src/google/protobuf/thread_safe_arena.h - third_party/github/protocolbuffers/protobuf - Git at Google

 // Protocol Buffers - Google's data interchange format
 // Copyright 2022 Google Inc.  All rights reserved.
 //
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file or at
 // https://developers.google.com/open-source/licenses/bsd
 //
 // This file defines the internal class ThreadSafeArena

 #ifndef GOOGLE_PROTOBUF_THREAD_SAFE_ARENA_H__
 #define GOOGLE_PROTOBUF_THREAD_SAFE_ARENA_H__

 #include <atomic>
 #include <cstddef>
 #include <cstdint>
 #include <type_traits>
 #include <vector>

 #include "absl/base/attributes.h"
 #include "absl/base/optimization.h"
 #include "absl/synchronization/mutex.h"
 #include "google/protobuf/arena_align.h"
 #include "google/protobuf/arena_allocation_policy.h"
 #include "google/protobuf/arena_cleanup.h"
 #include "google/protobuf/arenaz_sampler.h"
 #include "google/protobuf/port.h"
 #include "google/protobuf/serial_arena.h"

 // Must be included last.
 #include "google/protobuf/port_def.inc"

 namespace google {
 namespace protobuf {
 namespace internal {

 // This class provides the core Arena memory allocation library. Different
 // implementations only need to implement the public interface below.
 // Arena is not a template type as that would only be useful if all protos
 // in turn would be templates, which will/cannot happen. However separating
 // the memory allocation part from the cruft of the API users expect we can
 // use #ifdef the select the best implementation based on hardware / OS.
 class PROTOBUF_EXPORT ThreadSafeArena {
  public:
   ThreadSafeArena();

   ThreadSafeArena(char* mem, size_t size);

   explicit ThreadSafeArena(void* mem, size_t size,
                            const AllocationPolicy& policy);

   // All protos have pointers back to the arena hence Arena must have
   // pointer stability.
   ThreadSafeArena(const ThreadSafeArena&) = delete;
   ThreadSafeArena& operator=(const ThreadSafeArena&) = delete;
   ThreadSafeArena(ThreadSafeArena&&) = delete;
   ThreadSafeArena& operator=(ThreadSafeArena&&) = delete;

   // Destructor deletes all owned heap allocated objects, and destructs objects
   // that have non-trivial destructors, except for proto2 message objects whose
   // destructors can be skipped. Also, frees all blocks except the initial block
   // if it was passed in.
   ~ThreadSafeArena();

   uint64_t Reset();

   uint64_t SpaceAllocated() const;
   uint64_t SpaceUsed() const;

   template <AllocationClient alloc_client = AllocationClient::kDefault>
   void* AllocateAligned(size_t n) {
     SerialArena* arena;
     if (ABSL_PREDICT_TRUE(GetSerialArenaFast(&arena))) {
       return arena->AllocateAligned<alloc_client>(n);
     } else {
       return AllocateAlignedFallback<alloc_client>(n);
     }
   }

   void ReturnArrayMemory(void* p, size_t size) {
     SerialArena* arena = nullptr;
     if (ABSL_PREDICT_TRUE(GetSerialArenaFast(&arena))) {
       arena->ReturnArrayMemory(p, size);
     }
   }

   // This function allocates n bytes if the common happy case is true and
   // returns true. Otherwise does nothing and returns false. This strange
   // semantics is necessary to allow callers to program functions that only
   // have fallback function calls in tail position. This substantially improves
   // code for the happy path.
   PROTOBUF_NDEBUG_INLINE bool MaybeAllocateAligned(size_t n, void** out) {
     SerialArena* arena = nullptr;
     if (ABSL_PREDICT_TRUE(GetSerialArenaFast(&arena))) {
       return arena->MaybeAllocateAligned(n, out);
     }
     return false;
   }

   void* AllocateAlignedWithCleanup(size_t n, size_t align,
                                    void (*destructor)(void*));

   // Add object pointer and cleanup function pointer to the list.
   void AddCleanup(void* elem, void (*cleanup)(void*));

   void* AllocateFromStringBlock();

   std::vector<void*> PeekCleanupListForTesting();

  private:
   friend class ArenaBenchmark;
   friend class TcParser;
   friend class SerialArena;
   friend struct SerialArenaChunkHeader;
   friend class cleanup::ChunkList;
   static uint64_t GetNextLifeCycleId();

   class SerialArenaChunk;

   // Returns a new SerialArenaChunk that has {id, serial} at slot 0. It may
   // grow based on "prev_num_slots".
   static SerialArenaChunk* NewSerialArenaChunk(uint32_t prev_capacity, void* id,
                                                SerialArena* serial);
   static SerialArenaChunk* SentrySerialArenaChunk();

   // Returns the first ArenaBlock* for the first SerialArena. If users provide
   // one, use it if it's acceptable. Otherwise returns a sentry block.
   ArenaBlock* FirstBlock(void* buf, size_t size);
   // Same as the above but returns a valid block if "policy" is not default.
   ArenaBlock* FirstBlock(void* buf, size_t size,
                          const AllocationPolicy& policy);

   // Adds SerialArena to the chunked list. May create a new chunk.
   void AddSerialArena(void* id, SerialArena* serial);

   void UnpoisonAllArenaBlocks() const;

   // Members are declared here to track sizeof(ThreadSafeArena) and hotness
   // centrally.

   // Unique for each arena. Changes on Reset().
   uint64_t tag_and_id_ = 0;

   TaggedAllocationPolicyPtr alloc_policy_;  // Tagged pointer to AllocPolicy.
   ThreadSafeArenaStatsHandle arena_stats_;

   // Adding a new chunk to head_ must be protected by mutex_.
   absl::Mutex mutex_;
   // Pointer to a linked list of SerialArenaChunk.
   std::atomic<SerialArenaChunk*> head_{nullptr};

   void* first_owner_;
   // Must be declared after alloc_policy_; otherwise, it may lose info on
   // user-provided initial block.
   SerialArena first_arena_;

   static_assert(std::is_trivially_destructible<SerialArena>{},
                 "SerialArena needs to be trivially destructible.");

   const AllocationPolicy* AllocPolicy() const { return alloc_policy_.get(); }
   void InitializeWithPolicy(const AllocationPolicy& policy);
   void* AllocateAlignedWithCleanupFallback(size_t n, size_t align,
                                            void (*destructor)(void*));

   void Init();

   // Delete or Destruct all objects owned by the arena.
   void CleanupList();

   inline void CacheSerialArena(SerialArena* serial) {
     thread_cache().last_serial_arena = serial;
     thread_cache().last_lifecycle_id_seen = tag_and_id_;
   }

   PROTOBUF_NDEBUG_INLINE bool GetSerialArenaFast(SerialArena** arena) {
     // If this thread already owns a block in this arena then try to use that.
     // This fast path optimizes the case where multiple threads allocate from
     // the same arena.
     ThreadCache* tc = &thread_cache();
     if (ABSL_PREDICT_TRUE(tc->last_lifecycle_id_seen == tag_and_id_)) {
       *arena = tc->last_serial_arena;
       return true;
     }
     return false;
   }

   // Finds SerialArena or creates one if not found. When creating a new one,
   // create a big enough block to accommodate n bytes.
   SerialArena* GetSerialArenaFallback(size_t n);

   SerialArena* GetSerialArena();

   template <AllocationClient alloc_client = AllocationClient::kDefault>
   void* AllocateAlignedFallback(size_t n);

   // Executes callback function over SerialArenaChunk. Passes const
   // SerialArenaChunk*.
   template <typename Callback>
   void WalkConstSerialArenaChunk(Callback fn) const;

   // Executes callback function over SerialArenaChunk.
   template <typename Callback>
   void WalkSerialArenaChunk(Callback fn);

   // Visits SerialArena and calls "fn", including "first_arena" and ones on
   // chunks. Do not rely on the order of visit. The callback function should
   // accept `const SerialArena*`.
   template <typename Callback>
   void VisitSerialArena(Callback fn) const;

   // Releases all memory except the first block which it returns. The first
   // block might be owned by the user and thus need some extra checks before
   // deleting.
   SizedPtr Free();

   // ThreadCache is accessed very frequently, so we align it such that it's
   // located within a single cache line.
   static constexpr size_t kThreadCacheAlignment = 32;

 #ifdef _MSC_VER
 #pragma warning(disable : 4324)
 #endif
   struct alignas(kThreadCacheAlignment) ThreadCache {
     // Number of per-thread lifecycle IDs to reserve. Must be power of two.
     // To reduce contention on a global atomic, each thread reserves a batch of
     // IDs.  The following number is calculated based on a stress test with
     // ~6500 threads all frequently allocating a new arena.
     static constexpr size_t kPerThreadIds = 256;
     // Next lifecycle ID available to this thread. We need to reserve a new
     // batch, if `next_lifecycle_id & (kPerThreadIds - 1) == 0`.
     uint64_t next_lifecycle_id{0};
     // The ThreadCache is considered valid as long as this matches the
     // lifecycle_id of the arena being used.
     uint64_t last_lifecycle_id_seen{static_cast<uint64_t>(-1)};
     SerialArena* last_serial_arena{nullptr};
   };
   static_assert(sizeof(ThreadCache) <= kThreadCacheAlignment,
                 "ThreadCache may span several cache lines");

   // Lifecycle_id can be highly contended variable in a situation of lots of
   // arena creation. Make sure that other global variables are not sharing the
   // cacheline.
 #ifdef _MSC_VER
 #pragma warning(disable : 4324)
 #endif
   using LifecycleId = uint64_t;
   alignas(kCacheAlignment) ABSL_CONST_INIT
       static std::atomic<LifecycleId> lifecycle_id_;
 #if defined(PROTOBUF_NO_THREADLOCAL)
   // iOS does not support __thread keyword so we use a custom thread local
   // storage class we implemented.
   static ThreadCache& thread_cache();
 #elif defined(PROTOBUF_USE_DLLS) && defined(_WIN32)
   // Thread local variables cannot be exposed through MSVC DLL interface but we
   // can wrap them in static functions.
   static ThreadCache& thread_cache();
 #else
   PROTOBUF_CONSTINIT static PROTOBUF_THREAD_LOCAL ThreadCache thread_cache_;
   static ThreadCache& thread_cache() { return thread_cache_; }
 #endif

  public:
   // kBlockHeaderSize is sizeof(ArenaBlock), aligned up to the nearest multiple
   // of 8 to protect the invariant that pos is always at a multiple of 8.
   static constexpr size_t kBlockHeaderSize = SerialArena::kBlockHeaderSize;
   static constexpr size_t kSerialArenaSize =
       (sizeof(SerialArena) + 7) & static_cast<size_t>(-8);
   static constexpr size_t kAllocPolicySize =
       ArenaAlignDefault::Ceil(sizeof(AllocationPolicy));
   static constexpr size_t kMaxCleanupNodeSize = 16;
   static_assert(kBlockHeaderSize % 8 == 0,
                 "kBlockHeaderSize must be a multiple of 8.");
   static_assert(kSerialArenaSize % 8 == 0,
                 "kSerialArenaSize must be a multiple of 8.");
 };

 }  // namespace internal
 }  // namespace protobuf
 }  // namespace google

 #include "google/protobuf/port_undef.inc"

 #endif  // GOOGLE_PROTOBUF_THREAD_SAFE_ARENA_H__
	// Protocol Buffers - Google's data interchange format
	// Copyright 2022 Google Inc. All rights reserved.
	//
	// Use of this source code is governed by a BSD-style
	// license that can be found in the LICENSE file or at
	// https://developers.google.com/open-source/licenses/bsd
	//
	// This file defines the internal class ThreadSafeArena

	#ifndef GOOGLE_PROTOBUF_THREAD_SAFE_ARENA_H__
	#define GOOGLE_PROTOBUF_THREAD_SAFE_ARENA_H__

	#include <atomic>
	#include <cstddef>
	#include <cstdint>
	#include <type_traits>
	#include <vector>

	#include "absl/base/attributes.h"
	#include "absl/base/optimization.h"
	#include "absl/synchronization/mutex.h"
	#include "google/protobuf/arena_align.h"
	#include "google/protobuf/arena_allocation_policy.h"
	#include "google/protobuf/arena_cleanup.h"
	#include "google/protobuf/arenaz_sampler.h"
	#include "google/protobuf/port.h"
	#include "google/protobuf/serial_arena.h"

	// Must be included last.
	#include "google/protobuf/port_def.inc"

	namespace google {
	namespace protobuf {
	namespace internal {

	// This class provides the core Arena memory allocation library. Different
	// implementations only need to implement the public interface below.
	// Arena is not a template type as that would only be useful if all protos
	// in turn would be templates, which will/cannot happen. However separating
	// the memory allocation part from the cruft of the API users expect we can
	// use #ifdef the select the best implementation based on hardware / OS.
	class PROTOBUF_EXPORT ThreadSafeArena {
	public:
	ThreadSafeArena();

	ThreadSafeArena(char* mem, size_t size);

	explicit ThreadSafeArena(void* mem, size_t size,
	const AllocationPolicy& policy);

	// All protos have pointers back to the arena hence Arena must have
	// pointer stability.
	ThreadSafeArena(const ThreadSafeArena&) = delete;
	ThreadSafeArena& operator=(const ThreadSafeArena&) = delete;
	ThreadSafeArena(ThreadSafeArena&&) = delete;
	ThreadSafeArena& operator=(ThreadSafeArena&&) = delete;

	// Destructor deletes all owned heap allocated objects, and destructs objects
	// that have non-trivial destructors, except for proto2 message objects whose
	// destructors can be skipped. Also, frees all blocks except the initial block
	// if it was passed in.
	~ThreadSafeArena();

	uint64_t Reset();

	uint64_t SpaceAllocated() const;
	uint64_t SpaceUsed() const;

	template <AllocationClient alloc_client = AllocationClient::kDefault>
	void* AllocateAligned(size_t n) {
	SerialArena* arena;
	if (ABSL_PREDICT_TRUE(GetSerialArenaFast(&arena))) {
	return arena->AllocateAligned<alloc_client>(n);
	} else {
	return AllocateAlignedFallback<alloc_client>(n);
	}
	}

	void ReturnArrayMemory(void* p, size_t size) {
	SerialArena* arena = nullptr;
	if (ABSL_PREDICT_TRUE(GetSerialArenaFast(&arena))) {
	arena->ReturnArrayMemory(p, size);
	}
	}

	// This function allocates n bytes if the common happy case is true and
	// returns true. Otherwise does nothing and returns false. This strange
	// semantics is necessary to allow callers to program functions that only
	// have fallback function calls in tail position. This substantially improves
	// code for the happy path.
	PROTOBUF_NDEBUG_INLINE bool MaybeAllocateAligned(size_t n, void** out) {
	SerialArena* arena = nullptr;
	if (ABSL_PREDICT_TRUE(GetSerialArenaFast(&arena))) {
	return arena->MaybeAllocateAligned(n, out);
	}
	return false;
	}

	void* AllocateAlignedWithCleanup(size_t n, size_t align,
	void (destructor)(void));

	// Add object pointer and cleanup function pointer to the list.
	void AddCleanup(void* elem, void (cleanup)(void));

	void* AllocateFromStringBlock();

	std::vector<void*> PeekCleanupListForTesting();

	private:
	friend class ArenaBenchmark;
	friend class TcParser;
	friend class SerialArena;
	friend struct SerialArenaChunkHeader;
	friend class cleanup::ChunkList;
	static uint64_t GetNextLifeCycleId();

	class SerialArenaChunk;

	// Returns a new SerialArenaChunk that has {id, serial} at slot 0. It may
	// grow based on "prev_num_slots".
	static SerialArenaChunk* NewSerialArenaChunk(uint32_t prev_capacity, void* id,
	SerialArena* serial);
	static SerialArenaChunk* SentrySerialArenaChunk();

	// Returns the first ArenaBlock* for the first SerialArena. If users provide
	// one, use it if it's acceptable. Otherwise returns a sentry block.
	ArenaBlock* FirstBlock(void* buf, size_t size);
	// Same as the above but returns a valid block if "policy" is not default.
	ArenaBlock* FirstBlock(void* buf, size_t size,
	const AllocationPolicy& policy);

	// Adds SerialArena to the chunked list. May create a new chunk.
	void AddSerialArena(void* id, SerialArena* serial);

	void UnpoisonAllArenaBlocks() const;

	// Members are declared here to track sizeof(ThreadSafeArena) and hotness
	// centrally.

	// Unique for each arena. Changes on Reset().
	uint64_t tag_and_id_ = 0;

	TaggedAllocationPolicyPtr alloc_policy_; // Tagged pointer to AllocPolicy.
	ThreadSafeArenaStatsHandle arena_stats_;

	// Adding a new chunk to head_ must be protected by mutex_.
	absl::Mutex mutex_;
	// Pointer to a linked list of SerialArenaChunk.
	std::atomic<SerialArenaChunk*> head_{nullptr};

	void* first_owner_;
	// Must be declared after alloc_policy_; otherwise, it may lose info on
	// user-provided initial block.
	SerialArena first_arena_;

	static_assert(std::is_trivially_destructible<SerialArena>{},
	"SerialArena needs to be trivially destructible.");

	const AllocationPolicy* AllocPolicy() const { return alloc_policy_.get(); }
	void InitializeWithPolicy(const AllocationPolicy& policy);
	void* AllocateAlignedWithCleanupFallback(size_t n, size_t align,
	void (destructor)(void));

	void Init();

	// Delete or Destruct all objects owned by the arena.
	void CleanupList();

	inline void CacheSerialArena(SerialArena* serial) {
	thread_cache().last_serial_arena = serial;
	thread_cache().last_lifecycle_id_seen = tag_and_id_;
	}

	PROTOBUF_NDEBUG_INLINE bool GetSerialArenaFast(SerialArena** arena) {
	// If this thread already owns a block in this arena then try to use that.
	// This fast path optimizes the case where multiple threads allocate from
	// the same arena.
	ThreadCache* tc = &thread_cache();
	if (ABSL_PREDICT_TRUE(tc->last_lifecycle_id_seen == tag_and_id_)) {
	*arena = tc->last_serial_arena;
	return true;
	}
	return false;
	}

	// Finds SerialArena or creates one if not found. When creating a new one,
	// create a big enough block to accommodate n bytes.
	SerialArena* GetSerialArenaFallback(size_t n);

	SerialArena* GetSerialArena();

	template <AllocationClient alloc_client = AllocationClient::kDefault>
	void* AllocateAlignedFallback(size_t n);

	// Executes callback function over SerialArenaChunk. Passes const
	// SerialArenaChunk*.
	template <typename Callback>
	void WalkConstSerialArenaChunk(Callback fn) const;

	// Executes callback function over SerialArenaChunk.
	template <typename Callback>
	void WalkSerialArenaChunk(Callback fn);

	// Visits SerialArena and calls "fn", including "first_arena" and ones on
	// chunks. Do not rely on the order of visit. The callback function should
	// accept `const SerialArena*`.
	template <typename Callback>
	void VisitSerialArena(Callback fn) const;

	// Releases all memory except the first block which it returns. The first
	// block might be owned by the user and thus need some extra checks before
	// deleting.
	SizedPtr Free();

	// ThreadCache is accessed very frequently, so we align it such that it's
	// located within a single cache line.
	static constexpr size_t kThreadCacheAlignment = 32;

	#ifdef _MSC_VER
	#pragma warning(disable : 4324)
	#endif
	struct alignas(kThreadCacheAlignment) ThreadCache {
	// Number of per-thread lifecycle IDs to reserve. Must be power of two.
	// To reduce contention on a global atomic, each thread reserves a batch of
	// IDs. The following number is calculated based on a stress test with
	// ~6500 threads all frequently allocating a new arena.
	static constexpr size_t kPerThreadIds = 256;
	// Next lifecycle ID available to this thread. We need to reserve a new
	// batch, if `next_lifecycle_id & (kPerThreadIds - 1) == 0`.
	uint64_t next_lifecycle_id{0};
	// The ThreadCache is considered valid as long as this matches the
	// lifecycle_id of the arena being used.
	uint64_t last_lifecycle_id_seen{static_cast<uint64_t>(-1)};
	SerialArena* last_serial_arena{nullptr};
	};
	static_assert(sizeof(ThreadCache) <= kThreadCacheAlignment,
	"ThreadCache may span several cache lines");

	// Lifecycle_id can be highly contended variable in a situation of lots of
	// arena creation. Make sure that other global variables are not sharing the
	// cacheline.
	#ifdef _MSC_VER
	#pragma warning(disable : 4324)
	#endif
	using LifecycleId = uint64_t;
	alignas(kCacheAlignment) ABSL_CONST_INIT
	static std::atomic<LifecycleId> lifecycle_id_;
	#if defined(PROTOBUF_NO_THREADLOCAL)
	// iOS does not support __thread keyword so we use a custom thread local
	// storage class we implemented.
	static ThreadCache& thread_cache();
	#elif defined(PROTOBUF_USE_DLLS) && defined(_WIN32)
	// Thread local variables cannot be exposed through MSVC DLL interface but we
	// can wrap them in static functions.
	static ThreadCache& thread_cache();
	#else
	PROTOBUF_CONSTINIT static PROTOBUF_THREAD_LOCAL ThreadCache thread_cache_;
	static ThreadCache& thread_cache() { return thread_cache_; }
	#endif

	public:
	// kBlockHeaderSize is sizeof(ArenaBlock), aligned up to the nearest multiple
	// of 8 to protect the invariant that pos is always at a multiple of 8.
	static constexpr size_t kBlockHeaderSize = SerialArena::kBlockHeaderSize;
	static constexpr size_t kSerialArenaSize =
	(sizeof(SerialArena) + 7) & static_cast<size_t>(-8);
	static constexpr size_t kAllocPolicySize =
	ArenaAlignDefault::Ceil(sizeof(AllocationPolicy));
	static constexpr size_t kMaxCleanupNodeSize = 16;
	static_assert(kBlockHeaderSize % 8 == 0,
	"kBlockHeaderSize must be a multiple of 8.");
	static_assert(kSerialArenaSize % 8 == 0,
	"kSerialArenaSize must be a multiple of 8.");
	};

	} // namespace internal
	} // namespace protobuf
	} // namespace google

	#include "google/protobuf/port_undef.inc"

	#endif // GOOGLE_PROTOBUF_THREAD_SAFE_ARENA_H__