src/google/protobuf/arena.cc - third_party/github/protocolbuffers/protobuf - Git at Google

 // Protocol Buffers - Google's data interchange format
 // Copyright 2008 Google Inc.  All rights reserved.
 //
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file or at
 // https://developers.google.com/open-source/licenses/bsd

 #include "google/protobuf/arena.h"

 #include <algorithm>
 #include <atomic>
 #include <cstddef>
 #include <cstdint>
 #include <limits>
 #include <string>
 #include <typeinfo>
 #include <vector>

 #include "absl/base/attributes.h"
 #include "absl/container/internal/layout.h"
 #include "absl/synchronization/mutex.h"
 #include "google/protobuf/arena_allocation_policy.h"
 #include "google/protobuf/arenaz_sampler.h"
 #include "google/protobuf/port.h"
 #include "google/protobuf/serial_arena.h"
 #include "google/protobuf/thread_safe_arena.h"


 #ifdef ADDRESS_SANITIZER
 #include <sanitizer/asan_interface.h>
 #endif  // ADDRESS_SANITIZER

 // Must be included last.
 #include "google/protobuf/port_def.inc"

 namespace google {
 namespace protobuf {
 namespace internal {
 namespace {

 #if defined(__GNUC__) && __GNUC__ >= 5
 // kSentryArenaBlock is used for arenas which can be referenced pre-main. So,
 // constexpr is required.
 constexpr ArenaBlock kSentryArenaBlock;

 ArenaBlock* SentryArenaBlock() {
   // const_cast<> is okay as kSentryArenaBlock will never be mutated.
   return const_cast<ArenaBlock*>(&kSentryArenaBlock);
 }
 #else
 // TODO Remove this once we're not using GCC 4.9 for tests.
 // There is a compiler bug in this version that causes the above constexpr to
 // fail.  This version is no longer in our support window, but we use it in
 // some of our aarch64 docker images.
 ArenaBlock* SentryArenaBlock() {
   static const ArenaBlock kSentryArenaBlock;
   // const_cast<> is okay as kSentryArenaBlock will never be mutated.
   return const_cast<ArenaBlock*>(&kSentryArenaBlock);
 }
 #endif

 }  // namespace

 static SizedPtr AllocateMemory(const AllocationPolicy* policy_ptr,
                                size_t last_size, size_t min_bytes) {
   AllocationPolicy policy;  // default policy
   if (policy_ptr) policy = *policy_ptr;
   size_t size;
   if (last_size != 0) {
     // Double the current block size, up to a limit.
     auto max_size = policy.max_block_size;
     size = std::min(2 * last_size, max_size);
   } else {
     size = policy.start_block_size;
   }
   // Verify that min_bytes + kBlockHeaderSize won't overflow.
   ABSL_CHECK_LE(min_bytes, std::numeric_limits<size_t>::max() -
                                SerialArena::kBlockHeaderSize);
   size = std::max(size, SerialArena::kBlockHeaderSize + min_bytes);

   if (policy.block_alloc == nullptr) {
     return AllocateAtLeast(size);
   }
   return {policy.block_alloc(size), size};
 }

 class GetDeallocator {
  public:
   GetDeallocator(const AllocationPolicy* policy, size_t* space_allocated)
       : dealloc_(policy ? policy->block_dealloc : nullptr),
         space_allocated_(space_allocated) {}

   void operator()(SizedPtr mem) const {
 #ifdef ADDRESS_SANITIZER
     // This memory was provided by the underlying allocator as unpoisoned,
     // so return it in an unpoisoned state.
     ASAN_UNPOISON_MEMORY_REGION(mem.p, mem.n);
 #endif  // ADDRESS_SANITIZER
     if (dealloc_) {
       dealloc_(mem.p, mem.n);
     } else {
       internal::SizedDelete(mem.p, mem.n);
     }
     *space_allocated_ += mem.n;
   }

  private:
   void (*dealloc_)(void*, size_t);
   size_t* space_allocated_;
 };

 // It is guaranteed that this is constructed in `b`. IOW, this is not the first
 // arena and `b` cannot be sentry.
 SerialArena::SerialArena(ArenaBlock* b, ThreadSafeArena& parent)
     : ptr_{b->Pointer(kBlockHeaderSize + ThreadSafeArena::kSerialArenaSize)},
       limit_{b->Limit()},
       prefetch_ptr_(
           b->Pointer(kBlockHeaderSize + ThreadSafeArena::kSerialArenaSize)),
       prefetch_limit_(b->Limit()),
       head_{b},
       space_allocated_{b->size},
       parent_{parent} {
   ABSL_DCHECK(!b->IsSentry());
 }

 // It is guaranteed that this is the first SerialArena. Use sentry block.
 SerialArena::SerialArena(ThreadSafeArena& parent)
     : head_{SentryArenaBlock()}, parent_{parent} {}

 // It is guaranteed that this is the first SerialArena but `b` may be user
 // provided or newly allocated to store AllocationPolicy.
 SerialArena::SerialArena(FirstSerialArena, ArenaBlock* b,
                          ThreadSafeArena& parent)
     : head_{b}, space_allocated_{b->size}, parent_{parent} {
   if (b->IsSentry()) return;
   set_range(b->Pointer(kBlockHeaderSize), b->Limit());
 }

 std::vector<void*> SerialArena::PeekCleanupListForTesting() {
   std::vector<void*> res;

   ArenaBlock* b = head();
   if (b->IsSentry()) return res;

   const auto peek_list = [&](const char* pos, const char* end) {
     while (pos != end) {
       pos += cleanup::PeekNode(pos, res);
     }
   };

   peek_list(limit_, b->Limit());
   for (b = b->next; b; b = b->next) {
     peek_list(reinterpret_cast<char*>(b->cleanup_nodes), b->Limit());
   }
   return res;
 }

 std::vector<void*> ThreadSafeArena::PeekCleanupListForTesting() {
   return GetSerialArena()->PeekCleanupListForTesting();
 }

 void SerialArena::Init(ArenaBlock* b, size_t offset) {
   set_range(b->Pointer(offset), b->Limit());
   head_.store(b, std::memory_order_relaxed);
   space_used_.store(0, std::memory_order_relaxed);
   space_allocated_.store(b->size, std::memory_order_relaxed);
   cached_block_length_ = 0;
   cached_blocks_ = nullptr;
   string_block_.store(nullptr, std::memory_order_relaxed);
   string_block_unused_.store(0, std::memory_order_relaxed);
 }

 SerialArena* SerialArena::New(SizedPtr mem, ThreadSafeArena& parent) {
   ABSL_DCHECK_LE(kBlockHeaderSize + ThreadSafeArena::kSerialArenaSize, mem.n);
   ThreadSafeArenaStats::RecordAllocateStats(parent.arena_stats_.MutableStats(),
                                             /*used=*/0, /*allocated=*/mem.n,
                                             /*wasted=*/0);
   auto b = new (mem.p) ArenaBlock{nullptr, mem.n};
   return new (b->Pointer(kBlockHeaderSize)) SerialArena(b, parent);
 }

 template <typename Deallocator>
 SizedPtr SerialArena::Free(Deallocator deallocator) {
   ArenaBlock* b = head();
   SizedPtr mem = {b, b->size};
   while (b->next) {
     b = b->next;  // We must first advance before deleting this block
     deallocator(mem);
     mem = {b, b->size};
   }
   return mem;
 }

 PROTOBUF_NOINLINE
 void* SerialArena::AllocateAlignedFallback(size_t n) {
   AllocateNewBlock(n);
   void* ret;
   bool res = MaybeAllocateAligned(n, &ret);
   ABSL_DCHECK(res);
   return ret;
 }

 PROTOBUF_NOINLINE
 void* SerialArena::AllocateFromStringBlockFallback() {
   ABSL_DCHECK_EQ(string_block_unused_.load(std::memory_order_relaxed), 0U);
   StringBlock* sb = string_block_.load(std::memory_order_relaxed);
   if (sb) {
     AddSpaceUsed(sb->effective_size());
   }

   void* ptr;
   StringBlock* new_sb;
   size_t size = StringBlock::NextSize(sb);
   if (MaybeAllocateAligned(size, &ptr)) {
     // Correct space_used_ to avoid double counting
     AddSpaceUsed(-size);
     new_sb = StringBlock::Emplace(ptr, size, sb);
   } else {
     new_sb = StringBlock::New(sb);
     AddSpaceAllocated(new_sb->allocated_size());
   }
   string_block_.store(new_sb, std::memory_order_release);
   size_t unused = new_sb->effective_size() - sizeof(std::string);
   string_block_unused_.store(unused, std::memory_order_relaxed);
   return new_sb->AtOffset(unused);
 }

 PROTOBUF_NOINLINE
 void* SerialArena::AllocateAlignedWithCleanupFallback(
     size_t n, size_t align, void (*destructor)(void*)) {
   size_t required = AlignUpTo(n, align) + cleanup::Size(destructor);
   AllocateNewBlock(required);
   return AllocateAlignedWithCleanup(n, align, destructor);
 }

 PROTOBUF_NOINLINE
 void SerialArena::AddCleanupFallback(void* elem, void (*destructor)(void*)) {
   size_t required = cleanup::Size(destructor);
   AllocateNewBlock(required);
   AddCleanupFromExisting(elem, destructor);
 }

 void SerialArena::AllocateNewBlock(size_t n) {
   size_t used = 0;
   size_t wasted = 0;
   ArenaBlock* old_head = head();
   if (!old_head->IsSentry()) {
     // Sync limit to block
     old_head->cleanup_nodes = limit_;

     // Record how much used in this block.
     used = static_cast<size_t>(ptr() - old_head->Pointer(kBlockHeaderSize));
     wasted = old_head->size - used - kBlockHeaderSize;
     AddSpaceUsed(used);
   }

   // TODO: Evaluate if pushing unused space into the cached blocks is a
   // win. In preliminary testing showed increased memory savings as expected,
   // but with a CPU regression. The regression might have been an artifact of
   // the microbenchmark.

   auto mem = AllocateMemory(parent_.AllocPolicy(), old_head->size, n);
   // We don't want to emit an expensive RMW instruction that requires
   // exclusive access to a cacheline. Hence we write it in terms of a
   // regular add.
   AddSpaceAllocated(mem.n);
   ThreadSafeArenaStats::RecordAllocateStats(parent_.arena_stats_.MutableStats(),
                                             /*used=*/used,
                                             /*allocated=*/mem.n, wasted);
   auto* new_head = new (mem.p) ArenaBlock{old_head, mem.n};
   set_range(new_head->Pointer(kBlockHeaderSize), new_head->Limit());
   // Previous writes must take effect before writing new head.
   head_.store(new_head, std::memory_order_release);

 #ifdef ADDRESS_SANITIZER
   ASAN_POISON_MEMORY_REGION(ptr(), limit_ - ptr());
 #endif  // ADDRESS_SANITIZER
 }

 uint64_t SerialArena::SpaceUsed() const {
   // Note: the calculation below technically causes a race with
   // AllocateNewBlock when called from another thread (which happens in
   // ThreadSafeArena::SpaceUsed).  However, worst-case space_used_ will have
   // stale data and the calculation will incorrectly assume 100%
   // usage of the *current* block.
   // TODO Consider eliminating this race in exchange for a possible
   // performance hit on ARM (see cl/455186837).

   uint64_t space_used = 0;
   StringBlock* sb = string_block_.load(std::memory_order_acquire);
   if (sb) {
     size_t unused = string_block_unused_.load(std::memory_order_relaxed);
     space_used += sb->effective_size() - unused;
   }
   const ArenaBlock* h = head_.load(std::memory_order_acquire);
   if (h->IsSentry()) return space_used;

   const uint64_t current_block_size = h->size;
   space_used += std::min(
       static_cast<uint64_t>(
           ptr() - const_cast<ArenaBlock*>(h)->Pointer(kBlockHeaderSize)),
       current_block_size);
   return space_used + space_used_.load(std::memory_order_relaxed);
 }

 size_t SerialArena::FreeStringBlocks(StringBlock* string_block,
                                      size_t unused_bytes) {
   ABSL_DCHECK(string_block != nullptr);
   StringBlock* next = string_block->next();
   std::string* end = string_block->end();
   for (std::string* s = string_block->AtOffset(unused_bytes); s != end; ++s) {
     s->~basic_string();
   }
   size_t deallocated = StringBlock::Delete(string_block);

   while ((string_block = next) != nullptr) {
     next = string_block->next();
     for (std::string& s : *string_block) {
       s.~basic_string();
     }
     deallocated += StringBlock::Delete(string_block);
   }
   return deallocated;
 }

 void SerialArena::CleanupList() {
   ArenaBlock* b = head();
   if (b->IsSentry()) return;

   b->cleanup_nodes = limit_;
   do {
     char* limit = b->Limit();
     char* it = reinterpret_cast<char*>(b->cleanup_nodes);
     ABSL_DCHECK(!b->IsSentry() || it == limit);
     while (it < limit) {
       it += cleanup::DestroyNode(it);
     }
     b = b->next;
   } while (b);
 }

 // Stores arrays of void* and SerialArena* instead of linked list of
 // SerialArena* to speed up traversing all SerialArena. The cost of walk is non
 // trivial when there are many nodes. Separately storing "ids" minimizes cache
 // footprints and more efficient when looking for matching arena.
 //
 // Uses absl::container_internal::Layout to emulate the following:
 //
 // struct SerialArenaChunk {
 //   struct SerialArenaChunkHeader {
 //     SerialArenaChunk* next_chunk;
 //     uint32_t capacity;
 //     std::atomic<uint32_t> size;
 //   } header;
 //   std::atomic<void*> ids[];
 //   std::atomic<SerialArena*> arenas[];
 // };
 //
 // where the size of "ids" and "arenas" is determined at runtime; hence the use
 // of Layout.
 struct SerialArenaChunkHeader {
   constexpr SerialArenaChunkHeader(uint32_t capacity, uint32_t size)
       : next_chunk(nullptr), capacity(capacity), size(size) {}

   ThreadSafeArena::SerialArenaChunk* next_chunk;
   uint32_t capacity;
   std::atomic<uint32_t> size;
 };

 class ThreadSafeArena::SerialArenaChunk {
  public:
   SerialArenaChunk(uint32_t capacity, void* me, SerialArena* serial) {
     new (&header()) SerialArenaChunkHeader{capacity, 1};

     new (&id(0)) std::atomic<void*>{me};
     for (uint32_t i = 1; i < capacity; ++i) {
       new (&id(i)) std::atomic<void*>{nullptr};
     }

     new (&arena(0)) std::atomic<SerialArena*>{serial};
     for (uint32_t i = 1; i < capacity; ++i) {
       new (&arena(i)) std::atomic<void*>{nullptr};
     }
   }

   bool IsSentry() const { return capacity() == 0; }

   // next_chunk
   const SerialArenaChunk* next_chunk() const { return header().next_chunk; }
   SerialArenaChunk* next_chunk() { return header().next_chunk; }
   void set_next(SerialArenaChunk* next_chunk) {
     header().next_chunk = next_chunk;
   }

   // capacity
   uint32_t capacity() const { return header().capacity; }
   void set_capacity(uint32_t capacity) { header().capacity = capacity; }

   // ids: returns up to size().
   absl::Span<const std::atomic<void*>> ids() const {
     return Layout(capacity()).Slice<kIds>(ptr()).first(safe_size());
   }
   absl::Span<std::atomic<void*>> ids() {
     return Layout(capacity()).Slice<kIds>(ptr()).first(safe_size());
   }
   std::atomic<void*>& id(uint32_t i) {
     ABSL_DCHECK_LT(i, capacity());
     return Layout(capacity()).Pointer<kIds>(ptr())[i];
   }

   // arenas: returns up to size().
   absl::Span<const std::atomic<SerialArena*>> arenas() const {
     return Layout(capacity()).Slice<kArenas>(ptr()).first(safe_size());
   }
   absl::Span<std::atomic<SerialArena*>> arenas() {
     return Layout(capacity()).Slice<kArenas>(ptr()).first(safe_size());
   }
   const std::atomic<SerialArena*>& arena(uint32_t i) const {
     ABSL_DCHECK_LT(i, capacity());
     return Layout(capacity()).Pointer<kArenas>(ptr())[i];
   }
   std::atomic<SerialArena*>& arena(uint32_t i) {
     ABSL_DCHECK_LT(i, capacity());
     return Layout(capacity()).Pointer<kArenas>(ptr())[i];
   }

   // Tries to insert {id, serial} to head chunk. Returns false if the head is
   // already full.
   //
   // Note that the updating "size", "id", "arena" is individually atomic but
   // those are not protected by a mutex. This is acceptable because concurrent
   // lookups from SpaceUsed or SpaceAllocated accept inaccuracy due to race. On
   // other paths, either race is not possible (GetSerialArenaFallback) or must
   // be prevented by users (CleanupList, Free).
   bool insert(void* me, SerialArena* serial) {
     uint32_t idx = size().fetch_add(1, std::memory_order_relaxed);
     // Bail out if this chunk is full.
     if (idx >= capacity()) {
       // Write old value back to avoid potential overflow.
       size().store(capacity(), std::memory_order_relaxed);
       return false;
     }

     id(idx).store(me, std::memory_order_relaxed);
     arena(idx).store(serial, std::memory_order_release);
     return true;
   }

   constexpr static size_t AllocSize(size_t n) { return Layout(n).AllocSize(); }

  private:
   constexpr static int kHeader = 0;
   constexpr static int kIds = 1;
   constexpr static int kArenas = 2;

   using layout_type = absl::container_internal::Layout<
       SerialArenaChunkHeader, std::atomic<void*>, std::atomic<SerialArena*>>;

   const char* ptr() const { return reinterpret_cast<const char*>(this); }
   char* ptr() { return reinterpret_cast<char*>(this); }

   SerialArenaChunkHeader& header() {
     return *layout_type::Partial().Pointer<kHeader>(ptr());
   }
   const SerialArenaChunkHeader& header() const {
     return *layout_type::Partial().Pointer<kHeader>(ptr());
   }

   std::atomic<uint32_t>& size() { return header().size; }
   const std::atomic<uint32_t>& size() const { return header().size; }

   // Returns the size capped by the capacity as fetch_add may result in a size
   // greater than capacity.
   uint32_t safe_size() const {
     return std::min(capacity(), size().load(std::memory_order_relaxed));
   }

   constexpr static layout_type Layout(size_t n) {
     return layout_type(
         /*header*/ 1,
         /*ids*/ n,
         /*arenas*/ n);
   }
 };

 constexpr SerialArenaChunkHeader kSentryArenaChunk = {0, 0};

 ThreadSafeArena::SerialArenaChunk* ThreadSafeArena::SentrySerialArenaChunk() {
   // const_cast is okay because the sentry chunk is never mutated. Also,
   // reinterpret_cast is acceptable here as it should be identical to
   // SerialArenaChunk with zero payload. This is a necessary trick to
   // constexpr initialize kSentryArenaChunk.
   return reinterpret_cast<SerialArenaChunk*>(
       const_cast<SerialArenaChunkHeader*>(&kSentryArenaChunk));
 }


 alignas(kCacheAlignment) ABSL_CONST_INIT
     std::atomic<ThreadSafeArena::LifecycleId> ThreadSafeArena::lifecycle_id_{0};
 #if defined(PROTOBUF_NO_THREADLOCAL)
 ThreadSafeArena::ThreadCache& ThreadSafeArena::thread_cache() {
   static internal::ThreadLocalStorage<ThreadCache>* thread_cache_ =
       new internal::ThreadLocalStorage<ThreadCache>();
   return *thread_cache_->Get();
 }
 #elif defined(PROTOBUF_USE_DLLS) && defined(_WIN32)
 ThreadSafeArena::ThreadCache& ThreadSafeArena::thread_cache() {
   static PROTOBUF_THREAD_LOCAL ThreadCache thread_cache;
   return thread_cache;
 }
 #else
 PROTOBUF_CONSTINIT PROTOBUF_THREAD_LOCAL
     ThreadSafeArena::ThreadCache ThreadSafeArena::thread_cache_;
 #endif

 ThreadSafeArena::ThreadSafeArena() : first_arena_(*this) { Init(); }

 ThreadSafeArena::ThreadSafeArena(char* mem, size_t size)
     : first_arena_(FirstSerialArena{}, FirstBlock(mem, size), *this) {
   Init();
 }

 ThreadSafeArena::ThreadSafeArena(void* mem, size_t size,
                                  const AllocationPolicy& policy)
     : first_arena_(FirstSerialArena{}, FirstBlock(mem, size, policy), *this) {
   InitializeWithPolicy(policy);
 }

 ArenaBlock* ThreadSafeArena::FirstBlock(void* buf, size_t size) {
   ABSL_DCHECK_EQ(reinterpret_cast<uintptr_t>(buf) & 7, 0u);
   if (buf == nullptr || size <= kBlockHeaderSize) {
     return SentryArenaBlock();
   }
   // Record user-owned block.
   alloc_policy_.set_is_user_owned_initial_block(true);
   return new (buf) ArenaBlock{nullptr, size};
 }

 ArenaBlock* ThreadSafeArena::FirstBlock(void* buf, size_t size,
                                         const AllocationPolicy& policy) {
   if (policy.IsDefault()) return FirstBlock(buf, size);

   ABSL_DCHECK_EQ(reinterpret_cast<uintptr_t>(buf) & 7, 0u);

   SizedPtr mem;
   if (buf == nullptr || size < kBlockHeaderSize + kAllocPolicySize) {
     mem = AllocateMemory(&policy, 0, kAllocPolicySize);
   } else {
     mem = {buf, size};
     // Record user-owned block.
     alloc_policy_.set_is_user_owned_initial_block(true);
   }

   return new (mem.p) ArenaBlock{nullptr, mem.n};
 }

 void ThreadSafeArena::InitializeWithPolicy(const AllocationPolicy& policy) {
   Init();

   if (policy.IsDefault()) return;

 #ifndef NDEBUG
   const uint64_t old_alloc_policy = alloc_policy_.get_raw();
   // If there was a policy (e.g., in Reset()), make sure flags were preserved.
 #define ABSL_DCHECK_POLICY_FLAGS_() \
   if (old_alloc_policy > 3)         \
   ABSL_CHECK_EQ(old_alloc_policy & 3, alloc_policy_.get_raw() & 3)
 #else
 #define ABSL_DCHECK_POLICY_FLAGS_()
 #endif  // NDEBUG

   // We ensured enough space so this cannot fail.
   void* p;
   if (!first_arena_.MaybeAllocateAligned(kAllocPolicySize, &p)) {
     ABSL_LOG(FATAL) << "MaybeAllocateAligned cannot fail here.";
     return;
   }
   new (p) AllocationPolicy{policy};
   // Low bits store flags, so they mustn't be overwritten.
   ABSL_DCHECK_EQ(0u, reinterpret_cast<uintptr_t>(p) & 3);
   alloc_policy_.set_policy(reinterpret_cast<AllocationPolicy*>(p));
   ABSL_DCHECK_POLICY_FLAGS_();

 #undef ABSL_DCHECK_POLICY_FLAGS_
 }

 uint64_t ThreadSafeArena::GetNextLifeCycleId() {
   ThreadCache& tc = thread_cache();
   uint64_t id = tc.next_lifecycle_id;
   constexpr uint64_t kInc = ThreadCache::kPerThreadIds;
   if (PROTOBUF_PREDICT_FALSE((id & (kInc - 1)) == 0)) {
     // On platforms that don't support uint64_t atomics we can certainly not
     // afford to increment by large intervals and expect uniqueness due to
     // wrapping, hence we only add by 1.
     id = lifecycle_id_.fetch_add(1, std::memory_order_relaxed) * kInc;
   }
   tc.next_lifecycle_id = id + 1;
   return id;
 }

 // We assume that #threads / arena is bimodal; i.e. majority small ones are
 // single threaded but some big ones are highly concurrent. To balance between
 // memory overhead and minimum pointer chasing, we start with few entries and
 // exponentially (4x) grow with a limit (255 entries). Note that parameters are
 // picked for x64 architectures as hint and the actual size is calculated by
 // Layout.
 ThreadSafeArena::SerialArenaChunk* ThreadSafeArena::NewSerialArenaChunk(
     uint32_t prev_capacity, void* id, SerialArena* serial) {
   constexpr size_t kMaxBytes = 4096;  // Can hold up to 255 entries.
   constexpr size_t kGrowthFactor = 4;
   constexpr size_t kHeaderSize = SerialArenaChunk::AllocSize(0);
   constexpr size_t kEntrySize = SerialArenaChunk::AllocSize(1) - kHeaderSize;

   // On x64 arch: {4, 16, 64, 256, 256, ...} * 16.
   size_t prev_bytes = SerialArenaChunk::AllocSize(prev_capacity);
   size_t next_bytes = std::min(kMaxBytes, prev_bytes * kGrowthFactor);
   uint32_t next_capacity =
       static_cast<uint32_t>(next_bytes - kHeaderSize) / kEntrySize;
   // Growth based on bytes needs to be adjusted by AllocSize.
   next_bytes = SerialArenaChunk::AllocSize(next_capacity);

   // If we allocate bigger memory than requested, we should expand
   // size to use that extra space, and add extra entries permitted
   // by the extra space.
   SizedPtr mem = AllocateAtLeast(next_bytes);
   next_capacity = static_cast<uint32_t>(mem.n - kHeaderSize) / kEntrySize;
   ABSL_DCHECK_LE(SerialArenaChunk::AllocSize(next_capacity), mem.n);
   return new (mem.p) SerialArenaChunk{next_capacity, id, serial};
 }

 // Tries to reserve an entry by atomic fetch_add. If the head chunk is already
 // full (size >= capacity), acquires the mutex and adds a new head.
 void ThreadSafeArena::AddSerialArena(void* id, SerialArena* serial) {
   SerialArenaChunk* head = head_.load(std::memory_order_acquire);
   // Fast path without acquiring mutex.
   if (!head->IsSentry() && head->insert(id, serial)) {
     return;
   }

   // Slow path with acquiring mutex.
   absl::MutexLock lock(&mutex_);

   // Refetch and if someone else installed a new head, try allocating on that!
   SerialArenaChunk* new_head = head_.load(std::memory_order_acquire);
   if (new_head != head) {
     if (new_head->insert(id, serial)) return;
     // Update head to link to the latest one.
     head = new_head;
   }

   new_head = NewSerialArenaChunk(head->capacity(), id, serial);
   new_head->set_next(head);

   // Use "std::memory_order_release" to make sure prior stores are visible after
   // this one.
   head_.store(new_head, std::memory_order_release);
 }

 void ThreadSafeArena::Init() {
   tag_and_id_ = GetNextLifeCycleId();
   arena_stats_ = Sample();
   head_.store(SentrySerialArenaChunk(), std::memory_order_relaxed);
   first_owner_ = &thread_cache();

   // Record allocation for the first block that was either user-provided or
   // newly allocated.
   ThreadSafeArenaStats::RecordAllocateStats(
       arena_stats_.MutableStats(),
       /*used=*/0,
       /*allocated=*/first_arena_.SpaceAllocated(),
       /*wasted=*/0);

   CacheSerialArena(&first_arena_);
 }

 ThreadSafeArena::~ThreadSafeArena() {
   // Have to do this in a first pass, because some of the destructors might
   // refer to memory in other blocks.
   CleanupList();

   size_t space_allocated = 0;
   auto mem = Free(&space_allocated);
   if (alloc_policy_.is_user_owned_initial_block()) {
 #ifdef ADDRESS_SANITIZER
     // Unpoison the initial block, now that it's going back to the user.
     ASAN_UNPOISON_MEMORY_REGION(mem.p, mem.n);
 #endif  // ADDRESS_SANITIZER
     space_allocated += mem.n;
   } else if (mem.n > 0) {
     GetDeallocator(alloc_policy_.get(), &space_allocated)(mem);
   }
 }

 SizedPtr ThreadSafeArena::Free(size_t* space_allocated) {
   auto deallocator = GetDeallocator(alloc_policy_.get(), space_allocated);

   WalkSerialArenaChunk([&](SerialArenaChunk* chunk) {
     absl::Span<std::atomic<SerialArena*>> span = chunk->arenas();
     // Walks arenas backward to handle the first serial arena the last. Freeing
     // in reverse-order to the order in which objects were created may not be
     // necessary to Free and we should revisit this. (b/247560530)
     for (auto it = span.rbegin(); it != span.rend(); ++it) {
       SerialArena* serial = it->load(std::memory_order_relaxed);
       ABSL_DCHECK_NE(serial, nullptr);
       // Free string blocks
       *space_allocated += serial->FreeStringBlocks();
       // Always frees the first block of "serial" as it cannot be user-provided.
       SizedPtr mem = serial->Free(deallocator);
       ABSL_DCHECK_NE(mem.p, nullptr);
       deallocator(mem);
     }

     // Delete the chunk as we're done with it.
     internal::SizedDelete(chunk,
                           SerialArenaChunk::AllocSize(chunk->capacity()));
   });

   // The first block of the first arena is special and let the caller handle it.
   *space_allocated += first_arena_.FreeStringBlocks();
   return first_arena_.Free(deallocator);
 }

 uint64_t ThreadSafeArena::Reset() {
   // Have to do this in a first pass, because some of the destructors might
   // refer to memory in other blocks.
   CleanupList();

   // Discard all blocks except the first one. Whether it is user-provided or
   // allocated, always reuse the first block for the first arena.
   size_t space_allocated = 0;
   auto mem = Free(&space_allocated);
   space_allocated += mem.n;

   // Reset the first arena with the first block. This avoids redundant
   // free / allocation and re-allocating for AllocationPolicy. Adjust offset if
   // we need to preserve alloc_policy_.
   if (alloc_policy_.is_user_owned_initial_block() ||
       alloc_policy_.get() != nullptr) {
     size_t offset = alloc_policy_.get() == nullptr
                         ? kBlockHeaderSize
                         : kBlockHeaderSize + kAllocPolicySize;
     first_arena_.Init(new (mem.p) ArenaBlock{nullptr, mem.n}, offset);
   } else {
     first_arena_.Init(SentryArenaBlock(), 0);
   }

   // Since the first block and potential alloc_policy on the first block is
   // preserved, this can be initialized by Init().
   Init();

   return space_allocated;
 }

 void* ThreadSafeArena::AllocateAlignedWithCleanup(size_t n, size_t align,
                                                   void (*destructor)(void*)) {
   SerialArena* arena;
   if (PROTOBUF_PREDICT_TRUE(GetSerialArenaFast(&arena))) {
     return arena->AllocateAlignedWithCleanup(n, align, destructor);
   } else {
     return AllocateAlignedWithCleanupFallback(n, align, destructor);
   }
 }

 void ThreadSafeArena::AddCleanup(void* elem, void (*cleanup)(void*)) {
   GetSerialArena()->AddCleanup(elem, cleanup);
 }

 SerialArena* ThreadSafeArena::GetSerialArena() {
   SerialArena* arena;
   if (PROTOBUF_PREDICT_FALSE(!GetSerialArenaFast(&arena))) {
     arena = GetSerialArenaFallback(kMaxCleanupNodeSize);
   }
   return arena;
 }

 PROTOBUF_NOINLINE
 void* ThreadSafeArena::AllocateAlignedWithCleanupFallback(
     size_t n, size_t align, void (*destructor)(void*)) {
   return GetSerialArenaFallback(n + kMaxCleanupNodeSize)
       ->AllocateAlignedWithCleanup(n, align, destructor);
 }

 PROTOBUF_NOINLINE
 void* ThreadSafeArena::AllocateFromStringBlock() {
   return GetSerialArena()->AllocateFromStringBlock();
 }

 template <typename Functor>
 void ThreadSafeArena::WalkConstSerialArenaChunk(Functor fn) const {
   const SerialArenaChunk* chunk = head_.load(std::memory_order_acquire);

   for (; !chunk->IsSentry(); chunk = chunk->next_chunk()) {
     fn(chunk);
   }
 }

 template <typename Functor>
 void ThreadSafeArena::WalkSerialArenaChunk(Functor fn) {
   // By omitting an Acquire barrier we help the sanitizer that any user code
   // that doesn't properly synchronize Reset() or the destructor will throw a
   // TSAN warning.
   SerialArenaChunk* chunk = head_.load(std::memory_order_relaxed);

   while (!chunk->IsSentry()) {
     // Cache next chunk in case this chunk is destroyed.
     SerialArenaChunk* next_chunk = chunk->next_chunk();
     fn(chunk);
     chunk = next_chunk;
   }
 }

 template <typename Functor>
 void ThreadSafeArena::PerConstSerialArenaInChunk(Functor fn) const {
   WalkConstSerialArenaChunk([&fn](const SerialArenaChunk* chunk) {
     for (const auto& each : chunk->arenas()) {
       const SerialArena* serial = each.load(std::memory_order_acquire);
       // It is possible that newly added SerialArena is not updated although
       // size was. This is acceptable for SpaceAllocated and SpaceUsed.
       if (serial == nullptr) continue;
       fn(serial);
     }
   });
 }

 uint64_t ThreadSafeArena::SpaceAllocated() const {
   uint64_t space_allocated = first_arena_.SpaceAllocated();
   PerConstSerialArenaInChunk([&space_allocated](const SerialArena* serial) {
     space_allocated += serial->SpaceAllocated();
   });
   return space_allocated;
 }

 uint64_t ThreadSafeArena::SpaceUsed() const {
   // First arena is inlined to ThreadSafeArena and the first block's overhead is
   // smaller than others that contain SerialArena.
   uint64_t space_used = first_arena_.SpaceUsed();
   PerConstSerialArenaInChunk([&space_used](const SerialArena* serial) {
     // SerialArena on chunks directly allocated from the block and needs to be
     // subtracted from SpaceUsed.
     space_used += serial->SpaceUsed() - kSerialArenaSize;
   });
   return space_used - (alloc_policy_.get() ? sizeof(AllocationPolicy) : 0);
 }

 template <AllocationClient alloc_client>
 PROTOBUF_NOINLINE void* ThreadSafeArena::AllocateAlignedFallback(size_t n) {
   return GetSerialArenaFallback(n)->AllocateAligned<alloc_client>(n);
 }

 template void* ThreadSafeArena::AllocateAlignedFallback<
     AllocationClient::kDefault>(size_t);
 template void*
     ThreadSafeArena::AllocateAlignedFallback<AllocationClient::kArray>(size_t);

 void ThreadSafeArena::CleanupList() {
   WalkSerialArenaChunk([](SerialArenaChunk* chunk) {
     absl::Span<std::atomic<SerialArena*>> span = chunk->arenas();
     // Walks arenas backward to handle the first serial arena the last.
     // Destroying in reverse-order to the construction is often assumed by users
     // and required not to break inter-object dependencies. (b/247560530)
     for (auto it = span.rbegin(); it != span.rend(); ++it) {
       SerialArena* serial = it->load(std::memory_order_relaxed);
       ABSL_DCHECK_NE(serial, nullptr);
       serial->CleanupList();
     }
   });
   // First arena must be cleaned up last. (b/247560530)
   first_arena_.CleanupList();
 }

 PROTOBUF_NOINLINE
 SerialArena* ThreadSafeArena::GetSerialArenaFallback(size_t n) {
   void* const id = &thread_cache();
   if (id == first_owner_) {
     CacheSerialArena(&first_arena_);
     return &first_arena_;
   }

   // Search matching SerialArena.
   SerialArena* serial = nullptr;
   WalkConstSerialArenaChunk([&serial, id](const SerialArenaChunk* chunk) {
     absl::Span<const std::atomic<void*>> ids = chunk->ids();
     for (uint32_t i = 0; i < ids.size(); ++i) {
       if (ids[i].load(std::memory_order_relaxed) == id) {
         serial = chunk->arena(i).load(std::memory_order_relaxed);
         ABSL_DCHECK_NE(serial, nullptr);
         break;
       }
     }
   });

   if (!serial) {
     // This thread doesn't have any SerialArena, which also means it doesn't
     // have any blocks yet.  So we'll allocate its first block now. It must be
     // big enough to host SerialArena and the pending request.
     serial = SerialArena::New(
         AllocateMemory(alloc_policy_.get(), 0, n + kSerialArenaSize), *this);

     AddSerialArena(id, serial);
   }

   CacheSerialArena(serial);
   return serial;
 }

 }  // namespace internal

 void* Arena::Allocate(size_t n) { return impl_.AllocateAligned(n); }

 void* Arena::AllocateForArray(size_t n) {
   return impl_.AllocateAligned<internal::AllocationClient::kArray>(n);
 }

 void* Arena::AllocateAlignedWithCleanup(size_t n, size_t align,
                                         void (*destructor)(void*)) {
   return impl_.AllocateAlignedWithCleanup(n, align, destructor);
 }

 std::vector<void*> Arena::PeekCleanupListForTesting() {
   return impl_.PeekCleanupListForTesting();
 }

 }  // namespace protobuf
 }  // namespace google

 #include "google/protobuf/port_undef.inc"