absl/flags/internal/sequence_lock.h - third_party/github/abseil/abseil-cpp - Git at Google

 //
 // Copyright 2020 The Abseil Authors.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //      https://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #ifndef ABSL_FLAGS_INTERNAL_SEQUENCE_LOCK_H_
 #define ABSL_FLAGS_INTERNAL_SEQUENCE_LOCK_H_

 #include <stddef.h>
 #include <stdint.h>

 #include <atomic>
 #include <cassert>
 #include <cstring>

 #include "absl/base/optimization.h"

 namespace absl {
 ABSL_NAMESPACE_BEGIN
 namespace flags_internal {

 // Align 'x' up to the nearest 'align' bytes.
 inline constexpr size_t AlignUp(size_t x, size_t align) {
   return align * ((x + align - 1) / align);
 }

 // A SequenceLock implements lock-free reads. A sequence counter is incremented
 // before and after each write, and readers access the counter before and after
 // accessing the protected data. If the counter is verified to not change during
 // the access, and the sequence counter value was even, then the reader knows
 // that the read was race-free and valid. Otherwise, the reader must fall back
 // to a Mutex-based code path.
 //
 // This particular SequenceLock starts in an "uninitialized" state in which
 // TryRead() returns false. It must be enabled by calling MarkInitialized().
 // This serves as a marker that the associated flag value has not yet been
 // initialized and a slow path needs to be taken.
 //
 // The memory reads and writes protected by this lock must use the provided
 // `TryRead()` and `Write()` functions. These functions behave similarly to
 // `memcpy()`, with one oddity: the protected data must be an array of
 // `std::atomic<uint64>`. This is to comply with the C++ standard, which
 // considers data races on non-atomic objects to be undefined behavior. See "Can
 // Seqlocks Get Along With Programming Language Memory Models?"[1] by Hans J.
 // Boehm for more details.
 //
 // [1] https://www.hpl.hp.com/techreports/2012/HPL-2012-68.pdf
 class SequenceLock {
  public:
   constexpr SequenceLock() : lock_(kUninitialized) {}

   // Mark that this lock is ready for use.
   void MarkInitialized() {
     assert(lock_.load(std::memory_order_relaxed) == kUninitialized);
     lock_.store(0, std::memory_order_release);
   }

   // Copy "size" bytes of data from "src" to "dst", protected as a read-side
   // critical section of the sequence lock.
   //
   // Unlike traditional sequence lock implementations which loop until getting a
   // clean read, this implementation returns false in the case of concurrent
   // calls to `Write`. In such a case, the caller should fall back to a
   // locking-based slow path.
   //
   // Returns false if the sequence lock was not yet marked as initialized.
   //
   // NOTE: If this returns false, "dst" may be overwritten with undefined
   // (potentially uninitialized) data.
   bool TryRead(void* dst, const std::atomic<uint64_t>* src, size_t size) const {
     // Acquire barrier ensures that no loads done by f() are reordered
     // above the first load of the sequence counter.
     int64_t seq_before = lock_.load(std::memory_order_acquire);
     if (ABSL_PREDICT_FALSE(seq_before & 1) == 1) return false;
     RelaxedCopyFromAtomic(dst, src, size);
     // Another acquire fence ensures that the load of 'lock_' below is
     // strictly ordered after the RelaxedCopyToAtomic call above.
     std::atomic_thread_fence(std::memory_order_acquire);
     int64_t seq_after = lock_.load(std::memory_order_relaxed);
     return ABSL_PREDICT_TRUE(seq_before == seq_after);
   }

   // Copy "size" bytes from "src" to "dst" as a write-side critical section
   // of the sequence lock. Any concurrent readers will be forced to retry
   // until they get a read that does not conflict with this write.
   //
   // This call must be externally synchronized against other calls to Write,
   // but may proceed concurrently with reads.
   void Write(std::atomic<uint64_t>* dst, const void* src, size_t size) {
     // We can use relaxed instructions to increment the counter since we
     // are extenally synchronized. The std::atomic_thread_fence below
     // ensures that the counter updates don't get interleaved with the
     // copy to the data.
     int64_t orig_seq = lock_.load(std::memory_order_relaxed);
     assert((orig_seq & 1) == 0);  // Must be initially unlocked.
     lock_.store(orig_seq + 1, std::memory_order_relaxed);

     // We put a release fence between update to lock_ and writes to shared data.
     // Thus all stores to shared data are effectively release operations and
     // update to lock_ above cannot be re-ordered past any of them. Note that
     // this barrier is not for the fetch_add above.  A release barrier for the
     // fetch_add would be before it, not after.
     std::atomic_thread_fence(std::memory_order_release);
     RelaxedCopyToAtomic(dst, src, size);
     // "Release" semantics ensure that none of the writes done by
     // RelaxedCopyToAtomic() can be reordered after the following modification.
     lock_.store(orig_seq + 2, std::memory_order_release);
   }

   // Return the number of times that Write() has been called.
   //
   // REQUIRES: This must be externally synchronized against concurrent calls to
   // `Write()` or `IncrementModificationCount()`.
   // REQUIRES: `MarkInitialized()` must have been previously called.
   int64_t ModificationCount() const {
     int64_t val = lock_.load(std::memory_order_relaxed);
     assert(val != kUninitialized && (val & 1) == 0);
     return val / 2;
   }

   // REQUIRES: This must be externally synchronized against concurrent calls to
   // `Write()` or `ModificationCount()`.
   // REQUIRES: `MarkInitialized()` must have been previously called.
   void IncrementModificationCount() {
     int64_t val = lock_.load(std::memory_order_relaxed);
     assert(val != kUninitialized);
     lock_.store(val + 2, std::memory_order_relaxed);
   }

  private:
   // Perform the equivalent of "memcpy(dst, src, size)", but using relaxed
   // atomics.
   static void RelaxedCopyFromAtomic(void* dst, const std::atomic<uint64_t>* src,
                                     size_t size) {
     char* dst_byte = static_cast<char*>(dst);
     while (size >= sizeof(uint64_t)) {
       uint64_t word = src->load(std::memory_order_relaxed);
       std::memcpy(dst_byte, &word, sizeof(word));
       dst_byte += sizeof(word);
       src++;
       size -= sizeof(word);
     }
     if (size > 0) {
       uint64_t word = src->load(std::memory_order_relaxed);
       std::memcpy(dst_byte, &word, size);
     }
   }

   // Perform the equivalent of "memcpy(dst, src, size)", but using relaxed
   // atomics.
   static void RelaxedCopyToAtomic(std::atomic<uint64_t>* dst, const void* src,
                                   size_t size) {
     const char* src_byte = static_cast<const char*>(src);
     while (size >= sizeof(uint64_t)) {
       uint64_t word;
       std::memcpy(&word, src_byte, sizeof(word));
       dst->store(word, std::memory_order_relaxed);
       src_byte += sizeof(word);
       dst++;
       size -= sizeof(word);
     }
     if (size > 0) {
       uint64_t word = 0;
       std::memcpy(&word, src_byte, size);
       dst->store(word, std::memory_order_relaxed);
     }
   }

   static constexpr int64_t kUninitialized = -1;
   std::atomic<int64_t> lock_;
 };

 }  // namespace flags_internal
 ABSL_NAMESPACE_END
 }  // namespace absl

 #endif  // ABSL_FLAGS_INTERNAL_SEQUENCE_LOCK_H_
	//
	// Copyright 2020 The Abseil Authors.
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// https://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.

	#ifndef ABSL_FLAGS_INTERNAL_SEQUENCE_LOCK_H_
	#define ABSL_FLAGS_INTERNAL_SEQUENCE_LOCK_H_

	#include <stddef.h>
	#include <stdint.h>

	#include <atomic>
	#include <cassert>
	#include <cstring>

	#include "absl/base/optimization.h"

	namespace absl {
	ABSL_NAMESPACE_BEGIN
	namespace flags_internal {

	// Align 'x' up to the nearest 'align' bytes.
	inline constexpr size_t AlignUp(size_t x, size_t align) {
	return align * ((x + align - 1) / align);
	}

	// A SequenceLock implements lock-free reads. A sequence counter is incremented
	// before and after each write, and readers access the counter before and after
	// accessing the protected data. If the counter is verified to not change during
	// the access, and the sequence counter value was even, then the reader knows
	// that the read was race-free and valid. Otherwise, the reader must fall back
	// to a Mutex-based code path.
	//
	// This particular SequenceLock starts in an "uninitialized" state in which
	// TryRead() returns false. It must be enabled by calling MarkInitialized().
	// This serves as a marker that the associated flag value has not yet been
	// initialized and a slow path needs to be taken.
	//
	// The memory reads and writes protected by this lock must use the provided
	// `TryRead()` and `Write()` functions. These functions behave similarly to
	// `memcpy()`, with one oddity: the protected data must be an array of
	// `std::atomic<uint64>`. This is to comply with the C++ standard, which
	// considers data races on non-atomic objects to be undefined behavior. See "Can
	// Seqlocks Get Along With Programming Language Memory Models?"[1] by Hans J.
	// Boehm for more details.
	//
	// [1] https://www.hpl.hp.com/techreports/2012/HPL-2012-68.pdf
	class SequenceLock {
	public:
	constexpr SequenceLock() : lock_(kUninitialized) {}

	// Mark that this lock is ready for use.
	void MarkInitialized() {
	assert(lock_.load(std::memory_order_relaxed) == kUninitialized);
	lock_.store(0, std::memory_order_release);
	}

	// Copy "size" bytes of data from "src" to "dst", protected as a read-side
	// critical section of the sequence lock.
	//
	// Unlike traditional sequence lock implementations which loop until getting a
	// clean read, this implementation returns false in the case of concurrent
	// calls to `Write`. In such a case, the caller should fall back to a
	// locking-based slow path.
	//
	// Returns false if the sequence lock was not yet marked as initialized.
	//
	// NOTE: If this returns false, "dst" may be overwritten with undefined
	// (potentially uninitialized) data.
	bool TryRead(void* dst, const std::atomic<uint64_t>* src, size_t size) const {
	// Acquire barrier ensures that no loads done by f() are reordered
	// above the first load of the sequence counter.
	int64_t seq_before = lock_.load(std::memory_order_acquire);
	if (ABSL_PREDICT_FALSE(seq_before & 1) == 1) return false;
	RelaxedCopyFromAtomic(dst, src, size);
	// Another acquire fence ensures that the load of 'lock_' below is
	// strictly ordered after the RelaxedCopyToAtomic call above.
	std::atomic_thread_fence(std::memory_order_acquire);
	int64_t seq_after = lock_.load(std::memory_order_relaxed);
	return ABSL_PREDICT_TRUE(seq_before == seq_after);
	}

	// Copy "size" bytes from "src" to "dst" as a write-side critical section
	// of the sequence lock. Any concurrent readers will be forced to retry
	// until they get a read that does not conflict with this write.
	//
	// This call must be externally synchronized against other calls to Write,
	// but may proceed concurrently with reads.
	void Write(std::atomic<uint64_t>* dst, const void* src, size_t size) {
	// We can use relaxed instructions to increment the counter since we
	// are extenally synchronized. The std::atomic_thread_fence below
	// ensures that the counter updates don't get interleaved with the
	// copy to the data.
	int64_t orig_seq = lock_.load(std::memory_order_relaxed);
	assert((orig_seq & 1) == 0); // Must be initially unlocked.
	lock_.store(orig_seq + 1, std::memory_order_relaxed);

	// We put a release fence between update to lock_ and writes to shared data.
	// Thus all stores to shared data are effectively release operations and
	// update to lock_ above cannot be re-ordered past any of them. Note that
	// this barrier is not for the fetch_add above. A release barrier for the
	// fetch_add would be before it, not after.
	std::atomic_thread_fence(std::memory_order_release);
	RelaxedCopyToAtomic(dst, src, size);
	// "Release" semantics ensure that none of the writes done by
	// RelaxedCopyToAtomic() can be reordered after the following modification.
	lock_.store(orig_seq + 2, std::memory_order_release);
	}

	// Return the number of times that Write() has been called.
	//
	// REQUIRES: This must be externally synchronized against concurrent calls to
	// `Write()` or `IncrementModificationCount()`.
	// REQUIRES: `MarkInitialized()` must have been previously called.
	int64_t ModificationCount() const {
	int64_t val = lock_.load(std::memory_order_relaxed);
	assert(val != kUninitialized && (val & 1) == 0);
	return val / 2;
	}

	// REQUIRES: This must be externally synchronized against concurrent calls to
	// `Write()` or `ModificationCount()`.
	// REQUIRES: `MarkInitialized()` must have been previously called.
	void IncrementModificationCount() {
	int64_t val = lock_.load(std::memory_order_relaxed);
	assert(val != kUninitialized);
	lock_.store(val + 2, std::memory_order_relaxed);
	}

	private:
	// Perform the equivalent of "memcpy(dst, src, size)", but using relaxed
	// atomics.
	static void RelaxedCopyFromAtomic(void* dst, const std::atomic<uint64_t>* src,
	size_t size) {
	char* dst_byte = static_cast<char*>(dst);
	while (size >= sizeof(uint64_t)) {
	uint64_t word = src->load(std::memory_order_relaxed);
	std::memcpy(dst_byte, &word, sizeof(word));
	dst_byte += sizeof(word);
	src++;
	size -= sizeof(word);
	}
	if (size > 0) {
	uint64_t word = src->load(std::memory_order_relaxed);
	std::memcpy(dst_byte, &word, size);
	}
	}

	// Perform the equivalent of "memcpy(dst, src, size)", but using relaxed
	// atomics.
	static void RelaxedCopyToAtomic(std::atomic<uint64_t>* dst, const void* src,
	size_t size) {
	const char* src_byte = static_cast<const char*>(src);
	while (size >= sizeof(uint64_t)) {
	uint64_t word;
	std::memcpy(&word, src_byte, sizeof(word));
	dst->store(word, std::memory_order_relaxed);
	src_byte += sizeof(word);
	dst++;
	size -= sizeof(word);
	}
	if (size > 0) {
	uint64_t word = 0;
	std::memcpy(&word, src_byte, size);
	dst->store(word, std::memory_order_relaxed);
	}
	}

	static constexpr int64_t kUninitialized = -1;
	std::atomic<int64_t> lock_;
	};

	} // namespace flags_internal
	ABSL_NAMESPACE_END
	} // namespace absl

	#endif // ABSL_FLAGS_INTERNAL_SEQUENCE_LOCK_H_