| /* |
| * Copyright (C) 2008 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #ifndef ART_RUNTIME_ATOMIC_H_ |
| #define ART_RUNTIME_ATOMIC_H_ |
| |
| #ifdef __clang__ |
| #define ART_HAVE_STDATOMIC 1 |
| #endif |
| |
| #include <stdint.h> |
| #if ART_HAVE_STDATOMIC |
| #include <atomic> |
| #endif |
| #include <limits> |
| #include <vector> |
| |
| #include "base/logging.h" |
| #include "base/macros.h" |
| |
| namespace art { |
| |
| class Mutex; |
| |
| #if ART_HAVE_STDATOMIC |
| template<typename T> |
| class Atomic : public std::atomic<T> { |
| public: |
| COMPILE_ASSERT(sizeof(T) == sizeof(std::atomic<T>), |
| std_atomic_size_differs_from_that_of_underlying_type); |
| COMPILE_ASSERT(alignof(T) == alignof(std::atomic<T>), |
| std_atomic_alignment_differs_from_that_of_underlying_type); |
| |
| Atomic<T>() : std::atomic<T>() { } |
| |
| explicit Atomic<T>(T value) : std::atomic<T>(value) { } |
| |
| // Load from memory without ordering or synchronization constraints. |
| T LoadRelaxed() const { |
| return this->load(std::memory_order_relaxed); |
| } |
| |
| // Load from memory with a total ordering. |
| T LoadSequentiallyConsistent() const { |
| return this->load(std::memory_order_seq_cst); |
| } |
| |
| // Store to memory without ordering or synchronization constraints. |
| void StoreRelaxed(T desired) { |
| this->store(desired, std::memory_order_relaxed); |
| } |
| |
| // Store to memory with a total ordering. |
| void StoreSequentiallyConsistent(T desired) { |
| this->store(desired, std::memory_order_seq_cst); |
| } |
| |
| // Atomically replace the value with desired value if it matches the expected value. Doesn't |
| // imply ordering or synchronization constraints. |
| bool CompareExchangeWeakRelaxed(T expected_value, T desired_value) { |
| return this->compare_exchange_weak(expected_value, desired_value, std::memory_order_relaxed); |
| } |
| |
| // Atomically replace the value with desired value if it matches the expected value. Prior writes |
| // made to other memory locations by the thread that did the release become visible in this |
| // thread. |
| bool CompareExchangeWeakAcquire(T expected_value, T desired_value) { |
| return this->compare_exchange_weak(expected_value, desired_value, std::memory_order_acquire); |
| } |
| |
| // Atomically replace the value with desired value if it matches the expected value. prior writes |
| // to other memory locations become visible to the threads that do a consume or an acquire on the |
| // same location. |
| bool CompareExchangeWeakRelease(T expected_value, T desired_value) { |
| return this->compare_exchange_weak(expected_value, desired_value, std::memory_order_release); |
| } |
| |
| T FetchAndAddSequentiallyConsistent(const T value) { |
| return this->fetch_add(value, std::memory_order_seq_cst); // Return old_value. |
| } |
| |
| T FetchAndSubSequentiallyConsistent(const T value) { |
| return this->fetch_sub(value, std::memory_order_seq_cst); // Return old value. |
| } |
| |
| volatile T* Address() { |
| return reinterpret_cast<T*>(this); |
| } |
| |
| static T MaxValue() { |
| return std::numeric_limits<T>::max(); |
| } |
| }; |
| #else |
| template<typename T> |
| class Atomic { |
| public: |
| Atomic<T>() : value_(0) { } |
| |
| explicit Atomic<T>(T value) : value_(value) { } |
| |
| // Load from memory without ordering or synchronization constraints. |
| T LoadRelaxed() const { |
| return value_; |
| } |
| |
| // Load from memory with a total ordering. |
| T LoadSequentiallyConsistent() const; |
| |
| // Store to memory without ordering or synchronization constraints. |
| void StoreRelaxed(T desired) { |
| value_ = desired; |
| } |
| |
| // Store to memory with a total ordering. |
| void StoreSequentiallyConsistent(T desired); |
| |
| // Atomically replace the value with desired value if it matches the expected value. Doesn't |
| // imply ordering or synchronization constraints. |
| bool CompareExchangeWeakRelaxed(T expected_value, T desired_value) { |
| // TODO: make this relaxed. |
| return __sync_bool_compare_and_swap(&value_, expected_value, desired_value); |
| } |
| |
| // Atomically replace the value with desired value if it matches the expected value. Prior writes |
| // made to other memory locations by the thread that did the release become visible in this |
| // thread. |
| bool CompareExchangeWeakAcquire(T expected_value, T desired_value) { |
| // TODO: make this acquire. |
| return __sync_bool_compare_and_swap(&value_, expected_value, desired_value); |
| } |
| |
| // Atomically replace the value with desired value if it matches the expected value. prior writes |
| // to other memory locations become visible to the threads that do a consume or an acquire on the |
| // same location. |
| bool CompareExchangeWeakRelease(T expected_value, T desired_value) { |
| // TODO: make this release. |
| return __sync_bool_compare_and_swap(&value_, expected_value, desired_value); |
| } |
| |
| volatile T* Address() { |
| return &value_; |
| } |
| |
| T FetchAndAddSequentiallyConsistent(const T value) { |
| return __sync_fetch_and_add(&value_, value); // Return old_value. |
| } |
| |
| T FetchAndSubSequentiallyConsistent(const T value) { |
| return __sync_fetch_and_sub(&value_, value); // Return old value. |
| } |
| |
| T operator++() { // Prefix operator. |
| return __sync_add_and_fetch(&value_, 1); // Return new value. |
| } |
| |
| T operator++(int) { // Postfix operator. |
| return __sync_fetch_and_add(&value_, 1); // Return old value. |
| } |
| |
| T operator--() { // Prefix operator. |
| return __sync_sub_and_fetch(&value_, 1); // Return new value. |
| } |
| |
| T operator--(int) { // Postfix operator. |
| return __sync_fetch_and_sub(&value_, 1); // Return old value. |
| } |
| |
| static T MaxValue() { |
| return std::numeric_limits<T>::max(); |
| } |
| |
| private: |
| T value_; |
| }; |
| #endif |
| |
| typedef Atomic<int32_t> AtomicInteger; |
| |
| // NOTE: Two "quasiatomic" operations on the exact same memory address |
| // are guaranteed to operate atomically with respect to each other, |
| // but no guarantees are made about quasiatomic operations mixed with |
| // non-quasiatomic operations on the same address, nor about |
| // quasiatomic operations that are performed on partially-overlapping |
| // memory. |
| class QuasiAtomic { |
| #if defined(__mips__) && !defined(__LP64__) |
| static constexpr bool kNeedSwapMutexes = true; |
| #else |
| static constexpr bool kNeedSwapMutexes = false; |
| #endif |
| |
| public: |
| static void Startup(); |
| |
| static void Shutdown(); |
| |
| // Reads the 64-bit value at "addr" without tearing. |
| static int64_t Read64(volatile const int64_t* addr) { |
| if (!kNeedSwapMutexes) { |
| int64_t value; |
| #if defined(__LP64__) |
| value = *addr; |
| #else |
| #if defined(__arm__) |
| #if defined(__ARM_FEATURE_LPAE) |
| // With LPAE support (such as Cortex-A15) then ldrd is defined not to tear. |
| __asm__ __volatile__("@ QuasiAtomic::Read64\n" |
| "ldrd %0, %H0, %1" |
| : "=r" (value) |
| : "m" (*addr)); |
| #else |
| // Exclusive loads are defined not to tear, clearing the exclusive state isn't necessary. |
| __asm__ __volatile__("@ QuasiAtomic::Read64\n" |
| "ldrexd %0, %H0, %1" |
| : "=r" (value) |
| : "Q" (*addr)); |
| #endif |
| #elif defined(__i386__) |
| __asm__ __volatile__( |
| "movq %1, %0\n" |
| : "=x" (value) |
| : "m" (*addr)); |
| #else |
| LOG(FATAL) << "Unsupported architecture"; |
| #endif |
| #endif // defined(__LP64__) |
| return value; |
| } else { |
| return SwapMutexRead64(addr); |
| } |
| } |
| |
| // Writes to the 64-bit value at "addr" without tearing. |
| static void Write64(volatile int64_t* addr, int64_t value) { |
| if (!kNeedSwapMutexes) { |
| #if defined(__LP64__) |
| *addr = value; |
| #else |
| #if defined(__arm__) |
| #if defined(__ARM_FEATURE_LPAE) |
| // If we know that ARM architecture has LPAE (such as Cortex-A15) strd is defined not to tear. |
| __asm__ __volatile__("@ QuasiAtomic::Write64\n" |
| "strd %1, %H1, %0" |
| : "=m"(*addr) |
| : "r" (value)); |
| #else |
| // The write is done as a swap so that the cache-line is in the exclusive state for the store. |
| int64_t prev; |
| int status; |
| do { |
| __asm__ __volatile__("@ QuasiAtomic::Write64\n" |
| "ldrexd %0, %H0, %2\n" |
| "strexd %1, %3, %H3, %2" |
| : "=&r" (prev), "=&r" (status), "+Q"(*addr) |
| : "r" (value) |
| : "cc"); |
| } while (UNLIKELY(status != 0)); |
| #endif |
| #elif defined(__i386__) |
| __asm__ __volatile__( |
| "movq %1, %0" |
| : "=m" (*addr) |
| : "x" (value)); |
| #else |
| LOG(FATAL) << "Unsupported architecture"; |
| #endif |
| #endif // defined(__LP64__) |
| } else { |
| SwapMutexWrite64(addr, value); |
| } |
| } |
| |
| // Atomically compare the value at "addr" to "old_value", if equal replace it with "new_value" |
| // and return true. Otherwise, don't swap, and return false. |
| static bool Cas64(int64_t old_value, int64_t new_value, volatile int64_t* addr) { |
| if (!kNeedSwapMutexes) { |
| return __sync_bool_compare_and_swap(addr, old_value, new_value); |
| } else { |
| return SwapMutexCas64(old_value, new_value, addr); |
| } |
| } |
| |
| // Does the architecture provide reasonable atomic long operations or do we fall back on mutexes? |
| static bool LongAtomicsUseMutexes() { |
| return kNeedSwapMutexes; |
| } |
| |
| static void MembarLoadStore() { |
| #if defined(__arm__) || defined(__aarch64__) |
| __asm__ __volatile__("dmb ish" : : : "memory"); |
| #elif defined(__i386__) || defined(__x86_64__) |
| __asm__ __volatile__("" : : : "memory"); |
| #elif defined(__mips__) |
| __asm__ __volatile__("sync" : : : "memory"); |
| #else |
| #error Unexpected architecture |
| #endif |
| } |
| |
| static void MembarLoadLoad() { |
| #if defined(__arm__) || defined(__aarch64__) |
| __asm__ __volatile__("dmb ish" : : : "memory"); |
| #elif defined(__i386__) || defined(__x86_64__) |
| __asm__ __volatile__("" : : : "memory"); |
| #elif defined(__mips__) |
| __asm__ __volatile__("sync" : : : "memory"); |
| #else |
| #error Unexpected architecture |
| #endif |
| } |
| |
| static void MembarStoreStore() { |
| #if defined(__arm__) || defined(__aarch64__) |
| __asm__ __volatile__("dmb ishst" : : : "memory"); |
| #elif defined(__i386__) || defined(__x86_64__) |
| __asm__ __volatile__("" : : : "memory"); |
| #elif defined(__mips__) |
| __asm__ __volatile__("sync" : : : "memory"); |
| #else |
| #error Unexpected architecture |
| #endif |
| } |
| |
| static void MembarStoreLoad() { |
| #if defined(__arm__) || defined(__aarch64__) |
| __asm__ __volatile__("dmb ish" : : : "memory"); |
| #elif defined(__i386__) || defined(__x86_64__) |
| __asm__ __volatile__("mfence" : : : "memory"); |
| #elif defined(__mips__) |
| __asm__ __volatile__("sync" : : : "memory"); |
| #else |
| #error Unexpected architecture |
| #endif |
| } |
| |
| private: |
| static Mutex* GetSwapMutex(const volatile int64_t* addr); |
| static int64_t SwapMutexRead64(volatile const int64_t* addr); |
| static void SwapMutexWrite64(volatile int64_t* addr, int64_t val); |
| static bool SwapMutexCas64(int64_t old_value, int64_t new_value, volatile int64_t* addr); |
| |
| // We stripe across a bunch of different mutexes to reduce contention. |
| static constexpr size_t kSwapMutexCount = 32; |
| static std::vector<Mutex*>* gSwapMutexes; |
| |
| DISALLOW_COPY_AND_ASSIGN(QuasiAtomic); |
| }; |
| |
| #if !ART_HAVE_STDATOMIC |
| template<typename T> |
| inline T Atomic<T>::LoadSequentiallyConsistent() const { |
| T result = value_; |
| QuasiAtomic::MembarLoadLoad(); |
| return result; |
| } |
| |
| template<typename T> |
| inline void Atomic<T>::StoreSequentiallyConsistent(T desired) { |
| QuasiAtomic::MembarStoreStore(); |
| value_ = desired; |
| QuasiAtomic::MembarStoreLoad(); |
| } |
| |
| #endif |
| |
| } // namespace art |
| |
| #endif // ART_RUNTIME_ATOMIC_H_ |