mirror of
https://github.com/beefytech/Beef.git
synced 2025-07-01 13:56:00 +02:00
412 lines
12 KiB
C
412 lines
12 KiB
C
![]() |
// Copyright (c) 2011, Google Inc.
|
||
|
// All rights reserved.
|
||
|
//
|
||
|
// Redistribution and use in source and binary forms, with or without
|
||
|
// modification, are permitted provided that the following conditions are
|
||
|
// met:
|
||
|
//
|
||
|
// * Redistributions of source code must retain the above copyright
|
||
|
// notice, this list of conditions and the following disclaimer.
|
||
|
// * Redistributions in binary form must reproduce the above
|
||
|
// copyright notice, this list of conditions and the following disclaimer
|
||
|
// in the documentation and/or other materials provided with the
|
||
|
// distribution.
|
||
|
// * Neither the name of Google Inc. nor the names of its
|
||
|
// contributors may be used to endorse or promote products derived from
|
||
|
// this software without specific prior written permission.
|
||
|
//
|
||
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||
|
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||
|
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||
|
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
||
|
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
||
|
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
||
|
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
||
|
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
||
|
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
||
|
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
||
|
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||
|
// ---
|
||
|
//
|
||
|
// Author: Sasha Levitskiy
|
||
|
// based on atomicops-internals by Sanjay Ghemawat
|
||
|
//
|
||
|
// This file is an internal atomic implementation, use base/atomicops.h instead.
|
||
|
//
|
||
|
// This code implements ARM atomics for architectures V6 and newer.
|
||
|
|
||
|
#ifndef BASE_ATOMICOPS_INTERNALS_ARM_V6PLUS_H_
|
||
|
#define BASE_ATOMICOPS_INTERNALS_ARM_V6PLUS_H_
|
||
|
|
||
|
#include <stdio.h>
|
||
|
#include <stdlib.h>
|
||
|
#include "base/basictypes.h" // For COMPILE_ASSERT
|
||
|
|
||
|
// The LDREXD and STREXD instructions in ARM all v7 variants or above. In v6,
|
||
|
// only some variants support it. For simplicity, we only use exclusive
|
||
|
// 64-bit load/store in V7 or above.
|
||
|
#if defined(ARMV7)
|
||
|
# define BASE_ATOMICOPS_HAS_LDREXD_AND_STREXD
|
||
|
#endif
|
||
|
|
||
|
typedef int32_t Atomic32;
|
||
|
|
||
|
namespace base {
|
||
|
namespace subtle {
|
||
|
|
||
|
typedef int64_t Atomic64;
|
||
|
|
||
|
// 32-bit low-level ops
|
||
|
|
||
|
inline Atomic32 NoBarrier_CompareAndSwap(volatile Atomic32* ptr,
|
||
|
Atomic32 old_value,
|
||
|
Atomic32 new_value) {
|
||
|
Atomic32 oldval, res;
|
||
|
do {
|
||
|
__asm__ __volatile__(
|
||
|
"ldrex %1, [%3]\n"
|
||
|
"mov %0, #0\n"
|
||
|
"teq %1, %4\n"
|
||
|
// The following IT (if-then) instruction is needed for the subsequent
|
||
|
// conditional instruction STREXEQ when compiling in THUMB mode.
|
||
|
// In ARM mode, the compiler/assembler will not generate any code for it.
|
||
|
"it eq\n"
|
||
|
"strexeq %0, %5, [%3]\n"
|
||
|
: "=&r" (res), "=&r" (oldval), "+Qo" (*ptr)
|
||
|
: "r" (ptr), "Ir" (old_value), "r" (new_value)
|
||
|
: "cc");
|
||
|
} while (res);
|
||
|
return oldval;
|
||
|
}
|
||
|
|
||
|
inline Atomic32 NoBarrier_AtomicExchange(volatile Atomic32* ptr,
|
||
|
Atomic32 new_value) {
|
||
|
Atomic32 tmp, old;
|
||
|
__asm__ __volatile__(
|
||
|
"1:\n"
|
||
|
"ldrex %1, [%2]\n"
|
||
|
"strex %0, %3, [%2]\n"
|
||
|
"teq %0, #0\n"
|
||
|
"bne 1b"
|
||
|
: "=&r" (tmp), "=&r" (old)
|
||
|
: "r" (ptr), "r" (new_value)
|
||
|
: "cc", "memory");
|
||
|
return old;
|
||
|
}
|
||
|
|
||
|
inline void MemoryBarrier() {
|
||
|
#if defined(__ARM_ARCH_6__) || defined(__ARM_ARCH_6J__) || defined(__ARM_ARCH_6K__) || defined(__ARM_ARCH_6Z__) || defined(__ARM_ARCH_6KZ__) || defined(__ARM_ARCH_6T2__)
|
||
|
uint32_t dest = 0;
|
||
|
__asm__ __volatile__("mcr p15,0,%0,c7,c10,5" :"=&r"(dest) : : "memory");
|
||
|
#else
|
||
|
__asm__ __volatile__("dmb" : : : "memory");
|
||
|
#endif
|
||
|
}
|
||
|
|
||
|
inline Atomic32 Acquire_AtomicExchange(volatile Atomic32* ptr,
|
||
|
Atomic32 new_value) {
|
||
|
Atomic32 old_value = NoBarrier_AtomicExchange(ptr, new_value);
|
||
|
MemoryBarrier();
|
||
|
return old_value;
|
||
|
}
|
||
|
|
||
|
inline Atomic32 Release_AtomicExchange(volatile Atomic32* ptr,
|
||
|
Atomic32 new_value) {
|
||
|
MemoryBarrier();
|
||
|
return NoBarrier_AtomicExchange(ptr, new_value);
|
||
|
}
|
||
|
|
||
|
inline Atomic32 NoBarrier_AtomicIncrement(volatile Atomic32* ptr,
|
||
|
Atomic32 increment) {
|
||
|
Atomic32 tmp, res;
|
||
|
__asm__ __volatile__(
|
||
|
"1:\n"
|
||
|
"ldrex %1, [%2]\n"
|
||
|
"add %1, %1, %3\n"
|
||
|
"strex %0, %1, [%2]\n"
|
||
|
"teq %0, #0\n"
|
||
|
"bne 1b"
|
||
|
: "=&r" (tmp), "=&r"(res)
|
||
|
: "r" (ptr), "r"(increment)
|
||
|
: "cc", "memory");
|
||
|
return res;
|
||
|
}
|
||
|
|
||
|
inline Atomic32 Barrier_AtomicIncrement(volatile Atomic32* ptr,
|
||
|
Atomic32 increment) {
|
||
|
Atomic32 tmp, res;
|
||
|
__asm__ __volatile__(
|
||
|
"1:\n"
|
||
|
"ldrex %1, [%2]\n"
|
||
|
"add %1, %1, %3\n"
|
||
|
"dmb\n"
|
||
|
"strex %0, %1, [%2]\n"
|
||
|
"teq %0, #0\n"
|
||
|
"bne 1b"
|
||
|
: "=&r" (tmp), "=&r"(res)
|
||
|
: "r" (ptr), "r"(increment)
|
||
|
: "cc", "memory");
|
||
|
return res;
|
||
|
}
|
||
|
|
||
|
inline Atomic32 Acquire_CompareAndSwap(volatile Atomic32* ptr,
|
||
|
Atomic32 old_value,
|
||
|
Atomic32 new_value) {
|
||
|
Atomic32 value = NoBarrier_CompareAndSwap(ptr, old_value, new_value);
|
||
|
MemoryBarrier();
|
||
|
return value;
|
||
|
}
|
||
|
|
||
|
inline Atomic32 Release_CompareAndSwap(volatile Atomic32* ptr,
|
||
|
Atomic32 old_value,
|
||
|
Atomic32 new_value) {
|
||
|
MemoryBarrier();
|
||
|
return NoBarrier_CompareAndSwap(ptr, old_value, new_value);
|
||
|
}
|
||
|
|
||
|
inline void NoBarrier_Store(volatile Atomic32* ptr, Atomic32 value) {
|
||
|
*ptr = value;
|
||
|
}
|
||
|
|
||
|
inline void Acquire_Store(volatile Atomic32* ptr, Atomic32 value) {
|
||
|
*ptr = value;
|
||
|
MemoryBarrier();
|
||
|
}
|
||
|
|
||
|
inline void Release_Store(volatile Atomic32* ptr, Atomic32 value) {
|
||
|
MemoryBarrier();
|
||
|
*ptr = value;
|
||
|
}
|
||
|
|
||
|
inline Atomic32 NoBarrier_Load(volatile const Atomic32* ptr) {
|
||
|
return *ptr;
|
||
|
}
|
||
|
|
||
|
inline Atomic32 Acquire_Load(volatile const Atomic32* ptr) {
|
||
|
Atomic32 value = *ptr;
|
||
|
MemoryBarrier();
|
||
|
return value;
|
||
|
}
|
||
|
|
||
|
inline Atomic32 Release_Load(volatile const Atomic32* ptr) {
|
||
|
MemoryBarrier();
|
||
|
return *ptr;
|
||
|
}
|
||
|
|
||
|
// 64-bit versions are only available if LDREXD and STREXD instructions
|
||
|
// are available.
|
||
|
#ifdef BASE_ATOMICOPS_HAS_LDREXD_AND_STREXD
|
||
|
|
||
|
#define BASE_HAS_ATOMIC64 1
|
||
|
|
||
|
inline Atomic64 NoBarrier_CompareAndSwap(volatile Atomic64* ptr,
|
||
|
Atomic64 old_value,
|
||
|
Atomic64 new_value) {
|
||
|
Atomic64 oldval, res;
|
||
|
do {
|
||
|
__asm__ __volatile__(
|
||
|
"ldrexd %1, [%3]\n"
|
||
|
"mov %0, #0\n"
|
||
|
"teq %Q1, %Q4\n"
|
||
|
// The following IT (if-then) instructions are needed for the subsequent
|
||
|
// conditional instructions when compiling in THUMB mode.
|
||
|
// In ARM mode, the compiler/assembler will not generate any code for it.
|
||
|
"it eq\n"
|
||
|
"teqeq %R1, %R4\n"
|
||
|
"it eq\n"
|
||
|
"strexdeq %0, %5, [%3]\n"
|
||
|
: "=&r" (res), "=&r" (oldval), "+Q" (*ptr)
|
||
|
: "r" (ptr), "Ir" (old_value), "r" (new_value)
|
||
|
: "cc");
|
||
|
} while (res);
|
||
|
return oldval;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 NoBarrier_AtomicExchange(volatile Atomic64* ptr,
|
||
|
Atomic64 new_value) {
|
||
|
int store_failed;
|
||
|
Atomic64 old;
|
||
|
__asm__ __volatile__(
|
||
|
"1:\n"
|
||
|
"ldrexd %1, [%2]\n"
|
||
|
"strexd %0, %3, [%2]\n"
|
||
|
"teq %0, #0\n"
|
||
|
"bne 1b"
|
||
|
: "=&r" (store_failed), "=&r" (old)
|
||
|
: "r" (ptr), "r" (new_value)
|
||
|
: "cc", "memory");
|
||
|
return old;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Acquire_AtomicExchange(volatile Atomic64* ptr,
|
||
|
Atomic64 new_value) {
|
||
|
Atomic64 old_value = NoBarrier_AtomicExchange(ptr, new_value);
|
||
|
MemoryBarrier();
|
||
|
return old_value;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Release_AtomicExchange(volatile Atomic64* ptr,
|
||
|
Atomic64 new_value) {
|
||
|
MemoryBarrier();
|
||
|
return NoBarrier_AtomicExchange(ptr, new_value);
|
||
|
}
|
||
|
|
||
|
inline Atomic64 NoBarrier_AtomicIncrement(volatile Atomic64* ptr,
|
||
|
Atomic64 increment) {
|
||
|
int store_failed;
|
||
|
Atomic64 res;
|
||
|
__asm__ __volatile__(
|
||
|
"1:\n"
|
||
|
"ldrexd %1, [%2]\n"
|
||
|
"adds %Q1, %Q1, %Q3\n"
|
||
|
"adc %R1, %R1, %R3\n"
|
||
|
"strexd %0, %1, [%2]\n"
|
||
|
"teq %0, #0\n"
|
||
|
"bne 1b"
|
||
|
: "=&r" (store_failed), "=&r"(res)
|
||
|
: "r" (ptr), "r"(increment)
|
||
|
: "cc", "memory");
|
||
|
return res;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Barrier_AtomicIncrement(volatile Atomic64* ptr,
|
||
|
Atomic64 increment) {
|
||
|
int store_failed;
|
||
|
Atomic64 res;
|
||
|
__asm__ __volatile__(
|
||
|
"1:\n"
|
||
|
"ldrexd %1, [%2]\n"
|
||
|
"adds %Q1, %Q1, %Q3\n"
|
||
|
"adc %R1, %R1, %R3\n"
|
||
|
"dmb\n"
|
||
|
"strexd %0, %1, [%2]\n"
|
||
|
"teq %0, #0\n"
|
||
|
"bne 1b"
|
||
|
: "=&r" (store_failed), "=&r"(res)
|
||
|
: "r" (ptr), "r"(increment)
|
||
|
: "cc", "memory");
|
||
|
return res;
|
||
|
}
|
||
|
|
||
|
inline void NoBarrier_Store(volatile Atomic64* ptr, Atomic64 value) {
|
||
|
int store_failed;
|
||
|
Atomic64 dummy;
|
||
|
__asm__ __volatile__(
|
||
|
"1:\n"
|
||
|
// Dummy load to lock cache line.
|
||
|
"ldrexd %1, [%3]\n"
|
||
|
"strexd %0, %2, [%3]\n"
|
||
|
"teq %0, #0\n"
|
||
|
"bne 1b"
|
||
|
: "=&r" (store_failed), "=&r"(dummy)
|
||
|
: "r"(value), "r" (ptr)
|
||
|
: "cc", "memory");
|
||
|
}
|
||
|
|
||
|
inline Atomic64 NoBarrier_Load(volatile const Atomic64* ptr) {
|
||
|
Atomic64 res;
|
||
|
__asm__ __volatile__(
|
||
|
"ldrexd %0, [%1]\n"
|
||
|
"clrex\n"
|
||
|
: "=r" (res)
|
||
|
: "r"(ptr), "Q"(*ptr));
|
||
|
return res;
|
||
|
}
|
||
|
|
||
|
#else // BASE_ATOMICOPS_HAS_LDREXD_AND_STREXD
|
||
|
|
||
|
inline void NotImplementedFatalError(const char *function_name) {
|
||
|
fprintf(stderr, "64-bit %s() not implemented on this platform\n",
|
||
|
function_name);
|
||
|
abort();
|
||
|
}
|
||
|
|
||
|
inline Atomic64 NoBarrier_CompareAndSwap(volatile Atomic64* ptr,
|
||
|
Atomic64 old_value,
|
||
|
Atomic64 new_value) {
|
||
|
NotImplementedFatalError("NoBarrier_CompareAndSwap");
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 NoBarrier_AtomicExchange(volatile Atomic64* ptr,
|
||
|
Atomic64 new_value) {
|
||
|
NotImplementedFatalError("NoBarrier_AtomicExchange");
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Acquire_AtomicExchange(volatile Atomic64* ptr,
|
||
|
Atomic64 new_value) {
|
||
|
NotImplementedFatalError("Acquire_AtomicExchange");
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Release_AtomicExchange(volatile Atomic64* ptr,
|
||
|
Atomic64 new_value) {
|
||
|
NotImplementedFatalError("Release_AtomicExchange");
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 NoBarrier_AtomicIncrement(volatile Atomic64* ptr,
|
||
|
Atomic64 increment) {
|
||
|
NotImplementedFatalError("NoBarrier_AtomicIncrement");
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Barrier_AtomicIncrement(volatile Atomic64* ptr,
|
||
|
Atomic64 increment) {
|
||
|
NotImplementedFatalError("Barrier_AtomicIncrement");
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
inline void NoBarrier_Store(volatile Atomic64* ptr, Atomic64 value) {
|
||
|
NotImplementedFatalError("NoBarrier_Store");
|
||
|
}
|
||
|
|
||
|
inline Atomic64 NoBarrier_Load(volatile const Atomic64* ptr) {
|
||
|
NotImplementedFatalError("NoBarrier_Load");
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
#endif // BASE_ATOMICOPS_HAS_LDREXD_AND_STREXD
|
||
|
|
||
|
inline void Acquire_Store(volatile Atomic64* ptr, Atomic64 value) {
|
||
|
NoBarrier_Store(ptr, value);
|
||
|
MemoryBarrier();
|
||
|
}
|
||
|
|
||
|
inline void Release_Store(volatile Atomic64* ptr, Atomic64 value) {
|
||
|
MemoryBarrier();
|
||
|
NoBarrier_Store(ptr, value);
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Acquire_Load(volatile const Atomic64* ptr) {
|
||
|
Atomic64 value = NoBarrier_Load(ptr);
|
||
|
MemoryBarrier();
|
||
|
return value;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Release_Load(volatile const Atomic64* ptr) {
|
||
|
MemoryBarrier();
|
||
|
return NoBarrier_Load(ptr);
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Acquire_CompareAndSwap(volatile Atomic64* ptr,
|
||
|
Atomic64 old_value,
|
||
|
Atomic64 new_value) {
|
||
|
Atomic64 value = NoBarrier_CompareAndSwap(ptr, old_value, new_value);
|
||
|
MemoryBarrier();
|
||
|
return value;
|
||
|
}
|
||
|
|
||
|
inline Atomic64 Release_CompareAndSwap(volatile Atomic64* ptr,
|
||
|
Atomic64 old_value,
|
||
|
Atomic64 new_value) {
|
||
|
MemoryBarrier();
|
||
|
return NoBarrier_CompareAndSwap(ptr, old_value, new_value);
|
||
|
}
|
||
|
|
||
|
} // namespace subtle ends
|
||
|
} // namespace base ends
|
||
|
|
||
|
#endif // BASE_ATOMICOPS_INTERNALS_ARM_V6PLUS_H_
|