|
|
@ -38,12 +38,16 @@ namespace protobuf { |
|
|
|
namespace internal { |
|
|
|
namespace internal { |
|
|
|
|
|
|
|
|
|
|
|
inline void MemoryBarrier() { |
|
|
|
inline void MemoryBarrier() { |
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
__asm__ __volatile__ ("dmb ish" ::: "memory"); // NOLINT
|
|
|
|
"dmb ish \n\t" // Data memory barrier.
|
|
|
|
|
|
|
|
::: "memory" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// NoBarrier versions of the operation include "memory" in the clobber list.
|
|
|
|
|
|
|
|
// This is not required for direct usage of the NoBarrier versions of the
|
|
|
|
|
|
|
|
// operations. However this is required for correctness when they are used as
|
|
|
|
|
|
|
|
// part of the Acquire or Release versions, to ensure that nothing from outside
|
|
|
|
|
|
|
|
// the call is reordered between the operation and the memory barrier. This does
|
|
|
|
|
|
|
|
// not change the code generated, so has no or minimal impact on the
|
|
|
|
|
|
|
|
// NoBarrier operations.
|
|
|
|
|
|
|
|
|
|
|
|
inline Atomic32 NoBarrier_CompareAndSwap(volatile Atomic32* ptr, |
|
|
|
inline Atomic32 NoBarrier_CompareAndSwap(volatile Atomic32* ptr, |
|
|
|
Atomic32 old_value, |
|
|
|
Atomic32 old_value, |
|
|
@ -59,13 +63,12 @@ inline Atomic32 NoBarrier_CompareAndSwap(volatile Atomic32* ptr, |
|
|
|
"stxr %w[temp], %w[new_value], %[ptr] \n\t" // Try to store the new value.
|
|
|
|
"stxr %w[temp], %w[new_value], %[ptr] \n\t" // Try to store the new value.
|
|
|
|
"cbnz %w[temp], 0b \n\t" // Retry if it did not work.
|
|
|
|
"cbnz %w[temp], 0b \n\t" // Retry if it did not work.
|
|
|
|
"1: \n\t" |
|
|
|
"1: \n\t" |
|
|
|
"clrex \n\t" // In case we didn't swap.
|
|
|
|
|
|
|
|
: [prev]"=&r" (prev), |
|
|
|
: [prev]"=&r" (prev), |
|
|
|
[temp]"=&r" (temp), |
|
|
|
[temp]"=&r" (temp), |
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
: [old_value]"r" (old_value), |
|
|
|
: [old_value]"IJr" (old_value), |
|
|
|
[new_value]"r" (new_value) |
|
|
|
[new_value]"r" (new_value) |
|
|
|
: "memory", "cc" |
|
|
|
: "cc", "memory" |
|
|
|
); // NOLINT
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
|
return prev; |
|
|
|
return prev; |
|
|
@ -105,7 +108,7 @@ inline Atomic32 NoBarrier_AtomicIncrement(volatile Atomic32* ptr, |
|
|
|
: [result]"=&r" (result), |
|
|
|
: [result]"=&r" (result), |
|
|
|
[temp]"=&r" (temp), |
|
|
|
[temp]"=&r" (temp), |
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
: [increment]"r" (increment) |
|
|
|
: [increment]"IJr" (increment) |
|
|
|
: "memory" |
|
|
|
: "memory" |
|
|
|
); // NOLINT
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
@ -114,8 +117,10 @@ inline Atomic32 NoBarrier_AtomicIncrement(volatile Atomic32* ptr, |
|
|
|
|
|
|
|
|
|
|
|
inline Atomic32 Barrier_AtomicIncrement(volatile Atomic32* ptr, |
|
|
|
inline Atomic32 Barrier_AtomicIncrement(volatile Atomic32* ptr, |
|
|
|
Atomic32 increment) { |
|
|
|
Atomic32 increment) { |
|
|
|
|
|
|
|
Atomic32 result; |
|
|
|
|
|
|
|
|
|
|
|
MemoryBarrier(); |
|
|
|
MemoryBarrier(); |
|
|
|
Atomic32 result = NoBarrier_AtomicIncrement(ptr, increment); |
|
|
|
result = NoBarrier_AtomicIncrement(ptr, increment); |
|
|
|
MemoryBarrier(); |
|
|
|
MemoryBarrier(); |
|
|
|
|
|
|
|
|
|
|
|
return result; |
|
|
|
return result; |
|
|
@ -125,27 +130,9 @@ inline Atomic32 Acquire_CompareAndSwap(volatile Atomic32* ptr, |
|
|
|
Atomic32 old_value, |
|
|
|
Atomic32 old_value, |
|
|
|
Atomic32 new_value) { |
|
|
|
Atomic32 new_value) { |
|
|
|
Atomic32 prev; |
|
|
|
Atomic32 prev; |
|
|
|
int32_t temp; |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
prev = NoBarrier_CompareAndSwap(ptr, old_value, new_value); |
|
|
|
"0: \n\t" |
|
|
|
MemoryBarrier(); |
|
|
|
"ldxr %w[prev], %[ptr] \n\t" // Load the previous value.
|
|
|
|
|
|
|
|
"cmp %w[prev], %w[old_value] \n\t" |
|
|
|
|
|
|
|
"bne 1f \n\t" |
|
|
|
|
|
|
|
"stxr %w[temp], %w[new_value], %[ptr] \n\t" // Try to store the new value.
|
|
|
|
|
|
|
|
"cbnz %w[temp], 0b \n\t" // Retry if it did not work.
|
|
|
|
|
|
|
|
"dmb ish \n\t" // Data memory barrier.
|
|
|
|
|
|
|
|
"1: \n\t" |
|
|
|
|
|
|
|
// If the compare failed the 'dmb' is unnecessary, but we still need a
|
|
|
|
|
|
|
|
// 'clrex'.
|
|
|
|
|
|
|
|
"clrex \n\t" |
|
|
|
|
|
|
|
: [prev]"=&r" (prev), |
|
|
|
|
|
|
|
[temp]"=&r" (temp), |
|
|
|
|
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
|
|
|
|
: [old_value]"r" (old_value), |
|
|
|
|
|
|
|
[new_value]"r" (new_value) |
|
|
|
|
|
|
|
: "memory", "cc" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
return prev; |
|
|
|
return prev; |
|
|
|
} |
|
|
|
} |
|
|
@ -154,27 +141,9 @@ inline Atomic32 Release_CompareAndSwap(volatile Atomic32* ptr, |
|
|
|
Atomic32 old_value, |
|
|
|
Atomic32 old_value, |
|
|
|
Atomic32 new_value) { |
|
|
|
Atomic32 new_value) { |
|
|
|
Atomic32 prev; |
|
|
|
Atomic32 prev; |
|
|
|
int32_t temp; |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
MemoryBarrier(); |
|
|
|
MemoryBarrier(); |
|
|
|
|
|
|
|
prev = NoBarrier_CompareAndSwap(ptr, old_value, new_value); |
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
|
|
|
|
"0: \n\t" |
|
|
|
|
|
|
|
"ldxr %w[prev], %[ptr] \n\t" // Load the previous value.
|
|
|
|
|
|
|
|
"cmp %w[prev], %w[old_value] \n\t" |
|
|
|
|
|
|
|
"bne 1f \n\t" |
|
|
|
|
|
|
|
"stxr %w[temp], %w[new_value], %[ptr] \n\t" // Try to store the new value.
|
|
|
|
|
|
|
|
"cbnz %w[temp], 0b \n\t" // Retry if it did not work.
|
|
|
|
|
|
|
|
"1: \n\t" |
|
|
|
|
|
|
|
// If the compare failed the we still need a 'clrex'.
|
|
|
|
|
|
|
|
"clrex \n\t" |
|
|
|
|
|
|
|
: [prev]"=&r" (prev), |
|
|
|
|
|
|
|
[temp]"=&r" (temp), |
|
|
|
|
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
|
|
|
|
: [old_value]"r" (old_value), |
|
|
|
|
|
|
|
[new_value]"r" (new_value) |
|
|
|
|
|
|
|
: "memory", "cc" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
return prev; |
|
|
|
return prev; |
|
|
|
} |
|
|
|
} |
|
|
@ -189,8 +158,12 @@ inline void Acquire_Store(volatile Atomic32* ptr, Atomic32 value) { |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
inline void Release_Store(volatile Atomic32* ptr, Atomic32 value) { |
|
|
|
inline void Release_Store(volatile Atomic32* ptr, Atomic32 value) { |
|
|
|
MemoryBarrier(); |
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
*ptr = value; |
|
|
|
"stlr %w[value], %[ptr] \n\t" |
|
|
|
|
|
|
|
: [ptr]"=Q" (*ptr) |
|
|
|
|
|
|
|
: [value]"r" (value) |
|
|
|
|
|
|
|
: "memory" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
inline Atomic32 NoBarrier_Load(volatile const Atomic32* ptr) { |
|
|
|
inline Atomic32 NoBarrier_Load(volatile const Atomic32* ptr) { |
|
|
@ -198,8 +171,15 @@ inline Atomic32 NoBarrier_Load(volatile const Atomic32* ptr) { |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
inline Atomic32 Acquire_Load(volatile const Atomic32* ptr) { |
|
|
|
inline Atomic32 Acquire_Load(volatile const Atomic32* ptr) { |
|
|
|
Atomic32 value = *ptr; |
|
|
|
Atomic32 value; |
|
|
|
MemoryBarrier(); |
|
|
|
|
|
|
|
|
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
|
|
|
|
"ldar %w[value], %[ptr] \n\t" |
|
|
|
|
|
|
|
: [value]"=r" (value) |
|
|
|
|
|
|
|
: [ptr]"Q" (*ptr) |
|
|
|
|
|
|
|
: "memory" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
|
return value; |
|
|
|
return value; |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
@ -225,13 +205,12 @@ inline Atomic64 NoBarrier_CompareAndSwap(volatile Atomic64* ptr, |
|
|
|
"stxr %w[temp], %[new_value], %[ptr] \n\t" |
|
|
|
"stxr %w[temp], %[new_value], %[ptr] \n\t" |
|
|
|
"cbnz %w[temp], 0b \n\t" |
|
|
|
"cbnz %w[temp], 0b \n\t" |
|
|
|
"1: \n\t" |
|
|
|
"1: \n\t" |
|
|
|
"clrex \n\t" |
|
|
|
|
|
|
|
: [prev]"=&r" (prev), |
|
|
|
: [prev]"=&r" (prev), |
|
|
|
[temp]"=&r" (temp), |
|
|
|
[temp]"=&r" (temp), |
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
: [old_value]"r" (old_value), |
|
|
|
: [old_value]"IJr" (old_value), |
|
|
|
[new_value]"r" (new_value) |
|
|
|
[new_value]"r" (new_value) |
|
|
|
: "memory", "cc" |
|
|
|
: "cc", "memory" |
|
|
|
); // NOLINT
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
|
return prev; |
|
|
|
return prev; |
|
|
@ -271,7 +250,7 @@ inline Atomic64 NoBarrier_AtomicIncrement(volatile Atomic64* ptr, |
|
|
|
: [result]"=&r" (result), |
|
|
|
: [result]"=&r" (result), |
|
|
|
[temp]"=&r" (temp), |
|
|
|
[temp]"=&r" (temp), |
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
: [increment]"r" (increment) |
|
|
|
: [increment]"IJr" (increment) |
|
|
|
: "memory" |
|
|
|
: "memory" |
|
|
|
); // NOLINT
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
@ -280,8 +259,10 @@ inline Atomic64 NoBarrier_AtomicIncrement(volatile Atomic64* ptr, |
|
|
|
|
|
|
|
|
|
|
|
inline Atomic64 Barrier_AtomicIncrement(volatile Atomic64* ptr, |
|
|
|
inline Atomic64 Barrier_AtomicIncrement(volatile Atomic64* ptr, |
|
|
|
Atomic64 increment) { |
|
|
|
Atomic64 increment) { |
|
|
|
|
|
|
|
Atomic64 result; |
|
|
|
|
|
|
|
|
|
|
|
MemoryBarrier(); |
|
|
|
MemoryBarrier(); |
|
|
|
Atomic64 result = NoBarrier_AtomicIncrement(ptr, increment); |
|
|
|
result = NoBarrier_AtomicIncrement(ptr, increment); |
|
|
|
MemoryBarrier(); |
|
|
|
MemoryBarrier(); |
|
|
|
|
|
|
|
|
|
|
|
return result; |
|
|
|
return result; |
|
|
@ -291,25 +272,9 @@ inline Atomic64 Acquire_CompareAndSwap(volatile Atomic64* ptr, |
|
|
|
Atomic64 old_value, |
|
|
|
Atomic64 old_value, |
|
|
|
Atomic64 new_value) { |
|
|
|
Atomic64 new_value) { |
|
|
|
Atomic64 prev; |
|
|
|
Atomic64 prev; |
|
|
|
int32_t temp; |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
prev = NoBarrier_CompareAndSwap(ptr, old_value, new_value); |
|
|
|
"0: \n\t" |
|
|
|
MemoryBarrier(); |
|
|
|
"ldxr %[prev], %[ptr] \n\t" |
|
|
|
|
|
|
|
"cmp %[prev], %[old_value] \n\t" |
|
|
|
|
|
|
|
"bne 1f \n\t" |
|
|
|
|
|
|
|
"stxr %w[temp], %[new_value], %[ptr] \n\t" |
|
|
|
|
|
|
|
"cbnz %w[temp], 0b \n\t" |
|
|
|
|
|
|
|
"dmb ish \n\t" |
|
|
|
|
|
|
|
"1: \n\t" |
|
|
|
|
|
|
|
"clrex \n\t" |
|
|
|
|
|
|
|
: [prev]"=&r" (prev), |
|
|
|
|
|
|
|
[temp]"=&r" (temp), |
|
|
|
|
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
|
|
|
|
: [old_value]"r" (old_value), |
|
|
|
|
|
|
|
[new_value]"r" (new_value) |
|
|
|
|
|
|
|
: "memory", "cc" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
return prev; |
|
|
|
return prev; |
|
|
|
} |
|
|
|
} |
|
|
@ -318,26 +283,9 @@ inline Atomic64 Release_CompareAndSwap(volatile Atomic64* ptr, |
|
|
|
Atomic64 old_value, |
|
|
|
Atomic64 old_value, |
|
|
|
Atomic64 new_value) { |
|
|
|
Atomic64 new_value) { |
|
|
|
Atomic64 prev; |
|
|
|
Atomic64 prev; |
|
|
|
int32_t temp; |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
MemoryBarrier(); |
|
|
|
MemoryBarrier(); |
|
|
|
|
|
|
|
prev = NoBarrier_CompareAndSwap(ptr, old_value, new_value); |
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
|
|
|
|
"0: \n\t" |
|
|
|
|
|
|
|
"ldxr %[prev], %[ptr] \n\t" |
|
|
|
|
|
|
|
"cmp %[prev], %[old_value] \n\t" |
|
|
|
|
|
|
|
"bne 1f \n\t" |
|
|
|
|
|
|
|
"stxr %w[temp], %[new_value], %[ptr] \n\t" |
|
|
|
|
|
|
|
"cbnz %w[temp], 0b \n\t" |
|
|
|
|
|
|
|
"1: \n\t" |
|
|
|
|
|
|
|
"clrex \n\t" |
|
|
|
|
|
|
|
: [prev]"=&r" (prev), |
|
|
|
|
|
|
|
[temp]"=&r" (temp), |
|
|
|
|
|
|
|
[ptr]"+Q" (*ptr) |
|
|
|
|
|
|
|
: [old_value]"r" (old_value), |
|
|
|
|
|
|
|
[new_value]"r" (new_value) |
|
|
|
|
|
|
|
: "memory", "cc" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
return prev; |
|
|
|
return prev; |
|
|
|
} |
|
|
|
} |
|
|
@ -352,8 +300,12 @@ inline void Acquire_Store(volatile Atomic64* ptr, Atomic64 value) { |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
inline void Release_Store(volatile Atomic64* ptr, Atomic64 value) { |
|
|
|
inline void Release_Store(volatile Atomic64* ptr, Atomic64 value) { |
|
|
|
MemoryBarrier(); |
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
*ptr = value; |
|
|
|
"stlr %x[value], %[ptr] \n\t" |
|
|
|
|
|
|
|
: [ptr]"=Q" (*ptr) |
|
|
|
|
|
|
|
: [value]"r" (value) |
|
|
|
|
|
|
|
: "memory" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
inline Atomic64 NoBarrier_Load(volatile const Atomic64* ptr) { |
|
|
|
inline Atomic64 NoBarrier_Load(volatile const Atomic64* ptr) { |
|
|
@ -361,8 +313,15 @@ inline Atomic64 NoBarrier_Load(volatile const Atomic64* ptr) { |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
inline Atomic64 Acquire_Load(volatile const Atomic64* ptr) { |
|
|
|
inline Atomic64 Acquire_Load(volatile const Atomic64* ptr) { |
|
|
|
Atomic64 value = *ptr; |
|
|
|
Atomic32 value; |
|
|
|
MemoryBarrier(); |
|
|
|
|
|
|
|
|
|
|
|
__asm__ __volatile__ ( // NOLINT
|
|
|
|
|
|
|
|
"ldar %x[value], %[ptr] \n\t" |
|
|
|
|
|
|
|
: [value]"=r" (value) |
|
|
|
|
|
|
|
: [ptr]"Q" (*ptr) |
|
|
|
|
|
|
|
: "memory" |
|
|
|
|
|
|
|
); // NOLINT
|
|
|
|
|
|
|
|
|
|
|
|
return value; |
|
|
|
return value; |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|