• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /* Copyright (c) 2008, Google Inc.
2  * All rights reserved.
3  *
4  * Redistribution and use in source and binary forms, with or without
5  * modification, are permitted provided that the following conditions are
6  * met:
7  *
8  *     * Redistributions of source code must retain the above copyright
9  * notice, this list of conditions and the following disclaimer.
10  *     * Redistributions in binary form must reproduce the above
11  * copyright notice, this list of conditions and the following disclaimer
12  * in the documentation and/or other materials provided with the
13  * distribution.
14  *     * Neither the name of Google Inc. nor the names of its
15  * contributors may be used to endorse or promote products derived from
16  * this software without specific prior written permission.
17  *
18  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29  *
30  * ---
31  */
32 
33 // Implementation of atomic operations for ppc-linux.  This file should not
34 // be included directly.  Clients should instead include
35 // "base/atomicops.h".
36 
37 #ifndef BASE_ATOMICOPS_INTERNALS_LINUXPPC_H_
38 #define BASE_ATOMICOPS_INTERNALS_LINUXPPC_H_
39 
40 typedef int32_t Atomic32;
41 
42 #ifdef __PPC64__
43 #define BASE_HAS_ATOMIC64 1
44 #endif
45 
46 namespace base {
47 namespace subtle {
48 
_sync(void)49 static inline void _sync(void) {
50   __asm__ __volatile__("sync": : : "memory");
51 }
52 
_lwsync(void)53 static inline void _lwsync(void) {
54   // gcc defines __NO_LWSYNC__ when appropriate; see
55   //    http://gcc.gnu.org/ml/gcc-patches/2006-11/msg01238.html
56 #ifdef __NO_LWSYNC__
57   __asm__ __volatile__("msync": : : "memory");
58 #else
59   __asm__ __volatile__("lwsync": : : "memory");
60 #endif
61 }
62 
_isync(void)63 static inline void _isync(void) {
64   __asm__ __volatile__("isync": : : "memory");
65 }
66 
OSAtomicAdd32(Atomic32 amount,Atomic32 * value)67 static inline Atomic32 OSAtomicAdd32(Atomic32 amount, Atomic32 *value) {
68   Atomic32 t;
69   __asm__ __volatile__(
70 "1:		lwarx   %0,0,%3\n\
71 		add     %0,%2,%0\n\
72 		stwcx.  %0,0,%3 \n\
73 		bne-    1b"
74 		: "=&r" (t), "+m" (*value)
75 		: "r" (amount), "r" (value)
76                 : "cc");
77   return t;
78 }
79 
OSAtomicAdd32Barrier(Atomic32 amount,Atomic32 * value)80 static inline Atomic32 OSAtomicAdd32Barrier(Atomic32 amount, Atomic32 *value) {
81   Atomic32 t;
82   _lwsync();
83   t = OSAtomicAdd32(amount, value);
84   // This is based on the code snippet in the architecture manual (Vol
85   // 2, Appendix B).  It's a little tricky: correctness depends on the
86   // fact that the code right before this (in OSAtomicAdd32) has a
87   // conditional branch with a data dependency on the update.
88   // Otherwise, we'd have to use sync.
89   _isync();
90   return t;
91 }
92 
OSAtomicCompareAndSwap32(Atomic32 old_value,Atomic32 new_value,Atomic32 * value)93 static inline bool OSAtomicCompareAndSwap32(Atomic32 old_value,
94                                             Atomic32 new_value,
95                                             Atomic32 *value) {
96   Atomic32 prev;
97   __asm__ __volatile__(
98 "1:		lwarx   %0,0,%2\n\
99 		cmpw    0,%0,%3\n\
100 		bne-    2f\n\
101 		stwcx.  %4,0,%2\n\
102 		bne-    1b\n\
103 2:"
104                 : "=&r" (prev), "+m" (*value)
105                 : "r" (value), "r" (old_value), "r" (new_value)
106                 : "cc");
107   return prev == old_value;
108 }
109 
OSAtomicCompareAndSwap32Acquire(Atomic32 old_value,Atomic32 new_value,Atomic32 * value)110 static inline Atomic32 OSAtomicCompareAndSwap32Acquire(Atomic32 old_value,
111                                                        Atomic32 new_value,
112                                                        Atomic32 *value) {
113   Atomic32 t;
114   t = OSAtomicCompareAndSwap32(old_value, new_value, value);
115   // This is based on the code snippet in the architecture manual (Vol
116   // 2, Appendix B).  It's a little tricky: correctness depends on the
117   // fact that the code right before this (in
118   // OSAtomicCompareAndSwap32) has a conditional branch with a data
119   // dependency on the update.  Otherwise, we'd have to use sync.
120   _isync();
121   return t;
122 }
123 
OSAtomicCompareAndSwap32Release(Atomic32 old_value,Atomic32 new_value,Atomic32 * value)124 static inline Atomic32 OSAtomicCompareAndSwap32Release(Atomic32 old_value,
125                                                        Atomic32 new_value,
126                                                        Atomic32 *value) {
127   _lwsync();
128   return OSAtomicCompareAndSwap32(old_value, new_value, value);
129 }
130 
131 typedef int64_t Atomic64;
132 
MemoryBarrier()133 inline void MemoryBarrier() {
134   // This can't be _lwsync(); we need to order the immediately
135   // preceding stores against any load that may follow, but lwsync
136   // doesn't guarantee that.
137   _sync();
138 }
139 
140 // 32-bit Versions.
141 
NoBarrier_CompareAndSwap(volatile Atomic32 * ptr,Atomic32 old_value,Atomic32 new_value)142 inline Atomic32 NoBarrier_CompareAndSwap(volatile Atomic32 *ptr,
143                                          Atomic32 old_value,
144                                          Atomic32 new_value) {
145   Atomic32 prev_value;
146   do {
147     if (OSAtomicCompareAndSwap32(old_value, new_value,
148                                  const_cast<Atomic32*>(ptr))) {
149       return old_value;
150     }
151     prev_value = *ptr;
152   } while (prev_value == old_value);
153   return prev_value;
154 }
155 
NoBarrier_AtomicExchange(volatile Atomic32 * ptr,Atomic32 new_value)156 inline Atomic32 NoBarrier_AtomicExchange(volatile Atomic32 *ptr,
157                                          Atomic32 new_value) {
158   Atomic32 old_value;
159   do {
160     old_value = *ptr;
161   } while (!OSAtomicCompareAndSwap32(old_value, new_value,
162                                      const_cast<Atomic32*>(ptr)));
163   return old_value;
164 }
165 
NoBarrier_AtomicIncrement(volatile Atomic32 * ptr,Atomic32 increment)166 inline Atomic32 NoBarrier_AtomicIncrement(volatile Atomic32 *ptr,
167                                           Atomic32 increment) {
168   return OSAtomicAdd32(increment, const_cast<Atomic32*>(ptr));
169 }
170 
Barrier_AtomicIncrement(volatile Atomic32 * ptr,Atomic32 increment)171 inline Atomic32 Barrier_AtomicIncrement(volatile Atomic32 *ptr,
172                                         Atomic32 increment) {
173   return OSAtomicAdd32Barrier(increment, const_cast<Atomic32*>(ptr));
174 }
175 
Acquire_CompareAndSwap(volatile Atomic32 * ptr,Atomic32 old_value,Atomic32 new_value)176 inline Atomic32 Acquire_CompareAndSwap(volatile Atomic32 *ptr,
177                                        Atomic32 old_value,
178                                        Atomic32 new_value) {
179   Atomic32 prev_value;
180   do {
181     if (OSAtomicCompareAndSwap32Acquire(old_value, new_value,
182                                         const_cast<Atomic32*>(ptr))) {
183       return old_value;
184     }
185     prev_value = *ptr;
186   } while (prev_value == old_value);
187   return prev_value;
188 }
189 
Release_CompareAndSwap(volatile Atomic32 * ptr,Atomic32 old_value,Atomic32 new_value)190 inline Atomic32 Release_CompareAndSwap(volatile Atomic32 *ptr,
191                                        Atomic32 old_value,
192                                        Atomic32 new_value) {
193   Atomic32 prev_value;
194   do {
195     if (OSAtomicCompareAndSwap32Release(old_value, new_value,
196                                         const_cast<Atomic32*>(ptr))) {
197       return old_value;
198     }
199     prev_value = *ptr;
200   } while (prev_value == old_value);
201   return prev_value;
202 }
203 
204 #ifdef __PPC64__
205 
206 // 64-bit Versions.
207 
OSAtomicAdd64(Atomic64 amount,Atomic64 * value)208 static inline Atomic64 OSAtomicAdd64(Atomic64 amount, Atomic64 *value) {
209   Atomic64 t;
210   __asm__ __volatile__(
211 "1:		ldarx   %0,0,%3\n\
212 		add     %0,%2,%0\n\
213 		stdcx.  %0,0,%3 \n\
214 		bne-    1b"
215 		: "=&r" (t), "+m" (*value)
216 		: "r" (amount), "r" (value)
217                 : "cc");
218   return t;
219 }
220 
OSAtomicAdd64Barrier(Atomic64 amount,Atomic64 * value)221 static inline Atomic64 OSAtomicAdd64Barrier(Atomic64 amount, Atomic64 *value) {
222   Atomic64 t;
223   _lwsync();
224   t = OSAtomicAdd64(amount, value);
225   // This is based on the code snippet in the architecture manual (Vol
226   // 2, Appendix B).  It's a little tricky: correctness depends on the
227   // fact that the code right before this (in OSAtomicAdd64) has a
228   // conditional branch with a data dependency on the update.
229   // Otherwise, we'd have to use sync.
230   _isync();
231   return t;
232 }
233 
OSAtomicCompareAndSwap64(Atomic64 old_value,Atomic64 new_value,Atomic64 * value)234 static inline bool OSAtomicCompareAndSwap64(Atomic64 old_value,
235                                             Atomic64 new_value,
236                                             Atomic64 *value) {
237   Atomic64 prev;
238   __asm__ __volatile__(
239 "1:		ldarx   %0,0,%2\n\
240 		cmpw    0,%0,%3\n\
241 		bne-    2f\n\
242 		stdcx.  %4,0,%2\n\
243 		bne-    1b\n\
244 2:"
245                 : "=&r" (prev), "+m" (*value)
246                 : "r" (value), "r" (old_value), "r" (new_value)
247                 : "cc");
248   return prev == old_value;
249 }
250 
OSAtomicCompareAndSwap64Acquire(Atomic64 old_value,Atomic64 new_value,Atomic64 * value)251 static inline Atomic64 OSAtomicCompareAndSwap64Acquire(Atomic64 old_value,
252                                                        Atomic64 new_value,
253                                                        Atomic64 *value) {
254   Atomic64 t;
255   t = OSAtomicCompareAndSwap64(old_value, new_value, value);
256   // This is based on the code snippet in the architecture manual (Vol
257   // 2, Appendix B).  It's a little tricky: correctness depends on the
258   // fact that the code right before this (in
259   // OSAtomicCompareAndSwap64) has a conditional branch with a data
260   // dependency on the update.  Otherwise, we'd have to use sync.
261   _isync();
262   return t;
263 }
264 
OSAtomicCompareAndSwap64Release(Atomic64 old_value,Atomic64 new_value,Atomic64 * value)265 static inline Atomic64 OSAtomicCompareAndSwap64Release(Atomic64 old_value,
266                                                        Atomic64 new_value,
267                                                        Atomic64 *value) {
268   _lwsync();
269   return OSAtomicCompareAndSwap64(old_value, new_value, value);
270 }
271 
272 
NoBarrier_CompareAndSwap(volatile Atomic64 * ptr,Atomic64 old_value,Atomic64 new_value)273 inline Atomic64 NoBarrier_CompareAndSwap(volatile Atomic64 *ptr,
274                                          Atomic64 old_value,
275                                          Atomic64 new_value) {
276   Atomic64 prev_value;
277   do {
278     if (OSAtomicCompareAndSwap64(old_value, new_value,
279                                  const_cast<Atomic64*>(ptr))) {
280       return old_value;
281     }
282     prev_value = *ptr;
283   } while (prev_value == old_value);
284   return prev_value;
285 }
286 
NoBarrier_AtomicExchange(volatile Atomic64 * ptr,Atomic64 new_value)287 inline Atomic64 NoBarrier_AtomicExchange(volatile Atomic64 *ptr,
288                                          Atomic64 new_value) {
289   Atomic64 old_value;
290   do {
291     old_value = *ptr;
292   } while (!OSAtomicCompareAndSwap64(old_value, new_value,
293                                      const_cast<Atomic64*>(ptr)));
294   return old_value;
295 }
296 
NoBarrier_AtomicIncrement(volatile Atomic64 * ptr,Atomic64 increment)297 inline Atomic64 NoBarrier_AtomicIncrement(volatile Atomic64 *ptr,
298                                           Atomic64 increment) {
299   return OSAtomicAdd64(increment, const_cast<Atomic64*>(ptr));
300 }
301 
Barrier_AtomicIncrement(volatile Atomic64 * ptr,Atomic64 increment)302 inline Atomic64 Barrier_AtomicIncrement(volatile Atomic64 *ptr,
303                                         Atomic64 increment) {
304   return OSAtomicAdd64Barrier(increment, const_cast<Atomic64*>(ptr));
305 }
306 
Acquire_CompareAndSwap(volatile Atomic64 * ptr,Atomic64 old_value,Atomic64 new_value)307 inline Atomic64 Acquire_CompareAndSwap(volatile Atomic64 *ptr,
308                                        Atomic64 old_value,
309                                        Atomic64 new_value) {
310   Atomic64 prev_value;
311   do {
312     if (OSAtomicCompareAndSwap64Acquire(old_value, new_value,
313                                         const_cast<Atomic64*>(ptr))) {
314       return old_value;
315     }
316     prev_value = *ptr;
317   } while (prev_value == old_value);
318   return prev_value;
319 }
320 
Release_CompareAndSwap(volatile Atomic64 * ptr,Atomic64 old_value,Atomic64 new_value)321 inline Atomic64 Release_CompareAndSwap(volatile Atomic64 *ptr,
322                                        Atomic64 old_value,
323                                        Atomic64 new_value) {
324   Atomic64 prev_value;
325   do {
326     if (OSAtomicCompareAndSwap64Release(old_value, new_value,
327                                         const_cast<Atomic64*>(ptr))) {
328       return old_value;
329     }
330     prev_value = *ptr;
331   } while (prev_value == old_value);
332   return prev_value;
333 }
334 
335 #endif
336 
NoBarrier_Store(volatile Atomic32 * ptr,Atomic32 value)337 inline void NoBarrier_Store(volatile Atomic32 *ptr, Atomic32 value) {
338   *ptr = value;
339 }
340 
Acquire_Store(volatile Atomic32 * ptr,Atomic32 value)341 inline void Acquire_Store(volatile Atomic32 *ptr, Atomic32 value) {
342   *ptr = value;
343   // This can't be _lwsync(); we need to order the immediately
344   // preceding stores against any load that may follow, but lwsync
345   // doesn't guarantee that.
346   _sync();
347 }
348 
Release_Store(volatile Atomic32 * ptr,Atomic32 value)349 inline void Release_Store(volatile Atomic32 *ptr, Atomic32 value) {
350   _lwsync();
351   *ptr = value;
352 }
353 
NoBarrier_Load(volatile const Atomic32 * ptr)354 inline Atomic32 NoBarrier_Load(volatile const Atomic32 *ptr) {
355   return *ptr;
356 }
357 
Acquire_Load(volatile const Atomic32 * ptr)358 inline Atomic32 Acquire_Load(volatile const Atomic32 *ptr) {
359   Atomic32 value = *ptr;
360   _lwsync();
361   return value;
362 }
363 
Release_Load(volatile const Atomic32 * ptr)364 inline Atomic32 Release_Load(volatile const Atomic32 *ptr) {
365   // This can't be _lwsync(); we need to order the immediately
366   // preceding stores against any load that may follow, but lwsync
367   // doesn't guarantee that.
368   _sync();
369   return *ptr;
370 }
371 
372 #ifdef __PPC64__
373 
374 // 64-bit Versions.
375 
NoBarrier_Store(volatile Atomic64 * ptr,Atomic64 value)376 inline void NoBarrier_Store(volatile Atomic64 *ptr, Atomic64 value) {
377   *ptr = value;
378 }
379 
Acquire_Store(volatile Atomic64 * ptr,Atomic64 value)380 inline void Acquire_Store(volatile Atomic64 *ptr, Atomic64 value) {
381   *ptr = value;
382   // This can't be _lwsync(); we need to order the immediately
383   // preceding stores against any load that may follow, but lwsync
384   // doesn't guarantee that.
385   _sync();
386 }
387 
Release_Store(volatile Atomic64 * ptr,Atomic64 value)388 inline void Release_Store(volatile Atomic64 *ptr, Atomic64 value) {
389   _lwsync();
390   *ptr = value;
391 }
392 
NoBarrier_Load(volatile const Atomic64 * ptr)393 inline Atomic64 NoBarrier_Load(volatile const Atomic64 *ptr) {
394   return *ptr;
395 }
396 
Acquire_Load(volatile const Atomic64 * ptr)397 inline Atomic64 Acquire_Load(volatile const Atomic64 *ptr) {
398   Atomic64 value = *ptr;
399   _lwsync();
400   return value;
401 }
402 
Release_Load(volatile const Atomic64 * ptr)403 inline Atomic64 Release_Load(volatile const Atomic64 *ptr) {
404   // This can't be _lwsync(); we need to order the immediately
405   // preceding stores against any load that may follow, but lwsync
406   // doesn't guarantee that.
407   _sync();
408   return *ptr;
409 }
410 
411 #endif
412 
413 }   // namespace base::subtle
414 }   // namespace base
415 
416 #endif  // BASE_ATOMICOPS_INTERNALS_LINUXPPC_H_
417