• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright 2010 Tilera Corporation. All Rights Reserved.
3  *
4  *   This program is free software; you can redistribute it and/or
5  *   modify it under the terms of the GNU General Public License
6  *   as published by the Free Software Foundation, version 2.
7  *
8  *   This program is distributed in the hope that it will be useful, but
9  *   WITHOUT ANY WARRANTY; without even the implied warranty of
10  *   MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE, GOOD TITLE or
11  *   NON INFRINGEMENT.  See the GNU General Public License for
12  *   more details.
13  */
14 
15 #include <linux/cache.h>
16 #include <linux/delay.h>
17 #include <linux/uaccess.h>
18 #include <linux/module.h>
19 #include <linux/mm.h>
20 #include <linux/atomic.h>
21 #include <arch/chip.h>
22 
23 /* This page is remapped on startup to be hash-for-home. */
24 int atomic_locks[PAGE_SIZE / sizeof(int)] __page_aligned_bss;
25 
__atomic_hashed_lock(volatile void * v)26 int *__atomic_hashed_lock(volatile void *v)
27 {
28 	/* NOTE: this code must match "sys_cmpxchg" in kernel/intvec_32.S */
29 	/*
30 	 * Use bits [3, 3 + ATOMIC_HASH_SHIFT) as the lock index.
31 	 * Using mm works here because atomic_locks is page aligned.
32 	 */
33 	unsigned long ptr = __insn_mm((unsigned long)v >> 1,
34 				      (unsigned long)atomic_locks,
35 				      2, (ATOMIC_HASH_SHIFT + 2) - 1);
36 	return (int *)ptr;
37 }
38 
39 #ifdef CONFIG_SMP
40 /* Return whether the passed pointer is a valid atomic lock pointer. */
is_atomic_lock(int * p)41 static int is_atomic_lock(int *p)
42 {
43 	return p >= &atomic_locks[0] && p < &atomic_locks[ATOMIC_HASH_SIZE];
44 }
45 
__atomic_fault_unlock(int * irqlock_word)46 void __atomic_fault_unlock(int *irqlock_word)
47 {
48 	BUG_ON(!is_atomic_lock(irqlock_word));
49 	BUG_ON(*irqlock_word != 1);
50 	*irqlock_word = 0;
51 }
52 
53 #endif /* CONFIG_SMP */
54 
__atomic_setup(volatile void * v)55 static inline int *__atomic_setup(volatile void *v)
56 {
57 	/* Issue a load to the target to bring it into cache. */
58 	*(volatile int *)v;
59 	return __atomic_hashed_lock(v);
60 }
61 
_atomic_xchg(int * v,int n)62 int _atomic_xchg(int *v, int n)
63 {
64 	return __atomic32_xchg(v, __atomic_setup(v), n).val;
65 }
66 EXPORT_SYMBOL(_atomic_xchg);
67 
_atomic_xchg_add(int * v,int i)68 int _atomic_xchg_add(int *v, int i)
69 {
70 	return __atomic32_xchg_add(v, __atomic_setup(v), i).val;
71 }
72 EXPORT_SYMBOL(_atomic_xchg_add);
73 
_atomic_xchg_add_unless(int * v,int a,int u)74 int _atomic_xchg_add_unless(int *v, int a, int u)
75 {
76 	/*
77 	 * Note: argument order is switched here since it is easier
78 	 * to use the first argument consistently as the "old value"
79 	 * in the assembly, as is done for _atomic_cmpxchg().
80 	 */
81 	return __atomic32_xchg_add_unless(v, __atomic_setup(v), u, a).val;
82 }
83 EXPORT_SYMBOL(_atomic_xchg_add_unless);
84 
_atomic_cmpxchg(int * v,int o,int n)85 int _atomic_cmpxchg(int *v, int o, int n)
86 {
87 	return __atomic32_cmpxchg(v, __atomic_setup(v), o, n).val;
88 }
89 EXPORT_SYMBOL(_atomic_cmpxchg);
90 
_atomic_fetch_or(volatile unsigned long * p,unsigned long mask)91 unsigned long _atomic_fetch_or(volatile unsigned long *p, unsigned long mask)
92 {
93 	return __atomic32_fetch_or((int *)p, __atomic_setup(p), mask).val;
94 }
95 EXPORT_SYMBOL(_atomic_fetch_or);
96 
_atomic_fetch_and(volatile unsigned long * p,unsigned long mask)97 unsigned long _atomic_fetch_and(volatile unsigned long *p, unsigned long mask)
98 {
99 	return __atomic32_fetch_and((int *)p, __atomic_setup(p), mask).val;
100 }
101 EXPORT_SYMBOL(_atomic_fetch_and);
102 
_atomic_fetch_andn(volatile unsigned long * p,unsigned long mask)103 unsigned long _atomic_fetch_andn(volatile unsigned long *p, unsigned long mask)
104 {
105 	return __atomic32_fetch_andn((int *)p, __atomic_setup(p), mask).val;
106 }
107 EXPORT_SYMBOL(_atomic_fetch_andn);
108 
_atomic_fetch_xor(volatile unsigned long * p,unsigned long mask)109 unsigned long _atomic_fetch_xor(volatile unsigned long *p, unsigned long mask)
110 {
111 	return __atomic32_fetch_xor((int *)p, __atomic_setup(p), mask).val;
112 }
113 EXPORT_SYMBOL(_atomic_fetch_xor);
114 
115 
_atomic64_xchg(long long * v,long long n)116 long long _atomic64_xchg(long long *v, long long n)
117 {
118 	return __atomic64_xchg(v, __atomic_setup(v), n);
119 }
120 EXPORT_SYMBOL(_atomic64_xchg);
121 
_atomic64_xchg_add(long long * v,long long i)122 long long _atomic64_xchg_add(long long *v, long long i)
123 {
124 	return __atomic64_xchg_add(v, __atomic_setup(v), i);
125 }
126 EXPORT_SYMBOL(_atomic64_xchg_add);
127 
_atomic64_xchg_add_unless(long long * v,long long a,long long u)128 long long _atomic64_xchg_add_unless(long long *v, long long a, long long u)
129 {
130 	/*
131 	 * Note: argument order is switched here since it is easier
132 	 * to use the first argument consistently as the "old value"
133 	 * in the assembly, as is done for _atomic_cmpxchg().
134 	 */
135 	return __atomic64_xchg_add_unless(v, __atomic_setup(v), u, a);
136 }
137 EXPORT_SYMBOL(_atomic64_xchg_add_unless);
138 
_atomic64_cmpxchg(long long * v,long long o,long long n)139 long long _atomic64_cmpxchg(long long *v, long long o, long long n)
140 {
141 	return __atomic64_cmpxchg(v, __atomic_setup(v), o, n);
142 }
143 EXPORT_SYMBOL(_atomic64_cmpxchg);
144 
_atomic64_fetch_and(long long * v,long long n)145 long long _atomic64_fetch_and(long long *v, long long n)
146 {
147 	return __atomic64_fetch_and(v, __atomic_setup(v), n);
148 }
149 EXPORT_SYMBOL(_atomic64_fetch_and);
150 
_atomic64_fetch_or(long long * v,long long n)151 long long _atomic64_fetch_or(long long *v, long long n)
152 {
153 	return __atomic64_fetch_or(v, __atomic_setup(v), n);
154 }
155 EXPORT_SYMBOL(_atomic64_fetch_or);
156 
_atomic64_fetch_xor(long long * v,long long n)157 long long _atomic64_fetch_xor(long long *v, long long n)
158 {
159 	return __atomic64_fetch_xor(v, __atomic_setup(v), n);
160 }
161 EXPORT_SYMBOL(_atomic64_fetch_xor);
162 
163 /*
164  * If any of the atomic or futex routines hit a bad address (not in
165  * the page tables at kernel PL) this routine is called.  The futex
166  * routines are never used on kernel space, and the normal atomics and
167  * bitops are never used on user space.  So a fault on kernel space
168  * must be fatal, but a fault on userspace is a futex fault and we
169  * need to return -EFAULT.  Note that the context this routine is
170  * invoked in is the context of the "_atomic_xxx()" routines called
171  * by the functions in this file.
172  */
__atomic_bad_address(int __user * addr)173 struct __get_user __atomic_bad_address(int __user *addr)
174 {
175 	if (unlikely(!access_ok(VERIFY_WRITE, addr, sizeof(int))))
176 		panic("Bad address used for kernel atomic op: %p\n", addr);
177 	return (struct __get_user) { .err = -EFAULT };
178 }
179 
180 
__init_atomic_per_cpu(void)181 void __init __init_atomic_per_cpu(void)
182 {
183 	/* Validate power-of-two and "bigger than cpus" assumption */
184 	BUILD_BUG_ON(ATOMIC_HASH_SIZE & (ATOMIC_HASH_SIZE-1));
185 	BUG_ON(ATOMIC_HASH_SIZE < nr_cpu_ids);
186 
187 	/*
188 	 * On TILEPro we prefer to use a single hash-for-home
189 	 * page, since this means atomic operations are less
190 	 * likely to encounter a TLB fault and thus should
191 	 * in general perform faster.  You may wish to disable
192 	 * this in situations where few hash-for-home tiles
193 	 * are configured.
194 	 */
195 	BUG_ON((unsigned long)atomic_locks % PAGE_SIZE != 0);
196 
197 	/* The locks must all fit on one page. */
198 	BUILD_BUG_ON(ATOMIC_HASH_SIZE * sizeof(int) > PAGE_SIZE);
199 
200 	/*
201 	 * We use the page offset of the atomic value's address as
202 	 * an index into atomic_locks, excluding the low 3 bits.
203 	 * That should not produce more indices than ATOMIC_HASH_SIZE.
204 	 */
205 	BUILD_BUG_ON((PAGE_SIZE >> 3) > ATOMIC_HASH_SIZE);
206 }
207