H. Peter Anvin | 1965aae | 2008-10-22 22:26:29 -0700 | [diff] [blame] | 1 | #ifndef _ASM_X86_PERCPU_H |
| 2 | #define _ASM_X86_PERCPU_H |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 3 | |
Tejun Heo | 1a51e3a | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 4 | #ifdef CONFIG_X86_64 |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 5 | #define __percpu_seg gs |
| 6 | #define __percpu_mov_op movq |
Tejun Heo | 1a51e3a | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 7 | #else |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 8 | #define __percpu_seg fs |
| 9 | #define __percpu_mov_op movl |
Tejun Heo | 1a51e3a | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 10 | #endif |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 11 | |
| 12 | #ifdef __ASSEMBLY__ |
| 13 | |
| 14 | /* |
| 15 | * PER_CPU finds an address of a per-cpu variable. |
| 16 | * |
| 17 | * Args: |
| 18 | * var - variable name |
| 19 | * reg - 32bit register |
| 20 | * |
| 21 | * The resulting address is stored in the "reg" argument. |
| 22 | * |
| 23 | * Example: |
| 24 | * PER_CPU(cpu_gdt_descr, %ebx) |
| 25 | */ |
| 26 | #ifdef CONFIG_SMP |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 27 | #define PER_CPU(var, reg) \ |
Rusty Russell | dd17c8f | 2009-10-29 22:34:15 +0900 | [diff] [blame] | 28 | __percpu_mov_op %__percpu_seg:this_cpu_off, reg; \ |
| 29 | lea var(reg), reg |
| 30 | #define PER_CPU_VAR(var) %__percpu_seg:var |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 31 | #else /* ! SMP */ |
Rusty Russell | dd17c8f | 2009-10-29 22:34:15 +0900 | [diff] [blame] | 32 | #define PER_CPU(var, reg) __percpu_mov_op $var, reg |
| 33 | #define PER_CPU_VAR(var) var |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 34 | #endif /* SMP */ |
| 35 | |
Brian Gerst | 2add8e2 | 2009-02-08 09:58:39 -0500 | [diff] [blame] | 36 | #ifdef CONFIG_X86_64_SMP |
| 37 | #define INIT_PER_CPU_VAR(var) init_per_cpu__##var |
| 38 | #else |
Rusty Russell | dd17c8f | 2009-10-29 22:34:15 +0900 | [diff] [blame] | 39 | #define INIT_PER_CPU_VAR(var) var |
Brian Gerst | 2add8e2 | 2009-02-08 09:58:39 -0500 | [diff] [blame] | 40 | #endif |
| 41 | |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 42 | #else /* ...!ASSEMBLY */ |
| 43 | |
Tejun Heo | e59a1bb | 2009-06-22 11:56:24 +0900 | [diff] [blame] | 44 | #include <linux/kernel.h> |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 45 | #include <linux/stringify.h> |
| 46 | |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 47 | #ifdef CONFIG_SMP |
Christoph Lameter | d7c3f8c | 2011-03-26 20:57:18 -0500 | [diff] [blame] | 48 | #define __percpu_prefix "%%"__stringify(__percpu_seg)":" |
Ingo Molnar | 6dbde35 | 2009-01-15 22:15:53 +0900 | [diff] [blame] | 49 | #define __my_cpu_offset percpu_read(this_cpu_off) |
Brian Gerst | db7829c | 2010-09-09 18:17:26 +0200 | [diff] [blame] | 50 | |
| 51 | /* |
| 52 | * Compared to the generic __my_cpu_offset version, the following |
| 53 | * saves one instruction and avoids clobbering a temp register. |
| 54 | */ |
| 55 | #define __this_cpu_ptr(ptr) \ |
| 56 | ({ \ |
| 57 | unsigned long tcp_ptr__; \ |
| 58 | __verify_pcpu_ptr(ptr); \ |
| 59 | asm volatile("add " __percpu_arg(1) ", %0" \ |
| 60 | : "=r" (tcp_ptr__) \ |
| 61 | : "m" (this_cpu_off), "0" (ptr)); \ |
| 62 | (typeof(*(ptr)) __kernel __force *)tcp_ptr__; \ |
| 63 | }) |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 64 | #else |
Christoph Lameter | d7c3f8c | 2011-03-26 20:57:18 -0500 | [diff] [blame] | 65 | #define __percpu_prefix "" |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 66 | #endif |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 67 | |
Christoph Lameter | d7c3f8c | 2011-03-26 20:57:18 -0500 | [diff] [blame] | 68 | #define __percpu_arg(x) __percpu_prefix "%P" #x |
| 69 | |
Brian Gerst | 2add8e2 | 2009-02-08 09:58:39 -0500 | [diff] [blame] | 70 | /* |
| 71 | * Initialized pointers to per-cpu variables needed for the boot |
| 72 | * processor need to use these macros to get the proper address |
| 73 | * offset from __per_cpu_load on SMP. |
| 74 | * |
| 75 | * There also must be an entry in vmlinux_64.lds.S |
| 76 | */ |
| 77 | #define DECLARE_INIT_PER_CPU(var) \ |
Rusty Russell | dd17c8f | 2009-10-29 22:34:15 +0900 | [diff] [blame] | 78 | extern typeof(var) init_per_cpu_var(var) |
Brian Gerst | 2add8e2 | 2009-02-08 09:58:39 -0500 | [diff] [blame] | 79 | |
| 80 | #ifdef CONFIG_X86_64_SMP |
| 81 | #define init_per_cpu_var(var) init_per_cpu__##var |
| 82 | #else |
Rusty Russell | dd17c8f | 2009-10-29 22:34:15 +0900 | [diff] [blame] | 83 | #define init_per_cpu_var(var) var |
Brian Gerst | 2add8e2 | 2009-02-08 09:58:39 -0500 | [diff] [blame] | 84 | #endif |
| 85 | |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 86 | /* For arch-specific code, we can use direct single-insn ops (they |
| 87 | * don't give an lvalue though). */ |
| 88 | extern void __bad_percpu_size(void); |
| 89 | |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 90 | #define percpu_to_op(op, var, val) \ |
| 91 | do { \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 92 | typedef typeof(var) pto_T__; \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 93 | if (0) { \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 94 | pto_T__ pto_tmp__; \ |
| 95 | pto_tmp__ = (val); \ |
Andi Kleen | 23b764d | 2010-06-10 13:10:36 +0200 | [diff] [blame] | 96 | (void)pto_tmp__; \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 97 | } \ |
| 98 | switch (sizeof(var)) { \ |
| 99 | case 1: \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 100 | asm(op "b %1,"__percpu_arg(0) \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 101 | : "+m" (var) \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 102 | : "qi" ((pto_T__)(val))); \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 103 | break; \ |
| 104 | case 2: \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 105 | asm(op "w %1,"__percpu_arg(0) \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 106 | : "+m" (var) \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 107 | : "ri" ((pto_T__)(val))); \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 108 | break; \ |
| 109 | case 4: \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 110 | asm(op "l %1,"__percpu_arg(0) \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 111 | : "+m" (var) \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 112 | : "ri" ((pto_T__)(val))); \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 113 | break; \ |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 114 | case 8: \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 115 | asm(op "q %1,"__percpu_arg(0) \ |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 116 | : "+m" (var) \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 117 | : "re" ((pto_T__)(val))); \ |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 118 | break; \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 119 | default: __bad_percpu_size(); \ |
| 120 | } \ |
| 121 | } while (0) |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 122 | |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 123 | /* |
| 124 | * Generate a percpu add to memory instruction and optimize code |
Justin P. Mattock | 40f0a5d | 2010-04-19 11:51:16 -0700 | [diff] [blame] | 125 | * if one is added or subtracted. |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 126 | */ |
| 127 | #define percpu_add_op(var, val) \ |
| 128 | do { \ |
| 129 | typedef typeof(var) pao_T__; \ |
| 130 | const int pao_ID__ = (__builtin_constant_p(val) && \ |
| 131 | ((val) == 1 || (val) == -1)) ? (val) : 0; \ |
| 132 | if (0) { \ |
| 133 | pao_T__ pao_tmp__; \ |
| 134 | pao_tmp__ = (val); \ |
Andi Kleen | 23b764d | 2010-06-10 13:10:36 +0200 | [diff] [blame] | 135 | (void)pao_tmp__; \ |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 136 | } \ |
| 137 | switch (sizeof(var)) { \ |
| 138 | case 1: \ |
| 139 | if (pao_ID__ == 1) \ |
| 140 | asm("incb "__percpu_arg(0) : "+m" (var)); \ |
| 141 | else if (pao_ID__ == -1) \ |
| 142 | asm("decb "__percpu_arg(0) : "+m" (var)); \ |
| 143 | else \ |
| 144 | asm("addb %1, "__percpu_arg(0) \ |
| 145 | : "+m" (var) \ |
| 146 | : "qi" ((pao_T__)(val))); \ |
| 147 | break; \ |
| 148 | case 2: \ |
| 149 | if (pao_ID__ == 1) \ |
| 150 | asm("incw "__percpu_arg(0) : "+m" (var)); \ |
| 151 | else if (pao_ID__ == -1) \ |
| 152 | asm("decw "__percpu_arg(0) : "+m" (var)); \ |
| 153 | else \ |
| 154 | asm("addw %1, "__percpu_arg(0) \ |
| 155 | : "+m" (var) \ |
| 156 | : "ri" ((pao_T__)(val))); \ |
| 157 | break; \ |
| 158 | case 4: \ |
| 159 | if (pao_ID__ == 1) \ |
| 160 | asm("incl "__percpu_arg(0) : "+m" (var)); \ |
| 161 | else if (pao_ID__ == -1) \ |
| 162 | asm("decl "__percpu_arg(0) : "+m" (var)); \ |
| 163 | else \ |
| 164 | asm("addl %1, "__percpu_arg(0) \ |
| 165 | : "+m" (var) \ |
| 166 | : "ri" ((pao_T__)(val))); \ |
| 167 | break; \ |
| 168 | case 8: \ |
| 169 | if (pao_ID__ == 1) \ |
| 170 | asm("incq "__percpu_arg(0) : "+m" (var)); \ |
| 171 | else if (pao_ID__ == -1) \ |
| 172 | asm("decq "__percpu_arg(0) : "+m" (var)); \ |
| 173 | else \ |
| 174 | asm("addq %1, "__percpu_arg(0) \ |
| 175 | : "+m" (var) \ |
| 176 | : "re" ((pao_T__)(val))); \ |
| 177 | break; \ |
| 178 | default: __bad_percpu_size(); \ |
| 179 | } \ |
| 180 | } while (0) |
| 181 | |
Linus Torvalds | ed8d9ad | 2009-08-03 14:08:48 +0900 | [diff] [blame] | 182 | #define percpu_from_op(op, var, constraint) \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 183 | ({ \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 184 | typeof(var) pfo_ret__; \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 185 | switch (sizeof(var)) { \ |
| 186 | case 1: \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 187 | asm(op "b "__percpu_arg(1)",%0" \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 188 | : "=q" (pfo_ret__) \ |
Linus Torvalds | ed8d9ad | 2009-08-03 14:08:48 +0900 | [diff] [blame] | 189 | : constraint); \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 190 | break; \ |
| 191 | case 2: \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 192 | asm(op "w "__percpu_arg(1)",%0" \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 193 | : "=r" (pfo_ret__) \ |
Linus Torvalds | ed8d9ad | 2009-08-03 14:08:48 +0900 | [diff] [blame] | 194 | : constraint); \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 195 | break; \ |
| 196 | case 4: \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 197 | asm(op "l "__percpu_arg(1)",%0" \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 198 | : "=r" (pfo_ret__) \ |
Linus Torvalds | ed8d9ad | 2009-08-03 14:08:48 +0900 | [diff] [blame] | 199 | : constraint); \ |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 200 | break; \ |
| 201 | case 8: \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 202 | asm(op "q "__percpu_arg(1)",%0" \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 203 | : "=r" (pfo_ret__) \ |
Linus Torvalds | ed8d9ad | 2009-08-03 14:08:48 +0900 | [diff] [blame] | 204 | : constraint); \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 205 | break; \ |
| 206 | default: __bad_percpu_size(); \ |
| 207 | } \ |
Tejun Heo | 0f5e481 | 2009-10-29 22:34:12 +0900 | [diff] [blame] | 208 | pfo_ret__; \ |
Joe Perches | bc9e3be | 2008-03-23 01:03:06 -0700 | [diff] [blame] | 209 | }) |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 210 | |
Jan Beulich | 402af0d | 2010-04-21 15:21:51 +0100 | [diff] [blame] | 211 | #define percpu_unary_op(op, var) \ |
| 212 | ({ \ |
| 213 | switch (sizeof(var)) { \ |
| 214 | case 1: \ |
| 215 | asm(op "b "__percpu_arg(0) \ |
| 216 | : "+m" (var)); \ |
| 217 | break; \ |
| 218 | case 2: \ |
| 219 | asm(op "w "__percpu_arg(0) \ |
| 220 | : "+m" (var)); \ |
| 221 | break; \ |
| 222 | case 4: \ |
| 223 | asm(op "l "__percpu_arg(0) \ |
| 224 | : "+m" (var)); \ |
| 225 | break; \ |
| 226 | case 8: \ |
| 227 | asm(op "q "__percpu_arg(0) \ |
| 228 | : "+m" (var)); \ |
| 229 | break; \ |
| 230 | default: __bad_percpu_size(); \ |
| 231 | } \ |
| 232 | }) |
| 233 | |
Linus Torvalds | ed8d9ad | 2009-08-03 14:08:48 +0900 | [diff] [blame] | 234 | /* |
Tejun Heo | 4030477 | 2010-12-17 15:47:04 +0100 | [diff] [blame] | 235 | * Add return operation |
| 236 | */ |
| 237 | #define percpu_add_return_op(var, val) \ |
| 238 | ({ \ |
| 239 | typeof(var) paro_ret__ = val; \ |
| 240 | switch (sizeof(var)) { \ |
| 241 | case 1: \ |
| 242 | asm("xaddb %0, "__percpu_arg(1) \ |
| 243 | : "+q" (paro_ret__), "+m" (var) \ |
| 244 | : : "memory"); \ |
| 245 | break; \ |
| 246 | case 2: \ |
| 247 | asm("xaddw %0, "__percpu_arg(1) \ |
| 248 | : "+r" (paro_ret__), "+m" (var) \ |
| 249 | : : "memory"); \ |
| 250 | break; \ |
| 251 | case 4: \ |
| 252 | asm("xaddl %0, "__percpu_arg(1) \ |
| 253 | : "+r" (paro_ret__), "+m" (var) \ |
| 254 | : : "memory"); \ |
| 255 | break; \ |
| 256 | case 8: \ |
| 257 | asm("xaddq %0, "__percpu_arg(1) \ |
| 258 | : "+re" (paro_ret__), "+m" (var) \ |
| 259 | : : "memory"); \ |
| 260 | break; \ |
| 261 | default: __bad_percpu_size(); \ |
| 262 | } \ |
| 263 | paro_ret__ += val; \ |
| 264 | paro_ret__; \ |
| 265 | }) |
| 266 | |
| 267 | /* |
Christoph Lameter | 8270137 | 2010-12-14 10:28:47 -0600 | [diff] [blame] | 268 | * xchg is implemented using cmpxchg without a lock prefix. xchg is |
| 269 | * expensive due to the implied lock prefix. The processor cannot prefetch |
| 270 | * cachelines if xchg is used. |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 271 | */ |
| 272 | #define percpu_xchg_op(var, nval) \ |
| 273 | ({ \ |
| 274 | typeof(var) pxo_ret__; \ |
| 275 | typeof(var) pxo_new__ = (nval); \ |
| 276 | switch (sizeof(var)) { \ |
| 277 | case 1: \ |
Eric Dumazet | 889a7a6 | 2011-01-25 17:31:54 +0100 | [diff] [blame] | 278 | asm("\n\tmov "__percpu_arg(1)",%%al" \ |
| 279 | "\n1:\tcmpxchgb %2, "__percpu_arg(1) \ |
Christoph Lameter | 8270137 | 2010-12-14 10:28:47 -0600 | [diff] [blame] | 280 | "\n\tjnz 1b" \ |
Eric Dumazet | 889a7a6 | 2011-01-25 17:31:54 +0100 | [diff] [blame] | 281 | : "=&a" (pxo_ret__), "+m" (var) \ |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 282 | : "q" (pxo_new__) \ |
| 283 | : "memory"); \ |
| 284 | break; \ |
| 285 | case 2: \ |
Eric Dumazet | 889a7a6 | 2011-01-25 17:31:54 +0100 | [diff] [blame] | 286 | asm("\n\tmov "__percpu_arg(1)",%%ax" \ |
| 287 | "\n1:\tcmpxchgw %2, "__percpu_arg(1) \ |
Christoph Lameter | 8270137 | 2010-12-14 10:28:47 -0600 | [diff] [blame] | 288 | "\n\tjnz 1b" \ |
Eric Dumazet | 889a7a6 | 2011-01-25 17:31:54 +0100 | [diff] [blame] | 289 | : "=&a" (pxo_ret__), "+m" (var) \ |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 290 | : "r" (pxo_new__) \ |
| 291 | : "memory"); \ |
| 292 | break; \ |
| 293 | case 4: \ |
Eric Dumazet | 889a7a6 | 2011-01-25 17:31:54 +0100 | [diff] [blame] | 294 | asm("\n\tmov "__percpu_arg(1)",%%eax" \ |
| 295 | "\n1:\tcmpxchgl %2, "__percpu_arg(1) \ |
Christoph Lameter | 8270137 | 2010-12-14 10:28:47 -0600 | [diff] [blame] | 296 | "\n\tjnz 1b" \ |
Eric Dumazet | 889a7a6 | 2011-01-25 17:31:54 +0100 | [diff] [blame] | 297 | : "=&a" (pxo_ret__), "+m" (var) \ |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 298 | : "r" (pxo_new__) \ |
| 299 | : "memory"); \ |
| 300 | break; \ |
| 301 | case 8: \ |
Eric Dumazet | 889a7a6 | 2011-01-25 17:31:54 +0100 | [diff] [blame] | 302 | asm("\n\tmov "__percpu_arg(1)",%%rax" \ |
| 303 | "\n1:\tcmpxchgq %2, "__percpu_arg(1) \ |
Christoph Lameter | 8270137 | 2010-12-14 10:28:47 -0600 | [diff] [blame] | 304 | "\n\tjnz 1b" \ |
Eric Dumazet | 889a7a6 | 2011-01-25 17:31:54 +0100 | [diff] [blame] | 305 | : "=&a" (pxo_ret__), "+m" (var) \ |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 306 | : "r" (pxo_new__) \ |
| 307 | : "memory"); \ |
| 308 | break; \ |
| 309 | default: __bad_percpu_size(); \ |
| 310 | } \ |
| 311 | pxo_ret__; \ |
| 312 | }) |
| 313 | |
| 314 | /* |
| 315 | * cmpxchg has no such implied lock semantics as a result it is much |
| 316 | * more efficient for cpu local operations. |
| 317 | */ |
| 318 | #define percpu_cmpxchg_op(var, oval, nval) \ |
| 319 | ({ \ |
| 320 | typeof(var) pco_ret__; \ |
| 321 | typeof(var) pco_old__ = (oval); \ |
| 322 | typeof(var) pco_new__ = (nval); \ |
| 323 | switch (sizeof(var)) { \ |
| 324 | case 1: \ |
| 325 | asm("cmpxchgb %2, "__percpu_arg(1) \ |
| 326 | : "=a" (pco_ret__), "+m" (var) \ |
| 327 | : "q" (pco_new__), "0" (pco_old__) \ |
| 328 | : "memory"); \ |
| 329 | break; \ |
| 330 | case 2: \ |
| 331 | asm("cmpxchgw %2, "__percpu_arg(1) \ |
| 332 | : "=a" (pco_ret__), "+m" (var) \ |
| 333 | : "r" (pco_new__), "0" (pco_old__) \ |
| 334 | : "memory"); \ |
| 335 | break; \ |
| 336 | case 4: \ |
| 337 | asm("cmpxchgl %2, "__percpu_arg(1) \ |
| 338 | : "=a" (pco_ret__), "+m" (var) \ |
| 339 | : "r" (pco_new__), "0" (pco_old__) \ |
| 340 | : "memory"); \ |
| 341 | break; \ |
| 342 | case 8: \ |
| 343 | asm("cmpxchgq %2, "__percpu_arg(1) \ |
| 344 | : "=a" (pco_ret__), "+m" (var) \ |
| 345 | : "r" (pco_new__), "0" (pco_old__) \ |
| 346 | : "memory"); \ |
| 347 | break; \ |
| 348 | default: __bad_percpu_size(); \ |
| 349 | } \ |
| 350 | pco_ret__; \ |
| 351 | }) |
| 352 | |
| 353 | /* |
Linus Torvalds | ed8d9ad | 2009-08-03 14:08:48 +0900 | [diff] [blame] | 354 | * percpu_read() makes gcc load the percpu variable every time it is |
| 355 | * accessed while percpu_read_stable() allows the value to be cached. |
| 356 | * percpu_read_stable() is more efficient and can be used if its value |
| 357 | * is guaranteed to be valid across cpus. The current users include |
| 358 | * get_current() and get_thread_info() both of which are actually |
| 359 | * per-thread variables implemented as per-cpu variables and thus |
| 360 | * stable for the duration of the respective task. |
| 361 | */ |
Rusty Russell | dd17c8f | 2009-10-29 22:34:15 +0900 | [diff] [blame] | 362 | #define percpu_read(var) percpu_from_op("mov", var, "m" (var)) |
| 363 | #define percpu_read_stable(var) percpu_from_op("mov", var, "p" (&(var))) |
| 364 | #define percpu_write(var, val) percpu_to_op("mov", var, val) |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 365 | #define percpu_add(var, val) percpu_add_op(var, val) |
| 366 | #define percpu_sub(var, val) percpu_add_op(var, -(val)) |
Rusty Russell | dd17c8f | 2009-10-29 22:34:15 +0900 | [diff] [blame] | 367 | #define percpu_and(var, val) percpu_to_op("and", var, val) |
| 368 | #define percpu_or(var, val) percpu_to_op("or", var, val) |
| 369 | #define percpu_xor(var, val) percpu_to_op("xor", var, val) |
Jan Beulich | 402af0d | 2010-04-21 15:21:51 +0100 | [diff] [blame] | 370 | #define percpu_inc(var) percpu_unary_op("inc", var) |
Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 371 | |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 372 | #define __this_cpu_read_1(pcp) percpu_from_op("mov", (pcp), "m"(pcp)) |
| 373 | #define __this_cpu_read_2(pcp) percpu_from_op("mov", (pcp), "m"(pcp)) |
| 374 | #define __this_cpu_read_4(pcp) percpu_from_op("mov", (pcp), "m"(pcp)) |
| 375 | |
| 376 | #define __this_cpu_write_1(pcp, val) percpu_to_op("mov", (pcp), val) |
| 377 | #define __this_cpu_write_2(pcp, val) percpu_to_op("mov", (pcp), val) |
| 378 | #define __this_cpu_write_4(pcp, val) percpu_to_op("mov", (pcp), val) |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 379 | #define __this_cpu_add_1(pcp, val) percpu_add_op((pcp), val) |
| 380 | #define __this_cpu_add_2(pcp, val) percpu_add_op((pcp), val) |
| 381 | #define __this_cpu_add_4(pcp, val) percpu_add_op((pcp), val) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 382 | #define __this_cpu_and_1(pcp, val) percpu_to_op("and", (pcp), val) |
| 383 | #define __this_cpu_and_2(pcp, val) percpu_to_op("and", (pcp), val) |
| 384 | #define __this_cpu_and_4(pcp, val) percpu_to_op("and", (pcp), val) |
| 385 | #define __this_cpu_or_1(pcp, val) percpu_to_op("or", (pcp), val) |
| 386 | #define __this_cpu_or_2(pcp, val) percpu_to_op("or", (pcp), val) |
| 387 | #define __this_cpu_or_4(pcp, val) percpu_to_op("or", (pcp), val) |
| 388 | #define __this_cpu_xor_1(pcp, val) percpu_to_op("xor", (pcp), val) |
| 389 | #define __this_cpu_xor_2(pcp, val) percpu_to_op("xor", (pcp), val) |
| 390 | #define __this_cpu_xor_4(pcp, val) percpu_to_op("xor", (pcp), val) |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 391 | /* |
| 392 | * Generic fallback operations for __this_cpu_xchg_[1-4] are okay and much |
| 393 | * faster than an xchg with forced lock semantics. |
| 394 | */ |
| 395 | #define __this_cpu_xchg_8(pcp, nval) percpu_xchg_op(pcp, nval) |
| 396 | #define __this_cpu_cmpxchg_8(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 397 | |
| 398 | #define this_cpu_read_1(pcp) percpu_from_op("mov", (pcp), "m"(pcp)) |
| 399 | #define this_cpu_read_2(pcp) percpu_from_op("mov", (pcp), "m"(pcp)) |
| 400 | #define this_cpu_read_4(pcp) percpu_from_op("mov", (pcp), "m"(pcp)) |
| 401 | #define this_cpu_write_1(pcp, val) percpu_to_op("mov", (pcp), val) |
| 402 | #define this_cpu_write_2(pcp, val) percpu_to_op("mov", (pcp), val) |
| 403 | #define this_cpu_write_4(pcp, val) percpu_to_op("mov", (pcp), val) |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 404 | #define this_cpu_add_1(pcp, val) percpu_add_op((pcp), val) |
| 405 | #define this_cpu_add_2(pcp, val) percpu_add_op((pcp), val) |
| 406 | #define this_cpu_add_4(pcp, val) percpu_add_op((pcp), val) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 407 | #define this_cpu_and_1(pcp, val) percpu_to_op("and", (pcp), val) |
| 408 | #define this_cpu_and_2(pcp, val) percpu_to_op("and", (pcp), val) |
| 409 | #define this_cpu_and_4(pcp, val) percpu_to_op("and", (pcp), val) |
| 410 | #define this_cpu_or_1(pcp, val) percpu_to_op("or", (pcp), val) |
| 411 | #define this_cpu_or_2(pcp, val) percpu_to_op("or", (pcp), val) |
| 412 | #define this_cpu_or_4(pcp, val) percpu_to_op("or", (pcp), val) |
| 413 | #define this_cpu_xor_1(pcp, val) percpu_to_op("xor", (pcp), val) |
| 414 | #define this_cpu_xor_2(pcp, val) percpu_to_op("xor", (pcp), val) |
| 415 | #define this_cpu_xor_4(pcp, val) percpu_to_op("xor", (pcp), val) |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 416 | #define this_cpu_xchg_1(pcp, nval) percpu_xchg_op(pcp, nval) |
| 417 | #define this_cpu_xchg_2(pcp, nval) percpu_xchg_op(pcp, nval) |
| 418 | #define this_cpu_xchg_4(pcp, nval) percpu_xchg_op(pcp, nval) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 419 | |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 420 | #define irqsafe_cpu_add_1(pcp, val) percpu_add_op((pcp), val) |
| 421 | #define irqsafe_cpu_add_2(pcp, val) percpu_add_op((pcp), val) |
| 422 | #define irqsafe_cpu_add_4(pcp, val) percpu_add_op((pcp), val) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 423 | #define irqsafe_cpu_and_1(pcp, val) percpu_to_op("and", (pcp), val) |
| 424 | #define irqsafe_cpu_and_2(pcp, val) percpu_to_op("and", (pcp), val) |
| 425 | #define irqsafe_cpu_and_4(pcp, val) percpu_to_op("and", (pcp), val) |
| 426 | #define irqsafe_cpu_or_1(pcp, val) percpu_to_op("or", (pcp), val) |
| 427 | #define irqsafe_cpu_or_2(pcp, val) percpu_to_op("or", (pcp), val) |
| 428 | #define irqsafe_cpu_or_4(pcp, val) percpu_to_op("or", (pcp), val) |
| 429 | #define irqsafe_cpu_xor_1(pcp, val) percpu_to_op("xor", (pcp), val) |
| 430 | #define irqsafe_cpu_xor_2(pcp, val) percpu_to_op("xor", (pcp), val) |
| 431 | #define irqsafe_cpu_xor_4(pcp, val) percpu_to_op("xor", (pcp), val) |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 432 | #define irqsafe_cpu_xchg_1(pcp, nval) percpu_xchg_op(pcp, nval) |
| 433 | #define irqsafe_cpu_xchg_2(pcp, nval) percpu_xchg_op(pcp, nval) |
| 434 | #define irqsafe_cpu_xchg_4(pcp, nval) percpu_xchg_op(pcp, nval) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 435 | |
Christoph Lameter | 8f1d97c | 2010-12-06 11:40:00 -0600 | [diff] [blame] | 436 | #ifndef CONFIG_M386 |
| 437 | #define __this_cpu_add_return_1(pcp, val) percpu_add_return_op(pcp, val) |
| 438 | #define __this_cpu_add_return_2(pcp, val) percpu_add_return_op(pcp, val) |
| 439 | #define __this_cpu_add_return_4(pcp, val) percpu_add_return_op(pcp, val) |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 440 | #define __this_cpu_cmpxchg_1(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 441 | #define __this_cpu_cmpxchg_2(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 442 | #define __this_cpu_cmpxchg_4(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 443 | |
Christoph Lameter | 8f1d97c | 2010-12-06 11:40:00 -0600 | [diff] [blame] | 444 | #define this_cpu_add_return_1(pcp, val) percpu_add_return_op(pcp, val) |
| 445 | #define this_cpu_add_return_2(pcp, val) percpu_add_return_op(pcp, val) |
| 446 | #define this_cpu_add_return_4(pcp, val) percpu_add_return_op(pcp, val) |
Christoph Lameter | 7296e08 | 2010-12-14 10:28:44 -0600 | [diff] [blame] | 447 | #define this_cpu_cmpxchg_1(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 448 | #define this_cpu_cmpxchg_2(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 449 | #define this_cpu_cmpxchg_4(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 450 | |
| 451 | #define irqsafe_cpu_cmpxchg_1(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 452 | #define irqsafe_cpu_cmpxchg_2(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 453 | #define irqsafe_cpu_cmpxchg_4(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
| 454 | #endif /* !CONFIG_M386 */ |
| 455 | |
Christoph Lameter | b9ec40a | 2011-02-28 11:02:24 +0100 | [diff] [blame] | 456 | #ifdef CONFIG_X86_CMPXCHG64 |
| 457 | #define percpu_cmpxchg8b_double(pcp1, o1, o2, n1, n2) \ |
| 458 | ({ \ |
| 459 | char __ret; \ |
| 460 | typeof(o1) __o1 = o1; \ |
| 461 | typeof(o1) __n1 = n1; \ |
| 462 | typeof(o2) __o2 = o2; \ |
| 463 | typeof(o2) __n2 = n2; \ |
| 464 | typeof(o2) __dummy = n2; \ |
| 465 | asm volatile("cmpxchg8b "__percpu_arg(1)"\n\tsetz %0\n\t" \ |
| 466 | : "=a"(__ret), "=m" (pcp1), "=d"(__dummy) \ |
| 467 | : "b"(__n1), "c"(__n2), "a"(__o1), "d"(__o2)); \ |
| 468 | __ret; \ |
| 469 | }) |
| 470 | |
| 471 | #define __this_cpu_cmpxchg_double_4(pcp1, pcp2, o1, o2, n1, n2) percpu_cmpxchg8b_double(pcp1, o1, o2, n1, n2) |
| 472 | #define this_cpu_cmpxchg_double_4(pcp1, pcp2, o1, o2, n1, n2) percpu_cmpxchg8b_double(pcp1, o1, o2, n1, n2) |
| 473 | #define irqsafe_cpu_cmpxchg_double_4(pcp1, pcp2, o1, o2, n1, n2) percpu_cmpxchg8b_double(pcp1, o1, o2, n1, n2) |
| 474 | #endif /* CONFIG_X86_CMPXCHG64 */ |
| 475 | |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 476 | /* |
| 477 | * Per cpu atomic 64 bit operations are only available under 64 bit. |
| 478 | * 32 bit must fall back to generic operations. |
| 479 | */ |
| 480 | #ifdef CONFIG_X86_64 |
| 481 | #define __this_cpu_read_8(pcp) percpu_from_op("mov", (pcp), "m"(pcp)) |
| 482 | #define __this_cpu_write_8(pcp, val) percpu_to_op("mov", (pcp), val) |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 483 | #define __this_cpu_add_8(pcp, val) percpu_add_op((pcp), val) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 484 | #define __this_cpu_and_8(pcp, val) percpu_to_op("and", (pcp), val) |
| 485 | #define __this_cpu_or_8(pcp, val) percpu_to_op("or", (pcp), val) |
| 486 | #define __this_cpu_xor_8(pcp, val) percpu_to_op("xor", (pcp), val) |
Tejun Heo | 4030477 | 2010-12-17 15:47:04 +0100 | [diff] [blame] | 487 | #define __this_cpu_add_return_8(pcp, val) percpu_add_return_op(pcp, val) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 488 | |
| 489 | #define this_cpu_read_8(pcp) percpu_from_op("mov", (pcp), "m"(pcp)) |
| 490 | #define this_cpu_write_8(pcp, val) percpu_to_op("mov", (pcp), val) |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 491 | #define this_cpu_add_8(pcp, val) percpu_add_op((pcp), val) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 492 | #define this_cpu_and_8(pcp, val) percpu_to_op("and", (pcp), val) |
| 493 | #define this_cpu_or_8(pcp, val) percpu_to_op("or", (pcp), val) |
| 494 | #define this_cpu_xor_8(pcp, val) percpu_to_op("xor", (pcp), val) |
Tejun Heo | 4030477 | 2010-12-17 15:47:04 +0100 | [diff] [blame] | 495 | #define this_cpu_add_return_8(pcp, val) percpu_add_return_op(pcp, val) |
Christoph Lameter | 2485b64 | 2011-01-11 18:54:53 +0100 | [diff] [blame] | 496 | #define this_cpu_xchg_8(pcp, nval) percpu_xchg_op(pcp, nval) |
| 497 | #define this_cpu_cmpxchg_8(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 498 | |
Christoph Lameter | 5917dae | 2010-01-05 15:34:50 +0900 | [diff] [blame] | 499 | #define irqsafe_cpu_add_8(pcp, val) percpu_add_op((pcp), val) |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 500 | #define irqsafe_cpu_and_8(pcp, val) percpu_to_op("and", (pcp), val) |
| 501 | #define irqsafe_cpu_or_8(pcp, val) percpu_to_op("or", (pcp), val) |
| 502 | #define irqsafe_cpu_xor_8(pcp, val) percpu_to_op("xor", (pcp), val) |
Christoph Lameter | 2485b64 | 2011-01-11 18:54:53 +0100 | [diff] [blame] | 503 | #define irqsafe_cpu_xchg_8(pcp, nval) percpu_xchg_op(pcp, nval) |
| 504 | #define irqsafe_cpu_cmpxchg_8(pcp, oval, nval) percpu_cmpxchg_op(pcp, oval, nval) |
Christoph Lameter | b9ec40a | 2011-02-28 11:02:24 +0100 | [diff] [blame] | 505 | |
| 506 | /* |
| 507 | * Pretty complex macro to generate cmpxchg16 instruction. The instruction |
| 508 | * is not supported on early AMD64 processors so we must be able to emulate |
| 509 | * it in software. The address used in the cmpxchg16 instruction must be |
| 510 | * aligned to a 16 byte boundary. |
| 511 | */ |
Eric Dumazet | 5f55924 | 2011-03-28 18:06:58 +0200 | [diff] [blame] | 512 | #ifdef CONFIG_SMP |
Linus Torvalds | 5129df0 | 2011-05-24 11:53:42 -0700 | [diff] [blame] | 513 | #define CMPXCHG16B_EMU_CALL "call this_cpu_cmpxchg16b_emu\n\t" ASM_NOP3 |
Eric Dumazet | 5f55924 | 2011-03-28 18:06:58 +0200 | [diff] [blame] | 514 | #else |
Linus Torvalds | 5129df0 | 2011-05-24 11:53:42 -0700 | [diff] [blame] | 515 | #define CMPXCHG16B_EMU_CALL "call this_cpu_cmpxchg16b_emu\n\t" ASM_NOP2 |
Eric Dumazet | 5f55924 | 2011-03-28 18:06:58 +0200 | [diff] [blame] | 516 | #endif |
Christoph Lameter | b9ec40a | 2011-02-28 11:02:24 +0100 | [diff] [blame] | 517 | #define percpu_cmpxchg16b_double(pcp1, o1, o2, n1, n2) \ |
| 518 | ({ \ |
| 519 | char __ret; \ |
| 520 | typeof(o1) __o1 = o1; \ |
| 521 | typeof(o1) __n1 = n1; \ |
| 522 | typeof(o2) __o2 = o2; \ |
| 523 | typeof(o2) __n2 = n2; \ |
| 524 | typeof(o2) __dummy; \ |
Eric Dumazet | 5f55924 | 2011-03-28 18:06:58 +0200 | [diff] [blame] | 525 | alternative_io(CMPXCHG16B_EMU_CALL, \ |
Christoph Lameter | d7c3f8c | 2011-03-26 20:57:18 -0500 | [diff] [blame] | 526 | "cmpxchg16b " __percpu_prefix "(%%rsi)\n\tsetz %0\n\t", \ |
Christoph Lameter | b9ec40a | 2011-02-28 11:02:24 +0100 | [diff] [blame] | 527 | X86_FEATURE_CX16, \ |
| 528 | ASM_OUTPUT2("=a"(__ret), "=d"(__dummy)), \ |
| 529 | "S" (&pcp1), "b"(__n1), "c"(__n2), \ |
Christoph Lameter | d7c3f8c | 2011-03-26 20:57:18 -0500 | [diff] [blame] | 530 | "a"(__o1), "d"(__o2) : "memory"); \ |
Christoph Lameter | b9ec40a | 2011-02-28 11:02:24 +0100 | [diff] [blame] | 531 | __ret; \ |
| 532 | }) |
| 533 | |
| 534 | #define __this_cpu_cmpxchg_double_8(pcp1, pcp2, o1, o2, n1, n2) percpu_cmpxchg16b_double(pcp1, o1, o2, n1, n2) |
| 535 | #define this_cpu_cmpxchg_double_8(pcp1, pcp2, o1, o2, n1, n2) percpu_cmpxchg16b_double(pcp1, o1, o2, n1, n2) |
| 536 | #define irqsafe_cpu_cmpxchg_double_8(pcp1, pcp2, o1, o2, n1, n2) percpu_cmpxchg16b_double(pcp1, o1, o2, n1, n2) |
| 537 | |
Christoph Lameter | 30ed1a7 | 2009-10-03 19:48:22 +0900 | [diff] [blame] | 538 | #endif |
| 539 | |
Tejun Heo | 49357d1 | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 540 | /* This is not atomic against other CPUs -- CPU preemption needs to be off */ |
| 541 | #define x86_test_and_clear_bit_percpu(bit, var) \ |
| 542 | ({ \ |
| 543 | int old__; \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 544 | asm volatile("btr %2,"__percpu_arg(1)"\n\tsbbl %0,%0" \ |
Rusty Russell | dd17c8f | 2009-10-29 22:34:15 +0900 | [diff] [blame] | 545 | : "=r" (old__), "+m" (var) \ |
Brian Gerst | 87b2640 | 2009-01-19 00:38:59 +0900 | [diff] [blame] | 546 | : "dIr" (bit)); \ |
Tejun Heo | 49357d1 | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 547 | old__; \ |
| 548 | }) |
| 549 | |
Christoph Lameter | 349c004 | 2011-03-12 12:50:10 +0100 | [diff] [blame] | 550 | static __always_inline int x86_this_cpu_constant_test_bit(unsigned int nr, |
| 551 | const unsigned long __percpu *addr) |
| 552 | { |
| 553 | unsigned long __percpu *a = (unsigned long *)addr + nr / BITS_PER_LONG; |
| 554 | |
| 555 | return ((1UL << (nr % BITS_PER_LONG)) & percpu_read(*a)) != 0; |
| 556 | } |
| 557 | |
| 558 | static inline int x86_this_cpu_variable_test_bit(int nr, |
| 559 | const unsigned long __percpu *addr) |
| 560 | { |
| 561 | int oldbit; |
| 562 | |
| 563 | asm volatile("bt "__percpu_arg(2)",%1\n\t" |
| 564 | "sbb %0,%0" |
| 565 | : "=r" (oldbit) |
| 566 | : "m" (*(unsigned long *)addr), "Ir" (nr)); |
| 567 | |
| 568 | return oldbit; |
| 569 | } |
| 570 | |
| 571 | #define x86_this_cpu_test_bit(nr, addr) \ |
| 572 | (__builtin_constant_p((nr)) \ |
| 573 | ? x86_this_cpu_constant_test_bit((nr), (addr)) \ |
| 574 | : x86_this_cpu_variable_test_bit((nr), (addr))) |
| 575 | |
| 576 | |
Ingo Molnar | 6dbde35 | 2009-01-15 22:15:53 +0900 | [diff] [blame] | 577 | #include <asm-generic/percpu.h> |
| 578 | |
| 579 | /* We can use this directly for local CPU (faster). */ |
| 580 | DECLARE_PER_CPU(unsigned long, this_cpu_off); |
| 581 | |
travis@sgi.com | 3334052 | 2008-01-30 13:32:53 +0100 | [diff] [blame] | 582 | #endif /* !__ASSEMBLY__ */ |
Mike Travis | 23ca4bb | 2008-05-12 21:21:12 +0200 | [diff] [blame] | 583 | |
| 584 | #ifdef CONFIG_SMP |
| 585 | |
| 586 | /* |
| 587 | * Define the "EARLY_PER_CPU" macros. These are used for some per_cpu |
| 588 | * variables that are initialized and accessed before there are per_cpu |
| 589 | * areas allocated. |
| 590 | */ |
| 591 | |
| 592 | #define DEFINE_EARLY_PER_CPU(_type, _name, _initvalue) \ |
| 593 | DEFINE_PER_CPU(_type, _name) = _initvalue; \ |
| 594 | __typeof__(_type) _name##_early_map[NR_CPUS] __initdata = \ |
| 595 | { [0 ... NR_CPUS-1] = _initvalue }; \ |
Marcin Slusarz | c6a92a2 | 2008-08-17 17:50:50 +0200 | [diff] [blame] | 596 | __typeof__(_type) *_name##_early_ptr __refdata = _name##_early_map |
Mike Travis | 23ca4bb | 2008-05-12 21:21:12 +0200 | [diff] [blame] | 597 | |
| 598 | #define EXPORT_EARLY_PER_CPU_SYMBOL(_name) \ |
| 599 | EXPORT_PER_CPU_SYMBOL(_name) |
| 600 | |
| 601 | #define DECLARE_EARLY_PER_CPU(_type, _name) \ |
| 602 | DECLARE_PER_CPU(_type, _name); \ |
| 603 | extern __typeof__(_type) *_name##_early_ptr; \ |
| 604 | extern __typeof__(_type) _name##_early_map[] |
| 605 | |
| 606 | #define early_per_cpu_ptr(_name) (_name##_early_ptr) |
| 607 | #define early_per_cpu_map(_name, _idx) (_name##_early_map[_idx]) |
| 608 | #define early_per_cpu(_name, _cpu) \ |
Tejun Heo | f10fcd4 | 2009-01-13 20:41:34 +0900 | [diff] [blame] | 609 | *(early_per_cpu_ptr(_name) ? \ |
| 610 | &early_per_cpu_ptr(_name)[_cpu] : \ |
| 611 | &per_cpu(_name, _cpu)) |
Mike Travis | 23ca4bb | 2008-05-12 21:21:12 +0200 | [diff] [blame] | 612 | |
| 613 | #else /* !CONFIG_SMP */ |
| 614 | #define DEFINE_EARLY_PER_CPU(_type, _name, _initvalue) \ |
| 615 | DEFINE_PER_CPU(_type, _name) = _initvalue |
| 616 | |
| 617 | #define EXPORT_EARLY_PER_CPU_SYMBOL(_name) \ |
| 618 | EXPORT_PER_CPU_SYMBOL(_name) |
| 619 | |
| 620 | #define DECLARE_EARLY_PER_CPU(_type, _name) \ |
| 621 | DECLARE_PER_CPU(_type, _name) |
| 622 | |
| 623 | #define early_per_cpu(_name, _cpu) per_cpu(_name, _cpu) |
| 624 | #define early_per_cpu_ptr(_name) NULL |
| 625 | /* no early_per_cpu_map() */ |
| 626 | |
| 627 | #endif /* !CONFIG_SMP */ |
| 628 | |
H. Peter Anvin | 1965aae | 2008-10-22 22:26:29 -0700 | [diff] [blame] | 629 | #endif /* _ASM_X86_PERCPU_H */ |