at v5.0-rc2 562 lines 14 kB view raw
1/* 2 * Copyright (C) 2004, 2007-2010, 2011-2012 Synopsys, Inc. (www.synopsys.com) 3 * 4 * This program is free software; you can redistribute it and/or modify 5 * it under the terms of the GNU General Public License version 2 as 6 * published by the Free Software Foundation. 7 */ 8 9#ifndef _ASM_ARC_ATOMIC_H 10#define _ASM_ARC_ATOMIC_H 11 12#ifndef __ASSEMBLY__ 13 14#include <linux/types.h> 15#include <linux/compiler.h> 16#include <asm/cmpxchg.h> 17#include <asm/barrier.h> 18#include <asm/smp.h> 19 20#define ATOMIC_INIT(i) { (i) } 21 22#ifndef CONFIG_ARC_PLAT_EZNPS 23 24#define atomic_read(v) READ_ONCE((v)->counter) 25 26#ifdef CONFIG_ARC_HAS_LLSC 27 28#define atomic_set(v, i) WRITE_ONCE(((v)->counter), (i)) 29 30#define ATOMIC_OP(op, c_op, asm_op) \ 31static inline void atomic_##op(int i, atomic_t *v) \ 32{ \ 33 unsigned int val; \ 34 \ 35 __asm__ __volatile__( \ 36 "1: llock %[val], [%[ctr]] \n" \ 37 " " #asm_op " %[val], %[val], %[i] \n" \ 38 " scond %[val], [%[ctr]] \n" \ 39 " bnz 1b \n" \ 40 : [val] "=&r" (val) /* Early clobber to prevent reg reuse */ \ 41 : [ctr] "r" (&v->counter), /* Not "m": llock only supports reg direct addr mode */ \ 42 [i] "ir" (i) \ 43 : "cc"); \ 44} \ 45 46#define ATOMIC_OP_RETURN(op, c_op, asm_op) \ 47static inline int atomic_##op##_return(int i, atomic_t *v) \ 48{ \ 49 unsigned int val; \ 50 \ 51 /* \ 52 * Explicit full memory barrier needed before/after as \ 53 * LLOCK/SCOND thmeselves don't provide any such semantics \ 54 */ \ 55 smp_mb(); \ 56 \ 57 __asm__ __volatile__( \ 58 "1: llock %[val], [%[ctr]] \n" \ 59 " " #asm_op " %[val], %[val], %[i] \n" \ 60 " scond %[val], [%[ctr]] \n" \ 61 " bnz 1b \n" \ 62 : [val] "=&r" (val) \ 63 : [ctr] "r" (&v->counter), \ 64 [i] "ir" (i) \ 65 : "cc"); \ 66 \ 67 smp_mb(); \ 68 \ 69 return val; \ 70} 71 72#define ATOMIC_FETCH_OP(op, c_op, asm_op) \ 73static inline int atomic_fetch_##op(int i, atomic_t *v) \ 74{ \ 75 unsigned int val, orig; \ 76 \ 77 /* \ 78 * Explicit full memory barrier needed before/after as \ 79 * LLOCK/SCOND thmeselves don't provide any such semantics \ 80 */ \ 81 smp_mb(); \ 82 \ 83 __asm__ __volatile__( \ 84 "1: llock %[orig], [%[ctr]] \n" \ 85 " " #asm_op " %[val], %[orig], %[i] \n" \ 86 " scond %[val], [%[ctr]] \n" \ 87 " bnz 1b \n" \ 88 : [val] "=&r" (val), \ 89 [orig] "=&r" (orig) \ 90 : [ctr] "r" (&v->counter), \ 91 [i] "ir" (i) \ 92 : "cc"); \ 93 \ 94 smp_mb(); \ 95 \ 96 return orig; \ 97} 98 99#else /* !CONFIG_ARC_HAS_LLSC */ 100 101#ifndef CONFIG_SMP 102 103 /* violating atomic_xxx API locking protocol in UP for optimization sake */ 104#define atomic_set(v, i) WRITE_ONCE(((v)->counter), (i)) 105 106#else 107 108static inline void atomic_set(atomic_t *v, int i) 109{ 110 /* 111 * Independent of hardware support, all of the atomic_xxx() APIs need 112 * to follow the same locking rules to make sure that a "hardware" 113 * atomic insn (e.g. LD) doesn't clobber an "emulated" atomic insn 114 * sequence 115 * 116 * Thus atomic_set() despite being 1 insn (and seemingly atomic) 117 * requires the locking. 118 */ 119 unsigned long flags; 120 121 atomic_ops_lock(flags); 122 WRITE_ONCE(v->counter, i); 123 atomic_ops_unlock(flags); 124} 125 126#define atomic_set_release(v, i) atomic_set((v), (i)) 127 128#endif 129 130/* 131 * Non hardware assisted Atomic-R-M-W 132 * Locking would change to irq-disabling only (UP) and spinlocks (SMP) 133 */ 134 135#define ATOMIC_OP(op, c_op, asm_op) \ 136static inline void atomic_##op(int i, atomic_t *v) \ 137{ \ 138 unsigned long flags; \ 139 \ 140 atomic_ops_lock(flags); \ 141 v->counter c_op i; \ 142 atomic_ops_unlock(flags); \ 143} 144 145#define ATOMIC_OP_RETURN(op, c_op, asm_op) \ 146static inline int atomic_##op##_return(int i, atomic_t *v) \ 147{ \ 148 unsigned long flags; \ 149 unsigned long temp; \ 150 \ 151 /* \ 152 * spin lock/unlock provides the needed smp_mb() before/after \ 153 */ \ 154 atomic_ops_lock(flags); \ 155 temp = v->counter; \ 156 temp c_op i; \ 157 v->counter = temp; \ 158 atomic_ops_unlock(flags); \ 159 \ 160 return temp; \ 161} 162 163#define ATOMIC_FETCH_OP(op, c_op, asm_op) \ 164static inline int atomic_fetch_##op(int i, atomic_t *v) \ 165{ \ 166 unsigned long flags; \ 167 unsigned long orig; \ 168 \ 169 /* \ 170 * spin lock/unlock provides the needed smp_mb() before/after \ 171 */ \ 172 atomic_ops_lock(flags); \ 173 orig = v->counter; \ 174 v->counter c_op i; \ 175 atomic_ops_unlock(flags); \ 176 \ 177 return orig; \ 178} 179 180#endif /* !CONFIG_ARC_HAS_LLSC */ 181 182#define ATOMIC_OPS(op, c_op, asm_op) \ 183 ATOMIC_OP(op, c_op, asm_op) \ 184 ATOMIC_OP_RETURN(op, c_op, asm_op) \ 185 ATOMIC_FETCH_OP(op, c_op, asm_op) 186 187ATOMIC_OPS(add, +=, add) 188ATOMIC_OPS(sub, -=, sub) 189 190#define atomic_andnot atomic_andnot 191#define atomic_fetch_andnot atomic_fetch_andnot 192 193#undef ATOMIC_OPS 194#define ATOMIC_OPS(op, c_op, asm_op) \ 195 ATOMIC_OP(op, c_op, asm_op) \ 196 ATOMIC_FETCH_OP(op, c_op, asm_op) 197 198ATOMIC_OPS(and, &=, and) 199ATOMIC_OPS(andnot, &= ~, bic) 200ATOMIC_OPS(or, |=, or) 201ATOMIC_OPS(xor, ^=, xor) 202 203#else /* CONFIG_ARC_PLAT_EZNPS */ 204 205static inline int atomic_read(const atomic_t *v) 206{ 207 int temp; 208 209 __asm__ __volatile__( 210 " ld.di %0, [%1]" 211 : "=r"(temp) 212 : "r"(&v->counter) 213 : "memory"); 214 return temp; 215} 216 217static inline void atomic_set(atomic_t *v, int i) 218{ 219 __asm__ __volatile__( 220 " st.di %0,[%1]" 221 : 222 : "r"(i), "r"(&v->counter) 223 : "memory"); 224} 225 226#define ATOMIC_OP(op, c_op, asm_op) \ 227static inline void atomic_##op(int i, atomic_t *v) \ 228{ \ 229 __asm__ __volatile__( \ 230 " mov r2, %0\n" \ 231 " mov r3, %1\n" \ 232 " .word %2\n" \ 233 : \ 234 : "r"(i), "r"(&v->counter), "i"(asm_op) \ 235 : "r2", "r3", "memory"); \ 236} \ 237 238#define ATOMIC_OP_RETURN(op, c_op, asm_op) \ 239static inline int atomic_##op##_return(int i, atomic_t *v) \ 240{ \ 241 unsigned int temp = i; \ 242 \ 243 /* Explicit full memory barrier needed before/after */ \ 244 smp_mb(); \ 245 \ 246 __asm__ __volatile__( \ 247 " mov r2, %0\n" \ 248 " mov r3, %1\n" \ 249 " .word %2\n" \ 250 " mov %0, r2" \ 251 : "+r"(temp) \ 252 : "r"(&v->counter), "i"(asm_op) \ 253 : "r2", "r3", "memory"); \ 254 \ 255 smp_mb(); \ 256 \ 257 temp c_op i; \ 258 \ 259 return temp; \ 260} 261 262#define ATOMIC_FETCH_OP(op, c_op, asm_op) \ 263static inline int atomic_fetch_##op(int i, atomic_t *v) \ 264{ \ 265 unsigned int temp = i; \ 266 \ 267 /* Explicit full memory barrier needed before/after */ \ 268 smp_mb(); \ 269 \ 270 __asm__ __volatile__( \ 271 " mov r2, %0\n" \ 272 " mov r3, %1\n" \ 273 " .word %2\n" \ 274 " mov %0, r2" \ 275 : "+r"(temp) \ 276 : "r"(&v->counter), "i"(asm_op) \ 277 : "r2", "r3", "memory"); \ 278 \ 279 smp_mb(); \ 280 \ 281 return temp; \ 282} 283 284#define ATOMIC_OPS(op, c_op, asm_op) \ 285 ATOMIC_OP(op, c_op, asm_op) \ 286 ATOMIC_OP_RETURN(op, c_op, asm_op) \ 287 ATOMIC_FETCH_OP(op, c_op, asm_op) 288 289ATOMIC_OPS(add, +=, CTOP_INST_AADD_DI_R2_R2_R3) 290#define atomic_sub(i, v) atomic_add(-(i), (v)) 291#define atomic_sub_return(i, v) atomic_add_return(-(i), (v)) 292#define atomic_fetch_sub(i, v) atomic_fetch_add(-(i), (v)) 293 294#undef ATOMIC_OPS 295#define ATOMIC_OPS(op, c_op, asm_op) \ 296 ATOMIC_OP(op, c_op, asm_op) \ 297 ATOMIC_FETCH_OP(op, c_op, asm_op) 298 299ATOMIC_OPS(and, &=, CTOP_INST_AAND_DI_R2_R2_R3) 300ATOMIC_OPS(or, |=, CTOP_INST_AOR_DI_R2_R2_R3) 301ATOMIC_OPS(xor, ^=, CTOP_INST_AXOR_DI_R2_R2_R3) 302 303#endif /* CONFIG_ARC_PLAT_EZNPS */ 304 305#undef ATOMIC_OPS 306#undef ATOMIC_FETCH_OP 307#undef ATOMIC_OP_RETURN 308#undef ATOMIC_OP 309 310#ifdef CONFIG_GENERIC_ATOMIC64 311 312#include <asm-generic/atomic64.h> 313 314#else /* Kconfig ensures this is only enabled with needed h/w assist */ 315 316/* 317 * ARCv2 supports 64-bit exclusive load (LLOCKD) / store (SCONDD) 318 * - The address HAS to be 64-bit aligned 319 * - There are 2 semantics involved here: 320 * = exclusive implies no interim update between load/store to same addr 321 * = both words are observed/updated together: this is guaranteed even 322 * for regular 64-bit load (LDD) / store (STD). Thus atomic64_set() 323 * is NOT required to use LLOCKD+SCONDD, STD suffices 324 */ 325 326typedef struct { 327 aligned_u64 counter; 328} atomic64_t; 329 330#define ATOMIC64_INIT(a) { (a) } 331 332static inline long long atomic64_read(const atomic64_t *v) 333{ 334 unsigned long long val; 335 336 __asm__ __volatile__( 337 " ldd %0, [%1] \n" 338 : "=r"(val) 339 : "r"(&v->counter)); 340 341 return val; 342} 343 344static inline void atomic64_set(atomic64_t *v, long long a) 345{ 346 /* 347 * This could have been a simple assignment in "C" but would need 348 * explicit volatile. Otherwise gcc optimizers could elide the store 349 * which borked atomic64 self-test 350 * In the inline asm version, memory clobber needed for exact same 351 * reason, to tell gcc about the store. 352 * 353 * This however is not needed for sibling atomic64_add() etc since both 354 * load/store are explicitly done in inline asm. As long as API is used 355 * for each access, gcc has no way to optimize away any load/store 356 */ 357 __asm__ __volatile__( 358 " std %0, [%1] \n" 359 : 360 : "r"(a), "r"(&v->counter) 361 : "memory"); 362} 363 364#define ATOMIC64_OP(op, op1, op2) \ 365static inline void atomic64_##op(long long a, atomic64_t *v) \ 366{ \ 367 unsigned long long val; \ 368 \ 369 __asm__ __volatile__( \ 370 "1: \n" \ 371 " llockd %0, [%1] \n" \ 372 " " #op1 " %L0, %L0, %L2 \n" \ 373 " " #op2 " %H0, %H0, %H2 \n" \ 374 " scondd %0, [%1] \n" \ 375 " bnz 1b \n" \ 376 : "=&r"(val) \ 377 : "r"(&v->counter), "ir"(a) \ 378 : "cc"); \ 379} \ 380 381#define ATOMIC64_OP_RETURN(op, op1, op2) \ 382static inline long long atomic64_##op##_return(long long a, atomic64_t *v) \ 383{ \ 384 unsigned long long val; \ 385 \ 386 smp_mb(); \ 387 \ 388 __asm__ __volatile__( \ 389 "1: \n" \ 390 " llockd %0, [%1] \n" \ 391 " " #op1 " %L0, %L0, %L2 \n" \ 392 " " #op2 " %H0, %H0, %H2 \n" \ 393 " scondd %0, [%1] \n" \ 394 " bnz 1b \n" \ 395 : [val] "=&r"(val) \ 396 : "r"(&v->counter), "ir"(a) \ 397 : "cc"); /* memory clobber comes from smp_mb() */ \ 398 \ 399 smp_mb(); \ 400 \ 401 return val; \ 402} 403 404#define ATOMIC64_FETCH_OP(op, op1, op2) \ 405static inline long long atomic64_fetch_##op(long long a, atomic64_t *v) \ 406{ \ 407 unsigned long long val, orig; \ 408 \ 409 smp_mb(); \ 410 \ 411 __asm__ __volatile__( \ 412 "1: \n" \ 413 " llockd %0, [%2] \n" \ 414 " " #op1 " %L1, %L0, %L3 \n" \ 415 " " #op2 " %H1, %H0, %H3 \n" \ 416 " scondd %1, [%2] \n" \ 417 " bnz 1b \n" \ 418 : "=&r"(orig), "=&r"(val) \ 419 : "r"(&v->counter), "ir"(a) \ 420 : "cc"); /* memory clobber comes from smp_mb() */ \ 421 \ 422 smp_mb(); \ 423 \ 424 return orig; \ 425} 426 427#define ATOMIC64_OPS(op, op1, op2) \ 428 ATOMIC64_OP(op, op1, op2) \ 429 ATOMIC64_OP_RETURN(op, op1, op2) \ 430 ATOMIC64_FETCH_OP(op, op1, op2) 431 432#define atomic64_andnot atomic64_andnot 433#define atomic64_fetch_andnot atomic64_fetch_andnot 434 435ATOMIC64_OPS(add, add.f, adc) 436ATOMIC64_OPS(sub, sub.f, sbc) 437ATOMIC64_OPS(and, and, and) 438ATOMIC64_OPS(andnot, bic, bic) 439ATOMIC64_OPS(or, or, or) 440ATOMIC64_OPS(xor, xor, xor) 441 442#undef ATOMIC64_OPS 443#undef ATOMIC64_FETCH_OP 444#undef ATOMIC64_OP_RETURN 445#undef ATOMIC64_OP 446 447static inline long long 448atomic64_cmpxchg(atomic64_t *ptr, long long expected, long long new) 449{ 450 long long prev; 451 452 smp_mb(); 453 454 __asm__ __volatile__( 455 "1: llockd %0, [%1] \n" 456 " brne %L0, %L2, 2f \n" 457 " brne %H0, %H2, 2f \n" 458 " scondd %3, [%1] \n" 459 " bnz 1b \n" 460 "2: \n" 461 : "=&r"(prev) 462 : "r"(ptr), "ir"(expected), "r"(new) 463 : "cc"); /* memory clobber comes from smp_mb() */ 464 465 smp_mb(); 466 467 return prev; 468} 469 470static inline long long atomic64_xchg(atomic64_t *ptr, long long new) 471{ 472 long long prev; 473 474 smp_mb(); 475 476 __asm__ __volatile__( 477 "1: llockd %0, [%1] \n" 478 " scondd %2, [%1] \n" 479 " bnz 1b \n" 480 "2: \n" 481 : "=&r"(prev) 482 : "r"(ptr), "r"(new) 483 : "cc"); /* memory clobber comes from smp_mb() */ 484 485 smp_mb(); 486 487 return prev; 488} 489 490/** 491 * atomic64_dec_if_positive - decrement by 1 if old value positive 492 * @v: pointer of type atomic64_t 493 * 494 * The function returns the old value of *v minus 1, even if 495 * the atomic variable, v, was not decremented. 496 */ 497 498static inline long long atomic64_dec_if_positive(atomic64_t *v) 499{ 500 long long val; 501 502 smp_mb(); 503 504 __asm__ __volatile__( 505 "1: llockd %0, [%1] \n" 506 " sub.f %L0, %L0, 1 # w0 - 1, set C on borrow\n" 507 " sub.c %H0, %H0, 1 # if C set, w1 - 1\n" 508 " brlt %H0, 0, 2f \n" 509 " scondd %0, [%1] \n" 510 " bnz 1b \n" 511 "2: \n" 512 : "=&r"(val) 513 : "r"(&v->counter) 514 : "cc"); /* memory clobber comes from smp_mb() */ 515 516 smp_mb(); 517 518 return val; 519} 520#define atomic64_dec_if_positive atomic64_dec_if_positive 521 522/** 523 * atomic64_fetch_add_unless - add unless the number is a given value 524 * @v: pointer of type atomic64_t 525 * @a: the amount to add to v... 526 * @u: ...unless v is equal to u. 527 * 528 * Atomically adds @a to @v, if it was not @u. 529 * Returns the old value of @v 530 */ 531static inline long long atomic64_fetch_add_unless(atomic64_t *v, long long a, 532 long long u) 533{ 534 long long old, temp; 535 536 smp_mb(); 537 538 __asm__ __volatile__( 539 "1: llockd %0, [%2] \n" 540 " brne %L0, %L4, 2f # continue to add since v != u \n" 541 " breq.d %H0, %H4, 3f # return since v == u \n" 542 "2: \n" 543 " add.f %L1, %L0, %L3 \n" 544 " adc %H1, %H0, %H3 \n" 545 " scondd %1, [%2] \n" 546 " bnz 1b \n" 547 "3: \n" 548 : "=&r"(old), "=&r" (temp) 549 : "r"(&v->counter), "r"(a), "r"(u) 550 : "cc"); /* memory clobber comes from smp_mb() */ 551 552 smp_mb(); 553 554 return old; 555} 556#define atomic64_fetch_add_unless atomic64_fetch_add_unless 557 558#endif /* !CONFIG_GENERIC_ATOMIC64 */ 559 560#endif /* !__ASSEMBLY__ */ 561 562#endif