at v2.6.34 506 lines 17 kB view raw
1/* 2 * Read-Copy Update mechanism for mutual exclusion 3 * 4 * This program is free software; you can redistribute it and/or modify 5 * it under the terms of the GNU General Public License as published by 6 * the Free Software Foundation; either version 2 of the License, or 7 * (at your option) any later version. 8 * 9 * This program is distributed in the hope that it will be useful, 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of 11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 12 * GNU General Public License for more details. 13 * 14 * You should have received a copy of the GNU General Public License 15 * along with this program; if not, write to the Free Software 16 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. 17 * 18 * Copyright IBM Corporation, 2001 19 * 20 * Author: Dipankar Sarma <dipankar@in.ibm.com> 21 * 22 * Based on the original work by Paul McKenney <paulmck@us.ibm.com> 23 * and inputs from Rusty Russell, Andrea Arcangeli and Andi Kleen. 24 * Papers: 25 * http://www.rdrop.com/users/paulmck/paper/rclockpdcsproof.pdf 26 * http://lse.sourceforge.net/locking/rclock_OLS.2001.05.01c.sc.pdf (OLS2001) 27 * 28 * For detailed explanation of Read-Copy Update mechanism see - 29 * http://lse.sourceforge.net/locking/rcupdate.html 30 * 31 */ 32 33#ifndef __LINUX_RCUPDATE_H 34#define __LINUX_RCUPDATE_H 35 36#include <linux/cache.h> 37#include <linux/spinlock.h> 38#include <linux/threads.h> 39#include <linux/cpumask.h> 40#include <linux/seqlock.h> 41#include <linux/lockdep.h> 42#include <linux/completion.h> 43 44#ifdef CONFIG_RCU_TORTURE_TEST 45extern int rcutorture_runnable; /* for sysctl */ 46#endif /* #ifdef CONFIG_RCU_TORTURE_TEST */ 47 48/** 49 * struct rcu_head - callback structure for use with RCU 50 * @next: next update requests in a list 51 * @func: actual update function to call after the grace period. 52 */ 53struct rcu_head { 54 struct rcu_head *next; 55 void (*func)(struct rcu_head *head); 56}; 57 58/* Exported common interfaces */ 59extern void synchronize_rcu_bh(void); 60extern void synchronize_sched(void); 61extern void rcu_barrier(void); 62extern void rcu_barrier_bh(void); 63extern void rcu_barrier_sched(void); 64extern void synchronize_sched_expedited(void); 65extern int sched_expedited_torture_stats(char *page); 66 67/* Internal to kernel */ 68extern void rcu_init(void); 69extern int rcu_scheduler_active; 70extern void rcu_scheduler_starting(void); 71 72#if defined(CONFIG_TREE_RCU) || defined(CONFIG_TREE_PREEMPT_RCU) 73#include <linux/rcutree.h> 74#elif defined(CONFIG_TINY_RCU) 75#include <linux/rcutiny.h> 76#else 77#error "Unknown RCU implementation specified to kernel configuration" 78#endif 79 80#define RCU_HEAD_INIT { .next = NULL, .func = NULL } 81#define RCU_HEAD(head) struct rcu_head head = RCU_HEAD_INIT 82#define INIT_RCU_HEAD(ptr) do { \ 83 (ptr)->next = NULL; (ptr)->func = NULL; \ 84} while (0) 85 86#ifdef CONFIG_DEBUG_LOCK_ALLOC 87 88extern struct lockdep_map rcu_lock_map; 89# define rcu_read_acquire() \ 90 lock_acquire(&rcu_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_) 91# define rcu_read_release() lock_release(&rcu_lock_map, 1, _THIS_IP_) 92 93extern struct lockdep_map rcu_bh_lock_map; 94# define rcu_read_acquire_bh() \ 95 lock_acquire(&rcu_bh_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_) 96# define rcu_read_release_bh() lock_release(&rcu_bh_lock_map, 1, _THIS_IP_) 97 98extern struct lockdep_map rcu_sched_lock_map; 99# define rcu_read_acquire_sched() \ 100 lock_acquire(&rcu_sched_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_) 101# define rcu_read_release_sched() \ 102 lock_release(&rcu_sched_lock_map, 1, _THIS_IP_) 103 104extern int debug_lockdep_rcu_enabled(void); 105 106/** 107 * rcu_read_lock_held - might we be in RCU read-side critical section? 108 * 109 * If CONFIG_PROVE_LOCKING is selected and enabled, returns nonzero iff in 110 * an RCU read-side critical section. In absence of CONFIG_PROVE_LOCKING, 111 * this assumes we are in an RCU read-side critical section unless it can 112 * prove otherwise. 113 * 114 * Check rcu_scheduler_active to prevent false positives during boot. 115 */ 116static inline int rcu_read_lock_held(void) 117{ 118 if (!debug_lockdep_rcu_enabled()) 119 return 1; 120 return lock_is_held(&rcu_lock_map); 121} 122 123/* 124 * rcu_read_lock_bh_held() is defined out of line to avoid #include-file 125 * hell. 126 */ 127extern int rcu_read_lock_bh_held(void); 128 129/** 130 * rcu_read_lock_sched_held - might we be in RCU-sched read-side critical section? 131 * 132 * If CONFIG_PROVE_LOCKING is selected and enabled, returns nonzero iff in an 133 * RCU-sched read-side critical section. In absence of CONFIG_PROVE_LOCKING, 134 * this assumes we are in an RCU-sched read-side critical section unless it 135 * can prove otherwise. Note that disabling of preemption (including 136 * disabling irqs) counts as an RCU-sched read-side critical section. 137 * 138 * Check rcu_scheduler_active to prevent false positives during boot. 139 */ 140#ifdef CONFIG_PREEMPT 141static inline int rcu_read_lock_sched_held(void) 142{ 143 int lockdep_opinion = 0; 144 145 if (!debug_lockdep_rcu_enabled()) 146 return 1; 147 if (debug_locks) 148 lockdep_opinion = lock_is_held(&rcu_sched_lock_map); 149 return lockdep_opinion || preempt_count() != 0 || irqs_disabled(); 150} 151#else /* #ifdef CONFIG_PREEMPT */ 152static inline int rcu_read_lock_sched_held(void) 153{ 154 return 1; 155} 156#endif /* #else #ifdef CONFIG_PREEMPT */ 157 158#else /* #ifdef CONFIG_DEBUG_LOCK_ALLOC */ 159 160# define rcu_read_acquire() do { } while (0) 161# define rcu_read_release() do { } while (0) 162# define rcu_read_acquire_bh() do { } while (0) 163# define rcu_read_release_bh() do { } while (0) 164# define rcu_read_acquire_sched() do { } while (0) 165# define rcu_read_release_sched() do { } while (0) 166 167static inline int rcu_read_lock_held(void) 168{ 169 return 1; 170} 171 172static inline int rcu_read_lock_bh_held(void) 173{ 174 return 1; 175} 176 177#ifdef CONFIG_PREEMPT 178static inline int rcu_read_lock_sched_held(void) 179{ 180 return !rcu_scheduler_active || preempt_count() != 0 || irqs_disabled(); 181} 182#else /* #ifdef CONFIG_PREEMPT */ 183static inline int rcu_read_lock_sched_held(void) 184{ 185 return 1; 186} 187#endif /* #else #ifdef CONFIG_PREEMPT */ 188 189#endif /* #else #ifdef CONFIG_DEBUG_LOCK_ALLOC */ 190 191#ifdef CONFIG_PROVE_RCU 192 193extern int rcu_my_thread_group_empty(void); 194 195/** 196 * rcu_dereference_check - rcu_dereference with debug checking 197 * @p: The pointer to read, prior to dereferencing 198 * @c: The conditions under which the dereference will take place 199 * 200 * Do an rcu_dereference(), but check that the conditions under which the 201 * dereference will take place are correct. Typically the conditions indicate 202 * the various locking conditions that should be held at that point. The check 203 * should return true if the conditions are satisfied. 204 * 205 * For example: 206 * 207 * bar = rcu_dereference_check(foo->bar, rcu_read_lock_held() || 208 * lockdep_is_held(&foo->lock)); 209 * 210 * could be used to indicate to lockdep that foo->bar may only be dereferenced 211 * if either the RCU read lock is held, or that the lock required to replace 212 * the bar struct at foo->bar is held. 213 * 214 * Note that the list of conditions may also include indications of when a lock 215 * need not be held, for example during initialisation or destruction of the 216 * target struct: 217 * 218 * bar = rcu_dereference_check(foo->bar, rcu_read_lock_held() || 219 * lockdep_is_held(&foo->lock) || 220 * atomic_read(&foo->usage) == 0); 221 */ 222#define rcu_dereference_check(p, c) \ 223 ({ \ 224 if (debug_lockdep_rcu_enabled() && !(c)) \ 225 lockdep_rcu_dereference(__FILE__, __LINE__); \ 226 rcu_dereference_raw(p); \ 227 }) 228 229/** 230 * rcu_dereference_protected - fetch RCU pointer when updates prevented 231 * 232 * Return the value of the specified RCU-protected pointer, but omit 233 * both the smp_read_barrier_depends() and the ACCESS_ONCE(). This 234 * is useful in cases where update-side locks prevent the value of the 235 * pointer from changing. Please note that this primitive does -not- 236 * prevent the compiler from repeating this reference or combining it 237 * with other references, so it should not be used without protection 238 * of appropriate locks. 239 */ 240#define rcu_dereference_protected(p, c) \ 241 ({ \ 242 if (debug_lockdep_rcu_enabled() && !(c)) \ 243 lockdep_rcu_dereference(__FILE__, __LINE__); \ 244 (p); \ 245 }) 246 247#else /* #ifdef CONFIG_PROVE_RCU */ 248 249#define rcu_dereference_check(p, c) rcu_dereference_raw(p) 250#define rcu_dereference_protected(p, c) (p) 251 252#endif /* #else #ifdef CONFIG_PROVE_RCU */ 253 254/** 255 * rcu_access_pointer - fetch RCU pointer with no dereferencing 256 * 257 * Return the value of the specified RCU-protected pointer, but omit the 258 * smp_read_barrier_depends() and keep the ACCESS_ONCE(). This is useful 259 * when the value of this pointer is accessed, but the pointer is not 260 * dereferenced, for example, when testing an RCU-protected pointer against 261 * NULL. This may also be used in cases where update-side locks prevent 262 * the value of the pointer from changing, but rcu_dereference_protected() 263 * is a lighter-weight primitive for this use case. 264 */ 265#define rcu_access_pointer(p) ACCESS_ONCE(p) 266 267/** 268 * rcu_read_lock - mark the beginning of an RCU read-side critical section. 269 * 270 * When synchronize_rcu() is invoked on one CPU while other CPUs 271 * are within RCU read-side critical sections, then the 272 * synchronize_rcu() is guaranteed to block until after all the other 273 * CPUs exit their critical sections. Similarly, if call_rcu() is invoked 274 * on one CPU while other CPUs are within RCU read-side critical 275 * sections, invocation of the corresponding RCU callback is deferred 276 * until after the all the other CPUs exit their critical sections. 277 * 278 * Note, however, that RCU callbacks are permitted to run concurrently 279 * with RCU read-side critical sections. One way that this can happen 280 * is via the following sequence of events: (1) CPU 0 enters an RCU 281 * read-side critical section, (2) CPU 1 invokes call_rcu() to register 282 * an RCU callback, (3) CPU 0 exits the RCU read-side critical section, 283 * (4) CPU 2 enters a RCU read-side critical section, (5) the RCU 284 * callback is invoked. This is legal, because the RCU read-side critical 285 * section that was running concurrently with the call_rcu() (and which 286 * therefore might be referencing something that the corresponding RCU 287 * callback would free up) has completed before the corresponding 288 * RCU callback is invoked. 289 * 290 * RCU read-side critical sections may be nested. Any deferred actions 291 * will be deferred until the outermost RCU read-side critical section 292 * completes. 293 * 294 * It is illegal to block while in an RCU read-side critical section. 295 */ 296static inline void rcu_read_lock(void) 297{ 298 __rcu_read_lock(); 299 __acquire(RCU); 300 rcu_read_acquire(); 301} 302 303/* 304 * So where is rcu_write_lock()? It does not exist, as there is no 305 * way for writers to lock out RCU readers. This is a feature, not 306 * a bug -- this property is what provides RCU's performance benefits. 307 * Of course, writers must coordinate with each other. The normal 308 * spinlock primitives work well for this, but any other technique may be 309 * used as well. RCU does not care how the writers keep out of each 310 * others' way, as long as they do so. 311 */ 312 313/** 314 * rcu_read_unlock - marks the end of an RCU read-side critical section. 315 * 316 * See rcu_read_lock() for more information. 317 */ 318static inline void rcu_read_unlock(void) 319{ 320 rcu_read_release(); 321 __release(RCU); 322 __rcu_read_unlock(); 323} 324 325/** 326 * rcu_read_lock_bh - mark the beginning of a softirq-only RCU critical section 327 * 328 * This is equivalent of rcu_read_lock(), but to be used when updates 329 * are being done using call_rcu_bh(). Since call_rcu_bh() callbacks 330 * consider completion of a softirq handler to be a quiescent state, 331 * a process in RCU read-side critical section must be protected by 332 * disabling softirqs. Read-side critical sections in interrupt context 333 * can use just rcu_read_lock(). 334 * 335 */ 336static inline void rcu_read_lock_bh(void) 337{ 338 __rcu_read_lock_bh(); 339 __acquire(RCU_BH); 340 rcu_read_acquire_bh(); 341} 342 343/* 344 * rcu_read_unlock_bh - marks the end of a softirq-only RCU critical section 345 * 346 * See rcu_read_lock_bh() for more information. 347 */ 348static inline void rcu_read_unlock_bh(void) 349{ 350 rcu_read_release_bh(); 351 __release(RCU_BH); 352 __rcu_read_unlock_bh(); 353} 354 355/** 356 * rcu_read_lock_sched - mark the beginning of a RCU-classic critical section 357 * 358 * Should be used with either 359 * - synchronize_sched() 360 * or 361 * - call_rcu_sched() and rcu_barrier_sched() 362 * on the write-side to insure proper synchronization. 363 */ 364static inline void rcu_read_lock_sched(void) 365{ 366 preempt_disable(); 367 __acquire(RCU_SCHED); 368 rcu_read_acquire_sched(); 369} 370 371/* Used by lockdep and tracing: cannot be traced, cannot call lockdep. */ 372static inline notrace void rcu_read_lock_sched_notrace(void) 373{ 374 preempt_disable_notrace(); 375 __acquire(RCU_SCHED); 376} 377 378/* 379 * rcu_read_unlock_sched - marks the end of a RCU-classic critical section 380 * 381 * See rcu_read_lock_sched for more information. 382 */ 383static inline void rcu_read_unlock_sched(void) 384{ 385 rcu_read_release_sched(); 386 __release(RCU_SCHED); 387 preempt_enable(); 388} 389 390/* Used by lockdep and tracing: cannot be traced, cannot call lockdep. */ 391static inline notrace void rcu_read_unlock_sched_notrace(void) 392{ 393 __release(RCU_SCHED); 394 preempt_enable_notrace(); 395} 396 397 398/** 399 * rcu_dereference_raw - fetch an RCU-protected pointer 400 * 401 * The caller must be within some flavor of RCU read-side critical 402 * section, or must be otherwise preventing the pointer from changing, 403 * for example, by holding an appropriate lock. This pointer may later 404 * be safely dereferenced. It is the caller's responsibility to have 405 * done the right thing, as this primitive does no checking of any kind. 406 * 407 * Inserts memory barriers on architectures that require them 408 * (currently only the Alpha), and, more importantly, documents 409 * exactly which pointers are protected by RCU. 410 */ 411#define rcu_dereference_raw(p) ({ \ 412 typeof(p) _________p1 = ACCESS_ONCE(p); \ 413 smp_read_barrier_depends(); \ 414 (_________p1); \ 415 }) 416 417/** 418 * rcu_dereference - fetch an RCU-protected pointer, checking for RCU 419 * 420 * Makes rcu_dereference_check() do the dirty work. 421 */ 422#define rcu_dereference(p) \ 423 rcu_dereference_check(p, rcu_read_lock_held()) 424 425/** 426 * rcu_dereference_bh - fetch an RCU-protected pointer, checking for RCU-bh 427 * 428 * Makes rcu_dereference_check() do the dirty work. 429 */ 430#define rcu_dereference_bh(p) \ 431 rcu_dereference_check(p, rcu_read_lock_bh_held()) 432 433/** 434 * rcu_dereference_sched - fetch RCU-protected pointer, checking for RCU-sched 435 * 436 * Makes rcu_dereference_check() do the dirty work. 437 */ 438#define rcu_dereference_sched(p) \ 439 rcu_dereference_check(p, rcu_read_lock_sched_held()) 440 441/** 442 * rcu_assign_pointer - assign (publicize) a pointer to a newly 443 * initialized structure that will be dereferenced by RCU read-side 444 * critical sections. Returns the value assigned. 445 * 446 * Inserts memory barriers on architectures that require them 447 * (pretty much all of them other than x86), and also prevents 448 * the compiler from reordering the code that initializes the 449 * structure after the pointer assignment. More importantly, this 450 * call documents which pointers will be dereferenced by RCU read-side 451 * code. 452 */ 453 454#define rcu_assign_pointer(p, v) \ 455 ({ \ 456 if (!__builtin_constant_p(v) || \ 457 ((v) != NULL)) \ 458 smp_wmb(); \ 459 (p) = (v); \ 460 }) 461 462/* Infrastructure to implement the synchronize_() primitives. */ 463 464struct rcu_synchronize { 465 struct rcu_head head; 466 struct completion completion; 467}; 468 469extern void wakeme_after_rcu(struct rcu_head *head); 470 471/** 472 * call_rcu - Queue an RCU callback for invocation after a grace period. 473 * @head: structure to be used for queueing the RCU updates. 474 * @func: actual update function to be invoked after the grace period 475 * 476 * The update function will be invoked some time after a full grace 477 * period elapses, in other words after all currently executing RCU 478 * read-side critical sections have completed. RCU read-side critical 479 * sections are delimited by rcu_read_lock() and rcu_read_unlock(), 480 * and may be nested. 481 */ 482extern void call_rcu(struct rcu_head *head, 483 void (*func)(struct rcu_head *head)); 484 485/** 486 * call_rcu_bh - Queue an RCU for invocation after a quicker grace period. 487 * @head: structure to be used for queueing the RCU updates. 488 * @func: actual update function to be invoked after the grace period 489 * 490 * The update function will be invoked some time after a full grace 491 * period elapses, in other words after all currently executing RCU 492 * read-side critical sections have completed. call_rcu_bh() assumes 493 * that the read-side critical sections end on completion of a softirq 494 * handler. This means that read-side critical sections in process 495 * context must not be interrupted by softirqs. This interface is to be 496 * used when most of the read-side critical sections are in softirq context. 497 * RCU read-side critical sections are delimited by : 498 * - rcu_read_lock() and rcu_read_unlock(), if in interrupt context. 499 * OR 500 * - rcu_read_lock_bh() and rcu_read_unlock_bh(), if in process context. 501 * These may be nested. 502 */ 503extern void call_rcu_bh(struct rcu_head *head, 504 void (*func)(struct rcu_head *head)); 505 506#endif /* __LINUX_RCUPDATE_H */