]> bbs.cooldavid.org Git - net-next-2.6.git/blame - include/linux/rcupdate.h
rcu: refactor RCU's context-switch handling
[net-next-2.6.git] / include / linux / rcupdate.h
CommitLineData
1da177e4 1/*
a71fca58 2 * Read-Copy Update mechanism for mutual exclusion
1da177e4
LT
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
17 *
01c1c660 18 * Copyright IBM Corporation, 2001
1da177e4
LT
19 *
20 * Author: Dipankar Sarma <dipankar@in.ibm.com>
a71fca58 21 *
595182bc 22 * Based on the original work by Paul McKenney <paulmck@us.ibm.com>
1da177e4
LT
23 * and inputs from Rusty Russell, Andrea Arcangeli and Andi Kleen.
24 * Papers:
25 * http://www.rdrop.com/users/paulmck/paper/rclockpdcsproof.pdf
26 * http://lse.sourceforge.net/locking/rclock_OLS.2001.05.01c.sc.pdf (OLS2001)
27 *
28 * For detailed explanation of Read-Copy Update mechanism see -
a71fca58 29 * http://lse.sourceforge.net/locking/rcupdate.html
1da177e4
LT
30 *
31 */
32
33#ifndef __LINUX_RCUPDATE_H
34#define __LINUX_RCUPDATE_H
35
1da177e4
LT
36#include <linux/cache.h>
37#include <linux/spinlock.h>
38#include <linux/threads.h>
1da177e4
LT
39#include <linux/cpumask.h>
40#include <linux/seqlock.h>
851a67b8 41#include <linux/lockdep.h>
4446a36f 42#include <linux/completion.h>
1da177e4 43
e5ab6772
DY
44#ifdef CONFIG_RCU_TORTURE_TEST
45extern int rcutorture_runnable; /* for sysctl */
46#endif /* #ifdef CONFIG_RCU_TORTURE_TEST */
47
1da177e4
LT
48/**
49 * struct rcu_head - callback structure for use with RCU
50 * @next: next update requests in a list
51 * @func: actual update function to call after the grace period.
52 */
53struct rcu_head {
54 struct rcu_head *next;
55 void (*func)(struct rcu_head *head);
56};
57
03b042bf 58/* Exported common interfaces */
03b042bf
PM
59extern void rcu_barrier(void);
60extern void rcu_barrier_bh(void);
61extern void rcu_barrier_sched(void);
62extern void synchronize_sched_expedited(void);
63extern int sched_expedited_torture_stats(char *page);
64
65/* Internal to kernel */
66extern void rcu_init(void);
d9f1bb6a
PM
67extern int rcu_scheduler_active;
68extern void rcu_scheduler_starting(void);
a6826048 69
f41d911f 70#if defined(CONFIG_TREE_RCU) || defined(CONFIG_TREE_PREEMPT_RCU)
64db4cff 71#include <linux/rcutree.h>
2c28e245 72#elif defined(CONFIG_TINY_RCU)
9b1d82fa 73#include <linux/rcutiny.h>
64db4cff
PM
74#else
75#error "Unknown RCU implementation specified to kernel configuration"
6b3ef48a 76#endif
01c1c660 77
3d76c082 78#define RCU_HEAD_INIT { .next = NULL, .func = NULL }
8b6490e5 79#define RCU_HEAD(head) struct rcu_head head = RCU_HEAD_INIT
1da177e4
LT
80#define INIT_RCU_HEAD(ptr) do { \
81 (ptr)->next = NULL; (ptr)->func = NULL; \
82} while (0)
83
bc33f24b 84#ifdef CONFIG_DEBUG_LOCK_ALLOC
632ee200 85
bc33f24b 86extern struct lockdep_map rcu_lock_map;
632ee200
PM
87# define rcu_read_acquire() \
88 lock_acquire(&rcu_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_)
bc33f24b 89# define rcu_read_release() lock_release(&rcu_lock_map, 1, _THIS_IP_)
632ee200
PM
90
91extern struct lockdep_map rcu_bh_lock_map;
92# define rcu_read_acquire_bh() \
93 lock_acquire(&rcu_bh_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_)
94# define rcu_read_release_bh() lock_release(&rcu_bh_lock_map, 1, _THIS_IP_)
95
96extern struct lockdep_map rcu_sched_lock_map;
97# define rcu_read_acquire_sched() \
98 lock_acquire(&rcu_sched_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_)
99# define rcu_read_release_sched() \
100 lock_release(&rcu_sched_lock_map, 1, _THIS_IP_)
101
bc293d62 102extern int debug_lockdep_rcu_enabled(void);
54dbf96c 103
632ee200
PM
104/**
105 * rcu_read_lock_held - might we be in RCU read-side critical section?
106 *
d20200b5
PM
107 * If CONFIG_DEBUG_LOCK_ALLOC is selected, returns nonzero iff in an RCU
108 * read-side critical section. In absence of CONFIG_DEBUG_LOCK_ALLOC,
632ee200
PM
109 * this assumes we are in an RCU read-side critical section unless it can
110 * prove otherwise.
54dbf96c 111 *
32c141a0
PM
112 * Check debug_lockdep_rcu_enabled() to prevent false positives during boot
113 * and while lockdep is disabled.
632ee200
PM
114 */
115static inline int rcu_read_lock_held(void)
116{
54dbf96c
PM
117 if (!debug_lockdep_rcu_enabled())
118 return 1;
119 return lock_is_held(&rcu_lock_map);
632ee200
PM
120}
121
e3818b8d
PM
122/*
123 * rcu_read_lock_bh_held() is defined out of line to avoid #include-file
124 * hell.
632ee200 125 */
e3818b8d 126extern int rcu_read_lock_bh_held(void);
632ee200
PM
127
128/**
129 * rcu_read_lock_sched_held - might we be in RCU-sched read-side critical section?
130 *
d20200b5
PM
131 * If CONFIG_DEBUG_LOCK_ALLOC is selected, returns nonzero iff in an
132 * RCU-sched read-side critical section. In absence of
133 * CONFIG_DEBUG_LOCK_ALLOC, this assumes we are in an RCU-sched read-side
134 * critical section unless it can prove otherwise. Note that disabling
135 * of preemption (including disabling irqs) counts as an RCU-sched
136 * read-side critical section.
54dbf96c 137 *
32c141a0
PM
138 * Check debug_lockdep_rcu_enabled() to prevent false positives during boot
139 * and while lockdep is disabled.
632ee200 140 */
e6033e3b 141#ifdef CONFIG_PREEMPT
632ee200
PM
142static inline int rcu_read_lock_sched_held(void)
143{
144 int lockdep_opinion = 0;
145
54dbf96c
PM
146 if (!debug_lockdep_rcu_enabled())
147 return 1;
632ee200
PM
148 if (debug_locks)
149 lockdep_opinion = lock_is_held(&rcu_sched_lock_map);
0cff810f 150 return lockdep_opinion || preempt_count() != 0 || irqs_disabled();
632ee200 151}
e6033e3b
PM
152#else /* #ifdef CONFIG_PREEMPT */
153static inline int rcu_read_lock_sched_held(void)
154{
155 return 1;
632ee200 156}
e6033e3b 157#endif /* #else #ifdef CONFIG_PREEMPT */
632ee200
PM
158
159#else /* #ifdef CONFIG_DEBUG_LOCK_ALLOC */
160
161# define rcu_read_acquire() do { } while (0)
162# define rcu_read_release() do { } while (0)
163# define rcu_read_acquire_bh() do { } while (0)
164# define rcu_read_release_bh() do { } while (0)
165# define rcu_read_acquire_sched() do { } while (0)
166# define rcu_read_release_sched() do { } while (0)
167
168static inline int rcu_read_lock_held(void)
169{
170 return 1;
171}
172
173static inline int rcu_read_lock_bh_held(void)
174{
175 return 1;
176}
177
e6033e3b 178#ifdef CONFIG_PREEMPT
632ee200
PM
179static inline int rcu_read_lock_sched_held(void)
180{
0cff810f 181 return !rcu_scheduler_active || preempt_count() != 0 || irqs_disabled();
632ee200 182}
e6033e3b
PM
183#else /* #ifdef CONFIG_PREEMPT */
184static inline int rcu_read_lock_sched_held(void)
185{
186 return 1;
632ee200 187}
e6033e3b 188#endif /* #else #ifdef CONFIG_PREEMPT */
632ee200
PM
189
190#endif /* #else #ifdef CONFIG_DEBUG_LOCK_ALLOC */
191
192#ifdef CONFIG_PROVE_RCU
193
ee84b824
PM
194extern int rcu_my_thread_group_empty(void);
195
2b3fc35f
LJ
196#define __do_rcu_dereference_check(c) \
197 do { \
198 static bool __warned; \
199 if (debug_lockdep_rcu_enabled() && !__warned && !(c)) { \
200 __warned = true; \
201 lockdep_rcu_dereference(__FILE__, __LINE__); \
202 } \
203 } while (0)
204
632ee200
PM
205/**
206 * rcu_dereference_check - rcu_dereference with debug checking
c08c68dd
DH
207 * @p: The pointer to read, prior to dereferencing
208 * @c: The conditions under which the dereference will take place
632ee200 209 *
c08c68dd
DH
210 * Do an rcu_dereference(), but check that the conditions under which the
211 * dereference will take place are correct. Typically the conditions indicate
212 * the various locking conditions that should be held at that point. The check
213 * should return true if the conditions are satisfied.
214 *
215 * For example:
216 *
217 * bar = rcu_dereference_check(foo->bar, rcu_read_lock_held() ||
218 * lockdep_is_held(&foo->lock));
219 *
220 * could be used to indicate to lockdep that foo->bar may only be dereferenced
221 * if either the RCU read lock is held, or that the lock required to replace
222 * the bar struct at foo->bar is held.
223 *
224 * Note that the list of conditions may also include indications of when a lock
225 * need not be held, for example during initialisation or destruction of the
226 * target struct:
227 *
228 * bar = rcu_dereference_check(foo->bar, rcu_read_lock_held() ||
229 * lockdep_is_held(&foo->lock) ||
230 * atomic_read(&foo->usage) == 0);
632ee200
PM
231 */
232#define rcu_dereference_check(p, c) \
233 ({ \
2b3fc35f 234 __do_rcu_dereference_check(c); \
c26d34a5 235 rcu_dereference_raw(p); \
632ee200
PM
236 })
237
b62730ba
PM
238/**
239 * rcu_dereference_protected - fetch RCU pointer when updates prevented
240 *
241 * Return the value of the specified RCU-protected pointer, but omit
242 * both the smp_read_barrier_depends() and the ACCESS_ONCE(). This
243 * is useful in cases where update-side locks prevent the value of the
244 * pointer from changing. Please note that this primitive does -not-
245 * prevent the compiler from repeating this reference or combining it
246 * with other references, so it should not be used without protection
247 * of appropriate locks.
248 */
249#define rcu_dereference_protected(p, c) \
250 ({ \
2b3fc35f 251 __do_rcu_dereference_check(c); \
b62730ba
PM
252 (p); \
253 })
254
632ee200
PM
255#else /* #ifdef CONFIG_PROVE_RCU */
256
c26d34a5 257#define rcu_dereference_check(p, c) rcu_dereference_raw(p)
b62730ba 258#define rcu_dereference_protected(p, c) (p)
632ee200
PM
259
260#endif /* #else #ifdef CONFIG_PROVE_RCU */
bc33f24b 261
b62730ba
PM
262/**
263 * rcu_access_pointer - fetch RCU pointer with no dereferencing
264 *
265 * Return the value of the specified RCU-protected pointer, but omit the
266 * smp_read_barrier_depends() and keep the ACCESS_ONCE(). This is useful
267 * when the value of this pointer is accessed, but the pointer is not
268 * dereferenced, for example, when testing an RCU-protected pointer against
269 * NULL. This may also be used in cases where update-side locks prevent
270 * the value of the pointer from changing, but rcu_dereference_protected()
271 * is a lighter-weight primitive for this use case.
272 */
273#define rcu_access_pointer(p) ACCESS_ONCE(p)
274
1da177e4
LT
275/**
276 * rcu_read_lock - mark the beginning of an RCU read-side critical section.
277 *
9b06e818 278 * When synchronize_rcu() is invoked on one CPU while other CPUs
1da177e4 279 * are within RCU read-side critical sections, then the
9b06e818 280 * synchronize_rcu() is guaranteed to block until after all the other
1da177e4
LT
281 * CPUs exit their critical sections. Similarly, if call_rcu() is invoked
282 * on one CPU while other CPUs are within RCU read-side critical
283 * sections, invocation of the corresponding RCU callback is deferred
284 * until after the all the other CPUs exit their critical sections.
285 *
286 * Note, however, that RCU callbacks are permitted to run concurrently
287 * with RCU read-side critical sections. One way that this can happen
288 * is via the following sequence of events: (1) CPU 0 enters an RCU
289 * read-side critical section, (2) CPU 1 invokes call_rcu() to register
290 * an RCU callback, (3) CPU 0 exits the RCU read-side critical section,
291 * (4) CPU 2 enters a RCU read-side critical section, (5) the RCU
292 * callback is invoked. This is legal, because the RCU read-side critical
293 * section that was running concurrently with the call_rcu() (and which
294 * therefore might be referencing something that the corresponding RCU
295 * callback would free up) has completed before the corresponding
296 * RCU callback is invoked.
297 *
298 * RCU read-side critical sections may be nested. Any deferred actions
299 * will be deferred until the outermost RCU read-side critical section
300 * completes.
301 *
302 * It is illegal to block while in an RCU read-side critical section.
303 */
bc33f24b
PM
304static inline void rcu_read_lock(void)
305{
306 __rcu_read_lock();
307 __acquire(RCU);
308 rcu_read_acquire();
309}
1da177e4 310
1da177e4
LT
311/*
312 * So where is rcu_write_lock()? It does not exist, as there is no
313 * way for writers to lock out RCU readers. This is a feature, not
314 * a bug -- this property is what provides RCU's performance benefits.
315 * Of course, writers must coordinate with each other. The normal
316 * spinlock primitives work well for this, but any other technique may be
317 * used as well. RCU does not care how the writers keep out of each
318 * others' way, as long as they do so.
319 */
3d76c082
PM
320
321/**
322 * rcu_read_unlock - marks the end of an RCU read-side critical section.
323 *
324 * See rcu_read_lock() for more information.
325 */
bc33f24b
PM
326static inline void rcu_read_unlock(void)
327{
328 rcu_read_release();
329 __release(RCU);
330 __rcu_read_unlock();
331}
1da177e4
LT
332
333/**
334 * rcu_read_lock_bh - mark the beginning of a softirq-only RCU critical section
335 *
336 * This is equivalent of rcu_read_lock(), but to be used when updates
337 * are being done using call_rcu_bh(). Since call_rcu_bh() callbacks
338 * consider completion of a softirq handler to be a quiescent state,
339 * a process in RCU read-side critical section must be protected by
340 * disabling softirqs. Read-side critical sections in interrupt context
341 * can use just rcu_read_lock().
342 *
343 */
bc33f24b
PM
344static inline void rcu_read_lock_bh(void)
345{
346 __rcu_read_lock_bh();
347 __acquire(RCU_BH);
632ee200 348 rcu_read_acquire_bh();
bc33f24b 349}
1da177e4
LT
350
351/*
352 * rcu_read_unlock_bh - marks the end of a softirq-only RCU critical section
353 *
354 * See rcu_read_lock_bh() for more information.
355 */
bc33f24b
PM
356static inline void rcu_read_unlock_bh(void)
357{
632ee200 358 rcu_read_release_bh();
bc33f24b
PM
359 __release(RCU_BH);
360 __rcu_read_unlock_bh();
361}
1da177e4 362
1c50b728
MD
363/**
364 * rcu_read_lock_sched - mark the beginning of a RCU-classic critical section
365 *
366 * Should be used with either
367 * - synchronize_sched()
368 * or
369 * - call_rcu_sched() and rcu_barrier_sched()
370 * on the write-side to insure proper synchronization.
371 */
d6714c22
PM
372static inline void rcu_read_lock_sched(void)
373{
374 preempt_disable();
bc33f24b 375 __acquire(RCU_SCHED);
632ee200 376 rcu_read_acquire_sched();
d6714c22 377}
1eba8f84
PM
378
379/* Used by lockdep and tracing: cannot be traced, cannot call lockdep. */
7c614d64 380static inline notrace void rcu_read_lock_sched_notrace(void)
d6714c22
PM
381{
382 preempt_disable_notrace();
bc33f24b 383 __acquire(RCU_SCHED);
d6714c22 384}
1c50b728
MD
385
386/*
387 * rcu_read_unlock_sched - marks the end of a RCU-classic critical section
388 *
389 * See rcu_read_lock_sched for more information.
390 */
d6714c22
PM
391static inline void rcu_read_unlock_sched(void)
392{
632ee200 393 rcu_read_release_sched();
bc33f24b 394 __release(RCU_SCHED);
d6714c22
PM
395 preempt_enable();
396}
1eba8f84
PM
397
398/* Used by lockdep and tracing: cannot be traced, cannot call lockdep. */
7c614d64 399static inline notrace void rcu_read_unlock_sched_notrace(void)
d6714c22 400{
bc33f24b 401 __release(RCU_SCHED);
d6714c22
PM
402 preempt_enable_notrace();
403}
1c50b728
MD
404
405
1da177e4 406/**
c26d34a5
PM
407 * rcu_dereference_raw - fetch an RCU-protected pointer
408 *
409 * The caller must be within some flavor of RCU read-side critical
410 * section, or must be otherwise preventing the pointer from changing,
411 * for example, by holding an appropriate lock. This pointer may later
412 * be safely dereferenced. It is the caller's responsibility to have
413 * done the right thing, as this primitive does no checking of any kind.
1da177e4
LT
414 *
415 * Inserts memory barriers on architectures that require them
416 * (currently only the Alpha), and, more importantly, documents
417 * exactly which pointers are protected by RCU.
418 */
c26d34a5 419#define rcu_dereference_raw(p) ({ \
97b43032 420 typeof(p) _________p1 = ACCESS_ONCE(p); \
1da177e4
LT
421 smp_read_barrier_depends(); \
422 (_________p1); \
423 })
424
c26d34a5
PM
425/**
426 * rcu_dereference - fetch an RCU-protected pointer, checking for RCU
427 *
428 * Makes rcu_dereference_check() do the dirty work.
429 */
430#define rcu_dereference(p) \
431 rcu_dereference_check(p, rcu_read_lock_held())
432
433/**
434 * rcu_dereference_bh - fetch an RCU-protected pointer, checking for RCU-bh
435 *
436 * Makes rcu_dereference_check() do the dirty work.
437 */
438#define rcu_dereference_bh(p) \
439 rcu_dereference_check(p, rcu_read_lock_bh_held())
440
441/**
442 * rcu_dereference_sched - fetch RCU-protected pointer, checking for RCU-sched
443 *
444 * Makes rcu_dereference_check() do the dirty work.
445 */
446#define rcu_dereference_sched(p) \
447 rcu_dereference_check(p, rcu_read_lock_sched_held())
448
1da177e4
LT
449/**
450 * rcu_assign_pointer - assign (publicize) a pointer to a newly
451 * initialized structure that will be dereferenced by RCU read-side
452 * critical sections. Returns the value assigned.
453 *
454 * Inserts memory barriers on architectures that require them
455 * (pretty much all of them other than x86), and also prevents
456 * the compiler from reordering the code that initializes the
457 * structure after the pointer assignment. More importantly, this
458 * call documents which pointers will be dereferenced by RCU read-side
459 * code.
460 */
461
d99c4f6b
PM
462#define rcu_assign_pointer(p, v) \
463 ({ \
464 if (!__builtin_constant_p(v) || \
465 ((v) != NULL)) \
466 smp_wmb(); \
467 (p) = (v); \
468 })
1da177e4 469
4446a36f
PM
470/* Infrastructure to implement the synchronize_() primitives. */
471
472struct rcu_synchronize {
473 struct rcu_head head;
474 struct completion completion;
475};
476
477extern void wakeme_after_rcu(struct rcu_head *head);
478
01c1c660
PM
479/**
480 * call_rcu - Queue an RCU callback for invocation after a grace period.
481 * @head: structure to be used for queueing the RCU updates.
482 * @func: actual update function to be invoked after the grace period
483 *
484 * The update function will be invoked some time after a full grace
485 * period elapses, in other words after all currently executing RCU
486 * read-side critical sections have completed. RCU read-side critical
487 * sections are delimited by rcu_read_lock() and rcu_read_unlock(),
488 * and may be nested.
489 */
490extern void call_rcu(struct rcu_head *head,
491 void (*func)(struct rcu_head *head));
492
493/**
494 * call_rcu_bh - Queue an RCU for invocation after a quicker grace period.
495 * @head: structure to be used for queueing the RCU updates.
496 * @func: actual update function to be invoked after the grace period
497 *
498 * The update function will be invoked some time after a full grace
499 * period elapses, in other words after all currently executing RCU
500 * read-side critical sections have completed. call_rcu_bh() assumes
501 * that the read-side critical sections end on completion of a softirq
502 * handler. This means that read-side critical sections in process
503 * context must not be interrupted by softirqs. This interface is to be
504 * used when most of the read-side critical sections are in softirq context.
505 * RCU read-side critical sections are delimited by :
506 * - rcu_read_lock() and rcu_read_unlock(), if in interrupt context.
507 * OR
508 * - rcu_read_lock_bh() and rcu_read_unlock_bh(), if in process context.
509 * These may be nested.
510 */
511extern void call_rcu_bh(struct rcu_head *head,
512 void (*func)(struct rcu_head *head));
513
1da177e4 514#endif /* __LINUX_RCUPDATE_H */