blob: 87bd390df73fb58987d09d281aaf365e65d8a795 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Paul E. McKenneya71fca52009-09-18 10:28:19 -07002 * Read-Copy Update mechanism for mutual exclusion
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
17 *
Paul E. McKenney01c1c662008-01-25 21:08:24 +010018 * Copyright IBM Corporation, 2001
Linus Torvalds1da177e2005-04-16 15:20:36 -070019 *
20 * Author: Dipankar Sarma <dipankar@in.ibm.com>
Paul E. McKenneya71fca52009-09-18 10:28:19 -070021 *
Josh Triplett595182b2006-10-04 02:17:21 -070022 * Based on the original work by Paul McKenney <paulmck@us.ibm.com>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023 * and inputs from Rusty Russell, Andrea Arcangeli and Andi Kleen.
24 * Papers:
25 * http://www.rdrop.com/users/paulmck/paper/rclockpdcsproof.pdf
26 * http://lse.sourceforge.net/locking/rclock_OLS.2001.05.01c.sc.pdf (OLS2001)
27 *
28 * For detailed explanation of Read-Copy Update mechanism see -
Paul E. McKenneya71fca52009-09-18 10:28:19 -070029 * http://lse.sourceforge.net/locking/rcupdate.html
Linus Torvalds1da177e2005-04-16 15:20:36 -070030 *
31 */
32
33#ifndef __LINUX_RCUPDATE_H
34#define __LINUX_RCUPDATE_H
35
Paul E. McKenney99098752011-05-31 21:03:55 -070036#include <linux/types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070037#include <linux/cache.h>
38#include <linux/spinlock.h>
39#include <linux/threads.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070040#include <linux/cpumask.h>
41#include <linux/seqlock.h>
Peter Zijlstra851a67b2007-10-11 22:11:12 +020042#include <linux/lockdep.h>
Paul E. McKenney4446a362008-05-12 21:21:05 +020043#include <linux/completion.h>
Mathieu Desnoyers551d55a2010-04-17 08:48:42 -040044#include <linux/debugobjects.h>
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -070045#include <linux/compiler.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070046
Dave Younge5ab6772010-03-10 15:24:05 -080047#ifdef CONFIG_RCU_TORTURE_TEST
48extern int rcutorture_runnable; /* for sysctl */
49#endif /* #ifdef CONFIG_RCU_TORTURE_TEST */
50
Paul E. McKenney4a298652011-04-03 21:33:51 -070051#if defined(CONFIG_TREE_RCU) || defined(CONFIG_TREE_PREEMPT_RCU)
52extern void rcutorture_record_test_transition(void);
53extern void rcutorture_record_progress(unsigned long vernum);
54#else
55static inline void rcutorture_record_test_transition(void)
56{
57}
58static inline void rcutorture_record_progress(unsigned long vernum)
59{
60}
61#endif
62
Tejun Heoe27fc962010-11-22 21:36:11 -080063#define UINT_CMP_GE(a, b) (UINT_MAX / 2 >= (a) - (b))
64#define UINT_CMP_LT(a, b) (UINT_MAX / 2 < (a) - (b))
Paul E. McKenneya3dc3fb2010-08-13 16:16:25 -070065#define ULONG_CMP_GE(a, b) (ULONG_MAX / 2 >= (a) - (b))
66#define ULONG_CMP_LT(a, b) (ULONG_MAX / 2 < (a) - (b))
67
Paul E. McKenney03b042b2009-06-25 09:08:16 -070068/* Exported common interfaces */
Paul E. McKenney7b0b7592010-08-17 14:18:46 -070069extern void call_rcu_sched(struct rcu_head *head,
70 void (*func)(struct rcu_head *rcu));
71extern void synchronize_sched(void);
Paul E. McKenney03b042b2009-06-25 09:08:16 -070072extern void rcu_barrier_bh(void);
73extern void rcu_barrier_sched(void);
Paul E. McKenney03b042b2009-06-25 09:08:16 -070074
Paul E. McKenney7b0b7592010-08-17 14:18:46 -070075static inline void __rcu_read_lock_bh(void)
76{
77 local_bh_disable();
78}
79
80static inline void __rcu_read_unlock_bh(void)
81{
82 local_bh_enable();
83}
Paul E. McKenneya6826042009-02-25 18:03:42 -080084
Paul E. McKenneya3dc3fb2010-08-13 16:16:25 -070085#ifdef CONFIG_PREEMPT_RCU
86
Paul E. McKenney7b0b7592010-08-17 14:18:46 -070087extern void __rcu_read_lock(void);
88extern void __rcu_read_unlock(void);
89void synchronize_rcu(void);
90
Paul E. McKenneya3dc3fb2010-08-13 16:16:25 -070091/*
92 * Defined as a macro as it is a very low level header included from
93 * areas that don't even know about current. This gives the rcu_read_lock()
94 * nesting depth, but makes sense only if CONFIG_PREEMPT_RCU -- in other
95 * types of kernel builds, the rcu_read_lock() nesting depth is unknowable.
96 */
97#define rcu_preempt_depth() (current->rcu_read_lock_nesting)
98
Paul E. McKenney7b0b7592010-08-17 14:18:46 -070099#else /* #ifdef CONFIG_PREEMPT_RCU */
100
101static inline void __rcu_read_lock(void)
102{
103 preempt_disable();
104}
105
106static inline void __rcu_read_unlock(void)
107{
108 preempt_enable();
109}
110
111static inline void synchronize_rcu(void)
112{
113 synchronize_sched();
114}
115
116static inline int rcu_preempt_depth(void)
117{
118 return 0;
119}
120
121#endif /* #else #ifdef CONFIG_PREEMPT_RCU */
122
123/* Internal to kernel */
Paul E. McKenney7b0b7592010-08-17 14:18:46 -0700124extern void rcu_sched_qs(int cpu);
125extern void rcu_bh_qs(int cpu);
126extern void rcu_check_callbacks(int cpu, int user);
127struct notifier_block;
128
129#ifdef CONFIG_NO_HZ
130
131extern void rcu_enter_nohz(void);
132extern void rcu_exit_nohz(void);
133
134#else /* #ifdef CONFIG_NO_HZ */
135
136static inline void rcu_enter_nohz(void)
137{
138}
139
140static inline void rcu_exit_nohz(void)
141{
142}
143
144#endif /* #else #ifdef CONFIG_NO_HZ */
Paul E. McKenneya3dc3fb2010-08-13 16:16:25 -0700145
Paul E. McKenneyf41d9112009-08-22 13:56:52 -0700146#if defined(CONFIG_TREE_RCU) || defined(CONFIG_TREE_PREEMPT_RCU)
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100147#include <linux/rcutree.h>
Paul E. McKenneya57eb942010-06-29 16:49:16 -0700148#elif defined(CONFIG_TINY_RCU) || defined(CONFIG_TINY_PREEMPT_RCU)
Paul E. McKenney9b1d82f2009-10-25 19:03:50 -0700149#include <linux/rcutiny.h>
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100150#else
151#error "Unknown RCU implementation specified to kernel configuration"
Paul E. McKenney6b3ef482009-08-22 13:56:53 -0700152#endif
Paul E. McKenney01c1c662008-01-25 21:08:24 +0100153
Mathieu Desnoyers551d55a2010-04-17 08:48:42 -0400154/*
155 * init_rcu_head_on_stack()/destroy_rcu_head_on_stack() are needed for dynamic
156 * initialization and destruction of rcu_head on the stack. rcu_head structures
157 * allocated dynamically in the heap or defined statically don't need any
158 * initialization.
159 */
160#ifdef CONFIG_DEBUG_OBJECTS_RCU_HEAD
161extern void init_rcu_head_on_stack(struct rcu_head *head);
162extern void destroy_rcu_head_on_stack(struct rcu_head *head);
163#else /* !CONFIG_DEBUG_OBJECTS_RCU_HEAD */
Mathieu Desnoyers43760302010-04-17 08:48:39 -0400164static inline void init_rcu_head_on_stack(struct rcu_head *head)
165{
166}
167
168static inline void destroy_rcu_head_on_stack(struct rcu_head *head)
169{
170}
Mathieu Desnoyers551d55a2010-04-17 08:48:42 -0400171#endif /* #else !CONFIG_DEBUG_OBJECTS_RCU_HEAD */
Mathieu Desnoyers43760302010-04-17 08:48:39 -0400172
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700173#ifdef CONFIG_DEBUG_LOCK_ALLOC
Paul E. McKenney632ee202010-02-22 17:04:45 -0800174
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700175extern struct lockdep_map rcu_lock_map;
Paul E. McKenney632ee202010-02-22 17:04:45 -0800176# define rcu_read_acquire() \
177 lock_acquire(&rcu_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_)
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700178# define rcu_read_release() lock_release(&rcu_lock_map, 1, _THIS_IP_)
Paul E. McKenney632ee202010-02-22 17:04:45 -0800179
180extern struct lockdep_map rcu_bh_lock_map;
181# define rcu_read_acquire_bh() \
182 lock_acquire(&rcu_bh_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_)
183# define rcu_read_release_bh() lock_release(&rcu_bh_lock_map, 1, _THIS_IP_)
184
185extern struct lockdep_map rcu_sched_lock_map;
186# define rcu_read_acquire_sched() \
187 lock_acquire(&rcu_sched_lock_map, 0, 0, 2, 1, NULL, _THIS_IP_)
188# define rcu_read_release_sched() \
189 lock_release(&rcu_sched_lock_map, 1, _THIS_IP_)
190
Paul E. McKenneybc293d62010-04-15 12:50:39 -0700191extern int debug_lockdep_rcu_enabled(void);
Paul E. McKenney54dbf962010-03-03 07:46:57 -0800192
Paul E. McKenney632ee202010-02-22 17:04:45 -0800193/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700194 * rcu_read_lock_held() - might we be in RCU read-side critical section?
Paul E. McKenney632ee202010-02-22 17:04:45 -0800195 *
Paul E. McKenneyd20200b2010-03-30 10:52:21 -0700196 * If CONFIG_DEBUG_LOCK_ALLOC is selected, returns nonzero iff in an RCU
197 * read-side critical section. In absence of CONFIG_DEBUG_LOCK_ALLOC,
Paul E. McKenney632ee202010-02-22 17:04:45 -0800198 * this assumes we are in an RCU read-side critical section unless it can
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700199 * prove otherwise. This is useful for debug checks in functions that
200 * require that they be called within an RCU read-side critical section.
Paul E. McKenney54dbf962010-03-03 07:46:57 -0800201 *
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700202 * Checks debug_lockdep_rcu_enabled() to prevent false positives during boot
Paul E. McKenney32c141a2010-03-30 10:59:28 -0700203 * and while lockdep is disabled.
Paul E. McKenney632ee202010-02-22 17:04:45 -0800204 */
205static inline int rcu_read_lock_held(void)
206{
Paul E. McKenney54dbf962010-03-03 07:46:57 -0800207 if (!debug_lockdep_rcu_enabled())
208 return 1;
209 return lock_is_held(&rcu_lock_map);
Paul E. McKenney632ee202010-02-22 17:04:45 -0800210}
211
Paul E. McKenneye3818b82010-03-15 17:03:43 -0700212/*
213 * rcu_read_lock_bh_held() is defined out of line to avoid #include-file
214 * hell.
Paul E. McKenney632ee202010-02-22 17:04:45 -0800215 */
Paul E. McKenneye3818b82010-03-15 17:03:43 -0700216extern int rcu_read_lock_bh_held(void);
Paul E. McKenney632ee202010-02-22 17:04:45 -0800217
218/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700219 * rcu_read_lock_sched_held() - might we be in RCU-sched read-side critical section?
Paul E. McKenney632ee202010-02-22 17:04:45 -0800220 *
Paul E. McKenneyd20200b2010-03-30 10:52:21 -0700221 * If CONFIG_DEBUG_LOCK_ALLOC is selected, returns nonzero iff in an
222 * RCU-sched read-side critical section. In absence of
223 * CONFIG_DEBUG_LOCK_ALLOC, this assumes we are in an RCU-sched read-side
224 * critical section unless it can prove otherwise. Note that disabling
225 * of preemption (including disabling irqs) counts as an RCU-sched
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700226 * read-side critical section. This is useful for debug checks in functions
227 * that required that they be called within an RCU-sched read-side
228 * critical section.
Paul E. McKenney54dbf962010-03-03 07:46:57 -0800229 *
Paul E. McKenney32c141a2010-03-30 10:59:28 -0700230 * Check debug_lockdep_rcu_enabled() to prevent false positives during boot
231 * and while lockdep is disabled.
Paul E. McKenney632ee202010-02-22 17:04:45 -0800232 */
Frederic Weisbeckerbdd4e852011-06-08 01:13:27 +0200233#ifdef CONFIG_PREEMPT_COUNT
Paul E. McKenney632ee202010-02-22 17:04:45 -0800234static inline int rcu_read_lock_sched_held(void)
235{
236 int lockdep_opinion = 0;
237
Paul E. McKenney54dbf962010-03-03 07:46:57 -0800238 if (!debug_lockdep_rcu_enabled())
239 return 1;
Paul E. McKenney632ee202010-02-22 17:04:45 -0800240 if (debug_locks)
241 lockdep_opinion = lock_is_held(&rcu_sched_lock_map);
Lai Jiangshan0cff8102010-03-18 12:25:33 -0700242 return lockdep_opinion || preempt_count() != 0 || irqs_disabled();
Paul E. McKenney632ee202010-02-22 17:04:45 -0800243}
Frederic Weisbeckerbdd4e852011-06-08 01:13:27 +0200244#else /* #ifdef CONFIG_PREEMPT_COUNT */
Paul E. McKenneye6033e32010-03-03 17:50:16 -0800245static inline int rcu_read_lock_sched_held(void)
246{
247 return 1;
248}
Frederic Weisbeckerbdd4e852011-06-08 01:13:27 +0200249#endif /* #else #ifdef CONFIG_PREEMPT_COUNT */
Paul E. McKenney632ee202010-02-22 17:04:45 -0800250
251#else /* #ifdef CONFIG_DEBUG_LOCK_ALLOC */
252
253# define rcu_read_acquire() do { } while (0)
254# define rcu_read_release() do { } while (0)
255# define rcu_read_acquire_bh() do { } while (0)
256# define rcu_read_release_bh() do { } while (0)
257# define rcu_read_acquire_sched() do { } while (0)
258# define rcu_read_release_sched() do { } while (0)
259
260static inline int rcu_read_lock_held(void)
261{
262 return 1;
263}
264
265static inline int rcu_read_lock_bh_held(void)
266{
267 return 1;
268}
269
Frederic Weisbeckerbdd4e852011-06-08 01:13:27 +0200270#ifdef CONFIG_PREEMPT_COUNT
Paul E. McKenney632ee202010-02-22 17:04:45 -0800271static inline int rcu_read_lock_sched_held(void)
272{
Paul E. McKenneybbad9372010-04-02 16:17:17 -0700273 return preempt_count() != 0 || irqs_disabled();
Paul E. McKenney632ee202010-02-22 17:04:45 -0800274}
Frederic Weisbeckerbdd4e852011-06-08 01:13:27 +0200275#else /* #ifdef CONFIG_PREEMPT_COUNT */
Paul E. McKenneye6033e32010-03-03 17:50:16 -0800276static inline int rcu_read_lock_sched_held(void)
277{
278 return 1;
279}
Frederic Weisbeckerbdd4e852011-06-08 01:13:27 +0200280#endif /* #else #ifdef CONFIG_PREEMPT_COUNT */
Paul E. McKenney632ee202010-02-22 17:04:45 -0800281
282#endif /* #else #ifdef CONFIG_DEBUG_LOCK_ALLOC */
283
284#ifdef CONFIG_PROVE_RCU
285
Paul E. McKenneyee84b822010-05-06 09:28:41 -0700286extern int rcu_my_thread_group_empty(void);
287
Tetsuo Handa4221a992010-06-26 01:08:19 +0900288/**
289 * rcu_lockdep_assert - emit lockdep splat if specified condition not met
290 * @c: condition to check
Paul E. McKenneyb3fbab02011-05-24 08:31:09 -0700291 * @s: informative message
Tetsuo Handa4221a992010-06-26 01:08:19 +0900292 */
Paul E. McKenneyb3fbab02011-05-24 08:31:09 -0700293#define rcu_lockdep_assert(c, s) \
Lai Jiangshan2b3fc352010-04-20 16:23:07 +0800294 do { \
295 static bool __warned; \
296 if (debug_lockdep_rcu_enabled() && !__warned && !(c)) { \
297 __warned = true; \
Paul E. McKenneyb3fbab02011-05-24 08:31:09 -0700298 lockdep_rcu_suspicious(__FILE__, __LINE__, s); \
Lai Jiangshan2b3fc352010-04-20 16:23:07 +0800299 } \
300 } while (0)
301
Paul E. McKenneyb3fbab02011-05-24 08:31:09 -0700302#define rcu_sleep_check() \
303 do { \
304 rcu_lockdep_assert(!lock_is_held(&rcu_bh_lock_map), \
305 "Illegal context switch in RCU-bh" \
306 " read-side critical section"); \
307 rcu_lockdep_assert(!lock_is_held(&rcu_sched_lock_map), \
308 "Illegal context switch in RCU-sched"\
309 " read-side critical section"); \
310 } while (0)
311
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700312#else /* #ifdef CONFIG_PROVE_RCU */
313
Paul E. McKenneyb3fbab02011-05-24 08:31:09 -0700314#define rcu_lockdep_assert(c, s) do { } while (0)
315#define rcu_sleep_check() do { } while (0)
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700316
317#endif /* #else #ifdef CONFIG_PROVE_RCU */
318
319/*
320 * Helper functions for rcu_dereference_check(), rcu_dereference_protected()
321 * and rcu_assign_pointer(). Some of these could be folded into their
322 * callers, but they are left separate in order to ease introduction of
323 * multiple flavors of pointers to match the multiple flavors of RCU
324 * (e.g., __rcu_bh, * __rcu_sched, and __srcu), should this make sense in
325 * the future.
326 */
Paul E. McKenney53ecfba2010-09-13 17:24:21 -0700327
328#ifdef __CHECKER__
329#define rcu_dereference_sparse(p, space) \
330 ((void)(((typeof(*p) space *)p) == p))
331#else /* #ifdef __CHECKER__ */
332#define rcu_dereference_sparse(p, space)
333#endif /* #else #ifdef __CHECKER__ */
334
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700335#define __rcu_access_pointer(p, space) \
336 ({ \
337 typeof(*p) *_________p1 = (typeof(*p)*__force )ACCESS_ONCE(p); \
Paul E. McKenney53ecfba2010-09-13 17:24:21 -0700338 rcu_dereference_sparse(p, space); \
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700339 ((typeof(*p) __force __kernel *)(_________p1)); \
340 })
341#define __rcu_dereference_check(p, c, space) \
342 ({ \
343 typeof(*p) *_________p1 = (typeof(*p)*__force )ACCESS_ONCE(p); \
Paul E. McKenneyb3fbab02011-05-24 08:31:09 -0700344 rcu_lockdep_assert(c, "suspicious rcu_dereference_check()" \
345 " usage"); \
Paul E. McKenney53ecfba2010-09-13 17:24:21 -0700346 rcu_dereference_sparse(p, space); \
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700347 smp_read_barrier_depends(); \
348 ((typeof(*p) __force __kernel *)(_________p1)); \
349 })
350#define __rcu_dereference_protected(p, c, space) \
351 ({ \
Paul E. McKenneyb3fbab02011-05-24 08:31:09 -0700352 rcu_lockdep_assert(c, "suspicious rcu_dereference_protected()" \
353 " usage"); \
Paul E. McKenney53ecfba2010-09-13 17:24:21 -0700354 rcu_dereference_sparse(p, space); \
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700355 ((typeof(*p) __force __kernel *)(p)); \
356 })
357
Paul E. McKenneya4dd9922011-04-01 07:15:14 -0700358#define __rcu_access_index(p, space) \
359 ({ \
360 typeof(p) _________p1 = ACCESS_ONCE(p); \
361 rcu_dereference_sparse(p, space); \
362 (_________p1); \
363 })
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700364#define __rcu_dereference_index_check(p, c) \
365 ({ \
366 typeof(p) _________p1 = ACCESS_ONCE(p); \
Paul E. McKenneyb3fbab02011-05-24 08:31:09 -0700367 rcu_lockdep_assert(c, \
368 "suspicious rcu_dereference_index_check()" \
369 " usage"); \
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700370 smp_read_barrier_depends(); \
371 (_________p1); \
372 })
373#define __rcu_assign_pointer(p, v, space) \
374 ({ \
375 if (!__builtin_constant_p(v) || \
376 ((v) != NULL)) \
377 smp_wmb(); \
378 (p) = (typeof(*v) __force space *)(v); \
379 })
380
381
Paul E. McKenney632ee202010-02-22 17:04:45 -0800382/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700383 * rcu_access_pointer() - fetch RCU pointer with no dereferencing
384 * @p: The pointer to read
385 *
386 * Return the value of the specified RCU-protected pointer, but omit the
387 * smp_read_barrier_depends() and keep the ACCESS_ONCE(). This is useful
388 * when the value of this pointer is accessed, but the pointer is not
389 * dereferenced, for example, when testing an RCU-protected pointer against
390 * NULL. Although rcu_access_pointer() may also be used in cases where
391 * update-side locks prevent the value of the pointer from changing, you
392 * should instead use rcu_dereference_protected() for this use case.
393 */
394#define rcu_access_pointer(p) __rcu_access_pointer((p), __rcu)
395
396/**
397 * rcu_dereference_check() - rcu_dereference with debug checking
David Howellsc08c68d2010-04-09 15:39:11 -0700398 * @p: The pointer to read, prior to dereferencing
399 * @c: The conditions under which the dereference will take place
Paul E. McKenney632ee202010-02-22 17:04:45 -0800400 *
David Howellsc08c68d2010-04-09 15:39:11 -0700401 * Do an rcu_dereference(), but check that the conditions under which the
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700402 * dereference will take place are correct. Typically the conditions
403 * indicate the various locking conditions that should be held at that
404 * point. The check should return true if the conditions are satisfied.
405 * An implicit check for being in an RCU read-side critical section
406 * (rcu_read_lock()) is included.
David Howellsc08c68d2010-04-09 15:39:11 -0700407 *
408 * For example:
409 *
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700410 * bar = rcu_dereference_check(foo->bar, lockdep_is_held(&foo->lock));
David Howellsc08c68d2010-04-09 15:39:11 -0700411 *
412 * could be used to indicate to lockdep that foo->bar may only be dereferenced
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700413 * if either rcu_read_lock() is held, or that the lock required to replace
David Howellsc08c68d2010-04-09 15:39:11 -0700414 * the bar struct at foo->bar is held.
415 *
416 * Note that the list of conditions may also include indications of when a lock
417 * need not be held, for example during initialisation or destruction of the
418 * target struct:
419 *
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700420 * bar = rcu_dereference_check(foo->bar, lockdep_is_held(&foo->lock) ||
David Howellsc08c68d2010-04-09 15:39:11 -0700421 * atomic_read(&foo->usage) == 0);
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700422 *
423 * Inserts memory barriers on architectures that require them
424 * (currently only the Alpha), prevents the compiler from refetching
425 * (and from merging fetches), and, more importantly, documents exactly
426 * which pointers are protected by RCU and checks that the pointer is
427 * annotated as __rcu.
Paul E. McKenney632ee202010-02-22 17:04:45 -0800428 */
429#define rcu_dereference_check(p, c) \
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700430 __rcu_dereference_check((p), rcu_read_lock_held() || (c), __rcu)
Paul E. McKenney632ee202010-02-22 17:04:45 -0800431
Paul E. McKenneyb62730b2010-04-09 15:39:10 -0700432/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700433 * rcu_dereference_bh_check() - rcu_dereference_bh with debug checking
434 * @p: The pointer to read, prior to dereferencing
435 * @c: The conditions under which the dereference will take place
436 *
437 * This is the RCU-bh counterpart to rcu_dereference_check().
438 */
439#define rcu_dereference_bh_check(p, c) \
440 __rcu_dereference_check((p), rcu_read_lock_bh_held() || (c), __rcu)
441
442/**
443 * rcu_dereference_sched_check() - rcu_dereference_sched with debug checking
444 * @p: The pointer to read, prior to dereferencing
445 * @c: The conditions under which the dereference will take place
446 *
447 * This is the RCU-sched counterpart to rcu_dereference_check().
448 */
449#define rcu_dereference_sched_check(p, c) \
450 __rcu_dereference_check((p), rcu_read_lock_sched_held() || (c), \
451 __rcu)
452
453#define rcu_dereference_raw(p) rcu_dereference_check(p, 1) /*@@@ needed? @@@*/
454
455/**
Paul E. McKenneya4dd9922011-04-01 07:15:14 -0700456 * rcu_access_index() - fetch RCU index with no dereferencing
457 * @p: The index to read
458 *
459 * Return the value of the specified RCU-protected index, but omit the
460 * smp_read_barrier_depends() and keep the ACCESS_ONCE(). This is useful
461 * when the value of this index is accessed, but the index is not
462 * dereferenced, for example, when testing an RCU-protected index against
463 * -1. Although rcu_access_index() may also be used in cases where
464 * update-side locks prevent the value of the index from changing, you
465 * should instead use rcu_dereference_index_protected() for this use case.
466 */
467#define rcu_access_index(p) __rcu_access_index((p), __rcu)
468
469/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700470 * rcu_dereference_index_check() - rcu_dereference for indices with debug checking
471 * @p: The pointer to read, prior to dereferencing
472 * @c: The conditions under which the dereference will take place
473 *
474 * Similar to rcu_dereference_check(), but omits the sparse checking.
475 * This allows rcu_dereference_index_check() to be used on integers,
476 * which can then be used as array indices. Attempting to use
477 * rcu_dereference_check() on an integer will give compiler warnings
478 * because the sparse address-space mechanism relies on dereferencing
479 * the RCU-protected pointer. Dereferencing integers is not something
480 * that even gcc will put up with.
481 *
482 * Note that this function does not implicitly check for RCU read-side
483 * critical sections. If this function gains lots of uses, it might
484 * make sense to provide versions for each flavor of RCU, but it does
485 * not make sense as of early 2010.
486 */
487#define rcu_dereference_index_check(p, c) \
488 __rcu_dereference_index_check((p), (c))
489
490/**
491 * rcu_dereference_protected() - fetch RCU pointer when updates prevented
492 * @p: The pointer to read, prior to dereferencing
493 * @c: The conditions under which the dereference will take place
Paul E. McKenneyb62730b2010-04-09 15:39:10 -0700494 *
495 * Return the value of the specified RCU-protected pointer, but omit
496 * both the smp_read_barrier_depends() and the ACCESS_ONCE(). This
497 * is useful in cases where update-side locks prevent the value of the
498 * pointer from changing. Please note that this primitive does -not-
499 * prevent the compiler from repeating this reference or combining it
500 * with other references, so it should not be used without protection
501 * of appropriate locks.
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700502 *
503 * This function is only for update-side use. Using this function
504 * when protected only by rcu_read_lock() will result in infrequent
505 * but very ugly failures.
Paul E. McKenneyb62730b2010-04-09 15:39:10 -0700506 */
507#define rcu_dereference_protected(p, c) \
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700508 __rcu_dereference_protected((p), (c), __rcu)
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700509
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700511 * rcu_dereference_bh_protected() - fetch RCU-bh pointer when updates prevented
512 * @p: The pointer to read, prior to dereferencing
513 * @c: The conditions under which the dereference will take place
Paul E. McKenneyb62730b2010-04-09 15:39:10 -0700514 *
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700515 * This is the RCU-bh counterpart to rcu_dereference_protected().
Paul E. McKenneyb62730b2010-04-09 15:39:10 -0700516 */
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700517#define rcu_dereference_bh_protected(p, c) \
518 __rcu_dereference_protected((p), (c), __rcu)
Paul E. McKenneyb62730b2010-04-09 15:39:10 -0700519
520/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700521 * rcu_dereference_sched_protected() - fetch RCU-sched pointer when updates prevented
522 * @p: The pointer to read, prior to dereferencing
523 * @c: The conditions under which the dereference will take place
524 *
525 * This is the RCU-sched counterpart to rcu_dereference_protected().
526 */
527#define rcu_dereference_sched_protected(p, c) \
528 __rcu_dereference_protected((p), (c), __rcu)
529
530
531/**
532 * rcu_dereference() - fetch RCU-protected pointer for dereferencing
533 * @p: The pointer to read, prior to dereferencing
534 *
535 * This is a simple wrapper around rcu_dereference_check().
536 */
537#define rcu_dereference(p) rcu_dereference_check(p, 0)
538
539/**
540 * rcu_dereference_bh() - fetch an RCU-bh-protected pointer for dereferencing
541 * @p: The pointer to read, prior to dereferencing
542 *
543 * Makes rcu_dereference_check() do the dirty work.
544 */
545#define rcu_dereference_bh(p) rcu_dereference_bh_check(p, 0)
546
547/**
548 * rcu_dereference_sched() - fetch RCU-sched-protected pointer for dereferencing
549 * @p: The pointer to read, prior to dereferencing
550 *
551 * Makes rcu_dereference_check() do the dirty work.
552 */
553#define rcu_dereference_sched(p) rcu_dereference_sched_check(p, 0)
554
555/**
556 * rcu_read_lock() - mark the beginning of an RCU read-side critical section
Linus Torvalds1da177e2005-04-16 15:20:36 -0700557 *
Paul E. McKenney9b06e812005-05-01 08:59:04 -0700558 * When synchronize_rcu() is invoked on one CPU while other CPUs
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559 * are within RCU read-side critical sections, then the
Paul E. McKenney9b06e812005-05-01 08:59:04 -0700560 * synchronize_rcu() is guaranteed to block until after all the other
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 * CPUs exit their critical sections. Similarly, if call_rcu() is invoked
562 * on one CPU while other CPUs are within RCU read-side critical
563 * sections, invocation of the corresponding RCU callback is deferred
564 * until after the all the other CPUs exit their critical sections.
565 *
566 * Note, however, that RCU callbacks are permitted to run concurrently
Paul E. McKenney77d84852010-07-08 17:38:59 -0700567 * with new RCU read-side critical sections. One way that this can happen
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568 * is via the following sequence of events: (1) CPU 0 enters an RCU
569 * read-side critical section, (2) CPU 1 invokes call_rcu() to register
570 * an RCU callback, (3) CPU 0 exits the RCU read-side critical section,
571 * (4) CPU 2 enters a RCU read-side critical section, (5) the RCU
572 * callback is invoked. This is legal, because the RCU read-side critical
573 * section that was running concurrently with the call_rcu() (and which
574 * therefore might be referencing something that the corresponding RCU
575 * callback would free up) has completed before the corresponding
576 * RCU callback is invoked.
577 *
578 * RCU read-side critical sections may be nested. Any deferred actions
579 * will be deferred until the outermost RCU read-side critical section
580 * completes.
581 *
Paul E. McKenney9079fd72010-08-07 21:59:54 -0700582 * You can avoid reading and understanding the next paragraph by
583 * following this rule: don't put anything in an rcu_read_lock() RCU
584 * read-side critical section that would block in a !PREEMPT kernel.
585 * But if you want the full story, read on!
586 *
587 * In non-preemptible RCU implementations (TREE_RCU and TINY_RCU), it
588 * is illegal to block while in an RCU read-side critical section. In
589 * preemptible RCU implementations (TREE_PREEMPT_RCU and TINY_PREEMPT_RCU)
590 * in CONFIG_PREEMPT kernel builds, RCU read-side critical sections may
591 * be preempted, but explicit blocking is illegal. Finally, in preemptible
592 * RCU implementations in real-time (CONFIG_PREEMPT_RT) kernel builds,
593 * RCU read-side critical sections may be preempted and they may also
594 * block, but only when acquiring spinlocks that are subject to priority
595 * inheritance.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596 */
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700597static inline void rcu_read_lock(void)
598{
599 __rcu_read_lock();
600 __acquire(RCU);
601 rcu_read_acquire();
602}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604/*
605 * So where is rcu_write_lock()? It does not exist, as there is no
606 * way for writers to lock out RCU readers. This is a feature, not
607 * a bug -- this property is what provides RCU's performance benefits.
608 * Of course, writers must coordinate with each other. The normal
609 * spinlock primitives work well for this, but any other technique may be
610 * used as well. RCU does not care how the writers keep out of each
611 * others' way, as long as they do so.
612 */
Paul E. McKenney3d76c082009-09-28 07:46:32 -0700613
614/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700615 * rcu_read_unlock() - marks the end of an RCU read-side critical section.
Paul E. McKenney3d76c082009-09-28 07:46:32 -0700616 *
617 * See rcu_read_lock() for more information.
618 */
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700619static inline void rcu_read_unlock(void)
620{
621 rcu_read_release();
622 __release(RCU);
623 __rcu_read_unlock();
624}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625
626/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700627 * rcu_read_lock_bh() - mark the beginning of an RCU-bh critical section
Linus Torvalds1da177e2005-04-16 15:20:36 -0700628 *
629 * This is equivalent of rcu_read_lock(), but to be used when updates
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700630 * are being done using call_rcu_bh() or synchronize_rcu_bh(). Since
631 * both call_rcu_bh() and synchronize_rcu_bh() consider completion of a
632 * softirq handler to be a quiescent state, a process in RCU read-side
633 * critical section must be protected by disabling softirqs. Read-side
634 * critical sections in interrupt context can use just rcu_read_lock(),
635 * though this should at least be commented to avoid confusing people
636 * reading the code.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700637 */
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700638static inline void rcu_read_lock_bh(void)
639{
640 __rcu_read_lock_bh();
641 __acquire(RCU_BH);
Paul E. McKenney632ee202010-02-22 17:04:45 -0800642 rcu_read_acquire_bh();
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700643}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700644
645/*
646 * rcu_read_unlock_bh - marks the end of a softirq-only RCU critical section
647 *
648 * See rcu_read_lock_bh() for more information.
649 */
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700650static inline void rcu_read_unlock_bh(void)
651{
Paul E. McKenney632ee202010-02-22 17:04:45 -0800652 rcu_read_release_bh();
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700653 __release(RCU_BH);
654 __rcu_read_unlock_bh();
655}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700656
657/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700658 * rcu_read_lock_sched() - mark the beginning of a RCU-sched critical section
Mathieu Desnoyers1c50b722008-09-29 11:06:46 -0400659 *
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700660 * This is equivalent of rcu_read_lock(), but to be used when updates
661 * are being done using call_rcu_sched() or synchronize_rcu_sched().
662 * Read-side critical sections can also be introduced by anything that
663 * disables preemption, including local_irq_disable() and friends.
Mathieu Desnoyers1c50b722008-09-29 11:06:46 -0400664 */
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700665static inline void rcu_read_lock_sched(void)
666{
667 preempt_disable();
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700668 __acquire(RCU_SCHED);
Paul E. McKenney632ee202010-02-22 17:04:45 -0800669 rcu_read_acquire_sched();
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700670}
Paul E. McKenney1eba8f82009-09-23 09:50:42 -0700671
672/* Used by lockdep and tracing: cannot be traced, cannot call lockdep. */
Paul E. McKenney7c614d62009-08-24 09:42:00 -0700673static inline notrace void rcu_read_lock_sched_notrace(void)
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700674{
675 preempt_disable_notrace();
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700676 __acquire(RCU_SCHED);
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700677}
Mathieu Desnoyers1c50b722008-09-29 11:06:46 -0400678
679/*
680 * rcu_read_unlock_sched - marks the end of a RCU-classic critical section
681 *
682 * See rcu_read_lock_sched for more information.
683 */
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700684static inline void rcu_read_unlock_sched(void)
685{
Paul E. McKenney632ee202010-02-22 17:04:45 -0800686 rcu_read_release_sched();
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700687 __release(RCU_SCHED);
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700688 preempt_enable();
689}
Paul E. McKenney1eba8f82009-09-23 09:50:42 -0700690
691/* Used by lockdep and tracing: cannot be traced, cannot call lockdep. */
Paul E. McKenney7c614d62009-08-24 09:42:00 -0700692static inline notrace void rcu_read_unlock_sched_notrace(void)
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700693{
Paul E. McKenneybc33f242009-08-22 13:56:47 -0700694 __release(RCU_SCHED);
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700695 preempt_enable_notrace();
696}
Mathieu Desnoyers1c50b722008-09-29 11:06:46 -0400697
Mathieu Desnoyers1c50b722008-09-29 11:06:46 -0400698/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700699 * rcu_assign_pointer() - assign to RCU-protected pointer
700 * @p: pointer to assign to
701 * @v: value to assign (publish)
Paul E. McKenneyc26d34a2010-02-22 17:04:46 -0800702 *
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700703 * Assigns the specified value to the specified RCU-protected
704 * pointer, ensuring that any concurrent RCU readers will see
705 * any prior initialization. Returns the value assigned.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706 *
707 * Inserts memory barriers on architectures that require them
708 * (pretty much all of them other than x86), and also prevents
709 * the compiler from reordering the code that initializes the
710 * structure after the pointer assignment. More importantly, this
711 * call documents which pointers will be dereferenced by RCU read-side
712 * code.
713 */
Paul E. McKenneyd99c4f62008-02-06 01:37:25 -0800714#define rcu_assign_pointer(p, v) \
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700715 __rcu_assign_pointer((p), (v), __rcu)
716
717/**
718 * RCU_INIT_POINTER() - initialize an RCU protected pointer
719 *
720 * Initialize an RCU-protected pointer in such a way to avoid RCU-lockdep
721 * splats.
722 */
723#define RCU_INIT_POINTER(p, v) \
724 p = (typeof(*v) __force __rcu *)(v)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700725
Paul E. McKenney4446a362008-05-12 21:21:05 +0200726/* Infrastructure to implement the synchronize_() primitives. */
727
728struct rcu_synchronize {
729 struct rcu_head head;
730 struct completion completion;
731};
732
733extern void wakeme_after_rcu(struct rcu_head *head);
734
Paul E. McKenney7b0b7592010-08-17 14:18:46 -0700735#ifdef CONFIG_PREEMPT_RCU
736
Paul E. McKenney9b06e812005-05-01 08:59:04 -0700737/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700738 * call_rcu() - Queue an RCU callback for invocation after a grace period.
Paul E. McKenney01c1c662008-01-25 21:08:24 +0100739 * @head: structure to be used for queueing the RCU updates.
Paul E. McKenney77d84852010-07-08 17:38:59 -0700740 * @func: actual callback function to be invoked after the grace period
Paul E. McKenney01c1c662008-01-25 21:08:24 +0100741 *
Paul E. McKenney77d84852010-07-08 17:38:59 -0700742 * The callback function will be invoked some time after a full grace
743 * period elapses, in other words after all pre-existing RCU read-side
744 * critical sections have completed. However, the callback function
745 * might well execute concurrently with RCU read-side critical sections
746 * that started after call_rcu() was invoked. RCU read-side critical
Paul E. McKenney01c1c662008-01-25 21:08:24 +0100747 * sections are delimited by rcu_read_lock() and rcu_read_unlock(),
748 * and may be nested.
749 */
750extern void call_rcu(struct rcu_head *head,
751 void (*func)(struct rcu_head *head));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752
Paul E. McKenney7b0b7592010-08-17 14:18:46 -0700753#else /* #ifdef CONFIG_PREEMPT_RCU */
754
755/* In classic RCU, call_rcu() is just call_rcu_sched(). */
756#define call_rcu call_rcu_sched
757
758#endif /* #else #ifdef CONFIG_PREEMPT_RCU */
759
Paul E. McKenney01c1c662008-01-25 21:08:24 +0100760/**
Paul E. McKenneyca5ecdd2010-04-28 14:39:09 -0700761 * call_rcu_bh() - Queue an RCU for invocation after a quicker grace period.
Paul E. McKenney01c1c662008-01-25 21:08:24 +0100762 * @head: structure to be used for queueing the RCU updates.
Paul E. McKenney77d84852010-07-08 17:38:59 -0700763 * @func: actual callback function to be invoked after the grace period
Paul E. McKenney01c1c662008-01-25 21:08:24 +0100764 *
Paul E. McKenney77d84852010-07-08 17:38:59 -0700765 * The callback function will be invoked some time after a full grace
Paul E. McKenney01c1c662008-01-25 21:08:24 +0100766 * period elapses, in other words after all currently executing RCU
767 * read-side critical sections have completed. call_rcu_bh() assumes
768 * that the read-side critical sections end on completion of a softirq
769 * handler. This means that read-side critical sections in process
770 * context must not be interrupted by softirqs. This interface is to be
771 * used when most of the read-side critical sections are in softirq context.
772 * RCU read-side critical sections are delimited by :
773 * - rcu_read_lock() and rcu_read_unlock(), if in interrupt context.
774 * OR
775 * - rcu_read_lock_bh() and rcu_read_unlock_bh(), if in process context.
776 * These may be nested.
777 */
778extern void call_rcu_bh(struct rcu_head *head,
779 void (*func)(struct rcu_head *head));
780
Mathieu Desnoyers551d55a2010-04-17 08:48:42 -0400781/*
782 * debug_rcu_head_queue()/debug_rcu_head_unqueue() are used internally
783 * by call_rcu() and rcu callback execution, and are therefore not part of the
784 * RCU API. Leaving in rcupdate.h because they are used by all RCU flavors.
785 */
786
787#ifdef CONFIG_DEBUG_OBJECTS_RCU_HEAD
788# define STATE_RCU_HEAD_READY 0
789# define STATE_RCU_HEAD_QUEUED 1
790
791extern struct debug_obj_descr rcuhead_debug_descr;
792
793static inline void debug_rcu_head_queue(struct rcu_head *head)
794{
Paul E. McKenneyb0c9d7f2011-03-29 12:56:56 -0700795 WARN_ON_ONCE((unsigned long)head & 0x3);
Mathieu Desnoyers551d55a2010-04-17 08:48:42 -0400796 debug_object_activate(head, &rcuhead_debug_descr);
797 debug_object_active_state(head, &rcuhead_debug_descr,
798 STATE_RCU_HEAD_READY,
799 STATE_RCU_HEAD_QUEUED);
800}
801
802static inline void debug_rcu_head_unqueue(struct rcu_head *head)
803{
804 debug_object_active_state(head, &rcuhead_debug_descr,
805 STATE_RCU_HEAD_QUEUED,
806 STATE_RCU_HEAD_READY);
807 debug_object_deactivate(head, &rcuhead_debug_descr);
808}
809#else /* !CONFIG_DEBUG_OBJECTS_RCU_HEAD */
810static inline void debug_rcu_head_queue(struct rcu_head *head)
811{
812}
813
814static inline void debug_rcu_head_unqueue(struct rcu_head *head)
815{
816}
817#endif /* #else !CONFIG_DEBUG_OBJECTS_RCU_HEAD */
818
Lai Jiangshan9ab15442011-03-18 11:15:47 +0800819static __always_inline bool __is_kfree_rcu_offset(unsigned long offset)
820{
821 return offset < 4096;
822}
823
824static __always_inline
825void __kfree_rcu(struct rcu_head *head, unsigned long offset)
826{
827 typedef void (*rcu_callback)(struct rcu_head *);
828
829 BUILD_BUG_ON(!__builtin_constant_p(offset));
830
831 /* See the kfree_rcu() header comment. */
832 BUILD_BUG_ON(!__is_kfree_rcu_offset(offset));
833
834 call_rcu(head, (rcu_callback)offset);
835}
836
837extern void kfree(const void *);
838
839static inline void __rcu_reclaim(struct rcu_head *head)
840{
841 unsigned long offset = (unsigned long)head->func;
842
843 if (__is_kfree_rcu_offset(offset))
844 kfree((void *)head - offset);
845 else
846 head->func(head);
847}
848
849/**
850 * kfree_rcu() - kfree an object after a grace period.
851 * @ptr: pointer to kfree
852 * @rcu_head: the name of the struct rcu_head within the type of @ptr.
853 *
854 * Many rcu callbacks functions just call kfree() on the base structure.
855 * These functions are trivial, but their size adds up, and furthermore
856 * when they are used in a kernel module, that module must invoke the
857 * high-latency rcu_barrier() function at module-unload time.
858 *
859 * The kfree_rcu() function handles this issue. Rather than encoding a
860 * function address in the embedded rcu_head structure, kfree_rcu() instead
861 * encodes the offset of the rcu_head structure within the base structure.
862 * Because the functions are not allowed in the low-order 4096 bytes of
863 * kernel virtual memory, offsets up to 4095 bytes can be accommodated.
864 * If the offset is larger than 4095 bytes, a compile-time error will
865 * be generated in __kfree_rcu(). If this error is triggered, you can
866 * either fall back to use of call_rcu() or rearrange the structure to
867 * position the rcu_head structure into the first 4096 bytes.
868 *
869 * Note that the allowable offset might decrease in the future, for example,
870 * to allow something like kmem_cache_free_rcu().
871 */
872#define kfree_rcu(ptr, rcu_head) \
873 __kfree_rcu(&((ptr)->rcu_head), offsetof(typeof(*(ptr)), rcu_head))
874
Linus Torvalds1da177e2005-04-16 15:20:36 -0700875#endif /* __LINUX_RCUPDATE_H */