blob: 77b86be8ce4f66fc2dea72d164004e485cb28558 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#ifndef __LINUX_PERCPU_H
2#define __LINUX_PERCPU_H
Martin Peschke7ff6f082006-09-25 23:31:21 -07003
Robert P. J. Day0a3021f2007-07-15 23:39:57 -07004#include <linux/preempt.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -07005#include <linux/slab.h> /* For kmalloc() */
6#include <linux/smp.h>
Martin Peschke7ff6f082006-09-25 23:31:21 -07007#include <linux/cpumask.h>
Tejun Heo6a242902009-03-06 14:33:58 +09008#include <linux/pfn.h>
Martin Peschke7ff6f082006-09-25 23:31:21 -07009
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include <asm/percpu.h>
11
Tejun Heo6a242902009-03-06 14:33:58 +090012/* enough to cover all DEFINE_PER_CPUs in modules */
Jeremy Fitzhardingeb00742d32007-05-02 19:27:11 +020013#ifdef CONFIG_MODULES
Tejun Heo6a242902009-03-06 14:33:58 +090014#define PERCPU_MODULE_RESERVE (8 << 10)
Jeremy Fitzhardingeb00742d32007-05-02 19:27:11 +020015#else
Tejun Heo6a242902009-03-06 14:33:58 +090016#define PERCPU_MODULE_RESERVE 0
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#endif
18
Tejun Heo6a242902009-03-06 14:33:58 +090019#ifndef PERCPU_ENOUGH_ROOM
Jeremy Fitzhardingeb00742d32007-05-02 19:27:11 +020020#define PERCPU_ENOUGH_ROOM \
Tejun Heo6a242902009-03-06 14:33:58 +090021 (ALIGN(__per_cpu_end - __per_cpu_start, SMP_CACHE_BYTES) + \
22 PERCPU_MODULE_RESERVE)
23#endif
Jeremy Fitzhardingeb00742d32007-05-02 19:27:11 +020024
Jan Blunck632bbfe2006-09-25 23:30:53 -070025/*
26 * Must be an lvalue. Since @var must be a simple identifier,
27 * we force a syntax error here if it isn't.
28 */
29#define get_cpu_var(var) (*({ \
Jan Bluncka666ecf2006-10-06 00:43:58 -070030 extern int simple_identifier_##var(void); \
Jan Blunck632bbfe2006-09-25 23:30:53 -070031 preempt_disable(); \
32 &__get_cpu_var(var); }))
Linus Torvalds1da177e2005-04-16 15:20:36 -070033#define put_cpu_var(var) preempt_enable()
34
35#ifdef CONFIG_SMP
36
Tejun Heoe74e3962009-03-30 19:07:44 +090037#ifndef CONFIG_HAVE_LEGACY_PER_CPU_AREA
Tejun Heofbf59bc2009-02-20 16:29:08 +090038
Tejun Heo8d408b42009-02-24 11:57:21 +090039/* minimum unit size, also is the maximum supported allocation size */
Tejun Heo6a242902009-03-06 14:33:58 +090040#define PCPU_MIN_UNIT_SIZE PFN_ALIGN(64 << 10)
Tejun Heo8d408b42009-02-24 11:57:21 +090041
42/*
43 * PERCPU_DYNAMIC_RESERVE indicates the amount of free area to piggy
Tejun Heo6b19b0c2009-03-06 14:33:59 +090044 * back on the first chunk for dynamic percpu allocation if arch is
45 * manually allocating and mapping it for faster access (as a part of
46 * large page mapping for example).
Tejun Heo8d408b42009-02-24 11:57:21 +090047 *
Tejun Heo6b19b0c2009-03-06 14:33:59 +090048 * The following values give between one and two pages of free space
49 * after typical minimal boot (2-way SMP, single disk and NIC) with
50 * both defconfig and a distro config on x86_64 and 32. More
51 * intelligent way to determine this would be nice.
Tejun Heo8d408b42009-02-24 11:57:21 +090052 */
Tejun Heo6b19b0c2009-03-06 14:33:59 +090053#if BITS_PER_LONG > 32
54#define PERCPU_DYNAMIC_RESERVE (20 << 10)
55#else
56#define PERCPU_DYNAMIC_RESERVE (12 << 10)
57#endif
Tejun Heo8d408b42009-02-24 11:57:21 +090058
Tejun Heofbf59bc2009-02-20 16:29:08 +090059extern void *pcpu_base_addr;
Tejun Heo2f39e632009-07-04 08:11:00 +090060extern const int *pcpu_unit_map;
Tejun Heofbf59bc2009-02-20 16:29:08 +090061
Tejun Heofd1e8a12009-08-14 15:00:51 +090062struct pcpu_group_info {
63 int nr_units; /* aligned # of units */
64 unsigned long base_offset; /* base address offset */
65 unsigned int *cpu_map; /* unit->cpu map, empty
66 * entries contain NR_CPUS */
67};
68
69struct pcpu_alloc_info {
70 size_t static_size;
71 size_t reserved_size;
72 size_t dyn_size;
73 size_t unit_size;
74 size_t atom_size;
75 size_t alloc_size;
76 size_t __ai_size; /* internal, don't use */
77 int nr_groups; /* 0 if grouping unnecessary */
78 struct pcpu_group_info groups[];
79};
80
Tejun Heof58dc012009-08-14 15:00:50 +090081enum pcpu_fc {
82 PCPU_FC_AUTO,
83 PCPU_FC_EMBED,
84 PCPU_FC_PAGE,
85 PCPU_FC_LPAGE,
86
87 PCPU_FC_NR,
88};
89extern const char *pcpu_fc_names[PCPU_FC_NR];
90
91extern enum pcpu_fc pcpu_chosen_fc;
92
Tejun Heo3cbc8562009-08-14 15:00:50 +090093typedef void * (*pcpu_fc_alloc_fn_t)(unsigned int cpu, size_t size,
94 size_t align);
Tejun Heod4b95f82009-07-04 08:10:59 +090095typedef void (*pcpu_fc_free_fn_t)(void *ptr, size_t size);
96typedef void (*pcpu_fc_populate_pte_fn_t)(unsigned long addr);
Tejun Heoa530b792009-07-04 08:11:00 +090097typedef int (pcpu_fc_cpu_distance_fn_t)(unsigned int from, unsigned int to);
Tejun Heo8c4bfc62009-07-04 08:10:59 +090098typedef void (*pcpu_fc_map_fn_t)(void *ptr, size_t size, void *addr);
Tejun Heofbf59bc2009-02-20 16:29:08 +090099
Tejun Heofd1e8a12009-08-14 15:00:51 +0900100extern struct pcpu_alloc_info * __init pcpu_alloc_alloc_info(int nr_groups,
101 int nr_units);
102extern void __init pcpu_free_alloc_info(struct pcpu_alloc_info *ai);
Tejun Heo033e48f2009-08-14 15:00:51 +0900103
Tejun Heofd1e8a12009-08-14 15:00:51 +0900104extern struct pcpu_alloc_info * __init pcpu_build_alloc_info(
105 size_t reserved_size, ssize_t dyn_size,
106 size_t atom_size,
107 pcpu_fc_cpu_distance_fn_t cpu_distance_fn);
108
109extern size_t __init pcpu_setup_first_chunk(const struct pcpu_alloc_info *ai,
110 void *base_addr);
Tejun Heo8d408b42009-02-24 11:57:21 +0900111
Tejun Heo08fc4582009-08-14 15:00:49 +0900112#ifdef CONFIG_NEED_PER_CPU_EMBED_FIRST_CHUNK
Tejun Heo66c3a752009-03-10 16:27:48 +0900113extern ssize_t __init pcpu_embed_first_chunk(
Tejun Heo9a773762009-08-14 15:00:50 +0900114 size_t reserved_size, ssize_t dyn_size);
Tejun Heo08fc4582009-08-14 15:00:49 +0900115#endif
Tejun Heo66c3a752009-03-10 16:27:48 +0900116
Tejun Heo08fc4582009-08-14 15:00:49 +0900117#ifdef CONFIG_NEED_PER_CPU_PAGE_FIRST_CHUNK
Tejun Heo00ae4062009-08-14 15:00:49 +0900118extern ssize_t __init pcpu_page_first_chunk(
Tejun Heo9a773762009-08-14 15:00:50 +0900119 size_t reserved_size,
Tejun Heod4b95f82009-07-04 08:10:59 +0900120 pcpu_fc_alloc_fn_t alloc_fn,
121 pcpu_fc_free_fn_t free_fn,
122 pcpu_fc_populate_pte_fn_t populate_pte_fn);
Tejun Heo08fc4582009-08-14 15:00:49 +0900123#endif
Tejun Heod4b95f82009-07-04 08:10:59 +0900124
Tejun Heo08fc4582009-08-14 15:00:49 +0900125#ifdef CONFIG_NEED_PER_CPU_LPAGE_FIRST_CHUNK
Tejun Heo8c4bfc62009-07-04 08:10:59 +0900126extern ssize_t __init pcpu_lpage_first_chunk(
Tejun Heofd1e8a12009-08-14 15:00:51 +0900127 const struct pcpu_alloc_info *ai,
Tejun Heo8c4bfc62009-07-04 08:10:59 +0900128 pcpu_fc_alloc_fn_t alloc_fn,
129 pcpu_fc_free_fn_t free_fn,
130 pcpu_fc_map_fn_t map_fn);
131
132extern void *pcpu_lpage_remapped(void *kaddr);
133#else
Tejun Heo8c4bfc62009-07-04 08:10:59 +0900134static inline void *pcpu_lpage_remapped(void *kaddr)
135{
136 return NULL;
137}
138#endif
139
Tejun Heofbf59bc2009-02-20 16:29:08 +0900140/*
141 * Use this to get to a cpu's version of the per-cpu object
142 * dynamically allocated. Non-atomic access to the current CPU's
143 * version should probably be combined with get_cpu()/put_cpu().
144 */
145#define per_cpu_ptr(ptr, cpu) SHIFT_PERCPU_PTR((ptr), per_cpu_offset((cpu)))
146
Tejun Heoedcb4632009-03-06 14:33:59 +0900147extern void *__alloc_reserved_percpu(size_t size, size_t align);
148
Tejun Heoe74e3962009-03-30 19:07:44 +0900149#else /* CONFIG_HAVE_LEGACY_PER_CPU_AREA */
Tejun Heofbf59bc2009-02-20 16:29:08 +0900150
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151struct percpu_data {
Eric Dumazetb3242152008-02-06 01:37:01 -0800152 void *ptrs[1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153};
154
Catalin Marinas2e1483c2009-06-11 13:24:13 +0100155/* pointer disguising messes up the kmemleak objects tracking */
156#ifndef CONFIG_DEBUG_KMEMLEAK
Martin Peschke7ff6f082006-09-25 23:31:21 -0700157#define __percpu_disguise(pdata) (struct percpu_data *)~(unsigned long)(pdata)
Catalin Marinas2e1483c2009-06-11 13:24:13 +0100158#else
159#define __percpu_disguise(pdata) (struct percpu_data *)(pdata)
160#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161
Rusty Russellb36128c2009-02-20 16:29:08 +0900162#define per_cpu_ptr(ptr, cpu) \
163({ \
164 struct percpu_data *__p = __percpu_disguise(ptr); \
165 (__typeof__(ptr))__p->ptrs[(cpu)]; \
166})
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167
Tejun Heoe74e3962009-03-30 19:07:44 +0900168#endif /* CONFIG_HAVE_LEGACY_PER_CPU_AREA */
Tejun Heofbf59bc2009-02-20 16:29:08 +0900169
Tejun Heof2a82052009-02-20 16:29:08 +0900170extern void *__alloc_percpu(size_t size, size_t align);
171extern void free_percpu(void *__pdata);
172
Tejun Heoe74e3962009-03-30 19:07:44 +0900173#ifndef CONFIG_HAVE_SETUP_PER_CPU_AREA
174extern void __init setup_per_cpu_areas(void);
175#endif
176
Tejun Heof2a82052009-02-20 16:29:08 +0900177#else /* CONFIG_SMP */
178
179#define per_cpu_ptr(ptr, cpu) ({ (void)(cpu); (ptr); })
180
181static inline void *__alloc_percpu(size_t size, size_t align)
182{
183 /*
184 * Can't easily make larger alignment work with kmalloc. WARN
185 * on it. Larger alignment should only be used for module
186 * percpu sections on SMP for which this path isn't used.
187 */
Tejun Heoe3176032009-02-26 10:54:17 +0900188 WARN_ON_ONCE(align > SMP_CACHE_BYTES);
Ingo Molnard2b02612009-02-25 14:36:45 +0100189 return kzalloc(size, GFP_KERNEL);
Tejun Heof2a82052009-02-20 16:29:08 +0900190}
191
192static inline void free_percpu(void *p)
193{
194 kfree(p);
195}
196
Tejun Heoe74e3962009-03-30 19:07:44 +0900197static inline void __init setup_per_cpu_areas(void) { }
198
Tejun Heoa76761b2009-07-15 23:35:14 +0900199static inline void *pcpu_lpage_remapped(void *kaddr)
200{
201 return NULL;
202}
203
Tejun Heof2a82052009-02-20 16:29:08 +0900204#endif /* CONFIG_SMP */
205
206#define alloc_percpu(type) (type *)__alloc_percpu(sizeof(type), \
207 __alignof__(type))
208
Tejun Heo066123a2009-04-10 12:02:40 -0700209/*
210 * Optional methods for optimized non-lvalue per-cpu variable access.
211 *
212 * @var can be a percpu variable or a field of it and its size should
213 * equal char, int or long. percpu_read() evaluates to a lvalue and
214 * all others to void.
215 *
216 * These operations are guaranteed to be atomic w.r.t. preemption.
217 * The generic versions use plain get/put_cpu_var(). Archs are
218 * encouraged to implement single-instruction alternatives which don't
219 * require preemption protection.
220 */
221#ifndef percpu_read
222# define percpu_read(var) \
223 ({ \
224 typeof(per_cpu_var(var)) __tmp_var__; \
225 __tmp_var__ = get_cpu_var(var); \
226 put_cpu_var(var); \
227 __tmp_var__; \
228 })
229#endif
230
231#define __percpu_generic_to_op(var, val, op) \
232do { \
233 get_cpu_var(var) op val; \
234 put_cpu_var(var); \
235} while (0)
236
237#ifndef percpu_write
238# define percpu_write(var, val) __percpu_generic_to_op(var, (val), =)
239#endif
240
241#ifndef percpu_add
242# define percpu_add(var, val) __percpu_generic_to_op(var, (val), +=)
243#endif
244
245#ifndef percpu_sub
246# define percpu_sub(var, val) __percpu_generic_to_op(var, (val), -=)
247#endif
248
249#ifndef percpu_and
250# define percpu_and(var, val) __percpu_generic_to_op(var, (val), &=)
251#endif
252
253#ifndef percpu_or
254# define percpu_or(var, val) __percpu_generic_to_op(var, (val), |=)
255#endif
256
257#ifndef percpu_xor
258# define percpu_xor(var, val) __percpu_generic_to_op(var, (val), ^=)
259#endif
260
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261#endif /* __LINUX_PERCPU_H */