blob: 9db4825cd393c3b72723af80101e8b2c29ddf887 [file] [log] [blame]
Christoph Lameter81819f02007-05-06 14:49:36 -07001#ifndef _LINUX_SLUB_DEF_H
2#define _LINUX_SLUB_DEF_H
3
4/*
5 * SLUB : A Slab allocator without object queues.
6 *
Christoph Lametercde53532008-07-04 09:59:22 -07007 * (C) 2007 SGI, Christoph Lameter
Christoph Lameter81819f02007-05-06 14:49:36 -07008 */
9#include <linux/types.h>
10#include <linux/gfp.h>
Paul Gortmaker187f1882011-11-23 20:12:59 -050011#include <linux/bug.h>
Christoph Lameter81819f02007-05-06 14:49:36 -070012#include <linux/workqueue.h>
13#include <linux/kobject.h>
14
Richard Kennedy4a923792010-10-21 10:29:19 +010015#include <linux/kmemleak.h>
Li Zefan039ca4e2010-05-26 17:22:17 +080016
Christoph Lameter8ff12cf2008-02-07 17:47:41 -080017enum stat_item {
18 ALLOC_FASTPATH, /* Allocation from cpu slab */
19 ALLOC_SLOWPATH, /* Allocation by getting a new cpu slab */
20 FREE_FASTPATH, /* Free to cpu slub */
21 FREE_SLOWPATH, /* Freeing not to cpu slab */
22 FREE_FROZEN, /* Freeing to frozen slab */
23 FREE_ADD_PARTIAL, /* Freeing moves slab to partial list */
24 FREE_REMOVE_PARTIAL, /* Freeing removes last object */
Alex Shi8028dce2012-02-03 23:34:56 +080025 ALLOC_FROM_PARTIAL, /* Cpu slab acquired from node partial list */
Christoph Lameter8ff12cf2008-02-07 17:47:41 -080026 ALLOC_SLAB, /* Cpu slab acquired from page allocator */
27 ALLOC_REFILL, /* Refill cpu slab from slab freelist */
Christoph Lametere36a2652011-06-01 12:25:57 -050028 ALLOC_NODE_MISMATCH, /* Switching cpu slab */
Christoph Lameter8ff12cf2008-02-07 17:47:41 -080029 FREE_SLAB, /* Slab freed to the page allocator */
30 CPUSLAB_FLUSH, /* Abandoning of the cpu slab */
31 DEACTIVATE_FULL, /* Cpu slab was full when deactivated */
32 DEACTIVATE_EMPTY, /* Cpu slab was empty when deactivated */
33 DEACTIVATE_TO_HEAD, /* Cpu slab was moved to the head of partials */
34 DEACTIVATE_TO_TAIL, /* Cpu slab was moved to the tail of partials */
35 DEACTIVATE_REMOTE_FREES,/* Slab contained remotely freed objects */
Christoph Lameter03e404a2011-06-01 12:25:58 -050036 DEACTIVATE_BYPASS, /* Implicit deactivation */
Christoph Lameter65c33762008-04-14 19:11:40 +030037 ORDER_FALLBACK, /* Number of times fallback was necessary */
Christoph Lameter4fdccdf2011-03-22 13:35:00 -050038 CMPXCHG_DOUBLE_CPU_FAIL,/* Failure of this_cpu_cmpxchg_double */
Christoph Lameterb789ef52011-06-01 12:25:49 -050039 CMPXCHG_DOUBLE_FAIL, /* Number of times that cmpxchg double did not match */
Christoph Lameter49e22582011-08-09 16:12:27 -050040 CPU_PARTIAL_ALLOC, /* Used cpu partial on alloc */
Alex Shi8028dce2012-02-03 23:34:56 +080041 CPU_PARTIAL_FREE, /* Refill cpu partial on free */
42 CPU_PARTIAL_NODE, /* Refill cpu partial from node partial */
43 CPU_PARTIAL_DRAIN, /* Drain cpu partial to node partial */
Christoph Lameter8ff12cf2008-02-07 17:47:41 -080044 NR_SLUB_STAT_ITEMS };
45
Christoph Lameterdfb4f092007-10-16 01:26:05 -070046struct kmem_cache_cpu {
Christoph Lameter8a5ec0b2011-02-25 11:38:54 -060047 void **freelist; /* Pointer to next available object */
Christoph Lameter8a5ec0b2011-02-25 11:38:54 -060048 unsigned long tid; /* Globally unique transaction id */
Christoph Lameterda89b792008-01-07 23:20:31 -080049 struct page *page; /* The slab from which we are allocating */
Christoph Lameter49e22582011-08-09 16:12:27 -050050 struct page *partial; /* Partially allocated frozen slabs */
Christoph Lameter8ff12cf2008-02-07 17:47:41 -080051#ifdef CONFIG_SLUB_STATS
52 unsigned stat[NR_SLUB_STAT_ITEMS];
53#endif
Christoph Lameter4c93c3552007-10-16 01:26:08 -070054};
Christoph Lameterdfb4f092007-10-16 01:26:05 -070055
Christoph Lameter81819f02007-05-06 14:49:36 -070056struct kmem_cache_node {
57 spinlock_t list_lock; /* Protect partial list and nr_partial */
58 unsigned long nr_partial;
Christoph Lameter81819f02007-05-06 14:49:36 -070059 struct list_head partial;
Christoph Lameter0c710012007-07-17 04:03:24 -070060#ifdef CONFIG_SLUB_DEBUG
Christoph Lameter0f389ec2008-04-14 18:53:02 +030061 atomic_long_t nr_slabs;
Christoph Lameter205ab992008-04-14 19:11:40 +030062 atomic_long_t total_objects;
Christoph Lameter643b1132007-05-06 14:49:42 -070063 struct list_head full;
Christoph Lameter0c710012007-07-17 04:03:24 -070064#endif
Christoph Lameter81819f02007-05-06 14:49:36 -070065};
66
67/*
Christoph Lameter834f3d12008-04-14 19:11:31 +030068 * Word size structure that can be atomically updated or read and that
69 * contains both the order and the number of objects that a slab of the
70 * given order would contain.
71 */
72struct kmem_cache_order_objects {
73 unsigned long x;
74};
75
76/*
Christoph Lameter81819f02007-05-06 14:49:36 -070077 * Slab cache management.
78 */
79struct kmem_cache {
Namhyung Kim1b5ad242010-08-07 14:29:22 +020080 struct kmem_cache_cpu __percpu *cpu_slab;
Christoph Lameter81819f02007-05-06 14:49:36 -070081 /* Used for retriving partial slabs etc */
82 unsigned long flags;
Christoph Lameter1a757fe2011-02-25 11:38:51 -060083 unsigned long min_partial;
Christoph Lameter81819f02007-05-06 14:49:36 -070084 int size; /* The size of an object including meta data */
Christoph Lameter3b0efdf2012-06-13 10:24:57 -050085 int object_size; /* The size of an object without meta data */
Christoph Lameter81819f02007-05-06 14:49:36 -070086 int offset; /* Free pointer offset. */
Alex Shi9f264902011-09-01 11:32:18 +080087 int cpu_partial; /* Number of per cpu partial objects to keep around */
Christoph Lameter834f3d12008-04-14 19:11:31 +030088 struct kmem_cache_order_objects oo;
Christoph Lameter81819f02007-05-06 14:49:36 -070089
Christoph Lameter81819f02007-05-06 14:49:36 -070090 /* Allocation and freeing of slabs */
Christoph Lameter205ab992008-04-14 19:11:40 +030091 struct kmem_cache_order_objects max;
Christoph Lameter65c33762008-04-14 19:11:40 +030092 struct kmem_cache_order_objects min;
Christoph Lameterb7a49f02008-02-14 14:21:32 -080093 gfp_t allocflags; /* gfp flags to use on each alloc */
Christoph Lameter81819f02007-05-06 14:49:36 -070094 int refcount; /* Refcount for slab cache destroy */
Alexey Dobriyan51cc5062008-07-25 19:45:34 -070095 void (*ctor)(void *);
Christoph Lameter81819f02007-05-06 14:49:36 -070096 int inuse; /* Offset to metadata */
97 int align; /* Alignment */
Lai Jiangshanab9a0f12011-03-10 15:21:48 +080098 int reserved; /* Reserved bytes at the end of slabs */
Christoph Lameter81819f02007-05-06 14:49:36 -070099 const char *name; /* Name (only for display!) */
100 struct list_head list; /* List of slab caches */
Christoph Lameterab4d5ed2010-10-05 13:57:26 -0500101#ifdef CONFIG_SYSFS
Christoph Lameter81819f02007-05-06 14:49:36 -0700102 struct kobject kobj; /* For sysfs */
Christoph Lameter0c710012007-07-17 04:03:24 -0700103#endif
Glauber Costaba6c4962012-12-18 14:22:27 -0800104#ifdef CONFIG_MEMCG_KMEM
105 struct memcg_cache_params *memcg_params;
Glauber Costa107dab52012-12-18 14:23:05 -0800106 int max_attr_size; /* for propagation, maximum size of a stored attr */
Glauber Costaba6c4962012-12-18 14:22:27 -0800107#endif
Christoph Lameter81819f02007-05-06 14:49:36 -0700108
109#ifdef CONFIG_NUMA
Christoph Lameter98246012008-01-07 23:20:26 -0800110 /*
111 * Defragmentation by allocating from a remote node.
112 */
113 int remote_node_defrag_ratio;
Christoph Lameter81819f02007-05-06 14:49:36 -0700114#endif
Christoph Lameter7340cc82010-09-28 08:10:26 -0500115 struct kmem_cache_node *node[MAX_NUMNODES];
Christoph Lameter81819f02007-05-06 14:49:36 -0700116};
117
118/*
119 * Kmalloc subsystem.
120 */
FUJITA Tomonoria6eb9fe2010-08-10 18:03:22 -0700121#if defined(ARCH_DMA_MINALIGN) && ARCH_DMA_MINALIGN > 8
122#define KMALLOC_MIN_SIZE ARCH_DMA_MINALIGN
Christoph Lameter4b356be2007-06-16 10:16:13 -0700123#else
124#define KMALLOC_MIN_SIZE 8
125#endif
126
127#define KMALLOC_SHIFT_LOW ilog2(KMALLOC_MIN_SIZE)
Christoph Lameter81819f02007-05-06 14:49:36 -0700128
Christoph Lameter81819f02007-05-06 14:49:36 -0700129/*
Christoph Lameterffadd4d2009-02-17 12:05:07 -0500130 * Maximum kmalloc object size handled by SLUB. Larger object allocations
131 * are passed through to the page allocator. The page allocator "fastpath"
132 * is relatively slow so we need this value sufficiently high so that
133 * performance critical objects are allocated through the SLUB fastpath.
134 *
135 * This should be dropped to PAGE_SIZE / 2 once the page allocator
136 * "fastpath" becomes competitive with the slab allocator fastpaths.
137 */
Pekka Enberg51735a72009-02-20 12:21:33 +0200138#define SLUB_MAX_SIZE (2 * PAGE_SIZE)
Christoph Lameterffadd4d2009-02-17 12:05:07 -0500139
Pekka Enberg51735a72009-02-20 12:21:33 +0200140#define SLUB_PAGE_SHIFT (PAGE_SHIFT + 2)
Christoph Lameterffadd4d2009-02-17 12:05:07 -0500141
Christoph Lameter756dee72009-12-18 16:26:21 -0600142#ifdef CONFIG_ZONE_DMA
143#define SLUB_DMA __GFP_DMA
Christoph Lameter756dee72009-12-18 16:26:21 -0600144#else
145/* Disable DMA functionality */
146#define SLUB_DMA (__force gfp_t)0
Christoph Lameter756dee72009-12-18 16:26:21 -0600147#endif
148
Christoph Lameterffadd4d2009-02-17 12:05:07 -0500149/*
Christoph Lameter81819f02007-05-06 14:49:36 -0700150 * We keep the general caches in an array of slab caches that are used for
151 * 2^x bytes of allocations.
152 */
Christoph Lameter51df1142010-08-20 12:37:15 -0500153extern struct kmem_cache *kmalloc_caches[SLUB_PAGE_SHIFT];
Christoph Lameter81819f02007-05-06 14:49:36 -0700154
155/*
156 * Sorry that the following has to be that ugly but some versions of GCC
157 * have trouble with constant propagation and loops.
158 */
Christoph Lameteraa137f92007-08-31 00:48:45 -0700159static __always_inline int kmalloc_index(size_t size)
Christoph Lameter81819f02007-05-06 14:49:36 -0700160{
Christoph Lameter272c1d22007-06-08 13:46:49 -0700161 if (!size)
162 return 0;
Christoph Lameter614410d2007-05-06 14:49:38 -0700163
Christoph Lameter4b356be2007-06-16 10:16:13 -0700164 if (size <= KMALLOC_MIN_SIZE)
165 return KMALLOC_SHIFT_LOW;
166
Aaro Koskinenacdfcd02009-08-28 14:28:54 +0300167 if (KMALLOC_MIN_SIZE <= 32 && size > 64 && size <= 96)
Christoph Lameter81819f02007-05-06 14:49:36 -0700168 return 1;
Aaro Koskinenacdfcd02009-08-28 14:28:54 +0300169 if (KMALLOC_MIN_SIZE <= 64 && size > 128 && size <= 192)
Christoph Lameter81819f02007-05-06 14:49:36 -0700170 return 2;
171 if (size <= 8) return 3;
172 if (size <= 16) return 4;
173 if (size <= 32) return 5;
174 if (size <= 64) return 6;
175 if (size <= 128) return 7;
176 if (size <= 256) return 8;
177 if (size <= 512) return 9;
178 if (size <= 1024) return 10;
179 if (size <= 2 * 1024) return 11;
Christoph Lameter6446faa2008-02-15 23:45:26 -0800180 if (size <= 4 * 1024) return 12;
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700181/*
182 * The following is only needed to support architectures with a larger page
Christoph Lameter3e0c2ab2011-05-20 09:42:48 -0500183 * size than 4k. We need to support 2 * PAGE_SIZE here. So for a 64k page
184 * size we would have to go up to 128k.
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700185 */
Christoph Lameter81819f02007-05-06 14:49:36 -0700186 if (size <= 8 * 1024) return 13;
187 if (size <= 16 * 1024) return 14;
188 if (size <= 32 * 1024) return 15;
189 if (size <= 64 * 1024) return 16;
190 if (size <= 128 * 1024) return 17;
191 if (size <= 256 * 1024) return 18;
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700192 if (size <= 512 * 1024) return 19;
Christoph Lameter81819f02007-05-06 14:49:36 -0700193 if (size <= 1024 * 1024) return 20;
Christoph Lameter81819f02007-05-06 14:49:36 -0700194 if (size <= 2 * 1024 * 1024) return 21;
Christoph Lameter3e0c2ab2011-05-20 09:42:48 -0500195 BUG();
196 return -1; /* Will never be reached */
Christoph Lameter81819f02007-05-06 14:49:36 -0700197
198/*
199 * What we really wanted to do and cannot do because of compiler issues is:
200 * int i;
201 * for (i = KMALLOC_SHIFT_LOW; i <= KMALLOC_SHIFT_HIGH; i++)
202 * if (size <= (1 << i))
203 * return i;
204 */
205}
206
207/*
208 * Find the slab cache for a given combination of allocation flags and size.
209 *
210 * This ought to end up with a global pointer to the right cache
211 * in kmalloc_caches.
212 */
Christoph Lameteraa137f92007-08-31 00:48:45 -0700213static __always_inline struct kmem_cache *kmalloc_slab(size_t size)
Christoph Lameter81819f02007-05-06 14:49:36 -0700214{
215 int index = kmalloc_index(size);
216
217 if (index == 0)
218 return NULL;
219
Christoph Lameter51df1142010-08-20 12:37:15 -0500220 return kmalloc_caches[index];
Christoph Lameter81819f02007-05-06 14:49:36 -0700221}
222
Paul Mundt6193a2f2007-07-15 23:38:22 -0700223void *kmem_cache_alloc(struct kmem_cache *, gfp_t);
224void *__kmalloc(size_t size, gfp_t flags);
225
Richard Kennedy4a923792010-10-21 10:29:19 +0100226static __always_inline void *
227kmalloc_order(size_t size, gfp_t flags, unsigned int order)
228{
Glauber Costad79923f2012-12-18 14:22:48 -0800229 void *ret;
230
231 flags |= (__GFP_COMP | __GFP_KMEMCG);
232 ret = (void *) __get_free_pages(flags, order);
Richard Kennedy4a923792010-10-21 10:29:19 +0100233 kmemleak_alloc(ret, size, 1, flags);
234 return ret;
235}
236
Ben Greeard18a90d2011-07-07 11:36:37 -0700237/**
238 * Calling this on allocated memory will check that the memory
239 * is expected to be in use, and print warnings if not.
240 */
241#ifdef CONFIG_SLUB_DEBUG
242extern bool verify_mem_not_deleted(const void *x);
243#else
244static inline bool verify_mem_not_deleted(const void *x)
245{
246 return true;
247}
248#endif
249
Li Zefan0f24f122009-12-11 15:45:30 +0800250#ifdef CONFIG_TRACING
Richard Kennedy4a923792010-10-21 10:29:19 +0100251extern void *
252kmem_cache_alloc_trace(struct kmem_cache *s, gfp_t gfpflags, size_t size);
253extern void *kmalloc_order_trace(size_t size, gfp_t flags, unsigned int order);
Eduard - Gabriel Munteanu5b882be2008-08-19 20:43:26 +0300254#else
255static __always_inline void *
Richard Kennedy4a923792010-10-21 10:29:19 +0100256kmem_cache_alloc_trace(struct kmem_cache *s, gfp_t gfpflags, size_t size)
Eduard - Gabriel Munteanu5b882be2008-08-19 20:43:26 +0300257{
258 return kmem_cache_alloc(s, gfpflags);
259}
Richard Kennedy4a923792010-10-21 10:29:19 +0100260
261static __always_inline void *
262kmalloc_order_trace(size_t size, gfp_t flags, unsigned int order)
263{
264 return kmalloc_order(size, flags, order);
265}
Eduard - Gabriel Munteanu5b882be2008-08-19 20:43:26 +0300266#endif
267
Pekka Enbergeada35e2008-02-11 22:47:46 +0200268static __always_inline void *kmalloc_large(size_t size, gfp_t flags)
269{
Eduard - Gabriel Munteanu5b882be2008-08-19 20:43:26 +0300270 unsigned int order = get_order(size);
Richard Kennedy4a923792010-10-21 10:29:19 +0100271 return kmalloc_order_trace(size, flags, order);
Pekka Enbergeada35e2008-02-11 22:47:46 +0200272}
273
Christoph Lameteraa137f92007-08-31 00:48:45 -0700274static __always_inline void *kmalloc(size_t size, gfp_t flags)
Christoph Lameter81819f02007-05-06 14:49:36 -0700275{
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700276 if (__builtin_constant_p(size)) {
Christoph Lameterffadd4d2009-02-17 12:05:07 -0500277 if (size > SLUB_MAX_SIZE)
Pekka Enbergeada35e2008-02-11 22:47:46 +0200278 return kmalloc_large(size, flags);
Christoph Lameter81819f02007-05-06 14:49:36 -0700279
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700280 if (!(flags & SLUB_DMA)) {
281 struct kmem_cache *s = kmalloc_slab(size);
Christoph Lameter81819f02007-05-06 14:49:36 -0700282
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700283 if (!s)
284 return ZERO_SIZE_PTR;
285
Richard Kennedy4a923792010-10-21 10:29:19 +0100286 return kmem_cache_alloc_trace(s, flags, size);
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700287 }
288 }
289 return __kmalloc(size, flags);
Christoph Lameter81819f02007-05-06 14:49:36 -0700290}
291
Christoph Lameter81819f02007-05-06 14:49:36 -0700292#ifdef CONFIG_NUMA
Paul Mundt6193a2f2007-07-15 23:38:22 -0700293void *__kmalloc_node(size_t size, gfp_t flags, int node);
294void *kmem_cache_alloc_node(struct kmem_cache *, gfp_t flags, int node);
Christoph Lameter81819f02007-05-06 14:49:36 -0700295
Li Zefan0f24f122009-12-11 15:45:30 +0800296#ifdef CONFIG_TRACING
Richard Kennedy4a923792010-10-21 10:29:19 +0100297extern void *kmem_cache_alloc_node_trace(struct kmem_cache *s,
Eduard - Gabriel Munteanu5b882be2008-08-19 20:43:26 +0300298 gfp_t gfpflags,
Richard Kennedy4a923792010-10-21 10:29:19 +0100299 int node, size_t size);
Eduard - Gabriel Munteanu5b882be2008-08-19 20:43:26 +0300300#else
301static __always_inline void *
Richard Kennedy4a923792010-10-21 10:29:19 +0100302kmem_cache_alloc_node_trace(struct kmem_cache *s,
Eduard - Gabriel Munteanu5b882be2008-08-19 20:43:26 +0300303 gfp_t gfpflags,
Richard Kennedy4a923792010-10-21 10:29:19 +0100304 int node, size_t size)
Eduard - Gabriel Munteanu5b882be2008-08-19 20:43:26 +0300305{
306 return kmem_cache_alloc_node(s, gfpflags, node);
307}
308#endif
309
Christoph Lameteraa137f92007-08-31 00:48:45 -0700310static __always_inline void *kmalloc_node(size_t size, gfp_t flags, int node)
Christoph Lameter81819f02007-05-06 14:49:36 -0700311{
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700312 if (__builtin_constant_p(size) &&
Christoph Lameterffadd4d2009-02-17 12:05:07 -0500313 size <= SLUB_MAX_SIZE && !(flags & SLUB_DMA)) {
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700314 struct kmem_cache *s = kmalloc_slab(size);
Christoph Lameter81819f02007-05-06 14:49:36 -0700315
316 if (!s)
Christoph Lameter272c1d22007-06-08 13:46:49 -0700317 return ZERO_SIZE_PTR;
Christoph Lameter81819f02007-05-06 14:49:36 -0700318
Richard Kennedy4a923792010-10-21 10:29:19 +0100319 return kmem_cache_alloc_node_trace(s, flags, node, size);
Christoph Lameteraadb4bc2007-10-16 01:24:38 -0700320 }
321 return __kmalloc_node(size, flags, node);
Christoph Lameter81819f02007-05-06 14:49:36 -0700322}
323#endif
324
Christoph Lameter81819f02007-05-06 14:49:36 -0700325#endif /* _LINUX_SLUB_DEF_H */