Matt Mackall | 10cef60 | 2006-01-08 01:01:45 -0800 | [diff] [blame] | 1 | /* |
| 2 | * SLOB Allocator: Simple List Of Blocks |
| 3 | * |
| 4 | * Matt Mackall <mpm@selenic.com> 12/30/03 |
| 5 | * |
| 6 | * How SLOB works: |
| 7 | * |
| 8 | * The core of SLOB is a traditional K&R style heap allocator, with |
| 9 | * support for returning aligned objects. The granularity of this |
| 10 | * allocator is 8 bytes on x86, though it's perhaps possible to reduce |
| 11 | * this to 4 if it's deemed worth the effort. The slob heap is a |
| 12 | * singly-linked list of pages from __get_free_page, grown on demand |
| 13 | * and allocation from the heap is currently first-fit. |
| 14 | * |
| 15 | * Above this is an implementation of kmalloc/kfree. Blocks returned |
| 16 | * from kmalloc are 8-byte aligned and prepended with a 8-byte header. |
| 17 | * If kmalloc is asked for objects of PAGE_SIZE or larger, it calls |
| 18 | * __get_free_pages directly so that it can return page-aligned blocks |
| 19 | * and keeps a linked list of such pages and their orders. These |
| 20 | * objects are detected in kfree() by their page alignment. |
| 21 | * |
| 22 | * SLAB is emulated on top of SLOB by simply calling constructors and |
| 23 | * destructors for every SLAB allocation. Objects are returned with |
| 24 | * the 8-byte alignment unless the SLAB_MUST_HWCACHE_ALIGN flag is |
| 25 | * set, in which case the low-level allocator will fragment blocks to |
| 26 | * create the proper alignment. Again, objects of page-size or greater |
| 27 | * are allocated by calling __get_free_pages. As SLAB objects know |
| 28 | * their size, no separate size bookkeeping is necessary and there is |
| 29 | * essentially no allocation space overhead. |
| 30 | */ |
| 31 | |
| 32 | #include <linux/config.h> |
| 33 | #include <linux/slab.h> |
| 34 | #include <linux/mm.h> |
| 35 | #include <linux/cache.h> |
| 36 | #include <linux/init.h> |
| 37 | #include <linux/module.h> |
| 38 | #include <linux/timer.h> |
| 39 | |
| 40 | struct slob_block { |
| 41 | int units; |
| 42 | struct slob_block *next; |
| 43 | }; |
| 44 | typedef struct slob_block slob_t; |
| 45 | |
| 46 | #define SLOB_UNIT sizeof(slob_t) |
| 47 | #define SLOB_UNITS(size) (((size) + SLOB_UNIT - 1)/SLOB_UNIT) |
| 48 | #define SLOB_ALIGN L1_CACHE_BYTES |
| 49 | |
| 50 | struct bigblock { |
| 51 | int order; |
| 52 | void *pages; |
| 53 | struct bigblock *next; |
| 54 | }; |
| 55 | typedef struct bigblock bigblock_t; |
| 56 | |
| 57 | static slob_t arena = { .next = &arena, .units = 1 }; |
| 58 | static slob_t *slobfree = &arena; |
| 59 | static bigblock_t *bigblocks; |
| 60 | static DEFINE_SPINLOCK(slob_lock); |
| 61 | static DEFINE_SPINLOCK(block_lock); |
| 62 | |
| 63 | static void slob_free(void *b, int size); |
| 64 | |
| 65 | static void *slob_alloc(size_t size, gfp_t gfp, int align) |
| 66 | { |
| 67 | slob_t *prev, *cur, *aligned = 0; |
| 68 | int delta = 0, units = SLOB_UNITS(size); |
| 69 | unsigned long flags; |
| 70 | |
| 71 | spin_lock_irqsave(&slob_lock, flags); |
| 72 | prev = slobfree; |
| 73 | for (cur = prev->next; ; prev = cur, cur = cur->next) { |
| 74 | if (align) { |
| 75 | aligned = (slob_t *)ALIGN((unsigned long)cur, align); |
| 76 | delta = aligned - cur; |
| 77 | } |
| 78 | if (cur->units >= units + delta) { /* room enough? */ |
| 79 | if (delta) { /* need to fragment head to align? */ |
| 80 | aligned->units = cur->units - delta; |
| 81 | aligned->next = cur->next; |
| 82 | cur->next = aligned; |
| 83 | cur->units = delta; |
| 84 | prev = cur; |
| 85 | cur = aligned; |
| 86 | } |
| 87 | |
| 88 | if (cur->units == units) /* exact fit? */ |
| 89 | prev->next = cur->next; /* unlink */ |
| 90 | else { /* fragment */ |
| 91 | prev->next = cur + units; |
| 92 | prev->next->units = cur->units - units; |
| 93 | prev->next->next = cur->next; |
| 94 | cur->units = units; |
| 95 | } |
| 96 | |
| 97 | slobfree = prev; |
| 98 | spin_unlock_irqrestore(&slob_lock, flags); |
| 99 | return cur; |
| 100 | } |
| 101 | if (cur == slobfree) { |
| 102 | spin_unlock_irqrestore(&slob_lock, flags); |
| 103 | |
| 104 | if (size == PAGE_SIZE) /* trying to shrink arena? */ |
| 105 | return 0; |
| 106 | |
| 107 | cur = (slob_t *)__get_free_page(gfp); |
| 108 | if (!cur) |
| 109 | return 0; |
| 110 | |
| 111 | slob_free(cur, PAGE_SIZE); |
| 112 | spin_lock_irqsave(&slob_lock, flags); |
| 113 | cur = slobfree; |
| 114 | } |
| 115 | } |
| 116 | } |
| 117 | |
| 118 | static void slob_free(void *block, int size) |
| 119 | { |
| 120 | slob_t *cur, *b = (slob_t *)block; |
| 121 | unsigned long flags; |
| 122 | |
| 123 | if (!block) |
| 124 | return; |
| 125 | |
| 126 | if (size) |
| 127 | b->units = SLOB_UNITS(size); |
| 128 | |
| 129 | /* Find reinsertion point */ |
| 130 | spin_lock_irqsave(&slob_lock, flags); |
| 131 | for (cur = slobfree; !(b > cur && b < cur->next); cur = cur->next) |
| 132 | if (cur >= cur->next && (b > cur || b < cur->next)) |
| 133 | break; |
| 134 | |
| 135 | if (b + b->units == cur->next) { |
| 136 | b->units += cur->next->units; |
| 137 | b->next = cur->next->next; |
| 138 | } else |
| 139 | b->next = cur->next; |
| 140 | |
| 141 | if (cur + cur->units == b) { |
| 142 | cur->units += b->units; |
| 143 | cur->next = b->next; |
| 144 | } else |
| 145 | cur->next = b; |
| 146 | |
| 147 | slobfree = cur; |
| 148 | |
| 149 | spin_unlock_irqrestore(&slob_lock, flags); |
| 150 | } |
| 151 | |
| 152 | static int FASTCALL(find_order(int size)); |
| 153 | static int fastcall find_order(int size) |
| 154 | { |
| 155 | int order = 0; |
| 156 | for ( ; size > 4096 ; size >>=1) |
| 157 | order++; |
| 158 | return order; |
| 159 | } |
| 160 | |
| 161 | void *kmalloc(size_t size, gfp_t gfp) |
| 162 | { |
| 163 | slob_t *m; |
| 164 | bigblock_t *bb; |
| 165 | unsigned long flags; |
| 166 | |
| 167 | if (size < PAGE_SIZE - SLOB_UNIT) { |
| 168 | m = slob_alloc(size + SLOB_UNIT, gfp, 0); |
| 169 | return m ? (void *)(m + 1) : 0; |
| 170 | } |
| 171 | |
| 172 | bb = slob_alloc(sizeof(bigblock_t), gfp, 0); |
| 173 | if (!bb) |
| 174 | return 0; |
| 175 | |
| 176 | bb->order = find_order(size); |
| 177 | bb->pages = (void *)__get_free_pages(gfp, bb->order); |
| 178 | |
| 179 | if (bb->pages) { |
| 180 | spin_lock_irqsave(&block_lock, flags); |
| 181 | bb->next = bigblocks; |
| 182 | bigblocks = bb; |
| 183 | spin_unlock_irqrestore(&block_lock, flags); |
| 184 | return bb->pages; |
| 185 | } |
| 186 | |
| 187 | slob_free(bb, sizeof(bigblock_t)); |
| 188 | return 0; |
| 189 | } |
| 190 | |
| 191 | EXPORT_SYMBOL(kmalloc); |
| 192 | |
| 193 | void kfree(const void *block) |
| 194 | { |
| 195 | bigblock_t *bb, **last = &bigblocks; |
| 196 | unsigned long flags; |
| 197 | |
| 198 | if (!block) |
| 199 | return; |
| 200 | |
| 201 | if (!((unsigned long)block & (PAGE_SIZE-1))) { |
| 202 | /* might be on the big block list */ |
| 203 | spin_lock_irqsave(&block_lock, flags); |
| 204 | for (bb = bigblocks; bb; last = &bb->next, bb = bb->next) { |
| 205 | if (bb->pages == block) { |
| 206 | *last = bb->next; |
| 207 | spin_unlock_irqrestore(&block_lock, flags); |
| 208 | free_pages((unsigned long)block, bb->order); |
| 209 | slob_free(bb, sizeof(bigblock_t)); |
| 210 | return; |
| 211 | } |
| 212 | } |
| 213 | spin_unlock_irqrestore(&block_lock, flags); |
| 214 | } |
| 215 | |
| 216 | slob_free((slob_t *)block - 1, 0); |
| 217 | return; |
| 218 | } |
| 219 | |
| 220 | EXPORT_SYMBOL(kfree); |
| 221 | |
| 222 | unsigned int ksize(const void *block) |
| 223 | { |
| 224 | bigblock_t *bb; |
| 225 | unsigned long flags; |
| 226 | |
| 227 | if (!block) |
| 228 | return 0; |
| 229 | |
| 230 | if (!((unsigned long)block & (PAGE_SIZE-1))) { |
| 231 | spin_lock_irqsave(&block_lock, flags); |
| 232 | for (bb = bigblocks; bb; bb = bb->next) |
| 233 | if (bb->pages == block) { |
| 234 | spin_unlock_irqrestore(&slob_lock, flags); |
| 235 | return PAGE_SIZE << bb->order; |
| 236 | } |
| 237 | spin_unlock_irqrestore(&block_lock, flags); |
| 238 | } |
| 239 | |
| 240 | return ((slob_t *)block - 1)->units * SLOB_UNIT; |
| 241 | } |
| 242 | |
| 243 | struct kmem_cache { |
| 244 | unsigned int size, align; |
| 245 | const char *name; |
| 246 | void (*ctor)(void *, struct kmem_cache *, unsigned long); |
| 247 | void (*dtor)(void *, struct kmem_cache *, unsigned long); |
| 248 | }; |
| 249 | |
| 250 | struct kmem_cache *kmem_cache_create(const char *name, size_t size, |
| 251 | size_t align, unsigned long flags, |
| 252 | void (*ctor)(void*, struct kmem_cache *, unsigned long), |
| 253 | void (*dtor)(void*, struct kmem_cache *, unsigned long)) |
| 254 | { |
| 255 | struct kmem_cache *c; |
| 256 | |
| 257 | c = slob_alloc(sizeof(struct kmem_cache), flags, 0); |
| 258 | |
| 259 | if (c) { |
| 260 | c->name = name; |
| 261 | c->size = size; |
| 262 | c->ctor = ctor; |
| 263 | c->dtor = dtor; |
| 264 | /* ignore alignment unless it's forced */ |
| 265 | c->align = (flags & SLAB_MUST_HWCACHE_ALIGN) ? SLOB_ALIGN : 0; |
| 266 | if (c->align < align) |
| 267 | c->align = align; |
| 268 | } |
| 269 | |
| 270 | return c; |
| 271 | } |
| 272 | EXPORT_SYMBOL(kmem_cache_create); |
| 273 | |
| 274 | int kmem_cache_destroy(struct kmem_cache *c) |
| 275 | { |
| 276 | slob_free(c, sizeof(struct kmem_cache)); |
| 277 | return 0; |
| 278 | } |
| 279 | EXPORT_SYMBOL(kmem_cache_destroy); |
| 280 | |
| 281 | void *kmem_cache_alloc(struct kmem_cache *c, gfp_t flags) |
| 282 | { |
| 283 | void *b; |
| 284 | |
| 285 | if (c->size < PAGE_SIZE) |
| 286 | b = slob_alloc(c->size, flags, c->align); |
| 287 | else |
| 288 | b = (void *)__get_free_pages(flags, find_order(c->size)); |
| 289 | |
| 290 | if (c->ctor) |
| 291 | c->ctor(b, c, SLAB_CTOR_CONSTRUCTOR); |
| 292 | |
| 293 | return b; |
| 294 | } |
| 295 | EXPORT_SYMBOL(kmem_cache_alloc); |
| 296 | |
Pekka Enberg | a8c0f9a | 2006-03-25 03:06:42 -0800 | [diff] [blame] | 297 | void *kmem_cache_zalloc(struct kmem_cache *c, gfp_t flags) |
| 298 | { |
| 299 | void *ret = kmem_cache_alloc(c, flags); |
| 300 | if (ret) |
| 301 | memset(ret, 0, c->size); |
| 302 | |
| 303 | return ret; |
| 304 | } |
| 305 | EXPORT_SYMBOL(kmem_cache_zalloc); |
| 306 | |
Matt Mackall | 10cef60 | 2006-01-08 01:01:45 -0800 | [diff] [blame] | 307 | void kmem_cache_free(struct kmem_cache *c, void *b) |
| 308 | { |
| 309 | if (c->dtor) |
| 310 | c->dtor(b, c, 0); |
| 311 | |
| 312 | if (c->size < PAGE_SIZE) |
| 313 | slob_free(b, c->size); |
| 314 | else |
| 315 | free_pages((unsigned long)b, find_order(c->size)); |
| 316 | } |
| 317 | EXPORT_SYMBOL(kmem_cache_free); |
| 318 | |
| 319 | unsigned int kmem_cache_size(struct kmem_cache *c) |
| 320 | { |
| 321 | return c->size; |
| 322 | } |
| 323 | EXPORT_SYMBOL(kmem_cache_size); |
| 324 | |
| 325 | const char *kmem_cache_name(struct kmem_cache *c) |
| 326 | { |
| 327 | return c->name; |
| 328 | } |
| 329 | EXPORT_SYMBOL(kmem_cache_name); |
| 330 | |
| 331 | static struct timer_list slob_timer = TIMER_INITIALIZER( |
| 332 | (void (*)(unsigned long))kmem_cache_init, 0, 0); |
| 333 | |
| 334 | void kmem_cache_init(void) |
| 335 | { |
| 336 | void *p = slob_alloc(PAGE_SIZE, 0, PAGE_SIZE-1); |
| 337 | |
| 338 | if (p) |
| 339 | free_page((unsigned long)p); |
| 340 | |
| 341 | mod_timer(&slob_timer, jiffies + HZ); |
| 342 | } |
| 343 | |
| 344 | atomic_t slab_reclaim_pages = ATOMIC_INIT(0); |
| 345 | EXPORT_SYMBOL(slab_reclaim_pages); |
| 346 | |
| 347 | #ifdef CONFIG_SMP |
| 348 | |
Ingo Molnar | 9934a79 | 2006-02-08 10:11:56 +0100 | [diff] [blame] | 349 | void *__alloc_percpu(size_t size) |
Matt Mackall | 10cef60 | 2006-01-08 01:01:45 -0800 | [diff] [blame] | 350 | { |
| 351 | int i; |
| 352 | struct percpu_data *pdata = kmalloc(sizeof (*pdata), GFP_KERNEL); |
| 353 | |
| 354 | if (!pdata) |
| 355 | return NULL; |
| 356 | |
John Hawkes | 75129e2 | 2006-04-18 22:20:33 -0700 | [diff] [blame] | 357 | for_each_possible_cpu(i) { |
Matt Mackall | 10cef60 | 2006-01-08 01:01:45 -0800 | [diff] [blame] | 358 | pdata->ptrs[i] = kmalloc(size, GFP_KERNEL); |
| 359 | if (!pdata->ptrs[i]) |
| 360 | goto unwind_oom; |
| 361 | memset(pdata->ptrs[i], 0, size); |
| 362 | } |
| 363 | |
| 364 | /* Catch derefs w/o wrappers */ |
| 365 | return (void *) (~(unsigned long) pdata); |
| 366 | |
| 367 | unwind_oom: |
| 368 | while (--i >= 0) { |
| 369 | if (!cpu_possible(i)) |
| 370 | continue; |
| 371 | kfree(pdata->ptrs[i]); |
| 372 | } |
| 373 | kfree(pdata); |
| 374 | return NULL; |
| 375 | } |
| 376 | EXPORT_SYMBOL(__alloc_percpu); |
| 377 | |
| 378 | void |
| 379 | free_percpu(const void *objp) |
| 380 | { |
| 381 | int i; |
| 382 | struct percpu_data *p = (struct percpu_data *) (~(unsigned long) objp); |
| 383 | |
John Hawkes | 75129e2 | 2006-04-18 22:20:33 -0700 | [diff] [blame] | 384 | for_each_possible_cpu(i) |
Matt Mackall | 10cef60 | 2006-01-08 01:01:45 -0800 | [diff] [blame] | 385 | kfree(p->ptrs[i]); |
John Hawkes | 75129e2 | 2006-04-18 22:20:33 -0700 | [diff] [blame] | 386 | |
Matt Mackall | 10cef60 | 2006-01-08 01:01:45 -0800 | [diff] [blame] | 387 | kfree(p); |
| 388 | } |
| 389 | EXPORT_SYMBOL(free_percpu); |
| 390 | |
| 391 | #endif |