blob: b68d5df147317295514e61ccae2b9f65f5311895 [file] [log] [blame]
Tejun Heob0c97782010-04-09 18:57:01 +09001/*
2 * mm/percpu-km.c - kernel memory based chunk allocation
3 *
4 * Copyright (C) 2010 SUSE Linux Products GmbH
5 * Copyright (C) 2010 Tejun Heo <tj@kernel.org>
6 *
7 * This file is released under the GPLv2.
8 *
9 * Chunks are allocated as a contiguous kernel memory using gfp
10 * allocation. This is to be used on nommu architectures.
11 *
12 * To use percpu-km,
13 *
14 * - define CONFIG_NEED_PER_CPU_KM from the arch Kconfig.
15 *
16 * - CONFIG_NEED_PER_CPU_PAGE_FIRST_CHUNK must not be defined. It's
17 * not compatible with PER_CPU_KM. EMBED_FIRST_CHUNK should work
18 * fine.
19 *
20 * - NUMA is not supported. When setting up the first chunk,
21 * @cpu_distance_fn should be NULL or report all CPUs to be nearer
22 * than or at LOCAL_DISTANCE.
23 *
24 * - It's best if the chunk size is power of two multiple of
25 * PAGE_SIZE. Because each chunk is allocated as a contiguous
26 * kernel memory block using alloc_pages(), memory will be wasted if
27 * chunk size is not aligned. percpu-km code will whine about it.
28 */
29
Tejun Heobbddff02010-09-03 18:22:48 +020030#if defined(CONFIG_SMP) && defined(CONFIG_NEED_PER_CPU_PAGE_FIRST_CHUNK)
Tejun Heob0c97782010-04-09 18:57:01 +090031#error "contiguous percpu allocation is incompatible with paged first chunk"
32#endif
33
34#include <linux/log2.h>
35
Tejun Heoa93ace42014-09-02 14:46:02 -040036static int pcpu_populate_chunk(struct pcpu_chunk *chunk,
Dennis Zhou47504ee2018-02-16 12:07:19 -060037 int page_start, int page_end, gfp_t gfp)
Tejun Heob0c97782010-04-09 18:57:01 +090038{
Tejun Heob0c97782010-04-09 18:57:01 +090039 return 0;
40}
41
Tejun Heoa93ace42014-09-02 14:46:02 -040042static void pcpu_depopulate_chunk(struct pcpu_chunk *chunk,
43 int page_start, int page_end)
Tejun Heob0c97782010-04-09 18:57:01 +090044{
45 /* nada */
46}
47
Dennis Zhou47504ee2018-02-16 12:07:19 -060048static struct pcpu_chunk *pcpu_create_chunk(gfp_t gfp)
Tejun Heob0c97782010-04-09 18:57:01 +090049{
50 const int nr_pages = pcpu_group_sizes[0] >> PAGE_SHIFT;
51 struct pcpu_chunk *chunk;
52 struct page *pages;
Dennis Zhou6ab7d472018-12-18 08:42:27 -080053 unsigned long flags;
Tejun Heob0c97782010-04-09 18:57:01 +090054 int i;
55
Dennis Zhou47504ee2018-02-16 12:07:19 -060056 chunk = pcpu_alloc_chunk(gfp);
Tejun Heob0c97782010-04-09 18:57:01 +090057 if (!chunk)
58 return NULL;
59
Dennis Zhou554fef12018-02-16 12:09:58 -060060 pages = alloc_pages(gfp, order_base_2(nr_pages));
Tejun Heob0c97782010-04-09 18:57:01 +090061 if (!pages) {
62 pcpu_free_chunk(chunk);
63 return NULL;
64 }
65
66 for (i = 0; i < nr_pages; i++)
67 pcpu_set_page_chunk(nth_page(pages, i), chunk);
68
69 chunk->data = pages;
Peng Fan1b046b42019-02-24 13:13:50 +000070 chunk->base_addr = page_address(pages);
Tejun Heoa63d4ac2014-09-02 14:46:02 -040071
Dennis Zhou6ab7d472018-12-18 08:42:27 -080072 spin_lock_irqsave(&pcpu_lock, flags);
Dennis Zhou (Facebook)40064ae2017-07-12 11:27:32 -070073 pcpu_chunk_populated(chunk, 0, nr_pages, false);
Dennis Zhou6ab7d472018-12-18 08:42:27 -080074 spin_unlock_irqrestore(&pcpu_lock, flags);
Tejun Heoa63d4ac2014-09-02 14:46:02 -040075
Dennis Zhou30a5b532017-06-19 19:28:31 -040076 pcpu_stats_chunk_alloc();
Dennis Zhoudf95e792017-06-19 19:28:32 -040077 trace_percpu_create_chunk(chunk->base_addr);
Dennis Zhou30a5b532017-06-19 19:28:31 -040078
Tejun Heob0c97782010-04-09 18:57:01 +090079 return chunk;
80}
81
82static void pcpu_destroy_chunk(struct pcpu_chunk *chunk)
83{
84 const int nr_pages = pcpu_group_sizes[0] >> PAGE_SHIFT;
85
Dennis Zhoue3efe3d2017-06-29 10:56:26 -040086 if (!chunk)
87 return;
88
Dennis Zhou30a5b532017-06-19 19:28:31 -040089 pcpu_stats_chunk_dealloc();
Dennis Zhoudf95e792017-06-19 19:28:32 -040090 trace_percpu_destroy_chunk(chunk->base_addr);
Dennis Zhou30a5b532017-06-19 19:28:31 -040091
Dennis Zhoue3efe3d2017-06-29 10:56:26 -040092 if (chunk->data)
Tejun Heob0c97782010-04-09 18:57:01 +090093 __free_pages(chunk->data, order_base_2(nr_pages));
94 pcpu_free_chunk(chunk);
95}
96
97static struct page *pcpu_addr_to_page(void *addr)
98{
99 return virt_to_page(addr);
100}
101
102static int __init pcpu_verify_alloc_info(const struct pcpu_alloc_info *ai)
103{
104 size_t nr_pages, alloc_pages;
105
106 /* all units must be in a single group */
107 if (ai->nr_groups != 1) {
Joe Perches870d4b12016-03-17 14:19:53 -0700108 pr_crit("can't handle more than one group\n");
Tejun Heob0c97782010-04-09 18:57:01 +0900109 return -EINVAL;
110 }
111
112 nr_pages = (ai->groups[0].nr_units * ai->unit_size) >> PAGE_SHIFT;
113 alloc_pages = roundup_pow_of_two(nr_pages);
114
115 if (alloc_pages > nr_pages)
Joe Perches870d4b12016-03-17 14:19:53 -0700116 pr_warn("wasting %zu pages per chunk\n",
Joe Perches11705322016-03-17 14:19:50 -0700117 alloc_pages - nr_pages);
Tejun Heob0c97782010-04-09 18:57:01 +0900118
119 return 0;
120}