blob: 66338a60aa6ef961c6017731b6fd6d9d169736e1 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * ACPI 3.0 based NUMA setup
3 * Copyright 2004 Andi Kleen, SuSE Labs.
4 *
5 * Reads the ACPI SRAT table to figure out what memory belongs to which CPUs.
6 *
7 * Called from acpi_numa_init while reading the SRAT and SLIT tables.
8 * Assumes all memory regions belonging to a single proximity domain
9 * are in one chunk. Holes between them will be included in the node.
10 */
11
12#include <linux/kernel.h>
13#include <linux/acpi.h>
14#include <linux/mmzone.h>
15#include <linux/bitmap.h>
16#include <linux/module.h>
17#include <linux/topology.h>
Andi Kleen68a3a7f2006-04-07 19:49:18 +020018#include <linux/bootmem.h>
Yinghai Lua9ce6bc2010-08-25 13:39:17 -070019#include <linux/memblock.h>
Andi Kleen68a3a7f2006-04-07 19:49:18 +020020#include <linux/mm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <asm/proto.h>
22#include <asm/numa.h>
Andi Kleen8a6fdd32006-01-11 22:44:39 +010023#include <asm/e820.h>
Ingo Molnar7b6aa332009-02-17 13:58:15 +010024#include <asm/apic.h>
Ingo Molnar4ec71fa2009-01-21 10:24:27 +010025#include <asm/uv/uv.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026
Andi Kleenc31fbb12006-09-26 10:52:33 +020027int acpi_numa __initdata;
28
Linus Torvalds1da177e2005-04-16 15:20:36 -070029static __init int setup_node(int pxm)
30{
Yasunori Goto762834e2006-06-23 02:03:19 -070031 return acpi_map_pxm_to_node(pxm);
Linus Torvalds1da177e2005-04-16 15:20:36 -070032}
33
Linus Torvalds1da177e2005-04-16 15:20:36 -070034static __init void bad_srat(void)
35{
36 printk(KERN_ERR "SRAT: SRAT not used.\n");
37 acpi_numa = -1;
38}
39
40static __init inline int srat_disabled(void)
41{
Tejun Heoffe77a42011-02-16 12:13:06 +010042 return acpi_numa < 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070043}
44
Toshi Kania85eba82014-01-21 14:33:15 -080045/*
46 * Callback for SLIT parsing. pxm_to_node() returns NUMA_NO_NODE for
47 * I/O localities since SRAT does not list them. I/O localities are
48 * not supported at this point.
49 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070050void __init acpi_numa_slit_init(struct acpi_table_slit *slit)
51{
Tejun Heoac7136b62011-02-16 17:11:09 +010052 int i, j;
Yinghai Luf302a5bb2008-07-10 20:36:37 -070053
Toshi Kania85eba82014-01-21 14:33:15 -080054 for (i = 0; i < slit->locality_count; i++) {
Yinghai Luba6a328f2014-01-26 13:01:42 -080055 const int from_node = pxm_to_node(i);
56
57 if (from_node == NUMA_NO_NODE)
Toshi Kania85eba82014-01-21 14:33:15 -080058 continue;
Yinghai Luba6a328f2014-01-26 13:01:42 -080059
Toshi Kania85eba82014-01-21 14:33:15 -080060 for (j = 0; j < slit->locality_count; j++) {
Yinghai Luba6a328f2014-01-26 13:01:42 -080061 const int to_node = pxm_to_node(j);
62
63 if (to_node == NUMA_NO_NODE)
Toshi Kania85eba82014-01-21 14:33:15 -080064 continue;
Yinghai Luba6a328f2014-01-26 13:01:42 -080065
66 numa_set_distance(from_node, to_node,
Tejun Heoac7136b62011-02-16 17:11:09 +010067 slit->entry[slit->locality_count * i + j]);
Toshi Kania85eba82014-01-21 14:33:15 -080068 }
69 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070070}
71
Suresh Siddha7237d3d2009-03-30 13:55:30 -080072/* Callback for Proximity Domain -> x2APIC mapping */
73void __init
74acpi_numa_x2apic_affinity_init(struct acpi_srat_x2apic_cpu_affinity *pa)
75{
76 int pxm, node;
77 int apic_id;
78
79 if (srat_disabled())
80 return;
81 if (pa->header.length < sizeof(struct acpi_srat_x2apic_cpu_affinity)) {
82 bad_srat();
83 return;
84 }
85 if ((pa->flags & ACPI_SRAT_CPU_ENABLED) == 0)
86 return;
87 pxm = pa->proximity_domain;
Yinghai Lua35fd282011-12-21 17:45:16 -080088 apic_id = pa->apic_id;
Steffen Persvoldb7157ac2012-03-16 20:25:35 +010089 if (!apic->apic_id_valid(apic_id)) {
Yinghai Lua35fd282011-12-21 17:45:16 -080090 printk(KERN_INFO "SRAT: PXM %u -> X2APIC 0x%04x ignored\n",
91 pxm, apic_id);
92 return;
93 }
Suresh Siddha7237d3d2009-03-30 13:55:30 -080094 node = setup_node(pxm);
95 if (node < 0) {
96 printk(KERN_ERR "SRAT: Too many proximity domains %x\n", pxm);
97 bad_srat();
98 return;
99 }
100
Yinghai Lud3bd0582010-12-16 19:09:58 -0800101 if (apic_id >= MAX_LOCAL_APIC) {
102 printk(KERN_INFO "SRAT: PXM %u -> APIC 0x%04x -> Node %u skipped apicid that is too big\n", pxm, apic_id, node);
103 return;
104 }
Tejun Heobbc9e2f2011-01-23 14:37:39 +0100105 set_apicid_to_node(apic_id, node);
Tejun Heo92d4a432011-02-16 17:11:09 +0100106 node_set(node, numa_nodes_parsed);
Suresh Siddha7237d3d2009-03-30 13:55:30 -0800107 acpi_numa = 1;
Yinghai Lu163d3862009-11-21 00:23:37 -0800108 printk(KERN_INFO "SRAT: PXM %u -> APIC 0x%04x -> Node %u\n",
Suresh Siddha7237d3d2009-03-30 13:55:30 -0800109 pxm, apic_id, node);
110}
111
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112/* Callback for Proximity Domain -> LAPIC mapping */
113void __init
Alexey Starikovskiy15a58ed2007-02-02 19:48:22 +0300114acpi_numa_processor_affinity_init(struct acpi_srat_cpu_affinity *pa)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115{
116 int pxm, node;
travis@sgi.comef970012008-01-30 13:33:10 +0100117 int apic_id;
118
Andi Kleend22fe802006-02-03 21:51:26 +0100119 if (srat_disabled())
120 return;
Alexey Starikovskiy15a58ed2007-02-02 19:48:22 +0300121 if (pa->header.length != sizeof(struct acpi_srat_cpu_affinity)) {
Andi Kleenfad79062006-05-15 18:19:44 +0200122 bad_srat();
Andi Kleend22fe802006-02-03 21:51:26 +0100123 return;
124 }
Alexey Starikovskiy15a58ed2007-02-02 19:48:22 +0300125 if ((pa->flags & ACPI_SRAT_CPU_ENABLED) == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126 return;
Alexey Starikovskiy15a58ed2007-02-02 19:48:22 +0300127 pxm = pa->proximity_domain_lo;
Kurt Garloffcd298f62012-01-17 04:20:31 -0500128 if (acpi_srat_revision >= 2)
129 pxm |= *((unsigned int*)pa->proximity_domain_hi) << 8;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700130 node = setup_node(pxm);
131 if (node < 0) {
132 printk(KERN_ERR "SRAT: Too many proximity domains %x\n", pxm);
133 bad_srat();
134 return;
135 }
Yinghai Lubeafe912008-02-16 23:00:22 -0800136
Jack Steiner2e420602008-09-23 15:37:13 -0500137 if (get_uv_system_type() >= UV_X2APIC)
Jack Steinera65d1d62008-03-28 14:12:08 -0500138 apic_id = (pa->apic_id << 8) | pa->local_sapic_eid;
139 else
140 apic_id = pa->apic_id;
Yinghai Lud3bd0582010-12-16 19:09:58 -0800141
142 if (apic_id >= MAX_LOCAL_APIC) {
143 printk(KERN_INFO "SRAT: PXM %u -> APIC 0x%02x -> Node %u skipped apicid that is too big\n", pxm, apic_id, node);
144 return;
145 }
146
Tejun Heobbc9e2f2011-01-23 14:37:39 +0100147 set_apicid_to_node(apic_id, node);
Tejun Heo92d4a432011-02-16 17:11:09 +0100148 node_set(node, numa_nodes_parsed);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700149 acpi_numa = 1;
Yinghai Lu163d3862009-11-21 00:23:37 -0800150 printk(KERN_INFO "SRAT: PXM %u -> APIC 0x%02x -> Node %u\n",
travis@sgi.comef970012008-01-30 13:33:10 +0100151 pxm, apic_id, node);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700152}
153
Tejun Heo96886782011-05-02 14:18:51 +0200154#ifdef CONFIG_MEMORY_HOTPLUG
Keith Mannthey71efa8f2006-09-30 23:27:05 -0700155static inline int save_add_info(void) {return 1;}
156#else
157static inline int save_add_info(void) {return 0;}
158#endif
Andi Kleen68a3a7f2006-04-07 19:49:18 +0200159
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160/* Callback for parsing of the Proximity Domain <-> Memory Area mappings */
Thomas Renninger095adbb2012-07-31 17:41:09 +0200161int __init
Alexey Starikovskiy15a58ed2007-02-02 19:48:22 +0300162acpi_numa_memory_affinity_init(struct acpi_srat_mem_affinity *ma)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163{
Tejun Heoeca9ad32011-05-02 14:18:52 +0200164 u64 start, end;
Tang Chend7b2c3d2013-08-14 17:37:06 +0800165 u32 hotpluggable;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166 int node, pxm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167
Andi Kleend22fe802006-02-03 21:51:26 +0100168 if (srat_disabled())
Davidlohr Bueso479a99a2013-01-08 16:18:41 -0800169 goto out_err;
170 if (ma->header.length != sizeof(struct acpi_srat_mem_affinity))
171 goto out_err_bad_srat;
Alexey Starikovskiy15a58ed2007-02-02 19:48:22 +0300172 if ((ma->flags & ACPI_SRAT_MEM_ENABLED) == 0)
Davidlohr Bueso479a99a2013-01-08 16:18:41 -0800173 goto out_err;
Tang Chend7b2c3d2013-08-14 17:37:06 +0800174 hotpluggable = ma->flags & ACPI_SRAT_MEM_HOT_PLUGGABLE;
175 if (hotpluggable && !save_add_info())
Davidlohr Bueso479a99a2013-01-08 16:18:41 -0800176 goto out_err;
177
Alexey Starikovskiy15a58ed2007-02-02 19:48:22 +0300178 start = ma->base_address;
179 end = start + ma->length;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 pxm = ma->proximity_domain;
Kurt Garloffcd298f62012-01-17 04:20:31 -0500181 if (acpi_srat_revision <= 1)
182 pxm &= 0xff;
Davidlohr Bueso479a99a2013-01-08 16:18:41 -0800183
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 node = setup_node(pxm);
185 if (node < 0) {
186 printk(KERN_ERR "SRAT: Too many proximity domains.\n");
Davidlohr Bueso479a99a2013-01-08 16:18:41 -0800187 goto out_err_bad_srat;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700188 }
Tejun Heoef396ec2011-02-16 17:11:07 +0100189
Davidlohr Bueso479a99a2013-01-08 16:18:41 -0800190 if (numa_add_memblk(node, start, end) < 0)
191 goto out_err_bad_srat;
Andi Kleen68a3a7f2006-04-07 19:49:18 +0200192
Yasuaki Ishimatsu4af463d2012-06-04 11:42:32 +0900193 node_set(node, numa_nodes_parsed);
194
Tang Chend7b2c3d2013-08-14 17:37:06 +0800195 pr_info("SRAT: Node %u PXM %u [mem %#010Lx-%#010Lx]%s\n",
196 node, pxm,
197 (unsigned long long) start, (unsigned long long) end - 1,
198 hotpluggable ? " hotplug" : "");
Davidlohr Bueso479a99a2013-01-08 16:18:41 -0800199
Tang Chen05d1d8c2014-01-21 15:49:29 -0800200 /* Mark hotplug range in memblock. */
201 if (hotpluggable && memblock_mark_hotplug(start, ma->length))
202 pr_warn("SRAT: Failed to mark hotplug range [mem %#010Lx-%#010Lx] in memblock\n",
203 (unsigned long long)start, (unsigned long long)end - 1);
204
Thomas Renninger095adbb2012-07-31 17:41:09 +0200205 return 0;
Davidlohr Bueso479a99a2013-01-08 16:18:41 -0800206out_err_bad_srat:
207 bad_srat();
208out_err:
209 return -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210}
211
212void __init acpi_numa_arch_fixup(void) {}
213
Tejun Heoa9aec562011-02-16 12:13:06 +0100214int __init x86_acpi_numa_init(void)
215{
216 int ret;
217
218 ret = acpi_numa_init();
219 if (ret < 0)
220 return ret;
221 return srat_disabled() ? -EINVAL : 0;
222}