blob: 026e4931d16259fe624eef5b5bb269436ad3e81e [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#include <linux/init.h>
2#include <linux/pci.h>
Robert Richterd199a042008-07-02 22:50:26 +02003#include <linux/topology.h>
Robert Richter91ede002008-08-22 20:23:38 +02004#include <linux/cpu.h>
Yinghai Lu27811d82010-02-10 01:20:07 -08005#include <linux/range.h>
6
Jan Beulich24d9b702011-01-10 16:20:23 +00007#include <asm/amd_nb.h>
Jaswinder Singh Rajput82487712008-12-27 18:32:28 +05308#include <asm/pci_x86.h>
Robert Richter3a27dd12008-06-12 20:19:23 +02009
Yinghai Lu871d5f82008-02-19 03:20:09 -080010#include <asm/pci-direct.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070011
Yinghai Lu99935a72009-10-04 21:54:24 -070012#include "bus_numa.h"
13
Linus Torvalds1da177e2005-04-16 15:20:36 -070014/*
15 * This discovers the pcibus <-> node mapping on AMD K8.
Yinghai Lu30a18d62008-02-19 03:21:20 -080016 * also get peer root bus resource for io,mmio
Linus Torvalds1da177e2005-04-16 15:20:36 -070017 */
18
Yinghai Lu30a18d62008-02-19 03:21:20 -080019struct pci_hostbridge_probe {
20 u32 bus;
21 u32 slot;
22 u32 vendor;
23 u32 device;
24};
25
26static struct pci_hostbridge_probe pci_probes[] __initdata = {
27 { 0, 0x18, PCI_VENDOR_ID_AMD, 0x1100 },
28 { 0, 0x18, PCI_VENDOR_ID_AMD, 0x1200 },
29 { 0xff, 0, PCI_VENDOR_ID_AMD, 0x1200 },
30 { 0, 0x18, PCI_VENDOR_ID_AMD, 0x1300 },
31};
32
Yinghai Lu6e184f22008-03-06 01:15:31 -080033static u64 __initdata fam10h_mmconf_start;
34static u64 __initdata fam10h_mmconf_end;
35static void __init get_pci_mmcfg_amd_fam10h_range(void)
36{
37 u32 address;
38 u64 base, msr;
39 unsigned segn_busn_bits;
40
41 /* assume all cpus from fam10h have mmconf */
42 if (boot_cpu_data.x86 < 0x10)
43 return;
44
45 address = MSR_FAM10H_MMIO_CONF_BASE;
46 rdmsrl(address, msr);
47
48 /* mmconfig is not enable */
49 if (!(msr & FAM10H_MMIO_CONF_ENABLE))
50 return;
51
52 base = msr & (FAM10H_MMIO_CONF_BASE_MASK<<FAM10H_MMIO_CONF_BASE_SHIFT);
53
54 segn_busn_bits = (msr >> FAM10H_MMIO_CONF_BUSRANGE_SHIFT) &
55 FAM10H_MMIO_CONF_BUSRANGE_MASK;
56
57 fam10h_mmconf_start = base;
58 fam10h_mmconf_end = base + (1ULL<<(segn_busn_bits + 20)) - 1;
59}
60
Yinghai Lu27811d82010-02-10 01:20:07 -080061#define RANGE_NUM 16
62
Linus Torvalds1da177e2005-04-16 15:20:36 -070063/**
Yinghai Lu871d5f82008-02-19 03:20:09 -080064 * early_fill_mp_bus_to_node()
65 * called before pcibios_scan_root and pci_scan_bus
Linus Torvalds1da177e2005-04-16 15:20:36 -070066 * fills the mp_bus_to_cpumask array based according to the LDT Bus Number
67 * Registers found in the K8 northbridge
68 */
Yinghai Lu30a18d62008-02-19 03:21:20 -080069static int __init early_fill_mp_bus_info(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070070{
Yinghai Lu30a18d62008-02-19 03:21:20 -080071 int i;
72 int j;
73 unsigned bus;
Yinghai Lu871d5f82008-02-19 03:20:09 -080074 unsigned slot;
Yinghai Lu35ddd062008-02-19 03:15:08 -080075 int node;
Yinghai Lu30a18d62008-02-19 03:21:20 -080076 int link;
77 int def_node;
78 int def_link;
79 struct pci_root_info *info;
80 u32 reg;
81 struct resource *res;
Yinghai Lu97445c32010-02-10 01:20:10 -080082 u64 start;
83 u64 end;
Yinghai Lu27811d82010-02-10 01:20:07 -080084 struct range range[RANGE_NUM];
Yinghai Lu30a18d62008-02-19 03:21:20 -080085 u64 val;
86 u32 address;
Yinghai Lu3e3da002010-02-10 01:20:09 -080087 bool found;
Yinghai Lu35ddd062008-02-19 03:15:08 -080088
Yinghai Lu871d5f82008-02-19 03:20:09 -080089 if (!early_pci_allowed())
90 return -1;
91
Yinghai Lu3e3da002010-02-10 01:20:09 -080092 found = false;
Yinghai Lu30a18d62008-02-19 03:21:20 -080093 for (i = 0; i < ARRAY_SIZE(pci_probes); i++) {
94 u32 id;
95 u16 device;
96 u16 vendor;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
Yinghai Lu30a18d62008-02-19 03:21:20 -080098 bus = pci_probes[i].bus;
99 slot = pci_probes[i].slot;
100 id = read_pci_config(bus, slot, 0, PCI_VENDOR_ID);
Yinghai Lu35ddd062008-02-19 03:15:08 -0800101
Yinghai Lu30a18d62008-02-19 03:21:20 -0800102 vendor = id & 0xffff;
103 device = (id>>16) & 0xffff;
104 if (pci_probes[i].vendor == vendor &&
105 pci_probes[i].device == device) {
Yinghai Lu3e3da002010-02-10 01:20:09 -0800106 found = true;
Yinghai Lu30a18d62008-02-19 03:21:20 -0800107 break;
108 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109 }
110
Yinghai Lu3e3da002010-02-10 01:20:09 -0800111 if (!found)
Yinghai Lu30a18d62008-02-19 03:21:20 -0800112 return 0;
113
114 pci_root_num = 0;
115 for (i = 0; i < 4; i++) {
116 int min_bus;
117 int max_bus;
118 reg = read_pci_config(bus, slot, 1, 0xe0 + (i << 2));
119
120 /* Check if that register is enabled for bus range */
121 if ((reg & 7) != 3)
122 continue;
123
124 min_bus = (reg >> 16) & 0xff;
125 max_bus = (reg >> 24) & 0xff;
126 node = (reg >> 4) & 0x07;
127#ifdef CONFIG_NUMA
128 for (j = min_bus; j <= max_bus; j++)
Jesse Barnes25470892009-07-10 14:04:30 -0700129 set_mp_bus_to_node(j, node);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800130#endif
131 link = (reg >> 8) & 0x03;
132
133 info = &pci_root_info[pci_root_num];
134 info->bus_min = min_bus;
135 info->bus_max = max_bus;
136 info->node = node;
137 info->link = link;
138 sprintf(info->name, "PCI Bus #%02x", min_bus);
139 pci_root_num++;
140 }
141
142 /* get the default node and link for left over res */
143 reg = read_pci_config(bus, slot, 0, 0x60);
144 def_node = (reg >> 8) & 0x07;
145 reg = read_pci_config(bus, slot, 0, 0x64);
146 def_link = (reg >> 8) & 0x03;
147
148 memset(range, 0, sizeof(range));
Yinghai Lue9a00642010-02-10 01:20:13 -0800149 add_range(range, RANGE_NUM, 0, 0, 0xffff + 1);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800150 /* io port resource */
151 for (i = 0; i < 4; i++) {
152 reg = read_pci_config(bus, slot, 1, 0xc0 + (i << 3));
153 if (!(reg & 3))
154 continue;
155
156 start = reg & 0xfff000;
157 reg = read_pci_config(bus, slot, 1, 0xc4 + (i << 3));
158 node = reg & 0x07;
159 link = (reg >> 4) & 0x03;
160 end = (reg & 0xfff000) | 0xfff;
161
162 /* find the position */
163 for (j = 0; j < pci_root_num; j++) {
164 info = &pci_root_info[j];
165 if (info->node == node && info->link == link)
166 break;
167 }
168 if (j == pci_root_num)
169 continue; /* not found */
170
171 info = &pci_root_info[j];
Yinghai Lu6e184f22008-03-06 01:15:31 -0800172 printk(KERN_DEBUG "node %d link %d: io port [%llx, %llx]\n",
Yinghai Lu97445c32010-02-10 01:20:10 -0800173 node, link, start, end);
Yinghai Lue8ee6f02008-04-13 01:41:58 -0700174
175 /* kernel only handle 16 bit only */
176 if (end > 0xffff)
177 end = 0xffff;
178 update_res(info, start, end, IORESOURCE_IO, 1);
Yinghai Lue9a00642010-02-10 01:20:13 -0800179 subtract_range(range, RANGE_NUM, start, end + 1);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800180 }
181 /* add left over io port range to def node/link, [0, 0xffff] */
182 /* find the position */
183 for (j = 0; j < pci_root_num; j++) {
184 info = &pci_root_info[j];
185 if (info->node == def_node && info->link == def_link)
186 break;
187 }
188 if (j < pci_root_num) {
189 info = &pci_root_info[j];
190 for (i = 0; i < RANGE_NUM; i++) {
191 if (!range[i].end)
192 continue;
193
Yinghai Lue9a00642010-02-10 01:20:13 -0800194 update_res(info, range[i].start, range[i].end - 1,
Yinghai Lu30a18d62008-02-19 03:21:20 -0800195 IORESOURCE_IO, 1);
196 }
197 }
198
199 memset(range, 0, sizeof(range));
200 /* 0xfd00000000-0xffffffffff for HT */
Yinghai Lue9a00642010-02-10 01:20:13 -0800201 end = cap_resource((0xfdULL<<32) - 1);
202 end++;
203 add_range(range, RANGE_NUM, 0, 0, end);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800204
205 /* need to take out [0, TOM) for RAM*/
206 address = MSR_K8_TOP_MEM1;
207 rdmsrl(address, val);
Yinghai Lu8004dd92008-05-12 17:40:39 -0700208 end = (val & 0xffffff800000ULL);
Yinghai Lu97445c32010-02-10 01:20:10 -0800209 printk(KERN_INFO "TOM: %016llx aka %lldM\n", end, end>>20);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800210 if (end < (1ULL<<32))
Yinghai Lue9a00642010-02-10 01:20:13 -0800211 subtract_range(range, RANGE_NUM, 0, end);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800212
Yinghai Lu6e184f22008-03-06 01:15:31 -0800213 /* get mmconfig */
214 get_pci_mmcfg_amd_fam10h_range();
215 /* need to take out mmconf range */
216 if (fam10h_mmconf_end) {
217 printk(KERN_DEBUG "Fam 10h mmconf [%llx, %llx]\n", fam10h_mmconf_start, fam10h_mmconf_end);
Yinghai Lue9a00642010-02-10 01:20:13 -0800218 subtract_range(range, RANGE_NUM, fam10h_mmconf_start,
219 fam10h_mmconf_end + 1);
Yinghai Lu6e184f22008-03-06 01:15:31 -0800220 }
221
Yinghai Lu30a18d62008-02-19 03:21:20 -0800222 /* mmio resource */
223 for (i = 0; i < 8; i++) {
224 reg = read_pci_config(bus, slot, 1, 0x80 + (i << 3));
225 if (!(reg & 3))
226 continue;
227
228 start = reg & 0xffffff00; /* 39:16 on 31:8*/
229 start <<= 8;
230 reg = read_pci_config(bus, slot, 1, 0x84 + (i << 3));
231 node = reg & 0x07;
232 link = (reg >> 4) & 0x03;
233 end = (reg & 0xffffff00);
234 end <<= 8;
235 end |= 0xffff;
236
237 /* find the position */
238 for (j = 0; j < pci_root_num; j++) {
239 info = &pci_root_info[j];
240 if (info->node == node && info->link == link)
241 break;
242 }
243 if (j == pci_root_num)
244 continue; /* not found */
245
246 info = &pci_root_info[j];
Yinghai Lu6e184f22008-03-06 01:15:31 -0800247
248 printk(KERN_DEBUG "node %d link %d: mmio [%llx, %llx]",
Yinghai Lu97445c32010-02-10 01:20:10 -0800249 node, link, start, end);
Yinghai Lu6e184f22008-03-06 01:15:31 -0800250 /*
251 * some sick allocation would have range overlap with fam10h
252 * mmconf range, so need to update start and end.
253 */
254 if (fam10h_mmconf_end) {
255 int changed = 0;
256 u64 endx = 0;
257 if (start >= fam10h_mmconf_start &&
258 start <= fam10h_mmconf_end) {
259 start = fam10h_mmconf_end + 1;
260 changed = 1;
261 }
262
263 if (end >= fam10h_mmconf_start &&
264 end <= fam10h_mmconf_end) {
265 end = fam10h_mmconf_start - 1;
266 changed = 1;
267 }
268
269 if (start < fam10h_mmconf_start &&
270 end > fam10h_mmconf_end) {
271 /* we got a hole */
272 endx = fam10h_mmconf_start - 1;
273 update_res(info, start, endx, IORESOURCE_MEM, 0);
Yinghai Lue9a00642010-02-10 01:20:13 -0800274 subtract_range(range, RANGE_NUM, start,
275 endx + 1);
Yinghai Lu97445c32010-02-10 01:20:10 -0800276 printk(KERN_CONT " ==> [%llx, %llx]", start, endx);
Yinghai Lu6e184f22008-03-06 01:15:31 -0800277 start = fam10h_mmconf_end + 1;
278 changed = 1;
279 }
280 if (changed) {
281 if (start <= end) {
Yinghai Lu97445c32010-02-10 01:20:10 -0800282 printk(KERN_CONT " %s [%llx, %llx]", endx ? "and" : "==>", start, end);
Yinghai Lu6e184f22008-03-06 01:15:31 -0800283 } else {
284 printk(KERN_CONT "%s\n", endx?"":" ==> none");
285 continue;
286 }
287 }
288 }
289
Yinghai Lu9ad3f2c2010-02-10 01:20:11 -0800290 update_res(info, cap_resource(start), cap_resource(end),
291 IORESOURCE_MEM, 1);
Yinghai Lue9a00642010-02-10 01:20:13 -0800292 subtract_range(range, RANGE_NUM, start, end + 1);
Yinghai Lu6e184f22008-03-06 01:15:31 -0800293 printk(KERN_CONT "\n");
Yinghai Lu30a18d62008-02-19 03:21:20 -0800294 }
295
296 /* need to take out [4G, TOM2) for RAM*/
297 /* SYS_CFG */
298 address = MSR_K8_SYSCFG;
299 rdmsrl(address, val);
300 /* TOP_MEM2 is enabled? */
301 if (val & (1<<21)) {
302 /* TOP_MEM2 */
303 address = MSR_K8_TOP_MEM2;
304 rdmsrl(address, val);
Yinghai Lu8004dd92008-05-12 17:40:39 -0700305 end = (val & 0xffffff800000ULL);
Yinghai Lu97445c32010-02-10 01:20:10 -0800306 printk(KERN_INFO "TOM2: %016llx aka %lldM\n", end, end>>20);
Yinghai Lue9a00642010-02-10 01:20:13 -0800307 subtract_range(range, RANGE_NUM, 1ULL<<32, end);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800308 }
309
310 /*
311 * add left over mmio range to def node/link ?
312 * that is tricky, just record range in from start_min to 4G
313 */
314 for (j = 0; j < pci_root_num; j++) {
315 info = &pci_root_info[j];
316 if (info->node == def_node && info->link == def_link)
317 break;
318 }
319 if (j < pci_root_num) {
320 info = &pci_root_info[j];
321
322 for (i = 0; i < RANGE_NUM; i++) {
323 if (!range[i].end)
324 continue;
325
Yinghai Lu9ad3f2c2010-02-10 01:20:11 -0800326 update_res(info, cap_resource(range[i].start),
Yinghai Lue9a00642010-02-10 01:20:13 -0800327 cap_resource(range[i].end - 1),
Yinghai Lu30a18d62008-02-19 03:21:20 -0800328 IORESOURCE_MEM, 1);
329 }
330 }
331
Yinghai Lu30a18d62008-02-19 03:21:20 -0800332 for (i = 0; i < pci_root_num; i++) {
333 int res_num;
334 int busnum;
335
336 info = &pci_root_info[i];
337 res_num = info->res_num;
338 busnum = info->bus_min;
Yinghai Lu99935a72009-10-04 21:54:24 -0700339 printk(KERN_DEBUG "bus: [%02x, %02x] on node %x link %x\n",
Yinghai Lu30a18d62008-02-19 03:21:20 -0800340 info->bus_min, info->bus_max, info->node, info->link);
341 for (j = 0; j < res_num; j++) {
342 res = &info->res[j];
Yinghai Lu284f9332010-02-10 01:20:12 -0800343 printk(KERN_DEBUG "bus: %02x index %x %pR\n",
344 busnum, j, res);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800345 }
346 }
347
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 return 0;
349}
350
Robert Richter3a27dd12008-06-12 20:19:23 +0200351#define ENABLE_CF8_EXT_CFG (1ULL << 46)
352
Jan Beulich691269f2011-02-09 08:26:53 +0000353static void __cpuinit enable_pci_io_ecs(void *unused)
Robert Richter3a27dd12008-06-12 20:19:23 +0200354{
355 u64 reg;
356 rdmsrl(MSR_AMD64_NB_CFG, reg);
357 if (!(reg & ENABLE_CF8_EXT_CFG)) {
358 reg |= ENABLE_CF8_EXT_CFG;
359 wrmsrl(MSR_AMD64_NB_CFG, reg);
360 }
361}
362
Robert Richter91ede002008-08-22 20:23:38 +0200363static int __cpuinit amd_cpu_notify(struct notifier_block *self,
364 unsigned long action, void *hcpu)
Robert Richter3a27dd12008-06-12 20:19:23 +0200365{
Robert Richter91ede002008-08-22 20:23:38 +0200366 int cpu = (long)hcpu;
Robert Richtered217632008-08-22 20:23:38 +0200367 switch (action) {
Robert Richter91ede002008-08-22 20:23:38 +0200368 case CPU_ONLINE:
369 case CPU_ONLINE_FROZEN:
370 smp_call_function_single(cpu, enable_pci_io_ecs, NULL, 0);
371 break;
372 default:
373 break;
374 }
375 return NOTIFY_OK;
376}
377
378static struct notifier_block __cpuinitdata amd_cpu_notifier = {
379 .notifier_call = amd_cpu_notify,
380};
381
Jan Beulich24d9b702011-01-10 16:20:23 +0000382static void __init pci_enable_pci_io_ecs(void)
383{
384#ifdef CONFIG_AMD_NB
385 unsigned int i, n;
386
387 for (n = i = 0; !n && amd_nb_bus_dev_ranges[i].dev_limit; ++i) {
388 u8 bus = amd_nb_bus_dev_ranges[i].bus;
389 u8 slot = amd_nb_bus_dev_ranges[i].dev_base;
390 u8 limit = amd_nb_bus_dev_ranges[i].dev_limit;
391
392 for (; slot < limit; ++slot) {
393 u32 val = read_pci_config(bus, slot, 3, 0);
394
395 if (!early_is_amd_nb(val))
396 continue;
397
398 val = read_pci_config(bus, slot, 3, 0x8c);
399 if (!(val & (ENABLE_CF8_EXT_CFG >> 32))) {
400 val |= ENABLE_CF8_EXT_CFG >> 32;
401 write_pci_config(bus, slot, 3, 0x8c, val);
402 }
403 ++n;
404 }
405 }
406 pr_info("Extended Config Space enabled on %u nodes\n", n);
407#endif
408}
409
Robert Richter91ede002008-08-22 20:23:38 +0200410static int __init pci_io_ecs_init(void)
411{
412 int cpu;
413
Robert Richter3a27dd12008-06-12 20:19:23 +0200414 /* assume all cpus from fam10h have IO ECS */
415 if (boot_cpu_data.x86 < 0x10)
416 return 0;
Robert Richter91ede002008-08-22 20:23:38 +0200417
Jan Beulich24d9b702011-01-10 16:20:23 +0000418 /* Try the PCI method first. */
419 if (early_pci_allowed())
420 pci_enable_pci_io_ecs();
421
Robert Richter91ede002008-08-22 20:23:38 +0200422 register_cpu_notifier(&amd_cpu_notifier);
423 for_each_online_cpu(cpu)
424 amd_cpu_notify(&amd_cpu_notifier, (unsigned long)CPU_ONLINE,
425 (void *)(long)cpu);
Robert Richter3a27dd12008-06-12 20:19:23 +0200426 pci_probe |= PCI_HAS_IO_ECS;
Robert Richter91ede002008-08-22 20:23:38 +0200427
Robert Richter3a27dd12008-06-12 20:19:23 +0200428 return 0;
429}
430
Robert Richter9b4e27b2008-08-22 20:23:37 +0200431static int __init amd_postcore_init(void)
432{
433 if (boot_cpu_data.x86_vendor != X86_VENDOR_AMD)
434 return 0;
435
436 early_fill_mp_bus_info();
Robert Richter91ede002008-08-22 20:23:38 +0200437 pci_io_ecs_init();
Robert Richter9b4e27b2008-08-22 20:23:37 +0200438
439 return 0;
440}
441
442postcore_initcall(amd_postcore_init);