blob: 95ecbd495955094ac22c7502fe992ea2af7ad444 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#include <linux/init.h>
2#include <linux/pci.h>
Robert Richterd199a042008-07-02 22:50:26 +02003#include <linux/topology.h>
Robert Richter91ede002008-08-22 20:23:38 +02004#include <linux/cpu.h>
Jaswinder Singh Rajput82487712008-12-27 18:32:28 +05305#include <asm/pci_x86.h>
Robert Richter3a27dd12008-06-12 20:19:23 +02006
7#ifdef CONFIG_X86_64
Yinghai Lu871d5f82008-02-19 03:20:09 -08008#include <asm/pci-direct.h>
Robert Richterd199a042008-07-02 22:50:26 +02009#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070010
Yinghai Lu99935a72009-10-04 21:54:24 -070011#include "bus_numa.h"
12
Linus Torvalds1da177e2005-04-16 15:20:36 -070013/*
14 * This discovers the pcibus <-> node mapping on AMD K8.
Yinghai Lu30a18d62008-02-19 03:21:20 -080015 * also get peer root bus resource for io,mmio
Linus Torvalds1da177e2005-04-16 15:20:36 -070016 */
17
Robert Richterd199a042008-07-02 22:50:26 +020018#ifdef CONFIG_X86_64
Yinghai Lu871d5f82008-02-19 03:20:09 -080019
Yinghai Lu30a18d62008-02-19 03:21:20 -080020#define RANGE_NUM 16
21
22struct res_range {
23 size_t start;
24 size_t end;
25};
26
27static void __init update_range(struct res_range *range, size_t start,
28 size_t end)
29{
30 int i;
31 int j;
32
33 for (j = 0; j < RANGE_NUM; j++) {
34 if (!range[j].end)
35 continue;
Yinghai Lue8ee6f02008-04-13 01:41:58 -070036
37 if (start <= range[j].start && end >= range[j].end) {
Yinghai Lu30a18d62008-02-19 03:21:20 -080038 range[j].start = 0;
39 range[j].end = 0;
Yinghai Lue8ee6f02008-04-13 01:41:58 -070040 continue;
41 }
42
43 if (start <= range[j].start && end < range[j].end && range[j].start < end + 1) {
44 range[j].start = end + 1;
45 continue;
46 }
47
48
49 if (start > range[j].start && end >= range[j].end && range[j].end > start - 1) {
Yinghai Lu30a18d62008-02-19 03:21:20 -080050 range[j].end = start - 1;
Yinghai Lue8ee6f02008-04-13 01:41:58 -070051 continue;
52 }
53
54 if (start > range[j].start && end < range[j].end) {
Yinghai Lu30a18d62008-02-19 03:21:20 -080055 /* find the new spare */
56 for (i = 0; i < RANGE_NUM; i++) {
57 if (range[i].end == 0)
58 break;
59 }
60 if (i < RANGE_NUM) {
61 range[i].end = range[j].end;
62 range[i].start = end + 1;
63 } else {
64 printk(KERN_ERR "run of slot in ranges\n");
65 }
66 range[j].end = start - 1;
Yinghai Lue8ee6f02008-04-13 01:41:58 -070067 continue;
Yinghai Lu30a18d62008-02-19 03:21:20 -080068 }
69 }
70}
71
Yinghai Lu30a18d62008-02-19 03:21:20 -080072struct pci_hostbridge_probe {
73 u32 bus;
74 u32 slot;
75 u32 vendor;
76 u32 device;
77};
78
79static struct pci_hostbridge_probe pci_probes[] __initdata = {
80 { 0, 0x18, PCI_VENDOR_ID_AMD, 0x1100 },
81 { 0, 0x18, PCI_VENDOR_ID_AMD, 0x1200 },
82 { 0xff, 0, PCI_VENDOR_ID_AMD, 0x1200 },
83 { 0, 0x18, PCI_VENDOR_ID_AMD, 0x1300 },
84};
85
Yinghai Lu6e184f22008-03-06 01:15:31 -080086static u64 __initdata fam10h_mmconf_start;
87static u64 __initdata fam10h_mmconf_end;
88static void __init get_pci_mmcfg_amd_fam10h_range(void)
89{
90 u32 address;
91 u64 base, msr;
92 unsigned segn_busn_bits;
93
94 /* assume all cpus from fam10h have mmconf */
95 if (boot_cpu_data.x86 < 0x10)
96 return;
97
98 address = MSR_FAM10H_MMIO_CONF_BASE;
99 rdmsrl(address, msr);
100
101 /* mmconfig is not enable */
102 if (!(msr & FAM10H_MMIO_CONF_ENABLE))
103 return;
104
105 base = msr & (FAM10H_MMIO_CONF_BASE_MASK<<FAM10H_MMIO_CONF_BASE_SHIFT);
106
107 segn_busn_bits = (msr >> FAM10H_MMIO_CONF_BUSRANGE_SHIFT) &
108 FAM10H_MMIO_CONF_BUSRANGE_MASK;
109
110 fam10h_mmconf_start = base;
111 fam10h_mmconf_end = base + (1ULL<<(segn_busn_bits + 20)) - 1;
112}
113
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114/**
Yinghai Lu871d5f82008-02-19 03:20:09 -0800115 * early_fill_mp_bus_to_node()
116 * called before pcibios_scan_root and pci_scan_bus
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117 * fills the mp_bus_to_cpumask array based according to the LDT Bus Number
118 * Registers found in the K8 northbridge
119 */
Yinghai Lu30a18d62008-02-19 03:21:20 -0800120static int __init early_fill_mp_bus_info(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121{
Yinghai Lu30a18d62008-02-19 03:21:20 -0800122 int i;
123 int j;
124 unsigned bus;
Yinghai Lu871d5f82008-02-19 03:20:09 -0800125 unsigned slot;
Yinghai Lu35ddd062008-02-19 03:15:08 -0800126 int node;
Yinghai Lu30a18d62008-02-19 03:21:20 -0800127 int link;
128 int def_node;
129 int def_link;
130 struct pci_root_info *info;
131 u32 reg;
132 struct resource *res;
133 size_t start;
134 size_t end;
135 struct res_range range[RANGE_NUM];
136 u64 val;
137 u32 address;
Yinghai Lu35ddd062008-02-19 03:15:08 -0800138
Yinghai Lu871d5f82008-02-19 03:20:09 -0800139 if (!early_pci_allowed())
140 return -1;
141
Yinghai Lu99935a72009-10-04 21:54:24 -0700142 found_all_numa_early = 0;
Yinghai Lu30a18d62008-02-19 03:21:20 -0800143 for (i = 0; i < ARRAY_SIZE(pci_probes); i++) {
144 u32 id;
145 u16 device;
146 u16 vendor;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700147
Yinghai Lu30a18d62008-02-19 03:21:20 -0800148 bus = pci_probes[i].bus;
149 slot = pci_probes[i].slot;
150 id = read_pci_config(bus, slot, 0, PCI_VENDOR_ID);
Yinghai Lu35ddd062008-02-19 03:15:08 -0800151
Yinghai Lu30a18d62008-02-19 03:21:20 -0800152 vendor = id & 0xffff;
153 device = (id>>16) & 0xffff;
154 if (pci_probes[i].vendor == vendor &&
155 pci_probes[i].device == device) {
Yinghai Lu99935a72009-10-04 21:54:24 -0700156 found_all_numa_early = 1;
Yinghai Lu30a18d62008-02-19 03:21:20 -0800157 break;
158 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159 }
160
Yinghai Lu99935a72009-10-04 21:54:24 -0700161 if (!found_all_numa_early)
Yinghai Lu30a18d62008-02-19 03:21:20 -0800162 return 0;
163
164 pci_root_num = 0;
165 for (i = 0; i < 4; i++) {
166 int min_bus;
167 int max_bus;
168 reg = read_pci_config(bus, slot, 1, 0xe0 + (i << 2));
169
170 /* Check if that register is enabled for bus range */
171 if ((reg & 7) != 3)
172 continue;
173
174 min_bus = (reg >> 16) & 0xff;
175 max_bus = (reg >> 24) & 0xff;
176 node = (reg >> 4) & 0x07;
177#ifdef CONFIG_NUMA
178 for (j = min_bus; j <= max_bus; j++)
Jesse Barnes25470892009-07-10 14:04:30 -0700179 set_mp_bus_to_node(j, node);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800180#endif
181 link = (reg >> 8) & 0x03;
182
183 info = &pci_root_info[pci_root_num];
184 info->bus_min = min_bus;
185 info->bus_max = max_bus;
186 info->node = node;
187 info->link = link;
188 sprintf(info->name, "PCI Bus #%02x", min_bus);
189 pci_root_num++;
190 }
191
192 /* get the default node and link for left over res */
193 reg = read_pci_config(bus, slot, 0, 0x60);
194 def_node = (reg >> 8) & 0x07;
195 reg = read_pci_config(bus, slot, 0, 0x64);
196 def_link = (reg >> 8) & 0x03;
197
198 memset(range, 0, sizeof(range));
199 range[0].end = 0xffff;
200 /* io port resource */
201 for (i = 0; i < 4; i++) {
202 reg = read_pci_config(bus, slot, 1, 0xc0 + (i << 3));
203 if (!(reg & 3))
204 continue;
205
206 start = reg & 0xfff000;
207 reg = read_pci_config(bus, slot, 1, 0xc4 + (i << 3));
208 node = reg & 0x07;
209 link = (reg >> 4) & 0x03;
210 end = (reg & 0xfff000) | 0xfff;
211
212 /* find the position */
213 for (j = 0; j < pci_root_num; j++) {
214 info = &pci_root_info[j];
215 if (info->node == node && info->link == link)
216 break;
217 }
218 if (j == pci_root_num)
219 continue; /* not found */
220
221 info = &pci_root_info[j];
Yinghai Lu6e184f22008-03-06 01:15:31 -0800222 printk(KERN_DEBUG "node %d link %d: io port [%llx, %llx]\n",
223 node, link, (u64)start, (u64)end);
Yinghai Lue8ee6f02008-04-13 01:41:58 -0700224
225 /* kernel only handle 16 bit only */
226 if (end > 0xffff)
227 end = 0xffff;
228 update_res(info, start, end, IORESOURCE_IO, 1);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800229 update_range(range, start, end);
230 }
231 /* add left over io port range to def node/link, [0, 0xffff] */
232 /* find the position */
233 for (j = 0; j < pci_root_num; j++) {
234 info = &pci_root_info[j];
235 if (info->node == def_node && info->link == def_link)
236 break;
237 }
238 if (j < pci_root_num) {
239 info = &pci_root_info[j];
240 for (i = 0; i < RANGE_NUM; i++) {
241 if (!range[i].end)
242 continue;
243
244 update_res(info, range[i].start, range[i].end,
245 IORESOURCE_IO, 1);
246 }
247 }
248
249 memset(range, 0, sizeof(range));
250 /* 0xfd00000000-0xffffffffff for HT */
Yinghai Lu6e184f22008-03-06 01:15:31 -0800251 range[0].end = (0xfdULL<<32) - 1;
Yinghai Lu30a18d62008-02-19 03:21:20 -0800252
253 /* need to take out [0, TOM) for RAM*/
254 address = MSR_K8_TOP_MEM1;
255 rdmsrl(address, val);
Yinghai Lu8004dd92008-05-12 17:40:39 -0700256 end = (val & 0xffffff800000ULL);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800257 printk(KERN_INFO "TOM: %016lx aka %ldM\n", end, end>>20);
258 if (end < (1ULL<<32))
259 update_range(range, 0, end - 1);
260
Yinghai Lu6e184f22008-03-06 01:15:31 -0800261 /* get mmconfig */
262 get_pci_mmcfg_amd_fam10h_range();
263 /* need to take out mmconf range */
264 if (fam10h_mmconf_end) {
265 printk(KERN_DEBUG "Fam 10h mmconf [%llx, %llx]\n", fam10h_mmconf_start, fam10h_mmconf_end);
266 update_range(range, fam10h_mmconf_start, fam10h_mmconf_end);
267 }
268
Yinghai Lu30a18d62008-02-19 03:21:20 -0800269 /* mmio resource */
270 for (i = 0; i < 8; i++) {
271 reg = read_pci_config(bus, slot, 1, 0x80 + (i << 3));
272 if (!(reg & 3))
273 continue;
274
275 start = reg & 0xffffff00; /* 39:16 on 31:8*/
276 start <<= 8;
277 reg = read_pci_config(bus, slot, 1, 0x84 + (i << 3));
278 node = reg & 0x07;
279 link = (reg >> 4) & 0x03;
280 end = (reg & 0xffffff00);
281 end <<= 8;
282 end |= 0xffff;
283
284 /* find the position */
285 for (j = 0; j < pci_root_num; j++) {
286 info = &pci_root_info[j];
287 if (info->node == node && info->link == link)
288 break;
289 }
290 if (j == pci_root_num)
291 continue; /* not found */
292
293 info = &pci_root_info[j];
Yinghai Lu6e184f22008-03-06 01:15:31 -0800294
295 printk(KERN_DEBUG "node %d link %d: mmio [%llx, %llx]",
296 node, link, (u64)start, (u64)end);
297 /*
298 * some sick allocation would have range overlap with fam10h
299 * mmconf range, so need to update start and end.
300 */
301 if (fam10h_mmconf_end) {
302 int changed = 0;
303 u64 endx = 0;
304 if (start >= fam10h_mmconf_start &&
305 start <= fam10h_mmconf_end) {
306 start = fam10h_mmconf_end + 1;
307 changed = 1;
308 }
309
310 if (end >= fam10h_mmconf_start &&
311 end <= fam10h_mmconf_end) {
312 end = fam10h_mmconf_start - 1;
313 changed = 1;
314 }
315
316 if (start < fam10h_mmconf_start &&
317 end > fam10h_mmconf_end) {
318 /* we got a hole */
319 endx = fam10h_mmconf_start - 1;
320 update_res(info, start, endx, IORESOURCE_MEM, 0);
321 update_range(range, start, endx);
322 printk(KERN_CONT " ==> [%llx, %llx]", (u64)start, endx);
323 start = fam10h_mmconf_end + 1;
324 changed = 1;
325 }
326 if (changed) {
327 if (start <= end) {
328 printk(KERN_CONT " %s [%llx, %llx]", endx?"and":"==>", (u64)start, (u64)end);
329 } else {
330 printk(KERN_CONT "%s\n", endx?"":" ==> none");
331 continue;
332 }
333 }
334 }
335
Yinghai Lue8ee6f02008-04-13 01:41:58 -0700336 update_res(info, start, end, IORESOURCE_MEM, 1);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800337 update_range(range, start, end);
Yinghai Lu6e184f22008-03-06 01:15:31 -0800338 printk(KERN_CONT "\n");
Yinghai Lu30a18d62008-02-19 03:21:20 -0800339 }
340
341 /* need to take out [4G, TOM2) for RAM*/
342 /* SYS_CFG */
343 address = MSR_K8_SYSCFG;
344 rdmsrl(address, val);
345 /* TOP_MEM2 is enabled? */
346 if (val & (1<<21)) {
347 /* TOP_MEM2 */
348 address = MSR_K8_TOP_MEM2;
349 rdmsrl(address, val);
Yinghai Lu8004dd92008-05-12 17:40:39 -0700350 end = (val & 0xffffff800000ULL);
Yinghai Lu30a18d62008-02-19 03:21:20 -0800351 printk(KERN_INFO "TOM2: %016lx aka %ldM\n", end, end>>20);
352 update_range(range, 1ULL<<32, end - 1);
353 }
354
355 /*
356 * add left over mmio range to def node/link ?
357 * that is tricky, just record range in from start_min to 4G
358 */
359 for (j = 0; j < pci_root_num; j++) {
360 info = &pci_root_info[j];
361 if (info->node == def_node && info->link == def_link)
362 break;
363 }
364 if (j < pci_root_num) {
365 info = &pci_root_info[j];
366
367 for (i = 0; i < RANGE_NUM; i++) {
368 if (!range[i].end)
369 continue;
370
371 update_res(info, range[i].start, range[i].end,
372 IORESOURCE_MEM, 1);
373 }
374 }
375
Yinghai Lu30a18d62008-02-19 03:21:20 -0800376 for (i = 0; i < pci_root_num; i++) {
377 int res_num;
378 int busnum;
379
380 info = &pci_root_info[i];
381 res_num = info->res_num;
382 busnum = info->bus_min;
Yinghai Lu99935a72009-10-04 21:54:24 -0700383 printk(KERN_DEBUG "bus: [%02x, %02x] on node %x link %x\n",
Yinghai Lu30a18d62008-02-19 03:21:20 -0800384 info->bus_min, info->bus_max, info->node, info->link);
385 for (j = 0; j < res_num; j++) {
386 res = &info->res[j];
387 printk(KERN_DEBUG "bus: %02x index %x %s: [%llx, %llx]\n",
388 busnum, j,
389 (res->flags & IORESOURCE_IO)?"io port":"mmio",
390 res->start, res->end);
391 }
392 }
393
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394 return 0;
395}
396
Robert Richter9b4e27b2008-08-22 20:23:37 +0200397#else /* !CONFIG_X86_64 */
Robert Richter3a27dd12008-06-12 20:19:23 +0200398
Robert Richter9b4e27b2008-08-22 20:23:37 +0200399static int __init early_fill_mp_bus_info(void) { return 0; }
400
401#endif /* !CONFIG_X86_64 */
Robert Richter3a27dd12008-06-12 20:19:23 +0200402
403/* common 32/64 bit code */
404
405#define ENABLE_CF8_EXT_CFG (1ULL << 46)
406
Robert Richter91ede002008-08-22 20:23:38 +0200407static void enable_pci_io_ecs(void *unused)
Robert Richter3a27dd12008-06-12 20:19:23 +0200408{
409 u64 reg;
410 rdmsrl(MSR_AMD64_NB_CFG, reg);
411 if (!(reg & ENABLE_CF8_EXT_CFG)) {
412 reg |= ENABLE_CF8_EXT_CFG;
413 wrmsrl(MSR_AMD64_NB_CFG, reg);
414 }
415}
416
Robert Richter91ede002008-08-22 20:23:38 +0200417static int __cpuinit amd_cpu_notify(struct notifier_block *self,
418 unsigned long action, void *hcpu)
Robert Richter3a27dd12008-06-12 20:19:23 +0200419{
Robert Richter91ede002008-08-22 20:23:38 +0200420 int cpu = (long)hcpu;
Robert Richtered217632008-08-22 20:23:38 +0200421 switch (action) {
Robert Richter91ede002008-08-22 20:23:38 +0200422 case CPU_ONLINE:
423 case CPU_ONLINE_FROZEN:
424 smp_call_function_single(cpu, enable_pci_io_ecs, NULL, 0);
425 break;
426 default:
427 break;
428 }
429 return NOTIFY_OK;
430}
431
432static struct notifier_block __cpuinitdata amd_cpu_notifier = {
433 .notifier_call = amd_cpu_notify,
434};
435
436static int __init pci_io_ecs_init(void)
437{
438 int cpu;
439
Robert Richter3a27dd12008-06-12 20:19:23 +0200440 /* assume all cpus from fam10h have IO ECS */
441 if (boot_cpu_data.x86 < 0x10)
442 return 0;
Robert Richter91ede002008-08-22 20:23:38 +0200443
444 register_cpu_notifier(&amd_cpu_notifier);
445 for_each_online_cpu(cpu)
446 amd_cpu_notify(&amd_cpu_notifier, (unsigned long)CPU_ONLINE,
447 (void *)(long)cpu);
Robert Richter3a27dd12008-06-12 20:19:23 +0200448 pci_probe |= PCI_HAS_IO_ECS;
Robert Richter91ede002008-08-22 20:23:38 +0200449
Robert Richter3a27dd12008-06-12 20:19:23 +0200450 return 0;
451}
452
Robert Richter9b4e27b2008-08-22 20:23:37 +0200453static int __init amd_postcore_init(void)
454{
455 if (boot_cpu_data.x86_vendor != X86_VENDOR_AMD)
456 return 0;
457
458 early_fill_mp_bus_info();
Robert Richter91ede002008-08-22 20:23:38 +0200459 pci_io_ecs_init();
Robert Richter9b4e27b2008-08-22 20:23:37 +0200460
461 return 0;
462}
463
464postcore_initcall(amd_postcore_init);