Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
awilliam
GitHub Repository: awilliam/linux-vfio
Path: blob/master/arch/x86/pci/amd_bus.c
10818 views
1
#include <linux/init.h>
2
#include <linux/pci.h>
3
#include <linux/topology.h>
4
#include <linux/cpu.h>
5
#include <linux/range.h>
6
7
#include <asm/amd_nb.h>
8
#include <asm/pci_x86.h>
9
10
#include <asm/pci-direct.h>
11
12
#include "bus_numa.h"
13
14
/*
15
* This discovers the pcibus <-> node mapping on AMD K8.
16
* also get peer root bus resource for io,mmio
17
*/
18
19
struct pci_hostbridge_probe {
20
u32 bus;
21
u32 slot;
22
u32 vendor;
23
u32 device;
24
};
25
26
static struct pci_hostbridge_probe pci_probes[] __initdata = {
27
{ 0, 0x18, PCI_VENDOR_ID_AMD, 0x1100 },
28
{ 0, 0x18, PCI_VENDOR_ID_AMD, 0x1200 },
29
{ 0xff, 0, PCI_VENDOR_ID_AMD, 0x1200 },
30
{ 0, 0x18, PCI_VENDOR_ID_AMD, 0x1300 },
31
};
32
33
static u64 __initdata fam10h_mmconf_start;
34
static u64 __initdata fam10h_mmconf_end;
35
static void __init get_pci_mmcfg_amd_fam10h_range(void)
36
{
37
u32 address;
38
u64 base, msr;
39
unsigned segn_busn_bits;
40
41
/* assume all cpus from fam10h have mmconf */
42
if (boot_cpu_data.x86 < 0x10)
43
return;
44
45
address = MSR_FAM10H_MMIO_CONF_BASE;
46
rdmsrl(address, msr);
47
48
/* mmconfig is not enable */
49
if (!(msr & FAM10H_MMIO_CONF_ENABLE))
50
return;
51
52
base = msr & (FAM10H_MMIO_CONF_BASE_MASK<<FAM10H_MMIO_CONF_BASE_SHIFT);
53
54
segn_busn_bits = (msr >> FAM10H_MMIO_CONF_BUSRANGE_SHIFT) &
55
FAM10H_MMIO_CONF_BUSRANGE_MASK;
56
57
fam10h_mmconf_start = base;
58
fam10h_mmconf_end = base + (1ULL<<(segn_busn_bits + 20)) - 1;
59
}
60
61
#define RANGE_NUM 16
62
63
/**
64
* early_fill_mp_bus_to_node()
65
* called before pcibios_scan_root and pci_scan_bus
66
* fills the mp_bus_to_cpumask array based according to the LDT Bus Number
67
* Registers found in the K8 northbridge
68
*/
69
static int __init early_fill_mp_bus_info(void)
70
{
71
int i;
72
int j;
73
unsigned bus;
74
unsigned slot;
75
int node;
76
int link;
77
int def_node;
78
int def_link;
79
struct pci_root_info *info;
80
u32 reg;
81
struct resource *res;
82
u64 start;
83
u64 end;
84
struct range range[RANGE_NUM];
85
u64 val;
86
u32 address;
87
bool found;
88
89
if (!early_pci_allowed())
90
return -1;
91
92
found = false;
93
for (i = 0; i < ARRAY_SIZE(pci_probes); i++) {
94
u32 id;
95
u16 device;
96
u16 vendor;
97
98
bus = pci_probes[i].bus;
99
slot = pci_probes[i].slot;
100
id = read_pci_config(bus, slot, 0, PCI_VENDOR_ID);
101
102
vendor = id & 0xffff;
103
device = (id>>16) & 0xffff;
104
if (pci_probes[i].vendor == vendor &&
105
pci_probes[i].device == device) {
106
found = true;
107
break;
108
}
109
}
110
111
if (!found)
112
return 0;
113
114
pci_root_num = 0;
115
for (i = 0; i < 4; i++) {
116
int min_bus;
117
int max_bus;
118
reg = read_pci_config(bus, slot, 1, 0xe0 + (i << 2));
119
120
/* Check if that register is enabled for bus range */
121
if ((reg & 7) != 3)
122
continue;
123
124
min_bus = (reg >> 16) & 0xff;
125
max_bus = (reg >> 24) & 0xff;
126
node = (reg >> 4) & 0x07;
127
#ifdef CONFIG_NUMA
128
for (j = min_bus; j <= max_bus; j++)
129
set_mp_bus_to_node(j, node);
130
#endif
131
link = (reg >> 8) & 0x03;
132
133
info = &pci_root_info[pci_root_num];
134
info->bus_min = min_bus;
135
info->bus_max = max_bus;
136
info->node = node;
137
info->link = link;
138
sprintf(info->name, "PCI Bus #%02x", min_bus);
139
pci_root_num++;
140
}
141
142
/* get the default node and link for left over res */
143
reg = read_pci_config(bus, slot, 0, 0x60);
144
def_node = (reg >> 8) & 0x07;
145
reg = read_pci_config(bus, slot, 0, 0x64);
146
def_link = (reg >> 8) & 0x03;
147
148
memset(range, 0, sizeof(range));
149
add_range(range, RANGE_NUM, 0, 0, 0xffff + 1);
150
/* io port resource */
151
for (i = 0; i < 4; i++) {
152
reg = read_pci_config(bus, slot, 1, 0xc0 + (i << 3));
153
if (!(reg & 3))
154
continue;
155
156
start = reg & 0xfff000;
157
reg = read_pci_config(bus, slot, 1, 0xc4 + (i << 3));
158
node = reg & 0x07;
159
link = (reg >> 4) & 0x03;
160
end = (reg & 0xfff000) | 0xfff;
161
162
/* find the position */
163
for (j = 0; j < pci_root_num; j++) {
164
info = &pci_root_info[j];
165
if (info->node == node && info->link == link)
166
break;
167
}
168
if (j == pci_root_num)
169
continue; /* not found */
170
171
info = &pci_root_info[j];
172
printk(KERN_DEBUG "node %d link %d: io port [%llx, %llx]\n",
173
node, link, start, end);
174
175
/* kernel only handle 16 bit only */
176
if (end > 0xffff)
177
end = 0xffff;
178
update_res(info, start, end, IORESOURCE_IO, 1);
179
subtract_range(range, RANGE_NUM, start, end + 1);
180
}
181
/* add left over io port range to def node/link, [0, 0xffff] */
182
/* find the position */
183
for (j = 0; j < pci_root_num; j++) {
184
info = &pci_root_info[j];
185
if (info->node == def_node && info->link == def_link)
186
break;
187
}
188
if (j < pci_root_num) {
189
info = &pci_root_info[j];
190
for (i = 0; i < RANGE_NUM; i++) {
191
if (!range[i].end)
192
continue;
193
194
update_res(info, range[i].start, range[i].end - 1,
195
IORESOURCE_IO, 1);
196
}
197
}
198
199
memset(range, 0, sizeof(range));
200
/* 0xfd00000000-0xffffffffff for HT */
201
end = cap_resource((0xfdULL<<32) - 1);
202
end++;
203
add_range(range, RANGE_NUM, 0, 0, end);
204
205
/* need to take out [0, TOM) for RAM*/
206
address = MSR_K8_TOP_MEM1;
207
rdmsrl(address, val);
208
end = (val & 0xffffff800000ULL);
209
printk(KERN_INFO "TOM: %016llx aka %lldM\n", end, end>>20);
210
if (end < (1ULL<<32))
211
subtract_range(range, RANGE_NUM, 0, end);
212
213
/* get mmconfig */
214
get_pci_mmcfg_amd_fam10h_range();
215
/* need to take out mmconf range */
216
if (fam10h_mmconf_end) {
217
printk(KERN_DEBUG "Fam 10h mmconf [%llx, %llx]\n", fam10h_mmconf_start, fam10h_mmconf_end);
218
subtract_range(range, RANGE_NUM, fam10h_mmconf_start,
219
fam10h_mmconf_end + 1);
220
}
221
222
/* mmio resource */
223
for (i = 0; i < 8; i++) {
224
reg = read_pci_config(bus, slot, 1, 0x80 + (i << 3));
225
if (!(reg & 3))
226
continue;
227
228
start = reg & 0xffffff00; /* 39:16 on 31:8*/
229
start <<= 8;
230
reg = read_pci_config(bus, slot, 1, 0x84 + (i << 3));
231
node = reg & 0x07;
232
link = (reg >> 4) & 0x03;
233
end = (reg & 0xffffff00);
234
end <<= 8;
235
end |= 0xffff;
236
237
/* find the position */
238
for (j = 0; j < pci_root_num; j++) {
239
info = &pci_root_info[j];
240
if (info->node == node && info->link == link)
241
break;
242
}
243
if (j == pci_root_num)
244
continue; /* not found */
245
246
info = &pci_root_info[j];
247
248
printk(KERN_DEBUG "node %d link %d: mmio [%llx, %llx]",
249
node, link, start, end);
250
/*
251
* some sick allocation would have range overlap with fam10h
252
* mmconf range, so need to update start and end.
253
*/
254
if (fam10h_mmconf_end) {
255
int changed = 0;
256
u64 endx = 0;
257
if (start >= fam10h_mmconf_start &&
258
start <= fam10h_mmconf_end) {
259
start = fam10h_mmconf_end + 1;
260
changed = 1;
261
}
262
263
if (end >= fam10h_mmconf_start &&
264
end <= fam10h_mmconf_end) {
265
end = fam10h_mmconf_start - 1;
266
changed = 1;
267
}
268
269
if (start < fam10h_mmconf_start &&
270
end > fam10h_mmconf_end) {
271
/* we got a hole */
272
endx = fam10h_mmconf_start - 1;
273
update_res(info, start, endx, IORESOURCE_MEM, 0);
274
subtract_range(range, RANGE_NUM, start,
275
endx + 1);
276
printk(KERN_CONT " ==> [%llx, %llx]", start, endx);
277
start = fam10h_mmconf_end + 1;
278
changed = 1;
279
}
280
if (changed) {
281
if (start <= end) {
282
printk(KERN_CONT " %s [%llx, %llx]", endx ? "and" : "==>", start, end);
283
} else {
284
printk(KERN_CONT "%s\n", endx?"":" ==> none");
285
continue;
286
}
287
}
288
}
289
290
update_res(info, cap_resource(start), cap_resource(end),
291
IORESOURCE_MEM, 1);
292
subtract_range(range, RANGE_NUM, start, end + 1);
293
printk(KERN_CONT "\n");
294
}
295
296
/* need to take out [4G, TOM2) for RAM*/
297
/* SYS_CFG */
298
address = MSR_K8_SYSCFG;
299
rdmsrl(address, val);
300
/* TOP_MEM2 is enabled? */
301
if (val & (1<<21)) {
302
/* TOP_MEM2 */
303
address = MSR_K8_TOP_MEM2;
304
rdmsrl(address, val);
305
end = (val & 0xffffff800000ULL);
306
printk(KERN_INFO "TOM2: %016llx aka %lldM\n", end, end>>20);
307
subtract_range(range, RANGE_NUM, 1ULL<<32, end);
308
}
309
310
/*
311
* add left over mmio range to def node/link ?
312
* that is tricky, just record range in from start_min to 4G
313
*/
314
for (j = 0; j < pci_root_num; j++) {
315
info = &pci_root_info[j];
316
if (info->node == def_node && info->link == def_link)
317
break;
318
}
319
if (j < pci_root_num) {
320
info = &pci_root_info[j];
321
322
for (i = 0; i < RANGE_NUM; i++) {
323
if (!range[i].end)
324
continue;
325
326
update_res(info, cap_resource(range[i].start),
327
cap_resource(range[i].end - 1),
328
IORESOURCE_MEM, 1);
329
}
330
}
331
332
for (i = 0; i < pci_root_num; i++) {
333
int res_num;
334
int busnum;
335
336
info = &pci_root_info[i];
337
res_num = info->res_num;
338
busnum = info->bus_min;
339
printk(KERN_DEBUG "bus: [%02x, %02x] on node %x link %x\n",
340
info->bus_min, info->bus_max, info->node, info->link);
341
for (j = 0; j < res_num; j++) {
342
res = &info->res[j];
343
printk(KERN_DEBUG "bus: %02x index %x %pR\n",
344
busnum, j, res);
345
}
346
}
347
348
return 0;
349
}
350
351
#define ENABLE_CF8_EXT_CFG (1ULL << 46)
352
353
static void __cpuinit enable_pci_io_ecs(void *unused)
354
{
355
u64 reg;
356
rdmsrl(MSR_AMD64_NB_CFG, reg);
357
if (!(reg & ENABLE_CF8_EXT_CFG)) {
358
reg |= ENABLE_CF8_EXT_CFG;
359
wrmsrl(MSR_AMD64_NB_CFG, reg);
360
}
361
}
362
363
static int __cpuinit amd_cpu_notify(struct notifier_block *self,
364
unsigned long action, void *hcpu)
365
{
366
int cpu = (long)hcpu;
367
switch (action) {
368
case CPU_ONLINE:
369
case CPU_ONLINE_FROZEN:
370
smp_call_function_single(cpu, enable_pci_io_ecs, NULL, 0);
371
break;
372
default:
373
break;
374
}
375
return NOTIFY_OK;
376
}
377
378
static struct notifier_block __cpuinitdata amd_cpu_notifier = {
379
.notifier_call = amd_cpu_notify,
380
};
381
382
static void __init pci_enable_pci_io_ecs(void)
383
{
384
#ifdef CONFIG_AMD_NB
385
unsigned int i, n;
386
387
for (n = i = 0; !n && amd_nb_bus_dev_ranges[i].dev_limit; ++i) {
388
u8 bus = amd_nb_bus_dev_ranges[i].bus;
389
u8 slot = amd_nb_bus_dev_ranges[i].dev_base;
390
u8 limit = amd_nb_bus_dev_ranges[i].dev_limit;
391
392
for (; slot < limit; ++slot) {
393
u32 val = read_pci_config(bus, slot, 3, 0);
394
395
if (!early_is_amd_nb(val))
396
continue;
397
398
val = read_pci_config(bus, slot, 3, 0x8c);
399
if (!(val & (ENABLE_CF8_EXT_CFG >> 32))) {
400
val |= ENABLE_CF8_EXT_CFG >> 32;
401
write_pci_config(bus, slot, 3, 0x8c, val);
402
}
403
++n;
404
}
405
}
406
pr_info("Extended Config Space enabled on %u nodes\n", n);
407
#endif
408
}
409
410
static int __init pci_io_ecs_init(void)
411
{
412
int cpu;
413
414
/* assume all cpus from fam10h have IO ECS */
415
if (boot_cpu_data.x86 < 0x10)
416
return 0;
417
418
/* Try the PCI method first. */
419
if (early_pci_allowed())
420
pci_enable_pci_io_ecs();
421
422
register_cpu_notifier(&amd_cpu_notifier);
423
for_each_online_cpu(cpu)
424
amd_cpu_notify(&amd_cpu_notifier, (unsigned long)CPU_ONLINE,
425
(void *)(long)cpu);
426
pci_probe |= PCI_HAS_IO_ECS;
427
428
return 0;
429
}
430
431
static int __init amd_postcore_init(void)
432
{
433
if (boot_cpu_data.x86_vendor != X86_VENDOR_AMD)
434
return 0;
435
436
early_fill_mp_bus_info();
437
pci_io_ecs_init();
438
439
return 0;
440
}
441
442
postcore_initcall(amd_postcore_init);
443
444