1#include <linux/pci.h> 2#include <linux/acpi.h> 3#include <linux/init.h> 4#include <linux/irq.h> 5#include <linux/dmi.h> 6#include <linux/slab.h> 7#include <asm/numa.h> 8#include <asm/pci_x86.h> 9 10struct pci_root_info { 11 struct acpi_device *bridge; 12 char name[16]; 13 struct pci_sysdata sd; 14#ifdef CONFIG_PCI_MMCONFIG 15 bool mcfg_added; 16 u16 segment; 17 u8 start_bus; 18 u8 end_bus; 19#endif 20}; 21 22static bool pci_use_crs = true; 23static bool pci_ignore_seg = false; 24 25static int __init set_use_crs(const struct dmi_system_id *id) 26{ 27 pci_use_crs = true; 28 return 0; 29} 30 31static int __init set_nouse_crs(const struct dmi_system_id *id) 32{ 33 pci_use_crs = false; 34 return 0; 35} 36 37static int __init set_ignore_seg(const struct dmi_system_id *id) 38{ 39 printk(KERN_INFO "PCI: %s detected: ignoring ACPI _SEG\n", id->ident); 40 pci_ignore_seg = true; 41 return 0; 42} 43 44static const struct dmi_system_id pci_crs_quirks[] __initconst = { 45 /* http://bugzilla.kernel.org/show_bug.cgi?id=14183 */ 46 { 47 .callback = set_use_crs, 48 .ident = "IBM System x3800", 49 .matches = { 50 DMI_MATCH(DMI_SYS_VENDOR, "IBM"), 51 DMI_MATCH(DMI_PRODUCT_NAME, "x3800"), 52 }, 53 }, 54 /* https://bugzilla.kernel.org/show_bug.cgi?id=16007 */ 55 /* 2006 AMD HT/VIA system with two host bridges */ 56 { 57 .callback = set_use_crs, 58 .ident = "ASRock ALiveSATA2-GLAN", 59 .matches = { 60 DMI_MATCH(DMI_PRODUCT_NAME, "ALiveSATA2-GLAN"), 61 }, 62 }, 63 /* https://bugzilla.kernel.org/show_bug.cgi?id=30552 */ 64 /* 2006 AMD HT/VIA system with two host bridges */ 65 { 66 .callback = set_use_crs, 67 .ident = "ASUS M2V-MX SE", 68 .matches = { 69 DMI_MATCH(DMI_BOARD_VENDOR, "ASUSTeK Computer INC."), 70 DMI_MATCH(DMI_BOARD_NAME, "M2V-MX SE"), 71 DMI_MATCH(DMI_BIOS_VENDOR, "American Megatrends Inc."), 72 }, 73 }, 74 /* https://bugzilla.kernel.org/show_bug.cgi?id=42619 */ 75 { 76 .callback = set_use_crs, 77 .ident = "MSI MS-7253", 78 .matches = { 79 DMI_MATCH(DMI_BOARD_VENDOR, "MICRO-STAR INTERNATIONAL CO., LTD"), 80 DMI_MATCH(DMI_BOARD_NAME, "MS-7253"), 81 DMI_MATCH(DMI_BIOS_VENDOR, "Phoenix Technologies, LTD"), 82 }, 83 }, 84 /* https://bugs.launchpad.net/ubuntu/+source/alsa-driver/+bug/931368 */ 85 /* https://bugs.launchpad.net/ubuntu/+source/alsa-driver/+bug/1033299 */ 86 { 87 .callback = set_use_crs, 88 .ident = "Foxconn K8M890-8237A", 89 .matches = { 90 DMI_MATCH(DMI_BOARD_VENDOR, "Foxconn"), 91 DMI_MATCH(DMI_BOARD_NAME, "K8M890-8237A"), 92 DMI_MATCH(DMI_BIOS_VENDOR, "Phoenix Technologies, LTD"), 93 }, 94 }, 95 96 /* Now for the blacklist.. */ 97 98 /* https://bugzilla.redhat.com/show_bug.cgi?id=769657 */ 99 { 100 .callback = set_nouse_crs, 101 .ident = "Dell Studio 1557", 102 .matches = { 103 DMI_MATCH(DMI_BOARD_VENDOR, "Dell Inc."), 104 DMI_MATCH(DMI_PRODUCT_NAME, "Studio 1557"), 105 DMI_MATCH(DMI_BIOS_VERSION, "A09"), 106 }, 107 }, 108 /* https://bugzilla.redhat.com/show_bug.cgi?id=769657 */ 109 { 110 .callback = set_nouse_crs, 111 .ident = "Thinkpad SL510", 112 .matches = { 113 DMI_MATCH(DMI_BOARD_VENDOR, "LENOVO"), 114 DMI_MATCH(DMI_BOARD_NAME, "2847DFG"), 115 DMI_MATCH(DMI_BIOS_VERSION, "6JET85WW (1.43 )"), 116 }, 117 }, 118 119 /* https://bugzilla.kernel.org/show_bug.cgi?id=15362 */ 120 { 121 .callback = set_ignore_seg, 122 .ident = "HP xw9300", 123 .matches = { 124 DMI_MATCH(DMI_SYS_VENDOR, "Hewlett-Packard"), 125 DMI_MATCH(DMI_PRODUCT_NAME, "HP xw9300 Workstation"), 126 }, 127 }, 128 {} 129}; 130 131void __init pci_acpi_crs_quirks(void) 132{ 133 int year; 134 135 if (dmi_get_date(DMI_BIOS_DATE, &year, NULL, NULL) && year < 2008) { 136 if (iomem_resource.end <= 0xffffffff) 137 pci_use_crs = false; 138 } 139 140 dmi_check_system(pci_crs_quirks); 141 142 /* 143 * If the user specifies "pci=use_crs" or "pci=nocrs" explicitly, that 144 * takes precedence over anything we figured out above. 145 */ 146 if (pci_probe & PCI_ROOT_NO_CRS) 147 pci_use_crs = false; 148 else if (pci_probe & PCI_USE__CRS) 149 pci_use_crs = true; 150 151 printk(KERN_INFO "PCI: %s host bridge windows from ACPI; " 152 "if necessary, use \"pci=%s\" and report a bug\n", 153 pci_use_crs ? "Using" : "Ignoring", 154 pci_use_crs ? "nocrs" : "use_crs"); 155} 156 157#ifdef CONFIG_PCI_MMCONFIG 158static int check_segment(u16 seg, struct device *dev, char *estr) 159{ 160 if (seg) { 161 dev_err(dev, 162 "%s can't access PCI configuration " 163 "space under this host bridge.\n", 164 estr); 165 return -EIO; 166 } 167 168 /* 169 * Failure in adding MMCFG information is not fatal, 170 * just can't access extended configuration space of 171 * devices under this host bridge. 172 */ 173 dev_warn(dev, 174 "%s can't access extended PCI configuration " 175 "space under this bridge.\n", 176 estr); 177 178 return 0; 179} 180 181static int setup_mcfg_map(struct pci_root_info *info, u16 seg, u8 start, 182 u8 end, phys_addr_t addr) 183{ 184 int result; 185 struct device *dev = &info->bridge->dev; 186 187 info->start_bus = start; 188 info->end_bus = end; 189 info->mcfg_added = false; 190 191 /* return success if MMCFG is not in use */ 192 if (raw_pci_ext_ops && raw_pci_ext_ops != &pci_mmcfg) 193 return 0; 194 195 if (!(pci_probe & PCI_PROBE_MMCONF)) 196 return check_segment(seg, dev, "MMCONFIG is disabled,"); 197 198 result = pci_mmconfig_insert(dev, seg, start, end, addr); 199 if (result == 0) { 200 /* enable MMCFG if it hasn't been enabled yet */ 201 if (raw_pci_ext_ops == NULL) 202 raw_pci_ext_ops = &pci_mmcfg; 203 info->mcfg_added = true; 204 } else if (result != -EEXIST) 205 return check_segment(seg, dev, 206 "fail to add MMCONFIG information,"); 207 208 return 0; 209} 210 211static void teardown_mcfg_map(struct pci_root_info *info) 212{ 213 if (info->mcfg_added) { 214 pci_mmconfig_delete(info->segment, info->start_bus, 215 info->end_bus); 216 info->mcfg_added = false; 217 } 218} 219#else 220static int setup_mcfg_map(struct pci_root_info *info, 221 u16 seg, u8 start, u8 end, 222 phys_addr_t addr) 223{ 224 return 0; 225} 226static void teardown_mcfg_map(struct pci_root_info *info) 227{ 228} 229#endif 230 231static void validate_resources(struct device *dev, struct list_head *crs_res, 232 unsigned long type) 233{ 234 LIST_HEAD(list); 235 struct resource *res1, *res2, *root = NULL; 236 struct resource_entry *tmp, *entry, *entry2; 237 238 BUG_ON((type & (IORESOURCE_MEM | IORESOURCE_IO)) == 0); 239 root = (type & IORESOURCE_MEM) ? &iomem_resource : &ioport_resource; 240 241 list_splice_init(crs_res, &list); 242 resource_list_for_each_entry_safe(entry, tmp, &list) { 243 bool free = false; 244 resource_size_t end; 245 246 res1 = entry->res; 247 if (!(res1->flags & type)) 248 goto next; 249 250 /* Exclude non-addressable range or non-addressable portion */ 251 end = min(res1->end, root->end); 252 if (end <= res1->start) { 253 dev_info(dev, "host bridge window %pR (ignored, not CPU addressable)\n", 254 res1); 255 free = true; 256 goto next; 257 } else if (res1->end != end) { 258 dev_info(dev, "host bridge window %pR ([%#llx-%#llx] ignored, not CPU addressable)\n", 259 res1, (unsigned long long)end + 1, 260 (unsigned long long)res1->end); 261 res1->end = end; 262 } 263 264 resource_list_for_each_entry(entry2, crs_res) { 265 res2 = entry2->res; 266 if (!(res2->flags & type)) 267 continue; 268 269 /* 270 * I don't like throwing away windows because then 271 * our resources no longer match the ACPI _CRS, but 272 * the kernel resource tree doesn't allow overlaps. 273 */ 274 if (resource_overlaps(res1, res2)) { 275 res2->start = min(res1->start, res2->start); 276 res2->end = max(res1->end, res2->end); 277 dev_info(dev, "host bridge window expanded to %pR; %pR ignored\n", 278 res2, res1); 279 free = true; 280 goto next; 281 } 282 } 283 284next: 285 resource_list_del(entry); 286 if (free) 287 resource_list_free_entry(entry); 288 else 289 resource_list_add_tail(entry, crs_res); 290 } 291} 292 293static void add_resources(struct pci_root_info *info, 294 struct list_head *resources, 295 struct list_head *crs_res) 296{ 297 struct resource_entry *entry, *tmp; 298 struct resource *res, *conflict, *root = NULL; 299 300 validate_resources(&info->bridge->dev, crs_res, IORESOURCE_MEM); 301 validate_resources(&info->bridge->dev, crs_res, IORESOURCE_IO); 302 303 resource_list_for_each_entry_safe(entry, tmp, crs_res) { 304 res = entry->res; 305 if (res->flags & IORESOURCE_MEM) 306 root = &iomem_resource; 307 else if (res->flags & IORESOURCE_IO) 308 root = &ioport_resource; 309 else 310 BUG_ON(res); 311 312 conflict = insert_resource_conflict(root, res); 313 if (conflict) { 314 dev_info(&info->bridge->dev, 315 "ignoring host bridge window %pR (conflicts with %s %pR)\n", 316 res, conflict->name, conflict); 317 resource_list_destroy_entry(entry); 318 } 319 } 320 321 list_splice_tail(crs_res, resources); 322} 323 324static void release_pci_root_info(struct pci_host_bridge *bridge) 325{ 326 struct resource *res; 327 struct resource_entry *entry; 328 struct pci_root_info *info = bridge->release_data; 329 330 resource_list_for_each_entry(entry, &bridge->windows) { 331 res = entry->res; 332 if (res->parent && 333 (res->flags & (IORESOURCE_MEM | IORESOURCE_IO))) 334 release_resource(res); 335 } 336 337 teardown_mcfg_map(info); 338 kfree(info); 339} 340 341/* 342 * An IO port or MMIO resource assigned to a PCI host bridge may be 343 * consumed by the host bridge itself or available to its child 344 * bus/devices. The ACPI specification defines a bit (Producer/Consumer) 345 * to tell whether the resource is consumed by the host bridge itself, 346 * but firmware hasn't used that bit consistently, so we can't rely on it. 347 * 348 * On x86 and IA64 platforms, all IO port and MMIO resources are assumed 349 * to be available to child bus/devices except one special case: 350 * IO port [0xCF8-0xCFF] is consumed by the host bridge itself 351 * to access PCI configuration space. 352 * 353 * So explicitly filter out PCI CFG IO ports[0xCF8-0xCFF]. 354 */ 355static bool resource_is_pcicfg_ioport(struct resource *res) 356{ 357 return (res->flags & IORESOURCE_IO) && 358 res->start == 0xCF8 && res->end == 0xCFF; 359} 360 361static void probe_pci_root_info(struct pci_root_info *info, 362 struct acpi_device *device, 363 int busnum, int domain, 364 struct list_head *list) 365{ 366 int ret; 367 struct resource_entry *entry, *tmp; 368 369 sprintf(info->name, "PCI Bus %04x:%02x", domain, busnum); 370 info->bridge = device; 371 ret = acpi_dev_get_resources(device, list, 372 acpi_dev_filter_resource_type_cb, 373 (void *)(IORESOURCE_IO | IORESOURCE_MEM)); 374 if (ret < 0) 375 dev_warn(&device->dev, 376 "failed to parse _CRS method, error code %d\n", ret); 377 else if (ret == 0) 378 dev_dbg(&device->dev, 379 "no IO and memory resources present in _CRS\n"); 380 else 381 resource_list_for_each_entry_safe(entry, tmp, list) { 382 if ((entry->res->flags & IORESOURCE_DISABLED) || 383 resource_is_pcicfg_ioport(entry->res)) 384 resource_list_destroy_entry(entry); 385 else 386 entry->res->name = info->name; 387 } 388} 389 390struct pci_bus *pci_acpi_scan_root(struct acpi_pci_root *root) 391{ 392 struct acpi_device *device = root->device; 393 struct pci_root_info *info; 394 int domain = root->segment; 395 int busnum = root->secondary.start; 396 struct resource_entry *res_entry; 397 LIST_HEAD(crs_res); 398 LIST_HEAD(resources); 399 struct pci_bus *bus; 400 struct pci_sysdata *sd; 401 int node; 402 403 if (pci_ignore_seg) 404 domain = 0; 405 406 if (domain && !pci_domains_supported) { 407 printk(KERN_WARNING "pci_bus %04x:%02x: " 408 "ignored (multiple domains not supported)\n", 409 domain, busnum); 410 return NULL; 411 } 412 413 node = acpi_get_node(device->handle); 414 if (node == NUMA_NO_NODE) { 415 node = x86_pci_root_bus_node(busnum); 416 if (node != 0 && node != NUMA_NO_NODE) 417 dev_info(&device->dev, FW_BUG "no _PXM; falling back to node %d from hardware (may be inconsistent with ACPI node numbers)\n", 418 node); 419 } 420 421 if (node != NUMA_NO_NODE && !node_online(node)) 422 node = NUMA_NO_NODE; 423 424 info = kzalloc_node(sizeof(*info), GFP_KERNEL, node); 425 if (!info) { 426 printk(KERN_WARNING "pci_bus %04x:%02x: " 427 "ignored (out of memory)\n", domain, busnum); 428 return NULL; 429 } 430 431 sd = &info->sd; 432 sd->domain = domain; 433 sd->node = node; 434 sd->companion = device; 435 436 bus = pci_find_bus(domain, busnum); 437 if (bus) { 438 /* 439 * If the desired bus has been scanned already, replace 440 * its bus->sysdata. 441 */ 442 memcpy(bus->sysdata, sd, sizeof(*sd)); 443 kfree(info); 444 } else { 445 /* insert busn res at first */ 446 pci_add_resource(&resources, &root->secondary); 447 448 /* 449 * _CRS with no apertures is normal, so only fall back to 450 * defaults or native bridge info if we're ignoring _CRS. 451 */ 452 probe_pci_root_info(info, device, busnum, domain, &crs_res); 453 if (pci_use_crs) { 454 add_resources(info, &resources, &crs_res); 455 } else { 456 resource_list_for_each_entry(res_entry, &crs_res) 457 dev_printk(KERN_DEBUG, &device->dev, 458 "host bridge window %pR (ignored)\n", 459 res_entry->res); 460 resource_list_free(&crs_res); 461 x86_pci_root_bus_resources(busnum, &resources); 462 } 463 464 if (!setup_mcfg_map(info, domain, (u8)root->secondary.start, 465 (u8)root->secondary.end, root->mcfg_addr)) 466 bus = pci_create_root_bus(NULL, busnum, &pci_root_ops, 467 sd, &resources); 468 469 if (bus) { 470 pci_scan_child_bus(bus); 471 pci_set_host_bridge_release( 472 to_pci_host_bridge(bus->bridge), 473 release_pci_root_info, info); 474 } else { 475 resource_list_free(&resources); 476 teardown_mcfg_map(info); 477 kfree(info); 478 } 479 } 480 481 /* After the PCI-E bus has been walked and all devices discovered, 482 * configure any settings of the fabric that might be necessary. 483 */ 484 if (bus) { 485 struct pci_bus *child; 486 list_for_each_entry(child, &bus->children, node) 487 pcie_bus_configure_settings(child); 488 } 489 490 if (bus && node != NUMA_NO_NODE) 491 dev_printk(KERN_DEBUG, &bus->dev, "on NUMA node %d\n", node); 492 493 return bus; 494} 495 496int pcibios_root_bridge_prepare(struct pci_host_bridge *bridge) 497{ 498 /* 499 * We pass NULL as parent to pci_create_root_bus(), so if it is not NULL 500 * here, pci_create_root_bus() has been called by someone else and 501 * sysdata is likely to be different from what we expect. Let it go in 502 * that case. 503 */ 504 if (!bridge->dev.parent) { 505 struct pci_sysdata *sd = bridge->bus->sysdata; 506 ACPI_COMPANION_SET(&bridge->dev, sd->companion); 507 } 508 return 0; 509} 510 511int __init pci_acpi_init(void) 512{ 513 struct pci_dev *dev = NULL; 514 515 if (acpi_noirq) 516 return -ENODEV; 517 518 printk(KERN_INFO "PCI: Using ACPI for IRQ routing\n"); 519 acpi_irq_penalty_init(); 520 pcibios_enable_irq = acpi_pci_irq_enable; 521 pcibios_disable_irq = acpi_pci_irq_disable; 522 x86_init.pci.init_irq = x86_init_noop; 523 524 if (pci_routeirq) { 525 /* 526 * PCI IRQ routing is set up by pci_enable_device(), but we 527 * also do it here in case there are still broken drivers that 528 * don't use pci_enable_device(). 529 */ 530 printk(KERN_INFO "PCI: Routing PCI interrupts for all devices because \"pci=routeirq\" specified\n"); 531 for_each_pci_dev(dev) 532 acpi_pci_irq_enable(dev); 533 } 534 535 return 0; 536} 537