Merge git://git.kernel.org/pub/scm/linux/kernel/git/davem/net-next
[linux-2.6/btrfs-unstable.git] / drivers / pci / probe.c
blob4f9cc93c3b597df84d347a85906a1c2dcd76e549
1 /*
2 * probe.c - PCI detection and setup code
3 */
5 #include <linux/kernel.h>
6 #include <linux/delay.h>
7 #include <linux/init.h>
8 #include <linux/pci.h>
9 #include <linux/slab.h>
10 #include <linux/module.h>
11 #include <linux/cpumask.h>
12 #include <linux/pci-aspm.h>
13 #include <asm-generic/pci-bridge.h>
14 #include "pci.h"
16 #define CARDBUS_LATENCY_TIMER 176 /* secondary latency timer */
17 #define CARDBUS_RESERVE_BUSNR 3
19 struct resource busn_resource = {
20 .name = "PCI busn",
21 .start = 0,
22 .end = 255,
23 .flags = IORESOURCE_BUS,
26 /* Ugh. Need to stop exporting this to modules. */
27 LIST_HEAD(pci_root_buses);
28 EXPORT_SYMBOL(pci_root_buses);
30 static LIST_HEAD(pci_domain_busn_res_list);
32 struct pci_domain_busn_res {
33 struct list_head list;
34 struct resource res;
35 int domain_nr;
38 static struct resource *get_pci_domain_busn_res(int domain_nr)
40 struct pci_domain_busn_res *r;
42 list_for_each_entry(r, &pci_domain_busn_res_list, list)
43 if (r->domain_nr == domain_nr)
44 return &r->res;
46 r = kzalloc(sizeof(*r), GFP_KERNEL);
47 if (!r)
48 return NULL;
50 r->domain_nr = domain_nr;
51 r->res.start = 0;
52 r->res.end = 0xff;
53 r->res.flags = IORESOURCE_BUS | IORESOURCE_PCI_FIXED;
55 list_add_tail(&r->list, &pci_domain_busn_res_list);
57 return &r->res;
60 static int find_anything(struct device *dev, void *data)
62 return 1;
66 * Some device drivers need know if pci is initiated.
67 * Basically, we think pci is not initiated when there
68 * is no device to be found on the pci_bus_type.
70 int no_pci_devices(void)
72 struct device *dev;
73 int no_devices;
75 dev = bus_find_device(&pci_bus_type, NULL, NULL, find_anything);
76 no_devices = (dev == NULL);
77 put_device(dev);
78 return no_devices;
80 EXPORT_SYMBOL(no_pci_devices);
83 * PCI Bus Class
85 static void release_pcibus_dev(struct device *dev)
87 struct pci_bus *pci_bus = to_pci_bus(dev);
89 if (pci_bus->bridge)
90 put_device(pci_bus->bridge);
91 pci_bus_remove_resources(pci_bus);
92 pci_release_bus_of_node(pci_bus);
93 kfree(pci_bus);
96 static struct class pcibus_class = {
97 .name = "pci_bus",
98 .dev_release = &release_pcibus_dev,
99 .dev_groups = pcibus_groups,
102 static int __init pcibus_class_init(void)
104 return class_register(&pcibus_class);
106 postcore_initcall(pcibus_class_init);
108 static u64 pci_size(u64 base, u64 maxbase, u64 mask)
110 u64 size = mask & maxbase; /* Find the significant bits */
111 if (!size)
112 return 0;
114 /* Get the lowest of them to find the decode size, and
115 from that the extent. */
116 size = (size & ~(size-1)) - 1;
118 /* base == maxbase can be valid only if the BAR has
119 already been programmed with all 1s. */
120 if (base == maxbase && ((base | size) & mask) != mask)
121 return 0;
123 return size;
126 static inline unsigned long decode_bar(struct pci_dev *dev, u32 bar)
128 u32 mem_type;
129 unsigned long flags;
131 if ((bar & PCI_BASE_ADDRESS_SPACE) == PCI_BASE_ADDRESS_SPACE_IO) {
132 flags = bar & ~PCI_BASE_ADDRESS_IO_MASK;
133 flags |= IORESOURCE_IO;
134 return flags;
137 flags = bar & ~PCI_BASE_ADDRESS_MEM_MASK;
138 flags |= IORESOURCE_MEM;
139 if (flags & PCI_BASE_ADDRESS_MEM_PREFETCH)
140 flags |= IORESOURCE_PREFETCH;
142 mem_type = bar & PCI_BASE_ADDRESS_MEM_TYPE_MASK;
143 switch (mem_type) {
144 case PCI_BASE_ADDRESS_MEM_TYPE_32:
145 break;
146 case PCI_BASE_ADDRESS_MEM_TYPE_1M:
147 /* 1M mem BAR treated as 32-bit BAR */
148 break;
149 case PCI_BASE_ADDRESS_MEM_TYPE_64:
150 flags |= IORESOURCE_MEM_64;
151 break;
152 default:
153 /* mem unknown type treated as 32-bit BAR */
154 break;
156 return flags;
159 #define PCI_COMMAND_DECODE_ENABLE (PCI_COMMAND_MEMORY | PCI_COMMAND_IO)
162 * pci_read_base - read a PCI BAR
163 * @dev: the PCI device
164 * @type: type of the BAR
165 * @res: resource buffer to be filled in
166 * @pos: BAR position in the config space
168 * Returns 1 if the BAR is 64-bit, or 0 if 32-bit.
170 int __pci_read_base(struct pci_dev *dev, enum pci_bar_type type,
171 struct resource *res, unsigned int pos)
173 u32 l, sz, mask;
174 u16 orig_cmd;
175 struct pci_bus_region region, inverted_region;
176 bool bar_too_big = false, bar_disabled = false;
178 mask = type ? PCI_ROM_ADDRESS_MASK : ~0;
180 /* No printks while decoding is disabled! */
181 if (!dev->mmio_always_on) {
182 pci_read_config_word(dev, PCI_COMMAND, &orig_cmd);
183 if (orig_cmd & PCI_COMMAND_DECODE_ENABLE) {
184 pci_write_config_word(dev, PCI_COMMAND,
185 orig_cmd & ~PCI_COMMAND_DECODE_ENABLE);
189 res->name = pci_name(dev);
191 pci_read_config_dword(dev, pos, &l);
192 pci_write_config_dword(dev, pos, l | mask);
193 pci_read_config_dword(dev, pos, &sz);
194 pci_write_config_dword(dev, pos, l);
197 * All bits set in sz means the device isn't working properly.
198 * If the BAR isn't implemented, all bits must be 0. If it's a
199 * memory BAR or a ROM, bit 0 must be clear; if it's an io BAR, bit
200 * 1 must be clear.
202 if (!sz || sz == 0xffffffff)
203 goto fail;
206 * I don't know how l can have all bits set. Copied from old code.
207 * Maybe it fixes a bug on some ancient platform.
209 if (l == 0xffffffff)
210 l = 0;
212 if (type == pci_bar_unknown) {
213 res->flags = decode_bar(dev, l);
214 res->flags |= IORESOURCE_SIZEALIGN;
215 if (res->flags & IORESOURCE_IO) {
216 l &= PCI_BASE_ADDRESS_IO_MASK;
217 mask = PCI_BASE_ADDRESS_IO_MASK & (u32) IO_SPACE_LIMIT;
218 } else {
219 l &= PCI_BASE_ADDRESS_MEM_MASK;
220 mask = (u32)PCI_BASE_ADDRESS_MEM_MASK;
222 } else {
223 res->flags |= (l & IORESOURCE_ROM_ENABLE);
224 l &= PCI_ROM_ADDRESS_MASK;
225 mask = (u32)PCI_ROM_ADDRESS_MASK;
228 if (res->flags & IORESOURCE_MEM_64) {
229 u64 l64 = l;
230 u64 sz64 = sz;
231 u64 mask64 = mask | (u64)~0 << 32;
233 pci_read_config_dword(dev, pos + 4, &l);
234 pci_write_config_dword(dev, pos + 4, ~0);
235 pci_read_config_dword(dev, pos + 4, &sz);
236 pci_write_config_dword(dev, pos + 4, l);
238 l64 |= ((u64)l << 32);
239 sz64 |= ((u64)sz << 32);
241 sz64 = pci_size(l64, sz64, mask64);
243 if (!sz64)
244 goto fail;
246 if ((sizeof(resource_size_t) < 8) && (sz64 > 0x100000000ULL)) {
247 bar_too_big = true;
248 goto fail;
251 if ((sizeof(resource_size_t) < 8) && l) {
252 /* Address above 32-bit boundary; disable the BAR */
253 pci_write_config_dword(dev, pos, 0);
254 pci_write_config_dword(dev, pos + 4, 0);
255 region.start = 0;
256 region.end = sz64;
257 bar_disabled = true;
258 } else {
259 region.start = l64;
260 region.end = l64 + sz64;
262 } else {
263 sz = pci_size(l, sz, mask);
265 if (!sz)
266 goto fail;
268 region.start = l;
269 region.end = l + sz;
272 pcibios_bus_to_resource(dev, res, &region);
273 pcibios_resource_to_bus(dev, &inverted_region, res);
276 * If "A" is a BAR value (a bus address), "bus_to_resource(A)" is
277 * the corresponding resource address (the physical address used by
278 * the CPU. Converting that resource address back to a bus address
279 * should yield the original BAR value:
281 * resource_to_bus(bus_to_resource(A)) == A
283 * If it doesn't, CPU accesses to "bus_to_resource(A)" will not
284 * be claimed by the device.
286 if (inverted_region.start != region.start) {
287 dev_info(&dev->dev, "reg 0x%x: initial BAR value %pa invalid; forcing reassignment\n",
288 pos, &region.start);
289 res->flags |= IORESOURCE_UNSET;
290 res->end -= res->start;
291 res->start = 0;
294 goto out;
297 fail:
298 res->flags = 0;
299 out:
300 if (!dev->mmio_always_on &&
301 (orig_cmd & PCI_COMMAND_DECODE_ENABLE))
302 pci_write_config_word(dev, PCI_COMMAND, orig_cmd);
304 if (bar_too_big)
305 dev_err(&dev->dev, "reg 0x%x: can't handle 64-bit BAR\n", pos);
306 if (res->flags && !bar_disabled)
307 dev_printk(KERN_DEBUG, &dev->dev, "reg 0x%x: %pR\n", pos, res);
309 return (res->flags & IORESOURCE_MEM_64) ? 1 : 0;
312 static void pci_read_bases(struct pci_dev *dev, unsigned int howmany, int rom)
314 unsigned int pos, reg;
316 for (pos = 0; pos < howmany; pos++) {
317 struct resource *res = &dev->resource[pos];
318 reg = PCI_BASE_ADDRESS_0 + (pos << 2);
319 pos += __pci_read_base(dev, pci_bar_unknown, res, reg);
322 if (rom) {
323 struct resource *res = &dev->resource[PCI_ROM_RESOURCE];
324 dev->rom_base_reg = rom;
325 res->flags = IORESOURCE_MEM | IORESOURCE_PREFETCH |
326 IORESOURCE_READONLY | IORESOURCE_CACHEABLE |
327 IORESOURCE_SIZEALIGN;
328 __pci_read_base(dev, pci_bar_mem32, res, rom);
332 static void pci_read_bridge_io(struct pci_bus *child)
334 struct pci_dev *dev = child->self;
335 u8 io_base_lo, io_limit_lo;
336 unsigned long io_mask, io_granularity, base, limit;
337 struct pci_bus_region region;
338 struct resource *res;
340 io_mask = PCI_IO_RANGE_MASK;
341 io_granularity = 0x1000;
342 if (dev->io_window_1k) {
343 /* Support 1K I/O space granularity */
344 io_mask = PCI_IO_1K_RANGE_MASK;
345 io_granularity = 0x400;
348 res = child->resource[0];
349 pci_read_config_byte(dev, PCI_IO_BASE, &io_base_lo);
350 pci_read_config_byte(dev, PCI_IO_LIMIT, &io_limit_lo);
351 base = (io_base_lo & io_mask) << 8;
352 limit = (io_limit_lo & io_mask) << 8;
354 if ((io_base_lo & PCI_IO_RANGE_TYPE_MASK) == PCI_IO_RANGE_TYPE_32) {
355 u16 io_base_hi, io_limit_hi;
357 pci_read_config_word(dev, PCI_IO_BASE_UPPER16, &io_base_hi);
358 pci_read_config_word(dev, PCI_IO_LIMIT_UPPER16, &io_limit_hi);
359 base |= ((unsigned long) io_base_hi << 16);
360 limit |= ((unsigned long) io_limit_hi << 16);
363 if (base <= limit) {
364 res->flags = (io_base_lo & PCI_IO_RANGE_TYPE_MASK) | IORESOURCE_IO;
365 region.start = base;
366 region.end = limit + io_granularity - 1;
367 pcibios_bus_to_resource(dev, res, &region);
368 dev_printk(KERN_DEBUG, &dev->dev, " bridge window %pR\n", res);
372 static void pci_read_bridge_mmio(struct pci_bus *child)
374 struct pci_dev *dev = child->self;
375 u16 mem_base_lo, mem_limit_lo;
376 unsigned long base, limit;
377 struct pci_bus_region region;
378 struct resource *res;
380 res = child->resource[1];
381 pci_read_config_word(dev, PCI_MEMORY_BASE, &mem_base_lo);
382 pci_read_config_word(dev, PCI_MEMORY_LIMIT, &mem_limit_lo);
383 base = ((unsigned long) mem_base_lo & PCI_MEMORY_RANGE_MASK) << 16;
384 limit = ((unsigned long) mem_limit_lo & PCI_MEMORY_RANGE_MASK) << 16;
385 if (base <= limit) {
386 res->flags = (mem_base_lo & PCI_MEMORY_RANGE_TYPE_MASK) | IORESOURCE_MEM;
387 region.start = base;
388 region.end = limit + 0xfffff;
389 pcibios_bus_to_resource(dev, res, &region);
390 dev_printk(KERN_DEBUG, &dev->dev, " bridge window %pR\n", res);
394 static void pci_read_bridge_mmio_pref(struct pci_bus *child)
396 struct pci_dev *dev = child->self;
397 u16 mem_base_lo, mem_limit_lo;
398 unsigned long base, limit;
399 struct pci_bus_region region;
400 struct resource *res;
402 res = child->resource[2];
403 pci_read_config_word(dev, PCI_PREF_MEMORY_BASE, &mem_base_lo);
404 pci_read_config_word(dev, PCI_PREF_MEMORY_LIMIT, &mem_limit_lo);
405 base = ((unsigned long) mem_base_lo & PCI_PREF_RANGE_MASK) << 16;
406 limit = ((unsigned long) mem_limit_lo & PCI_PREF_RANGE_MASK) << 16;
408 if ((mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) == PCI_PREF_RANGE_TYPE_64) {
409 u32 mem_base_hi, mem_limit_hi;
411 pci_read_config_dword(dev, PCI_PREF_BASE_UPPER32, &mem_base_hi);
412 pci_read_config_dword(dev, PCI_PREF_LIMIT_UPPER32, &mem_limit_hi);
415 * Some bridges set the base > limit by default, and some
416 * (broken) BIOSes do not initialize them. If we find
417 * this, just assume they are not being used.
419 if (mem_base_hi <= mem_limit_hi) {
420 #if BITS_PER_LONG == 64
421 base |= ((unsigned long) mem_base_hi) << 32;
422 limit |= ((unsigned long) mem_limit_hi) << 32;
423 #else
424 if (mem_base_hi || mem_limit_hi) {
425 dev_err(&dev->dev, "can't handle 64-bit "
426 "address space for bridge\n");
427 return;
429 #endif
432 if (base <= limit) {
433 res->flags = (mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) |
434 IORESOURCE_MEM | IORESOURCE_PREFETCH;
435 if (res->flags & PCI_PREF_RANGE_TYPE_64)
436 res->flags |= IORESOURCE_MEM_64;
437 region.start = base;
438 region.end = limit + 0xfffff;
439 pcibios_bus_to_resource(dev, res, &region);
440 dev_printk(KERN_DEBUG, &dev->dev, " bridge window %pR\n", res);
444 void pci_read_bridge_bases(struct pci_bus *child)
446 struct pci_dev *dev = child->self;
447 struct resource *res;
448 int i;
450 if (pci_is_root_bus(child)) /* It's a host bus, nothing to read */
451 return;
453 dev_info(&dev->dev, "PCI bridge to %pR%s\n",
454 &child->busn_res,
455 dev->transparent ? " (subtractive decode)" : "");
457 pci_bus_remove_resources(child);
458 for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++)
459 child->resource[i] = &dev->resource[PCI_BRIDGE_RESOURCES+i];
461 pci_read_bridge_io(child);
462 pci_read_bridge_mmio(child);
463 pci_read_bridge_mmio_pref(child);
465 if (dev->transparent) {
466 pci_bus_for_each_resource(child->parent, res, i) {
467 if (res) {
468 pci_bus_add_resource(child, res,
469 PCI_SUBTRACTIVE_DECODE);
470 dev_printk(KERN_DEBUG, &dev->dev,
471 " bridge window %pR (subtractive decode)\n",
472 res);
478 static struct pci_bus *pci_alloc_bus(void)
480 struct pci_bus *b;
482 b = kzalloc(sizeof(*b), GFP_KERNEL);
483 if (!b)
484 return NULL;
486 INIT_LIST_HEAD(&b->node);
487 INIT_LIST_HEAD(&b->children);
488 INIT_LIST_HEAD(&b->devices);
489 INIT_LIST_HEAD(&b->slots);
490 INIT_LIST_HEAD(&b->resources);
491 b->max_bus_speed = PCI_SPEED_UNKNOWN;
492 b->cur_bus_speed = PCI_SPEED_UNKNOWN;
493 return b;
496 static void pci_release_host_bridge_dev(struct device *dev)
498 struct pci_host_bridge *bridge = to_pci_host_bridge(dev);
500 if (bridge->release_fn)
501 bridge->release_fn(bridge);
503 pci_free_resource_list(&bridge->windows);
505 kfree(bridge);
508 static struct pci_host_bridge *pci_alloc_host_bridge(struct pci_bus *b)
510 struct pci_host_bridge *bridge;
512 bridge = kzalloc(sizeof(*bridge), GFP_KERNEL);
513 if (!bridge)
514 return NULL;
516 INIT_LIST_HEAD(&bridge->windows);
517 bridge->bus = b;
518 return bridge;
521 const unsigned char pcix_bus_speed[] = {
522 PCI_SPEED_UNKNOWN, /* 0 */
523 PCI_SPEED_66MHz_PCIX, /* 1 */
524 PCI_SPEED_100MHz_PCIX, /* 2 */
525 PCI_SPEED_133MHz_PCIX, /* 3 */
526 PCI_SPEED_UNKNOWN, /* 4 */
527 PCI_SPEED_66MHz_PCIX_ECC, /* 5 */
528 PCI_SPEED_100MHz_PCIX_ECC, /* 6 */
529 PCI_SPEED_133MHz_PCIX_ECC, /* 7 */
530 PCI_SPEED_UNKNOWN, /* 8 */
531 PCI_SPEED_66MHz_PCIX_266, /* 9 */
532 PCI_SPEED_100MHz_PCIX_266, /* A */
533 PCI_SPEED_133MHz_PCIX_266, /* B */
534 PCI_SPEED_UNKNOWN, /* C */
535 PCI_SPEED_66MHz_PCIX_533, /* D */
536 PCI_SPEED_100MHz_PCIX_533, /* E */
537 PCI_SPEED_133MHz_PCIX_533 /* F */
540 const unsigned char pcie_link_speed[] = {
541 PCI_SPEED_UNKNOWN, /* 0 */
542 PCIE_SPEED_2_5GT, /* 1 */
543 PCIE_SPEED_5_0GT, /* 2 */
544 PCIE_SPEED_8_0GT, /* 3 */
545 PCI_SPEED_UNKNOWN, /* 4 */
546 PCI_SPEED_UNKNOWN, /* 5 */
547 PCI_SPEED_UNKNOWN, /* 6 */
548 PCI_SPEED_UNKNOWN, /* 7 */
549 PCI_SPEED_UNKNOWN, /* 8 */
550 PCI_SPEED_UNKNOWN, /* 9 */
551 PCI_SPEED_UNKNOWN, /* A */
552 PCI_SPEED_UNKNOWN, /* B */
553 PCI_SPEED_UNKNOWN, /* C */
554 PCI_SPEED_UNKNOWN, /* D */
555 PCI_SPEED_UNKNOWN, /* E */
556 PCI_SPEED_UNKNOWN /* F */
559 void pcie_update_link_speed(struct pci_bus *bus, u16 linksta)
561 bus->cur_bus_speed = pcie_link_speed[linksta & PCI_EXP_LNKSTA_CLS];
563 EXPORT_SYMBOL_GPL(pcie_update_link_speed);
565 static unsigned char agp_speeds[] = {
566 AGP_UNKNOWN,
567 AGP_1X,
568 AGP_2X,
569 AGP_4X,
570 AGP_8X
573 static enum pci_bus_speed agp_speed(int agp3, int agpstat)
575 int index = 0;
577 if (agpstat & 4)
578 index = 3;
579 else if (agpstat & 2)
580 index = 2;
581 else if (agpstat & 1)
582 index = 1;
583 else
584 goto out;
586 if (agp3) {
587 index += 2;
588 if (index == 5)
589 index = 0;
592 out:
593 return agp_speeds[index];
597 static void pci_set_bus_speed(struct pci_bus *bus)
599 struct pci_dev *bridge = bus->self;
600 int pos;
602 pos = pci_find_capability(bridge, PCI_CAP_ID_AGP);
603 if (!pos)
604 pos = pci_find_capability(bridge, PCI_CAP_ID_AGP3);
605 if (pos) {
606 u32 agpstat, agpcmd;
608 pci_read_config_dword(bridge, pos + PCI_AGP_STATUS, &agpstat);
609 bus->max_bus_speed = agp_speed(agpstat & 8, agpstat & 7);
611 pci_read_config_dword(bridge, pos + PCI_AGP_COMMAND, &agpcmd);
612 bus->cur_bus_speed = agp_speed(agpstat & 8, agpcmd & 7);
615 pos = pci_find_capability(bridge, PCI_CAP_ID_PCIX);
616 if (pos) {
617 u16 status;
618 enum pci_bus_speed max;
620 pci_read_config_word(bridge, pos + PCI_X_BRIDGE_SSTATUS,
621 &status);
623 if (status & PCI_X_SSTATUS_533MHZ) {
624 max = PCI_SPEED_133MHz_PCIX_533;
625 } else if (status & PCI_X_SSTATUS_266MHZ) {
626 max = PCI_SPEED_133MHz_PCIX_266;
627 } else if (status & PCI_X_SSTATUS_133MHZ) {
628 if ((status & PCI_X_SSTATUS_VERS) == PCI_X_SSTATUS_V2) {
629 max = PCI_SPEED_133MHz_PCIX_ECC;
630 } else {
631 max = PCI_SPEED_133MHz_PCIX;
633 } else {
634 max = PCI_SPEED_66MHz_PCIX;
637 bus->max_bus_speed = max;
638 bus->cur_bus_speed = pcix_bus_speed[
639 (status & PCI_X_SSTATUS_FREQ) >> 6];
641 return;
644 pos = pci_find_capability(bridge, PCI_CAP_ID_EXP);
645 if (pos) {
646 u32 linkcap;
647 u16 linksta;
649 pcie_capability_read_dword(bridge, PCI_EXP_LNKCAP, &linkcap);
650 bus->max_bus_speed = pcie_link_speed[linkcap & PCI_EXP_LNKCAP_SLS];
652 pcie_capability_read_word(bridge, PCI_EXP_LNKSTA, &linksta);
653 pcie_update_link_speed(bus, linksta);
658 static struct pci_bus *pci_alloc_child_bus(struct pci_bus *parent,
659 struct pci_dev *bridge, int busnr)
661 struct pci_bus *child;
662 int i;
663 int ret;
666 * Allocate a new bus, and inherit stuff from the parent..
668 child = pci_alloc_bus();
669 if (!child)
670 return NULL;
672 child->parent = parent;
673 child->ops = parent->ops;
674 child->sysdata = parent->sysdata;
675 child->bus_flags = parent->bus_flags;
677 /* initialize some portions of the bus device, but don't register it
678 * now as the parent is not properly set up yet.
680 child->dev.class = &pcibus_class;
681 dev_set_name(&child->dev, "%04x:%02x", pci_domain_nr(child), busnr);
684 * Set up the primary, secondary and subordinate
685 * bus numbers.
687 child->number = child->busn_res.start = busnr;
688 child->primary = parent->busn_res.start;
689 child->busn_res.end = 0xff;
691 if (!bridge) {
692 child->dev.parent = parent->bridge;
693 goto add_dev;
696 child->self = bridge;
697 child->bridge = get_device(&bridge->dev);
698 child->dev.parent = child->bridge;
699 pci_set_bus_of_node(child);
700 pci_set_bus_speed(child);
702 /* Set up default resource pointers and names.. */
703 for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++) {
704 child->resource[i] = &bridge->resource[PCI_BRIDGE_RESOURCES+i];
705 child->resource[i]->name = child->name;
707 bridge->subordinate = child;
709 add_dev:
710 ret = device_register(&child->dev);
711 WARN_ON(ret < 0);
713 pcibios_add_bus(child);
715 /* Create legacy_io and legacy_mem files for this bus */
716 pci_create_legacy_files(child);
718 return child;
721 struct pci_bus *__ref pci_add_new_bus(struct pci_bus *parent, struct pci_dev *dev, int busnr)
723 struct pci_bus *child;
725 child = pci_alloc_child_bus(parent, dev, busnr);
726 if (child) {
727 down_write(&pci_bus_sem);
728 list_add_tail(&child->node, &parent->children);
729 up_write(&pci_bus_sem);
731 return child;
734 static void pci_fixup_parent_subordinate_busnr(struct pci_bus *child, int max)
736 struct pci_bus *parent = child->parent;
738 /* Attempts to fix that up are really dangerous unless
739 we're going to re-assign all bus numbers. */
740 if (!pcibios_assign_all_busses())
741 return;
743 while (parent->parent && parent->busn_res.end < max) {
744 parent->busn_res.end = max;
745 pci_write_config_byte(parent->self, PCI_SUBORDINATE_BUS, max);
746 parent = parent->parent;
751 * If it's a bridge, configure it and scan the bus behind it.
752 * For CardBus bridges, we don't scan behind as the devices will
753 * be handled by the bridge driver itself.
755 * We need to process bridges in two passes -- first we scan those
756 * already configured by the BIOS and after we are done with all of
757 * them, we proceed to assigning numbers to the remaining buses in
758 * order to avoid overlaps between old and new bus numbers.
760 int pci_scan_bridge(struct pci_bus *bus, struct pci_dev *dev, int max, int pass)
762 struct pci_bus *child;
763 int is_cardbus = (dev->hdr_type == PCI_HEADER_TYPE_CARDBUS);
764 u32 buses, i, j = 0;
765 u16 bctl;
766 u8 primary, secondary, subordinate;
767 int broken = 0;
769 pci_read_config_dword(dev, PCI_PRIMARY_BUS, &buses);
770 primary = buses & 0xFF;
771 secondary = (buses >> 8) & 0xFF;
772 subordinate = (buses >> 16) & 0xFF;
774 dev_dbg(&dev->dev, "scanning [bus %02x-%02x] behind bridge, pass %d\n",
775 secondary, subordinate, pass);
777 if (!primary && (primary != bus->number) && secondary && subordinate) {
778 dev_warn(&dev->dev, "Primary bus is hard wired to 0\n");
779 primary = bus->number;
782 /* Check if setup is sensible at all */
783 if (!pass &&
784 (primary != bus->number || secondary <= bus->number ||
785 secondary > subordinate)) {
786 dev_info(&dev->dev, "bridge configuration invalid ([bus %02x-%02x]), reconfiguring\n",
787 secondary, subordinate);
788 broken = 1;
791 /* Disable MasterAbortMode during probing to avoid reporting
792 of bus errors (in some architectures) */
793 pci_read_config_word(dev, PCI_BRIDGE_CONTROL, &bctl);
794 pci_write_config_word(dev, PCI_BRIDGE_CONTROL,
795 bctl & ~PCI_BRIDGE_CTL_MASTER_ABORT);
797 if ((secondary || subordinate) && !pcibios_assign_all_busses() &&
798 !is_cardbus && !broken) {
799 unsigned int cmax;
801 * Bus already configured by firmware, process it in the first
802 * pass and just note the configuration.
804 if (pass)
805 goto out;
808 * If we already got to this bus through a different bridge,
809 * don't re-add it. This can happen with the i450NX chipset.
811 * However, we continue to descend down the hierarchy and
812 * scan remaining child buses.
814 child = pci_find_bus(pci_domain_nr(bus), secondary);
815 if (!child) {
816 child = pci_add_new_bus(bus, dev, secondary);
817 if (!child)
818 goto out;
819 child->primary = primary;
820 pci_bus_insert_busn_res(child, secondary, subordinate);
821 child->bridge_ctl = bctl;
824 cmax = pci_scan_child_bus(child);
825 if (cmax > max)
826 max = cmax;
827 if (child->busn_res.end > max)
828 max = child->busn_res.end;
829 } else {
831 * We need to assign a number to this bus which we always
832 * do in the second pass.
834 if (!pass) {
835 if (pcibios_assign_all_busses() || broken)
836 /* Temporarily disable forwarding of the
837 configuration cycles on all bridges in
838 this bus segment to avoid possible
839 conflicts in the second pass between two
840 bridges programmed with overlapping
841 bus ranges. */
842 pci_write_config_dword(dev, PCI_PRIMARY_BUS,
843 buses & ~0xffffff);
844 goto out;
847 /* Clear errors */
848 pci_write_config_word(dev, PCI_STATUS, 0xffff);
850 /* Prevent assigning a bus number that already exists.
851 * This can happen when a bridge is hot-plugged, so in
852 * this case we only re-scan this bus. */
853 child = pci_find_bus(pci_domain_nr(bus), max+1);
854 if (!child) {
855 child = pci_add_new_bus(bus, dev, ++max);
856 if (!child)
857 goto out;
858 pci_bus_insert_busn_res(child, max, 0xff);
860 buses = (buses & 0xff000000)
861 | ((unsigned int)(child->primary) << 0)
862 | ((unsigned int)(child->busn_res.start) << 8)
863 | ((unsigned int)(child->busn_res.end) << 16);
866 * yenta.c forces a secondary latency timer of 176.
867 * Copy that behaviour here.
869 if (is_cardbus) {
870 buses &= ~0xff000000;
871 buses |= CARDBUS_LATENCY_TIMER << 24;
875 * We need to blast all three values with a single write.
877 pci_write_config_dword(dev, PCI_PRIMARY_BUS, buses);
879 if (!is_cardbus) {
880 child->bridge_ctl = bctl;
882 * Adjust subordinate busnr in parent buses.
883 * We do this before scanning for children because
884 * some devices may not be detected if the bios
885 * was lazy.
887 pci_fixup_parent_subordinate_busnr(child, max);
888 /* Now we can scan all subordinate buses... */
889 max = pci_scan_child_bus(child);
891 * now fix it up again since we have found
892 * the real value of max.
894 pci_fixup_parent_subordinate_busnr(child, max);
895 } else {
897 * For CardBus bridges, we leave 4 bus numbers
898 * as cards with a PCI-to-PCI bridge can be
899 * inserted later.
901 for (i=0; i<CARDBUS_RESERVE_BUSNR; i++) {
902 struct pci_bus *parent = bus;
903 if (pci_find_bus(pci_domain_nr(bus),
904 max+i+1))
905 break;
906 while (parent->parent) {
907 if ((!pcibios_assign_all_busses()) &&
908 (parent->busn_res.end > max) &&
909 (parent->busn_res.end <= max+i)) {
910 j = 1;
912 parent = parent->parent;
914 if (j) {
916 * Often, there are two cardbus bridges
917 * -- try to leave one valid bus number
918 * for each one.
920 i /= 2;
921 break;
924 max += i;
925 pci_fixup_parent_subordinate_busnr(child, max);
928 * Set the subordinate bus number to its real value.
930 pci_bus_update_busn_res_end(child, max);
931 pci_write_config_byte(dev, PCI_SUBORDINATE_BUS, max);
934 sprintf(child->name,
935 (is_cardbus ? "PCI CardBus %04x:%02x" : "PCI Bus %04x:%02x"),
936 pci_domain_nr(bus), child->number);
938 /* Has only triggered on CardBus, fixup is in yenta_socket */
939 while (bus->parent) {
940 if ((child->busn_res.end > bus->busn_res.end) ||
941 (child->number > bus->busn_res.end) ||
942 (child->number < bus->number) ||
943 (child->busn_res.end < bus->number)) {
944 dev_info(&child->dev, "%pR %s "
945 "hidden behind%s bridge %s %pR\n",
946 &child->busn_res,
947 (bus->number > child->busn_res.end &&
948 bus->busn_res.end < child->number) ?
949 "wholly" : "partially",
950 bus->self->transparent ? " transparent" : "",
951 dev_name(&bus->dev),
952 &bus->busn_res);
954 bus = bus->parent;
957 out:
958 pci_write_config_word(dev, PCI_BRIDGE_CONTROL, bctl);
960 return max;
964 * Read interrupt line and base address registers.
965 * The architecture-dependent code can tweak these, of course.
967 static void pci_read_irq(struct pci_dev *dev)
969 unsigned char irq;
971 pci_read_config_byte(dev, PCI_INTERRUPT_PIN, &irq);
972 dev->pin = irq;
973 if (irq)
974 pci_read_config_byte(dev, PCI_INTERRUPT_LINE, &irq);
975 dev->irq = irq;
978 void set_pcie_port_type(struct pci_dev *pdev)
980 int pos;
981 u16 reg16;
983 pos = pci_find_capability(pdev, PCI_CAP_ID_EXP);
984 if (!pos)
985 return;
986 pdev->is_pcie = 1;
987 pdev->pcie_cap = pos;
988 pci_read_config_word(pdev, pos + PCI_EXP_FLAGS, &reg16);
989 pdev->pcie_flags_reg = reg16;
990 pci_read_config_word(pdev, pos + PCI_EXP_DEVCAP, &reg16);
991 pdev->pcie_mpss = reg16 & PCI_EXP_DEVCAP_PAYLOAD;
994 void set_pcie_hotplug_bridge(struct pci_dev *pdev)
996 u32 reg32;
998 pcie_capability_read_dword(pdev, PCI_EXP_SLTCAP, &reg32);
999 if (reg32 & PCI_EXP_SLTCAP_HPC)
1000 pdev->is_hotplug_bridge = 1;
1003 #define LEGACY_IO_RESOURCE (IORESOURCE_IO | IORESOURCE_PCI_FIXED)
1006 * pci_setup_device - fill in class and map information of a device
1007 * @dev: the device structure to fill
1009 * Initialize the device structure with information about the device's
1010 * vendor,class,memory and IO-space addresses,IRQ lines etc.
1011 * Called at initialisation of the PCI subsystem and by CardBus services.
1012 * Returns 0 on success and negative if unknown type of device (not normal,
1013 * bridge or CardBus).
1015 int pci_setup_device(struct pci_dev *dev)
1017 u32 class;
1018 u8 hdr_type;
1019 struct pci_slot *slot;
1020 int pos = 0;
1021 struct pci_bus_region region;
1022 struct resource *res;
1024 if (pci_read_config_byte(dev, PCI_HEADER_TYPE, &hdr_type))
1025 return -EIO;
1027 dev->sysdata = dev->bus->sysdata;
1028 dev->dev.parent = dev->bus->bridge;
1029 dev->dev.bus = &pci_bus_type;
1030 dev->hdr_type = hdr_type & 0x7f;
1031 dev->multifunction = !!(hdr_type & 0x80);
1032 dev->error_state = pci_channel_io_normal;
1033 set_pcie_port_type(dev);
1035 list_for_each_entry(slot, &dev->bus->slots, list)
1036 if (PCI_SLOT(dev->devfn) == slot->number)
1037 dev->slot = slot;
1039 /* Assume 32-bit PCI; let 64-bit PCI cards (which are far rarer)
1040 set this higher, assuming the system even supports it. */
1041 dev->dma_mask = 0xffffffff;
1043 dev_set_name(&dev->dev, "%04x:%02x:%02x.%d", pci_domain_nr(dev->bus),
1044 dev->bus->number, PCI_SLOT(dev->devfn),
1045 PCI_FUNC(dev->devfn));
1047 pci_read_config_dword(dev, PCI_CLASS_REVISION, &class);
1048 dev->revision = class & 0xff;
1049 dev->class = class >> 8; /* upper 3 bytes */
1051 dev_printk(KERN_DEBUG, &dev->dev, "[%04x:%04x] type %02x class %#08x\n",
1052 dev->vendor, dev->device, dev->hdr_type, dev->class);
1054 /* need to have dev->class ready */
1055 dev->cfg_size = pci_cfg_space_size(dev);
1057 /* "Unknown power state" */
1058 dev->current_state = PCI_UNKNOWN;
1060 /* Early fixups, before probing the BARs */
1061 pci_fixup_device(pci_fixup_early, dev);
1062 /* device class may be changed after fixup */
1063 class = dev->class >> 8;
1065 switch (dev->hdr_type) { /* header type */
1066 case PCI_HEADER_TYPE_NORMAL: /* standard header */
1067 if (class == PCI_CLASS_BRIDGE_PCI)
1068 goto bad;
1069 pci_read_irq(dev);
1070 pci_read_bases(dev, 6, PCI_ROM_ADDRESS);
1071 pci_read_config_word(dev, PCI_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor);
1072 pci_read_config_word(dev, PCI_SUBSYSTEM_ID, &dev->subsystem_device);
1075 * Do the ugly legacy mode stuff here rather than broken chip
1076 * quirk code. Legacy mode ATA controllers have fixed
1077 * addresses. These are not always echoed in BAR0-3, and
1078 * BAR0-3 in a few cases contain junk!
1080 if (class == PCI_CLASS_STORAGE_IDE) {
1081 u8 progif;
1082 pci_read_config_byte(dev, PCI_CLASS_PROG, &progif);
1083 if ((progif & 1) == 0) {
1084 region.start = 0x1F0;
1085 region.end = 0x1F7;
1086 res = &dev->resource[0];
1087 res->flags = LEGACY_IO_RESOURCE;
1088 pcibios_bus_to_resource(dev, res, &region);
1089 region.start = 0x3F6;
1090 region.end = 0x3F6;
1091 res = &dev->resource[1];
1092 res->flags = LEGACY_IO_RESOURCE;
1093 pcibios_bus_to_resource(dev, res, &region);
1095 if ((progif & 4) == 0) {
1096 region.start = 0x170;
1097 region.end = 0x177;
1098 res = &dev->resource[2];
1099 res->flags = LEGACY_IO_RESOURCE;
1100 pcibios_bus_to_resource(dev, res, &region);
1101 region.start = 0x376;
1102 region.end = 0x376;
1103 res = &dev->resource[3];
1104 res->flags = LEGACY_IO_RESOURCE;
1105 pcibios_bus_to_resource(dev, res, &region);
1108 break;
1110 case PCI_HEADER_TYPE_BRIDGE: /* bridge header */
1111 if (class != PCI_CLASS_BRIDGE_PCI)
1112 goto bad;
1113 /* The PCI-to-PCI bridge spec requires that subtractive
1114 decoding (i.e. transparent) bridge must have programming
1115 interface code of 0x01. */
1116 pci_read_irq(dev);
1117 dev->transparent = ((dev->class & 0xff) == 1);
1118 pci_read_bases(dev, 2, PCI_ROM_ADDRESS1);
1119 set_pcie_hotplug_bridge(dev);
1120 pos = pci_find_capability(dev, PCI_CAP_ID_SSVID);
1121 if (pos) {
1122 pci_read_config_word(dev, pos + PCI_SSVID_VENDOR_ID, &dev->subsystem_vendor);
1123 pci_read_config_word(dev, pos + PCI_SSVID_DEVICE_ID, &dev->subsystem_device);
1125 break;
1127 case PCI_HEADER_TYPE_CARDBUS: /* CardBus bridge header */
1128 if (class != PCI_CLASS_BRIDGE_CARDBUS)
1129 goto bad;
1130 pci_read_irq(dev);
1131 pci_read_bases(dev, 1, 0);
1132 pci_read_config_word(dev, PCI_CB_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor);
1133 pci_read_config_word(dev, PCI_CB_SUBSYSTEM_ID, &dev->subsystem_device);
1134 break;
1136 default: /* unknown header */
1137 dev_err(&dev->dev, "unknown header type %02x, "
1138 "ignoring device\n", dev->hdr_type);
1139 return -EIO;
1141 bad:
1142 dev_err(&dev->dev, "ignoring class %#08x (doesn't match header "
1143 "type %02x)\n", dev->class, dev->hdr_type);
1144 dev->class = PCI_CLASS_NOT_DEFINED;
1147 /* We found a fine healthy device, go go go... */
1148 return 0;
1151 static void pci_release_capabilities(struct pci_dev *dev)
1153 pci_vpd_release(dev);
1154 pci_iov_release(dev);
1155 pci_free_cap_save_buffers(dev);
1159 * pci_release_dev - free a pci device structure when all users of it are finished.
1160 * @dev: device that's been disconnected
1162 * Will be called only by the device core when all users of this pci device are
1163 * done.
1165 static void pci_release_dev(struct device *dev)
1167 struct pci_dev *pci_dev;
1169 pci_dev = to_pci_dev(dev);
1170 pci_release_capabilities(pci_dev);
1171 pci_release_of_node(pci_dev);
1172 pcibios_release_device(pci_dev);
1173 pci_bus_put(pci_dev->bus);
1174 kfree(pci_dev);
1178 * pci_cfg_space_size - get the configuration space size of the PCI device.
1179 * @dev: PCI device
1181 * Regular PCI devices have 256 bytes, but PCI-X 2 and PCI Express devices
1182 * have 4096 bytes. Even if the device is capable, that doesn't mean we can
1183 * access it. Maybe we don't have a way to generate extended config space
1184 * accesses, or the device is behind a reverse Express bridge. So we try
1185 * reading the dword at 0x100 which must either be 0 or a valid extended
1186 * capability header.
1188 int pci_cfg_space_size_ext(struct pci_dev *dev)
1190 u32 status;
1191 int pos = PCI_CFG_SPACE_SIZE;
1193 if (pci_read_config_dword(dev, pos, &status) != PCIBIOS_SUCCESSFUL)
1194 goto fail;
1195 if (status == 0xffffffff)
1196 goto fail;
1198 return PCI_CFG_SPACE_EXP_SIZE;
1200 fail:
1201 return PCI_CFG_SPACE_SIZE;
1204 int pci_cfg_space_size(struct pci_dev *dev)
1206 int pos;
1207 u32 status;
1208 u16 class;
1210 class = dev->class >> 8;
1211 if (class == PCI_CLASS_BRIDGE_HOST)
1212 return pci_cfg_space_size_ext(dev);
1214 if (!pci_is_pcie(dev)) {
1215 pos = pci_find_capability(dev, PCI_CAP_ID_PCIX);
1216 if (!pos)
1217 goto fail;
1219 pci_read_config_dword(dev, pos + PCI_X_STATUS, &status);
1220 if (!(status & (PCI_X_STATUS_266MHZ | PCI_X_STATUS_533MHZ)))
1221 goto fail;
1224 return pci_cfg_space_size_ext(dev);
1226 fail:
1227 return PCI_CFG_SPACE_SIZE;
1230 struct pci_dev *pci_alloc_dev(struct pci_bus *bus)
1232 struct pci_dev *dev;
1234 dev = kzalloc(sizeof(struct pci_dev), GFP_KERNEL);
1235 if (!dev)
1236 return NULL;
1238 INIT_LIST_HEAD(&dev->bus_list);
1239 dev->dev.type = &pci_dev_type;
1240 dev->bus = pci_bus_get(bus);
1242 return dev;
1244 EXPORT_SYMBOL(pci_alloc_dev);
1246 struct pci_dev *alloc_pci_dev(void)
1248 return pci_alloc_dev(NULL);
1250 EXPORT_SYMBOL(alloc_pci_dev);
1252 bool pci_bus_read_dev_vendor_id(struct pci_bus *bus, int devfn, u32 *l,
1253 int crs_timeout)
1255 int delay = 1;
1257 if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, l))
1258 return false;
1260 /* some broken boards return 0 or ~0 if a slot is empty: */
1261 if (*l == 0xffffffff || *l == 0x00000000 ||
1262 *l == 0x0000ffff || *l == 0xffff0000)
1263 return false;
1265 /* Configuration request Retry Status */
1266 while (*l == 0xffff0001) {
1267 if (!crs_timeout)
1268 return false;
1270 msleep(delay);
1271 delay *= 2;
1272 if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, l))
1273 return false;
1274 /* Card hasn't responded in 60 seconds? Must be stuck. */
1275 if (delay > crs_timeout) {
1276 printk(KERN_WARNING "pci %04x:%02x:%02x.%d: not "
1277 "responding\n", pci_domain_nr(bus),
1278 bus->number, PCI_SLOT(devfn),
1279 PCI_FUNC(devfn));
1280 return false;
1284 return true;
1286 EXPORT_SYMBOL(pci_bus_read_dev_vendor_id);
1289 * Read the config data for a PCI device, sanity-check it
1290 * and fill in the dev structure...
1292 static struct pci_dev *pci_scan_device(struct pci_bus *bus, int devfn)
1294 struct pci_dev *dev;
1295 u32 l;
1297 if (!pci_bus_read_dev_vendor_id(bus, devfn, &l, 60*1000))
1298 return NULL;
1300 dev = pci_alloc_dev(bus);
1301 if (!dev)
1302 return NULL;
1304 dev->devfn = devfn;
1305 dev->vendor = l & 0xffff;
1306 dev->device = (l >> 16) & 0xffff;
1308 pci_set_of_node(dev);
1310 if (pci_setup_device(dev)) {
1311 pci_bus_put(dev->bus);
1312 kfree(dev);
1313 return NULL;
1316 return dev;
1319 static void pci_init_capabilities(struct pci_dev *dev)
1321 /* MSI/MSI-X list */
1322 pci_msi_init_pci_dev(dev);
1324 /* Buffers for saving PCIe and PCI-X capabilities */
1325 pci_allocate_cap_save_buffers(dev);
1327 /* Power Management */
1328 pci_pm_init(dev);
1330 /* Vital Product Data */
1331 pci_vpd_pci22_init(dev);
1333 /* Alternative Routing-ID Forwarding */
1334 pci_configure_ari(dev);
1336 /* Single Root I/O Virtualization */
1337 pci_iov_init(dev);
1339 /* Enable ACS P2P upstream forwarding */
1340 pci_enable_acs(dev);
1343 void pci_device_add(struct pci_dev *dev, struct pci_bus *bus)
1345 int ret;
1347 device_initialize(&dev->dev);
1348 dev->dev.release = pci_release_dev;
1350 set_dev_node(&dev->dev, pcibus_to_node(bus));
1351 dev->dev.dma_mask = &dev->dma_mask;
1352 dev->dev.dma_parms = &dev->dma_parms;
1353 dev->dev.coherent_dma_mask = 0xffffffffull;
1355 pci_set_dma_max_seg_size(dev, 65536);
1356 pci_set_dma_seg_boundary(dev, 0xffffffff);
1358 /* Fix up broken headers */
1359 pci_fixup_device(pci_fixup_header, dev);
1361 /* moved out from quirk header fixup code */
1362 pci_reassigndev_resource_alignment(dev);
1364 /* Clear the state_saved flag. */
1365 dev->state_saved = false;
1367 /* Initialize various capabilities */
1368 pci_init_capabilities(dev);
1371 * Add the device to our list of discovered devices
1372 * and the bus list for fixup functions, etc.
1374 down_write(&pci_bus_sem);
1375 list_add_tail(&dev->bus_list, &bus->devices);
1376 up_write(&pci_bus_sem);
1378 ret = pcibios_add_device(dev);
1379 WARN_ON(ret < 0);
1381 /* Notifier could use PCI capabilities */
1382 dev->match_driver = false;
1383 ret = device_add(&dev->dev);
1384 WARN_ON(ret < 0);
1386 pci_proc_attach_device(dev);
1389 struct pci_dev *__ref pci_scan_single_device(struct pci_bus *bus, int devfn)
1391 struct pci_dev *dev;
1393 dev = pci_get_slot(bus, devfn);
1394 if (dev) {
1395 pci_dev_put(dev);
1396 return dev;
1399 dev = pci_scan_device(bus, devfn);
1400 if (!dev)
1401 return NULL;
1403 pci_device_add(dev, bus);
1405 return dev;
1407 EXPORT_SYMBOL(pci_scan_single_device);
1409 static unsigned next_fn(struct pci_bus *bus, struct pci_dev *dev, unsigned fn)
1411 int pos;
1412 u16 cap = 0;
1413 unsigned next_fn;
1415 if (pci_ari_enabled(bus)) {
1416 if (!dev)
1417 return 0;
1418 pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ARI);
1419 if (!pos)
1420 return 0;
1422 pci_read_config_word(dev, pos + PCI_ARI_CAP, &cap);
1423 next_fn = PCI_ARI_CAP_NFN(cap);
1424 if (next_fn <= fn)
1425 return 0; /* protect against malformed list */
1427 return next_fn;
1430 /* dev may be NULL for non-contiguous multifunction devices */
1431 if (!dev || dev->multifunction)
1432 return (fn + 1) % 8;
1434 return 0;
1437 static int only_one_child(struct pci_bus *bus)
1439 struct pci_dev *parent = bus->self;
1441 if (!parent || !pci_is_pcie(parent))
1442 return 0;
1443 if (pci_pcie_type(parent) == PCI_EXP_TYPE_ROOT_PORT)
1444 return 1;
1445 if (pci_pcie_type(parent) == PCI_EXP_TYPE_DOWNSTREAM &&
1446 !pci_has_flag(PCI_SCAN_ALL_PCIE_DEVS))
1447 return 1;
1448 return 0;
1452 * pci_scan_slot - scan a PCI slot on a bus for devices.
1453 * @bus: PCI bus to scan
1454 * @devfn: slot number to scan (must have zero function.)
1456 * Scan a PCI slot on the specified PCI bus for devices, adding
1457 * discovered devices to the @bus->devices list. New devices
1458 * will not have is_added set.
1460 * Returns the number of new devices found.
1462 int pci_scan_slot(struct pci_bus *bus, int devfn)
1464 unsigned fn, nr = 0;
1465 struct pci_dev *dev;
1467 if (only_one_child(bus) && (devfn > 0))
1468 return 0; /* Already scanned the entire slot */
1470 dev = pci_scan_single_device(bus, devfn);
1471 if (!dev)
1472 return 0;
1473 if (!dev->is_added)
1474 nr++;
1476 for (fn = next_fn(bus, dev, 0); fn > 0; fn = next_fn(bus, dev, fn)) {
1477 dev = pci_scan_single_device(bus, devfn + fn);
1478 if (dev) {
1479 if (!dev->is_added)
1480 nr++;
1481 dev->multifunction = 1;
1485 /* only one slot has pcie device */
1486 if (bus->self && nr)
1487 pcie_aspm_init_link_state(bus->self);
1489 return nr;
1492 static int pcie_find_smpss(struct pci_dev *dev, void *data)
1494 u8 *smpss = data;
1496 if (!pci_is_pcie(dev))
1497 return 0;
1500 * We don't have a way to change MPS settings on devices that have
1501 * drivers attached. A hot-added device might support only the minimum
1502 * MPS setting (MPS=128). Therefore, if the fabric contains a bridge
1503 * where devices may be hot-added, we limit the fabric MPS to 128 so
1504 * hot-added devices will work correctly.
1506 * However, if we hot-add a device to a slot directly below a Root
1507 * Port, it's impossible for there to be other existing devices below
1508 * the port. We don't limit the MPS in this case because we can
1509 * reconfigure MPS on both the Root Port and the hot-added device,
1510 * and there are no other devices involved.
1512 * Note that this PCIE_BUS_SAFE path assumes no peer-to-peer DMA.
1514 if (dev->is_hotplug_bridge &&
1515 pci_pcie_type(dev) != PCI_EXP_TYPE_ROOT_PORT)
1516 *smpss = 0;
1518 if (*smpss > dev->pcie_mpss)
1519 *smpss = dev->pcie_mpss;
1521 return 0;
1524 static void pcie_write_mps(struct pci_dev *dev, int mps)
1526 int rc;
1528 if (pcie_bus_config == PCIE_BUS_PERFORMANCE) {
1529 mps = 128 << dev->pcie_mpss;
1531 if (pci_pcie_type(dev) != PCI_EXP_TYPE_ROOT_PORT &&
1532 dev->bus->self)
1533 /* For "Performance", the assumption is made that
1534 * downstream communication will never be larger than
1535 * the MRRS. So, the MPS only needs to be configured
1536 * for the upstream communication. This being the case,
1537 * walk from the top down and set the MPS of the child
1538 * to that of the parent bus.
1540 * Configure the device MPS with the smaller of the
1541 * device MPSS or the bridge MPS (which is assumed to be
1542 * properly configured at this point to the largest
1543 * allowable MPS based on its parent bus).
1545 mps = min(mps, pcie_get_mps(dev->bus->self));
1548 rc = pcie_set_mps(dev, mps);
1549 if (rc)
1550 dev_err(&dev->dev, "Failed attempting to set the MPS\n");
1553 static void pcie_write_mrrs(struct pci_dev *dev)
1555 int rc, mrrs;
1557 /* In the "safe" case, do not configure the MRRS. There appear to be
1558 * issues with setting MRRS to 0 on a number of devices.
1560 if (pcie_bus_config != PCIE_BUS_PERFORMANCE)
1561 return;
1563 /* For Max performance, the MRRS must be set to the largest supported
1564 * value. However, it cannot be configured larger than the MPS the
1565 * device or the bus can support. This should already be properly
1566 * configured by a prior call to pcie_write_mps.
1568 mrrs = pcie_get_mps(dev);
1570 /* MRRS is a R/W register. Invalid values can be written, but a
1571 * subsequent read will verify if the value is acceptable or not.
1572 * If the MRRS value provided is not acceptable (e.g., too large),
1573 * shrink the value until it is acceptable to the HW.
1575 while (mrrs != pcie_get_readrq(dev) && mrrs >= 128) {
1576 rc = pcie_set_readrq(dev, mrrs);
1577 if (!rc)
1578 break;
1580 dev_warn(&dev->dev, "Failed attempting to set the MRRS\n");
1581 mrrs /= 2;
1584 if (mrrs < 128)
1585 dev_err(&dev->dev, "MRRS was unable to be configured with a "
1586 "safe value. If problems are experienced, try running "
1587 "with pci=pcie_bus_safe.\n");
1590 static void pcie_bus_detect_mps(struct pci_dev *dev)
1592 struct pci_dev *bridge = dev->bus->self;
1593 int mps, p_mps;
1595 if (!bridge)
1596 return;
1598 mps = pcie_get_mps(dev);
1599 p_mps = pcie_get_mps(bridge);
1601 if (mps != p_mps)
1602 dev_warn(&dev->dev, "Max Payload Size %d, but upstream %s set to %d; if necessary, use \"pci=pcie_bus_safe\" and report a bug\n",
1603 mps, pci_name(bridge), p_mps);
1606 static int pcie_bus_configure_set(struct pci_dev *dev, void *data)
1608 int mps, orig_mps;
1610 if (!pci_is_pcie(dev))
1611 return 0;
1613 if (pcie_bus_config == PCIE_BUS_TUNE_OFF) {
1614 pcie_bus_detect_mps(dev);
1615 return 0;
1618 mps = 128 << *(u8 *)data;
1619 orig_mps = pcie_get_mps(dev);
1621 pcie_write_mps(dev, mps);
1622 pcie_write_mrrs(dev);
1624 dev_info(&dev->dev, "Max Payload Size set to %4d/%4d (was %4d), "
1625 "Max Read Rq %4d\n", pcie_get_mps(dev), 128 << dev->pcie_mpss,
1626 orig_mps, pcie_get_readrq(dev));
1628 return 0;
1631 /* pcie_bus_configure_settings requires that pci_walk_bus work in a top-down,
1632 * parents then children fashion. If this changes, then this code will not
1633 * work as designed.
1635 void pcie_bus_configure_settings(struct pci_bus *bus)
1637 u8 smpss;
1639 if (!bus->self)
1640 return;
1642 if (!pci_is_pcie(bus->self))
1643 return;
1645 /* FIXME - Peer to peer DMA is possible, though the endpoint would need
1646 * to be aware of the MPS of the destination. To work around this,
1647 * simply force the MPS of the entire system to the smallest possible.
1649 if (pcie_bus_config == PCIE_BUS_PEER2PEER)
1650 smpss = 0;
1652 if (pcie_bus_config == PCIE_BUS_SAFE) {
1653 smpss = bus->self->pcie_mpss;
1655 pcie_find_smpss(bus->self, &smpss);
1656 pci_walk_bus(bus, pcie_find_smpss, &smpss);
1659 pcie_bus_configure_set(bus->self, &smpss);
1660 pci_walk_bus(bus, pcie_bus_configure_set, &smpss);
1662 EXPORT_SYMBOL_GPL(pcie_bus_configure_settings);
1664 unsigned int pci_scan_child_bus(struct pci_bus *bus)
1666 unsigned int devfn, pass, max = bus->busn_res.start;
1667 struct pci_dev *dev;
1669 dev_dbg(&bus->dev, "scanning bus\n");
1671 /* Go find them, Rover! */
1672 for (devfn = 0; devfn < 0x100; devfn += 8)
1673 pci_scan_slot(bus, devfn);
1675 /* Reserve buses for SR-IOV capability. */
1676 max += pci_iov_bus_range(bus);
1679 * After performing arch-dependent fixup of the bus, look behind
1680 * all PCI-to-PCI bridges on this bus.
1682 if (!bus->is_added) {
1683 dev_dbg(&bus->dev, "fixups for bus\n");
1684 pcibios_fixup_bus(bus);
1685 bus->is_added = 1;
1688 for (pass=0; pass < 2; pass++)
1689 list_for_each_entry(dev, &bus->devices, bus_list) {
1690 if (dev->hdr_type == PCI_HEADER_TYPE_BRIDGE ||
1691 dev->hdr_type == PCI_HEADER_TYPE_CARDBUS)
1692 max = pci_scan_bridge(bus, dev, max, pass);
1696 * We've scanned the bus and so we know all about what's on
1697 * the other side of any bridges that may be on this bus plus
1698 * any devices.
1700 * Return how far we've got finding sub-buses.
1702 dev_dbg(&bus->dev, "bus scan returning with max=%02x\n", max);
1703 return max;
1707 * pcibios_root_bridge_prepare - Platform-specific host bridge setup.
1708 * @bridge: Host bridge to set up.
1710 * Default empty implementation. Replace with an architecture-specific setup
1711 * routine, if necessary.
1713 int __weak pcibios_root_bridge_prepare(struct pci_host_bridge *bridge)
1715 return 0;
1718 void __weak pcibios_add_bus(struct pci_bus *bus)
1722 void __weak pcibios_remove_bus(struct pci_bus *bus)
1726 struct pci_bus *pci_create_root_bus(struct device *parent, int bus,
1727 struct pci_ops *ops, void *sysdata, struct list_head *resources)
1729 int error;
1730 struct pci_host_bridge *bridge;
1731 struct pci_bus *b, *b2;
1732 struct pci_host_bridge_window *window, *n;
1733 struct resource *res;
1734 resource_size_t offset;
1735 char bus_addr[64];
1736 char *fmt;
1738 b = pci_alloc_bus();
1739 if (!b)
1740 return NULL;
1742 b->sysdata = sysdata;
1743 b->ops = ops;
1744 b->number = b->busn_res.start = bus;
1745 b2 = pci_find_bus(pci_domain_nr(b), bus);
1746 if (b2) {
1747 /* If we already got to this bus through a different bridge, ignore it */
1748 dev_dbg(&b2->dev, "bus already known\n");
1749 goto err_out;
1752 bridge = pci_alloc_host_bridge(b);
1753 if (!bridge)
1754 goto err_out;
1756 bridge->dev.parent = parent;
1757 bridge->dev.release = pci_release_host_bridge_dev;
1758 dev_set_name(&bridge->dev, "pci%04x:%02x", pci_domain_nr(b), bus);
1759 error = pcibios_root_bridge_prepare(bridge);
1760 if (error) {
1761 kfree(bridge);
1762 goto err_out;
1765 error = device_register(&bridge->dev);
1766 if (error) {
1767 put_device(&bridge->dev);
1768 goto err_out;
1770 b->bridge = get_device(&bridge->dev);
1771 device_enable_async_suspend(b->bridge);
1772 pci_set_bus_of_node(b);
1774 if (!parent)
1775 set_dev_node(b->bridge, pcibus_to_node(b));
1777 b->dev.class = &pcibus_class;
1778 b->dev.parent = b->bridge;
1779 dev_set_name(&b->dev, "%04x:%02x", pci_domain_nr(b), bus);
1780 error = device_register(&b->dev);
1781 if (error)
1782 goto class_dev_reg_err;
1784 pcibios_add_bus(b);
1786 /* Create legacy_io and legacy_mem files for this bus */
1787 pci_create_legacy_files(b);
1789 if (parent)
1790 dev_info(parent, "PCI host bridge to bus %s\n", dev_name(&b->dev));
1791 else
1792 printk(KERN_INFO "PCI host bridge to bus %s\n", dev_name(&b->dev));
1794 /* Add initial resources to the bus */
1795 list_for_each_entry_safe(window, n, resources, list) {
1796 list_move_tail(&window->list, &bridge->windows);
1797 res = window->res;
1798 offset = window->offset;
1799 if (res->flags & IORESOURCE_BUS)
1800 pci_bus_insert_busn_res(b, bus, res->end);
1801 else
1802 pci_bus_add_resource(b, res, 0);
1803 if (offset) {
1804 if (resource_type(res) == IORESOURCE_IO)
1805 fmt = " (bus address [%#06llx-%#06llx])";
1806 else
1807 fmt = " (bus address [%#010llx-%#010llx])";
1808 snprintf(bus_addr, sizeof(bus_addr), fmt,
1809 (unsigned long long) (res->start - offset),
1810 (unsigned long long) (res->end - offset));
1811 } else
1812 bus_addr[0] = '\0';
1813 dev_info(&b->dev, "root bus resource %pR%s\n", res, bus_addr);
1816 down_write(&pci_bus_sem);
1817 list_add_tail(&b->node, &pci_root_buses);
1818 up_write(&pci_bus_sem);
1820 return b;
1822 class_dev_reg_err:
1823 put_device(&bridge->dev);
1824 device_unregister(&bridge->dev);
1825 err_out:
1826 kfree(b);
1827 return NULL;
1830 int pci_bus_insert_busn_res(struct pci_bus *b, int bus, int bus_max)
1832 struct resource *res = &b->busn_res;
1833 struct resource *parent_res, *conflict;
1835 res->start = bus;
1836 res->end = bus_max;
1837 res->flags = IORESOURCE_BUS;
1839 if (!pci_is_root_bus(b))
1840 parent_res = &b->parent->busn_res;
1841 else {
1842 parent_res = get_pci_domain_busn_res(pci_domain_nr(b));
1843 res->flags |= IORESOURCE_PCI_FIXED;
1846 conflict = insert_resource_conflict(parent_res, res);
1848 if (conflict)
1849 dev_printk(KERN_DEBUG, &b->dev,
1850 "busn_res: can not insert %pR under %s%pR (conflicts with %s %pR)\n",
1851 res, pci_is_root_bus(b) ? "domain " : "",
1852 parent_res, conflict->name, conflict);
1854 return conflict == NULL;
1857 int pci_bus_update_busn_res_end(struct pci_bus *b, int bus_max)
1859 struct resource *res = &b->busn_res;
1860 struct resource old_res = *res;
1861 resource_size_t size;
1862 int ret;
1864 if (res->start > bus_max)
1865 return -EINVAL;
1867 size = bus_max - res->start + 1;
1868 ret = adjust_resource(res, res->start, size);
1869 dev_printk(KERN_DEBUG, &b->dev,
1870 "busn_res: %pR end %s updated to %02x\n",
1871 &old_res, ret ? "can not be" : "is", bus_max);
1873 if (!ret && !res->parent)
1874 pci_bus_insert_busn_res(b, res->start, res->end);
1876 return ret;
1879 void pci_bus_release_busn_res(struct pci_bus *b)
1881 struct resource *res = &b->busn_res;
1882 int ret;
1884 if (!res->flags || !res->parent)
1885 return;
1887 ret = release_resource(res);
1888 dev_printk(KERN_DEBUG, &b->dev,
1889 "busn_res: %pR %s released\n",
1890 res, ret ? "can not be" : "is");
1893 struct pci_bus *pci_scan_root_bus(struct device *parent, int bus,
1894 struct pci_ops *ops, void *sysdata, struct list_head *resources)
1896 struct pci_host_bridge_window *window;
1897 bool found = false;
1898 struct pci_bus *b;
1899 int max;
1901 list_for_each_entry(window, resources, list)
1902 if (window->res->flags & IORESOURCE_BUS) {
1903 found = true;
1904 break;
1907 b = pci_create_root_bus(parent, bus, ops, sysdata, resources);
1908 if (!b)
1909 return NULL;
1911 if (!found) {
1912 dev_info(&b->dev,
1913 "No busn resource found for root bus, will use [bus %02x-ff]\n",
1914 bus);
1915 pci_bus_insert_busn_res(b, bus, 255);
1918 max = pci_scan_child_bus(b);
1920 if (!found)
1921 pci_bus_update_busn_res_end(b, max);
1923 pci_bus_add_devices(b);
1924 return b;
1926 EXPORT_SYMBOL(pci_scan_root_bus);
1928 /* Deprecated; use pci_scan_root_bus() instead */
1929 struct pci_bus *pci_scan_bus_parented(struct device *parent,
1930 int bus, struct pci_ops *ops, void *sysdata)
1932 LIST_HEAD(resources);
1933 struct pci_bus *b;
1935 pci_add_resource(&resources, &ioport_resource);
1936 pci_add_resource(&resources, &iomem_resource);
1937 pci_add_resource(&resources, &busn_resource);
1938 b = pci_create_root_bus(parent, bus, ops, sysdata, &resources);
1939 if (b)
1940 pci_scan_child_bus(b);
1941 else
1942 pci_free_resource_list(&resources);
1943 return b;
1945 EXPORT_SYMBOL(pci_scan_bus_parented);
1947 struct pci_bus *pci_scan_bus(int bus, struct pci_ops *ops,
1948 void *sysdata)
1950 LIST_HEAD(resources);
1951 struct pci_bus *b;
1953 pci_add_resource(&resources, &ioport_resource);
1954 pci_add_resource(&resources, &iomem_resource);
1955 pci_add_resource(&resources, &busn_resource);
1956 b = pci_create_root_bus(NULL, bus, ops, sysdata, &resources);
1957 if (b) {
1958 pci_scan_child_bus(b);
1959 pci_bus_add_devices(b);
1960 } else {
1961 pci_free_resource_list(&resources);
1963 return b;
1965 EXPORT_SYMBOL(pci_scan_bus);
1968 * pci_rescan_bus_bridge_resize - scan a PCI bus for devices.
1969 * @bridge: PCI bridge for the bus to scan
1971 * Scan a PCI bus and child buses for new devices, add them,
1972 * and enable them, resizing bridge mmio/io resource if necessary
1973 * and possible. The caller must ensure the child devices are already
1974 * removed for resizing to occur.
1976 * Returns the max number of subordinate bus discovered.
1978 unsigned int __ref pci_rescan_bus_bridge_resize(struct pci_dev *bridge)
1980 unsigned int max;
1981 struct pci_bus *bus = bridge->subordinate;
1983 max = pci_scan_child_bus(bus);
1985 pci_assign_unassigned_bridge_resources(bridge);
1987 pci_bus_add_devices(bus);
1989 return max;
1993 * pci_rescan_bus - scan a PCI bus for devices.
1994 * @bus: PCI bus to scan
1996 * Scan a PCI bus and child buses for new devices, adds them,
1997 * and enables them.
1999 * Returns the max number of subordinate bus discovered.
2001 unsigned int __ref pci_rescan_bus(struct pci_bus *bus)
2003 unsigned int max;
2005 max = pci_scan_child_bus(bus);
2006 pci_assign_unassigned_bus_resources(bus);
2007 pci_bus_add_devices(bus);
2009 return max;
2011 EXPORT_SYMBOL_GPL(pci_rescan_bus);
2013 EXPORT_SYMBOL(pci_add_new_bus);
2014 EXPORT_SYMBOL(pci_scan_slot);
2015 EXPORT_SYMBOL(pci_scan_bridge);
2016 EXPORT_SYMBOL_GPL(pci_scan_child_bus);
2018 static int __init pci_sort_bf_cmp(const struct device *d_a, const struct device *d_b)
2020 const struct pci_dev *a = to_pci_dev(d_a);
2021 const struct pci_dev *b = to_pci_dev(d_b);
2023 if (pci_domain_nr(a->bus) < pci_domain_nr(b->bus)) return -1;
2024 else if (pci_domain_nr(a->bus) > pci_domain_nr(b->bus)) return 1;
2026 if (a->bus->number < b->bus->number) return -1;
2027 else if (a->bus->number > b->bus->number) return 1;
2029 if (a->devfn < b->devfn) return -1;
2030 else if (a->devfn > b->devfn) return 1;
2032 return 0;
2035 void __init pci_sort_breadthfirst(void)
2037 bus_sort_breadthfirst(&pci_bus_type, &pci_sort_bf_cmp);