2005-04-16 22:20:36 +00:00
|
|
|
#include <linux/pci.h>
|
|
|
|
#include <linux/acpi.h>
|
|
|
|
#include <linux/init.h>
|
2005-09-30 16:34:42 +00:00
|
|
|
#include <linux/irq.h>
|
2007-10-03 22:56:14 +00:00
|
|
|
#include <linux/dmi.h>
|
2005-09-12 16:49:24 +00:00
|
|
|
#include <asm/numa.h>
|
2008-12-27 13:02:28 +00:00
|
|
|
#include <asm/pci_x86.h>
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2007-10-03 22:56:51 +00:00
|
|
|
struct pci_root_info {
|
2009-10-06 21:33:49 +00:00
|
|
|
struct acpi_device *bridge;
|
2007-10-03 22:56:51 +00:00
|
|
|
char *name;
|
|
|
|
unsigned int res_num;
|
|
|
|
struct resource *res;
|
|
|
|
struct pci_bus *bus;
|
|
|
|
int busnum;
|
|
|
|
};
|
|
|
|
|
|
|
|
static acpi_status
|
|
|
|
resource_to_addr(struct acpi_resource *resource,
|
|
|
|
struct acpi_resource_address64 *addr)
|
|
|
|
{
|
|
|
|
acpi_status status;
|
|
|
|
|
|
|
|
status = acpi_resource_to_address64(resource, addr);
|
|
|
|
if (ACPI_SUCCESS(status) &&
|
|
|
|
(addr->resource_type == ACPI_MEMORY_RANGE ||
|
|
|
|
addr->resource_type == ACPI_IO_RANGE) &&
|
|
|
|
addr->address_length > 0 &&
|
|
|
|
addr->producer_consumer == ACPI_PRODUCER) {
|
|
|
|
return AE_OK;
|
|
|
|
}
|
|
|
|
return AE_ERROR;
|
|
|
|
}
|
|
|
|
|
|
|
|
static acpi_status
|
|
|
|
count_resource(struct acpi_resource *acpi_res, void *data)
|
|
|
|
{
|
|
|
|
struct pci_root_info *info = data;
|
|
|
|
struct acpi_resource_address64 addr;
|
|
|
|
acpi_status status;
|
|
|
|
|
|
|
|
status = resource_to_addr(acpi_res, &addr);
|
|
|
|
if (ACPI_SUCCESS(status))
|
|
|
|
info->res_num++;
|
|
|
|
return AE_OK;
|
|
|
|
}
|
|
|
|
|
2009-11-04 17:39:18 +00:00
|
|
|
static void
|
|
|
|
align_resource(struct acpi_device *bridge, struct resource *res)
|
|
|
|
{
|
|
|
|
int align = (res->flags & IORESOURCE_MEM) ? 16 : 4;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Host bridge windows are not BARs, but the decoders on the PCI side
|
|
|
|
* that claim this address space have starting alignment and length
|
|
|
|
* constraints, so fix any obvious BIOS goofs.
|
|
|
|
*/
|
2009-11-05 17:17:11 +00:00
|
|
|
if (!IS_ALIGNED(res->start, align)) {
|
2009-11-04 17:39:18 +00:00
|
|
|
dev_printk(KERN_DEBUG, &bridge->dev,
|
|
|
|
"host bridge window %pR invalid; "
|
|
|
|
"aligning start to %d-byte boundary\n", res, align);
|
|
|
|
res->start &= ~(align - 1);
|
|
|
|
}
|
2009-11-05 17:17:11 +00:00
|
|
|
if (!IS_ALIGNED(res->end + 1, align)) {
|
2009-11-04 17:39:18 +00:00
|
|
|
dev_printk(KERN_DEBUG, &bridge->dev,
|
|
|
|
"host bridge window %pR invalid; "
|
|
|
|
"aligning end to %d-byte boundary\n", res, align);
|
2009-11-05 17:17:11 +00:00
|
|
|
res->end = ALIGN(res->end, align) - 1;
|
2009-11-04 17:39:18 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2007-10-03 22:56:51 +00:00
|
|
|
static acpi_status
|
|
|
|
setup_resource(struct acpi_resource *acpi_res, void *data)
|
|
|
|
{
|
|
|
|
struct pci_root_info *info = data;
|
|
|
|
struct resource *res;
|
|
|
|
struct acpi_resource_address64 addr;
|
|
|
|
acpi_status status;
|
|
|
|
unsigned long flags;
|
|
|
|
struct resource *root;
|
2009-06-25 02:01:19 +00:00
|
|
|
u64 start, end;
|
|
|
|
|
2007-10-03 22:56:51 +00:00
|
|
|
status = resource_to_addr(acpi_res, &addr);
|
|
|
|
if (!ACPI_SUCCESS(status))
|
|
|
|
return AE_OK;
|
|
|
|
|
|
|
|
if (addr.resource_type == ACPI_MEMORY_RANGE) {
|
|
|
|
root = &iomem_resource;
|
|
|
|
flags = IORESOURCE_MEM;
|
|
|
|
if (addr.info.mem.caching == ACPI_PREFETCHABLE_MEMORY)
|
|
|
|
flags |= IORESOURCE_PREFETCH;
|
|
|
|
} else if (addr.resource_type == ACPI_IO_RANGE) {
|
|
|
|
root = &ioport_resource;
|
|
|
|
flags = IORESOURCE_IO;
|
|
|
|
} else
|
|
|
|
return AE_OK;
|
|
|
|
|
2009-06-25 02:01:19 +00:00
|
|
|
start = addr.minimum + addr.translation_offset;
|
|
|
|
end = start + addr.address_length - 1;
|
2009-05-27 19:41:44 +00:00
|
|
|
|
2009-06-25 02:01:19 +00:00
|
|
|
res = &info->res[info->res_num];
|
|
|
|
res->name = info->name;
|
|
|
|
res->flags = flags;
|
|
|
|
res->start = start;
|
|
|
|
res->end = end;
|
|
|
|
res->child = NULL;
|
2009-11-04 17:39:18 +00:00
|
|
|
align_resource(info->bridge, res);
|
2009-06-25 02:01:19 +00:00
|
|
|
|
2009-11-04 17:39:13 +00:00
|
|
|
if (!(pci_probe & PCI_USE__CRS)) {
|
|
|
|
dev_printk(KERN_DEBUG, &info->bridge->dev,
|
|
|
|
"host bridge window %pR (ignored)\n", res);
|
|
|
|
return AE_OK;
|
|
|
|
}
|
|
|
|
|
2007-10-03 22:56:51 +00:00
|
|
|
if (insert_resource(root, res)) {
|
2009-10-27 19:26:47 +00:00
|
|
|
dev_err(&info->bridge->dev,
|
|
|
|
"can't allocate host bridge window %pR\n", res);
|
2007-10-03 22:56:51 +00:00
|
|
|
} else {
|
2010-02-23 17:24:36 +00:00
|
|
|
pci_bus_add_resource(info->bus, res, 0);
|
2007-10-03 22:56:51 +00:00
|
|
|
info->res_num++;
|
2009-10-06 21:33:49 +00:00
|
|
|
if (addr.translation_offset)
|
2009-10-27 19:26:47 +00:00
|
|
|
dev_info(&info->bridge->dev, "host bridge window %pR "
|
2009-10-06 21:33:49 +00:00
|
|
|
"(PCI address [%#llx-%#llx])\n",
|
|
|
|
res, res->start - addr.translation_offset,
|
|
|
|
res->end - addr.translation_offset);
|
|
|
|
else
|
|
|
|
dev_info(&info->bridge->dev,
|
2009-10-27 19:26:47 +00:00
|
|
|
"host bridge window %pR\n", res);
|
2007-10-03 22:56:51 +00:00
|
|
|
}
|
|
|
|
return AE_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
get_current_resources(struct acpi_device *device, int busnum,
|
2008-02-08 22:00:52 +00:00
|
|
|
int domain, struct pci_bus *bus)
|
2007-10-03 22:56:51 +00:00
|
|
|
{
|
|
|
|
struct pci_root_info info;
|
|
|
|
size_t size;
|
|
|
|
|
2010-02-23 17:24:36 +00:00
|
|
|
if (pci_probe & PCI_USE__CRS)
|
|
|
|
pci_bus_remove_resources(bus);
|
|
|
|
else
|
2009-11-04 17:39:13 +00:00
|
|
|
dev_info(&device->dev,
|
|
|
|
"ignoring host bridge windows from ACPI; "
|
|
|
|
"boot with \"pci=use_crs\" to use them\n");
|
|
|
|
|
2009-10-06 21:33:49 +00:00
|
|
|
info.bridge = device;
|
2007-10-03 22:56:51 +00:00
|
|
|
info.bus = bus;
|
|
|
|
info.res_num = 0;
|
|
|
|
acpi_walk_resources(device->handle, METHOD_NAME__CRS, count_resource,
|
|
|
|
&info);
|
|
|
|
if (!info.res_num)
|
|
|
|
return;
|
|
|
|
|
|
|
|
size = sizeof(*info.res) * info.res_num;
|
|
|
|
info.res = kmalloc(size, GFP_KERNEL);
|
|
|
|
if (!info.res)
|
|
|
|
goto res_alloc_fail;
|
|
|
|
|
2008-02-08 22:00:52 +00:00
|
|
|
info.name = kmalloc(16, GFP_KERNEL);
|
2007-10-03 22:56:51 +00:00
|
|
|
if (!info.name)
|
|
|
|
goto name_alloc_fail;
|
2008-02-08 22:00:52 +00:00
|
|
|
sprintf(info.name, "PCI Bus %04x:%02x", domain, busnum);
|
2007-10-03 22:56:51 +00:00
|
|
|
|
|
|
|
info.res_num = 0;
|
|
|
|
acpi_walk_resources(device->handle, METHOD_NAME__CRS, setup_resource,
|
|
|
|
&info);
|
|
|
|
|
|
|
|
return;
|
|
|
|
|
|
|
|
name_alloc_fail:
|
|
|
|
kfree(info.res);
|
|
|
|
res_alloc_fail:
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
struct pci_bus * __devinit pci_acpi_scan_root(struct acpi_device *device, int domain, int busnum)
|
|
|
|
{
|
2005-09-12 16:49:24 +00:00
|
|
|
struct pci_bus *bus;
|
2007-07-21 21:23:39 +00:00
|
|
|
struct pci_sysdata *sd;
|
x86: get mp_bus_to_node early
Currently, on an amd k8 system with multi ht chains, the numa_node of
pci devices under /sys/devices/pci0000:80/* is always 0, even if that
chain is on node 1 or 2 or 3.
Workaround: pcibus_to_node(bus) is used when we want to get the node that
pci_device is on.
In struct device, we already have numa_node member, and we could use
dev_to_node()/set_dev_node() to get and set numa_node in the device.
set_dev_node is called in pci_device_add() with pcibus_to_node(bus),
and pcibus_to_node uses bus->sysdata for nodeid.
The problem is when pci_add_device is called, bus->sysdata is not assigned
correct nodeid yet. The result is that numa_node will always be 0.
pcibios_scan_root and pci_scan_root could take sysdata. So we need to get
mp_bus_to_node mapping before these two are called, and thus
get_mp_bus_to_node could get correct node for sysdata in root bus.
In scanning of the root bus, all child busses will take parent bus sysdata.
So all pci_device->dev.numa_node will be assigned correctly and automatically.
Later we could use dev_to_node(&pci_dev->dev) to get numa_node, and we
could also could make other bus specific device get the correct numa_node
too.
This is an updated version of pci_sysdata and Jeff's pci_domain patch.
[ mingo@elte.hu: build fix ]
Signed-off-by: Yinghai Lu <yinghai.lu@sun.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2008-02-19 11:20:09 +00:00
|
|
|
int node;
|
|
|
|
#ifdef CONFIG_ACPI_NUMA
|
2007-07-21 21:23:39 +00:00
|
|
|
int pxm;
|
x86: get mp_bus_to_node early
Currently, on an amd k8 system with multi ht chains, the numa_node of
pci devices under /sys/devices/pci0000:80/* is always 0, even if that
chain is on node 1 or 2 or 3.
Workaround: pcibus_to_node(bus) is used when we want to get the node that
pci_device is on.
In struct device, we already have numa_node member, and we could use
dev_to_node()/set_dev_node() to get and set numa_node in the device.
set_dev_node is called in pci_device_add() with pcibus_to_node(bus),
and pcibus_to_node uses bus->sysdata for nodeid.
The problem is when pci_add_device is called, bus->sysdata is not assigned
correct nodeid yet. The result is that numa_node will always be 0.
pcibios_scan_root and pci_scan_root could take sysdata. So we need to get
mp_bus_to_node mapping before these two are called, and thus
get_mp_bus_to_node could get correct node for sysdata in root bus.
In scanning of the root bus, all child busses will take parent bus sysdata.
So all pci_device->dev.numa_node will be assigned correctly and automatically.
Later we could use dev_to_node(&pci_dev->dev) to get numa_node, and we
could also could make other bus specific device get the correct numa_node
too.
This is an updated version of pci_sysdata and Jeff's pci_domain patch.
[ mingo@elte.hu: build fix ]
Signed-off-by: Yinghai Lu <yinghai.lu@sun.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2008-02-19 11:20:09 +00:00
|
|
|
#endif
|
2007-07-21 21:23:39 +00:00
|
|
|
|
2007-10-11 20:58:30 +00:00
|
|
|
if (domain && !pci_domains_supported) {
|
2009-11-04 17:32:47 +00:00
|
|
|
printk(KERN_WARNING "pci_bus %04x:%02x: "
|
|
|
|
"ignored (multiple domains not supported)\n",
|
|
|
|
domain, busnum);
|
2007-10-11 20:58:30 +00:00
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
x86: get mp_bus_to_node early
Currently, on an amd k8 system with multi ht chains, the numa_node of
pci devices under /sys/devices/pci0000:80/* is always 0, even if that
chain is on node 1 or 2 or 3.
Workaround: pcibus_to_node(bus) is used when we want to get the node that
pci_device is on.
In struct device, we already have numa_node member, and we could use
dev_to_node()/set_dev_node() to get and set numa_node in the device.
set_dev_node is called in pci_device_add() with pcibus_to_node(bus),
and pcibus_to_node uses bus->sysdata for nodeid.
The problem is when pci_add_device is called, bus->sysdata is not assigned
correct nodeid yet. The result is that numa_node will always be 0.
pcibios_scan_root and pci_scan_root could take sysdata. So we need to get
mp_bus_to_node mapping before these two are called, and thus
get_mp_bus_to_node could get correct node for sysdata in root bus.
In scanning of the root bus, all child busses will take parent bus sysdata.
So all pci_device->dev.numa_node will be assigned correctly and automatically.
Later we could use dev_to_node(&pci_dev->dev) to get numa_node, and we
could also could make other bus specific device get the correct numa_node
too.
This is an updated version of pci_sysdata and Jeff's pci_domain patch.
[ mingo@elte.hu: build fix ]
Signed-off-by: Yinghai Lu <yinghai.lu@sun.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2008-02-19 11:20:09 +00:00
|
|
|
node = -1;
|
|
|
|
#ifdef CONFIG_ACPI_NUMA
|
|
|
|
pxm = acpi_get_pxm(device->handle);
|
|
|
|
if (pxm >= 0)
|
|
|
|
node = pxm_to_node(pxm);
|
|
|
|
if (node != -1)
|
|
|
|
set_mp_bus_to_node(busnum, node);
|
|
|
|
else
|
|
|
|
#endif
|
|
|
|
node = get_mp_bus_to_node(busnum);
|
2008-02-20 20:41:52 +00:00
|
|
|
|
|
|
|
if (node != -1 && !node_online(node))
|
|
|
|
node = -1;
|
x86: get mp_bus_to_node early
Currently, on an amd k8 system with multi ht chains, the numa_node of
pci devices under /sys/devices/pci0000:80/* is always 0, even if that
chain is on node 1 or 2 or 3.
Workaround: pcibus_to_node(bus) is used when we want to get the node that
pci_device is on.
In struct device, we already have numa_node member, and we could use
dev_to_node()/set_dev_node() to get and set numa_node in the device.
set_dev_node is called in pci_device_add() with pcibus_to_node(bus),
and pcibus_to_node uses bus->sysdata for nodeid.
The problem is when pci_add_device is called, bus->sysdata is not assigned
correct nodeid yet. The result is that numa_node will always be 0.
pcibios_scan_root and pci_scan_root could take sysdata. So we need to get
mp_bus_to_node mapping before these two are called, and thus
get_mp_bus_to_node could get correct node for sysdata in root bus.
In scanning of the root bus, all child busses will take parent bus sysdata.
So all pci_device->dev.numa_node will be assigned correctly and automatically.
Later we could use dev_to_node(&pci_dev->dev) to get numa_node, and we
could also could make other bus specific device get the correct numa_node
too.
This is an updated version of pci_sysdata and Jeff's pci_domain patch.
[ mingo@elte.hu: build fix ]
Signed-off-by: Yinghai Lu <yinghai.lu@sun.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2008-02-19 11:20:09 +00:00
|
|
|
|
2007-07-21 21:23:39 +00:00
|
|
|
/* Allocate per-root-bus (not per bus) arch-specific data.
|
|
|
|
* TODO: leak; this memory is never freed.
|
|
|
|
* It's arguable whether it's worth the trouble to care.
|
|
|
|
*/
|
|
|
|
sd = kzalloc(sizeof(*sd), GFP_KERNEL);
|
|
|
|
if (!sd) {
|
2009-11-04 17:32:47 +00:00
|
|
|
printk(KERN_WARNING "pci_bus %04x:%02x: "
|
|
|
|
"ignored (out of memory)\n", domain, busnum);
|
2007-07-21 21:23:39 +00:00
|
|
|
return NULL;
|
|
|
|
}
|
2005-09-12 16:49:24 +00:00
|
|
|
|
2007-10-11 20:58:30 +00:00
|
|
|
sd->domain = domain;
|
x86: get mp_bus_to_node early
Currently, on an amd k8 system with multi ht chains, the numa_node of
pci devices under /sys/devices/pci0000:80/* is always 0, even if that
chain is on node 1 or 2 or 3.
Workaround: pcibus_to_node(bus) is used when we want to get the node that
pci_device is on.
In struct device, we already have numa_node member, and we could use
dev_to_node()/set_dev_node() to get and set numa_node in the device.
set_dev_node is called in pci_device_add() with pcibus_to_node(bus),
and pcibus_to_node uses bus->sysdata for nodeid.
The problem is when pci_add_device is called, bus->sysdata is not assigned
correct nodeid yet. The result is that numa_node will always be 0.
pcibios_scan_root and pci_scan_root could take sysdata. So we need to get
mp_bus_to_node mapping before these two are called, and thus
get_mp_bus_to_node could get correct node for sysdata in root bus.
In scanning of the root bus, all child busses will take parent bus sysdata.
So all pci_device->dev.numa_node will be assigned correctly and automatically.
Later we could use dev_to_node(&pci_dev->dev) to get numa_node, and we
could also could make other bus specific device get the correct numa_node
too.
This is an updated version of pci_sysdata and Jeff's pci_domain patch.
[ mingo@elte.hu: build fix ]
Signed-off-by: Yinghai Lu <yinghai.lu@sun.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
2008-02-19 11:20:09 +00:00
|
|
|
sd->node = node;
|
2008-04-15 21:34:49 +00:00
|
|
|
/*
|
|
|
|
* Maybe the desired pci bus has been already scanned. In such case
|
|
|
|
* it is unnecessary to scan the pci bus with the given domain,busnum.
|
|
|
|
*/
|
|
|
|
bus = pci_find_bus(domain, busnum);
|
|
|
|
if (bus) {
|
|
|
|
/*
|
|
|
|
* If the desired bus exits, the content of bus->sysdata will
|
|
|
|
* be replaced by sd.
|
|
|
|
*/
|
|
|
|
memcpy(bus->sysdata, sd, sizeof(*sd));
|
|
|
|
kfree(sd);
|
2009-06-25 03:00:12 +00:00
|
|
|
} else {
|
|
|
|
bus = pci_create_bus(NULL, busnum, &pci_root_ops, sd);
|
|
|
|
if (bus) {
|
2009-11-04 17:39:13 +00:00
|
|
|
get_current_resources(device, busnum, domain, bus);
|
2009-06-25 03:00:12 +00:00
|
|
|
bus->subordinate = pci_scan_child_bus(bus);
|
|
|
|
}
|
|
|
|
}
|
2007-07-21 21:23:39 +00:00
|
|
|
|
|
|
|
if (!bus)
|
|
|
|
kfree(sd);
|
|
|
|
|
2008-04-19 08:30:16 +00:00
|
|
|
if (bus && node != -1) {
|
2005-09-12 16:49:24 +00:00
|
|
|
#ifdef CONFIG_ACPI_NUMA
|
2008-04-19 08:30:16 +00:00
|
|
|
if (pxm >= 0)
|
2008-12-18 23:34:51 +00:00
|
|
|
dev_printk(KERN_DEBUG, &bus->dev,
|
|
|
|
"on NUMA node %d (pxm %d)\n", node, pxm);
|
2008-04-19 08:30:16 +00:00
|
|
|
#else
|
2008-12-18 23:34:51 +00:00
|
|
|
dev_printk(KERN_DEBUG, &bus->dev, "on NUMA node %d\n", node);
|
2005-09-12 16:49:24 +00:00
|
|
|
#endif
|
2008-04-19 08:30:16 +00:00
|
|
|
}
|
2007-10-03 22:56:51 +00:00
|
|
|
|
2005-09-12 16:49:24 +00:00
|
|
|
return bus;
|
2005-04-16 22:20:36 +00:00
|
|
|
}
|
|
|
|
|
2008-07-02 20:50:29 +00:00
|
|
|
int __init pci_acpi_init(void)
|
2005-04-16 22:20:36 +00:00
|
|
|
{
|
|
|
|
struct pci_dev *dev = NULL;
|
|
|
|
|
|
|
|
if (pcibios_scanned)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (acpi_noirq)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
printk(KERN_INFO "PCI: Using ACPI for IRQ routing\n");
|
|
|
|
acpi_irq_penalty_init();
|
|
|
|
pcibios_scanned++;
|
|
|
|
pcibios_enable_irq = acpi_pci_irq_enable;
|
2005-07-28 03:02:00 +00:00
|
|
|
pcibios_disable_irq = acpi_pci_irq_disable;
|
2005-04-16 22:20:36 +00:00
|
|
|
|
|
|
|
if (pci_routeirq) {
|
|
|
|
/*
|
|
|
|
* PCI IRQ routing is set up by pci_enable_device(), but we
|
|
|
|
* also do it here in case there are still broken drivers that
|
|
|
|
* don't use pci_enable_device().
|
|
|
|
*/
|
|
|
|
printk(KERN_INFO "PCI: Routing PCI interrupts for all devices because \"pci=routeirq\" specified\n");
|
2005-11-07 07:39:36 +00:00
|
|
|
for_each_pci_dev(dev)
|
2005-04-16 22:20:36 +00:00
|
|
|
acpi_pci_irq_enable(dev);
|
2008-02-18 16:44:13 +00:00
|
|
|
}
|
2005-04-16 22:20:36 +00:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|