c2bf1fc212
Currently Linux does not follow PCIe spec regarding the required delays after reset. A concrete example is a Thunderbolt add-in-card that consists of a PCIe switch and two PCIe endpoints: +-1b.0-[01-6b]----00.0-[02-6b]--+-00.0-[03]----00.0 TBT controller +-01.0-[04-36]-- DS hotplug port +-02.0-[37]----00.0 xHCI controller \-04.0-[38-6b]-- DS hotplug port The root port (1b.0) and the PCIe switch downstream ports are all PCIe gen3 so they support 8GT/s link speeds. We wait for the PCIe hierarchy to enter D3cold (runtime): pcieport 0000:00:1b.0: power state changed by ACPI to D3cold When it wakes up from D3cold, according to the PCIe 4.0 section 5.8 the PCIe switch is put to reset and its power is re-applied. This means that we must follow the rules in PCIe 4.0 section 6.6.1. For the PCIe gen3 ports we are dealing with here, the following applies: With a Downstream Port that supports Link speeds greater than 5.0 GT/s, software must wait a minimum of 100 ms after Link training completes before sending a Configuration Request to the device immediately below that Port. Software can determine when Link training completes by polling the Data Link Layer Link Active bit or by setting up an associated interrupt (see Section 6.7.3.3). Translating this into the above topology we would need to do this (DLLLA stands for Data Link Layer Link Active): pcieport 0000:00:1b.0: wait for 100ms after DLLLA is set before access to 0000:01:00.0 pcieport 0000:02:00.0: wait for 100ms after DLLLA is set before access to 0000:03:00.0 pcieport 0000:02:02.0: wait for 100ms after DLLLA is set before access to 0000:37:00.0 I've instrumented the kernel with additional logging so we can see the actual delays the kernel performs: pcieport 0000:00:1b.0: power state changed by ACPI to D0 pcieport 0000:00:1b.0: waiting for D3cold delay of 100 ms pcieport 0000:00:1b.0: waking up bus pcieport 0000:00:1b.0: waiting for D3hot delay of 10 ms pcieport 0000:00:1b.0: restoring config space at offset 0x2c (was 0x60, writing 0x60) ... pcieport 0000:00:1b.0: PME# disabled pcieport 0000:01:00.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) ... pcieport 0000:01:00.0: PME# disabled pcieport 0000:02:00.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) ... pcieport 0000:02:00.0: PME# disabled pcieport 0000:02:01.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) ... pcieport 0000:02:01.0: restoring config space at offset 0x4 (was 0x100000, writing 0x100407) pcieport 0000:02:01.0: PME# disabled pcieport 0000:02:02.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) ... pcieport 0000:02:02.0: PME# disabled pcieport 0000:02:04.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) ... pcieport 0000:02:04.0: PME# disabled pcieport 0000:02:01.0: PME# enabled pcieport 0000:02:01.0: waiting for D3hot delay of 10 ms pcieport 0000:02:04.0: PME# enabled pcieport 0000:02:04.0: waiting for D3hot delay of 10 ms thunderbolt 0000:03:00.0: restoring config space at offset 0x14 (was 0x0, writing 0x8a040000) ... thunderbolt 0000:03:00.0: PME# disabled xhci_hcd 0000:37:00.0: restoring config space at offset 0x10 (was 0x0, writing 0x73f00000) ... xhci_hcd 0000:37:00.0: PME# disabled For the switch upstream port (01:00.0) we wait for 100ms but not taking into account the DLLLA requirement. We then wait 10ms for D3hot -> D0 transition of the root port and the two downstream hotplug ports. This means that we deviate from what the spec requires. Performing the same check for system sleep (s2idle) transitions we can see following when resuming from s2idle: pcieport 0000:00:1b.0: power state changed by ACPI to D0 pcieport 0000:00:1b.0: restoring config space at offset 0x2c (was 0x60, writing 0x60) ... pcieport 0000:01:00.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) ... pcieport 0000:02:02.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) pcieport 0000:02:02.0: restoring config space at offset 0x2c (was 0x0, writing 0x0) pcieport 0000:02:01.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) pcieport 0000:02:04.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) pcieport 0000:02:02.0: restoring config space at offset 0x28 (was 0x0, writing 0x0) pcieport 0000:02:00.0: restoring config space at offset 0x3c (was 0x1ff, writing 0x201ff) pcieport 0000:02:02.0: restoring config space at offset 0x24 (was 0x10001, writing 0x1fff1) pcieport 0000:02:01.0: restoring config space at offset 0x2c (was 0x0, writing 0x60) pcieport 0000:02:02.0: restoring config space at offset 0x20 (was 0x0, writing 0x73f073f0) pcieport 0000:02:04.0: restoring config space at offset 0x2c (was 0x0, writing 0x60) pcieport 0000:02:01.0: restoring config space at offset 0x28 (was 0x0, writing 0x60) pcieport 0000:02:00.0: restoring config space at offset 0x2c (was 0x0, writing 0x0) pcieport 0000:02:02.0: restoring config space at offset 0x1c (was 0x101, writing 0x1f1) pcieport 0000:02:04.0: restoring config space at offset 0x28 (was 0x0, writing 0x60) pcieport 0000:02:01.0: restoring config space at offset 0x24 (was 0x10001, writing 0x1ff10001) pcieport 0000:02:00.0: restoring config space at offset 0x28 (was 0x0, writing 0x0) pcieport 0000:02:02.0: restoring config space at offset 0x18 (was 0x0, writing 0x373702) pcieport 0000:02:04.0: restoring config space at offset 0x24 (was 0x10001, writing 0x49f12001) pcieport 0000:02:01.0: restoring config space at offset 0x20 (was 0x0, writing 0x73e05c00) pcieport 0000:02:00.0: restoring config space at offset 0x24 (was 0x10001, writing 0x1fff1) pcieport 0000:02:04.0: restoring config space at offset 0x20 (was 0x0, writing 0x89f07400) pcieport 0000:02:01.0: restoring config space at offset 0x1c (was 0x101, writing 0x5151) pcieport 0000:02:00.0: restoring config space at offset 0x20 (was 0x0, writing 0x8a008a00) pcieport 0000:02:02.0: restoring config space at offset 0xc (was 0x10000, writing 0x10020) pcieport 0000:02:04.0: restoring config space at offset 0x1c (was 0x101, writing 0x6161) pcieport 0000:02:01.0: restoring config space at offset 0x18 (was 0x0, writing 0x360402) pcieport 0000:02:00.0: restoring config space at offset 0x1c (was 0x101, writing 0x1f1) pcieport 0000:02:04.0: restoring config space at offset 0x18 (was 0x0, writing 0x6b3802) pcieport 0000:02:02.0: restoring config space at offset 0x4 (was 0x100000, writing 0x100407) pcieport 0000:02:00.0: restoring config space at offset 0x18 (was 0x0, writing 0x30302) pcieport 0000:02:01.0: restoring config space at offset 0xc (was 0x10000, writing 0x10020) pcieport 0000:02:04.0: restoring config space at offset 0xc (was 0x10000, writing 0x10020) pcieport 0000:02:00.0: restoring config space at offset 0xc (was 0x10000, writing 0x10020) pcieport 0000:02:01.0: restoring config space at offset 0x4 (was 0x100000, writing 0x100407) pcieport 0000:02:04.0: restoring config space at offset 0x4 (was 0x100000, writing 0x100407) pcieport 0000:02:00.0: restoring config space at offset 0x4 (was 0x100000, writing 0x100407) xhci_hcd 0000:37:00.0: restoring config space at offset 0x10 (was 0x0, writing 0x73f00000) ... thunderbolt 0000:03:00.0: restoring config space at offset 0x14 (was 0x0, writing 0x8a040000) This is even worse. None of the mandatory delays are performed. If this would be S3 instead of s2idle then according to PCI FW spec 3.2 section 4.6.8. there is a specific _DSM that allows the OS to skip the delays but this platform does not provide the _DSM and does not go to S3 anyway so no firmware is involved that could already handle these delays. In this particular Intel Coffee Lake platform these delays are not actually needed because there is an additional delay as part of the ACPI power resource that is used to turn on power to the hierarchy but since that additional delay is not required by any of standards (PCIe, ACPI) it is not present in the Intel Ice Lake, for example where missing the mandatory delays causes pciehp to start tearing down the stack too early (links are not yet trained). For this reason, change the PCIe portdrv PM resume hooks so that they perform the mandatory delays before the downstream component gets resumed. We perform the delays before port services are resumed because otherwise pciehp might find that the link is not up (even if it is just training) and tears-down the hierarchy. Signed-off-by: Mika Westerberg <mika.westerberg@linux.intel.com> Signed-off-by: Rafael J. Wysocki <rafael.j.wysocki@intel.com>
674 lines
18 KiB
C
674 lines
18 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Purpose: PCI Express Port Bus Driver's Core Functions
|
|
*
|
|
* Copyright (C) 2004 Intel
|
|
* Copyright (C) Tom Long Nguyen (tom.l.nguyen@intel.com)
|
|
*/
|
|
|
|
#include <linux/module.h>
|
|
#include <linux/pci.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/delay.h>
|
|
#include <linux/errno.h>
|
|
#include <linux/pm.h>
|
|
#include <linux/pm_runtime.h>
|
|
#include <linux/string.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/aer.h>
|
|
|
|
#include "../pci.h"
|
|
#include "portdrv.h"
|
|
|
|
struct portdrv_service_data {
|
|
struct pcie_port_service_driver *drv;
|
|
struct device *dev;
|
|
u32 service;
|
|
};
|
|
|
|
/**
|
|
* release_pcie_device - free PCI Express port service device structure
|
|
* @dev: Port service device to release
|
|
*
|
|
* Invoked automatically when device is being removed in response to
|
|
* device_unregister(dev). Release all resources being claimed.
|
|
*/
|
|
static void release_pcie_device(struct device *dev)
|
|
{
|
|
kfree(to_pcie_device(dev));
|
|
}
|
|
|
|
/*
|
|
* Fill in *pme, *aer, *dpc with the relevant Interrupt Message Numbers if
|
|
* services are enabled in "mask". Return the number of MSI/MSI-X vectors
|
|
* required to accommodate the largest Message Number.
|
|
*/
|
|
static int pcie_message_numbers(struct pci_dev *dev, int mask,
|
|
u32 *pme, u32 *aer, u32 *dpc)
|
|
{
|
|
u32 nvec = 0, pos;
|
|
u16 reg16;
|
|
|
|
/*
|
|
* The Interrupt Message Number indicates which vector is used, i.e.,
|
|
* the MSI-X table entry or the MSI offset between the base Message
|
|
* Data and the generated interrupt message. See PCIe r3.1, sec
|
|
* 7.8.2, 7.10.10, 7.31.2.
|
|
*/
|
|
|
|
if (mask & (PCIE_PORT_SERVICE_PME | PCIE_PORT_SERVICE_HP |
|
|
PCIE_PORT_SERVICE_BWNOTIF)) {
|
|
pcie_capability_read_word(dev, PCI_EXP_FLAGS, ®16);
|
|
*pme = (reg16 & PCI_EXP_FLAGS_IRQ) >> 9;
|
|
nvec = *pme + 1;
|
|
}
|
|
|
|
#ifdef CONFIG_PCIEAER
|
|
if (mask & PCIE_PORT_SERVICE_AER) {
|
|
u32 reg32;
|
|
|
|
pos = dev->aer_cap;
|
|
if (pos) {
|
|
pci_read_config_dword(dev, pos + PCI_ERR_ROOT_STATUS,
|
|
®32);
|
|
*aer = (reg32 & PCI_ERR_ROOT_AER_IRQ) >> 27;
|
|
nvec = max(nvec, *aer + 1);
|
|
}
|
|
}
|
|
#endif
|
|
|
|
if (mask & PCIE_PORT_SERVICE_DPC) {
|
|
pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_DPC);
|
|
if (pos) {
|
|
pci_read_config_word(dev, pos + PCI_EXP_DPC_CAP,
|
|
®16);
|
|
*dpc = reg16 & PCI_EXP_DPC_IRQ;
|
|
nvec = max(nvec, *dpc + 1);
|
|
}
|
|
}
|
|
|
|
return nvec;
|
|
}
|
|
|
|
/**
|
|
* pcie_port_enable_irq_vec - try to set up MSI-X or MSI as interrupt mode
|
|
* for given port
|
|
* @dev: PCI Express port to handle
|
|
* @irqs: Array of interrupt vectors to populate
|
|
* @mask: Bitmask of port capabilities returned by get_port_device_capability()
|
|
*
|
|
* Return value: 0 on success, error code on failure
|
|
*/
|
|
static int pcie_port_enable_irq_vec(struct pci_dev *dev, int *irqs, int mask)
|
|
{
|
|
int nr_entries, nvec, pcie_irq;
|
|
u32 pme = 0, aer = 0, dpc = 0;
|
|
|
|
/* Allocate the maximum possible number of MSI/MSI-X vectors */
|
|
nr_entries = pci_alloc_irq_vectors(dev, 1, PCIE_PORT_MAX_MSI_ENTRIES,
|
|
PCI_IRQ_MSIX | PCI_IRQ_MSI);
|
|
if (nr_entries < 0)
|
|
return nr_entries;
|
|
|
|
/* See how many and which Interrupt Message Numbers we actually use */
|
|
nvec = pcie_message_numbers(dev, mask, &pme, &aer, &dpc);
|
|
if (nvec > nr_entries) {
|
|
pci_free_irq_vectors(dev);
|
|
return -EIO;
|
|
}
|
|
|
|
/*
|
|
* If we allocated more than we need, free them and reallocate fewer.
|
|
*
|
|
* Reallocating may change the specific vectors we get, so
|
|
* pci_irq_vector() must be done *after* the reallocation.
|
|
*
|
|
* If we're using MSI, hardware is *allowed* to change the Interrupt
|
|
* Message Numbers when we free and reallocate the vectors, but we
|
|
* assume it won't because we allocate enough vectors for the
|
|
* biggest Message Number we found.
|
|
*/
|
|
if (nvec != nr_entries) {
|
|
pci_free_irq_vectors(dev);
|
|
|
|
nr_entries = pci_alloc_irq_vectors(dev, nvec, nvec,
|
|
PCI_IRQ_MSIX | PCI_IRQ_MSI);
|
|
if (nr_entries < 0)
|
|
return nr_entries;
|
|
}
|
|
|
|
/* PME, hotplug and bandwidth notification share an MSI/MSI-X vector */
|
|
if (mask & (PCIE_PORT_SERVICE_PME | PCIE_PORT_SERVICE_HP |
|
|
PCIE_PORT_SERVICE_BWNOTIF)) {
|
|
pcie_irq = pci_irq_vector(dev, pme);
|
|
irqs[PCIE_PORT_SERVICE_PME_SHIFT] = pcie_irq;
|
|
irqs[PCIE_PORT_SERVICE_HP_SHIFT] = pcie_irq;
|
|
irqs[PCIE_PORT_SERVICE_BWNOTIF_SHIFT] = pcie_irq;
|
|
}
|
|
|
|
if (mask & PCIE_PORT_SERVICE_AER)
|
|
irqs[PCIE_PORT_SERVICE_AER_SHIFT] = pci_irq_vector(dev, aer);
|
|
|
|
if (mask & PCIE_PORT_SERVICE_DPC)
|
|
irqs[PCIE_PORT_SERVICE_DPC_SHIFT] = pci_irq_vector(dev, dpc);
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* pcie_init_service_irqs - initialize irqs for PCI Express port services
|
|
* @dev: PCI Express port to handle
|
|
* @irqs: Array of irqs to populate
|
|
* @mask: Bitmask of port capabilities returned by get_port_device_capability()
|
|
*
|
|
* Return value: Interrupt mode associated with the port
|
|
*/
|
|
static int pcie_init_service_irqs(struct pci_dev *dev, int *irqs, int mask)
|
|
{
|
|
int ret, i;
|
|
|
|
for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++)
|
|
irqs[i] = -1;
|
|
|
|
/*
|
|
* If we support PME but can't use MSI/MSI-X for it, we have to
|
|
* fall back to INTx or other interrupts, e.g., a system shared
|
|
* interrupt.
|
|
*/
|
|
if ((mask & PCIE_PORT_SERVICE_PME) && pcie_pme_no_msi())
|
|
goto legacy_irq;
|
|
|
|
/* Try to use MSI-X or MSI if supported */
|
|
if (pcie_port_enable_irq_vec(dev, irqs, mask) == 0)
|
|
return 0;
|
|
|
|
legacy_irq:
|
|
/* fall back to legacy IRQ */
|
|
ret = pci_alloc_irq_vectors(dev, 1, 1, PCI_IRQ_LEGACY);
|
|
if (ret < 0)
|
|
return -ENODEV;
|
|
|
|
for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++)
|
|
irqs[i] = pci_irq_vector(dev, 0);
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* get_port_device_capability - discover capabilities of a PCI Express port
|
|
* @dev: PCI Express port to examine
|
|
*
|
|
* The capabilities are read from the port's PCI Express configuration registers
|
|
* as described in PCI Express Base Specification 1.0a sections 7.8.2, 7.8.9 and
|
|
* 7.9 - 7.11.
|
|
*
|
|
* Return value: Bitmask of discovered port capabilities
|
|
*/
|
|
static int get_port_device_capability(struct pci_dev *dev)
|
|
{
|
|
struct pci_host_bridge *host = pci_find_host_bridge(dev->bus);
|
|
int services = 0;
|
|
|
|
if (dev->is_hotplug_bridge &&
|
|
(pcie_ports_native || host->native_pcie_hotplug)) {
|
|
services |= PCIE_PORT_SERVICE_HP;
|
|
|
|
/*
|
|
* Disable hot-plug interrupts in case they have been enabled
|
|
* by the BIOS and the hot-plug service driver is not loaded.
|
|
*/
|
|
pcie_capability_clear_word(dev, PCI_EXP_SLTCTL,
|
|
PCI_EXP_SLTCTL_CCIE | PCI_EXP_SLTCTL_HPIE);
|
|
}
|
|
|
|
#ifdef CONFIG_PCIEAER
|
|
if (dev->aer_cap && pci_aer_available() &&
|
|
(pcie_ports_native || host->native_aer)) {
|
|
services |= PCIE_PORT_SERVICE_AER;
|
|
|
|
/*
|
|
* Disable AER on this port in case it's been enabled by the
|
|
* BIOS (the AER service driver will enable it when necessary).
|
|
*/
|
|
pci_disable_pcie_error_reporting(dev);
|
|
}
|
|
#endif
|
|
|
|
/*
|
|
* Root ports are capable of generating PME too. Root Complex
|
|
* Event Collectors can also generate PMEs, but we don't handle
|
|
* those yet.
|
|
*/
|
|
if (pci_pcie_type(dev) == PCI_EXP_TYPE_ROOT_PORT &&
|
|
(pcie_ports_native || host->native_pme)) {
|
|
services |= PCIE_PORT_SERVICE_PME;
|
|
|
|
/*
|
|
* Disable PME interrupt on this port in case it's been enabled
|
|
* by the BIOS (the PME service driver will enable it when
|
|
* necessary).
|
|
*/
|
|
pcie_pme_interrupt_enable(dev, false);
|
|
}
|
|
|
|
if (pci_find_ext_capability(dev, PCI_EXT_CAP_ID_DPC) &&
|
|
pci_aer_available() && services & PCIE_PORT_SERVICE_AER)
|
|
services |= PCIE_PORT_SERVICE_DPC;
|
|
|
|
if (pci_pcie_type(dev) == PCI_EXP_TYPE_DOWNSTREAM ||
|
|
pci_pcie_type(dev) == PCI_EXP_TYPE_ROOT_PORT)
|
|
services |= PCIE_PORT_SERVICE_BWNOTIF;
|
|
|
|
return services;
|
|
}
|
|
|
|
/**
|
|
* pcie_device_init - allocate and initialize PCI Express port service device
|
|
* @pdev: PCI Express port to associate the service device with
|
|
* @service: Type of service to associate with the service device
|
|
* @irq: Interrupt vector to associate with the service device
|
|
*/
|
|
static int pcie_device_init(struct pci_dev *pdev, int service, int irq)
|
|
{
|
|
int retval;
|
|
struct pcie_device *pcie;
|
|
struct device *device;
|
|
|
|
pcie = kzalloc(sizeof(*pcie), GFP_KERNEL);
|
|
if (!pcie)
|
|
return -ENOMEM;
|
|
pcie->port = pdev;
|
|
pcie->irq = irq;
|
|
pcie->service = service;
|
|
|
|
/* Initialize generic device interface */
|
|
device = &pcie->device;
|
|
device->bus = &pcie_port_bus_type;
|
|
device->release = release_pcie_device; /* callback to free pcie dev */
|
|
dev_set_name(device, "%s:pcie%03x",
|
|
pci_name(pdev),
|
|
get_descriptor_id(pci_pcie_type(pdev), service));
|
|
device->parent = &pdev->dev;
|
|
device_enable_async_suspend(device);
|
|
|
|
retval = device_register(device);
|
|
if (retval) {
|
|
put_device(device);
|
|
return retval;
|
|
}
|
|
|
|
pm_runtime_no_callbacks(device);
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* pcie_port_device_register - register PCI Express port
|
|
* @dev: PCI Express port to register
|
|
*
|
|
* Allocate the port extension structure and register services associated with
|
|
* the port.
|
|
*/
|
|
int pcie_port_device_register(struct pci_dev *dev)
|
|
{
|
|
int status, capabilities, i, nr_service;
|
|
int irqs[PCIE_PORT_DEVICE_MAXSERVICES];
|
|
|
|
/* Enable PCI Express port device */
|
|
status = pci_enable_device(dev);
|
|
if (status)
|
|
return status;
|
|
|
|
/* Get and check PCI Express port services */
|
|
capabilities = get_port_device_capability(dev);
|
|
if (!capabilities)
|
|
return 0;
|
|
|
|
pci_set_master(dev);
|
|
/*
|
|
* Initialize service irqs. Don't use service devices that
|
|
* require interrupts if there is no way to generate them.
|
|
* However, some drivers may have a polling mode (e.g. pciehp_poll_mode)
|
|
* that can be used in the absence of irqs. Allow them to determine
|
|
* if that is to be used.
|
|
*/
|
|
status = pcie_init_service_irqs(dev, irqs, capabilities);
|
|
if (status) {
|
|
capabilities &= PCIE_PORT_SERVICE_HP;
|
|
if (!capabilities)
|
|
goto error_disable;
|
|
}
|
|
|
|
/* Allocate child services if any */
|
|
status = -ENODEV;
|
|
nr_service = 0;
|
|
for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++) {
|
|
int service = 1 << i;
|
|
if (!(capabilities & service))
|
|
continue;
|
|
if (!pcie_device_init(dev, service, irqs[i]))
|
|
nr_service++;
|
|
}
|
|
if (!nr_service)
|
|
goto error_cleanup_irqs;
|
|
|
|
return 0;
|
|
|
|
error_cleanup_irqs:
|
|
pci_free_irq_vectors(dev);
|
|
error_disable:
|
|
pci_disable_device(dev);
|
|
return status;
|
|
}
|
|
|
|
#ifdef CONFIG_PM
|
|
typedef int (*pcie_pm_callback_t)(struct pcie_device *);
|
|
|
|
static int pm_iter(struct device *dev, void *data)
|
|
{
|
|
struct pcie_port_service_driver *service_driver;
|
|
size_t offset = *(size_t *)data;
|
|
pcie_pm_callback_t cb;
|
|
|
|
if ((dev->bus == &pcie_port_bus_type) && dev->driver) {
|
|
service_driver = to_service_driver(dev->driver);
|
|
cb = *(pcie_pm_callback_t *)((void *)service_driver + offset);
|
|
if (cb)
|
|
return cb(to_pcie_device(dev));
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int get_downstream_delay(struct pci_bus *bus)
|
|
{
|
|
struct pci_dev *pdev;
|
|
int min_delay = 100;
|
|
int max_delay = 0;
|
|
|
|
list_for_each_entry(pdev, &bus->devices, bus_list) {
|
|
if (!pdev->imm_ready)
|
|
min_delay = 0;
|
|
else if (pdev->d3cold_delay < min_delay)
|
|
min_delay = pdev->d3cold_delay;
|
|
if (pdev->d3cold_delay > max_delay)
|
|
max_delay = pdev->d3cold_delay;
|
|
}
|
|
|
|
return max(min_delay, max_delay);
|
|
}
|
|
|
|
/*
|
|
* wait_for_downstream_link - Wait for downstream link to establish
|
|
* @pdev: PCIe port whose downstream link is waited
|
|
*
|
|
* Handle delays according to PCIe 4.0 section 6.6.1 before configuration
|
|
* access to the downstream component is permitted.
|
|
*
|
|
* This blocks PCI core resume of the hierarchy below this port until the
|
|
* link is trained. Should be called before resuming port services to
|
|
* prevent pciehp from starting to tear-down the hierarchy too soon.
|
|
*/
|
|
static void wait_for_downstream_link(struct pci_dev *pdev)
|
|
{
|
|
int delay;
|
|
|
|
if (pci_pcie_type(pdev) != PCI_EXP_TYPE_ROOT_PORT &&
|
|
pci_pcie_type(pdev) != PCI_EXP_TYPE_DOWNSTREAM)
|
|
return;
|
|
|
|
if (pci_dev_is_disconnected(pdev))
|
|
return;
|
|
|
|
if (!pdev->subordinate || list_empty(&pdev->subordinate->devices) ||
|
|
!pdev->bridge_d3)
|
|
return;
|
|
|
|
delay = get_downstream_delay(pdev->subordinate);
|
|
if (!delay)
|
|
return;
|
|
|
|
dev_dbg(&pdev->dev, "waiting downstream link for %d ms\n", delay);
|
|
|
|
/*
|
|
* If downstream port does not support speeds greater than 5 GT/s
|
|
* need to wait 100ms. For higher speeds (gen3) we need to wait
|
|
* first for the data link layer to become active.
|
|
*/
|
|
if (pcie_get_speed_cap(pdev) <= PCIE_SPEED_5_0GT)
|
|
msleep(delay);
|
|
else
|
|
pcie_wait_for_link_delay(pdev, true, delay);
|
|
}
|
|
|
|
/**
|
|
* pcie_port_device_suspend - suspend port services associated with a PCIe port
|
|
* @dev: PCI Express port to handle
|
|
*/
|
|
int pcie_port_device_suspend(struct device *dev)
|
|
{
|
|
size_t off = offsetof(struct pcie_port_service_driver, suspend);
|
|
return device_for_each_child(dev, &off, pm_iter);
|
|
}
|
|
|
|
int pcie_port_device_resume_noirq(struct device *dev)
|
|
{
|
|
size_t off = offsetof(struct pcie_port_service_driver, resume_noirq);
|
|
|
|
wait_for_downstream_link(to_pci_dev(dev));
|
|
return device_for_each_child(dev, &off, pm_iter);
|
|
}
|
|
|
|
/**
|
|
* pcie_port_device_resume - resume port services associated with a PCIe port
|
|
* @dev: PCI Express port to handle
|
|
*/
|
|
int pcie_port_device_resume(struct device *dev)
|
|
{
|
|
size_t off = offsetof(struct pcie_port_service_driver, resume);
|
|
return device_for_each_child(dev, &off, pm_iter);
|
|
}
|
|
|
|
/**
|
|
* pcie_port_device_runtime_suspend - runtime suspend port services
|
|
* @dev: PCI Express port to handle
|
|
*/
|
|
int pcie_port_device_runtime_suspend(struct device *dev)
|
|
{
|
|
size_t off = offsetof(struct pcie_port_service_driver, runtime_suspend);
|
|
return device_for_each_child(dev, &off, pm_iter);
|
|
}
|
|
|
|
/**
|
|
* pcie_port_device_runtime_resume - runtime resume port services
|
|
* @dev: PCI Express port to handle
|
|
*/
|
|
int pcie_port_device_runtime_resume(struct device *dev)
|
|
{
|
|
size_t off = offsetof(struct pcie_port_service_driver, runtime_resume);
|
|
|
|
wait_for_downstream_link(to_pci_dev(dev));
|
|
return device_for_each_child(dev, &off, pm_iter);
|
|
}
|
|
#endif /* PM */
|
|
|
|
static int remove_iter(struct device *dev, void *data)
|
|
{
|
|
if (dev->bus == &pcie_port_bus_type)
|
|
device_unregister(dev);
|
|
return 0;
|
|
}
|
|
|
|
static int find_service_iter(struct device *device, void *data)
|
|
{
|
|
struct pcie_port_service_driver *service_driver;
|
|
struct portdrv_service_data *pdrvs;
|
|
u32 service;
|
|
|
|
pdrvs = (struct portdrv_service_data *) data;
|
|
service = pdrvs->service;
|
|
|
|
if (device->bus == &pcie_port_bus_type && device->driver) {
|
|
service_driver = to_service_driver(device->driver);
|
|
if (service_driver->service == service) {
|
|
pdrvs->drv = service_driver;
|
|
pdrvs->dev = device;
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* pcie_port_find_service - find the service driver
|
|
* @dev: PCI Express port the service is associated with
|
|
* @service: Service to find
|
|
*
|
|
* Find PCI Express port service driver associated with given service
|
|
*/
|
|
struct pcie_port_service_driver *pcie_port_find_service(struct pci_dev *dev,
|
|
u32 service)
|
|
{
|
|
struct pcie_port_service_driver *drv;
|
|
struct portdrv_service_data pdrvs;
|
|
|
|
pdrvs.drv = NULL;
|
|
pdrvs.service = service;
|
|
device_for_each_child(&dev->dev, &pdrvs, find_service_iter);
|
|
|
|
drv = pdrvs.drv;
|
|
return drv;
|
|
}
|
|
|
|
/**
|
|
* pcie_port_find_device - find the struct device
|
|
* @dev: PCI Express port the service is associated with
|
|
* @service: For the service to find
|
|
*
|
|
* Find the struct device associated with given service on a pci_dev
|
|
*/
|
|
struct device *pcie_port_find_device(struct pci_dev *dev,
|
|
u32 service)
|
|
{
|
|
struct device *device;
|
|
struct portdrv_service_data pdrvs;
|
|
|
|
pdrvs.dev = NULL;
|
|
pdrvs.service = service;
|
|
device_for_each_child(&dev->dev, &pdrvs, find_service_iter);
|
|
|
|
device = pdrvs.dev;
|
|
return device;
|
|
}
|
|
EXPORT_SYMBOL_GPL(pcie_port_find_device);
|
|
|
|
/**
|
|
* pcie_port_device_remove - unregister PCI Express port service devices
|
|
* @dev: PCI Express port the service devices to unregister are associated with
|
|
*
|
|
* Remove PCI Express port service devices associated with given port and
|
|
* disable MSI-X or MSI for the port.
|
|
*/
|
|
void pcie_port_device_remove(struct pci_dev *dev)
|
|
{
|
|
device_for_each_child(&dev->dev, NULL, remove_iter);
|
|
pci_free_irq_vectors(dev);
|
|
pci_disable_device(dev);
|
|
}
|
|
|
|
/**
|
|
* pcie_port_probe_service - probe driver for given PCI Express port service
|
|
* @dev: PCI Express port service device to probe against
|
|
*
|
|
* If PCI Express port service driver is registered with
|
|
* pcie_port_service_register(), this function will be called by the driver core
|
|
* whenever match is found between the driver and a port service device.
|
|
*/
|
|
static int pcie_port_probe_service(struct device *dev)
|
|
{
|
|
struct pcie_device *pciedev;
|
|
struct pcie_port_service_driver *driver;
|
|
int status;
|
|
|
|
if (!dev || !dev->driver)
|
|
return -ENODEV;
|
|
|
|
driver = to_service_driver(dev->driver);
|
|
if (!driver || !driver->probe)
|
|
return -ENODEV;
|
|
|
|
pciedev = to_pcie_device(dev);
|
|
status = driver->probe(pciedev);
|
|
if (status)
|
|
return status;
|
|
|
|
get_device(dev);
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* pcie_port_remove_service - detach driver from given PCI Express port service
|
|
* @dev: PCI Express port service device to handle
|
|
*
|
|
* If PCI Express port service driver is registered with
|
|
* pcie_port_service_register(), this function will be called by the driver core
|
|
* when device_unregister() is called for the port service device associated
|
|
* with the driver.
|
|
*/
|
|
static int pcie_port_remove_service(struct device *dev)
|
|
{
|
|
struct pcie_device *pciedev;
|
|
struct pcie_port_service_driver *driver;
|
|
|
|
if (!dev || !dev->driver)
|
|
return 0;
|
|
|
|
pciedev = to_pcie_device(dev);
|
|
driver = to_service_driver(dev->driver);
|
|
if (driver && driver->remove) {
|
|
driver->remove(pciedev);
|
|
put_device(dev);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/**
|
|
* pcie_port_shutdown_service - shut down given PCI Express port service
|
|
* @dev: PCI Express port service device to handle
|
|
*
|
|
* If PCI Express port service driver is registered with
|
|
* pcie_port_service_register(), this function will be called by the driver core
|
|
* when device_shutdown() is called for the port service device associated
|
|
* with the driver.
|
|
*/
|
|
static void pcie_port_shutdown_service(struct device *dev) {}
|
|
|
|
/**
|
|
* pcie_port_service_register - register PCI Express port service driver
|
|
* @new: PCI Express port service driver to register
|
|
*/
|
|
int pcie_port_service_register(struct pcie_port_service_driver *new)
|
|
{
|
|
if (pcie_ports_disabled)
|
|
return -ENODEV;
|
|
|
|
new->driver.name = new->name;
|
|
new->driver.bus = &pcie_port_bus_type;
|
|
new->driver.probe = pcie_port_probe_service;
|
|
new->driver.remove = pcie_port_remove_service;
|
|
new->driver.shutdown = pcie_port_shutdown_service;
|
|
|
|
return driver_register(&new->driver);
|
|
}
|
|
EXPORT_SYMBOL(pcie_port_service_register);
|
|
|
|
/**
|
|
* pcie_port_service_unregister - unregister PCI Express port service driver
|
|
* @drv: PCI Express port service driver to unregister
|
|
*/
|
|
void pcie_port_service_unregister(struct pcie_port_service_driver *drv)
|
|
{
|
|
driver_unregister(&drv->driver);
|
|
}
|
|
EXPORT_SYMBOL(pcie_port_service_unregister);
|