2dd9c11b9d
This patch leverages 'struct pci_host_bridge' from the PCI subsystem in order to free the pci_controller only after the last reference to its devices is dropped (avoiding an oops in pcibios_release_device() if the last reference is dropped after pcibios_free_controller()). The patch relies on pci_host_bridge.release_fn() (and .release_data), which is called automatically by the PCI subsystem when the root bus is released (i.e., the last reference is dropped). Those fields are set via pci_set_host_bridge_release() (e.g. in the platform-specific implementation of pcibios_root_bridge_prepare()). It introduces the 'pcibios_free_controller_deferred()' .release_fn() and it expects .release_data to hold a pointer to the pci_controller. The function implictly calls 'pcibios_free_controller()', so an user must *NOT* explicitly call it if using the new _deferred() callback. The functionality is enabled for pseries (although it isn't platform specific, and may be used by cxl). Details on not-so-elegant design choices: - Use 'pci_host_bridge.release_data' field as pointer to associated 'struct pci_controller' so *not* to 'pci_bus_to_host(bridge->bus)' in pcibios_free_controller_deferred(). That's because pci_remove_root_bus() sets 'host_bridge->bus = NULL' (so, if the last reference is released after pci_remove_root_bus() runs, which eventually reaches pcibios_free_controller_deferred(), that would hit a null pointer dereference). The cxl/vphb.c code calls pci_remove_root_bus(), and the cxl folks are interested in this fix. Test-case #1 (hold references) # ls -ld /sys/block/sd* | grep -m1 0021:01:00.0 <...> /sys/block/sdaa -> ../devices/pci0021:01/0021:01:00.0/<...> # ls -ld /sys/block/sd* | grep -m1 0021:01:00.1 <...> /sys/block/sdab -> ../devices/pci0021:01/0021:01:00.1/<...> # cat >/dev/sdaa & pid1=$! # cat >/dev/sdab & pid2=$! # drmgr -w 5 -d 1 -c phb -s 'PHB 33' -r Validating PHB DLPAR capability...yes. [ 594.306719] pci_hp_remove_devices: PCI: Removing devices on bus 0021:01 [ 594.306738] pci_hp_remove_devices: Removing 0021:01:00.0... ... [ 598.236381] pci_hp_remove_devices: Removing 0021:01:00.1... ... [ 611.972077] pci_bus 0021:01: busn_res: [bus 01-ff] is released [ 611.972140] rpadlpar_io: slot PHB 33 removed # kill -9 $pid1 # kill -9 $pid2 [ 632.918088] pcibios_free_controller_deferred: domain 33, dynamic 1 Test-case #2 (don't hold references) # drmgr -w 5 -d 1 -c phb -s 'PHB 33' -r Validating PHB DLPAR capability...yes. [ 916.357363] pci_hp_remove_devices: PCI: Removing devices on bus 0021:01 [ 916.357386] pci_hp_remove_devices: Removing 0021:01:00.0... ... [ 920.566527] pci_hp_remove_devices: Removing 0021:01:00.1... ... [ 933.955873] pci_bus 0021:01: busn_res: [bus 01-ff] is released [ 933.955977] pcibios_free_controller_deferred: domain 33, dynamic 1 [ 933.955999] rpadlpar_io: slot PHB 33 removed Suggested-By: Gavin Shan <gwshan@linux.vnet.ibm.com> Signed-off-by: Mauricio Faria de Oliveira <mauricfo@linux.vnet.ibm.com> Reviewed-by: Gavin Shan <gwshan@linux.vnet.ibm.com> Reviewed-by: Andrew Donnellan <andrew.donnellan@au1.ibm.com> Tested-by: Andrew Donnellan <andrew.donnellan@au1.ibm.com> # cxl Signed-off-by: Benjamin Herrenschmidt <benh@kernel.crashing.org>
317 lines
9.7 KiB
C
317 lines
9.7 KiB
C
#ifndef _ASM_POWERPC_PCI_BRIDGE_H
|
|
#define _ASM_POWERPC_PCI_BRIDGE_H
|
|
#ifdef __KERNEL__
|
|
/*
|
|
* This program is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU General Public License
|
|
* as published by the Free Software Foundation; either version
|
|
* 2 of the License, or (at your option) any later version.
|
|
*/
|
|
#include <linux/pci.h>
|
|
#include <linux/list.h>
|
|
#include <linux/ioport.h>
|
|
|
|
struct device_node;
|
|
|
|
/*
|
|
* PCI controller operations
|
|
*/
|
|
struct pci_controller_ops {
|
|
void (*dma_dev_setup)(struct pci_dev *pdev);
|
|
void (*dma_bus_setup)(struct pci_bus *bus);
|
|
|
|
int (*probe_mode)(struct pci_bus *bus);
|
|
|
|
/* Called when pci_enable_device() is called. Returns true to
|
|
* allow assignment/enabling of the device. */
|
|
bool (*enable_device_hook)(struct pci_dev *pdev);
|
|
|
|
void (*disable_device)(struct pci_dev *pdev);
|
|
|
|
void (*release_device)(struct pci_dev *pdev);
|
|
|
|
/* Called during PCI resource reassignment */
|
|
resource_size_t (*window_alignment)(struct pci_bus *bus,
|
|
unsigned long type);
|
|
void (*setup_bridge)(struct pci_bus *bus,
|
|
unsigned long type);
|
|
void (*reset_secondary_bus)(struct pci_dev *pdev);
|
|
|
|
#ifdef CONFIG_PCI_MSI
|
|
int (*setup_msi_irqs)(struct pci_dev *pdev,
|
|
int nvec, int type);
|
|
void (*teardown_msi_irqs)(struct pci_dev *pdev);
|
|
#endif
|
|
|
|
int (*dma_set_mask)(struct pci_dev *pdev, u64 dma_mask);
|
|
u64 (*dma_get_required_mask)(struct pci_dev *pdev);
|
|
|
|
void (*shutdown)(struct pci_controller *hose);
|
|
};
|
|
|
|
/*
|
|
* Structure of a PCI controller (host bridge)
|
|
*/
|
|
struct pci_controller {
|
|
struct pci_bus *bus;
|
|
char is_dynamic;
|
|
#ifdef CONFIG_PPC64
|
|
int node;
|
|
#endif
|
|
struct device_node *dn;
|
|
struct list_head list_node;
|
|
struct device *parent;
|
|
|
|
int first_busno;
|
|
int last_busno;
|
|
int self_busno;
|
|
struct resource busn;
|
|
|
|
void __iomem *io_base_virt;
|
|
#ifdef CONFIG_PPC64
|
|
void *io_base_alloc;
|
|
#endif
|
|
resource_size_t io_base_phys;
|
|
resource_size_t pci_io_size;
|
|
|
|
/* Some machines have a special region to forward the ISA
|
|
* "memory" cycles such as VGA memory regions. Left to 0
|
|
* if unsupported
|
|
*/
|
|
resource_size_t isa_mem_phys;
|
|
resource_size_t isa_mem_size;
|
|
|
|
struct pci_controller_ops controller_ops;
|
|
struct pci_ops *ops;
|
|
unsigned int __iomem *cfg_addr;
|
|
void __iomem *cfg_data;
|
|
|
|
/*
|
|
* Used for variants of PCI indirect handling and possible quirks:
|
|
* SET_CFG_TYPE - used on 4xx or any PHB that does explicit type0/1
|
|
* EXT_REG - provides access to PCI-e extended registers
|
|
* SURPRESS_PRIMARY_BUS - we suppress the setting of PCI_PRIMARY_BUS
|
|
* on Freescale PCI-e controllers since they used the PCI_PRIMARY_BUS
|
|
* to determine which bus number to match on when generating type0
|
|
* config cycles
|
|
* NO_PCIE_LINK - the Freescale PCI-e controllers have issues with
|
|
* hanging if we don't have link and try to do config cycles to
|
|
* anything but the PHB. Only allow talking to the PHB if this is
|
|
* set.
|
|
* BIG_ENDIAN - cfg_addr is a big endian register
|
|
* BROKEN_MRM - the 440EPx/GRx chips have an errata that causes hangs on
|
|
* the PLB4. Effectively disable MRM commands by setting this.
|
|
* FSL_CFG_REG_LINK - Freescale controller version in which the PCIe
|
|
* link status is in a RC PCIe cfg register (vs being a SoC register)
|
|
*/
|
|
#define PPC_INDIRECT_TYPE_SET_CFG_TYPE 0x00000001
|
|
#define PPC_INDIRECT_TYPE_EXT_REG 0x00000002
|
|
#define PPC_INDIRECT_TYPE_SURPRESS_PRIMARY_BUS 0x00000004
|
|
#define PPC_INDIRECT_TYPE_NO_PCIE_LINK 0x00000008
|
|
#define PPC_INDIRECT_TYPE_BIG_ENDIAN 0x00000010
|
|
#define PPC_INDIRECT_TYPE_BROKEN_MRM 0x00000020
|
|
#define PPC_INDIRECT_TYPE_FSL_CFG_REG_LINK 0x00000040
|
|
u32 indirect_type;
|
|
/* Currently, we limit ourselves to 1 IO range and 3 mem
|
|
* ranges since the common pci_bus structure can't handle more
|
|
*/
|
|
struct resource io_resource;
|
|
struct resource mem_resources[3];
|
|
resource_size_t mem_offset[3];
|
|
int global_number; /* PCI domain number */
|
|
|
|
resource_size_t dma_window_base_cur;
|
|
resource_size_t dma_window_size;
|
|
|
|
#ifdef CONFIG_PPC64
|
|
unsigned long buid;
|
|
struct pci_dn *pci_data;
|
|
#endif /* CONFIG_PPC64 */
|
|
|
|
void *private_data;
|
|
};
|
|
|
|
/* These are used for config access before all the PCI probing
|
|
has been done. */
|
|
extern int early_read_config_byte(struct pci_controller *hose, int bus,
|
|
int dev_fn, int where, u8 *val);
|
|
extern int early_read_config_word(struct pci_controller *hose, int bus,
|
|
int dev_fn, int where, u16 *val);
|
|
extern int early_read_config_dword(struct pci_controller *hose, int bus,
|
|
int dev_fn, int where, u32 *val);
|
|
extern int early_write_config_byte(struct pci_controller *hose, int bus,
|
|
int dev_fn, int where, u8 val);
|
|
extern int early_write_config_word(struct pci_controller *hose, int bus,
|
|
int dev_fn, int where, u16 val);
|
|
extern int early_write_config_dword(struct pci_controller *hose, int bus,
|
|
int dev_fn, int where, u32 val);
|
|
|
|
extern int early_find_capability(struct pci_controller *hose, int bus,
|
|
int dev_fn, int cap);
|
|
|
|
extern void setup_indirect_pci(struct pci_controller* hose,
|
|
resource_size_t cfg_addr,
|
|
resource_size_t cfg_data, u32 flags);
|
|
|
|
extern int indirect_read_config(struct pci_bus *bus, unsigned int devfn,
|
|
int offset, int len, u32 *val);
|
|
|
|
extern int __indirect_read_config(struct pci_controller *hose,
|
|
unsigned char bus_number, unsigned int devfn,
|
|
int offset, int len, u32 *val);
|
|
|
|
extern int indirect_write_config(struct pci_bus *bus, unsigned int devfn,
|
|
int offset, int len, u32 val);
|
|
|
|
static inline struct pci_controller *pci_bus_to_host(const struct pci_bus *bus)
|
|
{
|
|
return bus->sysdata;
|
|
}
|
|
|
|
#ifndef CONFIG_PPC64
|
|
|
|
extern int pci_device_from_OF_node(struct device_node *node,
|
|
u8 *bus, u8 *devfn);
|
|
extern void pci_create_OF_bus_map(void);
|
|
|
|
static inline int isa_vaddr_is_ioport(void __iomem *address)
|
|
{
|
|
/* No specific ISA handling on ppc32 at this stage, it
|
|
* all goes through PCI
|
|
*/
|
|
return 0;
|
|
}
|
|
|
|
#else /* CONFIG_PPC64 */
|
|
|
|
/*
|
|
* PCI stuff, for nodes representing PCI devices, pointed to
|
|
* by device_node->data.
|
|
*/
|
|
struct iommu_table;
|
|
|
|
struct pci_dn {
|
|
int flags;
|
|
#define PCI_DN_FLAG_IOV_VF 0x01
|
|
|
|
int busno; /* pci bus number */
|
|
int devfn; /* pci device and function number */
|
|
int vendor_id; /* Vendor ID */
|
|
int device_id; /* Device ID */
|
|
int class_code; /* Device class code */
|
|
|
|
struct pci_dn *parent;
|
|
struct pci_controller *phb; /* for pci devices */
|
|
struct iommu_table_group *table_group; /* for phb's or bridges */
|
|
struct device_node *node; /* back-pointer to the device_node */
|
|
|
|
int pci_ext_config_space; /* for pci devices */
|
|
|
|
struct pci_dev *pcidev; /* back-pointer to the pci device */
|
|
#ifdef CONFIG_EEH
|
|
struct eeh_dev *edev; /* eeh device */
|
|
#endif
|
|
#define IODA_INVALID_PE 0xFFFFFFFF
|
|
#ifdef CONFIG_PPC_POWERNV
|
|
unsigned int pe_number;
|
|
int vf_index; /* VF index in the PF */
|
|
#ifdef CONFIG_PCI_IOV
|
|
u16 vfs_expanded; /* number of VFs IOV BAR expanded */
|
|
u16 num_vfs; /* number of VFs enabled*/
|
|
unsigned int *pe_num_map; /* PE# for the first VF PE or array */
|
|
bool m64_single_mode; /* Use M64 BAR in Single Mode */
|
|
#define IODA_INVALID_M64 (-1)
|
|
int (*m64_map)[PCI_SRIOV_NUM_BARS];
|
|
#endif /* CONFIG_PCI_IOV */
|
|
int mps; /* Maximum Payload Size */
|
|
#endif
|
|
struct list_head child_list;
|
|
struct list_head list;
|
|
};
|
|
|
|
/* Get the pointer to a device_node's pci_dn */
|
|
#define PCI_DN(dn) ((struct pci_dn *) (dn)->data)
|
|
|
|
extern struct pci_dn *pci_get_pdn_by_devfn(struct pci_bus *bus,
|
|
int devfn);
|
|
extern struct pci_dn *pci_get_pdn(struct pci_dev *pdev);
|
|
extern struct pci_dn *add_dev_pci_data(struct pci_dev *pdev);
|
|
extern void remove_dev_pci_data(struct pci_dev *pdev);
|
|
extern struct pci_dn *pci_add_device_node_info(struct pci_controller *hose,
|
|
struct device_node *dn);
|
|
extern void pci_remove_device_node_info(struct device_node *dn);
|
|
|
|
static inline int pci_device_from_OF_node(struct device_node *np,
|
|
u8 *bus, u8 *devfn)
|
|
{
|
|
if (!PCI_DN(np))
|
|
return -ENODEV;
|
|
*bus = PCI_DN(np)->busno;
|
|
*devfn = PCI_DN(np)->devfn;
|
|
return 0;
|
|
}
|
|
|
|
#if defined(CONFIG_EEH)
|
|
static inline struct eeh_dev *pdn_to_eeh_dev(struct pci_dn *pdn)
|
|
{
|
|
return pdn ? pdn->edev : NULL;
|
|
}
|
|
#else
|
|
#define pdn_to_eeh_dev(x) (NULL)
|
|
#endif
|
|
|
|
/** Find the bus corresponding to the indicated device node */
|
|
extern struct pci_bus *pci_find_bus_by_node(struct device_node *dn);
|
|
|
|
/** Remove all of the PCI devices under this bus */
|
|
extern void pci_hp_remove_devices(struct pci_bus *bus);
|
|
|
|
/** Discover new pci devices under this bus, and add them */
|
|
extern void pci_hp_add_devices(struct pci_bus *bus);
|
|
|
|
|
|
extern void isa_bridge_find_early(struct pci_controller *hose);
|
|
|
|
static inline int isa_vaddr_is_ioport(void __iomem *address)
|
|
{
|
|
/* Check if address hits the reserved legacy IO range */
|
|
unsigned long ea = (unsigned long)address;
|
|
return ea >= ISA_IO_BASE && ea < ISA_IO_END;
|
|
}
|
|
|
|
extern int pcibios_unmap_io_space(struct pci_bus *bus);
|
|
extern int pcibios_map_io_space(struct pci_bus *bus);
|
|
|
|
#ifdef CONFIG_NUMA
|
|
#define PHB_SET_NODE(PHB, NODE) ((PHB)->node = (NODE))
|
|
#else
|
|
#define PHB_SET_NODE(PHB, NODE) ((PHB)->node = -1)
|
|
#endif
|
|
|
|
#endif /* CONFIG_PPC64 */
|
|
|
|
/* Get the PCI host controller for an OF device */
|
|
extern struct pci_controller *pci_find_hose_for_OF_device(
|
|
struct device_node* node);
|
|
|
|
/* Fill up host controller resources from the OF node */
|
|
extern void pci_process_bridge_OF_ranges(struct pci_controller *hose,
|
|
struct device_node *dev, int primary);
|
|
|
|
/* Allocate & free a PCI host bridge structure */
|
|
extern struct pci_controller *pcibios_alloc_controller(struct device_node *dev);
|
|
extern void pcibios_free_controller(struct pci_controller *phb);
|
|
extern void pcibios_free_controller_deferred(struct pci_host_bridge *bridge);
|
|
|
|
#ifdef CONFIG_PCI
|
|
extern int pcibios_vaddr_is_ioport(void __iomem *address);
|
|
#else
|
|
static inline int pcibios_vaddr_is_ioport(void __iomem *address)
|
|
{
|
|
return 0;
|
|
}
|
|
#endif /* CONFIG_PCI */
|
|
|
|
#endif /* __KERNEL__ */
|
|
#endif /* _ASM_POWERPC_PCI_BRIDGE_H */
|