From: Rafael J. Wysocki <rjw@xxxxxxx> If MSI-X interrupt mode is used by the PCI Express port driver, too many vectors are allocated and it is not ensured that the right vectors will be used for various services. Namely, the PCI Express specification states that both PCI Express native PME and PCI Express hotplug will always use the same MSI or MSI-X message for signalling interrupts, which implies that the same vector will be used by both of them. Also, the VC service does not use interrupts at all. Moreover, is not clear which of the vectors allocated by pci_enable_msix() will be used for PME and hotplug and which of them will be used for AER if all of these services are configured. For these reasons, rework the allocation of interrupts for PCI Express ports so that at most two vectors are allocated and ensure that the right vector will be used for the right purpose. Signed-off-by: Rafael J. Wysocki <rjw@xxxxxxx> --- drivers/pci/pcie/portdrv.h | 1 drivers/pci/pcie/portdrv_core.c | 155 +++++++++++++++++++++++++++++----------- 2 files changed, 117 insertions(+), 39 deletions(-) Index: linux-2.6/drivers/pci/pcie/portdrv.h =================================================================== --- linux-2.6.orig/drivers/pci/pcie/portdrv.h +++ linux-2.6/drivers/pci/pcie/portdrv.h @@ -25,6 +25,7 @@ #define PCIE_CAPABILITIES_REG 0x2 #define PCIE_SLOT_CAPABILITIES_REG 0x14 #define PCIE_PORT_DEVICE_MAXSERVICES 4 +#define PORT_MSI_VECTOR_MASK 0x1f #define get_descriptor_id(type, service) (((type - 4) << 4) | service) Index: linux-2.6/drivers/pci/pcie/portdrv_core.c =================================================================== --- linux-2.6.orig/drivers/pci/pcie/portdrv_core.c +++ linux-2.6/drivers/pci/pcie/portdrv_core.c @@ -30,55 +30,120 @@ static void release_pcie_device(struct d } /** + * fix_up_vectors - ensure the right ordering of MSI-X interrupt vectors + * @dev: PCI Express port that is going to use the vectors + * @vectors: Array of interrupt vectors to check (2 entries) + * + * Return value: + * 0 on success, error code if the values read from config registers are not as + * expected + * + * If this function is called, we are going to use two interrupt vectors which + * may be different, but we have to make sure they are in the right order such + * that the vector to be used for PME and hotplug signalling is the first one. + * + * NOTE: The assumption here is that MSI message offset (with respect to the + * base Message Data) equal to N corresponds to index N in the array of vectors + * returned by pci_enable_msix(). + */ +static int fix_up_vectors(struct pci_dev *dev, int *vectors) +{ + int pos, offset; + int vec0, vec1; + u16 reg16; + u32 reg32; + + if (vectors[0] == vectors[1]) + return 0; + + pos = pci_find_capability(dev, PCI_CAP_ID_EXP); + pci_read_config_word(dev, pos + PCIE_CAPABILITIES_REG, ®16); + offset = (reg16 >> 9) & PORT_MSI_VECTOR_MASK; + if (offset > 1) + return -EIO; + else + vec0 = offset ? vectors[1] : vectors[0]; + + pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ERR); + pci_read_config_dword(dev, pos + PCI_ERR_ROOT_STATUS, ®32); + offset = (reg32 >> 27) & PORT_MSI_VECTOR_MASK; + if (offset > 1) + return -EIO; + else + vec1 = offset ? vectors[1] : vectors[0]; + + vectors[0] = vec0; + vectors[1] = vec1; + + return 0; +} + +/** + * pcie_port_enable_msix - try to set up MSI-X as interrupt mode for given port + * @dev: PCI Express port to handle + * @vectors: Array of interrupt vectors to populate (2 entries) + * @mask: Bitmask of port capabilities returned by get_port_device_capability() + * + * Return value: 0 on success, error code on failure + */ +static int pcie_port_enable_msix(struct pci_dev *dev, int *vectors, int mask) +{ + struct msix_entry msix_entries[] = {{0, 0}, {0, 1}}; + int nvec, status; + + /* + * According to the PCI Express specification both PME and PCI Express + * hotplug always use the same interrupt vector, while AER can use + * a different one. + */ + nvec = ((mask & (PCIE_PORT_SERVICE_PME | PCIE_PORT_SERVICE_HP)) + && (mask & PCIE_PORT_SERVICE_AER)) ? 2 : 1; + + status = pci_enable_msix(dev, msix_entries, nvec); + if (status) + return status; + + vectors[0] = msix_entries[0].vector; + vectors[1] = nvec > 1 ? msix_entries[1].vector : vectors[0]; + + status = fix_up_vectors(dev, vectors); + if (status) + pci_disable_msix(dev); + + return status; +} + +/** * assign_interrupt_mode - choose interrupt mode for PCI Express port services * (INTx, MSI-X, MSI) and set up vectors * @dev: PCI Express port to handle - * @vectors: Array of interrupt vectors to populate + * @vectors: Array of interrupt vectors to populate (2 entries) * @mask: Bitmask of port capabilities returned by get_port_device_capability() * * Return value: Interrupt mode associated with the port */ static int assign_interrupt_mode(struct pci_dev *dev, int *vectors, int mask) { - int i, pos, nvec, status = -EINVAL; int interrupt_mode = PCIE_PORT_NO_IRQ; - /* Set INTx as default */ - for (i = 0, nvec = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++) { - if (mask & (1 << i)) - nvec++; - vectors[i] = dev->irq; - if (dev->pin) - interrupt_mode = PCIE_PORT_INTx_MODE; + /* Use MSI-X if supported */ + if (!pcie_port_enable_msix(dev, vectors, mask)) { + interrupt_mode = PCIE_PORT_MSIX_MODE; + goto Exit; } - /* Select MSI-X over MSI if supported */ - pos = pci_find_capability(dev, PCI_CAP_ID_MSIX); - if (pos) { - struct msix_entry msix_entries[PCIE_PORT_DEVICE_MAXSERVICES] = - {{0, 0}, {0, 1}, {0, 2}, {0, 3}}; - status = pci_enable_msix(dev, msix_entries, nvec); - if (!status) { - int j = 0; - - interrupt_mode = PCIE_PORT_MSIX_MODE; - for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++) { - if (mask & (1 << i)) - vectors[i] = msix_entries[j++].vector; - } - } - } - if (status) { - pos = pci_find_capability(dev, PCI_CAP_ID_MSI); - if (pos) { - status = pci_enable_msi(dev); - if (!status) { - interrupt_mode = PCIE_PORT_MSI_MODE; - for (i = 0;i < PCIE_PORT_DEVICE_MAXSERVICES;i++) - vectors[i] = dev->irq; - } - } - } + /* We can't use MSI-X, so try MSI and fall back to INTx */ + if (!pci_enable_msi(dev)) + interrupt_mode = PCIE_PORT_MSI_MODE; + else if (dev->pin) + interrupt_mode = PCIE_PORT_INTx_MODE; + else + goto Exit; + + vectors[0] = dev->irq; + vectors[1] = vectors[0]; + + Exit: return interrupt_mode; } @@ -205,7 +270,7 @@ int pcie_port_device_probe(struct pci_de int pcie_port_device_register(struct pci_dev *dev) { int status, type, capabilities, irq_mode, i, nr_serv; - int vectors[PCIE_PORT_DEVICE_MAXSERVICES]; + int vectors[] = { -1, -1 }; u16 reg16; /* Get port type */ @@ -229,7 +294,7 @@ int pcie_port_device_register(struct pci /* Allocate child services if any */ for (i = 0, nr_serv = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++) { struct pcie_device *child; - int service = 1 << i; + int irq, service = 1 << i; if (!(capabilities & service)) continue; @@ -242,11 +307,23 @@ int pcie_port_device_register(struct pci && service != PCIE_PORT_SERVICE_VC) continue; + switch (service) { + case PCIE_PORT_SERVICE_PME: + case PCIE_PORT_SERVICE_HP: + irq = vectors[0]; + break; + case PCIE_PORT_SERVICE_AER: + irq = vectors[1]; + break; + default: + irq = -1; + } + child = alloc_pcie_device( dev, /* parent */ type, /* port type */ service, /* service type */ - vectors[i], /* irq */ + irq, /* interrupt vector */ irq_mode /* interrupt mode */); if (!child) continue; -- To unsubscribe from this list: send the line "unsubscribe linux-pci" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html