qemu-devel
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [Qemu-devel] [PATCH v3] pci: fix pci_requester_id()


From: Michael S. Tsirkin
Subject: Re: [Qemu-devel] [PATCH v3] pci: fix pci_requester_id()
Date: Tue, 17 May 2016 10:46:12 +0300

On Tue, May 17, 2016 at 02:45:07PM +0800, Peter Xu wrote:
> This fix SID verification failure when IOMMU IR is enabled with PCI
> bridges. Existing pci_requester_id() is more like getting BDF info
> only. Renaming it to pci_get_bdf(). Meanwhile, we provide the correct
> implementation to get requester ID. VT-d spec 5.1.1 is a good reference
> to go, though it talks only about interrupt delivery, the rule works
> exactly the same for non-interrupt cases.
> 
> Currently, there are three use cases for pci_requester_id():
> 
> - PCIX status bits: here we need BDF only, not requester ID. Replacing
>   with pci_get_bdf().
> - PCIe Error injection and MSI delivery: for both these cases, we are
>   looking for requester IDs. Here we should use the new impl.
> 
> To avoid a PCI walk every time we send MSI message, one requester_id
> field is added to PCIDevice to cache the result when we use it the first
> time.  Here assumption is made that requester_id will never change
> during device lifecycle.

That's wrong though. It can change if bus number changes.

That's why I said add a pointer to the actual requester,
set it up during initialization, not on first use.


> Signed-off-by: Peter Xu <address@hidden>
> ---
>  hw/i386/kvm/pci-assign.c |  2 +-
>  hw/pci/pci.c             | 46 ++++++++++++++++++++++++++++++++++++++++++++++
>  include/hw/pci/pci.h     | 11 +++++++++--
>  3 files changed, 56 insertions(+), 3 deletions(-)
> 
> diff --git a/hw/i386/kvm/pci-assign.c b/hw/i386/kvm/pci-assign.c
> index bf425a2..c40ab36 100644
> --- a/hw/i386/kvm/pci-assign.c
> +++ b/hw/i386/kvm/pci-assign.c
> @@ -1481,7 +1481,7 @@ static int assigned_device_pci_cap_init(PCIDevice 
> *pci_dev, Error **errp)
>           * error bits, leave the rest. */
>          status = pci_get_long(pci_dev->config + pos + PCI_X_STATUS);
>          status &= ~(PCI_X_STATUS_BUS | PCI_X_STATUS_DEVFN);
> -        status |= pci_requester_id(pci_dev);
> +        status |= pci_get_bdf(pci_dev);
>          status &= ~(PCI_X_STATUS_SPL_DISC | PCI_X_STATUS_UNX_SPL |
>                      PCI_X_STATUS_SPL_ERR);
>          pci_set_long(pci_dev->config + pos + PCI_X_STATUS, status);
> diff --git a/hw/pci/pci.c b/hw/pci/pci.c
> index bb605ef..0a35255 100644
> --- a/hw/pci/pci.c
> +++ b/hw/pci/pci.c
> @@ -885,6 +885,7 @@ static PCIDevice *do_pci_register_device(PCIDevice 
> *pci_dev, PCIBus *bus,
>      }
>  
>      pci_dev->devfn = devfn;
> +    pci_dev->requester_id = 0;  /* Not cached */
>      dma_as = pci_device_iommu_address_space(pci_dev);
>  
>      memory_region_init_alias(&pci_dev->bus_master_enable_region,
> @@ -2498,6 +2499,51 @@ PCIDevice *pci_get_function_0(PCIDevice *pci_dev)
>      }
>  }
>  
> +/* Parse bridges up to the root complex and get final Requester ID
> + * for this device.  For full PCIe topology, this works exactly as
> + * what pci_get_bdf() does. However, several tricks are required
> + * when mixed up with legacy PCI devices and PCIe-to-PCI bridges. */
> +static uint16_t pci_requester_id_no_cache(PCIDevice *dev)
> +{
> +    uint8_t bus_n;
> +    uint16_t result = pci_get_bdf(dev);
> +
> +    while (!pci_bus_is_root(dev->bus)) {
> +        /* We are under PCI/PCIe bridges, fetch bus number of
> +         * current bus, which is the secondary bus number of
> +         * parent bridge. */
> +        bus_n = pci_bus_num(dev->bus);
> +        dev = dev->bus->parent_dev;
> +        if (pci_is_express(dev)) {
> +            if (pcie_cap_get_type(dev) == PCI_EXP_TYPE_PCI_BRIDGE) {
> +                /* When we pass through PCIe-to-PCI/PCIX bridges, we
> +                 * override the requester ID using secondary bus
> +                 * number of parent bridge with zeroed devfn
> +                 * (pcie-to-pci bridge spec chap 2.3). */
> +                result = PCI_BUILD_BDF(bus_n, 0);
> +            }
> +        } else {
> +            /* Legacy PCI, override requester ID with the bridge's
> +             * BDF upstream.  When the root complex connects to
> +             * legacy PCI devices (including buses), it can only
> +             * obtain requester ID info from directly attached
> +             * devices.  If devices are attached under bridges, only
> +             * the requester ID of the bridge that is directly
> +             * attached to the root complex can be recognized. */
> +            result = pci_get_bdf(dev);
> +        }
> +    }
> +    return result;
> +}
> +
> +uint16_t pci_requester_id(PCIDevice *dev)
> +{
> +    if (unlikely(!dev->requester_id)) {
> +        dev->requester_id = pci_requester_id_no_cache(dev);
> +    }
> +    return dev->requester_id;
> +}
> +
>  static const TypeInfo pci_device_type_info = {
>      .name = TYPE_PCI_DEVICE,
>      .parent = TYPE_DEVICE,
> diff --git a/include/hw/pci/pci.h b/include/hw/pci/pci.h
> index ef6ba51..cb3ab3b 100644
> --- a/include/hw/pci/pci.h
> +++ b/include/hw/pci/pci.h
> @@ -15,6 +15,7 @@
>  #define PCI_DEVFN(slot, func)   ((((slot) & 0x1f) << 3) | ((func) & 0x07))
>  #define PCI_SLOT(devfn)         (((devfn) >> 3) & 0x1f)
>  #define PCI_FUNC(devfn)         ((devfn) & 0x07)
> +#define PCI_BUILD_BDF(bus, devfn)     ((bus << 8) | (devfn))
>  #define PCI_SLOT_MAX            32
>  #define PCI_FUNC_MAX            8
>  
> @@ -252,6 +253,10 @@ struct PCIDevice {
>      /* the following fields are read only */
>      PCIBus *bus;
>      int32_t devfn;
> +    /* Cached requester ID, to avoid the PCI tree walking every time
> +     * we invoke PCI request (e.g., MSI).  For conventional PCI root
> +     * complex, this field is meaningless. */
> +    uint16_t requester_id;
>      char name[64];
>      PCIIORegion io_regions[PCI_NUM_REGIONS];
>      AddressSpace bus_master_as;
> @@ -685,11 +690,13 @@ static inline uint32_t pci_config_size(const PCIDevice 
> *d)
>      return pci_is_express(d) ? PCIE_CONFIG_SPACE_SIZE : 
> PCI_CONFIG_SPACE_SIZE;
>  }
>  
> -static inline uint16_t pci_requester_id(PCIDevice *dev)
> +static inline uint16_t pci_get_bdf(PCIDevice *dev)
>  {
> -    return (pci_bus_num(dev->bus) << 8) | dev->devfn;
> +    return PCI_BUILD_BDF(pci_bus_num(dev->bus), dev->devfn);
>  }
>  
> +uint16_t pci_requester_id(PCIDevice *dev);
> +
>  /* DMA access functions */
>  static inline AddressSpace *pci_get_address_space(PCIDevice *dev)
>  {
> -- 
> 2.4.11



reply via email to

[Prev in Thread] Current Thread [Next in Thread]