When vpci fails to initialize a capability of a device, it just return error instead of catching and processing exception. That makes the entire device unusable.
So, refactor REGISTER_VPCI_INIT to contain more capability specific information, and use new functions to hide capability when initialization fails in vpci_assign_device(). Those new functions remove the failed legacy/extended capability from the emulated legacy/extended capability list. What's more, change the definition of init_header() since it is not a capability and it is needed for all devices' PCI config space. Note: call vpci_make_msix_hole() in the end of init_msix() since the change of sequence of init_header() and init_msix(). Signed-off-by: Jiqian Chen <jiqian.c...@amd.com> --- cc: "Roger Pau Monné" <roger....@citrix.com> cc: Andrew Cooper <andrew.coop...@citrix.com> cc: Anthony PERARD <anthony.per...@vates.tech> cc: Michal Orzel <michal.or...@amd.com> cc: Jan Beulich <jbeul...@suse.com> cc: Julien Grall <jul...@xen.org> cc: Stefano Stabellini <sstabell...@kernel.org> --- v1->v2 changes: * Removed the "priorities" of initializing capabilities since it isn't used anymore. * Added new function vpci_capability_mask() and vpci_ext_capability_mask() to remove failed capability from list. * Called vpci_make_msix_hole() in the end of init_msix(). Best regards, Jiqian Chen. --- xen/drivers/vpci/header.c | 3 +- xen/drivers/vpci/msi.c | 2 +- xen/drivers/vpci/msix.c | 8 +- xen/drivers/vpci/rebar.c | 2 +- xen/drivers/vpci/vpci.c | 175 +++++++++++++++++++++++++++++++------ xen/include/xen/pci_regs.h | 1 + xen/include/xen/vpci.h | 26 ++++-- xen/include/xen/xen.lds.h | 2 +- 8 files changed, 179 insertions(+), 40 deletions(-) diff --git a/xen/drivers/vpci/header.c b/xen/drivers/vpci/header.c index 6833d456566b..51a67d76ad8a 100644 --- a/xen/drivers/vpci/header.c +++ b/xen/drivers/vpci/header.c @@ -848,7 +848,7 @@ static int vpci_init_ext_capability_list(struct pci_dev *pdev) return 0; } -static int cf_check init_header(struct pci_dev *pdev) +int vpci_init_header(struct pci_dev *pdev) { uint16_t cmd; uint64_t addr, size; @@ -1044,7 +1044,6 @@ static int cf_check init_header(struct pci_dev *pdev) pci_conf_write16(pdev->sbdf, PCI_COMMAND, cmd); return rc; } -REGISTER_VPCI_INIT(init_header, VPCI_PRIORITY_MIDDLE); /* * Local variables: diff --git a/xen/drivers/vpci/msi.c b/xen/drivers/vpci/msi.c index 66e5a8a116be..ca89ae9b9c22 100644 --- a/xen/drivers/vpci/msi.c +++ b/xen/drivers/vpci/msi.c @@ -270,7 +270,7 @@ static int cf_check init_msi(struct pci_dev *pdev) return 0; } -REGISTER_VPCI_INIT(init_msi, VPCI_PRIORITY_LOW); +REGISTER_VPCI_LEGACY_CAP(PCI_CAP_ID_MSI, init_msi); void vpci_dump_msi(void) { diff --git a/xen/drivers/vpci/msix.c b/xen/drivers/vpci/msix.c index 6bd8c55bb48e..6537374c79a0 100644 --- a/xen/drivers/vpci/msix.c +++ b/xen/drivers/vpci/msix.c @@ -751,9 +751,13 @@ static int cf_check init_msix(struct pci_dev *pdev) pdev->vpci->msix = msix; list_add(&msix->next, &d->arch.hvm.msix_tables); - return 0; + spin_lock(&pdev->vpci->lock); + rc = vpci_make_msix_hole(pdev); + spin_unlock(&pdev->vpci->lock); + + return rc } -REGISTER_VPCI_INIT(init_msix, VPCI_PRIORITY_HIGH); +REGISTER_VPCI_LEGACY_CAP(PCI_CAP_ID_MSIX, init_msix); /* * Local variables: diff --git a/xen/drivers/vpci/rebar.c b/xen/drivers/vpci/rebar.c index 793937449af7..79858e5dc92f 100644 --- a/xen/drivers/vpci/rebar.c +++ b/xen/drivers/vpci/rebar.c @@ -118,7 +118,7 @@ static int cf_check init_rebar(struct pci_dev *pdev) return 0; } -REGISTER_VPCI_INIT(init_rebar, VPCI_PRIORITY_LOW); +REGISTER_VPCI_EXTEND_CAP(PCI_EXT_CAP_ID_REBAR, init_rebar); /* * Local variables: diff --git a/xen/drivers/vpci/vpci.c b/xen/drivers/vpci/vpci.c index 1e6aa5d799b9..f1f125bfdab1 100644 --- a/xen/drivers/vpci/vpci.c +++ b/xen/drivers/vpci/vpci.c @@ -35,9 +35,25 @@ struct vpci_register { uint32_t rsvdz_mask; }; +static int vpci_register_cmp(const struct vpci_register *r1, + const struct vpci_register *r2) +{ + /* Return 0 if registers overlap. */ + if ( r1->offset < r2->offset + r2->size && + r2->offset < r1->offset + r1->size ) + return 0; + if ( r1->offset < r2->offset ) + return -1; + if ( r1->offset > r2->offset ) + return 1; + + ASSERT_UNREACHABLE(); + return 0; +} + #ifdef __XEN__ -extern vpci_register_init_t *const __start_vpci_array[]; -extern vpci_register_init_t *const __end_vpci_array[]; +extern vpci_capability_t *const __start_vpci_array[]; +extern vpci_capability_t *const __end_vpci_array[]; #define NUM_VPCI_INIT (__end_vpci_array - __start_vpci_array) #ifdef CONFIG_HAS_VPCI_GUEST_SUPPORT @@ -83,6 +99,133 @@ static int assign_virtual_sbdf(struct pci_dev *pdev) #endif /* CONFIG_HAS_VPCI_GUEST_SUPPORT */ +static void vpci_capability_mask(struct pci_dev *pdev, + const unsigned int cap) +{ + const unsigned int size = 1; + const unsigned int offset = pci_find_cap_offset(pdev->sbdf, cap); + const struct vpci_register r = { .offset = offset, .size = size }; + struct vpci_register *rm; + struct vpci *vpci = pdev->vpci; + + spin_lock(&vpci->lock); + list_for_each_entry ( rm, &vpci->handlers, node ) + { + int cmp = vpci_register_cmp(&r, rm); + + if ( !cmp && rm->offset == offset && rm->size == size ) + { + struct vpci_register *pre = list_entry(rm->node.prev, + struct vpci_register, + node); + struct vpci_register *next = list_entry(rm->node.next, + struct vpci_register, + node); + + pre->private = next->private; + + /* PCI_CAP_LIST_ID register of current capability */ + list_del(&rm->node); + /* PCI_CAP_LIST_NEXT register of current capability */ + list_del(&next->node); + spin_unlock(&vpci->lock); + + xfree(rm); + xfree(next); + return; + } + if ( cmp <= 0 ) + break; + } + spin_unlock(&vpci->lock); +} + +static void vpci_ext_capability_mask(struct pci_dev *pdev, + const unsigned int cap) +{ + const unsigned int size = 4; + const unsigned int offset = pci_find_ext_capability(pdev->sbdf, cap); + const struct vpci_register r = { .offset = offset, .size = size }; + struct vpci_register *rm; + struct vpci *vpci = pdev->vpci; + + spin_lock(&vpci->lock); + list_for_each_entry ( rm, &vpci->handlers, node ) + { + int cmp = vpci_register_cmp(&r, rm); + + if ( !cmp && rm->offset == offset && rm->size == size ) + { + struct vpci_register *pre; + u32 pre_header, header = (u32)(uintptr_t)rm->private; + + if ( offset == 0x100U && PCI_EXT_CAP_NEXT(header) == 0 ) + { + rm->private = (void *)(uintptr_t)0; + spin_unlock(&vpci->lock); + return; + } + else if ( offset == 0x100U ) + { + pre = rm; + rm = list_entry(rm->node.next, struct vpci_register, node); + pre->private = rm->private; + } + else + { + pre = list_entry(rm->node.prev, struct vpci_register, node); + pre_header = (u32)(uintptr_t)pre->private; + pre->private = + (void *)(uintptr_t)((pre_header & !PCI_EXT_CAP_NEXT_MASK) | + (header & PCI_EXT_CAP_NEXT_MASK)); + } + list_del(&rm->node); + spin_unlock(&vpci->lock); + xfree(rm); + return; + } + if ( cmp <= 0 ) + break; + } + spin_unlock(&vpci->lock); +} + +static void vpci_init_capabilities(struct pci_dev *pdev) +{ + for ( unsigned int i = 0; i < NUM_VPCI_INIT; i++ ) + { + const vpci_capability_t *capability = __start_vpci_array[i]; + const unsigned int cap = capability->id; + const bool is_ext = capability->is_ext; + unsigned int pos; + int rc; + + if ( !is_hardware_domain(pdev->domain) && is_ext ) + continue; + + if ( is_ext ) + pos = pci_find_ext_capability(pdev->sbdf, cap); + else + pos = pci_find_cap_offset(pdev->sbdf, cap); + + if ( !pos ) + continue; + + rc = capability->init(pdev); + + if ( rc ) + { + printk(XENLOG_WARNING "%pd %pp: %s cap %u init fail rc=%d, mask it\n", + pdev->domain, &pdev->sbdf, + is_ext ? "extended" : "legacy", cap, rc); + if ( is_ext ) + vpci_ext_capability_mask(pdev, cap); + else + vpci_capability_mask(pdev, cap); + } + } +} + void vpci_deassign_device(struct pci_dev *pdev) { unsigned int i; @@ -128,7 +271,6 @@ void vpci_deassign_device(struct pci_dev *pdev) int vpci_assign_device(struct pci_dev *pdev) { - unsigned int i; const unsigned long *ro_map; int rc = 0; @@ -159,12 +301,11 @@ int vpci_assign_device(struct pci_dev *pdev) goto out; #endif - for ( i = 0; i < NUM_VPCI_INIT; i++ ) - { - rc = __start_vpci_array[i](pdev); - if ( rc ) - break; - } + rc = vpci_init_header(pdev); + if ( rc ) + goto out; + + vpci_init_capabilities(pdev); out: __maybe_unused; if ( rc ) @@ -174,22 +315,6 @@ int vpci_assign_device(struct pci_dev *pdev) } #endif /* __XEN__ */ -static int vpci_register_cmp(const struct vpci_register *r1, - const struct vpci_register *r2) -{ - /* Return 0 if registers overlap. */ - if ( r1->offset < r2->offset + r2->size && - r2->offset < r1->offset + r1->size ) - return 0; - if ( r1->offset < r2->offset ) - return -1; - if ( r1->offset > r2->offset ) - return 1; - - ASSERT_UNREACHABLE(); - return 0; -} - /* Dummy hooks, writes are ignored, reads return 1's */ static uint32_t cf_check vpci_ignored_read( const struct pci_dev *pdev, unsigned int reg, void *data) diff --git a/xen/include/xen/pci_regs.h b/xen/include/xen/pci_regs.h index 27b4f44eedf3..5fe6653fded4 100644 --- a/xen/include/xen/pci_regs.h +++ b/xen/include/xen/pci_regs.h @@ -449,6 +449,7 @@ #define PCI_EXT_CAP_ID(header) ((header) & 0x0000ffff) #define PCI_EXT_CAP_VER(header) (((header) >> 16) & 0xf) #define PCI_EXT_CAP_NEXT(header) (((header) >> 20) & 0xffc) +#define PCI_EXT_CAP_NEXT_MASK 0xFFC00000U #define PCI_EXT_CAP_ID_ERR 1 #define PCI_EXT_CAP_ID_VC 2 diff --git a/xen/include/xen/vpci.h b/xen/include/xen/vpci.h index 807401b2eaa2..5016ded64d89 100644 --- a/xen/include/xen/vpci.h +++ b/xen/include/xen/vpci.h @@ -13,11 +13,11 @@ typedef uint32_t vpci_read_t(const struct pci_dev *pdev, unsigned int reg, typedef void vpci_write_t(const struct pci_dev *pdev, unsigned int reg, uint32_t val, void *data); -typedef int vpci_register_init_t(struct pci_dev *dev); - -#define VPCI_PRIORITY_HIGH "1" -#define VPCI_PRIORITY_MIDDLE "5" -#define VPCI_PRIORITY_LOW "9" +typedef struct { + unsigned int id; + bool is_ext; + int (*init)(struct pci_dev *pdev); +} vpci_capability_t; #define VPCI_ECAM_BDF(addr) (((addr) & 0x0ffff000) >> 12) @@ -29,9 +29,19 @@ typedef int vpci_register_init_t(struct pci_dev *dev); */ #define VPCI_MAX_VIRT_DEV (PCI_SLOT(~0) + 1) -#define REGISTER_VPCI_INIT(x, p) \ - static vpci_register_init_t *const x##_entry \ - __used_section(".data.vpci." p) = (x) +#define REGISTER_VPCI_CAP(cap, x, ext) \ + static vpci_capability_t x##_t = { \ + .id = (cap), \ + .init = (x), \ + .is_ext = (ext), \ + }; \ + static vpci_capability_t *const x##_entry \ + __used_section(".data.vpci.") = &(x##_t) + +#define REGISTER_VPCI_LEGACY_CAP(cap, x) REGISTER_VPCI_CAP(cap, x, false) +#define REGISTER_VPCI_EXTEND_CAP(cap, x) REGISTER_VPCI_CAP(cap, x, true) + +int __must_check vpci_init_header(struct pci_dev *pdev); /* Assign vPCI to device by adding handlers. */ int __must_check vpci_assign_device(struct pci_dev *pdev); diff --git a/xen/include/xen/xen.lds.h b/xen/include/xen/xen.lds.h index 16a9b1ba03db..c73222112dd3 100644 --- a/xen/include/xen/xen.lds.h +++ b/xen/include/xen/xen.lds.h @@ -187,7 +187,7 @@ #define VPCI_ARRAY \ . = ALIGN(POINTER_ALIGN); \ __start_vpci_array = .; \ - *(SORT(.data.vpci.*)) \ + *(.data.vpci.*) \ __end_vpci_array = .; #else #define VPCI_ARRAY -- 2.34.1