On Mon, May 22, 2023 at 11:31:57PM +0700, Bui Quang Minh wrote: > This commit adds XTSup configuration to let user choose to whether enable > this feature or not. When XTSup is enabled, additional bytes in IRTE with > enabled guest virtual VAPIC are used to support 32-bit destination id. > > Additionally, this commit exports IVHD type 0x11 besides the old IVHD type > 0x10 in ACPI table. IVHD type 0x10 does not report full set of IOMMU > features only the legacy ones, so operating system (e.g. Linux) may only > detects x2APIC support if IVHD type 0x11 is available. The IVHD type 0x10 > is kept so that old operating system that only parses type 0x10 can detect > the IOMMU device. > > Signed-off-by: Bui Quang Minh <minhquangbu...@gmail.com> > --- > hw/i386/acpi-build.c | 127 ++++++++++++++++++++++++++----------------- > hw/i386/amd_iommu.c | 21 ++++++- > hw/i386/amd_iommu.h | 16 ++++-- > 3 files changed, 108 insertions(+), 56 deletions(-) > > diff --git a/hw/i386/acpi-build.c b/hw/i386/acpi-build.c > index 512162003b..4459122e56 100644 > --- a/hw/i386/acpi-build.c > +++ b/hw/i386/acpi-build.c > @@ -2339,30 +2339,23 @@ static void > build_amd_iommu(GArray *table_data, BIOSLinker *linker, const char *oem_id, > const char *oem_table_id) > { > - int ivhd_table_len = 24; > AMDVIState *s = AMD_IOMMU_DEVICE(x86_iommu_get_default()); > GArray *ivhd_blob = g_array_new(false, true, 1); > AcpiTable table = { .sig = "IVRS", .rev = 1, .oem_id = oem_id, > .oem_table_id = oem_table_id }; > + uint64_t feature_report; > > acpi_table_begin(&table, table_data); > /* IVinfo - IO virtualization information common to all > * IOMMU units in a system > */ > - build_append_int_noprefix(table_data, 40UL << 8/* PASize */, 4); > + build_append_int_noprefix(table_data, > + (1UL << 0) | /* EFRSup */ > + (40UL << 8), /* PASize */ > + 4); > /* reserved */ > build_append_int_noprefix(table_data, 0, 8); > > - /* IVHD definition - type 10h */ > - build_append_int_noprefix(table_data, 0x10, 1); > - /* virtualization flags */ > - build_append_int_noprefix(table_data, > - (1UL << 0) | /* HtTunEn */ > - (1UL << 4) | /* iotblSup */ > - (1UL << 6) | /* PrefSup */ > - (1UL << 7), /* PPRSup */ > - 1); > - > /* > * A PCI bus walk, for each PCI host bridge, is necessary to create a > * complete set of IVHD entries. Do this into a separate blob so that we > @@ -2382,56 +2375,92 @@ build_amd_iommu(GArray *table_data, BIOSLinker > *linker, const char *oem_id, > build_append_int_noprefix(ivhd_blob, 0x0000001, 4); > } > > - ivhd_table_len += ivhd_blob->len; > - > /* > * When interrupt remapping is supported, we add a special IVHD device > - * for type IO-APIC. > - */ > - if (x86_iommu_ir_supported(x86_iommu_get_default())) { > - ivhd_table_len += 8; > - } > - > - /* IVHD length */ > - build_append_int_noprefix(table_data, ivhd_table_len, 2); > - /* DeviceID */ > - build_append_int_noprefix(table_data, > - object_property_get_int(OBJECT(&s->pci), > "addr", > - &error_abort), 2); > - /* Capability offset */ > - build_append_int_noprefix(table_data, s->pci.capab_offset, 2); > - /* IOMMU base address */ > - build_append_int_noprefix(table_data, s->mmio.addr, 8); > - /* PCI Segment Group */ > - build_append_int_noprefix(table_data, 0, 2); > - /* IOMMU info */ > - build_append_int_noprefix(table_data, 0, 2); > - /* IOMMU Feature Reporting */ > - build_append_int_noprefix(table_data, > - (48UL << 30) | /* HATS */ > - (48UL << 28) | /* GATS */ > - (1UL << 2) | /* GTSup */ > - (1UL << 6), /* GASup */ > - 4); > - > - /* IVHD entries as found above */ > - g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len); > - g_array_free(ivhd_blob, TRUE); > - > - /* > - * Add a special IVHD device type. > + * for type IO-APIC > * Refer to spec - Table 95: IVHD device entry type codes > * > * Linux IOMMU driver checks for the special IVHD device (type IO-APIC). > * See Linux kernel commit 'c2ff5cf5294bcbd7fa50f7d860e90a66db7e5059' > */ > if (x86_iommu_ir_supported(x86_iommu_get_default())) { > - build_append_int_noprefix(table_data, > + build_append_int_noprefix(ivhd_blob, > (0x1ull << 56) | /* type IOAPIC */ > (IOAPIC_SB_DEVID << 40) | /* IOAPIC devid > */ > 0x48, /* special > device */ > 8); > } > + > + /* IVHD definition - type 10h */ > + build_append_int_noprefix(table_data, 0x10, 1); > + /* virtualization flags */ > + build_append_int_noprefix(table_data, > + (1UL << 0) | /* HtTunEn */ > + (1UL << 4) | /* iotblSup */ > + (1UL << 6) | /* PrefSup */ > + (1UL << 7), /* PPRSup */ > + 1); > + > + /* IVHD length */ > + build_append_int_noprefix(table_data, ivhd_blob->len + 24, 2); > + /* DeviceID */ > + build_append_int_noprefix(table_data, > + object_property_get_int(OBJECT(&s->pci), > "addr", > + &error_abort), 2); > + /* Capability offset */ > + build_append_int_noprefix(table_data, s->pci.capab_offset, 2); > + /* IOMMU base address */ > + build_append_int_noprefix(table_data, s->mmio.addr, 8); > + /* PCI Segment Group */ > + build_append_int_noprefix(table_data, 0, 2); > + /* IOMMU info */ > + build_append_int_noprefix(table_data, 0, 2); > + /* IOMMU Feature Reporting */ > + feature_report = (48UL << 30) | /* HATS */ > + (48UL << 28) | /* GATS */ > + (1UL << 2) | /* GTSup */ > + (1UL << 6); /* GASup */ > + if (s->xtsup) { > + feature_report |= (1UL << 0); /* XTSup */ > + } > + build_append_int_noprefix(table_data, feature_report, 4); > + > + /* IVHD entries as found above */ > + g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len); > + > + /* IVHD definition - type 11h */ > + build_append_int_noprefix(table_data, 0x11, 1); > + /* virtualization flags */ > + build_append_int_noprefix(table_data, > + (1UL << 0) | /* HtTunEn */ > + (1UL << 4), /* iotblSup */ > + 1); > + > + /* IVHD length */ > + build_append_int_noprefix(table_data, ivhd_blob->len + 40, 2); > + /* DeviceID */ > + build_append_int_noprefix(table_data, > + object_property_get_int(OBJECT(&s->pci), > "addr", > + &error_abort), 2); > + /* Capability offset */ > + build_append_int_noprefix(table_data, s->pci.capab_offset, 2); > + /* IOMMU base address */ > + build_append_int_noprefix(table_data, s->mmio.addr, 8); > + /* PCI Segment Group */ > + build_append_int_noprefix(table_data, 0, 2); > + /* IOMMU info */ > + build_append_int_noprefix(table_data, 0, 2); > + /* IOMMU Attributes */ > + build_append_int_noprefix(table_data, 0, 4); > + /* EFR Register Image */ > + build_append_int_noprefix(table_data, s->efr_reg, 8); > + /* EFR Register Image 2 */ > + build_append_int_noprefix(table_data, 0, 8); > + > + /* IVHD entries as found above */ > + g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len); > + > + g_array_free(ivhd_blob, TRUE); > acpi_table_end(linker, &table); > } > > diff --git a/hw/i386/amd_iommu.c b/hw/i386/amd_iommu.c > index 9c77304438..0e308184d7 100644 > --- a/hw/i386/amd_iommu.c > +++ b/hw/i386/amd_iommu.c > @@ -31,6 +31,7 @@ > #include "hw/i386/apic_internal.h" > #include "trace.h" > #include "hw/i386/apic-msidef.h" > +#include "hw/qdev-properties.h" > > /* used AMD-Vi MMIO registers */ > const char *amdvi_mmio_low[] = { > @@ -1155,7 +1156,12 @@ static int amdvi_int_remap_ga(AMDVIState *iommu, > irq->vector = irte.hi.fields.vector; > irq->dest_mode = irte.lo.fields_remap.dm; > irq->redir_hint = irte.lo.fields_remap.rq_eoi; > - irq->dest = irte.lo.fields_remap.destination; > + if (iommu->xtsup) { > + irq->dest = irte.lo.fields_remap.destination | > + (irte.hi.fields.destination_hi << 24); > + } else { > + irq->dest = irte.lo.fields_remap.destination & 0xff; > + } > > return 0; > } > @@ -1503,10 +1509,15 @@ static void amdvi_init(AMDVIState *s) > s->enabled = false; > s->ats_enabled = false; > s->cmdbuf_enabled = false; > + s->efr_reg = AMDVI_DEFAULT_EXT_FEATURES; > + > + if (s->xtsup) { > + s->efr_reg |= AMDVI_FEATURE_XT; > + } > > /* reset MMIO */ > memset(s->mmior, 0, AMDVI_MMIO_SIZE); > - amdvi_set_quad(s, AMDVI_MMIO_EXT_FEATURES, AMDVI_EXT_FEATURES, > + amdvi_set_quad(s, AMDVI_MMIO_EXT_FEATURES, s->efr_reg, > 0xffffffffffffffef, 0); > amdvi_set_quad(s, AMDVI_MMIO_STATUS, 0, 0x98, 0x67); > } > @@ -1591,6 +1602,11 @@ static void amdvi_sysbus_realize(DeviceState *dev, > Error **errp) > amdvi_init(s); > } > > +static Property amdvi_properties[] = { > + DEFINE_PROP_BOOL("xtsup", AMDVIState, xtsup, false), > + DEFINE_PROP_END_OF_LIST(), > +}; > + > static const VMStateDescription vmstate_amdvi_sysbus = { > .name = "amd-iommu", > .unmigratable = 1 > @@ -1617,6 +1633,7 @@ static void amdvi_sysbus_class_init(ObjectClass *klass, > void *data) > dc->user_creatable = true; > set_bit(DEVICE_CATEGORY_MISC, dc->categories); > dc->desc = "AMD IOMMU (AMD-Vi) DMA Remapping device"; > + device_class_set_props(dc, amdvi_properties); > } > > static const TypeInfo amdvi_sysbus = { > diff --git a/hw/i386/amd_iommu.h b/hw/i386/amd_iommu.h > index 6da893ee57..f3730db990 100644 > --- a/hw/i386/amd_iommu.h > +++ b/hw/i386/amd_iommu.h > @@ -154,6 +154,7 @@ > > #define AMDVI_FEATURE_PREFETCH (1ULL << 0) /* page prefetch > */ > #define AMDVI_FEATURE_PPR (1ULL << 1) /* PPR Support > */ > +#define AMDVI_FEATURE_XT (1ULL << 2) /* x2APIC Support > */ > #define AMDVI_FEATURE_GT (1ULL << 4) /* Guest Translation > */ > #define AMDVI_FEATURE_IA (1ULL << 6) /* inval all support > */ > #define AMDVI_FEATURE_GA (1ULL << 7) /* guest VAPIC support > */ > @@ -173,8 +174,9 @@ > #define AMDVI_IOTLB_MAX_SIZE 1024 > #define AMDVI_DEVID_SHIFT 36 > > -/* extended feature support */ > -#define AMDVI_EXT_FEATURES (AMDVI_FEATURE_PREFETCH | AMDVI_FEATURE_PPR | \ > +/* default extended feature */ > +#define AMDVI_DEFAULT_EXT_FEATURES \ > + (AMDVI_FEATURE_PREFETCH | AMDVI_FEATURE_PPR | \ > AMDVI_FEATURE_IA | AMDVI_FEATURE_GT | AMDVI_FEATURE_HE | \ > AMDVI_GATS_MODE | AMDVI_HATS_MODE | AMDVI_FEATURE_GA) > > @@ -278,8 +280,8 @@ union irte_ga_lo { > dm:1, > /* ------ */ > guest_mode:1, > - destination:8, > - rsvd_1:48; > + destination:24, > + rsvd_1:32; > } fields_remap; > }; > > @@ -287,7 +289,8 @@ union irte_ga_hi { > uint64_t val; > struct { > uint64_t vector:8, > - rsvd_2:56; > + rsvd_2:48, > + destination_hi:8; > } fields; > }; > > @@ -366,6 +369,9 @@ struct AMDVIState { > > /* Interrupt remapping */ > bool ga_enabled; > + bool xtsup; > + > + uint64_t efr_reg; /* extended feature register */ > };
It would be cleaner to have efr_reg as a function and just call it when needed. With that addressed: Reviewed-by: Michael S. Tsirkin <m...@redhat.com> > #endif > -- > 2.25.1