On Fri, Jun 23, 2023 at 10:28:43PM +0700, Bui Quang Minh wrote: > On 6/23/23 03:26, Michael S. Tsirkin wrote: > > On Mon, May 22, 2023 at 11:31:57PM +0700, Bui Quang Minh wrote: > > > This commit adds XTSup configuration to let user choose to whether enable > > > this feature or not. When XTSup is enabled, additional bytes in IRTE with > > > enabled guest virtual VAPIC are used to support 32-bit destination id. > > > > > > Additionally, this commit exports IVHD type 0x11 besides the old IVHD type > > > 0x10 in ACPI table. IVHD type 0x10 does not report full set of IOMMU > > > features only the legacy ones, so operating system (e.g. Linux) may only > > > detects x2APIC support if IVHD type 0x11 is available. The IVHD type 0x10 > > > is kept so that old operating system that only parses type 0x10 can detect > > > the IOMMU device. > > > > > > Signed-off-by: Bui Quang Minh <minhquangbu...@gmail.com> > > > --- > > > hw/i386/acpi-build.c | 127 ++++++++++++++++++++++++++----------------- > > > hw/i386/amd_iommu.c | 21 ++++++- > > > hw/i386/amd_iommu.h | 16 ++++-- > > > 3 files changed, 108 insertions(+), 56 deletions(-) > > > > > > diff --git a/hw/i386/acpi-build.c b/hw/i386/acpi-build.c > > > index 512162003b..4459122e56 100644 > > > --- a/hw/i386/acpi-build.c > > > +++ b/hw/i386/acpi-build.c > > > @@ -2339,30 +2339,23 @@ static void > > > build_amd_iommu(GArray *table_data, BIOSLinker *linker, const char > > > *oem_id, > > > const char *oem_table_id) > > > { > > > - int ivhd_table_len = 24; > > > AMDVIState *s = AMD_IOMMU_DEVICE(x86_iommu_get_default()); > > > GArray *ivhd_blob = g_array_new(false, true, 1); > > > AcpiTable table = { .sig = "IVRS", .rev = 1, .oem_id = oem_id, > > > .oem_table_id = oem_table_id }; > > > + uint64_t feature_report; > > > acpi_table_begin(&table, table_data); > > > /* IVinfo - IO virtualization information common to all > > > * IOMMU units in a system > > > */ > > > - build_append_int_noprefix(table_data, 40UL << 8/* PASize */, 4); > > > + build_append_int_noprefix(table_data, > > > + (1UL << 0) | /* EFRSup */ > > > + (40UL << 8), /* PASize */ > > > + 4); > > > /* reserved */ > > > build_append_int_noprefix(table_data, 0, 8); > > > - /* IVHD definition - type 10h */ > > > - build_append_int_noprefix(table_data, 0x10, 1); > > > - /* virtualization flags */ > > > - build_append_int_noprefix(table_data, > > > - (1UL << 0) | /* HtTunEn */ > > > - (1UL << 4) | /* iotblSup */ > > > - (1UL << 6) | /* PrefSup */ > > > - (1UL << 7), /* PPRSup */ > > > - 1); > > > - > > > /* > > > * A PCI bus walk, for each PCI host bridge, is necessary to create > > > a > > > * complete set of IVHD entries. Do this into a separate blob so > > > that we > > > @@ -2382,56 +2375,92 @@ build_amd_iommu(GArray *table_data, BIOSLinker > > > *linker, const char *oem_id, > > > build_append_int_noprefix(ivhd_blob, 0x0000001, 4); > > > } > > > - ivhd_table_len += ivhd_blob->len; > > > - > > > /* > > > * When interrupt remapping is supported, we add a special IVHD > > > device > > > - * for type IO-APIC. > > > - */ > > > - if (x86_iommu_ir_supported(x86_iommu_get_default())) { > > > - ivhd_table_len += 8; > > > - } > > > - > > > - /* IVHD length */ > > > - build_append_int_noprefix(table_data, ivhd_table_len, 2); > > > - /* DeviceID */ > > > - build_append_int_noprefix(table_data, > > > - object_property_get_int(OBJECT(&s->pci), > > > "addr", > > > - &error_abort), 2); > > > - /* Capability offset */ > > > - build_append_int_noprefix(table_data, s->pci.capab_offset, 2); > > > - /* IOMMU base address */ > > > - build_append_int_noprefix(table_data, s->mmio.addr, 8); > > > - /* PCI Segment Group */ > > > - build_append_int_noprefix(table_data, 0, 2); > > > - /* IOMMU info */ > > > - build_append_int_noprefix(table_data, 0, 2); > > > - /* IOMMU Feature Reporting */ > > > - build_append_int_noprefix(table_data, > > > - (48UL << 30) | /* HATS */ > > > - (48UL << 28) | /* GATS */ > > > - (1UL << 2) | /* GTSup */ > > > - (1UL << 6), /* GASup */ > > > - 4); > > > - > > > - /* IVHD entries as found above */ > > > - g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len); > > > - g_array_free(ivhd_blob, TRUE); > > > - > > > - /* > > > - * Add a special IVHD device type. > > > + * for type IO-APIC > > > * Refer to spec - Table 95: IVHD device entry type codes > > > * > > > * Linux IOMMU driver checks for the special IVHD device (type > > > IO-APIC). > > > * See Linux kernel commit > > > 'c2ff5cf5294bcbd7fa50f7d860e90a66db7e5059' > > > */ > > > if (x86_iommu_ir_supported(x86_iommu_get_default())) { > > > - build_append_int_noprefix(table_data, > > > + build_append_int_noprefix(ivhd_blob, > > > (0x1ull << 56) | /* type > > > IOAPIC */ > > > (IOAPIC_SB_DEVID << 40) | /* IOAPIC > > > devid */ > > > 0x48, /* special > > > device */ > > > 8); > > > } > > > + > > > + /* IVHD definition - type 10h */ > > > + build_append_int_noprefix(table_data, 0x10, 1); > > > + /* virtualization flags */ > > > + build_append_int_noprefix(table_data, > > > + (1UL << 0) | /* HtTunEn */ > > > + (1UL << 4) | /* iotblSup */ > > > + (1UL << 6) | /* PrefSup */ > > > + (1UL << 7), /* PPRSup */ > > > + 1); > > > + > > > + /* IVHD length */ > > > + build_append_int_noprefix(table_data, ivhd_blob->len + 24, 2); > > > + /* DeviceID */ > > > + build_append_int_noprefix(table_data, > > > + object_property_get_int(OBJECT(&s->pci), > > > "addr", > > > + &error_abort), 2); > > > + /* Capability offset */ > > > + build_append_int_noprefix(table_data, s->pci.capab_offset, 2); > > > + /* IOMMU base address */ > > > + build_append_int_noprefix(table_data, s->mmio.addr, 8); > > > + /* PCI Segment Group */ > > > + build_append_int_noprefix(table_data, 0, 2); > > > + /* IOMMU info */ > > > + build_append_int_noprefix(table_data, 0, 2); > > > + /* IOMMU Feature Reporting */ > > > + feature_report = (48UL << 30) | /* HATS */ > > > + (48UL << 28) | /* GATS */ > > > + (1UL << 2) | /* GTSup */ > > > + (1UL << 6); /* GASup */ > > > + if (s->xtsup) { > > > + feature_report |= (1UL << 0); /* XTSup */ > > > + } > > > + build_append_int_noprefix(table_data, feature_report, 4); > > > + > > > + /* IVHD entries as found above */ > > > + g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len); > > > + > > > + /* IVHD definition - type 11h */ > > > + build_append_int_noprefix(table_data, 0x11, 1); > > > + /* virtualization flags */ > > > + build_append_int_noprefix(table_data, > > > + (1UL << 0) | /* HtTunEn */ > > > + (1UL << 4), /* iotblSup */ > > > + 1); > > > + > > > + /* IVHD length */ > > > + build_append_int_noprefix(table_data, ivhd_blob->len + 40, 2); > > > + /* DeviceID */ > > > + build_append_int_noprefix(table_data, > > > + object_property_get_int(OBJECT(&s->pci), > > > "addr", > > > + &error_abort), 2); > > > + /* Capability offset */ > > > + build_append_int_noprefix(table_data, s->pci.capab_offset, 2); > > > + /* IOMMU base address */ > > > + build_append_int_noprefix(table_data, s->mmio.addr, 8); > > > + /* PCI Segment Group */ > > > + build_append_int_noprefix(table_data, 0, 2); > > > + /* IOMMU info */ > > > + build_append_int_noprefix(table_data, 0, 2); > > > + /* IOMMU Attributes */ > > > + build_append_int_noprefix(table_data, 0, 4); > > > + /* EFR Register Image */ > > > + build_append_int_noprefix(table_data, s->efr_reg, 8); > > > + /* EFR Register Image 2 */ > > > + build_append_int_noprefix(table_data, 0, 8); > > > + > > > + /* IVHD entries as found above */ > > > + g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len); > > > + > > > + g_array_free(ivhd_blob, TRUE); > > > acpi_table_end(linker, &table); > > > } > > > diff --git a/hw/i386/amd_iommu.c b/hw/i386/amd_iommu.c > > > index 9c77304438..0e308184d7 100644 > > > --- a/hw/i386/amd_iommu.c > > > +++ b/hw/i386/amd_iommu.c > > > @@ -31,6 +31,7 @@ > > > #include "hw/i386/apic_internal.h" > > > #include "trace.h" > > > #include "hw/i386/apic-msidef.h" > > > +#include "hw/qdev-properties.h" > > > /* used AMD-Vi MMIO registers */ > > > const char *amdvi_mmio_low[] = { > > > @@ -1155,7 +1156,12 @@ static int amdvi_int_remap_ga(AMDVIState *iommu, > > > irq->vector = irte.hi.fields.vector; > > > irq->dest_mode = irte.lo.fields_remap.dm; > > > irq->redir_hint = irte.lo.fields_remap.rq_eoi; > > > - irq->dest = irte.lo.fields_remap.destination; > > > + if (iommu->xtsup) { > > > + irq->dest = irte.lo.fields_remap.destination | > > > + (irte.hi.fields.destination_hi << 24); > > > + } else { > > > + irq->dest = irte.lo.fields_remap.destination & 0xff; > > > + } > > > return 0; > > > } > > > @@ -1503,10 +1509,15 @@ static void amdvi_init(AMDVIState *s) > > > s->enabled = false; > > > s->ats_enabled = false; > > > s->cmdbuf_enabled = false; > > > + s->efr_reg = AMDVI_DEFAULT_EXT_FEATURES; > > > + > > > + if (s->xtsup) { > > > + s->efr_reg |= AMDVI_FEATURE_XT; > > > + } > > > /* reset MMIO */ > > > memset(s->mmior, 0, AMDVI_MMIO_SIZE); > > > - amdvi_set_quad(s, AMDVI_MMIO_EXT_FEATURES, AMDVI_EXT_FEATURES, > > > + amdvi_set_quad(s, AMDVI_MMIO_EXT_FEATURES, s->efr_reg, > > > 0xffffffffffffffef, 0); > > > amdvi_set_quad(s, AMDVI_MMIO_STATUS, 0, 0x98, 0x67); > > > } > > > @@ -1591,6 +1602,11 @@ static void amdvi_sysbus_realize(DeviceState *dev, > > > Error **errp) > > > amdvi_init(s); > > > } > > > +static Property amdvi_properties[] = { > > > + DEFINE_PROP_BOOL("xtsup", AMDVIState, xtsup, false), > > > + DEFINE_PROP_END_OF_LIST(), > > > +}; > > > + > > > static const VMStateDescription vmstate_amdvi_sysbus = { > > > .name = "amd-iommu", > > > .unmigratable = 1 > > > @@ -1617,6 +1633,7 @@ static void amdvi_sysbus_class_init(ObjectClass > > > *klass, void *data) > > > dc->user_creatable = true; > > > set_bit(DEVICE_CATEGORY_MISC, dc->categories); > > > dc->desc = "AMD IOMMU (AMD-Vi) DMA Remapping device"; > > > + device_class_set_props(dc, amdvi_properties); > > > } > > > static const TypeInfo amdvi_sysbus = { > > > diff --git a/hw/i386/amd_iommu.h b/hw/i386/amd_iommu.h > > > index 6da893ee57..f3730db990 100644 > > > --- a/hw/i386/amd_iommu.h > > > +++ b/hw/i386/amd_iommu.h > > > @@ -154,6 +154,7 @@ > > > #define AMDVI_FEATURE_PREFETCH (1ULL << 0) /* page prefetch > > > */ > > > #define AMDVI_FEATURE_PPR (1ULL << 1) /* PPR Support > > > */ > > > +#define AMDVI_FEATURE_XT (1ULL << 2) /* x2APIC Support > > > */ > > > #define AMDVI_FEATURE_GT (1ULL << 4) /* Guest > > > Translation */ > > > #define AMDVI_FEATURE_IA (1ULL << 6) /* inval all > > > support */ > > > #define AMDVI_FEATURE_GA (1ULL << 7) /* guest VAPIC > > > support */ > > > @@ -173,8 +174,9 @@ > > > #define AMDVI_IOTLB_MAX_SIZE 1024 > > > #define AMDVI_DEVID_SHIFT 36 > > > -/* extended feature support */ > > > -#define AMDVI_EXT_FEATURES (AMDVI_FEATURE_PREFETCH | AMDVI_FEATURE_PPR | > > > \ > > > +/* default extended feature */ > > > +#define AMDVI_DEFAULT_EXT_FEATURES \ > > > + (AMDVI_FEATURE_PREFETCH | AMDVI_FEATURE_PPR | \ > > > AMDVI_FEATURE_IA | AMDVI_FEATURE_GT | AMDVI_FEATURE_HE | \ > > > AMDVI_GATS_MODE | AMDVI_HATS_MODE | AMDVI_FEATURE_GA) > > > @@ -278,8 +280,8 @@ union irte_ga_lo { > > > dm:1, > > > /* ------ */ > > > guest_mode:1, > > > - destination:8, > > > - rsvd_1:48; > > > + destination:24, > > > + rsvd_1:32; > > > } fields_remap; > > > }; > > > @@ -287,7 +289,8 @@ union irte_ga_hi { > > > uint64_t val; > > > struct { > > > uint64_t vector:8, > > > - rsvd_2:56; > > > + rsvd_2:48, > > > + destination_hi:8; > > > } fields; > > > }; > > > @@ -366,6 +369,9 @@ struct AMDVIState { > > > /* Interrupt remapping */ > > > bool ga_enabled; > > > + bool xtsup; > > > + > > > + uint64_t efr_reg; /* extended feature register */ > > > }; > > > > It would be cleaner to have efr_reg as a function and just call it > > when needed. > > > > With that addressed: > > > > Reviewed-by: Michael S. Tsirkin <m...@redhat.com> > > You mean function like this > > uint64_t amdvi_extended_feature_register(AMDVIState *s) > { > uint64_t feature = AMDVI_DEFAULT_EXT_FEATURES; > if (s->xtsup) > feature |= AMDVI_FEATURE_XT; > > return feature; > }
Yes exactly. going to do that? > > > #endif > > > -- > > > 2.25.1 > >