qemu-devel
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [PATCH v4 5/5] amd_iommu: report x2APIC support to the operating sys


From: Bui Quang Minh
Subject: Re: [PATCH v4 5/5] amd_iommu: report x2APIC support to the operating system
Date: Fri, 23 Jun 2023 22:28:43 +0700
User-agent: Mozilla/5.0 (X11; Linux x86_64; rv:102.0) Gecko/20100101 Thunderbird/102.11.0

On 6/23/23 03:26, Michael S. Tsirkin wrote:
On Mon, May 22, 2023 at 11:31:57PM +0700, Bui Quang Minh wrote:
This commit adds XTSup configuration to let user choose to whether enable
this feature or not. When XTSup is enabled, additional bytes in IRTE with
enabled guest virtual VAPIC are used to support 32-bit destination id.

Additionally, this commit exports IVHD type 0x11 besides the old IVHD type
0x10 in ACPI table. IVHD type 0x10 does not report full set of IOMMU
features only the legacy ones, so operating system (e.g. Linux) may only
detects x2APIC support if IVHD type 0x11 is available. The IVHD type 0x10
is kept so that old operating system that only parses type 0x10 can detect
the IOMMU device.

Signed-off-by: Bui Quang Minh <minhquangbui99@gmail.com>
---
  hw/i386/acpi-build.c | 127 ++++++++++++++++++++++++++-----------------
  hw/i386/amd_iommu.c  |  21 ++++++-
  hw/i386/amd_iommu.h  |  16 ++++--
  3 files changed, 108 insertions(+), 56 deletions(-)

diff --git a/hw/i386/acpi-build.c b/hw/i386/acpi-build.c
index 512162003b..4459122e56 100644
--- a/hw/i386/acpi-build.c
+++ b/hw/i386/acpi-build.c
@@ -2339,30 +2339,23 @@ static void
  build_amd_iommu(GArray *table_data, BIOSLinker *linker, const char *oem_id,
                  const char *oem_table_id)
  {
-    int ivhd_table_len = 24;
      AMDVIState *s = AMD_IOMMU_DEVICE(x86_iommu_get_default());
      GArray *ivhd_blob = g_array_new(false, true, 1);
      AcpiTable table = { .sig = "IVRS", .rev = 1, .oem_id = oem_id,
                          .oem_table_id = oem_table_id };
+    uint64_t feature_report;
acpi_table_begin(&table, table_data);
      /* IVinfo - IO virtualization information common to all
       * IOMMU units in a system
       */
-    build_append_int_noprefix(table_data, 40UL << 8/* PASize */, 4);
+    build_append_int_noprefix(table_data,
+                             (1UL << 0) | /* EFRSup */
+                             (40UL << 8), /* PASize */
+                             4);
      /* reserved */
      build_append_int_noprefix(table_data, 0, 8);
- /* IVHD definition - type 10h */
-    build_append_int_noprefix(table_data, 0x10, 1);
-    /* virtualization flags */
-    build_append_int_noprefix(table_data,
-                             (1UL << 0) | /* HtTunEn      */
-                             (1UL << 4) | /* iotblSup     */
-                             (1UL << 6) | /* PrefSup      */
-                             (1UL << 7),  /* PPRSup       */
-                             1);
-
      /*
       * A PCI bus walk, for each PCI host bridge, is necessary to create a
       * complete set of IVHD entries.  Do this into a separate blob so that we
@@ -2382,56 +2375,92 @@ build_amd_iommu(GArray *table_data, BIOSLinker *linker, 
const char *oem_id,
          build_append_int_noprefix(ivhd_blob, 0x0000001, 4);
      }
- ivhd_table_len += ivhd_blob->len;
-
      /*
       * When interrupt remapping is supported, we add a special IVHD device
-     * for type IO-APIC.
-     */
-    if (x86_iommu_ir_supported(x86_iommu_get_default())) {
-        ivhd_table_len += 8;
-    }
-
-    /* IVHD length */
-    build_append_int_noprefix(table_data, ivhd_table_len, 2);
-    /* DeviceID */
-    build_append_int_noprefix(table_data,
-                              object_property_get_int(OBJECT(&s->pci), "addr",
-                                                      &error_abort), 2);
-    /* Capability offset */
-    build_append_int_noprefix(table_data, s->pci.capab_offset, 2);
-    /* IOMMU base address */
-    build_append_int_noprefix(table_data, s->mmio.addr, 8);
-    /* PCI Segment Group */
-    build_append_int_noprefix(table_data, 0, 2);
-    /* IOMMU info */
-    build_append_int_noprefix(table_data, 0, 2);
-    /* IOMMU Feature Reporting */
-    build_append_int_noprefix(table_data,
-                             (48UL << 30) | /* HATS   */
-                             (48UL << 28) | /* GATS   */
-                             (1UL << 2)   | /* GTSup  */
-                             (1UL << 6),    /* GASup  */
-                             4);
-
-    /* IVHD entries as found above */
-    g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len);
-    g_array_free(ivhd_blob, TRUE);
-
-    /*
-     * Add a special IVHD device type.
+     * for type IO-APIC
       * Refer to spec - Table 95: IVHD device entry type codes
       *
       * Linux IOMMU driver checks for the special IVHD device (type IO-APIC).
       * See Linux kernel commit 'c2ff5cf5294bcbd7fa50f7d860e90a66db7e5059'
       */
      if (x86_iommu_ir_supported(x86_iommu_get_default())) {
-        build_append_int_noprefix(table_data,
+        build_append_int_noprefix(ivhd_blob,
                                   (0x1ull << 56) |           /* type IOAPIC */
                                   (IOAPIC_SB_DEVID << 40) |  /* IOAPIC devid */
                                   0x48,                      /* special device 
*/
                                   8);
      }
+
+    /* IVHD definition - type 10h */
+    build_append_int_noprefix(table_data, 0x10, 1);
+    /* virtualization flags */
+    build_append_int_noprefix(table_data,
+                             (1UL << 0) | /* HtTunEn      */
+                             (1UL << 4) | /* iotblSup     */
+                             (1UL << 6) | /* PrefSup      */
+                             (1UL << 7),  /* PPRSup       */
+                             1);
+
+    /* IVHD length */
+    build_append_int_noprefix(table_data, ivhd_blob->len + 24, 2);
+    /* DeviceID */
+    build_append_int_noprefix(table_data,
+                              object_property_get_int(OBJECT(&s->pci), "addr",
+                                                      &error_abort), 2);
+    /* Capability offset */
+    build_append_int_noprefix(table_data, s->pci.capab_offset, 2);
+    /* IOMMU base address */
+    build_append_int_noprefix(table_data, s->mmio.addr, 8);
+    /* PCI Segment Group */
+    build_append_int_noprefix(table_data, 0, 2);
+    /* IOMMU info */
+    build_append_int_noprefix(table_data, 0, 2);
+    /* IOMMU Feature Reporting */
+    feature_report = (48UL << 30) | /* HATS   */
+                     (48UL << 28) | /* GATS   */
+                     (1UL << 2)   | /* GTSup  */
+                     (1UL << 6);    /* GASup  */
+    if (s->xtsup) {
+        feature_report |= (1UL << 0); /* XTSup */
+    }
+    build_append_int_noprefix(table_data, feature_report, 4);
+
+    /* IVHD entries as found above */
+    g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len);
+
+   /* IVHD definition - type 11h */
+    build_append_int_noprefix(table_data, 0x11, 1);
+    /* virtualization flags */
+    build_append_int_noprefix(table_data,
+                             (1UL << 0) | /* HtTunEn      */
+                             (1UL << 4),  /* iotblSup     */
+                             1);
+
+    /* IVHD length */
+    build_append_int_noprefix(table_data, ivhd_blob->len + 40, 2);
+    /* DeviceID */
+    build_append_int_noprefix(table_data,
+                              object_property_get_int(OBJECT(&s->pci), "addr",
+                                                      &error_abort), 2);
+    /* Capability offset */
+    build_append_int_noprefix(table_data, s->pci.capab_offset, 2);
+    /* IOMMU base address */
+    build_append_int_noprefix(table_data, s->mmio.addr, 8);
+    /* PCI Segment Group */
+    build_append_int_noprefix(table_data, 0, 2);
+    /* IOMMU info */
+    build_append_int_noprefix(table_data, 0, 2);
+    /* IOMMU Attributes */
+    build_append_int_noprefix(table_data, 0, 4);
+    /* EFR Register Image */
+    build_append_int_noprefix(table_data, s->efr_reg, 8);
+    /* EFR Register Image 2 */
+    build_append_int_noprefix(table_data, 0, 8);
+
+    /* IVHD entries as found above */
+    g_array_append_vals(table_data, ivhd_blob->data, ivhd_blob->len);
+
+    g_array_free(ivhd_blob, TRUE);
      acpi_table_end(linker, &table);
  }
diff --git a/hw/i386/amd_iommu.c b/hw/i386/amd_iommu.c
index 9c77304438..0e308184d7 100644
--- a/hw/i386/amd_iommu.c
+++ b/hw/i386/amd_iommu.c
@@ -31,6 +31,7 @@
  #include "hw/i386/apic_internal.h"
  #include "trace.h"
  #include "hw/i386/apic-msidef.h"
+#include "hw/qdev-properties.h"
/* used AMD-Vi MMIO registers */
  const char *amdvi_mmio_low[] = {
@@ -1155,7 +1156,12 @@ static int amdvi_int_remap_ga(AMDVIState *iommu,
      irq->vector = irte.hi.fields.vector;
      irq->dest_mode = irte.lo.fields_remap.dm;
      irq->redir_hint = irte.lo.fields_remap.rq_eoi;
-    irq->dest = irte.lo.fields_remap.destination;
+    if (iommu->xtsup) {
+        irq->dest = irte.lo.fields_remap.destination |
+                    (irte.hi.fields.destination_hi << 24);
+    } else {
+        irq->dest = irte.lo.fields_remap.destination & 0xff;
+    }
return 0;
  }
@@ -1503,10 +1509,15 @@ static void amdvi_init(AMDVIState *s)
      s->enabled = false;
      s->ats_enabled = false;
      s->cmdbuf_enabled = false;
+    s->efr_reg = AMDVI_DEFAULT_EXT_FEATURES;
+
+    if (s->xtsup) {
+        s->efr_reg |= AMDVI_FEATURE_XT;
+    }
/* reset MMIO */
      memset(s->mmior, 0, AMDVI_MMIO_SIZE);
-    amdvi_set_quad(s, AMDVI_MMIO_EXT_FEATURES, AMDVI_EXT_FEATURES,
+    amdvi_set_quad(s, AMDVI_MMIO_EXT_FEATURES, s->efr_reg,
              0xffffffffffffffef, 0);
      amdvi_set_quad(s, AMDVI_MMIO_STATUS, 0, 0x98, 0x67);
  }
@@ -1591,6 +1602,11 @@ static void amdvi_sysbus_realize(DeviceState *dev, Error 
**errp)
      amdvi_init(s);
  }
+static Property amdvi_properties[] = {
+    DEFINE_PROP_BOOL("xtsup", AMDVIState, xtsup, false),
+    DEFINE_PROP_END_OF_LIST(),
+};
+
  static const VMStateDescription vmstate_amdvi_sysbus = {
      .name = "amd-iommu",
      .unmigratable = 1
@@ -1617,6 +1633,7 @@ static void amdvi_sysbus_class_init(ObjectClass *klass, 
void *data)
      dc->user_creatable = true;
      set_bit(DEVICE_CATEGORY_MISC, dc->categories);
      dc->desc = "AMD IOMMU (AMD-Vi) DMA Remapping device";
+    device_class_set_props(dc, amdvi_properties);
  }
static const TypeInfo amdvi_sysbus = {
diff --git a/hw/i386/amd_iommu.h b/hw/i386/amd_iommu.h
index 6da893ee57..f3730db990 100644
--- a/hw/i386/amd_iommu.h
+++ b/hw/i386/amd_iommu.h
@@ -154,6 +154,7 @@
#define AMDVI_FEATURE_PREFETCH (1ULL << 0) /* page prefetch */
  #define AMDVI_FEATURE_PPR                 (1ULL << 1) /* PPR Support         
*/
+#define AMDVI_FEATURE_XT                  (1ULL << 2) /* x2APIC Support      */
  #define AMDVI_FEATURE_GT                  (1ULL << 4) /* Guest Translation   
*/
  #define AMDVI_FEATURE_IA                  (1ULL << 6) /* inval all support   
*/
  #define AMDVI_FEATURE_GA                  (1ULL << 7) /* guest VAPIC support 
*/
@@ -173,8 +174,9 @@
  #define AMDVI_IOTLB_MAX_SIZE 1024
  #define AMDVI_DEVID_SHIFT    36
-/* extended feature support */
-#define AMDVI_EXT_FEATURES (AMDVI_FEATURE_PREFETCH | AMDVI_FEATURE_PPR | \
+/* default extended feature */
+#define AMDVI_DEFAULT_EXT_FEATURES \
+        (AMDVI_FEATURE_PREFETCH | AMDVI_FEATURE_PPR | \
          AMDVI_FEATURE_IA | AMDVI_FEATURE_GT | AMDVI_FEATURE_HE | \
          AMDVI_GATS_MODE | AMDVI_HATS_MODE | AMDVI_FEATURE_GA)
@@ -278,8 +280,8 @@ union irte_ga_lo {
                  dm:1,
                  /* ------ */
                  guest_mode:1,
-                destination:8,
-                rsvd_1:48;
+                destination:24,
+                rsvd_1:32;
    } fields_remap;
  };
@@ -287,7 +289,8 @@ union irte_ga_hi {
    uint64_t val;
    struct {
        uint64_t  vector:8,
-                rsvd_2:56;
+                rsvd_2:48,
+                destination_hi:8;
    } fields;
  };
@@ -366,6 +369,9 @@ struct AMDVIState { /* Interrupt remapping */
      bool ga_enabled;
+    bool xtsup;
+
+    uint64_t efr_reg;            /* extended feature register */
  };

It would be cleaner to have efr_reg as a function and just call it
when needed.

With that addressed:

Reviewed-by: Michael S. Tsirkin <mst@redhat.com>

You mean function like this

uint64_t amdvi_extended_feature_register(AMDVIState *s)
{
        uint64_t feature = AMDVI_DEFAULT_EXT_FEATURES;
        if (s->xtsup)
                feature |= AMDVI_FEATURE_XT;

        return feature;
}

  #endif
--
2.25.1




reply via email to

[Prev in Thread] Current Thread [Next in Thread]