qemu-devel
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [Qemu-devel] [RFC v2 2/3] acpi-build: allocate mcfg for pxb-pcie hos


From: Marcel Apfelbaum
Subject: Re: [Qemu-devel] [RFC v2 2/3] acpi-build: allocate mcfg for pxb-pcie host bridges
Date: Wed, 20 Jun 2018 10:41:01 +0300
User-agent: Mozilla/5.0 (X11; Linux x86_64; rv:52.0) Gecko/20100101 Thunderbird/52.7.0



On 06/12/2018 12:13 PM, Zihan Yang wrote:
Allocate new segment for pxb-pcie host bridges in MCFG table, and reserve
corresponding MCFG space for them. This allows user-defined pxb-pcie
host bridges to be placed in different pci domain than q35 host

Signed-off-by: Zihan Yang <address@hidden>
---
  hw/i386/acpi-build.c                        | 97 +++++++++++++++++++++++------
  hw/i386/pc.c                                | 14 ++++-
  hw/pci-bridge/pci_expander_bridge.c         | 52 +++++++++++-----
  hw/pci-host/q35.c                           |  2 +
  include/hw/i386/pc.h                        |  1 +
  include/hw/pci-bridge/pci_expander_bridge.h |  6 ++
  include/hw/pci-host/q35.h                   |  1 +
  7 files changed, 137 insertions(+), 36 deletions(-)
  create mode 100644 include/hw/pci-bridge/pci_expander_bridge.h

diff --git a/hw/i386/acpi-build.c b/hw/i386/acpi-build.c
index 9bc6d97..104e52d 100644
--- a/hw/i386/acpi-build.c
+++ b/hw/i386/acpi-build.c
@@ -89,6 +89,8 @@
  typedef struct AcpiMcfgInfo {
      uint64_t mcfg_base;
      uint32_t mcfg_size;
+    uint32_t domain_nr;
+    struct AcpiMcfgInfo *next;
  } AcpiMcfgInfo;
typedef struct AcpiPmInfo {
@@ -2427,14 +2429,16 @@ build_mcfg_q35(GArray *table_data, BIOSLinker *linker, 
AcpiMcfgInfo *info)
  {
      AcpiTableMcfg *mcfg;
      const char *sig;
-    int len = sizeof(*mcfg) + 1 * sizeof(mcfg->allocation[0]);
+    int len, count = 0;
+    AcpiMcfgInfo *cfg = info;
+
+    while (cfg) {
+        ++count;
+        cfg = cfg->next;
+    }
+    len = sizeof(*mcfg) + count * sizeof(mcfg->allocation[0]);
mcfg = acpi_data_push(table_data, len);
-    mcfg->allocation[0].address = cpu_to_le64(info->mcfg_base);
-    /* Only a single allocation so no need to play with segments */
-    mcfg->allocation[0].pci_segment = cpu_to_le16(0);
-    mcfg->allocation[0].start_bus_number = 0;
-    mcfg->allocation[0].end_bus_number = PCIE_MMCFG_BUS(info->mcfg_size - 1);
/* MCFG is used for ECAM which can be enabled or disabled by guest.
       * To avoid table size changes (which create migration issues),
@@ -2448,6 +2452,15 @@ build_mcfg_q35(GArray *table_data, BIOSLinker *linker, 
AcpiMcfgInfo *info)
      } else {
          sig = "MCFG";
      }
+
+    while (info) {
+        mcfg[count].allocation[0].address = cpu_to_le64(info->mcfg_base);
+        mcfg[count].allocation[0].pci_segment = cpu_to_le16(info->domain_nr);
+        mcfg[count].allocation[0].start_bus_number = 0;
+        mcfg[count++].allocation[0].end_bus_number = 
PCIE_MMCFG_BUS(info->mcfg_size - 1);

I think you want to use here max_bus property defined in the prev patch.

+        info = info->next;
+    }
+
      build_header(linker, table_data, (void *)mcfg, sig, len, 1, NULL, NULL);
  }
@@ -2602,26 +2615,69 @@ struct AcpiBuildState {
      MemoryRegion *linker_mr;
  } AcpiBuildState;
-static bool acpi_get_mcfg(AcpiMcfgInfo *mcfg)
+static inline void cleanup_mcfg(AcpiMcfgInfo *mcfg)
+{
+    AcpiMcfgInfo *tmp;
+    while (mcfg) {
+        tmp = mcfg->next;
+        g_free(mcfg);
+        mcfg = tmp;
+    }
+}
+
+static AcpiMcfgInfo *acpi_get_mcfg(void)
  {
      Object *pci_host;
      QObject *o;
+    uint32_t domain_nr;
+    AcpiMcfgInfo *head = NULL, *tail, *mcfg;
pci_host = acpi_get_i386_pci_host();
      g_assert(pci_host);
- o = object_property_get_qobject(pci_host, PCIE_HOST_MCFG_BASE, NULL);
-    if (!o) {
-        return false;
+    while (pci_host) {
+        o = object_property_get_qobject(pci_host, "domain_nr", NULL);
+        if (!o) {

If every pci_host is supposed to have a domain_nr is better to assert here.

+            cleanup_mcfg(head);
+            return NULL;
+        }
+        domain_nr = qnum_get_uint(qobject_to(QNum, o));
+        qobject_unref(o);
+        /* skip q35 host and bridges that reside in the same domain with it */
+        if (domain_nr == 0) {
+            pci_host = OBJECT(QLIST_NEXT(PCI_HOST_BRIDGE(pci_host), next));
+            continue;

The default q35 pci host will not have a MMCFG?

+        }
+
+        mcfg = g_new0(AcpiMcfgInfo, 1);
+        mcfg->next = NULL;
+        if (!head) {
+            tail = head = mcfg;
+        } else {
+            tail->next = mcfg;
+            tail = mcfg;
+        }
+        mcfg->domain_nr = domain_nr;
+
+        o = object_property_get_qobject(pci_host, PCIE_HOST_MCFG_BASE, NULL);
+        assert(o);
+        mcfg->mcfg_base = qnum_get_uint(qobject_to(QNum, o));
+        qobject_unref(o);
+
+        /* firmware will overwrite it */
+        o = object_property_get_qobject(pci_host, PCIE_HOST_MCFG_SIZE, NULL);
+        assert(o);
+        mcfg->mcfg_size = qnum_get_uint(qobject_to(QNum, o));
+        qobject_unref(o);
+
+        o = object_property_get_qobject(pci_host, "domain_nr", NULL);
+        assert(o);
+        mcfg->domain_nr = qnum_get_uint(qobject_to(QNum, o));

You already have the domain_nr.

+
+        pci_host = OBJECT(QLIST_NEXT(PCI_HOST_BRIDGE(pci_host), next));
      }
-    mcfg->mcfg_base = qnum_get_uint(qobject_to(QNum, o));
-    qobject_unref(o);
- o = object_property_get_qobject(pci_host, PCIE_HOST_MCFG_SIZE, NULL);
-    assert(o);
-    mcfg->mcfg_size = qnum_get_uint(qobject_to(QNum, o));
-    qobject_unref(o);
-    return true;
+    return head;
  }
static
@@ -2633,7 +2689,7 @@ void acpi_build(AcpiBuildTables *tables, MachineState 
*machine)
      unsigned facs, dsdt, rsdt, fadt;
      AcpiPmInfo pm;
      AcpiMiscInfo misc;
-    AcpiMcfgInfo mcfg;
+    AcpiMcfgInfo *mcfg;
      Range pci_hole, pci_hole64;
      uint8_t *u;
      size_t aml_len = 0;
@@ -2714,10 +2770,11 @@ void acpi_build(AcpiBuildTables *tables, MachineState 
*machine)
              build_slit(tables_blob, tables->linker);
          }
      }
-    if (acpi_get_mcfg(&mcfg)) {
+    if ((mcfg = acpi_get_mcfg()) != NULL) {
          acpi_add_table(table_offsets, tables_blob);
-        build_mcfg_q35(tables_blob, tables->linker, &mcfg);
+        build_mcfg_q35(tables_blob, tables->linker, mcfg);
      }
+    cleanup_mcfg(mcfg);
      if (x86_iommu_get_default()) {
          IommuType IOMMUType = x86_iommu_get_type();
          if (IOMMUType == TYPE_AMD) {
diff --git a/hw/i386/pc.c b/hw/i386/pc.c
index f3befe6..95f6c34 100644
--- a/hw/i386/pc.c
+++ b/hw/i386/pc.c
@@ -34,6 +34,7 @@
  #include "hw/ide.h"
  #include "hw/pci/pci.h"
  #include "hw/pci/pci_bus.h"
+#include "hw/pci-bridge/pci_expander_bridge.h"
  #include "hw/nvram/fw_cfg.h"
  #include "hw/timer/hpet.h"
  #include "hw/smbios/smbios.h"
@@ -1469,15 +1470,24 @@ uint64_t pc_pci_hole64_start(void)
      if (pcmc->has_reserved_memory && ms->device_memory->base) {
          hole64_start = ms->device_memory->base;
          if (!pcmc->broken_reserved_end) {
-            hole64_start += memory_region_size(&ms->device_memory->mr);
+            hole64_start += (memory_region_size(&ms->device_memory->mr) + \
+                            pxb_pcie_mcfg_hole());
          }
      } else {
-        hole64_start = 0x100000000ULL + pcms->above_4g_mem_size;
+        /* memory layout [RAM Hotplug][MCFG][..ROUND UP..][PCI HOLE] */
+        hole64_start = pc_pci_mcfg_start() + pxb_pcie_mcfg_hole();
      }
return ROUND_UP(hole64_start, 1ULL << 30);
  }
+uint64_t pc_pci_mcfg_start(void)
+{
+    PCMachineState *pcms = PC_MACHINE(qdev_get_machine());
+
+    return ROUND_UP(0x100000000ULL + pcms->above_4g_mem_size, 1ULL << 12);
+}
+
  qemu_irq pc_allocate_cpu_irq(void)
  {
      return qemu_allocate_irq(pic_irq_request, NULL, 0);
diff --git a/hw/pci-bridge/pci_expander_bridge.c 
b/hw/pci-bridge/pci_expander_bridge.c
index 448b9fb..14f0447 100644
--- a/hw/pci-bridge/pci_expander_bridge.c
+++ b/hw/pci-bridge/pci_expander_bridge.c
@@ -12,11 +12,14 @@
#include "qemu/osdep.h"
  #include "qapi/error.h"
+#include "hw/i386/pc.h"
  #include "hw/pci/pci.h"
  #include "hw/pci/pci_bus.h"
  #include "hw/pci/pci_host.h"
  #include "hw/pci/pcie_host.h"
  #include "hw/pci/pci_bridge.h"
+#include "hw/pci-host/q35.h"
+#include "hw/pci-bridge/pci_expander_bridge.h"
  #include "qemu/range.h"
  #include "qemu/error-report.h"
  #include "sysemu/numa.h"
@@ -118,6 +121,25 @@ static const TypeInfo pxb_pcie_bus_info = {
      .class_init    = pxb_bus_class_init,
  };
+static uint64_t pxb_mcfg_hole_size = 0;
+

No need to initialize a static to 0.

+static void pxb_pcie_foreach(gpointer data, gpointer user_data)
+{
+    PXBDev *pxb = (PXBDev *)data;
+
+    if (pxb->sep_domain && pxb->domain_nr > 0) {
+        // only reserve what users ask for to reduce memory cost
+        pxb_mcfg_hole_size += ((pxb->max_bus + 1ULL) << 20);

Why "+ 1" ?
Please replace 20 with a MACRO explaining it.

+    }
+}
+
+uint64_t pxb_pcie_mcfg_hole(void)
+{
+    /* foreach is necessary as some pxb still reside in domain 0 */
+    g_list_foreach(pxb_dev_list, pxb_pcie_foreach, NULL);
+    return pxb_mcfg_hole_size;
+}
+
  static const char *pxb_host_root_bus_path(PCIHostState *host_bridge,
                                            PCIBus *rootbus)
  {
@@ -145,14 +167,6 @@ static const char 
*pxb_pcie_host_root_bus_path(PCIHostState *host_bridge,
      return bus->bus_path;
  }
-static void pxb_pcie_host_get_mmcfg_size(Object *obj, Visitor *v, const char *name,
-                                    void *opaque, Error **errp)
-{
-    PCIExpressHost *e = PCIE_HOST_BRIDGE(obj);
-
-    visit_type_uint64(v, name, &e->size, errp);
-}
-
  static char *pxb_host_ofw_unit_address(const SysBusDevice *dev)
  {
      const PCIHostState *pxb_host;
@@ -192,16 +206,12 @@ static void pxb_pcie_host_initfn(Object *obj)
                            "pci-conf-idx", 4);
      memory_region_init_io(&phb->data_mem, obj, &pci_host_data_le_ops, phb,
                            "pci-conf-data", 4);
-
-    object_property_add(obj, PCIE_HOST_MCFG_SIZE, "uint64",
-                         pxb_pcie_host_get_mmcfg_size,
-                         NULL, NULL, NULL, NULL);
-
  }
static Property pxb_pcie_host_props[] = {
      DEFINE_PROP_UINT64(PCIE_HOST_MCFG_BASE, PXBPCIEHost, parent_obj.base_addr,
-                        PCIE_BASE_ADDR_UNMAPPED),
+                       PCIE_BASE_ADDR_UNMAPPED),
+    DEFINE_PROP_UINT64(PCIE_HOST_MCFG_SIZE, PXBPCIEHost, parent_obj.size, 0),
      DEFINE_PROP_UINT32("domain_nr", PXBPCIEHost, domain_nr, 0),
      DEFINE_PROP_UINT8("bus_nr", PXBPCIEHost, bus_nr, 0),
      DEFINE_PROP_UINT8("max_bus", PXBPCIEHost, max_bus, 255),
@@ -301,6 +311,8 @@ static gint pxb_compare(gconstpointer a, gconstpointer b)
             0;
  }
+static uint64_t pxb_pcie_mcfg_base = 0;
+
  static void pxb_dev_realize_common(PCIDevice *dev, bool pcie, Error **errp)
  {
      PXBDev *pxb = convert_to_pxb(dev);
@@ -327,6 +339,15 @@ static void pxb_dev_realize_common(PCIDevice *dev, bool 
pcie, Error **errp)
          qdev_prop_set_uint8(ds, "bus_nr", pxb->bus_nr); //TODO.
          qdev_prop_set_uint8(ds, "max_bus", pxb->max_bus);
          qdev_prop_set_uint8(ds, "domain_nr", pxb->domain_nr);
+
+        /* will be overwritten by firmware, but kept for readability */
+        qdev_prop_set_uint64(ds, PCIE_HOST_MCFG_BASE,
+            pxb->domain_nr ? pxb_pcie_mcfg_base : 
MCH_HOST_BRIDGE_PCIEXBAR_DEFAULT);
+        qdev_prop_set_uint64(ds, PCIE_HOST_MCFG_SIZE,
+            pxb->domain_nr ? (pxb->max_bus + 1ULL) << 20 : 0);
+        if (pxb->domain_nr)
+            pxb_pcie_mcfg_base += ((pxb->max_bus + 1ULL) << 20);
+
          bus = pci_root_bus_new(ds, dev_name, NULL, NULL, 0, 
TYPE_PXB_PCIE_BUS);
      } else {
          ds = qdev_create(NULL, TYPE_PXB_HOST);
@@ -438,6 +459,9 @@ static void pxb_pcie_dev_realize(PCIDevice *dev, Error 
**errp)
          return;
      }
+ if (0 == pxb_pcie_mcfg_base)
+        pxb_pcie_mcfg_base = pc_pci_mcfg_start();
+
      pxb_dev_realize_common(dev, true, errp);
  }
diff --git a/hw/pci-host/q35.c b/hw/pci-host/q35.c
index 02f9576..a76029d 100644
--- a/hw/pci-host/q35.c
+++ b/hw/pci-host/q35.c
@@ -178,6 +178,8 @@ static Property q35_host_props[] = {
      DEFINE_PROP_SIZE(PCI_HOST_ABOVE_4G_MEM_SIZE, Q35PCIHost,
                       mch.above_4g_mem_size, 0),
      DEFINE_PROP_BOOL("x-pci-hole64-fix", Q35PCIHost, pci_hole64_fix, true),
+    /* q35 host bridge should always stay in pci domain 0 */
+    DEFINE_PROP_UINT32("domain_nr", Q35PCIHost, domain_nr, 0),
      DEFINE_PROP_END_OF_LIST(),
  };
diff --git a/include/hw/i386/pc.h b/include/hw/i386/pc.h
index 04d1f8c..81ba010 100644
--- a/include/hw/i386/pc.h
+++ b/include/hw/i386/pc.h
@@ -212,6 +212,7 @@ void pc_memory_init(PCMachineState *pcms,
                      MemoryRegion *rom_memory,
                      MemoryRegion **ram_memory);
  uint64_t pc_pci_hole64_start(void);
+uint64_t pc_pci_mcfg_start(void);
  qemu_irq pc_allocate_cpu_irq(void);
  DeviceState *pc_vga_init(ISABus *isa_bus, PCIBus *pci_bus);
  void pc_basic_device_init(ISABus *isa_bus, qemu_irq *gsi,
diff --git a/include/hw/pci-bridge/pci_expander_bridge.h 
b/include/hw/pci-bridge/pci_expander_bridge.h
new file mode 100644
index 0000000..bb1462c
--- /dev/null
+++ b/include/hw/pci-bridge/pci_expander_bridge.h
@@ -0,0 +1,6 @@
+#ifndef HW_PCI_EXPANDER_H
+#define HW_PCI_EXPANDER_H
+
+uint64_t pxb_pcie_mcfg_hole(void);
+
+#endif
diff --git a/include/hw/pci-host/q35.h b/include/hw/pci-host/q35.h
index 8f4ddde..432e569 100644
--- a/include/hw/pci-host/q35.h
+++ b/include/hw/pci-host/q35.h
@@ -69,6 +69,7 @@ typedef struct Q35PCIHost {
      /*< public >*/
bool pci_hole64_fix;
+    uint32_t domain_nr;
      MCHPCIState mch;
  } Q35PCIHost;

Thanks,
Marcel




reply via email to

[Prev in Thread] Current Thread [Next in Thread]