qemu-devel.nongnu.org archive mirror
 help / color / mirror / Atom feed
From: Marcel Apfelbaum <marcel.apfelbaum@gmail.com>
To: Zihan Yang <whois.zihan.yang@gmail.com>, qemu-devel@nongnu.org
Cc: "Michael S. Tsirkin" <mst@redhat.com>,
	Igor Mammedov <imammedo@redhat.com>,
	Paolo Bonzini <pbonzini@redhat.com>,
	Richard Henderson <rth@twiddle.net>,
	Eduardo Habkost <ehabkost@redhat.com>
Subject: Re: [Qemu-devel] [RFC v2 2/3] acpi-build: allocate mcfg for pxb-pcie host bridges
Date: Wed, 20 Jun 2018 10:41:01 +0300	[thread overview]
Message-ID: <a6014b3a-0e1c-47e6-7b10-4873358864c3@gmail.com> (raw)
In-Reply-To: <1528794804-6289-2-git-send-email-whois.zihan.yang@gmail.com>



On 06/12/2018 12:13 PM, Zihan Yang wrote:
> Allocate new segment for pxb-pcie host bridges in MCFG table, and reserve
> corresponding MCFG space for them. This allows user-defined pxb-pcie
> host bridges to be placed in different pci domain than q35 host
>
> Signed-off-by: Zihan Yang <whois.zihan.yang@gmail.com>
> ---
>   hw/i386/acpi-build.c                        | 97 +++++++++++++++++++++++------
>   hw/i386/pc.c                                | 14 ++++-
>   hw/pci-bridge/pci_expander_bridge.c         | 52 +++++++++++-----
>   hw/pci-host/q35.c                           |  2 +
>   include/hw/i386/pc.h                        |  1 +
>   include/hw/pci-bridge/pci_expander_bridge.h |  6 ++
>   include/hw/pci-host/q35.h                   |  1 +
>   7 files changed, 137 insertions(+), 36 deletions(-)
>   create mode 100644 include/hw/pci-bridge/pci_expander_bridge.h
>
> diff --git a/hw/i386/acpi-build.c b/hw/i386/acpi-build.c
> index 9bc6d97..104e52d 100644
> --- a/hw/i386/acpi-build.c
> +++ b/hw/i386/acpi-build.c
> @@ -89,6 +89,8 @@
>   typedef struct AcpiMcfgInfo {
>       uint64_t mcfg_base;
>       uint32_t mcfg_size;
> +    uint32_t domain_nr;
> +    struct AcpiMcfgInfo *next;
>   } AcpiMcfgInfo;
>   
>   typedef struct AcpiPmInfo {
> @@ -2427,14 +2429,16 @@ build_mcfg_q35(GArray *table_data, BIOSLinker *linker, AcpiMcfgInfo *info)
>   {
>       AcpiTableMcfg *mcfg;
>       const char *sig;
> -    int len = sizeof(*mcfg) + 1 * sizeof(mcfg->allocation[0]);
> +    int len, count = 0;
> +    AcpiMcfgInfo *cfg = info;
> +
> +    while (cfg) {
> +        ++count;
> +        cfg = cfg->next;
> +    }
> +    len = sizeof(*mcfg) + count * sizeof(mcfg->allocation[0]);
>   
>       mcfg = acpi_data_push(table_data, len);
> -    mcfg->allocation[0].address = cpu_to_le64(info->mcfg_base);
> -    /* Only a single allocation so no need to play with segments */
> -    mcfg->allocation[0].pci_segment = cpu_to_le16(0);
> -    mcfg->allocation[0].start_bus_number = 0;
> -    mcfg->allocation[0].end_bus_number = PCIE_MMCFG_BUS(info->mcfg_size - 1);
>   
>       /* MCFG is used for ECAM which can be enabled or disabled by guest.
>        * To avoid table size changes (which create migration issues),
> @@ -2448,6 +2452,15 @@ build_mcfg_q35(GArray *table_data, BIOSLinker *linker, AcpiMcfgInfo *info)
>       } else {
>           sig = "MCFG";
>       }
> +
> +    while (info) {
> +        mcfg[count].allocation[0].address = cpu_to_le64(info->mcfg_base);
> +        mcfg[count].allocation[0].pci_segment = cpu_to_le16(info->domain_nr);
> +        mcfg[count].allocation[0].start_bus_number = 0;
> +        mcfg[count++].allocation[0].end_bus_number = PCIE_MMCFG_BUS(info->mcfg_size - 1);

I think you want to use here max_bus property defined in the prev patch.

> +        info = info->next;
> +    }
> +
>       build_header(linker, table_data, (void *)mcfg, sig, len, 1, NULL, NULL);
>   }
>   
> @@ -2602,26 +2615,69 @@ struct AcpiBuildState {
>       MemoryRegion *linker_mr;
>   } AcpiBuildState;
>   
> -static bool acpi_get_mcfg(AcpiMcfgInfo *mcfg)
> +static inline void cleanup_mcfg(AcpiMcfgInfo *mcfg)
> +{
> +    AcpiMcfgInfo *tmp;
> +    while (mcfg) {
> +        tmp = mcfg->next;
> +        g_free(mcfg);
> +        mcfg = tmp;
> +    }
> +}
> +
> +static AcpiMcfgInfo *acpi_get_mcfg(void)
>   {
>       Object *pci_host;
>       QObject *o;
> +    uint32_t domain_nr;
> +    AcpiMcfgInfo *head = NULL, *tail, *mcfg;
>   
>       pci_host = acpi_get_i386_pci_host();
>       g_assert(pci_host);
>   
> -    o = object_property_get_qobject(pci_host, PCIE_HOST_MCFG_BASE, NULL);
> -    if (!o) {
> -        return false;
> +    while (pci_host) {
> +        o = object_property_get_qobject(pci_host, "domain_nr", NULL);
> +        if (!o) {

If every pci_host is supposed to have a domain_nr is better to assert here.

> +            cleanup_mcfg(head);
> +            return NULL;
> +        }
> +        domain_nr = qnum_get_uint(qobject_to(QNum, o));
> +        qobject_unref(o);
> +        /* skip q35 host and bridges that reside in the same domain with it */
> +        if (domain_nr == 0) {
> +            pci_host = OBJECT(QLIST_NEXT(PCI_HOST_BRIDGE(pci_host), next));
> +            continue;

The default q35 pci host will not have a MMCFG?

> +        }
> +
> +        mcfg = g_new0(AcpiMcfgInfo, 1);
> +        mcfg->next = NULL;
> +        if (!head) {
> +            tail = head = mcfg;
> +        } else {
> +            tail->next = mcfg;
> +            tail = mcfg;
> +        }
> +        mcfg->domain_nr = domain_nr;
> +
> +        o = object_property_get_qobject(pci_host, PCIE_HOST_MCFG_BASE, NULL);
> +        assert(o);
> +        mcfg->mcfg_base = qnum_get_uint(qobject_to(QNum, o));
> +        qobject_unref(o);
> +
> +        /* firmware will overwrite it */
> +        o = object_property_get_qobject(pci_host, PCIE_HOST_MCFG_SIZE, NULL);
> +        assert(o);
> +        mcfg->mcfg_size = qnum_get_uint(qobject_to(QNum, o));
> +        qobject_unref(o);
> +
> +        o = object_property_get_qobject(pci_host, "domain_nr", NULL);
> +        assert(o);
> +        mcfg->domain_nr = qnum_get_uint(qobject_to(QNum, o));

You already have the domain_nr.

> +
> +        pci_host = OBJECT(QLIST_NEXT(PCI_HOST_BRIDGE(pci_host), next));
>       }
> -    mcfg->mcfg_base = qnum_get_uint(qobject_to(QNum, o));
> -    qobject_unref(o);
>   
> -    o = object_property_get_qobject(pci_host, PCIE_HOST_MCFG_SIZE, NULL);
> -    assert(o);
> -    mcfg->mcfg_size = qnum_get_uint(qobject_to(QNum, o));
> -    qobject_unref(o);
> -    return true;
> +    return head;
>   }
>   
>   static
> @@ -2633,7 +2689,7 @@ void acpi_build(AcpiBuildTables *tables, MachineState *machine)
>       unsigned facs, dsdt, rsdt, fadt;
>       AcpiPmInfo pm;
>       AcpiMiscInfo misc;
> -    AcpiMcfgInfo mcfg;
> +    AcpiMcfgInfo *mcfg;
>       Range pci_hole, pci_hole64;
>       uint8_t *u;
>       size_t aml_len = 0;
> @@ -2714,10 +2770,11 @@ void acpi_build(AcpiBuildTables *tables, MachineState *machine)
>               build_slit(tables_blob, tables->linker);
>           }
>       }
> -    if (acpi_get_mcfg(&mcfg)) {
> +    if ((mcfg = acpi_get_mcfg()) != NULL) {
>           acpi_add_table(table_offsets, tables_blob);
> -        build_mcfg_q35(tables_blob, tables->linker, &mcfg);
> +        build_mcfg_q35(tables_blob, tables->linker, mcfg);
>       }
> +    cleanup_mcfg(mcfg);
>       if (x86_iommu_get_default()) {
>           IommuType IOMMUType = x86_iommu_get_type();
>           if (IOMMUType == TYPE_AMD) {
> diff --git a/hw/i386/pc.c b/hw/i386/pc.c
> index f3befe6..95f6c34 100644
> --- a/hw/i386/pc.c
> +++ b/hw/i386/pc.c
> @@ -34,6 +34,7 @@
>   #include "hw/ide.h"
>   #include "hw/pci/pci.h"
>   #include "hw/pci/pci_bus.h"
> +#include "hw/pci-bridge/pci_expander_bridge.h"
>   #include "hw/nvram/fw_cfg.h"
>   #include "hw/timer/hpet.h"
>   #include "hw/smbios/smbios.h"
> @@ -1469,15 +1470,24 @@ uint64_t pc_pci_hole64_start(void)
>       if (pcmc->has_reserved_memory && ms->device_memory->base) {
>           hole64_start = ms->device_memory->base;
>           if (!pcmc->broken_reserved_end) {
> -            hole64_start += memory_region_size(&ms->device_memory->mr);
> +            hole64_start += (memory_region_size(&ms->device_memory->mr) + \
> +                            pxb_pcie_mcfg_hole());
>           }
>       } else {
> -        hole64_start = 0x100000000ULL + pcms->above_4g_mem_size;
> +        /* memory layout [RAM Hotplug][MCFG][..ROUND UP..][PCI HOLE] */
> +        hole64_start = pc_pci_mcfg_start() + pxb_pcie_mcfg_hole();
>       }
>   
>       return ROUND_UP(hole64_start, 1ULL << 30);
>   }
>   
> +uint64_t pc_pci_mcfg_start(void)
> +{
> +    PCMachineState *pcms = PC_MACHINE(qdev_get_machine());
> +
> +    return ROUND_UP(0x100000000ULL + pcms->above_4g_mem_size, 1ULL << 12);
> +}
> +
>   qemu_irq pc_allocate_cpu_irq(void)
>   {
>       return qemu_allocate_irq(pic_irq_request, NULL, 0);
> diff --git a/hw/pci-bridge/pci_expander_bridge.c b/hw/pci-bridge/pci_expander_bridge.c
> index 448b9fb..14f0447 100644
> --- a/hw/pci-bridge/pci_expander_bridge.c
> +++ b/hw/pci-bridge/pci_expander_bridge.c
> @@ -12,11 +12,14 @@
>   
>   #include "qemu/osdep.h"
>   #include "qapi/error.h"
> +#include "hw/i386/pc.h"
>   #include "hw/pci/pci.h"
>   #include "hw/pci/pci_bus.h"
>   #include "hw/pci/pci_host.h"
>   #include "hw/pci/pcie_host.h"
>   #include "hw/pci/pci_bridge.h"
> +#include "hw/pci-host/q35.h"
> +#include "hw/pci-bridge/pci_expander_bridge.h"
>   #include "qemu/range.h"
>   #include "qemu/error-report.h"
>   #include "sysemu/numa.h"
> @@ -118,6 +121,25 @@ static const TypeInfo pxb_pcie_bus_info = {
>       .class_init    = pxb_bus_class_init,
>   };
>   
> +static uint64_t pxb_mcfg_hole_size = 0;
> +

No need to initialize a static to 0.

> +static void pxb_pcie_foreach(gpointer data, gpointer user_data)
> +{
> +    PXBDev *pxb = (PXBDev *)data;
> +
> +    if (pxb->sep_domain && pxb->domain_nr > 0) {
> +        // only reserve what users ask for to reduce memory cost
> +        pxb_mcfg_hole_size += ((pxb->max_bus + 1ULL) << 20);

Why "+ 1" ?
Please replace 20 with a MACRO explaining it.

> +    }
> +}
> +
> +uint64_t pxb_pcie_mcfg_hole(void)
> +{
> +    /* foreach is necessary as some pxb still reside in domain 0 */
> +    g_list_foreach(pxb_dev_list, pxb_pcie_foreach, NULL);
> +    return pxb_mcfg_hole_size;
> +}
> +
>   static const char *pxb_host_root_bus_path(PCIHostState *host_bridge,
>                                             PCIBus *rootbus)
>   {
> @@ -145,14 +167,6 @@ static const char *pxb_pcie_host_root_bus_path(PCIHostState *host_bridge,
>       return bus->bus_path;
>   }
>   
> -static void pxb_pcie_host_get_mmcfg_size(Object *obj, Visitor *v, const char *name,
> -                                    void *opaque, Error **errp)
> -{
> -    PCIExpressHost *e = PCIE_HOST_BRIDGE(obj);
> -
> -    visit_type_uint64(v, name, &e->size, errp);
> -}
> -
>   static char *pxb_host_ofw_unit_address(const SysBusDevice *dev)
>   {
>       const PCIHostState *pxb_host;
> @@ -192,16 +206,12 @@ static void pxb_pcie_host_initfn(Object *obj)
>                             "pci-conf-idx", 4);
>       memory_region_init_io(&phb->data_mem, obj, &pci_host_data_le_ops, phb,
>                             "pci-conf-data", 4);
> -
> -    object_property_add(obj, PCIE_HOST_MCFG_SIZE, "uint64",
> -                         pxb_pcie_host_get_mmcfg_size,
> -                         NULL, NULL, NULL, NULL);
> -
>   }
>   
>   static Property pxb_pcie_host_props[] = {
>       DEFINE_PROP_UINT64(PCIE_HOST_MCFG_BASE, PXBPCIEHost, parent_obj.base_addr,
> -                        PCIE_BASE_ADDR_UNMAPPED),
> +                       PCIE_BASE_ADDR_UNMAPPED),
> +    DEFINE_PROP_UINT64(PCIE_HOST_MCFG_SIZE, PXBPCIEHost, parent_obj.size, 0),
>       DEFINE_PROP_UINT32("domain_nr", PXBPCIEHost, domain_nr, 0),
>       DEFINE_PROP_UINT8("bus_nr", PXBPCIEHost, bus_nr, 0),
>       DEFINE_PROP_UINT8("max_bus", PXBPCIEHost, max_bus, 255),
> @@ -301,6 +311,8 @@ static gint pxb_compare(gconstpointer a, gconstpointer b)
>              0;
>   }
>   
> +static uint64_t pxb_pcie_mcfg_base = 0;
> +
>   static void pxb_dev_realize_common(PCIDevice *dev, bool pcie, Error **errp)
>   {
>       PXBDev *pxb = convert_to_pxb(dev);
> @@ -327,6 +339,15 @@ static void pxb_dev_realize_common(PCIDevice *dev, bool pcie, Error **errp)
>           qdev_prop_set_uint8(ds, "bus_nr", pxb->bus_nr); //TODO.
>           qdev_prop_set_uint8(ds, "max_bus", pxb->max_bus);
>           qdev_prop_set_uint8(ds, "domain_nr", pxb->domain_nr);
> +
> +        /* will be overwritten by firmware, but kept for readability */
> +        qdev_prop_set_uint64(ds, PCIE_HOST_MCFG_BASE,
> +            pxb->domain_nr ? pxb_pcie_mcfg_base : MCH_HOST_BRIDGE_PCIEXBAR_DEFAULT);
> +        qdev_prop_set_uint64(ds, PCIE_HOST_MCFG_SIZE,
> +            pxb->domain_nr ? (pxb->max_bus + 1ULL) << 20 : 0);
> +        if (pxb->domain_nr)
> +            pxb_pcie_mcfg_base += ((pxb->max_bus + 1ULL) << 20);
> +
>           bus = pci_root_bus_new(ds, dev_name, NULL, NULL, 0, TYPE_PXB_PCIE_BUS);
>       } else {
>           ds = qdev_create(NULL, TYPE_PXB_HOST);
> @@ -438,6 +459,9 @@ static void pxb_pcie_dev_realize(PCIDevice *dev, Error **errp)
>           return;
>       }
>   
> +    if (0 == pxb_pcie_mcfg_base)
> +        pxb_pcie_mcfg_base = pc_pci_mcfg_start();
> +
>       pxb_dev_realize_common(dev, true, errp);
>   }
>   
> diff --git a/hw/pci-host/q35.c b/hw/pci-host/q35.c
> index 02f9576..a76029d 100644
> --- a/hw/pci-host/q35.c
> +++ b/hw/pci-host/q35.c
> @@ -178,6 +178,8 @@ static Property q35_host_props[] = {
>       DEFINE_PROP_SIZE(PCI_HOST_ABOVE_4G_MEM_SIZE, Q35PCIHost,
>                        mch.above_4g_mem_size, 0),
>       DEFINE_PROP_BOOL("x-pci-hole64-fix", Q35PCIHost, pci_hole64_fix, true),
> +    /* q35 host bridge should always stay in pci domain 0 */
> +    DEFINE_PROP_UINT32("domain_nr", Q35PCIHost, domain_nr, 0),
>       DEFINE_PROP_END_OF_LIST(),
>   };
>   
> diff --git a/include/hw/i386/pc.h b/include/hw/i386/pc.h
> index 04d1f8c..81ba010 100644
> --- a/include/hw/i386/pc.h
> +++ b/include/hw/i386/pc.h
> @@ -212,6 +212,7 @@ void pc_memory_init(PCMachineState *pcms,
>                       MemoryRegion *rom_memory,
>                       MemoryRegion **ram_memory);
>   uint64_t pc_pci_hole64_start(void);
> +uint64_t pc_pci_mcfg_start(void);
>   qemu_irq pc_allocate_cpu_irq(void);
>   DeviceState *pc_vga_init(ISABus *isa_bus, PCIBus *pci_bus);
>   void pc_basic_device_init(ISABus *isa_bus, qemu_irq *gsi,
> diff --git a/include/hw/pci-bridge/pci_expander_bridge.h b/include/hw/pci-bridge/pci_expander_bridge.h
> new file mode 100644
> index 0000000..bb1462c
> --- /dev/null
> +++ b/include/hw/pci-bridge/pci_expander_bridge.h
> @@ -0,0 +1,6 @@
> +#ifndef HW_PCI_EXPANDER_H
> +#define HW_PCI_EXPANDER_H
> +
> +uint64_t pxb_pcie_mcfg_hole(void);
> +
> +#endif
> diff --git a/include/hw/pci-host/q35.h b/include/hw/pci-host/q35.h
> index 8f4ddde..432e569 100644
> --- a/include/hw/pci-host/q35.h
> +++ b/include/hw/pci-host/q35.h
> @@ -69,6 +69,7 @@ typedef struct Q35PCIHost {
>       /*< public >*/
>   
>       bool pci_hole64_fix;
> +    uint32_t domain_nr;
>       MCHPCIState mch;
>   } Q35PCIHost;
>   

Thanks,
Marcel

  parent reply	other threads:[~2018-06-20  7:41 UTC|newest]

Thread overview: 15+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2018-06-12  9:13 [Qemu-devel] [RFC v2 1/3] pci_expander_bridge: add type TYPE_PXB_PCIE_HOST Zihan Yang
2018-06-12  9:13 ` [Qemu-devel] [RFC v2 3/3] acpi-build: describe new pci domain in AML Zihan Yang
2018-06-20  7:46   ` Marcel Apfelbaum
2018-06-21 16:52     ` Zihan Yang
2018-06-22 16:43       ` Marcel Apfelbaum
2018-06-12 13:43 ` [Qemu-devel] [RFC v2 1/3] pci_expander_bridge: add type TYPE_PXB_PCIE_HOST Michael S. Tsirkin
2018-06-13  8:23   ` Zihan Yang
2018-06-13 14:46     ` Michael S. Tsirkin
2018-06-14  3:29       ` Zihan Yang
2018-06-20  4:31     ` Marcel Apfelbaum
2018-06-20  6:38 ` Marcel Apfelbaum
2018-06-21 16:46   ` Zihan Yang
     [not found] ` <1528794804-6289-2-git-send-email-whois.zihan.yang@gmail.com>
2018-06-20  7:41   ` Marcel Apfelbaum [this message]
2018-06-21 16:49     ` [Qemu-devel] [RFC v2 2/3] acpi-build: allocate mcfg for pxb-pcie host bridges Zihan Yang
2018-06-22 16:37       ` Marcel Apfelbaum

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=a6014b3a-0e1c-47e6-7b10-4873358864c3@gmail.com \
    --to=marcel.apfelbaum@gmail.com \
    --cc=ehabkost@redhat.com \
    --cc=imammedo@redhat.com \
    --cc=mst@redhat.com \
    --cc=pbonzini@redhat.com \
    --cc=qemu-devel@nongnu.org \
    --cc=rth@twiddle.net \
    --cc=whois.zihan.yang@gmail.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).