[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
Re: [Qemu-ppc] [PATCH v2 3/3] spapr: introduce a fixed IRQ number space
From: |
Cédric Le Goater |
Subject: |
Re: [Qemu-ppc] [PATCH v2 3/3] spapr: introduce a fixed IRQ number space |
Date: |
Tue, 19 Jun 2018 12:05:21 +0200 |
User-agent: |
Mozilla/5.0 (X11; Linux x86_64; rv:52.0) Gecko/20100101 Thunderbird/52.5.2 |
On 06/19/2018 03:02 AM, David Gibson wrote:
> On Mon, Jun 18, 2018 at 07:34:02PM +0200, Cédric Le Goater wrote:
>> This proposal introduces a new IRQ number space layout using static
>> numbers for all devices and a bitmap allocator for the MSI numbers
>> which are negotiated by the guest at runtime.
>>
>> The previous layout is kept in machines raising the 'xics_legacy'
>> flag.
>>
>> Signed-off-by: Cédric Le Goater <address@hidden>
>> ---
>> include/hw/ppc/spapr.h | 4 ++++
>> include/hw/ppc/spapr_irq.h | 30 +++++++++++++++++++++++++
>> hw/ppc/spapr.c | 31 +++++++++++++++++++++++++
>> hw/ppc/spapr_events.c | 12 ++++++++--
>> hw/ppc/spapr_irq.c | 56
>> ++++++++++++++++++++++++++++++++++++++++++++++
>> hw/ppc/spapr_pci.c | 28 ++++++++++++++++++-----
>> hw/ppc/spapr_vio.c | 19 ++++++++++++----
>> hw/ppc/Makefile.objs | 2 +-
>> 8 files changed, 169 insertions(+), 13 deletions(-)
>> create mode 100644 include/hw/ppc/spapr_irq.h
>> create mode 100644 hw/ppc/spapr_irq.c
>>
>> diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h
>> index 9decc66a1915..4c63b1fac13b 100644
>> --- a/include/hw/ppc/spapr.h
>> +++ b/include/hw/ppc/spapr.h
>> @@ -7,6 +7,7 @@
>> #include "hw/ppc/spapr_drc.h"
>> #include "hw/mem/pc-dimm.h"
>> #include "hw/ppc/spapr_ovec.h"
>> +#include "hw/ppc/spapr_irq.h"
>>
>> struct VIOsPAPRBus;
>> struct sPAPRPHBState;
>> @@ -164,6 +165,9 @@ struct sPAPRMachineState {
>> char *kvm_type;
>>
>> const char *icp_type;
>> + bool xics_legacy;
>
> This flag can go in the class, rather than the instance.
>
> And maybe call it 'legacy_irq_allocation'. It assumes XICS, but
> otherwise isn't strongly tied to it.
Here's another idea.
Instead of a bool, we could use a find() operation if it is defined
by the spapr_irq backend.
The current XICS spapr_irq backend would have one and the new XICS
and XIVE backends would not.
C.
>
>> + int32_t irq_map_nr;
>> + unsigned long *irq_map;
>
> So, I don't love the fact that the new bitmap duplicates information
> that's also in the intc backend (e.g. via ICS_IRQ_FREE()). However
> leaving the authoritative info in the backend also causes problems
> when we have dynamic switching. Not entirely sure what to do about
> that.
>
>> bool cmd_line_caps[SPAPR_CAP_NUM];
>> sPAPRCapabilities def, eff, mig;
>> diff --git a/include/hw/ppc/spapr_irq.h b/include/hw/ppc/spapr_irq.h
>> new file mode 100644
>> index 000000000000..345a42efd366
>> --- /dev/null
>> +++ b/include/hw/ppc/spapr_irq.h
>> @@ -0,0 +1,30 @@
>> +/*
>> + * QEMU PowerPC sPAPR IRQ backend definitions
>> + *
>> + * Copyright (c) 2018, IBM Corporation.
>> + *
>> + * This code is licensed under the GPL version 2 or later. See the
>> + * COPYING file in the top-level directory.
>> + */
>> +
>> +#ifndef HW_SPAPR_IRQ_H
>> +#define HW_SPAPR_IRQ_H
>> +
>> +/*
>> + * IRQ range offsets per device type
>> + */
>> +#define SPAPR_IRQ_EPOW 0x1000 /* XICS_IRQ_BASE offset */
>> +#define SPAPR_IRQ_HOTPLUG 0x1001
>> +#define SPAPR_IRQ_VIO 0x1100 /* 256 VIO devices */
>> +#define SPAPR_IRQ_PCI_LSI 0x1200 /* 32+ PHBs devices */
>> +
>> +#define SPAPR_IRQ_MSI 0x1300 /* Offset of the dynamic range covered
>> + * by the bitmap allocator */
>
> I'm a little confused by the MSI stuff. It looks like you're going
> for the option of one big pool for all dynamic irqs. Except that I
> thought in our discussion the other day you said each PHB advertised
> its own separate MSI range, so we'd actually need to split this up
> into ranges for each PHB.
>
>> +void spapr_irq_msi_init(sPAPRMachineState *spapr, uint32_t nr_irqs);
>> +int spapr_irq_msi_alloc(sPAPRMachineState *spapr, uint32_t num, bool align,
>> + Error **errp);
>> +void spapr_irq_msi_free(sPAPRMachineState *spapr, int irq, uint32_t num);
>> +void spapr_irq_msi_reset(sPAPRMachineState *spapr);
>> +
>> +#endif
>> diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c
>> index 2b6d17056012..b9ba3ae675e5 100644
>> --- a/hw/ppc/spapr.c
>> +++ b/hw/ppc/spapr.c
>> @@ -188,6 +188,11 @@ static void xics_system_init(MachineState *machine, int
>> nr_irqs, Error **errp)
>> sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
>> Error *local_err = NULL;
>>
>> + /* Initialize the MSI IRQ allocator. */
>> + if (!spapr->xics_legacy) {
>> + spapr_irq_msi_init(spapr, nr_irqs);
>> + }
>> +
>> if (kvm_enabled()) {
>> if (machine_kernel_irqchip_allowed(machine) &&
>> !xics_kvm_init(spapr, &local_err)) {
>> @@ -1635,6 +1640,10 @@ static void spapr_machine_reset(void)
>> ppc_set_compat(first_ppc_cpu, spapr->max_compat_pvr, &error_fatal);
>> }
>>
>> + if (!spapr->xics_legacy) {
>> + spapr_irq_msi_reset(spapr);
>> + }
>> +
>> qemu_devices_reset();
>>
>> /* DRC reset may cause a device to be unplugged. This will cause
>> troubles
>> @@ -1909,6 +1918,24 @@ static const VMStateDescription
>> vmstate_spapr_patb_entry = {
>> },
>> };
>>
>> +static bool spapr_irq_map_needed(void *opaque)
>> +{
>> + sPAPRMachineState *spapr = opaque;
>> +
>> + return spapr->irq_map && !bitmap_empty(spapr->irq_map,
>> spapr->irq_map_nr);
>> +}
>> +
>> +static const VMStateDescription vmstate_spapr_irq_map = {
>> + .name = "spapr_irq_map",
>> + .version_id = 1,
>> + .minimum_version_id = 1,
>> + .needed = spapr_irq_map_needed,
>> + .fields = (VMStateField[]) {
>> + VMSTATE_BITMAP(irq_map, sPAPRMachineState, 0, irq_map_nr),
>> + VMSTATE_END_OF_LIST()
>> + },
>> +};
>> +
>> static const VMStateDescription vmstate_spapr = {
>> .name = "spapr",
>> .version_id = 3,
>> @@ -1936,6 +1963,7 @@ static const VMStateDescription vmstate_spapr = {
>> &vmstate_spapr_cap_cfpc,
>> &vmstate_spapr_cap_sbbc,
>> &vmstate_spapr_cap_ibs,
>> + &vmstate_spapr_irq_map,
>> NULL
>> }
>> };
>> @@ -4093,7 +4121,10 @@ DEFINE_SPAPR_MACHINE(3_0, "3.0", true);
>>
>> static void spapr_machine_2_12_instance_options(MachineState *machine)
>> {
>> + sPAPRMachineState *spapr = SPAPR_MACHINE(machine);
>> +
>> spapr_machine_3_0_instance_options(machine);
>> + spapr->xics_legacy = true;
>> }
>>
>> static void spapr_machine_2_12_class_options(MachineClass *mc)
>> diff --git a/hw/ppc/spapr_events.c b/hw/ppc/spapr_events.c
>> index e4f5946a2188..c82dc40be0d5 100644
>> --- a/hw/ppc/spapr_events.c
>> +++ b/hw/ppc/spapr_events.c
>> @@ -709,7 +709,11 @@ void spapr_events_init(sPAPRMachineState *spapr)
>> {
>> int epow_irq;
>>
>> - epow_irq = spapr_irq_findone(spapr, &error_fatal);
>> + if (spapr->xics_legacy) {
>> + epow_irq = spapr_irq_findone(spapr, &error_fatal);
>> + } else {
>> + epow_irq = SPAPR_IRQ_EPOW;
>
> Can slightly improve brevity by just initializing epow_irq to this,
> then overwriting it in the legacy case.
>
>> + }
>>
>> spapr_irq_claim(spapr, epow_irq, false, &error_fatal);
>>
>> @@ -731,7 +735,11 @@ void spapr_events_init(sPAPRMachineState *spapr)
>> if (spapr->use_hotplug_event_source) {
>> int hp_irq;
>>
>> - hp_irq = spapr_irq_findone(spapr, &error_fatal);
>> + if (spapr->xics_legacy) {
>> + hp_irq = spapr_irq_findone(spapr, &error_fatal);
>> + } else {
>> + hp_irq = SPAPR_IRQ_HOTPLUG;
>> + }
>
> Same here.
>
>>
>> spapr_irq_claim(spapr, hp_irq, false, &error_fatal);
>>
>> diff --git a/hw/ppc/spapr_irq.c b/hw/ppc/spapr_irq.c
>> new file mode 100644
>> index 000000000000..4e311023bab2
>> --- /dev/null
>> +++ b/hw/ppc/spapr_irq.c
>> @@ -0,0 +1,56 @@
>> +/*
>> + * QEMU PowerPC sPAPR IRQ interface
>> + *
>> + * Copyright (c) 2018, IBM Corporation.
>> + *
>> + * This code is licensed under the GPL version 2 or later. See the
>> + * COPYING file in the top-level directory.
>> + */
>> +
>> +#include "qemu/osdep.h"
>> +#include "qemu/log.h"
>> +#include "qemu/error-report.h"
>> +#include "qapi/error.h"
>> +#include "hw/ppc/spapr.h"
>> +#include "hw/ppc/xics.h"
>> +
>> +void spapr_irq_msi_init(sPAPRMachineState *spapr, uint32_t nr_irqs)
>> +{
>> + spapr->irq_map_nr = XICS_IRQ_BASE + nr_irqs - SPAPR_IRQ_MSI;
>> + spapr->irq_map = bitmap_new(spapr->irq_map_nr);
>> +}
>> +
>> +int spapr_irq_msi_alloc(sPAPRMachineState *spapr, uint32_t num, bool align,
>> + Error **errp)
>> +{
>> + int irq;
>> +
>> + /*
>> + * The 'align_mask' parameter of bitmap_find_next_zero_area()
>> + * should be one less than a power of 2; 0 means no
>> + * alignment. Adapt the 'align' value of the former allocator
>> + * to fit the requirements of bitmap_find_next_zero_area()
>> + */
>> + align -= 1;
>> +
>> + irq = bitmap_find_next_zero_area(spapr->irq_map, spapr->irq_map_nr, 0,
>> num,
>> + align);
>> + if (irq == spapr->irq_map_nr) {
>> + error_setg(errp, "can't find a free %d-IRQ block", num);
>> + return -1;
>> + }
>> +
>> + bitmap_set(spapr->irq_map, irq, num);
>> +
>> + return irq + SPAPR_IRQ_MSI;
>> +}
>> +
>> +void spapr_irq_msi_free(sPAPRMachineState *spapr, int irq, uint32_t num)
>> +{
>> + bitmap_clear(spapr->irq_map, irq - SPAPR_IRQ_MSI, num);
>> +}
>> +
>> +void spapr_irq_msi_reset(sPAPRMachineState *spapr)
>> +{
>> + bitmap_clear(spapr->irq_map, 0, spapr->irq_map_nr);
>> +}
>> diff --git a/hw/ppc/spapr_pci.c b/hw/ppc/spapr_pci.c
>> index 497b896c7d24..bbf48fd3503d 100644
>> --- a/hw/ppc/spapr_pci.c
>> +++ b/hw/ppc/spapr_pci.c
>> @@ -334,6 +334,9 @@ static void rtas_ibm_change_msi(PowerPCCPU *cpu,
>> sPAPRMachineState *spapr,
>> return;
>> }
>>
>> + if (!spapr->xics_legacy) {
>> + spapr_irq_msi_free(spapr, msi->first_irq, msi->num);
>> + }
>> spapr_irq_free(spapr, msi->first_irq, msi->num);
>> if (msi_present(pdev)) {
>> spapr_msi_setmsg(pdev, 0, false, 0, 0);
>> @@ -372,7 +375,13 @@ static void rtas_ibm_change_msi(PowerPCCPU *cpu,
>> sPAPRMachineState *spapr,
>> }
>>
>> /* Allocate MSIs */
>> - irq = spapr_irq_find(spapr, req_num, ret_intr_type == RTAS_TYPE_MSI,
>> &err);
>> + if (spapr->xics_legacy) {
>> + irq = spapr_irq_find(spapr, req_num, ret_intr_type == RTAS_TYPE_MSI,
>> + &err);
>> + } else {
>> + irq = spapr_irq_msi_alloc(spapr, req_num,
>> + ret_intr_type == RTAS_TYPE_MSI, &err);
>> + }
>> if (err) {
>> error_reportf_err(err, "Can't allocate MSIs for device %x: ",
>> config_addr);
>> @@ -392,6 +401,9 @@ static void rtas_ibm_change_msi(PowerPCCPU *cpu,
>> sPAPRMachineState *spapr,
>>
>> /* Release previous MSIs */
>> if (msi) {
>> + if (!spapr->xics_legacy) {
>> + spapr_irq_msi_free(spapr, msi->first_irq, msi->num);
>> + }
>> spapr_irq_free(spapr, msi->first_irq, msi->num);
>> g_hash_table_remove(phb->msi, &config_addr);
>> }
>> @@ -1708,11 +1720,15 @@ static void spapr_phb_realize(DeviceState *dev,
>> Error **errp)
>> uint32_t irq;
>> Error *local_err = NULL;
>>
>> - irq = spapr_irq_findone(spapr, &local_err);
>> - if (local_err) {
>> - error_propagate(errp, local_err);
>> - error_prepend(errp, "can't allocate LSIs: ");
>> - return;
>> + if (spapr->xics_legacy) {
>> + irq = spapr_irq_findone(spapr, &local_err);
>> + if (local_err) {
>> + error_propagate(errp, local_err);
>> + error_prepend(errp, "can't allocate LSIs: ");
>> + return;
>> + }
>> + } else {
>> + irq = SPAPR_IRQ_PCI_LSI + sphb->index * PCI_NUM_PINS + i;
>> }
>>
>> spapr_irq_claim(spapr, irq, true, &local_err);
>> diff --git a/hw/ppc/spapr_vio.c b/hw/ppc/spapr_vio.c
>> index daf85130b5ef..ecee4b2d03da 100644
>> --- a/hw/ppc/spapr_vio.c
>> +++ b/hw/ppc/spapr_vio.c
>> @@ -436,6 +436,9 @@ static void spapr_vio_busdev_reset(DeviceState *qdev)
>> }
>> }
>>
>> +/* TODO : poor VIO device indexing ... */
>> +static uint32_t vio_index;
>> +
>> static void spapr_vio_busdev_realize(DeviceState *qdev, Error **errp)
>> {
>> sPAPRMachineState *spapr = SPAPR_MACHINE(qdev_get_machine());
>> @@ -476,10 +479,18 @@ static void spapr_vio_busdev_realize(DeviceState
>> *qdev, Error **errp)
>> }
>>
>> if (!dev->irq) {
>> - dev->irq = spapr_irq_findone(spapr, &local_err);
>> - if (local_err) {
>> - error_propagate(errp, local_err);
>> - return;
>> + if (spapr->xics_legacy) {
>> + dev->irq = spapr_irq_findone(spapr, &local_err);
>> + if (local_err) {
>> + error_propagate(errp, local_err);
>> + return;
>> + }
>> + } else {
>> + dev->irq = SPAPR_IRQ_VIO + vio_index++;
>> + if (dev->irq == SPAPR_IRQ_PCI_LSI) {
>> + error_setg(errp, "Too many VIO devices");
>> + return;
>> + }
>> }
>> }
>>
>> diff --git a/hw/ppc/Makefile.objs b/hw/ppc/Makefile.objs
>> index 86d82a6ec3ac..4fe3b7804d43 100644
>> --- a/hw/ppc/Makefile.objs
>> +++ b/hw/ppc/Makefile.objs
>> @@ -4,7 +4,7 @@ obj-y += ppc.o ppc_booke.o fdt.o
>> obj-$(CONFIG_PSERIES) += spapr.o spapr_caps.o spapr_vio.o spapr_events.o
>> obj-$(CONFIG_PSERIES) += spapr_hcall.o spapr_iommu.o spapr_rtas.o
>> obj-$(CONFIG_PSERIES) += spapr_pci.o spapr_rtc.o spapr_drc.o spapr_rng.o
>> -obj-$(CONFIG_PSERIES) += spapr_cpu_core.o spapr_ovec.o
>> +obj-$(CONFIG_PSERIES) += spapr_cpu_core.o spapr_ovec.o spapr_irq.o
>> # IBM PowerNV
>> obj-$(CONFIG_POWERNV) += pnv.o pnv_xscom.o pnv_core.o pnv_lpc.o pnv_psi.o
>> pnv_occ.o pnv_bmc.o
>> ifeq ($(CONFIG_PCI)$(CONFIG_PSERIES)$(CONFIG_LINUX), yyy)
>