Alexey Kardashevskiy <a...@ozlabs.ru> writes:

> On 05/19/2015 06:26 PM, Nikunj A Dadhania wrote:
>> All the PCI enumeration and device node creation was off-loaded to
>> SLOF. With PCI hotplug support, code needed to be added to add device
>> node. This creates multiple copy of the code one in SLOF and other in
>> hotplug code. To unify this, the patch adds the pci device node
>> creation in Qemu. For backward compatibility, a flag
>> "qemu,phb-enumerated" is added to the phb, suggesting to SLOF to not
>> do device node creation.
>>
>> Signed-off-by: Nikunj A Dadhania <nik...@linux.vnet.ibm.com>
>> [ Squashed Michael's drc_index changes ]
>> Signed-off-by: Michael Roth <mdr...@linux.vnet.ibm.com>
>> Signed-off-by: Nikunj A Dadhania <nik...@linux.vnet.ibm.com>
>> ---
>>   hw/ppc/spapr_pci.c | 188 
>> ++++++++++++++++++++++++++++++++++++++++++-----------
>>   1 file changed, 150 insertions(+), 38 deletions(-)
>>
>> diff --git a/hw/ppc/spapr_pci.c b/hw/ppc/spapr_pci.c
>> index 8b02a3e..12f1b9c 100644
>> --- a/hw/ppc/spapr_pci.c
>> +++ b/hw/ppc/spapr_pci.c
>> @@ -23,6 +23,7 @@
>>    * THE SOFTWARE.
>>    */
>>   #include "hw/hw.h"
>> +#include "hw/sysbus.h"
>>   #include "hw/pci/pci.h"
>>   #include "hw/pci/msi.h"
>>   #include "hw/pci/msix.h"
>> @@ -35,6 +36,7 @@
>>   #include "qemu/error-report.h"
>>   #include "qapi/qmp/qerror.h"
>>
>> +#include "hw/pci/pci_bridge.h"
>>   #include "hw/pci/pci_bus.h"
>>   #include "hw/ppc/spapr_drc.h"
>>   #include "sysemu/device_tree.h"
>> @@ -742,6 +744,31 @@ static AddressSpace *spapr_pci_dma_iommu(PCIBus *bus, 
>> void *opaque, int devfn)
>>       return &phb->iommu_as;
>>   }
>>
>> +
>> +static sPAPRDRConnector *spapr_phb_get_pci_drc(sPAPRPHBState *phb,
>> +                                               PCIDevice *pdev)
>> +{
>> +    uint32_t busnr = 
>> pci_bus_num(PCI_BUS(qdev_get_parent_bus(DEVICE(pdev))));
>> +    return spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_PCI,
>> +                                    (phb->index << 16) |
>> +                                    (busnr << 8) |
>> +                                    pdev->devfn);
>> +}
>> +
>> +static uint32_t spapr_phb_get_pci_drc_index(sPAPRPHBState *phb,
>> +                                            PCIDevice *pdev)
>> +{
>> +    sPAPRDRConnector *drc = spapr_phb_get_pci_drc(phb, pdev);
>> +    sPAPRDRConnectorClass *drck;
>> +
>> +    if (!drc) {
>> +        return 0;
>> +    }
>> +
>> +    drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
>> +    return drck->get_index(drc);
>> +}
>> +
>>   /* Macros to operate with address in OF binding to PCI */
>>   #define b_x(x, p, l)    (((x) & ((1<<(l))-1)) << (p))
>>   #define b_n(x)          b_x((x), 31, 1) /* 0 if relocatable */
>> @@ -879,12 +906,13 @@ static void populate_resource_props(PCIDevice *d, 
>> ResourceProps *rp)
>>   }
>>
>>   static int spapr_populate_pci_child_dt(PCIDevice *dev, void *fdt, int 
>> offset,
>> -                                       int phb_index, int drc_index,
>> +                                       sPAPRPHBState *sphb,
>>                                          const char *drc_name)
>>   {
>>       ResourceProps rp;
>>       bool is_bridge = false;
>>       int pci_status;
>> +    uint32_t drc_index = spapr_phb_get_pci_drc_index(sphb, dev);
>
> Is this drc_index any different from the one which used to be passed to 
> this function? If no, then I do not see the point in changing the prototype 
> (or make another "this just makes code easier/nicer" patch).

Its the same, I can have a separate patch. As I was changing this code
the drc_index would need to be read in boot and hotplug code. So brought
over the code here.

> If yes, then it would be nice to see what the patch changed in this
> regard in the commit log.
>
>
>
>>       if (pci_default_read_config(dev, PCI_HEADER_TYPE, 1) ==
>>           PCI_HEADER_TYPE_BRIDGE) {
>> @@ -945,8 +973,13 @@ static int spapr_populate_pci_child_dt(PCIDevice *dev, 
>> void *fdt, int offset,
>>        * processed by OF beforehand
>>        */
>>       _FDT(fdt_setprop_string(fdt, offset, "name", "pci"));
>> -    _FDT(fdt_setprop(fdt, offset, "ibm,loc-code", drc_name, 
>> strlen(drc_name)));
>> -    _FDT(fdt_setprop_cell(fdt, offset, "ibm,my-drc-index", drc_index));
>> +    if (drc_name) {
>> +        _FDT(fdt_setprop(fdt, offset, "ibm,loc-code", drc_name,
>> +                         strlen(drc_name)));
>> +    }
>> +    if (drc_index) {
>> +        _FDT(fdt_setprop_cell(fdt, offset, "ibm,my-drc-index", drc_index));
>> +    }
>>
>>       _FDT(fdt_setprop_cell(fdt, offset, "#address-cells",
>>                             RESOURCE_CELLS_ADDRESS));
>> @@ -963,30 +996,34 @@ static int spapr_populate_pci_child_dt(PCIDevice *dev, 
>> void *fdt, int offset,
>>       return 0;
>>   }
>>
>> +typedef struct sPAPRFDT {
>> +    void *fdt;
>> +    int node_off;
>> +    sPAPRPHBState *sphb;
>> +} sPAPRFDT;
>> +
>>   /* create OF node for pci device and required OF DT properties */
>> -static void *spapr_create_pci_child_dt(sPAPRPHBState *phb, PCIDevice *dev,
>> -                                       int drc_index, const char *drc_name,
>> -                                       int *dt_offset)
>> +static int spapr_create_pci_child_dt(PCIDevice *pdev, sPAPRFDT *p,
>> +                                     const char *drc_name)
>
> Why s/dev/pdev/?

PCIDev thats the only reason.

>
>
>>   {
>> -    void *fdt;
>> -    int offset, ret, fdt_size;
>> -    int slot = PCI_SLOT(dev->devfn);
>> -    int func = PCI_FUNC(dev->devfn);
>> -    char nodename[512];
>> +    int offset, ret;
>> +    char nodename[64];
>
> Why s/512/64/?

Earlier this was called in recursion, so there was a comment in previous
series to reduce this to lesser number.

>
> This change and the one above hide what the patch really does to 
> spapr_create_pci_child_dt.
>
>
>> +    int slot = PCI_SLOT(pdev->devfn);
>> +    int func = PCI_FUNC(pdev->devfn);
>>
>> -    fdt = create_device_tree(&fdt_size);
>>       if (func != 0) {
>>           sprintf(nodename, "pci@%d,%d", slot, func);
>>       } else {
>>           sprintf(nodename, "pci@%d", slot);
>>       }
>> -    offset = fdt_add_subnode(fdt, 0, nodename);
>> -    ret = spapr_populate_pci_child_dt(dev, fdt, offset, phb->index, 
>> drc_index,
>> +    offset = fdt_add_subnode(p->fdt, p->node_off, nodename);
>> +    ret = spapr_populate_pci_child_dt(pdev, p->fdt, offset, p->sphb,
>>                                         drc_name);
>>       g_assert(!ret);
>> -
>> -    *dt_offset = offset;
>> -    return fdt;
>> +    if (ret) {
>> +        return 0;
>> +    }
>> +    return offset;
>>   }
>>
>>   static void spapr_phb_add_pci_device(sPAPRDRConnector *drc,
>> @@ -996,24 +1033,26 @@ static void spapr_phb_add_pci_device(sPAPRDRConnector 
>> *drc,
>>   {
>>       sPAPRDRConnectorClass *drck = SPAPR_DR_CONNECTOR_GET_CLASS(drc);
>>       DeviceState *dev = DEVICE(pdev);
>> -    int drc_index = drck->get_index(drc);
>>       const char *drc_name = drck->get_name(drc);
>> -    void *fdt = NULL;
>> -    int fdt_start_offset = 0;
>> +    int fdt_start_offset = 0, fdt_size;
>> +    sPAPRFDT s_fdt = {NULL, 0, NULL};
>>
>> -    /* boot-time devices get their device tree node created by SLOF, but for
>> -     * hotplugged devices we need QEMU to generate it so the guest can fetch
>> -     * it via RTAS
>> -     */
>>       if (dev->hotplugged) {
>
>
> I understand the patch is not changing this but still while we are here -
> spapr_phb_add_pci_device() is only called from spapr_phb_hot_plug_child(), 
> how can dev->hotplugged be not true in this function (if it cannot, you 
> could get rid of "out:"?

It gets called even when the devices are added during boot.

>
>> -        fdt = spapr_create_pci_child_dt(phb, pdev, drc_index, drc_name,
>> -                                        &fdt_start_offset);
>> +        s_fdt.fdt = create_device_tree(&fdt_size);
>> +        s_fdt.sphb = phb;
>> +        s_fdt.node_off = 0;
>> +        fdt_start_offset = spapr_create_pci_child_dt(pdev, &s_fdt, 
>> drc_name);
>> +        if (!fdt_start_offset) {
>> +            error_setg(errp, "Failed to create pci child device tree node");
>> +            goto out;
>> +        }
>>       }
>>
>>       drck->attach(drc, DEVICE(pdev),
>> -                 fdt, fdt_start_offset, !dev->hotplugged, errp);
>> +                 s_fdt.fdt, fdt_start_offset, !dev->hotplugged, errp);
>> +out:
>>       if (*errp) {
>> -        g_free(fdt);
>> +        g_free(s_fdt.fdt);
>>       }
>>   }
>>
>> @@ -1043,16 +1082,6 @@ static void 
>> spapr_phb_remove_pci_device(sPAPRDRConnector *drc,
>>       drck->detach(drc, DEVICE(pdev), spapr_phb_remove_pci_device_cb, phb, 
>> errp);
>>   }
>>
>> -static sPAPRDRConnector *spapr_phb_get_pci_drc(sPAPRPHBState *phb,
>> -                                               PCIDevice *pdev)
>
> Just adding forward declaration would make the patch shorter.

Yes, I can do that.

>
>> -{
>> -    uint32_t busnr = 
>> pci_bus_num(PCI_BUS(qdev_get_parent_bus(DEVICE(pdev))));
>> -    return spapr_dr_connector_by_id(SPAPR_DR_CONNECTOR_TYPE_PCI,
>> -                                    (phb->index << 16) |
>> -                                    (busnr << 8) |
>> -                                    pdev->devfn);
>> -}
>> -
>>   static void spapr_phb_hot_plug_child(HotplugHandler *plug_handler,
>>                                        DeviceState *plugged_dev, Error 
>> **errp)
>>   {
>> @@ -1482,6 +1511,75 @@ PCIHostState *spapr_create_phb(sPAPREnvironment 
>> *spapr, int index)
>>       return PCI_HOST_BRIDGE(dev);
>>   }
>>
>> +static void spapr_populate_pci_devices_dt(PCIBus *bus, PCIDevice *pdev,
>> +                                          void *opaque)
>> +{
>> +    PCIBus *sec_bus;
>> +    sPAPRFDT *p = opaque;
>> +    int offset;
>> +    sPAPRFDT s_fdt;
>> +
>> +    offset = spapr_create_pci_child_dt(pdev, p, NULL);
>> +    if (!offset) {
>> +        error_report("Failed to create pci child device tree node");
>> +        return;
>> +    }
>> +
>> +    if ((pci_default_read_config(pdev, PCI_HEADER_TYPE, 1) !=
>> +         PCI_HEADER_TYPE_BRIDGE)) {
>> +        return;
>> +    }
>> +
>> +    sec_bus = pci_bridge_get_sec_bus(PCI_BRIDGE(pdev));
>> +    if (!sec_bus) {
>> +        return;
>> +    }
>> +
>> +    s_fdt.fdt = p->fdt;
>> +    s_fdt.node_off = offset;
>> +    s_fdt.sphb = p->sphb;
>> +    pci_for_each_device(sec_bus, pci_bus_num(sec_bus),
>> +                        spapr_populate_pci_devices_dt,
>> +                        &s_fdt);
>> +}
>> +
>> +static void spapr_phb_pci_enumerate_bridge(PCIBus *bus, PCIDevice *pdev,
>> +                                           void *opaque)
>> +{
>> +    unsigned int *bus_no = opaque;
>> +    unsigned int primary = *bus_no;
>> +    unsigned int secondary;
>> +    unsigned int subordinate = 0xff;
>> +
>> +    if ((pci_default_read_config(pdev, PCI_HEADER_TYPE, 1) ==
>> +         PCI_HEADER_TYPE_BRIDGE)) {
>
>
> s/==/!=/ and "return" and no need in extra indent below.

Right.

>
>> +        PCIBus *sec_bus = pci_bridge_get_sec_bus(PCI_BRIDGE(pdev));
>> +        secondary = *bus_no + 1;
>
>
> (*bus_no)++;
> secondary = *bus_no;
>
> and remove "bus_no = *bus_no + 1" below?
> In fact, I do not need much sense in having "secondary" variable in this 
> function.
>
>> +        pci_default_write_config(pdev, PCI_PRIMARY_BUS, primary, 1);
>> +        pci_default_write_config(pdev, PCI_SECONDARY_BUS, secondary, 1);
>> +        pci_default_write_config(pdev, PCI_SUBORDINATE_BUS, secondary, 1);
>> +        *bus_no = *bus_no + 1;
>> +        if (sec_bus) {
>
> same here? Just like you did in spapr_populate_pci_devices_dt(). I do not 
> insist though. But having less scopes just makes it easier/nicer to wrap 
> long lines in QEMU coding style (new line starts under "(").
>
>
>> +            pci_default_write_config(pdev, PCI_SUBORDINATE_BUS, 
>> subordinate, 1);
>> +            pci_for_each_device(sec_bus, pci_bus_num(sec_bus),
>> +                                spapr_phb_pci_enumerate_bridge,
>> +                                bus_no);
>> +            pci_default_write_config(pdev, PCI_SUBORDINATE_BUS, *bus_no, 1);
>> +        }
>> +    }
>> +}
>> +
>> +static void spapr_phb_pci_enumerate(sPAPRPHBState *phb)
>> +{
>> +    PCIBus *bus = PCI_HOST_BRIDGE(phb)->bus;
>> +    unsigned int bus_no = 0;
>> +
>> +    pci_for_each_device(bus, pci_bus_num(bus),
>> +                        spapr_phb_pci_enumerate_bridge,
>> +                        &bus_no);
>> +
>> +}
>> +
>>   int spapr_populate_pci_dt(sPAPRPHBState *phb,
>>                             uint32_t xics_phandle,
>>                             void *fdt)
>> @@ -1521,6 +1619,8 @@ int spapr_populate_pci_dt(sPAPRPHBState *phb,
>>           cpu_to_be32(b_ddddd(-1)|b_fff(0)), 0x0, 0x0, cpu_to_be32(-1)};
>>       uint32_t interrupt_map[PCI_SLOT_MAX * PCI_NUM_PINS][7];
>>       sPAPRTCETable *tcet;
>> +    PCIBus *bus = PCI_HOST_BRIDGE(phb)->bus;
>> +    sPAPRFDT s_fdt;
>>
>>       /* Start populating the FDT */
>>       sprintf(nodename, "pci@%" PRIx64, phb->buid);
>> @@ -1570,6 +1670,18 @@ int spapr_populate_pci_dt(sPAPRPHBState *phb,
>>                    tcet->liobn, tcet->bus_offset,
>>                    tcet->nb_table << tcet->page_shift);
>>
>> +    /* Walk the bridges and program the bus numbers*/
>> +    spapr_phb_pci_enumerate(phb);
>> +    _FDT(fdt_setprop_cell(fdt, bus_off, "qemu,phb-enumerated", 0x1));
>
>
> Can we also add a hack here to scan for the "qemu,phb-enumerated" string in 
> the SLOF bin image?

Really ? That would be ugly.

>
>> +
>> +    /* Populate tree nodes with PCI devices attached */
>> +    s_fdt.fdt = fdt;
>> +    s_fdt.node_off = bus_off;
>> +    s_fdt.sphb = phb;
>> +    pci_for_each_device(bus, pci_bus_num(bus),
>> +                        spapr_populate_pci_devices_dt,
>> +                        &s_fdt);
>> +
>>       ret = spapr_drc_populate_dt(fdt, bus_off, OBJECT(phb),
>>                                   SPAPR_DR_CONNECTOR_TYPE_PCI);
>>       if (ret) {
>>
>
>
> -- 
> Alexey


Reply via email to