All of lore.kernel.org
 help / color / mirror / Atom feed
* [Qemu-devel] [PATCH] spapr/pci: populate PCI DT in reverse order
@ 2015-11-30 10:45 Greg Kurz
  2015-12-01 21:48 ` Thomas Huth
  0 siblings, 1 reply; 9+ messages in thread
From: Greg Kurz @ 2015-11-30 10:45 UTC (permalink / raw)
  To: David Gibson, Michael S. Tsirkin
  Cc: Thomas Huth, qemu-ppc, qemu-devel, Nikunj A Dadhania

Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
populates the PCI device tree in the opposite order compared to SLOF.

Before 1d2d974244c6:

Populating /pci@800000020000000
                     00 0000 (D) : 1af4 1000    virtio [ net ]
                     00 0800 (D) : 1af4 1001    virtio [ block ]
                     00 1000 (D) : 1af4 1009    virtio [ network ]
Populating /pci@800000020000000/unknown-legacy-device@2


7e5294b8 :  /pci@800000020000000
7e52b998 :  |-- ethernet@0
7e52c0c8 :  |-- scsi@1
7e52c7e8 :  +-- unknown-legacy-device@2 ok

Since 1d2d974244c6:

Populating /pci@800000020000000
                     00 1000 (D) : 1af4 1009    virtio [ network ]
Populating /pci@800000020000000/unknown-legacy-device@2
                     00 0800 (D) : 1af4 1001    virtio [ block ]
                     00 0000 (D) : 1af4 1000    virtio [ net ]


7e5e8118 :  /pci@800000020000000
7e5ea6a0 :  |-- unknown-legacy-device@2
7e5eadb8 :  |-- scsi@1
7e5eb4d8 :  +-- ethernet@0 ok

This behaviour change is not actually a bug since no assumptions should be
made on DT ordering. But it has no real justification either, other than
being the consequence of the way fdt_add_subnode() inserts new elements
to the front of the FDT rather than adding them to the tail.

This patch reverts to the historical SLOF ordering by walking PCI devices in
reverse order.

Signed-off-by: Greg Kurz <gkurz@linux.vnet.ibm.com>
---

Repost with Cc: to qemu-devel and qemu-ppc :)

Michael, David,

I hope it is okay that this is a single patch to be applied by
any of you. Otherwise I can post distinct patches for PCI and
sPAPR.

 hw/pci/pci.c         |   28 ++++++++++++++++++++++++++++
 hw/ppc/spapr_pci.c   |   12 ++++++------
 include/hw/pci/pci.h |    4 ++++
 3 files changed, 38 insertions(+), 6 deletions(-)

diff --git a/hw/pci/pci.c b/hw/pci/pci.c
index 168b9cc56b69..3e95745900fc 100644
--- a/hw/pci/pci.c
+++ b/hw/pci/pci.c
@@ -1420,6 +1420,34 @@ static const pci_class_desc pci_class_descriptions[] =
     { 0, NULL}
 };
 
+static void pci_for_each_device_under_bus_reverse(PCIBus *bus,
+                                                  void (*fn)(PCIBus *b,
+                                                             PCIDevice *d,
+                                                             void *opaque),
+                                                  void *opaque)
+{
+    PCIDevice *d;
+    int devfn;
+
+    for (devfn = 0; devfn < ARRAY_SIZE(bus->devices); devfn++) {
+        d = bus->devices[ARRAY_SIZE(bus->devices) - 1 - devfn];
+        if (d) {
+            fn(bus, d, opaque);
+        }
+    }
+}
+
+void pci_for_each_device_reverse(PCIBus *bus, int bus_num,
+                         void (*fn)(PCIBus *b, PCIDevice *d, void *opaque),
+                         void *opaque)
+{
+    bus = pci_find_bus_nr(bus, bus_num);
+
+    if (bus) {
+        pci_for_each_device_under_bus_reverse(bus, fn, opaque);
+    }
+}
+
 static void pci_for_each_device_under_bus(PCIBus *bus,
                                           void (*fn)(PCIBus *b, PCIDevice *d,
                                                      void *opaque),
diff --git a/hw/ppc/spapr_pci.c b/hw/ppc/spapr_pci.c
index 55fa8db9e290..b3c9294af74d 100644
--- a/hw/ppc/spapr_pci.c
+++ b/hw/ppc/spapr_pci.c
@@ -1612,9 +1612,9 @@ static void spapr_populate_pci_devices_dt(PCIBus *bus, PCIDevice *pdev,
     s_fdt.fdt = p->fdt;
     s_fdt.node_off = offset;
     s_fdt.sphb = p->sphb;
-    pci_for_each_device(sec_bus, pci_bus_num(sec_bus),
-                        spapr_populate_pci_devices_dt,
-                        &s_fdt);
+    pci_for_each_device_reverse(sec_bus, pci_bus_num(sec_bus),
+                                spapr_populate_pci_devices_dt,
+                                &s_fdt);
 }
 
 static void spapr_phb_pci_enumerate_bridge(PCIBus *bus, PCIDevice *pdev,
@@ -1755,9 +1755,9 @@ int spapr_populate_pci_dt(sPAPRPHBState *phb,
     s_fdt.fdt = fdt;
     s_fdt.node_off = bus_off;
     s_fdt.sphb = phb;
-    pci_for_each_device(bus, pci_bus_num(bus),
-                        spapr_populate_pci_devices_dt,
-                        &s_fdt);
+    pci_for_each_device_reverse(bus, pci_bus_num(bus),
+                                spapr_populate_pci_devices_dt,
+                                &s_fdt);
 
     ret = spapr_drc_populate_dt(fdt, bus_off, OBJECT(phb),
                                 SPAPR_DR_CONNECTOR_TYPE_PCI);
diff --git a/include/hw/pci/pci.h b/include/hw/pci/pci.h
index 379b6e1a4561..465483b2ee79 100644
--- a/include/hw/pci/pci.h
+++ b/include/hw/pci/pci.h
@@ -393,6 +393,10 @@ int pci_bus_numa_node(PCIBus *bus);
 void pci_for_each_device(PCIBus *bus, int bus_num,
                          void (*fn)(PCIBus *bus, PCIDevice *d, void *opaque),
                          void *opaque);
+void pci_for_each_device_reverse(PCIBus *bus, int bus_num,
+                                 void (*fn)(PCIBus *bus, PCIDevice *d,
+                                            void *opaque),
+                                 void *opaque);
 void pci_for_each_bus_depth_first(PCIBus *bus,
                                   void *(*begin)(PCIBus *bus, void *parent_state),
                                   void (*end)(PCIBus *bus, void *state),

^ permalink raw reply related	[flat|nested] 9+ messages in thread

* Re: [Qemu-devel] [PATCH] spapr/pci: populate PCI DT in reverse order
  2015-11-30 10:45 [Qemu-devel] [PATCH] spapr/pci: populate PCI DT in reverse order Greg Kurz
@ 2015-12-01 21:48 ` Thomas Huth
  2015-12-03 14:53   ` [Qemu-devel] [Qemu-ppc] " Greg Kurz
  0 siblings, 1 reply; 9+ messages in thread
From: Thomas Huth @ 2015-12-01 21:48 UTC (permalink / raw)
  To: Greg Kurz, David Gibson, Michael S. Tsirkin
  Cc: qemu-ppc, qemu-devel, Nikunj A Dadhania

On 30/11/15 11:45, Greg Kurz wrote:
> Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
> populates the PCI device tree in the opposite order compared to SLOF.
> 
> Before 1d2d974244c6:
> 
> Populating /pci@800000020000000
>                      00 0000 (D) : 1af4 1000    virtio [ net ]
>                      00 0800 (D) : 1af4 1001    virtio [ block ]
>                      00 1000 (D) : 1af4 1009    virtio [ network ]
> Populating /pci@800000020000000/unknown-legacy-device@2
> 
> 
> 7e5294b8 :  /pci@800000020000000
> 7e52b998 :  |-- ethernet@0
> 7e52c0c8 :  |-- scsi@1
> 7e52c7e8 :  +-- unknown-legacy-device@2 ok
> 
> Since 1d2d974244c6:
> 
> Populating /pci@800000020000000
>                      00 1000 (D) : 1af4 1009    virtio [ network ]
> Populating /pci@800000020000000/unknown-legacy-device@2
>                      00 0800 (D) : 1af4 1001    virtio [ block ]
>                      00 0000 (D) : 1af4 1000    virtio [ net ]
> 
> 
> 7e5e8118 :  /pci@800000020000000
> 7e5ea6a0 :  |-- unknown-legacy-device@2
> 7e5eadb8 :  |-- scsi@1
> 7e5eb4d8 :  +-- ethernet@0 ok
> 
> This behaviour change is not actually a bug since no assumptions should be
> made on DT ordering. But it has no real justification either, other than
> being the consequence of the way fdt_add_subnode() inserts new elements
> to the front of the FDT rather than adding them to the tail.
> 
> This patch reverts to the historical SLOF ordering by walking PCI devices in
> reverse order.

I've applied your patch here locally, and indeed, the device tree looks
nicer to me, too, when the nodes are listed in ascending order.

Tested-by: Thomas Huth <thuth@redhat.com>

^ permalink raw reply	[flat|nested] 9+ messages in thread

* Re: [Qemu-devel] [Qemu-ppc] [PATCH] spapr/pci: populate PCI DT in reverse order
  2015-12-01 21:48 ` Thomas Huth
@ 2015-12-03 14:53   ` Greg Kurz
  2015-12-17  8:43     ` Greg Kurz
  0 siblings, 1 reply; 9+ messages in thread
From: Greg Kurz @ 2015-12-03 14:53 UTC (permalink / raw)
  To: Thomas Huth; +Cc: Michael S. Tsirkin, qemu-ppc, qemu-devel, David Gibson

On Tue, 1 Dec 2015 22:48:38 +0100
Thomas Huth <thuth@redhat.com> wrote:

> On 30/11/15 11:45, Greg Kurz wrote:
> > Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
> > populates the PCI device tree in the opposite order compared to SLOF.
> > 
> > Before 1d2d974244c6:
> > 
> > Populating /pci@800000020000000
> >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > Populating /pci@800000020000000/unknown-legacy-device@2
> > 
> > 
> > 7e5294b8 :  /pci@800000020000000
> > 7e52b998 :  |-- ethernet@0
> > 7e52c0c8 :  |-- scsi@1
> > 7e52c7e8 :  +-- unknown-legacy-device@2 ok
> > 
> > Since 1d2d974244c6:
> > 
> > Populating /pci@800000020000000
> >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > Populating /pci@800000020000000/unknown-legacy-device@2
> >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> > 
> > 
> > 7e5e8118 :  /pci@800000020000000
> > 7e5ea6a0 :  |-- unknown-legacy-device@2
> > 7e5eadb8 :  |-- scsi@1
> > 7e5eb4d8 :  +-- ethernet@0 ok
> > 
> > This behaviour change is not actually a bug since no assumptions should be
> > made on DT ordering. But it has no real justification either, other than
> > being the consequence of the way fdt_add_subnode() inserts new elements
> > to the front of the FDT rather than adding them to the tail.
> > 
> > This patch reverts to the historical SLOF ordering by walking PCI devices in
> > reverse order.
> 
> I've applied your patch here locally, and indeed, the device tree looks
> nicer to me, too, when the nodes are listed in ascending order.
> 
> Tested-by: Thomas Huth <thuth@redhat.com>
> 
> 

Thanks for testing !

Cheers.

--
Greg

^ permalink raw reply	[flat|nested] 9+ messages in thread

* Re: [Qemu-devel] [Qemu-ppc] [PATCH] spapr/pci: populate PCI DT in reverse order
  2015-12-03 14:53   ` [Qemu-devel] [Qemu-ppc] " Greg Kurz
@ 2015-12-17  8:43     ` Greg Kurz
  2015-12-21  1:56       ` David Gibson
  0 siblings, 1 reply; 9+ messages in thread
From: Greg Kurz @ 2015-12-17  8:43 UTC (permalink / raw)
  To: David Gibson, Michael S. Tsirkin; +Cc: Thomas Huth, qemu-ppc, qemu-devel

On Thu, 3 Dec 2015 15:53:17 +0100
Greg Kurz <gkurz@linux.vnet.ibm.com> wrote:

> On Tue, 1 Dec 2015 22:48:38 +0100
> Thomas Huth <thuth@redhat.com> wrote:
> 
> > On 30/11/15 11:45, Greg Kurz wrote:
> > > Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
> > > populates the PCI device tree in the opposite order compared to SLOF.
> > > 
> > > Before 1d2d974244c6:
> > > 
> > > Populating /pci@800000020000000
> > >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> > >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> > >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > > Populating /pci@800000020000000/unknown-legacy-device@2
> > > 
> > > 
> > > 7e5294b8 :  /pci@800000020000000
> > > 7e52b998 :  |-- ethernet@0
> > > 7e52c0c8 :  |-- scsi@1
> > > 7e52c7e8 :  +-- unknown-legacy-device@2 ok
> > > 
> > > Since 1d2d974244c6:
> > > 
> > > Populating /pci@800000020000000
> > >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > > Populating /pci@800000020000000/unknown-legacy-device@2
> > >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> > >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> > > 
> > > 
> > > 7e5e8118 :  /pci@800000020000000
> > > 7e5ea6a0 :  |-- unknown-legacy-device@2
> > > 7e5eadb8 :  |-- scsi@1
> > > 7e5eb4d8 :  +-- ethernet@0 ok
> > > 
> > > This behaviour change is not actually a bug since no assumptions should be
> > > made on DT ordering. But it has no real justification either, other than
> > > being the consequence of the way fdt_add_subnode() inserts new elements
> > > to the front of the FDT rather than adding them to the tail.
> > > 
> > > This patch reverts to the historical SLOF ordering by walking PCI devices in
> > > reverse order.
> > 
> > I've applied your patch here locally, and indeed, the device tree looks
> > nicer to me, too, when the nodes are listed in ascending order.
> > 
> > Tested-by: Thomas Huth <thuth@redhat.com>
> > 
> > 
> 

Ping ?

> Thanks for testing !
> 
> Cheers.
> 
> --
> Greg
> 
> 

^ permalink raw reply	[flat|nested] 9+ messages in thread

* Re: [Qemu-devel] [Qemu-ppc] [PATCH] spapr/pci: populate PCI DT in reverse order
  2015-12-17  8:43     ` Greg Kurz
@ 2015-12-21  1:56       ` David Gibson
  2015-12-21  8:09         ` Greg Kurz
  2015-12-23  5:47         ` Nikunj A Dadhania
  0 siblings, 2 replies; 9+ messages in thread
From: David Gibson @ 2015-12-21  1:56 UTC (permalink / raw)
  To: Greg Kurz; +Cc: Thomas Huth, qemu-ppc, qemu-devel, Michael S. Tsirkin

[-- Attachment #1: Type: text/plain, Size: 2754 bytes --]

On Thu, Dec 17, 2015 at 09:43:29AM +0100, Greg Kurz wrote:
> On Thu, 3 Dec 2015 15:53:17 +0100
> Greg Kurz <gkurz@linux.vnet.ibm.com> wrote:
> 
> > On Tue, 1 Dec 2015 22:48:38 +0100
> > Thomas Huth <thuth@redhat.com> wrote:
> > 
> > > On 30/11/15 11:45, Greg Kurz wrote:
> > > > Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
> > > > populates the PCI device tree in the opposite order compared to SLOF.
> > > > 
> > > > Before 1d2d974244c6:
> > > > 
> > > > Populating /pci@800000020000000
> > > >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> > > >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> > > >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > > > Populating /pci@800000020000000/unknown-legacy-device@2
> > > > 
> > > > 
> > > > 7e5294b8 :  /pci@800000020000000
> > > > 7e52b998 :  |-- ethernet@0
> > > > 7e52c0c8 :  |-- scsi@1
> > > > 7e52c7e8 :  +-- unknown-legacy-device@2 ok
> > > > 
> > > > Since 1d2d974244c6:
> > > > 
> > > > Populating /pci@800000020000000
> > > >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > > > Populating /pci@800000020000000/unknown-legacy-device@2
> > > >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> > > >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> > > > 
> > > > 
> > > > 7e5e8118 :  /pci@800000020000000
> > > > 7e5ea6a0 :  |-- unknown-legacy-device@2
> > > > 7e5eadb8 :  |-- scsi@1
> > > > 7e5eb4d8 :  +-- ethernet@0 ok
> > > > 
> > > > This behaviour change is not actually a bug since no assumptions should be
> > > > made on DT ordering. But it has no real justification either, other than
> > > > being the consequence of the way fdt_add_subnode() inserts new elements
> > > > to the front of the FDT rather than adding them to the tail.
> > > > 
> > > > This patch reverts to the historical SLOF ordering by walking PCI devices in
> > > > reverse order.
> > > 
> > > I've applied your patch here locally, and indeed, the device tree looks
> > > nicer to me, too, when the nodes are listed in ascending order.
> > > 
> > > Tested-by: Thomas Huth <thuth@redhat.com>
> > > 
> > > 
> > 
> 
> Ping ?

Sorry I didn't reply.

I'm still dubious about this.  It seems like a fair bit of effort to
restore a behaviour that the client isn't supposed to be relying on
anyway.

Plus, the version with the changed order is already released, so
applying this will mean a second behaviour change.

-- 
David Gibson			| I'll have my music baroque, and my code
david AT gibson.dropbear.id.au	| minimalist, thank you.  NOT _the_ _other_
				| _way_ _around_!
http://www.ozlabs.org/~dgibson

[-- Attachment #2: signature.asc --]
[-- Type: application/pgp-signature, Size: 819 bytes --]

^ permalink raw reply	[flat|nested] 9+ messages in thread

* Re: [Qemu-devel] [Qemu-ppc] [PATCH] spapr/pci: populate PCI DT in reverse order
  2015-12-21  1:56       ` David Gibson
@ 2015-12-21  8:09         ` Greg Kurz
  2015-12-23  5:47         ` Nikunj A Dadhania
  1 sibling, 0 replies; 9+ messages in thread
From: Greg Kurz @ 2015-12-21  8:09 UTC (permalink / raw)
  To: David Gibson; +Cc: Thomas Huth, qemu-ppc, qemu-devel, Michael S. Tsirkin

On Mon, 21 Dec 2015 12:56:24 +1100
David Gibson <david@gibson.dropbear.id.au> wrote:

> On Thu, Dec 17, 2015 at 09:43:29AM +0100, Greg Kurz wrote:
> > On Thu, 3 Dec 2015 15:53:17 +0100
> > Greg Kurz <gkurz@linux.vnet.ibm.com> wrote:
> > 
> > > On Tue, 1 Dec 2015 22:48:38 +0100
> > > Thomas Huth <thuth@redhat.com> wrote:
> > > 
> > > > On 30/11/15 11:45, Greg Kurz wrote:
> > > > > Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
> > > > > populates the PCI device tree in the opposite order compared to SLOF.
> > > > > 
> > > > > Before 1d2d974244c6:
> > > > > 
> > > > > Populating /pci@800000020000000
> > > > >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> > > > >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> > > > >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > > > > Populating /pci@800000020000000/unknown-legacy-device@2
> > > > > 
> > > > > 
> > > > > 7e5294b8 :  /pci@800000020000000
> > > > > 7e52b998 :  |-- ethernet@0
> > > > > 7e52c0c8 :  |-- scsi@1
> > > > > 7e52c7e8 :  +-- unknown-legacy-device@2 ok
> > > > > 
> > > > > Since 1d2d974244c6:
> > > > > 
> > > > > Populating /pci@800000020000000
> > > > >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > > > > Populating /pci@800000020000000/unknown-legacy-device@2
> > > > >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> > > > >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> > > > > 
> > > > > 
> > > > > 7e5e8118 :  /pci@800000020000000
> > > > > 7e5ea6a0 :  |-- unknown-legacy-device@2
> > > > > 7e5eadb8 :  |-- scsi@1
> > > > > 7e5eb4d8 :  +-- ethernet@0 ok
> > > > > 
> > > > > This behaviour change is not actually a bug since no assumptions should be
> > > > > made on DT ordering. But it has no real justification either, other than
> > > > > being the consequence of the way fdt_add_subnode() inserts new elements
> > > > > to the front of the FDT rather than adding them to the tail.
> > > > > 
> > > > > This patch reverts to the historical SLOF ordering by walking PCI devices in
> > > > > reverse order.
> > > > 
> > > > I've applied your patch here locally, and indeed, the device tree looks
> > > > nicer to me, too, when the nodes are listed in ascending order.
> > > > 
> > > > Tested-by: Thomas Huth <thuth@redhat.com>
> > > > 
> > > > 
> > > 
> > 
> > Ping ?
> 
> Sorry I didn't reply.
> 
> I'm still dubious about this.  It seems like a fair bit of effort to
> restore a behaviour that the client isn't supposed to be relying on
> anyway.
> 
> Plus, the version with the changed order is already released, so
> applying this will mean a second behaviour change.
> 

And since nobody apart from Thomas expressed interest, I guess it is
not something people dearly want. Just forget about this patch. :)

Cheers.

--
Greg

^ permalink raw reply	[flat|nested] 9+ messages in thread

* Re: [Qemu-devel] [Qemu-ppc] [PATCH] spapr/pci: populate PCI DT in reverse order
  2015-12-21  1:56       ` David Gibson
  2015-12-21  8:09         ` Greg Kurz
@ 2015-12-23  5:47         ` Nikunj A Dadhania
  1 sibling, 0 replies; 9+ messages in thread
From: Nikunj A Dadhania @ 2015-12-23  5:47 UTC (permalink / raw)
  To: David Gibson, Greg Kurz
  Cc: Thomas Huth, qemu-ppc, qemu-devel, Michael S. Tsirkin

David Gibson <david@gibson.dropbear.id.au> writes:

> On Thu, Dec 17, 2015 at 09:43:29AM +0100, Greg Kurz wrote:
>> On Thu, 3 Dec 2015 15:53:17 +0100
>> Greg Kurz <gkurz@linux.vnet.ibm.com> wrote:
>> 
>> > On Tue, 1 Dec 2015 22:48:38 +0100
>> > Thomas Huth <thuth@redhat.com> wrote:
>> > 
>> > > On 30/11/15 11:45, Greg Kurz wrote:
>> > > > Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
>> > > > populates the PCI device tree in the opposite order compared to SLOF.
>> > > > 
>> > > > Before 1d2d974244c6:
>> > > > 
>> > > > Populating /pci@800000020000000
>> > > >                      00 0000 (D) : 1af4 1000    virtio [ net ]
>> > > >                      00 0800 (D) : 1af4 1001    virtio [ block ]
>> > > >                      00 1000 (D) : 1af4 1009    virtio [ network ]
>> > > > Populating /pci@800000020000000/unknown-legacy-device@2
>> > > > 
>> > > > 
>> > > > 7e5294b8 :  /pci@800000020000000
>> > > > 7e52b998 :  |-- ethernet@0
>> > > > 7e52c0c8 :  |-- scsi@1
>> > > > 7e52c7e8 :  +-- unknown-legacy-device@2 ok
>> > > > 
>> > > > Since 1d2d974244c6:
>> > > > 
>> > > > Populating /pci@800000020000000
>> > > >                      00 1000 (D) : 1af4 1009    virtio [ network ]
>> > > > Populating /pci@800000020000000/unknown-legacy-device@2
>> > > >                      00 0800 (D) : 1af4 1001    virtio [ block ]
>> > > >                      00 0000 (D) : 1af4 1000    virtio [ net ]
>> > > > 
>> > > > 
>> > > > 7e5e8118 :  /pci@800000020000000
>> > > > 7e5ea6a0 :  |-- unknown-legacy-device@2
>> > > > 7e5eadb8 :  |-- scsi@1
>> > > > 7e5eb4d8 :  +-- ethernet@0 ok
>> > > > 
>> > > > This behaviour change is not actually a bug since no assumptions should be
>> > > > made on DT ordering. But it has no real justification either, other than
>> > > > being the consequence of the way fdt_add_subnode() inserts new elements
>> > > > to the front of the FDT rather than adding them to the tail.
>> > > > 
>> > > > This patch reverts to the historical SLOF ordering by walking PCI devices in
>> > > > reverse order.
>> > > 
>> > > I've applied your patch here locally, and indeed, the device tree looks
>> > > nicer to me, too, when the nodes are listed in ascending order.
>> > > 
>> > > Tested-by: Thomas Huth <thuth@redhat.com>
>> > > 
>> > > 
>> > 
>> 
>> Ping ?
>
> Sorry I didn't reply.
>
> I'm still dubious about this.  It seems like a fair bit of effort to
> restore a behaviour that the client isn't supposed to be relying on
> anyway.
>
> Plus, the version with the changed order is already released, so
> applying this will mean a second behaviour change.

The behaviour change was not intentional by me, so I would vote for
restoring the old order.

Reviewed-by: Nikunj A Dadhania <nikunj@linux.vnet.ibm.com>

Regards
Nikunj

^ permalink raw reply	[flat|nested] 9+ messages in thread

* Re: [Qemu-devel] [Qemu-ppc] [PATCH] spapr/pci: populate PCI DT in reverse order
  2017-02-27 22:20 ` [Qemu-devel] [Qemu-ppc] " Greg Kurz
@ 2017-03-01  1:07   ` David Gibson
  0 siblings, 0 replies; 9+ messages in thread
From: David Gibson @ 2017-03-01  1:07 UTC (permalink / raw)
  To: Greg Kurz
  Cc: Thomas Huth, Michael S. Tsirkin, qemu-ppc, Marcel Apfelbaum, qemu-devel

[-- Attachment #1: Type: text/plain, Size: 7737 bytes --]

On Mon, Feb 27, 2017 at 11:20:16PM +0100, Greg Kurz wrote:
> David,
> 
> Any chances to have this in 2.9 ?

Yes.  I've put it in my tree and I'm hoping to send a pull request
shortly.  Actually, I was hoping to send it yesterday, but hit a bug
during testing which I'm now chasing.

> 
> On Wed, 22 Feb 2017 11:56:53 +0100
> Greg Kurz <groug@kaod.org> wrote:
> 
> > From: Greg Kurz <gkurz@linux.vnet.ibm.com>
> > 
> > Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
> > populates the PCI device tree in the opposite order compared to SLOF.
> > 
> > Before 1d2d974244c6:
> > 
> > Populating /pci@800000020000000
> >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > Populating /pci@800000020000000/unknown-legacy-device@2
> > 
> > 7e5294b8 :  /pci@800000020000000
> > 7e52b998 :  |-- ethernet@0
> > 7e52c0c8 :  |-- scsi@1
> > 7e52c7e8 :  +-- unknown-legacy-device@2 ok
> > 
> > Since 1d2d974244c6:
> > 
> > Populating /pci@800000020000000
> >                      00 1000 (D) : 1af4 1009    virtio [ network ]
> > Populating /pci@800000020000000/unknown-legacy-device@2
> >                      00 0800 (D) : 1af4 1001    virtio [ block ]
> >                      00 0000 (D) : 1af4 1000    virtio [ net ]
> > 
> > 7e5e8118 :  /pci@800000020000000
> > 7e5ea6a0 :  |-- unknown-legacy-device@2
> > 7e5eadb8 :  |-- scsi@1
> > 7e5eb4d8 :  +-- ethernet@0 ok
> > 
> > This behaviour change is not actually a bug since no assumptions should be
> > made on DT ordering. But it has no real justification either, other than
> > being the consequence of the way fdt_add_subnode() inserts new elements
> > to the front of the FDT rather than adding them to the tail.
> > 
> > This patch reverts to the historical SLOF ordering by walking PCI devices
> > in reverse order. This reconciles pseries with x86 machine types behavior.
> > It is expected to make things easier when porting existing applications to
> > power.
> > 
> > Signed-off-by: Greg Kurz <gkurz@linux.vnet.ibm.com>
> > Tested-by: Thomas Huth <thuth@redhat.com>
> > Reviewed-by: Nikunj A Dadhania <nikunj@linux.vnet.ibm.com>
> > (slight update to the changelog)
> > Signed-off-by: Greg Kurz <groug@kaod.org>
> > ---
> >  hw/pci/pci.c         |   28 ++++++++++++++++++++++++++++
> >  hw/ppc/spapr_pci.c   |   12 ++++++------
> >  include/hw/pci/pci.h |    4 ++++
> >  3 files changed, 38 insertions(+), 6 deletions(-)
> > 
> > David,
> > 
> > This patch was posted and already discussed during 2.5 development:
> > 
> > http://patchwork.ozlabs.org/patch/549925/
> > 
> > The "consensus" at the time was that guests should not rely on device
> > ordering (i.e. use persistent naming instead).
> > 
> > I got recently contacted by OpenStack people who had several complaints
> > about the reverse ordering of PCI devices in pseries: different behavior
> > between ppc64 and x86, lots of time spent in debugging when porting
> > applications from x86 to ppc64 before realizing that it is caused by the
> > reverse ordering, necessity to carry hacky workarounds...
> > 
> > One strong argument against handling this properly with persistent naming
> > is that it requires systemd/udev. This option is considered as painful
> > with CirrOS, which aims at remaining as minimal as possible and is widely
> > used in the OpenStack ecosystem.
> > 
> > Would you re-consider your position and apply this patch ?
> > 
> > Cheers.
> > 
> > diff --git a/hw/pci/pci.c b/hw/pci/pci.c
> > index a563555e7da7..273f1e46025a 100644
> > --- a/hw/pci/pci.c
> > +++ b/hw/pci/pci.c
> > @@ -1530,6 +1530,34 @@ static const pci_class_desc pci_class_descriptions[] =
> >      { 0, NULL}
> >  };
> >  
> > +static void pci_for_each_device_under_bus_reverse(PCIBus *bus,
> > +                                                  void (*fn)(PCIBus *b,
> > +                                                             PCIDevice *d,
> > +                                                             void *opaque),
> > +                                                  void *opaque)
> > +{
> > +    PCIDevice *d;
> > +    int devfn;
> > +
> > +    for (devfn = 0; devfn < ARRAY_SIZE(bus->devices); devfn++) {
> > +        d = bus->devices[ARRAY_SIZE(bus->devices) - 1 - devfn];
> > +        if (d) {
> > +            fn(bus, d, opaque);
> > +        }
> > +    }
> > +}
> > +
> > +void pci_for_each_device_reverse(PCIBus *bus, int bus_num,
> > +                         void (*fn)(PCIBus *b, PCIDevice *d, void *opaque),
> > +                         void *opaque)
> > +{
> > +    bus = pci_find_bus_nr(bus, bus_num);
> > +
> > +    if (bus) {
> > +        pci_for_each_device_under_bus_reverse(bus, fn, opaque);
> > +    }
> > +}
> > +
> >  static void pci_for_each_device_under_bus(PCIBus *bus,
> >                                            void (*fn)(PCIBus *b, PCIDevice *d,
> >                                                       void *opaque),
> > diff --git a/hw/ppc/spapr_pci.c b/hw/ppc/spapr_pci.c
> > index fd6fc1d95344..2a20c2a140fc 100644
> > --- a/hw/ppc/spapr_pci.c
> > +++ b/hw/ppc/spapr_pci.c
> > @@ -1782,9 +1782,9 @@ static void spapr_populate_pci_devices_dt(PCIBus *bus, PCIDevice *pdev,
> >      s_fdt.fdt = p->fdt;
> >      s_fdt.node_off = offset;
> >      s_fdt.sphb = p->sphb;
> > -    pci_for_each_device(sec_bus, pci_bus_num(sec_bus),
> > -                        spapr_populate_pci_devices_dt,
> > -                        &s_fdt);
> > +    pci_for_each_device_reverse(sec_bus, pci_bus_num(sec_bus),
> > +                                spapr_populate_pci_devices_dt,
> > +                                &s_fdt);
> >  }
> >  
> >  static void spapr_phb_pci_enumerate_bridge(PCIBus *bus, PCIDevice *pdev,
> > @@ -1953,9 +1953,9 @@ int spapr_populate_pci_dt(sPAPRPHBState *phb,
> >      s_fdt.fdt = fdt;
> >      s_fdt.node_off = bus_off;
> >      s_fdt.sphb = phb;
> > -    pci_for_each_device(bus, pci_bus_num(bus),
> > -                        spapr_populate_pci_devices_dt,
> > -                        &s_fdt);
> > +    pci_for_each_device_reverse(bus, pci_bus_num(bus),
> > +                                spapr_populate_pci_devices_dt,
> > +                                &s_fdt);
> >  
> >      ret = spapr_drc_populate_dt(fdt, bus_off, OBJECT(phb),
> >                                  SPAPR_DR_CONNECTOR_TYPE_PCI);
> > diff --git a/include/hw/pci/pci.h b/include/hw/pci/pci.h
> > index 6983f13745a5..9349acbfb278 100644
> > --- a/include/hw/pci/pci.h
> > +++ b/include/hw/pci/pci.h
> > @@ -429,6 +429,10 @@ int pci_bus_numa_node(PCIBus *bus);
> >  void pci_for_each_device(PCIBus *bus, int bus_num,
> >                           void (*fn)(PCIBus *bus, PCIDevice *d, void *opaque),
> >                           void *opaque);
> > +void pci_for_each_device_reverse(PCIBus *bus, int bus_num,
> > +                                 void (*fn)(PCIBus *bus, PCIDevice *d,
> > +                                            void *opaque),
> > +                                 void *opaque);
> >  void pci_for_each_bus_depth_first(PCIBus *bus,
> >                                    void *(*begin)(PCIBus *bus, void *parent_state),
> >                                    void (*end)(PCIBus *bus, void *state),
> > 
> > 
> 



-- 
David Gibson			| I'll have my music baroque, and my code
david AT gibson.dropbear.id.au	| minimalist, thank you.  NOT _the_ _other_
				| _way_ _around_!
http://www.ozlabs.org/~dgibson

[-- Attachment #2: signature.asc --]
[-- Type: application/pgp-signature, Size: 819 bytes --]

^ permalink raw reply	[flat|nested] 9+ messages in thread

* Re: [Qemu-devel] [Qemu-ppc] [PATCH] spapr/pci: populate PCI DT in reverse order
  2017-02-22 10:56 [Qemu-devel] " Greg Kurz
@ 2017-02-27 22:20 ` Greg Kurz
  2017-03-01  1:07   ` David Gibson
  0 siblings, 1 reply; 9+ messages in thread
From: Greg Kurz @ 2017-02-27 22:20 UTC (permalink / raw)
  To: David Gibson
  Cc: Thomas Huth, Michael S. Tsirkin, qemu-ppc, Marcel Apfelbaum, qemu-devel

[-- Attachment #1: Type: text/plain, Size: 6956 bytes --]

David,

Any chances to have this in 2.9 ?

On Wed, 22 Feb 2017 11:56:53 +0100
Greg Kurz <groug@kaod.org> wrote:

> From: Greg Kurz <gkurz@linux.vnet.ibm.com>
> 
> Since commit 1d2d974244c6 "spapr_pci: enumerate and add PCI device tree", QEMU
> populates the PCI device tree in the opposite order compared to SLOF.
> 
> Before 1d2d974244c6:
> 
> Populating /pci@800000020000000
>                      00 0000 (D) : 1af4 1000    virtio [ net ]
>                      00 0800 (D) : 1af4 1001    virtio [ block ]
>                      00 1000 (D) : 1af4 1009    virtio [ network ]
> Populating /pci@800000020000000/unknown-legacy-device@2
> 
> 7e5294b8 :  /pci@800000020000000
> 7e52b998 :  |-- ethernet@0
> 7e52c0c8 :  |-- scsi@1
> 7e52c7e8 :  +-- unknown-legacy-device@2 ok
> 
> Since 1d2d974244c6:
> 
> Populating /pci@800000020000000
>                      00 1000 (D) : 1af4 1009    virtio [ network ]
> Populating /pci@800000020000000/unknown-legacy-device@2
>                      00 0800 (D) : 1af4 1001    virtio [ block ]
>                      00 0000 (D) : 1af4 1000    virtio [ net ]
> 
> 7e5e8118 :  /pci@800000020000000
> 7e5ea6a0 :  |-- unknown-legacy-device@2
> 7e5eadb8 :  |-- scsi@1
> 7e5eb4d8 :  +-- ethernet@0 ok
> 
> This behaviour change is not actually a bug since no assumptions should be
> made on DT ordering. But it has no real justification either, other than
> being the consequence of the way fdt_add_subnode() inserts new elements
> to the front of the FDT rather than adding them to the tail.
> 
> This patch reverts to the historical SLOF ordering by walking PCI devices
> in reverse order. This reconciles pseries with x86 machine types behavior.
> It is expected to make things easier when porting existing applications to
> power.
> 
> Signed-off-by: Greg Kurz <gkurz@linux.vnet.ibm.com>
> Tested-by: Thomas Huth <thuth@redhat.com>
> Reviewed-by: Nikunj A Dadhania <nikunj@linux.vnet.ibm.com>
> (slight update to the changelog)
> Signed-off-by: Greg Kurz <groug@kaod.org>
> ---
>  hw/pci/pci.c         |   28 ++++++++++++++++++++++++++++
>  hw/ppc/spapr_pci.c   |   12 ++++++------
>  include/hw/pci/pci.h |    4 ++++
>  3 files changed, 38 insertions(+), 6 deletions(-)
> 
> David,
> 
> This patch was posted and already discussed during 2.5 development:
> 
> http://patchwork.ozlabs.org/patch/549925/
> 
> The "consensus" at the time was that guests should not rely on device
> ordering (i.e. use persistent naming instead).
> 
> I got recently contacted by OpenStack people who had several complaints
> about the reverse ordering of PCI devices in pseries: different behavior
> between ppc64 and x86, lots of time spent in debugging when porting
> applications from x86 to ppc64 before realizing that it is caused by the
> reverse ordering, necessity to carry hacky workarounds...
> 
> One strong argument against handling this properly with persistent naming
> is that it requires systemd/udev. This option is considered as painful
> with CirrOS, which aims at remaining as minimal as possible and is widely
> used in the OpenStack ecosystem.
> 
> Would you re-consider your position and apply this patch ?
> 
> Cheers.
> 
> diff --git a/hw/pci/pci.c b/hw/pci/pci.c
> index a563555e7da7..273f1e46025a 100644
> --- a/hw/pci/pci.c
> +++ b/hw/pci/pci.c
> @@ -1530,6 +1530,34 @@ static const pci_class_desc pci_class_descriptions[] =
>      { 0, NULL}
>  };
>  
> +static void pci_for_each_device_under_bus_reverse(PCIBus *bus,
> +                                                  void (*fn)(PCIBus *b,
> +                                                             PCIDevice *d,
> +                                                             void *opaque),
> +                                                  void *opaque)
> +{
> +    PCIDevice *d;
> +    int devfn;
> +
> +    for (devfn = 0; devfn < ARRAY_SIZE(bus->devices); devfn++) {
> +        d = bus->devices[ARRAY_SIZE(bus->devices) - 1 - devfn];
> +        if (d) {
> +            fn(bus, d, opaque);
> +        }
> +    }
> +}
> +
> +void pci_for_each_device_reverse(PCIBus *bus, int bus_num,
> +                         void (*fn)(PCIBus *b, PCIDevice *d, void *opaque),
> +                         void *opaque)
> +{
> +    bus = pci_find_bus_nr(bus, bus_num);
> +
> +    if (bus) {
> +        pci_for_each_device_under_bus_reverse(bus, fn, opaque);
> +    }
> +}
> +
>  static void pci_for_each_device_under_bus(PCIBus *bus,
>                                            void (*fn)(PCIBus *b, PCIDevice *d,
>                                                       void *opaque),
> diff --git a/hw/ppc/spapr_pci.c b/hw/ppc/spapr_pci.c
> index fd6fc1d95344..2a20c2a140fc 100644
> --- a/hw/ppc/spapr_pci.c
> +++ b/hw/ppc/spapr_pci.c
> @@ -1782,9 +1782,9 @@ static void spapr_populate_pci_devices_dt(PCIBus *bus, PCIDevice *pdev,
>      s_fdt.fdt = p->fdt;
>      s_fdt.node_off = offset;
>      s_fdt.sphb = p->sphb;
> -    pci_for_each_device(sec_bus, pci_bus_num(sec_bus),
> -                        spapr_populate_pci_devices_dt,
> -                        &s_fdt);
> +    pci_for_each_device_reverse(sec_bus, pci_bus_num(sec_bus),
> +                                spapr_populate_pci_devices_dt,
> +                                &s_fdt);
>  }
>  
>  static void spapr_phb_pci_enumerate_bridge(PCIBus *bus, PCIDevice *pdev,
> @@ -1953,9 +1953,9 @@ int spapr_populate_pci_dt(sPAPRPHBState *phb,
>      s_fdt.fdt = fdt;
>      s_fdt.node_off = bus_off;
>      s_fdt.sphb = phb;
> -    pci_for_each_device(bus, pci_bus_num(bus),
> -                        spapr_populate_pci_devices_dt,
> -                        &s_fdt);
> +    pci_for_each_device_reverse(bus, pci_bus_num(bus),
> +                                spapr_populate_pci_devices_dt,
> +                                &s_fdt);
>  
>      ret = spapr_drc_populate_dt(fdt, bus_off, OBJECT(phb),
>                                  SPAPR_DR_CONNECTOR_TYPE_PCI);
> diff --git a/include/hw/pci/pci.h b/include/hw/pci/pci.h
> index 6983f13745a5..9349acbfb278 100644
> --- a/include/hw/pci/pci.h
> +++ b/include/hw/pci/pci.h
> @@ -429,6 +429,10 @@ int pci_bus_numa_node(PCIBus *bus);
>  void pci_for_each_device(PCIBus *bus, int bus_num,
>                           void (*fn)(PCIBus *bus, PCIDevice *d, void *opaque),
>                           void *opaque);
> +void pci_for_each_device_reverse(PCIBus *bus, int bus_num,
> +                                 void (*fn)(PCIBus *bus, PCIDevice *d,
> +                                            void *opaque),
> +                                 void *opaque);
>  void pci_for_each_bus_depth_first(PCIBus *bus,
>                                    void *(*begin)(PCIBus *bus, void *parent_state),
>                                    void (*end)(PCIBus *bus, void *state),
> 
> 


[-- Attachment #2: OpenPGP digital signature --]
[-- Type: application/pgp-signature, Size: 181 bytes --]

^ permalink raw reply	[flat|nested] 9+ messages in thread

end of thread, other threads:[~2017-03-01  1:38 UTC | newest]

Thread overview: 9+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2015-11-30 10:45 [Qemu-devel] [PATCH] spapr/pci: populate PCI DT in reverse order Greg Kurz
2015-12-01 21:48 ` Thomas Huth
2015-12-03 14:53   ` [Qemu-devel] [Qemu-ppc] " Greg Kurz
2015-12-17  8:43     ` Greg Kurz
2015-12-21  1:56       ` David Gibson
2015-12-21  8:09         ` Greg Kurz
2015-12-23  5:47         ` Nikunj A Dadhania
2017-02-22 10:56 [Qemu-devel] " Greg Kurz
2017-02-27 22:20 ` [Qemu-devel] [Qemu-ppc] " Greg Kurz
2017-03-01  1:07   ` David Gibson

This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.