from:"Andre Przywara"

[PATCH v5 09/10] arm: add support for supplying GICv3 redistributor addresses

2015-07-03 Thread Andre Przywara

Instead of the GIC virtual CPU interface an emulated GICv3 needs to
have accesses to its emulated redistributors trapped in the guest.
Add code to tell the kernel about the mapping if a GICv3 emulation was
requested by the user.

This contains some defines which are not (yet) in the (32 bit) header
files to allow compilation for ARM.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
Reviewed-by: Marc Zyngier marc.zyng...@arm.com
---
 arm/gic.c | 36 +++-
 arm/include/arm-common/gic.h  |  1 +
 arm/include/arm-common/kvm-arch.h |  7 +++
 3 files changed, 43 insertions(+), 1 deletion(-)

diff --git a/arm/gic.c b/arm/gic.c
index b6c5868..efe4b42 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -9,7 +9,18 @@
 #include linux/kernel.h
 #include linux/kvm.h
 
+/* Those names are not defined for ARM (yet) */
+#ifndef KVM_VGIC_V3_ADDR_TYPE_DIST
+#define KVM_VGIC_V3_ADDR_TYPE_DIST 2
+#endif
+
+#ifndef KVM_VGIC_V3_ADDR_TYPE_REDIST
+#define KVM_VGIC_V3_ADDR_TYPE_REDIST 3
+#endif
+
 static int gic_fd = -1;
+static u64 gic_redists_base;
+static u64 gic_redists_size;
 
 static int gic__create_device(struct kvm *kvm, enum irqchip_type type)
 {
@@ -28,12 +39,21 @@ static int gic__create_device(struct kvm *kvm, enum 
irqchip_type type)
.group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
.addr   = (u64)(unsigned long)dist_addr,
};
+   struct kvm_device_attr redist_attr = {
+   .group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
+   .attr   = KVM_VGIC_V3_ADDR_TYPE_REDIST,
+   .addr   = (u64)(unsigned long)gic_redists_base,
+   };
 
switch (type) {
case IRQCHIP_GICV2:
gic_device.type = KVM_DEV_TYPE_ARM_VGIC_V2;
dist_attr.attr  = KVM_VGIC_V2_ADDR_TYPE_DIST;
break;
+   case IRQCHIP_GICV3:
+   gic_device.type = KVM_DEV_TYPE_ARM_VGIC_V3;
+   dist_attr.attr  = KVM_VGIC_V3_ADDR_TYPE_DIST;
+   break;
}
 
err = ioctl(kvm-vm_fd, KVM_CREATE_DEVICE, gic_device);
@@ -46,6 +66,9 @@ static int gic__create_device(struct kvm *kvm, enum 
irqchip_type type)
case IRQCHIP_GICV2:
err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, cpu_if_attr);
break;
+   case IRQCHIP_GICV3:
+   err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, redist_attr);
+   break;
}
if (err)
goto out_err;
@@ -97,6 +120,10 @@ int gic__create(struct kvm *kvm, enum irqchip_type type)
switch (type) {
case IRQCHIP_GICV2:
break;
+   case IRQCHIP_GICV3:
+   gic_redists_size = kvm-cfg.nrcpus * ARM_GIC_REDIST_SIZE;
+   gic_redists_base = ARM_GIC_DIST_BASE - gic_redists_size;
+   break;
default:
return -ENODEV;
}
@@ -156,12 +183,19 @@ void gic__generate_fdt_nodes(void *fdt, u32 phandle, enum 
irqchip_type type)
const char *compatible;
u64 reg_prop[] = {
cpu_to_fdt64(ARM_GIC_DIST_BASE), 
cpu_to_fdt64(ARM_GIC_DIST_SIZE),
-   cpu_to_fdt64(ARM_GIC_CPUI_BASE), 
cpu_to_fdt64(ARM_GIC_CPUI_SIZE),
+   0, 0,   /* to be filled */
};
 
switch (type) {
case IRQCHIP_GICV2:
compatible = arm,cortex-a15-gic;
+   reg_prop[2] = cpu_to_fdt64(ARM_GIC_CPUI_BASE);
+   reg_prop[3] = cpu_to_fdt64(ARM_GIC_CPUI_SIZE);
+   break;
+   case IRQCHIP_GICV3:
+   compatible = arm,gic-v3;
+   reg_prop[2] = cpu_to_fdt64(gic_redists_base);
+   reg_prop[3] = cpu_to_fdt64(gic_redists_size);
break;
default:
return;
diff --git a/arm/include/arm-common/gic.h b/arm/include/arm-common/gic.h
index d524f55..4fde5ac 100644
--- a/arm/include/arm-common/gic.h
+++ b/arm/include/arm-common/gic.h
@@ -23,6 +23,7 @@
 
 enum irqchip_type {
IRQCHIP_GICV2,
+   IRQCHIP_GICV3,
 };
 
 struct kvm;
diff --git a/arm/include/arm-common/kvm-arch.h 
b/arm/include/arm-common/kvm-arch.h
index 90d6733..0f5fb7f 100644
--- a/arm/include/arm-common/kvm-arch.h
+++ b/arm/include/arm-common/kvm-arch.h
@@ -30,6 +30,13 @@
 #define KVM_PCI_MMIO_AREA  (KVM_PCI_CFG_AREA + ARM_PCI_CFG_SIZE)
 #define KVM_VIRTIO_MMIO_AREA   ARM_MMIO_AREA
 
+/*
+ * On a GICv3 there must be one redistributor per vCPU.
+ * The value here is the size for one, we multiply this at runtime with
+ * the number of requested vCPUs to get the actual size.
+ */
+#define ARM_GIC_REDIST_SIZE0x2
+
 #define KVM_IRQ_OFFSET GIC_SPI_IRQ_BASE
 
 #define KVM_VM_TYPE0
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v5 04/10] AArch{32,64}: dynamically configure the number of GIC interrupts

2015-07-03 Thread Andre Przywara

From: Marc Zyngier marc.zyng...@arm.com

In order to reduce the memory usage of large guests (as well
as improve performance), tell KVM about the number of interrupts
we require.

To avoid synchronization with the various device creation,
use a late_init callback to compute the GIC configuration.
[Andre: rename to gic__init_gic() to ease future expansion]

Signed-off-by: Marc Zyngier marc.zyng...@arm.com
Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 arm/gic.c | 25 +
 1 file changed, 25 insertions(+)

diff --git a/arm/gic.c b/arm/gic.c
index 1ff3663..8560c9b 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -1,10 +1,12 @@
 #include kvm/fdt.h
+#include kvm/irq.h
 #include kvm/kvm.h
 #include kvm/virtio.h
 
 #include arm-common/gic.h
 
 #include linux/byteorder.h
+#include linux/kernel.h
 #include linux/kvm.h
 
 static int gic_fd = -1;
@@ -96,6 +98,29 @@ int gic__create(struct kvm *kvm)
return err;
 }
 
+static int gic__init_gic(struct kvm *kvm)
+{
+   int lines = irq__get_nr_allocated_lines();
+   u32 nr_irqs = ALIGN(lines, 32) + GIC_SPI_IRQ_BASE;
+   struct kvm_device_attr nr_irqs_attr = {
+   .group  = KVM_DEV_ARM_VGIC_GRP_NR_IRQS,
+   .addr   = (u64)(unsigned long)nr_irqs,
+   };
+
+   /*
+* If we didn't use the KVM_CREATE_DEVICE method, KVM will
+* give us some default number of interrupts.
+*/
+   if (gic_fd  0)
+   return 0;
+
+   if (!ioctl(gic_fd, KVM_HAS_DEVICE_ATTR, nr_irqs_attr))
+   return ioctl(gic_fd, KVM_SET_DEVICE_ATTR, nr_irqs_attr);
+
+   return 0;
+}
+late_init(gic__init_gic)
+
 void gic__generate_fdt_nodes(void *fdt, u32 phandle)
 {
u64 reg_prop[] = {
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v5 06/10] arm: simplify MMIO dispatching

2015-07-03 Thread Andre Przywara

Currently we separate any incoming MMIO request into one of the ARM
memory map regions and take care to spare the GIC.
It turns out that this is unnecessary, as we only have one special
region (the IO port area in the first 64 KByte). The MMIO rbtree
takes care about unhandled MMIO ranges, so we can simply drop all the
special range checking (except that for the IO range) in
kvm_cpu__emulate_mmio().
As the GIC is handled in the kernel, a GIC MMIO access should never
reach userland (and we don't know what to do with it anyway).
This lets us delete some more code and simplifies future extensions
(like expanding the GIC regions).
To be in line with the other architectures, move the now simpler
code into a header file.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
Reviewed-by: Marc Zyngier marc.zyng...@arm.com
---
 arm/include/arm-common/kvm-arch.h | 12 
 arm/include/arm-common/kvm-cpu-arch.h | 14 --
 arm/kvm-cpu.c | 16 
 3 files changed, 12 insertions(+), 30 deletions(-)

diff --git a/arm/include/arm-common/kvm-arch.h 
b/arm/include/arm-common/kvm-arch.h
index 082131d..90d6733 100644
--- a/arm/include/arm-common/kvm-arch.h
+++ b/arm/include/arm-common/kvm-arch.h
@@ -45,18 +45,6 @@ static inline bool arm_addr_in_ioport_region(u64 phys_addr)
return phys_addr = KVM_IOPORT_AREA  phys_addr  limit;
 }
 
-static inline bool arm_addr_in_virtio_mmio_region(u64 phys_addr)
-{
-   u64 limit = KVM_VIRTIO_MMIO_AREA + ARM_VIRTIO_MMIO_SIZE;
-   return phys_addr = KVM_VIRTIO_MMIO_AREA  phys_addr  limit;
-}
-
-static inline bool arm_addr_in_pci_region(u64 phys_addr)
-{
-   u64 limit = KVM_PCI_CFG_AREA + ARM_PCI_CFG_SIZE + ARM_PCI_MMIO_SIZE;
-   return phys_addr = KVM_PCI_CFG_AREA  phys_addr  limit;
-}
-
 struct kvm_arch {
/*
 * We may have to align the guest memory for virtio, so keep the
diff --git a/arm/include/arm-common/kvm-cpu-arch.h 
b/arm/include/arm-common/kvm-cpu-arch.h
index 36c7872..329979a 100644
--- a/arm/include/arm-common/kvm-cpu-arch.h
+++ b/arm/include/arm-common/kvm-cpu-arch.h
@@ -44,8 +44,18 @@ static inline bool kvm_cpu__emulate_io(struct kvm_cpu *vcpu, 
u16 port, void *dat
return false;
 }
 
-bool kvm_cpu__emulate_mmio(struct kvm_cpu *vcpu, u64 phys_addr, u8 *data,
-  u32 len, u8 is_write);
+static inline bool kvm_cpu__emulate_mmio(struct kvm_cpu *vcpu, u64 phys_addr,
+u8 *data, u32 len, u8 is_write)
+{
+   if (arm_addr_in_ioport_region(phys_addr)) {
+   int direction = is_write ? KVM_EXIT_IO_OUT : KVM_EXIT_IO_IN;
+   u16 port = (phys_addr - KVM_IOPORT_AREA)  USHRT_MAX;
+
+   return kvm__emulate_io(vcpu, port, data, direction, len, 1);
+   }
+
+   return kvm__emulate_mmio(vcpu, phys_addr, data, len, is_write);
+}
 
 unsigned long kvm_cpu__get_vcpu_mpidr(struct kvm_cpu *vcpu);
 
diff --git a/arm/kvm-cpu.c b/arm/kvm-cpu.c
index ab08815..7780251 100644
--- a/arm/kvm-cpu.c
+++ b/arm/kvm-cpu.c
@@ -139,22 +139,6 @@ bool kvm_cpu__handle_exit(struct kvm_cpu *vcpu)
return false;
 }
 
-bool kvm_cpu__emulate_mmio(struct kvm_cpu *vcpu, u64 phys_addr, u8 *data,
-  u32 len, u8 is_write)
-{
-   if (arm_addr_in_virtio_mmio_region(phys_addr)) {
-   return kvm__emulate_mmio(vcpu, phys_addr, data, len, is_write);
-   } else if (arm_addr_in_ioport_region(phys_addr)) {
-   int direction = is_write ? KVM_EXIT_IO_OUT : KVM_EXIT_IO_IN;
-   u16 port = (phys_addr - KVM_IOPORT_AREA)  USHRT_MAX;
-   return kvm__emulate_io(vcpu, port, data, direction, len, 1);
-   } else if (arm_addr_in_pci_region(phys_addr)) {
-   return kvm__emulate_mmio(vcpu, phys_addr, data, len, is_write);
-   }
-
-   return false;
-}
-
 void kvm_cpu__show_page_tables(struct kvm_cpu *vcpu)
 {
 }
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v5 10/10] arm: use new irqchip parameter to create different vGIC types

2015-07-03 Thread Andre Przywara

Currently we unconditionally create a virtual GICv2 in the guest.
Add a --irqchip= parameter to let the user specify a different GIC
type for the guest, when omitting this parameter it still defaults to
--irqchip=gicv2.
For now the only other supported type is --irqchip=gicv3

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 arm/aarch64/arm-cpu.c|  2 +-
 arm/gic.c| 16 
 arm/include/arm-common/kvm-config-arch.h |  9 -
 arm/kvm.c|  2 +-
 4 files changed, 26 insertions(+), 3 deletions(-)

diff --git a/arm/aarch64/arm-cpu.c b/arm/aarch64/arm-cpu.c
index f702b9e..3dc8ea3 100644
--- a/arm/aarch64/arm-cpu.c
+++ b/arm/aarch64/arm-cpu.c
@@ -12,7 +12,7 @@
 static void generate_fdt_nodes(void *fdt, struct kvm *kvm, u32 gic_phandle)
 {
int timer_interrupts[4] = {13, 14, 11, 10};
-   gic__generate_fdt_nodes(fdt, gic_phandle, IRQCHIP_GICV2);
+   gic__generate_fdt_nodes(fdt, gic_phandle, kvm-cfg.arch.irqchip);
timer__generate_fdt_nodes(fdt, kvm, timer_interrupts);
 }
 
diff --git a/arm/gic.c b/arm/gic.c
index efe4b42..1b63074 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -22,6 +22,22 @@ static int gic_fd = -1;
 static u64 gic_redists_base;
 static u64 gic_redists_size;
 
+int irqchip_parser(const struct option *opt, const char *arg, int unset)
+{
+   enum irqchip_type *type = opt-value;
+
+   if (!strcmp(arg, gicv2)) {
+   *type = IRQCHIP_GICV2;
+   } else if (!strcmp(arg, gicv3)) {
+   *type = IRQCHIP_GICV3;
+   } else {
+   fprintf(stderr, irqchip: unknown type \%s\\n, arg);
+   return -1;
+   }
+
+   return 0;
+}
+
 static int gic__create_device(struct kvm *kvm, enum irqchip_type type)
 {
int err;
diff --git a/arm/include/arm-common/kvm-config-arch.h 
b/arm/include/arm-common/kvm-config-arch.h
index a8ebd94..9529881 100644
--- a/arm/include/arm-common/kvm-config-arch.h
+++ b/arm/include/arm-common/kvm-config-arch.h
@@ -8,8 +8,11 @@ struct kvm_config_arch {
unsigned intforce_cntfrq;
boolvirtio_trans_pci;
boolaarch32_guest;
+   enum irqchip_type irqchip;
 };
 
+int irqchip_parser(const struct option *opt, const char *arg, int unset);
+
 #define OPT_ARCH_RUN(pfx, cfg) 
\
pfx,
\
ARM_OPT_ARCH_RUN(cfg)   
\
@@ -21,6 +24,10 @@ struct kvm_config_arch {
 updated to program CNTFRQ correctly*),   
\
OPT_BOOLEAN('\0', force-pci, (cfg)-virtio_trans_pci,
\
Force virtio devices to use PCI as their default  
\
-   transport),
+   transport),   
\
+OPT_CALLBACK('\0', irqchip, (cfg)-irqchip, 
\
+[gicv2|gicv3],   \
+type of interrupt controller to emulate in the guest,
\
+irqchip_parser, NULL),
 
 #endif /* ARM_COMMON__KVM_CONFIG_ARCH_H */
diff --git a/arm/kvm.c b/arm/kvm.c
index f9685c2..d0e4a20 100644
--- a/arm/kvm.c
+++ b/arm/kvm.c
@@ -82,6 +82,6 @@ void kvm__arch_init(struct kvm *kvm, const char 
*hugetlbfs_path, u64 ram_size)
MADV_MERGEABLE | MADV_HUGEPAGE);
 
/* Create the virtual GIC. */
-   if (gic__create(kvm, IRQCHIP_GICV2))
+   if (gic__create(kvm, kvm-cfg.arch.irqchip))
die(Failed to create virtual GIC);
 }
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v5 07/10] limit number of VCPUs on demand

2015-07-03 Thread Andre Przywara

Currently the ARM GIC checks the number of VCPUs against a fixed
limit, which is GICv2 specific. Don't pretend we know better than the
kernel and let's get rid of that explicit check.
We now fail if the number of requested VCPUs could not be
instantiated instead of limiting the number of VCPUs.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 arm/gic.c | 6 --
 1 file changed, 6 deletions(-)

diff --git a/arm/gic.c b/arm/gic.c
index 99f0d2b..05f85a2 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -84,12 +84,6 @@ int gic__create(struct kvm *kvm)
 {
int err;
 
-   if (kvm-nrcpus  GIC_MAX_CPUS) {
-   pr_warning(%d CPUS greater than maximum of %d -- truncating\n,
-   kvm-nrcpus, GIC_MAX_CPUS);
-   kvm-nrcpus = GIC_MAX_CPUS;
-   }
-
/* Try the new way first, and fallback on legacy method otherwise */
err = gic__create_device(kvm);
if (err)
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v5 08/10] arm: prepare for instantiating different IRQ chip devices

2015-07-03 Thread Andre Przywara

Extend the vGIC handling code to potentially deal with different IRQ
chip devices instead of hard-coding the GICv2 in.
We extend most vGIC functions to take a type parameter, but still put
GICv2 in at the top for the time being.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
Reviewed-by: Marc Zyngier marc.zyng...@arm.com
---
 arm/aarch32/arm-cpu.c|  2 +-
 arm/aarch64/arm-cpu.c|  2 +-
 arm/gic.c| 44 +++-
 arm/include/arm-common/gic.h |  8 ++--
 arm/kvm.c|  2 +-
 5 files changed, 44 insertions(+), 14 deletions(-)

diff --git a/arm/aarch32/arm-cpu.c b/arm/aarch32/arm-cpu.c
index 946e443..d8d6293 100644
--- a/arm/aarch32/arm-cpu.c
+++ b/arm/aarch32/arm-cpu.c
@@ -12,7 +12,7 @@ static void generate_fdt_nodes(void *fdt, struct kvm *kvm, 
u32 gic_phandle)
 {
int timer_interrupts[4] = {13, 14, 11, 10};
 
-   gic__generate_fdt_nodes(fdt, gic_phandle);
+   gic__generate_fdt_nodes(fdt, gic_phandle, IRQCHIP_GICV2);
timer__generate_fdt_nodes(fdt, kvm, timer_interrupts);
 }
 
diff --git a/arm/aarch64/arm-cpu.c b/arm/aarch64/arm-cpu.c
index 8efe877..f702b9e 100644
--- a/arm/aarch64/arm-cpu.c
+++ b/arm/aarch64/arm-cpu.c
@@ -12,7 +12,7 @@
 static void generate_fdt_nodes(void *fdt, struct kvm *kvm, u32 gic_phandle)
 {
int timer_interrupts[4] = {13, 14, 11, 10};
-   gic__generate_fdt_nodes(fdt, gic_phandle);
+   gic__generate_fdt_nodes(fdt, gic_phandle, IRQCHIP_GICV2);
timer__generate_fdt_nodes(fdt, kvm, timer_interrupts);
 }
 
diff --git a/arm/gic.c b/arm/gic.c
index 05f85a2..b6c5868 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -11,13 +11,13 @@
 
 static int gic_fd = -1;
 
-static int gic__create_device(struct kvm *kvm)
+static int gic__create_device(struct kvm *kvm, enum irqchip_type type)
 {
int err;
u64 cpu_if_addr = ARM_GIC_CPUI_BASE;
u64 dist_addr = ARM_GIC_DIST_BASE;
struct kvm_create_device gic_device = {
-   .type   = KVM_DEV_TYPE_ARM_VGIC_V2,
+   .flags  = 0,
};
struct kvm_device_attr cpu_if_attr = {
.group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
@@ -26,17 +26,27 @@ static int gic__create_device(struct kvm *kvm)
};
struct kvm_device_attr dist_attr = {
.group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
-   .attr   = KVM_VGIC_V2_ADDR_TYPE_DIST,
.addr   = (u64)(unsigned long)dist_addr,
};
 
+   switch (type) {
+   case IRQCHIP_GICV2:
+   gic_device.type = KVM_DEV_TYPE_ARM_VGIC_V2;
+   dist_attr.attr  = KVM_VGIC_V2_ADDR_TYPE_DIST;
+   break;
+   }
+
err = ioctl(kvm-vm_fd, KVM_CREATE_DEVICE, gic_device);
if (err)
return err;
 
gic_fd = gic_device.fd;
 
-   err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, cpu_if_attr);
+   switch (type) {
+   case IRQCHIP_GICV2:
+   err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, cpu_if_attr);
+   break;
+   }
if (err)
goto out_err;
 
@@ -80,13 +90,20 @@ static int gic__create_irqchip(struct kvm *kvm)
return err;
 }
 
-int gic__create(struct kvm *kvm)
+int gic__create(struct kvm *kvm, enum irqchip_type type)
 {
int err;
 
+   switch (type) {
+   case IRQCHIP_GICV2:
+   break;
+   default:
+   return -ENODEV;
+   }
+
/* Try the new way first, and fallback on legacy method otherwise */
-   err = gic__create_device(kvm);
-   if (err)
+   err = gic__create_device(kvm, type);
+   if (err  type == IRQCHIP_GICV2)
err = gic__create_irqchip(kvm);
 
return err;
@@ -134,15 +151,24 @@ static int gic__init_gic(struct kvm *kvm)
 }
 late_init(gic__init_gic)
 
-void gic__generate_fdt_nodes(void *fdt, u32 phandle)
+void gic__generate_fdt_nodes(void *fdt, u32 phandle, enum irqchip_type type)
 {
+   const char *compatible;
u64 reg_prop[] = {
cpu_to_fdt64(ARM_GIC_DIST_BASE), 
cpu_to_fdt64(ARM_GIC_DIST_SIZE),
cpu_to_fdt64(ARM_GIC_CPUI_BASE), 
cpu_to_fdt64(ARM_GIC_CPUI_SIZE),
};
 
+   switch (type) {
+   case IRQCHIP_GICV2:
+   compatible = arm,cortex-a15-gic;
+   break;
+   default:
+   return;
+   }
+
_FDT(fdt_begin_node(fdt, intc));
-   _FDT(fdt_property_string(fdt, compatible, arm,cortex-a15-gic));
+   _FDT(fdt_property_string(fdt, compatible, compatible));
_FDT(fdt_property_cell(fdt, #interrupt-cells, GIC_FDT_IRQ_NUM_CELLS));
_FDT(fdt_property(fdt, interrupt-controller, NULL, 0));
_FDT(fdt_property(fdt, reg, reg_prop, sizeof(reg_prop)));
diff --git a/arm/include/arm-common/gic.h b/arm/include/arm-common/gic.h
index 44859f7..d524f55 100644
--- a/arm/include/arm-common/gic.h
+++ b/arm/include/arm-common/gic.h
@@ -21,10 +21,14 @@
 #define GIC_MAX_CPUS

[PATCH v5 05/10] arm: finish VGIC initialisation explicitly

2015-07-03 Thread Andre Przywara

Since Linux 3.19-rc1 there is a new API to explicitly initialise
the in-kernel GIC emulation by a userland KVM device call.
Use that to tell the kernel we are finished with the GIC
initialisation, since the automatic GIC init will only be provided
as a legacy functionality in the future.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
Reviewed-by: Marc Zyngier marc.zyng...@arm.com
---
 arm/gic.c | 25 ++---
 1 file changed, 22 insertions(+), 3 deletions(-)

diff --git a/arm/gic.c b/arm/gic.c
index 8560c9b..99f0d2b 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -98,24 +98,43 @@ int gic__create(struct kvm *kvm)
return err;
 }
 
+/*
+ * Sets the number of used interrupts and finalizes the GIC init explicitly.
+ */
 static int gic__init_gic(struct kvm *kvm)
 {
+   int ret;
+
int lines = irq__get_nr_allocated_lines();
u32 nr_irqs = ALIGN(lines, 32) + GIC_SPI_IRQ_BASE;
struct kvm_device_attr nr_irqs_attr = {
.group  = KVM_DEV_ARM_VGIC_GRP_NR_IRQS,
.addr   = (u64)(unsigned long)nr_irqs,
};
+   struct kvm_device_attr vgic_init_attr = {
+   .group  = KVM_DEV_ARM_VGIC_GRP_CTRL,
+   .attr   = KVM_DEV_ARM_VGIC_CTRL_INIT,
+   };
 
/*
 * If we didn't use the KVM_CREATE_DEVICE method, KVM will
-* give us some default number of interrupts.
+* give us some default number of interrupts. The GIC initialization
+* will be done automatically in this case.
 */
if (gic_fd  0)
return 0;
 
-   if (!ioctl(gic_fd, KVM_HAS_DEVICE_ATTR, nr_irqs_attr))
-   return ioctl(gic_fd, KVM_SET_DEVICE_ATTR, nr_irqs_attr);
+   if (!ioctl(gic_fd, KVM_HAS_DEVICE_ATTR, nr_irqs_attr)) {
+   ret = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, nr_irqs_attr);
+   if (ret)
+   return ret;
+   }
+
+   if (!ioctl(gic_fd, KVM_HAS_DEVICE_ATTR, vgic_init_attr)) {
+   ret = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, vgic_init_attr);
+   if (ret)
+   return ret;
+   }
 
return 0;
 }
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH 1/7] KVM: api: add kvm_irq_routing_extended_msi

2015-07-02 Thread Andre Przywara

Hi Eric,

On 02/07/15 15:49, Eric Auger wrote:
 Hi Pavel,
 On 07/02/2015 09:26 AM, Pavel Fedin wrote:
  Hello!

 -Original Message-
 From: kvm-ow...@vger.kernel.org [mailto:kvm-ow...@vger.kernel.org] On 
 Behalf Of Eric Auger
 Sent: Monday, June 29, 2015 6:37 PM
 To: eric.au...@st.com; eric.au...@linaro.org; 
 linux-arm-ker...@lists.infradead.org;
 marc.zyng...@arm.com; christoffer.d...@linaro.org; andre.przyw...@arm.com;
 kvm...@lists.cs.columbia.edu; kvm@vger.kernel.org
 Cc: linux-ker...@vger.kernel.org; patc...@linaro.org; p.fe...@samsung.com; 
 pbonz...@redhat.com
 Subject: [PATCH 1/7] KVM: api: add kvm_irq_routing_extended_msi

 On ARM, the MSI msg (address and data) comes along with
 out-of-band device ID information. The device ID encodes the device
 that composes the MSI msg. Let's create a new routing entry type,
 dubbed KVM_IRQ_ROUTING_EXTENDED_MSI and use the __u32 pad space
 to convey the device ID.

 Signed-off-by: Eric Auger eric.au...@linaro.org

 ---

 RFC - PATCH
 - remove kvm_irq_routing_extended_msi and use union instead
 ---
  Documentation/virtual/kvm/api.txt | 9 -
  include/uapi/linux/kvm.h  | 6 +-
  2 files changed, 13 insertions(+), 2 deletions(-)

 diff --git a/Documentation/virtual/kvm/api.txt 
 b/Documentation/virtual/kvm/api.txt
 index d20fd94..6426ae9 100644
 --- a/Documentation/virtual/kvm/api.txt
 +++ b/Documentation/virtual/kvm/api.txt
 @@ -1414,7 +1414,10 @@ struct kvm_irq_routing_entry {
 __u32 gsi;
 __u32 type;
 __u32 flags;
 -   __u32 pad;
 +   union {
 +   __u32 pad;
 +   __u32 devid;
 +   };
 union {
 struct kvm_irq_routing_irqchip irqchip;
 struct kvm_irq_routing_msi msi;

  devid is actually a part of MSI bunch. Shouldn't it be a part of struct 
 kvm_irq_routing_msi then?
 It also has reserved pad.
 Well this makes sense to me to associate the devid to the msi and put
 devid in the pad field of struct kvm_irq_routing_msi.
 
 André, Christoffer, would you agree on this change? - I would like to
 avoid doing/undoing things ;-) -

Yes, that makes sense to me. TBH I haven't had a closer look at the
patches yet, but clearly devid belongs into struct kvm_irq_routing_msi.


 @@ -1427,6 +1430,10 @@ struct kvm_irq_routing_entry {
  #define KVM_IRQ_ROUTING_IRQCHIP 1
  #define KVM_IRQ_ROUTING_MSI 2
  #define KVM_IRQ_ROUTING_S390_ADAPTER 3
 +#define KVM_IRQ_ROUTING_EXTENDED_MSI 4
 +
 +In case of KVM_IRQ_ROUTING_EXTENDED_MSI routing type, devid is used to 
 convey
 +the device ID.

  No flags are specified so far, the corresponding field must be set to zero.

 What if we use KVM_MSI_VALID_DEVID flag instead of new 
 KVM_IRQ_ROUTING_EXTENDED_MSI definition? I
 believe this would make an API more consistent and introduce less new 
 definitions.
 do you mean using type == KVM_IRQ_ROUTING_MSI and flag ==
 KVM_MSI_VALID_DEVID? Not sure this is simpler/clearer. s390 paved the
 way for new routing entry types. I add a new one here.

I tend to agree with Pavel's solution. When hacking IRQ routing support
into kvmtool I saw that it's nasty being forced to differentiate between
the two MSI routing types. Actually userland should be able to query the
kernel about what kind of routing it requires. Also there is the issue
that we must _not_ set the flag on x86, since that breaks older kernels
(due to that check that Eric removes in 3/7).
So from my point of view the cleanest solution would be to always use
KVM_IRQ_ROUTING_MSI, and add the device ID if the kernel needs it (true
for ITS guests, false for GICv2M, x86, ...)
I am looking for a clever solution for this now.

Cheers,
Andre.

 
 Another solution may be to use new KVM_IRQ_ROUTING_EXTENDED_MSI type and
 add struct kvm_msi ext_msi in kvm_irq_routing_entry union. It is 8 words
 as well. But most probably this is even uglier.

 
 Let's see if this thread is heading to a consensus...
 
 Best Regards
 
 Eric


 diff --git a/include/uapi/linux/kvm.h b/include/uapi/linux/kvm.h
 index 2a23705..8484681 100644
 --- a/include/uapi/linux/kvm.h
 +++ b/include/uapi/linux/kvm.h
 @@ -841,12 +841,16 @@ struct kvm_irq_routing_s390_adapter {
  #define KVM_IRQ_ROUTING_IRQCHIP 1
  #define KVM_IRQ_ROUTING_MSI 2
  #define KVM_IRQ_ROUTING_S390_ADAPTER 3
 +#define KVM_IRQ_ROUTING_EXTENDED_MSI 4

  struct kvm_irq_routing_entry {
 __u32 gsi;
 __u32 type;
 __u32 flags;
 -   __u32 pad;
 +   union {
 +   __u32 pad;
 +   __u32 devid;
 +   };
 union {
 struct kvm_irq_routing_irqchip irqchip;
 struct kvm_irq_routing_msi msi;
 --
 1.9.1

 --
 To unsubscribe from this list: send the line unsubscribe kvm in
 the body of a message to majord...@vger.kernel.org
 More majordomo info at  http://vger.kernel.org/majordomo-info.html

 Kind regards,
 Pavel Fedin
 Expert Engineer
 Samsung Electronics Research center Russia

 
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org

Re: [PATCH 7/7] KVM: arm: implement kvm_set_msi by gsi direct mapping

2015-07-02 Thread Andre Przywara

Hi Eric,

On 29/06/15 16:37, Eric Auger wrote:
 If the ITS modality is not available, let's simply support MSI
 injection by transforming the MSI.data into an SPI ID.
 
 This becomes possible to use KVM_SIGNAL_MSI ioctl for arm too.
 
 Signed-off-by: Eric Auger eric.au...@linaro.org
 ---
  arch/arm/kvm/Kconfig | 1 +
  virt/kvm/arm/vgic.c  | 5 +
  2 files changed, 6 insertions(+)
 
 diff --git a/arch/arm/kvm/Kconfig b/arch/arm/kvm/Kconfig
 index 151e710..0f58baf 100644
 --- a/arch/arm/kvm/Kconfig
 +++ b/arch/arm/kvm/Kconfig
 @@ -31,6 +31,7 @@ config KVM
   select KVM_VFIO
   select HAVE_KVM_EVENTFD
   select HAVE_KVM_IRQFD
 + select HAVE_KVM_MSI
   select HAVE_KVM_IRQCHIP
   select HAVE_KVM_IRQ_ROUTING
   depends on ARM_VIRT_EXT  ARM_LPAE  ARM_ARCH_TIMER
 diff --git a/virt/kvm/arm/vgic.c b/virt/kvm/arm/vgic.c
 index 0b4c48c..b3c10dc 100644
 --- a/virt/kvm/arm/vgic.c
 +++ b/virt/kvm/arm/vgic.c
 @@ -2314,6 +2314,11 @@ int kvm_set_msi(struct kvm_kernel_irq_routing_entry *e,
   return kvm-arch.vgic.vm_ops.inject_msi(kvm, msi);
   else
   return -ENODEV;
 + case KVM_IRQ_ROUTING_MSI:
 + if (kvm-arch.vgic.vm_ops.inject_msi)
 + return -EINVAL;
 + else
 + return kvm_vgic_inject_irq(kvm, 0, e-msi.data, level);

If you add:

static int vgic_v2m_inject_msi(struct kvm *kvm, struct kvm_msi *msi)
{
return kvm_vgic_inject_irq(kvm, 0, msi-data, 1);
}

to vgic-v2-emul.c and wire it up accordingly, you can simplify the above
kvm_set_msi, getting rid of all those extra case handling.
This also helps merging KVM_IRQ_ROUTING_MSI and the extended case.

I have hacked this up and it seems to work for me.

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH 2/7] KVM: kvm_host: add kvm_extended_msi

2015-07-02 Thread Andre Przywara

Hi Eric,

just played a bit with the code and I could make things easier by the
following change:

On 29/06/15 16:37, Eric Auger wrote:
 Add a new kvm_extended_msi struct to store the additional device ID
 specific to ARM. kvm_kernel_irq_routing_entry union now encompasses
 this new struct.
 
 Signed-off-by: Eric Auger eric.au...@linaro.org
 
 ---
 
 RFC - PATCH:
 - reword the commit message after change in first patch (uapi)
 ---
  include/linux/kvm_host.h | 8 
  1 file changed, 8 insertions(+)
 
 diff --git a/include/linux/kvm_host.h b/include/linux/kvm_host.h
 index ad45054..e1c1c0d 100644
 --- a/include/linux/kvm_host.h
 +++ b/include/linux/kvm_host.h
 @@ -304,6 +304,13 @@ struct kvm_s390_adapter_int {
   u32 adapter_id;
  };
  
 +struct kvm_extended_msi {
 + u32 address_lo; /* low 32 bits of msi message address */
 + u32 address_hi; /* high 32 bits of msi message address */
 + u32 data;   /* 16 bits of msi message data */
 + u32 devid;  /* out-of-band device ID */
 +};
 +

I got rid of this structure at all, instead using:

 @@ -317,6 +324,7 @@ struct kvm_kernel_irq_routing_entry {
} irqchip;
-   struct msi_msg msi;
+   struct {
+   struct msi_msg msi;
+   u32 devid;
+   };
struct kvm_s390_adapter_int adapter;
};
struct hlist_node link;
  };

This re-uses the existing MSI fields in struct msi_msg, so all the extra
code you added in the next patches to set address and data could be
skipped. If needed we can add a flags field here as well to avoid that
extra type.
That simplified a lot for me.

Cheers,
André
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH 4/7] KVM: arm/arm64: enable irqchip routing

2015-06-30 Thread Andre Przywara

Hi Eric,

On 29/06/15 16:37, Eric Auger wrote:
 This patch adds compilation and link against irqchip.
 
 On ARM, irqchip routing is not really useful since there is
 a single irqchip. However main motivation behind using irqchip
 code is to enable MSI routing code. With the support of in-kernel
 GICv3 ITS emulation, it now seems to be a MUST HAVE requirement.
 
 Functions previously implemented in vgic.c and substitute
 to more complex irqchip implementation are removed:
 
 - kvm_send_userspace_msi
 - kvm_irq_map_chip_pin
 - kvm_set_irq
 - kvm_irq_map_gsi.
 
 They implemented a kernel default identity GSI routing. This is now
 replaced by user-side provided routing.
 
 Routing standard hooks are now implemented in vgic:
 - kvm_set_routing_entry
 - kvm_set_irq
 - kvm_set_msi
 
 Both HAVE_KVM_IRQCHIP and HAVE_KVM_IRQ_ROUTING are defined.
 KVM_CAP_IRQ_ROUTING is advertised and KVM_SET_GSI_ROUTING is allowed.
 
 MSI routing is not yet allowed.
 
 Signed-off-by: Eric Auger eric.au...@linaro.org
 
...

 diff --git a/virt/kvm/arm/vgic.c b/virt/kvm/arm/vgic.c
 index 09b1f46..212a5ff 100644
 --- a/virt/kvm/arm/vgic.c
 +++ b/virt/kvm/arm/vgic.c
 @@ -2220,47 +2220,67 @@ out_free_irq:
   return ret;
  }
  
 -int kvm_irq_map_gsi(struct kvm *kvm,
 - struct kvm_kernel_irq_routing_entry *entries,
 - int gsi)
 +int vgic_irqfd_set_irq(struct kvm_kernel_irq_routing_entry *e,
 + struct kvm *kvm, int irq_source_id,
 + int level, bool line_status)
  {
 - return 0;
 -}
 -
 -int kvm_irq_map_chip_pin(struct kvm *kvm, unsigned irqchip, unsigned pin)
 -{
 - return pin;
 -}
 -
 -int kvm_set_irq(struct kvm *kvm, int irq_source_id,
 - u32 irq, int level, bool line_status)
 -{
 - unsigned int spi = irq + VGIC_NR_PRIVATE_IRQS;
 + unsigned int spi_id = e-irqchip.pin + VGIC_NR_PRIVATE_IRQS;
  
 - trace_kvm_set_irq(irq, level, irq_source_id);
 + trace_kvm_set_irq(spi_id, level, irq_source_id);
  
   BUG_ON(!vgic_initialized(kvm));
  
 - if (spi  kvm-arch.vgic.nr_irqs)
 + if (spi_id  kvm-arch.vgic.nr_irqs)
   return -EINVAL;
 - return kvm_vgic_inject_irq(kvm, 0, spi, level);
 + return kvm_vgic_inject_irq(kvm, 0, spi_id, level);
  
  }
  
 -/* MSI not implemented yet */
 +/**
 + * Populates a kvm routing entry from a user routing entry
 + * @e: kvm internal formatted entry
 + * @ue: user api formatted entry
 + * return 0 on success, -EINVAL on errors.
 + */
 +int kvm_set_routing_entry(struct kvm_kernel_irq_routing_entry *e,
 +   const struct kvm_irq_routing_entry *ue)
 +{
 + int r = -EINVAL;
 +
 + switch (ue-type) {
 + case KVM_IRQ_ROUTING_IRQCHIP:
 + e-set = vgic_irqfd_set_irq;
 + e-irqchip.irqchip = ue-u.irqchip.irqchip;
 + e-irqchip.pin = ue-u.irqchip.pin;
 + if ((e-irqchip.pin = KVM_IRQCHIP_NUM_PINS) ||
 + (e-irqchip.irqchip = KVM_NR_IRQCHIPS))
 + goto out;
 + break;
 + default:
 + goto out;
 + }
 + r = 0;
 +out:
 + return r;
 +}
 +
  int kvm_set_msi(struct kvm_kernel_irq_routing_entry *e,
   struct kvm *kvm, int irq_source_id,
   int level, bool line_status)
  {
 - return 0;
 -}
 + struct kvm_msi msi;
  
 -#ifdef CONFIG_HAVE_KVM_MSI
 -int kvm_send_userspace_msi(struct kvm *kvm, struct kvm_msi *msi)
 -{
 - if (kvm-arch.vgic.vm_ops.inject_msi)
 - return kvm-arch.vgic.vm_ops.inject_msi(kvm, msi);
 - else
 - return -ENODEV;
 + switch (e-type) {
 + case KVM_IRQ_ROUTING_EXTENDED_MSI:
 + msi.address_lo = e-ext_msi.address_lo;
 + msi.address_hi = e-ext_msi.address_hi;
 + msi.data = e-ext_msi.data;
 + msi.flags = e-ext_msi.devid;

You probably meant to write:
+   msi.flags = KVM_MSI_VALID_DEVID;
+   msi.devid = e-ext_msi.devid;

With this change I could get it (your patches on top of my v1.5) to work
with my hacked kvmtool - at least with vhost=0. On to fixing irqfd now ...

Cheers,
Andre.

 + if (kvm-arch.vgic.vm_ops.inject_msi)
 + return kvm-arch.vgic.vm_ops.inject_msi(kvm, msi);
 + else
 + return -ENODEV;
 + default:
 + return -EINVAL;
 + }
  }
 -#endif
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH v4 10/10] arm: use new irqchip parameter to create different vGIC types

2015-06-30 Thread Andre Przywara

On 30/06/15 17:13, Will Deacon wrote:
 On Fri, Jun 26, 2015 at 02:16:18PM +0100, Andre Przywara wrote:
 Currently we unconditionally create a virtual GICv2 in the guest.
 Add a --irqchip= parameter to let the user specify a different GIC
 type for the guest, when omitting this parameter it still defaults to
 --irqchip=gicv2.
 For now the only other supported type is --irqchip=gicv3

 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
  arm/aarch64/arm-cpu.c|  2 +-
  arm/gic.c| 17 +
  arm/include/arm-common/kvm-config-arch.h |  9 -
  arm/kvm.c|  2 +-
  4 files changed, 27 insertions(+), 3 deletions(-)

 diff --git a/arm/aarch64/arm-cpu.c b/arm/aarch64/arm-cpu.c
 index f702b9e..3dc8ea3 100644
 --- a/arm/aarch64/arm-cpu.c
 +++ b/arm/aarch64/arm-cpu.c
 @@ -12,7 +12,7 @@
  static void generate_fdt_nodes(void *fdt, struct kvm *kvm, u32 gic_phandle)
  {
  int timer_interrupts[4] = {13, 14, 11, 10};
 -gic__generate_fdt_nodes(fdt, gic_phandle, IRQCHIP_GICV2);
 +gic__generate_fdt_nodes(fdt, gic_phandle, kvm-cfg.arch.irqchip);
  timer__generate_fdt_nodes(fdt, kvm, timer_interrupts);
  }
  
 diff --git a/arm/gic.c b/arm/gic.c
 index efe4b42..ff56de7 100644
 --- a/arm/gic.c
 +++ b/arm/gic.c
 @@ -22,6 +22,23 @@ static int gic_fd = -1;
  static u64 gic_redists_base;
  static u64 gic_redists_size;
  
 +int irqchip_parser(const struct option *opt, const char *arg, int unset)
 +{
 +enum irqchip_type *type = opt-value;
 +
 +*type = IRQCHIP_GICV2;
 
 Pointless assignment?

Yeah, that's a leftover from some refactoring.

 
 +if (!strcmp(arg, gicv2)) {
 +*type = IRQCHIP_GICV2;
 +} else if (!strcmp(arg, gicv3)) {
 +*type = IRQCHIP_GICV3;
 +} else {
 +fprintf(stderr, irqchip: unknown type \%s\\n, arg);
 +return -1;
 +}
 +
 +return 0;
 +}
 +
  static int gic__create_device(struct kvm *kvm, enum irqchip_type type)
  {
  int err;
 diff --git a/arm/include/arm-common/kvm-config-arch.h 
 b/arm/include/arm-common/kvm-config-arch.h
 index a8ebd94..9529881 100644
 --- a/arm/include/arm-common/kvm-config-arch.h
 +++ b/arm/include/arm-common/kvm-config-arch.h
 @@ -8,8 +8,11 @@ struct kvm_config_arch {
  unsigned intforce_cntfrq;
  boolvirtio_trans_pci;
  boolaarch32_guest;
 +enum irqchip_type irqchip;
  };
  
 +int irqchip_parser(const struct option *opt, const char *arg, int unset);
 +
  #define OPT_ARCH_RUN(pfx, cfg)  
 \
  pfx,
 \
  ARM_OPT_ARCH_RUN(cfg)   
 \
 @@ -21,6 +24,10 @@ struct kvm_config_arch {
   updated to program CNTFRQ correctly*),   
 \
  OPT_BOOLEAN('\0', force-pci, (cfg)-virtio_trans_pci,
 \
  Force virtio devices to use PCI as their default  
 \
 -transport),
 +transport),   
 \
 +OPT_CALLBACK('\0', irqchip, (cfg)-irqchip,  
 \
 + [gicv2|gicv3],   \
 + type of interrupt controller to emulate in the guest,
 \
 + irqchip_parser, NULL),
 
 What happens if I don't pass this option at all?

Then (cfg)-irqchip will be 0 as all the other configuration parameters
because they are part of struct kvm, which is calloc()ed.
So it will be IRQCHIP_GICV2, as that is the first entry in the enum.
Admittedly a bit convoluted, do you want a comment or an explicit
enum { IRQCHIP_GICV2 = 0, ...}?

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH v4 07/10] limit number of VCPUs on demand

2015-06-30 Thread Andre Przywara

Hi,

On 30/06/15 17:09, Will Deacon wrote:
 On Fri, Jun 26, 2015 at 02:16:15PM +0100, Andre Przywara wrote:
 Currently the ARM GIC checks the number of VCPUs against a fixed
 limit, which is GICv2 specific. Don't pretend we know better than the
 kernel and let's get rid of that explicit check.
 Instead be more relaxed about KVM_CREATE_VCPU failing with EINVAL,
 which is the way the kernel communicates having reached a VCPU limit.
 If we see this and have at least brought up one VCPU already
 successfully, then don't panic, but limit the number of VCPUs instead.

 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
  arm/gic.c | 6 --
  arm/kvm-cpu.c | 7 ++-
  kvm-cpu.c | 7 +++
  3 files changed, 13 insertions(+), 7 deletions(-)

 diff --git a/arm/gic.c b/arm/gic.c
 index 99f0d2b..05f85a2 100644
 --- a/arm/gic.c
 +++ b/arm/gic.c
 @@ -84,12 +84,6 @@ int gic__create(struct kvm *kvm)
  {
  int err;
  
 -if (kvm-nrcpus  GIC_MAX_CPUS) {
 -pr_warning(%d CPUS greater than maximum of %d -- truncating\n,
 -kvm-nrcpus, GIC_MAX_CPUS);
 -kvm-nrcpus = GIC_MAX_CPUS;
 -}
 -
  /* Try the new way first, and fallback on legacy method otherwise */
  err = gic__create_device(kvm);
  if (err)
 diff --git a/arm/kvm-cpu.c b/arm/kvm-cpu.c
 index 7780251..b2fd6ed 100644
 --- a/arm/kvm-cpu.c
 +++ b/arm/kvm-cpu.c
 @@ -51,8 +51,13 @@ struct kvm_cpu *kvm_cpu__arch_init(struct kvm *kvm, 
 unsigned long cpu_id)
  return NULL;
  
  vcpu-vcpu_fd = ioctl(kvm-vm_fd, KVM_CREATE_VCPU, cpu_id);
 -if (vcpu-vcpu_fd  0)
 +if (vcpu-vcpu_fd  0) {
 +if (errno == EINVAL) {
 +free(vcpu);
 +return NULL;
 +}
 
 Hmm, but EINVAL can mean all sorts of other failures too, surely?

Not for ARM, at least not at the moment. I went through all the cases -
I think up to 8 levels deep - and exceeding the number of VCPUs is the
only case where we return EINVAL for KVM_CREATE_VCPU.

 I'm
 not against removing the nrcpus check, but I think we should die if ioctls
 start failing rather than silently ignore them.

I see your point, but at least we don't fail silently: if we exit the
loop prematurely, we print the warning about limiting the number of VCPUs.
I agree that the proper solution would be to just explicitly ask the
kernel about the number of VCPUs, but on ARM this is not reliable at the
moment due to kernel behaviour, and any fix there would still not affect
older kernels.

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH] kvmtool: don't use PCI config space IRQ line field

2015-06-29 Thread Andre Przywara

Hi Will,

On 29/06/15 11:10, Will Deacon wrote:
 Hi Andre,
 
 On Thu, Jun 18, 2015 at 06:19:53PM +0100, Andre Przywara wrote:
 I am tempted to remove shmem, since it's broken:
 a) there is no upstream driver, only some out-of-tree uio driver module
 in some Github repo
 
 Right, but that's the same for qemu and we've already made the jump of
 merging the driver, so I don't think that's a good argument for throwing
 it out of the tree.

If this driver has some future in the Linux tree, I agree it's worth to
keep it in, though I didn't see any effort to merge it lately.

 b) the PCI device BARs do not match what QEMU implements and what the
 uio driver expects (IO BAR vs. MMIO BAR)
 
 In what way? A quick look suggests that kvmtool is at least aligned with
 said github repo.

The first BAR holds the control registers, QEMU and the UIO driver
require an MMIO region, kvmtool uses PIO :-(

 c) there is (at least one) bug in kvmtool (easily fixed, though)

The size of the control register region in BAR0 is set to the size of
the shared memory region, where it should be some constant size (at
least 16 Bytes, QEMU uses 256, the spec says 1K, pick one ;-)
As PIO on x86 is at most 64K, this BAR gets ignored by the kernel with
any shmem size above that (it defaults to 4M).
As said the fix is easy, but ...

Those two bugs alone make we wonder if that ever worked on kvmtool,
obviously not with that UIO driver (which seems to work on QEMU).
I have fixes for both issues, but I haven't had a chance of testing this
in real action (just the driver loaded and lspci looking sensible). I
may send the patches later, but this doesn't have high priority for me
(unless someone bugs me ;-)

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH 0/3] KVM: arm: Implement software vGICv2 emulation

2015-06-29 Thread Andre Przywara

Hi,

On 29/06/15 13:52, Christoffer Dall wrote:
 Hi Pavel,
 
 [Please cc the kvm/arm list for such patches according to the
 MAINTAINERS file in the future]
 
 On Mon, Jun 29, 2015 at 12:53:46PM +0300, Pavel Fedin wrote:
 Some hardware (like Raspberry Pi 2) is capable of running KVM, however lacks
 functional vGIC registers. This series introduces software vGIC emulation for
 such machines, allowing to fully use virtualization capabilities
 
 Is this rather esoteric use case really worth the extra code in the
 kernel? 

I wonder if these patches would pave the way to support running GICv2
guests on GICv3s without compat support? Admittedly not a really
compelling use case either, but at least worth discussing, I think.

Also if this will make the hack needed to enable KVM on RPi2 smaller,
I'd rather embrace this one than letting any random hacks appear on that
RPi kernel tree (patches which I have seen already on some other repo).
If I get this correctly, there are some efforts currently to get closer
to mainline with the RPi tree.

Pavel, is this broken GIC you are talking about going to appear in a
publicly available SoC? If yes, you could either state this right now or
send it later once you can talk publicly.

Marc, Christoffer:
So is this GICv2 CPU interface emulation totally out of question for us
or is it worth at least commenting on the patches?

Cheers,
Andre.

 I really feel that pure emulation should happen in userspace
 unless there's a very good reason for doing it in the kernel, such as a
 clearly measureable difference in performance, etc.
 
 I would much rather see a version of this where a userspace provided GIC
 works with the in-kernel arch timers support.
 
 -Christoffer
 
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH 02/13] KVM: extend struct kvm_msi to hold a 32-bit device ID

2015-06-29 Thread Andre Przywara

Hi Christoffer,

thanks for your time to reviewing this! Was probably no pleasure ;-)

On 28/06/15 20:12, Christoffer Dall wrote:
 On Fri, May 29, 2015 at 10:53:18AM +0100, Andre Przywara wrote:
 The ARM GICv3 ITS MSI controller requires a device ID to be able to
 assign the proper interrupt vector. On real hardware, this ID is
 sampled from the bus. To be able to emulate an ITS controller, extend
 the KVM MSI interface to let userspace provide such a device ID. For
 PCI devices, the device ID is simply the 16-bit bus-device-function
 triplet, which should be easily available to the userland tool.

 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
  Documentation/virtual/kvm/api.txt | 8 ++--
  include/uapi/linux/kvm.h  | 4 +++-
  2 files changed, 9 insertions(+), 3 deletions(-)

 diff --git a/Documentation/virtual/kvm/api.txt 
 b/Documentation/virtual/kvm/api.txt
 index 9fa2bf8..891d64a 100644
 --- a/Documentation/virtual/kvm/api.txt
 +++ b/Documentation/virtual/kvm/api.txt
 @@ -2121,10 +2121,14 @@ struct kvm_msi {
  __u32 address_hi;
  __u32 data;
  __u32 flags;
 -__u8  pad[16];
 +__u32 devid;
 +__u8  pad[12];
  };
  
 -No flags are defined so far. The corresponding field must be 0.
 +flags: KVM_MSI_VALID_DEVID: devid is valid, otherwise ignored.
 
 I don't see what the 'otherwise ignored' part of the sentence here is
 meant to say, that the flags field is otherwise ignored for other value?

No, that the devid field is ignored if this bit isn't set. I can
rephrase this to be more explicit.

 That's not what the current API doc specifies, it specifies that the
 remainder of the field must be 0.
 
 +devid: If KVM_MSI_VALID_DEVID is set, contains a value to identify the 
 device
 +   that wrote the MSI message. For PCI, this is usually a BFD
 +   identifier in the lower 16 bits.
 
 I assume plus something else that uniquely identifies the PCI
 controller?

Well yes, the device ID is a unique device identifier within a system,
the BFD use case was just to illustrate this and give a hint to
userspace what to fill in there. I will explain this better in v2.

So are you OK with that extension of the API in general? Just asking
because there is a lot that depends on it.

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH] kvmtool: vhost-net: fix ioeventfd registration

2015-06-26 Thread Andre Przywara

On registering the ioeventfds for the virtio-pci device we cover both
the I/O ports and the MMIO BAR.
But as the current code advertises both as PIO, the host kernel gets
the wrong bus number for the MMIO region.
Fix the issue by marking only the actual PIO area as PIO.
This fixes vhost-net on x86.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 virtio/pci.c | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/virtio/pci.c b/virtio/pci.c
index 2dff13b..90fcd64 100644
--- a/virtio/pci.c
+++ b/virtio/pci.c
@@ -25,7 +25,7 @@ static int virtio_pci__init_ioeventfd(struct kvm *kvm, struct 
virtio_device *vde
 {
struct ioevent ioevent;
struct virtio_pci *vpci = vdev-virtio;
-   int i, r, flags = IOEVENTFD_FLAG_PIO;
+   int i, r, flags = 0;
int fds[2];
 
vpci-ioeventfds[vq] = (struct virtio_pci_ioevent_param) {
@@ -51,7 +51,7 @@ static int virtio_pci__init_ioeventfd(struct kvm *kvm, struct 
virtio_device *vde
ioevent.io_addr = vpci-port_addr + VIRTIO_PCI_QUEUE_NOTIFY;
ioevent.io_len  = sizeof(u16);
ioevent.fd  = fds[0] = eventfd(0, 0);
-   r = ioeventfd__add_event(ioevent, flags);
+   r = ioeventfd__add_event(ioevent, flags | IOEVENTFD_FLAG_PIO);
if (r)
return r;
 
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 01/10] AArch64: Reserve two 64k pages for GIC CPU interface

2015-06-26 Thread Andre Przywara

From: Marc Zyngier marc.zyng...@arm.com

On AArch64 system with a GICv2, the GICC range can be aligned
to the last 4k block of a 64k page, ending up straddling two
64k pages. In order not to conflict with the distributor mapping,
allocate two 64k pages to the CPU interface.

Signed-off-by: Marc Zyngier marc.zyng...@arm.com
Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 arm/aarch64/include/kvm/kvm-arch.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/arm/aarch64/include/kvm/kvm-arch.h 
b/arm/aarch64/include/kvm/kvm-arch.h
index 2f08a26..4925736 100644
--- a/arm/aarch64/include/kvm/kvm-arch.h
+++ b/arm/aarch64/include/kvm/kvm-arch.h
@@ -2,7 +2,7 @@
 #define KVM__KVM_ARCH_H
 
 #define ARM_GIC_DIST_SIZE  0x1
-#define ARM_GIC_CPUI_SIZE  0x1
+#define ARM_GIC_CPUI_SIZE  0x2
 
 #define ARM_KERN_OFFSET(kvm)   ((kvm)-cfg.arch.aarch32_guest  ?   \
0x8000  :   \
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 08/10] arm: prepare for instantiating different IRQ chip devices

2015-06-26 Thread Andre Przywara

Extend the vGIC handling code to potentially deal with different IRQ
chip devices instead of hard-coding the GICv2 in.
We extend most vGIC functions to take a type parameter, but still put
GICv2 in at the top for the time being.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
Reviewed-by: Marc Zyngier marc.zyng...@arm.com
---
 arm/aarch32/arm-cpu.c|  2 +-
 arm/aarch64/arm-cpu.c|  2 +-
 arm/gic.c| 44 +++-
 arm/include/arm-common/gic.h |  8 ++--
 arm/kvm.c|  2 +-
 5 files changed, 44 insertions(+), 14 deletions(-)

diff --git a/arm/aarch32/arm-cpu.c b/arm/aarch32/arm-cpu.c
index 946e443..d8d6293 100644
--- a/arm/aarch32/arm-cpu.c
+++ b/arm/aarch32/arm-cpu.c
@@ -12,7 +12,7 @@ static void generate_fdt_nodes(void *fdt, struct kvm *kvm, 
u32 gic_phandle)
 {
int timer_interrupts[4] = {13, 14, 11, 10};
 
-   gic__generate_fdt_nodes(fdt, gic_phandle);
+   gic__generate_fdt_nodes(fdt, gic_phandle, IRQCHIP_GICV2);
timer__generate_fdt_nodes(fdt, kvm, timer_interrupts);
 }
 
diff --git a/arm/aarch64/arm-cpu.c b/arm/aarch64/arm-cpu.c
index 8efe877..f702b9e 100644
--- a/arm/aarch64/arm-cpu.c
+++ b/arm/aarch64/arm-cpu.c
@@ -12,7 +12,7 @@
 static void generate_fdt_nodes(void *fdt, struct kvm *kvm, u32 gic_phandle)
 {
int timer_interrupts[4] = {13, 14, 11, 10};
-   gic__generate_fdt_nodes(fdt, gic_phandle);
+   gic__generate_fdt_nodes(fdt, gic_phandle, IRQCHIP_GICV2);
timer__generate_fdt_nodes(fdt, kvm, timer_interrupts);
 }
 
diff --git a/arm/gic.c b/arm/gic.c
index 05f85a2..b6c5868 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -11,13 +11,13 @@
 
 static int gic_fd = -1;
 
-static int gic__create_device(struct kvm *kvm)
+static int gic__create_device(struct kvm *kvm, enum irqchip_type type)
 {
int err;
u64 cpu_if_addr = ARM_GIC_CPUI_BASE;
u64 dist_addr = ARM_GIC_DIST_BASE;
struct kvm_create_device gic_device = {
-   .type   = KVM_DEV_TYPE_ARM_VGIC_V2,
+   .flags  = 0,
};
struct kvm_device_attr cpu_if_attr = {
.group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
@@ -26,17 +26,27 @@ static int gic__create_device(struct kvm *kvm)
};
struct kvm_device_attr dist_attr = {
.group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
-   .attr   = KVM_VGIC_V2_ADDR_TYPE_DIST,
.addr   = (u64)(unsigned long)dist_addr,
};
 
+   switch (type) {
+   case IRQCHIP_GICV2:
+   gic_device.type = KVM_DEV_TYPE_ARM_VGIC_V2;
+   dist_attr.attr  = KVM_VGIC_V2_ADDR_TYPE_DIST;
+   break;
+   }
+
err = ioctl(kvm-vm_fd, KVM_CREATE_DEVICE, gic_device);
if (err)
return err;
 
gic_fd = gic_device.fd;
 
-   err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, cpu_if_attr);
+   switch (type) {
+   case IRQCHIP_GICV2:
+   err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, cpu_if_attr);
+   break;
+   }
if (err)
goto out_err;
 
@@ -80,13 +90,20 @@ static int gic__create_irqchip(struct kvm *kvm)
return err;
 }
 
-int gic__create(struct kvm *kvm)
+int gic__create(struct kvm *kvm, enum irqchip_type type)
 {
int err;
 
+   switch (type) {
+   case IRQCHIP_GICV2:
+   break;
+   default:
+   return -ENODEV;
+   }
+
/* Try the new way first, and fallback on legacy method otherwise */
-   err = gic__create_device(kvm);
-   if (err)
+   err = gic__create_device(kvm, type);
+   if (err  type == IRQCHIP_GICV2)
err = gic__create_irqchip(kvm);
 
return err;
@@ -134,15 +151,24 @@ static int gic__init_gic(struct kvm *kvm)
 }
 late_init(gic__init_gic)
 
-void gic__generate_fdt_nodes(void *fdt, u32 phandle)
+void gic__generate_fdt_nodes(void *fdt, u32 phandle, enum irqchip_type type)
 {
+   const char *compatible;
u64 reg_prop[] = {
cpu_to_fdt64(ARM_GIC_DIST_BASE), 
cpu_to_fdt64(ARM_GIC_DIST_SIZE),
cpu_to_fdt64(ARM_GIC_CPUI_BASE), 
cpu_to_fdt64(ARM_GIC_CPUI_SIZE),
};
 
+   switch (type) {
+   case IRQCHIP_GICV2:
+   compatible = arm,cortex-a15-gic;
+   break;
+   default:
+   return;
+   }
+
_FDT(fdt_begin_node(fdt, intc));
-   _FDT(fdt_property_string(fdt, compatible, arm,cortex-a15-gic));
+   _FDT(fdt_property_string(fdt, compatible, compatible));
_FDT(fdt_property_cell(fdt, #interrupt-cells, GIC_FDT_IRQ_NUM_CELLS));
_FDT(fdt_property(fdt, interrupt-controller, NULL, 0));
_FDT(fdt_property(fdt, reg, reg_prop, sizeof(reg_prop)));
diff --git a/arm/include/arm-common/gic.h b/arm/include/arm-common/gic.h
index 44859f7..d524f55 100644
--- a/arm/include/arm-common/gic.h
+++ b/arm/include/arm-common/gic.h
@@ -21,10 +21,14 @@
 #define GIC_MAX_CPUS

[PATCH v4 00/10] kvmtool: arm64: GICv3 guest support

2015-06-26 Thread Andre Przywara

Hi,

hopefully the final version of the GICv3 support series for kvmtool.
I addressed the remaining comments Marc had on the last four patches
(the first six were left untouched).
The undocumented --irqchip=default is now gone.

Cheers,
Andre.

-
Since Linux 3.19 the kernel can emulate a GICv3 for KVM guests.
This allows more than 8 VCPUs in a guest and enables in-kernel irqchip
for non-backwards-compatible GICv3 implementations.

This series updates kvmtool to support this feature.
The first half of the series is mostly from Marc and supports some
newer features of the virtual GIC which we later depend on. The second
part enables support for a guest GICv3 by adding a new command line
parameter (--irqchip=).

We now use the KVM_CREATE_DEVICE interface to create a virtual GIC
and only fall back to the now legacy KVM_CREATE_IRQCHIP call if the
former is not supported by the kernel.
Also we use two new features the KVM_CREATE_DEVICE interface
introduces:
* We now set the number of actually used interrupts to avoid
  allocating too many of them without ever using them.
* We tell the kernel explicitly that we are finished with the GIC
  initialisation. This is a requirement for future VGIC versions.

The final three patches introduce virtual GICv3 support, so on
supported hardware (and given kernel support) the user can ask KVM to
emulate a GICv3, lifting the 8 VCPU limit of KVM. This is done by
specifying --irqchip=gicv3 on the command line.
For the time being the kernel only supports a virtual GICv3 on ARM64,
but as the GIC is shared in kvmtool, I had to add the macro
definitions to not break the build on ARM.

This series goes on top of the new official stand-alone repo hosted
on Will's kernel.org git [1].
Find a branch with those patches included at my repo [2].

[1] git://git.kernel.org/pub/scm/linux/kernel/git/will/kvmtool.git
[2] git://linux-arm.org/kvmtool.git (branch gicv3/v4)
http://www.linux-arm.org/git?p=kvmtool.git;a=log;h=refs/heads/gicv3/v4

Andre Przywara (6):
  arm: finish VGIC initialisation explicitly
  arm: simplify MMIO dispatching
  limit number of VCPUs on demand
  arm: prepare for instantiating different IRQ chip devices
  arm: add support for supplying GICv3 redistributor addresses
  arm: use new irqchip parameter to create different vGIC types

Marc Zyngier (4):
  AArch64: Reserve two 64k pages for GIC CPU interface
  AArch{32,64}: use KVM_CREATE_DEVICE  co to instanciate the GIC
  irq: add irq__get_nr_allocated_lines
  AArch{32,64}: dynamically configure the number of GIC interrupts

 arm/aarch32/arm-cpu.c|   2 +-
 arm/aarch64/arm-cpu.c|   2 +-
 arm/aarch64/include/kvm/kvm-arch.h   |   2 +-
 arm/gic.c| 190 +--
 arm/include/arm-common/gic.h |   9 +-
 arm/include/arm-common/kvm-arch.h|  19 ++--
 arm/include/arm-common/kvm-config-arch.h |   9 +-
 arm/include/arm-common/kvm-cpu-arch.h|  14 ++-
 arm/kvm-cpu.c|  23 +---
 arm/kvm.c|   6 +-
 include/kvm/irq.h|   1 +
 irq.c|   5 +
 kvm-cpu.c|   7 ++
 13 files changed, 239 insertions(+), 50 deletions(-)

-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 09/10] arm: add support for supplying GICv3 redistributor addresses

2015-06-26 Thread Andre Przywara

Instead of the GIC virtual CPU interface an emulated GICv3 needs to
have accesses to its emulated redistributors trapped in the guest.
Add code to tell the kernel about the mapping if a GICv3 emulation was
requested by the user.

This contains some defines which are not (yet) in the (32 bit) header
files to allow compilation for ARM.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
Reviewed-by: Marc Zyngier marc.zyng...@arm.com
---
 arm/gic.c | 36 +++-
 arm/include/arm-common/gic.h  |  1 +
 arm/include/arm-common/kvm-arch.h |  7 +++
 3 files changed, 43 insertions(+), 1 deletion(-)

diff --git a/arm/gic.c b/arm/gic.c
index b6c5868..efe4b42 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -9,7 +9,18 @@
 #include linux/kernel.h
 #include linux/kvm.h
 
+/* Those names are not defined for ARM (yet) */
+#ifndef KVM_VGIC_V3_ADDR_TYPE_DIST
+#define KVM_VGIC_V3_ADDR_TYPE_DIST 2
+#endif
+
+#ifndef KVM_VGIC_V3_ADDR_TYPE_REDIST
+#define KVM_VGIC_V3_ADDR_TYPE_REDIST 3
+#endif
+
 static int gic_fd = -1;
+static u64 gic_redists_base;
+static u64 gic_redists_size;
 
 static int gic__create_device(struct kvm *kvm, enum irqchip_type type)
 {
@@ -28,12 +39,21 @@ static int gic__create_device(struct kvm *kvm, enum 
irqchip_type type)
.group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
.addr   = (u64)(unsigned long)dist_addr,
};
+   struct kvm_device_attr redist_attr = {
+   .group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
+   .attr   = KVM_VGIC_V3_ADDR_TYPE_REDIST,
+   .addr   = (u64)(unsigned long)gic_redists_base,
+   };
 
switch (type) {
case IRQCHIP_GICV2:
gic_device.type = KVM_DEV_TYPE_ARM_VGIC_V2;
dist_attr.attr  = KVM_VGIC_V2_ADDR_TYPE_DIST;
break;
+   case IRQCHIP_GICV3:
+   gic_device.type = KVM_DEV_TYPE_ARM_VGIC_V3;
+   dist_attr.attr  = KVM_VGIC_V3_ADDR_TYPE_DIST;
+   break;
}
 
err = ioctl(kvm-vm_fd, KVM_CREATE_DEVICE, gic_device);
@@ -46,6 +66,9 @@ static int gic__create_device(struct kvm *kvm, enum 
irqchip_type type)
case IRQCHIP_GICV2:
err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, cpu_if_attr);
break;
+   case IRQCHIP_GICV3:
+   err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, redist_attr);
+   break;
}
if (err)
goto out_err;
@@ -97,6 +120,10 @@ int gic__create(struct kvm *kvm, enum irqchip_type type)
switch (type) {
case IRQCHIP_GICV2:
break;
+   case IRQCHIP_GICV3:
+   gic_redists_size = kvm-cfg.nrcpus * ARM_GIC_REDIST_SIZE;
+   gic_redists_base = ARM_GIC_DIST_BASE - gic_redists_size;
+   break;
default:
return -ENODEV;
}
@@ -156,12 +183,19 @@ void gic__generate_fdt_nodes(void *fdt, u32 phandle, enum 
irqchip_type type)
const char *compatible;
u64 reg_prop[] = {
cpu_to_fdt64(ARM_GIC_DIST_BASE), 
cpu_to_fdt64(ARM_GIC_DIST_SIZE),
-   cpu_to_fdt64(ARM_GIC_CPUI_BASE), 
cpu_to_fdt64(ARM_GIC_CPUI_SIZE),
+   0, 0,   /* to be filled */
};
 
switch (type) {
case IRQCHIP_GICV2:
compatible = arm,cortex-a15-gic;
+   reg_prop[2] = cpu_to_fdt64(ARM_GIC_CPUI_BASE);
+   reg_prop[3] = cpu_to_fdt64(ARM_GIC_CPUI_SIZE);
+   break;
+   case IRQCHIP_GICV3:
+   compatible = arm,gic-v3;
+   reg_prop[2] = cpu_to_fdt64(gic_redists_base);
+   reg_prop[3] = cpu_to_fdt64(gic_redists_size);
break;
default:
return;
diff --git a/arm/include/arm-common/gic.h b/arm/include/arm-common/gic.h
index d524f55..4fde5ac 100644
--- a/arm/include/arm-common/gic.h
+++ b/arm/include/arm-common/gic.h
@@ -23,6 +23,7 @@
 
 enum irqchip_type {
IRQCHIP_GICV2,
+   IRQCHIP_GICV3,
 };
 
 struct kvm;
diff --git a/arm/include/arm-common/kvm-arch.h 
b/arm/include/arm-common/kvm-arch.h
index 90d6733..0f5fb7f 100644
--- a/arm/include/arm-common/kvm-arch.h
+++ b/arm/include/arm-common/kvm-arch.h
@@ -30,6 +30,13 @@
 #define KVM_PCI_MMIO_AREA  (KVM_PCI_CFG_AREA + ARM_PCI_CFG_SIZE)
 #define KVM_VIRTIO_MMIO_AREA   ARM_MMIO_AREA
 
+/*
+ * On a GICv3 there must be one redistributor per vCPU.
+ * The value here is the size for one, we multiply this at runtime with
+ * the number of requested vCPUs to get the actual size.
+ */
+#define ARM_GIC_REDIST_SIZE0x2
+
 #define KVM_IRQ_OFFSET GIC_SPI_IRQ_BASE
 
 #define KVM_VM_TYPE0
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 06/10] arm: simplify MMIO dispatching

2015-06-26 Thread Andre Przywara

Currently we separate any incoming MMIO request into one of the ARM
memory map regions and take care to spare the GIC.
It turns out that this is unnecessary, as we only have one special
region (the IO port area in the first 64 KByte). The MMIO rbtree
takes care about unhandled MMIO ranges, so we can simply drop all the
special range checking (except that for the IO range) in
kvm_cpu__emulate_mmio().
As the GIC is handled in the kernel, a GIC MMIO access should never
reach userland (and we don't know what to do with it anyway).
This lets us delete some more code and simplifies future extensions
(like expanding the GIC regions).
To be in line with the other architectures, move the now simpler
code into a header file.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
Reviewed-by: Marc Zyngier marc.zyng...@arm.com
---
 arm/include/arm-common/kvm-arch.h | 12 
 arm/include/arm-common/kvm-cpu-arch.h | 14 --
 arm/kvm-cpu.c | 16 
 3 files changed, 12 insertions(+), 30 deletions(-)

diff --git a/arm/include/arm-common/kvm-arch.h 
b/arm/include/arm-common/kvm-arch.h
index 082131d..90d6733 100644
--- a/arm/include/arm-common/kvm-arch.h
+++ b/arm/include/arm-common/kvm-arch.h
@@ -45,18 +45,6 @@ static inline bool arm_addr_in_ioport_region(u64 phys_addr)
return phys_addr = KVM_IOPORT_AREA  phys_addr  limit;
 }
 
-static inline bool arm_addr_in_virtio_mmio_region(u64 phys_addr)
-{
-   u64 limit = KVM_VIRTIO_MMIO_AREA + ARM_VIRTIO_MMIO_SIZE;
-   return phys_addr = KVM_VIRTIO_MMIO_AREA  phys_addr  limit;
-}
-
-static inline bool arm_addr_in_pci_region(u64 phys_addr)
-{
-   u64 limit = KVM_PCI_CFG_AREA + ARM_PCI_CFG_SIZE + ARM_PCI_MMIO_SIZE;
-   return phys_addr = KVM_PCI_CFG_AREA  phys_addr  limit;
-}
-
 struct kvm_arch {
/*
 * We may have to align the guest memory for virtio, so keep the
diff --git a/arm/include/arm-common/kvm-cpu-arch.h 
b/arm/include/arm-common/kvm-cpu-arch.h
index 36c7872..329979a 100644
--- a/arm/include/arm-common/kvm-cpu-arch.h
+++ b/arm/include/arm-common/kvm-cpu-arch.h
@@ -44,8 +44,18 @@ static inline bool kvm_cpu__emulate_io(struct kvm_cpu *vcpu, 
u16 port, void *dat
return false;
 }
 
-bool kvm_cpu__emulate_mmio(struct kvm_cpu *vcpu, u64 phys_addr, u8 *data,
-  u32 len, u8 is_write);
+static inline bool kvm_cpu__emulate_mmio(struct kvm_cpu *vcpu, u64 phys_addr,
+u8 *data, u32 len, u8 is_write)
+{
+   if (arm_addr_in_ioport_region(phys_addr)) {
+   int direction = is_write ? KVM_EXIT_IO_OUT : KVM_EXIT_IO_IN;
+   u16 port = (phys_addr - KVM_IOPORT_AREA)  USHRT_MAX;
+
+   return kvm__emulate_io(vcpu, port, data, direction, len, 1);
+   }
+
+   return kvm__emulate_mmio(vcpu, phys_addr, data, len, is_write);
+}
 
 unsigned long kvm_cpu__get_vcpu_mpidr(struct kvm_cpu *vcpu);
 
diff --git a/arm/kvm-cpu.c b/arm/kvm-cpu.c
index ab08815..7780251 100644
--- a/arm/kvm-cpu.c
+++ b/arm/kvm-cpu.c
@@ -139,22 +139,6 @@ bool kvm_cpu__handle_exit(struct kvm_cpu *vcpu)
return false;
 }
 
-bool kvm_cpu__emulate_mmio(struct kvm_cpu *vcpu, u64 phys_addr, u8 *data,
-  u32 len, u8 is_write)
-{
-   if (arm_addr_in_virtio_mmio_region(phys_addr)) {
-   return kvm__emulate_mmio(vcpu, phys_addr, data, len, is_write);
-   } else if (arm_addr_in_ioport_region(phys_addr)) {
-   int direction = is_write ? KVM_EXIT_IO_OUT : KVM_EXIT_IO_IN;
-   u16 port = (phys_addr - KVM_IOPORT_AREA)  USHRT_MAX;
-   return kvm__emulate_io(vcpu, port, data, direction, len, 1);
-   } else if (arm_addr_in_pci_region(phys_addr)) {
-   return kvm__emulate_mmio(vcpu, phys_addr, data, len, is_write);
-   }
-
-   return false;
-}
-
 void kvm_cpu__show_page_tables(struct kvm_cpu *vcpu)
 {
 }
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 02/10] AArch{32,64}: use KVM_CREATE_DEVICE co to instanciate the GIC

2015-06-26 Thread Andre Przywara

From: Marc Zyngier marc.zyng...@arm.com

As of 3.14, KVM/arm supports the creation/configuration of the GIC through
a more generic device API, which is now the preferred way to do so.

Plumb the new API in, and allow the old code to be used as a fallback.

[Andre: Rename some functions on the way to differentiate between
creation and initialisation more clearly and fix error path.]

Signed-off-by: Marc Zyngier marc.zyng...@arm.com
Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 arm/gic.c| 69 +++-
 arm/include/arm-common/gic.h |  2 +-
 arm/kvm.c|  6 ++--
 3 files changed, 66 insertions(+), 11 deletions(-)

diff --git a/arm/gic.c b/arm/gic.c
index 5d8cbe6..1ff3663 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -7,7 +7,50 @@
 #include linux/byteorder.h
 #include linux/kvm.h
 
-int gic__init_irqchip(struct kvm *kvm)
+static int gic_fd = -1;
+
+static int gic__create_device(struct kvm *kvm)
+{
+   int err;
+   u64 cpu_if_addr = ARM_GIC_CPUI_BASE;
+   u64 dist_addr = ARM_GIC_DIST_BASE;
+   struct kvm_create_device gic_device = {
+   .type   = KVM_DEV_TYPE_ARM_VGIC_V2,
+   };
+   struct kvm_device_attr cpu_if_attr = {
+   .group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
+   .attr   = KVM_VGIC_V2_ADDR_TYPE_CPU,
+   .addr   = (u64)(unsigned long)cpu_if_addr,
+   };
+   struct kvm_device_attr dist_attr = {
+   .group  = KVM_DEV_ARM_VGIC_GRP_ADDR,
+   .attr   = KVM_VGIC_V2_ADDR_TYPE_DIST,
+   .addr   = (u64)(unsigned long)dist_addr,
+   };
+
+   err = ioctl(kvm-vm_fd, KVM_CREATE_DEVICE, gic_device);
+   if (err)
+   return err;
+
+   gic_fd = gic_device.fd;
+
+   err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, cpu_if_attr);
+   if (err)
+   goto out_err;
+
+   err = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, dist_attr);
+   if (err)
+   goto out_err;
+
+   return 0;
+
+out_err:
+   close(gic_fd);
+   gic_fd = -1;
+   return err;
+}
+
+static int gic__create_irqchip(struct kvm *kvm)
 {
int err;
struct kvm_arm_device_addr gic_addr[] = {
@@ -23,12 +66,6 @@ int gic__init_irqchip(struct kvm *kvm)
}
};
 
-   if (kvm-nrcpus  GIC_MAX_CPUS) {
-   pr_warning(%d CPUS greater than maximum of %d -- truncating\n,
-   kvm-nrcpus, GIC_MAX_CPUS);
-   kvm-nrcpus = GIC_MAX_CPUS;
-   }
-
err = ioctl(kvm-vm_fd, KVM_CREATE_IRQCHIP);
if (err)
return err;
@@ -41,6 +78,24 @@ int gic__init_irqchip(struct kvm *kvm)
return err;
 }
 
+int gic__create(struct kvm *kvm)
+{
+   int err;
+
+   if (kvm-nrcpus  GIC_MAX_CPUS) {
+   pr_warning(%d CPUS greater than maximum of %d -- truncating\n,
+   kvm-nrcpus, GIC_MAX_CPUS);
+   kvm-nrcpus = GIC_MAX_CPUS;
+   }
+
+   /* Try the new way first, and fallback on legacy method otherwise */
+   err = gic__create_device(kvm);
+   if (err)
+   err = gic__create_irqchip(kvm);
+
+   return err;
+}
+
 void gic__generate_fdt_nodes(void *fdt, u32 phandle)
 {
u64 reg_prop[] = {
diff --git a/arm/include/arm-common/gic.h b/arm/include/arm-common/gic.h
index 5a36f2c..44859f7 100644
--- a/arm/include/arm-common/gic.h
+++ b/arm/include/arm-common/gic.h
@@ -24,7 +24,7 @@
 struct kvm;
 
 int gic__alloc_irqnum(void);
-int gic__init_irqchip(struct kvm *kvm);
+int gic__create(struct kvm *kvm);
 void gic__generate_fdt_nodes(void *fdt, u32 phandle);
 
 #endif /* ARM_COMMON__GIC_H */
diff --git a/arm/kvm.c b/arm/kvm.c
index 58ad9fa..bcd2533 100644
--- a/arm/kvm.c
+++ b/arm/kvm.c
@@ -81,7 +81,7 @@ void kvm__arch_init(struct kvm *kvm, const char 
*hugetlbfs_path, u64 ram_size)
madvise(kvm-arch.ram_alloc_start, kvm-arch.ram_alloc_size,
MADV_MERGEABLE | MADV_HUGEPAGE);
 
-   /* Initialise the virtual GIC. */
-   if (gic__init_irqchip(kvm))
-   die(Failed to initialise virtual GIC);
+   /* Create the virtual GIC. */
+   if (gic__create(kvm))
+   die(Failed to create virtual GIC);
 }
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 03/10] irq: add irq__get_nr_allocated_lines

2015-06-26 Thread Andre Przywara

From: Marc Zyngier marc.zyng...@arm.com

The ARM GIC emulation needs to be told the number of interrupts
it has to support. As commit 1c262fa1dc7bc (kvm tools: irq: make
irq__alloc_line generic) made the interrupt counter private,
add a new accessor returning the number of interrupt lines we've
allocated so far.

Signed-off-by: Marc Zyngier marc.zyng...@arm.com
Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 include/kvm/irq.h | 1 +
 irq.c | 5 +
 2 files changed, 6 insertions(+)

diff --git a/include/kvm/irq.h b/include/kvm/irq.h
index 4cec6f0..8a78e43 100644
--- a/include/kvm/irq.h
+++ b/include/kvm/irq.h
@@ -11,6 +11,7 @@
 struct kvm;
 
 int irq__alloc_line(void);
+int irq__get_nr_allocated_lines(void);
 
 int irq__init(struct kvm *kvm);
 int irq__exit(struct kvm *kvm);
diff --git a/irq.c b/irq.c
index 33ea8d2..71eaa05 100644
--- a/irq.c
+++ b/irq.c
@@ -7,3 +7,8 @@ int irq__alloc_line(void)
 {
return next_line++;
 }
+
+int irq__get_nr_allocated_lines(void)
+{
+   return next_line - KVM_IRQ_OFFSET;
+}
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 07/10] limit number of VCPUs on demand

2015-06-26 Thread Andre Przywara

Currently the ARM GIC checks the number of VCPUs against a fixed
limit, which is GICv2 specific. Don't pretend we know better than the
kernel and let's get rid of that explicit check.
Instead be more relaxed about KVM_CREATE_VCPU failing with EINVAL,
which is the way the kernel communicates having reached a VCPU limit.
If we see this and have at least brought up one VCPU already
successfully, then don't panic, but limit the number of VCPUs instead.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 arm/gic.c | 6 --
 arm/kvm-cpu.c | 7 ++-
 kvm-cpu.c | 7 +++
 3 files changed, 13 insertions(+), 7 deletions(-)

diff --git a/arm/gic.c b/arm/gic.c
index 99f0d2b..05f85a2 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -84,12 +84,6 @@ int gic__create(struct kvm *kvm)
 {
int err;
 
-   if (kvm-nrcpus  GIC_MAX_CPUS) {
-   pr_warning(%d CPUS greater than maximum of %d -- truncating\n,
-   kvm-nrcpus, GIC_MAX_CPUS);
-   kvm-nrcpus = GIC_MAX_CPUS;
-   }
-
/* Try the new way first, and fallback on legacy method otherwise */
err = gic__create_device(kvm);
if (err)
diff --git a/arm/kvm-cpu.c b/arm/kvm-cpu.c
index 7780251..b2fd6ed 100644
--- a/arm/kvm-cpu.c
+++ b/arm/kvm-cpu.c
@@ -51,8 +51,13 @@ struct kvm_cpu *kvm_cpu__arch_init(struct kvm *kvm, unsigned 
long cpu_id)
return NULL;
 
vcpu-vcpu_fd = ioctl(kvm-vm_fd, KVM_CREATE_VCPU, cpu_id);
-   if (vcpu-vcpu_fd  0)
+   if (vcpu-vcpu_fd  0) {
+   if (errno == EINVAL) {
+   free(vcpu);
+   return NULL;
+   }
die_perror(KVM_CREATE_VCPU ioctl);
+   }
 
mmap_size = ioctl(kvm-sys_fd, KVM_GET_VCPU_MMAP_SIZE, 0);
if (mmap_size  0)
diff --git a/kvm-cpu.c b/kvm-cpu.c
index 5d90664..7a9d689 100644
--- a/kvm-cpu.c
+++ b/kvm-cpu.c
@@ -222,11 +222,18 @@ int kvm_cpu__init(struct kvm *kvm)
for (i = 0; i  kvm-nrcpus; i++) {
kvm-cpus[i] = kvm_cpu__arch_init(kvm, i);
if (!kvm-cpus[i]) {
+   if (i  0  errno == EINVAL)
+   break;
pr_warning(unable to initialize KVM VCPU);
goto fail_alloc;
}
}
 
+   if (i  kvm-nrcpus) {
+   kvm-nrcpus = i;
+   printf(  # The kernel limits the number of CPUs to %d\n, i);
+   }
+
return 0;
 
 fail_alloc:
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 05/10] arm: finish VGIC initialisation explicitly

2015-06-26 Thread Andre Przywara

Since Linux 3.19-rc1 there is a new API to explicitly initialise
the in-kernel GIC emulation by a userland KVM device call.
Use that to tell the kernel we are finished with the GIC
initialisation, since the automatic GIC init will only be provided
as a legacy functionality in the future.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
Reviewed-by: Marc Zyngier marc.zyng...@arm.com
---
 arm/gic.c | 25 ++---
 1 file changed, 22 insertions(+), 3 deletions(-)

diff --git a/arm/gic.c b/arm/gic.c
index 8560c9b..99f0d2b 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -98,24 +98,43 @@ int gic__create(struct kvm *kvm)
return err;
 }
 
+/*
+ * Sets the number of used interrupts and finalizes the GIC init explicitly.
+ */
 static int gic__init_gic(struct kvm *kvm)
 {
+   int ret;
+
int lines = irq__get_nr_allocated_lines();
u32 nr_irqs = ALIGN(lines, 32) + GIC_SPI_IRQ_BASE;
struct kvm_device_attr nr_irqs_attr = {
.group  = KVM_DEV_ARM_VGIC_GRP_NR_IRQS,
.addr   = (u64)(unsigned long)nr_irqs,
};
+   struct kvm_device_attr vgic_init_attr = {
+   .group  = KVM_DEV_ARM_VGIC_GRP_CTRL,
+   .attr   = KVM_DEV_ARM_VGIC_CTRL_INIT,
+   };
 
/*
 * If we didn't use the KVM_CREATE_DEVICE method, KVM will
-* give us some default number of interrupts.
+* give us some default number of interrupts. The GIC initialization
+* will be done automatically in this case.
 */
if (gic_fd  0)
return 0;
 
-   if (!ioctl(gic_fd, KVM_HAS_DEVICE_ATTR, nr_irqs_attr))
-   return ioctl(gic_fd, KVM_SET_DEVICE_ATTR, nr_irqs_attr);
+   if (!ioctl(gic_fd, KVM_HAS_DEVICE_ATTR, nr_irqs_attr)) {
+   ret = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, nr_irqs_attr);
+   if (ret)
+   return ret;
+   }
+
+   if (!ioctl(gic_fd, KVM_HAS_DEVICE_ATTR, vgic_init_attr)) {
+   ret = ioctl(gic_fd, KVM_SET_DEVICE_ATTR, vgic_init_attr);
+   if (ret)
+   return ret;
+   }
 
return 0;
 }
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 04/10] AArch{32,64}: dynamically configure the number of GIC interrupts

2015-06-26 Thread Andre Przywara

From: Marc Zyngier marc.zyng...@arm.com

In order to reduce the memory usage of large guests (as well
as improve performance), tell KVM about the number of interrupts
we require.

To avoid synchronization with the various device creation,
use a late_init callback to compute the GIC configuration.
[Andre: rename to gic__init_gic() to ease future expansion]

Signed-off-by: Marc Zyngier marc.zyng...@arm.com
Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 arm/gic.c | 25 +
 1 file changed, 25 insertions(+)

diff --git a/arm/gic.c b/arm/gic.c
index 1ff3663..8560c9b 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -1,10 +1,12 @@
 #include kvm/fdt.h
+#include kvm/irq.h
 #include kvm/kvm.h
 #include kvm/virtio.h
 
 #include arm-common/gic.h
 
 #include linux/byteorder.h
+#include linux/kernel.h
 #include linux/kvm.h
 
 static int gic_fd = -1;
@@ -96,6 +98,29 @@ int gic__create(struct kvm *kvm)
return err;
 }
 
+static int gic__init_gic(struct kvm *kvm)
+{
+   int lines = irq__get_nr_allocated_lines();
+   u32 nr_irqs = ALIGN(lines, 32) + GIC_SPI_IRQ_BASE;
+   struct kvm_device_attr nr_irqs_attr = {
+   .group  = KVM_DEV_ARM_VGIC_GRP_NR_IRQS,
+   .addr   = (u64)(unsigned long)nr_irqs,
+   };
+
+   /*
+* If we didn't use the KVM_CREATE_DEVICE method, KVM will
+* give us some default number of interrupts.
+*/
+   if (gic_fd  0)
+   return 0;
+
+   if (!ioctl(gic_fd, KVM_HAS_DEVICE_ATTR, nr_irqs_attr))
+   return ioctl(gic_fd, KVM_SET_DEVICE_ATTR, nr_irqs_attr);
+
+   return 0;
+}
+late_init(gic__init_gic)
+
 void gic__generate_fdt_nodes(void *fdt, u32 phandle)
 {
u64 reg_prop[] = {
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v4 10/10] arm: use new irqchip parameter to create different vGIC types

2015-06-26 Thread Andre Przywara

Currently we unconditionally create a virtual GICv2 in the guest.
Add a --irqchip= parameter to let the user specify a different GIC
type for the guest, when omitting this parameter it still defaults to
--irqchip=gicv2.
For now the only other supported type is --irqchip=gicv3

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 arm/aarch64/arm-cpu.c|  2 +-
 arm/gic.c| 17 +
 arm/include/arm-common/kvm-config-arch.h |  9 -
 arm/kvm.c|  2 +-
 4 files changed, 27 insertions(+), 3 deletions(-)

diff --git a/arm/aarch64/arm-cpu.c b/arm/aarch64/arm-cpu.c
index f702b9e..3dc8ea3 100644
--- a/arm/aarch64/arm-cpu.c
+++ b/arm/aarch64/arm-cpu.c
@@ -12,7 +12,7 @@
 static void generate_fdt_nodes(void *fdt, struct kvm *kvm, u32 gic_phandle)
 {
int timer_interrupts[4] = {13, 14, 11, 10};
-   gic__generate_fdt_nodes(fdt, gic_phandle, IRQCHIP_GICV2);
+   gic__generate_fdt_nodes(fdt, gic_phandle, kvm-cfg.arch.irqchip);
timer__generate_fdt_nodes(fdt, kvm, timer_interrupts);
 }
 
diff --git a/arm/gic.c b/arm/gic.c
index efe4b42..ff56de7 100644
--- a/arm/gic.c
+++ b/arm/gic.c
@@ -22,6 +22,23 @@ static int gic_fd = -1;
 static u64 gic_redists_base;
 static u64 gic_redists_size;
 
+int irqchip_parser(const struct option *opt, const char *arg, int unset)
+{
+   enum irqchip_type *type = opt-value;
+
+   *type = IRQCHIP_GICV2;
+   if (!strcmp(arg, gicv2)) {
+   *type = IRQCHIP_GICV2;
+   } else if (!strcmp(arg, gicv3)) {
+   *type = IRQCHIP_GICV3;
+   } else {
+   fprintf(stderr, irqchip: unknown type \%s\\n, arg);
+   return -1;
+   }
+
+   return 0;
+}
+
 static int gic__create_device(struct kvm *kvm, enum irqchip_type type)
 {
int err;
diff --git a/arm/include/arm-common/kvm-config-arch.h 
b/arm/include/arm-common/kvm-config-arch.h
index a8ebd94..9529881 100644
--- a/arm/include/arm-common/kvm-config-arch.h
+++ b/arm/include/arm-common/kvm-config-arch.h
@@ -8,8 +8,11 @@ struct kvm_config_arch {
unsigned intforce_cntfrq;
boolvirtio_trans_pci;
boolaarch32_guest;
+   enum irqchip_type irqchip;
 };
 
+int irqchip_parser(const struct option *opt, const char *arg, int unset);
+
 #define OPT_ARCH_RUN(pfx, cfg) 
\
pfx,
\
ARM_OPT_ARCH_RUN(cfg)   
\
@@ -21,6 +24,10 @@ struct kvm_config_arch {
 updated to program CNTFRQ correctly*),   
\
OPT_BOOLEAN('\0', force-pci, (cfg)-virtio_trans_pci,
\
Force virtio devices to use PCI as their default  
\
-   transport),
+   transport),   
\
+OPT_CALLBACK('\0', irqchip, (cfg)-irqchip, 
\
+[gicv2|gicv3],   \
+type of interrupt controller to emulate in the guest,
\
+irqchip_parser, NULL),
 
 #endif /* ARM_COMMON__KVM_CONFIG_ARCH_H */
diff --git a/arm/kvm.c b/arm/kvm.c
index f9685c2..d0e4a20 100644
--- a/arm/kvm.c
+++ b/arm/kvm.c
@@ -82,6 +82,6 @@ void kvm__arch_init(struct kvm *kvm, const char 
*hugetlbfs_path, u64 ram_size)
MADV_MERGEABLE | MADV_HUGEPAGE);
 
/* Create the virtual GIC. */
-   if (gic__create(kvm, IRQCHIP_GICV2))
+   if (gic__create(kvm, kvm-cfg.arch.irqchip))
die(Failed to create virtual GIC);
 }
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH v3 06/10] arm: simplify MMIO dispatching

2015-06-24 Thread Andre Przywara

Hi Will,

do you want me to respin the whole series to address the remaining minor
comments in the last four patches or do you want to take patch 01-06
already (which I think Marc has already agreed upon)?
Then I would just send an updated version of the remaining patches.

Cheers,
Andre.




 No, that's fine.
 
 I just wondered what was the rational behind having the
 arm_addr_in_pci_region() call there. It might have guarded something,
 but if you're absolutely positive that this doesn't cause a regression,
 that's OK with me.
 
 Reviewed-by: Marc Zyngier marc.zyng...@arm.com
 
   M.
 
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[RFC PATCH 1/2] Makefile: cleanup guest/init generation

2015-06-23 Thread Andre Przywara

The dependencies and targets for the guest userland binary are
currently not correct, some are redundant.
Fix them by splitting up guest/guest_init.o creation into its two
steps and describe the dependencies properly.
On the way use automatic variables in some rules.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 Makefile | 21 -
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/Makefile b/Makefile
index 151fa9d..b9480ff 100644
--- a/Makefile
+++ b/Makefile
@@ -337,7 +337,7 @@ ifneq ($(WERROR),0)
CFLAGS += -Werror
 endif
 
-all: $(PROGRAM) $(PROGRAM_ALIAS) $(GUEST_INIT)
+all: $(PROGRAM) $(PROGRAM_ALIAS)
 
 # CFLAGS used when building objects
 # This is intentionally not assigned using :=
@@ -352,22 +352,25 @@ c_flags   = -Wp,-MD,$(depfile) $(CFLAGS)
 STATIC_OBJS = $(patsubst %.o,%.static.o,$(OBJS) $(OBJS_STATOPT))
 GUEST_OBJS = guest/guest_init.o
 
-$(PROGRAM)-static:  $(STATIC_OBJS) $(OTHEROBJS) $(GUEST_INIT)
+$(PROGRAM)-static:  $(STATIC_OBJS) $(OTHEROBJS) $(GUEST_OBJS)
$(E)   LINK $@
-   $(Q) $(CC) -static $(CFLAGS) $(STATIC_OBJS) $(OTHEROBJS) $(GUEST_OBJS) 
$(LIBS) $(LIBS_STATOPT) -o $@
+   $(Q) $(CC) -static $(CFLAGS) $^ $(LIBS) $(LIBS_STATOPT) -o $@
 
-$(PROGRAM): $(OBJS) $(OBJS_DYNOPT) $(OTHEROBJS) $(GUEST_INIT)
+$(PROGRAM): $(OBJS) $(OBJS_DYNOPT) $(OTHEROBJS) $(GUEST_OBJS)
$(E)   LINK $@
-   $(Q) $(CC) $(CFLAGS) $(OBJS) $(OBJS_DYNOPT) $(OTHEROBJS) $(GUEST_OBJS) 
$(LIBS) $(LIBS_DYNOPT) -o $@
+   $(Q) $(CC) $(CFLAGS) $^ $(LIBS) $(LIBS_DYNOPT) -o $@
 
 $(PROGRAM_ALIAS): $(PROGRAM)
$(E)   LN   $@
-   $(Q) ln -f $(PROGRAM) $@
+   $(Q) ln -f $ $@
 
-$(GUEST_INIT): guest/init.c
+$(GUEST_OBJS): $(GUEST_INIT)
$(E)   LINK $@
-   $(Q) $(CC) -static guest/init.c -o $@
-   $(Q) $(LD) $(LDFLAGS) -r -b binary -o guest/guest_init.o $(GUEST_INIT)
+   $(Q) $(LD) $(LDFLAGS) -r -b binary -o $@ $
+
+$(GUEST_INIT): guest/init.c
+   $(E)   CC   $@
+   $(Q) $(CC) -static $^ -o $@
 
 %.s: %.c
$(Q) $(CC) -o $@ -S $(CFLAGS) -fverbose-asm $
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[RFC PATCH 2/2] Makefile: use xxd for converting guest/init

2015-06-23 Thread Andre Przywara

Currently we use ld to convert the static guest/init binary back
into an object file, which we can embed as a binary blob into our
lkvm binary. This works fine as long as compiler and linker use the
same ELF target format, which seems to be not true for most of the
MIPS toolchains.
Use a different approach instead, which converts the guest/init
binary into a C array, from which the compiler generates an .o
representation. As the compiler is now the same, this naturally links
together fine on all architectures.
We use the xxd tool for generating a C array representation out of
the binary file. If this turns out to be not widely installed (it
seems to be part of the vim package in most distributions), we could
think about switching to a scripted implementation using od or some
printf trickery.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 Makefile| 4 ++--
 builtin-run.c   | 8 
 builtin-setup.c | 8 
 3 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/Makefile b/Makefile
index b9480ff..7f2a0ea 100644
--- a/Makefile
+++ b/Makefile
@@ -365,8 +365,8 @@ $(PROGRAM_ALIAS): $(PROGRAM)
$(Q) ln -f $ $@
 
 $(GUEST_OBJS): $(GUEST_INIT)
-   $(E)   LINK $@
-   $(Q) $(LD) $(LDFLAGS) -r -b binary -o $@ $
+   $(E)   CONVERT  $@
+   $(Q) xxd -i $ | $(CC) -c -x c - -o $@
 
 $(GUEST_INIT): guest/init.c
$(E)   CC   $@
diff --git a/builtin-run.c b/builtin-run.c
index 1ee75ad..0a48663 100644
--- a/builtin-run.c
+++ b/builtin-run.c
@@ -59,8 +59,8 @@ static int  kvm_run_wrapper;
 
 bool do_debug_print = false;
 
-extern char _binary_guest_init_start;
-extern char _binary_guest_init_size;
+extern char guest_init;
+extern char guest_init_len;
 
 static const char * const run_usage[] = {
lkvm run [options] [kernel image],
@@ -354,8 +354,8 @@ static int kvm_setup_guest_init(struct kvm *kvm)
char *data;
 
/* Setup /virt/init */
-   size = (size_t)_binary_guest_init_size;
-   data = (char *)_binary_guest_init_start;
+   size = (size_t)guest_init_len;
+   data = (char *)guest_init;
snprintf(tmp, PATH_MAX, %s%s/virt/init, kvm__get_dir(), rootfs);
remove(tmp);
fd = open(tmp, O_CREAT | O_WRONLY, 0755);
diff --git a/builtin-setup.c b/builtin-setup.c
index 8b45c56..fd7ca54 100644
--- a/builtin-setup.c
+++ b/builtin-setup.c
@@ -16,8 +16,8 @@
 #include sys/mman.h
 #include fcntl.h
 
-extern char _binary_guest_init_start;
-extern char _binary_guest_init_size;
+extern char guest_init;
+extern char guest_init_len;
 
 static const char *instance_name;
 
@@ -131,8 +131,8 @@ static int copy_init(const char *guestfs_name)
int fd, ret;
char *data;
 
-   size = (size_t)_binary_guest_init_size;
-   data = (char *)_binary_guest_init_start;
+   size = (size_t)guest_init;
+   data = (char *)guest_init_len;
snprintf(path, PATH_MAX, %s%s/virt/init, kvm__get_dir(), 
guestfs_name);
remove(path);
fd = open(path, O_CREAT | O_WRONLY, 0755);
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[RFC PATCH 0/2] kvmtool: Rework guest/init integration

2015-06-23 Thread Andre Przywara

Hi,

this mini series aims at solving long standing issues with compiling
and linking the guest/init binary for MIPS.
It seems that many MIPS toolchains use different default ELF targets
for the compiler and the linker, rendering the approach of linking
the guest/init executable into the lkvm binary moot.
One could work around this by specifying some magic ELF target
options to the linker so it matches the compiler ones, but I couldn't
find a way of automatically determining those, so this approach is
only valid on a particular toolchain.
Another approach would be to fixup the ELF header, but that sounds
dodgy and fragile to me.

Instead of using ld this series transforms the generated guest
binary into a C file, which gets compiled (with CC) and thus
automatically links fine with the other object files.
Patch 2/2 implements this, patch 1/2 cleans up the rules for the
guest binary generation in the Makefile.

This uses the xxd tool, which has a special command line option
to generate a C array out of a binary blob. On the distributions
I checked, this comes with the vim package, not sure if that is a
restriction.

I compile tested this on on PowerPC64, MIPS64, ARM, ARM64, i386 and
x86_64.

Please test whether this works with your toolchain / system!

Cheers,
Andre.

Andre Przywara (2):
  Makefile: cleanup guest/init generation
  Makefile: use xxd for converting guest/init

 Makefile| 21 -
 builtin-run.c   |  8 
 builtin-setup.c |  8 
 3 files changed, 20 insertions(+), 17 deletions(-)

-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [RFC 0/6] KVM: arm/arm64: gsi routing support

2015-06-23 Thread Andre Przywara

Hi Eric,

I went back reading the code and looked at how the x86 APIC works more
closely to understand the GSI routing better.
See below for more ...

On 22/06/15 10:21, Eric Auger wrote:
 On 06/22/2015 10:40 AM, Andre Przywara wrote:
 Hi Eric,

 I briefly looked over the series, the patches itself look good overall.
 I have one or two comments on the actual code, but want to discuss the
 general approach first (more a dump of some first thoughts):

 On 18/06/15 18:40, Eric Auger wrote:
 With the advent of GICv3 ITS in-kernel emulation, KVM GSI routing
 appears to be requested. More specifically MSI routing is needed.
 irqchip routing does not sound to be really useful on arm but usage of
 MSI routing also mandates to integrate irqchip routing. The initial
 implementation of irqfd on arm must be upgraded with the integration
 of kvm irqchip.c code and the implementation of its standard hooks
 in the architecture specific part.

 The series therefore allows and mandates the usage of KVM_SET_GSI_ROUTING
 ioctl along with KVM_IRQFD. If the userspace does not define any routing
 table, no irqfd injection can happen. The user-space can use
 KVM_CAP_IRQ_ROUTING to detect whether a routing table is needed.

 for irqchip routing, the convention is, only SPI can be injected and the
 SPI ID corresponds to irqchip.pin + 32. For MSI routing the interrupt ID
 matches the MSI msg data. API evolve to support associating a device ID
 to a routine entry.

 So if I get this right, in a guest ITS case we have now three different
 IRQ name spaces:
 a) the LPI number, which is guest internal. The ITS driver in the guest
 maintains it. We can track assignments and changes when handling the
 MAPVI command in the host kernel, but this would stay in the kernel, as
 I don't see an efficient way of propagating this to userland.
 b) the GSI number, which is used in communication between userland and
 the host kernel. The guest kernel does not know about this at all. Also
 the ioctl requires us to set the routing for _all_ GSIs, and I read it
 that it assumes starting at GSI 0.
 all injected GSI must effectively have a routing entry in KVM. Starting
 at 0 that's not requested. At qemu level there's just the constaint gsi
 fits between [0, max route number].

Yeah, you are right, I somehow missed that each routing entry has a gsi
field in it. So we have to allocate all of them at once with one ioctl,
but they can be sparse.

  So we cannot even pretend to have
 LPIs here, because we would need at least 8192 empty entries then, not
 to speak of the possibly sparse allocation above. So we have a
 completely distinct name space here.
 What is done currently at qemu level for other archs -  if I understand
 it correctly -  is there is static GSI routing for standard IRQ. For MSI
 irqfd setup they use spare gsi number not yet used for GSI routing  max
 route number. So this is sparse for MSI but not for standard IRQs.
 Effectively we do not plan to have GSI routing for LPIs but only MSI
 routing.

That seems to make sense to me. Since we already limit the number of
SPIs to something sensible with our KVM_DEV_ARM_VGIC_GRP_NR_IRQS, we
could infer an implicit direct routing for those SPIs. KVM could check
the IRQ number against vgic.nr_irqs to see whether an IRQ is routed or not.
Any GSI beyond that number would be an MSI with your enhanced DevID:EvID
pair in it, which gets injected via the ITS emulation code (or the
respective GICv2m code).

That would be the idea, but if it turns out that not routing SPIs but
only MSIs requires too many changes to the (core) KVM code (haven't
looked yet), we could require routing entries for SPIs as well.
After all that's what for instance kvmtool sets up for x86, creating
default 1:1 mappings for ISA and low APIC IRQs and allocating MSIs on
demand after that.

 c) The DevID:EvID pair, which actually identifies an IRQ in all the
 three regimes and is the only authoritative ID.

 So that means we need to maintain the connection between all the three,
 somehow duplicating the whole ITS mapping again to map GSIs to DevID:EvID.
 Currently the KVM routing table indeed stores GSI/DevID:EvID mapping.

 So I wonder if we could use DevID:EvID directly.
 The KVM_IRQFD ioctl struct has some space, so we could put the DevID
 into the pad area.
 Also (more forward-looking) KVM_CAP_ASSIGN_DEV_IRQ identifies guest IRQs
 by an u32, but again there is quite some padding area available.

 ASSIGN_DEV_IRQ is a deprecated feature. We should not use that API I think.

OK, so do we have other users of the GSI routing beside IRQFD then?

I will go ahead and try to implement some code matching Eric's patches
in kvmtool to test the GSI routing.

Eric, how did you test the irqchip routing on the Midway?

Cheers,
Andre.

 Eric

 In general I am a bit reluctant to introduce just another level of
 complexity to the already quite convoluted way of doing IRQs and MSIs on
 ARM(64), that's why I will investigate if we can use DevID:EvID

Re: [PATCH 1/2] powerpc: Define the hcall opcodes return values we need

2015-06-23 Thread Andre Przywara

Hi,

On 23/06/15 11:05, Michael Ellerman wrote:
 On Tue, 2015-06-23 at 11:33 +0200, Paolo Bonzini wrote:
 On 19/06/2015 09:21, Michael Ellerman wrote:
 diff --git a/powerpc/spapr.h b/powerpc/spapr.h
 index 0537f881c0e4..7a377d093ef4 100644
 --- a/powerpc/spapr.h
 +++ b/powerpc/spapr.h
 @@ -16,17 +16,32 @@
  
  #include inttypes.h
  
 -/* We need some of the H_ hcall defs, but they're __KERNEL__ only. */
 -#define __KERNEL__
 -#include asm/hvcall.h
 -#undef __KERNEL__
 -

 This thing is exactly why I think kvmtool's life in the kernel tree was
 harmful.
 
 Harmful is a bit of an overstatement. Though I agree that was a bit of a hack.
 
 Why wasn't instead H_* just moved to a uapi/ header?!?!?  Can you do
 that now?
 
 Because it's not part of the kernel API, never was, still isn't.

Technically it may not - if I get this correctly it is more a platform
API defined by the architecture, like ACPI or PSCI on ARM.
But if I get this correctly Linux re-uses those definitions in the KVM
API, by piggy-backing on the existing hypercalls. Please correct me if I
am wrong here, I am looking at arch/powerpc/kvm/book3s_hv.c, where it
seems to trap those hypercalls.

So I think that - though not originally invented or defined by Linux -
it should export those definitions that KVM (re-)uses.
QEMU also has a header file duplicating those definitions, so I support
the idea of an uapi header.

 It *is* part of the hypervisor API, but it's not Linux's job to export that 
 and
 deal with the fallout if it was ever changed.

Regardless of what happens if that phyp API changes, KVM would still
need to support those hypercalls, so I think it should export them as well.

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [RFC 1/6] KVM: api: add kvm_irq_routing_extended_msi

2015-06-22 Thread Andre Przywara

Hi Eric,

On 18/06/15 18:40, Eric Auger wrote:
 On ARM, the MSI msg (address and data) comes along with
 out-of-band device ID information. The device ID encodes the device
 that composes the MSI msg. Let's create a new routing entry structure
 that enables to encode that information on top of standard MSI
 message
 
 Signed-off-by: Eric Auger eric.au...@linaro.org
 ---
  Documentation/virtual/kvm/api.txt | 9 +
  include/uapi/linux/kvm.h  | 9 +
  2 files changed, 18 insertions(+)
 
 diff --git a/Documentation/virtual/kvm/api.txt 
 b/Documentation/virtual/kvm/api.txt
 index d20fd94..bcec91e 100644
 --- a/Documentation/virtual/kvm/api.txt
 +++ b/Documentation/virtual/kvm/api.txt
 @@ -1419,6 +1419,7 @@ struct kvm_irq_routing_entry {
   struct kvm_irq_routing_irqchip irqchip;
   struct kvm_irq_routing_msi msi;
   struct kvm_irq_routing_s390_adapter adapter;
 + struct kvm_irq_routing_extended_msi ext_msi;
   __u32 pad[8];
   } u;
  };
 @@ -1427,6 +1428,7 @@ struct kvm_irq_routing_entry {
  #define KVM_IRQ_ROUTING_IRQCHIP 1
  #define KVM_IRQ_ROUTING_MSI 2
  #define KVM_IRQ_ROUTING_S390_ADAPTER 3
 +#define KVM_IRQ_ROUTING_EXTENDED_MSI 4
  
  No flags are specified so far, the corresponding field must be set to zero.
  
 @@ -1442,6 +1444,13 @@ struct kvm_irq_routing_msi {
   __u32 pad;
  };
  
 +struct kvm_irq_routing_extended_msi {
 + __u32 address_lo;
 + __u32 address_hi;
 + __u32 data;
 + __u32 devid;
 +};
 +

I wonder if we could re-use the existing struct kvm_irq_routing_msi,
which has an u32 pad field already. Since we use a different type
number, this should not break. Admittedly not the nicest thing, but
reduces interface bloat:

struct kvm_irq_routing_msi {
__u32 address_lo;
__u32 address_hi;
__u32 data;
union {
__u32 pad;
__u32 devid;
};
};

to maintain backward compatibility on the userland source level.

Cheers,
Andre.

  struct kvm_irq_routing_s390_adapter {
   __u64 ind_addr;
   __u64 summary_addr;
 diff --git a/include/uapi/linux/kvm.h b/include/uapi/linux/kvm.h
 index 2a23705..e3f65a0 100644
 --- a/include/uapi/linux/kvm.h
 +++ b/include/uapi/linux/kvm.h
 @@ -829,6 +829,13 @@ struct kvm_irq_routing_msi {
   __u32 pad;
  };
  
 +struct kvm_irq_routing_extended_msi {
 + __u32 address_lo;
 + __u32 address_hi;
 + __u32 data;
 + __u32 devid;
 +};
 +
  struct kvm_irq_routing_s390_adapter {
   __u64 ind_addr;
   __u64 summary_addr;
 @@ -841,6 +848,7 @@ struct kvm_irq_routing_s390_adapter {
  #define KVM_IRQ_ROUTING_IRQCHIP 1
  #define KVM_IRQ_ROUTING_MSI 2
  #define KVM_IRQ_ROUTING_S390_ADAPTER 3
 +#define KVM_IRQ_ROUTING_EXTENDED_MSI 4
  
  struct kvm_irq_routing_entry {
   __u32 gsi;
 @@ -851,6 +859,7 @@ struct kvm_irq_routing_entry {
   struct kvm_irq_routing_irqchip irqchip;
   struct kvm_irq_routing_msi msi;
   struct kvm_irq_routing_s390_adapter adapter;
 + struct kvm_irq_routing_extended_msi ext_msi;
   __u32 pad[8];
   } u;
  };
 
--
To unsubscribe from this list: send the line unsubscribe kvm in

Re: [RFC 0/6] KVM: arm/arm64: gsi routing support

2015-06-22 Thread Andre Przywara

Hi Eric,

I briefly looked over the series, the patches itself look good overall.
I have one or two comments on the actual code, but want to discuss the
general approach first (more a dump of some first thoughts):

On 18/06/15 18:40, Eric Auger wrote:
With the advent of GICv3 ITS in-kernel emulation, KVM GSI routing
appears to be requested. More specifically MSI routing is needed.
irqchip routing does not sound to be really useful on arm but usage of
MSI routing also mandates to integrate irqchip routing. The initial
implementation of irqfd on arm must be upgraded with the integration
of kvm irqchip.c code and the implementation of its standard hooks
in the architecture specific part.

The series therefore allows and mandates the usage of KVM_SET_GSI_ROUTING
ioctl along with KVM_IRQFD. If the userspace does not define any routing
table, no irqfd injection can happen. The user-space can use
KVM_CAP_IRQ_ROUTING to detect whether a routing table is needed.

for irqchip routing, the convention is, only SPI can be injected and the
SPI ID corresponds to irqchip.pin + 32. For MSI routing the interrupt ID
matches the MSI msg data. API evolve to support associating a device ID
to a routine entry.

So if I get this right, in a guest ITS case we have now three different
IRQ name spaces:
a) the LPI number, which is guest internal. The ITS driver in the guest
maintains it. We can track assignments and changes when handling the
MAPVI command in the host kernel, but this would stay in the kernel, as
I don't see an efficient way of propagating this to userland.
b) the GSI number, which is used in communication between userland and
the host kernel. The guest kernel does not know about this at all. Also
the ioctl requires us to set the routing for _all_ GSIs, and I read it
that it assumes starting at GSI 0. So we cannot even pretend to have
LPIs here, because we would need at least 8192 empty entries then, not
to speak of the possibly sparse allocation above. So we have a
completely distinct name space here.
c) The DevID:EvID pair, which actually identifies an IRQ in all the
three regimes and is the only authoritative ID.

So that means we need to maintain the connection between all the three,
somehow duplicating the whole ITS mapping again to map GSIs to DevID:EvID.

So I wonder if we could use DevID:EvID directly.
The KVM_IRQFD ioctl struct has some space, so we could put the DevID
into the pad area.
Also (more forward-looking) KVM_CAP_ASSIGN_DEV_IRQ identifies guest IRQs
by an u32, but again there is quite some padding area available.

In general I am a bit reluctant to introduce just another level of
complexity to the already quite convoluted way of doing IRQs and MSIs on
ARM(64), that's why I will investigate if we can use DevID:EvID to refer
to an interrupt.

So far,
Andre.

Known Issues of this RFC:

- One of the biggest is the API inconsistencies on ARM. Blame me.
Routing should apply to KVM_IRQ_LINE ioctl which is not the case yet
in this series. It only applies to irqfd.
on x86 typically this KVM_IRQ_LINE is plugged onto irqchip.c kvm_set_irq
whereas on ARM we inject directly through kvm_vgic_inject_irq
x on arm/arm64 gsi has a specific structure:
bits: | 31 ... 24 | 23 ... 16 | 15...0 |
field: | irq_type | vcpu_index | irq_id |
where irq_id matches the Interrupt ID
- for KVM_IRQFD without routing (current implementation) the gsi field
corresponds to an SPI index = irq_id (above) -32.
- as far as understand qemu integration, gsi is supposed to be within
[0, KVM_MAX_IRQ_ROUTES]. Difficult to use KVM_IRQ_LINE gsi.
- to be defined what we choose as a convention with irqchip routing is
applied: gsi - irqchip input pin.
- Or shouldn't we simply rule out any userspace irqchip routing and stick
to MSI routing? we could define a fixed identity in-kernel irqchip mapping
and only offer MSI routing.
- static allocation of chip[KVM_NR_IRQCHIPS][KVM_IRQCHIP_NUM_PINS];
arbitrary put KVM_IRQCHIP_NUM_PINS = 1020 - 32 (SPI count). On s390
this is even bigger.

Currently tested on irqchip routing only (Calxeda midway only),
ie NOT TESTED on MSI routing yet.

This is a very preliminary RFC to ease the discussion.

Code can be found at
https://git.linaro.org/people/eric.auger/linux.git/shortlog/refs/heads/v4.1-rc8-gsi-routing-rfc

It applies on Andre's [PATCH 00/13] arm64: KVM: GICv3 ITS emulation
(http://www.spinics.net/lists/kvm/msg117402.html)

Eric Auger (6):
KVM: api: add kvm_irq_routing_extended_msi
KVM: kvm_host: add kvm_extended_msi
KVM: irqchip: convey devid to kvm_set_msi
KVM: arm/arm64: enable irqchip routing
KVM: arm/arm64: enable MSI routing
KVM: arm: implement kvm_set_msi by gsi direct mapping

Documentation/virtual/kvm/api.txt | 20 ++--
arch/arm/include/asm/kvm_host.h | 2 +
arch/arm/kvm/Kconfig | 3 ++
arch/arm/kvm/Makefile | 2 +-

[PATCH] kvmtool: avoid casts when initializing structures

2015-06-19 Thread Andre Przywara

Due to our kernel heritage we have code in kvmtool that relies on
the (still) implicit -std=gnu89 compiler switch.
It turns out that this just affects some structure initialization,
where we currently provide a cast to the type, which upsets GCC for
anything beyond -std=gnu89 (for instance gnu99 or gnu11).
We do need the casts when initializing structures that are not
assigned to the same type, so we put it there explicitly.

This allows us to compile with all the three standards GCC currently
supports: gnu89/90, gnu99 and gnu11.
GCC threatens people with moving to gnu11 as the new default standard,
so lets fix this better sooner than later.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
Hi,

TBH I don't know why we had those casts there in the first place,
but it works without them, even for -std=gnu89.
If people agree with this, we can think about dropping the forced
CFLAGS and LDFLAGS reset in the Makefile again, since this patch
should fix compilation on Dave Jones' machine as well ;-)

Cheers,
Andre.
 disk/qcow.c| 6 +++---
 include/kvm/mutex.h| 2 +-
 include/linux/rbtree.h | 2 +-
 virtio/9p.c| 2 +-
 virtio/balloon.c   | 2 +-
 virtio/blk.c   | 2 +-
 virtio/console.c   | 2 +-
 virtio/net.c   | 2 +-
 virtio/rng.c   | 2 +-
 virtio/scsi.c  | 2 +-
 10 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/disk/qcow.c b/disk/qcow.c
index 64a2550..e26c419 100644
--- a/disk/qcow.c
+++ b/disk/qcow.c
@@ -1203,7 +1203,7 @@ static int qcow_read_refcount_table(struct qcow *q)
if (!rft-rf_table)
return -1;
 
-   rft-root = RB_ROOT;
+   rft-root = (struct rb_root) RB_ROOT;
INIT_LIST_HEAD(rft-lru_list);
 
return pread_in_full(q-fd, rft-rf_table, sizeof(u64) * rft-rf_size, 
header-refcount_table_offset);
@@ -1289,7 +1289,7 @@ static struct disk_image *qcow2_probe(int fd, bool 
readonly)
 
l1t = q-table;
 
-   l1t-root = RB_ROOT;
+   l1t-root = (struct rb_root) RB_ROOT;
INIT_LIST_HEAD(l1t-lru_list);
 
h = q-header = qcow2_read_header(fd);
@@ -1435,7 +1435,7 @@ static struct disk_image *qcow1_probe(int fd, bool 
readonly)
 
l1t = q-table;
 
-   l1t-root = RB_ROOT;
+   l1t-root = (struct rb_root)RB_ROOT;
INIT_LIST_HEAD(l1t-lru_list);
 
h = q-header = qcow1_read_header(fd);
diff --git a/include/kvm/mutex.h b/include/kvm/mutex.h
index a90584b..1f7d0f6 100644
--- a/include/kvm/mutex.h
+++ b/include/kvm/mutex.h
@@ -13,7 +13,7 @@
 struct mutex {
pthread_mutex_t mutex;
 };
-#define MUTEX_INITIALIZER (struct mutex) { .mutex = PTHREAD_MUTEX_INITIALIZER }
+#define MUTEX_INITIALIZER { .mutex = PTHREAD_MUTEX_INITIALIZER }
 
 #define DEFINE_MUTEX(mtx) struct mutex mtx = MUTEX_INITIALIZER
 
diff --git a/include/linux/rbtree.h b/include/linux/rbtree.h
index fb31765..33adf78 100644
--- a/include/linux/rbtree.h
+++ b/include/linux/rbtree.h
@@ -46,7 +46,7 @@ struct rb_root {
 
 #define rb_parent(r)   ((struct rb_node *)((r)-__rb_parent_color  ~3))
 
-#define RB_ROOT(struct rb_root) { NULL, }
+#define RB_ROOT{ NULL, }
 #definerb_entry(ptr, type, member) container_of(ptr, type, member)
 
 #define RB_EMPTY_ROOT(root)  ((root)-rb_node == NULL)
diff --git a/virtio/9p.c b/virtio/9p.c
index 66dcc26..49e7c5c 100644
--- a/virtio/9p.c
+++ b/virtio/9p.c
@@ -1320,7 +1320,7 @@ static int set_size_vq(struct kvm *kvm, void *dev, u32 
vq, int size)
return size;
 }
 
-struct virtio_ops p9_dev_virtio_ops = (struct virtio_ops) {
+struct virtio_ops p9_dev_virtio_ops = {
.get_config = get_config,
.get_host_features  = get_host_features,
.set_guest_features = set_guest_features,
diff --git a/virtio/balloon.c b/virtio/balloon.c
index 84c4bb0..9564aa3 100644
--- a/virtio/balloon.c
+++ b/virtio/balloon.c
@@ -239,7 +239,7 @@ static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, 
int size)
return size;
 }
 
-struct virtio_ops bln_dev_virtio_ops = (struct virtio_ops) {
+struct virtio_ops bln_dev_virtio_ops = {
.get_config = get_config,
.get_host_features  = get_host_features,
.set_guest_features = set_guest_features,
diff --git a/virtio/blk.c b/virtio/blk.c
index edfa8e6..c485e4f 100644
--- a/virtio/blk.c
+++ b/virtio/blk.c
@@ -244,7 +244,7 @@ static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, 
int size)
return size;
 }
 
-static struct virtio_ops blk_dev_virtio_ops = (struct virtio_ops) {
+static struct virtio_ops blk_dev_virtio_ops = {
.get_config = get_config,
.get_host_features  = get_host_features,
.set_guest_features = set_guest_features,
diff --git a/virtio/console.c b/virtio/console.c
index 384eac1..f1c0a19 100644
--- a/virtio/console.c
+++ b/virtio/console.c
@@ -197,7 +197,7 @@ static int set_size_vq(struct kvm *kvm, void *dev, u32 vq, 
int size)
return

Re: [PATCH] kvmtool: Makefile: allow overriding CC and LD

2015-06-19 Thread Andre Przywara

Hi Paolo,

On 19/06/15 10:59, Paolo Bonzini wrote:
 
 
 On 18/06/2015 17:50, Andre Przywara wrote:
 Currently we set CC unconditionally to ${CROSS_COMPILE}gcc, the same
 for LD.
 Allow people to override the compiler name by specifying it explicitly
 on the command line or via the environment.
 Beside calling a certain compiler binary this allows to pass in
 options to the compiler, which lets us get rid of the PowerPC
 overrides in the Makefile. Possible uses:
 $ make CC=gcc -m64 LD=ld -melf64ppc
 (build kvmtool on a PowerPC toolchain defaulting to 32-bit)
 $ make CC=gcc -m32 LD=ld -melf_i386
 (build a 32-bit binary on a multilib-enabled x86-64 compiler)

 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
  Makefile | 10 ++
  1 file changed, 6 insertions(+), 4 deletions(-)

 diff --git a/Makefile b/Makefile
 index 6110b8e..888bee5 100644
 --- a/Makefile
 +++ b/Makefile
 @@ -14,9 +14,13 @@ export E Q
  include config/utilities.mak
  include config/feature-tests.mak
  
 -CC  := $(CROSS_COMPILE)gcc
 +ifeq ($(origin CC), default)
 +CC  := $(CROSS_COMPILE)gcc
 +endif
  CFLAGS  :=
 -LD  := $(CROSS_COMPILE)ld
 +ifeq ($(origin LD), default)
 +LD  := $(CROSS_COMPILE)ld
 +endif
 
 I know zero about the kvmtool build system, 

Well, it inherits a lot from the kernel ;-)

 but that ought not to be
 necessary.  The make manual says:
 
 If a variable has been set with a command argument (*note Overriding
 Variables: Overriding.), then ordinary assignments in the makefile are
 ignored.

Right, there was this nasty difference between CC=gcc make and
make CC=gcc. So I agree that the latter works even without that patch.

Guess I was only looking at the environment here.
Paolo, thanks for pointing out!

Will, please ignore this patch then.

Cheers,
Andre.

 
 Paolo
 
  LDFLAGS :=
  
  FIND:= find
 @@ -148,8 +152,6 @@ ifeq ($(ARCH), powerpc)
  OBJS+= powerpc/spapr_pci.o
  OBJS+= powerpc/xics.o
  ARCH_INCLUDE := powerpc/include
 -CFLAGS  += -m64
 -LDFLAGS += -m elf64ppc
  
  ARCH_WANT_LIBFDT := y
  endif

 
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH] kvmtool: Makefile: allow overriding CC and LD

2015-06-19 Thread Andre Przywara

Hi Michael,

On 19/06/15 02:14, Michael Ellerman wrote:
 On Thu, 2015-06-18 at 16:50 +0100, Andre Przywara wrote:
 Currently we set CC unconditionally to ${CROSS_COMPILE}gcc, the same
 for LD.
 Allow people to override the compiler name by specifying it explicitly
 on the command line or via the environment.
 Beside calling a certain compiler binary this allows to pass in
 options to the compiler, which lets us get rid of the PowerPC
 overrides in the Makefile. Possible uses:
 $ make CC=gcc -m64 LD=ld -melf64ppc
 (build kvmtool on a PowerPC toolchain defaulting to 32-bit)
 $ make CC=gcc -m32 LD=ld -melf_i386
 (build a 32-bit binary on a multilib-enabled x86-64 compiler)
 
 
 I'm not a big fan of that.
 
 Your examples are all about overriding CFLAGS and LDFLAGS, not CC and LD. So
 if anything you should be allowing that. Adding flags to CC and LD is asking
 for trouble.

Will just disabled overriding CFLAGS and LDFLAGS, I think because
kvmtool inherited some C nastiness from the kernel, which does not
compile with random flags set (CFLAGS=-std=gnu99 was the one the broke it).
Maybe we should revisit that, either fix the code to be more robust to
comply with various standards or document that you should not have
CFLAGS set. Then allow overriding CFLAGS again.

But I thought that overriding CC is common practise - if you want to
select a different compiler, that is. Using a different bitness seems a
lot like a different compiler to me, same with different endianness.
I think I saw quite some examples on the web about using CC=gcc -m32.

I agree that abusing CC to pass optimization options to the compiler is
not good, but for kvmtool's Makefile I don't see how adding flags to CC
would hurt.

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm-ppc in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH] kvmtool: Makefile: allow overriding CC and LD

2015-06-19 Thread Andre Przywara

Hi Michael,

On 19/06/15 02:14, Michael Ellerman wrote:
 On Thu, 2015-06-18 at 16:50 +0100, Andre Przywara wrote:
 Currently we set CC unconditionally to ${CROSS_COMPILE}gcc, the same
 for LD.
 Allow people to override the compiler name by specifying it explicitly
 on the command line or via the environment.
 Beside calling a certain compiler binary this allows to pass in
 options to the compiler, which lets us get rid of the PowerPC
 overrides in the Makefile. Possible uses:
 $ make CC=gcc -m64 LD=ld -melf64ppc
 (build kvmtool on a PowerPC toolchain defaulting to 32-bit)
 $ make CC=gcc -m32 LD=ld -melf_i386
 (build a 32-bit binary on a multilib-enabled x86-64 compiler)
 
 
 I'm not a big fan of that.
 
 Your examples are all about overriding CFLAGS and LDFLAGS, not CC and LD. So
 if anything you should be allowing that. Adding flags to CC and LD is asking
 for trouble.

Will just disabled overriding CFLAGS and LDFLAGS, I think because
kvmtool inherited some C nastiness from the kernel, which does not
compile with random flags set (CFLAGS=-std=gnu99 was the one the broke it).
Maybe we should revisit that, either fix the code to be more robust to
comply with various standards or document that you should not have
CFLAGS set. Then allow overriding CFLAGS again.

But I thought that overriding CC is common practise - if you want to
select a different compiler, that is. Using a different bitness seems a
lot like a different compiler to me, same with different endianness.
I think I saw quite some examples on the web about using CC=gcc -m32.

I agree that abusing CC to pass optimization options to the compiler is
not good, but for kvmtool's Makefile I don't see how adding flags to CC
would hurt.

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH 2/3] powerpc: use default endianness for converting guest/init

2015-06-19 Thread Andre Przywara

Hi Michael,

On 19/06/15 02:08, Michael Ellerman wrote:
 On Thu, 2015-06-18 at 15:52 +0100, Andre Przywara wrote:
 Hi,

 On 06/17/2015 10:43 AM, Andre Przywara wrote:
 For converting the guest/init binary into an object file, we call
 the linker binary, setting the endianness to big endian explicitly
 when compiling kvmtool for powerpc.
 This breaks if the compiler is actually targetting little endian
 (which is true for the Debian port, for instance).
 Remove the explicit big endianness switch from the linker call to
 allow linking on little endian PowerPC builds again.

 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
 Hi,

 this fixed the powerpc64le build for me, while still compiling fine
 for big endian. Admittedly this whole init-guest_init.o conversion
 has its issues (with MIPS, for instance), which deserve proper fixing,
 but lets just fix that build for now.

 Will was concerned about breaking toolchains where the linker does not
 default to 64-bit. Is that an issue we care about?
 
 Yeah, that would be Debian  Ubuntu BE at least, and maybe Fedora too? I'm not
 sure how you compiled it big endian?

I have my own cross-compiler built from scratch. This is
powerpc64-linux-gnu, which is big endian. I don't have any distribution
behind it, it's just a cross-compiler with glibc.

 AFAICT LDFLAGS is only used in this dodgy binary-to-object-file
 conversion of guest/init. For this we rely on the resulting .o file to
 have the same ELF target as the other object files to be finally linked
 into the lkvm binary. As we don't compile guest/init with CFLAGS, there
 is a possible mismatch.

 I am looking into a proper fix for this now (compiling guest/init with
 CFLAGS, calling $CC with linker options instead of $LD and allowing CC
 and LD override). Still struggling with MIPS, though :-(
 
 Yeah that's obviously a better solution medium term.
 
 Can you do something like this? Sorry untested:
 
 diff --git a/Makefile b/Makefile
 index 6110b8e..8663d67 100644
 --- a/Makefile
 +++ b/Makefile
 @@ -149,7 +149,11 @@ ifeq ($(ARCH), powerpc)
 OBJS+= powerpc/xics.o
 ARCH_INCLUDE := powerpc/include
 CFLAGS  += -m64
 -   LDFLAGS += -m elf64ppc
 +   ifeq ($(call try-build,$(SOURCE_HELLO),$(CFLAGS),-m elf64ppc),y)
 +   LDFLAGS += -m elf64ppc
 +   else
 +   LDFLAGS += -m elf64leppc
 +   endif
  
 ARCH_WANT_LIBFDT := y
  endif

Nah, actually I want to get rid of those LDFLAGS at all. For some
reasons using ld to convert a random binary file into a C object is
causing trouble on MIPS, because ld uses a slightly different ELF target
than CC there.
I think this conversion should be more a job for objcopy than for ld,
but that does not fix the problem in a generic way (though I was able to
hack it with some magic objcopy options).

What works though is using xxd to convert the binary guest/init into a C
array:
$ xxd -i guest/init | $(CC) -x c -c - -o guest/guest_init.o
This has the nice property of using the same compiler that generates the
other object files and thus automatically matches them (which is a
problem under MIPS atm, as ld seems to default to some different ELF type).
The only issue is that xxd is part of the vim package, which would annoy
Emacs users. Not sure we are in a position to mandate vim for compiling
kvmtool ;-)

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm-ppc in

Re: [PATCH 2/3] powerpc: use default endianness for converting guest/init

2015-06-19 Thread Andre Przywara

Hi Michael,

On 19/06/15 02:08, Michael Ellerman wrote:
 On Thu, 2015-06-18 at 15:52 +0100, Andre Przywara wrote:
 Hi,

 On 06/17/2015 10:43 AM, Andre Przywara wrote:
 For converting the guest/init binary into an object file, we call
 the linker binary, setting the endianness to big endian explicitly
 when compiling kvmtool for powerpc.
 This breaks if the compiler is actually targetting little endian
 (which is true for the Debian port, for instance).
 Remove the explicit big endianness switch from the linker call to
 allow linking on little endian PowerPC builds again.

 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
 Hi,

 this fixed the powerpc64le build for me, while still compiling fine
 for big endian. Admittedly this whole init-guest_init.o conversion
 has its issues (with MIPS, for instance), which deserve proper fixing,
 but lets just fix that build for now.

 Will was concerned about breaking toolchains where the linker does not
 default to 64-bit. Is that an issue we care about?
 
 Yeah, that would be Debian  Ubuntu BE at least, and maybe Fedora too? I'm not
 sure how you compiled it big endian?

I have my own cross-compiler built from scratch. This is
powerpc64-linux-gnu, which is big endian. I don't have any distribution
behind it, it's just a cross-compiler with glibc.

 AFAICT LDFLAGS is only used in this dodgy binary-to-object-file
 conversion of guest/init. For this we rely on the resulting .o file to
 have the same ELF target as the other object files to be finally linked
 into the lkvm binary. As we don't compile guest/init with CFLAGS, there
 is a possible mismatch.

 I am looking into a proper fix for this now (compiling guest/init with
 CFLAGS, calling $CC with linker options instead of $LD and allowing CC
 and LD override). Still struggling with MIPS, though :-(
 
 Yeah that's obviously a better solution medium term.
 
 Can you do something like this? Sorry untested:
 
 diff --git a/Makefile b/Makefile
 index 6110b8e..8663d67 100644
 --- a/Makefile
 +++ b/Makefile
 @@ -149,7 +149,11 @@ ifeq ($(ARCH), powerpc)
 OBJS+= powerpc/xics.o
 ARCH_INCLUDE := powerpc/include
 CFLAGS  += -m64
 -   LDFLAGS += -m elf64ppc
 +   ifeq ($(call try-build,$(SOURCE_HELLO),$(CFLAGS),-m elf64ppc),y)
 +   LDFLAGS += -m elf64ppc
 +   else
 +   LDFLAGS += -m elf64leppc
 +   endif
  
 ARCH_WANT_LIBFDT := y
  endif

Nah, actually I want to get rid of those LDFLAGS at all. For some
reasons using ld to convert a random binary file into a C object is
causing trouble on MIPS, because ld uses a slightly different ELF target
than CC there.
I think this conversion should be more a job for objcopy than for ld,
but that does not fix the problem in a generic way (though I was able to
hack it with some magic objcopy options).

What works though is using xxd to convert the binary guest/init into a C
array:
$ xxd -i guest/init | $(CC) -x c -c - -o guest/guest_init.o
This has the nice property of using the same compiler that generates the
other object files and thus automatically matches them (which is a
problem under MIPS atm, as ld seems to default to some different ELF type).
The only issue is that xxd is part of the vim package, which would annoy
Emacs users. Not sure we are in a position to mandate vim for compiling
kvmtool ;-)

Cheers,
Andre.
--
To unsubscribe from this list: send the line unsubscribe kvm in

Re: [PATCH 13/13] KVM: arm64: enable ITS emulation as a virtual MSI controller

2015-06-18 Thread Andre Przywara

Hi Eric,

On 06/18/2015 09:43 AM, Eric Auger wrote:
 On 05/29/2015 11:53 AM, Andre Przywara wrote:
 If userspace has provided a base address for the ITS register frame,
 we enable the bits that advertise LPIs in the GICv3.
 When the guest has enabled LPIs and the ITS, we enable the emulation
 part by initializing the ITS data structures and trapping on ITS
 register frame accesses by the guest.
 Also we enable the KVM_SIGNAL_MSI feature to allow userland to inject
 MSIs into the guest. Not having enabled the ITS emulation will lead
 to a -ENODEV when trying to inject a MSI.




 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 diff --git a/virt/kvm/arm/vgic.c b/virt/kvm/arm/vgic.c
 index 9f7b05f..09b1f46 100644
 --- a/virt/kvm/arm/vgic.c
 +++ b/virt/kvm/arm/vgic.c
 @@ -2254,3 +2254,13 @@ int kvm_set_msi(struct kvm_kernel_irq_routing_entry 
 *e,
  {
  return 0;
  }
 +
 +#ifdef CONFIG_HAVE_KVM_MSI
 I don't think the if#def is requested since the entry is already
 prevented in kvm_main.c in, case KVM_SIGNAL_MSI.

But that fails compilation on ARM (which uses this file as well),
because we have a dummy fail function in the header if
CONFIG_HAVE_KVM_MSI is not defined.
So you get: error: redefinition of 'kvm_send_userspace_msi'

Cheers,
Andre.

 +int kvm_send_userspace_msi(struct kvm *kvm, struct kvm_msi *msi)
 +{
 +if (kvm-arch.vgic.vm_ops.inject_msi)
 +return kvm-arch.vgic.vm_ops.inject_msi(kvm, msi);
 +else
 +return -ENODEV;
 +}
 +#endif

 
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH 2/3] powerpc: use default endianness for converting guest/init

2015-06-18 Thread Andre Przywara

Hi,

On 06/17/2015 10:43 AM, Andre Przywara wrote:
 For converting the guest/init binary into an object file, we call
 the linker binary, setting the endianness to big endian explicitly
 when compiling kvmtool for powerpc.
 This breaks if the compiler is actually targetting little endian
 (which is true for the Debian port, for instance).
 Remove the explicit big endianness switch from the linker call to
 allow linking on little endian PowerPC builds again.
 
 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
 Hi,
 
 this fixed the powerpc64le build for me, while still compiling fine
 for big endian. Admittedly this whole init-guest_init.o conversion
 has its issues (with MIPS, for instance), which deserve proper fixing,
 but lets just fix that build for now.
 

Will was concerned about breaking toolchains where the linker does not
default to 64-bit. Is that an issue we care about?
AFAICT LDFLAGS is only used in this dodgy binary-to-object-file
conversion of guest/init. For this we rely on the resulting .o file to
have the same ELF target as the other object files to be finally linked
into the lkvm binary. As we don't compile guest/init with CFLAGS, there
is a possible mismatch.

I am looking into a proper fix for this now (compiling guest/init with
CFLAGS, calling $CC with linker options instead of $LD and allowing CC
and LD override). Still struggling with MIPS, though :-(

If someone is eager to fix compilation on PowerPC meanwhile, feel free
to use this fix for the time being.

Cheers,
Andre.

 
  Makefile | 1 -
  1 file changed, 1 deletion(-)
 
 diff --git a/Makefile b/Makefile
 index 6110b8e..c118e1a 100644
 --- a/Makefile
 +++ b/Makefile
 @@ -149,7 +149,6 @@ ifeq ($(ARCH), powerpc)
   OBJS+= powerpc/xics.o
   ARCH_INCLUDE := powerpc/include
   CFLAGS  += -m64
 - LDFLAGS += -m elf64ppc
  
   ARCH_WANT_LIBFDT := y
  endif
 
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH 2/3] powerpc: use default endianness for converting guest/init

2015-06-18 Thread Andre Przywara

Hi,

On 06/17/2015 10:43 AM, Andre Przywara wrote:
 For converting the guest/init binary into an object file, we call
 the linker binary, setting the endianness to big endian explicitly
 when compiling kvmtool for powerpc.
 This breaks if the compiler is actually targetting little endian
 (which is true for the Debian port, for instance).
 Remove the explicit big endianness switch from the linker call to
 allow linking on little endian PowerPC builds again.
 
 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
 Hi,
 
 this fixed the powerpc64le build for me, while still compiling fine
 for big endian. Admittedly this whole init-guest_init.o conversion
 has its issues (with MIPS, for instance), which deserve proper fixing,
 but lets just fix that build for now.
 

Will was concerned about breaking toolchains where the linker does not
default to 64-bit. Is that an issue we care about?
AFAICT LDFLAGS is only used in this dodgy binary-to-object-file
conversion of guest/init. For this we rely on the resulting .o file to
have the same ELF target as the other object files to be finally linked
into the lkvm binary. As we don't compile guest/init with CFLAGS, there
is a possible mismatch.

I am looking into a proper fix for this now (compiling guest/init with
CFLAGS, calling $CC with linker options instead of $LD and allowing CC
and LD override). Still struggling with MIPS, though :-(

If someone is eager to fix compilation on PowerPC meanwhile, feel free
to use this fix for the time being.

Cheers,
Andre.

 
  Makefile | 1 -
  1 file changed, 1 deletion(-)
 
 diff --git a/Makefile b/Makefile
 index 6110b8e..c118e1a 100644
 --- a/Makefile
 +++ b/Makefile
 @@ -149,7 +149,6 @@ ifeq ($(ARCH), powerpc)
   OBJS+= powerpc/xics.o
   ARCH_INCLUDE := powerpc/include
   CFLAGS  += -m64
 - LDFLAGS += -m elf64ppc
  
   ARCH_WANT_LIBFDT := y
  endif
 
--
To unsubscribe from this list: send the line unsubscribe kvm-ppc in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH] kvmtool: Makefile: allow overriding CC and LD

2015-06-18 Thread Andre Przywara

Currently we set CC unconditionally to ${CROSS_COMPILE}gcc, the same
for LD.
Allow people to override the compiler name by specifying it explicitly
on the command line or via the environment.
Beside calling a certain compiler binary this allows to pass in
options to the compiler, which lets us get rid of the PowerPC
overrides in the Makefile. Possible uses:
$ make CC=gcc -m64 LD=ld -melf64ppc
(build kvmtool on a PowerPC toolchain defaulting to 32-bit)
$ make CC=gcc -m32 LD=ld -melf_i386
(build a 32-bit binary on a multilib-enabled x86-64 compiler)

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 Makefile | 10 ++
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/Makefile b/Makefile
index 6110b8e..888bee5 100644
--- a/Makefile
+++ b/Makefile
@@ -14,9 +14,13 @@ export E Q
 include config/utilities.mak
 include config/feature-tests.mak
 
-CC := $(CROSS_COMPILE)gcc
+ifeq ($(origin CC), default)
+   CC  := $(CROSS_COMPILE)gcc
+endif
 CFLAGS :=
-LD := $(CROSS_COMPILE)ld
+ifeq ($(origin LD), default)
+   LD  := $(CROSS_COMPILE)ld
+endif
 LDFLAGS:=
 
 FIND   := find
@@ -148,8 +152,6 @@ ifeq ($(ARCH), powerpc)
OBJS+= powerpc/spapr_pci.o
OBJS+= powerpc/xics.o
ARCH_INCLUDE := powerpc/include
-   CFLAGS  += -m64
-   LDFLAGS += -m elf64ppc
 
ARCH_WANT_LIBFDT := y
 endif
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH] kvmtool: Makefile: allow overriding CC and LD

2015-06-18 Thread Andre Przywara

Currently we set CC unconditionally to ${CROSS_COMPILE}gcc, the same
for LD.
Allow people to override the compiler name by specifying it explicitly
on the command line or via the environment.
Beside calling a certain compiler binary this allows to pass in
options to the compiler, which lets us get rid of the PowerPC
overrides in the Makefile. Possible uses:
$ make CC=gcc -m64 LD=ld -melf64ppc
(build kvmtool on a PowerPC toolchain defaulting to 32-bit)
$ make CC=gcc -m32 LD=ld -melf_i386
(build a 32-bit binary on a multilib-enabled x86-64 compiler)

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
 Makefile | 10 ++
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/Makefile b/Makefile
index 6110b8e..888bee5 100644
--- a/Makefile
+++ b/Makefile
@@ -14,9 +14,13 @@ export E Q
 include config/utilities.mak
 include config/feature-tests.mak
 
-CC := $(CROSS_COMPILE)gcc
+ifeq ($(origin CC), default)
+   CC  := $(CROSS_COMPILE)gcc
+endif
 CFLAGS :=
-LD := $(CROSS_COMPILE)ld
+ifeq ($(origin LD), default)
+   LD  := $(CROSS_COMPILE)ld
+endif
 LDFLAGS:=
 
 FIND   := find
@@ -148,8 +152,6 @@ ifeq ($(ARCH), powerpc)
OBJS+= powerpc/spapr_pci.o
OBJS+= powerpc/xics.o
ARCH_INCLUDE := powerpc/include
-   CFLAGS  += -m64
-   LDFLAGS += -m elf64ppc
 
ARCH_WANT_LIBFDT := y
 endif
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm-ppc in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Re: [PATCH] kvmtool: don't use PCI config space IRQ line field

2015-06-18 Thread Andre Przywara

Hi Will,

On 06/16/2015 06:06 PM, Will Deacon wrote:
 On Mon, Jun 15, 2015 at 11:45:38AM +0100, Andre Przywara wrote:
 On 06/05/2015 05:41 PM, Will Deacon wrote:
 On Thu, Jun 04, 2015 at 04:20:45PM +0100, Andre Przywara wrote:
 In PCI config space there is an interrupt line field (offset 0x3f),
 which is used to initially communicate the IRQ line number from
 firmware to the OS. _Hardware_ should never use this information,
 as the OS is free to write any information in there.
 But kvmtool uses this number when it triggers IRQs in the guest,
 which fails starting with Linux 3.19-rc1, where the PCI layer starts
 writing the virtual IRQ number in there.

 Fix that by storing the IRQ number in a separate field in
 struct virtio_pci, which is independent from the PCI config space
 and cannot be influenced by the guest.
 This fixes ARM/ARM64 guests using PCI with newer kernels.

 Signed-off-by: Andre Przywara andre.przyw...@arm.com
 ---
  include/kvm/virtio-pci.h | 8 
  virtio/pci.c | 9 ++---
  2 files changed, 14 insertions(+), 3 deletions(-)

 diff --git a/include/kvm/virtio-pci.h b/include/kvm/virtio-pci.h
 index c795ce7..b70cadd 100644
 --- a/include/kvm/virtio-pci.h
 +++ b/include/kvm/virtio-pci.h
 @@ -30,6 +30,14 @@ struct virtio_pci {
u8  isr;
u32 features;
  
 +  /*
 +   * We cannot rely on the INTERRUPT_LINE byte in the config space once
 +   * we have run guest code, as the OS is allowed to use that field
 +   * as a scratch pad to communicate between driver and PCI layer.
 +   * So store our legacy interrupt line number in here for internal use.
 +   */
 +  u8  legacy_irq_line;
 +
/* MSI-X */
u16 config_vector;
u32 config_gsi;
 diff --git a/virtio/pci.c b/virtio/pci.c
 index 7556239..e17e5a9 100644
 --- a/virtio/pci.c
 +++ b/virtio/pci.c
 @@ -141,7 +141,7 @@ static bool virtio_pci__io_in(struct ioport *ioport, 
 struct kvm_cpu *vcpu, u16 p
break;
case VIRTIO_PCI_ISR:
ioport__write8(data, vpci-isr);
 -  kvm__irq_line(kvm, vpci-pci_hdr.irq_line, VIRTIO_IRQ_LOW);
 +  kvm__irq_line(kvm, vpci-legacy_irq_line, VIRTIO_IRQ_LOW);
vpci-isr = VIRTIO_IRQ_LOW;
break;
default:
 @@ -299,7 +299,7 @@ int virtio_pci__signal_vq(struct kvm *kvm, struct 
 virtio_device *vdev, u32 vq)
kvm__irq_trigger(kvm, vpci-gsis[vq]);
} else {
vpci-isr = VIRTIO_IRQ_HIGH;
 -  kvm__irq_trigger(kvm, vpci-pci_hdr.irq_line);
 +  kvm__irq_trigger(kvm, vpci-legacy_irq_line);
}
return 0;
  }
 @@ -323,7 +323,7 @@ int virtio_pci__signal_config(struct kvm *kvm, struct 
 virtio_device *vdev)
kvm__irq_trigger(kvm, vpci-config_gsi);
} else {
vpci-isr = VIRTIO_PCI_ISR_CONFIG;
 -  kvm__irq_trigger(kvm, vpci-pci_hdr.irq_line);
 +  kvm__irq_trigger(kvm, vpci-legacy_irq_line);
}
  
return 0;
 @@ -422,6 +422,9 @@ int virtio_pci__init(struct kvm *kvm, void *dev, 
 struct virtio_device *vdev,
if (r  0)
goto free_msix_mmio;
  
 +  /* save the IRQ that device__register() has allocated */
 +  vpci-legacy_irq_line = vpci-pci_hdr.irq_line;

 I'd rather we used the container_of trick that we do for virtio-mmio
 devices when assigning the irq in device__register. Then we can avoid
 this line completely.

 Not completely sure I get what you mean, I take it you want to assign
 legacy_irq_line in pci__assign_irq() directly (where the IRQ number is
 allocated).
 But this function is PCI generic code and is used by the VESA
 framebuffer and the shmem device on x86 as well. For those devices
 dev_hdr is not part of a struct virtio_pci, so we can't do container_of
 to assign the legacy_irq_line here directly.
 Admittedly this fix should apply to the other two users as well, but
 VESA does not use interrupts and pci-shmem is completely broken anyway,
 so I didn't bother to fix it in this regard.
 Would it be justified to provide an IRQ number field in struct
 device_header to address all users?

 Or what am I missing here?
 
 If VESA and shmem are broken, they should either be fixed or removed.

I am tempted to remove shmem, since it's broken:
a) there is no upstream driver, only some out-of-tree uio driver module
in some Github repo
b) the PCI device BARs do not match what QEMU implements and what the
uio driver expects (IO BAR vs. MMIO BAR)
c) there is (at least one) bug in kvmtool (easily fixed, though)
I haven't completely given up yet fixing it, but that's for another
series ;-)

However ...

 
 If you fix them, then we could have separate virtual buses for virtio-pci
 and emulated-pci (or whatever you want to call it). We could also have
 a separate bus for passthrough-devices too.
 
 However, that's quite a lot of work for a bug-fix, so I guess the easiest
 thing is to extend your current hack to cover VESA and shmem

Re: [PATCH 13/13] KVM: arm64: enable ITS emulation as a virtual MSI controller

2015-06-18 Thread Andre Przywara

On 06/18/2015 04:03 PM, Pavel Fedin wrote:
  Hello!
 
 But that fails compilation on ARM (which uses this file as well),
 because we have a dummy fail function in the header if
 CONFIG_HAVE_KVM_MSI is not defined.
 
  May be then remove that fail function too? Too many #ifdef's are not good...

Yes, that seems to work - now. I think I had more code in there before
that prevented exposure without #ifdef guarding.

Cheers,
Andre.

 
 Kind regards,
 Pavel Fedin
 Expert Engineer
 Samsung Electronics Research center Russia
 
 
--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v2] powerpc: add hvcall.h header from Linux

2015-06-18 Thread Andre Przywara

The powerpc code uses some PAPR hypercalls, of which we need the
hypercall number. Copy just the needed macro definitions from the
kernel's (private) hvcall.h file and remove the extra tricks formerly
used to be able to include this header file directly.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
Hi,

this version of the header file just contains the definitions we
need, while still being easily diff-able against the original file.
Please consider applying this one.

Cheers,
Andre.

 powerpc/include/asm/hvcall.h | 33 +
 powerpc/spapr.h  |  3 ---
 2 files changed, 33 insertions(+), 3 deletions(-)
 create mode 100644 powerpc/include/asm/hvcall.h

diff --git a/powerpc/include/asm/hvcall.h b/powerpc/include/asm/hvcall.h
new file mode 100644
index 000..9d58f9b
--- /dev/null
+++ b/powerpc/include/asm/hvcall.h
@@ -0,0 +1,33 @@
+#ifndef _ASM_POWERPC_HVCALL_H
+#define _ASM_POWERPC_HVCALL_H
+
+/* This file is a trimmed-down version of arch/powerpc/include/asm/hvcall.h. */
+
+#define H_SUCCESS  0
+
+#define H_HARDWARE -1  /* Hardware error */
+#define H_FUNCTION -2  /* Function not supported */
+#define H_PRIVILEGE-3  /* Caller not privileged */
+#define H_PARAMETER-4  /* Parameter invalid, out-of-range or 
conflicting */
+
+#define H_SET_DABR 0x28
+#define H_LOGICAL_CI_LOAD  0x3c
+#define H_LOGICAL_CI_STORE 0x40
+#define H_LOGICAL_CACHE_LOAD   0x44
+#define H_LOGICAL_CACHE_STORE  0x48
+#define H_LOGICAL_ICBI 0x4c
+#define H_LOGICAL_DCBF 0x50
+
+#define H_GET_TERM_CHAR0x54
+#define H_PUT_TERM_CHAR0x58
+
+#define H_EOI  0x64
+#define H_CPPR 0x68
+#define H_IPI  0x6c
+#define H_IPOLL0x70
+#define H_XIRR 0x74
+
+#define H_SET_MODE 0x31C
+#define MAX_HCALL_OPCODE   H_SET_MODE
+
+#endif /* _ASM_POWERPC_HVCALL_H */
diff --git a/powerpc/spapr.h b/powerpc/spapr.h
index 0537f88..4c6e349 100644
--- a/powerpc/spapr.h
+++ b/powerpc/spapr.h
@@ -16,10 +16,7 @@
 
 #include inttypes.h
 
-/* We need some of the H_ hcall defs, but they're __KERNEL__ only. */
-#define __KERNEL__
 #include asm/hvcall.h
-#undef __KERNEL__
 
 #include kvm/kvm.h
 #include kvm/kvm-cpu.h
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[PATCH v2] powerpc: add hvcall.h header from Linux

2015-06-18 Thread Andre Przywara

The powerpc code uses some PAPR hypercalls, of which we need the
hypercall number. Copy just the needed macro definitions from the
kernel's (private) hvcall.h file and remove the extra tricks formerly
used to be able to include this header file directly.

Signed-off-by: Andre Przywara andre.przyw...@arm.com
---
Hi,

this version of the header file just contains the definitions we
need, while still being easily diff-able against the original file.
Please consider applying this one.

Cheers,
Andre.

 powerpc/include/asm/hvcall.h | 33 +
 powerpc/spapr.h  |  3 ---
 2 files changed, 33 insertions(+), 3 deletions(-)
 create mode 100644 powerpc/include/asm/hvcall.h

diff --git a/powerpc/include/asm/hvcall.h b/powerpc/include/asm/hvcall.h
new file mode 100644
index 000..9d58f9b
--- /dev/null
+++ b/powerpc/include/asm/hvcall.h
@@ -0,0 +1,33 @@
+#ifndef _ASM_POWERPC_HVCALL_H
+#define _ASM_POWERPC_HVCALL_H
+
+/* This file is a trimmed-down version of arch/powerpc/include/asm/hvcall.h. */
+
+#define H_SUCCESS  0
+
+#define H_HARDWARE -1  /* Hardware error */
+#define H_FUNCTION -2  /* Function not supported */
+#define H_PRIVILEGE-3  /* Caller not privileged */
+#define H_PARAMETER-4  /* Parameter invalid, out-of-range or 
conflicting */
+
+#define H_SET_DABR 0x28
+#define H_LOGICAL_CI_LOAD  0x3c
+#define H_LOGICAL_CI_STORE 0x40
+#define H_LOGICAL_CACHE_LOAD   0x44
+#define H_LOGICAL_CACHE_STORE  0x48
+#define H_LOGICAL_ICBI 0x4c
+#define H_LOGICAL_DCBF 0x50
+
+#define H_GET_TERM_CHAR0x54
+#define H_PUT_TERM_CHAR0x58
+
+#define H_EOI  0x64
+#define H_CPPR 0x68
+#define H_IPI  0x6c
+#define H_IPOLL0x70
+#define H_XIRR 0x74
+
+#define H_SET_MODE 0x31C
+#define MAX_HCALL_OPCODE   H_SET_MODE
+
+#endif /* _ASM_POWERPC_HVCALL_H */
diff --git a/powerpc/spapr.h b/powerpc/spapr.h
index 0537f88..4c6e349 100644
--- a/powerpc/spapr.h
+++ b/powerpc/spapr.h
@@ -16,10 +16,7 @@
 
 #include inttypes.h
 
-/* We need some of the H_ hcall defs, but they're __KERNEL__ only. */
-#define __KERNEL__
 #include asm/hvcall.h
-#undef __KERNEL__
 
 #include kvm/kvm.h
 #include kvm/kvm-cpu.h
-- 
2.3.5

--
To unsubscribe from this list: send the line unsubscribe kvm-ppc in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

< 1 2 3 4 5 6 7 >

201 - 300 of 673 matches

Mail list logo