Message ID | 20180618063606.2513-6-david@gibson.dropbear.id.au |
---|---|
State | New |
Headers | show |
Series | spapr: Clean up pagesize handling | expand |
On 06/18/2018 08:36 AM, David Gibson wrote: > The way the POWER Hash Page Table (HPT) MMU is virtualized by KVM HV means > that every page that the guest puts in the pagetables must be truly > physically contiguous, not just GPA-contiguous. In effect this means that > an HPT guest can't use any pagesizes greater than the host page size used > to back its memory. > > At present we handle this by changing what we advertise to the guest based > on the backing pagesizes. This is pretty bad, because it means the guest > sees a different environment depending on what should be host configuration > details. > > As a start on fixing this, we add a new capability parameter to the pseries > machine type which gives the maximum allowed pagesizes for an HPT guest (as > a shift). For now we just create and validate the parameter without making > it do anything. > > For backwards compatibility, on older machine types we set it to the max > available page size for the host. For the 3.0 machine type, we fix it to > 16, the intention being to only allow HPT pagesizes up to 64kiB by default > in future. > > Signed-off-by: David Gibson <david@gibson.dropbear.id.au> > --- > hw/ppc/spapr.c | 12 +++++++++ > hw/ppc/spapr_caps.c | 56 ++++++++++++++++++++++++++++++++++++++++++ > include/hw/ppc/spapr.h | 4 ++- > 3 files changed, 71 insertions(+), 1 deletion(-) > > diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c > index 40858d047c..74a76e7e09 100644 > --- a/hw/ppc/spapr.c > +++ b/hw/ppc/spapr.c > @@ -63,6 +63,7 @@ > #include "hw/virtio/vhost-scsi-common.h" > > #include "exec/address-spaces.h" > +#include "exec/ram_addr.h" > #include "hw/usb.h" > #include "qemu/config-file.h" > #include "qemu/error-report.h" > @@ -4043,6 +4044,7 @@ static void spapr_machine_class_init(ObjectClass *oc, void *data) > smc->default_caps.caps[SPAPR_CAP_CFPC] = SPAPR_CAP_BROKEN; > smc->default_caps.caps[SPAPR_CAP_SBBC] = SPAPR_CAP_BROKEN; > smc->default_caps.caps[SPAPR_CAP_IBS] = SPAPR_CAP_BROKEN; > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = 16; /* 64kiB */ > spapr_caps_add_properties(smc, &error_abort); > } > > @@ -4126,8 +4128,18 @@ static void spapr_machine_2_12_instance_options(MachineState *machine) > > static void spapr_machine_2_12_class_options(MachineClass *mc) > { > + sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc); > + uint8_t mps; > + > spapr_machine_3_0_class_options(mc); > SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_12); > + > + if (kvmppc_hpt_needs_host_contiguous_pages()) { > + mps = ctz64(qemu_getrampagesize()); > + } else { > + mps = 34; /* allow everything up to 16GiB, i.e. everything */ > + } > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = mps; > } > > DEFINE_SPAPR_MACHINE(2_12, "2.12", false); > diff --git a/hw/ppc/spapr_caps.c b/hw/ppc/spapr_caps.c > index 68a4243efc..6cdc0c94e7 100644 > --- a/hw/ppc/spapr_caps.c > +++ b/hw/ppc/spapr_caps.c > @@ -27,6 +27,7 @@ > #include "qapi/visitor.h" > #include "sysemu/hw_accel.h" > #include "target/ppc/cpu.h" > +#include "target/ppc/mmu-hash64.h" > #include "cpu-models.h" > #include "kvm_ppc.h" > > @@ -144,6 +145,42 @@ out: > g_free(val); > } > > +static void spapr_cap_get_pagesize(Object *obj, Visitor *v, const char *name, > + void *opaque, Error **errp) > +{ > + sPAPRCapabilityInfo *cap = opaque; > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > + uint8_t val = spapr_get_cap(spapr, cap->index); > + uint64_t pagesize = (1ULL << val); > + > + visit_type_size(v, name, &pagesize, errp); > +} > + > +static void spapr_cap_set_pagesize(Object *obj, Visitor *v, const char *name, > + void *opaque, Error **errp) > +{ > + sPAPRCapabilityInfo *cap = opaque; > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > + uint64_t pagesize; > + uint8_t val; > + Error *local_err = NULL; > + > + visit_type_size(v, name, &pagesize, &local_err); > + if (local_err) { > + error_propagate(errp, local_err); > + return; > + } > + > + if (!is_power_of_2(pagesize)) { > + error_setg(errp, "cap-%s must be a power of 2", cap->name); > + return; > + } > + > + val = ctz64(pagesize); > + spapr->cmd_line_caps[cap->index] = true; > + spapr->eff.caps[cap->index] = val; > +} > + > static void cap_htm_apply(sPAPRMachineState *spapr, uint8_t val, Error **errp) > { > if (!val) { > @@ -267,6 +304,16 @@ static void cap_safe_indirect_branch_apply(sPAPRMachineState *spapr, > > #define VALUE_DESC_TRISTATE " (broken, workaround, fixed)" > > +static void cap_hpt_maxpagesize_apply(sPAPRMachineState *spapr, > + uint8_t val, Error **errp) > +{ > + if (val < 12) { > + error_setg(errp, "Require at least 4kiB hpt-max-page-size"); > + } else if (val < 16) { > + warn_report("Many guests require at least 64kiB hpt-max-page-size"); > + } > +} > + > sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > [SPAPR_CAP_HTM] = { > .name = "htm", > @@ -326,6 +373,15 @@ sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > .possible = &cap_ibs_possible, > .apply = cap_safe_indirect_branch_apply, > }, > + [SPAPR_CAP_HPT_MAXPAGESIZE] = { > + .name = "hpt-max-page-size", > + .description = "Maximum page size for Hash Page Table guests", > + .index = SPAPR_CAP_HPT_MAXPAGESIZE, > + .get = spapr_cap_get_pagesize, > + .set = spapr_cap_set_pagesize, > + .type = "int", > + .apply = cap_hpt_maxpagesize_apply, > + }, > }; Why not use a "PAGESHIFT" name instead ? and also simplify 'set_pagesize' by requiring a page shift and not a page size. C. > static sPAPRCapabilities default_caps_with_cpu(sPAPRMachineState *spapr, > diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h > index 9dd46a72f6..c97593d032 100644 > --- a/include/hw/ppc/spapr.h > +++ b/include/hw/ppc/spapr.h > @@ -66,8 +66,10 @@ typedef enum { > #define SPAPR_CAP_SBBC 0x04 > /* Indirect Branch Serialisation */ > #define SPAPR_CAP_IBS 0x05 > +/* HPT Maximum Page Size (encoded as a shift) */ > +#define SPAPR_CAP_HPT_MAXPAGESIZE 0x06 > /* Num Caps */ > -#define SPAPR_CAP_NUM (SPAPR_CAP_IBS + 1) > +#define SPAPR_CAP_NUM (SPAPR_CAP_HPT_MAXPAGESIZE + 1) > > /* > * Capability Values >
On Tue, Jun 19, 2018 at 11:23:04AM +0200, Cédric Le Goater wrote: > On 06/18/2018 08:36 AM, David Gibson wrote: > > The way the POWER Hash Page Table (HPT) MMU is virtualized by KVM HV means > > that every page that the guest puts in the pagetables must be truly > > physically contiguous, not just GPA-contiguous. In effect this means that > > an HPT guest can't use any pagesizes greater than the host page size used > > to back its memory. > > > > At present we handle this by changing what we advertise to the guest based > > on the backing pagesizes. This is pretty bad, because it means the guest > > sees a different environment depending on what should be host configuration > > details. > > > > As a start on fixing this, we add a new capability parameter to the pseries > > machine type which gives the maximum allowed pagesizes for an HPT guest (as > > a shift). For now we just create and validate the parameter without making > > it do anything. > > > > For backwards compatibility, on older machine types we set it to the max > > available page size for the host. For the 3.0 machine type, we fix it to > > 16, the intention being to only allow HPT pagesizes up to 64kiB by default > > in future. > > > > Signed-off-by: David Gibson <david@gibson.dropbear.id.au> > > --- > > hw/ppc/spapr.c | 12 +++++++++ > > hw/ppc/spapr_caps.c | 56 ++++++++++++++++++++++++++++++++++++++++++ > > include/hw/ppc/spapr.h | 4 ++- > > 3 files changed, 71 insertions(+), 1 deletion(-) > > > > diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c > > index 40858d047c..74a76e7e09 100644 > > --- a/hw/ppc/spapr.c > > +++ b/hw/ppc/spapr.c > > @@ -63,6 +63,7 @@ > > #include "hw/virtio/vhost-scsi-common.h" > > > > #include "exec/address-spaces.h" > > +#include "exec/ram_addr.h" > > #include "hw/usb.h" > > #include "qemu/config-file.h" > > #include "qemu/error-report.h" > > @@ -4043,6 +4044,7 @@ static void spapr_machine_class_init(ObjectClass *oc, void *data) > > smc->default_caps.caps[SPAPR_CAP_CFPC] = SPAPR_CAP_BROKEN; > > smc->default_caps.caps[SPAPR_CAP_SBBC] = SPAPR_CAP_BROKEN; > > smc->default_caps.caps[SPAPR_CAP_IBS] = SPAPR_CAP_BROKEN; > > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = 16; /* 64kiB */ > > spapr_caps_add_properties(smc, &error_abort); > > } > > > > @@ -4126,8 +4128,18 @@ static void spapr_machine_2_12_instance_options(MachineState *machine) > > > > static void spapr_machine_2_12_class_options(MachineClass *mc) > > { > > + sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc); > > + uint8_t mps; > > + > > spapr_machine_3_0_class_options(mc); > > SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_12); > > + > > + if (kvmppc_hpt_needs_host_contiguous_pages()) { > > + mps = ctz64(qemu_getrampagesize()); > > + } else { > > + mps = 34; /* allow everything up to 16GiB, i.e. everything */ > > + } > > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = mps; > > } > > > > DEFINE_SPAPR_MACHINE(2_12, "2.12", false); > > diff --git a/hw/ppc/spapr_caps.c b/hw/ppc/spapr_caps.c > > index 68a4243efc..6cdc0c94e7 100644 > > --- a/hw/ppc/spapr_caps.c > > +++ b/hw/ppc/spapr_caps.c > > @@ -27,6 +27,7 @@ > > #include "qapi/visitor.h" > > #include "sysemu/hw_accel.h" > > #include "target/ppc/cpu.h" > > +#include "target/ppc/mmu-hash64.h" > > #include "cpu-models.h" > > #include "kvm_ppc.h" > > > > @@ -144,6 +145,42 @@ out: > > g_free(val); > > } > > > > +static void spapr_cap_get_pagesize(Object *obj, Visitor *v, const char *name, > > + void *opaque, Error **errp) > > +{ > > + sPAPRCapabilityInfo *cap = opaque; > > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > + uint8_t val = spapr_get_cap(spapr, cap->index); > > + uint64_t pagesize = (1ULL << val); > > + > > + visit_type_size(v, name, &pagesize, errp); > > +} > > + > > +static void spapr_cap_set_pagesize(Object *obj, Visitor *v, const char *name, > > + void *opaque, Error **errp) > > +{ > > + sPAPRCapabilityInfo *cap = opaque; > > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > + uint64_t pagesize; > > + uint8_t val; > > + Error *local_err = NULL; > > + > > + visit_type_size(v, name, &pagesize, &local_err); > > + if (local_err) { > > + error_propagate(errp, local_err); > > + return; > > + } > > + > > + if (!is_power_of_2(pagesize)) { > > + error_setg(errp, "cap-%s must be a power of 2", cap->name); > > + return; > > + } > > + > > + val = ctz64(pagesize); > > + spapr->cmd_line_caps[cap->index] = true; > > + spapr->eff.caps[cap->index] = val; > > +} > > + > > static void cap_htm_apply(sPAPRMachineState *spapr, uint8_t val, Error **errp) > > { > > if (!val) { > > @@ -267,6 +304,16 @@ static void cap_safe_indirect_branch_apply(sPAPRMachineState *spapr, > > > > #define VALUE_DESC_TRISTATE " (broken, workaround, fixed)" > > > > +static void cap_hpt_maxpagesize_apply(sPAPRMachineState *spapr, > > + uint8_t val, Error **errp) > > +{ > > + if (val < 12) { > > + error_setg(errp, "Require at least 4kiB hpt-max-page-size"); > > + } else if (val < 16) { > > + warn_report("Many guests require at least 64kiB hpt-max-page-size"); > > + } > > +} > > + > > sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > > [SPAPR_CAP_HTM] = { > > .name = "htm", > > @@ -326,6 +373,15 @@ sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > > .possible = &cap_ibs_possible, > > .apply = cap_safe_indirect_branch_apply, > > }, > > + [SPAPR_CAP_HPT_MAXPAGESIZE] = { > > + .name = "hpt-max-page-size", > > + .description = "Maximum page size for Hash Page Table guests", > > + .index = SPAPR_CAP_HPT_MAXPAGESIZE, > > + .get = spapr_cap_get_pagesize, > > + .set = spapr_cap_set_pagesize, > > + .type = "int", > > + .apply = cap_hpt_maxpagesize_apply, > > + }, > > }; > > Why not use a "PAGESHIFT" name instead ? and also simplify 'set_pagesize' > by requiring a page shift and not a page size. I had that in my previous version. Andrew suggested this was a friendlier interface, and on reflection, I agree. > > C. > > > > static sPAPRCapabilities default_caps_with_cpu(sPAPRMachineState *spapr, > > diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h > > index 9dd46a72f6..c97593d032 100644 > > --- a/include/hw/ppc/spapr.h > > +++ b/include/hw/ppc/spapr.h > > @@ -66,8 +66,10 @@ typedef enum { > > #define SPAPR_CAP_SBBC 0x04 > > /* Indirect Branch Serialisation */ > > #define SPAPR_CAP_IBS 0x05 > > +/* HPT Maximum Page Size (encoded as a shift) */ > > +#define SPAPR_CAP_HPT_MAXPAGESIZE 0x06 > > /* Num Caps */ > > -#define SPAPR_CAP_NUM (SPAPR_CAP_IBS + 1) > > +#define SPAPR_CAP_NUM (SPAPR_CAP_HPT_MAXPAGESIZE + 1) > > > > /* > > * Capability Values > > >
On 06/18/2018 08:36 AM, David Gibson wrote: > The way the POWER Hash Page Table (HPT) MMU is virtualized by KVM HV means > that every page that the guest puts in the pagetables must be truly > physically contiguous, not just GPA-contiguous. In effect this means that > an HPT guest can't use any pagesizes greater than the host page size used > to back its memory. > > At present we handle this by changing what we advertise to the guest based > on the backing pagesizes. This is pretty bad, because it means the guest > sees a different environment depending on what should be host configuration > details. > > As a start on fixing this, we add a new capability parameter to the pseries > machine type which gives the maximum allowed pagesizes for an HPT guest (as > a shift). For now we just create and validate the parameter without making > it do anything. > > For backwards compatibility, on older machine types we set it to the max > available page size for the host. For the 3.0 machine type, we fix it to > 16, the intention being to only allow HPT pagesizes up to 64kiB by default > in future. Why not do it now ? I don't think the pseries machine supports 4k pages anyway. so you could change the warn_report() below in an error I think. > Signed-off-by: David Gibson <david@gibson.dropbear.id.au> Reviewed-by: Cédric Le Goater <clg@kaod.org> C. > --- > hw/ppc/spapr.c | 12 +++++++++ > hw/ppc/spapr_caps.c | 56 ++++++++++++++++++++++++++++++++++++++++++ > include/hw/ppc/spapr.h | 4 ++- > 3 files changed, 71 insertions(+), 1 deletion(-) > > diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c > index 40858d047c..74a76e7e09 100644 > --- a/hw/ppc/spapr.c > +++ b/hw/ppc/spapr.c > @@ -63,6 +63,7 @@ > #include "hw/virtio/vhost-scsi-common.h" > > #include "exec/address-spaces.h" > +#include "exec/ram_addr.h" > #include "hw/usb.h" > #include "qemu/config-file.h" > #include "qemu/error-report.h" > @@ -4043,6 +4044,7 @@ static void spapr_machine_class_init(ObjectClass *oc, void *data) > smc->default_caps.caps[SPAPR_CAP_CFPC] = SPAPR_CAP_BROKEN; > smc->default_caps.caps[SPAPR_CAP_SBBC] = SPAPR_CAP_BROKEN; > smc->default_caps.caps[SPAPR_CAP_IBS] = SPAPR_CAP_BROKEN; > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = 16; /* 64kiB */ > spapr_caps_add_properties(smc, &error_abort); > } > > @@ -4126,8 +4128,18 @@ static void spapr_machine_2_12_instance_options(MachineState *machine) > > static void spapr_machine_2_12_class_options(MachineClass *mc) > { > + sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc); > + uint8_t mps; > + > spapr_machine_3_0_class_options(mc); > SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_12); > + > + if (kvmppc_hpt_needs_host_contiguous_pages()) { > + mps = ctz64(qemu_getrampagesize()); > + } else { > + mps = 34; /* allow everything up to 16GiB, i.e. everything */ > + } > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = mps; > } > > DEFINE_SPAPR_MACHINE(2_12, "2.12", false); > diff --git a/hw/ppc/spapr_caps.c b/hw/ppc/spapr_caps.c > index 68a4243efc..6cdc0c94e7 100644 > --- a/hw/ppc/spapr_caps.c > +++ b/hw/ppc/spapr_caps.c > @@ -27,6 +27,7 @@ > #include "qapi/visitor.h" > #include "sysemu/hw_accel.h" > #include "target/ppc/cpu.h" > +#include "target/ppc/mmu-hash64.h" > #include "cpu-models.h" > #include "kvm_ppc.h" > > @@ -144,6 +145,42 @@ out: > g_free(val); > } > > +static void spapr_cap_get_pagesize(Object *obj, Visitor *v, const char *name, > + void *opaque, Error **errp) > +{ > + sPAPRCapabilityInfo *cap = opaque; > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > + uint8_t val = spapr_get_cap(spapr, cap->index); > + uint64_t pagesize = (1ULL << val); > + > + visit_type_size(v, name, &pagesize, errp); > +} > + > +static void spapr_cap_set_pagesize(Object *obj, Visitor *v, const char *name, > + void *opaque, Error **errp) > +{ > + sPAPRCapabilityInfo *cap = opaque; > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > + uint64_t pagesize; > + uint8_t val; > + Error *local_err = NULL; > + > + visit_type_size(v, name, &pagesize, &local_err); > + if (local_err) { > + error_propagate(errp, local_err); > + return; > + } > + > + if (!is_power_of_2(pagesize)) { > + error_setg(errp, "cap-%s must be a power of 2", cap->name); > + return; > + } > + > + val = ctz64(pagesize); > + spapr->cmd_line_caps[cap->index] = true; > + spapr->eff.caps[cap->index] = val; > +} > + > static void cap_htm_apply(sPAPRMachineState *spapr, uint8_t val, Error **errp) > { > if (!val) { > @@ -267,6 +304,16 @@ static void cap_safe_indirect_branch_apply(sPAPRMachineState *spapr, > > #define VALUE_DESC_TRISTATE " (broken, workaround, fixed)" > > +static void cap_hpt_maxpagesize_apply(sPAPRMachineState *spapr, > + uint8_t val, Error **errp) > +{ > + if (val < 12) { > + error_setg(errp, "Require at least 4kiB hpt-max-page-size"); > + } else if (val < 16) { > + warn_report("Many guests require at least 64kiB hpt-max-page-size"); > + } > +} > + > sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > [SPAPR_CAP_HTM] = { > .name = "htm", > @@ -326,6 +373,15 @@ sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > .possible = &cap_ibs_possible, > .apply = cap_safe_indirect_branch_apply, > }, > + [SPAPR_CAP_HPT_MAXPAGESIZE] = { > + .name = "hpt-max-page-size", > + .description = "Maximum page size for Hash Page Table guests", > + .index = SPAPR_CAP_HPT_MAXPAGESIZE, > + .get = spapr_cap_get_pagesize, > + .set = spapr_cap_set_pagesize, > + .type = "int", > + .apply = cap_hpt_maxpagesize_apply, > + }, > }; > > static sPAPRCapabilities default_caps_with_cpu(sPAPRMachineState *spapr, > diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h > index 9dd46a72f6..c97593d032 100644 > --- a/include/hw/ppc/spapr.h > +++ b/include/hw/ppc/spapr.h > @@ -66,8 +66,10 @@ typedef enum { > #define SPAPR_CAP_SBBC 0x04 > /* Indirect Branch Serialisation */ > #define SPAPR_CAP_IBS 0x05 > +/* HPT Maximum Page Size (encoded as a shift) */ > +#define SPAPR_CAP_HPT_MAXPAGESIZE 0x06 > /* Num Caps */ > -#define SPAPR_CAP_NUM (SPAPR_CAP_IBS + 1) > +#define SPAPR_CAP_NUM (SPAPR_CAP_HPT_MAXPAGESIZE + 1) > > /* > * Capability Values >
On Mon, 18 Jun 2018 16:36:02 +1000 David Gibson <david@gibson.dropbear.id.au> wrote: > The way the POWER Hash Page Table (HPT) MMU is virtualized by KVM HV means > that every page that the guest puts in the pagetables must be truly > physically contiguous, not just GPA-contiguous. In effect this means that > an HPT guest can't use any pagesizes greater than the host page size used > to back its memory. > > At present we handle this by changing what we advertise to the guest based > on the backing pagesizes. This is pretty bad, because it means the guest > sees a different environment depending on what should be host configuration > details. > > As a start on fixing this, we add a new capability parameter to the pseries > machine type which gives the maximum allowed pagesizes for an HPT guest (as > a shift). Maybe you can mention that it is exposed to the user as a genuine pagesize, not a shift, because it is a friendlier interface. > For now we just create and validate the parameter without making > it do anything. > > For backwards compatibility, on older machine types we set it to the max > available page size for the host. For the 3.0 machine type, we fix it to > 16, the intention being to only allow HPT pagesizes up to 64kiB by default > in future. > > Signed-off-by: David Gibson <david@gibson.dropbear.id.au> > --- Reviewed-by: Greg Kurz <groug@kaod.org> > hw/ppc/spapr.c | 12 +++++++++ > hw/ppc/spapr_caps.c | 56 ++++++++++++++++++++++++++++++++++++++++++ > include/hw/ppc/spapr.h | 4 ++- > 3 files changed, 71 insertions(+), 1 deletion(-) > > diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c > index 40858d047c..74a76e7e09 100644 > --- a/hw/ppc/spapr.c > +++ b/hw/ppc/spapr.c > @@ -63,6 +63,7 @@ > #include "hw/virtio/vhost-scsi-common.h" > > #include "exec/address-spaces.h" > +#include "exec/ram_addr.h" > #include "hw/usb.h" > #include "qemu/config-file.h" > #include "qemu/error-report.h" > @@ -4043,6 +4044,7 @@ static void spapr_machine_class_init(ObjectClass *oc, void *data) > smc->default_caps.caps[SPAPR_CAP_CFPC] = SPAPR_CAP_BROKEN; > smc->default_caps.caps[SPAPR_CAP_SBBC] = SPAPR_CAP_BROKEN; > smc->default_caps.caps[SPAPR_CAP_IBS] = SPAPR_CAP_BROKEN; > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = 16; /* 64kiB */ > spapr_caps_add_properties(smc, &error_abort); > } > > @@ -4126,8 +4128,18 @@ static void spapr_machine_2_12_instance_options(MachineState *machine) > > static void spapr_machine_2_12_class_options(MachineClass *mc) > { > + sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc); > + uint8_t mps; > + > spapr_machine_3_0_class_options(mc); > SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_12); > + > + if (kvmppc_hpt_needs_host_contiguous_pages()) { > + mps = ctz64(qemu_getrampagesize()); > + } else { > + mps = 34; /* allow everything up to 16GiB, i.e. everything */ > + } > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = mps; > } > > DEFINE_SPAPR_MACHINE(2_12, "2.12", false); > diff --git a/hw/ppc/spapr_caps.c b/hw/ppc/spapr_caps.c > index 68a4243efc..6cdc0c94e7 100644 > --- a/hw/ppc/spapr_caps.c > +++ b/hw/ppc/spapr_caps.c > @@ -27,6 +27,7 @@ > #include "qapi/visitor.h" > #include "sysemu/hw_accel.h" > #include "target/ppc/cpu.h" > +#include "target/ppc/mmu-hash64.h" > #include "cpu-models.h" > #include "kvm_ppc.h" > > @@ -144,6 +145,42 @@ out: > g_free(val); > } > > +static void spapr_cap_get_pagesize(Object *obj, Visitor *v, const char *name, > + void *opaque, Error **errp) > +{ > + sPAPRCapabilityInfo *cap = opaque; > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > + uint8_t val = spapr_get_cap(spapr, cap->index); > + uint64_t pagesize = (1ULL << val); > + > + visit_type_size(v, name, &pagesize, errp); > +} > + > +static void spapr_cap_set_pagesize(Object *obj, Visitor *v, const char *name, > + void *opaque, Error **errp) > +{ > + sPAPRCapabilityInfo *cap = opaque; > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > + uint64_t pagesize; > + uint8_t val; > + Error *local_err = NULL; > + > + visit_type_size(v, name, &pagesize, &local_err); > + if (local_err) { > + error_propagate(errp, local_err); > + return; > + } > + > + if (!is_power_of_2(pagesize)) { > + error_setg(errp, "cap-%s must be a power of 2", cap->name); > + return; > + } > + > + val = ctz64(pagesize); > + spapr->cmd_line_caps[cap->index] = true; > + spapr->eff.caps[cap->index] = val; > +} > + > static void cap_htm_apply(sPAPRMachineState *spapr, uint8_t val, Error **errp) > { > if (!val) { > @@ -267,6 +304,16 @@ static void cap_safe_indirect_branch_apply(sPAPRMachineState *spapr, > > #define VALUE_DESC_TRISTATE " (broken, workaround, fixed)" > > +static void cap_hpt_maxpagesize_apply(sPAPRMachineState *spapr, > + uint8_t val, Error **errp) > +{ > + if (val < 12) { > + error_setg(errp, "Require at least 4kiB hpt-max-page-size"); > + } else if (val < 16) { > + warn_report("Many guests require at least 64kiB hpt-max-page-size"); > + } > +} > + > sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > [SPAPR_CAP_HTM] = { > .name = "htm", > @@ -326,6 +373,15 @@ sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > .possible = &cap_ibs_possible, > .apply = cap_safe_indirect_branch_apply, > }, > + [SPAPR_CAP_HPT_MAXPAGESIZE] = { > + .name = "hpt-max-page-size", > + .description = "Maximum page size for Hash Page Table guests", > + .index = SPAPR_CAP_HPT_MAXPAGESIZE, > + .get = spapr_cap_get_pagesize, > + .set = spapr_cap_set_pagesize, > + .type = "int", > + .apply = cap_hpt_maxpagesize_apply, > + }, > }; > > static sPAPRCapabilities default_caps_with_cpu(sPAPRMachineState *spapr, > diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h > index 9dd46a72f6..c97593d032 100644 > --- a/include/hw/ppc/spapr.h > +++ b/include/hw/ppc/spapr.h > @@ -66,8 +66,10 @@ typedef enum { > #define SPAPR_CAP_SBBC 0x04 > /* Indirect Branch Serialisation */ > #define SPAPR_CAP_IBS 0x05 > +/* HPT Maximum Page Size (encoded as a shift) */ > +#define SPAPR_CAP_HPT_MAXPAGESIZE 0x06 > /* Num Caps */ > -#define SPAPR_CAP_NUM (SPAPR_CAP_IBS + 1) > +#define SPAPR_CAP_NUM (SPAPR_CAP_HPT_MAXPAGESIZE + 1) > > /* > * Capability Values
On Thu, Jun 21, 2018 at 08:22:15AM +0200, Cédric Le Goater wrote: > On 06/18/2018 08:36 AM, David Gibson wrote: > > The way the POWER Hash Page Table (HPT) MMU is virtualized by KVM HV means > > that every page that the guest puts in the pagetables must be truly > > physically contiguous, not just GPA-contiguous. In effect this means that > > an HPT guest can't use any pagesizes greater than the host page size used > > to back its memory. > > > > At present we handle this by changing what we advertise to the guest based > > on the backing pagesizes. This is pretty bad, because it means the guest > > sees a different environment depending on what should be host configuration > > details. > > > > As a start on fixing this, we add a new capability parameter to the pseries > > machine type which gives the maximum allowed pagesizes for an HPT guest (as > > a shift). For now we just create and validate the parameter without making > > it do anything. > > > > For backwards compatibility, on older machine types we set it to the max > > available page size for the host. For the 3.0 machine type, we fix it to > > 16, the intention being to only allow HPT pagesizes up to 64kiB by default > > in future. > > Why not do it now ? Uh.. do what now. Essentially this *is* doing it now, except that we don't have the mechanism to actually enforce it until a couple of patches further in. > I don't think the pseries machine supports 4k pages > anyway. so you could change the warn_report() below in an error I think. Uh.. I think pseries does technically still support 4k pages. Although it might not have been much tested recently, since none of the distros configure it that way. > > Signed-off-by: David Gibson <david@gibson.dropbear.id.au> > > Reviewed-by: Cédric Le Goater <clg@kaod.org> > > C. > > > --- > > hw/ppc/spapr.c | 12 +++++++++ > > hw/ppc/spapr_caps.c | 56 ++++++++++++++++++++++++++++++++++++++++++ > > include/hw/ppc/spapr.h | 4 ++- > > 3 files changed, 71 insertions(+), 1 deletion(-) > > > > diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c > > index 40858d047c..74a76e7e09 100644 > > --- a/hw/ppc/spapr.c > > +++ b/hw/ppc/spapr.c > > @@ -63,6 +63,7 @@ > > #include "hw/virtio/vhost-scsi-common.h" > > > > #include "exec/address-spaces.h" > > +#include "exec/ram_addr.h" > > #include "hw/usb.h" > > #include "qemu/config-file.h" > > #include "qemu/error-report.h" > > @@ -4043,6 +4044,7 @@ static void spapr_machine_class_init(ObjectClass *oc, void *data) > > smc->default_caps.caps[SPAPR_CAP_CFPC] = SPAPR_CAP_BROKEN; > > smc->default_caps.caps[SPAPR_CAP_SBBC] = SPAPR_CAP_BROKEN; > > smc->default_caps.caps[SPAPR_CAP_IBS] = SPAPR_CAP_BROKEN; > > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = 16; /* 64kiB */ > > spapr_caps_add_properties(smc, &error_abort); > > } > > > > @@ -4126,8 +4128,18 @@ static void spapr_machine_2_12_instance_options(MachineState *machine) > > > > static void spapr_machine_2_12_class_options(MachineClass *mc) > > { > > + sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc); > > + uint8_t mps; > > + > > spapr_machine_3_0_class_options(mc); > > SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_12); > > + > > + if (kvmppc_hpt_needs_host_contiguous_pages()) { > > + mps = ctz64(qemu_getrampagesize()); > > + } else { > > + mps = 34; /* allow everything up to 16GiB, i.e. everything */ > > + } > > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = mps; > > } > > > > DEFINE_SPAPR_MACHINE(2_12, "2.12", false); > > diff --git a/hw/ppc/spapr_caps.c b/hw/ppc/spapr_caps.c > > index 68a4243efc..6cdc0c94e7 100644 > > --- a/hw/ppc/spapr_caps.c > > +++ b/hw/ppc/spapr_caps.c > > @@ -27,6 +27,7 @@ > > #include "qapi/visitor.h" > > #include "sysemu/hw_accel.h" > > #include "target/ppc/cpu.h" > > +#include "target/ppc/mmu-hash64.h" > > #include "cpu-models.h" > > #include "kvm_ppc.h" > > > > @@ -144,6 +145,42 @@ out: > > g_free(val); > > } > > > > +static void spapr_cap_get_pagesize(Object *obj, Visitor *v, const char *name, > > + void *opaque, Error **errp) > > +{ > > + sPAPRCapabilityInfo *cap = opaque; > > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > + uint8_t val = spapr_get_cap(spapr, cap->index); > > + uint64_t pagesize = (1ULL << val); > > + > > + visit_type_size(v, name, &pagesize, errp); > > +} > > + > > +static void spapr_cap_set_pagesize(Object *obj, Visitor *v, const char *name, > > + void *opaque, Error **errp) > > +{ > > + sPAPRCapabilityInfo *cap = opaque; > > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > + uint64_t pagesize; > > + uint8_t val; > > + Error *local_err = NULL; > > + > > + visit_type_size(v, name, &pagesize, &local_err); > > + if (local_err) { > > + error_propagate(errp, local_err); > > + return; > > + } > > + > > + if (!is_power_of_2(pagesize)) { > > + error_setg(errp, "cap-%s must be a power of 2", cap->name); > > + return; > > + } > > + > > + val = ctz64(pagesize); > > + spapr->cmd_line_caps[cap->index] = true; > > + spapr->eff.caps[cap->index] = val; > > +} > > + > > static void cap_htm_apply(sPAPRMachineState *spapr, uint8_t val, Error **errp) > > { > > if (!val) { > > @@ -267,6 +304,16 @@ static void cap_safe_indirect_branch_apply(sPAPRMachineState *spapr, > > > > #define VALUE_DESC_TRISTATE " (broken, workaround, fixed)" > > > > +static void cap_hpt_maxpagesize_apply(sPAPRMachineState *spapr, > > + uint8_t val, Error **errp) > > +{ > > + if (val < 12) { > > + error_setg(errp, "Require at least 4kiB hpt-max-page-size"); > > + } else if (val < 16) { > > + warn_report("Many guests require at least 64kiB hpt-max-page-size"); > > + } > > +} > > + > > sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > > [SPAPR_CAP_HTM] = { > > .name = "htm", > > @@ -326,6 +373,15 @@ sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > > .possible = &cap_ibs_possible, > > .apply = cap_safe_indirect_branch_apply, > > }, > > + [SPAPR_CAP_HPT_MAXPAGESIZE] = { > > + .name = "hpt-max-page-size", > > + .description = "Maximum page size for Hash Page Table guests", > > + .index = SPAPR_CAP_HPT_MAXPAGESIZE, > > + .get = spapr_cap_get_pagesize, > > + .set = spapr_cap_set_pagesize, > > + .type = "int", > > + .apply = cap_hpt_maxpagesize_apply, > > + }, > > }; > > > > static sPAPRCapabilities default_caps_with_cpu(sPAPRMachineState *spapr, > > diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h > > index 9dd46a72f6..c97593d032 100644 > > --- a/include/hw/ppc/spapr.h > > +++ b/include/hw/ppc/spapr.h > > @@ -66,8 +66,10 @@ typedef enum { > > #define SPAPR_CAP_SBBC 0x04 > > /* Indirect Branch Serialisation */ > > #define SPAPR_CAP_IBS 0x05 > > +/* HPT Maximum Page Size (encoded as a shift) */ > > +#define SPAPR_CAP_HPT_MAXPAGESIZE 0x06 > > /* Num Caps */ > > -#define SPAPR_CAP_NUM (SPAPR_CAP_IBS + 1) > > +#define SPAPR_CAP_NUM (SPAPR_CAP_HPT_MAXPAGESIZE + 1) > > > > /* > > * Capability Values > > >
On Thu, Jun 21, 2018 at 11:19:41AM +0200, Greg Kurz wrote: > On Mon, 18 Jun 2018 16:36:02 +1000 > David Gibson <david@gibson.dropbear.id.au> wrote: > > > The way the POWER Hash Page Table (HPT) MMU is virtualized by KVM HV means > > that every page that the guest puts in the pagetables must be truly > > physically contiguous, not just GPA-contiguous. In effect this means that > > an HPT guest can't use any pagesizes greater than the host page size used > > to back its memory. > > > > At present we handle this by changing what we advertise to the guest based > > on the backing pagesizes. This is pretty bad, because it means the guest > > sees a different environment depending on what should be host configuration > > details. > > > > As a start on fixing this, we add a new capability parameter to the pseries > > machine type which gives the maximum allowed pagesizes for an HPT guest (as > > a shift). > > Maybe you can mention that it is exposed to the user as a genuine pagesize, > not a shift, because it is a friendlier interface. Oops, I fixed most of the shift references in the commit messages, but missed this one. I removed the "as a shift" text. > > For now we just create and validate the parameter without making > > it do anything. > > > > For backwards compatibility, on older machine types we set it to the max > > available page size for the host. For the 3.0 machine type, we fix it to > > 16, the intention being to only allow HPT pagesizes up to 64kiB by default > > in future. > > > > Signed-off-by: David Gibson <david@gibson.dropbear.id.au> > > --- > > Reviewed-by: Greg Kurz <groug@kaod.org> > > > hw/ppc/spapr.c | 12 +++++++++ > > hw/ppc/spapr_caps.c | 56 ++++++++++++++++++++++++++++++++++++++++++ > > include/hw/ppc/spapr.h | 4 ++- > > 3 files changed, 71 insertions(+), 1 deletion(-) > > > > diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c > > index 40858d047c..74a76e7e09 100644 > > --- a/hw/ppc/spapr.c > > +++ b/hw/ppc/spapr.c > > @@ -63,6 +63,7 @@ > > #include "hw/virtio/vhost-scsi-common.h" > > > > #include "exec/address-spaces.h" > > +#include "exec/ram_addr.h" > > #include "hw/usb.h" > > #include "qemu/config-file.h" > > #include "qemu/error-report.h" > > @@ -4043,6 +4044,7 @@ static void spapr_machine_class_init(ObjectClass *oc, void *data) > > smc->default_caps.caps[SPAPR_CAP_CFPC] = SPAPR_CAP_BROKEN; > > smc->default_caps.caps[SPAPR_CAP_SBBC] = SPAPR_CAP_BROKEN; > > smc->default_caps.caps[SPAPR_CAP_IBS] = SPAPR_CAP_BROKEN; > > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = 16; /* 64kiB */ > > spapr_caps_add_properties(smc, &error_abort); > > } > > > > @@ -4126,8 +4128,18 @@ static void spapr_machine_2_12_instance_options(MachineState *machine) > > > > static void spapr_machine_2_12_class_options(MachineClass *mc) > > { > > + sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc); > > + uint8_t mps; > > + > > spapr_machine_3_0_class_options(mc); > > SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_12); > > + > > + if (kvmppc_hpt_needs_host_contiguous_pages()) { > > + mps = ctz64(qemu_getrampagesize()); > > + } else { > > + mps = 34; /* allow everything up to 16GiB, i.e. everything */ > > + } > > + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = mps; > > } > > > > DEFINE_SPAPR_MACHINE(2_12, "2.12", false); > > diff --git a/hw/ppc/spapr_caps.c b/hw/ppc/spapr_caps.c > > index 68a4243efc..6cdc0c94e7 100644 > > --- a/hw/ppc/spapr_caps.c > > +++ b/hw/ppc/spapr_caps.c > > @@ -27,6 +27,7 @@ > > #include "qapi/visitor.h" > > #include "sysemu/hw_accel.h" > > #include "target/ppc/cpu.h" > > +#include "target/ppc/mmu-hash64.h" > > #include "cpu-models.h" > > #include "kvm_ppc.h" > > > > @@ -144,6 +145,42 @@ out: > > g_free(val); > > } > > > > +static void spapr_cap_get_pagesize(Object *obj, Visitor *v, const char *name, > > + void *opaque, Error **errp) > > +{ > > + sPAPRCapabilityInfo *cap = opaque; > > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > + uint8_t val = spapr_get_cap(spapr, cap->index); > > + uint64_t pagesize = (1ULL << val); > > + > > + visit_type_size(v, name, &pagesize, errp); > > +} > > + > > +static void spapr_cap_set_pagesize(Object *obj, Visitor *v, const char *name, > > + void *opaque, Error **errp) > > +{ > > + sPAPRCapabilityInfo *cap = opaque; > > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > + uint64_t pagesize; > > + uint8_t val; > > + Error *local_err = NULL; > > + > > + visit_type_size(v, name, &pagesize, &local_err); > > + if (local_err) { > > + error_propagate(errp, local_err); > > + return; > > + } > > + > > + if (!is_power_of_2(pagesize)) { > > + error_setg(errp, "cap-%s must be a power of 2", cap->name); > > + return; > > + } > > + > > + val = ctz64(pagesize); > > + spapr->cmd_line_caps[cap->index] = true; > > + spapr->eff.caps[cap->index] = val; > > +} > > + > > static void cap_htm_apply(sPAPRMachineState *spapr, uint8_t val, Error **errp) > > { > > if (!val) { > > @@ -267,6 +304,16 @@ static void cap_safe_indirect_branch_apply(sPAPRMachineState *spapr, > > > > #define VALUE_DESC_TRISTATE " (broken, workaround, fixed)" > > > > +static void cap_hpt_maxpagesize_apply(sPAPRMachineState *spapr, > > + uint8_t val, Error **errp) > > +{ > > + if (val < 12) { > > + error_setg(errp, "Require at least 4kiB hpt-max-page-size"); > > + } else if (val < 16) { > > + warn_report("Many guests require at least 64kiB hpt-max-page-size"); > > + } > > +} > > + > > sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > > [SPAPR_CAP_HTM] = { > > .name = "htm", > > @@ -326,6 +373,15 @@ sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { > > .possible = &cap_ibs_possible, > > .apply = cap_safe_indirect_branch_apply, > > }, > > + [SPAPR_CAP_HPT_MAXPAGESIZE] = { > > + .name = "hpt-max-page-size", > > + .description = "Maximum page size for Hash Page Table guests", > > + .index = SPAPR_CAP_HPT_MAXPAGESIZE, > > + .get = spapr_cap_get_pagesize, > > + .set = spapr_cap_set_pagesize, > > + .type = "int", > > + .apply = cap_hpt_maxpagesize_apply, > > + }, > > }; > > > > static sPAPRCapabilities default_caps_with_cpu(sPAPRMachineState *spapr, > > diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h > > index 9dd46a72f6..c97593d032 100644 > > --- a/include/hw/ppc/spapr.h > > +++ b/include/hw/ppc/spapr.h > > @@ -66,8 +66,10 @@ typedef enum { > > #define SPAPR_CAP_SBBC 0x04 > > /* Indirect Branch Serialisation */ > > #define SPAPR_CAP_IBS 0x05 > > +/* HPT Maximum Page Size (encoded as a shift) */ > > +#define SPAPR_CAP_HPT_MAXPAGESIZE 0x06 > > /* Num Caps */ > > -#define SPAPR_CAP_NUM (SPAPR_CAP_IBS + 1) > > +#define SPAPR_CAP_NUM (SPAPR_CAP_HPT_MAXPAGESIZE + 1) > > > > /* > > * Capability Values >
diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c index 40858d047c..74a76e7e09 100644 --- a/hw/ppc/spapr.c +++ b/hw/ppc/spapr.c @@ -63,6 +63,7 @@ #include "hw/virtio/vhost-scsi-common.h" #include "exec/address-spaces.h" +#include "exec/ram_addr.h" #include "hw/usb.h" #include "qemu/config-file.h" #include "qemu/error-report.h" @@ -4043,6 +4044,7 @@ static void spapr_machine_class_init(ObjectClass *oc, void *data) smc->default_caps.caps[SPAPR_CAP_CFPC] = SPAPR_CAP_BROKEN; smc->default_caps.caps[SPAPR_CAP_SBBC] = SPAPR_CAP_BROKEN; smc->default_caps.caps[SPAPR_CAP_IBS] = SPAPR_CAP_BROKEN; + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = 16; /* 64kiB */ spapr_caps_add_properties(smc, &error_abort); } @@ -4126,8 +4128,18 @@ static void spapr_machine_2_12_instance_options(MachineState *machine) static void spapr_machine_2_12_class_options(MachineClass *mc) { + sPAPRMachineClass *smc = SPAPR_MACHINE_CLASS(mc); + uint8_t mps; + spapr_machine_3_0_class_options(mc); SET_MACHINE_COMPAT(mc, SPAPR_COMPAT_2_12); + + if (kvmppc_hpt_needs_host_contiguous_pages()) { + mps = ctz64(qemu_getrampagesize()); + } else { + mps = 34; /* allow everything up to 16GiB, i.e. everything */ + } + smc->default_caps.caps[SPAPR_CAP_HPT_MAXPAGESIZE] = mps; } DEFINE_SPAPR_MACHINE(2_12, "2.12", false); diff --git a/hw/ppc/spapr_caps.c b/hw/ppc/spapr_caps.c index 68a4243efc..6cdc0c94e7 100644 --- a/hw/ppc/spapr_caps.c +++ b/hw/ppc/spapr_caps.c @@ -27,6 +27,7 @@ #include "qapi/visitor.h" #include "sysemu/hw_accel.h" #include "target/ppc/cpu.h" +#include "target/ppc/mmu-hash64.h" #include "cpu-models.h" #include "kvm_ppc.h" @@ -144,6 +145,42 @@ out: g_free(val); } +static void spapr_cap_get_pagesize(Object *obj, Visitor *v, const char *name, + void *opaque, Error **errp) +{ + sPAPRCapabilityInfo *cap = opaque; + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); + uint8_t val = spapr_get_cap(spapr, cap->index); + uint64_t pagesize = (1ULL << val); + + visit_type_size(v, name, &pagesize, errp); +} + +static void spapr_cap_set_pagesize(Object *obj, Visitor *v, const char *name, + void *opaque, Error **errp) +{ + sPAPRCapabilityInfo *cap = opaque; + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); + uint64_t pagesize; + uint8_t val; + Error *local_err = NULL; + + visit_type_size(v, name, &pagesize, &local_err); + if (local_err) { + error_propagate(errp, local_err); + return; + } + + if (!is_power_of_2(pagesize)) { + error_setg(errp, "cap-%s must be a power of 2", cap->name); + return; + } + + val = ctz64(pagesize); + spapr->cmd_line_caps[cap->index] = true; + spapr->eff.caps[cap->index] = val; +} + static void cap_htm_apply(sPAPRMachineState *spapr, uint8_t val, Error **errp) { if (!val) { @@ -267,6 +304,16 @@ static void cap_safe_indirect_branch_apply(sPAPRMachineState *spapr, #define VALUE_DESC_TRISTATE " (broken, workaround, fixed)" +static void cap_hpt_maxpagesize_apply(sPAPRMachineState *spapr, + uint8_t val, Error **errp) +{ + if (val < 12) { + error_setg(errp, "Require at least 4kiB hpt-max-page-size"); + } else if (val < 16) { + warn_report("Many guests require at least 64kiB hpt-max-page-size"); + } +} + sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { [SPAPR_CAP_HTM] = { .name = "htm", @@ -326,6 +373,15 @@ sPAPRCapabilityInfo capability_table[SPAPR_CAP_NUM] = { .possible = &cap_ibs_possible, .apply = cap_safe_indirect_branch_apply, }, + [SPAPR_CAP_HPT_MAXPAGESIZE] = { + .name = "hpt-max-page-size", + .description = "Maximum page size for Hash Page Table guests", + .index = SPAPR_CAP_HPT_MAXPAGESIZE, + .get = spapr_cap_get_pagesize, + .set = spapr_cap_set_pagesize, + .type = "int", + .apply = cap_hpt_maxpagesize_apply, + }, }; static sPAPRCapabilities default_caps_with_cpu(sPAPRMachineState *spapr, diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h index 9dd46a72f6..c97593d032 100644 --- a/include/hw/ppc/spapr.h +++ b/include/hw/ppc/spapr.h @@ -66,8 +66,10 @@ typedef enum { #define SPAPR_CAP_SBBC 0x04 /* Indirect Branch Serialisation */ #define SPAPR_CAP_IBS 0x05 +/* HPT Maximum Page Size (encoded as a shift) */ +#define SPAPR_CAP_HPT_MAXPAGESIZE 0x06 /* Num Caps */ -#define SPAPR_CAP_NUM (SPAPR_CAP_IBS + 1) +#define SPAPR_CAP_NUM (SPAPR_CAP_HPT_MAXPAGESIZE + 1) /* * Capability Values
The way the POWER Hash Page Table (HPT) MMU is virtualized by KVM HV means that every page that the guest puts in the pagetables must be truly physically contiguous, not just GPA-contiguous. In effect this means that an HPT guest can't use any pagesizes greater than the host page size used to back its memory. At present we handle this by changing what we advertise to the guest based on the backing pagesizes. This is pretty bad, because it means the guest sees a different environment depending on what should be host configuration details. As a start on fixing this, we add a new capability parameter to the pseries machine type which gives the maximum allowed pagesizes for an HPT guest (as a shift). For now we just create and validate the parameter without making it do anything. For backwards compatibility, on older machine types we set it to the max available page size for the host. For the 3.0 machine type, we fix it to 16, the intention being to only allow HPT pagesizes up to 64kiB by default in future. Signed-off-by: David Gibson <david@gibson.dropbear.id.au> --- hw/ppc/spapr.c | 12 +++++++++ hw/ppc/spapr_caps.c | 56 ++++++++++++++++++++++++++++++++++++++++++ include/hw/ppc/spapr.h | 4 ++- 3 files changed, 71 insertions(+), 1 deletion(-)