On Wed, Dec 14, 2016 at 04:22:19PM +1100, Suraj Jitindar Singh wrote: > On Mon, 2016-12-12 at 15:06 +1100, David Gibson wrote: > > This introduces stub implementations of the H_RESIZE_HPT_PREPARE and > > H_RESIZE_HPT_COMMIT hypercalls which we hope to add in a PAPR > > extension to allow run time resizing of a guest's hash page > > table. It > > also adds a new machine property for controlling whether this new > > facility is available, and logic to check that against availability > > with KVM (only supported with KVM PR for now). > > > > Finally, it adds a new string to the hypertas property in the device > > tree, advertising to the guest the availability of the HPT resizing > > hypercalls. This is a tentative suggested value, and would need to > > be > > standardized by PAPR before being merged. > > > > Signed-off-by: David Gibson <da...@gibson.dropbear.id.au> > > --- > > hw/ppc/spapr.c | 75 > > ++++++++++++++++++++++++++++++++++++++++++++++++++ > > hw/ppc/spapr_hcall.c | 36 ++++++++++++++++++++++++ > > hw/ppc/trace-events | 2 ++ > > include/hw/ppc/spapr.h | 11 ++++++++ > > target-ppc/kvm.c | 25 +++++++++++++++++ > > target-ppc/kvm_ppc.h | 5 ++++ > > 6 files changed, 154 insertions(+) > > > > diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c > > index 0f25e83..846ce51 100644 > > --- a/hw/ppc/spapr.c > > +++ b/hw/ppc/spapr.c > > @@ -760,6 +760,11 @@ static void spapr_dt_rtas(sPAPRMachineState > > *spapr, void *fdt) > > if (!kvm_enabled() || kvmppc_spapr_use_multitce()) { > > add_str(hypertas, "hcall-multi-tce"); > > } > > + > > + if (spapr->resize_hpt != SPAPR_RESIZE_HPT_DISABLED) { > > + add_str(hypertas, "hcall-hpt-resize"); > > + } > > + > > _FDT(fdt_setprop(fdt, rtas, "ibm,hypertas-functions", > > hypertas->str, hypertas->len)); > > g_string_free(hypertas, TRUE); > > @@ -1839,11 +1844,40 @@ static void ppc_spapr_init(MachineState > > *machine) > > long load_limit, fw_size; > > char *filename; > > int smt = kvmppc_smt_threads(); > > + Error *resize_hpt_err = NULL; > > > > msi_nonbroken = true; > > > > QLIST_INIT(&spapr->phbs); > > > > + /* Check HPT resizing availability */ > > + kvmppc_check_papr_resize_hpt(&resize_hpt_err); > > + if (spapr->resize_hpt == SPAPR_RESIZE_HPT_DEFAULT) { > > + /* > > + * If the user explicitly requested a mode we should either > > + * supply it, or fail completely (which we do below). But > > if > > + * it's not set explicitly, we reset our mode to something > > + * that works > > + */ > > + if (resize_hpt_err) { > > + spapr->resize_hpt = SPAPR_RESIZE_HPT_DISABLED; > > + error_free(resize_hpt_err); > > + resize_hpt_err = NULL; > > + } else { > > + spapr->resize_hpt = smc->resize_hpt_default; > > + } > > + } > > + > > + assert(spapr->resize_hpt != SPAPR_RESIZE_HPT_DEFAULT); > > + > > + if ((spapr->resize_hpt != SPAPR_RESIZE_HPT_DISABLED) && > > resize_hpt_err) { > > + /* > > + * User requested HPT resize, but this host can't supply > > it. Bail out > > + */ > > + error_report_err(resize_hpt_err); > > + exit(1); > > + } > > + > > /* Allocate RMA if necessary */ > > rma_alloc_size = kvmppc_alloc_rma(&rma); > > > > @@ -2236,6 +2270,40 @@ static void > > spapr_set_modern_hotplug_events(Object *obj, bool value, > > spapr->use_hotplug_event_source = value; > > } > > > > +static char *spapr_get_resize_hpt(Object *obj, Error **errp) > > +{ > > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > + > > + switch (spapr->resize_hpt) { > > + case SPAPR_RESIZE_HPT_DEFAULT: > > + return g_strdup("default"); > > + case SPAPR_RESIZE_HPT_DISABLED: > > + return g_strdup("disabled"); > > + case SPAPR_RESIZE_HPT_ENABLED: > > + return g_strdup("enabled"); > > + case SPAPR_RESIZE_HPT_REQUIRED: > > + return g_strdup("required"); > > + } > > + assert(0); > > +} > > + > > +static void spapr_set_resize_hpt(Object *obj, const char *value, > > Error **errp) > > +{ > > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > + > > + if (strcmp(value, "default") == 0) { > > + spapr->resize_hpt = SPAPR_RESIZE_HPT_DEFAULT; > > + } else if (strcmp(value, "disabled") == 0) { > > + spapr->resize_hpt = SPAPR_RESIZE_HPT_DISABLED; > > + } else if (strcmp(value, "enabled") == 0) { > > + spapr->resize_hpt = SPAPR_RESIZE_HPT_ENABLED; > > + } else if (strcmp(value, "required") == 0) { > > + spapr->resize_hpt = SPAPR_RESIZE_HPT_REQUIRED; > > + } else { > > + error_setg(errp, "Bad value for \"resize-hpt\" property"); > > + } > > +} > > + > > static void spapr_machine_initfn(Object *obj) > > { > > sPAPRMachineState *spapr = SPAPR_MACHINE(obj); > > @@ -2256,6 +2324,12 @@ static void spapr_machine_initfn(Object *obj) > > " place of standard EPOW events > > when possible" > > " (required for memory hot- > > unplug support)", > > NULL); > > + > > + object_property_add_str(obj, "resize-hpt", > > + spapr_get_resize_hpt, > > spapr_set_resize_hpt, NULL); > > + object_property_set_description(obj, "resize-hpt", > > + "Resizing of the Hash Page Table > > (enabled, disabled, required)", > > + NULL); > > } > > > > static void spapr_machine_finalizefn(Object *obj) > > @@ -2707,6 +2781,7 @@ static void > > spapr_machine_class_init(ObjectClass *oc, void *data) > > > > smc->dr_lmb_enabled = true; > > smc->tcg_default_cpu = "POWER8"; > > + smc->resize_hpt_default = SPAPR_RESIZE_HPT_DISABLED; > > mc->query_hotpluggable_cpus = spapr_query_hotpluggable_cpus; > > fwc->get_dev_path = spapr_get_fw_dev_path; > > nc->nmi_monitor_handler = spapr_nmi; > > diff --git a/hw/ppc/spapr_hcall.c b/hw/ppc/spapr_hcall.c > > index fd9f1d4..72a9c4d 100644 > > --- a/hw/ppc/spapr_hcall.c > > +++ b/hw/ppc/spapr_hcall.c > > @@ -355,6 +355,38 @@ static target_ulong h_read(PowerPCCPU *cpu, > > sPAPRMachineState *spapr, > > return H_SUCCESS; > > } > > > > +static target_ulong h_resize_hpt_prepare(PowerPCCPU *cpu, > > + sPAPRMachineState *spapr, > > + target_ulong opcode, > > + target_ulong *args) > > +{ > > + target_ulong flags = args[0]; > > + target_ulong shift = args[1]; > > + > > + if (spapr->resize_hpt == SPAPR_RESIZE_HPT_DISABLED) { > > + return H_AUTHORITY; > > + } > > + > > + trace_spapr_h_resize_hpt_prepare(flags, shift); > > + return H_HARDWARE; > > +} > > + > > +static target_ulong h_resize_hpt_commit(PowerPCCPU *cpu, > > + sPAPRMachineState *spapr, > > + target_ulong opcode, > > + target_ulong *args) > > +{ > > + target_ulong flags = args[0]; > > + target_ulong shift = args[1]; > > + > > + if (spapr->resize_hpt == SPAPR_RESIZE_HPT_DISABLED) { > > + return H_AUTHORITY; > > + } > > + > > + trace_spapr_h_resize_hpt_commit(flags, shift); > > + return H_HARDWARE; > > +} > > + > > static target_ulong h_set_sprg0(PowerPCCPU *cpu, sPAPRMachineState > > *spapr, > > target_ulong opcode, target_ulong > > *args) > > { > > @@ -1134,6 +1166,10 @@ static void hypercall_register_types(void) > > /* hcall-bulk */ > > spapr_register_hypercall(H_BULK_REMOVE, h_bulk_remove); > > > > + /* hcall-hpt-resize */ > > + spapr_register_hypercall(H_RESIZE_HPT_PREPARE, > > h_resize_hpt_prepare); > > + spapr_register_hypercall(H_RESIZE_HPT_COMMIT, > > h_resize_hpt_commit); > > + > > /* hcall-splpar */ > > spapr_register_hypercall(H_REGISTER_VPA, h_register_vpa); > > spapr_register_hypercall(H_CEDE, h_cede); > > diff --git a/hw/ppc/trace-events b/hw/ppc/trace-events > > index 2297ead..bf59a8f 100644 > > --- a/hw/ppc/trace-events > > +++ b/hw/ppc/trace-events > > @@ -16,6 +16,8 @@ spapr_cas_continue(unsigned long n) "Copy changes > > to the guest: %ld bytes" > > # hw/ppc/spapr_hcall.c > > spapr_cas_pvr_try(uint32_t pvr) "%x" > > spapr_cas_pvr(uint32_t cur_pvr, bool cpu_match, uint32_t new_pvr, > > uint64_t pcr) "current=%x, cpu_match=%u, new=%x, compat > > flags=%"PRIx64 > > +spapr_h_resize_hpt_prepare(uint64_t flags, uint64_t shift) > > "flags=0x%"PRIx64", shift=%"PRIu64 > > +spapr_h_resize_hpt_commit(uint64_t flags, uint64_t shift) > > "flags=0x%"PRIx64", shift=%"PRIu64 > > > > # hw/ppc/spapr_iommu.c > > spapr_iommu_put(uint64_t liobn, uint64_t ioba, uint64_t tce, > > uint64_t ret) "liobn=%"PRIx64" ioba=0x%"PRIx64" tce=0x%"PRIx64" > > ret=%"PRId64 > > diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h > > index a2d8964..d2c758b 100644 > > --- a/include/hw/ppc/spapr.h > > +++ b/include/hw/ppc/spapr.h > > @@ -31,6 +31,13 @@ typedef struct sPAPRMachineState > > sPAPRMachineState; > > #define SPAPR_MACHINE_CLASS(klass) \ > > OBJECT_CLASS_CHECK(sPAPRMachineClass, klass, TYPE_SPAPR_MACHINE) > > > > +typedef enum { > > + SPAPR_RESIZE_HPT_DEFAULT = 0, > > + SPAPR_RESIZE_HPT_DISABLED, > > + SPAPR_RESIZE_HPT_ENABLED, > > + SPAPR_RESIZE_HPT_REQUIRED, > > +} sPAPRResizeHPT; > > + > > /** > > * sPAPRMachineClass: > > */ > > @@ -46,6 +53,7 @@ struct sPAPRMachineClass { > > uint64_t *buid, hwaddr *pio, > > hwaddr *mmio32, hwaddr *mmio64, > > unsigned n_dma, uint32_t *liobns, Error > > **errp); > > + sPAPRResizeHPT resize_hpt_default; > > }; > > > > /** > > @@ -61,6 +69,7 @@ struct sPAPRMachineState { > > XICSState *xics; > > DeviceState *rtc; > > > > + sPAPRResizeHPT resize_hpt; > > void *htab; > > uint32_t htab_shift; > > hwaddr rma_size; > > @@ -347,6 +356,8 @@ struct sPAPRMachineState { > > #define H_XIRR_X 0x2FC > > #define H_RANDOM 0x300 > > #define H_SET_MODE 0x31C > > +#define H_RESIZE_HPT_PREPARE 0x36C > > +#define H_RESIZE_HPT_COMMIT 0x370 > > #define H_SIGNAL_SYS_RESET 0x380 > > #define MAX_HCALL_OPCODE H_SIGNAL_SYS_RESET > > > > diff --git a/target-ppc/kvm.c b/target-ppc/kvm.c > > index 15e12f3..39e5753 100644 > > --- a/target-ppc/kvm.c > > +++ b/target-ppc/kvm.c > > @@ -22,6 +22,7 @@ > > #include <linux/kvm.h> > > > > #include "qemu-common.h" > > +#include "qapi/error.h" > > #include "qemu/error-report.h" > > #include "cpu.h" > > #include "qemu/timer.h" > > @@ -2672,3 +2673,27 @@ int kvmppc_enable_hwrng(void) > > > > return kvmppc_enable_hcall(kvm_state, H_RANDOM); > > } > > + > > +void kvmppc_check_papr_resize_hpt(Error **errp) > > +{ > > + if (!kvm_enabled()) { > > + return; > > + } > > + > > + /* TODO: Check specific capabilities for HPT resize aware host > > kernels */ > > + > > + /* > > + * It's tempting to try to check directly if the HPT is under > > our > > + * control or KVM's, which is what's really relevant here. > > + * Unfortunately, in order to correctly size the HPT, we need to > > + * know if we can do resizing, _before_ we attempt to allocate > > it > > + * with KVM. Before that point, we don't officially know > > whether > > + * we'll control the HPT or not. So we have to use a fallback > > + * test for PR vs HV KVM to predict that. > > + */ > > + if (kvmppc_is_pr(kvm_state)) { > > + return; > > + } > > + > > + error_setg(errp, "Hash page table resizing not available with > > this KVM version"); > > +} > > diff --git a/target-ppc/kvm_ppc.h b/target-ppc/kvm_ppc.h > > index 841a29b..3e852ba 100644 > > --- a/target-ppc/kvm_ppc.h > > +++ b/target-ppc/kvm_ppc.h > > @@ -59,6 +59,7 @@ bool kvmppc_has_cap_htm(void); > > int kvmppc_enable_hwrng(void); > > int kvmppc_put_books_sregs(PowerPCCPU *cpu); > > PowerPCCPUClass *kvm_ppc_get_host_cpu_class(void); > > +void kvmppc_check_papr_resize_hpt(Error **errp); > > > > #else > > > > @@ -270,6 +271,10 @@ static inline PowerPCCPUClass > > *kvm_ppc_get_host_cpu_class(void) > > return NULL; > > } > > > > +static inline void kvmppc_check_papr_resize_hpt(Error **errp) > > +{ > > + return; > > +} > > #endif > > > > #ifndef CONFIG_KVM > Since you're adding a new machine option it would be nice if this was > documented in the help message.
Um.. which help message do you mean exactly? I've attached a property description, so we get something in qemu-system-ppc64 -M pseries,? -- David Gibson | I'll have my music baroque, and my code david AT gibson.dropbear.id.au | minimalist, thank you. NOT _the_ _other_ | _way_ _around_! http://www.ozlabs.org/~dgibson
signature.asc
Description: PGP signature