[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
Re: [Qemu-ppc] [PATCHv3 2/5] pseries: Stubs for HPT resizing
From: |
David Gibson |
Subject: |
Re: [Qemu-ppc] [PATCHv3 2/5] pseries: Stubs for HPT resizing |
Date: |
Thu, 15 Dec 2016 12:07:47 +1100 |
User-agent: |
Mutt/1.7.1 (2016-10-04) |
On Wed, Dec 14, 2016 at 04:22:19PM +1100, Suraj Jitindar Singh wrote:
> On Mon, 2016-12-12 at 15:06 +1100, David Gibson wrote:
> > This introduces stub implementations of the H_RESIZE_HPT_PREPARE and
> > H_RESIZE_HPT_COMMIT hypercalls which we hope to add in a PAPR
> > extension to allow run time resizing of a guest's hash page
> > table. It
> > also adds a new machine property for controlling whether this new
> > facility is available, and logic to check that against availability
> > with KVM (only supported with KVM PR for now).
> >
> > Finally, it adds a new string to the hypertas property in the device
> > tree, advertising to the guest the availability of the HPT resizing
> > hypercalls. This is a tentative suggested value, and would need to
> > be
> > standardized by PAPR before being merged.
> >
> > Signed-off-by: David Gibson <address@hidden>
> > ---
> > hw/ppc/spapr.c | 75
> > ++++++++++++++++++++++++++++++++++++++++++++++++++
> > hw/ppc/spapr_hcall.c | 36 ++++++++++++++++++++++++
> > hw/ppc/trace-events | 2 ++
> > include/hw/ppc/spapr.h | 11 ++++++++
> > target-ppc/kvm.c | 25 +++++++++++++++++
> > target-ppc/kvm_ppc.h | 5 ++++
> > 6 files changed, 154 insertions(+)
> >
> > diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c
> > index 0f25e83..846ce51 100644
> > --- a/hw/ppc/spapr.c
> > +++ b/hw/ppc/spapr.c
> > @@ -760,6 +760,11 @@ static void spapr_dt_rtas(sPAPRMachineState
> > *spapr, void *fdt)
> > if (!kvm_enabled() || kvmppc_spapr_use_multitce()) {
> > add_str(hypertas, "hcall-multi-tce");
> > }
> > +
> > + if (spapr->resize_hpt != SPAPR_RESIZE_HPT_DISABLED) {
> > + add_str(hypertas, "hcall-hpt-resize");
> > + }
> > +
> > _FDT(fdt_setprop(fdt, rtas, "ibm,hypertas-functions",
> > hypertas->str, hypertas->len));
> > g_string_free(hypertas, TRUE);
> > @@ -1839,11 +1844,40 @@ static void ppc_spapr_init(MachineState
> > *machine)
> > long load_limit, fw_size;
> > char *filename;
> > int smt = kvmppc_smt_threads();
> > + Error *resize_hpt_err = NULL;
> >
> > msi_nonbroken = true;
> >
> > QLIST_INIT(&spapr->phbs);
> >
> > + /* Check HPT resizing availability */
> > + kvmppc_check_papr_resize_hpt(&resize_hpt_err);
> > + if (spapr->resize_hpt == SPAPR_RESIZE_HPT_DEFAULT) {
> > + /*
> > + * If the user explicitly requested a mode we should either
> > + * supply it, or fail completely (which we do below). But
> > if
> > + * it's not set explicitly, we reset our mode to something
> > + * that works
> > + */
> > + if (resize_hpt_err) {
> > + spapr->resize_hpt = SPAPR_RESIZE_HPT_DISABLED;
> > + error_free(resize_hpt_err);
> > + resize_hpt_err = NULL;
> > + } else {
> > + spapr->resize_hpt = smc->resize_hpt_default;
> > + }
> > + }
> > +
> > + assert(spapr->resize_hpt != SPAPR_RESIZE_HPT_DEFAULT);
> > +
> > + if ((spapr->resize_hpt != SPAPR_RESIZE_HPT_DISABLED) &&
> > resize_hpt_err) {
> > + /*
> > + * User requested HPT resize, but this host can't supply
> > it. Bail out
> > + */
> > + error_report_err(resize_hpt_err);
> > + exit(1);
> > + }
> > +
> > /* Allocate RMA if necessary */
> > rma_alloc_size = kvmppc_alloc_rma(&rma);
> >
> > @@ -2236,6 +2270,40 @@ static void
> > spapr_set_modern_hotplug_events(Object *obj, bool value,
> > spapr->use_hotplug_event_source = value;
> > }
> >
> > +static char *spapr_get_resize_hpt(Object *obj, Error **errp)
> > +{
> > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
> > +
> > + switch (spapr->resize_hpt) {
> > + case SPAPR_RESIZE_HPT_DEFAULT:
> > + return g_strdup("default");
> > + case SPAPR_RESIZE_HPT_DISABLED:
> > + return g_strdup("disabled");
> > + case SPAPR_RESIZE_HPT_ENABLED:
> > + return g_strdup("enabled");
> > + case SPAPR_RESIZE_HPT_REQUIRED:
> > + return g_strdup("required");
> > + }
> > + assert(0);
> > +}
> > +
> > +static void spapr_set_resize_hpt(Object *obj, const char *value,
> > Error **errp)
> > +{
> > + sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
> > +
> > + if (strcmp(value, "default") == 0) {
> > + spapr->resize_hpt = SPAPR_RESIZE_HPT_DEFAULT;
> > + } else if (strcmp(value, "disabled") == 0) {
> > + spapr->resize_hpt = SPAPR_RESIZE_HPT_DISABLED;
> > + } else if (strcmp(value, "enabled") == 0) {
> > + spapr->resize_hpt = SPAPR_RESIZE_HPT_ENABLED;
> > + } else if (strcmp(value, "required") == 0) {
> > + spapr->resize_hpt = SPAPR_RESIZE_HPT_REQUIRED;
> > + } else {
> > + error_setg(errp, "Bad value for \"resize-hpt\" property");
> > + }
> > +}
> > +
> > static void spapr_machine_initfn(Object *obj)
> > {
> > sPAPRMachineState *spapr = SPAPR_MACHINE(obj);
> > @@ -2256,6 +2324,12 @@ static void spapr_machine_initfn(Object *obj)
> > " place of standard EPOW events
> > when possible"
> > " (required for memory hot-
> > unplug support)",
> > NULL);
> > +
> > + object_property_add_str(obj, "resize-hpt",
> > + spapr_get_resize_hpt,
> > spapr_set_resize_hpt, NULL);
> > + object_property_set_description(obj, "resize-hpt",
> > + "Resizing of the Hash Page Table
> > (enabled, disabled, required)",
> > + NULL);
> > }
> >
> > static void spapr_machine_finalizefn(Object *obj)
> > @@ -2707,6 +2781,7 @@ static void
> > spapr_machine_class_init(ObjectClass *oc, void *data)
> >
> > smc->dr_lmb_enabled = true;
> > smc->tcg_default_cpu = "POWER8";
> > + smc->resize_hpt_default = SPAPR_RESIZE_HPT_DISABLED;
> > mc->query_hotpluggable_cpus = spapr_query_hotpluggable_cpus;
> > fwc->get_dev_path = spapr_get_fw_dev_path;
> > nc->nmi_monitor_handler = spapr_nmi;
> > diff --git a/hw/ppc/spapr_hcall.c b/hw/ppc/spapr_hcall.c
> > index fd9f1d4..72a9c4d 100644
> > --- a/hw/ppc/spapr_hcall.c
> > +++ b/hw/ppc/spapr_hcall.c
> > @@ -355,6 +355,38 @@ static target_ulong h_read(PowerPCCPU *cpu,
> > sPAPRMachineState *spapr,
> > return H_SUCCESS;
> > }
> >
> > +static target_ulong h_resize_hpt_prepare(PowerPCCPU *cpu,
> > + sPAPRMachineState *spapr,
> > + target_ulong opcode,
> > + target_ulong *args)
> > +{
> > + target_ulong flags = args[0];
> > + target_ulong shift = args[1];
> > +
> > + if (spapr->resize_hpt == SPAPR_RESIZE_HPT_DISABLED) {
> > + return H_AUTHORITY;
> > + }
> > +
> > + trace_spapr_h_resize_hpt_prepare(flags, shift);
> > + return H_HARDWARE;
> > +}
> > +
> > +static target_ulong h_resize_hpt_commit(PowerPCCPU *cpu,
> > + sPAPRMachineState *spapr,
> > + target_ulong opcode,
> > + target_ulong *args)
> > +{
> > + target_ulong flags = args[0];
> > + target_ulong shift = args[1];
> > +
> > + if (spapr->resize_hpt == SPAPR_RESIZE_HPT_DISABLED) {
> > + return H_AUTHORITY;
> > + }
> > +
> > + trace_spapr_h_resize_hpt_commit(flags, shift);
> > + return H_HARDWARE;
> > +}
> > +
> > static target_ulong h_set_sprg0(PowerPCCPU *cpu, sPAPRMachineState
> > *spapr,
> > target_ulong opcode, target_ulong
> > *args)
> > {
> > @@ -1134,6 +1166,10 @@ static void hypercall_register_types(void)
> > /* hcall-bulk */
> > spapr_register_hypercall(H_BULK_REMOVE, h_bulk_remove);
> >
> > + /* hcall-hpt-resize */
> > + spapr_register_hypercall(H_RESIZE_HPT_PREPARE,
> > h_resize_hpt_prepare);
> > + spapr_register_hypercall(H_RESIZE_HPT_COMMIT,
> > h_resize_hpt_commit);
> > +
> > /* hcall-splpar */
> > spapr_register_hypercall(H_REGISTER_VPA, h_register_vpa);
> > spapr_register_hypercall(H_CEDE, h_cede);
> > diff --git a/hw/ppc/trace-events b/hw/ppc/trace-events
> > index 2297ead..bf59a8f 100644
> > --- a/hw/ppc/trace-events
> > +++ b/hw/ppc/trace-events
> > @@ -16,6 +16,8 @@ spapr_cas_continue(unsigned long n) "Copy changes
> > to the guest: %ld bytes"
> > # hw/ppc/spapr_hcall.c
> > spapr_cas_pvr_try(uint32_t pvr) "%x"
> > spapr_cas_pvr(uint32_t cur_pvr, bool cpu_match, uint32_t new_pvr,
> > uint64_t pcr) "current=%x, cpu_match=%u, new=%x, compat
> > flags=%"PRIx64
> > +spapr_h_resize_hpt_prepare(uint64_t flags, uint64_t shift)
> > "flags=0x%"PRIx64", shift=%"PRIu64
> > +spapr_h_resize_hpt_commit(uint64_t flags, uint64_t shift)
> > "flags=0x%"PRIx64", shift=%"PRIu64
> >
> > # hw/ppc/spapr_iommu.c
> > spapr_iommu_put(uint64_t liobn, uint64_t ioba, uint64_t tce,
> > uint64_t ret) "liobn=%"PRIx64" ioba=0x%"PRIx64" tce=0x%"PRIx64"
> > ret=%"PRId64
> > diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h
> > index a2d8964..d2c758b 100644
> > --- a/include/hw/ppc/spapr.h
> > +++ b/include/hw/ppc/spapr.h
> > @@ -31,6 +31,13 @@ typedef struct sPAPRMachineState
> > sPAPRMachineState;
> > #define SPAPR_MACHINE_CLASS(klass) \
> > OBJECT_CLASS_CHECK(sPAPRMachineClass, klass, TYPE_SPAPR_MACHINE)
> >
> > +typedef enum {
> > + SPAPR_RESIZE_HPT_DEFAULT = 0,
> > + SPAPR_RESIZE_HPT_DISABLED,
> > + SPAPR_RESIZE_HPT_ENABLED,
> > + SPAPR_RESIZE_HPT_REQUIRED,
> > +} sPAPRResizeHPT;
> > +
> > /**
> > * sPAPRMachineClass:
> > */
> > @@ -46,6 +53,7 @@ struct sPAPRMachineClass {
> > uint64_t *buid, hwaddr *pio,
> > hwaddr *mmio32, hwaddr *mmio64,
> > unsigned n_dma, uint32_t *liobns, Error
> > **errp);
> > + sPAPRResizeHPT resize_hpt_default;
> > };
> >
> > /**
> > @@ -61,6 +69,7 @@ struct sPAPRMachineState {
> > XICSState *xics;
> > DeviceState *rtc;
> >
> > + sPAPRResizeHPT resize_hpt;
> > void *htab;
> > uint32_t htab_shift;
> > hwaddr rma_size;
> > @@ -347,6 +356,8 @@ struct sPAPRMachineState {
> > #define H_XIRR_X 0x2FC
> > #define H_RANDOM 0x300
> > #define H_SET_MODE 0x31C
> > +#define H_RESIZE_HPT_PREPARE 0x36C
> > +#define H_RESIZE_HPT_COMMIT 0x370
> > #define H_SIGNAL_SYS_RESET 0x380
> > #define MAX_HCALL_OPCODE H_SIGNAL_SYS_RESET
> >
> > diff --git a/target-ppc/kvm.c b/target-ppc/kvm.c
> > index 15e12f3..39e5753 100644
> > --- a/target-ppc/kvm.c
> > +++ b/target-ppc/kvm.c
> > @@ -22,6 +22,7 @@
> > #include <linux/kvm.h>
> >
> > #include "qemu-common.h"
> > +#include "qapi/error.h"
> > #include "qemu/error-report.h"
> > #include "cpu.h"
> > #include "qemu/timer.h"
> > @@ -2672,3 +2673,27 @@ int kvmppc_enable_hwrng(void)
> >
> > return kvmppc_enable_hcall(kvm_state, H_RANDOM);
> > }
> > +
> > +void kvmppc_check_papr_resize_hpt(Error **errp)
> > +{
> > + if (!kvm_enabled()) {
> > + return;
> > + }
> > +
> > + /* TODO: Check specific capabilities for HPT resize aware host
> > kernels */
> > +
> > + /*
> > + * It's tempting to try to check directly if the HPT is under
> > our
> > + * control or KVM's, which is what's really relevant here.
> > + * Unfortunately, in order to correctly size the HPT, we need to
> > + * know if we can do resizing, _before_ we attempt to allocate
> > it
> > + * with KVM. Before that point, we don't officially know
> > whether
> > + * we'll control the HPT or not. So we have to use a fallback
> > + * test for PR vs HV KVM to predict that.
> > + */
> > + if (kvmppc_is_pr(kvm_state)) {
> > + return;
> > + }
> > +
> > + error_setg(errp, "Hash page table resizing not available with
> > this KVM version");
> > +}
> > diff --git a/target-ppc/kvm_ppc.h b/target-ppc/kvm_ppc.h
> > index 841a29b..3e852ba 100644
> > --- a/target-ppc/kvm_ppc.h
> > +++ b/target-ppc/kvm_ppc.h
> > @@ -59,6 +59,7 @@ bool kvmppc_has_cap_htm(void);
> > int kvmppc_enable_hwrng(void);
> > int kvmppc_put_books_sregs(PowerPCCPU *cpu);
> > PowerPCCPUClass *kvm_ppc_get_host_cpu_class(void);
> > +void kvmppc_check_papr_resize_hpt(Error **errp);
> >
> > #else
> >
> > @@ -270,6 +271,10 @@ static inline PowerPCCPUClass
> > *kvm_ppc_get_host_cpu_class(void)
> > return NULL;
> > }
> >
> > +static inline void kvmppc_check_papr_resize_hpt(Error **errp)
> > +{
> > + return;
> > +}
> > #endif
> >
> > #ifndef CONFIG_KVM
> Since you're adding a new machine option it would be nice if this was
> documented in the help message.
Um.. which help message do you mean exactly? I've attached a property
description, so we get something in qemu-system-ppc64 -M pseries,?
--
David Gibson | I'll have my music baroque, and my code
david AT gibson.dropbear.id.au | minimalist, thank you. NOT _the_ _other_
| _way_ _around_!
http://www.ozlabs.org/~dgibson
signature.asc
Description: PGP signature