[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
Re: [RFC PATCH v0 1/2] spapr: Add H_REG_SNS hcall
From: |
David Gibson |
Subject: |
Re: [RFC PATCH v0 1/2] spapr: Add H_REG_SNS hcall |
Date: |
Mon, 9 Aug 2021 13:49:54 +1000 |
On Thu, Aug 05, 2021 at 01:02:27PM +0530, Bharata B Rao wrote:
> Add support for H_REG_SNS hcall so that asynchronous page
> fault mechanism can be supported on PowerKVM guests.
>
> This hcall essentially issues KVM_PPC_SET_SNS to let the
> host map and pin the memory containing the Subvention
> Notification Structure. It also claims SPAPR_IRQ_SNS to
> be used as subvention notification interrupt.
>
> Note: Updates to linux-headers/linux/kvm.h are temporary
> pending headers update.
>
> Signed-off-by: Bharata B Rao <bharata@linux.ibm.com>
> ---
> hw/ppc/spapr.c | 3 ++
> hw/ppc/spapr_hcall.c | 56 +++++++++++++++++++++++++++++++++
> include/hw/ppc/spapr.h | 3 ++
> include/hw/ppc/spapr_irq.h | 1 +
> linux-headers/asm-powerpc/kvm.h | 6 ++++
> linux-headers/linux/kvm.h | 1 +
> target/ppc/kvm.c | 14 +++++++++
> target/ppc/kvm_ppc.h | 10 ++++++
> 8 files changed, 94 insertions(+)
>
> diff --git a/hw/ppc/spapr.c b/hw/ppc/spapr.c
> index 81699d4f8b..5f1f75826d 100644
> --- a/hw/ppc/spapr.c
> +++ b/hw/ppc/spapr.c
> @@ -2830,6 +2830,9 @@ static void spapr_machine_init(MachineState *machine)
>
> /* Enable H_PAGE_INIT */
> kvmppc_enable_h_page_init();
> +
> + /* Enable H_REG_SNS */
> + kvmppc_enable_h_reg_sns();
> }
>
> /* map RAM */
> diff --git a/hw/ppc/spapr_hcall.c b/hw/ppc/spapr_hcall.c
> index 0e9a5b2e40..957edecb13 100644
> --- a/hw/ppc/spapr_hcall.c
> +++ b/hw/ppc/spapr_hcall.c
> @@ -1405,6 +1405,59 @@ static target_ulong h_update_dt(PowerPCCPU *cpu,
> SpaprMachineState *spapr,
> return H_SUCCESS;
> }
>
> +static target_ulong deregister_sns(PowerPCCPU *cpu, SpaprMachineState *spapr)
> +{
> + spapr->sns_addr = -1;
> + spapr->sns_len = 0;
> + spapr_irq_free(spapr, SPAPR_IRQ_SNS, 1);
> +
> + return H_SUCCESS;
> +}
> +
> +static target_ulong h_reg_sns(PowerPCCPU *cpu, SpaprMachineState *spapr,
> + target_ulong opcode, target_ulong *args)
> +{
> + target_ulong addr = args[0];
> + target_ulong len = args[1];
> +
> + if (addr == -1) {
> + return deregister_sns(cpu, spapr);
> + }
> +
> + /*
> + * If SNS area is already registered, can't register again before
> + * deregistering it first.
> + */
> + if (spapr->sns_addr == -1) {
As Fabiano says, it looks like the logic is reversed here.
> + return H_PARAMETER;
Also, H_PARAMETER doesn't seem like the right error for this case.
H_BUSY, maybe?
> + }
> +
> + if (!QEMU_IS_ALIGNED(addr, 4096)) {
What's the significance of 4096 here? Should this be one of the page
size defines instead?
> + return H_PARAMETER;
> + }
> +
> + if (len < 256) {
A defined constant (SPAPR_MIN_SNS_SIZE?) would be worthwhile here, I think.
> + return H_P2;
> + }
> +
> + /* TODO: SNS area is not allowed to cross a page boundary */
> +
> + /* KVM_PPC_SET_SNS ioctl */
> + if (kvmppc_set_sns_reg(addr, len)) {
What will happen if you attempt this on a TCG system?
> + return H_PARAMETER;
> + }
> +
> + /* Record SNS addr and len */
> + spapr->sns_addr = addr;
> + spapr->sns_len = len;
> +
> + /* Register irq source for sending ESN notification */
> + spapr_irq_claim(spapr, SPAPR_IRQ_SNS, false, &error_fatal);
I don't think &error_fatal can be right here. AFAICT this must be one
of two cases:
1) This should never fail, no matter what the guest does. If it
does fail, that indicates a qemu bug. In that case &error_abort is
more appropriate
2) This could fail for certain sequences of guest actions. If
that's the case, we shouldn't kill qemu, but should return
H_HARDWARE (or something) instead.
> + args[1] = SPAPR_IRQ_SNS; /* irq no in R5 */
> +
> + return H_SUCCESS;
> +}
> +
> static spapr_hcall_fn papr_hypercall_table[(MAX_HCALL_OPCODE / 4) + 1];
> static spapr_hcall_fn kvmppc_hypercall_table[KVMPPC_HCALL_MAX -
> KVMPPC_HCALL_BASE + 1];
> static spapr_hcall_fn svm_hypercall_table[(SVM_HCALL_MAX - SVM_HCALL_BASE) /
> 4 + 1];
> @@ -1545,6 +1598,9 @@ static void hypercall_register_types(void)
> spapr_register_hypercall(KVMPPC_H_CAS, h_client_architecture_support);
>
> spapr_register_hypercall(KVMPPC_H_UPDATE_DT, h_update_dt);
> +
> + /* SNS memory area registration */
> + spapr_register_hypercall(H_REG_SNS, h_reg_sns);
You definitely need a machine parameter to enable this, and you should
only enable it by default for newer machine types. Otherwise you will
cause migration breakages.
> }
>
> type_init(hypercall_register_types)
> diff --git a/include/hw/ppc/spapr.h b/include/hw/ppc/spapr.h
> index 637652ad16..934f9e066e 100644
> --- a/include/hw/ppc/spapr.h
> +++ b/include/hw/ppc/spapr.h
> @@ -252,6 +252,8 @@ struct SpaprMachineState {
> uint32_t numa_assoc_array[MAX_NODES + NVGPU_MAX_NUM][NUMA_ASSOC_SIZE];
>
> Error *fwnmi_migration_blocker;
> + uint64_t sns_addr;
> + uint64_t sns_len;
> };
>
> #define H_SUCCESS 0
> @@ -549,6 +551,7 @@ struct SpaprMachineState {
> #define H_SCM_UNBIND_MEM 0x3F0
> #define H_SCM_UNBIND_ALL 0x3FC
> #define H_SCM_HEALTH 0x400
> +#define H_REG_SNS 0x41C
> #define H_RPT_INVALIDATE 0x448
>
> #define MAX_HCALL_OPCODE H_RPT_INVALIDATE
> diff --git a/include/hw/ppc/spapr_irq.h b/include/hw/ppc/spapr_irq.h
> index c22a72c9e2..26c680f065 100644
> --- a/include/hw/ppc/spapr_irq.h
> +++ b/include/hw/ppc/spapr_irq.h
> @@ -21,6 +21,7 @@
> #define SPAPR_XIRQ_BASE XICS_IRQ_BASE /* 0x1000 */
> #define SPAPR_IRQ_EPOW (SPAPR_XIRQ_BASE + 0x0000)
> #define SPAPR_IRQ_HOTPLUG (SPAPR_XIRQ_BASE + 0x0001)
> +#define SPAPR_IRQ_SNS (SPAPR_XIRQ_BASE + 0x0002)
> #define SPAPR_IRQ_VIO (SPAPR_XIRQ_BASE + 0x0100) /* 256 VIO devices
> */
> #define SPAPR_IRQ_PCI_LSI (SPAPR_XIRQ_BASE + 0x0200) /* 32+ PHBs devices
> */
>
> diff --git a/linux-headers/asm-powerpc/kvm.h b/linux-headers/asm-powerpc/kvm.h
> index 9f18fa090f..d72739126a 100644
> --- a/linux-headers/asm-powerpc/kvm.h
> +++ b/linux-headers/asm-powerpc/kvm.h
> @@ -470,6 +470,12 @@ struct kvm_ppc_cpu_char {
> #define KVM_PPC_CPU_BEHAV_BNDS_CHK_SPEC_BAR (1ULL << 61)
> #define KVM_PPC_CPU_BEHAV_FLUSH_COUNT_CACHE (1ull << 58)
>
> +/* For KVM_PPC_SET_SNS */
> +struct kvm_ppc_sns_reg {
> + __u64 addr;
> + __u64 len;
> +};
> +
Updates to linux-headers/ should be done as a separate preliminary
patch, listing the specific kernel commit that you're updating too.
> /* Per-vcpu XICS interrupt controller state */
> #define KVM_REG_PPC_ICP_STATE (KVM_REG_PPC | KVM_REG_SIZE_U64 | 0x8c)
>
> diff --git a/linux-headers/linux/kvm.h b/linux-headers/linux/kvm.h
> index bcaf66cc4d..a76945fcbc 100644
> --- a/linux-headers/linux/kvm.h
> +++ b/linux-headers/linux/kvm.h
> @@ -1458,6 +1458,7 @@ struct kvm_s390_ucas_mapping {
> #define KVM_SET_PMU_EVENT_FILTER _IOW(KVMIO, 0xb2, struct
> kvm_pmu_event_filter)
> #define KVM_PPC_SVM_OFF _IO(KVMIO, 0xb3)
> #define KVM_ARM_MTE_COPY_TAGS _IOR(KVMIO, 0xb4, struct
> kvm_arm_copy_mte_tags)
> +#define KVM_PPC_SET_SNS _IOR(KVMIO, 0xb5, struct
> kvm_ppc_sns_reg)
>
> /* ioctl for vm fd */
> #define KVM_CREATE_DEVICE _IOWR(KVMIO, 0xe0, struct kvm_create_device)
> diff --git a/target/ppc/kvm.c b/target/ppc/kvm.c
> index dc93b99189..330985c8a0 100644
> --- a/target/ppc/kvm.c
> +++ b/target/ppc/kvm.c
> @@ -2047,6 +2047,11 @@ void kvmppc_enable_h_rpt_invalidate(void)
> kvmppc_enable_hcall(kvm_state, H_RPT_INVALIDATE);
> }
>
> +void kvmppc_enable_h_reg_sns(void)
> +{
> + kvmppc_enable_hcall(kvm_state, H_REG_SNS);
> +}
> +
> void kvmppc_set_papr(PowerPCCPU *cpu)
> {
> CPUState *cs = CPU(cpu);
> @@ -2959,3 +2964,12 @@ bool kvm_arch_cpu_check_are_resettable(void)
> {
> return true;
> }
> +
> +int kvmppc_set_sns_reg(target_ulong addr, target_ulong len)
> +{
> + struct kvm_ppc_sns_reg sns_reg;
> +
> + sns_reg.addr = addr;
> + sns_reg.len = len;
> + return kvm_vm_ioctl(kvm_state, KVM_PPC_SET_SNS, &sns_reg);
> +}
> diff --git a/target/ppc/kvm_ppc.h b/target/ppc/kvm_ppc.h
> index ee9325bf9a..c22bc3253e 100644
> --- a/target/ppc/kvm_ppc.h
> +++ b/target/ppc/kvm_ppc.h
> @@ -25,6 +25,7 @@ void kvmppc_enable_set_mode_hcall(void);
> void kvmppc_enable_clear_ref_mod_hcalls(void);
> void kvmppc_enable_h_page_init(void);
> void kvmppc_enable_h_rpt_invalidate(void);
> +void kvmppc_enable_h_reg_sns(void);
> void kvmppc_set_papr(PowerPCCPU *cpu);
> int kvmppc_set_compat(PowerPCCPU *cpu, uint32_t compat_pvr);
> void kvmppc_set_mpic_proxy(PowerPCCPU *cpu, int mpic_proxy);
> @@ -87,6 +88,7 @@ void kvmppc_set_reg_ppc_online(PowerPCCPU *cpu, unsigned
> int online);
> void kvmppc_set_reg_tb_offset(PowerPCCPU *cpu, int64_t tb_offset);
>
> int kvm_handle_nmi(PowerPCCPU *cpu, struct kvm_run *run);
> +int kvmppc_set_sns_reg(target_ulong addr, target_ulong len);
>
> #else
>
> @@ -157,6 +159,10 @@ static inline void kvmppc_enable_h_rpt_invalidate(void)
> g_assert_not_reached();
> }
>
> +static inline void kvmppc_enable_h_reg_sns(void)
> +{
> +}
> +
> static inline void kvmppc_set_papr(PowerPCCPU *cpu)
> {
> }
> @@ -430,6 +436,10 @@ static inline bool
> kvmppc_pvr_workaround_required(PowerPCCPU *cpu)
> return false;
> }
>
> +int kvmppc_set_sns_reg(target_ulong addr, target_ulong len)
> +{
> + return -ENOSYS;
> +}
> #endif
>
> #ifndef CONFIG_KVM
--
David Gibson | I'll have my music baroque, and my code
david AT gibson.dropbear.id.au | minimalist, thank you. NOT _the_ _other_
| _way_ _around_!
http://www.ozlabs.org/~dgibson
signature.asc
Description: PGP signature