[PATCH v4 28/40] KVM: arm64: Defer saving/restoring 64-bit sysregs to vcpu load/put on VHE

Marc Zyngier marc.zyngier at arm.com
Wed Feb 21 07:33:47 PST 2018


On Thu, 15 Feb 2018 21:03:20 +0000,
Christoffer Dall wrote:
> 
> Some system registers do not affect the host kernel's execution and can
> therefore be loaded when we are about to run a VCPU and we don't have to
> restore the host state to the hardware before the time when we are
> actually about to return to userspace or schedule out the VCPU thread.
> 
> The EL1 system registers and the userspace state registers only
> affecting EL0 execution do not need to be saved and restored on every
> switch between the VM and the host, because they don't affect the host
> kernel's execution.
> 
> We mark all registers which are now deffered as such in the
> vcpu_{read,write}_sys_reg accessors in sys-regs.c to ensure the most
> up-to-date copy is always accessed.
> 
> Note MPIDR_EL1 (controlled via VMPIDR_EL2) is accessed from other vcpu
> threads, for example via the GIC emulation, and therefore must be
> declared as immediate, which is fine as the guest cannot modify this
> value.
> 
> The 32-bit sysregs can also be deferred but we do this in a separate
> patch as it requires a bit more infrastructure.
> 
> Signed-off-by: Christoffer Dall <christoffer.dall at linaro.org>
> ---
> 
> Notes:
>     Changes since v3:
>      - Changed to switch-based sysreg approach
> 
>  arch/arm64/kvm/hyp/sysreg-sr.c | 39 +++++++++++++++++++++++++++++++--------
>  arch/arm64/kvm/sys_regs.c      | 40 ++++++++++++++++++++++++++++++++++++++++
>  2 files changed, 71 insertions(+), 8 deletions(-)
> 
> diff --git a/arch/arm64/kvm/hyp/sysreg-sr.c b/arch/arm64/kvm/hyp/sysreg-sr.c
> index 906606dc4e2c..9c60b8062724 100644
> --- a/arch/arm64/kvm/hyp/sysreg-sr.c
> +++ b/arch/arm64/kvm/hyp/sysreg-sr.c
> @@ -25,8 +25,12 @@
>  /*
>   * Non-VHE: Both host and guest must save everything.
>   *
> - * VHE: Host must save tpidr*_el0, mdscr_el1, sp_el0,
> - * and guest must save everything.
> + * VHE: Host and guest must save mdscr_el1 and sp_el0 (and the PC and pstate,
> + * which are handled as part of the el2 return state) on every switch.
> + * tpidr_el0 and tpidrro_el0 only need to be switched when going

How about suspend/resume, which saves/restores both of these EL0
registers (see cpu_do_suspend)? We may not need to do anything (either
because vcpu_put will have happened, or because we'll come back
exactly where we were), but I'd like to make sure this hasn't been
overlooked.

> + * to host userspace or a different VCPU.  EL1 registers only need to be
> + * switched when potentially going to run a different VCPU.  The latter two
> + * classes are handled as part of kvm_arch_vcpu_load and kvm_arch_vcpu_put.
>   */
>  
>  static void __hyp_text __sysreg_save_common_state(struct kvm_cpu_context *ctxt)
> @@ -93,14 +97,11 @@ void __hyp_text __sysreg_save_state_nvhe(struct kvm_cpu_context *ctxt)
>  void sysreg_save_host_state_vhe(struct kvm_cpu_context *ctxt)
>  {
>  	__sysreg_save_common_state(ctxt);
> -	__sysreg_save_user_state(ctxt);
>  }
>  
>  void sysreg_save_guest_state_vhe(struct kvm_cpu_context *ctxt)
>  {
> -	__sysreg_save_el1_state(ctxt);
>  	__sysreg_save_common_state(ctxt);
> -	__sysreg_save_user_state(ctxt);
>  	__sysreg_save_el2_return_state(ctxt);
>  }
>  
> @@ -169,14 +170,11 @@ void __hyp_text __sysreg_restore_state_nvhe(struct kvm_cpu_context *ctxt)
>  void sysreg_restore_host_state_vhe(struct kvm_cpu_context *ctxt)
>  {
>  	__sysreg_restore_common_state(ctxt);
> -	__sysreg_restore_user_state(ctxt);
>  }
>  
>  void sysreg_restore_guest_state_vhe(struct kvm_cpu_context *ctxt)
>  {
> -	__sysreg_restore_el1_state(ctxt);
>  	__sysreg_restore_common_state(ctxt);
> -	__sysreg_restore_user_state(ctxt);
>  	__sysreg_restore_el2_return_state(ctxt);
>  }
>  
> @@ -240,6 +238,18 @@ void __hyp_text __sysreg32_restore_state(struct kvm_vcpu *vcpu)
>   */
>  void kvm_vcpu_load_sysregs(struct kvm_vcpu *vcpu)
>  {
> +	struct kvm_cpu_context *host_ctxt = vcpu->arch.host_cpu_context;
> +	struct kvm_cpu_context *guest_ctxt = &vcpu->arch.ctxt;
> +
> +	if (!has_vhe())
> +		return;
> +
> +	__sysreg_save_user_state(host_ctxt);
> +
> +	__sysreg_restore_user_state(guest_ctxt);
> +	__sysreg_restore_el1_state(guest_ctxt);
> +
> +	vcpu->arch.sysregs_loaded_on_cpu = true;
>  }
>  
>  /**
> @@ -255,6 +265,19 @@ void kvm_vcpu_load_sysregs(struct kvm_vcpu *vcpu)
>   */
>  void kvm_vcpu_put_sysregs(struct kvm_vcpu *vcpu)
>  {
> +	struct kvm_cpu_context *host_ctxt = vcpu->arch.host_cpu_context;
> +	struct kvm_cpu_context *guest_ctxt = &vcpu->arch.ctxt;
> +
> +	if (!has_vhe())
> +		return;
> +
> +	__sysreg_save_el1_state(guest_ctxt);
> +	__sysreg_save_user_state(guest_ctxt);
> +
> +	/* Restore host user state */
> +	__sysreg_restore_user_state(host_ctxt);
> +
> +	vcpu->arch.sysregs_loaded_on_cpu = false;
>  }
>  
>  void __hyp_text __kvm_set_tpidr_el2(u64 tpidr_el2)
> diff --git a/arch/arm64/kvm/sys_regs.c b/arch/arm64/kvm/sys_regs.c
> index b3c3f014aa61..f060309337aa 100644
> --- a/arch/arm64/kvm/sys_regs.c
> +++ b/arch/arm64/kvm/sys_regs.c
> @@ -87,6 +87,26 @@ u64 vcpu_read_sys_reg(struct kvm_vcpu *vcpu, int reg)
>  	 * exit from the guest but are only saved on vcpu_put.
>  	 */
>  	switch (reg) {
> +	case CSSELR_EL1:	return read_sysreg_s(SYS_CSSELR_EL1);
> +	case SCTLR_EL1:		return read_sysreg_s(sctlr_EL12);
> +	case ACTLR_EL1:		return read_sysreg_s(SYS_ACTLR_EL1);
> +	case CPACR_EL1:		return read_sysreg_s(cpacr_EL12);
> +	case TTBR0_EL1:		return read_sysreg_s(ttbr0_EL12);
> +	case TTBR1_EL1:		return read_sysreg_s(ttbr1_EL12);
> +	case TCR_EL1:		return read_sysreg_s(tcr_EL12);
> +	case ESR_EL1:		return read_sysreg_s(esr_EL12);
> +	case AFSR0_EL1:		return read_sysreg_s(afsr0_EL12);
> +	case AFSR1_EL1:		return read_sysreg_s(afsr1_EL12);
> +	case FAR_EL1:		return read_sysreg_s(far_EL12);
> +	case MAIR_EL1:		return read_sysreg_s(mair_EL12);
> +	case VBAR_EL1:		return read_sysreg_s(vbar_EL12);
> +	case CONTEXTIDR_EL1:	return read_sysreg_s(contextidr_EL12);
> +	case TPIDR_EL0:		return read_sysreg_s(SYS_TPIDR_EL0);
> +	case TPIDRRO_EL0:	return read_sysreg_s(SYS_TPIDRRO_EL0);
> +	case TPIDR_EL1:		return read_sysreg_s(SYS_TPIDR_EL1);
> +	case AMAIR_EL1:		return read_sysreg_s(amair_EL12);
> +	case CNTKCTL_EL1:	return read_sysreg_s(cntkctl_EL12);
> +	case PAR_EL1:		return read_sysreg_s(SYS_PAR_EL1);
>  	}
>  
>  immediate_read:
> @@ -103,6 +123,26 @@ void vcpu_write_sys_reg(struct kvm_vcpu *vcpu, int reg, u64 val)
>  	 * entry to the guest but are only restored on vcpu_load.
>  	 */
>  	switch (reg) {
> +	case CSSELR_EL1:	write_sysreg_s(val, SYS_CSSELR_EL1);	return;
> +	case SCTLR_EL1:		write_sysreg_s(val, sctlr_EL12);	return;
> +	case ACTLR_EL1:		write_sysreg_s(val, SYS_ACTLR_EL1);	return;
> +	case CPACR_EL1:		write_sysreg_s(val, cpacr_EL12);	return;
> +	case TTBR0_EL1:		write_sysreg_s(val, ttbr0_EL12);	return;
> +	case TTBR1_EL1:		write_sysreg_s(val, ttbr1_EL12);	return;
> +	case TCR_EL1:		write_sysreg_s(val, tcr_EL12);		return;
> +	case ESR_EL1:		write_sysreg_s(val, esr_EL12);		return;
> +	case AFSR0_EL1:		write_sysreg_s(val, afsr0_EL12);	return;
> +	case AFSR1_EL1:		write_sysreg_s(val, afsr1_EL12);	return;
> +	case FAR_EL1:		write_sysreg_s(val, far_EL12);		return;
> +	case MAIR_EL1:		write_sysreg_s(val, mair_EL12);		return;
> +	case VBAR_EL1:		write_sysreg_s(val, vbar_EL12);		return;
> +	case CONTEXTIDR_EL1:	write_sysreg_s(val, contextidr_EL12);	return;
> +	case TPIDR_EL0:		write_sysreg_s(val, SYS_TPIDR_EL0);	return;
> +	case TPIDRRO_EL0:	write_sysreg_s(val, SYS_TPIDRRO_EL0);	return;
> +	case TPIDR_EL1:		write_sysreg_s(val, SYS_TPIDR_EL1);	return;
> +	case AMAIR_EL1:		write_sysreg_s(val, amair_EL12);	return;
> +	case CNTKCTL_EL1:	write_sysreg_s(val, cntkctl_EL12);	return;
> +	case PAR_EL1:		write_sysreg_s(val, SYS_PAR_EL1);	return;
>  	}
>  
>  immediate_write:
> -- 
> 2.14.2
> 

Looks good to me otherwise.

	M.

-- 
Jazz is not dead, it just smell funny.



More information about the linux-arm-kernel mailing list