hyp/vhe/tlb.c

*4882a593Smuzhiyun// SPDX-License-Identifier: GPL-2.0-only
*4882a593Smuzhiyun/*
*4882a593Smuzhiyun * Copyright (C) 2015 - ARM Ltd
*4882a593Smuzhiyun * Author: Marc Zyngier <marc.zyngier@arm.com>
*4882a593Smuzhiyun */
*4882a593Smuzhiyun
*4882a593Smuzhiyun#include <linux/irqflags.h>
*4882a593Smuzhiyun
*4882a593Smuzhiyun#include <asm/kvm_hyp.h>
*4882a593Smuzhiyun#include <asm/kvm_mmu.h>
*4882a593Smuzhiyun#include <asm/tlbflush.h>
*4882a593Smuzhiyun
*4882a593Smuzhiyunstruct tlb_inv_context {
*4882a593Smuzhiyun	unsigned long	flags;
*4882a593Smuzhiyun	u64		tcr;
*4882a593Smuzhiyun	u64		sctlr;
*4882a593Smuzhiyun};
*4882a593Smuzhiyun
*4882a593Smuzhiyunstatic void __tlb_switch_to_guest(struct kvm_s2_mmu *mmu,
*4882a593Smuzhiyun				  struct tlb_inv_context *cxt)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	u64 val;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	local_irq_save(cxt->flags);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (cpus_have_final_cap(ARM64_WORKAROUND_SPECULATIVE_AT)) {
*4882a593Smuzhiyun		/*
*4882a593Smuzhiyun		 * For CPUs that are affected by ARM errata 1165522 or 1530923,
*4882a593Smuzhiyun		 * we cannot trust stage-1 to be in a correct state at that
*4882a593Smuzhiyun		 * point. Since we do not want to force a full load of the
*4882a593Smuzhiyun		 * vcpu state, we prevent the EL1 page-table walker to
*4882a593Smuzhiyun		 * allocate new TLBs. This is done by setting the EPD bits
*4882a593Smuzhiyun		 * in the TCR_EL1 register. We also need to prevent it to
*4882a593Smuzhiyun		 * allocate IPA->PA walks, so we enable the S1 MMU...
*4882a593Smuzhiyun		 */
*4882a593Smuzhiyun		val = cxt->tcr = read_sysreg_el1(SYS_TCR);
*4882a593Smuzhiyun		val |= TCR_EPD1_MASK | TCR_EPD0_MASK;
*4882a593Smuzhiyun		write_sysreg_el1(val, SYS_TCR);
*4882a593Smuzhiyun		val = cxt->sctlr = read_sysreg_el1(SYS_SCTLR);
*4882a593Smuzhiyun		val |= SCTLR_ELx_M;
*4882a593Smuzhiyun		write_sysreg_el1(val, SYS_SCTLR);
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * With VHE enabled, we have HCR_EL2.{E2H,TGE} = {1,1}, and
*4882a593Smuzhiyun	 * most TLB operations target EL2/EL0. In order to affect the
*4882a593Smuzhiyun	 * guest TLBs (EL1/EL0), we need to change one of these two
*4882a593Smuzhiyun	 * bits. Changing E2H is impossible (goodbye TTBR1_EL2), so
*4882a593Smuzhiyun	 * let's flip TGE before executing the TLB operation.
*4882a593Smuzhiyun	 *
*4882a593Smuzhiyun	 * ARM erratum 1165522 requires some special handling (again),
*4882a593Smuzhiyun	 * as we need to make sure both stages of translation are in
*4882a593Smuzhiyun	 * place before clearing TGE. __load_guest_stage2() already
*4882a593Smuzhiyun	 * has an ISB in order to deal with this.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	__load_guest_stage2(mmu);
*4882a593Smuzhiyun	val = read_sysreg(hcr_el2);
*4882a593Smuzhiyun	val &= ~HCR_TGE;
*4882a593Smuzhiyun	write_sysreg(val, hcr_el2);
*4882a593Smuzhiyun	isb();
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunstatic void __tlb_switch_to_host(struct tlb_inv_context *cxt)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * We're done with the TLB operation, let's restore the host's
*4882a593Smuzhiyun	 * view of HCR_EL2.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	write_sysreg(0, vttbr_el2);
*4882a593Smuzhiyun	write_sysreg(HCR_HOST_VHE_FLAGS, hcr_el2);
*4882a593Smuzhiyun	isb();
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (cpus_have_final_cap(ARM64_WORKAROUND_SPECULATIVE_AT)) {
*4882a593Smuzhiyun		/* Restore the registers to what they were */
*4882a593Smuzhiyun		write_sysreg_el1(cxt->tcr, SYS_TCR);
*4882a593Smuzhiyun		write_sysreg_el1(cxt->sctlr, SYS_SCTLR);
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	local_irq_restore(cxt->flags);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid __kvm_tlb_flush_vmid_ipa(struct kvm_s2_mmu *mmu,
*4882a593Smuzhiyun			      phys_addr_t ipa, int level)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct tlb_inv_context cxt;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	dsb(ishst);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Switch to requested VMID */
*4882a593Smuzhiyun	__tlb_switch_to_guest(mmu, &cxt);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * We could do so much better if we had the VA as well.
*4882a593Smuzhiyun	 * Instead, we invalidate Stage-2 for this IPA, and the
*4882a593Smuzhiyun	 * whole of Stage-1. Weep...
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	ipa >>= 12;
*4882a593Smuzhiyun	__tlbi_level(ipas2e1is, ipa, level);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * We have to ensure completion of the invalidation at Stage-2,
*4882a593Smuzhiyun	 * since a table walk on another CPU could refill a TLB with a
*4882a593Smuzhiyun	 * complete (S1 + S2) walk based on the old Stage-2 mapping if
*4882a593Smuzhiyun	 * the Stage-1 invalidation happened first.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	dsb(ish);
*4882a593Smuzhiyun	__tlbi(vmalle1is);
*4882a593Smuzhiyun	dsb(ish);
*4882a593Smuzhiyun	isb();
*4882a593Smuzhiyun
*4882a593Smuzhiyun	__tlb_switch_to_host(&cxt);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid __kvm_tlb_flush_vmid(struct kvm_s2_mmu *mmu)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct tlb_inv_context cxt;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	dsb(ishst);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Switch to requested VMID */
*4882a593Smuzhiyun	__tlb_switch_to_guest(mmu, &cxt);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	__tlbi(vmalls12e1is);
*4882a593Smuzhiyun	dsb(ish);
*4882a593Smuzhiyun	isb();
*4882a593Smuzhiyun
*4882a593Smuzhiyun	__tlb_switch_to_host(&cxt);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid __kvm_flush_cpu_context(struct kvm_s2_mmu *mmu)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct tlb_inv_context cxt;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Switch to requested VMID */
*4882a593Smuzhiyun	__tlb_switch_to_guest(mmu, &cxt);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	__tlbi(vmalle1);
*4882a593Smuzhiyun	asm volatile("ic iallu");
*4882a593Smuzhiyun	dsb(nsh);
*4882a593Smuzhiyun	isb();
*4882a593Smuzhiyun
*4882a593Smuzhiyun	__tlb_switch_to_host(&cxt);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid __kvm_flush_vm_context(void)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	dsb(ishst);
*4882a593Smuzhiyun	__tlbi(alle1is);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * VIPT and PIPT caches are not affected by VMID, so no maintenance
*4882a593Smuzhiyun	 * is necessary across a VMID rollover.
*4882a593Smuzhiyun	 *
*4882a593Smuzhiyun	 * VPIPT caches constrain lookup and maintenance to the active VMID,
*4882a593Smuzhiyun	 * so we need to invalidate lines with a stale VMID to avoid an ABA
*4882a593Smuzhiyun	 * race after multiple rollovers.
*4882a593Smuzhiyun	 *
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	if (icache_is_vpipt())
*4882a593Smuzhiyun		asm volatile("ic ialluis");
*4882a593Smuzhiyun
*4882a593Smuzhiyun	dsb(ish);
*4882a593Smuzhiyun}