1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) 2015 - ARM Ltd
4*4882a593Smuzhiyun * Author: Marc Zyngier <marc.zyngier@arm.com>
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #include <hyp/adjust_pc.h>
8*4882a593Smuzhiyun #include <hyp/switch.h>
9*4882a593Smuzhiyun #include <hyp/sysreg-sr.h>
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <linux/arm-smccc.h>
12*4882a593Smuzhiyun #include <linux/kvm_host.h>
13*4882a593Smuzhiyun #include <linux/types.h>
14*4882a593Smuzhiyun #include <linux/jump_label.h>
15*4882a593Smuzhiyun #include <uapi/linux/psci.h>
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun #include <kvm/arm_psci.h>
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun #include <asm/barrier.h>
20*4882a593Smuzhiyun #include <asm/cpufeature.h>
21*4882a593Smuzhiyun #include <asm/kprobes.h>
22*4882a593Smuzhiyun #include <asm/kvm_asm.h>
23*4882a593Smuzhiyun #include <asm/kvm_emulate.h>
24*4882a593Smuzhiyun #include <asm/kvm_hyp.h>
25*4882a593Smuzhiyun #include <asm/kvm_mmu.h>
26*4882a593Smuzhiyun #include <asm/fpsimd.h>
27*4882a593Smuzhiyun #include <asm/debug-monitors.h>
28*4882a593Smuzhiyun #include <asm/processor.h>
29*4882a593Smuzhiyun #include <asm/thread_info.h>
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun #include <nvhe/mem_protect.h>
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun /* Non-VHE specific context */
34*4882a593Smuzhiyun DEFINE_PER_CPU(struct kvm_host_data, kvm_host_data);
35*4882a593Smuzhiyun DEFINE_PER_CPU(struct kvm_cpu_context, kvm_hyp_ctxt);
36*4882a593Smuzhiyun DEFINE_PER_CPU(unsigned long, kvm_hyp_vector);
37*4882a593Smuzhiyun
__activate_traps(struct kvm_vcpu * vcpu)38*4882a593Smuzhiyun static void __activate_traps(struct kvm_vcpu *vcpu)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun u64 val;
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun ___activate_traps(vcpu);
43*4882a593Smuzhiyun __activate_traps_common(vcpu);
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun val = CPTR_EL2_DEFAULT;
46*4882a593Smuzhiyun val |= CPTR_EL2_TTA | CPTR_EL2_TAM;
47*4882a593Smuzhiyun if (!update_fp_enabled(vcpu)) {
48*4882a593Smuzhiyun val |= CPTR_EL2_TFP | CPTR_EL2_TZ;
49*4882a593Smuzhiyun __activate_traps_fpsimd32(vcpu);
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun write_sysreg(val, cptr_el2);
53*4882a593Smuzhiyun write_sysreg(__this_cpu_read(kvm_hyp_vector), vbar_el2);
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun if (cpus_have_final_cap(ARM64_WORKAROUND_SPECULATIVE_AT)) {
56*4882a593Smuzhiyun struct kvm_cpu_context *ctxt = &vcpu->arch.ctxt;
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun isb();
59*4882a593Smuzhiyun /*
60*4882a593Smuzhiyun * At this stage, and thanks to the above isb(), S2 is
61*4882a593Smuzhiyun * configured and enabled. We can now restore the guest's S1
62*4882a593Smuzhiyun * configuration: SCTLR, and only then TCR.
63*4882a593Smuzhiyun */
64*4882a593Smuzhiyun write_sysreg_el1(ctxt_sys_reg(ctxt, SCTLR_EL1), SYS_SCTLR);
65*4882a593Smuzhiyun isb();
66*4882a593Smuzhiyun write_sysreg_el1(ctxt_sys_reg(ctxt, TCR_EL1), SYS_TCR);
67*4882a593Smuzhiyun }
68*4882a593Smuzhiyun }
69*4882a593Smuzhiyun
__deactivate_traps(struct kvm_vcpu * vcpu)70*4882a593Smuzhiyun static void __deactivate_traps(struct kvm_vcpu *vcpu)
71*4882a593Smuzhiyun {
72*4882a593Smuzhiyun extern char __kvm_hyp_host_vector[];
73*4882a593Smuzhiyun u64 mdcr_el2, cptr;
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun ___deactivate_traps(vcpu);
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun mdcr_el2 = read_sysreg(mdcr_el2);
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun if (cpus_have_final_cap(ARM64_WORKAROUND_SPECULATIVE_AT)) {
80*4882a593Smuzhiyun u64 val;
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun /*
83*4882a593Smuzhiyun * Set the TCR and SCTLR registers in the exact opposite
84*4882a593Smuzhiyun * sequence as __activate_traps (first prevent walks,
85*4882a593Smuzhiyun * then force the MMU on). A generous sprinkling of isb()
86*4882a593Smuzhiyun * ensure that things happen in this exact order.
87*4882a593Smuzhiyun */
88*4882a593Smuzhiyun val = read_sysreg_el1(SYS_TCR);
89*4882a593Smuzhiyun write_sysreg_el1(val | TCR_EPD1_MASK | TCR_EPD0_MASK, SYS_TCR);
90*4882a593Smuzhiyun isb();
91*4882a593Smuzhiyun val = read_sysreg_el1(SYS_SCTLR);
92*4882a593Smuzhiyun write_sysreg_el1(val | SCTLR_ELx_M, SYS_SCTLR);
93*4882a593Smuzhiyun isb();
94*4882a593Smuzhiyun }
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun __deactivate_traps_common();
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun mdcr_el2 &= MDCR_EL2_HPMN_MASK;
99*4882a593Smuzhiyun mdcr_el2 |= MDCR_EL2_E2PB_MASK << MDCR_EL2_E2PB_SHIFT;
100*4882a593Smuzhiyun mdcr_el2 |= MDCR_EL2_E2TB_MASK << MDCR_EL2_E2TB_SHIFT;
101*4882a593Smuzhiyun
102*4882a593Smuzhiyun write_sysreg(mdcr_el2, mdcr_el2);
103*4882a593Smuzhiyun write_sysreg(this_cpu_ptr(&kvm_init_params)->hcr_el2, hcr_el2);
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun cptr = CPTR_EL2_DEFAULT;
106*4882a593Smuzhiyun if (vcpu_has_sve(vcpu) && (vcpu->arch.flags & KVM_ARM64_FP_ENABLED))
107*4882a593Smuzhiyun cptr |= CPTR_EL2_TZ;
108*4882a593Smuzhiyun
109*4882a593Smuzhiyun write_sysreg(cptr, cptr_el2);
110*4882a593Smuzhiyun write_sysreg(__kvm_hyp_host_vector, vbar_el2);
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun /* Save VGICv3 state on non-VHE systems */
__hyp_vgic_save_state(struct kvm_vcpu * vcpu)114*4882a593Smuzhiyun static void __hyp_vgic_save_state(struct kvm_vcpu *vcpu)
115*4882a593Smuzhiyun {
116*4882a593Smuzhiyun if (static_branch_unlikely(&kvm_vgic_global_state.gicv3_cpuif)) {
117*4882a593Smuzhiyun __vgic_v3_save_state(&vcpu->arch.vgic_cpu.vgic_v3);
118*4882a593Smuzhiyun __vgic_v3_deactivate_traps(&vcpu->arch.vgic_cpu.vgic_v3);
119*4882a593Smuzhiyun }
120*4882a593Smuzhiyun }
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun /* Restore VGICv3 state on non_VEH systems */
__hyp_vgic_restore_state(struct kvm_vcpu * vcpu)123*4882a593Smuzhiyun static void __hyp_vgic_restore_state(struct kvm_vcpu *vcpu)
124*4882a593Smuzhiyun {
125*4882a593Smuzhiyun if (static_branch_unlikely(&kvm_vgic_global_state.gicv3_cpuif)) {
126*4882a593Smuzhiyun __vgic_v3_activate_traps(&vcpu->arch.vgic_cpu.vgic_v3);
127*4882a593Smuzhiyun __vgic_v3_restore_state(&vcpu->arch.vgic_cpu.vgic_v3);
128*4882a593Smuzhiyun }
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun /**
132*4882a593Smuzhiyun * Disable host events, enable guest events
133*4882a593Smuzhiyun */
__pmu_switch_to_guest(struct kvm_cpu_context * host_ctxt)134*4882a593Smuzhiyun static bool __pmu_switch_to_guest(struct kvm_cpu_context *host_ctxt)
135*4882a593Smuzhiyun {
136*4882a593Smuzhiyun struct kvm_host_data *host;
137*4882a593Smuzhiyun struct kvm_pmu_events *pmu;
138*4882a593Smuzhiyun
139*4882a593Smuzhiyun host = container_of(host_ctxt, struct kvm_host_data, host_ctxt);
140*4882a593Smuzhiyun pmu = &host->pmu_events;
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun if (pmu->events_host)
143*4882a593Smuzhiyun write_sysreg(pmu->events_host, pmcntenclr_el0);
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun if (pmu->events_guest)
146*4882a593Smuzhiyun write_sysreg(pmu->events_guest, pmcntenset_el0);
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun return (pmu->events_host || pmu->events_guest);
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun /**
152*4882a593Smuzhiyun * Disable guest events, enable host events
153*4882a593Smuzhiyun */
__pmu_switch_to_host(struct kvm_cpu_context * host_ctxt)154*4882a593Smuzhiyun static void __pmu_switch_to_host(struct kvm_cpu_context *host_ctxt)
155*4882a593Smuzhiyun {
156*4882a593Smuzhiyun struct kvm_host_data *host;
157*4882a593Smuzhiyun struct kvm_pmu_events *pmu;
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun host = container_of(host_ctxt, struct kvm_host_data, host_ctxt);
160*4882a593Smuzhiyun pmu = &host->pmu_events;
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun if (pmu->events_guest)
163*4882a593Smuzhiyun write_sysreg(pmu->events_guest, pmcntenclr_el0);
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun if (pmu->events_host)
166*4882a593Smuzhiyun write_sysreg(pmu->events_host, pmcntenset_el0);
167*4882a593Smuzhiyun }
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun /* Switch to the guest for legacy non-VHE systems */
__kvm_vcpu_run(struct kvm_vcpu * vcpu)170*4882a593Smuzhiyun int __kvm_vcpu_run(struct kvm_vcpu *vcpu)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun struct kvm_cpu_context *host_ctxt;
173*4882a593Smuzhiyun struct kvm_cpu_context *guest_ctxt;
174*4882a593Smuzhiyun bool pmu_switch_needed;
175*4882a593Smuzhiyun u64 exit_code;
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun /*
178*4882a593Smuzhiyun * Having IRQs masked via PMR when entering the guest means the GIC
179*4882a593Smuzhiyun * will not signal the CPU of interrupts of lower priority, and the
180*4882a593Smuzhiyun * only way to get out will be via guest exceptions.
181*4882a593Smuzhiyun * Naturally, we want to avoid this.
182*4882a593Smuzhiyun */
183*4882a593Smuzhiyun if (system_uses_irq_prio_masking()) {
184*4882a593Smuzhiyun gic_write_pmr(GIC_PRIO_IRQON | GIC_PRIO_PSR_I_SET);
185*4882a593Smuzhiyun pmr_sync();
186*4882a593Smuzhiyun }
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun host_ctxt = &this_cpu_ptr(&kvm_host_data)->host_ctxt;
189*4882a593Smuzhiyun host_ctxt->__hyp_running_vcpu = vcpu;
190*4882a593Smuzhiyun guest_ctxt = &vcpu->arch.ctxt;
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun pmu_switch_needed = __pmu_switch_to_guest(host_ctxt);
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun __sysreg_save_state_nvhe(host_ctxt);
195*4882a593Smuzhiyun /*
196*4882a593Smuzhiyun * We must flush and disable the SPE buffer for nVHE, as
197*4882a593Smuzhiyun * the translation regime(EL1&0) is going to be loaded with
198*4882a593Smuzhiyun * that of the guest. And we must do this before we change the
199*4882a593Smuzhiyun * translation regime to EL2 (via MDCR_EL2_E2PB == 0) and
200*4882a593Smuzhiyun * before we load guest Stage1.
201*4882a593Smuzhiyun */
202*4882a593Smuzhiyun __debug_save_host_buffers_nvhe(vcpu);
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun __adjust_pc(vcpu);
205*4882a593Smuzhiyun
206*4882a593Smuzhiyun /*
207*4882a593Smuzhiyun * We must restore the 32-bit state before the sysregs, thanks
208*4882a593Smuzhiyun * to erratum #852523 (Cortex-A57) or #853709 (Cortex-A72).
209*4882a593Smuzhiyun *
210*4882a593Smuzhiyun * Also, and in order to be able to deal with erratum #1319537 (A57)
211*4882a593Smuzhiyun * and #1319367 (A72), we must ensure that all VM-related sysreg are
212*4882a593Smuzhiyun * restored before we enable S2 translation.
213*4882a593Smuzhiyun */
214*4882a593Smuzhiyun __sysreg32_restore_state(vcpu);
215*4882a593Smuzhiyun __sysreg_restore_state_nvhe(guest_ctxt);
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun __load_guest_stage2(kern_hyp_va(vcpu->arch.hw_mmu));
218*4882a593Smuzhiyun __activate_traps(vcpu);
219*4882a593Smuzhiyun
220*4882a593Smuzhiyun __hyp_vgic_restore_state(vcpu);
221*4882a593Smuzhiyun __timer_enable_traps(vcpu);
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun __debug_switch_to_guest(vcpu);
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun do {
226*4882a593Smuzhiyun /* Jump in the fire! */
227*4882a593Smuzhiyun exit_code = __guest_enter(vcpu);
228*4882a593Smuzhiyun
229*4882a593Smuzhiyun /* And we're baaack! */
230*4882a593Smuzhiyun } while (fixup_guest_exit(vcpu, &exit_code));
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun __sysreg_save_state_nvhe(guest_ctxt);
233*4882a593Smuzhiyun __sysreg32_save_state(vcpu);
234*4882a593Smuzhiyun __timer_disable_traps(vcpu);
235*4882a593Smuzhiyun __hyp_vgic_save_state(vcpu);
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun __deactivate_traps(vcpu);
238*4882a593Smuzhiyun __load_host_stage2();
239*4882a593Smuzhiyun
240*4882a593Smuzhiyun __sysreg_restore_state_nvhe(host_ctxt);
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun if (vcpu->arch.flags & KVM_ARM64_FP_ENABLED)
243*4882a593Smuzhiyun __fpsimd_save_fpexc32(vcpu);
244*4882a593Smuzhiyun
245*4882a593Smuzhiyun __debug_switch_to_host(vcpu);
246*4882a593Smuzhiyun /*
247*4882a593Smuzhiyun * This must come after restoring the host sysregs, since a non-VHE
248*4882a593Smuzhiyun * system may enable SPE here and make use of the TTBRs.
249*4882a593Smuzhiyun */
250*4882a593Smuzhiyun __debug_restore_host_buffers_nvhe(vcpu);
251*4882a593Smuzhiyun
252*4882a593Smuzhiyun if (pmu_switch_needed)
253*4882a593Smuzhiyun __pmu_switch_to_host(host_ctxt);
254*4882a593Smuzhiyun
255*4882a593Smuzhiyun /* Returning to host will clear PSR.I, remask PMR if needed */
256*4882a593Smuzhiyun if (system_uses_irq_prio_masking())
257*4882a593Smuzhiyun gic_write_pmr(GIC_PRIO_IRQOFF);
258*4882a593Smuzhiyun
259*4882a593Smuzhiyun host_ctxt->__hyp_running_vcpu = NULL;
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun return exit_code;
262*4882a593Smuzhiyun }
263*4882a593Smuzhiyun
hyp_panic(void)264*4882a593Smuzhiyun void __noreturn hyp_panic(void)
265*4882a593Smuzhiyun {
266*4882a593Smuzhiyun u64 spsr = read_sysreg_el2(SYS_SPSR);
267*4882a593Smuzhiyun u64 elr = read_sysreg_el2(SYS_ELR);
268*4882a593Smuzhiyun u64 par = read_sysreg_par();
269*4882a593Smuzhiyun struct kvm_cpu_context *host_ctxt;
270*4882a593Smuzhiyun struct kvm_vcpu *vcpu;
271*4882a593Smuzhiyun
272*4882a593Smuzhiyun host_ctxt = &this_cpu_ptr(&kvm_host_data)->host_ctxt;
273*4882a593Smuzhiyun vcpu = host_ctxt->__hyp_running_vcpu;
274*4882a593Smuzhiyun
275*4882a593Smuzhiyun if (vcpu) {
276*4882a593Smuzhiyun __timer_disable_traps(vcpu);
277*4882a593Smuzhiyun __deactivate_traps(vcpu);
278*4882a593Smuzhiyun __load_host_stage2();
279*4882a593Smuzhiyun __sysreg_restore_state_nvhe(host_ctxt);
280*4882a593Smuzhiyun }
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun __hyp_do_panic(host_ctxt, spsr, elr, par);
283*4882a593Smuzhiyun unreachable();
284*4882a593Smuzhiyun }
285*4882a593Smuzhiyun
kvm_unexpected_el2_exception(void)286*4882a593Smuzhiyun asmlinkage void kvm_unexpected_el2_exception(void)
287*4882a593Smuzhiyun {
288*4882a593Smuzhiyun __kvm_unexpected_el2_exception();
289*4882a593Smuzhiyun }
290