1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) 2017 ARM Ltd.
4*4882a593Smuzhiyun * Author: Marc Zyngier <marc.zyngier@arm.com>
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #include <linux/kvm_host.h>
8*4882a593Smuzhiyun #include <linux/random.h>
9*4882a593Smuzhiyun #include <linux/memblock.h>
10*4882a593Smuzhiyun #include <asm/alternative.h>
11*4882a593Smuzhiyun #include <asm/debug-monitors.h>
12*4882a593Smuzhiyun #include <asm/insn.h>
13*4882a593Smuzhiyun #include <asm/kvm_mmu.h>
14*4882a593Smuzhiyun #include <asm/memory.h>
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun /*
17*4882a593Smuzhiyun * The LSB of the HYP VA tag
18*4882a593Smuzhiyun */
19*4882a593Smuzhiyun static u8 tag_lsb;
20*4882a593Smuzhiyun /*
21*4882a593Smuzhiyun * The HYP VA tag value with the region bit
22*4882a593Smuzhiyun */
23*4882a593Smuzhiyun static u64 tag_val;
24*4882a593Smuzhiyun static u64 va_mask;
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun /*
27*4882a593Smuzhiyun * Compute HYP VA by using the same computation as kern_hyp_va().
28*4882a593Smuzhiyun */
__early_kern_hyp_va(u64 addr)29*4882a593Smuzhiyun static u64 __early_kern_hyp_va(u64 addr)
30*4882a593Smuzhiyun {
31*4882a593Smuzhiyun addr &= va_mask;
32*4882a593Smuzhiyun addr |= tag_val << tag_lsb;
33*4882a593Smuzhiyun return addr;
34*4882a593Smuzhiyun }
35*4882a593Smuzhiyun
36*4882a593Smuzhiyun /*
37*4882a593Smuzhiyun * Store a hyp VA <-> PA offset into a EL2-owned variable.
38*4882a593Smuzhiyun */
init_hyp_physvirt_offset(void)39*4882a593Smuzhiyun static void init_hyp_physvirt_offset(void)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun u64 kern_va, hyp_va;
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun /* Compute the offset from the hyp VA and PA of a random symbol. */
44*4882a593Smuzhiyun kern_va = (u64)lm_alias(__hyp_text_start);
45*4882a593Smuzhiyun hyp_va = __early_kern_hyp_va(kern_va);
46*4882a593Smuzhiyun hyp_physvirt_offset = (s64)__pa(kern_va) - (s64)hyp_va;
47*4882a593Smuzhiyun }
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun /*
50*4882a593Smuzhiyun * We want to generate a hyp VA with the following format (with V ==
51*4882a593Smuzhiyun * vabits_actual):
52*4882a593Smuzhiyun *
53*4882a593Smuzhiyun * 63 ... V | V-1 | V-2 .. tag_lsb | tag_lsb - 1 .. 0
54*4882a593Smuzhiyun * ---------------------------------------------------------
55*4882a593Smuzhiyun * | 0000000 | hyp_va_msb | random tag | kern linear VA |
56*4882a593Smuzhiyun * |--------- tag_val -----------|----- va_mask ---|
57*4882a593Smuzhiyun *
58*4882a593Smuzhiyun * which does not conflict with the idmap regions.
59*4882a593Smuzhiyun */
kvm_compute_layout(void)60*4882a593Smuzhiyun __init void kvm_compute_layout(void)
61*4882a593Smuzhiyun {
62*4882a593Smuzhiyun phys_addr_t idmap_addr = __pa_symbol(__hyp_idmap_text_start);
63*4882a593Smuzhiyun u64 hyp_va_msb;
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun /* Where is my RAM region? */
66*4882a593Smuzhiyun hyp_va_msb = idmap_addr & BIT(vabits_actual - 1);
67*4882a593Smuzhiyun hyp_va_msb ^= BIT(vabits_actual - 1);
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun tag_lsb = fls64((u64)phys_to_virt(memblock_start_of_DRAM()) ^
70*4882a593Smuzhiyun (u64)(high_memory - 1));
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun va_mask = GENMASK_ULL(tag_lsb - 1, 0);
73*4882a593Smuzhiyun tag_val = hyp_va_msb;
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun if (IS_ENABLED(CONFIG_RANDOMIZE_BASE) && tag_lsb != (vabits_actual - 1)) {
76*4882a593Smuzhiyun /* We have some free bits to insert a random tag. */
77*4882a593Smuzhiyun tag_val |= get_random_long() & GENMASK_ULL(vabits_actual - 2, tag_lsb);
78*4882a593Smuzhiyun }
79*4882a593Smuzhiyun tag_val >>= tag_lsb;
80*4882a593Smuzhiyun
81*4882a593Smuzhiyun init_hyp_physvirt_offset();
82*4882a593Smuzhiyun }
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun /*
85*4882a593Smuzhiyun * The .hyp.reloc ELF section contains a list of kimg positions that
86*4882a593Smuzhiyun * contains kimg VAs but will be accessed only in hyp execution context.
87*4882a593Smuzhiyun * Convert them to hyp VAs. See gen-hyprel.c for more details.
88*4882a593Smuzhiyun */
kvm_apply_hyp_relocations(void)89*4882a593Smuzhiyun __init void kvm_apply_hyp_relocations(void)
90*4882a593Smuzhiyun {
91*4882a593Smuzhiyun int32_t *rel;
92*4882a593Smuzhiyun int32_t *begin = (int32_t *)__hyp_reloc_begin;
93*4882a593Smuzhiyun int32_t *end = (int32_t *)__hyp_reloc_end;
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun for (rel = begin; rel < end; ++rel) {
96*4882a593Smuzhiyun uintptr_t *ptr, kimg_va;
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun /*
99*4882a593Smuzhiyun * Each entry contains a 32-bit relative offset from itself
100*4882a593Smuzhiyun * to a kimg VA position.
101*4882a593Smuzhiyun */
102*4882a593Smuzhiyun ptr = (uintptr_t *)lm_alias((char *)rel + *rel);
103*4882a593Smuzhiyun
104*4882a593Smuzhiyun /* Read the kimg VA value at the relocation address. */
105*4882a593Smuzhiyun kimg_va = *ptr;
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun /* Convert to hyp VA and store back to the relocation address. */
108*4882a593Smuzhiyun *ptr = __early_kern_hyp_va((uintptr_t)lm_alias(kimg_va));
109*4882a593Smuzhiyun }
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun
compute_instruction(int n,u32 rd,u32 rn)112*4882a593Smuzhiyun static u32 compute_instruction(int n, u32 rd, u32 rn)
113*4882a593Smuzhiyun {
114*4882a593Smuzhiyun u32 insn = AARCH64_BREAK_FAULT;
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun switch (n) {
117*4882a593Smuzhiyun case 0:
118*4882a593Smuzhiyun insn = aarch64_insn_gen_logical_immediate(AARCH64_INSN_LOGIC_AND,
119*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
120*4882a593Smuzhiyun rn, rd, va_mask);
121*4882a593Smuzhiyun break;
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun case 1:
124*4882a593Smuzhiyun /* ROR is a variant of EXTR with Rm = Rn */
125*4882a593Smuzhiyun insn = aarch64_insn_gen_extr(AARCH64_INSN_VARIANT_64BIT,
126*4882a593Smuzhiyun rn, rn, rd,
127*4882a593Smuzhiyun tag_lsb);
128*4882a593Smuzhiyun break;
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun case 2:
131*4882a593Smuzhiyun insn = aarch64_insn_gen_add_sub_imm(rd, rn,
132*4882a593Smuzhiyun tag_val & GENMASK(11, 0),
133*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
134*4882a593Smuzhiyun AARCH64_INSN_ADSB_ADD);
135*4882a593Smuzhiyun break;
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun case 3:
138*4882a593Smuzhiyun insn = aarch64_insn_gen_add_sub_imm(rd, rn,
139*4882a593Smuzhiyun tag_val & GENMASK(23, 12),
140*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
141*4882a593Smuzhiyun AARCH64_INSN_ADSB_ADD);
142*4882a593Smuzhiyun break;
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun case 4:
145*4882a593Smuzhiyun /* ROR is a variant of EXTR with Rm = Rn */
146*4882a593Smuzhiyun insn = aarch64_insn_gen_extr(AARCH64_INSN_VARIANT_64BIT,
147*4882a593Smuzhiyun rn, rn, rd, 64 - tag_lsb);
148*4882a593Smuzhiyun break;
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun return insn;
152*4882a593Smuzhiyun }
153*4882a593Smuzhiyun
kvm_update_va_mask(struct alt_instr * alt,__le32 * origptr,__le32 * updptr,int nr_inst)154*4882a593Smuzhiyun void __init kvm_update_va_mask(struct alt_instr *alt,
155*4882a593Smuzhiyun __le32 *origptr, __le32 *updptr, int nr_inst)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun int i;
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun BUG_ON(nr_inst != 5);
160*4882a593Smuzhiyun
161*4882a593Smuzhiyun for (i = 0; i < nr_inst; i++) {
162*4882a593Smuzhiyun u32 rd, rn, insn, oinsn;
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun /*
165*4882a593Smuzhiyun * VHE doesn't need any address translation, let's NOP
166*4882a593Smuzhiyun * everything.
167*4882a593Smuzhiyun *
168*4882a593Smuzhiyun * Alternatively, if the tag is zero (because the layout
169*4882a593Smuzhiyun * dictates it and we don't have any spare bits in the
170*4882a593Smuzhiyun * address), NOP everything after masking the kernel VA.
171*4882a593Smuzhiyun */
172*4882a593Smuzhiyun if (has_vhe() || (!tag_val && i > 0)) {
173*4882a593Smuzhiyun updptr[i] = cpu_to_le32(aarch64_insn_gen_nop());
174*4882a593Smuzhiyun continue;
175*4882a593Smuzhiyun }
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun oinsn = le32_to_cpu(origptr[i]);
178*4882a593Smuzhiyun rd = aarch64_insn_decode_register(AARCH64_INSN_REGTYPE_RD, oinsn);
179*4882a593Smuzhiyun rn = aarch64_insn_decode_register(AARCH64_INSN_REGTYPE_RN, oinsn);
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun insn = compute_instruction(i, rd, rn);
182*4882a593Smuzhiyun BUG_ON(insn == AARCH64_BREAK_FAULT);
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun updptr[i] = cpu_to_le32(insn);
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun }
187*4882a593Smuzhiyun
kvm_patch_vector_branch(struct alt_instr * alt,__le32 * origptr,__le32 * updptr,int nr_inst)188*4882a593Smuzhiyun void kvm_patch_vector_branch(struct alt_instr *alt,
189*4882a593Smuzhiyun __le32 *origptr, __le32 *updptr, int nr_inst)
190*4882a593Smuzhiyun {
191*4882a593Smuzhiyun u64 addr;
192*4882a593Smuzhiyun u32 insn;
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun BUG_ON(nr_inst != 4);
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun if (!cpus_have_const_cap(ARM64_SPECTRE_V3A) || WARN_ON_ONCE(has_vhe()))
197*4882a593Smuzhiyun return;
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun /*
200*4882a593Smuzhiyun * Compute HYP VA by using the same computation as kern_hyp_va()
201*4882a593Smuzhiyun */
202*4882a593Smuzhiyun addr = __early_kern_hyp_va((u64)kvm_ksym_ref(__kvm_hyp_vector));
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun /* Use PC[10:7] to branch to the same vector in KVM */
205*4882a593Smuzhiyun addr |= ((u64)origptr & GENMASK_ULL(10, 7));
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun /*
208*4882a593Smuzhiyun * Branch over the preamble in order to avoid the initial store on
209*4882a593Smuzhiyun * the stack (which we already perform in the hardening vectors).
210*4882a593Smuzhiyun */
211*4882a593Smuzhiyun addr += KVM_VECTOR_PREAMBLE;
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun /* movz x0, #(addr & 0xffff) */
214*4882a593Smuzhiyun insn = aarch64_insn_gen_movewide(AARCH64_INSN_REG_0,
215*4882a593Smuzhiyun (u16)addr,
216*4882a593Smuzhiyun 0,
217*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
218*4882a593Smuzhiyun AARCH64_INSN_MOVEWIDE_ZERO);
219*4882a593Smuzhiyun *updptr++ = cpu_to_le32(insn);
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun /* movk x0, #((addr >> 16) & 0xffff), lsl #16 */
222*4882a593Smuzhiyun insn = aarch64_insn_gen_movewide(AARCH64_INSN_REG_0,
223*4882a593Smuzhiyun (u16)(addr >> 16),
224*4882a593Smuzhiyun 16,
225*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
226*4882a593Smuzhiyun AARCH64_INSN_MOVEWIDE_KEEP);
227*4882a593Smuzhiyun *updptr++ = cpu_to_le32(insn);
228*4882a593Smuzhiyun
229*4882a593Smuzhiyun /* movk x0, #((addr >> 32) & 0xffff), lsl #32 */
230*4882a593Smuzhiyun insn = aarch64_insn_gen_movewide(AARCH64_INSN_REG_0,
231*4882a593Smuzhiyun (u16)(addr >> 32),
232*4882a593Smuzhiyun 32,
233*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
234*4882a593Smuzhiyun AARCH64_INSN_MOVEWIDE_KEEP);
235*4882a593Smuzhiyun *updptr++ = cpu_to_le32(insn);
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun /* br x0 */
238*4882a593Smuzhiyun insn = aarch64_insn_gen_branch_reg(AARCH64_INSN_REG_0,
239*4882a593Smuzhiyun AARCH64_INSN_BRANCH_NOLINK);
240*4882a593Smuzhiyun *updptr++ = cpu_to_le32(insn);
241*4882a593Smuzhiyun }
242*4882a593Smuzhiyun
generate_mov_q(u64 val,__le32 * origptr,__le32 * updptr,int nr_inst)243*4882a593Smuzhiyun static void generate_mov_q(u64 val, __le32 *origptr, __le32 *updptr, int nr_inst)
244*4882a593Smuzhiyun {
245*4882a593Smuzhiyun u32 insn, oinsn, rd;
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun BUG_ON(nr_inst != 4);
248*4882a593Smuzhiyun
249*4882a593Smuzhiyun /* Compute target register */
250*4882a593Smuzhiyun oinsn = le32_to_cpu(*origptr);
251*4882a593Smuzhiyun rd = aarch64_insn_decode_register(AARCH64_INSN_REGTYPE_RD, oinsn);
252*4882a593Smuzhiyun
253*4882a593Smuzhiyun /* movz rd, #(val & 0xffff) */
254*4882a593Smuzhiyun insn = aarch64_insn_gen_movewide(rd,
255*4882a593Smuzhiyun (u16)val,
256*4882a593Smuzhiyun 0,
257*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
258*4882a593Smuzhiyun AARCH64_INSN_MOVEWIDE_ZERO);
259*4882a593Smuzhiyun *updptr++ = cpu_to_le32(insn);
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun /* movk rd, #((val >> 16) & 0xffff), lsl #16 */
262*4882a593Smuzhiyun insn = aarch64_insn_gen_movewide(rd,
263*4882a593Smuzhiyun (u16)(val >> 16),
264*4882a593Smuzhiyun 16,
265*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
266*4882a593Smuzhiyun AARCH64_INSN_MOVEWIDE_KEEP);
267*4882a593Smuzhiyun *updptr++ = cpu_to_le32(insn);
268*4882a593Smuzhiyun
269*4882a593Smuzhiyun /* movk rd, #((val >> 32) & 0xffff), lsl #32 */
270*4882a593Smuzhiyun insn = aarch64_insn_gen_movewide(rd,
271*4882a593Smuzhiyun (u16)(val >> 32),
272*4882a593Smuzhiyun 32,
273*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
274*4882a593Smuzhiyun AARCH64_INSN_MOVEWIDE_KEEP);
275*4882a593Smuzhiyun *updptr++ = cpu_to_le32(insn);
276*4882a593Smuzhiyun
277*4882a593Smuzhiyun /* movk rd, #((val >> 48) & 0xffff), lsl #48 */
278*4882a593Smuzhiyun insn = aarch64_insn_gen_movewide(rd,
279*4882a593Smuzhiyun (u16)(val >> 48),
280*4882a593Smuzhiyun 48,
281*4882a593Smuzhiyun AARCH64_INSN_VARIANT_64BIT,
282*4882a593Smuzhiyun AARCH64_INSN_MOVEWIDE_KEEP);
283*4882a593Smuzhiyun *updptr++ = cpu_to_le32(insn);
284*4882a593Smuzhiyun }
285*4882a593Smuzhiyun
kvm_get_kimage_voffset(struct alt_instr * alt,__le32 * origptr,__le32 * updptr,int nr_inst)286*4882a593Smuzhiyun void kvm_get_kimage_voffset(struct alt_instr *alt,
287*4882a593Smuzhiyun __le32 *origptr, __le32 *updptr, int nr_inst)
288*4882a593Smuzhiyun {
289*4882a593Smuzhiyun generate_mov_q(kimage_voffset, origptr, updptr, nr_inst);
290*4882a593Smuzhiyun }
291*4882a593Smuzhiyun
kvm_compute_final_ctr_el0(struct alt_instr * alt,__le32 * origptr,__le32 * updptr,int nr_inst)292*4882a593Smuzhiyun void kvm_compute_final_ctr_el0(struct alt_instr *alt,
293*4882a593Smuzhiyun __le32 *origptr, __le32 *updptr, int nr_inst)
294*4882a593Smuzhiyun {
295*4882a593Smuzhiyun generate_mov_q(read_sanitised_ftr_reg(SYS_CTR_EL0),
296*4882a593Smuzhiyun origptr, updptr, nr_inst);
297*4882a593Smuzhiyun }
298