xref: /OK3568_Linux_fs/kernel/arch/s390/kvm/gaccess.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * guest access functions
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright IBM Corp. 2014
6*4882a593Smuzhiyun  *
7*4882a593Smuzhiyun  */
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun #include <linux/vmalloc.h>
10*4882a593Smuzhiyun #include <linux/mm_types.h>
11*4882a593Smuzhiyun #include <linux/err.h>
12*4882a593Smuzhiyun #include <linux/pgtable.h>
13*4882a593Smuzhiyun 
14*4882a593Smuzhiyun #include <asm/gmap.h>
15*4882a593Smuzhiyun #include "kvm-s390.h"
16*4882a593Smuzhiyun #include "gaccess.h"
17*4882a593Smuzhiyun #include <asm/switch_to.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun union asce {
20*4882a593Smuzhiyun 	unsigned long val;
21*4882a593Smuzhiyun 	struct {
22*4882a593Smuzhiyun 		unsigned long origin : 52; /* Region- or Segment-Table Origin */
23*4882a593Smuzhiyun 		unsigned long	 : 2;
24*4882a593Smuzhiyun 		unsigned long g  : 1; /* Subspace Group Control */
25*4882a593Smuzhiyun 		unsigned long p  : 1; /* Private Space Control */
26*4882a593Smuzhiyun 		unsigned long s  : 1; /* Storage-Alteration-Event Control */
27*4882a593Smuzhiyun 		unsigned long x  : 1; /* Space-Switch-Event Control */
28*4882a593Smuzhiyun 		unsigned long r  : 1; /* Real-Space Control */
29*4882a593Smuzhiyun 		unsigned long	 : 1;
30*4882a593Smuzhiyun 		unsigned long dt : 2; /* Designation-Type Control */
31*4882a593Smuzhiyun 		unsigned long tl : 2; /* Region- or Segment-Table Length */
32*4882a593Smuzhiyun 	};
33*4882a593Smuzhiyun };
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun enum {
36*4882a593Smuzhiyun 	ASCE_TYPE_SEGMENT = 0,
37*4882a593Smuzhiyun 	ASCE_TYPE_REGION3 = 1,
38*4882a593Smuzhiyun 	ASCE_TYPE_REGION2 = 2,
39*4882a593Smuzhiyun 	ASCE_TYPE_REGION1 = 3
40*4882a593Smuzhiyun };
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun union region1_table_entry {
43*4882a593Smuzhiyun 	unsigned long val;
44*4882a593Smuzhiyun 	struct {
45*4882a593Smuzhiyun 		unsigned long rto: 52;/* Region-Table Origin */
46*4882a593Smuzhiyun 		unsigned long	 : 2;
47*4882a593Smuzhiyun 		unsigned long p  : 1; /* DAT-Protection Bit */
48*4882a593Smuzhiyun 		unsigned long	 : 1;
49*4882a593Smuzhiyun 		unsigned long tf : 2; /* Region-Second-Table Offset */
50*4882a593Smuzhiyun 		unsigned long i  : 1; /* Region-Invalid Bit */
51*4882a593Smuzhiyun 		unsigned long	 : 1;
52*4882a593Smuzhiyun 		unsigned long tt : 2; /* Table-Type Bits */
53*4882a593Smuzhiyun 		unsigned long tl : 2; /* Region-Second-Table Length */
54*4882a593Smuzhiyun 	};
55*4882a593Smuzhiyun };
56*4882a593Smuzhiyun 
57*4882a593Smuzhiyun union region2_table_entry {
58*4882a593Smuzhiyun 	unsigned long val;
59*4882a593Smuzhiyun 	struct {
60*4882a593Smuzhiyun 		unsigned long rto: 52;/* Region-Table Origin */
61*4882a593Smuzhiyun 		unsigned long	 : 2;
62*4882a593Smuzhiyun 		unsigned long p  : 1; /* DAT-Protection Bit */
63*4882a593Smuzhiyun 		unsigned long	 : 1;
64*4882a593Smuzhiyun 		unsigned long tf : 2; /* Region-Third-Table Offset */
65*4882a593Smuzhiyun 		unsigned long i  : 1; /* Region-Invalid Bit */
66*4882a593Smuzhiyun 		unsigned long	 : 1;
67*4882a593Smuzhiyun 		unsigned long tt : 2; /* Table-Type Bits */
68*4882a593Smuzhiyun 		unsigned long tl : 2; /* Region-Third-Table Length */
69*4882a593Smuzhiyun 	};
70*4882a593Smuzhiyun };
71*4882a593Smuzhiyun 
72*4882a593Smuzhiyun struct region3_table_entry_fc0 {
73*4882a593Smuzhiyun 	unsigned long sto: 52;/* Segment-Table Origin */
74*4882a593Smuzhiyun 	unsigned long	 : 1;
75*4882a593Smuzhiyun 	unsigned long fc : 1; /* Format-Control */
76*4882a593Smuzhiyun 	unsigned long p  : 1; /* DAT-Protection Bit */
77*4882a593Smuzhiyun 	unsigned long	 : 1;
78*4882a593Smuzhiyun 	unsigned long tf : 2; /* Segment-Table Offset */
79*4882a593Smuzhiyun 	unsigned long i  : 1; /* Region-Invalid Bit */
80*4882a593Smuzhiyun 	unsigned long cr : 1; /* Common-Region Bit */
81*4882a593Smuzhiyun 	unsigned long tt : 2; /* Table-Type Bits */
82*4882a593Smuzhiyun 	unsigned long tl : 2; /* Segment-Table Length */
83*4882a593Smuzhiyun };
84*4882a593Smuzhiyun 
85*4882a593Smuzhiyun struct region3_table_entry_fc1 {
86*4882a593Smuzhiyun 	unsigned long rfaa : 33; /* Region-Frame Absolute Address */
87*4882a593Smuzhiyun 	unsigned long	 : 14;
88*4882a593Smuzhiyun 	unsigned long av : 1; /* ACCF-Validity Control */
89*4882a593Smuzhiyun 	unsigned long acc: 4; /* Access-Control Bits */
90*4882a593Smuzhiyun 	unsigned long f  : 1; /* Fetch-Protection Bit */
91*4882a593Smuzhiyun 	unsigned long fc : 1; /* Format-Control */
92*4882a593Smuzhiyun 	unsigned long p  : 1; /* DAT-Protection Bit */
93*4882a593Smuzhiyun 	unsigned long iep: 1; /* Instruction-Execution-Protection */
94*4882a593Smuzhiyun 	unsigned long	 : 2;
95*4882a593Smuzhiyun 	unsigned long i  : 1; /* Region-Invalid Bit */
96*4882a593Smuzhiyun 	unsigned long cr : 1; /* Common-Region Bit */
97*4882a593Smuzhiyun 	unsigned long tt : 2; /* Table-Type Bits */
98*4882a593Smuzhiyun 	unsigned long	 : 2;
99*4882a593Smuzhiyun };
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun union region3_table_entry {
102*4882a593Smuzhiyun 	unsigned long val;
103*4882a593Smuzhiyun 	struct region3_table_entry_fc0 fc0;
104*4882a593Smuzhiyun 	struct region3_table_entry_fc1 fc1;
105*4882a593Smuzhiyun 	struct {
106*4882a593Smuzhiyun 		unsigned long	 : 53;
107*4882a593Smuzhiyun 		unsigned long fc : 1; /* Format-Control */
108*4882a593Smuzhiyun 		unsigned long	 : 4;
109*4882a593Smuzhiyun 		unsigned long i  : 1; /* Region-Invalid Bit */
110*4882a593Smuzhiyun 		unsigned long cr : 1; /* Common-Region Bit */
111*4882a593Smuzhiyun 		unsigned long tt : 2; /* Table-Type Bits */
112*4882a593Smuzhiyun 		unsigned long	 : 2;
113*4882a593Smuzhiyun 	};
114*4882a593Smuzhiyun };
115*4882a593Smuzhiyun 
116*4882a593Smuzhiyun struct segment_entry_fc0 {
117*4882a593Smuzhiyun 	unsigned long pto: 53;/* Page-Table Origin */
118*4882a593Smuzhiyun 	unsigned long fc : 1; /* Format-Control */
119*4882a593Smuzhiyun 	unsigned long p  : 1; /* DAT-Protection Bit */
120*4882a593Smuzhiyun 	unsigned long	 : 3;
121*4882a593Smuzhiyun 	unsigned long i  : 1; /* Segment-Invalid Bit */
122*4882a593Smuzhiyun 	unsigned long cs : 1; /* Common-Segment Bit */
123*4882a593Smuzhiyun 	unsigned long tt : 2; /* Table-Type Bits */
124*4882a593Smuzhiyun 	unsigned long	 : 2;
125*4882a593Smuzhiyun };
126*4882a593Smuzhiyun 
127*4882a593Smuzhiyun struct segment_entry_fc1 {
128*4882a593Smuzhiyun 	unsigned long sfaa : 44; /* Segment-Frame Absolute Address */
129*4882a593Smuzhiyun 	unsigned long	 : 3;
130*4882a593Smuzhiyun 	unsigned long av : 1; /* ACCF-Validity Control */
131*4882a593Smuzhiyun 	unsigned long acc: 4; /* Access-Control Bits */
132*4882a593Smuzhiyun 	unsigned long f  : 1; /* Fetch-Protection Bit */
133*4882a593Smuzhiyun 	unsigned long fc : 1; /* Format-Control */
134*4882a593Smuzhiyun 	unsigned long p  : 1; /* DAT-Protection Bit */
135*4882a593Smuzhiyun 	unsigned long iep: 1; /* Instruction-Execution-Protection */
136*4882a593Smuzhiyun 	unsigned long	 : 2;
137*4882a593Smuzhiyun 	unsigned long i  : 1; /* Segment-Invalid Bit */
138*4882a593Smuzhiyun 	unsigned long cs : 1; /* Common-Segment Bit */
139*4882a593Smuzhiyun 	unsigned long tt : 2; /* Table-Type Bits */
140*4882a593Smuzhiyun 	unsigned long	 : 2;
141*4882a593Smuzhiyun };
142*4882a593Smuzhiyun 
143*4882a593Smuzhiyun union segment_table_entry {
144*4882a593Smuzhiyun 	unsigned long val;
145*4882a593Smuzhiyun 	struct segment_entry_fc0 fc0;
146*4882a593Smuzhiyun 	struct segment_entry_fc1 fc1;
147*4882a593Smuzhiyun 	struct {
148*4882a593Smuzhiyun 		unsigned long	 : 53;
149*4882a593Smuzhiyun 		unsigned long fc : 1; /* Format-Control */
150*4882a593Smuzhiyun 		unsigned long	 : 4;
151*4882a593Smuzhiyun 		unsigned long i  : 1; /* Segment-Invalid Bit */
152*4882a593Smuzhiyun 		unsigned long cs : 1; /* Common-Segment Bit */
153*4882a593Smuzhiyun 		unsigned long tt : 2; /* Table-Type Bits */
154*4882a593Smuzhiyun 		unsigned long	 : 2;
155*4882a593Smuzhiyun 	};
156*4882a593Smuzhiyun };
157*4882a593Smuzhiyun 
158*4882a593Smuzhiyun enum {
159*4882a593Smuzhiyun 	TABLE_TYPE_SEGMENT = 0,
160*4882a593Smuzhiyun 	TABLE_TYPE_REGION3 = 1,
161*4882a593Smuzhiyun 	TABLE_TYPE_REGION2 = 2,
162*4882a593Smuzhiyun 	TABLE_TYPE_REGION1 = 3
163*4882a593Smuzhiyun };
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun union page_table_entry {
166*4882a593Smuzhiyun 	unsigned long val;
167*4882a593Smuzhiyun 	struct {
168*4882a593Smuzhiyun 		unsigned long pfra : 52; /* Page-Frame Real Address */
169*4882a593Smuzhiyun 		unsigned long z  : 1; /* Zero Bit */
170*4882a593Smuzhiyun 		unsigned long i  : 1; /* Page-Invalid Bit */
171*4882a593Smuzhiyun 		unsigned long p  : 1; /* DAT-Protection Bit */
172*4882a593Smuzhiyun 		unsigned long iep: 1; /* Instruction-Execution-Protection */
173*4882a593Smuzhiyun 		unsigned long	 : 8;
174*4882a593Smuzhiyun 	};
175*4882a593Smuzhiyun };
176*4882a593Smuzhiyun 
177*4882a593Smuzhiyun /*
178*4882a593Smuzhiyun  * vaddress union in order to easily decode a virtual address into its
179*4882a593Smuzhiyun  * region first index, region second index etc. parts.
180*4882a593Smuzhiyun  */
181*4882a593Smuzhiyun union vaddress {
182*4882a593Smuzhiyun 	unsigned long addr;
183*4882a593Smuzhiyun 	struct {
184*4882a593Smuzhiyun 		unsigned long rfx : 11;
185*4882a593Smuzhiyun 		unsigned long rsx : 11;
186*4882a593Smuzhiyun 		unsigned long rtx : 11;
187*4882a593Smuzhiyun 		unsigned long sx  : 11;
188*4882a593Smuzhiyun 		unsigned long px  : 8;
189*4882a593Smuzhiyun 		unsigned long bx  : 12;
190*4882a593Smuzhiyun 	};
191*4882a593Smuzhiyun 	struct {
192*4882a593Smuzhiyun 		unsigned long rfx01 : 2;
193*4882a593Smuzhiyun 		unsigned long	    : 9;
194*4882a593Smuzhiyun 		unsigned long rsx01 : 2;
195*4882a593Smuzhiyun 		unsigned long	    : 9;
196*4882a593Smuzhiyun 		unsigned long rtx01 : 2;
197*4882a593Smuzhiyun 		unsigned long	    : 9;
198*4882a593Smuzhiyun 		unsigned long sx01  : 2;
199*4882a593Smuzhiyun 		unsigned long	    : 29;
200*4882a593Smuzhiyun 	};
201*4882a593Smuzhiyun };
202*4882a593Smuzhiyun 
203*4882a593Smuzhiyun /*
204*4882a593Smuzhiyun  * raddress union which will contain the result (real or absolute address)
205*4882a593Smuzhiyun  * after a page table walk. The rfaa, sfaa and pfra members are used to
206*4882a593Smuzhiyun  * simply assign them the value of a region, segment or page table entry.
207*4882a593Smuzhiyun  */
208*4882a593Smuzhiyun union raddress {
209*4882a593Smuzhiyun 	unsigned long addr;
210*4882a593Smuzhiyun 	unsigned long rfaa : 33; /* Region-Frame Absolute Address */
211*4882a593Smuzhiyun 	unsigned long sfaa : 44; /* Segment-Frame Absolute Address */
212*4882a593Smuzhiyun 	unsigned long pfra : 52; /* Page-Frame Real Address */
213*4882a593Smuzhiyun };
214*4882a593Smuzhiyun 
215*4882a593Smuzhiyun union alet {
216*4882a593Smuzhiyun 	u32 val;
217*4882a593Smuzhiyun 	struct {
218*4882a593Smuzhiyun 		u32 reserved : 7;
219*4882a593Smuzhiyun 		u32 p        : 1;
220*4882a593Smuzhiyun 		u32 alesn    : 8;
221*4882a593Smuzhiyun 		u32 alen     : 16;
222*4882a593Smuzhiyun 	};
223*4882a593Smuzhiyun };
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun union ald {
226*4882a593Smuzhiyun 	u32 val;
227*4882a593Smuzhiyun 	struct {
228*4882a593Smuzhiyun 		u32     : 1;
229*4882a593Smuzhiyun 		u32 alo : 24;
230*4882a593Smuzhiyun 		u32 all : 7;
231*4882a593Smuzhiyun 	};
232*4882a593Smuzhiyun };
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun struct ale {
235*4882a593Smuzhiyun 	unsigned long i      : 1; /* ALEN-Invalid Bit */
236*4882a593Smuzhiyun 	unsigned long        : 5;
237*4882a593Smuzhiyun 	unsigned long fo     : 1; /* Fetch-Only Bit */
238*4882a593Smuzhiyun 	unsigned long p      : 1; /* Private Bit */
239*4882a593Smuzhiyun 	unsigned long alesn  : 8; /* Access-List-Entry Sequence Number */
240*4882a593Smuzhiyun 	unsigned long aleax  : 16; /* Access-List-Entry Authorization Index */
241*4882a593Smuzhiyun 	unsigned long        : 32;
242*4882a593Smuzhiyun 	unsigned long        : 1;
243*4882a593Smuzhiyun 	unsigned long asteo  : 25; /* ASN-Second-Table-Entry Origin */
244*4882a593Smuzhiyun 	unsigned long        : 6;
245*4882a593Smuzhiyun 	unsigned long astesn : 32; /* ASTE Sequence Number */
246*4882a593Smuzhiyun };
247*4882a593Smuzhiyun 
248*4882a593Smuzhiyun struct aste {
249*4882a593Smuzhiyun 	unsigned long i      : 1; /* ASX-Invalid Bit */
250*4882a593Smuzhiyun 	unsigned long ato    : 29; /* Authority-Table Origin */
251*4882a593Smuzhiyun 	unsigned long        : 1;
252*4882a593Smuzhiyun 	unsigned long b      : 1; /* Base-Space Bit */
253*4882a593Smuzhiyun 	unsigned long ax     : 16; /* Authorization Index */
254*4882a593Smuzhiyun 	unsigned long atl    : 12; /* Authority-Table Length */
255*4882a593Smuzhiyun 	unsigned long        : 2;
256*4882a593Smuzhiyun 	unsigned long ca     : 1; /* Controlled-ASN Bit */
257*4882a593Smuzhiyun 	unsigned long ra     : 1; /* Reusable-ASN Bit */
258*4882a593Smuzhiyun 	unsigned long asce   : 64; /* Address-Space-Control Element */
259*4882a593Smuzhiyun 	unsigned long ald    : 32;
260*4882a593Smuzhiyun 	unsigned long astesn : 32;
261*4882a593Smuzhiyun 	/* .. more fields there */
262*4882a593Smuzhiyun };
263*4882a593Smuzhiyun 
ipte_lock_held(struct kvm_vcpu * vcpu)264*4882a593Smuzhiyun int ipte_lock_held(struct kvm_vcpu *vcpu)
265*4882a593Smuzhiyun {
266*4882a593Smuzhiyun 	if (vcpu->arch.sie_block->eca & ECA_SII) {
267*4882a593Smuzhiyun 		int rc;
268*4882a593Smuzhiyun 
269*4882a593Smuzhiyun 		read_lock(&vcpu->kvm->arch.sca_lock);
270*4882a593Smuzhiyun 		rc = kvm_s390_get_ipte_control(vcpu->kvm)->kh != 0;
271*4882a593Smuzhiyun 		read_unlock(&vcpu->kvm->arch.sca_lock);
272*4882a593Smuzhiyun 		return rc;
273*4882a593Smuzhiyun 	}
274*4882a593Smuzhiyun 	return vcpu->kvm->arch.ipte_lock_count != 0;
275*4882a593Smuzhiyun }
276*4882a593Smuzhiyun 
ipte_lock_simple(struct kvm_vcpu * vcpu)277*4882a593Smuzhiyun static void ipte_lock_simple(struct kvm_vcpu *vcpu)
278*4882a593Smuzhiyun {
279*4882a593Smuzhiyun 	union ipte_control old, new, *ic;
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 	mutex_lock(&vcpu->kvm->arch.ipte_mutex);
282*4882a593Smuzhiyun 	vcpu->kvm->arch.ipte_lock_count++;
283*4882a593Smuzhiyun 	if (vcpu->kvm->arch.ipte_lock_count > 1)
284*4882a593Smuzhiyun 		goto out;
285*4882a593Smuzhiyun retry:
286*4882a593Smuzhiyun 	read_lock(&vcpu->kvm->arch.sca_lock);
287*4882a593Smuzhiyun 	ic = kvm_s390_get_ipte_control(vcpu->kvm);
288*4882a593Smuzhiyun 	do {
289*4882a593Smuzhiyun 		old = READ_ONCE(*ic);
290*4882a593Smuzhiyun 		if (old.k) {
291*4882a593Smuzhiyun 			read_unlock(&vcpu->kvm->arch.sca_lock);
292*4882a593Smuzhiyun 			cond_resched();
293*4882a593Smuzhiyun 			goto retry;
294*4882a593Smuzhiyun 		}
295*4882a593Smuzhiyun 		new = old;
296*4882a593Smuzhiyun 		new.k = 1;
297*4882a593Smuzhiyun 	} while (cmpxchg(&ic->val, old.val, new.val) != old.val);
298*4882a593Smuzhiyun 	read_unlock(&vcpu->kvm->arch.sca_lock);
299*4882a593Smuzhiyun out:
300*4882a593Smuzhiyun 	mutex_unlock(&vcpu->kvm->arch.ipte_mutex);
301*4882a593Smuzhiyun }
302*4882a593Smuzhiyun 
ipte_unlock_simple(struct kvm_vcpu * vcpu)303*4882a593Smuzhiyun static void ipte_unlock_simple(struct kvm_vcpu *vcpu)
304*4882a593Smuzhiyun {
305*4882a593Smuzhiyun 	union ipte_control old, new, *ic;
306*4882a593Smuzhiyun 
307*4882a593Smuzhiyun 	mutex_lock(&vcpu->kvm->arch.ipte_mutex);
308*4882a593Smuzhiyun 	vcpu->kvm->arch.ipte_lock_count--;
309*4882a593Smuzhiyun 	if (vcpu->kvm->arch.ipte_lock_count)
310*4882a593Smuzhiyun 		goto out;
311*4882a593Smuzhiyun 	read_lock(&vcpu->kvm->arch.sca_lock);
312*4882a593Smuzhiyun 	ic = kvm_s390_get_ipte_control(vcpu->kvm);
313*4882a593Smuzhiyun 	do {
314*4882a593Smuzhiyun 		old = READ_ONCE(*ic);
315*4882a593Smuzhiyun 		new = old;
316*4882a593Smuzhiyun 		new.k = 0;
317*4882a593Smuzhiyun 	} while (cmpxchg(&ic->val, old.val, new.val) != old.val);
318*4882a593Smuzhiyun 	read_unlock(&vcpu->kvm->arch.sca_lock);
319*4882a593Smuzhiyun 	wake_up(&vcpu->kvm->arch.ipte_wq);
320*4882a593Smuzhiyun out:
321*4882a593Smuzhiyun 	mutex_unlock(&vcpu->kvm->arch.ipte_mutex);
322*4882a593Smuzhiyun }
323*4882a593Smuzhiyun 
ipte_lock_siif(struct kvm_vcpu * vcpu)324*4882a593Smuzhiyun static void ipte_lock_siif(struct kvm_vcpu *vcpu)
325*4882a593Smuzhiyun {
326*4882a593Smuzhiyun 	union ipte_control old, new, *ic;
327*4882a593Smuzhiyun 
328*4882a593Smuzhiyun retry:
329*4882a593Smuzhiyun 	read_lock(&vcpu->kvm->arch.sca_lock);
330*4882a593Smuzhiyun 	ic = kvm_s390_get_ipte_control(vcpu->kvm);
331*4882a593Smuzhiyun 	do {
332*4882a593Smuzhiyun 		old = READ_ONCE(*ic);
333*4882a593Smuzhiyun 		if (old.kg) {
334*4882a593Smuzhiyun 			read_unlock(&vcpu->kvm->arch.sca_lock);
335*4882a593Smuzhiyun 			cond_resched();
336*4882a593Smuzhiyun 			goto retry;
337*4882a593Smuzhiyun 		}
338*4882a593Smuzhiyun 		new = old;
339*4882a593Smuzhiyun 		new.k = 1;
340*4882a593Smuzhiyun 		new.kh++;
341*4882a593Smuzhiyun 	} while (cmpxchg(&ic->val, old.val, new.val) != old.val);
342*4882a593Smuzhiyun 	read_unlock(&vcpu->kvm->arch.sca_lock);
343*4882a593Smuzhiyun }
344*4882a593Smuzhiyun 
ipte_unlock_siif(struct kvm_vcpu * vcpu)345*4882a593Smuzhiyun static void ipte_unlock_siif(struct kvm_vcpu *vcpu)
346*4882a593Smuzhiyun {
347*4882a593Smuzhiyun 	union ipte_control old, new, *ic;
348*4882a593Smuzhiyun 
349*4882a593Smuzhiyun 	read_lock(&vcpu->kvm->arch.sca_lock);
350*4882a593Smuzhiyun 	ic = kvm_s390_get_ipte_control(vcpu->kvm);
351*4882a593Smuzhiyun 	do {
352*4882a593Smuzhiyun 		old = READ_ONCE(*ic);
353*4882a593Smuzhiyun 		new = old;
354*4882a593Smuzhiyun 		new.kh--;
355*4882a593Smuzhiyun 		if (!new.kh)
356*4882a593Smuzhiyun 			new.k = 0;
357*4882a593Smuzhiyun 	} while (cmpxchg(&ic->val, old.val, new.val) != old.val);
358*4882a593Smuzhiyun 	read_unlock(&vcpu->kvm->arch.sca_lock);
359*4882a593Smuzhiyun 	if (!new.kh)
360*4882a593Smuzhiyun 		wake_up(&vcpu->kvm->arch.ipte_wq);
361*4882a593Smuzhiyun }
362*4882a593Smuzhiyun 
ipte_lock(struct kvm_vcpu * vcpu)363*4882a593Smuzhiyun void ipte_lock(struct kvm_vcpu *vcpu)
364*4882a593Smuzhiyun {
365*4882a593Smuzhiyun 	if (vcpu->arch.sie_block->eca & ECA_SII)
366*4882a593Smuzhiyun 		ipte_lock_siif(vcpu);
367*4882a593Smuzhiyun 	else
368*4882a593Smuzhiyun 		ipte_lock_simple(vcpu);
369*4882a593Smuzhiyun }
370*4882a593Smuzhiyun 
ipte_unlock(struct kvm_vcpu * vcpu)371*4882a593Smuzhiyun void ipte_unlock(struct kvm_vcpu *vcpu)
372*4882a593Smuzhiyun {
373*4882a593Smuzhiyun 	if (vcpu->arch.sie_block->eca & ECA_SII)
374*4882a593Smuzhiyun 		ipte_unlock_siif(vcpu);
375*4882a593Smuzhiyun 	else
376*4882a593Smuzhiyun 		ipte_unlock_simple(vcpu);
377*4882a593Smuzhiyun }
378*4882a593Smuzhiyun 
ar_translation(struct kvm_vcpu * vcpu,union asce * asce,u8 ar,enum gacc_mode mode)379*4882a593Smuzhiyun static int ar_translation(struct kvm_vcpu *vcpu, union asce *asce, u8 ar,
380*4882a593Smuzhiyun 			  enum gacc_mode mode)
381*4882a593Smuzhiyun {
382*4882a593Smuzhiyun 	union alet alet;
383*4882a593Smuzhiyun 	struct ale ale;
384*4882a593Smuzhiyun 	struct aste aste;
385*4882a593Smuzhiyun 	unsigned long ald_addr, authority_table_addr;
386*4882a593Smuzhiyun 	union ald ald;
387*4882a593Smuzhiyun 	int eax, rc;
388*4882a593Smuzhiyun 	u8 authority_table;
389*4882a593Smuzhiyun 
390*4882a593Smuzhiyun 	if (ar >= NUM_ACRS)
391*4882a593Smuzhiyun 		return -EINVAL;
392*4882a593Smuzhiyun 
393*4882a593Smuzhiyun 	save_access_regs(vcpu->run->s.regs.acrs);
394*4882a593Smuzhiyun 	alet.val = vcpu->run->s.regs.acrs[ar];
395*4882a593Smuzhiyun 
396*4882a593Smuzhiyun 	if (ar == 0 || alet.val == 0) {
397*4882a593Smuzhiyun 		asce->val = vcpu->arch.sie_block->gcr[1];
398*4882a593Smuzhiyun 		return 0;
399*4882a593Smuzhiyun 	} else if (alet.val == 1) {
400*4882a593Smuzhiyun 		asce->val = vcpu->arch.sie_block->gcr[7];
401*4882a593Smuzhiyun 		return 0;
402*4882a593Smuzhiyun 	}
403*4882a593Smuzhiyun 
404*4882a593Smuzhiyun 	if (alet.reserved)
405*4882a593Smuzhiyun 		return PGM_ALET_SPECIFICATION;
406*4882a593Smuzhiyun 
407*4882a593Smuzhiyun 	if (alet.p)
408*4882a593Smuzhiyun 		ald_addr = vcpu->arch.sie_block->gcr[5];
409*4882a593Smuzhiyun 	else
410*4882a593Smuzhiyun 		ald_addr = vcpu->arch.sie_block->gcr[2];
411*4882a593Smuzhiyun 	ald_addr &= 0x7fffffc0;
412*4882a593Smuzhiyun 
413*4882a593Smuzhiyun 	rc = read_guest_real(vcpu, ald_addr + 16, &ald.val, sizeof(union ald));
414*4882a593Smuzhiyun 	if (rc)
415*4882a593Smuzhiyun 		return rc;
416*4882a593Smuzhiyun 
417*4882a593Smuzhiyun 	if (alet.alen / 8 > ald.all)
418*4882a593Smuzhiyun 		return PGM_ALEN_TRANSLATION;
419*4882a593Smuzhiyun 
420*4882a593Smuzhiyun 	if (0x7fffffff - ald.alo * 128 < alet.alen * 16)
421*4882a593Smuzhiyun 		return PGM_ADDRESSING;
422*4882a593Smuzhiyun 
423*4882a593Smuzhiyun 	rc = read_guest_real(vcpu, ald.alo * 128 + alet.alen * 16, &ale,
424*4882a593Smuzhiyun 			     sizeof(struct ale));
425*4882a593Smuzhiyun 	if (rc)
426*4882a593Smuzhiyun 		return rc;
427*4882a593Smuzhiyun 
428*4882a593Smuzhiyun 	if (ale.i == 1)
429*4882a593Smuzhiyun 		return PGM_ALEN_TRANSLATION;
430*4882a593Smuzhiyun 	if (ale.alesn != alet.alesn)
431*4882a593Smuzhiyun 		return PGM_ALE_SEQUENCE;
432*4882a593Smuzhiyun 
433*4882a593Smuzhiyun 	rc = read_guest_real(vcpu, ale.asteo * 64, &aste, sizeof(struct aste));
434*4882a593Smuzhiyun 	if (rc)
435*4882a593Smuzhiyun 		return rc;
436*4882a593Smuzhiyun 
437*4882a593Smuzhiyun 	if (aste.i)
438*4882a593Smuzhiyun 		return PGM_ASTE_VALIDITY;
439*4882a593Smuzhiyun 	if (aste.astesn != ale.astesn)
440*4882a593Smuzhiyun 		return PGM_ASTE_SEQUENCE;
441*4882a593Smuzhiyun 
442*4882a593Smuzhiyun 	if (ale.p == 1) {
443*4882a593Smuzhiyun 		eax = (vcpu->arch.sie_block->gcr[8] >> 16) & 0xffff;
444*4882a593Smuzhiyun 		if (ale.aleax != eax) {
445*4882a593Smuzhiyun 			if (eax / 16 > aste.atl)
446*4882a593Smuzhiyun 				return PGM_EXTENDED_AUTHORITY;
447*4882a593Smuzhiyun 
448*4882a593Smuzhiyun 			authority_table_addr = aste.ato * 4 + eax / 4;
449*4882a593Smuzhiyun 
450*4882a593Smuzhiyun 			rc = read_guest_real(vcpu, authority_table_addr,
451*4882a593Smuzhiyun 					     &authority_table,
452*4882a593Smuzhiyun 					     sizeof(u8));
453*4882a593Smuzhiyun 			if (rc)
454*4882a593Smuzhiyun 				return rc;
455*4882a593Smuzhiyun 
456*4882a593Smuzhiyun 			if ((authority_table & (0x40 >> ((eax & 3) * 2))) == 0)
457*4882a593Smuzhiyun 				return PGM_EXTENDED_AUTHORITY;
458*4882a593Smuzhiyun 		}
459*4882a593Smuzhiyun 	}
460*4882a593Smuzhiyun 
461*4882a593Smuzhiyun 	if (ale.fo == 1 && mode == GACC_STORE)
462*4882a593Smuzhiyun 		return PGM_PROTECTION;
463*4882a593Smuzhiyun 
464*4882a593Smuzhiyun 	asce->val = aste.asce;
465*4882a593Smuzhiyun 	return 0;
466*4882a593Smuzhiyun }
467*4882a593Smuzhiyun 
468*4882a593Smuzhiyun struct trans_exc_code_bits {
469*4882a593Smuzhiyun 	unsigned long addr : 52; /* Translation-exception Address */
470*4882a593Smuzhiyun 	unsigned long fsi  : 2;  /* Access Exception Fetch/Store Indication */
471*4882a593Smuzhiyun 	unsigned long	   : 2;
472*4882a593Smuzhiyun 	unsigned long b56  : 1;
473*4882a593Smuzhiyun 	unsigned long	   : 3;
474*4882a593Smuzhiyun 	unsigned long b60  : 1;
475*4882a593Smuzhiyun 	unsigned long b61  : 1;
476*4882a593Smuzhiyun 	unsigned long as   : 2;  /* ASCE Identifier */
477*4882a593Smuzhiyun };
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun enum {
480*4882a593Smuzhiyun 	FSI_UNKNOWN = 0, /* Unknown wether fetch or store */
481*4882a593Smuzhiyun 	FSI_STORE   = 1, /* Exception was due to store operation */
482*4882a593Smuzhiyun 	FSI_FETCH   = 2  /* Exception was due to fetch operation */
483*4882a593Smuzhiyun };
484*4882a593Smuzhiyun 
485*4882a593Smuzhiyun enum prot_type {
486*4882a593Smuzhiyun 	PROT_TYPE_LA   = 0,
487*4882a593Smuzhiyun 	PROT_TYPE_KEYC = 1,
488*4882a593Smuzhiyun 	PROT_TYPE_ALC  = 2,
489*4882a593Smuzhiyun 	PROT_TYPE_DAT  = 3,
490*4882a593Smuzhiyun 	PROT_TYPE_IEP  = 4,
491*4882a593Smuzhiyun };
492*4882a593Smuzhiyun 
trans_exc(struct kvm_vcpu * vcpu,int code,unsigned long gva,u8 ar,enum gacc_mode mode,enum prot_type prot)493*4882a593Smuzhiyun static int trans_exc(struct kvm_vcpu *vcpu, int code, unsigned long gva,
494*4882a593Smuzhiyun 		     u8 ar, enum gacc_mode mode, enum prot_type prot)
495*4882a593Smuzhiyun {
496*4882a593Smuzhiyun 	struct kvm_s390_pgm_info *pgm = &vcpu->arch.pgm;
497*4882a593Smuzhiyun 	struct trans_exc_code_bits *tec;
498*4882a593Smuzhiyun 
499*4882a593Smuzhiyun 	memset(pgm, 0, sizeof(*pgm));
500*4882a593Smuzhiyun 	pgm->code = code;
501*4882a593Smuzhiyun 	tec = (struct trans_exc_code_bits *)&pgm->trans_exc_code;
502*4882a593Smuzhiyun 
503*4882a593Smuzhiyun 	switch (code) {
504*4882a593Smuzhiyun 	case PGM_PROTECTION:
505*4882a593Smuzhiyun 		switch (prot) {
506*4882a593Smuzhiyun 		case PROT_TYPE_IEP:
507*4882a593Smuzhiyun 			tec->b61 = 1;
508*4882a593Smuzhiyun 			fallthrough;
509*4882a593Smuzhiyun 		case PROT_TYPE_LA:
510*4882a593Smuzhiyun 			tec->b56 = 1;
511*4882a593Smuzhiyun 			break;
512*4882a593Smuzhiyun 		case PROT_TYPE_KEYC:
513*4882a593Smuzhiyun 			tec->b60 = 1;
514*4882a593Smuzhiyun 			break;
515*4882a593Smuzhiyun 		case PROT_TYPE_ALC:
516*4882a593Smuzhiyun 			tec->b60 = 1;
517*4882a593Smuzhiyun 			fallthrough;
518*4882a593Smuzhiyun 		case PROT_TYPE_DAT:
519*4882a593Smuzhiyun 			tec->b61 = 1;
520*4882a593Smuzhiyun 			break;
521*4882a593Smuzhiyun 		}
522*4882a593Smuzhiyun 		fallthrough;
523*4882a593Smuzhiyun 	case PGM_ASCE_TYPE:
524*4882a593Smuzhiyun 	case PGM_PAGE_TRANSLATION:
525*4882a593Smuzhiyun 	case PGM_REGION_FIRST_TRANS:
526*4882a593Smuzhiyun 	case PGM_REGION_SECOND_TRANS:
527*4882a593Smuzhiyun 	case PGM_REGION_THIRD_TRANS:
528*4882a593Smuzhiyun 	case PGM_SEGMENT_TRANSLATION:
529*4882a593Smuzhiyun 		/*
530*4882a593Smuzhiyun 		 * op_access_id only applies to MOVE_PAGE -> set bit 61
531*4882a593Smuzhiyun 		 * exc_access_id has to be set to 0 for some instructions. Both
532*4882a593Smuzhiyun 		 * cases have to be handled by the caller.
533*4882a593Smuzhiyun 		 */
534*4882a593Smuzhiyun 		tec->addr = gva >> PAGE_SHIFT;
535*4882a593Smuzhiyun 		tec->fsi = mode == GACC_STORE ? FSI_STORE : FSI_FETCH;
536*4882a593Smuzhiyun 		tec->as = psw_bits(vcpu->arch.sie_block->gpsw).as;
537*4882a593Smuzhiyun 		fallthrough;
538*4882a593Smuzhiyun 	case PGM_ALEN_TRANSLATION:
539*4882a593Smuzhiyun 	case PGM_ALE_SEQUENCE:
540*4882a593Smuzhiyun 	case PGM_ASTE_VALIDITY:
541*4882a593Smuzhiyun 	case PGM_ASTE_SEQUENCE:
542*4882a593Smuzhiyun 	case PGM_EXTENDED_AUTHORITY:
543*4882a593Smuzhiyun 		/*
544*4882a593Smuzhiyun 		 * We can always store exc_access_id, as it is
545*4882a593Smuzhiyun 		 * undefined for non-ar cases. It is undefined for
546*4882a593Smuzhiyun 		 * most DAT protection exceptions.
547*4882a593Smuzhiyun 		 */
548*4882a593Smuzhiyun 		pgm->exc_access_id = ar;
549*4882a593Smuzhiyun 		break;
550*4882a593Smuzhiyun 	}
551*4882a593Smuzhiyun 	return code;
552*4882a593Smuzhiyun }
553*4882a593Smuzhiyun 
get_vcpu_asce(struct kvm_vcpu * vcpu,union asce * asce,unsigned long ga,u8 ar,enum gacc_mode mode)554*4882a593Smuzhiyun static int get_vcpu_asce(struct kvm_vcpu *vcpu, union asce *asce,
555*4882a593Smuzhiyun 			 unsigned long ga, u8 ar, enum gacc_mode mode)
556*4882a593Smuzhiyun {
557*4882a593Smuzhiyun 	int rc;
558*4882a593Smuzhiyun 	struct psw_bits psw = psw_bits(vcpu->arch.sie_block->gpsw);
559*4882a593Smuzhiyun 
560*4882a593Smuzhiyun 	if (!psw.dat) {
561*4882a593Smuzhiyun 		asce->val = 0;
562*4882a593Smuzhiyun 		asce->r = 1;
563*4882a593Smuzhiyun 		return 0;
564*4882a593Smuzhiyun 	}
565*4882a593Smuzhiyun 
566*4882a593Smuzhiyun 	if ((mode == GACC_IFETCH) && (psw.as != PSW_BITS_AS_HOME))
567*4882a593Smuzhiyun 		psw.as = PSW_BITS_AS_PRIMARY;
568*4882a593Smuzhiyun 
569*4882a593Smuzhiyun 	switch (psw.as) {
570*4882a593Smuzhiyun 	case PSW_BITS_AS_PRIMARY:
571*4882a593Smuzhiyun 		asce->val = vcpu->arch.sie_block->gcr[1];
572*4882a593Smuzhiyun 		return 0;
573*4882a593Smuzhiyun 	case PSW_BITS_AS_SECONDARY:
574*4882a593Smuzhiyun 		asce->val = vcpu->arch.sie_block->gcr[7];
575*4882a593Smuzhiyun 		return 0;
576*4882a593Smuzhiyun 	case PSW_BITS_AS_HOME:
577*4882a593Smuzhiyun 		asce->val = vcpu->arch.sie_block->gcr[13];
578*4882a593Smuzhiyun 		return 0;
579*4882a593Smuzhiyun 	case PSW_BITS_AS_ACCREG:
580*4882a593Smuzhiyun 		rc = ar_translation(vcpu, asce, ar, mode);
581*4882a593Smuzhiyun 		if (rc > 0)
582*4882a593Smuzhiyun 			return trans_exc(vcpu, rc, ga, ar, mode, PROT_TYPE_ALC);
583*4882a593Smuzhiyun 		return rc;
584*4882a593Smuzhiyun 	}
585*4882a593Smuzhiyun 	return 0;
586*4882a593Smuzhiyun }
587*4882a593Smuzhiyun 
deref_table(struct kvm * kvm,unsigned long gpa,unsigned long * val)588*4882a593Smuzhiyun static int deref_table(struct kvm *kvm, unsigned long gpa, unsigned long *val)
589*4882a593Smuzhiyun {
590*4882a593Smuzhiyun 	return kvm_read_guest(kvm, gpa, val, sizeof(*val));
591*4882a593Smuzhiyun }
592*4882a593Smuzhiyun 
593*4882a593Smuzhiyun /**
594*4882a593Smuzhiyun  * guest_translate - translate a guest virtual into a guest absolute address
595*4882a593Smuzhiyun  * @vcpu: virtual cpu
596*4882a593Smuzhiyun  * @gva: guest virtual address
597*4882a593Smuzhiyun  * @gpa: points to where guest physical (absolute) address should be stored
598*4882a593Smuzhiyun  * @asce: effective asce
599*4882a593Smuzhiyun  * @mode: indicates the access mode to be used
600*4882a593Smuzhiyun  * @prot: returns the type for protection exceptions
601*4882a593Smuzhiyun  *
602*4882a593Smuzhiyun  * Translate a guest virtual address into a guest absolute address by means
603*4882a593Smuzhiyun  * of dynamic address translation as specified by the architecture.
604*4882a593Smuzhiyun  * If the resulting absolute address is not available in the configuration
605*4882a593Smuzhiyun  * an addressing exception is indicated and @gpa will not be changed.
606*4882a593Smuzhiyun  *
607*4882a593Smuzhiyun  * Returns: - zero on success; @gpa contains the resulting absolute address
608*4882a593Smuzhiyun  *	    - a negative value if guest access failed due to e.g. broken
609*4882a593Smuzhiyun  *	      guest mapping
610*4882a593Smuzhiyun  *	    - a positve value if an access exception happened. In this case
611*4882a593Smuzhiyun  *	      the returned value is the program interruption code as defined
612*4882a593Smuzhiyun  *	      by the architecture
613*4882a593Smuzhiyun  */
guest_translate(struct kvm_vcpu * vcpu,unsigned long gva,unsigned long * gpa,const union asce asce,enum gacc_mode mode,enum prot_type * prot)614*4882a593Smuzhiyun static unsigned long guest_translate(struct kvm_vcpu *vcpu, unsigned long gva,
615*4882a593Smuzhiyun 				     unsigned long *gpa, const union asce asce,
616*4882a593Smuzhiyun 				     enum gacc_mode mode, enum prot_type *prot)
617*4882a593Smuzhiyun {
618*4882a593Smuzhiyun 	union vaddress vaddr = {.addr = gva};
619*4882a593Smuzhiyun 	union raddress raddr = {.addr = gva};
620*4882a593Smuzhiyun 	union page_table_entry pte;
621*4882a593Smuzhiyun 	int dat_protection = 0;
622*4882a593Smuzhiyun 	int iep_protection = 0;
623*4882a593Smuzhiyun 	union ctlreg0 ctlreg0;
624*4882a593Smuzhiyun 	unsigned long ptr;
625*4882a593Smuzhiyun 	int edat1, edat2, iep;
626*4882a593Smuzhiyun 
627*4882a593Smuzhiyun 	ctlreg0.val = vcpu->arch.sie_block->gcr[0];
628*4882a593Smuzhiyun 	edat1 = ctlreg0.edat && test_kvm_facility(vcpu->kvm, 8);
629*4882a593Smuzhiyun 	edat2 = edat1 && test_kvm_facility(vcpu->kvm, 78);
630*4882a593Smuzhiyun 	iep = ctlreg0.iep && test_kvm_facility(vcpu->kvm, 130);
631*4882a593Smuzhiyun 	if (asce.r)
632*4882a593Smuzhiyun 		goto real_address;
633*4882a593Smuzhiyun 	ptr = asce.origin * PAGE_SIZE;
634*4882a593Smuzhiyun 	switch (asce.dt) {
635*4882a593Smuzhiyun 	case ASCE_TYPE_REGION1:
636*4882a593Smuzhiyun 		if (vaddr.rfx01 > asce.tl)
637*4882a593Smuzhiyun 			return PGM_REGION_FIRST_TRANS;
638*4882a593Smuzhiyun 		ptr += vaddr.rfx * 8;
639*4882a593Smuzhiyun 		break;
640*4882a593Smuzhiyun 	case ASCE_TYPE_REGION2:
641*4882a593Smuzhiyun 		if (vaddr.rfx)
642*4882a593Smuzhiyun 			return PGM_ASCE_TYPE;
643*4882a593Smuzhiyun 		if (vaddr.rsx01 > asce.tl)
644*4882a593Smuzhiyun 			return PGM_REGION_SECOND_TRANS;
645*4882a593Smuzhiyun 		ptr += vaddr.rsx * 8;
646*4882a593Smuzhiyun 		break;
647*4882a593Smuzhiyun 	case ASCE_TYPE_REGION3:
648*4882a593Smuzhiyun 		if (vaddr.rfx || vaddr.rsx)
649*4882a593Smuzhiyun 			return PGM_ASCE_TYPE;
650*4882a593Smuzhiyun 		if (vaddr.rtx01 > asce.tl)
651*4882a593Smuzhiyun 			return PGM_REGION_THIRD_TRANS;
652*4882a593Smuzhiyun 		ptr += vaddr.rtx * 8;
653*4882a593Smuzhiyun 		break;
654*4882a593Smuzhiyun 	case ASCE_TYPE_SEGMENT:
655*4882a593Smuzhiyun 		if (vaddr.rfx || vaddr.rsx || vaddr.rtx)
656*4882a593Smuzhiyun 			return PGM_ASCE_TYPE;
657*4882a593Smuzhiyun 		if (vaddr.sx01 > asce.tl)
658*4882a593Smuzhiyun 			return PGM_SEGMENT_TRANSLATION;
659*4882a593Smuzhiyun 		ptr += vaddr.sx * 8;
660*4882a593Smuzhiyun 		break;
661*4882a593Smuzhiyun 	}
662*4882a593Smuzhiyun 	switch (asce.dt) {
663*4882a593Smuzhiyun 	case ASCE_TYPE_REGION1:	{
664*4882a593Smuzhiyun 		union region1_table_entry rfte;
665*4882a593Smuzhiyun 
666*4882a593Smuzhiyun 		if (kvm_is_error_gpa(vcpu->kvm, ptr))
667*4882a593Smuzhiyun 			return PGM_ADDRESSING;
668*4882a593Smuzhiyun 		if (deref_table(vcpu->kvm, ptr, &rfte.val))
669*4882a593Smuzhiyun 			return -EFAULT;
670*4882a593Smuzhiyun 		if (rfte.i)
671*4882a593Smuzhiyun 			return PGM_REGION_FIRST_TRANS;
672*4882a593Smuzhiyun 		if (rfte.tt != TABLE_TYPE_REGION1)
673*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
674*4882a593Smuzhiyun 		if (vaddr.rsx01 < rfte.tf || vaddr.rsx01 > rfte.tl)
675*4882a593Smuzhiyun 			return PGM_REGION_SECOND_TRANS;
676*4882a593Smuzhiyun 		if (edat1)
677*4882a593Smuzhiyun 			dat_protection |= rfte.p;
678*4882a593Smuzhiyun 		ptr = rfte.rto * PAGE_SIZE + vaddr.rsx * 8;
679*4882a593Smuzhiyun 	}
680*4882a593Smuzhiyun 		fallthrough;
681*4882a593Smuzhiyun 	case ASCE_TYPE_REGION2: {
682*4882a593Smuzhiyun 		union region2_table_entry rste;
683*4882a593Smuzhiyun 
684*4882a593Smuzhiyun 		if (kvm_is_error_gpa(vcpu->kvm, ptr))
685*4882a593Smuzhiyun 			return PGM_ADDRESSING;
686*4882a593Smuzhiyun 		if (deref_table(vcpu->kvm, ptr, &rste.val))
687*4882a593Smuzhiyun 			return -EFAULT;
688*4882a593Smuzhiyun 		if (rste.i)
689*4882a593Smuzhiyun 			return PGM_REGION_SECOND_TRANS;
690*4882a593Smuzhiyun 		if (rste.tt != TABLE_TYPE_REGION2)
691*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
692*4882a593Smuzhiyun 		if (vaddr.rtx01 < rste.tf || vaddr.rtx01 > rste.tl)
693*4882a593Smuzhiyun 			return PGM_REGION_THIRD_TRANS;
694*4882a593Smuzhiyun 		if (edat1)
695*4882a593Smuzhiyun 			dat_protection |= rste.p;
696*4882a593Smuzhiyun 		ptr = rste.rto * PAGE_SIZE + vaddr.rtx * 8;
697*4882a593Smuzhiyun 	}
698*4882a593Smuzhiyun 		fallthrough;
699*4882a593Smuzhiyun 	case ASCE_TYPE_REGION3: {
700*4882a593Smuzhiyun 		union region3_table_entry rtte;
701*4882a593Smuzhiyun 
702*4882a593Smuzhiyun 		if (kvm_is_error_gpa(vcpu->kvm, ptr))
703*4882a593Smuzhiyun 			return PGM_ADDRESSING;
704*4882a593Smuzhiyun 		if (deref_table(vcpu->kvm, ptr, &rtte.val))
705*4882a593Smuzhiyun 			return -EFAULT;
706*4882a593Smuzhiyun 		if (rtte.i)
707*4882a593Smuzhiyun 			return PGM_REGION_THIRD_TRANS;
708*4882a593Smuzhiyun 		if (rtte.tt != TABLE_TYPE_REGION3)
709*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
710*4882a593Smuzhiyun 		if (rtte.cr && asce.p && edat2)
711*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
712*4882a593Smuzhiyun 		if (rtte.fc && edat2) {
713*4882a593Smuzhiyun 			dat_protection |= rtte.fc1.p;
714*4882a593Smuzhiyun 			iep_protection = rtte.fc1.iep;
715*4882a593Smuzhiyun 			raddr.rfaa = rtte.fc1.rfaa;
716*4882a593Smuzhiyun 			goto absolute_address;
717*4882a593Smuzhiyun 		}
718*4882a593Smuzhiyun 		if (vaddr.sx01 < rtte.fc0.tf)
719*4882a593Smuzhiyun 			return PGM_SEGMENT_TRANSLATION;
720*4882a593Smuzhiyun 		if (vaddr.sx01 > rtte.fc0.tl)
721*4882a593Smuzhiyun 			return PGM_SEGMENT_TRANSLATION;
722*4882a593Smuzhiyun 		if (edat1)
723*4882a593Smuzhiyun 			dat_protection |= rtte.fc0.p;
724*4882a593Smuzhiyun 		ptr = rtte.fc0.sto * PAGE_SIZE + vaddr.sx * 8;
725*4882a593Smuzhiyun 	}
726*4882a593Smuzhiyun 		fallthrough;
727*4882a593Smuzhiyun 	case ASCE_TYPE_SEGMENT: {
728*4882a593Smuzhiyun 		union segment_table_entry ste;
729*4882a593Smuzhiyun 
730*4882a593Smuzhiyun 		if (kvm_is_error_gpa(vcpu->kvm, ptr))
731*4882a593Smuzhiyun 			return PGM_ADDRESSING;
732*4882a593Smuzhiyun 		if (deref_table(vcpu->kvm, ptr, &ste.val))
733*4882a593Smuzhiyun 			return -EFAULT;
734*4882a593Smuzhiyun 		if (ste.i)
735*4882a593Smuzhiyun 			return PGM_SEGMENT_TRANSLATION;
736*4882a593Smuzhiyun 		if (ste.tt != TABLE_TYPE_SEGMENT)
737*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
738*4882a593Smuzhiyun 		if (ste.cs && asce.p)
739*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
740*4882a593Smuzhiyun 		if (ste.fc && edat1) {
741*4882a593Smuzhiyun 			dat_protection |= ste.fc1.p;
742*4882a593Smuzhiyun 			iep_protection = ste.fc1.iep;
743*4882a593Smuzhiyun 			raddr.sfaa = ste.fc1.sfaa;
744*4882a593Smuzhiyun 			goto absolute_address;
745*4882a593Smuzhiyun 		}
746*4882a593Smuzhiyun 		dat_protection |= ste.fc0.p;
747*4882a593Smuzhiyun 		ptr = ste.fc0.pto * (PAGE_SIZE / 2) + vaddr.px * 8;
748*4882a593Smuzhiyun 	}
749*4882a593Smuzhiyun 	}
750*4882a593Smuzhiyun 	if (kvm_is_error_gpa(vcpu->kvm, ptr))
751*4882a593Smuzhiyun 		return PGM_ADDRESSING;
752*4882a593Smuzhiyun 	if (deref_table(vcpu->kvm, ptr, &pte.val))
753*4882a593Smuzhiyun 		return -EFAULT;
754*4882a593Smuzhiyun 	if (pte.i)
755*4882a593Smuzhiyun 		return PGM_PAGE_TRANSLATION;
756*4882a593Smuzhiyun 	if (pte.z)
757*4882a593Smuzhiyun 		return PGM_TRANSLATION_SPEC;
758*4882a593Smuzhiyun 	dat_protection |= pte.p;
759*4882a593Smuzhiyun 	iep_protection = pte.iep;
760*4882a593Smuzhiyun 	raddr.pfra = pte.pfra;
761*4882a593Smuzhiyun real_address:
762*4882a593Smuzhiyun 	raddr.addr = kvm_s390_real_to_abs(vcpu, raddr.addr);
763*4882a593Smuzhiyun absolute_address:
764*4882a593Smuzhiyun 	if (mode == GACC_STORE && dat_protection) {
765*4882a593Smuzhiyun 		*prot = PROT_TYPE_DAT;
766*4882a593Smuzhiyun 		return PGM_PROTECTION;
767*4882a593Smuzhiyun 	}
768*4882a593Smuzhiyun 	if (mode == GACC_IFETCH && iep_protection && iep) {
769*4882a593Smuzhiyun 		*prot = PROT_TYPE_IEP;
770*4882a593Smuzhiyun 		return PGM_PROTECTION;
771*4882a593Smuzhiyun 	}
772*4882a593Smuzhiyun 	if (kvm_is_error_gpa(vcpu->kvm, raddr.addr))
773*4882a593Smuzhiyun 		return PGM_ADDRESSING;
774*4882a593Smuzhiyun 	*gpa = raddr.addr;
775*4882a593Smuzhiyun 	return 0;
776*4882a593Smuzhiyun }
777*4882a593Smuzhiyun 
is_low_address(unsigned long ga)778*4882a593Smuzhiyun static inline int is_low_address(unsigned long ga)
779*4882a593Smuzhiyun {
780*4882a593Smuzhiyun 	/* Check for address ranges 0..511 and 4096..4607 */
781*4882a593Smuzhiyun 	return (ga & ~0x11fful) == 0;
782*4882a593Smuzhiyun }
783*4882a593Smuzhiyun 
low_address_protection_enabled(struct kvm_vcpu * vcpu,const union asce asce)784*4882a593Smuzhiyun static int low_address_protection_enabled(struct kvm_vcpu *vcpu,
785*4882a593Smuzhiyun 					  const union asce asce)
786*4882a593Smuzhiyun {
787*4882a593Smuzhiyun 	union ctlreg0 ctlreg0 = {.val = vcpu->arch.sie_block->gcr[0]};
788*4882a593Smuzhiyun 	psw_t *psw = &vcpu->arch.sie_block->gpsw;
789*4882a593Smuzhiyun 
790*4882a593Smuzhiyun 	if (!ctlreg0.lap)
791*4882a593Smuzhiyun 		return 0;
792*4882a593Smuzhiyun 	if (psw_bits(*psw).dat && asce.p)
793*4882a593Smuzhiyun 		return 0;
794*4882a593Smuzhiyun 	return 1;
795*4882a593Smuzhiyun }
796*4882a593Smuzhiyun 
guest_page_range(struct kvm_vcpu * vcpu,unsigned long ga,u8 ar,unsigned long * pages,unsigned long nr_pages,const union asce asce,enum gacc_mode mode)797*4882a593Smuzhiyun static int guest_page_range(struct kvm_vcpu *vcpu, unsigned long ga, u8 ar,
798*4882a593Smuzhiyun 			    unsigned long *pages, unsigned long nr_pages,
799*4882a593Smuzhiyun 			    const union asce asce, enum gacc_mode mode)
800*4882a593Smuzhiyun {
801*4882a593Smuzhiyun 	psw_t *psw = &vcpu->arch.sie_block->gpsw;
802*4882a593Smuzhiyun 	int lap_enabled, rc = 0;
803*4882a593Smuzhiyun 	enum prot_type prot;
804*4882a593Smuzhiyun 
805*4882a593Smuzhiyun 	lap_enabled = low_address_protection_enabled(vcpu, asce);
806*4882a593Smuzhiyun 	while (nr_pages) {
807*4882a593Smuzhiyun 		ga = kvm_s390_logical_to_effective(vcpu, ga);
808*4882a593Smuzhiyun 		if (mode == GACC_STORE && lap_enabled && is_low_address(ga))
809*4882a593Smuzhiyun 			return trans_exc(vcpu, PGM_PROTECTION, ga, ar, mode,
810*4882a593Smuzhiyun 					 PROT_TYPE_LA);
811*4882a593Smuzhiyun 		ga &= PAGE_MASK;
812*4882a593Smuzhiyun 		if (psw_bits(*psw).dat) {
813*4882a593Smuzhiyun 			rc = guest_translate(vcpu, ga, pages, asce, mode, &prot);
814*4882a593Smuzhiyun 			if (rc < 0)
815*4882a593Smuzhiyun 				return rc;
816*4882a593Smuzhiyun 		} else {
817*4882a593Smuzhiyun 			*pages = kvm_s390_real_to_abs(vcpu, ga);
818*4882a593Smuzhiyun 			if (kvm_is_error_gpa(vcpu->kvm, *pages))
819*4882a593Smuzhiyun 				rc = PGM_ADDRESSING;
820*4882a593Smuzhiyun 		}
821*4882a593Smuzhiyun 		if (rc)
822*4882a593Smuzhiyun 			return trans_exc(vcpu, rc, ga, ar, mode, prot);
823*4882a593Smuzhiyun 		ga += PAGE_SIZE;
824*4882a593Smuzhiyun 		pages++;
825*4882a593Smuzhiyun 		nr_pages--;
826*4882a593Smuzhiyun 	}
827*4882a593Smuzhiyun 	return 0;
828*4882a593Smuzhiyun }
829*4882a593Smuzhiyun 
access_guest(struct kvm_vcpu * vcpu,unsigned long ga,u8 ar,void * data,unsigned long len,enum gacc_mode mode)830*4882a593Smuzhiyun int access_guest(struct kvm_vcpu *vcpu, unsigned long ga, u8 ar, void *data,
831*4882a593Smuzhiyun 		 unsigned long len, enum gacc_mode mode)
832*4882a593Smuzhiyun {
833*4882a593Smuzhiyun 	psw_t *psw = &vcpu->arch.sie_block->gpsw;
834*4882a593Smuzhiyun 	unsigned long _len, nr_pages, gpa, idx;
835*4882a593Smuzhiyun 	unsigned long pages_array[2];
836*4882a593Smuzhiyun 	unsigned long *pages;
837*4882a593Smuzhiyun 	int need_ipte_lock;
838*4882a593Smuzhiyun 	union asce asce;
839*4882a593Smuzhiyun 	int rc;
840*4882a593Smuzhiyun 
841*4882a593Smuzhiyun 	if (!len)
842*4882a593Smuzhiyun 		return 0;
843*4882a593Smuzhiyun 	ga = kvm_s390_logical_to_effective(vcpu, ga);
844*4882a593Smuzhiyun 	rc = get_vcpu_asce(vcpu, &asce, ga, ar, mode);
845*4882a593Smuzhiyun 	if (rc)
846*4882a593Smuzhiyun 		return rc;
847*4882a593Smuzhiyun 	nr_pages = (((ga & ~PAGE_MASK) + len - 1) >> PAGE_SHIFT) + 1;
848*4882a593Smuzhiyun 	pages = pages_array;
849*4882a593Smuzhiyun 	if (nr_pages > ARRAY_SIZE(pages_array))
850*4882a593Smuzhiyun 		pages = vmalloc(array_size(nr_pages, sizeof(unsigned long)));
851*4882a593Smuzhiyun 	if (!pages)
852*4882a593Smuzhiyun 		return -ENOMEM;
853*4882a593Smuzhiyun 	need_ipte_lock = psw_bits(*psw).dat && !asce.r;
854*4882a593Smuzhiyun 	if (need_ipte_lock)
855*4882a593Smuzhiyun 		ipte_lock(vcpu);
856*4882a593Smuzhiyun 	rc = guest_page_range(vcpu, ga, ar, pages, nr_pages, asce, mode);
857*4882a593Smuzhiyun 	for (idx = 0; idx < nr_pages && !rc; idx++) {
858*4882a593Smuzhiyun 		gpa = *(pages + idx) + (ga & ~PAGE_MASK);
859*4882a593Smuzhiyun 		_len = min(PAGE_SIZE - (gpa & ~PAGE_MASK), len);
860*4882a593Smuzhiyun 		if (mode == GACC_STORE)
861*4882a593Smuzhiyun 			rc = kvm_write_guest(vcpu->kvm, gpa, data, _len);
862*4882a593Smuzhiyun 		else
863*4882a593Smuzhiyun 			rc = kvm_read_guest(vcpu->kvm, gpa, data, _len);
864*4882a593Smuzhiyun 		len -= _len;
865*4882a593Smuzhiyun 		ga += _len;
866*4882a593Smuzhiyun 		data += _len;
867*4882a593Smuzhiyun 	}
868*4882a593Smuzhiyun 	if (need_ipte_lock)
869*4882a593Smuzhiyun 		ipte_unlock(vcpu);
870*4882a593Smuzhiyun 	if (nr_pages > ARRAY_SIZE(pages_array))
871*4882a593Smuzhiyun 		vfree(pages);
872*4882a593Smuzhiyun 	return rc;
873*4882a593Smuzhiyun }
874*4882a593Smuzhiyun 
access_guest_real(struct kvm_vcpu * vcpu,unsigned long gra,void * data,unsigned long len,enum gacc_mode mode)875*4882a593Smuzhiyun int access_guest_real(struct kvm_vcpu *vcpu, unsigned long gra,
876*4882a593Smuzhiyun 		      void *data, unsigned long len, enum gacc_mode mode)
877*4882a593Smuzhiyun {
878*4882a593Smuzhiyun 	unsigned long _len, gpa;
879*4882a593Smuzhiyun 	int rc = 0;
880*4882a593Smuzhiyun 
881*4882a593Smuzhiyun 	while (len && !rc) {
882*4882a593Smuzhiyun 		gpa = kvm_s390_real_to_abs(vcpu, gra);
883*4882a593Smuzhiyun 		_len = min(PAGE_SIZE - (gpa & ~PAGE_MASK), len);
884*4882a593Smuzhiyun 		if (mode)
885*4882a593Smuzhiyun 			rc = write_guest_abs(vcpu, gpa, data, _len);
886*4882a593Smuzhiyun 		else
887*4882a593Smuzhiyun 			rc = read_guest_abs(vcpu, gpa, data, _len);
888*4882a593Smuzhiyun 		len -= _len;
889*4882a593Smuzhiyun 		gra += _len;
890*4882a593Smuzhiyun 		data += _len;
891*4882a593Smuzhiyun 	}
892*4882a593Smuzhiyun 	return rc;
893*4882a593Smuzhiyun }
894*4882a593Smuzhiyun 
895*4882a593Smuzhiyun /**
896*4882a593Smuzhiyun  * guest_translate_address - translate guest logical into guest absolute address
897*4882a593Smuzhiyun  *
898*4882a593Smuzhiyun  * Parameter semantics are the same as the ones from guest_translate.
899*4882a593Smuzhiyun  * The memory contents at the guest address are not changed.
900*4882a593Smuzhiyun  *
901*4882a593Smuzhiyun  * Note: The IPTE lock is not taken during this function, so the caller
902*4882a593Smuzhiyun  * has to take care of this.
903*4882a593Smuzhiyun  */
guest_translate_address(struct kvm_vcpu * vcpu,unsigned long gva,u8 ar,unsigned long * gpa,enum gacc_mode mode)904*4882a593Smuzhiyun int guest_translate_address(struct kvm_vcpu *vcpu, unsigned long gva, u8 ar,
905*4882a593Smuzhiyun 			    unsigned long *gpa, enum gacc_mode mode)
906*4882a593Smuzhiyun {
907*4882a593Smuzhiyun 	psw_t *psw = &vcpu->arch.sie_block->gpsw;
908*4882a593Smuzhiyun 	enum prot_type prot;
909*4882a593Smuzhiyun 	union asce asce;
910*4882a593Smuzhiyun 	int rc;
911*4882a593Smuzhiyun 
912*4882a593Smuzhiyun 	gva = kvm_s390_logical_to_effective(vcpu, gva);
913*4882a593Smuzhiyun 	rc = get_vcpu_asce(vcpu, &asce, gva, ar, mode);
914*4882a593Smuzhiyun 	if (rc)
915*4882a593Smuzhiyun 		return rc;
916*4882a593Smuzhiyun 	if (is_low_address(gva) && low_address_protection_enabled(vcpu, asce)) {
917*4882a593Smuzhiyun 		if (mode == GACC_STORE)
918*4882a593Smuzhiyun 			return trans_exc(vcpu, PGM_PROTECTION, gva, 0,
919*4882a593Smuzhiyun 					 mode, PROT_TYPE_LA);
920*4882a593Smuzhiyun 	}
921*4882a593Smuzhiyun 
922*4882a593Smuzhiyun 	if (psw_bits(*psw).dat && !asce.r) {	/* Use DAT? */
923*4882a593Smuzhiyun 		rc = guest_translate(vcpu, gva, gpa, asce, mode, &prot);
924*4882a593Smuzhiyun 		if (rc > 0)
925*4882a593Smuzhiyun 			return trans_exc(vcpu, rc, gva, 0, mode, prot);
926*4882a593Smuzhiyun 	} else {
927*4882a593Smuzhiyun 		*gpa = kvm_s390_real_to_abs(vcpu, gva);
928*4882a593Smuzhiyun 		if (kvm_is_error_gpa(vcpu->kvm, *gpa))
929*4882a593Smuzhiyun 			return trans_exc(vcpu, rc, gva, PGM_ADDRESSING, mode, 0);
930*4882a593Smuzhiyun 	}
931*4882a593Smuzhiyun 
932*4882a593Smuzhiyun 	return rc;
933*4882a593Smuzhiyun }
934*4882a593Smuzhiyun 
935*4882a593Smuzhiyun /**
936*4882a593Smuzhiyun  * check_gva_range - test a range of guest virtual addresses for accessibility
937*4882a593Smuzhiyun  */
check_gva_range(struct kvm_vcpu * vcpu,unsigned long gva,u8 ar,unsigned long length,enum gacc_mode mode)938*4882a593Smuzhiyun int check_gva_range(struct kvm_vcpu *vcpu, unsigned long gva, u8 ar,
939*4882a593Smuzhiyun 		    unsigned long length, enum gacc_mode mode)
940*4882a593Smuzhiyun {
941*4882a593Smuzhiyun 	unsigned long gpa;
942*4882a593Smuzhiyun 	unsigned long currlen;
943*4882a593Smuzhiyun 	int rc = 0;
944*4882a593Smuzhiyun 
945*4882a593Smuzhiyun 	ipte_lock(vcpu);
946*4882a593Smuzhiyun 	while (length > 0 && !rc) {
947*4882a593Smuzhiyun 		currlen = min(length, PAGE_SIZE - (gva % PAGE_SIZE));
948*4882a593Smuzhiyun 		rc = guest_translate_address(vcpu, gva, ar, &gpa, mode);
949*4882a593Smuzhiyun 		gva += currlen;
950*4882a593Smuzhiyun 		length -= currlen;
951*4882a593Smuzhiyun 	}
952*4882a593Smuzhiyun 	ipte_unlock(vcpu);
953*4882a593Smuzhiyun 
954*4882a593Smuzhiyun 	return rc;
955*4882a593Smuzhiyun }
956*4882a593Smuzhiyun 
957*4882a593Smuzhiyun /**
958*4882a593Smuzhiyun  * kvm_s390_check_low_addr_prot_real - check for low-address protection
959*4882a593Smuzhiyun  * @gra: Guest real address
960*4882a593Smuzhiyun  *
961*4882a593Smuzhiyun  * Checks whether an address is subject to low-address protection and set
962*4882a593Smuzhiyun  * up vcpu->arch.pgm accordingly if necessary.
963*4882a593Smuzhiyun  *
964*4882a593Smuzhiyun  * Return: 0 if no protection exception, or PGM_PROTECTION if protected.
965*4882a593Smuzhiyun  */
kvm_s390_check_low_addr_prot_real(struct kvm_vcpu * vcpu,unsigned long gra)966*4882a593Smuzhiyun int kvm_s390_check_low_addr_prot_real(struct kvm_vcpu *vcpu, unsigned long gra)
967*4882a593Smuzhiyun {
968*4882a593Smuzhiyun 	union ctlreg0 ctlreg0 = {.val = vcpu->arch.sie_block->gcr[0]};
969*4882a593Smuzhiyun 
970*4882a593Smuzhiyun 	if (!ctlreg0.lap || !is_low_address(gra))
971*4882a593Smuzhiyun 		return 0;
972*4882a593Smuzhiyun 	return trans_exc(vcpu, PGM_PROTECTION, gra, 0, GACC_STORE, PROT_TYPE_LA);
973*4882a593Smuzhiyun }
974*4882a593Smuzhiyun 
975*4882a593Smuzhiyun /**
976*4882a593Smuzhiyun  * kvm_s390_shadow_tables - walk the guest page table and create shadow tables
977*4882a593Smuzhiyun  * @sg: pointer to the shadow guest address space structure
978*4882a593Smuzhiyun  * @saddr: faulting address in the shadow gmap
979*4882a593Smuzhiyun  * @pgt: pointer to the beginning of the page table for the given address if
980*4882a593Smuzhiyun  *	 successful (return value 0), or to the first invalid DAT entry in
981*4882a593Smuzhiyun  *	 case of exceptions (return value > 0)
982*4882a593Smuzhiyun  * @fake: pgt references contiguous guest memory block, not a pgtable
983*4882a593Smuzhiyun  */
kvm_s390_shadow_tables(struct gmap * sg,unsigned long saddr,unsigned long * pgt,int * dat_protection,int * fake)984*4882a593Smuzhiyun static int kvm_s390_shadow_tables(struct gmap *sg, unsigned long saddr,
985*4882a593Smuzhiyun 				  unsigned long *pgt, int *dat_protection,
986*4882a593Smuzhiyun 				  int *fake)
987*4882a593Smuzhiyun {
988*4882a593Smuzhiyun 	struct gmap *parent;
989*4882a593Smuzhiyun 	union asce asce;
990*4882a593Smuzhiyun 	union vaddress vaddr;
991*4882a593Smuzhiyun 	unsigned long ptr;
992*4882a593Smuzhiyun 	int rc;
993*4882a593Smuzhiyun 
994*4882a593Smuzhiyun 	*fake = 0;
995*4882a593Smuzhiyun 	*dat_protection = 0;
996*4882a593Smuzhiyun 	parent = sg->parent;
997*4882a593Smuzhiyun 	vaddr.addr = saddr;
998*4882a593Smuzhiyun 	asce.val = sg->orig_asce;
999*4882a593Smuzhiyun 	ptr = asce.origin * PAGE_SIZE;
1000*4882a593Smuzhiyun 	if (asce.r) {
1001*4882a593Smuzhiyun 		*fake = 1;
1002*4882a593Smuzhiyun 		ptr = 0;
1003*4882a593Smuzhiyun 		asce.dt = ASCE_TYPE_REGION1;
1004*4882a593Smuzhiyun 	}
1005*4882a593Smuzhiyun 	switch (asce.dt) {
1006*4882a593Smuzhiyun 	case ASCE_TYPE_REGION1:
1007*4882a593Smuzhiyun 		if (vaddr.rfx01 > asce.tl && !*fake)
1008*4882a593Smuzhiyun 			return PGM_REGION_FIRST_TRANS;
1009*4882a593Smuzhiyun 		break;
1010*4882a593Smuzhiyun 	case ASCE_TYPE_REGION2:
1011*4882a593Smuzhiyun 		if (vaddr.rfx)
1012*4882a593Smuzhiyun 			return PGM_ASCE_TYPE;
1013*4882a593Smuzhiyun 		if (vaddr.rsx01 > asce.tl)
1014*4882a593Smuzhiyun 			return PGM_REGION_SECOND_TRANS;
1015*4882a593Smuzhiyun 		break;
1016*4882a593Smuzhiyun 	case ASCE_TYPE_REGION3:
1017*4882a593Smuzhiyun 		if (vaddr.rfx || vaddr.rsx)
1018*4882a593Smuzhiyun 			return PGM_ASCE_TYPE;
1019*4882a593Smuzhiyun 		if (vaddr.rtx01 > asce.tl)
1020*4882a593Smuzhiyun 			return PGM_REGION_THIRD_TRANS;
1021*4882a593Smuzhiyun 		break;
1022*4882a593Smuzhiyun 	case ASCE_TYPE_SEGMENT:
1023*4882a593Smuzhiyun 		if (vaddr.rfx || vaddr.rsx || vaddr.rtx)
1024*4882a593Smuzhiyun 			return PGM_ASCE_TYPE;
1025*4882a593Smuzhiyun 		if (vaddr.sx01 > asce.tl)
1026*4882a593Smuzhiyun 			return PGM_SEGMENT_TRANSLATION;
1027*4882a593Smuzhiyun 		break;
1028*4882a593Smuzhiyun 	}
1029*4882a593Smuzhiyun 
1030*4882a593Smuzhiyun 	switch (asce.dt) {
1031*4882a593Smuzhiyun 	case ASCE_TYPE_REGION1: {
1032*4882a593Smuzhiyun 		union region1_table_entry rfte;
1033*4882a593Smuzhiyun 
1034*4882a593Smuzhiyun 		if (*fake) {
1035*4882a593Smuzhiyun 			ptr += vaddr.rfx * _REGION1_SIZE;
1036*4882a593Smuzhiyun 			rfte.val = ptr;
1037*4882a593Smuzhiyun 			goto shadow_r2t;
1038*4882a593Smuzhiyun 		}
1039*4882a593Smuzhiyun 		*pgt = ptr + vaddr.rfx * 8;
1040*4882a593Smuzhiyun 		rc = gmap_read_table(parent, ptr + vaddr.rfx * 8, &rfte.val);
1041*4882a593Smuzhiyun 		if (rc)
1042*4882a593Smuzhiyun 			return rc;
1043*4882a593Smuzhiyun 		if (rfte.i)
1044*4882a593Smuzhiyun 			return PGM_REGION_FIRST_TRANS;
1045*4882a593Smuzhiyun 		if (rfte.tt != TABLE_TYPE_REGION1)
1046*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
1047*4882a593Smuzhiyun 		if (vaddr.rsx01 < rfte.tf || vaddr.rsx01 > rfte.tl)
1048*4882a593Smuzhiyun 			return PGM_REGION_SECOND_TRANS;
1049*4882a593Smuzhiyun 		if (sg->edat_level >= 1)
1050*4882a593Smuzhiyun 			*dat_protection |= rfte.p;
1051*4882a593Smuzhiyun 		ptr = rfte.rto * PAGE_SIZE;
1052*4882a593Smuzhiyun shadow_r2t:
1053*4882a593Smuzhiyun 		rc = gmap_shadow_r2t(sg, saddr, rfte.val, *fake);
1054*4882a593Smuzhiyun 		if (rc)
1055*4882a593Smuzhiyun 			return rc;
1056*4882a593Smuzhiyun 	}
1057*4882a593Smuzhiyun 		fallthrough;
1058*4882a593Smuzhiyun 	case ASCE_TYPE_REGION2: {
1059*4882a593Smuzhiyun 		union region2_table_entry rste;
1060*4882a593Smuzhiyun 
1061*4882a593Smuzhiyun 		if (*fake) {
1062*4882a593Smuzhiyun 			ptr += vaddr.rsx * _REGION2_SIZE;
1063*4882a593Smuzhiyun 			rste.val = ptr;
1064*4882a593Smuzhiyun 			goto shadow_r3t;
1065*4882a593Smuzhiyun 		}
1066*4882a593Smuzhiyun 		*pgt = ptr + vaddr.rsx * 8;
1067*4882a593Smuzhiyun 		rc = gmap_read_table(parent, ptr + vaddr.rsx * 8, &rste.val);
1068*4882a593Smuzhiyun 		if (rc)
1069*4882a593Smuzhiyun 			return rc;
1070*4882a593Smuzhiyun 		if (rste.i)
1071*4882a593Smuzhiyun 			return PGM_REGION_SECOND_TRANS;
1072*4882a593Smuzhiyun 		if (rste.tt != TABLE_TYPE_REGION2)
1073*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
1074*4882a593Smuzhiyun 		if (vaddr.rtx01 < rste.tf || vaddr.rtx01 > rste.tl)
1075*4882a593Smuzhiyun 			return PGM_REGION_THIRD_TRANS;
1076*4882a593Smuzhiyun 		if (sg->edat_level >= 1)
1077*4882a593Smuzhiyun 			*dat_protection |= rste.p;
1078*4882a593Smuzhiyun 		ptr = rste.rto * PAGE_SIZE;
1079*4882a593Smuzhiyun shadow_r3t:
1080*4882a593Smuzhiyun 		rste.p |= *dat_protection;
1081*4882a593Smuzhiyun 		rc = gmap_shadow_r3t(sg, saddr, rste.val, *fake);
1082*4882a593Smuzhiyun 		if (rc)
1083*4882a593Smuzhiyun 			return rc;
1084*4882a593Smuzhiyun 	}
1085*4882a593Smuzhiyun 		fallthrough;
1086*4882a593Smuzhiyun 	case ASCE_TYPE_REGION3: {
1087*4882a593Smuzhiyun 		union region3_table_entry rtte;
1088*4882a593Smuzhiyun 
1089*4882a593Smuzhiyun 		if (*fake) {
1090*4882a593Smuzhiyun 			ptr += vaddr.rtx * _REGION3_SIZE;
1091*4882a593Smuzhiyun 			rtte.val = ptr;
1092*4882a593Smuzhiyun 			goto shadow_sgt;
1093*4882a593Smuzhiyun 		}
1094*4882a593Smuzhiyun 		*pgt = ptr + vaddr.rtx * 8;
1095*4882a593Smuzhiyun 		rc = gmap_read_table(parent, ptr + vaddr.rtx * 8, &rtte.val);
1096*4882a593Smuzhiyun 		if (rc)
1097*4882a593Smuzhiyun 			return rc;
1098*4882a593Smuzhiyun 		if (rtte.i)
1099*4882a593Smuzhiyun 			return PGM_REGION_THIRD_TRANS;
1100*4882a593Smuzhiyun 		if (rtte.tt != TABLE_TYPE_REGION3)
1101*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
1102*4882a593Smuzhiyun 		if (rtte.cr && asce.p && sg->edat_level >= 2)
1103*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
1104*4882a593Smuzhiyun 		if (rtte.fc && sg->edat_level >= 2) {
1105*4882a593Smuzhiyun 			*dat_protection |= rtte.fc0.p;
1106*4882a593Smuzhiyun 			*fake = 1;
1107*4882a593Smuzhiyun 			ptr = rtte.fc1.rfaa * _REGION3_SIZE;
1108*4882a593Smuzhiyun 			rtte.val = ptr;
1109*4882a593Smuzhiyun 			goto shadow_sgt;
1110*4882a593Smuzhiyun 		}
1111*4882a593Smuzhiyun 		if (vaddr.sx01 < rtte.fc0.tf || vaddr.sx01 > rtte.fc0.tl)
1112*4882a593Smuzhiyun 			return PGM_SEGMENT_TRANSLATION;
1113*4882a593Smuzhiyun 		if (sg->edat_level >= 1)
1114*4882a593Smuzhiyun 			*dat_protection |= rtte.fc0.p;
1115*4882a593Smuzhiyun 		ptr = rtte.fc0.sto * PAGE_SIZE;
1116*4882a593Smuzhiyun shadow_sgt:
1117*4882a593Smuzhiyun 		rtte.fc0.p |= *dat_protection;
1118*4882a593Smuzhiyun 		rc = gmap_shadow_sgt(sg, saddr, rtte.val, *fake);
1119*4882a593Smuzhiyun 		if (rc)
1120*4882a593Smuzhiyun 			return rc;
1121*4882a593Smuzhiyun 	}
1122*4882a593Smuzhiyun 		fallthrough;
1123*4882a593Smuzhiyun 	case ASCE_TYPE_SEGMENT: {
1124*4882a593Smuzhiyun 		union segment_table_entry ste;
1125*4882a593Smuzhiyun 
1126*4882a593Smuzhiyun 		if (*fake) {
1127*4882a593Smuzhiyun 			ptr += vaddr.sx * _SEGMENT_SIZE;
1128*4882a593Smuzhiyun 			ste.val = ptr;
1129*4882a593Smuzhiyun 			goto shadow_pgt;
1130*4882a593Smuzhiyun 		}
1131*4882a593Smuzhiyun 		*pgt = ptr + vaddr.sx * 8;
1132*4882a593Smuzhiyun 		rc = gmap_read_table(parent, ptr + vaddr.sx * 8, &ste.val);
1133*4882a593Smuzhiyun 		if (rc)
1134*4882a593Smuzhiyun 			return rc;
1135*4882a593Smuzhiyun 		if (ste.i)
1136*4882a593Smuzhiyun 			return PGM_SEGMENT_TRANSLATION;
1137*4882a593Smuzhiyun 		if (ste.tt != TABLE_TYPE_SEGMENT)
1138*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
1139*4882a593Smuzhiyun 		if (ste.cs && asce.p)
1140*4882a593Smuzhiyun 			return PGM_TRANSLATION_SPEC;
1141*4882a593Smuzhiyun 		*dat_protection |= ste.fc0.p;
1142*4882a593Smuzhiyun 		if (ste.fc && sg->edat_level >= 1) {
1143*4882a593Smuzhiyun 			*fake = 1;
1144*4882a593Smuzhiyun 			ptr = ste.fc1.sfaa * _SEGMENT_SIZE;
1145*4882a593Smuzhiyun 			ste.val = ptr;
1146*4882a593Smuzhiyun 			goto shadow_pgt;
1147*4882a593Smuzhiyun 		}
1148*4882a593Smuzhiyun 		ptr = ste.fc0.pto * (PAGE_SIZE / 2);
1149*4882a593Smuzhiyun shadow_pgt:
1150*4882a593Smuzhiyun 		ste.fc0.p |= *dat_protection;
1151*4882a593Smuzhiyun 		rc = gmap_shadow_pgt(sg, saddr, ste.val, *fake);
1152*4882a593Smuzhiyun 		if (rc)
1153*4882a593Smuzhiyun 			return rc;
1154*4882a593Smuzhiyun 	}
1155*4882a593Smuzhiyun 	}
1156*4882a593Smuzhiyun 	/* Return the parent address of the page table */
1157*4882a593Smuzhiyun 	*pgt = ptr;
1158*4882a593Smuzhiyun 	return 0;
1159*4882a593Smuzhiyun }
1160*4882a593Smuzhiyun 
1161*4882a593Smuzhiyun /**
1162*4882a593Smuzhiyun  * kvm_s390_shadow_fault - handle fault on a shadow page table
1163*4882a593Smuzhiyun  * @vcpu: virtual cpu
1164*4882a593Smuzhiyun  * @sg: pointer to the shadow guest address space structure
1165*4882a593Smuzhiyun  * @saddr: faulting address in the shadow gmap
1166*4882a593Smuzhiyun  * @datptr: will contain the address of the faulting DAT table entry, or of
1167*4882a593Smuzhiyun  *	    the valid leaf, plus some flags
1168*4882a593Smuzhiyun  *
1169*4882a593Smuzhiyun  * Returns: - 0 if the shadow fault was successfully resolved
1170*4882a593Smuzhiyun  *	    - > 0 (pgm exception code) on exceptions while faulting
1171*4882a593Smuzhiyun  *	    - -EAGAIN if the caller can retry immediately
1172*4882a593Smuzhiyun  *	    - -EFAULT when accessing invalid guest addresses
1173*4882a593Smuzhiyun  *	    - -ENOMEM if out of memory
1174*4882a593Smuzhiyun  */
kvm_s390_shadow_fault(struct kvm_vcpu * vcpu,struct gmap * sg,unsigned long saddr,unsigned long * datptr)1175*4882a593Smuzhiyun int kvm_s390_shadow_fault(struct kvm_vcpu *vcpu, struct gmap *sg,
1176*4882a593Smuzhiyun 			  unsigned long saddr, unsigned long *datptr)
1177*4882a593Smuzhiyun {
1178*4882a593Smuzhiyun 	union vaddress vaddr;
1179*4882a593Smuzhiyun 	union page_table_entry pte;
1180*4882a593Smuzhiyun 	unsigned long pgt = 0;
1181*4882a593Smuzhiyun 	int dat_protection, fake;
1182*4882a593Smuzhiyun 	int rc;
1183*4882a593Smuzhiyun 
1184*4882a593Smuzhiyun 	mmap_read_lock(sg->mm);
1185*4882a593Smuzhiyun 	/*
1186*4882a593Smuzhiyun 	 * We don't want any guest-2 tables to change - so the parent
1187*4882a593Smuzhiyun 	 * tables/pointers we read stay valid - unshadowing is however
1188*4882a593Smuzhiyun 	 * always possible - only guest_table_lock protects us.
1189*4882a593Smuzhiyun 	 */
1190*4882a593Smuzhiyun 	ipte_lock(vcpu);
1191*4882a593Smuzhiyun 
1192*4882a593Smuzhiyun 	rc = gmap_shadow_pgt_lookup(sg, saddr, &pgt, &dat_protection, &fake);
1193*4882a593Smuzhiyun 	if (rc)
1194*4882a593Smuzhiyun 		rc = kvm_s390_shadow_tables(sg, saddr, &pgt, &dat_protection,
1195*4882a593Smuzhiyun 					    &fake);
1196*4882a593Smuzhiyun 
1197*4882a593Smuzhiyun 	vaddr.addr = saddr;
1198*4882a593Smuzhiyun 	if (fake) {
1199*4882a593Smuzhiyun 		pte.val = pgt + vaddr.px * PAGE_SIZE;
1200*4882a593Smuzhiyun 		goto shadow_page;
1201*4882a593Smuzhiyun 	}
1202*4882a593Smuzhiyun 
1203*4882a593Smuzhiyun 	switch (rc) {
1204*4882a593Smuzhiyun 	case PGM_SEGMENT_TRANSLATION:
1205*4882a593Smuzhiyun 	case PGM_REGION_THIRD_TRANS:
1206*4882a593Smuzhiyun 	case PGM_REGION_SECOND_TRANS:
1207*4882a593Smuzhiyun 	case PGM_REGION_FIRST_TRANS:
1208*4882a593Smuzhiyun 		pgt |= PEI_NOT_PTE;
1209*4882a593Smuzhiyun 		break;
1210*4882a593Smuzhiyun 	case 0:
1211*4882a593Smuzhiyun 		pgt += vaddr.px * 8;
1212*4882a593Smuzhiyun 		rc = gmap_read_table(sg->parent, pgt, &pte.val);
1213*4882a593Smuzhiyun 	}
1214*4882a593Smuzhiyun 	if (datptr)
1215*4882a593Smuzhiyun 		*datptr = pgt | dat_protection * PEI_DAT_PROT;
1216*4882a593Smuzhiyun 	if (!rc && pte.i)
1217*4882a593Smuzhiyun 		rc = PGM_PAGE_TRANSLATION;
1218*4882a593Smuzhiyun 	if (!rc && pte.z)
1219*4882a593Smuzhiyun 		rc = PGM_TRANSLATION_SPEC;
1220*4882a593Smuzhiyun shadow_page:
1221*4882a593Smuzhiyun 	pte.p |= dat_protection;
1222*4882a593Smuzhiyun 	if (!rc)
1223*4882a593Smuzhiyun 		rc = gmap_shadow_page(sg, saddr, __pte(pte.val));
1224*4882a593Smuzhiyun 	ipte_unlock(vcpu);
1225*4882a593Smuzhiyun 	mmap_read_unlock(sg->mm);
1226*4882a593Smuzhiyun 	return rc;
1227*4882a593Smuzhiyun }
1228