xref: /OK3568_Linux_fs/kernel/arch/x86/mm/pkeys.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Intel Memory Protection Keys management
4*4882a593Smuzhiyun  * Copyright (c) 2015, Intel Corporation.
5*4882a593Smuzhiyun  */
6*4882a593Smuzhiyun #include <linux/debugfs.h>		/* debugfs_create_u32()		*/
7*4882a593Smuzhiyun #include <linux/mm_types.h>             /* mm_struct, vma, etc...       */
8*4882a593Smuzhiyun #include <linux/pkeys.h>                /* PKEY_*                       */
9*4882a593Smuzhiyun #include <uapi/asm-generic/mman-common.h>
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <asm/cpufeature.h>             /* boot_cpu_has, ...            */
12*4882a593Smuzhiyun #include <asm/mmu_context.h>            /* vma_pkey()                   */
13*4882a593Smuzhiyun #include <asm/fpu/internal.h>		/* init_fpstate			*/
14*4882a593Smuzhiyun 
__execute_only_pkey(struct mm_struct * mm)15*4882a593Smuzhiyun int __execute_only_pkey(struct mm_struct *mm)
16*4882a593Smuzhiyun {
17*4882a593Smuzhiyun 	bool need_to_set_mm_pkey = false;
18*4882a593Smuzhiyun 	int execute_only_pkey = mm->context.execute_only_pkey;
19*4882a593Smuzhiyun 	int ret;
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun 	/* Do we need to assign a pkey for mm's execute-only maps? */
22*4882a593Smuzhiyun 	if (execute_only_pkey == -1) {
23*4882a593Smuzhiyun 		/* Go allocate one to use, which might fail */
24*4882a593Smuzhiyun 		execute_only_pkey = mm_pkey_alloc(mm);
25*4882a593Smuzhiyun 		if (execute_only_pkey < 0)
26*4882a593Smuzhiyun 			return -1;
27*4882a593Smuzhiyun 		need_to_set_mm_pkey = true;
28*4882a593Smuzhiyun 	}
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun 	/*
31*4882a593Smuzhiyun 	 * We do not want to go through the relatively costly
32*4882a593Smuzhiyun 	 * dance to set PKRU if we do not need to.  Check it
33*4882a593Smuzhiyun 	 * first and assume that if the execute-only pkey is
34*4882a593Smuzhiyun 	 * write-disabled that we do not have to set it
35*4882a593Smuzhiyun 	 * ourselves.
36*4882a593Smuzhiyun 	 */
37*4882a593Smuzhiyun 	if (!need_to_set_mm_pkey &&
38*4882a593Smuzhiyun 	    !__pkru_allows_read(read_pkru(), execute_only_pkey)) {
39*4882a593Smuzhiyun 		return execute_only_pkey;
40*4882a593Smuzhiyun 	}
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun 	/*
43*4882a593Smuzhiyun 	 * Set up PKRU so that it denies access for everything
44*4882a593Smuzhiyun 	 * other than execution.
45*4882a593Smuzhiyun 	 */
46*4882a593Smuzhiyun 	ret = arch_set_user_pkey_access(current, execute_only_pkey,
47*4882a593Smuzhiyun 			PKEY_DISABLE_ACCESS);
48*4882a593Smuzhiyun 	/*
49*4882a593Smuzhiyun 	 * If the PKRU-set operation failed somehow, just return
50*4882a593Smuzhiyun 	 * 0 and effectively disable execute-only support.
51*4882a593Smuzhiyun 	 */
52*4882a593Smuzhiyun 	if (ret) {
53*4882a593Smuzhiyun 		mm_set_pkey_free(mm, execute_only_pkey);
54*4882a593Smuzhiyun 		return -1;
55*4882a593Smuzhiyun 	}
56*4882a593Smuzhiyun 
57*4882a593Smuzhiyun 	/* We got one, store it and use it from here on out */
58*4882a593Smuzhiyun 	if (need_to_set_mm_pkey)
59*4882a593Smuzhiyun 		mm->context.execute_only_pkey = execute_only_pkey;
60*4882a593Smuzhiyun 	return execute_only_pkey;
61*4882a593Smuzhiyun }
62*4882a593Smuzhiyun 
vma_is_pkey_exec_only(struct vm_area_struct * vma)63*4882a593Smuzhiyun static inline bool vma_is_pkey_exec_only(struct vm_area_struct *vma)
64*4882a593Smuzhiyun {
65*4882a593Smuzhiyun 	/* Do this check first since the vm_flags should be hot */
66*4882a593Smuzhiyun 	if ((vma->vm_flags & VM_ACCESS_FLAGS) != VM_EXEC)
67*4882a593Smuzhiyun 		return false;
68*4882a593Smuzhiyun 	if (vma_pkey(vma) != vma->vm_mm->context.execute_only_pkey)
69*4882a593Smuzhiyun 		return false;
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun 	return true;
72*4882a593Smuzhiyun }
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun /*
75*4882a593Smuzhiyun  * This is only called for *plain* mprotect calls.
76*4882a593Smuzhiyun  */
__arch_override_mprotect_pkey(struct vm_area_struct * vma,int prot,int pkey)77*4882a593Smuzhiyun int __arch_override_mprotect_pkey(struct vm_area_struct *vma, int prot, int pkey)
78*4882a593Smuzhiyun {
79*4882a593Smuzhiyun 	/*
80*4882a593Smuzhiyun 	 * Is this an mprotect_pkey() call?  If so, never
81*4882a593Smuzhiyun 	 * override the value that came from the user.
82*4882a593Smuzhiyun 	 */
83*4882a593Smuzhiyun 	if (pkey != -1)
84*4882a593Smuzhiyun 		return pkey;
85*4882a593Smuzhiyun 
86*4882a593Smuzhiyun 	/*
87*4882a593Smuzhiyun 	 * The mapping is execute-only.  Go try to get the
88*4882a593Smuzhiyun 	 * execute-only protection key.  If we fail to do that,
89*4882a593Smuzhiyun 	 * fall through as if we do not have execute-only
90*4882a593Smuzhiyun 	 * support in this mm.
91*4882a593Smuzhiyun 	 */
92*4882a593Smuzhiyun 	if (prot == PROT_EXEC) {
93*4882a593Smuzhiyun 		pkey = execute_only_pkey(vma->vm_mm);
94*4882a593Smuzhiyun 		if (pkey > 0)
95*4882a593Smuzhiyun 			return pkey;
96*4882a593Smuzhiyun 	} else if (vma_is_pkey_exec_only(vma)) {
97*4882a593Smuzhiyun 		/*
98*4882a593Smuzhiyun 		 * Protections are *not* PROT_EXEC, but the mapping
99*4882a593Smuzhiyun 		 * is using the exec-only pkey.  This mapping was
100*4882a593Smuzhiyun 		 * PROT_EXEC and will no longer be.  Move back to
101*4882a593Smuzhiyun 		 * the default pkey.
102*4882a593Smuzhiyun 		 */
103*4882a593Smuzhiyun 		return ARCH_DEFAULT_PKEY;
104*4882a593Smuzhiyun 	}
105*4882a593Smuzhiyun 
106*4882a593Smuzhiyun 	/*
107*4882a593Smuzhiyun 	 * This is a vanilla, non-pkey mprotect (or we failed to
108*4882a593Smuzhiyun 	 * setup execute-only), inherit the pkey from the VMA we
109*4882a593Smuzhiyun 	 * are working on.
110*4882a593Smuzhiyun 	 */
111*4882a593Smuzhiyun 	return vma_pkey(vma);
112*4882a593Smuzhiyun }
113*4882a593Smuzhiyun 
114*4882a593Smuzhiyun #define PKRU_AD_KEY(pkey)	(PKRU_AD_BIT << ((pkey) * PKRU_BITS_PER_PKEY))
115*4882a593Smuzhiyun 
116*4882a593Smuzhiyun /*
117*4882a593Smuzhiyun  * Make the default PKRU value (at execve() time) as restrictive
118*4882a593Smuzhiyun  * as possible.  This ensures that any threads clone()'d early
119*4882a593Smuzhiyun  * in the process's lifetime will not accidentally get access
120*4882a593Smuzhiyun  * to data which is pkey-protected later on.
121*4882a593Smuzhiyun  */
122*4882a593Smuzhiyun u32 init_pkru_value = PKRU_AD_KEY( 1) | PKRU_AD_KEY( 2) | PKRU_AD_KEY( 3) |
123*4882a593Smuzhiyun 		      PKRU_AD_KEY( 4) | PKRU_AD_KEY( 5) | PKRU_AD_KEY( 6) |
124*4882a593Smuzhiyun 		      PKRU_AD_KEY( 7) | PKRU_AD_KEY( 8) | PKRU_AD_KEY( 9) |
125*4882a593Smuzhiyun 		      PKRU_AD_KEY(10) | PKRU_AD_KEY(11) | PKRU_AD_KEY(12) |
126*4882a593Smuzhiyun 		      PKRU_AD_KEY(13) | PKRU_AD_KEY(14) | PKRU_AD_KEY(15);
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun /*
129*4882a593Smuzhiyun  * Called from the FPU code when creating a fresh set of FPU
130*4882a593Smuzhiyun  * registers.  This is called from a very specific context where
131*4882a593Smuzhiyun  * we know the FPU regstiers are safe for use and we can use PKRU
132*4882a593Smuzhiyun  * directly.
133*4882a593Smuzhiyun  */
copy_init_pkru_to_fpregs(void)134*4882a593Smuzhiyun void copy_init_pkru_to_fpregs(void)
135*4882a593Smuzhiyun {
136*4882a593Smuzhiyun 	u32 init_pkru_value_snapshot = READ_ONCE(init_pkru_value);
137*4882a593Smuzhiyun 	/*
138*4882a593Smuzhiyun 	 * Override the PKRU state that came from 'init_fpstate'
139*4882a593Smuzhiyun 	 * with the baseline from the process.
140*4882a593Smuzhiyun 	 */
141*4882a593Smuzhiyun 	write_pkru(init_pkru_value_snapshot);
142*4882a593Smuzhiyun }
143*4882a593Smuzhiyun 
init_pkru_read_file(struct file * file,char __user * user_buf,size_t count,loff_t * ppos)144*4882a593Smuzhiyun static ssize_t init_pkru_read_file(struct file *file, char __user *user_buf,
145*4882a593Smuzhiyun 			     size_t count, loff_t *ppos)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun 	char buf[32];
148*4882a593Smuzhiyun 	unsigned int len;
149*4882a593Smuzhiyun 
150*4882a593Smuzhiyun 	len = sprintf(buf, "0x%x\n", init_pkru_value);
151*4882a593Smuzhiyun 	return simple_read_from_buffer(user_buf, count, ppos, buf, len);
152*4882a593Smuzhiyun }
153*4882a593Smuzhiyun 
init_pkru_write_file(struct file * file,const char __user * user_buf,size_t count,loff_t * ppos)154*4882a593Smuzhiyun static ssize_t init_pkru_write_file(struct file *file,
155*4882a593Smuzhiyun 		 const char __user *user_buf, size_t count, loff_t *ppos)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun 	struct pkru_state *pk;
158*4882a593Smuzhiyun 	char buf[32];
159*4882a593Smuzhiyun 	ssize_t len;
160*4882a593Smuzhiyun 	u32 new_init_pkru;
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun 	len = min(count, sizeof(buf) - 1);
163*4882a593Smuzhiyun 	if (copy_from_user(buf, user_buf, len))
164*4882a593Smuzhiyun 		return -EFAULT;
165*4882a593Smuzhiyun 
166*4882a593Smuzhiyun 	/* Make the buffer a valid string that we can not overrun */
167*4882a593Smuzhiyun 	buf[len] = '\0';
168*4882a593Smuzhiyun 	if (kstrtouint(buf, 0, &new_init_pkru))
169*4882a593Smuzhiyun 		return -EINVAL;
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun 	/*
172*4882a593Smuzhiyun 	 * Don't allow insane settings that will blow the system
173*4882a593Smuzhiyun 	 * up immediately if someone attempts to disable access
174*4882a593Smuzhiyun 	 * or writes to pkey 0.
175*4882a593Smuzhiyun 	 */
176*4882a593Smuzhiyun 	if (new_init_pkru & (PKRU_AD_BIT|PKRU_WD_BIT))
177*4882a593Smuzhiyun 		return -EINVAL;
178*4882a593Smuzhiyun 
179*4882a593Smuzhiyun 	WRITE_ONCE(init_pkru_value, new_init_pkru);
180*4882a593Smuzhiyun 	pk = get_xsave_addr(&init_fpstate.xsave, XFEATURE_PKRU);
181*4882a593Smuzhiyun 	if (!pk)
182*4882a593Smuzhiyun 		return -EINVAL;
183*4882a593Smuzhiyun 	pk->pkru = new_init_pkru;
184*4882a593Smuzhiyun 	return count;
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun static const struct file_operations fops_init_pkru = {
188*4882a593Smuzhiyun 	.read = init_pkru_read_file,
189*4882a593Smuzhiyun 	.write = init_pkru_write_file,
190*4882a593Smuzhiyun 	.llseek = default_llseek,
191*4882a593Smuzhiyun };
192*4882a593Smuzhiyun 
create_init_pkru_value(void)193*4882a593Smuzhiyun static int __init create_init_pkru_value(void)
194*4882a593Smuzhiyun {
195*4882a593Smuzhiyun 	debugfs_create_file("init_pkru", S_IRUSR | S_IWUSR,
196*4882a593Smuzhiyun 			arch_debugfs_dir, NULL, &fops_init_pkru);
197*4882a593Smuzhiyun 	return 0;
198*4882a593Smuzhiyun }
199*4882a593Smuzhiyun late_initcall(create_init_pkru_value);
200*4882a593Smuzhiyun 
setup_init_pkru(char * opt)201*4882a593Smuzhiyun static __init int setup_init_pkru(char *opt)
202*4882a593Smuzhiyun {
203*4882a593Smuzhiyun 	u32 new_init_pkru;
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun 	if (kstrtouint(opt, 0, &new_init_pkru))
206*4882a593Smuzhiyun 		return 1;
207*4882a593Smuzhiyun 
208*4882a593Smuzhiyun 	WRITE_ONCE(init_pkru_value, new_init_pkru);
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun 	return 1;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun __setup("init_pkru=", setup_init_pkru);
213