xref: /linux/arch/x86/mm/pkeys.c (revision db6d8d5fdf9537641c76ba7f32e02b4bcc600972)
1 /*
2  * Intel Memory Protection Keys management
3  * Copyright (c) 2015, Intel Corporation.
4  *
5  * This program is free software; you can redistribute it and/or modify it
6  * under the terms and conditions of the GNU General Public License,
7  * version 2, as published by the Free Software Foundation.
8  *
9  * This program is distributed in the hope it will be useful, but WITHOUT
10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
12  * more details.
13  */
14 #include <linux/debugfs.h>		/* debugfs_create_u32()		*/
15 #include <linux/mm_types.h>             /* mm_struct, vma, etc...       */
16 #include <linux/pkeys.h>                /* PKEY_*                       */
17 #include <uapi/asm-generic/mman-common.h>
18 
19 #include <asm/cpufeature.h>             /* boot_cpu_has, ...            */
20 #include <asm/mmu_context.h>            /* vma_pkey()                   */
21 #include <asm/fpu/internal.h>           /* fpregs_active()              */
22 
23 int __execute_only_pkey(struct mm_struct *mm)
24 {
25 	bool need_to_set_mm_pkey = false;
26 	int execute_only_pkey = mm->context.execute_only_pkey;
27 	int ret;
28 
29 	/* Do we need to assign a pkey for mm's execute-only maps? */
30 	if (execute_only_pkey == -1) {
31 		/* Go allocate one to use, which might fail */
32 		execute_only_pkey = mm_pkey_alloc(mm);
33 		if (execute_only_pkey < 0)
34 			return -1;
35 		need_to_set_mm_pkey = true;
36 	}
37 
38 	/*
39 	 * We do not want to go through the relatively costly
40 	 * dance to set PKRU if we do not need to.  Check it
41 	 * first and assume that if the execute-only pkey is
42 	 * write-disabled that we do not have to set it
43 	 * ourselves.  We need preempt off so that nobody
44 	 * can make fpregs inactive.
45 	 */
46 	preempt_disable();
47 	if (!need_to_set_mm_pkey &&
48 	    fpregs_active() &&
49 	    !__pkru_allows_read(read_pkru(), execute_only_pkey)) {
50 		preempt_enable();
51 		return execute_only_pkey;
52 	}
53 	preempt_enable();
54 
55 	/*
56 	 * Set up PKRU so that it denies access for everything
57 	 * other than execution.
58 	 */
59 	ret = arch_set_user_pkey_access(current, execute_only_pkey,
60 			PKEY_DISABLE_ACCESS);
61 	/*
62 	 * If the PKRU-set operation failed somehow, just return
63 	 * 0 and effectively disable execute-only support.
64 	 */
65 	if (ret) {
66 		mm_set_pkey_free(mm, execute_only_pkey);
67 		return -1;
68 	}
69 
70 	/* We got one, store it and use it from here on out */
71 	if (need_to_set_mm_pkey)
72 		mm->context.execute_only_pkey = execute_only_pkey;
73 	return execute_only_pkey;
74 }
75 
76 static inline bool vma_is_pkey_exec_only(struct vm_area_struct *vma)
77 {
78 	/* Do this check first since the vm_flags should be hot */
79 	if ((vma->vm_flags & (VM_READ | VM_WRITE | VM_EXEC)) != VM_EXEC)
80 		return false;
81 	if (vma_pkey(vma) != vma->vm_mm->context.execute_only_pkey)
82 		return false;
83 
84 	return true;
85 }
86 
87 /*
88  * This is only called for *plain* mprotect calls.
89  */
90 int __arch_override_mprotect_pkey(struct vm_area_struct *vma, int prot, int pkey)
91 {
92 	/*
93 	 * Is this an mprotect_pkey() call?  If so, never
94 	 * override the value that came from the user.
95 	 */
96 	if (pkey != -1)
97 		return pkey;
98 	/*
99 	 * Look for a protection-key-drive execute-only mapping
100 	 * which is now being given permissions that are not
101 	 * execute-only.  Move it back to the default pkey.
102 	 */
103 	if (vma_is_pkey_exec_only(vma) &&
104 	    (prot & (PROT_READ|PROT_WRITE))) {
105 		return 0;
106 	}
107 	/*
108 	 * The mapping is execute-only.  Go try to get the
109 	 * execute-only protection key.  If we fail to do that,
110 	 * fall through as if we do not have execute-only
111 	 * support.
112 	 */
113 	if (prot == PROT_EXEC) {
114 		pkey = execute_only_pkey(vma->vm_mm);
115 		if (pkey > 0)
116 			return pkey;
117 	}
118 	/*
119 	 * This is a vanilla, non-pkey mprotect (or we failed to
120 	 * setup execute-only), inherit the pkey from the VMA we
121 	 * are working on.
122 	 */
123 	return vma_pkey(vma);
124 }
125 
126 #define PKRU_AD_KEY(pkey)	(PKRU_AD_BIT << ((pkey) * PKRU_BITS_PER_PKEY))
127 
128 /*
129  * Make the default PKRU value (at execve() time) as restrictive
130  * as possible.  This ensures that any threads clone()'d early
131  * in the process's lifetime will not accidentally get access
132  * to data which is pkey-protected later on.
133  */
134 u32 init_pkru_value = PKRU_AD_KEY( 1) | PKRU_AD_KEY( 2) | PKRU_AD_KEY( 3) |
135 		      PKRU_AD_KEY( 4) | PKRU_AD_KEY( 5) | PKRU_AD_KEY( 6) |
136 		      PKRU_AD_KEY( 7) | PKRU_AD_KEY( 8) | PKRU_AD_KEY( 9) |
137 		      PKRU_AD_KEY(10) | PKRU_AD_KEY(11) | PKRU_AD_KEY(12) |
138 		      PKRU_AD_KEY(13) | PKRU_AD_KEY(14) | PKRU_AD_KEY(15);
139 
140 /*
141  * Called from the FPU code when creating a fresh set of FPU
142  * registers.  This is called from a very specific context where
143  * we know the FPU regstiers are safe for use and we can use PKRU
144  * directly.  The fact that PKRU is only available when we are
145  * using eagerfpu mode makes this possible.
146  */
147 void copy_init_pkru_to_fpregs(void)
148 {
149 	u32 init_pkru_value_snapshot = READ_ONCE(init_pkru_value);
150 	/*
151 	 * Any write to PKRU takes it out of the XSAVE 'init
152 	 * state' which increases context switch cost.  Avoid
153 	 * writing 0 when PKRU was already 0.
154 	 */
155 	if (!init_pkru_value_snapshot && !read_pkru())
156 		return;
157 	/*
158 	 * Override the PKRU state that came from 'init_fpstate'
159 	 * with the baseline from the process.
160 	 */
161 	write_pkru(init_pkru_value_snapshot);
162 }
163 
164 static ssize_t init_pkru_read_file(struct file *file, char __user *user_buf,
165 			     size_t count, loff_t *ppos)
166 {
167 	char buf[32];
168 	unsigned int len;
169 
170 	len = sprintf(buf, "0x%x\n", init_pkru_value);
171 	return simple_read_from_buffer(user_buf, count, ppos, buf, len);
172 }
173 
174 static ssize_t init_pkru_write_file(struct file *file,
175 		 const char __user *user_buf, size_t count, loff_t *ppos)
176 {
177 	char buf[32];
178 	ssize_t len;
179 	u32 new_init_pkru;
180 
181 	len = min(count, sizeof(buf) - 1);
182 	if (copy_from_user(buf, user_buf, len))
183 		return -EFAULT;
184 
185 	/* Make the buffer a valid string that we can not overrun */
186 	buf[len] = '\0';
187 	if (kstrtouint(buf, 0, &new_init_pkru))
188 		return -EINVAL;
189 
190 	/*
191 	 * Don't allow insane settings that will blow the system
192 	 * up immediately if someone attempts to disable access
193 	 * or writes to pkey 0.
194 	 */
195 	if (new_init_pkru & (PKRU_AD_BIT|PKRU_WD_BIT))
196 		return -EINVAL;
197 
198 	WRITE_ONCE(init_pkru_value, new_init_pkru);
199 	return count;
200 }
201 
202 static const struct file_operations fops_init_pkru = {
203 	.read = init_pkru_read_file,
204 	.write = init_pkru_write_file,
205 	.llseek = default_llseek,
206 };
207 
208 static int __init create_init_pkru_value(void)
209 {
210 	debugfs_create_file("init_pkru", S_IRUSR | S_IWUSR,
211 			arch_debugfs_dir, NULL, &fops_init_pkru);
212 	return 0;
213 }
214 late_initcall(create_init_pkru_value);
215 
216 static __init int setup_init_pkru(char *opt)
217 {
218 	u32 new_init_pkru;
219 
220 	if (kstrtouint(opt, 0, &new_init_pkru))
221 		return 1;
222 
223 	WRITE_ONCE(init_pkru_value, new_init_pkru);
224 
225 	return 1;
226 }
227 __setup("init_pkru=", setup_init_pkru);
228