xref: /linux/arch/powerpc/mm/book3s64/pkeys.c (revision 8b83369ddcb3fb9cab5c1088987ce477565bb630)
1 // SPDX-License-Identifier: GPL-2.0+
2 /*
3  * PowerPC Memory Protection Keys management
4  *
5  * Copyright 2017, Ram Pai, IBM Corporation.
6  */
7 
8 #include <asm/mman.h>
9 #include <asm/mmu_context.h>
10 #include <asm/mmu.h>
11 #include <asm/setup.h>
12 #include <asm/smp.h>
13 
14 #include <linux/pkeys.h>
15 #include <linux/of_fdt.h>
16 
17 
18 int  num_pkey;		/* Max number of pkeys supported */
19 /*
20  *  Keys marked in the reservation list cannot be allocated by  userspace
21  */
22 u32 reserved_allocation_mask __ro_after_init;
23 
24 /* Bits set for the initially allocated keys */
25 static u32 initial_allocation_mask __ro_after_init;
26 
27 /*
28  * Even if we allocate keys with sys_pkey_alloc(), we need to make sure
29  * other thread still find the access denied using the same keys.
30  */
31 u64 default_amr __ro_after_init  = ~0x0UL;
32 u64 default_iamr __ro_after_init = 0x5555555555555555UL;
33 u64 default_uamor __ro_after_init;
34 EXPORT_SYMBOL(default_amr);
35 /*
36  * Key used to implement PROT_EXEC mmap. Denies READ/WRITE
37  * We pick key 2 because 0 is special key and 1 is reserved as per ISA.
38  */
39 static int execute_only_key = 2;
40 static bool pkey_execute_disable_supported;
41 
42 
43 #define AMR_BITS_PER_PKEY 2
44 #define AMR_RD_BIT 0x1UL
45 #define AMR_WR_BIT 0x2UL
46 #define IAMR_EX_BIT 0x1UL
47 #define PKEY_REG_BITS (sizeof(u64) * 8)
48 #define pkeyshift(pkey) (PKEY_REG_BITS - ((pkey+1) * AMR_BITS_PER_PKEY))
49 
50 static int __init dt_scan_storage_keys(unsigned long node,
51 				       const char *uname, int depth,
52 				       void *data)
53 {
54 	const char *type = of_get_flat_dt_prop(node, "device_type", NULL);
55 	const __be32 *prop;
56 	int *pkeys_total = (int *) data;
57 
58 	/* We are scanning "cpu" nodes only */
59 	if (type == NULL || strcmp(type, "cpu") != 0)
60 		return 0;
61 
62 	prop = of_get_flat_dt_prop(node, "ibm,processor-storage-keys", NULL);
63 	if (!prop)
64 		return 0;
65 	*pkeys_total = be32_to_cpu(prop[0]);
66 	return 1;
67 }
68 
69 static int scan_pkey_feature(void)
70 {
71 	int ret;
72 	int pkeys_total = 0;
73 
74 	/*
75 	 * Pkey is not supported with Radix translation.
76 	 */
77 	if (early_radix_enabled())
78 		return 0;
79 
80 	ret = of_scan_flat_dt(dt_scan_storage_keys, &pkeys_total);
81 	if (ret == 0) {
82 		/*
83 		 * Let's assume 32 pkeys on P8/P9 bare metal, if its not defined by device
84 		 * tree. We make this exception since some version of skiboot forgot to
85 		 * expose this property on power8/9.
86 		 */
87 		if (!firmware_has_feature(FW_FEATURE_LPAR)) {
88 			unsigned long pvr = mfspr(SPRN_PVR);
89 
90 			if (PVR_VER(pvr) == PVR_POWER8 || PVR_VER(pvr) == PVR_POWER8E ||
91 			    PVR_VER(pvr) == PVR_POWER8NVL || PVR_VER(pvr) == PVR_POWER9)
92 				pkeys_total = 32;
93 		}
94 	}
95 
96 #ifdef CONFIG_PPC_MEM_KEYS
97 	/*
98 	 * Adjust the upper limit, based on the number of bits supported by
99 	 * arch-neutral code.
100 	 */
101 	pkeys_total = min_t(int, pkeys_total,
102 			    ((ARCH_VM_PKEY_FLAGS >> VM_PKEY_SHIFT) + 1));
103 #endif
104 	return pkeys_total;
105 }
106 
107 void __init pkey_early_init_devtree(void)
108 {
109 	int pkeys_total, i;
110 
111 #ifdef CONFIG_PPC_MEM_KEYS
112 	/*
113 	 * We define PKEY_DISABLE_EXECUTE in addition to the arch-neutral
114 	 * generic defines for PKEY_DISABLE_ACCESS and PKEY_DISABLE_WRITE.
115 	 * Ensure that the bits a distinct.
116 	 */
117 	BUILD_BUG_ON(PKEY_DISABLE_EXECUTE &
118 		     (PKEY_DISABLE_ACCESS | PKEY_DISABLE_WRITE));
119 
120 	/*
121 	 * pkey_to_vmflag_bits() assumes that the pkey bits are contiguous
122 	 * in the vmaflag. Make sure that is really the case.
123 	 */
124 	BUILD_BUG_ON(__builtin_clzl(ARCH_VM_PKEY_FLAGS >> VM_PKEY_SHIFT) +
125 		     __builtin_popcountl(ARCH_VM_PKEY_FLAGS >> VM_PKEY_SHIFT)
126 				!= (sizeof(u64) * BITS_PER_BYTE));
127 #endif
128 	/*
129 	 * Only P7 and above supports SPRN_AMR update with MSR[PR] = 1
130 	 */
131 	if (!early_cpu_has_feature(CPU_FTR_ARCH_206))
132 		return;
133 
134 	/* scan the device tree for pkey feature */
135 	pkeys_total = scan_pkey_feature();
136 	if (!pkeys_total)
137 		goto out;
138 
139 	/* Allow all keys to be modified by default */
140 	default_uamor = ~0x0UL;
141 
142 	cur_cpu_spec->mmu_features |= MMU_FTR_PKEY;
143 
144 	/*
145 	 * The device tree cannot be relied to indicate support for
146 	 * execute_disable support. Instead we use a PVR check.
147 	 */
148 	if (pvr_version_is(PVR_POWER7) || pvr_version_is(PVR_POWER7p))
149 		pkey_execute_disable_supported = false;
150 	else
151 		pkey_execute_disable_supported = true;
152 
153 #ifdef CONFIG_PPC_4K_PAGES
154 	/*
155 	 * The OS can manage only 8 pkeys due to its inability to represent them
156 	 * in the Linux 4K PTE. Mark all other keys reserved.
157 	 */
158 	num_pkey = min(8, pkeys_total);
159 #else
160 	num_pkey = pkeys_total;
161 #endif
162 
163 	if (unlikely(num_pkey <= execute_only_key) || !pkey_execute_disable_supported) {
164 		/*
165 		 * Insufficient number of keys to support
166 		 * execute only key. Mark it unavailable.
167 		 */
168 		execute_only_key = -1;
169 	} else {
170 		/*
171 		 * Mark the execute_only_pkey as not available for
172 		 * user allocation via pkey_alloc.
173 		 */
174 		reserved_allocation_mask |= (0x1 << execute_only_key);
175 
176 		/*
177 		 * Deny READ/WRITE for execute_only_key.
178 		 * Allow execute in IAMR.
179 		 */
180 		default_amr  |= (0x3ul << pkeyshift(execute_only_key));
181 		default_iamr &= ~(0x1ul << pkeyshift(execute_only_key));
182 
183 		/*
184 		 * Clear the uamor bits for this key.
185 		 */
186 		default_uamor &= ~(0x3ul << pkeyshift(execute_only_key));
187 	}
188 
189 	if (unlikely(num_pkey <= 3)) {
190 		/*
191 		 * Insufficient number of keys to support
192 		 * KUAP/KUEP feature.
193 		 */
194 		disable_kuep = true;
195 		disable_kuap = true;
196 		WARN(1, "Disabling kernel user protection due to low (%d) max supported keys\n", num_pkey);
197 	} else {
198 		/*  handle key which is used by kernel for KAUP */
199 		reserved_allocation_mask |= (0x1 << 3);
200 		/*
201 		 * Mark access for kup_key in default amr so that
202 		 * we continue to operate with that AMR in
203 		 * copy_to/from_user().
204 		 */
205 		default_amr   &= ~(0x3ul << pkeyshift(3));
206 		default_iamr  &= ~(0x1ul << pkeyshift(3));
207 		default_uamor &= ~(0x3ul << pkeyshift(3));
208 	}
209 
210 	/*
211 	 * Allow access for only key 0. And prevent any other modification.
212 	 */
213 	default_amr   &= ~(0x3ul << pkeyshift(0));
214 	default_iamr  &= ~(0x1ul << pkeyshift(0));
215 	default_uamor &= ~(0x3ul << pkeyshift(0));
216 	/*
217 	 * key 0 is special in that we want to consider it an allocated
218 	 * key which is preallocated. We don't allow changing AMR bits
219 	 * w.r.t key 0. But one can pkey_free(key0)
220 	 */
221 	initial_allocation_mask |= (0x1 << 0);
222 
223 	/*
224 	 * key 1 is recommended not to be used. PowerISA(3.0) page 1015,
225 	 * programming note.
226 	 */
227 	reserved_allocation_mask |= (0x1 << 1);
228 	default_uamor &= ~(0x3ul << pkeyshift(1));
229 
230 	/*
231 	 * Prevent the usage of OS reserved keys. Update UAMOR
232 	 * for those keys. Also mark the rest of the bits in the
233 	 * 32 bit mask as reserved.
234 	 */
235 	for (i = num_pkey; i < 32 ; i++) {
236 		reserved_allocation_mask |= (0x1 << i);
237 		default_uamor &= ~(0x3ul << pkeyshift(i));
238 	}
239 	/*
240 	 * Prevent the allocation of reserved keys too.
241 	 */
242 	initial_allocation_mask |= reserved_allocation_mask;
243 
244 	pr_info("Enabling pkeys with max key count %d\n", num_pkey);
245 out:
246 	/*
247 	 * Setup uamor on boot cpu
248 	 */
249 	mtspr(SPRN_UAMOR, default_uamor);
250 
251 	return;
252 }
253 
254 #ifdef CONFIG_PPC_KUEP
255 void setup_kuep(bool disabled)
256 {
257 	if (disabled)
258 		return;
259 	/*
260 	 * On hash if PKEY feature is not enabled, disable KUAP too.
261 	 */
262 	if (!early_radix_enabled() && !early_mmu_has_feature(MMU_FTR_PKEY))
263 		return;
264 
265 	if (smp_processor_id() == boot_cpuid) {
266 		pr_info("Activating Kernel Userspace Execution Prevention\n");
267 		cur_cpu_spec->mmu_features |= MMU_FTR_BOOK3S_KUEP;
268 	}
269 
270 	/*
271 	 * Radix always uses key0 of the IAMR to determine if an access is
272 	 * allowed. We set bit 0 (IBM bit 1) of key0, to prevent instruction
273 	 * fetch.
274 	 */
275 	mtspr(SPRN_IAMR, AMR_KUEP_BLOCKED);
276 	isync();
277 }
278 #endif
279 
280 #ifdef CONFIG_PPC_KUAP
281 void setup_kuap(bool disabled)
282 {
283 	if (disabled)
284 		return;
285 	/*
286 	 * On hash if PKEY feature is not enabled, disable KUAP too.
287 	 */
288 	if (!early_radix_enabled() && !early_mmu_has_feature(MMU_FTR_PKEY))
289 		return;
290 
291 	if (smp_processor_id() == boot_cpuid) {
292 		pr_info("Activating Kernel Userspace Access Prevention\n");
293 		cur_cpu_spec->mmu_features |= MMU_FTR_BOOK3S_KUAP;
294 	}
295 
296 	/*
297 	 * Set the default kernel AMR values on all cpus.
298 	 */
299 	mtspr(SPRN_AMR, AMR_KUAP_BLOCKED);
300 	isync();
301 }
302 #endif
303 
304 static inline void update_current_thread_amr(u64 value)
305 {
306 	current->thread.regs->amr = value;
307 }
308 
309 static inline void update_current_thread_iamr(u64 value)
310 {
311 	if (!likely(pkey_execute_disable_supported))
312 		return;
313 
314 	current->thread.regs->iamr = value;
315 }
316 
317 #ifdef CONFIG_PPC_MEM_KEYS
318 void pkey_mm_init(struct mm_struct *mm)
319 {
320 	if (!mmu_has_feature(MMU_FTR_PKEY))
321 		return;
322 	mm_pkey_allocation_map(mm) = initial_allocation_mask;
323 	mm->context.execute_only_pkey = execute_only_key;
324 }
325 
326 static inline void init_amr(int pkey, u8 init_bits)
327 {
328 	u64 new_amr_bits = (((u64)init_bits & 0x3UL) << pkeyshift(pkey));
329 	u64 old_amr = current_thread_amr() & ~((u64)(0x3ul) << pkeyshift(pkey));
330 
331 	update_current_thread_amr(old_amr | new_amr_bits);
332 }
333 
334 static inline void init_iamr(int pkey, u8 init_bits)
335 {
336 	u64 new_iamr_bits = (((u64)init_bits & 0x1UL) << pkeyshift(pkey));
337 	u64 old_iamr = current_thread_iamr() & ~((u64)(0x1ul) << pkeyshift(pkey));
338 
339 	update_current_thread_iamr(old_iamr | new_iamr_bits);
340 }
341 
342 /*
343  * Set the access rights in AMR IAMR and UAMOR registers for @pkey to that
344  * specified in @init_val.
345  */
346 int __arch_set_user_pkey_access(struct task_struct *tsk, int pkey,
347 				unsigned long init_val)
348 {
349 	u64 new_amr_bits = 0x0ul;
350 	u64 new_iamr_bits = 0x0ul;
351 	u64 pkey_bits, uamor_pkey_bits;
352 
353 	/*
354 	 * Check whether the key is disabled by UAMOR.
355 	 */
356 	pkey_bits = 0x3ul << pkeyshift(pkey);
357 	uamor_pkey_bits = (default_uamor & pkey_bits);
358 
359 	/*
360 	 * Both the bits in UAMOR corresponding to the key should be set
361 	 */
362 	if (uamor_pkey_bits != pkey_bits)
363 		return -EINVAL;
364 
365 	if (init_val & PKEY_DISABLE_EXECUTE) {
366 		if (!pkey_execute_disable_supported)
367 			return -EINVAL;
368 		new_iamr_bits |= IAMR_EX_BIT;
369 	}
370 	init_iamr(pkey, new_iamr_bits);
371 
372 	/* Set the bits we need in AMR: */
373 	if (init_val & PKEY_DISABLE_ACCESS)
374 		new_amr_bits |= AMR_RD_BIT | AMR_WR_BIT;
375 	else if (init_val & PKEY_DISABLE_WRITE)
376 		new_amr_bits |= AMR_WR_BIT;
377 
378 	init_amr(pkey, new_amr_bits);
379 	return 0;
380 }
381 
382 int execute_only_pkey(struct mm_struct *mm)
383 {
384 	return mm->context.execute_only_pkey;
385 }
386 
387 static inline bool vma_is_pkey_exec_only(struct vm_area_struct *vma)
388 {
389 	/* Do this check first since the vm_flags should be hot */
390 	if ((vma->vm_flags & VM_ACCESS_FLAGS) != VM_EXEC)
391 		return false;
392 
393 	return (vma_pkey(vma) == vma->vm_mm->context.execute_only_pkey);
394 }
395 
396 /*
397  * This should only be called for *plain* mprotect calls.
398  */
399 int __arch_override_mprotect_pkey(struct vm_area_struct *vma, int prot,
400 				  int pkey)
401 {
402 	/*
403 	 * If the currently associated pkey is execute-only, but the requested
404 	 * protection is not execute-only, move it back to the default pkey.
405 	 */
406 	if (vma_is_pkey_exec_only(vma) && (prot != PROT_EXEC))
407 		return 0;
408 
409 	/*
410 	 * The requested protection is execute-only. Hence let's use an
411 	 * execute-only pkey.
412 	 */
413 	if (prot == PROT_EXEC) {
414 		pkey = execute_only_pkey(vma->vm_mm);
415 		if (pkey > 0)
416 			return pkey;
417 	}
418 
419 	/* Nothing to override. */
420 	return vma_pkey(vma);
421 }
422 
423 static bool pkey_access_permitted(int pkey, bool write, bool execute)
424 {
425 	int pkey_shift;
426 	u64 amr;
427 
428 	pkey_shift = pkeyshift(pkey);
429 	if (execute)
430 		return !(current_thread_iamr() & (IAMR_EX_BIT << pkey_shift));
431 
432 	amr = current_thread_amr();
433 	if (write)
434 		return !(amr & (AMR_WR_BIT << pkey_shift));
435 
436 	return !(amr & (AMR_RD_BIT << pkey_shift));
437 }
438 
439 bool arch_pte_access_permitted(u64 pte, bool write, bool execute)
440 {
441 	if (!mmu_has_feature(MMU_FTR_PKEY))
442 		return true;
443 
444 	return pkey_access_permitted(pte_to_pkey_bits(pte), write, execute);
445 }
446 
447 /*
448  * We only want to enforce protection keys on the current thread because we
449  * effectively have no access to AMR/IAMR for other threads or any way to tell
450  * which AMR/IAMR in a threaded process we could use.
451  *
452  * So do not enforce things if the VMA is not from the current mm, or if we are
453  * in a kernel thread.
454  */
455 bool arch_vma_access_permitted(struct vm_area_struct *vma, bool write,
456 			       bool execute, bool foreign)
457 {
458 	if (!mmu_has_feature(MMU_FTR_PKEY))
459 		return true;
460 	/*
461 	 * Do not enforce our key-permissions on a foreign vma.
462 	 */
463 	if (foreign || vma_is_foreign(vma))
464 		return true;
465 
466 	return pkey_access_permitted(vma_pkey(vma), write, execute);
467 }
468 
469 void arch_dup_pkeys(struct mm_struct *oldmm, struct mm_struct *mm)
470 {
471 	if (!mmu_has_feature(MMU_FTR_PKEY))
472 		return;
473 
474 	/* Duplicate the oldmm pkey state in mm: */
475 	mm_pkey_allocation_map(mm) = mm_pkey_allocation_map(oldmm);
476 	mm->context.execute_only_pkey = oldmm->context.execute_only_pkey;
477 }
478 
479 #endif /* CONFIG_PPC_MEM_KEYS */
480