xref: /linux/arch/powerpc/include/asm/book3s/64/hash.h (revision c94cd9508b1335b949fd13ebd269313c65492df0)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef _ASM_POWERPC_BOOK3S_64_HASH_H
3 #define _ASM_POWERPC_BOOK3S_64_HASH_H
4 #ifdef __KERNEL__
5 
6 #include <asm/asm-const.h>
7 #include <asm/book3s/64/slice.h>
8 
9 /*
10  * Common bits between 4K and 64K pages in a linux-style PTE.
11  * Additional bits may be defined in pgtable-hash64-*.h
12  *
13  */
14 #define H_PTE_NONE_MASK		_PAGE_HPTEFLAGS
15 
16 #ifdef CONFIG_PPC_64K_PAGES
17 #include <asm/book3s/64/hash-64k.h>
18 #else
19 #include <asm/book3s/64/hash-4k.h>
20 #endif
21 
22 #define H_PTRS_PER_PTE		(1 << H_PTE_INDEX_SIZE)
23 #define H_PTRS_PER_PMD		(1 << H_PMD_INDEX_SIZE)
24 #define H_PTRS_PER_PUD		(1 << H_PUD_INDEX_SIZE)
25 
26 /* Bits to set in a PMD/PUD/PGD entry valid bit*/
27 #define HASH_PMD_VAL_BITS		(0x8000000000000000UL)
28 #define HASH_PUD_VAL_BITS		(0x8000000000000000UL)
29 #define HASH_PGD_VAL_BITS		(0x8000000000000000UL)
30 
31 /*
32  * Size of EA range mapped by our pagetables.
33  */
34 #define H_PGTABLE_EADDR_SIZE	(H_PTE_INDEX_SIZE + H_PMD_INDEX_SIZE + \
35 				 H_PUD_INDEX_SIZE + H_PGD_INDEX_SIZE + PAGE_SHIFT)
36 #define H_PGTABLE_RANGE		(ASM_CONST(1) << H_PGTABLE_EADDR_SIZE)
37 /*
38  * Top 2 bits are ignored in page table walk.
39  */
40 #define EA_MASK			(~(0xcUL << 60))
41 
42 /*
43  * We store the slot details in the second half of page table.
44  * Increase the pud level table so that hugetlb ptes can be stored
45  * at pud level.
46  */
47 #if defined(CONFIG_HUGETLB_PAGE) &&  defined(CONFIG_PPC_64K_PAGES)
48 #define H_PUD_CACHE_INDEX	(H_PUD_INDEX_SIZE + 1)
49 #else
50 #define H_PUD_CACHE_INDEX	(H_PUD_INDEX_SIZE)
51 #endif
52 
53 /*
54  * +------------------------------+
55  * |                              |
56  * |                              |
57  * |                              |
58  * +------------------------------+  Kernel virtual map end (0xc00e000000000000)
59  * |                              |
60  * |                              |
61  * |      512TB/16TB of vmemmap   |
62  * |                              |
63  * |                              |
64  * +------------------------------+  Kernel vmemmap  start
65  * |                              |
66  * |      512TB/16TB of IO map    |
67  * |                              |
68  * +------------------------------+  Kernel IO map start
69  * |                              |
70  * |      512TB/16TB of vmap      |
71  * |                              |
72  * +------------------------------+  Kernel virt start (0xc008000000000000)
73  * |                              |
74  * |                              |
75  * |                              |
76  * +------------------------------+  Kernel linear (0xc.....)
77  */
78 
79 #define H_VMALLOC_START		H_KERN_VIRT_START
80 #define H_VMALLOC_SIZE		H_KERN_MAP_SIZE
81 #define H_VMALLOC_END		(H_VMALLOC_START + H_VMALLOC_SIZE)
82 
83 #define H_KERN_IO_START		H_VMALLOC_END
84 #define H_KERN_IO_SIZE		H_KERN_MAP_SIZE
85 #define H_KERN_IO_END		(H_KERN_IO_START + H_KERN_IO_SIZE)
86 
87 #define H_VMEMMAP_START		H_KERN_IO_END
88 #define H_VMEMMAP_SIZE		H_KERN_MAP_SIZE
89 #define H_VMEMMAP_END		(H_VMEMMAP_START + H_VMEMMAP_SIZE)
90 
91 #define NON_LINEAR_REGION_ID(ea)	((((unsigned long)ea - H_KERN_VIRT_START) >> REGION_SHIFT) + 2)
92 
93 /*
94  * Region IDs
95  */
96 #define USER_REGION_ID		0
97 #define LINEAR_MAP_REGION_ID	1
98 #define VMALLOC_REGION_ID	NON_LINEAR_REGION_ID(H_VMALLOC_START)
99 #define IO_REGION_ID		NON_LINEAR_REGION_ID(H_KERN_IO_START)
100 #define VMEMMAP_REGION_ID	NON_LINEAR_REGION_ID(H_VMEMMAP_START)
101 #define INVALID_REGION_ID	(VMEMMAP_REGION_ID + 1)
102 
103 /*
104  * Defines the address of the vmemap area, in its own region on
105  * hash table CPUs.
106  */
107 
108 /* PTEIDX nibble */
109 #define _PTEIDX_SECONDARY	0x8
110 #define _PTEIDX_GROUP_IX	0x7
111 
112 #define H_PMD_BAD_BITS		(PTE_TABLE_SIZE-1)
113 #define H_PUD_BAD_BITS		(PMD_TABLE_SIZE-1)
114 
115 #ifndef __ASSEMBLY__
116 static inline int get_region_id(unsigned long ea)
117 {
118 	int region_id;
119 	int id = (ea >> 60UL);
120 
121 	if (id == 0)
122 		return USER_REGION_ID;
123 
124 	if (id != (PAGE_OFFSET >> 60))
125 		return INVALID_REGION_ID;
126 
127 	if (ea < H_KERN_VIRT_START)
128 		return LINEAR_MAP_REGION_ID;
129 
130 	BUILD_BUG_ON(NON_LINEAR_REGION_ID(H_VMALLOC_START) != 2);
131 
132 	region_id = NON_LINEAR_REGION_ID(ea);
133 	return region_id;
134 }
135 
136 static inline int hash__pmd_same(pmd_t pmd_a, pmd_t pmd_b)
137 {
138 	return (((pmd_raw(pmd_a) ^ pmd_raw(pmd_b)) & ~cpu_to_be64(_PAGE_HPTEFLAGS)) == 0);
139 }
140 
141 #define	hash__pmd_bad(pmd)		(pmd_val(pmd) & H_PMD_BAD_BITS)
142 
143 /*
144  * pud comparison that will work with both pte and page table pointer.
145  */
146 static inline int hash__pud_same(pud_t pud_a, pud_t pud_b)
147 {
148 	return (((pud_raw(pud_a) ^ pud_raw(pud_b)) & ~cpu_to_be64(_PAGE_HPTEFLAGS)) == 0);
149 }
150 #define	hash__pud_bad(pud)		(pud_val(pud) & H_PUD_BAD_BITS)
151 
152 static inline int hash__p4d_bad(p4d_t p4d)
153 {
154 	return (p4d_val(p4d) == 0);
155 }
156 #ifdef CONFIG_STRICT_KERNEL_RWX
157 extern void hash__mark_rodata_ro(void);
158 extern void hash__mark_initmem_nx(void);
159 #endif
160 
161 extern void hpte_need_flush(struct mm_struct *mm, unsigned long addr,
162 			    pte_t *ptep, unsigned long pte, int huge);
163 unsigned long htab_convert_pte_flags(unsigned long pteflags, unsigned long flags);
164 /* Atomic PTE updates */
165 static inline unsigned long hash__pte_update_one(pte_t *ptep, unsigned long clr,
166 						 unsigned long set)
167 {
168 	__be64 old_be, tmp_be;
169 
170 	__asm__ __volatile__(
171 	"1:	ldarx	%0,0,%3		# pte_update\n\
172 	and.	%1,%0,%6\n\
173 	bne-	1b \n\
174 	andc	%1,%0,%4 \n\
175 	or	%1,%1,%7\n\
176 	stdcx.	%1,0,%3 \n\
177 	bne-	1b"
178 	: "=&r" (old_be), "=&r" (tmp_be), "=m" (*ptep)
179 	: "r" (ptep), "r" (cpu_to_be64(clr)), "m" (*ptep),
180 	  "r" (cpu_to_be64(H_PAGE_BUSY)), "r" (cpu_to_be64(set))
181 	: "cc" );
182 
183 	return be64_to_cpu(old_be);
184 }
185 
186 static inline unsigned long hash__pte_update(struct mm_struct *mm,
187 					 unsigned long addr,
188 					 pte_t *ptep, unsigned long clr,
189 					 unsigned long set,
190 					 int huge)
191 {
192 	unsigned long old;
193 
194 	old = hash__pte_update_one(ptep, clr, set);
195 
196 	if (IS_ENABLED(CONFIG_PPC_4K_PAGES) && huge) {
197 		unsigned int psize = get_slice_psize(mm, addr);
198 		int nb, i;
199 
200 		if (psize == MMU_PAGE_16M)
201 			nb = SZ_16M / PMD_SIZE;
202 		else if (psize == MMU_PAGE_16G)
203 			nb = SZ_16G / PUD_SIZE;
204 		else
205 			nb = 1;
206 
207 		WARN_ON_ONCE(nb == 1);	/* Should never happen */
208 
209 		for (i = 1; i < nb; i++)
210 			hash__pte_update_one(ptep + i, clr, set);
211 	}
212 	/* huge pages use the old page table lock */
213 	if (!huge)
214 		assert_pte_locked(mm, addr);
215 
216 	if (old & H_PAGE_HASHPTE)
217 		hpte_need_flush(mm, addr, ptep, old, huge);
218 
219 	return old;
220 }
221 
222 /* Set the dirty and/or accessed bits atomically in a linux PTE, this
223  * function doesn't need to flush the hash entry
224  */
225 static inline void hash__ptep_set_access_flags(pte_t *ptep, pte_t entry)
226 {
227 	__be64 old, tmp, val, mask;
228 
229 	mask = cpu_to_be64(_PAGE_DIRTY | _PAGE_ACCESSED | _PAGE_READ | _PAGE_WRITE |
230 			   _PAGE_EXEC | _PAGE_SOFT_DIRTY);
231 
232 	val = pte_raw(entry) & mask;
233 
234 	__asm__ __volatile__(
235 	"1:	ldarx	%0,0,%4\n\
236 		and.	%1,%0,%6\n\
237 		bne-	1b \n\
238 		or	%0,%3,%0\n\
239 		stdcx.	%0,0,%4\n\
240 		bne-	1b"
241 	:"=&r" (old), "=&r" (tmp), "=m" (*ptep)
242 	:"r" (val), "r" (ptep), "m" (*ptep), "r" (cpu_to_be64(H_PAGE_BUSY))
243 	:"cc");
244 }
245 
246 static inline int hash__pte_same(pte_t pte_a, pte_t pte_b)
247 {
248 	return (((pte_raw(pte_a) ^ pte_raw(pte_b)) & ~cpu_to_be64(_PAGE_HPTEFLAGS)) == 0);
249 }
250 
251 static inline int hash__pte_none(pte_t pte)
252 {
253 	return (pte_val(pte) & ~H_PTE_NONE_MASK) == 0;
254 }
255 
256 unsigned long pte_get_hash_gslot(unsigned long vpn, unsigned long shift,
257 		int ssize, real_pte_t rpte, unsigned int subpg_index);
258 
259 /* This low level function performs the actual PTE insertion
260  * Setting the PTE depends on the MMU type and other factors. It's
261  * an horrible mess that I'm not going to try to clean up now but
262  * I'm keeping it in one place rather than spread around
263  */
264 static inline void hash__set_pte_at(struct mm_struct *mm, unsigned long addr,
265 				  pte_t *ptep, pte_t pte, int percpu)
266 {
267 	/*
268 	 * Anything else just stores the PTE normally. That covers all 64-bit
269 	 * cases, and 32-bit non-hash with 32-bit PTEs.
270 	 */
271 	*ptep = pte;
272 }
273 
274 #ifdef CONFIG_TRANSPARENT_HUGEPAGE
275 extern void hpte_do_hugepage_flush(struct mm_struct *mm, unsigned long addr,
276 				   pmd_t *pmdp, unsigned long old_pmd);
277 #else
278 static inline void hpte_do_hugepage_flush(struct mm_struct *mm,
279 					  unsigned long addr, pmd_t *pmdp,
280 					  unsigned long old_pmd)
281 {
282 	WARN(1, "%s called with THP disabled\n", __func__);
283 }
284 #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
285 
286 
287 int hash__map_kernel_page(unsigned long ea, unsigned long pa, pgprot_t prot);
288 extern int __meminit hash__vmemmap_create_mapping(unsigned long start,
289 					      unsigned long page_size,
290 					      unsigned long phys);
291 extern void hash__vmemmap_remove_mapping(unsigned long start,
292 				     unsigned long page_size);
293 
294 int hash__create_section_mapping(unsigned long start, unsigned long end,
295 				 int nid, pgprot_t prot);
296 int hash__remove_section_mapping(unsigned long start, unsigned long end);
297 
298 #endif /* !__ASSEMBLY__ */
299 #endif /* __KERNEL__ */
300 #endif /* _ASM_POWERPC_BOOK3S_64_HASH_H */
301