xref: /titanic_52/usr/src/uts/i86pc/vm/hat_i86.h (revision d2ec54f7875f7e05edd56195adbeb593c947763f)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2007 Sun Microsystems, Inc.  All rights reserved.
23  * Use is subject to license terms.
24  */
25 
26 #ifndef	_VM_HAT_I86_H
27 #define	_VM_HAT_I86_H
28 
29 #pragma ident	"%Z%%M%	%I%	%E% SMI"
30 
31 #ifdef	__cplusplus
32 extern "C" {
33 #endif
34 
35 /*
36  * VM - Hardware Address Translation management.
37  *
38  * This file describes the contents of the x86_64 HAT data structures.
39  */
40 #include <sys/types.h>
41 #include <sys/t_lock.h>
42 #include <sys/cpuvar.h>
43 #include <sys/x_call.h>
44 #include <vm/seg.h>
45 #include <vm/page.h>
46 #include <sys/vmparam.h>
47 #include <sys/vm_machparam.h>
48 #include <sys/promif.h>
49 #include <vm/hat_pte.h>
50 #include <vm/htable.h>
51 #include <vm/hment.h>
52 
53 /*
54  * The essential data types involved:
55  *
56  * htable_t	- There is one of these for each page table and it is used
57  *		by the HAT to manage the page table.
58  *
59  * hment_t	- Links together multiple PTEs to a single page.
60  */
61 
62 /*
63  * VLP processes have a 32 bit address range, so their top level is 2 and
64  * with only 4 PTEs in that table.
65  */
66 #define	VLP_LEVEL	(2)
67 #define	VLP_NUM_PTES	(4)
68 #define	VLP_SIZE	(VLP_NUM_PTES * sizeof (x86pte_t))
69 #define	TOP_LEVEL(h)	(((h)->hat_flags & HAT_VLP) ? VLP_LEVEL : mmu.max_level)
70 #define	VLP_COPY(fromptep, toptep) { \
71 	toptep[0] = fromptep[0]; \
72 	toptep[1] = fromptep[1]; \
73 	toptep[2] = fromptep[2]; \
74 	toptep[3] = fromptep[3]; \
75 }
76 
77 /*
78  * The hat struct exists for each address space.
79  */
80 struct hat {
81 	kmutex_t	hat_mutex;
82 	struct as	*hat_as;
83 	uint_t		hat_stats;
84 	pgcnt_t		hat_pages_mapped[MAX_PAGE_LEVEL + 1];
85 	pgcnt_t		hat_ism_pgcnt;
86 	cpuset_t	hat_cpus;
87 	uint16_t	hat_flags;
88 	htable_t	*hat_htable;	/* top level htable */
89 	struct hat	*hat_next;
90 	struct hat	*hat_prev;
91 	uint_t		hat_num_hash;	/* number of htable hash buckets */
92 	htable_t	**hat_ht_hash;	/* htable hash buckets */
93 	htable_t	*hat_ht_cached;	/* cached free htables */
94 	x86pte_t	hat_vlp_ptes[VLP_NUM_PTES];
95 #if defined(__amd64) && defined(__xpv)
96 	pfn_t		hat_user_ptable; /* alt top ptable for user mode */
97 #endif
98 };
99 typedef struct hat hat_t;
100 
101 #define	PGCNT_INC(hat, level)	\
102 	atomic_add_long(&(hat)->hat_pages_mapped[level], 1);
103 #define	PGCNT_DEC(hat, level)	\
104 	atomic_add_long(&(hat)->hat_pages_mapped[level], -1);
105 
106 /*
107  * Flags for the hat_flags field
108  *
109  * HAT_FREEING - set when HAT is being destroyed - mostly used to detect that
110  *	demap()s can be avoided.
111  *
112  * HAT_VLP - indicates a 32 bit process has a virtual address range less than
113  *	the hardware's physical address range. (VLP->Virtual Less-than Physical)
114  *	Note - never used on the hypervisor.
115  *
116  * HAT_VICTIM - This is set while a hat is being examined for page table
117  *	stealing and prevents it from being freed.
118  *
119  * HAT_SHARED - The hat has exported it's page tables via hat_share()
120  *
121  * HAT_PINNED - On the hypervisor, indicates the top page table has been pinned.
122  */
123 #define	HAT_FREEING	(0x0001)
124 #define	HAT_VLP		(0x0002)
125 #define	HAT_VICTIM	(0x0004)
126 #define	HAT_SHARED	(0x0008)
127 #define	HAT_PINNED	(0x0010)
128 
129 /*
130  * Additional platform attribute for hat_devload() to force no caching.
131  */
132 #define	HAT_PLAT_NOCACHE	(0x100000)
133 
134 /*
135  * Simple statistics for the HAT. These are just counters that are
136  * atomically incremented. They can be reset directly from the kernel
137  * debugger.
138  */
139 struct hatstats {
140 	ulong_t	hs_reap_attempts;
141 	ulong_t	hs_reaped;
142 	ulong_t	hs_steals;
143 	ulong_t	hs_ptable_allocs;
144 	ulong_t	hs_ptable_frees;
145 	ulong_t	hs_htable_rgets;	/* allocs from reserve */
146 	ulong_t	hs_htable_rputs;	/* putbacks to reserve */
147 	ulong_t	hs_htable_shared;	/* number of htables shared */
148 	ulong_t	hs_htable_unshared;	/* number of htables unshared */
149 	ulong_t	hs_hm_alloc;
150 	ulong_t	hs_hm_free;
151 	ulong_t	hs_hm_put_reserve;
152 	ulong_t	hs_hm_get_reserve;
153 	ulong_t	hs_hm_steals;
154 	ulong_t	hs_hm_steal_exam;
155 	ulong_t hs_tlb_inval_delayed;
156 };
157 extern struct hatstats hatstat;
158 #ifdef DEBUG
159 #define	HATSTAT_INC(x)	(++hatstat.x)
160 #else
161 #define	HATSTAT_INC(x)	(0)
162 #endif
163 
164 #if defined(_KERNEL)
165 
166 /*
167  * Useful macro to align hat_XXX() address arguments to a page boundary
168  */
169 #define	ALIGN2PAGE(a)		((uintptr_t)(a) & MMU_PAGEMASK)
170 #define	IS_PAGEALIGNED(a)	(((uintptr_t)(a) & MMU_PAGEOFFSET) == 0)
171 
172 extern uint_t	khat_running;	/* set at end of hat_kern_setup() */
173 extern cpuset_t khat_cpuset;	/* cpuset for kernal address demap Xcalls */
174 extern kmutex_t hat_list_lock;
175 extern kcondvar_t hat_list_cv;
176 
177 
178 
179 /*
180  * Interfaces to setup a cpu private mapping (ie. preemption disabled).
181  * The attr and flags arguments are the same as for hat_devload().
182  * setup() must be called once, then any number of calls to remap(),
183  * followed by a final call to release()
184  *
185  * Used by ppcopy(), page_zero(), the memscrubber, and the kernel debugger.
186  */
187 typedef paddr_t hat_mempte_t;				/* phys addr of PTE */
188 extern hat_mempte_t hat_mempte_setup(caddr_t addr);
189 extern void hat_mempte_remap(pfn_t, caddr_t, hat_mempte_t,
190 	uint_t attr, uint_t flags);
191 extern void hat_mempte_release(caddr_t addr, hat_mempte_t);
192 
193 /*
194  * Interfaces to manage which thread has access to htable and hment reserves.
195  * The USE_HAT_RESERVES macro should always be recomputed in full. Its value
196  * (due to curthread) can change after any call into kmem/vmem.
197  */
198 extern uint_t can_steal_post_boot;
199 extern uint_t use_boot_reserve;
200 #define	USE_HAT_RESERVES()					\
201 	(use_boot_reserve || curthread->t_hatdepth > 1 ||	\
202 	panicstr != NULL || vmem_is_populator())
203 
204 /*
205  * initialization stuff needed by by startup, mp_startup...
206  */
207 extern void hat_cpu_online(struct cpu *);
208 extern void hat_cpu_offline(struct cpu *);
209 extern void setup_vaddr_for_ppcopy(struct cpu *);
210 extern void teardown_vaddr_for_ppcopy(struct cpu *);
211 extern void clear_boot_mappings(uintptr_t, uintptr_t);
212 
213 /*
214  * magic value to indicate that all TLB entries should be demapped.
215  */
216 #define	DEMAP_ALL_ADDR	(~(uintptr_t)0)
217 
218 /*
219  * not in any include file???
220  */
221 extern void halt(char *fmt);
222 
223 /*
224  * x86 specific routines for use online in setup or i86pc/vm files
225  */
226 extern void hat_kern_alloc(caddr_t segmap_base, size_t segmap_size,
227 	caddr_t ekernelheap);
228 extern void hat_kern_setup(void);
229 extern void hat_tlb_inval(struct hat *hat, uintptr_t va);
230 extern void hat_pte_unmap(htable_t *ht, uint_t entry, uint_t flags,
231 	x86pte_t old_pte, void *pte_ptr);
232 extern void hat_init_finish(void);
233 extern caddr_t hat_kpm_pfn2va(pfn_t pfn);
234 extern pfn_t hat_kpm_va2pfn(caddr_t);
235 extern page_t *hat_kpm_vaddr2page(caddr_t);
236 extern uintptr_t hat_kernelbase(uintptr_t);
237 extern void hat_kmap_init(uintptr_t base, size_t len);
238 
239 extern hment_t *hati_page_unmap(page_t *pp, htable_t *ht, uint_t entry);
240 
241 #if !defined(__xpv)
242 /*
243  * routines to deal with delayed TLB invalidations for idle CPUs
244  */
245 extern void tlb_going_idle(void);
246 extern void tlb_service(void);
247 #endif
248 
249 /*
250  * Hat switch function invoked to load a new context into %cr3
251  */
252 extern void hat_switch(struct hat *hat);
253 
254 #ifdef __xpv
255 /*
256  * Interfaces to use around code that maps/unmaps grant table references.
257  */
258 extern void hat_prepare_mapping(hat_t *, caddr_t);
259 extern void hat_release_mapping(hat_t *, caddr_t);
260 
261 #define	XPV_DISALLOW_MIGRATE()	xen_block_migrate()
262 #define	XPV_ALLOW_MIGRATE()	xen_allow_migrate()
263 
264 #else
265 
266 #define	XPV_DISALLOW_MIGRATE()	/* nothing */
267 #define	XPV_ALLOW_MIGRATE()	/* nothing */
268 
269 #define	pfn_is_foreign(pfn)	__lintzero
270 
271 #endif
272 
273 
274 #endif	/* _KERNEL */
275 
276 #ifdef	__cplusplus
277 }
278 #endif
279 
280 #endif	/* _VM_HAT_I86_H */
281