xref: /titanic_51/usr/src/uts/i86pc/vm/hat_i86.h (revision a6a74e0e62d62ff750cd4b790be5eacc99c3bb8c)
17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate  * CDDL HEADER START
37c478bd9Sstevel@tonic-gate  *
47c478bd9Sstevel@tonic-gate  * The contents of this file are subject to the terms of the
5ae115bc7Smrj  * Common Development and Distribution License (the "License").
6ae115bc7Smrj  * You may not use this file except in compliance with the License.
77c478bd9Sstevel@tonic-gate  *
87c478bd9Sstevel@tonic-gate  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
97c478bd9Sstevel@tonic-gate  * or http://www.opensolaris.org/os/licensing.
107c478bd9Sstevel@tonic-gate  * See the License for the specific language governing permissions
117c478bd9Sstevel@tonic-gate  * and limitations under the License.
127c478bd9Sstevel@tonic-gate  *
137c478bd9Sstevel@tonic-gate  * When distributing Covered Code, include this CDDL HEADER in each
147c478bd9Sstevel@tonic-gate  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
157c478bd9Sstevel@tonic-gate  * If applicable, add the following below this CDDL HEADER, with the
167c478bd9Sstevel@tonic-gate  * fields enclosed by brackets "[]" replaced with your own identifying
177c478bd9Sstevel@tonic-gate  * information: Portions Copyright [yyyy] [name of copyright owner]
187c478bd9Sstevel@tonic-gate  *
197c478bd9Sstevel@tonic-gate  * CDDL HEADER END
207c478bd9Sstevel@tonic-gate  */
217c478bd9Sstevel@tonic-gate /*
227eea693dSMark Johnson  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
237c478bd9Sstevel@tonic-gate  * Use is subject to license terms.
247c478bd9Sstevel@tonic-gate  */
25*a6a74e0eSMatthew Ahrens /*
26*a6a74e0eSMatthew Ahrens  * Copyright (c) 2014 by Delphix. All rights reserved.
27*a6a74e0eSMatthew Ahrens  */
287c478bd9Sstevel@tonic-gate 
297c478bd9Sstevel@tonic-gate #ifndef	_VM_HAT_I86_H
307c478bd9Sstevel@tonic-gate #define	_VM_HAT_I86_H
317c478bd9Sstevel@tonic-gate 
327c478bd9Sstevel@tonic-gate 
337c478bd9Sstevel@tonic-gate #ifdef	__cplusplus
347c478bd9Sstevel@tonic-gate extern "C" {
357c478bd9Sstevel@tonic-gate #endif
367c478bd9Sstevel@tonic-gate 
377c478bd9Sstevel@tonic-gate /*
387c478bd9Sstevel@tonic-gate  * VM - Hardware Address Translation management.
397c478bd9Sstevel@tonic-gate  *
407c478bd9Sstevel@tonic-gate  * This file describes the contents of the x86_64 HAT data structures.
417c478bd9Sstevel@tonic-gate  */
427c478bd9Sstevel@tonic-gate #include <sys/types.h>
437c478bd9Sstevel@tonic-gate #include <sys/t_lock.h>
447c478bd9Sstevel@tonic-gate #include <sys/cpuvar.h>
457c478bd9Sstevel@tonic-gate #include <sys/x_call.h>
467c478bd9Sstevel@tonic-gate #include <vm/seg.h>
477c478bd9Sstevel@tonic-gate #include <vm/page.h>
487c478bd9Sstevel@tonic-gate #include <sys/vmparam.h>
497c478bd9Sstevel@tonic-gate #include <sys/vm_machparam.h>
507c478bd9Sstevel@tonic-gate #include <sys/promif.h>
517c478bd9Sstevel@tonic-gate #include <vm/hat_pte.h>
527c478bd9Sstevel@tonic-gate #include <vm/htable.h>
537c478bd9Sstevel@tonic-gate #include <vm/hment.h>
547c478bd9Sstevel@tonic-gate 
557c478bd9Sstevel@tonic-gate /*
567c478bd9Sstevel@tonic-gate  * The essential data types involved:
577c478bd9Sstevel@tonic-gate  *
587c478bd9Sstevel@tonic-gate  * htable_t	- There is one of these for each page table and it is used
597c478bd9Sstevel@tonic-gate  *		by the HAT to manage the page table.
607c478bd9Sstevel@tonic-gate  *
617c478bd9Sstevel@tonic-gate  * hment_t	- Links together multiple PTEs to a single page.
627c478bd9Sstevel@tonic-gate  */
637c478bd9Sstevel@tonic-gate 
647c478bd9Sstevel@tonic-gate /*
657c478bd9Sstevel@tonic-gate  * VLP processes have a 32 bit address range, so their top level is 2 and
667c478bd9Sstevel@tonic-gate  * with only 4 PTEs in that table.
677c478bd9Sstevel@tonic-gate  */
687c478bd9Sstevel@tonic-gate #define	VLP_LEVEL	(2)
697c478bd9Sstevel@tonic-gate #define	VLP_NUM_PTES	(4)
707c478bd9Sstevel@tonic-gate #define	VLP_SIZE	(VLP_NUM_PTES * sizeof (x86pte_t))
717c478bd9Sstevel@tonic-gate #define	TOP_LEVEL(h)	(((h)->hat_flags & HAT_VLP) ? VLP_LEVEL : mmu.max_level)
727c478bd9Sstevel@tonic-gate #define	VLP_COPY(fromptep, toptep) { \
737c478bd9Sstevel@tonic-gate 	toptep[0] = fromptep[0]; \
747c478bd9Sstevel@tonic-gate 	toptep[1] = fromptep[1]; \
757c478bd9Sstevel@tonic-gate 	toptep[2] = fromptep[2]; \
767c478bd9Sstevel@tonic-gate 	toptep[3] = fromptep[3]; \
777c478bd9Sstevel@tonic-gate }
787c478bd9Sstevel@tonic-gate 
797c478bd9Sstevel@tonic-gate /*
807c478bd9Sstevel@tonic-gate  * The hat struct exists for each address space.
817c478bd9Sstevel@tonic-gate  */
827c478bd9Sstevel@tonic-gate struct hat {
837c478bd9Sstevel@tonic-gate 	kmutex_t	hat_mutex;
847c478bd9Sstevel@tonic-gate 	struct as	*hat_as;
857c478bd9Sstevel@tonic-gate 	uint_t		hat_stats;
867c478bd9Sstevel@tonic-gate 	pgcnt_t		hat_pages_mapped[MAX_PAGE_LEVEL + 1];
87250b7ff9Sjosephb 	pgcnt_t		hat_ism_pgcnt;
887c478bd9Sstevel@tonic-gate 	cpuset_t	hat_cpus;
897c478bd9Sstevel@tonic-gate 	uint16_t	hat_flags;
907c478bd9Sstevel@tonic-gate 	htable_t	*hat_htable;	/* top level htable */
917c478bd9Sstevel@tonic-gate 	struct hat	*hat_next;
927c478bd9Sstevel@tonic-gate 	struct hat	*hat_prev;
937c478bd9Sstevel@tonic-gate 	uint_t		hat_num_hash;	/* number of htable hash buckets */
947c478bd9Sstevel@tonic-gate 	htable_t	**hat_ht_hash;	/* htable hash buckets */
957c478bd9Sstevel@tonic-gate 	htable_t	*hat_ht_cached;	/* cached free htables */
967c478bd9Sstevel@tonic-gate 	x86pte_t	hat_vlp_ptes[VLP_NUM_PTES];
97843e1988Sjohnlev #if defined(__amd64) && defined(__xpv)
98843e1988Sjohnlev 	pfn_t		hat_user_ptable; /* alt top ptable for user mode */
99843e1988Sjohnlev #endif
1007c478bd9Sstevel@tonic-gate };
1017c478bd9Sstevel@tonic-gate typedef struct hat hat_t;
1027c478bd9Sstevel@tonic-gate 
1037c478bd9Sstevel@tonic-gate #define	PGCNT_INC(hat, level)	\
1041a5e258fSJosef 'Jeff' Sipek 	atomic_inc_ulong(&(hat)->hat_pages_mapped[level]);
1057c478bd9Sstevel@tonic-gate #define	PGCNT_DEC(hat, level)	\
1061a5e258fSJosef 'Jeff' Sipek 	atomic_dec_ulong(&(hat)->hat_pages_mapped[level]);
1077c478bd9Sstevel@tonic-gate 
1087c478bd9Sstevel@tonic-gate /*
1097c478bd9Sstevel@tonic-gate  * Flags for the hat_flags field
1107c478bd9Sstevel@tonic-gate  *
1117c478bd9Sstevel@tonic-gate  * HAT_FREEING - set when HAT is being destroyed - mostly used to detect that
1127c478bd9Sstevel@tonic-gate  *	demap()s can be avoided.
1137c478bd9Sstevel@tonic-gate  *
1147c478bd9Sstevel@tonic-gate  * HAT_VLP - indicates a 32 bit process has a virtual address range less than
1157c478bd9Sstevel@tonic-gate  *	the hardware's physical address range. (VLP->Virtual Less-than Physical)
116843e1988Sjohnlev  *	Note - never used on the hypervisor.
1177c478bd9Sstevel@tonic-gate  *
1187c478bd9Sstevel@tonic-gate  * HAT_VICTIM - This is set while a hat is being examined for page table
1197c478bd9Sstevel@tonic-gate  *	stealing and prevents it from being freed.
1207c478bd9Sstevel@tonic-gate  *
1217c478bd9Sstevel@tonic-gate  * HAT_SHARED - The hat has exported it's page tables via hat_share()
122843e1988Sjohnlev  *
123843e1988Sjohnlev  * HAT_PINNED - On the hypervisor, indicates the top page table has been pinned.
1247c478bd9Sstevel@tonic-gate  */
1257c478bd9Sstevel@tonic-gate #define	HAT_FREEING	(0x0001)
1267c478bd9Sstevel@tonic-gate #define	HAT_VLP		(0x0002)
1277c478bd9Sstevel@tonic-gate #define	HAT_VICTIM	(0x0004)
1287c478bd9Sstevel@tonic-gate #define	HAT_SHARED	(0x0008)
129843e1988Sjohnlev #define	HAT_PINNED	(0x0010)
1307c478bd9Sstevel@tonic-gate 
1317c478bd9Sstevel@tonic-gate /*
1327c478bd9Sstevel@tonic-gate  * Additional platform attribute for hat_devload() to force no caching.
1337c478bd9Sstevel@tonic-gate  */
1347c478bd9Sstevel@tonic-gate #define	HAT_PLAT_NOCACHE	(0x100000)
1357c478bd9Sstevel@tonic-gate 
1367c478bd9Sstevel@tonic-gate /*
1377c478bd9Sstevel@tonic-gate  * Simple statistics for the HAT. These are just counters that are
1387c478bd9Sstevel@tonic-gate  * atomically incremented. They can be reset directly from the kernel
1397c478bd9Sstevel@tonic-gate  * debugger.
1407c478bd9Sstevel@tonic-gate  */
1417c478bd9Sstevel@tonic-gate struct hatstats {
14295c0a3c8Sjosephb 	ulong_t	hs_reap_attempts;
14395c0a3c8Sjosephb 	ulong_t	hs_reaped;
14495c0a3c8Sjosephb 	ulong_t	hs_steals;
14595c0a3c8Sjosephb 	ulong_t	hs_ptable_allocs;
14695c0a3c8Sjosephb 	ulong_t	hs_ptable_frees;
14795c0a3c8Sjosephb 	ulong_t	hs_htable_rgets;	/* allocs from reserve */
14895c0a3c8Sjosephb 	ulong_t	hs_htable_rputs;	/* putbacks to reserve */
14995c0a3c8Sjosephb 	ulong_t	hs_htable_shared;	/* number of htables shared */
15095c0a3c8Sjosephb 	ulong_t	hs_htable_unshared;	/* number of htables unshared */
15195c0a3c8Sjosephb 	ulong_t	hs_hm_alloc;
15295c0a3c8Sjosephb 	ulong_t	hs_hm_free;
15395c0a3c8Sjosephb 	ulong_t	hs_hm_put_reserve;
15495c0a3c8Sjosephb 	ulong_t	hs_hm_get_reserve;
15595c0a3c8Sjosephb 	ulong_t	hs_hm_steals;
15695c0a3c8Sjosephb 	ulong_t	hs_hm_steal_exam;
15795c0a3c8Sjosephb 	ulong_t hs_tlb_inval_delayed;
1587c478bd9Sstevel@tonic-gate };
1597c478bd9Sstevel@tonic-gate extern struct hatstats hatstat;
16095c0a3c8Sjosephb #ifdef DEBUG
16195c0a3c8Sjosephb #define	HATSTAT_INC(x)	(++hatstat.x)
16295c0a3c8Sjosephb #else
16395c0a3c8Sjosephb #define	HATSTAT_INC(x)	(0)
16495c0a3c8Sjosephb #endif
1657c478bd9Sstevel@tonic-gate 
1667c478bd9Sstevel@tonic-gate #if defined(_KERNEL)
1677c478bd9Sstevel@tonic-gate 
1687c478bd9Sstevel@tonic-gate /*
1697c478bd9Sstevel@tonic-gate  * Useful macro to align hat_XXX() address arguments to a page boundary
1707c478bd9Sstevel@tonic-gate  */
1717c478bd9Sstevel@tonic-gate #define	ALIGN2PAGE(a)		((uintptr_t)(a) & MMU_PAGEMASK)
1727c478bd9Sstevel@tonic-gate #define	IS_PAGEALIGNED(a)	(((uintptr_t)(a) & MMU_PAGEOFFSET) == 0)
1737c478bd9Sstevel@tonic-gate 
1747c478bd9Sstevel@tonic-gate extern uint_t	khat_running;	/* set at end of hat_kern_setup() */
1757c478bd9Sstevel@tonic-gate extern cpuset_t khat_cpuset;	/* cpuset for kernal address demap Xcalls */
1767c478bd9Sstevel@tonic-gate extern kmutex_t hat_list_lock;
1777c478bd9Sstevel@tonic-gate extern kcondvar_t hat_list_cv;
1787c478bd9Sstevel@tonic-gate 
1797c478bd9Sstevel@tonic-gate 
1807c478bd9Sstevel@tonic-gate 
1817c478bd9Sstevel@tonic-gate /*
1827c478bd9Sstevel@tonic-gate  * Interfaces to setup a cpu private mapping (ie. preemption disabled).
1837c478bd9Sstevel@tonic-gate  * The attr and flags arguments are the same as for hat_devload().
1847c478bd9Sstevel@tonic-gate  * setup() must be called once, then any number of calls to remap(),
1857c478bd9Sstevel@tonic-gate  * followed by a final call to release()
1867c478bd9Sstevel@tonic-gate  *
1877c478bd9Sstevel@tonic-gate  * Used by ppcopy(), page_zero(), the memscrubber, and the kernel debugger.
1887c478bd9Sstevel@tonic-gate  */
189ae115bc7Smrj typedef paddr_t hat_mempte_t;				/* phys addr of PTE */
190ae115bc7Smrj extern hat_mempte_t hat_mempte_setup(caddr_t addr);
191ae115bc7Smrj extern void hat_mempte_remap(pfn_t, caddr_t, hat_mempte_t,
192ae115bc7Smrj 	uint_t attr, uint_t flags);
193ae115bc7Smrj extern void hat_mempte_release(caddr_t addr, hat_mempte_t);
1947c478bd9Sstevel@tonic-gate 
1957c478bd9Sstevel@tonic-gate /*
19697704650Sjosephb  * Interfaces to manage which thread has access to htable and hment reserves.
19797704650Sjosephb  * The USE_HAT_RESERVES macro should always be recomputed in full. Its value
19897704650Sjosephb  * (due to curthread) can change after any call into kmem/vmem.
1997c478bd9Sstevel@tonic-gate  */
2007c478bd9Sstevel@tonic-gate extern uint_t can_steal_post_boot;
2017c478bd9Sstevel@tonic-gate extern uint_t use_boot_reserve;
20297704650Sjosephb #define	USE_HAT_RESERVES()					\
203aac11643Sjosephb 	(use_boot_reserve || curthread->t_hatdepth > 1 ||	\
20497704650Sjosephb 	panicstr != NULL || vmem_is_populator())
2057c478bd9Sstevel@tonic-gate 
2067c478bd9Sstevel@tonic-gate /*
2077c478bd9Sstevel@tonic-gate  * initialization stuff needed by by startup, mp_startup...
2087c478bd9Sstevel@tonic-gate  */
2097c478bd9Sstevel@tonic-gate extern void hat_cpu_online(struct cpu *);
210ae115bc7Smrj extern void hat_cpu_offline(struct cpu *);
2117c478bd9Sstevel@tonic-gate extern void setup_vaddr_for_ppcopy(struct cpu *);
212ae115bc7Smrj extern void teardown_vaddr_for_ppcopy(struct cpu *);
2137c478bd9Sstevel@tonic-gate extern void clear_boot_mappings(uintptr_t, uintptr_t);
2147c478bd9Sstevel@tonic-gate 
2157c478bd9Sstevel@tonic-gate /*
2167c478bd9Sstevel@tonic-gate  * magic value to indicate that all TLB entries should be demapped.
2177c478bd9Sstevel@tonic-gate  */
2187c478bd9Sstevel@tonic-gate #define	DEMAP_ALL_ADDR	(~(uintptr_t)0)
2197c478bd9Sstevel@tonic-gate 
2207c478bd9Sstevel@tonic-gate /*
2217c478bd9Sstevel@tonic-gate  * not in any include file???
2227c478bd9Sstevel@tonic-gate  */
2237c478bd9Sstevel@tonic-gate extern void halt(char *fmt);
2247c478bd9Sstevel@tonic-gate 
2257c478bd9Sstevel@tonic-gate /*
2267c478bd9Sstevel@tonic-gate  * x86 specific routines for use online in setup or i86pc/vm files
2277c478bd9Sstevel@tonic-gate  */
228ae115bc7Smrj extern void hat_kern_alloc(caddr_t segmap_base, size_t segmap_size,
229ae115bc7Smrj 	caddr_t ekernelheap);
230ae115bc7Smrj extern void hat_kern_setup(void);
231ae115bc7Smrj extern void hat_tlb_inval(struct hat *hat, uintptr_t va);
2327c478bd9Sstevel@tonic-gate extern void hat_pte_unmap(htable_t *ht, uint_t entry, uint_t flags,
233*a6a74e0eSMatthew Ahrens 	x86pte_t old_pte, void *pte_ptr, boolean_t tlb);
2347c478bd9Sstevel@tonic-gate extern void hat_init_finish(void);
2357c478bd9Sstevel@tonic-gate extern caddr_t hat_kpm_pfn2va(pfn_t pfn);
2367c478bd9Sstevel@tonic-gate extern pfn_t hat_kpm_va2pfn(caddr_t);
2377c478bd9Sstevel@tonic-gate extern page_t *hat_kpm_vaddr2page(caddr_t);
2387c478bd9Sstevel@tonic-gate extern uintptr_t hat_kernelbase(uintptr_t);
239ae115bc7Smrj extern void hat_kmap_init(uintptr_t base, size_t len);
2407c478bd9Sstevel@tonic-gate 
2417c478bd9Sstevel@tonic-gate extern hment_t *hati_page_unmap(page_t *pp, htable_t *ht, uint_t entry);
24295c0a3c8Sjosephb 
243843e1988Sjohnlev #if !defined(__xpv)
24495c0a3c8Sjosephb /*
24595c0a3c8Sjosephb  * routines to deal with delayed TLB invalidations for idle CPUs
24695c0a3c8Sjosephb  */
24795c0a3c8Sjosephb extern void tlb_going_idle(void);
24895c0a3c8Sjosephb extern void tlb_service(void);
249843e1988Sjohnlev #endif
25095c0a3c8Sjosephb 
2517c478bd9Sstevel@tonic-gate /*
2527c478bd9Sstevel@tonic-gate  * Hat switch function invoked to load a new context into %cr3
2537c478bd9Sstevel@tonic-gate  */
2547c478bd9Sstevel@tonic-gate extern void hat_switch(struct hat *hat);
2557c478bd9Sstevel@tonic-gate 
256843e1988Sjohnlev #ifdef __xpv
257843e1988Sjohnlev /*
258843e1988Sjohnlev  * Interfaces to use around code that maps/unmaps grant table references.
259843e1988Sjohnlev  */
2607eea693dSMark Johnson extern void hat_prepare_mapping(hat_t *, caddr_t, uint64_t *);
261843e1988Sjohnlev extern void hat_release_mapping(hat_t *, caddr_t);
262843e1988Sjohnlev 
263843e1988Sjohnlev #define	XPV_DISALLOW_MIGRATE()	xen_block_migrate()
264843e1988Sjohnlev #define	XPV_ALLOW_MIGRATE()	xen_allow_migrate()
265843e1988Sjohnlev 
266843e1988Sjohnlev #else
267843e1988Sjohnlev 
268843e1988Sjohnlev #define	XPV_DISALLOW_MIGRATE()	/* nothing */
269843e1988Sjohnlev #define	XPV_ALLOW_MIGRATE()	/* nothing */
270843e1988Sjohnlev 
271ae115bc7Smrj #define	pfn_is_foreign(pfn)	__lintzero
2727c478bd9Sstevel@tonic-gate 
273843e1988Sjohnlev #endif
274843e1988Sjohnlev 
275843e1988Sjohnlev 
2767c478bd9Sstevel@tonic-gate #endif	/* _KERNEL */
2777c478bd9Sstevel@tonic-gate 
2787c478bd9Sstevel@tonic-gate #ifdef	__cplusplus
2797c478bd9Sstevel@tonic-gate }
2807c478bd9Sstevel@tonic-gate #endif
2817c478bd9Sstevel@tonic-gate 
2827c478bd9Sstevel@tonic-gate #endif	/* _VM_HAT_I86_H */
283