xref: /illumos-gate/usr/src/uts/i86pc/sys/machcpuvar.h (revision 3665ce8aeee26b1a84fb98951ef011e0779e1ae2)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
23  * Use is subject to license terms.
24  */
25 /*
26  * Copyright 2019 Joyent, Inc.
27  */
28 
29 #ifndef	_SYS_MACHCPUVAR_H
30 #define	_SYS_MACHCPUVAR_H
31 
32 #ifdef	__cplusplus
33 extern "C" {
34 #endif
35 
36 #include <sys/inttypes.h>
37 #include <sys/x_call.h>
38 #include <sys/tss.h>
39 #include <sys/segments.h>
40 #include <sys/rm_platter.h>
41 #include <sys/avintr.h>
42 #include <sys/pte.h>
43 #include <sys/stddef.h>
44 #include <sys/debug.h>
45 #include <sys/cpuvar.h>
46 
47 #ifndef	_ASM
48 /*
49  * On a virtualized platform a virtual cpu may not be actually
50  * on a physical cpu, especially in situations where a configuration has
51  * more vcpus than pcpus.  This function tells us (if it's able) if the
52  * specified vcpu is currently running on a pcpu.  Note if it is not
53  * known or not able to determine, it will return the unknown state.
54  */
55 #define	VCPU_STATE_UNKNOWN	0
56 #define	VCPU_ON_PCPU		1
57 #define	VCPU_NOT_ON_PCPU	2
58 
59 extern int vcpu_on_pcpu(processorid_t);
60 
61 /*
62  * Machine specific fields of the cpu struct
63  * defined in common/sys/cpuvar.h.
64  *
65  * Note:  This is kinda kludgy but seems to be the best
66  * of our alternatives.
67  */
68 
69 struct cpuid_info;
70 struct cpu_ucode_info;
71 struct cmi_hdl;
72 
73 /*
74  * A note about the hypervisor affinity bits: a one bit in the affinity mask
75  * means the corresponding event channel is allowed to be serviced
76  * by this cpu.
77  */
78 struct xen_evt_data {
79 	ulong_t		pending_sel[PIL_MAX + 1]; /* event array selectors */
80 	ulong_t		pending_evts[PIL_MAX + 1][sizeof (ulong_t) * 8];
81 	ulong_t		evt_affinity[sizeof (ulong_t) * 8]; /* service on cpu */
82 };
83 
84 struct kpti_frame {
85 	uint64_t	kf_lower_redzone;
86 
87 	/* Stashed value of %cr3 when we entered the trampoline. */
88 	greg_t		kf_tr_cr3;
89 
90 	/*
91 	 * We use %r13-r14 as scratch registers in the trampoline code,
92 	 * so stash those here "below" the rest of the stack so they can be
93 	 * pushed/popped if needed.
94 	 */
95 	greg_t		kf_r14;
96 	greg_t		kf_r13;
97 
98 	/*
99 	 * Part of this struct is used as the HW stack frame when taking an
100 	 * interrupt on the user page table. The CPU is going to push a bunch
101 	 * of regs onto the stack pointer set in the TSS/IDT (which we set to
102 	 * &kf_rsp here).
103 	 *
104 	 * This is only a temporary holding area for them (we'll move them over
105 	 * to the real interrupt stack once we've set %cr3).
106 	 *
107 	 * Note that these must be cleared during a process switch on this cpu.
108 	 */
109 	greg_t		kf_err;		/* Bottom of initial hw stack frame */
110 	greg_t		kf_rip;
111 	greg_t		kf_cs;
112 	greg_t		kf_rflags;
113 	greg_t		kf_rsp;
114 	greg_t		kf_ss;
115 
116 	greg_t		kf_tr_rsp;	/* Top of HW stack frame */
117 	/* We also write this with the %rsp value on tramp entry */
118 
119 	/* Written to 0x1 when this kpti_frame is in use. */
120 	uint64_t	kf_tr_flag;
121 
122 	uint64_t	kf_middle_redzone;
123 
124 	/*
125 	 * The things we need to write to %cr3 to change between page tables.
126 	 * These live "above" the HW stack.
127 	 */
128 	greg_t		kf_kernel_cr3;
129 	greg_t		kf_user_cr3;
130 	greg_t		kf_tr_ret_rsp;
131 
132 	uint64_t	kf_unused;		/* For 16-byte align */
133 
134 	uint64_t	kf_upper_redzone;
135 };
136 
137 typedef struct cpu_smt {
138 	lock_t cs_lock;
139 	char cs_pad[56];
140 	struct cpu *cs_sib;
141 	volatile uint64_t cs_intr_depth;
142 	volatile uint64_t cs_state;
143 	volatile uint64_t cs_sibstate;
144 } cpu_smt_t;
145 
146 /*
147  * This first value, MACHCPU_SIZE is the size of all the members in the cpu_t
148  * AND struct machcpu, before we get to the mcpu_pad and the kpti area.
149  * The KPTI is used to contain per-CPU data that is visible in both sets of
150  * page-tables, and hence must be page-aligned and page-sized. See
151  * hat_pcp_setup().
152  *
153  * There are CTASSERTs in os/intr.c that verify this all works out.
154  */
155 #define	MACHCPU_SIZE	(1568 + 696)
156 #define	MACHCPU_PAD	(MMU_PAGESIZE - MACHCPU_SIZE)
157 #define	MACHCPU_PAD2	(MMU_PAGESIZE - 16 - 3 * sizeof (struct kpti_frame))
158 
159 struct	machcpu {
160 	/*
161 	 * x_call fields - used for interprocessor cross calls
162 	 */
163 	struct xc_msg	*xc_msgbox;
164 	struct xc_msg	*xc_curmsg;
165 	struct xc_msg	*xc_free;
166 	xc_data_t	xc_data;
167 	uint32_t	xc_wait_cnt;
168 	volatile uint32_t xc_work_cnt;
169 
170 	int		mcpu_nodeid;		/* node-id */
171 	int		mcpu_pri;		/* CPU priority */
172 
173 	struct hat	*mcpu_current_hat; /* cpu's current hat */
174 
175 	struct hat_cpu_info	*mcpu_hat_info;
176 
177 	volatile ulong_t	mcpu_tlb_info;
178 
179 	/* i86 hardware table addresses that cannot be shared */
180 
181 	user_desc_t	*mcpu_gdt;	/* GDT */
182 	gate_desc_t	*mcpu_idt;	/* current IDT */
183 
184 	tss_t		*mcpu_tss;	/* TSS */
185 	void		*mcpu_ldt;
186 	size_t		mcpu_ldt_len;
187 
188 	kmutex_t	mcpu_ppaddr_mutex;
189 	caddr_t		mcpu_caddr1;	/* per cpu CADDR1 */
190 	caddr_t		mcpu_caddr2;	/* per cpu CADDR2 */
191 	uint64_t	mcpu_caddr1pte;
192 	uint64_t	mcpu_caddr2pte;
193 
194 	struct softint	mcpu_softinfo;
195 	uint64_t	pil_high_start[HIGH_LEVELS];
196 	uint64_t	intrstat[PIL_MAX + 1][2];
197 
198 	struct cpuid_info	 *mcpu_cpi;
199 
200 #if defined(__amd64)
201 	greg_t	mcpu_rtmp_rsp;		/* syscall: temporary %rsp stash */
202 	greg_t	mcpu_rtmp_r15;		/* syscall: temporary %r15 stash */
203 #endif
204 
205 	struct vcpu_info *mcpu_vcpu_info;
206 	uint64_t	mcpu_gdtpa;	/* hypervisor: GDT physical address */
207 
208 	uint16_t mcpu_intr_pending;	/* hypervisor: pending intrpt levels */
209 	uint16_t mcpu_ec_mbox;		/* hypervisor: evtchn_dev mailbox */
210 	struct xen_evt_data *mcpu_evt_pend; /* hypervisor: pending events */
211 
212 	volatile uint32_t *mcpu_mwait;	/* MONITOR/MWAIT buffer */
213 	void (*mcpu_idle_cpu)(void);	/* idle function */
214 	uint16_t mcpu_idle_type;	/* CPU next idle type */
215 	uint16_t max_cstates;		/* supported max cstates */
216 
217 	struct cpu_ucode_info	*mcpu_ucode_info;
218 
219 	void			*mcpu_pm_mach_state;
220 	struct cmi_hdl		*mcpu_cmi_hdl;
221 	void			*mcpu_mach_ctx_ptr;
222 
223 	/*
224 	 * A stamp that is unique per processor and changes
225 	 * whenever an interrupt happens. Userful for detecting
226 	 * if a section of code gets interrupted.
227 	 * The high order 16 bits will hold the cpu->cpu_id.
228 	 * The low order bits will be incremented on every interrupt.
229 	 */
230 	volatile uint32_t	mcpu_istamp;
231 
232 	cpu_smt_t		mcpu_smt;
233 
234 	char			mcpu_pad[MACHCPU_PAD];
235 
236 	/* This is the start of the page */
237 	char			mcpu_pad2[MACHCPU_PAD2];
238 	struct kpti_frame	mcpu_kpti;
239 	struct kpti_frame	mcpu_kpti_flt;
240 	struct kpti_frame	mcpu_kpti_dbg;
241 	char			mcpu_pad3[16];
242 };
243 
244 #define	NINTR_THREADS	(LOCK_LEVEL-1)	/* number of interrupt threads */
245 #define	MWAIT_HALTED	(1)		/* mcpu_mwait set when halting */
246 #define	MWAIT_RUNNING	(0)		/* mcpu_mwait set to wakeup */
247 #define	MWAIT_WAKEUP_IPI	(2)	/* need IPI to wakeup */
248 #define	MWAIT_WAKEUP(cpu)	(*((cpu)->cpu_m.mcpu_mwait) = MWAIT_RUNNING)
249 
250 #endif	/* _ASM */
251 
252 /* Please DON'T add any more of this namespace-poisoning sewage here */
253 
254 #define	cpu_nodeid cpu_m.mcpu_nodeid
255 #define	cpu_pri cpu_m.mcpu_pri
256 #define	cpu_current_hat cpu_m.mcpu_current_hat
257 #define	cpu_hat_info cpu_m.mcpu_hat_info
258 #define	cpu_ppaddr_mutex cpu_m.mcpu_ppaddr_mutex
259 #define	cpu_gdt cpu_m.mcpu_gdt
260 #define	cpu_idt cpu_m.mcpu_idt
261 #define	cpu_tss cpu_m.mcpu_tss
262 #define	cpu_caddr1 cpu_m.mcpu_caddr1
263 #define	cpu_caddr2 cpu_m.mcpu_caddr2
264 #define	cpu_softinfo cpu_m.mcpu_softinfo
265 #define	cpu_caddr1pte cpu_m.mcpu_caddr1pte
266 #define	cpu_caddr2pte cpu_m.mcpu_caddr2pte
267 
268 #ifdef	__cplusplus
269 }
270 #endif
271 
272 #endif	/* _SYS_MACHCPUVAR_H */
273