1 /*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
7 *
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
12 *
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 *
19 * CDDL HEADER END
20 */
21 /*
22 * Copyright 2009 Sun Microsystems, Inc. All rights reserved.
23 * Use is subject to license terms.
24 */
25 /*
26 * Copyright 2014 Josef 'Jeff' Sipek <jeffpc@josefsipek.net>
27 * Copyright (c) 2014 by Delphix. All rights reserved.
28 */
29
30 #include <sys/cpuvar.h>
31 #include <sys/psm.h>
32 #include <sys/archsystm.h>
33 #include <sys/apic.h>
34 #include <sys/sunddi.h>
35 #include <sys/ddi_impldefs.h>
36 #include <sys/mach_intr.h>
37 #include <sys/sysmacros.h>
38 #include <sys/trap.h>
39 #include <sys/x86_archext.h>
40 #include <sys/privregs.h>
41 #include <sys/psm_common.h>
42
43 /* Function prototypes of local apic and X2APIC */
44 static uint64_t local_apic_read(uint32_t reg);
45 static void local_apic_write(uint32_t reg, uint64_t value);
46 static int get_local_apic_pri(void);
47 static void local_apic_write_task_reg(uint64_t value);
48 static void local_apic_write_int_cmd(uint32_t cpu_id, uint32_t cmd1);
49 static uint64_t local_x2apic_read(uint32_t msr);
50 static void local_x2apic_write(uint32_t msr, uint64_t value);
51 static int get_local_x2apic_pri(void);
52 static void local_x2apic_write_task_reg(uint64_t value);
53 static void local_x2apic_write_int_cmd(uint32_t cpu_id, uint32_t cmd1);
54
55 /*
56 * According to the X2APIC specification:
57 *
58 * xAPIC global enable X2APIC enable Description
59 * (IA32_APIC_BASE[11]) (IA32_APIC_BASE[10])
60 * -----------------------------------------------------------
61 * 0 0 APIC is disabled
62 * 0 1 Invalid
63 * 1 0 APIC is enabled in xAPIC mode
64 * 1 1 APIC is enabled in X2APIC mode
65 * -----------------------------------------------------------
66 */
67 int x2apic_enable = 1;
68 apic_mode_t apic_mode = LOCAL_APIC; /* Default mode is Local APIC */
69
70 /* See apic_directed_EOI_supported(). Currently 3-state variable. */
71 volatile int apic_directed_eoi_state = 2;
72
73 /* Uses MMIO (Memory Mapped IO) */
74 static apic_reg_ops_t local_apic_regs_ops = {
75 local_apic_read,
76 local_apic_write,
77 get_local_apic_pri,
78 local_apic_write_task_reg,
79 local_apic_write_int_cmd,
80 apic_send_EOI,
81 };
82
83 /* X2APIC : Uses RDMSR/WRMSR instructions to access APIC registers */
84 static apic_reg_ops_t x2apic_regs_ops = {
85 local_x2apic_read,
86 local_x2apic_write,
87 get_local_x2apic_pri,
88 local_x2apic_write_task_reg,
89 local_x2apic_write_int_cmd,
90 apic_send_EOI,
91 };
92
93 int apic_have_32bit_cr8 = 0;
94
95 /* The default ops is local APIC (Memory Mapped IO) */
96 apic_reg_ops_t *apic_reg_ops = &local_apic_regs_ops;
97
98 /*
99 * APIC register ops related data sturctures and functions.
100 */
101 void apic_send_EOI();
102 void apic_send_directed_EOI(uint32_t irq);
103
104 #define X2APIC_ENABLE_BIT 10
105
106 /*
107 * Local APIC Implementation
108 */
109 static uint64_t
local_apic_read(uint32_t reg)110 local_apic_read(uint32_t reg)
111 {
112 return ((uint32_t)apicadr[reg]);
113 }
114
115 static void
local_apic_write(uint32_t reg,uint64_t value)116 local_apic_write(uint32_t reg, uint64_t value)
117 {
118 apicadr[reg] = (uint32_t)value;
119 }
120
121 static int
get_local_apic_pri(void)122 get_local_apic_pri(void)
123 {
124 #if defined(__amd64)
125 return ((int)getcr8());
126 #else
127 if (apic_have_32bit_cr8)
128 return ((int)getcr8());
129 return (apicadr[APIC_TASK_REG]);
130 #endif
131 }
132
133 static void
local_apic_write_task_reg(uint64_t value)134 local_apic_write_task_reg(uint64_t value)
135 {
136 #if defined(__amd64)
137 setcr8((ulong_t)(value >> APIC_IPL_SHIFT));
138 #else
139 if (apic_have_32bit_cr8)
140 setcr8((ulong_t)(value >> APIC_IPL_SHIFT));
141 else
142 apicadr[APIC_TASK_REG] = (uint32_t)value;
143 #endif
144 }
145
146 static void
local_apic_write_int_cmd(uint32_t cpu_id,uint32_t cmd1)147 local_apic_write_int_cmd(uint32_t cpu_id, uint32_t cmd1)
148 {
149 apicadr[APIC_INT_CMD2] = cpu_id << APIC_ICR_ID_BIT_OFFSET;
150 apicadr[APIC_INT_CMD1] = cmd1;
151 }
152
153 /*
154 * X2APIC Implementation.
155 */
156 static uint64_t
local_x2apic_read(uint32_t msr)157 local_x2apic_read(uint32_t msr)
158 {
159 uint64_t i;
160
161 i = (uint64_t)(rdmsr(REG_X2APIC_BASE_MSR + (msr >> 2)) & 0xffffffff);
162 return (i);
163 }
164
165 static void
local_x2apic_write(uint32_t msr,uint64_t value)166 local_x2apic_write(uint32_t msr, uint64_t value)
167 {
168 uint64_t tmp;
169
170 if (msr != APIC_EOI_REG) {
171 tmp = rdmsr(REG_X2APIC_BASE_MSR + (msr >> 2));
172 tmp = (tmp & 0xffffffff00000000) | value;
173 } else {
174 tmp = 0;
175 }
176
177 wrmsr((REG_X2APIC_BASE_MSR + (msr >> 2)), tmp);
178 }
179
180 static int
get_local_x2apic_pri(void)181 get_local_x2apic_pri(void)
182 {
183 return (rdmsr(REG_X2APIC_BASE_MSR + (APIC_TASK_REG >> 2)));
184 }
185
186 static void
local_x2apic_write_task_reg(uint64_t value)187 local_x2apic_write_task_reg(uint64_t value)
188 {
189 X2APIC_WRITE(APIC_TASK_REG, value);
190 }
191
192 static void
local_x2apic_write_int_cmd(uint32_t cpu_id,uint32_t cmd1)193 local_x2apic_write_int_cmd(uint32_t cpu_id, uint32_t cmd1)
194 {
195 wrmsr((REG_X2APIC_BASE_MSR + (APIC_INT_CMD1 >> 2)),
196 (((uint64_t)cpu_id << 32) | cmd1));
197 }
198
199 /*ARGSUSED*/
200 void
apic_send_EOI(uint32_t irq)201 apic_send_EOI(uint32_t irq)
202 {
203 apic_reg_ops->apic_write(APIC_EOI_REG, 0);
204 }
205
206 /*
207 * Support for Directed EOI capability is available in both the xAPIC
208 * and x2APIC mode.
209 */
210 void
apic_send_directed_EOI(uint32_t irq)211 apic_send_directed_EOI(uint32_t irq)
212 {
213 uchar_t ioapicindex;
214 uchar_t vector;
215 apic_irq_t *apic_irq;
216 short intr_index;
217
218 /*
219 * Following the EOI to the local APIC unit, perform a directed
220 * EOI to the IOxAPIC generating the interrupt by writing to its
221 * EOI register.
222 *
223 * A broadcast EOI is not generated.
224 */
225 apic_reg_ops->apic_write(APIC_EOI_REG, 0);
226
227 apic_irq = apic_irq_table[irq];
228 while (apic_irq) {
229 intr_index = apic_irq->airq_mps_intr_index;
230 if (intr_index == ACPI_INDEX || intr_index >= 0) {
231 ioapicindex = apic_irq->airq_ioapicindex;
232 vector = apic_irq->airq_vector;
233 ioapic_write_eoi(ioapicindex, vector);
234 }
235 apic_irq = apic_irq->airq_next;
236 }
237 }
238
239 int
apic_detect_x2apic(void)240 apic_detect_x2apic(void)
241 {
242 if (x2apic_enable == 0)
243 return (0);
244
245 return (is_x86_feature(x86_featureset, X86FSET_X2APIC));
246 }
247
248 void
apic_enable_x2apic(void)249 apic_enable_x2apic(void)
250 {
251 uint64_t apic_base_msr;
252
253 if (apic_local_mode() == LOCAL_X2APIC) {
254 /* BIOS apparently has enabled X2APIC */
255 if (apic_mode != LOCAL_X2APIC)
256 x2apic_update_psm();
257 return;
258 }
259
260 /*
261 * This is the first time we are enabling X2APIC on this CPU
262 */
263 apic_base_msr = rdmsr(REG_APIC_BASE_MSR);
264 apic_base_msr = apic_base_msr | (0x1 << X2APIC_ENABLE_BIT);
265 wrmsr(REG_APIC_BASE_MSR, apic_base_msr);
266
267 if (apic_mode != LOCAL_X2APIC)
268 x2apic_update_psm();
269 }
270
271 /*
272 * Determine which mode the current CPU is in. See the table above.
273 * (IA32_APIC_BASE[11]) (IA32_APIC_BASE[10])
274 */
275 int
apic_local_mode(void)276 apic_local_mode(void)
277 {
278 uint64_t apic_base_msr;
279 int bit = ((0x1 << (X2APIC_ENABLE_BIT + 1)) |
280 (0x1 << X2APIC_ENABLE_BIT));
281
282 apic_base_msr = rdmsr(REG_APIC_BASE_MSR);
283
284 if ((apic_base_msr & bit) == bit)
285 return (LOCAL_X2APIC);
286 else
287 return (LOCAL_APIC);
288 }
289
290 void
apic_set_directed_EOI_handler()291 apic_set_directed_EOI_handler()
292 {
293 apic_reg_ops->apic_send_eoi = apic_send_directed_EOI;
294 }
295
296 int
apic_directed_EOI_supported()297 apic_directed_EOI_supported()
298 {
299 uint32_t ver;
300
301 /*
302 * There are some known issues with some versions of Linux KVM and QEMU
303 * where by directed EOIs do not properly function and instead get
304 * coalesced at the hypervisor, causing the host not to see interrupts.
305 * Thus, when the platform is KVM, we would like to disable it by
306 * default, but keep it available otherwise.
307 *
308 * We use a three-state variable (apic_directed_eoi_state) to determine
309 * how we handle directed EOI.
310 *
311 * 0 --> Don't do directed EOI at all.
312 * 1 --> Do directed EOI if available, no matter the HW environment.
313 * 2 --> Don't do directed EOI on KVM, but do it otherwise if available.
314 *
315 * If some grinning weirdo put something else in there, treat it as '2'
316 * (i.e. the current default).
317 *
318 * Note, at this time illumos KVM does not identify as KVM. If it does,
319 * we'll need to do some work to determine if it should be caught by
320 * this or if it should show up as its own value of platform_type.
321 */
322 switch (apic_directed_eoi_state) {
323 case 0:
324 /* Don't do it at all. */
325 return (0);
326 case 1:
327 break;
328 case 2:
329 default:
330 /* Only do it if we aren't on KVM. */
331 if (get_hwenv() == HW_KVM)
332 return (0);
333 /* FALLTHRU */
334 }
335
336 ver = apic_reg_ops->apic_read(APIC_VERS_REG);
337 if (ver & APIC_DIRECTED_EOI_BIT)
338 return (1);
339
340 return (0);
341 }
342
343 /*
344 * Change apic_reg_ops depending upon the apic_mode.
345 */
346 void
apic_change_ops()347 apic_change_ops()
348 {
349 if (apic_mode == LOCAL_APIC)
350 apic_reg_ops = &local_apic_regs_ops;
351 else if (apic_mode == LOCAL_X2APIC)
352 apic_reg_ops = &x2apic_regs_ops;
353 }
354
355 /*
356 * Generates an interprocessor interrupt to another CPU when X2APIC mode is
357 * enabled.
358 */
359 void
x2apic_send_ipi(int cpun,int ipl)360 x2apic_send_ipi(int cpun, int ipl)
361 {
362 int vector;
363 ulong_t flag;
364
365 ASSERT(apic_mode == LOCAL_X2APIC);
366
367 /*
368 * With X2APIC, Intel relaxed the semantics of the
369 * WRMSR instruction such that references to the X2APIC
370 * MSR registers are no longer serializing instructions.
371 * The code that initiates IPIs assumes that some sort
372 * of memory serialization occurs. The old APIC code
373 * did a write to uncachable memory mapped registers.
374 * Any reference to uncached memory is a serializing
375 * operation. To mimic those semantics here, we do an
376 * atomic operation, which translates to a LOCK OR instruction,
377 * which is serializing.
378 */
379 atomic_or_ulong(&flag, 1);
380
381 vector = apic_resv_vector[ipl];
382
383 flag = intr_clear();
384
385 /*
386 * According to X2APIC specification in section '2.3.5.1' of
387 * Interrupt Command Register Semantics, the semantics of
388 * programming Interrupt Command Register to dispatch an interrupt
389 * is simplified. A single MSR write to the 64-bit ICR is required
390 * for dispatching an interrupt. Specifically with the 64-bit MSR
391 * interface to ICR, system software is not required to check the
392 * status of the delivery status bit prior to writing to the ICR
393 * to send an IPI. With the removal of the Delivery Status bit,
394 * system software no longer has a reason to read the ICR. It remains
395 * readable only to aid in debugging.
396 */
397 #ifdef DEBUG
398 APIC_AV_PENDING_SET();
399 #endif /* DEBUG */
400
401 if ((cpun == psm_get_cpu_id())) {
402 X2APIC_WRITE(X2APIC_SELF_IPI, vector);
403 } else {
404 apic_reg_ops->apic_write_int_cmd(
405 apic_cpus[cpun].aci_local_id, vector);
406 }
407
408 intr_restore(flag);
409 }
410
411 /*
412 * Generates IPI to another CPU depending on the local APIC mode.
413 * apic_send_ipi() and x2apic_send_ipi() depends on the configured
414 * mode of the local APIC, but that may not match the actual mode
415 * early in CPU startup.
416 *
417 * Any changes made to this routine must be accompanied by similar
418 * changes to apic_send_ipi().
419 */
420 void
apic_common_send_ipi(int cpun,int ipl)421 apic_common_send_ipi(int cpun, int ipl)
422 {
423 int vector;
424 ulong_t flag;
425 int mode = apic_local_mode();
426
427 if (mode == LOCAL_X2APIC) {
428 x2apic_send_ipi(cpun, ipl);
429 return;
430 }
431
432 ASSERT(mode == LOCAL_APIC);
433
434 vector = apic_resv_vector[ipl];
435 ASSERT((vector >= APIC_BASE_VECT) && (vector <= APIC_SPUR_INTR));
436 flag = intr_clear();
437 while (local_apic_regs_ops.apic_read(APIC_INT_CMD1) & AV_PENDING)
438 apic_ret();
439 local_apic_regs_ops.apic_write_int_cmd(apic_cpus[cpun].aci_local_id,
440 vector);
441 intr_restore(flag);
442 }
443