xref: /linux/arch/x86/kernel/cpu/common.c (revision ef8813ab280507972bb57e4b1b502811ad4411e9)
1f0fc4affSYinghai Lu #include <linux/bootmem.h>
29766cdbcSJaswinder Singh Rajput #include <linux/linkage.h>
3f0fc4affSYinghai Lu #include <linux/bitops.h>
49766cdbcSJaswinder Singh Rajput #include <linux/kernel.h>
5186f4360SPaul Gortmaker #include <linux/export.h>
6f7627e25SThomas Gleixner #include <linux/percpu.h>
79766cdbcSJaswinder Singh Rajput #include <linux/string.h>
8ee098e1aSBorislav Petkov #include <linux/ctype.h>
99766cdbcSJaswinder Singh Rajput #include <linux/delay.h>
1068e21be2SIngo Molnar #include <linux/sched/mm.h>
11e6017571SIngo Molnar #include <linux/sched/clock.h>
129164bb4aSIngo Molnar #include <linux/sched/task.h>
139766cdbcSJaswinder Singh Rajput #include <linux/init.h>
140f46efebSMasami Hiramatsu #include <linux/kprobes.h>
159766cdbcSJaswinder Singh Rajput #include <linux/kgdb.h>
169766cdbcSJaswinder Singh Rajput #include <linux/smp.h>
179766cdbcSJaswinder Singh Rajput #include <linux/io.h>
18b51ef52dSLaura Abbott #include <linux/syscore_ops.h>
199766cdbcSJaswinder Singh Rajput 
209766cdbcSJaswinder Singh Rajput #include <asm/stackprotector.h>
21cdd6c482SIngo Molnar #include <asm/perf_event.h>
22f7627e25SThomas Gleixner #include <asm/mmu_context.h>
2349d859d7SH. Peter Anvin #include <asm/archrandom.h>
249766cdbcSJaswinder Singh Rajput #include <asm/hypervisor.h>
259766cdbcSJaswinder Singh Rajput #include <asm/processor.h>
261e02ce4cSAndy Lutomirski #include <asm/tlbflush.h>
27f649e938SPaul Gortmaker #include <asm/debugreg.h>
289766cdbcSJaswinder Singh Rajput #include <asm/sections.h>
29f40c3300SAndy Lutomirski #include <asm/vsyscall.h>
308bdbd962SAlan Cox #include <linux/topology.h>
318bdbd962SAlan Cox #include <linux/cpumask.h>
329766cdbcSJaswinder Singh Rajput #include <asm/pgtable.h>
3360063497SArun Sharma #include <linux/atomic.h>
349766cdbcSJaswinder Singh Rajput #include <asm/proto.h>
359766cdbcSJaswinder Singh Rajput #include <asm/setup.h>
36f7627e25SThomas Gleixner #include <asm/apic.h>
379766cdbcSJaswinder Singh Rajput #include <asm/desc.h>
3878f7f1e5SIngo Molnar #include <asm/fpu/internal.h>
399766cdbcSJaswinder Singh Rajput #include <asm/mtrr.h>
400274f955SGrzegorz Andrejczuk #include <asm/hwcap2.h>
418bdbd962SAlan Cox #include <linux/numa.h>
429766cdbcSJaswinder Singh Rajput #include <asm/asm.h>
430f6ff2bcSDave Hansen #include <asm/bugs.h>
449766cdbcSJaswinder Singh Rajput #include <asm/cpu.h>
459766cdbcSJaswinder Singh Rajput #include <asm/mce.h>
469766cdbcSJaswinder Singh Rajput #include <asm/msr.h>
479766cdbcSJaswinder Singh Rajput #include <asm/pat.h>
48d288e1cfSFenghua Yu #include <asm/microcode.h>
49d288e1cfSFenghua Yu #include <asm/microcode_intel.h>
50e641f5f5SIngo Molnar 
51f7627e25SThomas Gleixner #ifdef CONFIG_X86_LOCAL_APIC
52bdbcdd48STejun Heo #include <asm/uv/uv.h>
53f7627e25SThomas Gleixner #endif
54f7627e25SThomas Gleixner 
55f7627e25SThomas Gleixner #include "cpu.h"
56f7627e25SThomas Gleixner 
570274f955SGrzegorz Andrejczuk u32 elf_hwcap2 __read_mostly;
580274f955SGrzegorz Andrejczuk 
59c2d1cec1SMike Travis /* all of these masks are initialized in setup_cpu_local_masks() */
60c2d1cec1SMike Travis cpumask_var_t cpu_initialized_mask;
619766cdbcSJaswinder Singh Rajput cpumask_var_t cpu_callout_mask;
629766cdbcSJaswinder Singh Rajput cpumask_var_t cpu_callin_mask;
63c2d1cec1SMike Travis 
64c2d1cec1SMike Travis /* representing cpus for which sibling maps can be computed */
65c2d1cec1SMike Travis cpumask_var_t cpu_sibling_setup_mask;
66c2d1cec1SMike Travis 
672f2f52baSBrian Gerst /* correctly size the local cpu masks */
684369f1fbSIngo Molnar void __init setup_cpu_local_masks(void)
692f2f52baSBrian Gerst {
702f2f52baSBrian Gerst 	alloc_bootmem_cpumask_var(&cpu_initialized_mask);
712f2f52baSBrian Gerst 	alloc_bootmem_cpumask_var(&cpu_callin_mask);
722f2f52baSBrian Gerst 	alloc_bootmem_cpumask_var(&cpu_callout_mask);
732f2f52baSBrian Gerst 	alloc_bootmem_cpumask_var(&cpu_sibling_setup_mask);
742f2f52baSBrian Gerst }
752f2f52baSBrian Gerst 
76148f9bb8SPaul Gortmaker static void default_init(struct cpuinfo_x86 *c)
77e8055139SOndrej Zary {
78e8055139SOndrej Zary #ifdef CONFIG_X86_64
7927c13eceSBorislav Petkov 	cpu_detect_cache_sizes(c);
80e8055139SOndrej Zary #else
81e8055139SOndrej Zary 	/* Not much we can do here... */
82e8055139SOndrej Zary 	/* Check if at least it has cpuid */
83e8055139SOndrej Zary 	if (c->cpuid_level == -1) {
84e8055139SOndrej Zary 		/* No cpuid. It must be an ancient CPU */
85e8055139SOndrej Zary 		if (c->x86 == 4)
86e8055139SOndrej Zary 			strcpy(c->x86_model_id, "486");
87e8055139SOndrej Zary 		else if (c->x86 == 3)
88e8055139SOndrej Zary 			strcpy(c->x86_model_id, "386");
89e8055139SOndrej Zary 	}
90e8055139SOndrej Zary #endif
91e8055139SOndrej Zary }
92e8055139SOndrej Zary 
93148f9bb8SPaul Gortmaker static const struct cpu_dev default_cpu = {
94e8055139SOndrej Zary 	.c_init		= default_init,
95e8055139SOndrej Zary 	.c_vendor	= "Unknown",
96e8055139SOndrej Zary 	.c_x86_vendor	= X86_VENDOR_UNKNOWN,
97e8055139SOndrej Zary };
98e8055139SOndrej Zary 
99148f9bb8SPaul Gortmaker static const struct cpu_dev *this_cpu = &default_cpu;
1000a488a53SYinghai Lu 
10106deef89SBrian Gerst DEFINE_PER_CPU_PAGE_ALIGNED(struct gdt_page, gdt_page) = { .gdt = {
102950ad7ffSYinghai Lu #ifdef CONFIG_X86_64
10306deef89SBrian Gerst 	/*
10406deef89SBrian Gerst 	 * We need valid kernel segments for data and code in long mode too
105950ad7ffSYinghai Lu 	 * IRET will check the segment types  kkeil 2000/10/28
106950ad7ffSYinghai Lu 	 * Also sysret mandates a special GDT layout
10706deef89SBrian Gerst 	 *
1089766cdbcSJaswinder Singh Rajput 	 * TLS descriptors are currently at a different place compared to i386.
10906deef89SBrian Gerst 	 * Hopefully nobody expects them at a fixed place (Wine?)
110950ad7ffSYinghai Lu 	 */
1111e5de182SAkinobu Mita 	[GDT_ENTRY_KERNEL32_CS]		= GDT_ENTRY_INIT(0xc09b, 0, 0xfffff),
1121e5de182SAkinobu Mita 	[GDT_ENTRY_KERNEL_CS]		= GDT_ENTRY_INIT(0xa09b, 0, 0xfffff),
1131e5de182SAkinobu Mita 	[GDT_ENTRY_KERNEL_DS]		= GDT_ENTRY_INIT(0xc093, 0, 0xfffff),
1141e5de182SAkinobu Mita 	[GDT_ENTRY_DEFAULT_USER32_CS]	= GDT_ENTRY_INIT(0xc0fb, 0, 0xfffff),
1151e5de182SAkinobu Mita 	[GDT_ENTRY_DEFAULT_USER_DS]	= GDT_ENTRY_INIT(0xc0f3, 0, 0xfffff),
1161e5de182SAkinobu Mita 	[GDT_ENTRY_DEFAULT_USER_CS]	= GDT_ENTRY_INIT(0xa0fb, 0, 0xfffff),
117950ad7ffSYinghai Lu #else
1181e5de182SAkinobu Mita 	[GDT_ENTRY_KERNEL_CS]		= GDT_ENTRY_INIT(0xc09a, 0, 0xfffff),
1191e5de182SAkinobu Mita 	[GDT_ENTRY_KERNEL_DS]		= GDT_ENTRY_INIT(0xc092, 0, 0xfffff),
1201e5de182SAkinobu Mita 	[GDT_ENTRY_DEFAULT_USER_CS]	= GDT_ENTRY_INIT(0xc0fa, 0, 0xfffff),
1211e5de182SAkinobu Mita 	[GDT_ENTRY_DEFAULT_USER_DS]	= GDT_ENTRY_INIT(0xc0f2, 0, 0xfffff),
122f7627e25SThomas Gleixner 	/*
123f7627e25SThomas Gleixner 	 * Segments used for calling PnP BIOS have byte granularity.
124f7627e25SThomas Gleixner 	 * They code segments and data segments have fixed 64k limits,
125f7627e25SThomas Gleixner 	 * the transfer segment sizes are set at run time.
126f7627e25SThomas Gleixner 	 */
1276842ef0eSGlauber de Oliveira Costa 	/* 32-bit code */
1281e5de182SAkinobu Mita 	[GDT_ENTRY_PNPBIOS_CS32]	= GDT_ENTRY_INIT(0x409a, 0, 0xffff),
1296842ef0eSGlauber de Oliveira Costa 	/* 16-bit code */
1301e5de182SAkinobu Mita 	[GDT_ENTRY_PNPBIOS_CS16]	= GDT_ENTRY_INIT(0x009a, 0, 0xffff),
1316842ef0eSGlauber de Oliveira Costa 	/* 16-bit data */
1321e5de182SAkinobu Mita 	[GDT_ENTRY_PNPBIOS_DS]		= GDT_ENTRY_INIT(0x0092, 0, 0xffff),
1336842ef0eSGlauber de Oliveira Costa 	/* 16-bit data */
1341e5de182SAkinobu Mita 	[GDT_ENTRY_PNPBIOS_TS1]		= GDT_ENTRY_INIT(0x0092, 0, 0),
1356842ef0eSGlauber de Oliveira Costa 	/* 16-bit data */
1361e5de182SAkinobu Mita 	[GDT_ENTRY_PNPBIOS_TS2]		= GDT_ENTRY_INIT(0x0092, 0, 0),
137f7627e25SThomas Gleixner 	/*
138f7627e25SThomas Gleixner 	 * The APM segments have byte granularity and their bases
139f7627e25SThomas Gleixner 	 * are set at run time.  All have 64k limits.
140f7627e25SThomas Gleixner 	 */
1416842ef0eSGlauber de Oliveira Costa 	/* 32-bit code */
1421e5de182SAkinobu Mita 	[GDT_ENTRY_APMBIOS_BASE]	= GDT_ENTRY_INIT(0x409a, 0, 0xffff),
143f7627e25SThomas Gleixner 	/* 16-bit code */
1441e5de182SAkinobu Mita 	[GDT_ENTRY_APMBIOS_BASE+1]	= GDT_ENTRY_INIT(0x009a, 0, 0xffff),
1456842ef0eSGlauber de Oliveira Costa 	/* data */
14672c4d853SIngo Molnar 	[GDT_ENTRY_APMBIOS_BASE+2]	= GDT_ENTRY_INIT(0x4092, 0, 0xffff),
147f7627e25SThomas Gleixner 
1481e5de182SAkinobu Mita 	[GDT_ENTRY_ESPFIX_SS]		= GDT_ENTRY_INIT(0xc092, 0, 0xfffff),
1491e5de182SAkinobu Mita 	[GDT_ENTRY_PERCPU]		= GDT_ENTRY_INIT(0xc092, 0, 0xfffff),
15060a5317fSTejun Heo 	GDT_STACK_CANARY_INIT
151950ad7ffSYinghai Lu #endif
15206deef89SBrian Gerst } };
153f7627e25SThomas Gleixner EXPORT_PER_CPU_SYMBOL_GPL(gdt_page);
154f7627e25SThomas Gleixner 
1558c3641e9SDave Hansen static int __init x86_mpx_setup(char *s)
1560c752a93SSuresh Siddha {
1578c3641e9SDave Hansen 	/* require an exact match without trailing characters */
1582cd3949fSDave Hansen 	if (strlen(s))
1592cd3949fSDave Hansen 		return 0;
1600c752a93SSuresh Siddha 
1618c3641e9SDave Hansen 	/* do not emit a message if the feature is not present */
1628c3641e9SDave Hansen 	if (!boot_cpu_has(X86_FEATURE_MPX))
1636bad06b7SSuresh Siddha 		return 1;
1646bad06b7SSuresh Siddha 
1658c3641e9SDave Hansen 	setup_clear_cpu_cap(X86_FEATURE_MPX);
1668c3641e9SDave Hansen 	pr_info("nompx: Intel Memory Protection Extensions (MPX) disabled\n");
167b6f42a4aSFenghua Yu 	return 1;
168b6f42a4aSFenghua Yu }
1698c3641e9SDave Hansen __setup("nompx", x86_mpx_setup);
170b6f42a4aSFenghua Yu 
1710790c9aaSAndy Lutomirski #ifdef CONFIG_X86_64
172c7ad5ad2SAndy Lutomirski static int __init x86_nopcid_setup(char *s)
1730790c9aaSAndy Lutomirski {
174c7ad5ad2SAndy Lutomirski 	/* nopcid doesn't accept parameters */
175c7ad5ad2SAndy Lutomirski 	if (s)
176c7ad5ad2SAndy Lutomirski 		return -EINVAL;
1770790c9aaSAndy Lutomirski 
1780790c9aaSAndy Lutomirski 	/* do not emit a message if the feature is not present */
1790790c9aaSAndy Lutomirski 	if (!boot_cpu_has(X86_FEATURE_PCID))
180c7ad5ad2SAndy Lutomirski 		return 0;
1810790c9aaSAndy Lutomirski 
1820790c9aaSAndy Lutomirski 	setup_clear_cpu_cap(X86_FEATURE_PCID);
1830790c9aaSAndy Lutomirski 	pr_info("nopcid: PCID feature disabled\n");
184c7ad5ad2SAndy Lutomirski 	return 0;
1850790c9aaSAndy Lutomirski }
186c7ad5ad2SAndy Lutomirski early_param("nopcid", x86_nopcid_setup);
1870790c9aaSAndy Lutomirski #endif
1880790c9aaSAndy Lutomirski 
189d12a72b8SAndy Lutomirski static int __init x86_noinvpcid_setup(char *s)
190d12a72b8SAndy Lutomirski {
191d12a72b8SAndy Lutomirski 	/* noinvpcid doesn't accept parameters */
192d12a72b8SAndy Lutomirski 	if (s)
193d12a72b8SAndy Lutomirski 		return -EINVAL;
194d12a72b8SAndy Lutomirski 
195d12a72b8SAndy Lutomirski 	/* do not emit a message if the feature is not present */
196d12a72b8SAndy Lutomirski 	if (!boot_cpu_has(X86_FEATURE_INVPCID))
197d12a72b8SAndy Lutomirski 		return 0;
198d12a72b8SAndy Lutomirski 
199d12a72b8SAndy Lutomirski 	setup_clear_cpu_cap(X86_FEATURE_INVPCID);
200d12a72b8SAndy Lutomirski 	pr_info("noinvpcid: INVPCID feature disabled\n");
201d12a72b8SAndy Lutomirski 	return 0;
202d12a72b8SAndy Lutomirski }
203d12a72b8SAndy Lutomirski early_param("noinvpcid", x86_noinvpcid_setup);
204d12a72b8SAndy Lutomirski 
205ba51dcedSYinghai Lu #ifdef CONFIG_X86_32
206148f9bb8SPaul Gortmaker static int cachesize_override = -1;
207148f9bb8SPaul Gortmaker static int disable_x86_serial_nr = 1;
208f7627e25SThomas Gleixner 
209f7627e25SThomas Gleixner static int __init cachesize_setup(char *str)
210f7627e25SThomas Gleixner {
211f7627e25SThomas Gleixner 	get_option(&str, &cachesize_override);
212f7627e25SThomas Gleixner 	return 1;
213f7627e25SThomas Gleixner }
214f7627e25SThomas Gleixner __setup("cachesize=", cachesize_setup);
215f7627e25SThomas Gleixner 
216f7627e25SThomas Gleixner static int __init x86_sep_setup(char *s)
217f7627e25SThomas Gleixner {
21813530257SAndi Kleen 	setup_clear_cpu_cap(X86_FEATURE_SEP);
219f7627e25SThomas Gleixner 	return 1;
220f7627e25SThomas Gleixner }
221f7627e25SThomas Gleixner __setup("nosep", x86_sep_setup);
222f7627e25SThomas Gleixner 
223f7627e25SThomas Gleixner /* Standard macro to see if a specific flag is changeable */
224f7627e25SThomas Gleixner static inline int flag_is_changeable_p(u32 flag)
225f7627e25SThomas Gleixner {
226f7627e25SThomas Gleixner 	u32 f1, f2;
227f7627e25SThomas Gleixner 
22894f6bac1SKrzysztof Helt 	/*
22994f6bac1SKrzysztof Helt 	 * Cyrix and IDT cpus allow disabling of CPUID
23094f6bac1SKrzysztof Helt 	 * so the code below may return different results
23194f6bac1SKrzysztof Helt 	 * when it is executed before and after enabling
23294f6bac1SKrzysztof Helt 	 * the CPUID. Add "volatile" to not allow gcc to
23394f6bac1SKrzysztof Helt 	 * optimize the subsequent calls to this function.
23494f6bac1SKrzysztof Helt 	 */
23594f6bac1SKrzysztof Helt 	asm volatile ("pushfl		\n\t"
236f7627e25SThomas Gleixner 		      "pushfl		\n\t"
237f7627e25SThomas Gleixner 		      "popl %0		\n\t"
238f7627e25SThomas Gleixner 		      "movl %0, %1	\n\t"
239f7627e25SThomas Gleixner 		      "xorl %2, %0	\n\t"
240f7627e25SThomas Gleixner 		      "pushl %0		\n\t"
241f7627e25SThomas Gleixner 		      "popfl		\n\t"
242f7627e25SThomas Gleixner 		      "pushfl		\n\t"
243f7627e25SThomas Gleixner 		      "popl %0		\n\t"
244f7627e25SThomas Gleixner 		      "popfl		\n\t"
2450f3fa48aSIngo Molnar 
246f7627e25SThomas Gleixner 		      : "=&r" (f1), "=&r" (f2)
247f7627e25SThomas Gleixner 		      : "ir" (flag));
248f7627e25SThomas Gleixner 
249f7627e25SThomas Gleixner 	return ((f1^f2) & flag) != 0;
250f7627e25SThomas Gleixner }
251f7627e25SThomas Gleixner 
252f7627e25SThomas Gleixner /* Probe for the CPUID instruction */
253148f9bb8SPaul Gortmaker int have_cpuid_p(void)
254f7627e25SThomas Gleixner {
255f7627e25SThomas Gleixner 	return flag_is_changeable_p(X86_EFLAGS_ID);
256f7627e25SThomas Gleixner }
257f7627e25SThomas Gleixner 
258148f9bb8SPaul Gortmaker static void squash_the_stupid_serial_number(struct cpuinfo_x86 *c)
2590a488a53SYinghai Lu {
2600a488a53SYinghai Lu 	unsigned long lo, hi;
2610f3fa48aSIngo Molnar 
2620f3fa48aSIngo Molnar 	if (!cpu_has(c, X86_FEATURE_PN) || !disable_x86_serial_nr)
2630f3fa48aSIngo Molnar 		return;
2640f3fa48aSIngo Molnar 
2650f3fa48aSIngo Molnar 	/* Disable processor serial number: */
2660f3fa48aSIngo Molnar 
2670a488a53SYinghai Lu 	rdmsr(MSR_IA32_BBL_CR_CTL, lo, hi);
2680a488a53SYinghai Lu 	lo |= 0x200000;
2690a488a53SYinghai Lu 	wrmsr(MSR_IA32_BBL_CR_CTL, lo, hi);
2700f3fa48aSIngo Molnar 
2711b74dde7SChen Yucong 	pr_notice("CPU serial number disabled.\n");
2720a488a53SYinghai Lu 	clear_cpu_cap(c, X86_FEATURE_PN);
2730a488a53SYinghai Lu 
2740a488a53SYinghai Lu 	/* Disabling the serial number may affect the cpuid level */
2750a488a53SYinghai Lu 	c->cpuid_level = cpuid_eax(0);
2760a488a53SYinghai Lu }
2770a488a53SYinghai Lu 
2780a488a53SYinghai Lu static int __init x86_serial_nr_setup(char *s)
2790a488a53SYinghai Lu {
2800a488a53SYinghai Lu 	disable_x86_serial_nr = 0;
2810a488a53SYinghai Lu 	return 1;
2820a488a53SYinghai Lu }
2830a488a53SYinghai Lu __setup("serialnumber", x86_serial_nr_setup);
284ba51dcedSYinghai Lu #else
285102bbe3aSYinghai Lu static inline int flag_is_changeable_p(u32 flag)
286102bbe3aSYinghai Lu {
287102bbe3aSYinghai Lu 	return 1;
288102bbe3aSYinghai Lu }
289102bbe3aSYinghai Lu static inline void squash_the_stupid_serial_number(struct cpuinfo_x86 *c)
290102bbe3aSYinghai Lu {
291102bbe3aSYinghai Lu }
292ba51dcedSYinghai Lu #endif
2930a488a53SYinghai Lu 
294de5397adSFenghua Yu static __init int setup_disable_smep(char *arg)
295de5397adSFenghua Yu {
296b2cc2a07SH. Peter Anvin 	setup_clear_cpu_cap(X86_FEATURE_SMEP);
2970f6ff2bcSDave Hansen 	/* Check for things that depend on SMEP being enabled: */
2980f6ff2bcSDave Hansen 	check_mpx_erratum(&boot_cpu_data);
299de5397adSFenghua Yu 	return 1;
300de5397adSFenghua Yu }
301de5397adSFenghua Yu __setup("nosmep", setup_disable_smep);
302de5397adSFenghua Yu 
303b2cc2a07SH. Peter Anvin static __always_inline void setup_smep(struct cpuinfo_x86 *c)
304de5397adSFenghua Yu {
305b2cc2a07SH. Peter Anvin 	if (cpu_has(c, X86_FEATURE_SMEP))
306375074ccSAndy Lutomirski 		cr4_set_bits(X86_CR4_SMEP);
307de5397adSFenghua Yu }
308de5397adSFenghua Yu 
30952b6179aSH. Peter Anvin static __init int setup_disable_smap(char *arg)
31052b6179aSH. Peter Anvin {
311b2cc2a07SH. Peter Anvin 	setup_clear_cpu_cap(X86_FEATURE_SMAP);
31252b6179aSH. Peter Anvin 	return 1;
31352b6179aSH. Peter Anvin }
31452b6179aSH. Peter Anvin __setup("nosmap", setup_disable_smap);
31552b6179aSH. Peter Anvin 
316b2cc2a07SH. Peter Anvin static __always_inline void setup_smap(struct cpuinfo_x86 *c)
31752b6179aSH. Peter Anvin {
318581b7f15SAndrew Cooper 	unsigned long eflags = native_save_fl();
319b2cc2a07SH. Peter Anvin 
320b2cc2a07SH. Peter Anvin 	/* This should have been cleared long ago */
321b2cc2a07SH. Peter Anvin 	BUG_ON(eflags & X86_EFLAGS_AC);
322b2cc2a07SH. Peter Anvin 
32303bbd596SH. Peter Anvin 	if (cpu_has(c, X86_FEATURE_SMAP)) {
32403bbd596SH. Peter Anvin #ifdef CONFIG_X86_SMAP
325375074ccSAndy Lutomirski 		cr4_set_bits(X86_CR4_SMAP);
32603bbd596SH. Peter Anvin #else
327375074ccSAndy Lutomirski 		cr4_clear_bits(X86_CR4_SMAP);
32803bbd596SH. Peter Anvin #endif
32903bbd596SH. Peter Anvin 	}
330f7627e25SThomas Gleixner }
331f7627e25SThomas Gleixner 
332f7627e25SThomas Gleixner /*
33306976945SDave Hansen  * Protection Keys are not available in 32-bit mode.
33406976945SDave Hansen  */
33506976945SDave Hansen static bool pku_disabled;
33606976945SDave Hansen 
33706976945SDave Hansen static __always_inline void setup_pku(struct cpuinfo_x86 *c)
33806976945SDave Hansen {
339e8df1a95SDave Hansen 	/* check the boot processor, plus compile options for PKU: */
340e8df1a95SDave Hansen 	if (!cpu_feature_enabled(X86_FEATURE_PKU))
341e8df1a95SDave Hansen 		return;
342e8df1a95SDave Hansen 	/* checks the actual processor's cpuid bits: */
34306976945SDave Hansen 	if (!cpu_has(c, X86_FEATURE_PKU))
34406976945SDave Hansen 		return;
34506976945SDave Hansen 	if (pku_disabled)
34606976945SDave Hansen 		return;
34706976945SDave Hansen 
34806976945SDave Hansen 	cr4_set_bits(X86_CR4_PKE);
34906976945SDave Hansen 	/*
35006976945SDave Hansen 	 * Seting X86_CR4_PKE will cause the X86_FEATURE_OSPKE
35106976945SDave Hansen 	 * cpuid bit to be set.  We need to ensure that we
35206976945SDave Hansen 	 * update that bit in this CPU's "cpu_info".
35306976945SDave Hansen 	 */
35406976945SDave Hansen 	get_cpu_cap(c);
35506976945SDave Hansen }
35606976945SDave Hansen 
35706976945SDave Hansen #ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS
35806976945SDave Hansen static __init int setup_disable_pku(char *arg)
35906976945SDave Hansen {
36006976945SDave Hansen 	/*
36106976945SDave Hansen 	 * Do not clear the X86_FEATURE_PKU bit.  All of the
36206976945SDave Hansen 	 * runtime checks are against OSPKE so clearing the
36306976945SDave Hansen 	 * bit does nothing.
36406976945SDave Hansen 	 *
36506976945SDave Hansen 	 * This way, we will see "pku" in cpuinfo, but not
36606976945SDave Hansen 	 * "ospke", which is exactly what we want.  It shows
36706976945SDave Hansen 	 * that the CPU has PKU, but the OS has not enabled it.
36806976945SDave Hansen 	 * This happens to be exactly how a system would look
36906976945SDave Hansen 	 * if we disabled the config option.
37006976945SDave Hansen 	 */
37106976945SDave Hansen 	pr_info("x86: 'nopku' specified, disabling Memory Protection Keys\n");
37206976945SDave Hansen 	pku_disabled = true;
37306976945SDave Hansen 	return 1;
37406976945SDave Hansen }
37506976945SDave Hansen __setup("nopku", setup_disable_pku);
37606976945SDave Hansen #endif /* CONFIG_X86_64 */
37706976945SDave Hansen 
37806976945SDave Hansen /*
379b38b0665SH. Peter Anvin  * Some CPU features depend on higher CPUID levels, which may not always
380b38b0665SH. Peter Anvin  * be available due to CPUID level capping or broken virtualization
381b38b0665SH. Peter Anvin  * software.  Add those features to this table to auto-disable them.
382b38b0665SH. Peter Anvin  */
383b38b0665SH. Peter Anvin struct cpuid_dependent_feature {
384b38b0665SH. Peter Anvin 	u32 feature;
385b38b0665SH. Peter Anvin 	u32 level;
386b38b0665SH. Peter Anvin };
3870f3fa48aSIngo Molnar 
388148f9bb8SPaul Gortmaker static const struct cpuid_dependent_feature
389b38b0665SH. Peter Anvin cpuid_dependent_features[] = {
390b38b0665SH. Peter Anvin 	{ X86_FEATURE_MWAIT,		0x00000005 },
391b38b0665SH. Peter Anvin 	{ X86_FEATURE_DCA,		0x00000009 },
392b38b0665SH. Peter Anvin 	{ X86_FEATURE_XSAVE,		0x0000000d },
393b38b0665SH. Peter Anvin 	{ 0, 0 }
394b38b0665SH. Peter Anvin };
395b38b0665SH. Peter Anvin 
396148f9bb8SPaul Gortmaker static void filter_cpuid_features(struct cpuinfo_x86 *c, bool warn)
397b38b0665SH. Peter Anvin {
398b38b0665SH. Peter Anvin 	const struct cpuid_dependent_feature *df;
3999766cdbcSJaswinder Singh Rajput 
400b38b0665SH. Peter Anvin 	for (df = cpuid_dependent_features; df->feature; df++) {
4010f3fa48aSIngo Molnar 
4020f3fa48aSIngo Molnar 		if (!cpu_has(c, df->feature))
4030f3fa48aSIngo Molnar 			continue;
404b38b0665SH. Peter Anvin 		/*
405b38b0665SH. Peter Anvin 		 * Note: cpuid_level is set to -1 if unavailable, but
406b38b0665SH. Peter Anvin 		 * extended_extended_level is set to 0 if unavailable
407b38b0665SH. Peter Anvin 		 * and the legitimate extended levels are all negative
408b38b0665SH. Peter Anvin 		 * when signed; hence the weird messing around with
409b38b0665SH. Peter Anvin 		 * signs here...
410b38b0665SH. Peter Anvin 		 */
4110f3fa48aSIngo Molnar 		if (!((s32)df->level < 0 ?
412f6db44dfSYinghai Lu 		     (u32)df->level > (u32)c->extended_cpuid_level :
4130f3fa48aSIngo Molnar 		     (s32)df->level > (s32)c->cpuid_level))
4140f3fa48aSIngo Molnar 			continue;
4150f3fa48aSIngo Molnar 
416b38b0665SH. Peter Anvin 		clear_cpu_cap(c, df->feature);
4170f3fa48aSIngo Molnar 		if (!warn)
4180f3fa48aSIngo Molnar 			continue;
4190f3fa48aSIngo Molnar 
4201b74dde7SChen Yucong 		pr_warn("CPU: CPU feature " X86_CAP_FMT " disabled, no CPUID level 0x%x\n",
4219def39beSJosh Triplett 			x86_cap_flag(df->feature), df->level);
422b38b0665SH. Peter Anvin 	}
423b38b0665SH. Peter Anvin }
424b38b0665SH. Peter Anvin 
425b38b0665SH. Peter Anvin /*
426f7627e25SThomas Gleixner  * Naming convention should be: <Name> [(<Codename>)]
427f7627e25SThomas Gleixner  * This table only is used unless init_<vendor>() below doesn't set it;
4280f3fa48aSIngo Molnar  * in particular, if CPUID levels 0x80000002..4 are supported, this
4290f3fa48aSIngo Molnar  * isn't used
430f7627e25SThomas Gleixner  */
431f7627e25SThomas Gleixner 
432f7627e25SThomas Gleixner /* Look up CPU names by table lookup. */
433148f9bb8SPaul Gortmaker static const char *table_lookup_model(struct cpuinfo_x86 *c)
434f7627e25SThomas Gleixner {
43509dc68d9SJan Beulich #ifdef CONFIG_X86_32
43609dc68d9SJan Beulich 	const struct legacy_cpu_model_info *info;
437f7627e25SThomas Gleixner 
438f7627e25SThomas Gleixner 	if (c->x86_model >= 16)
439f7627e25SThomas Gleixner 		return NULL;	/* Range check */
440f7627e25SThomas Gleixner 
441f7627e25SThomas Gleixner 	if (!this_cpu)
442f7627e25SThomas Gleixner 		return NULL;
443f7627e25SThomas Gleixner 
44409dc68d9SJan Beulich 	info = this_cpu->legacy_models;
445f7627e25SThomas Gleixner 
44609dc68d9SJan Beulich 	while (info->family) {
447f7627e25SThomas Gleixner 		if (info->family == c->x86)
448f7627e25SThomas Gleixner 			return info->model_names[c->x86_model];
449f7627e25SThomas Gleixner 		info++;
450f7627e25SThomas Gleixner 	}
45109dc68d9SJan Beulich #endif
452f7627e25SThomas Gleixner 	return NULL;		/* Not found */
453f7627e25SThomas Gleixner }
454f7627e25SThomas Gleixner 
455148f9bb8SPaul Gortmaker __u32 cpu_caps_cleared[NCAPINTS];
456148f9bb8SPaul Gortmaker __u32 cpu_caps_set[NCAPINTS];
457f7627e25SThomas Gleixner 
45811e3a840SJeremy Fitzhardinge void load_percpu_segment(int cpu)
4599d31d35bSYinghai Lu {
460fab334c1SYinghai Lu #ifdef CONFIG_X86_32
4612697fbd5SBrian Gerst 	loadsegment(fs, __KERNEL_PERCPU);
4622697fbd5SBrian Gerst #else
46345e876f7SAndy Lutomirski 	__loadsegment_simple(gs, 0);
4642697fbd5SBrian Gerst 	wrmsrl(MSR_GS_BASE, (unsigned long)per_cpu(irq_stack_union.gs_base, cpu));
465fab334c1SYinghai Lu #endif
46660a5317fSTejun Heo 	load_stack_canary_segment();
4679d31d35bSYinghai Lu }
4689d31d35bSYinghai Lu 
469*ef8813abSAndy Lutomirski /* Setup the fixmap mappings only once per-processor */
470*ef8813abSAndy Lutomirski static inline void setup_cpu_entry_area(int cpu)
47169218e47SThomas Garnier {
472b23adb7dSAndy Lutomirski #ifdef CONFIG_X86_64
473b23adb7dSAndy Lutomirski 	/* On 64-bit systems, we use a read-only fixmap GDT. */
474*ef8813abSAndy Lutomirski 	pgprot_t gdt_prot = PAGE_KERNEL_RO;
475b23adb7dSAndy Lutomirski #else
476b23adb7dSAndy Lutomirski 	/*
477b23adb7dSAndy Lutomirski 	 * On native 32-bit systems, the GDT cannot be read-only because
478b23adb7dSAndy Lutomirski 	 * our double fault handler uses a task gate, and entering through
479b23adb7dSAndy Lutomirski 	 * a task gate needs to change an available TSS to busy.  If the GDT
480b23adb7dSAndy Lutomirski 	 * is read-only, that will triple fault.
481b23adb7dSAndy Lutomirski 	 *
482b23adb7dSAndy Lutomirski 	 * On Xen PV, the GDT must be read-only because the hypervisor requires
483b23adb7dSAndy Lutomirski 	 * it.
484b23adb7dSAndy Lutomirski 	 */
485*ef8813abSAndy Lutomirski 	pgprot_t gdt_prot = boot_cpu_has(X86_FEATURE_XENPV) ?
486b23adb7dSAndy Lutomirski 		PAGE_KERNEL_RO : PAGE_KERNEL;
487b23adb7dSAndy Lutomirski #endif
488b23adb7dSAndy Lutomirski 
489*ef8813abSAndy Lutomirski 	__set_fixmap(get_cpu_entry_area_index(cpu, gdt), get_cpu_gdt_paddr(cpu), gdt_prot);
49069218e47SThomas Garnier }
49169218e47SThomas Garnier 
49245fc8757SThomas Garnier /* Load the original GDT from the per-cpu structure */
49345fc8757SThomas Garnier void load_direct_gdt(int cpu)
49445fc8757SThomas Garnier {
49545fc8757SThomas Garnier 	struct desc_ptr gdt_descr;
49645fc8757SThomas Garnier 
49745fc8757SThomas Garnier 	gdt_descr.address = (long)get_cpu_gdt_rw(cpu);
49845fc8757SThomas Garnier 	gdt_descr.size = GDT_SIZE - 1;
49945fc8757SThomas Garnier 	load_gdt(&gdt_descr);
50045fc8757SThomas Garnier }
50145fc8757SThomas Garnier EXPORT_SYMBOL_GPL(load_direct_gdt);
50245fc8757SThomas Garnier 
50369218e47SThomas Garnier /* Load a fixmap remapping of the per-cpu GDT */
50469218e47SThomas Garnier void load_fixmap_gdt(int cpu)
50569218e47SThomas Garnier {
50669218e47SThomas Garnier 	struct desc_ptr gdt_descr;
50769218e47SThomas Garnier 
50869218e47SThomas Garnier 	gdt_descr.address = (long)get_cpu_gdt_ro(cpu);
50969218e47SThomas Garnier 	gdt_descr.size = GDT_SIZE - 1;
51069218e47SThomas Garnier 	load_gdt(&gdt_descr);
51169218e47SThomas Garnier }
51245fc8757SThomas Garnier EXPORT_SYMBOL_GPL(load_fixmap_gdt);
51369218e47SThomas Garnier 
5140f3fa48aSIngo Molnar /*
5150f3fa48aSIngo Molnar  * Current gdt points %fs at the "master" per-cpu area: after this,
5160f3fa48aSIngo Molnar  * it's on the real one.
5170f3fa48aSIngo Molnar  */
518552be871SBrian Gerst void switch_to_new_gdt(int cpu)
519f7627e25SThomas Gleixner {
52045fc8757SThomas Garnier 	/* Load the original GDT */
52145fc8757SThomas Garnier 	load_direct_gdt(cpu);
522f7627e25SThomas Gleixner 	/* Reload the per-cpu base */
52311e3a840SJeremy Fitzhardinge 	load_percpu_segment(cpu);
524f7627e25SThomas Gleixner }
525f7627e25SThomas Gleixner 
526148f9bb8SPaul Gortmaker static const struct cpu_dev *cpu_devs[X86_VENDOR_NUM] = {};
527f7627e25SThomas Gleixner 
528148f9bb8SPaul Gortmaker static void get_model_name(struct cpuinfo_x86 *c)
529f7627e25SThomas Gleixner {
530f7627e25SThomas Gleixner 	unsigned int *v;
531ee098e1aSBorislav Petkov 	char *p, *q, *s;
532f7627e25SThomas Gleixner 
5333da99c97SYinghai Lu 	if (c->extended_cpuid_level < 0x80000004)
5341b05d60dSYinghai Lu 		return;
535f7627e25SThomas Gleixner 
536f7627e25SThomas Gleixner 	v = (unsigned int *)c->x86_model_id;
537f7627e25SThomas Gleixner 	cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]);
538f7627e25SThomas Gleixner 	cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]);
539f7627e25SThomas Gleixner 	cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]);
540f7627e25SThomas Gleixner 	c->x86_model_id[48] = 0;
541f7627e25SThomas Gleixner 
542ee098e1aSBorislav Petkov 	/* Trim whitespace */
543ee098e1aSBorislav Petkov 	p = q = s = &c->x86_model_id[0];
544ee098e1aSBorislav Petkov 
545ee098e1aSBorislav Petkov 	while (*p == ' ')
546ee098e1aSBorislav Petkov 		p++;
547ee098e1aSBorislav Petkov 
548ee098e1aSBorislav Petkov 	while (*p) {
549ee098e1aSBorislav Petkov 		/* Note the last non-whitespace index */
550ee098e1aSBorislav Petkov 		if (!isspace(*p))
551ee098e1aSBorislav Petkov 			s = q;
552ee098e1aSBorislav Petkov 
553ee098e1aSBorislav Petkov 		*q++ = *p++;
554ee098e1aSBorislav Petkov 	}
555ee098e1aSBorislav Petkov 
556ee098e1aSBorislav Petkov 	*(s + 1) = '\0';
557f7627e25SThomas Gleixner }
558f7627e25SThomas Gleixner 
559148f9bb8SPaul Gortmaker void cpu_detect_cache_sizes(struct cpuinfo_x86 *c)
560f7627e25SThomas Gleixner {
5619d31d35bSYinghai Lu 	unsigned int n, dummy, ebx, ecx, edx, l2size;
562f7627e25SThomas Gleixner 
5633da99c97SYinghai Lu 	n = c->extended_cpuid_level;
564f7627e25SThomas Gleixner 
565f7627e25SThomas Gleixner 	if (n >= 0x80000005) {
5669d31d35bSYinghai Lu 		cpuid(0x80000005, &dummy, &ebx, &ecx, &edx);
567f7627e25SThomas Gleixner 		c->x86_cache_size = (ecx>>24) + (edx>>24);
568140fc727SYinghai Lu #ifdef CONFIG_X86_64
569140fc727SYinghai Lu 		/* On K8 L1 TLB is inclusive, so don't count it */
570140fc727SYinghai Lu 		c->x86_tlbsize = 0;
571140fc727SYinghai Lu #endif
572f7627e25SThomas Gleixner 	}
573f7627e25SThomas Gleixner 
574f7627e25SThomas Gleixner 	if (n < 0x80000006)	/* Some chips just has a large L1. */
575f7627e25SThomas Gleixner 		return;
576f7627e25SThomas Gleixner 
5770a488a53SYinghai Lu 	cpuid(0x80000006, &dummy, &ebx, &ecx, &edx);
578f7627e25SThomas Gleixner 	l2size = ecx >> 16;
579f7627e25SThomas Gleixner 
580140fc727SYinghai Lu #ifdef CONFIG_X86_64
581140fc727SYinghai Lu 	c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff);
582140fc727SYinghai Lu #else
583f7627e25SThomas Gleixner 	/* do processor-specific cache resizing */
58409dc68d9SJan Beulich 	if (this_cpu->legacy_cache_size)
58509dc68d9SJan Beulich 		l2size = this_cpu->legacy_cache_size(c, l2size);
586f7627e25SThomas Gleixner 
587f7627e25SThomas Gleixner 	/* Allow user to override all this if necessary. */
588f7627e25SThomas Gleixner 	if (cachesize_override != -1)
589f7627e25SThomas Gleixner 		l2size = cachesize_override;
590f7627e25SThomas Gleixner 
591f7627e25SThomas Gleixner 	if (l2size == 0)
592f7627e25SThomas Gleixner 		return;		/* Again, no L2 cache is possible */
593140fc727SYinghai Lu #endif
594f7627e25SThomas Gleixner 
595f7627e25SThomas Gleixner 	c->x86_cache_size = l2size;
596f7627e25SThomas Gleixner }
597f7627e25SThomas Gleixner 
598e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_4k[NR_INFO];
599e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_2m[NR_INFO];
600e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_4m[NR_INFO];
601e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_4k[NR_INFO];
602e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_2m[NR_INFO];
603e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_4m[NR_INFO];
604dd360393SKirill A. Shutemov u16 __read_mostly tlb_lld_1g[NR_INFO];
605e0ba94f1SAlex Shi 
606f94fe119SSteven Honeyman static void cpu_detect_tlb(struct cpuinfo_x86 *c)
607e0ba94f1SAlex Shi {
608e0ba94f1SAlex Shi 	if (this_cpu->c_detect_tlb)
609e0ba94f1SAlex Shi 		this_cpu->c_detect_tlb(c);
610e0ba94f1SAlex Shi 
611f94fe119SSteven Honeyman 	pr_info("Last level iTLB entries: 4KB %d, 2MB %d, 4MB %d\n",
612e0ba94f1SAlex Shi 		tlb_lli_4k[ENTRIES], tlb_lli_2m[ENTRIES],
613f94fe119SSteven Honeyman 		tlb_lli_4m[ENTRIES]);
614f94fe119SSteven Honeyman 
615f94fe119SSteven Honeyman 	pr_info("Last level dTLB entries: 4KB %d, 2MB %d, 4MB %d, 1GB %d\n",
616f94fe119SSteven Honeyman 		tlb_lld_4k[ENTRIES], tlb_lld_2m[ENTRIES],
617f94fe119SSteven Honeyman 		tlb_lld_4m[ENTRIES], tlb_lld_1g[ENTRIES]);
618e0ba94f1SAlex Shi }
619e0ba94f1SAlex Shi 
620148f9bb8SPaul Gortmaker void detect_ht(struct cpuinfo_x86 *c)
6219d31d35bSYinghai Lu {
622c8e56d20SBorislav Petkov #ifdef CONFIG_SMP
6239d31d35bSYinghai Lu 	u32 eax, ebx, ecx, edx;
6249d31d35bSYinghai Lu 	int index_msb, core_bits;
6252eaad1fdSMike Travis 	static bool printed;
6269d31d35bSYinghai Lu 
6270a488a53SYinghai Lu 	if (!cpu_has(c, X86_FEATURE_HT))
6289d31d35bSYinghai Lu 		return;
6299d31d35bSYinghai Lu 
6300a488a53SYinghai Lu 	if (cpu_has(c, X86_FEATURE_CMP_LEGACY))
6310a488a53SYinghai Lu 		goto out;
6320a488a53SYinghai Lu 
6331cd78776SYinghai Lu 	if (cpu_has(c, X86_FEATURE_XTOPOLOGY))
6341cd78776SYinghai Lu 		return;
6351cd78776SYinghai Lu 
6360a488a53SYinghai Lu 	cpuid(1, &eax, &ebx, &ecx, &edx);
6370a488a53SYinghai Lu 
6389d31d35bSYinghai Lu 	smp_num_siblings = (ebx & 0xff0000) >> 16;
6399d31d35bSYinghai Lu 
6409d31d35bSYinghai Lu 	if (smp_num_siblings == 1) {
6411b74dde7SChen Yucong 		pr_info_once("CPU0: Hyper-Threading is disabled\n");
6420f3fa48aSIngo Molnar 		goto out;
6430f3fa48aSIngo Molnar 	}
6440f3fa48aSIngo Molnar 
6450f3fa48aSIngo Molnar 	if (smp_num_siblings <= 1)
6460f3fa48aSIngo Molnar 		goto out;
6479d31d35bSYinghai Lu 
6489d31d35bSYinghai Lu 	index_msb = get_count_order(smp_num_siblings);
649cb8cc442SIngo Molnar 	c->phys_proc_id = apic->phys_pkg_id(c->initial_apicid, index_msb);
6509d31d35bSYinghai Lu 
6519d31d35bSYinghai Lu 	smp_num_siblings = smp_num_siblings / c->x86_max_cores;
6529d31d35bSYinghai Lu 
6539d31d35bSYinghai Lu 	index_msb = get_count_order(smp_num_siblings);
6549d31d35bSYinghai Lu 
6559d31d35bSYinghai Lu 	core_bits = get_count_order(c->x86_max_cores);
6569d31d35bSYinghai Lu 
657cb8cc442SIngo Molnar 	c->cpu_core_id = apic->phys_pkg_id(c->initial_apicid, index_msb) &
6581cd78776SYinghai Lu 				       ((1 << core_bits) - 1);
6599d31d35bSYinghai Lu 
6600a488a53SYinghai Lu out:
6612eaad1fdSMike Travis 	if (!printed && (c->x86_max_cores * smp_num_siblings) > 1) {
6621b74dde7SChen Yucong 		pr_info("CPU: Physical Processor ID: %d\n",
6630a488a53SYinghai Lu 			c->phys_proc_id);
6641b74dde7SChen Yucong 		pr_info("CPU: Processor Core ID: %d\n",
6659d31d35bSYinghai Lu 			c->cpu_core_id);
6662eaad1fdSMike Travis 		printed = 1;
6679d31d35bSYinghai Lu 	}
6689d31d35bSYinghai Lu #endif
66997e4db7cSYinghai Lu }
670f7627e25SThomas Gleixner 
671148f9bb8SPaul Gortmaker static void get_cpu_vendor(struct cpuinfo_x86 *c)
672f7627e25SThomas Gleixner {
673f7627e25SThomas Gleixner 	char *v = c->x86_vendor_id;
6740f3fa48aSIngo Molnar 	int i;
675f7627e25SThomas Gleixner 
676f7627e25SThomas Gleixner 	for (i = 0; i < X86_VENDOR_NUM; i++) {
67710a434fcSYinghai Lu 		if (!cpu_devs[i])
67810a434fcSYinghai Lu 			break;
67910a434fcSYinghai Lu 
680f7627e25SThomas Gleixner 		if (!strcmp(v, cpu_devs[i]->c_ident[0]) ||
681f7627e25SThomas Gleixner 		    (cpu_devs[i]->c_ident[1] &&
682f7627e25SThomas Gleixner 		     !strcmp(v, cpu_devs[i]->c_ident[1]))) {
6830f3fa48aSIngo Molnar 
684f7627e25SThomas Gleixner 			this_cpu = cpu_devs[i];
68510a434fcSYinghai Lu 			c->x86_vendor = this_cpu->c_x86_vendor;
686f7627e25SThomas Gleixner 			return;
687f7627e25SThomas Gleixner 		}
688f7627e25SThomas Gleixner 	}
68910a434fcSYinghai Lu 
6901b74dde7SChen Yucong 	pr_err_once("CPU: vendor_id '%s' unknown, using generic init.\n" \
691a9c56953SMinchan Kim 		    "CPU: Your system may be unstable.\n", v);
69210a434fcSYinghai Lu 
693f7627e25SThomas Gleixner 	c->x86_vendor = X86_VENDOR_UNKNOWN;
694f7627e25SThomas Gleixner 	this_cpu = &default_cpu;
695f7627e25SThomas Gleixner }
696f7627e25SThomas Gleixner 
697148f9bb8SPaul Gortmaker void cpu_detect(struct cpuinfo_x86 *c)
698f7627e25SThomas Gleixner {
699f7627e25SThomas Gleixner 	/* Get vendor name */
7004a148513SHarvey Harrison 	cpuid(0x00000000, (unsigned int *)&c->cpuid_level,
7014a148513SHarvey Harrison 	      (unsigned int *)&c->x86_vendor_id[0],
7024a148513SHarvey Harrison 	      (unsigned int *)&c->x86_vendor_id[8],
7034a148513SHarvey Harrison 	      (unsigned int *)&c->x86_vendor_id[4]);
704f7627e25SThomas Gleixner 
705f7627e25SThomas Gleixner 	c->x86 = 4;
7069d31d35bSYinghai Lu 	/* Intel-defined flags: level 0x00000001 */
707f7627e25SThomas Gleixner 	if (c->cpuid_level >= 0x00000001) {
708f7627e25SThomas Gleixner 		u32 junk, tfms, cap0, misc;
7090f3fa48aSIngo Molnar 
710f7627e25SThomas Gleixner 		cpuid(0x00000001, &tfms, &misc, &junk, &cap0);
71199f925ceSBorislav Petkov 		c->x86		= x86_family(tfms);
71299f925ceSBorislav Petkov 		c->x86_model	= x86_model(tfms);
71399f925ceSBorislav Petkov 		c->x86_mask	= x86_stepping(tfms);
7140f3fa48aSIngo Molnar 
715d4387bd3SHuang, Ying 		if (cap0 & (1<<19)) {
716d4387bd3SHuang, Ying 			c->x86_clflush_size = ((misc >> 8) & 0xff) * 8;
7179d31d35bSYinghai Lu 			c->x86_cache_alignment = c->x86_clflush_size;
718d4387bd3SHuang, Ying 		}
719f7627e25SThomas Gleixner 	}
720f7627e25SThomas Gleixner }
7213da99c97SYinghai Lu 
7228bf1ebcaSAndy Lutomirski static void apply_forced_caps(struct cpuinfo_x86 *c)
7238bf1ebcaSAndy Lutomirski {
7248bf1ebcaSAndy Lutomirski 	int i;
7258bf1ebcaSAndy Lutomirski 
7268bf1ebcaSAndy Lutomirski 	for (i = 0; i < NCAPINTS; i++) {
7278bf1ebcaSAndy Lutomirski 		c->x86_capability[i] &= ~cpu_caps_cleared[i];
7288bf1ebcaSAndy Lutomirski 		c->x86_capability[i] |= cpu_caps_set[i];
7298bf1ebcaSAndy Lutomirski 	}
7308bf1ebcaSAndy Lutomirski }
7318bf1ebcaSAndy Lutomirski 
732148f9bb8SPaul Gortmaker void get_cpu_cap(struct cpuinfo_x86 *c)
733093af8d7SYinghai Lu {
73439c06df4SBorislav Petkov 	u32 eax, ebx, ecx, edx;
735093af8d7SYinghai Lu 
736093af8d7SYinghai Lu 	/* Intel-defined flags: level 0x00000001 */
737093af8d7SYinghai Lu 	if (c->cpuid_level >= 0x00000001) {
73839c06df4SBorislav Petkov 		cpuid(0x00000001, &eax, &ebx, &ecx, &edx);
7390f3fa48aSIngo Molnar 
74039c06df4SBorislav Petkov 		c->x86_capability[CPUID_1_ECX] = ecx;
74139c06df4SBorislav Petkov 		c->x86_capability[CPUID_1_EDX] = edx;
742093af8d7SYinghai Lu 	}
743093af8d7SYinghai Lu 
7443df8d920SAndy Lutomirski 	/* Thermal and Power Management Leaf: level 0x00000006 (eax) */
7453df8d920SAndy Lutomirski 	if (c->cpuid_level >= 0x00000006)
7463df8d920SAndy Lutomirski 		c->x86_capability[CPUID_6_EAX] = cpuid_eax(0x00000006);
7473df8d920SAndy Lutomirski 
748bdc802dcSH. Peter Anvin 	/* Additional Intel-defined flags: level 0x00000007 */
749bdc802dcSH. Peter Anvin 	if (c->cpuid_level >= 0x00000007) {
750bdc802dcSH. Peter Anvin 		cpuid_count(0x00000007, 0, &eax, &ebx, &ecx, &edx);
75139c06df4SBorislav Petkov 		c->x86_capability[CPUID_7_0_EBX] = ebx;
752dfb4a70fSDave Hansen 		c->x86_capability[CPUID_7_ECX] = ecx;
753bdc802dcSH. Peter Anvin 	}
754bdc802dcSH. Peter Anvin 
7556229ad27SFenghua Yu 	/* Extended state features: level 0x0000000d */
7566229ad27SFenghua Yu 	if (c->cpuid_level >= 0x0000000d) {
7576229ad27SFenghua Yu 		cpuid_count(0x0000000d, 1, &eax, &ebx, &ecx, &edx);
7586229ad27SFenghua Yu 
75939c06df4SBorislav Petkov 		c->x86_capability[CPUID_D_1_EAX] = eax;
7606229ad27SFenghua Yu 	}
7616229ad27SFenghua Yu 
762cbc82b17SPeter P Waskiewicz Jr 	/* Additional Intel-defined flags: level 0x0000000F */
763cbc82b17SPeter P Waskiewicz Jr 	if (c->cpuid_level >= 0x0000000F) {
764cbc82b17SPeter P Waskiewicz Jr 
765cbc82b17SPeter P Waskiewicz Jr 		/* QoS sub-leaf, EAX=0Fh, ECX=0 */
766cbc82b17SPeter P Waskiewicz Jr 		cpuid_count(0x0000000F, 0, &eax, &ebx, &ecx, &edx);
76739c06df4SBorislav Petkov 		c->x86_capability[CPUID_F_0_EDX] = edx;
76839c06df4SBorislav Petkov 
769cbc82b17SPeter P Waskiewicz Jr 		if (cpu_has(c, X86_FEATURE_CQM_LLC)) {
770cbc82b17SPeter P Waskiewicz Jr 			/* will be overridden if occupancy monitoring exists */
771cbc82b17SPeter P Waskiewicz Jr 			c->x86_cache_max_rmid = ebx;
772cbc82b17SPeter P Waskiewicz Jr 
773cbc82b17SPeter P Waskiewicz Jr 			/* QoS sub-leaf, EAX=0Fh, ECX=1 */
774cbc82b17SPeter P Waskiewicz Jr 			cpuid_count(0x0000000F, 1, &eax, &ebx, &ecx, &edx);
77539c06df4SBorislav Petkov 			c->x86_capability[CPUID_F_1_EDX] = edx;
77639c06df4SBorislav Petkov 
77733c3cc7aSVikas Shivappa 			if ((cpu_has(c, X86_FEATURE_CQM_OCCUP_LLC)) ||
77833c3cc7aSVikas Shivappa 			      ((cpu_has(c, X86_FEATURE_CQM_MBM_TOTAL)) ||
77933c3cc7aSVikas Shivappa 			       (cpu_has(c, X86_FEATURE_CQM_MBM_LOCAL)))) {
780cbc82b17SPeter P Waskiewicz Jr 				c->x86_cache_max_rmid = ecx;
781cbc82b17SPeter P Waskiewicz Jr 				c->x86_cache_occ_scale = ebx;
782cbc82b17SPeter P Waskiewicz Jr 			}
783cbc82b17SPeter P Waskiewicz Jr 		} else {
784cbc82b17SPeter P Waskiewicz Jr 			c->x86_cache_max_rmid = -1;
785cbc82b17SPeter P Waskiewicz Jr 			c->x86_cache_occ_scale = -1;
786cbc82b17SPeter P Waskiewicz Jr 		}
787cbc82b17SPeter P Waskiewicz Jr 	}
788cbc82b17SPeter P Waskiewicz Jr 
789093af8d7SYinghai Lu 	/* AMD-defined flags: level 0x80000001 */
79039c06df4SBorislav Petkov 	eax = cpuid_eax(0x80000000);
79139c06df4SBorislav Petkov 	c->extended_cpuid_level = eax;
7920f3fa48aSIngo Molnar 
79339c06df4SBorislav Petkov 	if ((eax & 0xffff0000) == 0x80000000) {
79439c06df4SBorislav Petkov 		if (eax >= 0x80000001) {
79539c06df4SBorislav Petkov 			cpuid(0x80000001, &eax, &ebx, &ecx, &edx);
79639c06df4SBorislav Petkov 
79739c06df4SBorislav Petkov 			c->x86_capability[CPUID_8000_0001_ECX] = ecx;
79839c06df4SBorislav Petkov 			c->x86_capability[CPUID_8000_0001_EDX] = edx;
799093af8d7SYinghai Lu 		}
800093af8d7SYinghai Lu 	}
801093af8d7SYinghai Lu 
80271faad43SYazen Ghannam 	if (c->extended_cpuid_level >= 0x80000007) {
80371faad43SYazen Ghannam 		cpuid(0x80000007, &eax, &ebx, &ecx, &edx);
80471faad43SYazen Ghannam 
80571faad43SYazen Ghannam 		c->x86_capability[CPUID_8000_0007_EBX] = ebx;
80671faad43SYazen Ghannam 		c->x86_power = edx;
80771faad43SYazen Ghannam 	}
80871faad43SYazen Ghannam 
8095122c890SYinghai Lu 	if (c->extended_cpuid_level >= 0x80000008) {
81039c06df4SBorislav Petkov 		cpuid(0x80000008, &eax, &ebx, &ecx, &edx);
8115122c890SYinghai Lu 
8125122c890SYinghai Lu 		c->x86_virt_bits = (eax >> 8) & 0xff;
8135122c890SYinghai Lu 		c->x86_phys_bits = eax & 0xff;
81439c06df4SBorislav Petkov 		c->x86_capability[CPUID_8000_0008_EBX] = ebx;
8155122c890SYinghai Lu 	}
81613c6c532SJan Beulich #ifdef CONFIG_X86_32
81713c6c532SJan Beulich 	else if (cpu_has(c, X86_FEATURE_PAE) || cpu_has(c, X86_FEATURE_PSE36))
81813c6c532SJan Beulich 		c->x86_phys_bits = 36;
8195122c890SYinghai Lu #endif
820e3224234SYinghai Lu 
8212ccd71f1SBorislav Petkov 	if (c->extended_cpuid_level >= 0x8000000a)
82239c06df4SBorislav Petkov 		c->x86_capability[CPUID_8000_000A_EDX] = cpuid_edx(0x8000000a);
8232ccd71f1SBorislav Petkov 
8241dedefd1SJacob Pan 	init_scattered_cpuid_features(c);
82560d34501SAndy Lutomirski 
82660d34501SAndy Lutomirski 	/*
82760d34501SAndy Lutomirski 	 * Clear/Set all flags overridden by options, after probe.
82860d34501SAndy Lutomirski 	 * This needs to happen each time we re-probe, which may happen
82960d34501SAndy Lutomirski 	 * several times during CPU initialization.
83060d34501SAndy Lutomirski 	 */
83160d34501SAndy Lutomirski 	apply_forced_caps(c);
832093af8d7SYinghai Lu }
833093af8d7SYinghai Lu 
834148f9bb8SPaul Gortmaker static void identify_cpu_without_cpuid(struct cpuinfo_x86 *c)
835aef93c8bSYinghai Lu {
836aef93c8bSYinghai Lu #ifdef CONFIG_X86_32
837aef93c8bSYinghai Lu 	int i;
838aef93c8bSYinghai Lu 
839aef93c8bSYinghai Lu 	/*
840aef93c8bSYinghai Lu 	 * First of all, decide if this is a 486 or higher
841aef93c8bSYinghai Lu 	 * It's a 486 if we can modify the AC flag
842aef93c8bSYinghai Lu 	 */
843aef93c8bSYinghai Lu 	if (flag_is_changeable_p(X86_EFLAGS_AC))
844aef93c8bSYinghai Lu 		c->x86 = 4;
845aef93c8bSYinghai Lu 	else
846aef93c8bSYinghai Lu 		c->x86 = 3;
847aef93c8bSYinghai Lu 
848aef93c8bSYinghai Lu 	for (i = 0; i < X86_VENDOR_NUM; i++)
849aef93c8bSYinghai Lu 		if (cpu_devs[i] && cpu_devs[i]->c_identify) {
850aef93c8bSYinghai Lu 			c->x86_vendor_id[0] = 0;
851aef93c8bSYinghai Lu 			cpu_devs[i]->c_identify(c);
852aef93c8bSYinghai Lu 			if (c->x86_vendor_id[0]) {
853aef93c8bSYinghai Lu 				get_cpu_vendor(c);
854aef93c8bSYinghai Lu 				break;
855aef93c8bSYinghai Lu 			}
856aef93c8bSYinghai Lu 		}
857aef93c8bSYinghai Lu #endif
858093af8d7SYinghai Lu }
859f7627e25SThomas Gleixner 
86034048c9eSPaolo Ciarrocchi /*
86134048c9eSPaolo Ciarrocchi  * Do minimum CPU detection early.
86234048c9eSPaolo Ciarrocchi  * Fields really needed: vendor, cpuid_level, family, model, mask,
86334048c9eSPaolo Ciarrocchi  * cache alignment.
86434048c9eSPaolo Ciarrocchi  * The others are not touched to avoid unwanted side effects.
86534048c9eSPaolo Ciarrocchi  *
86634048c9eSPaolo Ciarrocchi  * WARNING: this function is only called on the BP.  Don't add code here
86734048c9eSPaolo Ciarrocchi  * that is supposed to run on all CPUs.
86834048c9eSPaolo Ciarrocchi  */
8693da99c97SYinghai Lu static void __init early_identify_cpu(struct cpuinfo_x86 *c)
870f7627e25SThomas Gleixner {
8716627d242SYinghai Lu #ifdef CONFIG_X86_64
8726627d242SYinghai Lu 	c->x86_clflush_size = 64;
87313c6c532SJan Beulich 	c->x86_phys_bits = 36;
87413c6c532SJan Beulich 	c->x86_virt_bits = 48;
8756627d242SYinghai Lu #else
876d4387bd3SHuang, Ying 	c->x86_clflush_size = 32;
87713c6c532SJan Beulich 	c->x86_phys_bits = 32;
87813c6c532SJan Beulich 	c->x86_virt_bits = 32;
8796627d242SYinghai Lu #endif
8800a488a53SYinghai Lu 	c->x86_cache_alignment = c->x86_clflush_size;
881f7627e25SThomas Gleixner 
8823da99c97SYinghai Lu 	memset(&c->x86_capability, 0, sizeof c->x86_capability);
8830a488a53SYinghai Lu 	c->extended_cpuid_level = 0;
8840a488a53SYinghai Lu 
885aef93c8bSYinghai Lu 	/* cyrix could have cpuid enabled via c_identify()*/
88605fb3c19SAndy Lutomirski 	if (have_cpuid_p()) {
887f7627e25SThomas Gleixner 		cpu_detect(c);
8883da99c97SYinghai Lu 		get_cpu_vendor(c);
8893da99c97SYinghai Lu 		get_cpu_cap(c);
89078d1b296SBorislav Petkov 		setup_force_cpu_cap(X86_FEATURE_CPUID);
89112cf105cSKrzysztof Helt 
89210a434fcSYinghai Lu 		if (this_cpu->c_early_init)
89310a434fcSYinghai Lu 			this_cpu->c_early_init(c);
8943da99c97SYinghai Lu 
895f6e9456cSRobert Richter 		c->cpu_index = 0;
896b38b0665SH. Peter Anvin 		filter_cpuid_features(c, false);
897de5397adSFenghua Yu 
898a110b5ecSBorislav Petkov 		if (this_cpu->c_bsp_init)
899a110b5ecSBorislav Petkov 			this_cpu->c_bsp_init(c);
90078d1b296SBorislav Petkov 	} else {
90178d1b296SBorislav Petkov 		identify_cpu_without_cpuid(c);
90278d1b296SBorislav Petkov 		setup_clear_cpu_cap(X86_FEATURE_CPUID);
90305fb3c19SAndy Lutomirski 	}
904c3b83598SBorislav Petkov 
905c3b83598SBorislav Petkov 	setup_force_cpu_cap(X86_FEATURE_ALWAYS);
906db52ef74SIngo Molnar 	fpu__init_system(c);
907b8b7abaeSAndy Lutomirski 
908b8b7abaeSAndy Lutomirski #ifdef CONFIG_X86_32
909b8b7abaeSAndy Lutomirski 	/*
910b8b7abaeSAndy Lutomirski 	 * Regardless of whether PCID is enumerated, the SDM says
911b8b7abaeSAndy Lutomirski 	 * that it can't be enabled in 32-bit mode.
912b8b7abaeSAndy Lutomirski 	 */
913b8b7abaeSAndy Lutomirski 	setup_clear_cpu_cap(X86_FEATURE_PCID);
914b8b7abaeSAndy Lutomirski #endif
915f7627e25SThomas Gleixner }
916f7627e25SThomas Gleixner 
9179d31d35bSYinghai Lu void __init early_cpu_init(void)
9189d31d35bSYinghai Lu {
91902dde8b4SJan Beulich 	const struct cpu_dev *const *cdev;
92010a434fcSYinghai Lu 	int count = 0;
9219d31d35bSYinghai Lu 
922ac23f253SJan Beulich #ifdef CONFIG_PROCESSOR_SELECT
9231b74dde7SChen Yucong 	pr_info("KERNEL supported cpus:\n");
92431c997caSIngo Molnar #endif
92531c997caSIngo Molnar 
92610a434fcSYinghai Lu 	for (cdev = __x86_cpu_dev_start; cdev < __x86_cpu_dev_end; cdev++) {
92702dde8b4SJan Beulich 		const struct cpu_dev *cpudev = *cdev;
9289d31d35bSYinghai Lu 
92910a434fcSYinghai Lu 		if (count >= X86_VENDOR_NUM)
93010a434fcSYinghai Lu 			break;
93110a434fcSYinghai Lu 		cpu_devs[count] = cpudev;
93210a434fcSYinghai Lu 		count++;
93310a434fcSYinghai Lu 
934ac23f253SJan Beulich #ifdef CONFIG_PROCESSOR_SELECT
93531c997caSIngo Molnar 		{
93631c997caSIngo Molnar 			unsigned int j;
93731c997caSIngo Molnar 
93810a434fcSYinghai Lu 			for (j = 0; j < 2; j++) {
93910a434fcSYinghai Lu 				if (!cpudev->c_ident[j])
94010a434fcSYinghai Lu 					continue;
9411b74dde7SChen Yucong 				pr_info("  %s %s\n", cpudev->c_vendor,
94210a434fcSYinghai Lu 					cpudev->c_ident[j]);
94310a434fcSYinghai Lu 			}
94410a434fcSYinghai Lu 		}
9450388423dSDave Jones #endif
94631c997caSIngo Molnar 	}
9479d31d35bSYinghai Lu 	early_identify_cpu(&boot_cpu_data);
948f7627e25SThomas Gleixner }
949f7627e25SThomas Gleixner 
950b6734c35SH. Peter Anvin /*
951366d4a43SBorislav Petkov  * The NOPL instruction is supposed to exist on all CPUs of family >= 6;
952366d4a43SBorislav Petkov  * unfortunately, that's not true in practice because of early VIA
953366d4a43SBorislav Petkov  * chips and (more importantly) broken virtualizers that are not easy
954366d4a43SBorislav Petkov  * to detect. In the latter case it doesn't even *fail* reliably, so
955366d4a43SBorislav Petkov  * probing for it doesn't even work. Disable it completely on 32-bit
956ba0593bfSH. Peter Anvin  * unless we can find a reliable way to detect all the broken cases.
957366d4a43SBorislav Petkov  * Enable it explicitly on 64-bit for non-constant inputs of cpu_has().
958b6734c35SH. Peter Anvin  */
959148f9bb8SPaul Gortmaker static void detect_nopl(struct cpuinfo_x86 *c)
960b6734c35SH. Peter Anvin {
961366d4a43SBorislav Petkov #ifdef CONFIG_X86_32
962b6734c35SH. Peter Anvin 	clear_cpu_cap(c, X86_FEATURE_NOPL);
963366d4a43SBorislav Petkov #else
964366d4a43SBorislav Petkov 	set_cpu_cap(c, X86_FEATURE_NOPL);
965366d4a43SBorislav Petkov #endif
966f7627e25SThomas Gleixner }
967f7627e25SThomas Gleixner 
9687a5d6704SAndy Lutomirski static void detect_null_seg_behavior(struct cpuinfo_x86 *c)
9697a5d6704SAndy Lutomirski {
9707a5d6704SAndy Lutomirski #ifdef CONFIG_X86_64
971f7627e25SThomas Gleixner 	/*
9727a5d6704SAndy Lutomirski 	 * Empirically, writing zero to a segment selector on AMD does
9737a5d6704SAndy Lutomirski 	 * not clear the base, whereas writing zero to a segment
9747a5d6704SAndy Lutomirski 	 * selector on Intel does clear the base.  Intel's behavior
9757a5d6704SAndy Lutomirski 	 * allows slightly faster context switches in the common case
9767a5d6704SAndy Lutomirski 	 * where GS is unused by the prev and next threads.
977f7627e25SThomas Gleixner 	 *
9787a5d6704SAndy Lutomirski 	 * Since neither vendor documents this anywhere that I can see,
9797a5d6704SAndy Lutomirski 	 * detect it directly instead of hardcoding the choice by
9807a5d6704SAndy Lutomirski 	 * vendor.
9817a5d6704SAndy Lutomirski 	 *
9827a5d6704SAndy Lutomirski 	 * I've designated AMD's behavior as the "bug" because it's
9837a5d6704SAndy Lutomirski 	 * counterintuitive and less friendly.
984f7627e25SThomas Gleixner 	 */
9857a5d6704SAndy Lutomirski 
9867a5d6704SAndy Lutomirski 	unsigned long old_base, tmp;
9877a5d6704SAndy Lutomirski 	rdmsrl(MSR_FS_BASE, old_base);
9887a5d6704SAndy Lutomirski 	wrmsrl(MSR_FS_BASE, 1);
9897a5d6704SAndy Lutomirski 	loadsegment(fs, 0);
9907a5d6704SAndy Lutomirski 	rdmsrl(MSR_FS_BASE, tmp);
9917a5d6704SAndy Lutomirski 	if (tmp != 0)
9927a5d6704SAndy Lutomirski 		set_cpu_bug(c, X86_BUG_NULL_SEG);
9937a5d6704SAndy Lutomirski 	wrmsrl(MSR_FS_BASE, old_base);
9943da99c97SYinghai Lu #endif
995f7627e25SThomas Gleixner }
996aef93c8bSYinghai Lu 
997148f9bb8SPaul Gortmaker static void generic_identify(struct cpuinfo_x86 *c)
998f7627e25SThomas Gleixner {
999f7627e25SThomas Gleixner 	c->extended_cpuid_level = 0;
1000f7627e25SThomas Gleixner 
1001aef93c8bSYinghai Lu 	if (!have_cpuid_p())
1002aef93c8bSYinghai Lu 		identify_cpu_without_cpuid(c);
1003f7627e25SThomas Gleixner 
1004aef93c8bSYinghai Lu 	/* cyrix could have cpuid enabled via c_identify()*/
1005a9853dd6SIngo Molnar 	if (!have_cpuid_p())
1006aef93c8bSYinghai Lu 		return;
1007aef93c8bSYinghai Lu 
10083da99c97SYinghai Lu 	cpu_detect(c);
10093da99c97SYinghai Lu 
10103da99c97SYinghai Lu 	get_cpu_vendor(c);
10113da99c97SYinghai Lu 
10123da99c97SYinghai Lu 	get_cpu_cap(c);
10133da99c97SYinghai Lu 
1014f7627e25SThomas Gleixner 	if (c->cpuid_level >= 0x00000001) {
10153da99c97SYinghai Lu 		c->initial_apicid = (cpuid_ebx(1) >> 24) & 0xFF;
1016b89d3b3eSYinghai Lu #ifdef CONFIG_X86_32
1017c8e56d20SBorislav Petkov # ifdef CONFIG_SMP
1018cb8cc442SIngo Molnar 		c->apicid = apic->phys_pkg_id(c->initial_apicid, 0);
1019f7627e25SThomas Gleixner # else
102001aaea1aSYinghai Lu 		c->apicid = c->initial_apicid;
1021f7627e25SThomas Gleixner # endif
1022b89d3b3eSYinghai Lu #endif
1023b89d3b3eSYinghai Lu 		c->phys_proc_id = c->initial_apicid;
1024f7627e25SThomas Gleixner 	}
1025f7627e25SThomas Gleixner 
1026f7627e25SThomas Gleixner 	get_model_name(c); /* Default name */
1027f7627e25SThomas Gleixner 
1028b6734c35SH. Peter Anvin 	detect_nopl(c);
10297a5d6704SAndy Lutomirski 
10307a5d6704SAndy Lutomirski 	detect_null_seg_behavior(c);
10310230bb03SAndy Lutomirski 
10320230bb03SAndy Lutomirski 	/*
10330230bb03SAndy Lutomirski 	 * ESPFIX is a strange bug.  All real CPUs have it.  Paravirt
10340230bb03SAndy Lutomirski 	 * systems that run Linux at CPL > 0 may or may not have the
10350230bb03SAndy Lutomirski 	 * issue, but, even if they have the issue, there's absolutely
10360230bb03SAndy Lutomirski 	 * nothing we can do about it because we can't use the real IRET
10370230bb03SAndy Lutomirski 	 * instruction.
10380230bb03SAndy Lutomirski 	 *
10390230bb03SAndy Lutomirski 	 * NB: For the time being, only 32-bit kernels support
10400230bb03SAndy Lutomirski 	 * X86_BUG_ESPFIX as such.  64-bit kernels directly choose
10410230bb03SAndy Lutomirski 	 * whether to apply espfix using paravirt hooks.  If any
10420230bb03SAndy Lutomirski 	 * non-paravirt system ever shows up that does *not* have the
10430230bb03SAndy Lutomirski 	 * ESPFIX issue, we can change this.
10440230bb03SAndy Lutomirski 	 */
10450230bb03SAndy Lutomirski #ifdef CONFIG_X86_32
10460230bb03SAndy Lutomirski # ifdef CONFIG_PARAVIRT
10470230bb03SAndy Lutomirski 	do {
10480230bb03SAndy Lutomirski 		extern void native_iret(void);
10490230bb03SAndy Lutomirski 		if (pv_cpu_ops.iret == native_iret)
10500230bb03SAndy Lutomirski 			set_cpu_bug(c, X86_BUG_ESPFIX);
10510230bb03SAndy Lutomirski 	} while (0);
10520230bb03SAndy Lutomirski # else
10530230bb03SAndy Lutomirski 	set_cpu_bug(c, X86_BUG_ESPFIX);
10540230bb03SAndy Lutomirski # endif
10550230bb03SAndy Lutomirski #endif
1056f7627e25SThomas Gleixner }
1057f7627e25SThomas Gleixner 
1058cbc82b17SPeter P Waskiewicz Jr static void x86_init_cache_qos(struct cpuinfo_x86 *c)
1059cbc82b17SPeter P Waskiewicz Jr {
1060cbc82b17SPeter P Waskiewicz Jr 	/*
1061cbc82b17SPeter P Waskiewicz Jr 	 * The heavy lifting of max_rmid and cache_occ_scale are handled
1062cbc82b17SPeter P Waskiewicz Jr 	 * in get_cpu_cap().  Here we just set the max_rmid for the boot_cpu
1063cbc82b17SPeter P Waskiewicz Jr 	 * in case CQM bits really aren't there in this CPU.
1064cbc82b17SPeter P Waskiewicz Jr 	 */
1065cbc82b17SPeter P Waskiewicz Jr 	if (c != &boot_cpu_data) {
1066cbc82b17SPeter P Waskiewicz Jr 		boot_cpu_data.x86_cache_max_rmid =
1067cbc82b17SPeter P Waskiewicz Jr 			min(boot_cpu_data.x86_cache_max_rmid,
1068cbc82b17SPeter P Waskiewicz Jr 			    c->x86_cache_max_rmid);
1069cbc82b17SPeter P Waskiewicz Jr 	}
1070cbc82b17SPeter P Waskiewicz Jr }
1071cbc82b17SPeter P Waskiewicz Jr 
1072f7627e25SThomas Gleixner /*
10739d85eb91SThomas Gleixner  * Validate that ACPI/mptables have the same information about the
10749d85eb91SThomas Gleixner  * effective APIC id and update the package map.
1075d49597fdSThomas Gleixner  */
10769d85eb91SThomas Gleixner static void validate_apic_and_package_id(struct cpuinfo_x86 *c)
1077d49597fdSThomas Gleixner {
1078d49597fdSThomas Gleixner #ifdef CONFIG_SMP
10799d85eb91SThomas Gleixner 	unsigned int apicid, cpu = smp_processor_id();
1080d49597fdSThomas Gleixner 
1081d49597fdSThomas Gleixner 	apicid = apic->cpu_present_to_apicid(cpu);
1082d49597fdSThomas Gleixner 
10839d85eb91SThomas Gleixner 	if (apicid != c->apicid) {
10849d85eb91SThomas Gleixner 		pr_err(FW_BUG "CPU%u: APIC id mismatch. Firmware: %x APIC: %x\n",
1085d49597fdSThomas Gleixner 		       cpu, apicid, c->initial_apicid);
1086d49597fdSThomas Gleixner 	}
10879d85eb91SThomas Gleixner 	BUG_ON(topology_update_package_map(c->phys_proc_id, cpu));
1088d49597fdSThomas Gleixner #else
1089d49597fdSThomas Gleixner 	c->logical_proc_id = 0;
1090d49597fdSThomas Gleixner #endif
1091d49597fdSThomas Gleixner }
1092d49597fdSThomas Gleixner 
1093d49597fdSThomas Gleixner /*
1094f7627e25SThomas Gleixner  * This does the hard work of actually picking apart the CPU stuff...
1095f7627e25SThomas Gleixner  */
1096148f9bb8SPaul Gortmaker static void identify_cpu(struct cpuinfo_x86 *c)
1097f7627e25SThomas Gleixner {
1098f7627e25SThomas Gleixner 	int i;
1099f7627e25SThomas Gleixner 
1100f7627e25SThomas Gleixner 	c->loops_per_jiffy = loops_per_jiffy;
1101f7627e25SThomas Gleixner 	c->x86_cache_size = -1;
1102f7627e25SThomas Gleixner 	c->x86_vendor = X86_VENDOR_UNKNOWN;
1103f7627e25SThomas Gleixner 	c->x86_model = c->x86_mask = 0;	/* So far unknown... */
1104f7627e25SThomas Gleixner 	c->x86_vendor_id[0] = '\0'; /* Unset */
1105f7627e25SThomas Gleixner 	c->x86_model_id[0] = '\0';  /* Unset */
1106f7627e25SThomas Gleixner 	c->x86_max_cores = 1;
1107102bbe3aSYinghai Lu 	c->x86_coreid_bits = 0;
110879a8b9aaSBorislav Petkov 	c->cu_id = 0xff;
110911fdd252SYinghai Lu #ifdef CONFIG_X86_64
1110102bbe3aSYinghai Lu 	c->x86_clflush_size = 64;
111113c6c532SJan Beulich 	c->x86_phys_bits = 36;
111213c6c532SJan Beulich 	c->x86_virt_bits = 48;
1113102bbe3aSYinghai Lu #else
1114102bbe3aSYinghai Lu 	c->cpuid_level = -1;	/* CPUID not detected */
1115f7627e25SThomas Gleixner 	c->x86_clflush_size = 32;
111613c6c532SJan Beulich 	c->x86_phys_bits = 32;
111713c6c532SJan Beulich 	c->x86_virt_bits = 32;
1118102bbe3aSYinghai Lu #endif
1119102bbe3aSYinghai Lu 	c->x86_cache_alignment = c->x86_clflush_size;
1120f7627e25SThomas Gleixner 	memset(&c->x86_capability, 0, sizeof c->x86_capability);
1121f7627e25SThomas Gleixner 
1122f7627e25SThomas Gleixner 	generic_identify(c);
1123f7627e25SThomas Gleixner 
11243898534dSAndi Kleen 	if (this_cpu->c_identify)
1125f7627e25SThomas Gleixner 		this_cpu->c_identify(c);
1126f7627e25SThomas Gleixner 
11276a6256f9SAdam Buchbinder 	/* Clear/Set all flags overridden by options, after probe */
11288bf1ebcaSAndy Lutomirski 	apply_forced_caps(c);
11292759c328SYinghai Lu 
1130102bbe3aSYinghai Lu #ifdef CONFIG_X86_64
1131cb8cc442SIngo Molnar 	c->apicid = apic->phys_pkg_id(c->initial_apicid, 0);
1132102bbe3aSYinghai Lu #endif
1133102bbe3aSYinghai Lu 
1134f7627e25SThomas Gleixner 	/*
1135f7627e25SThomas Gleixner 	 * Vendor-specific initialization.  In this section we
1136f7627e25SThomas Gleixner 	 * canonicalize the feature flags, meaning if there are
1137f7627e25SThomas Gleixner 	 * features a certain CPU supports which CPUID doesn't
1138f7627e25SThomas Gleixner 	 * tell us, CPUID claiming incorrect flags, or other bugs,
1139f7627e25SThomas Gleixner 	 * we handle them here.
1140f7627e25SThomas Gleixner 	 *
1141f7627e25SThomas Gleixner 	 * At the end of this section, c->x86_capability better
1142f7627e25SThomas Gleixner 	 * indicate the features this CPU genuinely supports!
1143f7627e25SThomas Gleixner 	 */
1144f7627e25SThomas Gleixner 	if (this_cpu->c_init)
1145f7627e25SThomas Gleixner 		this_cpu->c_init(c);
1146f7627e25SThomas Gleixner 
1147f7627e25SThomas Gleixner 	/* Disable the PN if appropriate */
1148f7627e25SThomas Gleixner 	squash_the_stupid_serial_number(c);
1149f7627e25SThomas Gleixner 
1150b2cc2a07SH. Peter Anvin 	/* Set up SMEP/SMAP */
1151b2cc2a07SH. Peter Anvin 	setup_smep(c);
1152b2cc2a07SH. Peter Anvin 	setup_smap(c);
1153b2cc2a07SH. Peter Anvin 
1154f7627e25SThomas Gleixner 	/*
11550f3fa48aSIngo Molnar 	 * The vendor-specific functions might have changed features.
11560f3fa48aSIngo Molnar 	 * Now we do "generic changes."
1157f7627e25SThomas Gleixner 	 */
1158f7627e25SThomas Gleixner 
1159b38b0665SH. Peter Anvin 	/* Filter out anything that depends on CPUID levels we don't have */
1160b38b0665SH. Peter Anvin 	filter_cpuid_features(c, true);
1161b38b0665SH. Peter Anvin 
1162f7627e25SThomas Gleixner 	/* If the model name is still unset, do table lookup. */
1163f7627e25SThomas Gleixner 	if (!c->x86_model_id[0]) {
116402dde8b4SJan Beulich 		const char *p;
1165f7627e25SThomas Gleixner 		p = table_lookup_model(c);
1166f7627e25SThomas Gleixner 		if (p)
1167f7627e25SThomas Gleixner 			strcpy(c->x86_model_id, p);
1168f7627e25SThomas Gleixner 		else
1169f7627e25SThomas Gleixner 			/* Last resort... */
1170f7627e25SThomas Gleixner 			sprintf(c->x86_model_id, "%02x/%02x",
1171f7627e25SThomas Gleixner 				c->x86, c->x86_model);
1172f7627e25SThomas Gleixner 	}
1173f7627e25SThomas Gleixner 
1174102bbe3aSYinghai Lu #ifdef CONFIG_X86_64
1175102bbe3aSYinghai Lu 	detect_ht(c);
1176102bbe3aSYinghai Lu #endif
1177102bbe3aSYinghai Lu 
117849d859d7SH. Peter Anvin 	x86_init_rdrand(c);
1179cbc82b17SPeter P Waskiewicz Jr 	x86_init_cache_qos(c);
118006976945SDave Hansen 	setup_pku(c);
11813e0c3737SYinghai Lu 
11823e0c3737SYinghai Lu 	/*
11836a6256f9SAdam Buchbinder 	 * Clear/Set all flags overridden by options, need do it
11843e0c3737SYinghai Lu 	 * before following smp all cpus cap AND.
11853e0c3737SYinghai Lu 	 */
11868bf1ebcaSAndy Lutomirski 	apply_forced_caps(c);
11873e0c3737SYinghai Lu 
1188f7627e25SThomas Gleixner 	/*
1189f7627e25SThomas Gleixner 	 * On SMP, boot_cpu_data holds the common feature set between
1190f7627e25SThomas Gleixner 	 * all CPUs; so make sure that we indicate which features are
1191f7627e25SThomas Gleixner 	 * common between the CPUs.  The first time this routine gets
1192f7627e25SThomas Gleixner 	 * executed, c == &boot_cpu_data.
1193f7627e25SThomas Gleixner 	 */
1194f7627e25SThomas Gleixner 	if (c != &boot_cpu_data) {
1195f7627e25SThomas Gleixner 		/* AND the already accumulated flags with these */
1196f7627e25SThomas Gleixner 		for (i = 0; i < NCAPINTS; i++)
1197f7627e25SThomas Gleixner 			boot_cpu_data.x86_capability[i] &= c->x86_capability[i];
119865fc985bSBorislav Petkov 
119965fc985bSBorislav Petkov 		/* OR, i.e. replicate the bug flags */
120065fc985bSBorislav Petkov 		for (i = NCAPINTS; i < NCAPINTS + NBUGINTS; i++)
120165fc985bSBorislav Petkov 			c->x86_capability[i] |= boot_cpu_data.x86_capability[i];
1202f7627e25SThomas Gleixner 	}
1203f7627e25SThomas Gleixner 
1204f7627e25SThomas Gleixner 	/* Init Machine Check Exception if available. */
12055e09954aSBorislav Petkov 	mcheck_cpu_init(c);
120630d432dfSAndi Kleen 
120730d432dfSAndi Kleen 	select_idle_routine(c);
1208102bbe3aSYinghai Lu 
1209de2d9445STejun Heo #ifdef CONFIG_NUMA
1210102bbe3aSYinghai Lu 	numa_add_cpu(smp_processor_id());
1211102bbe3aSYinghai Lu #endif
1212f7627e25SThomas Gleixner }
1213f7627e25SThomas Gleixner 
12148b6c0ab1SIngo Molnar /*
12158b6c0ab1SIngo Molnar  * Set up the CPU state needed to execute SYSENTER/SYSEXIT instructions
12168b6c0ab1SIngo Molnar  * on 32-bit kernels:
12178b6c0ab1SIngo Molnar  */
1218cfda7bb9SAndy Lutomirski #ifdef CONFIG_X86_32
1219cfda7bb9SAndy Lutomirski void enable_sep_cpu(void)
1220cfda7bb9SAndy Lutomirski {
12218b6c0ab1SIngo Molnar 	struct tss_struct *tss;
12228b6c0ab1SIngo Molnar 	int cpu;
1223cfda7bb9SAndy Lutomirski 
1224b3edfda4SBorislav Petkov 	if (!boot_cpu_has(X86_FEATURE_SEP))
1225b3edfda4SBorislav Petkov 		return;
1226b3edfda4SBorislav Petkov 
12278b6c0ab1SIngo Molnar 	cpu = get_cpu();
12288b6c0ab1SIngo Molnar 	tss = &per_cpu(cpu_tss, cpu);
12298b6c0ab1SIngo Molnar 
12308b6c0ab1SIngo Molnar 	/*
1231cf9328ccSAndy Lutomirski 	 * We cache MSR_IA32_SYSENTER_CS's value in the TSS's ss1 field --
1232cf9328ccSAndy Lutomirski 	 * see the big comment in struct x86_hw_tss's definition.
12338b6c0ab1SIngo Molnar 	 */
1234cfda7bb9SAndy Lutomirski 
1235cfda7bb9SAndy Lutomirski 	tss->x86_tss.ss1 = __KERNEL_CS;
12368b6c0ab1SIngo Molnar 	wrmsr(MSR_IA32_SYSENTER_CS, tss->x86_tss.ss1, 0);
12378b6c0ab1SIngo Molnar 
1238cf9328ccSAndy Lutomirski 	wrmsr(MSR_IA32_SYSENTER_ESP,
1239cf9328ccSAndy Lutomirski 	      (unsigned long)tss + offsetofend(struct tss_struct, SYSENTER_stack),
1240cf9328ccSAndy Lutomirski 	      0);
12418b6c0ab1SIngo Molnar 
12424c8cd0c5SIngo Molnar 	wrmsr(MSR_IA32_SYSENTER_EIP, (unsigned long)entry_SYSENTER_32, 0);
12438b6c0ab1SIngo Molnar 
1244cfda7bb9SAndy Lutomirski 	put_cpu();
1245cfda7bb9SAndy Lutomirski }
1246e04d645fSGlauber Costa #endif
1247e04d645fSGlauber Costa 
1248f7627e25SThomas Gleixner void __init identify_boot_cpu(void)
1249f7627e25SThomas Gleixner {
1250f7627e25SThomas Gleixner 	identify_cpu(&boot_cpu_data);
1251102bbe3aSYinghai Lu #ifdef CONFIG_X86_32
1252f7627e25SThomas Gleixner 	sysenter_setup();
1253f7627e25SThomas Gleixner 	enable_sep_cpu();
1254102bbe3aSYinghai Lu #endif
1255e0ba94f1SAlex Shi 	cpu_detect_tlb(&boot_cpu_data);
1256f7627e25SThomas Gleixner }
1257f7627e25SThomas Gleixner 
1258148f9bb8SPaul Gortmaker void identify_secondary_cpu(struct cpuinfo_x86 *c)
1259f7627e25SThomas Gleixner {
1260f7627e25SThomas Gleixner 	BUG_ON(c == &boot_cpu_data);
1261f7627e25SThomas Gleixner 	identify_cpu(c);
1262102bbe3aSYinghai Lu #ifdef CONFIG_X86_32
1263f7627e25SThomas Gleixner 	enable_sep_cpu();
1264102bbe3aSYinghai Lu #endif
1265f7627e25SThomas Gleixner 	mtrr_ap_init();
12669d85eb91SThomas Gleixner 	validate_apic_and_package_id(c);
1267f7627e25SThomas Gleixner }
1268f7627e25SThomas Gleixner 
1269191679fdSAndi Kleen static __init int setup_noclflush(char *arg)
1270191679fdSAndi Kleen {
1271840d2830SH. Peter Anvin 	setup_clear_cpu_cap(X86_FEATURE_CLFLUSH);
1272da4aaa7dSH. Peter Anvin 	setup_clear_cpu_cap(X86_FEATURE_CLFLUSHOPT);
1273191679fdSAndi Kleen 	return 1;
1274191679fdSAndi Kleen }
1275191679fdSAndi Kleen __setup("noclflush", setup_noclflush);
1276191679fdSAndi Kleen 
1277148f9bb8SPaul Gortmaker void print_cpu_info(struct cpuinfo_x86 *c)
1278f7627e25SThomas Gleixner {
127902dde8b4SJan Beulich 	const char *vendor = NULL;
1280f7627e25SThomas Gleixner 
12810f3fa48aSIngo Molnar 	if (c->x86_vendor < X86_VENDOR_NUM) {
1282f7627e25SThomas Gleixner 		vendor = this_cpu->c_vendor;
12830f3fa48aSIngo Molnar 	} else {
12840f3fa48aSIngo Molnar 		if (c->cpuid_level >= 0)
1285f7627e25SThomas Gleixner 			vendor = c->x86_vendor_id;
12860f3fa48aSIngo Molnar 	}
1287f7627e25SThomas Gleixner 
1288bd32a8cfSYinghai Lu 	if (vendor && !strstr(c->x86_model_id, vendor))
12891b74dde7SChen Yucong 		pr_cont("%s ", vendor);
1290f7627e25SThomas Gleixner 
12919d31d35bSYinghai Lu 	if (c->x86_model_id[0])
12921b74dde7SChen Yucong 		pr_cont("%s", c->x86_model_id);
1293f7627e25SThomas Gleixner 	else
12941b74dde7SChen Yucong 		pr_cont("%d86", c->x86);
1295f7627e25SThomas Gleixner 
12961b74dde7SChen Yucong 	pr_cont(" (family: 0x%x, model: 0x%x", c->x86, c->x86_model);
1297924e101aSBorislav Petkov 
1298f7627e25SThomas Gleixner 	if (c->x86_mask || c->cpuid_level >= 0)
12991b74dde7SChen Yucong 		pr_cont(", stepping: 0x%x)\n", c->x86_mask);
1300f7627e25SThomas Gleixner 	else
13011b74dde7SChen Yucong 		pr_cont(")\n");
1302f7627e25SThomas Gleixner }
1303f7627e25SThomas Gleixner 
13040c2a3913SAndi Kleen /*
13050c2a3913SAndi Kleen  * clearcpuid= was already parsed in fpu__init_parse_early_param.
13060c2a3913SAndi Kleen  * But we need to keep a dummy __setup around otherwise it would
13070c2a3913SAndi Kleen  * show up as an environment variable for init.
13080c2a3913SAndi Kleen  */
13090c2a3913SAndi Kleen static __init int setup_clearcpuid(char *arg)
1310ac72e788SAndi Kleen {
1311ac72e788SAndi Kleen 	return 1;
1312ac72e788SAndi Kleen }
13130c2a3913SAndi Kleen __setup("clearcpuid=", setup_clearcpuid);
1314ac72e788SAndi Kleen 
1315d5494d4fSYinghai Lu #ifdef CONFIG_X86_64
1316947e76cdSBrian Gerst DEFINE_PER_CPU_FIRST(union irq_stack_union,
1317277d5b40SAndi Kleen 		     irq_stack_union) __aligned(PAGE_SIZE) __visible;
13180f3fa48aSIngo Molnar 
1319bdf977b3STejun Heo /*
1320a7fcf28dSAndy Lutomirski  * The following percpu variables are hot.  Align current_task to
1321a7fcf28dSAndy Lutomirski  * cacheline size such that they fall in the same cacheline.
1322bdf977b3STejun Heo  */
1323bdf977b3STejun Heo DEFINE_PER_CPU(struct task_struct *, current_task) ____cacheline_aligned =
1324bdf977b3STejun Heo 	&init_task;
1325bdf977b3STejun Heo EXPORT_PER_CPU_SYMBOL(current_task);
1326d5494d4fSYinghai Lu 
1327bdf977b3STejun Heo DEFINE_PER_CPU(char *, irq_stack_ptr) =
13284950d6d4SJosh Poimboeuf 	init_per_cpu_var(irq_stack_union.irq_stack) + IRQ_STACK_SIZE;
1329bdf977b3STejun Heo 
1330277d5b40SAndi Kleen DEFINE_PER_CPU(unsigned int, irq_count) __visible = -1;
1331d5494d4fSYinghai Lu 
1332c2daa3beSPeter Zijlstra DEFINE_PER_CPU(int, __preempt_count) = INIT_PREEMPT_COUNT;
1333c2daa3beSPeter Zijlstra EXPORT_PER_CPU_SYMBOL(__preempt_count);
1334c2daa3beSPeter Zijlstra 
13350f3fa48aSIngo Molnar /*
13360f3fa48aSIngo Molnar  * Special IST stacks which the CPU switches to when it calls
13370f3fa48aSIngo Molnar  * an IST-marked descriptor entry. Up to 7 stacks (hardware
13380f3fa48aSIngo Molnar  * limit), all of them are 4K, except the debug stack which
13390f3fa48aSIngo Molnar  * is 8K.
13400f3fa48aSIngo Molnar  */
13410f3fa48aSIngo Molnar static const unsigned int exception_stack_sizes[N_EXCEPTION_STACKS] = {
13420f3fa48aSIngo Molnar 	  [0 ... N_EXCEPTION_STACKS - 1]	= EXCEPTION_STKSZ,
13430f3fa48aSIngo Molnar 	  [DEBUG_STACK - 1]			= DEBUG_STKSZ
13440f3fa48aSIngo Molnar };
13450f3fa48aSIngo Molnar 
134692d65b23SBrian Gerst static DEFINE_PER_CPU_PAGE_ALIGNED(char, exception_stacks
13473e352aa8STejun Heo 	[(N_EXCEPTION_STACKS - 1) * EXCEPTION_STKSZ + DEBUG_STKSZ]);
1348d5494d4fSYinghai Lu 
1349d5494d4fSYinghai Lu /* May not be marked __init: used by software suspend */
1350d5494d4fSYinghai Lu void syscall_init(void)
1351d5494d4fSYinghai Lu {
135231ac34caSBorislav Petkov 	wrmsr(MSR_STAR, 0, (__USER32_CS << 16) | __KERNEL_CS);
135347edb651SAndy Lutomirski 	wrmsrl(MSR_LSTAR, (unsigned long)entry_SYSCALL_64);
1354d56fe4bfSIngo Molnar 
1355d56fe4bfSIngo Molnar #ifdef CONFIG_IA32_EMULATION
135647edb651SAndy Lutomirski 	wrmsrl(MSR_CSTAR, (unsigned long)entry_SYSCALL_compat);
1357a76c7f46SDenys Vlasenko 	/*
1358487d1edbSDenys Vlasenko 	 * This only works on Intel CPUs.
1359487d1edbSDenys Vlasenko 	 * On AMD CPUs these MSRs are 32-bit, CPU truncates MSR_IA32_SYSENTER_EIP.
1360487d1edbSDenys Vlasenko 	 * This does not cause SYSENTER to jump to the wrong location, because
1361487d1edbSDenys Vlasenko 	 * AMD doesn't allow SYSENTER in long mode (either 32- or 64-bit).
1362a76c7f46SDenys Vlasenko 	 */
1363a76c7f46SDenys Vlasenko 	wrmsrl_safe(MSR_IA32_SYSENTER_CS, (u64)__KERNEL_CS);
13641a79797bSAndy Lutomirski 	wrmsrl_safe(MSR_IA32_SYSENTER_ESP,
13651a79797bSAndy Lutomirski 		    (unsigned long)this_cpu_ptr(&cpu_tss) +
13661a79797bSAndy Lutomirski 		    offsetofend(struct tss_struct, SYSENTER_stack));
13674c8cd0c5SIngo Molnar 	wrmsrl_safe(MSR_IA32_SYSENTER_EIP, (u64)entry_SYSENTER_compat);
1368d56fe4bfSIngo Molnar #else
136947edb651SAndy Lutomirski 	wrmsrl(MSR_CSTAR, (unsigned long)ignore_sysret);
13706b51311cSBorislav Petkov 	wrmsrl_safe(MSR_IA32_SYSENTER_CS, (u64)GDT_ENTRY_INVALID_SEG);
1371d56fe4bfSIngo Molnar 	wrmsrl_safe(MSR_IA32_SYSENTER_ESP, 0ULL);
1372d56fe4bfSIngo Molnar 	wrmsrl_safe(MSR_IA32_SYSENTER_EIP, 0ULL);
1373d5494d4fSYinghai Lu #endif
1374d5494d4fSYinghai Lu 
1375d5494d4fSYinghai Lu 	/* Flags to clear on syscall */
1376d5494d4fSYinghai Lu 	wrmsrl(MSR_SYSCALL_MASK,
137763bcff2aSH. Peter Anvin 	       X86_EFLAGS_TF|X86_EFLAGS_DF|X86_EFLAGS_IF|
13788c7aa698SAndy Lutomirski 	       X86_EFLAGS_IOPL|X86_EFLAGS_AC|X86_EFLAGS_NT);
1379d5494d4fSYinghai Lu }
1380d5494d4fSYinghai Lu 
1381d5494d4fSYinghai Lu /*
1382d5494d4fSYinghai Lu  * Copies of the original ist values from the tss are only accessed during
1383d5494d4fSYinghai Lu  * debugging, no special alignment required.
1384d5494d4fSYinghai Lu  */
1385d5494d4fSYinghai Lu DEFINE_PER_CPU(struct orig_ist, orig_ist);
1386d5494d4fSYinghai Lu 
1387228bdaa9SSteven Rostedt static DEFINE_PER_CPU(unsigned long, debug_stack_addr);
138842181186SSteven Rostedt DEFINE_PER_CPU(int, debug_stack_usage);
1389228bdaa9SSteven Rostedt 
1390228bdaa9SSteven Rostedt int is_debug_stack(unsigned long addr)
1391228bdaa9SSteven Rostedt {
139289cbc767SChristoph Lameter 	return __this_cpu_read(debug_stack_usage) ||
139389cbc767SChristoph Lameter 		(addr <= __this_cpu_read(debug_stack_addr) &&
139489cbc767SChristoph Lameter 		 addr > (__this_cpu_read(debug_stack_addr) - DEBUG_STKSZ));
1395228bdaa9SSteven Rostedt }
13960f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(is_debug_stack);
1397228bdaa9SSteven Rostedt 
1398629f4f9dSSeiji Aguchi DEFINE_PER_CPU(u32, debug_idt_ctr);
1399f8988175SSteven Rostedt 
1400228bdaa9SSteven Rostedt void debug_stack_set_zero(void)
1401228bdaa9SSteven Rostedt {
1402629f4f9dSSeiji Aguchi 	this_cpu_inc(debug_idt_ctr);
1403629f4f9dSSeiji Aguchi 	load_current_idt();
1404228bdaa9SSteven Rostedt }
14050f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(debug_stack_set_zero);
1406228bdaa9SSteven Rostedt 
1407228bdaa9SSteven Rostedt void debug_stack_reset(void)
1408228bdaa9SSteven Rostedt {
1409629f4f9dSSeiji Aguchi 	if (WARN_ON(!this_cpu_read(debug_idt_ctr)))
1410f8988175SSteven Rostedt 		return;
1411629f4f9dSSeiji Aguchi 	if (this_cpu_dec_return(debug_idt_ctr) == 0)
1412629f4f9dSSeiji Aguchi 		load_current_idt();
1413228bdaa9SSteven Rostedt }
14140f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(debug_stack_reset);
1415228bdaa9SSteven Rostedt 
14160f3fa48aSIngo Molnar #else	/* CONFIG_X86_64 */
1417d5494d4fSYinghai Lu 
1418bdf977b3STejun Heo DEFINE_PER_CPU(struct task_struct *, current_task) = &init_task;
1419bdf977b3STejun Heo EXPORT_PER_CPU_SYMBOL(current_task);
1420c2daa3beSPeter Zijlstra DEFINE_PER_CPU(int, __preempt_count) = INIT_PREEMPT_COUNT;
1421c2daa3beSPeter Zijlstra EXPORT_PER_CPU_SYMBOL(__preempt_count);
1422bdf977b3STejun Heo 
1423a7fcf28dSAndy Lutomirski /*
1424a7fcf28dSAndy Lutomirski  * On x86_32, vm86 modifies tss.sp0, so sp0 isn't a reliable way to find
1425a7fcf28dSAndy Lutomirski  * the top of the kernel stack.  Use an extra percpu variable to track the
1426a7fcf28dSAndy Lutomirski  * top of the kernel stack directly.
1427a7fcf28dSAndy Lutomirski  */
1428a7fcf28dSAndy Lutomirski DEFINE_PER_CPU(unsigned long, cpu_current_top_of_stack) =
1429a7fcf28dSAndy Lutomirski 	(unsigned long)&init_thread_union + THREAD_SIZE;
1430a7fcf28dSAndy Lutomirski EXPORT_PER_CPU_SYMBOL(cpu_current_top_of_stack);
1431a7fcf28dSAndy Lutomirski 
143260a5317fSTejun Heo #ifdef CONFIG_CC_STACKPROTECTOR
143353f82452SJeremy Fitzhardinge DEFINE_PER_CPU_ALIGNED(struct stack_canary, stack_canary);
143460a5317fSTejun Heo #endif
143560a5317fSTejun Heo 
14360f3fa48aSIngo Molnar #endif	/* CONFIG_X86_64 */
1437f7627e25SThomas Gleixner 
1438f7627e25SThomas Gleixner /*
14399766cdbcSJaswinder Singh Rajput  * Clear all 6 debug registers:
14409766cdbcSJaswinder Singh Rajput  */
14419766cdbcSJaswinder Singh Rajput static void clear_all_debug_regs(void)
14429766cdbcSJaswinder Singh Rajput {
14439766cdbcSJaswinder Singh Rajput 	int i;
14449766cdbcSJaswinder Singh Rajput 
14459766cdbcSJaswinder Singh Rajput 	for (i = 0; i < 8; i++) {
14469766cdbcSJaswinder Singh Rajput 		/* Ignore db4, db5 */
14479766cdbcSJaswinder Singh Rajput 		if ((i == 4) || (i == 5))
14489766cdbcSJaswinder Singh Rajput 			continue;
14499766cdbcSJaswinder Singh Rajput 
14509766cdbcSJaswinder Singh Rajput 		set_debugreg(0, i);
14519766cdbcSJaswinder Singh Rajput 	}
14529766cdbcSJaswinder Singh Rajput }
1453f7627e25SThomas Gleixner 
14540bb9fef9SJason Wessel #ifdef CONFIG_KGDB
14550bb9fef9SJason Wessel /*
14560bb9fef9SJason Wessel  * Restore debug regs if using kgdbwait and you have a kernel debugger
14570bb9fef9SJason Wessel  * connection established.
14580bb9fef9SJason Wessel  */
14590bb9fef9SJason Wessel static void dbg_restore_debug_regs(void)
14600bb9fef9SJason Wessel {
14610bb9fef9SJason Wessel 	if (unlikely(kgdb_connected && arch_kgdb_ops.correct_hw_break))
14620bb9fef9SJason Wessel 		arch_kgdb_ops.correct_hw_break();
14630bb9fef9SJason Wessel }
14640bb9fef9SJason Wessel #else /* ! CONFIG_KGDB */
14650bb9fef9SJason Wessel #define dbg_restore_debug_regs()
14660bb9fef9SJason Wessel #endif /* ! CONFIG_KGDB */
14670bb9fef9SJason Wessel 
1468ce4b1b16SIgor Mammedov static void wait_for_master_cpu(int cpu)
1469ce4b1b16SIgor Mammedov {
1470ce4b1b16SIgor Mammedov #ifdef CONFIG_SMP
1471ce4b1b16SIgor Mammedov 	/*
1472ce4b1b16SIgor Mammedov 	 * wait for ACK from master CPU before continuing
1473ce4b1b16SIgor Mammedov 	 * with AP initialization
1474ce4b1b16SIgor Mammedov 	 */
1475ce4b1b16SIgor Mammedov 	WARN_ON(cpumask_test_and_set_cpu(cpu, cpu_initialized_mask));
1476ce4b1b16SIgor Mammedov 	while (!cpumask_test_cpu(cpu, cpu_callout_mask))
1477ce4b1b16SIgor Mammedov 		cpu_relax();
1478ce4b1b16SIgor Mammedov #endif
1479ce4b1b16SIgor Mammedov }
1480ce4b1b16SIgor Mammedov 
1481f7627e25SThomas Gleixner /*
1482f7627e25SThomas Gleixner  * cpu_init() initializes state that is per-CPU. Some data is already
1483f7627e25SThomas Gleixner  * initialized (naturally) in the bootstrap process, such as the GDT
1484f7627e25SThomas Gleixner  * and IDT. We reload them nevertheless, this function acts as a
1485f7627e25SThomas Gleixner  * 'CPU state barrier', nothing should get across.
14861ba76586SYinghai Lu  * A lot of state is already set up in PDA init for 64 bit
1487f7627e25SThomas Gleixner  */
14881ba76586SYinghai Lu #ifdef CONFIG_X86_64
14890f3fa48aSIngo Molnar 
1490148f9bb8SPaul Gortmaker void cpu_init(void)
14911ba76586SYinghai Lu {
14920fe1e009STejun Heo 	struct orig_ist *oist;
14931ba76586SYinghai Lu 	struct task_struct *me;
14940f3fa48aSIngo Molnar 	struct tss_struct *t;
14950f3fa48aSIngo Molnar 	unsigned long v;
1496fb59831bSAndy Lutomirski 	int cpu = raw_smp_processor_id();
14971ba76586SYinghai Lu 	int i;
14981ba76586SYinghai Lu 
1499ce4b1b16SIgor Mammedov 	wait_for_master_cpu(cpu);
1500ce4b1b16SIgor Mammedov 
1501e6ebf5deSFenghua Yu 	/*
15021e02ce4cSAndy Lutomirski 	 * Initialize the CR4 shadow before doing anything that could
15031e02ce4cSAndy Lutomirski 	 * try to read it.
15041e02ce4cSAndy Lutomirski 	 */
15051e02ce4cSAndy Lutomirski 	cr4_init_shadow();
15061e02ce4cSAndy Lutomirski 
1507777284b6SBorislav Petkov 	if (cpu)
1508e6ebf5deSFenghua Yu 		load_ucode_ap();
1509e6ebf5deSFenghua Yu 
151024933b82SAndy Lutomirski 	t = &per_cpu(cpu_tss, cpu);
15110fe1e009STejun Heo 	oist = &per_cpu(orig_ist, cpu);
15120f3fa48aSIngo Molnar 
1513e7a22c1eSBrian Gerst #ifdef CONFIG_NUMA
151427fd185fSFenghua Yu 	if (this_cpu_read(numa_node) == 0 &&
1515e534c7c5SLee Schermerhorn 	    early_cpu_to_node(cpu) != NUMA_NO_NODE)
1516e534c7c5SLee Schermerhorn 		set_numa_node(early_cpu_to_node(cpu));
1517e7a22c1eSBrian Gerst #endif
15181ba76586SYinghai Lu 
15191ba76586SYinghai Lu 	me = current;
15201ba76586SYinghai Lu 
15212eaad1fdSMike Travis 	pr_debug("Initializing CPU#%d\n", cpu);
15221ba76586SYinghai Lu 
1523375074ccSAndy Lutomirski 	cr4_clear_bits(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE);
15241ba76586SYinghai Lu 
15251ba76586SYinghai Lu 	/*
15261ba76586SYinghai Lu 	 * Initialize the per-CPU GDT with the boot GDT,
15271ba76586SYinghai Lu 	 * and set up the GDT descriptor:
15281ba76586SYinghai Lu 	 */
15291ba76586SYinghai Lu 
1530552be871SBrian Gerst 	switch_to_new_gdt(cpu);
15312697fbd5SBrian Gerst 	loadsegment(fs, 0);
15322697fbd5SBrian Gerst 
1533cf910e83SSeiji Aguchi 	load_current_idt();
15341ba76586SYinghai Lu 
15351ba76586SYinghai Lu 	memset(me->thread.tls_array, 0, GDT_ENTRY_TLS_ENTRIES * 8);
15361ba76586SYinghai Lu 	syscall_init();
15371ba76586SYinghai Lu 
15381ba76586SYinghai Lu 	wrmsrl(MSR_FS_BASE, 0);
15391ba76586SYinghai Lu 	wrmsrl(MSR_KERNEL_GS_BASE, 0);
15401ba76586SYinghai Lu 	barrier();
15411ba76586SYinghai Lu 
15424763ed4dSH. Peter Anvin 	x86_configure_nx();
1543659006bfSThomas Gleixner 	x2apic_setup();
15441ba76586SYinghai Lu 
15451ba76586SYinghai Lu 	/*
15461ba76586SYinghai Lu 	 * set up and load the per-CPU TSS
15471ba76586SYinghai Lu 	 */
15480fe1e009STejun Heo 	if (!oist->ist[0]) {
154992d65b23SBrian Gerst 		char *estacks = per_cpu(exception_stacks, cpu);
15500f3fa48aSIngo Molnar 
15511ba76586SYinghai Lu 		for (v = 0; v < N_EXCEPTION_STACKS; v++) {
15520f3fa48aSIngo Molnar 			estacks += exception_stack_sizes[v];
15530fe1e009STejun Heo 			oist->ist[v] = t->x86_tss.ist[v] =
15541ba76586SYinghai Lu 					(unsigned long)estacks;
1555228bdaa9SSteven Rostedt 			if (v == DEBUG_STACK-1)
1556228bdaa9SSteven Rostedt 				per_cpu(debug_stack_addr, cpu) = (unsigned long)estacks;
15571ba76586SYinghai Lu 		}
15581ba76586SYinghai Lu 	}
15591ba76586SYinghai Lu 
15601ba76586SYinghai Lu 	t->x86_tss.io_bitmap_base = offsetof(struct tss_struct, io_bitmap);
15610f3fa48aSIngo Molnar 
15621ba76586SYinghai Lu 	/*
15631ba76586SYinghai Lu 	 * <= is required because the CPU will access up to
15641ba76586SYinghai Lu 	 * 8 bits beyond the end of the IO permission bitmap.
15651ba76586SYinghai Lu 	 */
15661ba76586SYinghai Lu 	for (i = 0; i <= IO_BITMAP_LONGS; i++)
15671ba76586SYinghai Lu 		t->io_bitmap[i] = ~0UL;
15681ba76586SYinghai Lu 
1569f1f10076SVegard Nossum 	mmgrab(&init_mm);
15701ba76586SYinghai Lu 	me->active_mm = &init_mm;
15718c5dfd25SStoyan Gaydarov 	BUG_ON(me->mm);
157272c0098dSAndy Lutomirski 	initialize_tlbstate_and_flush();
15731ba76586SYinghai Lu 	enter_lazy_tlb(&init_mm, me);
15741ba76586SYinghai Lu 
157520bb8344SAndy Lutomirski 	/*
157620bb8344SAndy Lutomirski 	 * Initialize the TSS.  Don't bother initializing sp0, as the initial
157720bb8344SAndy Lutomirski 	 * task never enters user mode.
157820bb8344SAndy Lutomirski 	 */
15791ba76586SYinghai Lu 	set_tss_desc(cpu, t);
15801ba76586SYinghai Lu 	load_TR_desc();
158120bb8344SAndy Lutomirski 
158237868fe1SAndy Lutomirski 	load_mm_ldt(&init_mm);
15831ba76586SYinghai Lu 
15849766cdbcSJaswinder Singh Rajput 	clear_all_debug_regs();
15850bb9fef9SJason Wessel 	dbg_restore_debug_regs();
15861ba76586SYinghai Lu 
158721c4cd10SIngo Molnar 	fpu__init_cpu();
15881ba76586SYinghai Lu 
15891ba76586SYinghai Lu 	if (is_uv_system())
15901ba76586SYinghai Lu 		uv_cpu_init();
159169218e47SThomas Garnier 
1592*ef8813abSAndy Lutomirski 	setup_cpu_entry_area(cpu);
159369218e47SThomas Garnier 	load_fixmap_gdt(cpu);
15941ba76586SYinghai Lu }
15951ba76586SYinghai Lu 
15961ba76586SYinghai Lu #else
15971ba76586SYinghai Lu 
1598148f9bb8SPaul Gortmaker void cpu_init(void)
1599f7627e25SThomas Gleixner {
1600f7627e25SThomas Gleixner 	int cpu = smp_processor_id();
1601f7627e25SThomas Gleixner 	struct task_struct *curr = current;
160224933b82SAndy Lutomirski 	struct tss_struct *t = &per_cpu(cpu_tss, cpu);
1603f7627e25SThomas Gleixner 
1604ce4b1b16SIgor Mammedov 	wait_for_master_cpu(cpu);
1605e6ebf5deSFenghua Yu 
16065b2bdbc8SSteven Rostedt 	/*
16075b2bdbc8SSteven Rostedt 	 * Initialize the CR4 shadow before doing anything that could
16085b2bdbc8SSteven Rostedt 	 * try to read it.
16095b2bdbc8SSteven Rostedt 	 */
16105b2bdbc8SSteven Rostedt 	cr4_init_shadow();
16115b2bdbc8SSteven Rostedt 
1612ce4b1b16SIgor Mammedov 	show_ucode_info_early();
1613f7627e25SThomas Gleixner 
16141b74dde7SChen Yucong 	pr_info("Initializing CPU#%d\n", cpu);
1615f7627e25SThomas Gleixner 
1616362f924bSBorislav Petkov 	if (cpu_feature_enabled(X86_FEATURE_VME) ||
161759e21e3dSBorislav Petkov 	    boot_cpu_has(X86_FEATURE_TSC) ||
1618362f924bSBorislav Petkov 	    boot_cpu_has(X86_FEATURE_DE))
1619375074ccSAndy Lutomirski 		cr4_clear_bits(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE);
1620f7627e25SThomas Gleixner 
1621cf910e83SSeiji Aguchi 	load_current_idt();
1622552be871SBrian Gerst 	switch_to_new_gdt(cpu);
1623f7627e25SThomas Gleixner 
1624f7627e25SThomas Gleixner 	/*
1625f7627e25SThomas Gleixner 	 * Set up and load the per-CPU TSS and LDT
1626f7627e25SThomas Gleixner 	 */
1627f1f10076SVegard Nossum 	mmgrab(&init_mm);
1628f7627e25SThomas Gleixner 	curr->active_mm = &init_mm;
16298c5dfd25SStoyan Gaydarov 	BUG_ON(curr->mm);
163072c0098dSAndy Lutomirski 	initialize_tlbstate_and_flush();
1631f7627e25SThomas Gleixner 	enter_lazy_tlb(&init_mm, curr);
1632f7627e25SThomas Gleixner 
163320bb8344SAndy Lutomirski 	/*
163420bb8344SAndy Lutomirski 	 * Initialize the TSS.  Don't bother initializing sp0, as the initial
163520bb8344SAndy Lutomirski 	 * task never enters user mode.
163620bb8344SAndy Lutomirski 	 */
1637f7627e25SThomas Gleixner 	set_tss_desc(cpu, t);
1638f7627e25SThomas Gleixner 	load_TR_desc();
163920bb8344SAndy Lutomirski 
164037868fe1SAndy Lutomirski 	load_mm_ldt(&init_mm);
1641f7627e25SThomas Gleixner 
1642f9a196b8SThomas Gleixner 	t->x86_tss.io_bitmap_base = offsetof(struct tss_struct, io_bitmap);
1643f9a196b8SThomas Gleixner 
1644f7627e25SThomas Gleixner #ifdef CONFIG_DOUBLEFAULT
1645f7627e25SThomas Gleixner 	/* Set up doublefault TSS pointer in the GDT */
1646f7627e25SThomas Gleixner 	__set_tss_desc(cpu, GDT_ENTRY_DOUBLEFAULT_TSS, &doublefault_tss);
1647f7627e25SThomas Gleixner #endif
1648f7627e25SThomas Gleixner 
16499766cdbcSJaswinder Singh Rajput 	clear_all_debug_regs();
16500bb9fef9SJason Wessel 	dbg_restore_debug_regs();
1651f7627e25SThomas Gleixner 
165221c4cd10SIngo Molnar 	fpu__init_cpu();
165369218e47SThomas Garnier 
1654*ef8813abSAndy Lutomirski 	setup_cpu_entry_area(cpu);
165569218e47SThomas Garnier 	load_fixmap_gdt(cpu);
1656f7627e25SThomas Gleixner }
16571ba76586SYinghai Lu #endif
16585700f743SBorislav Petkov 
1659b51ef52dSLaura Abbott static void bsp_resume(void)
1660b51ef52dSLaura Abbott {
1661b51ef52dSLaura Abbott 	if (this_cpu->c_bsp_resume)
1662b51ef52dSLaura Abbott 		this_cpu->c_bsp_resume(&boot_cpu_data);
1663b51ef52dSLaura Abbott }
1664b51ef52dSLaura Abbott 
1665b51ef52dSLaura Abbott static struct syscore_ops cpu_syscore_ops = {
1666b51ef52dSLaura Abbott 	.resume		= bsp_resume,
1667b51ef52dSLaura Abbott };
1668b51ef52dSLaura Abbott 
1669b51ef52dSLaura Abbott static int __init init_cpu_syscore(void)
1670b51ef52dSLaura Abbott {
1671b51ef52dSLaura Abbott 	register_syscore_ops(&cpu_syscore_ops);
1672b51ef52dSLaura Abbott 	return 0;
1673b51ef52dSLaura Abbott }
1674b51ef52dSLaura Abbott core_initcall(init_cpu_syscore);
1675