1f0fc4affSYinghai Lu #include <linux/bootmem.h> 29766cdbcSJaswinder Singh Rajput #include <linux/linkage.h> 3f0fc4affSYinghai Lu #include <linux/bitops.h> 49766cdbcSJaswinder Singh Rajput #include <linux/kernel.h> 5186f4360SPaul Gortmaker #include <linux/export.h> 6f7627e25SThomas Gleixner #include <linux/percpu.h> 79766cdbcSJaswinder Singh Rajput #include <linux/string.h> 8ee098e1aSBorislav Petkov #include <linux/ctype.h> 99766cdbcSJaswinder Singh Rajput #include <linux/delay.h> 1068e21be2SIngo Molnar #include <linux/sched/mm.h> 11e6017571SIngo Molnar #include <linux/sched/clock.h> 129164bb4aSIngo Molnar #include <linux/sched/task.h> 139766cdbcSJaswinder Singh Rajput #include <linux/init.h> 140f46efebSMasami Hiramatsu #include <linux/kprobes.h> 159766cdbcSJaswinder Singh Rajput #include <linux/kgdb.h> 169766cdbcSJaswinder Singh Rajput #include <linux/smp.h> 179766cdbcSJaswinder Singh Rajput #include <linux/io.h> 18b51ef52dSLaura Abbott #include <linux/syscore_ops.h> 199766cdbcSJaswinder Singh Rajput 209766cdbcSJaswinder Singh Rajput #include <asm/stackprotector.h> 21cdd6c482SIngo Molnar #include <asm/perf_event.h> 22f7627e25SThomas Gleixner #include <asm/mmu_context.h> 2349d859d7SH. Peter Anvin #include <asm/archrandom.h> 249766cdbcSJaswinder Singh Rajput #include <asm/hypervisor.h> 259766cdbcSJaswinder Singh Rajput #include <asm/processor.h> 261e02ce4cSAndy Lutomirski #include <asm/tlbflush.h> 27f649e938SPaul Gortmaker #include <asm/debugreg.h> 289766cdbcSJaswinder Singh Rajput #include <asm/sections.h> 29f40c3300SAndy Lutomirski #include <asm/vsyscall.h> 308bdbd962SAlan Cox #include <linux/topology.h> 318bdbd962SAlan Cox #include <linux/cpumask.h> 329766cdbcSJaswinder Singh Rajput #include <asm/pgtable.h> 3360063497SArun Sharma #include <linux/atomic.h> 349766cdbcSJaswinder Singh Rajput #include <asm/proto.h> 359766cdbcSJaswinder Singh Rajput #include <asm/setup.h> 36f7627e25SThomas Gleixner #include <asm/apic.h> 379766cdbcSJaswinder Singh Rajput #include <asm/desc.h> 3878f7f1e5SIngo Molnar #include <asm/fpu/internal.h> 399766cdbcSJaswinder Singh Rajput #include <asm/mtrr.h> 400274f955SGrzegorz Andrejczuk #include <asm/hwcap2.h> 418bdbd962SAlan Cox #include <linux/numa.h> 429766cdbcSJaswinder Singh Rajput #include <asm/asm.h> 430f6ff2bcSDave Hansen #include <asm/bugs.h> 449766cdbcSJaswinder Singh Rajput #include <asm/cpu.h> 459766cdbcSJaswinder Singh Rajput #include <asm/mce.h> 469766cdbcSJaswinder Singh Rajput #include <asm/msr.h> 479766cdbcSJaswinder Singh Rajput #include <asm/pat.h> 48d288e1cfSFenghua Yu #include <asm/microcode.h> 49d288e1cfSFenghua Yu #include <asm/microcode_intel.h> 50e641f5f5SIngo Molnar 51f7627e25SThomas Gleixner #ifdef CONFIG_X86_LOCAL_APIC 52bdbcdd48STejun Heo #include <asm/uv/uv.h> 53f7627e25SThomas Gleixner #endif 54f7627e25SThomas Gleixner 55f7627e25SThomas Gleixner #include "cpu.h" 56f7627e25SThomas Gleixner 570274f955SGrzegorz Andrejczuk u32 elf_hwcap2 __read_mostly; 580274f955SGrzegorz Andrejczuk 59c2d1cec1SMike Travis /* all of these masks are initialized in setup_cpu_local_masks() */ 60c2d1cec1SMike Travis cpumask_var_t cpu_initialized_mask; 619766cdbcSJaswinder Singh Rajput cpumask_var_t cpu_callout_mask; 629766cdbcSJaswinder Singh Rajput cpumask_var_t cpu_callin_mask; 63c2d1cec1SMike Travis 64c2d1cec1SMike Travis /* representing cpus for which sibling maps can be computed */ 65c2d1cec1SMike Travis cpumask_var_t cpu_sibling_setup_mask; 66c2d1cec1SMike Travis 672f2f52baSBrian Gerst /* correctly size the local cpu masks */ 684369f1fbSIngo Molnar void __init setup_cpu_local_masks(void) 692f2f52baSBrian Gerst { 702f2f52baSBrian Gerst alloc_bootmem_cpumask_var(&cpu_initialized_mask); 712f2f52baSBrian Gerst alloc_bootmem_cpumask_var(&cpu_callin_mask); 722f2f52baSBrian Gerst alloc_bootmem_cpumask_var(&cpu_callout_mask); 732f2f52baSBrian Gerst alloc_bootmem_cpumask_var(&cpu_sibling_setup_mask); 742f2f52baSBrian Gerst } 752f2f52baSBrian Gerst 76148f9bb8SPaul Gortmaker static void default_init(struct cpuinfo_x86 *c) 77e8055139SOndrej Zary { 78e8055139SOndrej Zary #ifdef CONFIG_X86_64 7927c13eceSBorislav Petkov cpu_detect_cache_sizes(c); 80e8055139SOndrej Zary #else 81e8055139SOndrej Zary /* Not much we can do here... */ 82e8055139SOndrej Zary /* Check if at least it has cpuid */ 83e8055139SOndrej Zary if (c->cpuid_level == -1) { 84e8055139SOndrej Zary /* No cpuid. It must be an ancient CPU */ 85e8055139SOndrej Zary if (c->x86 == 4) 86e8055139SOndrej Zary strcpy(c->x86_model_id, "486"); 87e8055139SOndrej Zary else if (c->x86 == 3) 88e8055139SOndrej Zary strcpy(c->x86_model_id, "386"); 89e8055139SOndrej Zary } 90e8055139SOndrej Zary #endif 91e8055139SOndrej Zary } 92e8055139SOndrej Zary 93148f9bb8SPaul Gortmaker static const struct cpu_dev default_cpu = { 94e8055139SOndrej Zary .c_init = default_init, 95e8055139SOndrej Zary .c_vendor = "Unknown", 96e8055139SOndrej Zary .c_x86_vendor = X86_VENDOR_UNKNOWN, 97e8055139SOndrej Zary }; 98e8055139SOndrej Zary 99148f9bb8SPaul Gortmaker static const struct cpu_dev *this_cpu = &default_cpu; 1000a488a53SYinghai Lu 10106deef89SBrian Gerst DEFINE_PER_CPU_PAGE_ALIGNED(struct gdt_page, gdt_page) = { .gdt = { 102950ad7ffSYinghai Lu #ifdef CONFIG_X86_64 10306deef89SBrian Gerst /* 10406deef89SBrian Gerst * We need valid kernel segments for data and code in long mode too 105950ad7ffSYinghai Lu * IRET will check the segment types kkeil 2000/10/28 106950ad7ffSYinghai Lu * Also sysret mandates a special GDT layout 10706deef89SBrian Gerst * 1089766cdbcSJaswinder Singh Rajput * TLS descriptors are currently at a different place compared to i386. 10906deef89SBrian Gerst * Hopefully nobody expects them at a fixed place (Wine?) 110950ad7ffSYinghai Lu */ 1111e5de182SAkinobu Mita [GDT_ENTRY_KERNEL32_CS] = GDT_ENTRY_INIT(0xc09b, 0, 0xfffff), 1121e5de182SAkinobu Mita [GDT_ENTRY_KERNEL_CS] = GDT_ENTRY_INIT(0xa09b, 0, 0xfffff), 1131e5de182SAkinobu Mita [GDT_ENTRY_KERNEL_DS] = GDT_ENTRY_INIT(0xc093, 0, 0xfffff), 1141e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER32_CS] = GDT_ENTRY_INIT(0xc0fb, 0, 0xfffff), 1151e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER_DS] = GDT_ENTRY_INIT(0xc0f3, 0, 0xfffff), 1161e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER_CS] = GDT_ENTRY_INIT(0xa0fb, 0, 0xfffff), 117950ad7ffSYinghai Lu #else 1181e5de182SAkinobu Mita [GDT_ENTRY_KERNEL_CS] = GDT_ENTRY_INIT(0xc09a, 0, 0xfffff), 1191e5de182SAkinobu Mita [GDT_ENTRY_KERNEL_DS] = GDT_ENTRY_INIT(0xc092, 0, 0xfffff), 1201e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER_CS] = GDT_ENTRY_INIT(0xc0fa, 0, 0xfffff), 1211e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER_DS] = GDT_ENTRY_INIT(0xc0f2, 0, 0xfffff), 122f7627e25SThomas Gleixner /* 123f7627e25SThomas Gleixner * Segments used for calling PnP BIOS have byte granularity. 124f7627e25SThomas Gleixner * They code segments and data segments have fixed 64k limits, 125f7627e25SThomas Gleixner * the transfer segment sizes are set at run time. 126f7627e25SThomas Gleixner */ 1276842ef0eSGlauber de Oliveira Costa /* 32-bit code */ 1281e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_CS32] = GDT_ENTRY_INIT(0x409a, 0, 0xffff), 1296842ef0eSGlauber de Oliveira Costa /* 16-bit code */ 1301e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_CS16] = GDT_ENTRY_INIT(0x009a, 0, 0xffff), 1316842ef0eSGlauber de Oliveira Costa /* 16-bit data */ 1321e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_DS] = GDT_ENTRY_INIT(0x0092, 0, 0xffff), 1336842ef0eSGlauber de Oliveira Costa /* 16-bit data */ 1341e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_TS1] = GDT_ENTRY_INIT(0x0092, 0, 0), 1356842ef0eSGlauber de Oliveira Costa /* 16-bit data */ 1361e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_TS2] = GDT_ENTRY_INIT(0x0092, 0, 0), 137f7627e25SThomas Gleixner /* 138f7627e25SThomas Gleixner * The APM segments have byte granularity and their bases 139f7627e25SThomas Gleixner * are set at run time. All have 64k limits. 140f7627e25SThomas Gleixner */ 1416842ef0eSGlauber de Oliveira Costa /* 32-bit code */ 1421e5de182SAkinobu Mita [GDT_ENTRY_APMBIOS_BASE] = GDT_ENTRY_INIT(0x409a, 0, 0xffff), 143f7627e25SThomas Gleixner /* 16-bit code */ 1441e5de182SAkinobu Mita [GDT_ENTRY_APMBIOS_BASE+1] = GDT_ENTRY_INIT(0x009a, 0, 0xffff), 1456842ef0eSGlauber de Oliveira Costa /* data */ 14672c4d853SIngo Molnar [GDT_ENTRY_APMBIOS_BASE+2] = GDT_ENTRY_INIT(0x4092, 0, 0xffff), 147f7627e25SThomas Gleixner 1481e5de182SAkinobu Mita [GDT_ENTRY_ESPFIX_SS] = GDT_ENTRY_INIT(0xc092, 0, 0xfffff), 1491e5de182SAkinobu Mita [GDT_ENTRY_PERCPU] = GDT_ENTRY_INIT(0xc092, 0, 0xfffff), 15060a5317fSTejun Heo GDT_STACK_CANARY_INIT 151950ad7ffSYinghai Lu #endif 15206deef89SBrian Gerst } }; 153f7627e25SThomas Gleixner EXPORT_PER_CPU_SYMBOL_GPL(gdt_page); 154f7627e25SThomas Gleixner 1558c3641e9SDave Hansen static int __init x86_mpx_setup(char *s) 1560c752a93SSuresh Siddha { 1578c3641e9SDave Hansen /* require an exact match without trailing characters */ 1582cd3949fSDave Hansen if (strlen(s)) 1592cd3949fSDave Hansen return 0; 1600c752a93SSuresh Siddha 1618c3641e9SDave Hansen /* do not emit a message if the feature is not present */ 1628c3641e9SDave Hansen if (!boot_cpu_has(X86_FEATURE_MPX)) 1636bad06b7SSuresh Siddha return 1; 1646bad06b7SSuresh Siddha 1658c3641e9SDave Hansen setup_clear_cpu_cap(X86_FEATURE_MPX); 1668c3641e9SDave Hansen pr_info("nompx: Intel Memory Protection Extensions (MPX) disabled\n"); 167b6f42a4aSFenghua Yu return 1; 168b6f42a4aSFenghua Yu } 1698c3641e9SDave Hansen __setup("nompx", x86_mpx_setup); 170b6f42a4aSFenghua Yu 1710790c9aaSAndy Lutomirski #ifdef CONFIG_X86_64 172c7ad5ad2SAndy Lutomirski static int __init x86_nopcid_setup(char *s) 1730790c9aaSAndy Lutomirski { 174c7ad5ad2SAndy Lutomirski /* nopcid doesn't accept parameters */ 175c7ad5ad2SAndy Lutomirski if (s) 176c7ad5ad2SAndy Lutomirski return -EINVAL; 1770790c9aaSAndy Lutomirski 1780790c9aaSAndy Lutomirski /* do not emit a message if the feature is not present */ 1790790c9aaSAndy Lutomirski if (!boot_cpu_has(X86_FEATURE_PCID)) 180c7ad5ad2SAndy Lutomirski return 0; 1810790c9aaSAndy Lutomirski 1820790c9aaSAndy Lutomirski setup_clear_cpu_cap(X86_FEATURE_PCID); 1830790c9aaSAndy Lutomirski pr_info("nopcid: PCID feature disabled\n"); 184c7ad5ad2SAndy Lutomirski return 0; 1850790c9aaSAndy Lutomirski } 186c7ad5ad2SAndy Lutomirski early_param("nopcid", x86_nopcid_setup); 1870790c9aaSAndy Lutomirski #endif 1880790c9aaSAndy Lutomirski 189d12a72b8SAndy Lutomirski static int __init x86_noinvpcid_setup(char *s) 190d12a72b8SAndy Lutomirski { 191d12a72b8SAndy Lutomirski /* noinvpcid doesn't accept parameters */ 192d12a72b8SAndy Lutomirski if (s) 193d12a72b8SAndy Lutomirski return -EINVAL; 194d12a72b8SAndy Lutomirski 195d12a72b8SAndy Lutomirski /* do not emit a message if the feature is not present */ 196d12a72b8SAndy Lutomirski if (!boot_cpu_has(X86_FEATURE_INVPCID)) 197d12a72b8SAndy Lutomirski return 0; 198d12a72b8SAndy Lutomirski 199d12a72b8SAndy Lutomirski setup_clear_cpu_cap(X86_FEATURE_INVPCID); 200d12a72b8SAndy Lutomirski pr_info("noinvpcid: INVPCID feature disabled\n"); 201d12a72b8SAndy Lutomirski return 0; 202d12a72b8SAndy Lutomirski } 203d12a72b8SAndy Lutomirski early_param("noinvpcid", x86_noinvpcid_setup); 204d12a72b8SAndy Lutomirski 205ba51dcedSYinghai Lu #ifdef CONFIG_X86_32 206148f9bb8SPaul Gortmaker static int cachesize_override = -1; 207148f9bb8SPaul Gortmaker static int disable_x86_serial_nr = 1; 208f7627e25SThomas Gleixner 209f7627e25SThomas Gleixner static int __init cachesize_setup(char *str) 210f7627e25SThomas Gleixner { 211f7627e25SThomas Gleixner get_option(&str, &cachesize_override); 212f7627e25SThomas Gleixner return 1; 213f7627e25SThomas Gleixner } 214f7627e25SThomas Gleixner __setup("cachesize=", cachesize_setup); 215f7627e25SThomas Gleixner 216f7627e25SThomas Gleixner static int __init x86_sep_setup(char *s) 217f7627e25SThomas Gleixner { 21813530257SAndi Kleen setup_clear_cpu_cap(X86_FEATURE_SEP); 219f7627e25SThomas Gleixner return 1; 220f7627e25SThomas Gleixner } 221f7627e25SThomas Gleixner __setup("nosep", x86_sep_setup); 222f7627e25SThomas Gleixner 223f7627e25SThomas Gleixner /* Standard macro to see if a specific flag is changeable */ 224f7627e25SThomas Gleixner static inline int flag_is_changeable_p(u32 flag) 225f7627e25SThomas Gleixner { 226f7627e25SThomas Gleixner u32 f1, f2; 227f7627e25SThomas Gleixner 22894f6bac1SKrzysztof Helt /* 22994f6bac1SKrzysztof Helt * Cyrix and IDT cpus allow disabling of CPUID 23094f6bac1SKrzysztof Helt * so the code below may return different results 23194f6bac1SKrzysztof Helt * when it is executed before and after enabling 23294f6bac1SKrzysztof Helt * the CPUID. Add "volatile" to not allow gcc to 23394f6bac1SKrzysztof Helt * optimize the subsequent calls to this function. 23494f6bac1SKrzysztof Helt */ 23594f6bac1SKrzysztof Helt asm volatile ("pushfl \n\t" 236f7627e25SThomas Gleixner "pushfl \n\t" 237f7627e25SThomas Gleixner "popl %0 \n\t" 238f7627e25SThomas Gleixner "movl %0, %1 \n\t" 239f7627e25SThomas Gleixner "xorl %2, %0 \n\t" 240f7627e25SThomas Gleixner "pushl %0 \n\t" 241f7627e25SThomas Gleixner "popfl \n\t" 242f7627e25SThomas Gleixner "pushfl \n\t" 243f7627e25SThomas Gleixner "popl %0 \n\t" 244f7627e25SThomas Gleixner "popfl \n\t" 2450f3fa48aSIngo Molnar 246f7627e25SThomas Gleixner : "=&r" (f1), "=&r" (f2) 247f7627e25SThomas Gleixner : "ir" (flag)); 248f7627e25SThomas Gleixner 249f7627e25SThomas Gleixner return ((f1^f2) & flag) != 0; 250f7627e25SThomas Gleixner } 251f7627e25SThomas Gleixner 252f7627e25SThomas Gleixner /* Probe for the CPUID instruction */ 253148f9bb8SPaul Gortmaker int have_cpuid_p(void) 254f7627e25SThomas Gleixner { 255f7627e25SThomas Gleixner return flag_is_changeable_p(X86_EFLAGS_ID); 256f7627e25SThomas Gleixner } 257f7627e25SThomas Gleixner 258148f9bb8SPaul Gortmaker static void squash_the_stupid_serial_number(struct cpuinfo_x86 *c) 2590a488a53SYinghai Lu { 2600a488a53SYinghai Lu unsigned long lo, hi; 2610f3fa48aSIngo Molnar 2620f3fa48aSIngo Molnar if (!cpu_has(c, X86_FEATURE_PN) || !disable_x86_serial_nr) 2630f3fa48aSIngo Molnar return; 2640f3fa48aSIngo Molnar 2650f3fa48aSIngo Molnar /* Disable processor serial number: */ 2660f3fa48aSIngo Molnar 2670a488a53SYinghai Lu rdmsr(MSR_IA32_BBL_CR_CTL, lo, hi); 2680a488a53SYinghai Lu lo |= 0x200000; 2690a488a53SYinghai Lu wrmsr(MSR_IA32_BBL_CR_CTL, lo, hi); 2700f3fa48aSIngo Molnar 2711b74dde7SChen Yucong pr_notice("CPU serial number disabled.\n"); 2720a488a53SYinghai Lu clear_cpu_cap(c, X86_FEATURE_PN); 2730a488a53SYinghai Lu 2740a488a53SYinghai Lu /* Disabling the serial number may affect the cpuid level */ 2750a488a53SYinghai Lu c->cpuid_level = cpuid_eax(0); 2760a488a53SYinghai Lu } 2770a488a53SYinghai Lu 2780a488a53SYinghai Lu static int __init x86_serial_nr_setup(char *s) 2790a488a53SYinghai Lu { 2800a488a53SYinghai Lu disable_x86_serial_nr = 0; 2810a488a53SYinghai Lu return 1; 2820a488a53SYinghai Lu } 2830a488a53SYinghai Lu __setup("serialnumber", x86_serial_nr_setup); 284ba51dcedSYinghai Lu #else 285102bbe3aSYinghai Lu static inline int flag_is_changeable_p(u32 flag) 286102bbe3aSYinghai Lu { 287102bbe3aSYinghai Lu return 1; 288102bbe3aSYinghai Lu } 289102bbe3aSYinghai Lu static inline void squash_the_stupid_serial_number(struct cpuinfo_x86 *c) 290102bbe3aSYinghai Lu { 291102bbe3aSYinghai Lu } 292ba51dcedSYinghai Lu #endif 2930a488a53SYinghai Lu 294de5397adSFenghua Yu static __init int setup_disable_smep(char *arg) 295de5397adSFenghua Yu { 296b2cc2a07SH. Peter Anvin setup_clear_cpu_cap(X86_FEATURE_SMEP); 2970f6ff2bcSDave Hansen /* Check for things that depend on SMEP being enabled: */ 2980f6ff2bcSDave Hansen check_mpx_erratum(&boot_cpu_data); 299de5397adSFenghua Yu return 1; 300de5397adSFenghua Yu } 301de5397adSFenghua Yu __setup("nosmep", setup_disable_smep); 302de5397adSFenghua Yu 303b2cc2a07SH. Peter Anvin static __always_inline void setup_smep(struct cpuinfo_x86 *c) 304de5397adSFenghua Yu { 305b2cc2a07SH. Peter Anvin if (cpu_has(c, X86_FEATURE_SMEP)) 306375074ccSAndy Lutomirski cr4_set_bits(X86_CR4_SMEP); 307de5397adSFenghua Yu } 308de5397adSFenghua Yu 30952b6179aSH. Peter Anvin static __init int setup_disable_smap(char *arg) 31052b6179aSH. Peter Anvin { 311b2cc2a07SH. Peter Anvin setup_clear_cpu_cap(X86_FEATURE_SMAP); 31252b6179aSH. Peter Anvin return 1; 31352b6179aSH. Peter Anvin } 31452b6179aSH. Peter Anvin __setup("nosmap", setup_disable_smap); 31552b6179aSH. Peter Anvin 316b2cc2a07SH. Peter Anvin static __always_inline void setup_smap(struct cpuinfo_x86 *c) 31752b6179aSH. Peter Anvin { 318581b7f15SAndrew Cooper unsigned long eflags = native_save_fl(); 319b2cc2a07SH. Peter Anvin 320b2cc2a07SH. Peter Anvin /* This should have been cleared long ago */ 321b2cc2a07SH. Peter Anvin BUG_ON(eflags & X86_EFLAGS_AC); 322b2cc2a07SH. Peter Anvin 32303bbd596SH. Peter Anvin if (cpu_has(c, X86_FEATURE_SMAP)) { 32403bbd596SH. Peter Anvin #ifdef CONFIG_X86_SMAP 325375074ccSAndy Lutomirski cr4_set_bits(X86_CR4_SMAP); 32603bbd596SH. Peter Anvin #else 327375074ccSAndy Lutomirski cr4_clear_bits(X86_CR4_SMAP); 32803bbd596SH. Peter Anvin #endif 32903bbd596SH. Peter Anvin } 330f7627e25SThomas Gleixner } 331f7627e25SThomas Gleixner 332f7627e25SThomas Gleixner /* 33306976945SDave Hansen * Protection Keys are not available in 32-bit mode. 33406976945SDave Hansen */ 33506976945SDave Hansen static bool pku_disabled; 33606976945SDave Hansen 33706976945SDave Hansen static __always_inline void setup_pku(struct cpuinfo_x86 *c) 33806976945SDave Hansen { 339e8df1a95SDave Hansen /* check the boot processor, plus compile options for PKU: */ 340e8df1a95SDave Hansen if (!cpu_feature_enabled(X86_FEATURE_PKU)) 341e8df1a95SDave Hansen return; 342e8df1a95SDave Hansen /* checks the actual processor's cpuid bits: */ 34306976945SDave Hansen if (!cpu_has(c, X86_FEATURE_PKU)) 34406976945SDave Hansen return; 34506976945SDave Hansen if (pku_disabled) 34606976945SDave Hansen return; 34706976945SDave Hansen 34806976945SDave Hansen cr4_set_bits(X86_CR4_PKE); 34906976945SDave Hansen /* 35006976945SDave Hansen * Seting X86_CR4_PKE will cause the X86_FEATURE_OSPKE 35106976945SDave Hansen * cpuid bit to be set. We need to ensure that we 35206976945SDave Hansen * update that bit in this CPU's "cpu_info". 35306976945SDave Hansen */ 35406976945SDave Hansen get_cpu_cap(c); 35506976945SDave Hansen } 35606976945SDave Hansen 35706976945SDave Hansen #ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS 35806976945SDave Hansen static __init int setup_disable_pku(char *arg) 35906976945SDave Hansen { 36006976945SDave Hansen /* 36106976945SDave Hansen * Do not clear the X86_FEATURE_PKU bit. All of the 36206976945SDave Hansen * runtime checks are against OSPKE so clearing the 36306976945SDave Hansen * bit does nothing. 36406976945SDave Hansen * 36506976945SDave Hansen * This way, we will see "pku" in cpuinfo, but not 36606976945SDave Hansen * "ospke", which is exactly what we want. It shows 36706976945SDave Hansen * that the CPU has PKU, but the OS has not enabled it. 36806976945SDave Hansen * This happens to be exactly how a system would look 36906976945SDave Hansen * if we disabled the config option. 37006976945SDave Hansen */ 37106976945SDave Hansen pr_info("x86: 'nopku' specified, disabling Memory Protection Keys\n"); 37206976945SDave Hansen pku_disabled = true; 37306976945SDave Hansen return 1; 37406976945SDave Hansen } 37506976945SDave Hansen __setup("nopku", setup_disable_pku); 37606976945SDave Hansen #endif /* CONFIG_X86_64 */ 37706976945SDave Hansen 37806976945SDave Hansen /* 379b38b0665SH. Peter Anvin * Some CPU features depend on higher CPUID levels, which may not always 380b38b0665SH. Peter Anvin * be available due to CPUID level capping or broken virtualization 381b38b0665SH. Peter Anvin * software. Add those features to this table to auto-disable them. 382b38b0665SH. Peter Anvin */ 383b38b0665SH. Peter Anvin struct cpuid_dependent_feature { 384b38b0665SH. Peter Anvin u32 feature; 385b38b0665SH. Peter Anvin u32 level; 386b38b0665SH. Peter Anvin }; 3870f3fa48aSIngo Molnar 388148f9bb8SPaul Gortmaker static const struct cpuid_dependent_feature 389b38b0665SH. Peter Anvin cpuid_dependent_features[] = { 390b38b0665SH. Peter Anvin { X86_FEATURE_MWAIT, 0x00000005 }, 391b38b0665SH. Peter Anvin { X86_FEATURE_DCA, 0x00000009 }, 392b38b0665SH. Peter Anvin { X86_FEATURE_XSAVE, 0x0000000d }, 393b38b0665SH. Peter Anvin { 0, 0 } 394b38b0665SH. Peter Anvin }; 395b38b0665SH. Peter Anvin 396148f9bb8SPaul Gortmaker static void filter_cpuid_features(struct cpuinfo_x86 *c, bool warn) 397b38b0665SH. Peter Anvin { 398b38b0665SH. Peter Anvin const struct cpuid_dependent_feature *df; 3999766cdbcSJaswinder Singh Rajput 400b38b0665SH. Peter Anvin for (df = cpuid_dependent_features; df->feature; df++) { 4010f3fa48aSIngo Molnar 4020f3fa48aSIngo Molnar if (!cpu_has(c, df->feature)) 4030f3fa48aSIngo Molnar continue; 404b38b0665SH. Peter Anvin /* 405b38b0665SH. Peter Anvin * Note: cpuid_level is set to -1 if unavailable, but 406b38b0665SH. Peter Anvin * extended_extended_level is set to 0 if unavailable 407b38b0665SH. Peter Anvin * and the legitimate extended levels are all negative 408b38b0665SH. Peter Anvin * when signed; hence the weird messing around with 409b38b0665SH. Peter Anvin * signs here... 410b38b0665SH. Peter Anvin */ 4110f3fa48aSIngo Molnar if (!((s32)df->level < 0 ? 412f6db44dfSYinghai Lu (u32)df->level > (u32)c->extended_cpuid_level : 4130f3fa48aSIngo Molnar (s32)df->level > (s32)c->cpuid_level)) 4140f3fa48aSIngo Molnar continue; 4150f3fa48aSIngo Molnar 416b38b0665SH. Peter Anvin clear_cpu_cap(c, df->feature); 4170f3fa48aSIngo Molnar if (!warn) 4180f3fa48aSIngo Molnar continue; 4190f3fa48aSIngo Molnar 4201b74dde7SChen Yucong pr_warn("CPU: CPU feature " X86_CAP_FMT " disabled, no CPUID level 0x%x\n", 4219def39beSJosh Triplett x86_cap_flag(df->feature), df->level); 422b38b0665SH. Peter Anvin } 423b38b0665SH. Peter Anvin } 424b38b0665SH. Peter Anvin 425b38b0665SH. Peter Anvin /* 426f7627e25SThomas Gleixner * Naming convention should be: <Name> [(<Codename>)] 427f7627e25SThomas Gleixner * This table only is used unless init_<vendor>() below doesn't set it; 4280f3fa48aSIngo Molnar * in particular, if CPUID levels 0x80000002..4 are supported, this 4290f3fa48aSIngo Molnar * isn't used 430f7627e25SThomas Gleixner */ 431f7627e25SThomas Gleixner 432f7627e25SThomas Gleixner /* Look up CPU names by table lookup. */ 433148f9bb8SPaul Gortmaker static const char *table_lookup_model(struct cpuinfo_x86 *c) 434f7627e25SThomas Gleixner { 43509dc68d9SJan Beulich #ifdef CONFIG_X86_32 43609dc68d9SJan Beulich const struct legacy_cpu_model_info *info; 437f7627e25SThomas Gleixner 438f7627e25SThomas Gleixner if (c->x86_model >= 16) 439f7627e25SThomas Gleixner return NULL; /* Range check */ 440f7627e25SThomas Gleixner 441f7627e25SThomas Gleixner if (!this_cpu) 442f7627e25SThomas Gleixner return NULL; 443f7627e25SThomas Gleixner 44409dc68d9SJan Beulich info = this_cpu->legacy_models; 445f7627e25SThomas Gleixner 44609dc68d9SJan Beulich while (info->family) { 447f7627e25SThomas Gleixner if (info->family == c->x86) 448f7627e25SThomas Gleixner return info->model_names[c->x86_model]; 449f7627e25SThomas Gleixner info++; 450f7627e25SThomas Gleixner } 45109dc68d9SJan Beulich #endif 452f7627e25SThomas Gleixner return NULL; /* Not found */ 453f7627e25SThomas Gleixner } 454f7627e25SThomas Gleixner 455148f9bb8SPaul Gortmaker __u32 cpu_caps_cleared[NCAPINTS]; 456148f9bb8SPaul Gortmaker __u32 cpu_caps_set[NCAPINTS]; 457f7627e25SThomas Gleixner 45811e3a840SJeremy Fitzhardinge void load_percpu_segment(int cpu) 4599d31d35bSYinghai Lu { 460fab334c1SYinghai Lu #ifdef CONFIG_X86_32 4612697fbd5SBrian Gerst loadsegment(fs, __KERNEL_PERCPU); 4622697fbd5SBrian Gerst #else 46345e876f7SAndy Lutomirski __loadsegment_simple(gs, 0); 4642697fbd5SBrian Gerst wrmsrl(MSR_GS_BASE, (unsigned long)per_cpu(irq_stack_union.gs_base, cpu)); 465fab334c1SYinghai Lu #endif 46660a5317fSTejun Heo load_stack_canary_segment(); 4679d31d35bSYinghai Lu } 4689d31d35bSYinghai Lu 469*ef8813abSAndy Lutomirski /* Setup the fixmap mappings only once per-processor */ 470*ef8813abSAndy Lutomirski static inline void setup_cpu_entry_area(int cpu) 47169218e47SThomas Garnier { 472b23adb7dSAndy Lutomirski #ifdef CONFIG_X86_64 473b23adb7dSAndy Lutomirski /* On 64-bit systems, we use a read-only fixmap GDT. */ 474*ef8813abSAndy Lutomirski pgprot_t gdt_prot = PAGE_KERNEL_RO; 475b23adb7dSAndy Lutomirski #else 476b23adb7dSAndy Lutomirski /* 477b23adb7dSAndy Lutomirski * On native 32-bit systems, the GDT cannot be read-only because 478b23adb7dSAndy Lutomirski * our double fault handler uses a task gate, and entering through 479b23adb7dSAndy Lutomirski * a task gate needs to change an available TSS to busy. If the GDT 480b23adb7dSAndy Lutomirski * is read-only, that will triple fault. 481b23adb7dSAndy Lutomirski * 482b23adb7dSAndy Lutomirski * On Xen PV, the GDT must be read-only because the hypervisor requires 483b23adb7dSAndy Lutomirski * it. 484b23adb7dSAndy Lutomirski */ 485*ef8813abSAndy Lutomirski pgprot_t gdt_prot = boot_cpu_has(X86_FEATURE_XENPV) ? 486b23adb7dSAndy Lutomirski PAGE_KERNEL_RO : PAGE_KERNEL; 487b23adb7dSAndy Lutomirski #endif 488b23adb7dSAndy Lutomirski 489*ef8813abSAndy Lutomirski __set_fixmap(get_cpu_entry_area_index(cpu, gdt), get_cpu_gdt_paddr(cpu), gdt_prot); 49069218e47SThomas Garnier } 49169218e47SThomas Garnier 49245fc8757SThomas Garnier /* Load the original GDT from the per-cpu structure */ 49345fc8757SThomas Garnier void load_direct_gdt(int cpu) 49445fc8757SThomas Garnier { 49545fc8757SThomas Garnier struct desc_ptr gdt_descr; 49645fc8757SThomas Garnier 49745fc8757SThomas Garnier gdt_descr.address = (long)get_cpu_gdt_rw(cpu); 49845fc8757SThomas Garnier gdt_descr.size = GDT_SIZE - 1; 49945fc8757SThomas Garnier load_gdt(&gdt_descr); 50045fc8757SThomas Garnier } 50145fc8757SThomas Garnier EXPORT_SYMBOL_GPL(load_direct_gdt); 50245fc8757SThomas Garnier 50369218e47SThomas Garnier /* Load a fixmap remapping of the per-cpu GDT */ 50469218e47SThomas Garnier void load_fixmap_gdt(int cpu) 50569218e47SThomas Garnier { 50669218e47SThomas Garnier struct desc_ptr gdt_descr; 50769218e47SThomas Garnier 50869218e47SThomas Garnier gdt_descr.address = (long)get_cpu_gdt_ro(cpu); 50969218e47SThomas Garnier gdt_descr.size = GDT_SIZE - 1; 51069218e47SThomas Garnier load_gdt(&gdt_descr); 51169218e47SThomas Garnier } 51245fc8757SThomas Garnier EXPORT_SYMBOL_GPL(load_fixmap_gdt); 51369218e47SThomas Garnier 5140f3fa48aSIngo Molnar /* 5150f3fa48aSIngo Molnar * Current gdt points %fs at the "master" per-cpu area: after this, 5160f3fa48aSIngo Molnar * it's on the real one. 5170f3fa48aSIngo Molnar */ 518552be871SBrian Gerst void switch_to_new_gdt(int cpu) 519f7627e25SThomas Gleixner { 52045fc8757SThomas Garnier /* Load the original GDT */ 52145fc8757SThomas Garnier load_direct_gdt(cpu); 522f7627e25SThomas Gleixner /* Reload the per-cpu base */ 52311e3a840SJeremy Fitzhardinge load_percpu_segment(cpu); 524f7627e25SThomas Gleixner } 525f7627e25SThomas Gleixner 526148f9bb8SPaul Gortmaker static const struct cpu_dev *cpu_devs[X86_VENDOR_NUM] = {}; 527f7627e25SThomas Gleixner 528148f9bb8SPaul Gortmaker static void get_model_name(struct cpuinfo_x86 *c) 529f7627e25SThomas Gleixner { 530f7627e25SThomas Gleixner unsigned int *v; 531ee098e1aSBorislav Petkov char *p, *q, *s; 532f7627e25SThomas Gleixner 5333da99c97SYinghai Lu if (c->extended_cpuid_level < 0x80000004) 5341b05d60dSYinghai Lu return; 535f7627e25SThomas Gleixner 536f7627e25SThomas Gleixner v = (unsigned int *)c->x86_model_id; 537f7627e25SThomas Gleixner cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]); 538f7627e25SThomas Gleixner cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]); 539f7627e25SThomas Gleixner cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]); 540f7627e25SThomas Gleixner c->x86_model_id[48] = 0; 541f7627e25SThomas Gleixner 542ee098e1aSBorislav Petkov /* Trim whitespace */ 543ee098e1aSBorislav Petkov p = q = s = &c->x86_model_id[0]; 544ee098e1aSBorislav Petkov 545ee098e1aSBorislav Petkov while (*p == ' ') 546ee098e1aSBorislav Petkov p++; 547ee098e1aSBorislav Petkov 548ee098e1aSBorislav Petkov while (*p) { 549ee098e1aSBorislav Petkov /* Note the last non-whitespace index */ 550ee098e1aSBorislav Petkov if (!isspace(*p)) 551ee098e1aSBorislav Petkov s = q; 552ee098e1aSBorislav Petkov 553ee098e1aSBorislav Petkov *q++ = *p++; 554ee098e1aSBorislav Petkov } 555ee098e1aSBorislav Petkov 556ee098e1aSBorislav Petkov *(s + 1) = '\0'; 557f7627e25SThomas Gleixner } 558f7627e25SThomas Gleixner 559148f9bb8SPaul Gortmaker void cpu_detect_cache_sizes(struct cpuinfo_x86 *c) 560f7627e25SThomas Gleixner { 5619d31d35bSYinghai Lu unsigned int n, dummy, ebx, ecx, edx, l2size; 562f7627e25SThomas Gleixner 5633da99c97SYinghai Lu n = c->extended_cpuid_level; 564f7627e25SThomas Gleixner 565f7627e25SThomas Gleixner if (n >= 0x80000005) { 5669d31d35bSYinghai Lu cpuid(0x80000005, &dummy, &ebx, &ecx, &edx); 567f7627e25SThomas Gleixner c->x86_cache_size = (ecx>>24) + (edx>>24); 568140fc727SYinghai Lu #ifdef CONFIG_X86_64 569140fc727SYinghai Lu /* On K8 L1 TLB is inclusive, so don't count it */ 570140fc727SYinghai Lu c->x86_tlbsize = 0; 571140fc727SYinghai Lu #endif 572f7627e25SThomas Gleixner } 573f7627e25SThomas Gleixner 574f7627e25SThomas Gleixner if (n < 0x80000006) /* Some chips just has a large L1. */ 575f7627e25SThomas Gleixner return; 576f7627e25SThomas Gleixner 5770a488a53SYinghai Lu cpuid(0x80000006, &dummy, &ebx, &ecx, &edx); 578f7627e25SThomas Gleixner l2size = ecx >> 16; 579f7627e25SThomas Gleixner 580140fc727SYinghai Lu #ifdef CONFIG_X86_64 581140fc727SYinghai Lu c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff); 582140fc727SYinghai Lu #else 583f7627e25SThomas Gleixner /* do processor-specific cache resizing */ 58409dc68d9SJan Beulich if (this_cpu->legacy_cache_size) 58509dc68d9SJan Beulich l2size = this_cpu->legacy_cache_size(c, l2size); 586f7627e25SThomas Gleixner 587f7627e25SThomas Gleixner /* Allow user to override all this if necessary. */ 588f7627e25SThomas Gleixner if (cachesize_override != -1) 589f7627e25SThomas Gleixner l2size = cachesize_override; 590f7627e25SThomas Gleixner 591f7627e25SThomas Gleixner if (l2size == 0) 592f7627e25SThomas Gleixner return; /* Again, no L2 cache is possible */ 593140fc727SYinghai Lu #endif 594f7627e25SThomas Gleixner 595f7627e25SThomas Gleixner c->x86_cache_size = l2size; 596f7627e25SThomas Gleixner } 597f7627e25SThomas Gleixner 598e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_4k[NR_INFO]; 599e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_2m[NR_INFO]; 600e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_4m[NR_INFO]; 601e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_4k[NR_INFO]; 602e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_2m[NR_INFO]; 603e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_4m[NR_INFO]; 604dd360393SKirill A. Shutemov u16 __read_mostly tlb_lld_1g[NR_INFO]; 605e0ba94f1SAlex Shi 606f94fe119SSteven Honeyman static void cpu_detect_tlb(struct cpuinfo_x86 *c) 607e0ba94f1SAlex Shi { 608e0ba94f1SAlex Shi if (this_cpu->c_detect_tlb) 609e0ba94f1SAlex Shi this_cpu->c_detect_tlb(c); 610e0ba94f1SAlex Shi 611f94fe119SSteven Honeyman pr_info("Last level iTLB entries: 4KB %d, 2MB %d, 4MB %d\n", 612e0ba94f1SAlex Shi tlb_lli_4k[ENTRIES], tlb_lli_2m[ENTRIES], 613f94fe119SSteven Honeyman tlb_lli_4m[ENTRIES]); 614f94fe119SSteven Honeyman 615f94fe119SSteven Honeyman pr_info("Last level dTLB entries: 4KB %d, 2MB %d, 4MB %d, 1GB %d\n", 616f94fe119SSteven Honeyman tlb_lld_4k[ENTRIES], tlb_lld_2m[ENTRIES], 617f94fe119SSteven Honeyman tlb_lld_4m[ENTRIES], tlb_lld_1g[ENTRIES]); 618e0ba94f1SAlex Shi } 619e0ba94f1SAlex Shi 620148f9bb8SPaul Gortmaker void detect_ht(struct cpuinfo_x86 *c) 6219d31d35bSYinghai Lu { 622c8e56d20SBorislav Petkov #ifdef CONFIG_SMP 6239d31d35bSYinghai Lu u32 eax, ebx, ecx, edx; 6249d31d35bSYinghai Lu int index_msb, core_bits; 6252eaad1fdSMike Travis static bool printed; 6269d31d35bSYinghai Lu 6270a488a53SYinghai Lu if (!cpu_has(c, X86_FEATURE_HT)) 6289d31d35bSYinghai Lu return; 6299d31d35bSYinghai Lu 6300a488a53SYinghai Lu if (cpu_has(c, X86_FEATURE_CMP_LEGACY)) 6310a488a53SYinghai Lu goto out; 6320a488a53SYinghai Lu 6331cd78776SYinghai Lu if (cpu_has(c, X86_FEATURE_XTOPOLOGY)) 6341cd78776SYinghai Lu return; 6351cd78776SYinghai Lu 6360a488a53SYinghai Lu cpuid(1, &eax, &ebx, &ecx, &edx); 6370a488a53SYinghai Lu 6389d31d35bSYinghai Lu smp_num_siblings = (ebx & 0xff0000) >> 16; 6399d31d35bSYinghai Lu 6409d31d35bSYinghai Lu if (smp_num_siblings == 1) { 6411b74dde7SChen Yucong pr_info_once("CPU0: Hyper-Threading is disabled\n"); 6420f3fa48aSIngo Molnar goto out; 6430f3fa48aSIngo Molnar } 6440f3fa48aSIngo Molnar 6450f3fa48aSIngo Molnar if (smp_num_siblings <= 1) 6460f3fa48aSIngo Molnar goto out; 6479d31d35bSYinghai Lu 6489d31d35bSYinghai Lu index_msb = get_count_order(smp_num_siblings); 649cb8cc442SIngo Molnar c->phys_proc_id = apic->phys_pkg_id(c->initial_apicid, index_msb); 6509d31d35bSYinghai Lu 6519d31d35bSYinghai Lu smp_num_siblings = smp_num_siblings / c->x86_max_cores; 6529d31d35bSYinghai Lu 6539d31d35bSYinghai Lu index_msb = get_count_order(smp_num_siblings); 6549d31d35bSYinghai Lu 6559d31d35bSYinghai Lu core_bits = get_count_order(c->x86_max_cores); 6569d31d35bSYinghai Lu 657cb8cc442SIngo Molnar c->cpu_core_id = apic->phys_pkg_id(c->initial_apicid, index_msb) & 6581cd78776SYinghai Lu ((1 << core_bits) - 1); 6599d31d35bSYinghai Lu 6600a488a53SYinghai Lu out: 6612eaad1fdSMike Travis if (!printed && (c->x86_max_cores * smp_num_siblings) > 1) { 6621b74dde7SChen Yucong pr_info("CPU: Physical Processor ID: %d\n", 6630a488a53SYinghai Lu c->phys_proc_id); 6641b74dde7SChen Yucong pr_info("CPU: Processor Core ID: %d\n", 6659d31d35bSYinghai Lu c->cpu_core_id); 6662eaad1fdSMike Travis printed = 1; 6679d31d35bSYinghai Lu } 6689d31d35bSYinghai Lu #endif 66997e4db7cSYinghai Lu } 670f7627e25SThomas Gleixner 671148f9bb8SPaul Gortmaker static void get_cpu_vendor(struct cpuinfo_x86 *c) 672f7627e25SThomas Gleixner { 673f7627e25SThomas Gleixner char *v = c->x86_vendor_id; 6740f3fa48aSIngo Molnar int i; 675f7627e25SThomas Gleixner 676f7627e25SThomas Gleixner for (i = 0; i < X86_VENDOR_NUM; i++) { 67710a434fcSYinghai Lu if (!cpu_devs[i]) 67810a434fcSYinghai Lu break; 67910a434fcSYinghai Lu 680f7627e25SThomas Gleixner if (!strcmp(v, cpu_devs[i]->c_ident[0]) || 681f7627e25SThomas Gleixner (cpu_devs[i]->c_ident[1] && 682f7627e25SThomas Gleixner !strcmp(v, cpu_devs[i]->c_ident[1]))) { 6830f3fa48aSIngo Molnar 684f7627e25SThomas Gleixner this_cpu = cpu_devs[i]; 68510a434fcSYinghai Lu c->x86_vendor = this_cpu->c_x86_vendor; 686f7627e25SThomas Gleixner return; 687f7627e25SThomas Gleixner } 688f7627e25SThomas Gleixner } 68910a434fcSYinghai Lu 6901b74dde7SChen Yucong pr_err_once("CPU: vendor_id '%s' unknown, using generic init.\n" \ 691a9c56953SMinchan Kim "CPU: Your system may be unstable.\n", v); 69210a434fcSYinghai Lu 693f7627e25SThomas Gleixner c->x86_vendor = X86_VENDOR_UNKNOWN; 694f7627e25SThomas Gleixner this_cpu = &default_cpu; 695f7627e25SThomas Gleixner } 696f7627e25SThomas Gleixner 697148f9bb8SPaul Gortmaker void cpu_detect(struct cpuinfo_x86 *c) 698f7627e25SThomas Gleixner { 699f7627e25SThomas Gleixner /* Get vendor name */ 7004a148513SHarvey Harrison cpuid(0x00000000, (unsigned int *)&c->cpuid_level, 7014a148513SHarvey Harrison (unsigned int *)&c->x86_vendor_id[0], 7024a148513SHarvey Harrison (unsigned int *)&c->x86_vendor_id[8], 7034a148513SHarvey Harrison (unsigned int *)&c->x86_vendor_id[4]); 704f7627e25SThomas Gleixner 705f7627e25SThomas Gleixner c->x86 = 4; 7069d31d35bSYinghai Lu /* Intel-defined flags: level 0x00000001 */ 707f7627e25SThomas Gleixner if (c->cpuid_level >= 0x00000001) { 708f7627e25SThomas Gleixner u32 junk, tfms, cap0, misc; 7090f3fa48aSIngo Molnar 710f7627e25SThomas Gleixner cpuid(0x00000001, &tfms, &misc, &junk, &cap0); 71199f925ceSBorislav Petkov c->x86 = x86_family(tfms); 71299f925ceSBorislav Petkov c->x86_model = x86_model(tfms); 71399f925ceSBorislav Petkov c->x86_mask = x86_stepping(tfms); 7140f3fa48aSIngo Molnar 715d4387bd3SHuang, Ying if (cap0 & (1<<19)) { 716d4387bd3SHuang, Ying c->x86_clflush_size = ((misc >> 8) & 0xff) * 8; 7179d31d35bSYinghai Lu c->x86_cache_alignment = c->x86_clflush_size; 718d4387bd3SHuang, Ying } 719f7627e25SThomas Gleixner } 720f7627e25SThomas Gleixner } 7213da99c97SYinghai Lu 7228bf1ebcaSAndy Lutomirski static void apply_forced_caps(struct cpuinfo_x86 *c) 7238bf1ebcaSAndy Lutomirski { 7248bf1ebcaSAndy Lutomirski int i; 7258bf1ebcaSAndy Lutomirski 7268bf1ebcaSAndy Lutomirski for (i = 0; i < NCAPINTS; i++) { 7278bf1ebcaSAndy Lutomirski c->x86_capability[i] &= ~cpu_caps_cleared[i]; 7288bf1ebcaSAndy Lutomirski c->x86_capability[i] |= cpu_caps_set[i]; 7298bf1ebcaSAndy Lutomirski } 7308bf1ebcaSAndy Lutomirski } 7318bf1ebcaSAndy Lutomirski 732148f9bb8SPaul Gortmaker void get_cpu_cap(struct cpuinfo_x86 *c) 733093af8d7SYinghai Lu { 73439c06df4SBorislav Petkov u32 eax, ebx, ecx, edx; 735093af8d7SYinghai Lu 736093af8d7SYinghai Lu /* Intel-defined flags: level 0x00000001 */ 737093af8d7SYinghai Lu if (c->cpuid_level >= 0x00000001) { 73839c06df4SBorislav Petkov cpuid(0x00000001, &eax, &ebx, &ecx, &edx); 7390f3fa48aSIngo Molnar 74039c06df4SBorislav Petkov c->x86_capability[CPUID_1_ECX] = ecx; 74139c06df4SBorislav Petkov c->x86_capability[CPUID_1_EDX] = edx; 742093af8d7SYinghai Lu } 743093af8d7SYinghai Lu 7443df8d920SAndy Lutomirski /* Thermal and Power Management Leaf: level 0x00000006 (eax) */ 7453df8d920SAndy Lutomirski if (c->cpuid_level >= 0x00000006) 7463df8d920SAndy Lutomirski c->x86_capability[CPUID_6_EAX] = cpuid_eax(0x00000006); 7473df8d920SAndy Lutomirski 748bdc802dcSH. Peter Anvin /* Additional Intel-defined flags: level 0x00000007 */ 749bdc802dcSH. Peter Anvin if (c->cpuid_level >= 0x00000007) { 750bdc802dcSH. Peter Anvin cpuid_count(0x00000007, 0, &eax, &ebx, &ecx, &edx); 75139c06df4SBorislav Petkov c->x86_capability[CPUID_7_0_EBX] = ebx; 752dfb4a70fSDave Hansen c->x86_capability[CPUID_7_ECX] = ecx; 753bdc802dcSH. Peter Anvin } 754bdc802dcSH. Peter Anvin 7556229ad27SFenghua Yu /* Extended state features: level 0x0000000d */ 7566229ad27SFenghua Yu if (c->cpuid_level >= 0x0000000d) { 7576229ad27SFenghua Yu cpuid_count(0x0000000d, 1, &eax, &ebx, &ecx, &edx); 7586229ad27SFenghua Yu 75939c06df4SBorislav Petkov c->x86_capability[CPUID_D_1_EAX] = eax; 7606229ad27SFenghua Yu } 7616229ad27SFenghua Yu 762cbc82b17SPeter P Waskiewicz Jr /* Additional Intel-defined flags: level 0x0000000F */ 763cbc82b17SPeter P Waskiewicz Jr if (c->cpuid_level >= 0x0000000F) { 764cbc82b17SPeter P Waskiewicz Jr 765cbc82b17SPeter P Waskiewicz Jr /* QoS sub-leaf, EAX=0Fh, ECX=0 */ 766cbc82b17SPeter P Waskiewicz Jr cpuid_count(0x0000000F, 0, &eax, &ebx, &ecx, &edx); 76739c06df4SBorislav Petkov c->x86_capability[CPUID_F_0_EDX] = edx; 76839c06df4SBorislav Petkov 769cbc82b17SPeter P Waskiewicz Jr if (cpu_has(c, X86_FEATURE_CQM_LLC)) { 770cbc82b17SPeter P Waskiewicz Jr /* will be overridden if occupancy monitoring exists */ 771cbc82b17SPeter P Waskiewicz Jr c->x86_cache_max_rmid = ebx; 772cbc82b17SPeter P Waskiewicz Jr 773cbc82b17SPeter P Waskiewicz Jr /* QoS sub-leaf, EAX=0Fh, ECX=1 */ 774cbc82b17SPeter P Waskiewicz Jr cpuid_count(0x0000000F, 1, &eax, &ebx, &ecx, &edx); 77539c06df4SBorislav Petkov c->x86_capability[CPUID_F_1_EDX] = edx; 77639c06df4SBorislav Petkov 77733c3cc7aSVikas Shivappa if ((cpu_has(c, X86_FEATURE_CQM_OCCUP_LLC)) || 77833c3cc7aSVikas Shivappa ((cpu_has(c, X86_FEATURE_CQM_MBM_TOTAL)) || 77933c3cc7aSVikas Shivappa (cpu_has(c, X86_FEATURE_CQM_MBM_LOCAL)))) { 780cbc82b17SPeter P Waskiewicz Jr c->x86_cache_max_rmid = ecx; 781cbc82b17SPeter P Waskiewicz Jr c->x86_cache_occ_scale = ebx; 782cbc82b17SPeter P Waskiewicz Jr } 783cbc82b17SPeter P Waskiewicz Jr } else { 784cbc82b17SPeter P Waskiewicz Jr c->x86_cache_max_rmid = -1; 785cbc82b17SPeter P Waskiewicz Jr c->x86_cache_occ_scale = -1; 786cbc82b17SPeter P Waskiewicz Jr } 787cbc82b17SPeter P Waskiewicz Jr } 788cbc82b17SPeter P Waskiewicz Jr 789093af8d7SYinghai Lu /* AMD-defined flags: level 0x80000001 */ 79039c06df4SBorislav Petkov eax = cpuid_eax(0x80000000); 79139c06df4SBorislav Petkov c->extended_cpuid_level = eax; 7920f3fa48aSIngo Molnar 79339c06df4SBorislav Petkov if ((eax & 0xffff0000) == 0x80000000) { 79439c06df4SBorislav Petkov if (eax >= 0x80000001) { 79539c06df4SBorislav Petkov cpuid(0x80000001, &eax, &ebx, &ecx, &edx); 79639c06df4SBorislav Petkov 79739c06df4SBorislav Petkov c->x86_capability[CPUID_8000_0001_ECX] = ecx; 79839c06df4SBorislav Petkov c->x86_capability[CPUID_8000_0001_EDX] = edx; 799093af8d7SYinghai Lu } 800093af8d7SYinghai Lu } 801093af8d7SYinghai Lu 80271faad43SYazen Ghannam if (c->extended_cpuid_level >= 0x80000007) { 80371faad43SYazen Ghannam cpuid(0x80000007, &eax, &ebx, &ecx, &edx); 80471faad43SYazen Ghannam 80571faad43SYazen Ghannam c->x86_capability[CPUID_8000_0007_EBX] = ebx; 80671faad43SYazen Ghannam c->x86_power = edx; 80771faad43SYazen Ghannam } 80871faad43SYazen Ghannam 8095122c890SYinghai Lu if (c->extended_cpuid_level >= 0x80000008) { 81039c06df4SBorislav Petkov cpuid(0x80000008, &eax, &ebx, &ecx, &edx); 8115122c890SYinghai Lu 8125122c890SYinghai Lu c->x86_virt_bits = (eax >> 8) & 0xff; 8135122c890SYinghai Lu c->x86_phys_bits = eax & 0xff; 81439c06df4SBorislav Petkov c->x86_capability[CPUID_8000_0008_EBX] = ebx; 8155122c890SYinghai Lu } 81613c6c532SJan Beulich #ifdef CONFIG_X86_32 81713c6c532SJan Beulich else if (cpu_has(c, X86_FEATURE_PAE) || cpu_has(c, X86_FEATURE_PSE36)) 81813c6c532SJan Beulich c->x86_phys_bits = 36; 8195122c890SYinghai Lu #endif 820e3224234SYinghai Lu 8212ccd71f1SBorislav Petkov if (c->extended_cpuid_level >= 0x8000000a) 82239c06df4SBorislav Petkov c->x86_capability[CPUID_8000_000A_EDX] = cpuid_edx(0x8000000a); 8232ccd71f1SBorislav Petkov 8241dedefd1SJacob Pan init_scattered_cpuid_features(c); 82560d34501SAndy Lutomirski 82660d34501SAndy Lutomirski /* 82760d34501SAndy Lutomirski * Clear/Set all flags overridden by options, after probe. 82860d34501SAndy Lutomirski * This needs to happen each time we re-probe, which may happen 82960d34501SAndy Lutomirski * several times during CPU initialization. 83060d34501SAndy Lutomirski */ 83160d34501SAndy Lutomirski apply_forced_caps(c); 832093af8d7SYinghai Lu } 833093af8d7SYinghai Lu 834148f9bb8SPaul Gortmaker static void identify_cpu_without_cpuid(struct cpuinfo_x86 *c) 835aef93c8bSYinghai Lu { 836aef93c8bSYinghai Lu #ifdef CONFIG_X86_32 837aef93c8bSYinghai Lu int i; 838aef93c8bSYinghai Lu 839aef93c8bSYinghai Lu /* 840aef93c8bSYinghai Lu * First of all, decide if this is a 486 or higher 841aef93c8bSYinghai Lu * It's a 486 if we can modify the AC flag 842aef93c8bSYinghai Lu */ 843aef93c8bSYinghai Lu if (flag_is_changeable_p(X86_EFLAGS_AC)) 844aef93c8bSYinghai Lu c->x86 = 4; 845aef93c8bSYinghai Lu else 846aef93c8bSYinghai Lu c->x86 = 3; 847aef93c8bSYinghai Lu 848aef93c8bSYinghai Lu for (i = 0; i < X86_VENDOR_NUM; i++) 849aef93c8bSYinghai Lu if (cpu_devs[i] && cpu_devs[i]->c_identify) { 850aef93c8bSYinghai Lu c->x86_vendor_id[0] = 0; 851aef93c8bSYinghai Lu cpu_devs[i]->c_identify(c); 852aef93c8bSYinghai Lu if (c->x86_vendor_id[0]) { 853aef93c8bSYinghai Lu get_cpu_vendor(c); 854aef93c8bSYinghai Lu break; 855aef93c8bSYinghai Lu } 856aef93c8bSYinghai Lu } 857aef93c8bSYinghai Lu #endif 858093af8d7SYinghai Lu } 859f7627e25SThomas Gleixner 86034048c9eSPaolo Ciarrocchi /* 86134048c9eSPaolo Ciarrocchi * Do minimum CPU detection early. 86234048c9eSPaolo Ciarrocchi * Fields really needed: vendor, cpuid_level, family, model, mask, 86334048c9eSPaolo Ciarrocchi * cache alignment. 86434048c9eSPaolo Ciarrocchi * The others are not touched to avoid unwanted side effects. 86534048c9eSPaolo Ciarrocchi * 86634048c9eSPaolo Ciarrocchi * WARNING: this function is only called on the BP. Don't add code here 86734048c9eSPaolo Ciarrocchi * that is supposed to run on all CPUs. 86834048c9eSPaolo Ciarrocchi */ 8693da99c97SYinghai Lu static void __init early_identify_cpu(struct cpuinfo_x86 *c) 870f7627e25SThomas Gleixner { 8716627d242SYinghai Lu #ifdef CONFIG_X86_64 8726627d242SYinghai Lu c->x86_clflush_size = 64; 87313c6c532SJan Beulich c->x86_phys_bits = 36; 87413c6c532SJan Beulich c->x86_virt_bits = 48; 8756627d242SYinghai Lu #else 876d4387bd3SHuang, Ying c->x86_clflush_size = 32; 87713c6c532SJan Beulich c->x86_phys_bits = 32; 87813c6c532SJan Beulich c->x86_virt_bits = 32; 8796627d242SYinghai Lu #endif 8800a488a53SYinghai Lu c->x86_cache_alignment = c->x86_clflush_size; 881f7627e25SThomas Gleixner 8823da99c97SYinghai Lu memset(&c->x86_capability, 0, sizeof c->x86_capability); 8830a488a53SYinghai Lu c->extended_cpuid_level = 0; 8840a488a53SYinghai Lu 885aef93c8bSYinghai Lu /* cyrix could have cpuid enabled via c_identify()*/ 88605fb3c19SAndy Lutomirski if (have_cpuid_p()) { 887f7627e25SThomas Gleixner cpu_detect(c); 8883da99c97SYinghai Lu get_cpu_vendor(c); 8893da99c97SYinghai Lu get_cpu_cap(c); 89078d1b296SBorislav Petkov setup_force_cpu_cap(X86_FEATURE_CPUID); 89112cf105cSKrzysztof Helt 89210a434fcSYinghai Lu if (this_cpu->c_early_init) 89310a434fcSYinghai Lu this_cpu->c_early_init(c); 8943da99c97SYinghai Lu 895f6e9456cSRobert Richter c->cpu_index = 0; 896b38b0665SH. Peter Anvin filter_cpuid_features(c, false); 897de5397adSFenghua Yu 898a110b5ecSBorislav Petkov if (this_cpu->c_bsp_init) 899a110b5ecSBorislav Petkov this_cpu->c_bsp_init(c); 90078d1b296SBorislav Petkov } else { 90178d1b296SBorislav Petkov identify_cpu_without_cpuid(c); 90278d1b296SBorislav Petkov setup_clear_cpu_cap(X86_FEATURE_CPUID); 90305fb3c19SAndy Lutomirski } 904c3b83598SBorislav Petkov 905c3b83598SBorislav Petkov setup_force_cpu_cap(X86_FEATURE_ALWAYS); 906db52ef74SIngo Molnar fpu__init_system(c); 907b8b7abaeSAndy Lutomirski 908b8b7abaeSAndy Lutomirski #ifdef CONFIG_X86_32 909b8b7abaeSAndy Lutomirski /* 910b8b7abaeSAndy Lutomirski * Regardless of whether PCID is enumerated, the SDM says 911b8b7abaeSAndy Lutomirski * that it can't be enabled in 32-bit mode. 912b8b7abaeSAndy Lutomirski */ 913b8b7abaeSAndy Lutomirski setup_clear_cpu_cap(X86_FEATURE_PCID); 914b8b7abaeSAndy Lutomirski #endif 915f7627e25SThomas Gleixner } 916f7627e25SThomas Gleixner 9179d31d35bSYinghai Lu void __init early_cpu_init(void) 9189d31d35bSYinghai Lu { 91902dde8b4SJan Beulich const struct cpu_dev *const *cdev; 92010a434fcSYinghai Lu int count = 0; 9219d31d35bSYinghai Lu 922ac23f253SJan Beulich #ifdef CONFIG_PROCESSOR_SELECT 9231b74dde7SChen Yucong pr_info("KERNEL supported cpus:\n"); 92431c997caSIngo Molnar #endif 92531c997caSIngo Molnar 92610a434fcSYinghai Lu for (cdev = __x86_cpu_dev_start; cdev < __x86_cpu_dev_end; cdev++) { 92702dde8b4SJan Beulich const struct cpu_dev *cpudev = *cdev; 9289d31d35bSYinghai Lu 92910a434fcSYinghai Lu if (count >= X86_VENDOR_NUM) 93010a434fcSYinghai Lu break; 93110a434fcSYinghai Lu cpu_devs[count] = cpudev; 93210a434fcSYinghai Lu count++; 93310a434fcSYinghai Lu 934ac23f253SJan Beulich #ifdef CONFIG_PROCESSOR_SELECT 93531c997caSIngo Molnar { 93631c997caSIngo Molnar unsigned int j; 93731c997caSIngo Molnar 93810a434fcSYinghai Lu for (j = 0; j < 2; j++) { 93910a434fcSYinghai Lu if (!cpudev->c_ident[j]) 94010a434fcSYinghai Lu continue; 9411b74dde7SChen Yucong pr_info(" %s %s\n", cpudev->c_vendor, 94210a434fcSYinghai Lu cpudev->c_ident[j]); 94310a434fcSYinghai Lu } 94410a434fcSYinghai Lu } 9450388423dSDave Jones #endif 94631c997caSIngo Molnar } 9479d31d35bSYinghai Lu early_identify_cpu(&boot_cpu_data); 948f7627e25SThomas Gleixner } 949f7627e25SThomas Gleixner 950b6734c35SH. Peter Anvin /* 951366d4a43SBorislav Petkov * The NOPL instruction is supposed to exist on all CPUs of family >= 6; 952366d4a43SBorislav Petkov * unfortunately, that's not true in practice because of early VIA 953366d4a43SBorislav Petkov * chips and (more importantly) broken virtualizers that are not easy 954366d4a43SBorislav Petkov * to detect. In the latter case it doesn't even *fail* reliably, so 955366d4a43SBorislav Petkov * probing for it doesn't even work. Disable it completely on 32-bit 956ba0593bfSH. Peter Anvin * unless we can find a reliable way to detect all the broken cases. 957366d4a43SBorislav Petkov * Enable it explicitly on 64-bit for non-constant inputs of cpu_has(). 958b6734c35SH. Peter Anvin */ 959148f9bb8SPaul Gortmaker static void detect_nopl(struct cpuinfo_x86 *c) 960b6734c35SH. Peter Anvin { 961366d4a43SBorislav Petkov #ifdef CONFIG_X86_32 962b6734c35SH. Peter Anvin clear_cpu_cap(c, X86_FEATURE_NOPL); 963366d4a43SBorislav Petkov #else 964366d4a43SBorislav Petkov set_cpu_cap(c, X86_FEATURE_NOPL); 965366d4a43SBorislav Petkov #endif 966f7627e25SThomas Gleixner } 967f7627e25SThomas Gleixner 9687a5d6704SAndy Lutomirski static void detect_null_seg_behavior(struct cpuinfo_x86 *c) 9697a5d6704SAndy Lutomirski { 9707a5d6704SAndy Lutomirski #ifdef CONFIG_X86_64 971f7627e25SThomas Gleixner /* 9727a5d6704SAndy Lutomirski * Empirically, writing zero to a segment selector on AMD does 9737a5d6704SAndy Lutomirski * not clear the base, whereas writing zero to a segment 9747a5d6704SAndy Lutomirski * selector on Intel does clear the base. Intel's behavior 9757a5d6704SAndy Lutomirski * allows slightly faster context switches in the common case 9767a5d6704SAndy Lutomirski * where GS is unused by the prev and next threads. 977f7627e25SThomas Gleixner * 9787a5d6704SAndy Lutomirski * Since neither vendor documents this anywhere that I can see, 9797a5d6704SAndy Lutomirski * detect it directly instead of hardcoding the choice by 9807a5d6704SAndy Lutomirski * vendor. 9817a5d6704SAndy Lutomirski * 9827a5d6704SAndy Lutomirski * I've designated AMD's behavior as the "bug" because it's 9837a5d6704SAndy Lutomirski * counterintuitive and less friendly. 984f7627e25SThomas Gleixner */ 9857a5d6704SAndy Lutomirski 9867a5d6704SAndy Lutomirski unsigned long old_base, tmp; 9877a5d6704SAndy Lutomirski rdmsrl(MSR_FS_BASE, old_base); 9887a5d6704SAndy Lutomirski wrmsrl(MSR_FS_BASE, 1); 9897a5d6704SAndy Lutomirski loadsegment(fs, 0); 9907a5d6704SAndy Lutomirski rdmsrl(MSR_FS_BASE, tmp); 9917a5d6704SAndy Lutomirski if (tmp != 0) 9927a5d6704SAndy Lutomirski set_cpu_bug(c, X86_BUG_NULL_SEG); 9937a5d6704SAndy Lutomirski wrmsrl(MSR_FS_BASE, old_base); 9943da99c97SYinghai Lu #endif 995f7627e25SThomas Gleixner } 996aef93c8bSYinghai Lu 997148f9bb8SPaul Gortmaker static void generic_identify(struct cpuinfo_x86 *c) 998f7627e25SThomas Gleixner { 999f7627e25SThomas Gleixner c->extended_cpuid_level = 0; 1000f7627e25SThomas Gleixner 1001aef93c8bSYinghai Lu if (!have_cpuid_p()) 1002aef93c8bSYinghai Lu identify_cpu_without_cpuid(c); 1003f7627e25SThomas Gleixner 1004aef93c8bSYinghai Lu /* cyrix could have cpuid enabled via c_identify()*/ 1005a9853dd6SIngo Molnar if (!have_cpuid_p()) 1006aef93c8bSYinghai Lu return; 1007aef93c8bSYinghai Lu 10083da99c97SYinghai Lu cpu_detect(c); 10093da99c97SYinghai Lu 10103da99c97SYinghai Lu get_cpu_vendor(c); 10113da99c97SYinghai Lu 10123da99c97SYinghai Lu get_cpu_cap(c); 10133da99c97SYinghai Lu 1014f7627e25SThomas Gleixner if (c->cpuid_level >= 0x00000001) { 10153da99c97SYinghai Lu c->initial_apicid = (cpuid_ebx(1) >> 24) & 0xFF; 1016b89d3b3eSYinghai Lu #ifdef CONFIG_X86_32 1017c8e56d20SBorislav Petkov # ifdef CONFIG_SMP 1018cb8cc442SIngo Molnar c->apicid = apic->phys_pkg_id(c->initial_apicid, 0); 1019f7627e25SThomas Gleixner # else 102001aaea1aSYinghai Lu c->apicid = c->initial_apicid; 1021f7627e25SThomas Gleixner # endif 1022b89d3b3eSYinghai Lu #endif 1023b89d3b3eSYinghai Lu c->phys_proc_id = c->initial_apicid; 1024f7627e25SThomas Gleixner } 1025f7627e25SThomas Gleixner 1026f7627e25SThomas Gleixner get_model_name(c); /* Default name */ 1027f7627e25SThomas Gleixner 1028b6734c35SH. Peter Anvin detect_nopl(c); 10297a5d6704SAndy Lutomirski 10307a5d6704SAndy Lutomirski detect_null_seg_behavior(c); 10310230bb03SAndy Lutomirski 10320230bb03SAndy Lutomirski /* 10330230bb03SAndy Lutomirski * ESPFIX is a strange bug. All real CPUs have it. Paravirt 10340230bb03SAndy Lutomirski * systems that run Linux at CPL > 0 may or may not have the 10350230bb03SAndy Lutomirski * issue, but, even if they have the issue, there's absolutely 10360230bb03SAndy Lutomirski * nothing we can do about it because we can't use the real IRET 10370230bb03SAndy Lutomirski * instruction. 10380230bb03SAndy Lutomirski * 10390230bb03SAndy Lutomirski * NB: For the time being, only 32-bit kernels support 10400230bb03SAndy Lutomirski * X86_BUG_ESPFIX as such. 64-bit kernels directly choose 10410230bb03SAndy Lutomirski * whether to apply espfix using paravirt hooks. If any 10420230bb03SAndy Lutomirski * non-paravirt system ever shows up that does *not* have the 10430230bb03SAndy Lutomirski * ESPFIX issue, we can change this. 10440230bb03SAndy Lutomirski */ 10450230bb03SAndy Lutomirski #ifdef CONFIG_X86_32 10460230bb03SAndy Lutomirski # ifdef CONFIG_PARAVIRT 10470230bb03SAndy Lutomirski do { 10480230bb03SAndy Lutomirski extern void native_iret(void); 10490230bb03SAndy Lutomirski if (pv_cpu_ops.iret == native_iret) 10500230bb03SAndy Lutomirski set_cpu_bug(c, X86_BUG_ESPFIX); 10510230bb03SAndy Lutomirski } while (0); 10520230bb03SAndy Lutomirski # else 10530230bb03SAndy Lutomirski set_cpu_bug(c, X86_BUG_ESPFIX); 10540230bb03SAndy Lutomirski # endif 10550230bb03SAndy Lutomirski #endif 1056f7627e25SThomas Gleixner } 1057f7627e25SThomas Gleixner 1058cbc82b17SPeter P Waskiewicz Jr static void x86_init_cache_qos(struct cpuinfo_x86 *c) 1059cbc82b17SPeter P Waskiewicz Jr { 1060cbc82b17SPeter P Waskiewicz Jr /* 1061cbc82b17SPeter P Waskiewicz Jr * The heavy lifting of max_rmid and cache_occ_scale are handled 1062cbc82b17SPeter P Waskiewicz Jr * in get_cpu_cap(). Here we just set the max_rmid for the boot_cpu 1063cbc82b17SPeter P Waskiewicz Jr * in case CQM bits really aren't there in this CPU. 1064cbc82b17SPeter P Waskiewicz Jr */ 1065cbc82b17SPeter P Waskiewicz Jr if (c != &boot_cpu_data) { 1066cbc82b17SPeter P Waskiewicz Jr boot_cpu_data.x86_cache_max_rmid = 1067cbc82b17SPeter P Waskiewicz Jr min(boot_cpu_data.x86_cache_max_rmid, 1068cbc82b17SPeter P Waskiewicz Jr c->x86_cache_max_rmid); 1069cbc82b17SPeter P Waskiewicz Jr } 1070cbc82b17SPeter P Waskiewicz Jr } 1071cbc82b17SPeter P Waskiewicz Jr 1072f7627e25SThomas Gleixner /* 10739d85eb91SThomas Gleixner * Validate that ACPI/mptables have the same information about the 10749d85eb91SThomas Gleixner * effective APIC id and update the package map. 1075d49597fdSThomas Gleixner */ 10769d85eb91SThomas Gleixner static void validate_apic_and_package_id(struct cpuinfo_x86 *c) 1077d49597fdSThomas Gleixner { 1078d49597fdSThomas Gleixner #ifdef CONFIG_SMP 10799d85eb91SThomas Gleixner unsigned int apicid, cpu = smp_processor_id(); 1080d49597fdSThomas Gleixner 1081d49597fdSThomas Gleixner apicid = apic->cpu_present_to_apicid(cpu); 1082d49597fdSThomas Gleixner 10839d85eb91SThomas Gleixner if (apicid != c->apicid) { 10849d85eb91SThomas Gleixner pr_err(FW_BUG "CPU%u: APIC id mismatch. Firmware: %x APIC: %x\n", 1085d49597fdSThomas Gleixner cpu, apicid, c->initial_apicid); 1086d49597fdSThomas Gleixner } 10879d85eb91SThomas Gleixner BUG_ON(topology_update_package_map(c->phys_proc_id, cpu)); 1088d49597fdSThomas Gleixner #else 1089d49597fdSThomas Gleixner c->logical_proc_id = 0; 1090d49597fdSThomas Gleixner #endif 1091d49597fdSThomas Gleixner } 1092d49597fdSThomas Gleixner 1093d49597fdSThomas Gleixner /* 1094f7627e25SThomas Gleixner * This does the hard work of actually picking apart the CPU stuff... 1095f7627e25SThomas Gleixner */ 1096148f9bb8SPaul Gortmaker static void identify_cpu(struct cpuinfo_x86 *c) 1097f7627e25SThomas Gleixner { 1098f7627e25SThomas Gleixner int i; 1099f7627e25SThomas Gleixner 1100f7627e25SThomas Gleixner c->loops_per_jiffy = loops_per_jiffy; 1101f7627e25SThomas Gleixner c->x86_cache_size = -1; 1102f7627e25SThomas Gleixner c->x86_vendor = X86_VENDOR_UNKNOWN; 1103f7627e25SThomas Gleixner c->x86_model = c->x86_mask = 0; /* So far unknown... */ 1104f7627e25SThomas Gleixner c->x86_vendor_id[0] = '\0'; /* Unset */ 1105f7627e25SThomas Gleixner c->x86_model_id[0] = '\0'; /* Unset */ 1106f7627e25SThomas Gleixner c->x86_max_cores = 1; 1107102bbe3aSYinghai Lu c->x86_coreid_bits = 0; 110879a8b9aaSBorislav Petkov c->cu_id = 0xff; 110911fdd252SYinghai Lu #ifdef CONFIG_X86_64 1110102bbe3aSYinghai Lu c->x86_clflush_size = 64; 111113c6c532SJan Beulich c->x86_phys_bits = 36; 111213c6c532SJan Beulich c->x86_virt_bits = 48; 1113102bbe3aSYinghai Lu #else 1114102bbe3aSYinghai Lu c->cpuid_level = -1; /* CPUID not detected */ 1115f7627e25SThomas Gleixner c->x86_clflush_size = 32; 111613c6c532SJan Beulich c->x86_phys_bits = 32; 111713c6c532SJan Beulich c->x86_virt_bits = 32; 1118102bbe3aSYinghai Lu #endif 1119102bbe3aSYinghai Lu c->x86_cache_alignment = c->x86_clflush_size; 1120f7627e25SThomas Gleixner memset(&c->x86_capability, 0, sizeof c->x86_capability); 1121f7627e25SThomas Gleixner 1122f7627e25SThomas Gleixner generic_identify(c); 1123f7627e25SThomas Gleixner 11243898534dSAndi Kleen if (this_cpu->c_identify) 1125f7627e25SThomas Gleixner this_cpu->c_identify(c); 1126f7627e25SThomas Gleixner 11276a6256f9SAdam Buchbinder /* Clear/Set all flags overridden by options, after probe */ 11288bf1ebcaSAndy Lutomirski apply_forced_caps(c); 11292759c328SYinghai Lu 1130102bbe3aSYinghai Lu #ifdef CONFIG_X86_64 1131cb8cc442SIngo Molnar c->apicid = apic->phys_pkg_id(c->initial_apicid, 0); 1132102bbe3aSYinghai Lu #endif 1133102bbe3aSYinghai Lu 1134f7627e25SThomas Gleixner /* 1135f7627e25SThomas Gleixner * Vendor-specific initialization. In this section we 1136f7627e25SThomas Gleixner * canonicalize the feature flags, meaning if there are 1137f7627e25SThomas Gleixner * features a certain CPU supports which CPUID doesn't 1138f7627e25SThomas Gleixner * tell us, CPUID claiming incorrect flags, or other bugs, 1139f7627e25SThomas Gleixner * we handle them here. 1140f7627e25SThomas Gleixner * 1141f7627e25SThomas Gleixner * At the end of this section, c->x86_capability better 1142f7627e25SThomas Gleixner * indicate the features this CPU genuinely supports! 1143f7627e25SThomas Gleixner */ 1144f7627e25SThomas Gleixner if (this_cpu->c_init) 1145f7627e25SThomas Gleixner this_cpu->c_init(c); 1146f7627e25SThomas Gleixner 1147f7627e25SThomas Gleixner /* Disable the PN if appropriate */ 1148f7627e25SThomas Gleixner squash_the_stupid_serial_number(c); 1149f7627e25SThomas Gleixner 1150b2cc2a07SH. Peter Anvin /* Set up SMEP/SMAP */ 1151b2cc2a07SH. Peter Anvin setup_smep(c); 1152b2cc2a07SH. Peter Anvin setup_smap(c); 1153b2cc2a07SH. Peter Anvin 1154f7627e25SThomas Gleixner /* 11550f3fa48aSIngo Molnar * The vendor-specific functions might have changed features. 11560f3fa48aSIngo Molnar * Now we do "generic changes." 1157f7627e25SThomas Gleixner */ 1158f7627e25SThomas Gleixner 1159b38b0665SH. Peter Anvin /* Filter out anything that depends on CPUID levels we don't have */ 1160b38b0665SH. Peter Anvin filter_cpuid_features(c, true); 1161b38b0665SH. Peter Anvin 1162f7627e25SThomas Gleixner /* If the model name is still unset, do table lookup. */ 1163f7627e25SThomas Gleixner if (!c->x86_model_id[0]) { 116402dde8b4SJan Beulich const char *p; 1165f7627e25SThomas Gleixner p = table_lookup_model(c); 1166f7627e25SThomas Gleixner if (p) 1167f7627e25SThomas Gleixner strcpy(c->x86_model_id, p); 1168f7627e25SThomas Gleixner else 1169f7627e25SThomas Gleixner /* Last resort... */ 1170f7627e25SThomas Gleixner sprintf(c->x86_model_id, "%02x/%02x", 1171f7627e25SThomas Gleixner c->x86, c->x86_model); 1172f7627e25SThomas Gleixner } 1173f7627e25SThomas Gleixner 1174102bbe3aSYinghai Lu #ifdef CONFIG_X86_64 1175102bbe3aSYinghai Lu detect_ht(c); 1176102bbe3aSYinghai Lu #endif 1177102bbe3aSYinghai Lu 117849d859d7SH. Peter Anvin x86_init_rdrand(c); 1179cbc82b17SPeter P Waskiewicz Jr x86_init_cache_qos(c); 118006976945SDave Hansen setup_pku(c); 11813e0c3737SYinghai Lu 11823e0c3737SYinghai Lu /* 11836a6256f9SAdam Buchbinder * Clear/Set all flags overridden by options, need do it 11843e0c3737SYinghai Lu * before following smp all cpus cap AND. 11853e0c3737SYinghai Lu */ 11868bf1ebcaSAndy Lutomirski apply_forced_caps(c); 11873e0c3737SYinghai Lu 1188f7627e25SThomas Gleixner /* 1189f7627e25SThomas Gleixner * On SMP, boot_cpu_data holds the common feature set between 1190f7627e25SThomas Gleixner * all CPUs; so make sure that we indicate which features are 1191f7627e25SThomas Gleixner * common between the CPUs. The first time this routine gets 1192f7627e25SThomas Gleixner * executed, c == &boot_cpu_data. 1193f7627e25SThomas Gleixner */ 1194f7627e25SThomas Gleixner if (c != &boot_cpu_data) { 1195f7627e25SThomas Gleixner /* AND the already accumulated flags with these */ 1196f7627e25SThomas Gleixner for (i = 0; i < NCAPINTS; i++) 1197f7627e25SThomas Gleixner boot_cpu_data.x86_capability[i] &= c->x86_capability[i]; 119865fc985bSBorislav Petkov 119965fc985bSBorislav Petkov /* OR, i.e. replicate the bug flags */ 120065fc985bSBorislav Petkov for (i = NCAPINTS; i < NCAPINTS + NBUGINTS; i++) 120165fc985bSBorislav Petkov c->x86_capability[i] |= boot_cpu_data.x86_capability[i]; 1202f7627e25SThomas Gleixner } 1203f7627e25SThomas Gleixner 1204f7627e25SThomas Gleixner /* Init Machine Check Exception if available. */ 12055e09954aSBorislav Petkov mcheck_cpu_init(c); 120630d432dfSAndi Kleen 120730d432dfSAndi Kleen select_idle_routine(c); 1208102bbe3aSYinghai Lu 1209de2d9445STejun Heo #ifdef CONFIG_NUMA 1210102bbe3aSYinghai Lu numa_add_cpu(smp_processor_id()); 1211102bbe3aSYinghai Lu #endif 1212f7627e25SThomas Gleixner } 1213f7627e25SThomas Gleixner 12148b6c0ab1SIngo Molnar /* 12158b6c0ab1SIngo Molnar * Set up the CPU state needed to execute SYSENTER/SYSEXIT instructions 12168b6c0ab1SIngo Molnar * on 32-bit kernels: 12178b6c0ab1SIngo Molnar */ 1218cfda7bb9SAndy Lutomirski #ifdef CONFIG_X86_32 1219cfda7bb9SAndy Lutomirski void enable_sep_cpu(void) 1220cfda7bb9SAndy Lutomirski { 12218b6c0ab1SIngo Molnar struct tss_struct *tss; 12228b6c0ab1SIngo Molnar int cpu; 1223cfda7bb9SAndy Lutomirski 1224b3edfda4SBorislav Petkov if (!boot_cpu_has(X86_FEATURE_SEP)) 1225b3edfda4SBorislav Petkov return; 1226b3edfda4SBorislav Petkov 12278b6c0ab1SIngo Molnar cpu = get_cpu(); 12288b6c0ab1SIngo Molnar tss = &per_cpu(cpu_tss, cpu); 12298b6c0ab1SIngo Molnar 12308b6c0ab1SIngo Molnar /* 1231cf9328ccSAndy Lutomirski * We cache MSR_IA32_SYSENTER_CS's value in the TSS's ss1 field -- 1232cf9328ccSAndy Lutomirski * see the big comment in struct x86_hw_tss's definition. 12338b6c0ab1SIngo Molnar */ 1234cfda7bb9SAndy Lutomirski 1235cfda7bb9SAndy Lutomirski tss->x86_tss.ss1 = __KERNEL_CS; 12368b6c0ab1SIngo Molnar wrmsr(MSR_IA32_SYSENTER_CS, tss->x86_tss.ss1, 0); 12378b6c0ab1SIngo Molnar 1238cf9328ccSAndy Lutomirski wrmsr(MSR_IA32_SYSENTER_ESP, 1239cf9328ccSAndy Lutomirski (unsigned long)tss + offsetofend(struct tss_struct, SYSENTER_stack), 1240cf9328ccSAndy Lutomirski 0); 12418b6c0ab1SIngo Molnar 12424c8cd0c5SIngo Molnar wrmsr(MSR_IA32_SYSENTER_EIP, (unsigned long)entry_SYSENTER_32, 0); 12438b6c0ab1SIngo Molnar 1244cfda7bb9SAndy Lutomirski put_cpu(); 1245cfda7bb9SAndy Lutomirski } 1246e04d645fSGlauber Costa #endif 1247e04d645fSGlauber Costa 1248f7627e25SThomas Gleixner void __init identify_boot_cpu(void) 1249f7627e25SThomas Gleixner { 1250f7627e25SThomas Gleixner identify_cpu(&boot_cpu_data); 1251102bbe3aSYinghai Lu #ifdef CONFIG_X86_32 1252f7627e25SThomas Gleixner sysenter_setup(); 1253f7627e25SThomas Gleixner enable_sep_cpu(); 1254102bbe3aSYinghai Lu #endif 1255e0ba94f1SAlex Shi cpu_detect_tlb(&boot_cpu_data); 1256f7627e25SThomas Gleixner } 1257f7627e25SThomas Gleixner 1258148f9bb8SPaul Gortmaker void identify_secondary_cpu(struct cpuinfo_x86 *c) 1259f7627e25SThomas Gleixner { 1260f7627e25SThomas Gleixner BUG_ON(c == &boot_cpu_data); 1261f7627e25SThomas Gleixner identify_cpu(c); 1262102bbe3aSYinghai Lu #ifdef CONFIG_X86_32 1263f7627e25SThomas Gleixner enable_sep_cpu(); 1264102bbe3aSYinghai Lu #endif 1265f7627e25SThomas Gleixner mtrr_ap_init(); 12669d85eb91SThomas Gleixner validate_apic_and_package_id(c); 1267f7627e25SThomas Gleixner } 1268f7627e25SThomas Gleixner 1269191679fdSAndi Kleen static __init int setup_noclflush(char *arg) 1270191679fdSAndi Kleen { 1271840d2830SH. Peter Anvin setup_clear_cpu_cap(X86_FEATURE_CLFLUSH); 1272da4aaa7dSH. Peter Anvin setup_clear_cpu_cap(X86_FEATURE_CLFLUSHOPT); 1273191679fdSAndi Kleen return 1; 1274191679fdSAndi Kleen } 1275191679fdSAndi Kleen __setup("noclflush", setup_noclflush); 1276191679fdSAndi Kleen 1277148f9bb8SPaul Gortmaker void print_cpu_info(struct cpuinfo_x86 *c) 1278f7627e25SThomas Gleixner { 127902dde8b4SJan Beulich const char *vendor = NULL; 1280f7627e25SThomas Gleixner 12810f3fa48aSIngo Molnar if (c->x86_vendor < X86_VENDOR_NUM) { 1282f7627e25SThomas Gleixner vendor = this_cpu->c_vendor; 12830f3fa48aSIngo Molnar } else { 12840f3fa48aSIngo Molnar if (c->cpuid_level >= 0) 1285f7627e25SThomas Gleixner vendor = c->x86_vendor_id; 12860f3fa48aSIngo Molnar } 1287f7627e25SThomas Gleixner 1288bd32a8cfSYinghai Lu if (vendor && !strstr(c->x86_model_id, vendor)) 12891b74dde7SChen Yucong pr_cont("%s ", vendor); 1290f7627e25SThomas Gleixner 12919d31d35bSYinghai Lu if (c->x86_model_id[0]) 12921b74dde7SChen Yucong pr_cont("%s", c->x86_model_id); 1293f7627e25SThomas Gleixner else 12941b74dde7SChen Yucong pr_cont("%d86", c->x86); 1295f7627e25SThomas Gleixner 12961b74dde7SChen Yucong pr_cont(" (family: 0x%x, model: 0x%x", c->x86, c->x86_model); 1297924e101aSBorislav Petkov 1298f7627e25SThomas Gleixner if (c->x86_mask || c->cpuid_level >= 0) 12991b74dde7SChen Yucong pr_cont(", stepping: 0x%x)\n", c->x86_mask); 1300f7627e25SThomas Gleixner else 13011b74dde7SChen Yucong pr_cont(")\n"); 1302f7627e25SThomas Gleixner } 1303f7627e25SThomas Gleixner 13040c2a3913SAndi Kleen /* 13050c2a3913SAndi Kleen * clearcpuid= was already parsed in fpu__init_parse_early_param. 13060c2a3913SAndi Kleen * But we need to keep a dummy __setup around otherwise it would 13070c2a3913SAndi Kleen * show up as an environment variable for init. 13080c2a3913SAndi Kleen */ 13090c2a3913SAndi Kleen static __init int setup_clearcpuid(char *arg) 1310ac72e788SAndi Kleen { 1311ac72e788SAndi Kleen return 1; 1312ac72e788SAndi Kleen } 13130c2a3913SAndi Kleen __setup("clearcpuid=", setup_clearcpuid); 1314ac72e788SAndi Kleen 1315d5494d4fSYinghai Lu #ifdef CONFIG_X86_64 1316947e76cdSBrian Gerst DEFINE_PER_CPU_FIRST(union irq_stack_union, 1317277d5b40SAndi Kleen irq_stack_union) __aligned(PAGE_SIZE) __visible; 13180f3fa48aSIngo Molnar 1319bdf977b3STejun Heo /* 1320a7fcf28dSAndy Lutomirski * The following percpu variables are hot. Align current_task to 1321a7fcf28dSAndy Lutomirski * cacheline size such that they fall in the same cacheline. 1322bdf977b3STejun Heo */ 1323bdf977b3STejun Heo DEFINE_PER_CPU(struct task_struct *, current_task) ____cacheline_aligned = 1324bdf977b3STejun Heo &init_task; 1325bdf977b3STejun Heo EXPORT_PER_CPU_SYMBOL(current_task); 1326d5494d4fSYinghai Lu 1327bdf977b3STejun Heo DEFINE_PER_CPU(char *, irq_stack_ptr) = 13284950d6d4SJosh Poimboeuf init_per_cpu_var(irq_stack_union.irq_stack) + IRQ_STACK_SIZE; 1329bdf977b3STejun Heo 1330277d5b40SAndi Kleen DEFINE_PER_CPU(unsigned int, irq_count) __visible = -1; 1331d5494d4fSYinghai Lu 1332c2daa3beSPeter Zijlstra DEFINE_PER_CPU(int, __preempt_count) = INIT_PREEMPT_COUNT; 1333c2daa3beSPeter Zijlstra EXPORT_PER_CPU_SYMBOL(__preempt_count); 1334c2daa3beSPeter Zijlstra 13350f3fa48aSIngo Molnar /* 13360f3fa48aSIngo Molnar * Special IST stacks which the CPU switches to when it calls 13370f3fa48aSIngo Molnar * an IST-marked descriptor entry. Up to 7 stacks (hardware 13380f3fa48aSIngo Molnar * limit), all of them are 4K, except the debug stack which 13390f3fa48aSIngo Molnar * is 8K. 13400f3fa48aSIngo Molnar */ 13410f3fa48aSIngo Molnar static const unsigned int exception_stack_sizes[N_EXCEPTION_STACKS] = { 13420f3fa48aSIngo Molnar [0 ... N_EXCEPTION_STACKS - 1] = EXCEPTION_STKSZ, 13430f3fa48aSIngo Molnar [DEBUG_STACK - 1] = DEBUG_STKSZ 13440f3fa48aSIngo Molnar }; 13450f3fa48aSIngo Molnar 134692d65b23SBrian Gerst static DEFINE_PER_CPU_PAGE_ALIGNED(char, exception_stacks 13473e352aa8STejun Heo [(N_EXCEPTION_STACKS - 1) * EXCEPTION_STKSZ + DEBUG_STKSZ]); 1348d5494d4fSYinghai Lu 1349d5494d4fSYinghai Lu /* May not be marked __init: used by software suspend */ 1350d5494d4fSYinghai Lu void syscall_init(void) 1351d5494d4fSYinghai Lu { 135231ac34caSBorislav Petkov wrmsr(MSR_STAR, 0, (__USER32_CS << 16) | __KERNEL_CS); 135347edb651SAndy Lutomirski wrmsrl(MSR_LSTAR, (unsigned long)entry_SYSCALL_64); 1354d56fe4bfSIngo Molnar 1355d56fe4bfSIngo Molnar #ifdef CONFIG_IA32_EMULATION 135647edb651SAndy Lutomirski wrmsrl(MSR_CSTAR, (unsigned long)entry_SYSCALL_compat); 1357a76c7f46SDenys Vlasenko /* 1358487d1edbSDenys Vlasenko * This only works on Intel CPUs. 1359487d1edbSDenys Vlasenko * On AMD CPUs these MSRs are 32-bit, CPU truncates MSR_IA32_SYSENTER_EIP. 1360487d1edbSDenys Vlasenko * This does not cause SYSENTER to jump to the wrong location, because 1361487d1edbSDenys Vlasenko * AMD doesn't allow SYSENTER in long mode (either 32- or 64-bit). 1362a76c7f46SDenys Vlasenko */ 1363a76c7f46SDenys Vlasenko wrmsrl_safe(MSR_IA32_SYSENTER_CS, (u64)__KERNEL_CS); 13641a79797bSAndy Lutomirski wrmsrl_safe(MSR_IA32_SYSENTER_ESP, 13651a79797bSAndy Lutomirski (unsigned long)this_cpu_ptr(&cpu_tss) + 13661a79797bSAndy Lutomirski offsetofend(struct tss_struct, SYSENTER_stack)); 13674c8cd0c5SIngo Molnar wrmsrl_safe(MSR_IA32_SYSENTER_EIP, (u64)entry_SYSENTER_compat); 1368d56fe4bfSIngo Molnar #else 136947edb651SAndy Lutomirski wrmsrl(MSR_CSTAR, (unsigned long)ignore_sysret); 13706b51311cSBorislav Petkov wrmsrl_safe(MSR_IA32_SYSENTER_CS, (u64)GDT_ENTRY_INVALID_SEG); 1371d56fe4bfSIngo Molnar wrmsrl_safe(MSR_IA32_SYSENTER_ESP, 0ULL); 1372d56fe4bfSIngo Molnar wrmsrl_safe(MSR_IA32_SYSENTER_EIP, 0ULL); 1373d5494d4fSYinghai Lu #endif 1374d5494d4fSYinghai Lu 1375d5494d4fSYinghai Lu /* Flags to clear on syscall */ 1376d5494d4fSYinghai Lu wrmsrl(MSR_SYSCALL_MASK, 137763bcff2aSH. Peter Anvin X86_EFLAGS_TF|X86_EFLAGS_DF|X86_EFLAGS_IF| 13788c7aa698SAndy Lutomirski X86_EFLAGS_IOPL|X86_EFLAGS_AC|X86_EFLAGS_NT); 1379d5494d4fSYinghai Lu } 1380d5494d4fSYinghai Lu 1381d5494d4fSYinghai Lu /* 1382d5494d4fSYinghai Lu * Copies of the original ist values from the tss are only accessed during 1383d5494d4fSYinghai Lu * debugging, no special alignment required. 1384d5494d4fSYinghai Lu */ 1385d5494d4fSYinghai Lu DEFINE_PER_CPU(struct orig_ist, orig_ist); 1386d5494d4fSYinghai Lu 1387228bdaa9SSteven Rostedt static DEFINE_PER_CPU(unsigned long, debug_stack_addr); 138842181186SSteven Rostedt DEFINE_PER_CPU(int, debug_stack_usage); 1389228bdaa9SSteven Rostedt 1390228bdaa9SSteven Rostedt int is_debug_stack(unsigned long addr) 1391228bdaa9SSteven Rostedt { 139289cbc767SChristoph Lameter return __this_cpu_read(debug_stack_usage) || 139389cbc767SChristoph Lameter (addr <= __this_cpu_read(debug_stack_addr) && 139489cbc767SChristoph Lameter addr > (__this_cpu_read(debug_stack_addr) - DEBUG_STKSZ)); 1395228bdaa9SSteven Rostedt } 13960f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(is_debug_stack); 1397228bdaa9SSteven Rostedt 1398629f4f9dSSeiji Aguchi DEFINE_PER_CPU(u32, debug_idt_ctr); 1399f8988175SSteven Rostedt 1400228bdaa9SSteven Rostedt void debug_stack_set_zero(void) 1401228bdaa9SSteven Rostedt { 1402629f4f9dSSeiji Aguchi this_cpu_inc(debug_idt_ctr); 1403629f4f9dSSeiji Aguchi load_current_idt(); 1404228bdaa9SSteven Rostedt } 14050f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(debug_stack_set_zero); 1406228bdaa9SSteven Rostedt 1407228bdaa9SSteven Rostedt void debug_stack_reset(void) 1408228bdaa9SSteven Rostedt { 1409629f4f9dSSeiji Aguchi if (WARN_ON(!this_cpu_read(debug_idt_ctr))) 1410f8988175SSteven Rostedt return; 1411629f4f9dSSeiji Aguchi if (this_cpu_dec_return(debug_idt_ctr) == 0) 1412629f4f9dSSeiji Aguchi load_current_idt(); 1413228bdaa9SSteven Rostedt } 14140f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(debug_stack_reset); 1415228bdaa9SSteven Rostedt 14160f3fa48aSIngo Molnar #else /* CONFIG_X86_64 */ 1417d5494d4fSYinghai Lu 1418bdf977b3STejun Heo DEFINE_PER_CPU(struct task_struct *, current_task) = &init_task; 1419bdf977b3STejun Heo EXPORT_PER_CPU_SYMBOL(current_task); 1420c2daa3beSPeter Zijlstra DEFINE_PER_CPU(int, __preempt_count) = INIT_PREEMPT_COUNT; 1421c2daa3beSPeter Zijlstra EXPORT_PER_CPU_SYMBOL(__preempt_count); 1422bdf977b3STejun Heo 1423a7fcf28dSAndy Lutomirski /* 1424a7fcf28dSAndy Lutomirski * On x86_32, vm86 modifies tss.sp0, so sp0 isn't a reliable way to find 1425a7fcf28dSAndy Lutomirski * the top of the kernel stack. Use an extra percpu variable to track the 1426a7fcf28dSAndy Lutomirski * top of the kernel stack directly. 1427a7fcf28dSAndy Lutomirski */ 1428a7fcf28dSAndy Lutomirski DEFINE_PER_CPU(unsigned long, cpu_current_top_of_stack) = 1429a7fcf28dSAndy Lutomirski (unsigned long)&init_thread_union + THREAD_SIZE; 1430a7fcf28dSAndy Lutomirski EXPORT_PER_CPU_SYMBOL(cpu_current_top_of_stack); 1431a7fcf28dSAndy Lutomirski 143260a5317fSTejun Heo #ifdef CONFIG_CC_STACKPROTECTOR 143353f82452SJeremy Fitzhardinge DEFINE_PER_CPU_ALIGNED(struct stack_canary, stack_canary); 143460a5317fSTejun Heo #endif 143560a5317fSTejun Heo 14360f3fa48aSIngo Molnar #endif /* CONFIG_X86_64 */ 1437f7627e25SThomas Gleixner 1438f7627e25SThomas Gleixner /* 14399766cdbcSJaswinder Singh Rajput * Clear all 6 debug registers: 14409766cdbcSJaswinder Singh Rajput */ 14419766cdbcSJaswinder Singh Rajput static void clear_all_debug_regs(void) 14429766cdbcSJaswinder Singh Rajput { 14439766cdbcSJaswinder Singh Rajput int i; 14449766cdbcSJaswinder Singh Rajput 14459766cdbcSJaswinder Singh Rajput for (i = 0; i < 8; i++) { 14469766cdbcSJaswinder Singh Rajput /* Ignore db4, db5 */ 14479766cdbcSJaswinder Singh Rajput if ((i == 4) || (i == 5)) 14489766cdbcSJaswinder Singh Rajput continue; 14499766cdbcSJaswinder Singh Rajput 14509766cdbcSJaswinder Singh Rajput set_debugreg(0, i); 14519766cdbcSJaswinder Singh Rajput } 14529766cdbcSJaswinder Singh Rajput } 1453f7627e25SThomas Gleixner 14540bb9fef9SJason Wessel #ifdef CONFIG_KGDB 14550bb9fef9SJason Wessel /* 14560bb9fef9SJason Wessel * Restore debug regs if using kgdbwait and you have a kernel debugger 14570bb9fef9SJason Wessel * connection established. 14580bb9fef9SJason Wessel */ 14590bb9fef9SJason Wessel static void dbg_restore_debug_regs(void) 14600bb9fef9SJason Wessel { 14610bb9fef9SJason Wessel if (unlikely(kgdb_connected && arch_kgdb_ops.correct_hw_break)) 14620bb9fef9SJason Wessel arch_kgdb_ops.correct_hw_break(); 14630bb9fef9SJason Wessel } 14640bb9fef9SJason Wessel #else /* ! CONFIG_KGDB */ 14650bb9fef9SJason Wessel #define dbg_restore_debug_regs() 14660bb9fef9SJason Wessel #endif /* ! CONFIG_KGDB */ 14670bb9fef9SJason Wessel 1468ce4b1b16SIgor Mammedov static void wait_for_master_cpu(int cpu) 1469ce4b1b16SIgor Mammedov { 1470ce4b1b16SIgor Mammedov #ifdef CONFIG_SMP 1471ce4b1b16SIgor Mammedov /* 1472ce4b1b16SIgor Mammedov * wait for ACK from master CPU before continuing 1473ce4b1b16SIgor Mammedov * with AP initialization 1474ce4b1b16SIgor Mammedov */ 1475ce4b1b16SIgor Mammedov WARN_ON(cpumask_test_and_set_cpu(cpu, cpu_initialized_mask)); 1476ce4b1b16SIgor Mammedov while (!cpumask_test_cpu(cpu, cpu_callout_mask)) 1477ce4b1b16SIgor Mammedov cpu_relax(); 1478ce4b1b16SIgor Mammedov #endif 1479ce4b1b16SIgor Mammedov } 1480ce4b1b16SIgor Mammedov 1481f7627e25SThomas Gleixner /* 1482f7627e25SThomas Gleixner * cpu_init() initializes state that is per-CPU. Some data is already 1483f7627e25SThomas Gleixner * initialized (naturally) in the bootstrap process, such as the GDT 1484f7627e25SThomas Gleixner * and IDT. We reload them nevertheless, this function acts as a 1485f7627e25SThomas Gleixner * 'CPU state barrier', nothing should get across. 14861ba76586SYinghai Lu * A lot of state is already set up in PDA init for 64 bit 1487f7627e25SThomas Gleixner */ 14881ba76586SYinghai Lu #ifdef CONFIG_X86_64 14890f3fa48aSIngo Molnar 1490148f9bb8SPaul Gortmaker void cpu_init(void) 14911ba76586SYinghai Lu { 14920fe1e009STejun Heo struct orig_ist *oist; 14931ba76586SYinghai Lu struct task_struct *me; 14940f3fa48aSIngo Molnar struct tss_struct *t; 14950f3fa48aSIngo Molnar unsigned long v; 1496fb59831bSAndy Lutomirski int cpu = raw_smp_processor_id(); 14971ba76586SYinghai Lu int i; 14981ba76586SYinghai Lu 1499ce4b1b16SIgor Mammedov wait_for_master_cpu(cpu); 1500ce4b1b16SIgor Mammedov 1501e6ebf5deSFenghua Yu /* 15021e02ce4cSAndy Lutomirski * Initialize the CR4 shadow before doing anything that could 15031e02ce4cSAndy Lutomirski * try to read it. 15041e02ce4cSAndy Lutomirski */ 15051e02ce4cSAndy Lutomirski cr4_init_shadow(); 15061e02ce4cSAndy Lutomirski 1507777284b6SBorislav Petkov if (cpu) 1508e6ebf5deSFenghua Yu load_ucode_ap(); 1509e6ebf5deSFenghua Yu 151024933b82SAndy Lutomirski t = &per_cpu(cpu_tss, cpu); 15110fe1e009STejun Heo oist = &per_cpu(orig_ist, cpu); 15120f3fa48aSIngo Molnar 1513e7a22c1eSBrian Gerst #ifdef CONFIG_NUMA 151427fd185fSFenghua Yu if (this_cpu_read(numa_node) == 0 && 1515e534c7c5SLee Schermerhorn early_cpu_to_node(cpu) != NUMA_NO_NODE) 1516e534c7c5SLee Schermerhorn set_numa_node(early_cpu_to_node(cpu)); 1517e7a22c1eSBrian Gerst #endif 15181ba76586SYinghai Lu 15191ba76586SYinghai Lu me = current; 15201ba76586SYinghai Lu 15212eaad1fdSMike Travis pr_debug("Initializing CPU#%d\n", cpu); 15221ba76586SYinghai Lu 1523375074ccSAndy Lutomirski cr4_clear_bits(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE); 15241ba76586SYinghai Lu 15251ba76586SYinghai Lu /* 15261ba76586SYinghai Lu * Initialize the per-CPU GDT with the boot GDT, 15271ba76586SYinghai Lu * and set up the GDT descriptor: 15281ba76586SYinghai Lu */ 15291ba76586SYinghai Lu 1530552be871SBrian Gerst switch_to_new_gdt(cpu); 15312697fbd5SBrian Gerst loadsegment(fs, 0); 15322697fbd5SBrian Gerst 1533cf910e83SSeiji Aguchi load_current_idt(); 15341ba76586SYinghai Lu 15351ba76586SYinghai Lu memset(me->thread.tls_array, 0, GDT_ENTRY_TLS_ENTRIES * 8); 15361ba76586SYinghai Lu syscall_init(); 15371ba76586SYinghai Lu 15381ba76586SYinghai Lu wrmsrl(MSR_FS_BASE, 0); 15391ba76586SYinghai Lu wrmsrl(MSR_KERNEL_GS_BASE, 0); 15401ba76586SYinghai Lu barrier(); 15411ba76586SYinghai Lu 15424763ed4dSH. Peter Anvin x86_configure_nx(); 1543659006bfSThomas Gleixner x2apic_setup(); 15441ba76586SYinghai Lu 15451ba76586SYinghai Lu /* 15461ba76586SYinghai Lu * set up and load the per-CPU TSS 15471ba76586SYinghai Lu */ 15480fe1e009STejun Heo if (!oist->ist[0]) { 154992d65b23SBrian Gerst char *estacks = per_cpu(exception_stacks, cpu); 15500f3fa48aSIngo Molnar 15511ba76586SYinghai Lu for (v = 0; v < N_EXCEPTION_STACKS; v++) { 15520f3fa48aSIngo Molnar estacks += exception_stack_sizes[v]; 15530fe1e009STejun Heo oist->ist[v] = t->x86_tss.ist[v] = 15541ba76586SYinghai Lu (unsigned long)estacks; 1555228bdaa9SSteven Rostedt if (v == DEBUG_STACK-1) 1556228bdaa9SSteven Rostedt per_cpu(debug_stack_addr, cpu) = (unsigned long)estacks; 15571ba76586SYinghai Lu } 15581ba76586SYinghai Lu } 15591ba76586SYinghai Lu 15601ba76586SYinghai Lu t->x86_tss.io_bitmap_base = offsetof(struct tss_struct, io_bitmap); 15610f3fa48aSIngo Molnar 15621ba76586SYinghai Lu /* 15631ba76586SYinghai Lu * <= is required because the CPU will access up to 15641ba76586SYinghai Lu * 8 bits beyond the end of the IO permission bitmap. 15651ba76586SYinghai Lu */ 15661ba76586SYinghai Lu for (i = 0; i <= IO_BITMAP_LONGS; i++) 15671ba76586SYinghai Lu t->io_bitmap[i] = ~0UL; 15681ba76586SYinghai Lu 1569f1f10076SVegard Nossum mmgrab(&init_mm); 15701ba76586SYinghai Lu me->active_mm = &init_mm; 15718c5dfd25SStoyan Gaydarov BUG_ON(me->mm); 157272c0098dSAndy Lutomirski initialize_tlbstate_and_flush(); 15731ba76586SYinghai Lu enter_lazy_tlb(&init_mm, me); 15741ba76586SYinghai Lu 157520bb8344SAndy Lutomirski /* 157620bb8344SAndy Lutomirski * Initialize the TSS. Don't bother initializing sp0, as the initial 157720bb8344SAndy Lutomirski * task never enters user mode. 157820bb8344SAndy Lutomirski */ 15791ba76586SYinghai Lu set_tss_desc(cpu, t); 15801ba76586SYinghai Lu load_TR_desc(); 158120bb8344SAndy Lutomirski 158237868fe1SAndy Lutomirski load_mm_ldt(&init_mm); 15831ba76586SYinghai Lu 15849766cdbcSJaswinder Singh Rajput clear_all_debug_regs(); 15850bb9fef9SJason Wessel dbg_restore_debug_regs(); 15861ba76586SYinghai Lu 158721c4cd10SIngo Molnar fpu__init_cpu(); 15881ba76586SYinghai Lu 15891ba76586SYinghai Lu if (is_uv_system()) 15901ba76586SYinghai Lu uv_cpu_init(); 159169218e47SThomas Garnier 1592*ef8813abSAndy Lutomirski setup_cpu_entry_area(cpu); 159369218e47SThomas Garnier load_fixmap_gdt(cpu); 15941ba76586SYinghai Lu } 15951ba76586SYinghai Lu 15961ba76586SYinghai Lu #else 15971ba76586SYinghai Lu 1598148f9bb8SPaul Gortmaker void cpu_init(void) 1599f7627e25SThomas Gleixner { 1600f7627e25SThomas Gleixner int cpu = smp_processor_id(); 1601f7627e25SThomas Gleixner struct task_struct *curr = current; 160224933b82SAndy Lutomirski struct tss_struct *t = &per_cpu(cpu_tss, cpu); 1603f7627e25SThomas Gleixner 1604ce4b1b16SIgor Mammedov wait_for_master_cpu(cpu); 1605e6ebf5deSFenghua Yu 16065b2bdbc8SSteven Rostedt /* 16075b2bdbc8SSteven Rostedt * Initialize the CR4 shadow before doing anything that could 16085b2bdbc8SSteven Rostedt * try to read it. 16095b2bdbc8SSteven Rostedt */ 16105b2bdbc8SSteven Rostedt cr4_init_shadow(); 16115b2bdbc8SSteven Rostedt 1612ce4b1b16SIgor Mammedov show_ucode_info_early(); 1613f7627e25SThomas Gleixner 16141b74dde7SChen Yucong pr_info("Initializing CPU#%d\n", cpu); 1615f7627e25SThomas Gleixner 1616362f924bSBorislav Petkov if (cpu_feature_enabled(X86_FEATURE_VME) || 161759e21e3dSBorislav Petkov boot_cpu_has(X86_FEATURE_TSC) || 1618362f924bSBorislav Petkov boot_cpu_has(X86_FEATURE_DE)) 1619375074ccSAndy Lutomirski cr4_clear_bits(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE); 1620f7627e25SThomas Gleixner 1621cf910e83SSeiji Aguchi load_current_idt(); 1622552be871SBrian Gerst switch_to_new_gdt(cpu); 1623f7627e25SThomas Gleixner 1624f7627e25SThomas Gleixner /* 1625f7627e25SThomas Gleixner * Set up and load the per-CPU TSS and LDT 1626f7627e25SThomas Gleixner */ 1627f1f10076SVegard Nossum mmgrab(&init_mm); 1628f7627e25SThomas Gleixner curr->active_mm = &init_mm; 16298c5dfd25SStoyan Gaydarov BUG_ON(curr->mm); 163072c0098dSAndy Lutomirski initialize_tlbstate_and_flush(); 1631f7627e25SThomas Gleixner enter_lazy_tlb(&init_mm, curr); 1632f7627e25SThomas Gleixner 163320bb8344SAndy Lutomirski /* 163420bb8344SAndy Lutomirski * Initialize the TSS. Don't bother initializing sp0, as the initial 163520bb8344SAndy Lutomirski * task never enters user mode. 163620bb8344SAndy Lutomirski */ 1637f7627e25SThomas Gleixner set_tss_desc(cpu, t); 1638f7627e25SThomas Gleixner load_TR_desc(); 163920bb8344SAndy Lutomirski 164037868fe1SAndy Lutomirski load_mm_ldt(&init_mm); 1641f7627e25SThomas Gleixner 1642f9a196b8SThomas Gleixner t->x86_tss.io_bitmap_base = offsetof(struct tss_struct, io_bitmap); 1643f9a196b8SThomas Gleixner 1644f7627e25SThomas Gleixner #ifdef CONFIG_DOUBLEFAULT 1645f7627e25SThomas Gleixner /* Set up doublefault TSS pointer in the GDT */ 1646f7627e25SThomas Gleixner __set_tss_desc(cpu, GDT_ENTRY_DOUBLEFAULT_TSS, &doublefault_tss); 1647f7627e25SThomas Gleixner #endif 1648f7627e25SThomas Gleixner 16499766cdbcSJaswinder Singh Rajput clear_all_debug_regs(); 16500bb9fef9SJason Wessel dbg_restore_debug_regs(); 1651f7627e25SThomas Gleixner 165221c4cd10SIngo Molnar fpu__init_cpu(); 165369218e47SThomas Garnier 1654*ef8813abSAndy Lutomirski setup_cpu_entry_area(cpu); 165569218e47SThomas Garnier load_fixmap_gdt(cpu); 1656f7627e25SThomas Gleixner } 16571ba76586SYinghai Lu #endif 16585700f743SBorislav Petkov 1659b51ef52dSLaura Abbott static void bsp_resume(void) 1660b51ef52dSLaura Abbott { 1661b51ef52dSLaura Abbott if (this_cpu->c_bsp_resume) 1662b51ef52dSLaura Abbott this_cpu->c_bsp_resume(&boot_cpu_data); 1663b51ef52dSLaura Abbott } 1664b51ef52dSLaura Abbott 1665b51ef52dSLaura Abbott static struct syscore_ops cpu_syscore_ops = { 1666b51ef52dSLaura Abbott .resume = bsp_resume, 1667b51ef52dSLaura Abbott }; 1668b51ef52dSLaura Abbott 1669b51ef52dSLaura Abbott static int __init init_cpu_syscore(void) 1670b51ef52dSLaura Abbott { 1671b51ef52dSLaura Abbott register_syscore_ops(&cpu_syscore_ops); 1672b51ef52dSLaura Abbott return 0; 1673b51ef52dSLaura Abbott } 1674b51ef52dSLaura Abbott core_initcall(init_cpu_syscore); 1675