1f0fc4affSYinghai Lu #include <linux/bootmem.h> 29766cdbcSJaswinder Singh Rajput #include <linux/linkage.h> 3f0fc4affSYinghai Lu #include <linux/bitops.h> 49766cdbcSJaswinder Singh Rajput #include <linux/kernel.h> 5186f4360SPaul Gortmaker #include <linux/export.h> 6f7627e25SThomas Gleixner #include <linux/percpu.h> 79766cdbcSJaswinder Singh Rajput #include <linux/string.h> 8ee098e1aSBorislav Petkov #include <linux/ctype.h> 99766cdbcSJaswinder Singh Rajput #include <linux/delay.h> 1068e21be2SIngo Molnar #include <linux/sched/mm.h> 11e6017571SIngo Molnar #include <linux/sched/clock.h> 129164bb4aSIngo Molnar #include <linux/sched/task.h> 139766cdbcSJaswinder Singh Rajput #include <linux/init.h> 140f46efebSMasami Hiramatsu #include <linux/kprobes.h> 159766cdbcSJaswinder Singh Rajput #include <linux/kgdb.h> 169766cdbcSJaswinder Singh Rajput #include <linux/smp.h> 179766cdbcSJaswinder Singh Rajput #include <linux/io.h> 18b51ef52dSLaura Abbott #include <linux/syscore_ops.h> 199766cdbcSJaswinder Singh Rajput 209766cdbcSJaswinder Singh Rajput #include <asm/stackprotector.h> 21cdd6c482SIngo Molnar #include <asm/perf_event.h> 22f7627e25SThomas Gleixner #include <asm/mmu_context.h> 2349d859d7SH. Peter Anvin #include <asm/archrandom.h> 249766cdbcSJaswinder Singh Rajput #include <asm/hypervisor.h> 259766cdbcSJaswinder Singh Rajput #include <asm/processor.h> 261e02ce4cSAndy Lutomirski #include <asm/tlbflush.h> 27f649e938SPaul Gortmaker #include <asm/debugreg.h> 289766cdbcSJaswinder Singh Rajput #include <asm/sections.h> 29f40c3300SAndy Lutomirski #include <asm/vsyscall.h> 308bdbd962SAlan Cox #include <linux/topology.h> 318bdbd962SAlan Cox #include <linux/cpumask.h> 329766cdbcSJaswinder Singh Rajput #include <asm/pgtable.h> 3360063497SArun Sharma #include <linux/atomic.h> 349766cdbcSJaswinder Singh Rajput #include <asm/proto.h> 359766cdbcSJaswinder Singh Rajput #include <asm/setup.h> 36f7627e25SThomas Gleixner #include <asm/apic.h> 379766cdbcSJaswinder Singh Rajput #include <asm/desc.h> 3878f7f1e5SIngo Molnar #include <asm/fpu/internal.h> 399766cdbcSJaswinder Singh Rajput #include <asm/mtrr.h> 400274f955SGrzegorz Andrejczuk #include <asm/hwcap2.h> 418bdbd962SAlan Cox #include <linux/numa.h> 429766cdbcSJaswinder Singh Rajput #include <asm/asm.h> 430f6ff2bcSDave Hansen #include <asm/bugs.h> 449766cdbcSJaswinder Singh Rajput #include <asm/cpu.h> 459766cdbcSJaswinder Singh Rajput #include <asm/mce.h> 469766cdbcSJaswinder Singh Rajput #include <asm/msr.h> 479766cdbcSJaswinder Singh Rajput #include <asm/pat.h> 48d288e1cfSFenghua Yu #include <asm/microcode.h> 49d288e1cfSFenghua Yu #include <asm/microcode_intel.h> 50e641f5f5SIngo Molnar 51f7627e25SThomas Gleixner #ifdef CONFIG_X86_LOCAL_APIC 52bdbcdd48STejun Heo #include <asm/uv/uv.h> 53f7627e25SThomas Gleixner #endif 54f7627e25SThomas Gleixner 55f7627e25SThomas Gleixner #include "cpu.h" 56f7627e25SThomas Gleixner 570274f955SGrzegorz Andrejczuk u32 elf_hwcap2 __read_mostly; 580274f955SGrzegorz Andrejczuk 59c2d1cec1SMike Travis /* all of these masks are initialized in setup_cpu_local_masks() */ 60c2d1cec1SMike Travis cpumask_var_t cpu_initialized_mask; 619766cdbcSJaswinder Singh Rajput cpumask_var_t cpu_callout_mask; 629766cdbcSJaswinder Singh Rajput cpumask_var_t cpu_callin_mask; 63c2d1cec1SMike Travis 64c2d1cec1SMike Travis /* representing cpus for which sibling maps can be computed */ 65c2d1cec1SMike Travis cpumask_var_t cpu_sibling_setup_mask; 66c2d1cec1SMike Travis 672f2f52baSBrian Gerst /* correctly size the local cpu masks */ 684369f1fbSIngo Molnar void __init setup_cpu_local_masks(void) 692f2f52baSBrian Gerst { 702f2f52baSBrian Gerst alloc_bootmem_cpumask_var(&cpu_initialized_mask); 712f2f52baSBrian Gerst alloc_bootmem_cpumask_var(&cpu_callin_mask); 722f2f52baSBrian Gerst alloc_bootmem_cpumask_var(&cpu_callout_mask); 732f2f52baSBrian Gerst alloc_bootmem_cpumask_var(&cpu_sibling_setup_mask); 742f2f52baSBrian Gerst } 752f2f52baSBrian Gerst 76148f9bb8SPaul Gortmaker static void default_init(struct cpuinfo_x86 *c) 77e8055139SOndrej Zary { 78e8055139SOndrej Zary #ifdef CONFIG_X86_64 7927c13eceSBorislav Petkov cpu_detect_cache_sizes(c); 80e8055139SOndrej Zary #else 81e8055139SOndrej Zary /* Not much we can do here... */ 82e8055139SOndrej Zary /* Check if at least it has cpuid */ 83e8055139SOndrej Zary if (c->cpuid_level == -1) { 84e8055139SOndrej Zary /* No cpuid. It must be an ancient CPU */ 85e8055139SOndrej Zary if (c->x86 == 4) 86e8055139SOndrej Zary strcpy(c->x86_model_id, "486"); 87e8055139SOndrej Zary else if (c->x86 == 3) 88e8055139SOndrej Zary strcpy(c->x86_model_id, "386"); 89e8055139SOndrej Zary } 90e8055139SOndrej Zary #endif 91e8055139SOndrej Zary } 92e8055139SOndrej Zary 93148f9bb8SPaul Gortmaker static const struct cpu_dev default_cpu = { 94e8055139SOndrej Zary .c_init = default_init, 95e8055139SOndrej Zary .c_vendor = "Unknown", 96e8055139SOndrej Zary .c_x86_vendor = X86_VENDOR_UNKNOWN, 97e8055139SOndrej Zary }; 98e8055139SOndrej Zary 99148f9bb8SPaul Gortmaker static const struct cpu_dev *this_cpu = &default_cpu; 1000a488a53SYinghai Lu 10106deef89SBrian Gerst DEFINE_PER_CPU_PAGE_ALIGNED(struct gdt_page, gdt_page) = { .gdt = { 102950ad7ffSYinghai Lu #ifdef CONFIG_X86_64 10306deef89SBrian Gerst /* 10406deef89SBrian Gerst * We need valid kernel segments for data and code in long mode too 105950ad7ffSYinghai Lu * IRET will check the segment types kkeil 2000/10/28 106950ad7ffSYinghai Lu * Also sysret mandates a special GDT layout 10706deef89SBrian Gerst * 1089766cdbcSJaswinder Singh Rajput * TLS descriptors are currently at a different place compared to i386. 10906deef89SBrian Gerst * Hopefully nobody expects them at a fixed place (Wine?) 110950ad7ffSYinghai Lu */ 1111e5de182SAkinobu Mita [GDT_ENTRY_KERNEL32_CS] = GDT_ENTRY_INIT(0xc09b, 0, 0xfffff), 1121e5de182SAkinobu Mita [GDT_ENTRY_KERNEL_CS] = GDT_ENTRY_INIT(0xa09b, 0, 0xfffff), 1131e5de182SAkinobu Mita [GDT_ENTRY_KERNEL_DS] = GDT_ENTRY_INIT(0xc093, 0, 0xfffff), 1141e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER32_CS] = GDT_ENTRY_INIT(0xc0fb, 0, 0xfffff), 1151e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER_DS] = GDT_ENTRY_INIT(0xc0f3, 0, 0xfffff), 1161e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER_CS] = GDT_ENTRY_INIT(0xa0fb, 0, 0xfffff), 117950ad7ffSYinghai Lu #else 1181e5de182SAkinobu Mita [GDT_ENTRY_KERNEL_CS] = GDT_ENTRY_INIT(0xc09a, 0, 0xfffff), 1191e5de182SAkinobu Mita [GDT_ENTRY_KERNEL_DS] = GDT_ENTRY_INIT(0xc092, 0, 0xfffff), 1201e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER_CS] = GDT_ENTRY_INIT(0xc0fa, 0, 0xfffff), 1211e5de182SAkinobu Mita [GDT_ENTRY_DEFAULT_USER_DS] = GDT_ENTRY_INIT(0xc0f2, 0, 0xfffff), 122f7627e25SThomas Gleixner /* 123f7627e25SThomas Gleixner * Segments used for calling PnP BIOS have byte granularity. 124f7627e25SThomas Gleixner * They code segments and data segments have fixed 64k limits, 125f7627e25SThomas Gleixner * the transfer segment sizes are set at run time. 126f7627e25SThomas Gleixner */ 1276842ef0eSGlauber de Oliveira Costa /* 32-bit code */ 1281e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_CS32] = GDT_ENTRY_INIT(0x409a, 0, 0xffff), 1296842ef0eSGlauber de Oliveira Costa /* 16-bit code */ 1301e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_CS16] = GDT_ENTRY_INIT(0x009a, 0, 0xffff), 1316842ef0eSGlauber de Oliveira Costa /* 16-bit data */ 1321e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_DS] = GDT_ENTRY_INIT(0x0092, 0, 0xffff), 1336842ef0eSGlauber de Oliveira Costa /* 16-bit data */ 1341e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_TS1] = GDT_ENTRY_INIT(0x0092, 0, 0), 1356842ef0eSGlauber de Oliveira Costa /* 16-bit data */ 1361e5de182SAkinobu Mita [GDT_ENTRY_PNPBIOS_TS2] = GDT_ENTRY_INIT(0x0092, 0, 0), 137f7627e25SThomas Gleixner /* 138f7627e25SThomas Gleixner * The APM segments have byte granularity and their bases 139f7627e25SThomas Gleixner * are set at run time. All have 64k limits. 140f7627e25SThomas Gleixner */ 1416842ef0eSGlauber de Oliveira Costa /* 32-bit code */ 1421e5de182SAkinobu Mita [GDT_ENTRY_APMBIOS_BASE] = GDT_ENTRY_INIT(0x409a, 0, 0xffff), 143f7627e25SThomas Gleixner /* 16-bit code */ 1441e5de182SAkinobu Mita [GDT_ENTRY_APMBIOS_BASE+1] = GDT_ENTRY_INIT(0x009a, 0, 0xffff), 1456842ef0eSGlauber de Oliveira Costa /* data */ 14672c4d853SIngo Molnar [GDT_ENTRY_APMBIOS_BASE+2] = GDT_ENTRY_INIT(0x4092, 0, 0xffff), 147f7627e25SThomas Gleixner 1481e5de182SAkinobu Mita [GDT_ENTRY_ESPFIX_SS] = GDT_ENTRY_INIT(0xc092, 0, 0xfffff), 1491e5de182SAkinobu Mita [GDT_ENTRY_PERCPU] = GDT_ENTRY_INIT(0xc092, 0, 0xfffff), 15060a5317fSTejun Heo GDT_STACK_CANARY_INIT 151950ad7ffSYinghai Lu #endif 15206deef89SBrian Gerst } }; 153f7627e25SThomas Gleixner EXPORT_PER_CPU_SYMBOL_GPL(gdt_page); 154f7627e25SThomas Gleixner 1558c3641e9SDave Hansen static int __init x86_mpx_setup(char *s) 1560c752a93SSuresh Siddha { 1578c3641e9SDave Hansen /* require an exact match without trailing characters */ 1582cd3949fSDave Hansen if (strlen(s)) 1592cd3949fSDave Hansen return 0; 1600c752a93SSuresh Siddha 1618c3641e9SDave Hansen /* do not emit a message if the feature is not present */ 1628c3641e9SDave Hansen if (!boot_cpu_has(X86_FEATURE_MPX)) 1636bad06b7SSuresh Siddha return 1; 1646bad06b7SSuresh Siddha 1658c3641e9SDave Hansen setup_clear_cpu_cap(X86_FEATURE_MPX); 1668c3641e9SDave Hansen pr_info("nompx: Intel Memory Protection Extensions (MPX) disabled\n"); 167b6f42a4aSFenghua Yu return 1; 168b6f42a4aSFenghua Yu } 1698c3641e9SDave Hansen __setup("nompx", x86_mpx_setup); 170b6f42a4aSFenghua Yu 1710790c9aaSAndy Lutomirski #ifdef CONFIG_X86_64 172*c7ad5ad2SAndy Lutomirski static int __init x86_nopcid_setup(char *s) 1730790c9aaSAndy Lutomirski { 174*c7ad5ad2SAndy Lutomirski /* nopcid doesn't accept parameters */ 175*c7ad5ad2SAndy Lutomirski if (s) 176*c7ad5ad2SAndy Lutomirski return -EINVAL; 1770790c9aaSAndy Lutomirski 1780790c9aaSAndy Lutomirski /* do not emit a message if the feature is not present */ 1790790c9aaSAndy Lutomirski if (!boot_cpu_has(X86_FEATURE_PCID)) 180*c7ad5ad2SAndy Lutomirski return 0; 1810790c9aaSAndy Lutomirski 1820790c9aaSAndy Lutomirski setup_clear_cpu_cap(X86_FEATURE_PCID); 1830790c9aaSAndy Lutomirski pr_info("nopcid: PCID feature disabled\n"); 184*c7ad5ad2SAndy Lutomirski return 0; 1850790c9aaSAndy Lutomirski } 186*c7ad5ad2SAndy Lutomirski early_param("nopcid", x86_nopcid_setup); 1870790c9aaSAndy Lutomirski #endif 1880790c9aaSAndy Lutomirski 189d12a72b8SAndy Lutomirski static int __init x86_noinvpcid_setup(char *s) 190d12a72b8SAndy Lutomirski { 191d12a72b8SAndy Lutomirski /* noinvpcid doesn't accept parameters */ 192d12a72b8SAndy Lutomirski if (s) 193d12a72b8SAndy Lutomirski return -EINVAL; 194d12a72b8SAndy Lutomirski 195d12a72b8SAndy Lutomirski /* do not emit a message if the feature is not present */ 196d12a72b8SAndy Lutomirski if (!boot_cpu_has(X86_FEATURE_INVPCID)) 197d12a72b8SAndy Lutomirski return 0; 198d12a72b8SAndy Lutomirski 199d12a72b8SAndy Lutomirski setup_clear_cpu_cap(X86_FEATURE_INVPCID); 200d12a72b8SAndy Lutomirski pr_info("noinvpcid: INVPCID feature disabled\n"); 201d12a72b8SAndy Lutomirski return 0; 202d12a72b8SAndy Lutomirski } 203d12a72b8SAndy Lutomirski early_param("noinvpcid", x86_noinvpcid_setup); 204d12a72b8SAndy Lutomirski 205ba51dcedSYinghai Lu #ifdef CONFIG_X86_32 206148f9bb8SPaul Gortmaker static int cachesize_override = -1; 207148f9bb8SPaul Gortmaker static int disable_x86_serial_nr = 1; 208f7627e25SThomas Gleixner 209f7627e25SThomas Gleixner static int __init cachesize_setup(char *str) 210f7627e25SThomas Gleixner { 211f7627e25SThomas Gleixner get_option(&str, &cachesize_override); 212f7627e25SThomas Gleixner return 1; 213f7627e25SThomas Gleixner } 214f7627e25SThomas Gleixner __setup("cachesize=", cachesize_setup); 215f7627e25SThomas Gleixner 216f7627e25SThomas Gleixner static int __init x86_sep_setup(char *s) 217f7627e25SThomas Gleixner { 21813530257SAndi Kleen setup_clear_cpu_cap(X86_FEATURE_SEP); 219f7627e25SThomas Gleixner return 1; 220f7627e25SThomas Gleixner } 221f7627e25SThomas Gleixner __setup("nosep", x86_sep_setup); 222f7627e25SThomas Gleixner 223f7627e25SThomas Gleixner /* Standard macro to see if a specific flag is changeable */ 224f7627e25SThomas Gleixner static inline int flag_is_changeable_p(u32 flag) 225f7627e25SThomas Gleixner { 226f7627e25SThomas Gleixner u32 f1, f2; 227f7627e25SThomas Gleixner 22894f6bac1SKrzysztof Helt /* 22994f6bac1SKrzysztof Helt * Cyrix and IDT cpus allow disabling of CPUID 23094f6bac1SKrzysztof Helt * so the code below may return different results 23194f6bac1SKrzysztof Helt * when it is executed before and after enabling 23294f6bac1SKrzysztof Helt * the CPUID. Add "volatile" to not allow gcc to 23394f6bac1SKrzysztof Helt * optimize the subsequent calls to this function. 23494f6bac1SKrzysztof Helt */ 23594f6bac1SKrzysztof Helt asm volatile ("pushfl \n\t" 236f7627e25SThomas Gleixner "pushfl \n\t" 237f7627e25SThomas Gleixner "popl %0 \n\t" 238f7627e25SThomas Gleixner "movl %0, %1 \n\t" 239f7627e25SThomas Gleixner "xorl %2, %0 \n\t" 240f7627e25SThomas Gleixner "pushl %0 \n\t" 241f7627e25SThomas Gleixner "popfl \n\t" 242f7627e25SThomas Gleixner "pushfl \n\t" 243f7627e25SThomas Gleixner "popl %0 \n\t" 244f7627e25SThomas Gleixner "popfl \n\t" 2450f3fa48aSIngo Molnar 246f7627e25SThomas Gleixner : "=&r" (f1), "=&r" (f2) 247f7627e25SThomas Gleixner : "ir" (flag)); 248f7627e25SThomas Gleixner 249f7627e25SThomas Gleixner return ((f1^f2) & flag) != 0; 250f7627e25SThomas Gleixner } 251f7627e25SThomas Gleixner 252f7627e25SThomas Gleixner /* Probe for the CPUID instruction */ 253148f9bb8SPaul Gortmaker int have_cpuid_p(void) 254f7627e25SThomas Gleixner { 255f7627e25SThomas Gleixner return flag_is_changeable_p(X86_EFLAGS_ID); 256f7627e25SThomas Gleixner } 257f7627e25SThomas Gleixner 258148f9bb8SPaul Gortmaker static void squash_the_stupid_serial_number(struct cpuinfo_x86 *c) 2590a488a53SYinghai Lu { 2600a488a53SYinghai Lu unsigned long lo, hi; 2610f3fa48aSIngo Molnar 2620f3fa48aSIngo Molnar if (!cpu_has(c, X86_FEATURE_PN) || !disable_x86_serial_nr) 2630f3fa48aSIngo Molnar return; 2640f3fa48aSIngo Molnar 2650f3fa48aSIngo Molnar /* Disable processor serial number: */ 2660f3fa48aSIngo Molnar 2670a488a53SYinghai Lu rdmsr(MSR_IA32_BBL_CR_CTL, lo, hi); 2680a488a53SYinghai Lu lo |= 0x200000; 2690a488a53SYinghai Lu wrmsr(MSR_IA32_BBL_CR_CTL, lo, hi); 2700f3fa48aSIngo Molnar 2711b74dde7SChen Yucong pr_notice("CPU serial number disabled.\n"); 2720a488a53SYinghai Lu clear_cpu_cap(c, X86_FEATURE_PN); 2730a488a53SYinghai Lu 2740a488a53SYinghai Lu /* Disabling the serial number may affect the cpuid level */ 2750a488a53SYinghai Lu c->cpuid_level = cpuid_eax(0); 2760a488a53SYinghai Lu } 2770a488a53SYinghai Lu 2780a488a53SYinghai Lu static int __init x86_serial_nr_setup(char *s) 2790a488a53SYinghai Lu { 2800a488a53SYinghai Lu disable_x86_serial_nr = 0; 2810a488a53SYinghai Lu return 1; 2820a488a53SYinghai Lu } 2830a488a53SYinghai Lu __setup("serialnumber", x86_serial_nr_setup); 284ba51dcedSYinghai Lu #else 285102bbe3aSYinghai Lu static inline int flag_is_changeable_p(u32 flag) 286102bbe3aSYinghai Lu { 287102bbe3aSYinghai Lu return 1; 288102bbe3aSYinghai Lu } 289102bbe3aSYinghai Lu static inline void squash_the_stupid_serial_number(struct cpuinfo_x86 *c) 290102bbe3aSYinghai Lu { 291102bbe3aSYinghai Lu } 292ba51dcedSYinghai Lu #endif 2930a488a53SYinghai Lu 294de5397adSFenghua Yu static __init int setup_disable_smep(char *arg) 295de5397adSFenghua Yu { 296b2cc2a07SH. Peter Anvin setup_clear_cpu_cap(X86_FEATURE_SMEP); 2970f6ff2bcSDave Hansen /* Check for things that depend on SMEP being enabled: */ 2980f6ff2bcSDave Hansen check_mpx_erratum(&boot_cpu_data); 299de5397adSFenghua Yu return 1; 300de5397adSFenghua Yu } 301de5397adSFenghua Yu __setup("nosmep", setup_disable_smep); 302de5397adSFenghua Yu 303b2cc2a07SH. Peter Anvin static __always_inline void setup_smep(struct cpuinfo_x86 *c) 304de5397adSFenghua Yu { 305b2cc2a07SH. Peter Anvin if (cpu_has(c, X86_FEATURE_SMEP)) 306375074ccSAndy Lutomirski cr4_set_bits(X86_CR4_SMEP); 307de5397adSFenghua Yu } 308de5397adSFenghua Yu 30952b6179aSH. Peter Anvin static __init int setup_disable_smap(char *arg) 31052b6179aSH. Peter Anvin { 311b2cc2a07SH. Peter Anvin setup_clear_cpu_cap(X86_FEATURE_SMAP); 31252b6179aSH. Peter Anvin return 1; 31352b6179aSH. Peter Anvin } 31452b6179aSH. Peter Anvin __setup("nosmap", setup_disable_smap); 31552b6179aSH. Peter Anvin 316b2cc2a07SH. Peter Anvin static __always_inline void setup_smap(struct cpuinfo_x86 *c) 31752b6179aSH. Peter Anvin { 318581b7f15SAndrew Cooper unsigned long eflags = native_save_fl(); 319b2cc2a07SH. Peter Anvin 320b2cc2a07SH. Peter Anvin /* This should have been cleared long ago */ 321b2cc2a07SH. Peter Anvin BUG_ON(eflags & X86_EFLAGS_AC); 322b2cc2a07SH. Peter Anvin 32303bbd596SH. Peter Anvin if (cpu_has(c, X86_FEATURE_SMAP)) { 32403bbd596SH. Peter Anvin #ifdef CONFIG_X86_SMAP 325375074ccSAndy Lutomirski cr4_set_bits(X86_CR4_SMAP); 32603bbd596SH. Peter Anvin #else 327375074ccSAndy Lutomirski cr4_clear_bits(X86_CR4_SMAP); 32803bbd596SH. Peter Anvin #endif 32903bbd596SH. Peter Anvin } 330f7627e25SThomas Gleixner } 331f7627e25SThomas Gleixner 332f7627e25SThomas Gleixner /* 33306976945SDave Hansen * Protection Keys are not available in 32-bit mode. 33406976945SDave Hansen */ 33506976945SDave Hansen static bool pku_disabled; 33606976945SDave Hansen 33706976945SDave Hansen static __always_inline void setup_pku(struct cpuinfo_x86 *c) 33806976945SDave Hansen { 339e8df1a95SDave Hansen /* check the boot processor, plus compile options for PKU: */ 340e8df1a95SDave Hansen if (!cpu_feature_enabled(X86_FEATURE_PKU)) 341e8df1a95SDave Hansen return; 342e8df1a95SDave Hansen /* checks the actual processor's cpuid bits: */ 34306976945SDave Hansen if (!cpu_has(c, X86_FEATURE_PKU)) 34406976945SDave Hansen return; 34506976945SDave Hansen if (pku_disabled) 34606976945SDave Hansen return; 34706976945SDave Hansen 34806976945SDave Hansen cr4_set_bits(X86_CR4_PKE); 34906976945SDave Hansen /* 35006976945SDave Hansen * Seting X86_CR4_PKE will cause the X86_FEATURE_OSPKE 35106976945SDave Hansen * cpuid bit to be set. We need to ensure that we 35206976945SDave Hansen * update that bit in this CPU's "cpu_info". 35306976945SDave Hansen */ 35406976945SDave Hansen get_cpu_cap(c); 35506976945SDave Hansen } 35606976945SDave Hansen 35706976945SDave Hansen #ifdef CONFIG_X86_INTEL_MEMORY_PROTECTION_KEYS 35806976945SDave Hansen static __init int setup_disable_pku(char *arg) 35906976945SDave Hansen { 36006976945SDave Hansen /* 36106976945SDave Hansen * Do not clear the X86_FEATURE_PKU bit. All of the 36206976945SDave Hansen * runtime checks are against OSPKE so clearing the 36306976945SDave Hansen * bit does nothing. 36406976945SDave Hansen * 36506976945SDave Hansen * This way, we will see "pku" in cpuinfo, but not 36606976945SDave Hansen * "ospke", which is exactly what we want. It shows 36706976945SDave Hansen * that the CPU has PKU, but the OS has not enabled it. 36806976945SDave Hansen * This happens to be exactly how a system would look 36906976945SDave Hansen * if we disabled the config option. 37006976945SDave Hansen */ 37106976945SDave Hansen pr_info("x86: 'nopku' specified, disabling Memory Protection Keys\n"); 37206976945SDave Hansen pku_disabled = true; 37306976945SDave Hansen return 1; 37406976945SDave Hansen } 37506976945SDave Hansen __setup("nopku", setup_disable_pku); 37606976945SDave Hansen #endif /* CONFIG_X86_64 */ 37706976945SDave Hansen 37806976945SDave Hansen /* 379b38b0665SH. Peter Anvin * Some CPU features depend on higher CPUID levels, which may not always 380b38b0665SH. Peter Anvin * be available due to CPUID level capping or broken virtualization 381b38b0665SH. Peter Anvin * software. Add those features to this table to auto-disable them. 382b38b0665SH. Peter Anvin */ 383b38b0665SH. Peter Anvin struct cpuid_dependent_feature { 384b38b0665SH. Peter Anvin u32 feature; 385b38b0665SH. Peter Anvin u32 level; 386b38b0665SH. Peter Anvin }; 3870f3fa48aSIngo Molnar 388148f9bb8SPaul Gortmaker static const struct cpuid_dependent_feature 389b38b0665SH. Peter Anvin cpuid_dependent_features[] = { 390b38b0665SH. Peter Anvin { X86_FEATURE_MWAIT, 0x00000005 }, 391b38b0665SH. Peter Anvin { X86_FEATURE_DCA, 0x00000009 }, 392b38b0665SH. Peter Anvin { X86_FEATURE_XSAVE, 0x0000000d }, 393b38b0665SH. Peter Anvin { 0, 0 } 394b38b0665SH. Peter Anvin }; 395b38b0665SH. Peter Anvin 396148f9bb8SPaul Gortmaker static void filter_cpuid_features(struct cpuinfo_x86 *c, bool warn) 397b38b0665SH. Peter Anvin { 398b38b0665SH. Peter Anvin const struct cpuid_dependent_feature *df; 3999766cdbcSJaswinder Singh Rajput 400b38b0665SH. Peter Anvin for (df = cpuid_dependent_features; df->feature; df++) { 4010f3fa48aSIngo Molnar 4020f3fa48aSIngo Molnar if (!cpu_has(c, df->feature)) 4030f3fa48aSIngo Molnar continue; 404b38b0665SH. Peter Anvin /* 405b38b0665SH. Peter Anvin * Note: cpuid_level is set to -1 if unavailable, but 406b38b0665SH. Peter Anvin * extended_extended_level is set to 0 if unavailable 407b38b0665SH. Peter Anvin * and the legitimate extended levels are all negative 408b38b0665SH. Peter Anvin * when signed; hence the weird messing around with 409b38b0665SH. Peter Anvin * signs here... 410b38b0665SH. Peter Anvin */ 4110f3fa48aSIngo Molnar if (!((s32)df->level < 0 ? 412f6db44dfSYinghai Lu (u32)df->level > (u32)c->extended_cpuid_level : 4130f3fa48aSIngo Molnar (s32)df->level > (s32)c->cpuid_level)) 4140f3fa48aSIngo Molnar continue; 4150f3fa48aSIngo Molnar 416b38b0665SH. Peter Anvin clear_cpu_cap(c, df->feature); 4170f3fa48aSIngo Molnar if (!warn) 4180f3fa48aSIngo Molnar continue; 4190f3fa48aSIngo Molnar 4201b74dde7SChen Yucong pr_warn("CPU: CPU feature " X86_CAP_FMT " disabled, no CPUID level 0x%x\n", 4219def39beSJosh Triplett x86_cap_flag(df->feature), df->level); 422b38b0665SH. Peter Anvin } 423b38b0665SH. Peter Anvin } 424b38b0665SH. Peter Anvin 425b38b0665SH. Peter Anvin /* 426f7627e25SThomas Gleixner * Naming convention should be: <Name> [(<Codename>)] 427f7627e25SThomas Gleixner * This table only is used unless init_<vendor>() below doesn't set it; 4280f3fa48aSIngo Molnar * in particular, if CPUID levels 0x80000002..4 are supported, this 4290f3fa48aSIngo Molnar * isn't used 430f7627e25SThomas Gleixner */ 431f7627e25SThomas Gleixner 432f7627e25SThomas Gleixner /* Look up CPU names by table lookup. */ 433148f9bb8SPaul Gortmaker static const char *table_lookup_model(struct cpuinfo_x86 *c) 434f7627e25SThomas Gleixner { 43509dc68d9SJan Beulich #ifdef CONFIG_X86_32 43609dc68d9SJan Beulich const struct legacy_cpu_model_info *info; 437f7627e25SThomas Gleixner 438f7627e25SThomas Gleixner if (c->x86_model >= 16) 439f7627e25SThomas Gleixner return NULL; /* Range check */ 440f7627e25SThomas Gleixner 441f7627e25SThomas Gleixner if (!this_cpu) 442f7627e25SThomas Gleixner return NULL; 443f7627e25SThomas Gleixner 44409dc68d9SJan Beulich info = this_cpu->legacy_models; 445f7627e25SThomas Gleixner 44609dc68d9SJan Beulich while (info->family) { 447f7627e25SThomas Gleixner if (info->family == c->x86) 448f7627e25SThomas Gleixner return info->model_names[c->x86_model]; 449f7627e25SThomas Gleixner info++; 450f7627e25SThomas Gleixner } 45109dc68d9SJan Beulich #endif 452f7627e25SThomas Gleixner return NULL; /* Not found */ 453f7627e25SThomas Gleixner } 454f7627e25SThomas Gleixner 455148f9bb8SPaul Gortmaker __u32 cpu_caps_cleared[NCAPINTS]; 456148f9bb8SPaul Gortmaker __u32 cpu_caps_set[NCAPINTS]; 457f7627e25SThomas Gleixner 45811e3a840SJeremy Fitzhardinge void load_percpu_segment(int cpu) 4599d31d35bSYinghai Lu { 460fab334c1SYinghai Lu #ifdef CONFIG_X86_32 4612697fbd5SBrian Gerst loadsegment(fs, __KERNEL_PERCPU); 4622697fbd5SBrian Gerst #else 46345e876f7SAndy Lutomirski __loadsegment_simple(gs, 0); 4642697fbd5SBrian Gerst wrmsrl(MSR_GS_BASE, (unsigned long)per_cpu(irq_stack_union.gs_base, cpu)); 465fab334c1SYinghai Lu #endif 46660a5317fSTejun Heo load_stack_canary_segment(); 4679d31d35bSYinghai Lu } 4689d31d35bSYinghai Lu 46969218e47SThomas Garnier /* Setup the fixmap mapping only once per-processor */ 47069218e47SThomas Garnier static inline void setup_fixmap_gdt(int cpu) 47169218e47SThomas Garnier { 472b23adb7dSAndy Lutomirski #ifdef CONFIG_X86_64 473b23adb7dSAndy Lutomirski /* On 64-bit systems, we use a read-only fixmap GDT. */ 474b23adb7dSAndy Lutomirski pgprot_t prot = PAGE_KERNEL_RO; 475b23adb7dSAndy Lutomirski #else 476b23adb7dSAndy Lutomirski /* 477b23adb7dSAndy Lutomirski * On native 32-bit systems, the GDT cannot be read-only because 478b23adb7dSAndy Lutomirski * our double fault handler uses a task gate, and entering through 479b23adb7dSAndy Lutomirski * a task gate needs to change an available TSS to busy. If the GDT 480b23adb7dSAndy Lutomirski * is read-only, that will triple fault. 481b23adb7dSAndy Lutomirski * 482b23adb7dSAndy Lutomirski * On Xen PV, the GDT must be read-only because the hypervisor requires 483b23adb7dSAndy Lutomirski * it. 484b23adb7dSAndy Lutomirski */ 485b23adb7dSAndy Lutomirski pgprot_t prot = boot_cpu_has(X86_FEATURE_XENPV) ? 486b23adb7dSAndy Lutomirski PAGE_KERNEL_RO : PAGE_KERNEL; 487b23adb7dSAndy Lutomirski #endif 488b23adb7dSAndy Lutomirski 489b23adb7dSAndy Lutomirski __set_fixmap(get_cpu_gdt_ro_index(cpu), get_cpu_gdt_paddr(cpu), prot); 49069218e47SThomas Garnier } 49169218e47SThomas Garnier 49245fc8757SThomas Garnier /* Load the original GDT from the per-cpu structure */ 49345fc8757SThomas Garnier void load_direct_gdt(int cpu) 49445fc8757SThomas Garnier { 49545fc8757SThomas Garnier struct desc_ptr gdt_descr; 49645fc8757SThomas Garnier 49745fc8757SThomas Garnier gdt_descr.address = (long)get_cpu_gdt_rw(cpu); 49845fc8757SThomas Garnier gdt_descr.size = GDT_SIZE - 1; 49945fc8757SThomas Garnier load_gdt(&gdt_descr); 50045fc8757SThomas Garnier } 50145fc8757SThomas Garnier EXPORT_SYMBOL_GPL(load_direct_gdt); 50245fc8757SThomas Garnier 50369218e47SThomas Garnier /* Load a fixmap remapping of the per-cpu GDT */ 50469218e47SThomas Garnier void load_fixmap_gdt(int cpu) 50569218e47SThomas Garnier { 50669218e47SThomas Garnier struct desc_ptr gdt_descr; 50769218e47SThomas Garnier 50869218e47SThomas Garnier gdt_descr.address = (long)get_cpu_gdt_ro(cpu); 50969218e47SThomas Garnier gdt_descr.size = GDT_SIZE - 1; 51069218e47SThomas Garnier load_gdt(&gdt_descr); 51169218e47SThomas Garnier } 51245fc8757SThomas Garnier EXPORT_SYMBOL_GPL(load_fixmap_gdt); 51369218e47SThomas Garnier 5140f3fa48aSIngo Molnar /* 5150f3fa48aSIngo Molnar * Current gdt points %fs at the "master" per-cpu area: after this, 5160f3fa48aSIngo Molnar * it's on the real one. 5170f3fa48aSIngo Molnar */ 518552be871SBrian Gerst void switch_to_new_gdt(int cpu) 519f7627e25SThomas Gleixner { 52045fc8757SThomas Garnier /* Load the original GDT */ 52145fc8757SThomas Garnier load_direct_gdt(cpu); 522f7627e25SThomas Gleixner /* Reload the per-cpu base */ 52311e3a840SJeremy Fitzhardinge load_percpu_segment(cpu); 524f7627e25SThomas Gleixner } 525f7627e25SThomas Gleixner 526148f9bb8SPaul Gortmaker static const struct cpu_dev *cpu_devs[X86_VENDOR_NUM] = {}; 527f7627e25SThomas Gleixner 528148f9bb8SPaul Gortmaker static void get_model_name(struct cpuinfo_x86 *c) 529f7627e25SThomas Gleixner { 530f7627e25SThomas Gleixner unsigned int *v; 531ee098e1aSBorislav Petkov char *p, *q, *s; 532f7627e25SThomas Gleixner 5333da99c97SYinghai Lu if (c->extended_cpuid_level < 0x80000004) 5341b05d60dSYinghai Lu return; 535f7627e25SThomas Gleixner 536f7627e25SThomas Gleixner v = (unsigned int *)c->x86_model_id; 537f7627e25SThomas Gleixner cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]); 538f7627e25SThomas Gleixner cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]); 539f7627e25SThomas Gleixner cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]); 540f7627e25SThomas Gleixner c->x86_model_id[48] = 0; 541f7627e25SThomas Gleixner 542ee098e1aSBorislav Petkov /* Trim whitespace */ 543ee098e1aSBorislav Petkov p = q = s = &c->x86_model_id[0]; 544ee098e1aSBorislav Petkov 545ee098e1aSBorislav Petkov while (*p == ' ') 546ee098e1aSBorislav Petkov p++; 547ee098e1aSBorislav Petkov 548ee098e1aSBorislav Petkov while (*p) { 549ee098e1aSBorislav Petkov /* Note the last non-whitespace index */ 550ee098e1aSBorislav Petkov if (!isspace(*p)) 551ee098e1aSBorislav Petkov s = q; 552ee098e1aSBorislav Petkov 553ee098e1aSBorislav Petkov *q++ = *p++; 554ee098e1aSBorislav Petkov } 555ee098e1aSBorislav Petkov 556ee098e1aSBorislav Petkov *(s + 1) = '\0'; 557f7627e25SThomas Gleixner } 558f7627e25SThomas Gleixner 559148f9bb8SPaul Gortmaker void cpu_detect_cache_sizes(struct cpuinfo_x86 *c) 560f7627e25SThomas Gleixner { 5619d31d35bSYinghai Lu unsigned int n, dummy, ebx, ecx, edx, l2size; 562f7627e25SThomas Gleixner 5633da99c97SYinghai Lu n = c->extended_cpuid_level; 564f7627e25SThomas Gleixner 565f7627e25SThomas Gleixner if (n >= 0x80000005) { 5669d31d35bSYinghai Lu cpuid(0x80000005, &dummy, &ebx, &ecx, &edx); 567f7627e25SThomas Gleixner c->x86_cache_size = (ecx>>24) + (edx>>24); 568140fc727SYinghai Lu #ifdef CONFIG_X86_64 569140fc727SYinghai Lu /* On K8 L1 TLB is inclusive, so don't count it */ 570140fc727SYinghai Lu c->x86_tlbsize = 0; 571140fc727SYinghai Lu #endif 572f7627e25SThomas Gleixner } 573f7627e25SThomas Gleixner 574f7627e25SThomas Gleixner if (n < 0x80000006) /* Some chips just has a large L1. */ 575f7627e25SThomas Gleixner return; 576f7627e25SThomas Gleixner 5770a488a53SYinghai Lu cpuid(0x80000006, &dummy, &ebx, &ecx, &edx); 578f7627e25SThomas Gleixner l2size = ecx >> 16; 579f7627e25SThomas Gleixner 580140fc727SYinghai Lu #ifdef CONFIG_X86_64 581140fc727SYinghai Lu c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff); 582140fc727SYinghai Lu #else 583f7627e25SThomas Gleixner /* do processor-specific cache resizing */ 58409dc68d9SJan Beulich if (this_cpu->legacy_cache_size) 58509dc68d9SJan Beulich l2size = this_cpu->legacy_cache_size(c, l2size); 586f7627e25SThomas Gleixner 587f7627e25SThomas Gleixner /* Allow user to override all this if necessary. */ 588f7627e25SThomas Gleixner if (cachesize_override != -1) 589f7627e25SThomas Gleixner l2size = cachesize_override; 590f7627e25SThomas Gleixner 591f7627e25SThomas Gleixner if (l2size == 0) 592f7627e25SThomas Gleixner return; /* Again, no L2 cache is possible */ 593140fc727SYinghai Lu #endif 594f7627e25SThomas Gleixner 595f7627e25SThomas Gleixner c->x86_cache_size = l2size; 596f7627e25SThomas Gleixner } 597f7627e25SThomas Gleixner 598e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_4k[NR_INFO]; 599e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_2m[NR_INFO]; 600e0ba94f1SAlex Shi u16 __read_mostly tlb_lli_4m[NR_INFO]; 601e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_4k[NR_INFO]; 602e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_2m[NR_INFO]; 603e0ba94f1SAlex Shi u16 __read_mostly tlb_lld_4m[NR_INFO]; 604dd360393SKirill A. Shutemov u16 __read_mostly tlb_lld_1g[NR_INFO]; 605e0ba94f1SAlex Shi 606f94fe119SSteven Honeyman static void cpu_detect_tlb(struct cpuinfo_x86 *c) 607e0ba94f1SAlex Shi { 608e0ba94f1SAlex Shi if (this_cpu->c_detect_tlb) 609e0ba94f1SAlex Shi this_cpu->c_detect_tlb(c); 610e0ba94f1SAlex Shi 611f94fe119SSteven Honeyman pr_info("Last level iTLB entries: 4KB %d, 2MB %d, 4MB %d\n", 612e0ba94f1SAlex Shi tlb_lli_4k[ENTRIES], tlb_lli_2m[ENTRIES], 613f94fe119SSteven Honeyman tlb_lli_4m[ENTRIES]); 614f94fe119SSteven Honeyman 615f94fe119SSteven Honeyman pr_info("Last level dTLB entries: 4KB %d, 2MB %d, 4MB %d, 1GB %d\n", 616f94fe119SSteven Honeyman tlb_lld_4k[ENTRIES], tlb_lld_2m[ENTRIES], 617f94fe119SSteven Honeyman tlb_lld_4m[ENTRIES], tlb_lld_1g[ENTRIES]); 618e0ba94f1SAlex Shi } 619e0ba94f1SAlex Shi 620148f9bb8SPaul Gortmaker void detect_ht(struct cpuinfo_x86 *c) 6219d31d35bSYinghai Lu { 622c8e56d20SBorislav Petkov #ifdef CONFIG_SMP 6239d31d35bSYinghai Lu u32 eax, ebx, ecx, edx; 6249d31d35bSYinghai Lu int index_msb, core_bits; 6252eaad1fdSMike Travis static bool printed; 6269d31d35bSYinghai Lu 6270a488a53SYinghai Lu if (!cpu_has(c, X86_FEATURE_HT)) 6289d31d35bSYinghai Lu return; 6299d31d35bSYinghai Lu 6300a488a53SYinghai Lu if (cpu_has(c, X86_FEATURE_CMP_LEGACY)) 6310a488a53SYinghai Lu goto out; 6320a488a53SYinghai Lu 6331cd78776SYinghai Lu if (cpu_has(c, X86_FEATURE_XTOPOLOGY)) 6341cd78776SYinghai Lu return; 6351cd78776SYinghai Lu 6360a488a53SYinghai Lu cpuid(1, &eax, &ebx, &ecx, &edx); 6370a488a53SYinghai Lu 6389d31d35bSYinghai Lu smp_num_siblings = (ebx & 0xff0000) >> 16; 6399d31d35bSYinghai Lu 6409d31d35bSYinghai Lu if (smp_num_siblings == 1) { 6411b74dde7SChen Yucong pr_info_once("CPU0: Hyper-Threading is disabled\n"); 6420f3fa48aSIngo Molnar goto out; 6430f3fa48aSIngo Molnar } 6440f3fa48aSIngo Molnar 6450f3fa48aSIngo Molnar if (smp_num_siblings <= 1) 6460f3fa48aSIngo Molnar goto out; 6479d31d35bSYinghai Lu 6489d31d35bSYinghai Lu index_msb = get_count_order(smp_num_siblings); 649cb8cc442SIngo Molnar c->phys_proc_id = apic->phys_pkg_id(c->initial_apicid, index_msb); 6509d31d35bSYinghai Lu 6519d31d35bSYinghai Lu smp_num_siblings = smp_num_siblings / c->x86_max_cores; 6529d31d35bSYinghai Lu 6539d31d35bSYinghai Lu index_msb = get_count_order(smp_num_siblings); 6549d31d35bSYinghai Lu 6559d31d35bSYinghai Lu core_bits = get_count_order(c->x86_max_cores); 6569d31d35bSYinghai Lu 657cb8cc442SIngo Molnar c->cpu_core_id = apic->phys_pkg_id(c->initial_apicid, index_msb) & 6581cd78776SYinghai Lu ((1 << core_bits) - 1); 6599d31d35bSYinghai Lu 6600a488a53SYinghai Lu out: 6612eaad1fdSMike Travis if (!printed && (c->x86_max_cores * smp_num_siblings) > 1) { 6621b74dde7SChen Yucong pr_info("CPU: Physical Processor ID: %d\n", 6630a488a53SYinghai Lu c->phys_proc_id); 6641b74dde7SChen Yucong pr_info("CPU: Processor Core ID: %d\n", 6659d31d35bSYinghai Lu c->cpu_core_id); 6662eaad1fdSMike Travis printed = 1; 6679d31d35bSYinghai Lu } 6689d31d35bSYinghai Lu #endif 66997e4db7cSYinghai Lu } 670f7627e25SThomas Gleixner 671148f9bb8SPaul Gortmaker static void get_cpu_vendor(struct cpuinfo_x86 *c) 672f7627e25SThomas Gleixner { 673f7627e25SThomas Gleixner char *v = c->x86_vendor_id; 6740f3fa48aSIngo Molnar int i; 675f7627e25SThomas Gleixner 676f7627e25SThomas Gleixner for (i = 0; i < X86_VENDOR_NUM; i++) { 67710a434fcSYinghai Lu if (!cpu_devs[i]) 67810a434fcSYinghai Lu break; 67910a434fcSYinghai Lu 680f7627e25SThomas Gleixner if (!strcmp(v, cpu_devs[i]->c_ident[0]) || 681f7627e25SThomas Gleixner (cpu_devs[i]->c_ident[1] && 682f7627e25SThomas Gleixner !strcmp(v, cpu_devs[i]->c_ident[1]))) { 6830f3fa48aSIngo Molnar 684f7627e25SThomas Gleixner this_cpu = cpu_devs[i]; 68510a434fcSYinghai Lu c->x86_vendor = this_cpu->c_x86_vendor; 686f7627e25SThomas Gleixner return; 687f7627e25SThomas Gleixner } 688f7627e25SThomas Gleixner } 68910a434fcSYinghai Lu 6901b74dde7SChen Yucong pr_err_once("CPU: vendor_id '%s' unknown, using generic init.\n" \ 691a9c56953SMinchan Kim "CPU: Your system may be unstable.\n", v); 69210a434fcSYinghai Lu 693f7627e25SThomas Gleixner c->x86_vendor = X86_VENDOR_UNKNOWN; 694f7627e25SThomas Gleixner this_cpu = &default_cpu; 695f7627e25SThomas Gleixner } 696f7627e25SThomas Gleixner 697148f9bb8SPaul Gortmaker void cpu_detect(struct cpuinfo_x86 *c) 698f7627e25SThomas Gleixner { 699f7627e25SThomas Gleixner /* Get vendor name */ 7004a148513SHarvey Harrison cpuid(0x00000000, (unsigned int *)&c->cpuid_level, 7014a148513SHarvey Harrison (unsigned int *)&c->x86_vendor_id[0], 7024a148513SHarvey Harrison (unsigned int *)&c->x86_vendor_id[8], 7034a148513SHarvey Harrison (unsigned int *)&c->x86_vendor_id[4]); 704f7627e25SThomas Gleixner 705f7627e25SThomas Gleixner c->x86 = 4; 7069d31d35bSYinghai Lu /* Intel-defined flags: level 0x00000001 */ 707f7627e25SThomas Gleixner if (c->cpuid_level >= 0x00000001) { 708f7627e25SThomas Gleixner u32 junk, tfms, cap0, misc; 7090f3fa48aSIngo Molnar 710f7627e25SThomas Gleixner cpuid(0x00000001, &tfms, &misc, &junk, &cap0); 71199f925ceSBorislav Petkov c->x86 = x86_family(tfms); 71299f925ceSBorislav Petkov c->x86_model = x86_model(tfms); 71399f925ceSBorislav Petkov c->x86_mask = x86_stepping(tfms); 7140f3fa48aSIngo Molnar 715d4387bd3SHuang, Ying if (cap0 & (1<<19)) { 716d4387bd3SHuang, Ying c->x86_clflush_size = ((misc >> 8) & 0xff) * 8; 7179d31d35bSYinghai Lu c->x86_cache_alignment = c->x86_clflush_size; 718d4387bd3SHuang, Ying } 719f7627e25SThomas Gleixner } 720f7627e25SThomas Gleixner } 7213da99c97SYinghai Lu 7228bf1ebcaSAndy Lutomirski static void apply_forced_caps(struct cpuinfo_x86 *c) 7238bf1ebcaSAndy Lutomirski { 7248bf1ebcaSAndy Lutomirski int i; 7258bf1ebcaSAndy Lutomirski 7268bf1ebcaSAndy Lutomirski for (i = 0; i < NCAPINTS; i++) { 7278bf1ebcaSAndy Lutomirski c->x86_capability[i] &= ~cpu_caps_cleared[i]; 7288bf1ebcaSAndy Lutomirski c->x86_capability[i] |= cpu_caps_set[i]; 7298bf1ebcaSAndy Lutomirski } 7308bf1ebcaSAndy Lutomirski } 7318bf1ebcaSAndy Lutomirski 732148f9bb8SPaul Gortmaker void get_cpu_cap(struct cpuinfo_x86 *c) 733093af8d7SYinghai Lu { 73439c06df4SBorislav Petkov u32 eax, ebx, ecx, edx; 735093af8d7SYinghai Lu 736093af8d7SYinghai Lu /* Intel-defined flags: level 0x00000001 */ 737093af8d7SYinghai Lu if (c->cpuid_level >= 0x00000001) { 73839c06df4SBorislav Petkov cpuid(0x00000001, &eax, &ebx, &ecx, &edx); 7390f3fa48aSIngo Molnar 74039c06df4SBorislav Petkov c->x86_capability[CPUID_1_ECX] = ecx; 74139c06df4SBorislav Petkov c->x86_capability[CPUID_1_EDX] = edx; 742093af8d7SYinghai Lu } 743093af8d7SYinghai Lu 7443df8d920SAndy Lutomirski /* Thermal and Power Management Leaf: level 0x00000006 (eax) */ 7453df8d920SAndy Lutomirski if (c->cpuid_level >= 0x00000006) 7463df8d920SAndy Lutomirski c->x86_capability[CPUID_6_EAX] = cpuid_eax(0x00000006); 7473df8d920SAndy Lutomirski 748bdc802dcSH. Peter Anvin /* Additional Intel-defined flags: level 0x00000007 */ 749bdc802dcSH. Peter Anvin if (c->cpuid_level >= 0x00000007) { 750bdc802dcSH. Peter Anvin cpuid_count(0x00000007, 0, &eax, &ebx, &ecx, &edx); 75139c06df4SBorislav Petkov c->x86_capability[CPUID_7_0_EBX] = ebx; 752dfb4a70fSDave Hansen c->x86_capability[CPUID_7_ECX] = ecx; 753bdc802dcSH. Peter Anvin } 754bdc802dcSH. Peter Anvin 7556229ad27SFenghua Yu /* Extended state features: level 0x0000000d */ 7566229ad27SFenghua Yu if (c->cpuid_level >= 0x0000000d) { 7576229ad27SFenghua Yu cpuid_count(0x0000000d, 1, &eax, &ebx, &ecx, &edx); 7586229ad27SFenghua Yu 75939c06df4SBorislav Petkov c->x86_capability[CPUID_D_1_EAX] = eax; 7606229ad27SFenghua Yu } 7616229ad27SFenghua Yu 762cbc82b17SPeter P Waskiewicz Jr /* Additional Intel-defined flags: level 0x0000000F */ 763cbc82b17SPeter P Waskiewicz Jr if (c->cpuid_level >= 0x0000000F) { 764cbc82b17SPeter P Waskiewicz Jr 765cbc82b17SPeter P Waskiewicz Jr /* QoS sub-leaf, EAX=0Fh, ECX=0 */ 766cbc82b17SPeter P Waskiewicz Jr cpuid_count(0x0000000F, 0, &eax, &ebx, &ecx, &edx); 76739c06df4SBorislav Petkov c->x86_capability[CPUID_F_0_EDX] = edx; 76839c06df4SBorislav Petkov 769cbc82b17SPeter P Waskiewicz Jr if (cpu_has(c, X86_FEATURE_CQM_LLC)) { 770cbc82b17SPeter P Waskiewicz Jr /* will be overridden if occupancy monitoring exists */ 771cbc82b17SPeter P Waskiewicz Jr c->x86_cache_max_rmid = ebx; 772cbc82b17SPeter P Waskiewicz Jr 773cbc82b17SPeter P Waskiewicz Jr /* QoS sub-leaf, EAX=0Fh, ECX=1 */ 774cbc82b17SPeter P Waskiewicz Jr cpuid_count(0x0000000F, 1, &eax, &ebx, &ecx, &edx); 77539c06df4SBorislav Petkov c->x86_capability[CPUID_F_1_EDX] = edx; 77639c06df4SBorislav Petkov 77733c3cc7aSVikas Shivappa if ((cpu_has(c, X86_FEATURE_CQM_OCCUP_LLC)) || 77833c3cc7aSVikas Shivappa ((cpu_has(c, X86_FEATURE_CQM_MBM_TOTAL)) || 77933c3cc7aSVikas Shivappa (cpu_has(c, X86_FEATURE_CQM_MBM_LOCAL)))) { 780cbc82b17SPeter P Waskiewicz Jr c->x86_cache_max_rmid = ecx; 781cbc82b17SPeter P Waskiewicz Jr c->x86_cache_occ_scale = ebx; 782cbc82b17SPeter P Waskiewicz Jr } 783cbc82b17SPeter P Waskiewicz Jr } else { 784cbc82b17SPeter P Waskiewicz Jr c->x86_cache_max_rmid = -1; 785cbc82b17SPeter P Waskiewicz Jr c->x86_cache_occ_scale = -1; 786cbc82b17SPeter P Waskiewicz Jr } 787cbc82b17SPeter P Waskiewicz Jr } 788cbc82b17SPeter P Waskiewicz Jr 789093af8d7SYinghai Lu /* AMD-defined flags: level 0x80000001 */ 79039c06df4SBorislav Petkov eax = cpuid_eax(0x80000000); 79139c06df4SBorislav Petkov c->extended_cpuid_level = eax; 7920f3fa48aSIngo Molnar 79339c06df4SBorislav Petkov if ((eax & 0xffff0000) == 0x80000000) { 79439c06df4SBorislav Petkov if (eax >= 0x80000001) { 79539c06df4SBorislav Petkov cpuid(0x80000001, &eax, &ebx, &ecx, &edx); 79639c06df4SBorislav Petkov 79739c06df4SBorislav Petkov c->x86_capability[CPUID_8000_0001_ECX] = ecx; 79839c06df4SBorislav Petkov c->x86_capability[CPUID_8000_0001_EDX] = edx; 799093af8d7SYinghai Lu } 800093af8d7SYinghai Lu } 801093af8d7SYinghai Lu 80271faad43SYazen Ghannam if (c->extended_cpuid_level >= 0x80000007) { 80371faad43SYazen Ghannam cpuid(0x80000007, &eax, &ebx, &ecx, &edx); 80471faad43SYazen Ghannam 80571faad43SYazen Ghannam c->x86_capability[CPUID_8000_0007_EBX] = ebx; 80671faad43SYazen Ghannam c->x86_power = edx; 80771faad43SYazen Ghannam } 80871faad43SYazen Ghannam 8095122c890SYinghai Lu if (c->extended_cpuid_level >= 0x80000008) { 81039c06df4SBorislav Petkov cpuid(0x80000008, &eax, &ebx, &ecx, &edx); 8115122c890SYinghai Lu 8125122c890SYinghai Lu c->x86_virt_bits = (eax >> 8) & 0xff; 8135122c890SYinghai Lu c->x86_phys_bits = eax & 0xff; 81439c06df4SBorislav Petkov c->x86_capability[CPUID_8000_0008_EBX] = ebx; 8155122c890SYinghai Lu } 81613c6c532SJan Beulich #ifdef CONFIG_X86_32 81713c6c532SJan Beulich else if (cpu_has(c, X86_FEATURE_PAE) || cpu_has(c, X86_FEATURE_PSE36)) 81813c6c532SJan Beulich c->x86_phys_bits = 36; 8195122c890SYinghai Lu #endif 820e3224234SYinghai Lu 8212ccd71f1SBorislav Petkov if (c->extended_cpuid_level >= 0x8000000a) 82239c06df4SBorislav Petkov c->x86_capability[CPUID_8000_000A_EDX] = cpuid_edx(0x8000000a); 8232ccd71f1SBorislav Petkov 8241dedefd1SJacob Pan init_scattered_cpuid_features(c); 82560d34501SAndy Lutomirski 82660d34501SAndy Lutomirski /* 82760d34501SAndy Lutomirski * Clear/Set all flags overridden by options, after probe. 82860d34501SAndy Lutomirski * This needs to happen each time we re-probe, which may happen 82960d34501SAndy Lutomirski * several times during CPU initialization. 83060d34501SAndy Lutomirski */ 83160d34501SAndy Lutomirski apply_forced_caps(c); 832093af8d7SYinghai Lu } 833093af8d7SYinghai Lu 834148f9bb8SPaul Gortmaker static void identify_cpu_without_cpuid(struct cpuinfo_x86 *c) 835aef93c8bSYinghai Lu { 836aef93c8bSYinghai Lu #ifdef CONFIG_X86_32 837aef93c8bSYinghai Lu int i; 838aef93c8bSYinghai Lu 839aef93c8bSYinghai Lu /* 840aef93c8bSYinghai Lu * First of all, decide if this is a 486 or higher 841aef93c8bSYinghai Lu * It's a 486 if we can modify the AC flag 842aef93c8bSYinghai Lu */ 843aef93c8bSYinghai Lu if (flag_is_changeable_p(X86_EFLAGS_AC)) 844aef93c8bSYinghai Lu c->x86 = 4; 845aef93c8bSYinghai Lu else 846aef93c8bSYinghai Lu c->x86 = 3; 847aef93c8bSYinghai Lu 848aef93c8bSYinghai Lu for (i = 0; i < X86_VENDOR_NUM; i++) 849aef93c8bSYinghai Lu if (cpu_devs[i] && cpu_devs[i]->c_identify) { 850aef93c8bSYinghai Lu c->x86_vendor_id[0] = 0; 851aef93c8bSYinghai Lu cpu_devs[i]->c_identify(c); 852aef93c8bSYinghai Lu if (c->x86_vendor_id[0]) { 853aef93c8bSYinghai Lu get_cpu_vendor(c); 854aef93c8bSYinghai Lu break; 855aef93c8bSYinghai Lu } 856aef93c8bSYinghai Lu } 857aef93c8bSYinghai Lu #endif 858093af8d7SYinghai Lu } 859f7627e25SThomas Gleixner 86034048c9eSPaolo Ciarrocchi /* 86134048c9eSPaolo Ciarrocchi * Do minimum CPU detection early. 86234048c9eSPaolo Ciarrocchi * Fields really needed: vendor, cpuid_level, family, model, mask, 86334048c9eSPaolo Ciarrocchi * cache alignment. 86434048c9eSPaolo Ciarrocchi * The others are not touched to avoid unwanted side effects. 86534048c9eSPaolo Ciarrocchi * 86634048c9eSPaolo Ciarrocchi * WARNING: this function is only called on the BP. Don't add code here 86734048c9eSPaolo Ciarrocchi * that is supposed to run on all CPUs. 86834048c9eSPaolo Ciarrocchi */ 8693da99c97SYinghai Lu static void __init early_identify_cpu(struct cpuinfo_x86 *c) 870f7627e25SThomas Gleixner { 8716627d242SYinghai Lu #ifdef CONFIG_X86_64 8726627d242SYinghai Lu c->x86_clflush_size = 64; 87313c6c532SJan Beulich c->x86_phys_bits = 36; 87413c6c532SJan Beulich c->x86_virt_bits = 48; 8756627d242SYinghai Lu #else 876d4387bd3SHuang, Ying c->x86_clflush_size = 32; 87713c6c532SJan Beulich c->x86_phys_bits = 32; 87813c6c532SJan Beulich c->x86_virt_bits = 32; 8796627d242SYinghai Lu #endif 8800a488a53SYinghai Lu c->x86_cache_alignment = c->x86_clflush_size; 881f7627e25SThomas Gleixner 8823da99c97SYinghai Lu memset(&c->x86_capability, 0, sizeof c->x86_capability); 8830a488a53SYinghai Lu c->extended_cpuid_level = 0; 8840a488a53SYinghai Lu 885aef93c8bSYinghai Lu /* cyrix could have cpuid enabled via c_identify()*/ 88605fb3c19SAndy Lutomirski if (have_cpuid_p()) { 887f7627e25SThomas Gleixner cpu_detect(c); 8883da99c97SYinghai Lu get_cpu_vendor(c); 8893da99c97SYinghai Lu get_cpu_cap(c); 89078d1b296SBorislav Petkov setup_force_cpu_cap(X86_FEATURE_CPUID); 89112cf105cSKrzysztof Helt 89210a434fcSYinghai Lu if (this_cpu->c_early_init) 89310a434fcSYinghai Lu this_cpu->c_early_init(c); 8943da99c97SYinghai Lu 895f6e9456cSRobert Richter c->cpu_index = 0; 896b38b0665SH. Peter Anvin filter_cpuid_features(c, false); 897de5397adSFenghua Yu 898a110b5ecSBorislav Petkov if (this_cpu->c_bsp_init) 899a110b5ecSBorislav Petkov this_cpu->c_bsp_init(c); 90078d1b296SBorislav Petkov } else { 90178d1b296SBorislav Petkov identify_cpu_without_cpuid(c); 90278d1b296SBorislav Petkov setup_clear_cpu_cap(X86_FEATURE_CPUID); 90305fb3c19SAndy Lutomirski } 904c3b83598SBorislav Petkov 905c3b83598SBorislav Petkov setup_force_cpu_cap(X86_FEATURE_ALWAYS); 906db52ef74SIngo Molnar fpu__init_system(c); 907f7627e25SThomas Gleixner } 908f7627e25SThomas Gleixner 9099d31d35bSYinghai Lu void __init early_cpu_init(void) 9109d31d35bSYinghai Lu { 91102dde8b4SJan Beulich const struct cpu_dev *const *cdev; 91210a434fcSYinghai Lu int count = 0; 9139d31d35bSYinghai Lu 914ac23f253SJan Beulich #ifdef CONFIG_PROCESSOR_SELECT 9151b74dde7SChen Yucong pr_info("KERNEL supported cpus:\n"); 91631c997caSIngo Molnar #endif 91731c997caSIngo Molnar 91810a434fcSYinghai Lu for (cdev = __x86_cpu_dev_start; cdev < __x86_cpu_dev_end; cdev++) { 91902dde8b4SJan Beulich const struct cpu_dev *cpudev = *cdev; 9209d31d35bSYinghai Lu 92110a434fcSYinghai Lu if (count >= X86_VENDOR_NUM) 92210a434fcSYinghai Lu break; 92310a434fcSYinghai Lu cpu_devs[count] = cpudev; 92410a434fcSYinghai Lu count++; 92510a434fcSYinghai Lu 926ac23f253SJan Beulich #ifdef CONFIG_PROCESSOR_SELECT 92731c997caSIngo Molnar { 92831c997caSIngo Molnar unsigned int j; 92931c997caSIngo Molnar 93010a434fcSYinghai Lu for (j = 0; j < 2; j++) { 93110a434fcSYinghai Lu if (!cpudev->c_ident[j]) 93210a434fcSYinghai Lu continue; 9331b74dde7SChen Yucong pr_info(" %s %s\n", cpudev->c_vendor, 93410a434fcSYinghai Lu cpudev->c_ident[j]); 93510a434fcSYinghai Lu } 93610a434fcSYinghai Lu } 9370388423dSDave Jones #endif 93831c997caSIngo Molnar } 9399d31d35bSYinghai Lu early_identify_cpu(&boot_cpu_data); 940f7627e25SThomas Gleixner } 941f7627e25SThomas Gleixner 942b6734c35SH. Peter Anvin /* 943366d4a43SBorislav Petkov * The NOPL instruction is supposed to exist on all CPUs of family >= 6; 944366d4a43SBorislav Petkov * unfortunately, that's not true in practice because of early VIA 945366d4a43SBorislav Petkov * chips and (more importantly) broken virtualizers that are not easy 946366d4a43SBorislav Petkov * to detect. In the latter case it doesn't even *fail* reliably, so 947366d4a43SBorislav Petkov * probing for it doesn't even work. Disable it completely on 32-bit 948ba0593bfSH. Peter Anvin * unless we can find a reliable way to detect all the broken cases. 949366d4a43SBorislav Petkov * Enable it explicitly on 64-bit for non-constant inputs of cpu_has(). 950b6734c35SH. Peter Anvin */ 951148f9bb8SPaul Gortmaker static void detect_nopl(struct cpuinfo_x86 *c) 952b6734c35SH. Peter Anvin { 953366d4a43SBorislav Petkov #ifdef CONFIG_X86_32 954b6734c35SH. Peter Anvin clear_cpu_cap(c, X86_FEATURE_NOPL); 955366d4a43SBorislav Petkov #else 956366d4a43SBorislav Petkov set_cpu_cap(c, X86_FEATURE_NOPL); 957366d4a43SBorislav Petkov #endif 958f7627e25SThomas Gleixner } 959f7627e25SThomas Gleixner 9607a5d6704SAndy Lutomirski static void detect_null_seg_behavior(struct cpuinfo_x86 *c) 9617a5d6704SAndy Lutomirski { 9627a5d6704SAndy Lutomirski #ifdef CONFIG_X86_64 963f7627e25SThomas Gleixner /* 9647a5d6704SAndy Lutomirski * Empirically, writing zero to a segment selector on AMD does 9657a5d6704SAndy Lutomirski * not clear the base, whereas writing zero to a segment 9667a5d6704SAndy Lutomirski * selector on Intel does clear the base. Intel's behavior 9677a5d6704SAndy Lutomirski * allows slightly faster context switches in the common case 9687a5d6704SAndy Lutomirski * where GS is unused by the prev and next threads. 969f7627e25SThomas Gleixner * 9707a5d6704SAndy Lutomirski * Since neither vendor documents this anywhere that I can see, 9717a5d6704SAndy Lutomirski * detect it directly instead of hardcoding the choice by 9727a5d6704SAndy Lutomirski * vendor. 9737a5d6704SAndy Lutomirski * 9747a5d6704SAndy Lutomirski * I've designated AMD's behavior as the "bug" because it's 9757a5d6704SAndy Lutomirski * counterintuitive and less friendly. 976f7627e25SThomas Gleixner */ 9777a5d6704SAndy Lutomirski 9787a5d6704SAndy Lutomirski unsigned long old_base, tmp; 9797a5d6704SAndy Lutomirski rdmsrl(MSR_FS_BASE, old_base); 9807a5d6704SAndy Lutomirski wrmsrl(MSR_FS_BASE, 1); 9817a5d6704SAndy Lutomirski loadsegment(fs, 0); 9827a5d6704SAndy Lutomirski rdmsrl(MSR_FS_BASE, tmp); 9837a5d6704SAndy Lutomirski if (tmp != 0) 9847a5d6704SAndy Lutomirski set_cpu_bug(c, X86_BUG_NULL_SEG); 9857a5d6704SAndy Lutomirski wrmsrl(MSR_FS_BASE, old_base); 9863da99c97SYinghai Lu #endif 987f7627e25SThomas Gleixner } 988aef93c8bSYinghai Lu 989148f9bb8SPaul Gortmaker static void generic_identify(struct cpuinfo_x86 *c) 990f7627e25SThomas Gleixner { 991f7627e25SThomas Gleixner c->extended_cpuid_level = 0; 992f7627e25SThomas Gleixner 993aef93c8bSYinghai Lu if (!have_cpuid_p()) 994aef93c8bSYinghai Lu identify_cpu_without_cpuid(c); 995f7627e25SThomas Gleixner 996aef93c8bSYinghai Lu /* cyrix could have cpuid enabled via c_identify()*/ 997a9853dd6SIngo Molnar if (!have_cpuid_p()) 998aef93c8bSYinghai Lu return; 999aef93c8bSYinghai Lu 10003da99c97SYinghai Lu cpu_detect(c); 10013da99c97SYinghai Lu 10023da99c97SYinghai Lu get_cpu_vendor(c); 10033da99c97SYinghai Lu 10043da99c97SYinghai Lu get_cpu_cap(c); 10053da99c97SYinghai Lu 1006f7627e25SThomas Gleixner if (c->cpuid_level >= 0x00000001) { 10073da99c97SYinghai Lu c->initial_apicid = (cpuid_ebx(1) >> 24) & 0xFF; 1008b89d3b3eSYinghai Lu #ifdef CONFIG_X86_32 1009c8e56d20SBorislav Petkov # ifdef CONFIG_SMP 1010cb8cc442SIngo Molnar c->apicid = apic->phys_pkg_id(c->initial_apicid, 0); 1011f7627e25SThomas Gleixner # else 101201aaea1aSYinghai Lu c->apicid = c->initial_apicid; 1013f7627e25SThomas Gleixner # endif 1014b89d3b3eSYinghai Lu #endif 1015b89d3b3eSYinghai Lu c->phys_proc_id = c->initial_apicid; 1016f7627e25SThomas Gleixner } 1017f7627e25SThomas Gleixner 1018f7627e25SThomas Gleixner get_model_name(c); /* Default name */ 1019f7627e25SThomas Gleixner 1020b6734c35SH. Peter Anvin detect_nopl(c); 10217a5d6704SAndy Lutomirski 10227a5d6704SAndy Lutomirski detect_null_seg_behavior(c); 10230230bb03SAndy Lutomirski 10240230bb03SAndy Lutomirski /* 10250230bb03SAndy Lutomirski * ESPFIX is a strange bug. All real CPUs have it. Paravirt 10260230bb03SAndy Lutomirski * systems that run Linux at CPL > 0 may or may not have the 10270230bb03SAndy Lutomirski * issue, but, even if they have the issue, there's absolutely 10280230bb03SAndy Lutomirski * nothing we can do about it because we can't use the real IRET 10290230bb03SAndy Lutomirski * instruction. 10300230bb03SAndy Lutomirski * 10310230bb03SAndy Lutomirski * NB: For the time being, only 32-bit kernels support 10320230bb03SAndy Lutomirski * X86_BUG_ESPFIX as such. 64-bit kernels directly choose 10330230bb03SAndy Lutomirski * whether to apply espfix using paravirt hooks. If any 10340230bb03SAndy Lutomirski * non-paravirt system ever shows up that does *not* have the 10350230bb03SAndy Lutomirski * ESPFIX issue, we can change this. 10360230bb03SAndy Lutomirski */ 10370230bb03SAndy Lutomirski #ifdef CONFIG_X86_32 10380230bb03SAndy Lutomirski # ifdef CONFIG_PARAVIRT 10390230bb03SAndy Lutomirski do { 10400230bb03SAndy Lutomirski extern void native_iret(void); 10410230bb03SAndy Lutomirski if (pv_cpu_ops.iret == native_iret) 10420230bb03SAndy Lutomirski set_cpu_bug(c, X86_BUG_ESPFIX); 10430230bb03SAndy Lutomirski } while (0); 10440230bb03SAndy Lutomirski # else 10450230bb03SAndy Lutomirski set_cpu_bug(c, X86_BUG_ESPFIX); 10460230bb03SAndy Lutomirski # endif 10470230bb03SAndy Lutomirski #endif 1048f7627e25SThomas Gleixner } 1049f7627e25SThomas Gleixner 1050cbc82b17SPeter P Waskiewicz Jr static void x86_init_cache_qos(struct cpuinfo_x86 *c) 1051cbc82b17SPeter P Waskiewicz Jr { 1052cbc82b17SPeter P Waskiewicz Jr /* 1053cbc82b17SPeter P Waskiewicz Jr * The heavy lifting of max_rmid and cache_occ_scale are handled 1054cbc82b17SPeter P Waskiewicz Jr * in get_cpu_cap(). Here we just set the max_rmid for the boot_cpu 1055cbc82b17SPeter P Waskiewicz Jr * in case CQM bits really aren't there in this CPU. 1056cbc82b17SPeter P Waskiewicz Jr */ 1057cbc82b17SPeter P Waskiewicz Jr if (c != &boot_cpu_data) { 1058cbc82b17SPeter P Waskiewicz Jr boot_cpu_data.x86_cache_max_rmid = 1059cbc82b17SPeter P Waskiewicz Jr min(boot_cpu_data.x86_cache_max_rmid, 1060cbc82b17SPeter P Waskiewicz Jr c->x86_cache_max_rmid); 1061cbc82b17SPeter P Waskiewicz Jr } 1062cbc82b17SPeter P Waskiewicz Jr } 1063cbc82b17SPeter P Waskiewicz Jr 1064f7627e25SThomas Gleixner /* 10659d85eb91SThomas Gleixner * Validate that ACPI/mptables have the same information about the 10669d85eb91SThomas Gleixner * effective APIC id and update the package map. 1067d49597fdSThomas Gleixner */ 10689d85eb91SThomas Gleixner static void validate_apic_and_package_id(struct cpuinfo_x86 *c) 1069d49597fdSThomas Gleixner { 1070d49597fdSThomas Gleixner #ifdef CONFIG_SMP 10719d85eb91SThomas Gleixner unsigned int apicid, cpu = smp_processor_id(); 1072d49597fdSThomas Gleixner 1073d49597fdSThomas Gleixner apicid = apic->cpu_present_to_apicid(cpu); 1074d49597fdSThomas Gleixner 10759d85eb91SThomas Gleixner if (apicid != c->apicid) { 10769d85eb91SThomas Gleixner pr_err(FW_BUG "CPU%u: APIC id mismatch. Firmware: %x APIC: %x\n", 1077d49597fdSThomas Gleixner cpu, apicid, c->initial_apicid); 1078d49597fdSThomas Gleixner } 10799d85eb91SThomas Gleixner BUG_ON(topology_update_package_map(c->phys_proc_id, cpu)); 1080d49597fdSThomas Gleixner #else 1081d49597fdSThomas Gleixner c->logical_proc_id = 0; 1082d49597fdSThomas Gleixner #endif 1083d49597fdSThomas Gleixner } 1084d49597fdSThomas Gleixner 1085d49597fdSThomas Gleixner /* 1086f7627e25SThomas Gleixner * This does the hard work of actually picking apart the CPU stuff... 1087f7627e25SThomas Gleixner */ 1088148f9bb8SPaul Gortmaker static void identify_cpu(struct cpuinfo_x86 *c) 1089f7627e25SThomas Gleixner { 1090f7627e25SThomas Gleixner int i; 1091f7627e25SThomas Gleixner 1092f7627e25SThomas Gleixner c->loops_per_jiffy = loops_per_jiffy; 1093f7627e25SThomas Gleixner c->x86_cache_size = -1; 1094f7627e25SThomas Gleixner c->x86_vendor = X86_VENDOR_UNKNOWN; 1095f7627e25SThomas Gleixner c->x86_model = c->x86_mask = 0; /* So far unknown... */ 1096f7627e25SThomas Gleixner c->x86_vendor_id[0] = '\0'; /* Unset */ 1097f7627e25SThomas Gleixner c->x86_model_id[0] = '\0'; /* Unset */ 1098f7627e25SThomas Gleixner c->x86_max_cores = 1; 1099102bbe3aSYinghai Lu c->x86_coreid_bits = 0; 110079a8b9aaSBorislav Petkov c->cu_id = 0xff; 110111fdd252SYinghai Lu #ifdef CONFIG_X86_64 1102102bbe3aSYinghai Lu c->x86_clflush_size = 64; 110313c6c532SJan Beulich c->x86_phys_bits = 36; 110413c6c532SJan Beulich c->x86_virt_bits = 48; 1105102bbe3aSYinghai Lu #else 1106102bbe3aSYinghai Lu c->cpuid_level = -1; /* CPUID not detected */ 1107f7627e25SThomas Gleixner c->x86_clflush_size = 32; 110813c6c532SJan Beulich c->x86_phys_bits = 32; 110913c6c532SJan Beulich c->x86_virt_bits = 32; 1110102bbe3aSYinghai Lu #endif 1111102bbe3aSYinghai Lu c->x86_cache_alignment = c->x86_clflush_size; 1112f7627e25SThomas Gleixner memset(&c->x86_capability, 0, sizeof c->x86_capability); 1113f7627e25SThomas Gleixner 1114f7627e25SThomas Gleixner generic_identify(c); 1115f7627e25SThomas Gleixner 11163898534dSAndi Kleen if (this_cpu->c_identify) 1117f7627e25SThomas Gleixner this_cpu->c_identify(c); 1118f7627e25SThomas Gleixner 11196a6256f9SAdam Buchbinder /* Clear/Set all flags overridden by options, after probe */ 11208bf1ebcaSAndy Lutomirski apply_forced_caps(c); 11212759c328SYinghai Lu 1122102bbe3aSYinghai Lu #ifdef CONFIG_X86_64 1123cb8cc442SIngo Molnar c->apicid = apic->phys_pkg_id(c->initial_apicid, 0); 1124102bbe3aSYinghai Lu #endif 1125102bbe3aSYinghai Lu 1126f7627e25SThomas Gleixner /* 1127f7627e25SThomas Gleixner * Vendor-specific initialization. In this section we 1128f7627e25SThomas Gleixner * canonicalize the feature flags, meaning if there are 1129f7627e25SThomas Gleixner * features a certain CPU supports which CPUID doesn't 1130f7627e25SThomas Gleixner * tell us, CPUID claiming incorrect flags, or other bugs, 1131f7627e25SThomas Gleixner * we handle them here. 1132f7627e25SThomas Gleixner * 1133f7627e25SThomas Gleixner * At the end of this section, c->x86_capability better 1134f7627e25SThomas Gleixner * indicate the features this CPU genuinely supports! 1135f7627e25SThomas Gleixner */ 1136f7627e25SThomas Gleixner if (this_cpu->c_init) 1137f7627e25SThomas Gleixner this_cpu->c_init(c); 1138f7627e25SThomas Gleixner 1139f7627e25SThomas Gleixner /* Disable the PN if appropriate */ 1140f7627e25SThomas Gleixner squash_the_stupid_serial_number(c); 1141f7627e25SThomas Gleixner 1142b2cc2a07SH. Peter Anvin /* Set up SMEP/SMAP */ 1143b2cc2a07SH. Peter Anvin setup_smep(c); 1144b2cc2a07SH. Peter Anvin setup_smap(c); 1145b2cc2a07SH. Peter Anvin 1146f7627e25SThomas Gleixner /* 11470f3fa48aSIngo Molnar * The vendor-specific functions might have changed features. 11480f3fa48aSIngo Molnar * Now we do "generic changes." 1149f7627e25SThomas Gleixner */ 1150f7627e25SThomas Gleixner 1151b38b0665SH. Peter Anvin /* Filter out anything that depends on CPUID levels we don't have */ 1152b38b0665SH. Peter Anvin filter_cpuid_features(c, true); 1153b38b0665SH. Peter Anvin 1154f7627e25SThomas Gleixner /* If the model name is still unset, do table lookup. */ 1155f7627e25SThomas Gleixner if (!c->x86_model_id[0]) { 115602dde8b4SJan Beulich const char *p; 1157f7627e25SThomas Gleixner p = table_lookup_model(c); 1158f7627e25SThomas Gleixner if (p) 1159f7627e25SThomas Gleixner strcpy(c->x86_model_id, p); 1160f7627e25SThomas Gleixner else 1161f7627e25SThomas Gleixner /* Last resort... */ 1162f7627e25SThomas Gleixner sprintf(c->x86_model_id, "%02x/%02x", 1163f7627e25SThomas Gleixner c->x86, c->x86_model); 1164f7627e25SThomas Gleixner } 1165f7627e25SThomas Gleixner 1166102bbe3aSYinghai Lu #ifdef CONFIG_X86_64 1167102bbe3aSYinghai Lu detect_ht(c); 1168102bbe3aSYinghai Lu #endif 1169102bbe3aSYinghai Lu 117049d859d7SH. Peter Anvin x86_init_rdrand(c); 1171cbc82b17SPeter P Waskiewicz Jr x86_init_cache_qos(c); 117206976945SDave Hansen setup_pku(c); 11733e0c3737SYinghai Lu 11743e0c3737SYinghai Lu /* 11756a6256f9SAdam Buchbinder * Clear/Set all flags overridden by options, need do it 11763e0c3737SYinghai Lu * before following smp all cpus cap AND. 11773e0c3737SYinghai Lu */ 11788bf1ebcaSAndy Lutomirski apply_forced_caps(c); 11793e0c3737SYinghai Lu 1180f7627e25SThomas Gleixner /* 1181f7627e25SThomas Gleixner * On SMP, boot_cpu_data holds the common feature set between 1182f7627e25SThomas Gleixner * all CPUs; so make sure that we indicate which features are 1183f7627e25SThomas Gleixner * common between the CPUs. The first time this routine gets 1184f7627e25SThomas Gleixner * executed, c == &boot_cpu_data. 1185f7627e25SThomas Gleixner */ 1186f7627e25SThomas Gleixner if (c != &boot_cpu_data) { 1187f7627e25SThomas Gleixner /* AND the already accumulated flags with these */ 1188f7627e25SThomas Gleixner for (i = 0; i < NCAPINTS; i++) 1189f7627e25SThomas Gleixner boot_cpu_data.x86_capability[i] &= c->x86_capability[i]; 119065fc985bSBorislav Petkov 119165fc985bSBorislav Petkov /* OR, i.e. replicate the bug flags */ 119265fc985bSBorislav Petkov for (i = NCAPINTS; i < NCAPINTS + NBUGINTS; i++) 119365fc985bSBorislav Petkov c->x86_capability[i] |= boot_cpu_data.x86_capability[i]; 1194f7627e25SThomas Gleixner } 1195f7627e25SThomas Gleixner 1196f7627e25SThomas Gleixner /* Init Machine Check Exception if available. */ 11975e09954aSBorislav Petkov mcheck_cpu_init(c); 119830d432dfSAndi Kleen 119930d432dfSAndi Kleen select_idle_routine(c); 1200102bbe3aSYinghai Lu 1201de2d9445STejun Heo #ifdef CONFIG_NUMA 1202102bbe3aSYinghai Lu numa_add_cpu(smp_processor_id()); 1203102bbe3aSYinghai Lu #endif 1204f7627e25SThomas Gleixner } 1205f7627e25SThomas Gleixner 12068b6c0ab1SIngo Molnar /* 12078b6c0ab1SIngo Molnar * Set up the CPU state needed to execute SYSENTER/SYSEXIT instructions 12088b6c0ab1SIngo Molnar * on 32-bit kernels: 12098b6c0ab1SIngo Molnar */ 1210cfda7bb9SAndy Lutomirski #ifdef CONFIG_X86_32 1211cfda7bb9SAndy Lutomirski void enable_sep_cpu(void) 1212cfda7bb9SAndy Lutomirski { 12138b6c0ab1SIngo Molnar struct tss_struct *tss; 12148b6c0ab1SIngo Molnar int cpu; 1215cfda7bb9SAndy Lutomirski 1216b3edfda4SBorislav Petkov if (!boot_cpu_has(X86_FEATURE_SEP)) 1217b3edfda4SBorislav Petkov return; 1218b3edfda4SBorislav Petkov 12198b6c0ab1SIngo Molnar cpu = get_cpu(); 12208b6c0ab1SIngo Molnar tss = &per_cpu(cpu_tss, cpu); 12218b6c0ab1SIngo Molnar 12228b6c0ab1SIngo Molnar /* 1223cf9328ccSAndy Lutomirski * We cache MSR_IA32_SYSENTER_CS's value in the TSS's ss1 field -- 1224cf9328ccSAndy Lutomirski * see the big comment in struct x86_hw_tss's definition. 12258b6c0ab1SIngo Molnar */ 1226cfda7bb9SAndy Lutomirski 1227cfda7bb9SAndy Lutomirski tss->x86_tss.ss1 = __KERNEL_CS; 12288b6c0ab1SIngo Molnar wrmsr(MSR_IA32_SYSENTER_CS, tss->x86_tss.ss1, 0); 12298b6c0ab1SIngo Molnar 1230cf9328ccSAndy Lutomirski wrmsr(MSR_IA32_SYSENTER_ESP, 1231cf9328ccSAndy Lutomirski (unsigned long)tss + offsetofend(struct tss_struct, SYSENTER_stack), 1232cf9328ccSAndy Lutomirski 0); 12338b6c0ab1SIngo Molnar 12344c8cd0c5SIngo Molnar wrmsr(MSR_IA32_SYSENTER_EIP, (unsigned long)entry_SYSENTER_32, 0); 12358b6c0ab1SIngo Molnar 1236cfda7bb9SAndy Lutomirski put_cpu(); 1237cfda7bb9SAndy Lutomirski } 1238e04d645fSGlauber Costa #endif 1239e04d645fSGlauber Costa 1240f7627e25SThomas Gleixner void __init identify_boot_cpu(void) 1241f7627e25SThomas Gleixner { 1242f7627e25SThomas Gleixner identify_cpu(&boot_cpu_data); 1243102bbe3aSYinghai Lu #ifdef CONFIG_X86_32 1244f7627e25SThomas Gleixner sysenter_setup(); 1245f7627e25SThomas Gleixner enable_sep_cpu(); 1246102bbe3aSYinghai Lu #endif 1247e0ba94f1SAlex Shi cpu_detect_tlb(&boot_cpu_data); 1248f7627e25SThomas Gleixner } 1249f7627e25SThomas Gleixner 1250148f9bb8SPaul Gortmaker void identify_secondary_cpu(struct cpuinfo_x86 *c) 1251f7627e25SThomas Gleixner { 1252f7627e25SThomas Gleixner BUG_ON(c == &boot_cpu_data); 1253f7627e25SThomas Gleixner identify_cpu(c); 1254102bbe3aSYinghai Lu #ifdef CONFIG_X86_32 1255f7627e25SThomas Gleixner enable_sep_cpu(); 1256102bbe3aSYinghai Lu #endif 1257f7627e25SThomas Gleixner mtrr_ap_init(); 12589d85eb91SThomas Gleixner validate_apic_and_package_id(c); 1259f7627e25SThomas Gleixner } 1260f7627e25SThomas Gleixner 1261191679fdSAndi Kleen static __init int setup_noclflush(char *arg) 1262191679fdSAndi Kleen { 1263840d2830SH. Peter Anvin setup_clear_cpu_cap(X86_FEATURE_CLFLUSH); 1264da4aaa7dSH. Peter Anvin setup_clear_cpu_cap(X86_FEATURE_CLFLUSHOPT); 1265191679fdSAndi Kleen return 1; 1266191679fdSAndi Kleen } 1267191679fdSAndi Kleen __setup("noclflush", setup_noclflush); 1268191679fdSAndi Kleen 1269148f9bb8SPaul Gortmaker void print_cpu_info(struct cpuinfo_x86 *c) 1270f7627e25SThomas Gleixner { 127102dde8b4SJan Beulich const char *vendor = NULL; 1272f7627e25SThomas Gleixner 12730f3fa48aSIngo Molnar if (c->x86_vendor < X86_VENDOR_NUM) { 1274f7627e25SThomas Gleixner vendor = this_cpu->c_vendor; 12750f3fa48aSIngo Molnar } else { 12760f3fa48aSIngo Molnar if (c->cpuid_level >= 0) 1277f7627e25SThomas Gleixner vendor = c->x86_vendor_id; 12780f3fa48aSIngo Molnar } 1279f7627e25SThomas Gleixner 1280bd32a8cfSYinghai Lu if (vendor && !strstr(c->x86_model_id, vendor)) 12811b74dde7SChen Yucong pr_cont("%s ", vendor); 1282f7627e25SThomas Gleixner 12839d31d35bSYinghai Lu if (c->x86_model_id[0]) 12841b74dde7SChen Yucong pr_cont("%s", c->x86_model_id); 1285f7627e25SThomas Gleixner else 12861b74dde7SChen Yucong pr_cont("%d86", c->x86); 1287f7627e25SThomas Gleixner 12881b74dde7SChen Yucong pr_cont(" (family: 0x%x, model: 0x%x", c->x86, c->x86_model); 1289924e101aSBorislav Petkov 1290f7627e25SThomas Gleixner if (c->x86_mask || c->cpuid_level >= 0) 12911b74dde7SChen Yucong pr_cont(", stepping: 0x%x)\n", c->x86_mask); 1292f7627e25SThomas Gleixner else 12931b74dde7SChen Yucong pr_cont(")\n"); 1294f7627e25SThomas Gleixner } 1295f7627e25SThomas Gleixner 1296ac72e788SAndi Kleen static __init int setup_disablecpuid(char *arg) 1297ac72e788SAndi Kleen { 1298ac72e788SAndi Kleen int bit; 12990f3fa48aSIngo Molnar 1300dd853fd2SLukasz Odzioba if (get_option(&arg, &bit) && bit >= 0 && bit < NCAPINTS * 32) 1301ac72e788SAndi Kleen setup_clear_cpu_cap(bit); 1302ac72e788SAndi Kleen else 1303ac72e788SAndi Kleen return 0; 13040f3fa48aSIngo Molnar 1305ac72e788SAndi Kleen return 1; 1306ac72e788SAndi Kleen } 1307ac72e788SAndi Kleen __setup("clearcpuid=", setup_disablecpuid); 1308ac72e788SAndi Kleen 1309d5494d4fSYinghai Lu #ifdef CONFIG_X86_64 1310947e76cdSBrian Gerst DEFINE_PER_CPU_FIRST(union irq_stack_union, 1311277d5b40SAndi Kleen irq_stack_union) __aligned(PAGE_SIZE) __visible; 13120f3fa48aSIngo Molnar 1313bdf977b3STejun Heo /* 1314a7fcf28dSAndy Lutomirski * The following percpu variables are hot. Align current_task to 1315a7fcf28dSAndy Lutomirski * cacheline size such that they fall in the same cacheline. 1316bdf977b3STejun Heo */ 1317bdf977b3STejun Heo DEFINE_PER_CPU(struct task_struct *, current_task) ____cacheline_aligned = 1318bdf977b3STejun Heo &init_task; 1319bdf977b3STejun Heo EXPORT_PER_CPU_SYMBOL(current_task); 1320d5494d4fSYinghai Lu 1321bdf977b3STejun Heo DEFINE_PER_CPU(char *, irq_stack_ptr) = 13224950d6d4SJosh Poimboeuf init_per_cpu_var(irq_stack_union.irq_stack) + IRQ_STACK_SIZE; 1323bdf977b3STejun Heo 1324277d5b40SAndi Kleen DEFINE_PER_CPU(unsigned int, irq_count) __visible = -1; 1325d5494d4fSYinghai Lu 1326c2daa3beSPeter Zijlstra DEFINE_PER_CPU(int, __preempt_count) = INIT_PREEMPT_COUNT; 1327c2daa3beSPeter Zijlstra EXPORT_PER_CPU_SYMBOL(__preempt_count); 1328c2daa3beSPeter Zijlstra 13290f3fa48aSIngo Molnar /* 13300f3fa48aSIngo Molnar * Special IST stacks which the CPU switches to when it calls 13310f3fa48aSIngo Molnar * an IST-marked descriptor entry. Up to 7 stacks (hardware 13320f3fa48aSIngo Molnar * limit), all of them are 4K, except the debug stack which 13330f3fa48aSIngo Molnar * is 8K. 13340f3fa48aSIngo Molnar */ 13350f3fa48aSIngo Molnar static const unsigned int exception_stack_sizes[N_EXCEPTION_STACKS] = { 13360f3fa48aSIngo Molnar [0 ... N_EXCEPTION_STACKS - 1] = EXCEPTION_STKSZ, 13370f3fa48aSIngo Molnar [DEBUG_STACK - 1] = DEBUG_STKSZ 13380f3fa48aSIngo Molnar }; 13390f3fa48aSIngo Molnar 134092d65b23SBrian Gerst static DEFINE_PER_CPU_PAGE_ALIGNED(char, exception_stacks 13413e352aa8STejun Heo [(N_EXCEPTION_STACKS - 1) * EXCEPTION_STKSZ + DEBUG_STKSZ]); 1342d5494d4fSYinghai Lu 1343d5494d4fSYinghai Lu /* May not be marked __init: used by software suspend */ 1344d5494d4fSYinghai Lu void syscall_init(void) 1345d5494d4fSYinghai Lu { 134631ac34caSBorislav Petkov wrmsr(MSR_STAR, 0, (__USER32_CS << 16) | __KERNEL_CS); 134747edb651SAndy Lutomirski wrmsrl(MSR_LSTAR, (unsigned long)entry_SYSCALL_64); 1348d56fe4bfSIngo Molnar 1349d56fe4bfSIngo Molnar #ifdef CONFIG_IA32_EMULATION 135047edb651SAndy Lutomirski wrmsrl(MSR_CSTAR, (unsigned long)entry_SYSCALL_compat); 1351a76c7f46SDenys Vlasenko /* 1352487d1edbSDenys Vlasenko * This only works on Intel CPUs. 1353487d1edbSDenys Vlasenko * On AMD CPUs these MSRs are 32-bit, CPU truncates MSR_IA32_SYSENTER_EIP. 1354487d1edbSDenys Vlasenko * This does not cause SYSENTER to jump to the wrong location, because 1355487d1edbSDenys Vlasenko * AMD doesn't allow SYSENTER in long mode (either 32- or 64-bit). 1356a76c7f46SDenys Vlasenko */ 1357a76c7f46SDenys Vlasenko wrmsrl_safe(MSR_IA32_SYSENTER_CS, (u64)__KERNEL_CS); 1358a76c7f46SDenys Vlasenko wrmsrl_safe(MSR_IA32_SYSENTER_ESP, 0ULL); 13594c8cd0c5SIngo Molnar wrmsrl_safe(MSR_IA32_SYSENTER_EIP, (u64)entry_SYSENTER_compat); 1360d56fe4bfSIngo Molnar #else 136147edb651SAndy Lutomirski wrmsrl(MSR_CSTAR, (unsigned long)ignore_sysret); 13626b51311cSBorislav Petkov wrmsrl_safe(MSR_IA32_SYSENTER_CS, (u64)GDT_ENTRY_INVALID_SEG); 1363d56fe4bfSIngo Molnar wrmsrl_safe(MSR_IA32_SYSENTER_ESP, 0ULL); 1364d56fe4bfSIngo Molnar wrmsrl_safe(MSR_IA32_SYSENTER_EIP, 0ULL); 1365d5494d4fSYinghai Lu #endif 1366d5494d4fSYinghai Lu 1367d5494d4fSYinghai Lu /* Flags to clear on syscall */ 1368d5494d4fSYinghai Lu wrmsrl(MSR_SYSCALL_MASK, 136963bcff2aSH. Peter Anvin X86_EFLAGS_TF|X86_EFLAGS_DF|X86_EFLAGS_IF| 13708c7aa698SAndy Lutomirski X86_EFLAGS_IOPL|X86_EFLAGS_AC|X86_EFLAGS_NT); 1371d5494d4fSYinghai Lu } 1372d5494d4fSYinghai Lu 1373d5494d4fSYinghai Lu /* 1374d5494d4fSYinghai Lu * Copies of the original ist values from the tss are only accessed during 1375d5494d4fSYinghai Lu * debugging, no special alignment required. 1376d5494d4fSYinghai Lu */ 1377d5494d4fSYinghai Lu DEFINE_PER_CPU(struct orig_ist, orig_ist); 1378d5494d4fSYinghai Lu 1379228bdaa9SSteven Rostedt static DEFINE_PER_CPU(unsigned long, debug_stack_addr); 138042181186SSteven Rostedt DEFINE_PER_CPU(int, debug_stack_usage); 1381228bdaa9SSteven Rostedt 1382228bdaa9SSteven Rostedt int is_debug_stack(unsigned long addr) 1383228bdaa9SSteven Rostedt { 138489cbc767SChristoph Lameter return __this_cpu_read(debug_stack_usage) || 138589cbc767SChristoph Lameter (addr <= __this_cpu_read(debug_stack_addr) && 138689cbc767SChristoph Lameter addr > (__this_cpu_read(debug_stack_addr) - DEBUG_STKSZ)); 1387228bdaa9SSteven Rostedt } 13880f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(is_debug_stack); 1389228bdaa9SSteven Rostedt 1390629f4f9dSSeiji Aguchi DEFINE_PER_CPU(u32, debug_idt_ctr); 1391f8988175SSteven Rostedt 1392228bdaa9SSteven Rostedt void debug_stack_set_zero(void) 1393228bdaa9SSteven Rostedt { 1394629f4f9dSSeiji Aguchi this_cpu_inc(debug_idt_ctr); 1395629f4f9dSSeiji Aguchi load_current_idt(); 1396228bdaa9SSteven Rostedt } 13970f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(debug_stack_set_zero); 1398228bdaa9SSteven Rostedt 1399228bdaa9SSteven Rostedt void debug_stack_reset(void) 1400228bdaa9SSteven Rostedt { 1401629f4f9dSSeiji Aguchi if (WARN_ON(!this_cpu_read(debug_idt_ctr))) 1402f8988175SSteven Rostedt return; 1403629f4f9dSSeiji Aguchi if (this_cpu_dec_return(debug_idt_ctr) == 0) 1404629f4f9dSSeiji Aguchi load_current_idt(); 1405228bdaa9SSteven Rostedt } 14060f46efebSMasami Hiramatsu NOKPROBE_SYMBOL(debug_stack_reset); 1407228bdaa9SSteven Rostedt 14080f3fa48aSIngo Molnar #else /* CONFIG_X86_64 */ 1409d5494d4fSYinghai Lu 1410bdf977b3STejun Heo DEFINE_PER_CPU(struct task_struct *, current_task) = &init_task; 1411bdf977b3STejun Heo EXPORT_PER_CPU_SYMBOL(current_task); 1412c2daa3beSPeter Zijlstra DEFINE_PER_CPU(int, __preempt_count) = INIT_PREEMPT_COUNT; 1413c2daa3beSPeter Zijlstra EXPORT_PER_CPU_SYMBOL(__preempt_count); 1414bdf977b3STejun Heo 1415a7fcf28dSAndy Lutomirski /* 1416a7fcf28dSAndy Lutomirski * On x86_32, vm86 modifies tss.sp0, so sp0 isn't a reliable way to find 1417a7fcf28dSAndy Lutomirski * the top of the kernel stack. Use an extra percpu variable to track the 1418a7fcf28dSAndy Lutomirski * top of the kernel stack directly. 1419a7fcf28dSAndy Lutomirski */ 1420a7fcf28dSAndy Lutomirski DEFINE_PER_CPU(unsigned long, cpu_current_top_of_stack) = 1421a7fcf28dSAndy Lutomirski (unsigned long)&init_thread_union + THREAD_SIZE; 1422a7fcf28dSAndy Lutomirski EXPORT_PER_CPU_SYMBOL(cpu_current_top_of_stack); 1423a7fcf28dSAndy Lutomirski 142460a5317fSTejun Heo #ifdef CONFIG_CC_STACKPROTECTOR 142553f82452SJeremy Fitzhardinge DEFINE_PER_CPU_ALIGNED(struct stack_canary, stack_canary); 142660a5317fSTejun Heo #endif 142760a5317fSTejun Heo 14280f3fa48aSIngo Molnar #endif /* CONFIG_X86_64 */ 1429f7627e25SThomas Gleixner 1430f7627e25SThomas Gleixner /* 14319766cdbcSJaswinder Singh Rajput * Clear all 6 debug registers: 14329766cdbcSJaswinder Singh Rajput */ 14339766cdbcSJaswinder Singh Rajput static void clear_all_debug_regs(void) 14349766cdbcSJaswinder Singh Rajput { 14359766cdbcSJaswinder Singh Rajput int i; 14369766cdbcSJaswinder Singh Rajput 14379766cdbcSJaswinder Singh Rajput for (i = 0; i < 8; i++) { 14389766cdbcSJaswinder Singh Rajput /* Ignore db4, db5 */ 14399766cdbcSJaswinder Singh Rajput if ((i == 4) || (i == 5)) 14409766cdbcSJaswinder Singh Rajput continue; 14419766cdbcSJaswinder Singh Rajput 14429766cdbcSJaswinder Singh Rajput set_debugreg(0, i); 14439766cdbcSJaswinder Singh Rajput } 14449766cdbcSJaswinder Singh Rajput } 1445f7627e25SThomas Gleixner 14460bb9fef9SJason Wessel #ifdef CONFIG_KGDB 14470bb9fef9SJason Wessel /* 14480bb9fef9SJason Wessel * Restore debug regs if using kgdbwait and you have a kernel debugger 14490bb9fef9SJason Wessel * connection established. 14500bb9fef9SJason Wessel */ 14510bb9fef9SJason Wessel static void dbg_restore_debug_regs(void) 14520bb9fef9SJason Wessel { 14530bb9fef9SJason Wessel if (unlikely(kgdb_connected && arch_kgdb_ops.correct_hw_break)) 14540bb9fef9SJason Wessel arch_kgdb_ops.correct_hw_break(); 14550bb9fef9SJason Wessel } 14560bb9fef9SJason Wessel #else /* ! CONFIG_KGDB */ 14570bb9fef9SJason Wessel #define dbg_restore_debug_regs() 14580bb9fef9SJason Wessel #endif /* ! CONFIG_KGDB */ 14590bb9fef9SJason Wessel 1460ce4b1b16SIgor Mammedov static void wait_for_master_cpu(int cpu) 1461ce4b1b16SIgor Mammedov { 1462ce4b1b16SIgor Mammedov #ifdef CONFIG_SMP 1463ce4b1b16SIgor Mammedov /* 1464ce4b1b16SIgor Mammedov * wait for ACK from master CPU before continuing 1465ce4b1b16SIgor Mammedov * with AP initialization 1466ce4b1b16SIgor Mammedov */ 1467ce4b1b16SIgor Mammedov WARN_ON(cpumask_test_and_set_cpu(cpu, cpu_initialized_mask)); 1468ce4b1b16SIgor Mammedov while (!cpumask_test_cpu(cpu, cpu_callout_mask)) 1469ce4b1b16SIgor Mammedov cpu_relax(); 1470ce4b1b16SIgor Mammedov #endif 1471ce4b1b16SIgor Mammedov } 1472ce4b1b16SIgor Mammedov 1473f7627e25SThomas Gleixner /* 1474f7627e25SThomas Gleixner * cpu_init() initializes state that is per-CPU. Some data is already 1475f7627e25SThomas Gleixner * initialized (naturally) in the bootstrap process, such as the GDT 1476f7627e25SThomas Gleixner * and IDT. We reload them nevertheless, this function acts as a 1477f7627e25SThomas Gleixner * 'CPU state barrier', nothing should get across. 14781ba76586SYinghai Lu * A lot of state is already set up in PDA init for 64 bit 1479f7627e25SThomas Gleixner */ 14801ba76586SYinghai Lu #ifdef CONFIG_X86_64 14810f3fa48aSIngo Molnar 1482148f9bb8SPaul Gortmaker void cpu_init(void) 14831ba76586SYinghai Lu { 14840fe1e009STejun Heo struct orig_ist *oist; 14851ba76586SYinghai Lu struct task_struct *me; 14860f3fa48aSIngo Molnar struct tss_struct *t; 14870f3fa48aSIngo Molnar unsigned long v; 1488fb59831bSAndy Lutomirski int cpu = raw_smp_processor_id(); 14891ba76586SYinghai Lu int i; 14901ba76586SYinghai Lu 1491ce4b1b16SIgor Mammedov wait_for_master_cpu(cpu); 1492ce4b1b16SIgor Mammedov 1493e6ebf5deSFenghua Yu /* 14941e02ce4cSAndy Lutomirski * Initialize the CR4 shadow before doing anything that could 14951e02ce4cSAndy Lutomirski * try to read it. 14961e02ce4cSAndy Lutomirski */ 14971e02ce4cSAndy Lutomirski cr4_init_shadow(); 14981e02ce4cSAndy Lutomirski 1499777284b6SBorislav Petkov if (cpu) 1500e6ebf5deSFenghua Yu load_ucode_ap(); 1501e6ebf5deSFenghua Yu 150224933b82SAndy Lutomirski t = &per_cpu(cpu_tss, cpu); 15030fe1e009STejun Heo oist = &per_cpu(orig_ist, cpu); 15040f3fa48aSIngo Molnar 1505e7a22c1eSBrian Gerst #ifdef CONFIG_NUMA 150627fd185fSFenghua Yu if (this_cpu_read(numa_node) == 0 && 1507e534c7c5SLee Schermerhorn early_cpu_to_node(cpu) != NUMA_NO_NODE) 1508e534c7c5SLee Schermerhorn set_numa_node(early_cpu_to_node(cpu)); 1509e7a22c1eSBrian Gerst #endif 15101ba76586SYinghai Lu 15111ba76586SYinghai Lu me = current; 15121ba76586SYinghai Lu 15132eaad1fdSMike Travis pr_debug("Initializing CPU#%d\n", cpu); 15141ba76586SYinghai Lu 1515375074ccSAndy Lutomirski cr4_clear_bits(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE); 15161ba76586SYinghai Lu 15171ba76586SYinghai Lu /* 15181ba76586SYinghai Lu * Initialize the per-CPU GDT with the boot GDT, 15191ba76586SYinghai Lu * and set up the GDT descriptor: 15201ba76586SYinghai Lu */ 15211ba76586SYinghai Lu 1522552be871SBrian Gerst switch_to_new_gdt(cpu); 15232697fbd5SBrian Gerst loadsegment(fs, 0); 15242697fbd5SBrian Gerst 1525cf910e83SSeiji Aguchi load_current_idt(); 15261ba76586SYinghai Lu 15271ba76586SYinghai Lu memset(me->thread.tls_array, 0, GDT_ENTRY_TLS_ENTRIES * 8); 15281ba76586SYinghai Lu syscall_init(); 15291ba76586SYinghai Lu 15301ba76586SYinghai Lu wrmsrl(MSR_FS_BASE, 0); 15311ba76586SYinghai Lu wrmsrl(MSR_KERNEL_GS_BASE, 0); 15321ba76586SYinghai Lu barrier(); 15331ba76586SYinghai Lu 15344763ed4dSH. Peter Anvin x86_configure_nx(); 1535659006bfSThomas Gleixner x2apic_setup(); 15361ba76586SYinghai Lu 15371ba76586SYinghai Lu /* 15381ba76586SYinghai Lu * set up and load the per-CPU TSS 15391ba76586SYinghai Lu */ 15400fe1e009STejun Heo if (!oist->ist[0]) { 154192d65b23SBrian Gerst char *estacks = per_cpu(exception_stacks, cpu); 15420f3fa48aSIngo Molnar 15431ba76586SYinghai Lu for (v = 0; v < N_EXCEPTION_STACKS; v++) { 15440f3fa48aSIngo Molnar estacks += exception_stack_sizes[v]; 15450fe1e009STejun Heo oist->ist[v] = t->x86_tss.ist[v] = 15461ba76586SYinghai Lu (unsigned long)estacks; 1547228bdaa9SSteven Rostedt if (v == DEBUG_STACK-1) 1548228bdaa9SSteven Rostedt per_cpu(debug_stack_addr, cpu) = (unsigned long)estacks; 15491ba76586SYinghai Lu } 15501ba76586SYinghai Lu } 15511ba76586SYinghai Lu 15521ba76586SYinghai Lu t->x86_tss.io_bitmap_base = offsetof(struct tss_struct, io_bitmap); 15530f3fa48aSIngo Molnar 15541ba76586SYinghai Lu /* 15551ba76586SYinghai Lu * <= is required because the CPU will access up to 15561ba76586SYinghai Lu * 8 bits beyond the end of the IO permission bitmap. 15571ba76586SYinghai Lu */ 15581ba76586SYinghai Lu for (i = 0; i <= IO_BITMAP_LONGS; i++) 15591ba76586SYinghai Lu t->io_bitmap[i] = ~0UL; 15601ba76586SYinghai Lu 1561f1f10076SVegard Nossum mmgrab(&init_mm); 15621ba76586SYinghai Lu me->active_mm = &init_mm; 15638c5dfd25SStoyan Gaydarov BUG_ON(me->mm); 156472c0098dSAndy Lutomirski initialize_tlbstate_and_flush(); 15651ba76586SYinghai Lu enter_lazy_tlb(&init_mm, me); 15661ba76586SYinghai Lu 15671ba76586SYinghai Lu load_sp0(t, ¤t->thread); 15681ba76586SYinghai Lu set_tss_desc(cpu, t); 15691ba76586SYinghai Lu load_TR_desc(); 157037868fe1SAndy Lutomirski load_mm_ldt(&init_mm); 15711ba76586SYinghai Lu 15729766cdbcSJaswinder Singh Rajput clear_all_debug_regs(); 15730bb9fef9SJason Wessel dbg_restore_debug_regs(); 15741ba76586SYinghai Lu 157521c4cd10SIngo Molnar fpu__init_cpu(); 15761ba76586SYinghai Lu 15771ba76586SYinghai Lu if (is_uv_system()) 15781ba76586SYinghai Lu uv_cpu_init(); 157969218e47SThomas Garnier 158069218e47SThomas Garnier setup_fixmap_gdt(cpu); 158169218e47SThomas Garnier load_fixmap_gdt(cpu); 15821ba76586SYinghai Lu } 15831ba76586SYinghai Lu 15841ba76586SYinghai Lu #else 15851ba76586SYinghai Lu 1586148f9bb8SPaul Gortmaker void cpu_init(void) 1587f7627e25SThomas Gleixner { 1588f7627e25SThomas Gleixner int cpu = smp_processor_id(); 1589f7627e25SThomas Gleixner struct task_struct *curr = current; 159024933b82SAndy Lutomirski struct tss_struct *t = &per_cpu(cpu_tss, cpu); 1591f7627e25SThomas Gleixner struct thread_struct *thread = &curr->thread; 1592f7627e25SThomas Gleixner 1593ce4b1b16SIgor Mammedov wait_for_master_cpu(cpu); 1594e6ebf5deSFenghua Yu 15955b2bdbc8SSteven Rostedt /* 15965b2bdbc8SSteven Rostedt * Initialize the CR4 shadow before doing anything that could 15975b2bdbc8SSteven Rostedt * try to read it. 15985b2bdbc8SSteven Rostedt */ 15995b2bdbc8SSteven Rostedt cr4_init_shadow(); 16005b2bdbc8SSteven Rostedt 1601ce4b1b16SIgor Mammedov show_ucode_info_early(); 1602f7627e25SThomas Gleixner 16031b74dde7SChen Yucong pr_info("Initializing CPU#%d\n", cpu); 1604f7627e25SThomas Gleixner 1605362f924bSBorislav Petkov if (cpu_feature_enabled(X86_FEATURE_VME) || 160659e21e3dSBorislav Petkov boot_cpu_has(X86_FEATURE_TSC) || 1607362f924bSBorislav Petkov boot_cpu_has(X86_FEATURE_DE)) 1608375074ccSAndy Lutomirski cr4_clear_bits(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE); 1609f7627e25SThomas Gleixner 1610cf910e83SSeiji Aguchi load_current_idt(); 1611552be871SBrian Gerst switch_to_new_gdt(cpu); 1612f7627e25SThomas Gleixner 1613f7627e25SThomas Gleixner /* 1614f7627e25SThomas Gleixner * Set up and load the per-CPU TSS and LDT 1615f7627e25SThomas Gleixner */ 1616f1f10076SVegard Nossum mmgrab(&init_mm); 1617f7627e25SThomas Gleixner curr->active_mm = &init_mm; 16188c5dfd25SStoyan Gaydarov BUG_ON(curr->mm); 161972c0098dSAndy Lutomirski initialize_tlbstate_and_flush(); 1620f7627e25SThomas Gleixner enter_lazy_tlb(&init_mm, curr); 1621f7627e25SThomas Gleixner 1622faca6227SH. Peter Anvin load_sp0(t, thread); 1623f7627e25SThomas Gleixner set_tss_desc(cpu, t); 1624f7627e25SThomas Gleixner load_TR_desc(); 162537868fe1SAndy Lutomirski load_mm_ldt(&init_mm); 1626f7627e25SThomas Gleixner 1627f9a196b8SThomas Gleixner t->x86_tss.io_bitmap_base = offsetof(struct tss_struct, io_bitmap); 1628f9a196b8SThomas Gleixner 1629f7627e25SThomas Gleixner #ifdef CONFIG_DOUBLEFAULT 1630f7627e25SThomas Gleixner /* Set up doublefault TSS pointer in the GDT */ 1631f7627e25SThomas Gleixner __set_tss_desc(cpu, GDT_ENTRY_DOUBLEFAULT_TSS, &doublefault_tss); 1632f7627e25SThomas Gleixner #endif 1633f7627e25SThomas Gleixner 16349766cdbcSJaswinder Singh Rajput clear_all_debug_regs(); 16350bb9fef9SJason Wessel dbg_restore_debug_regs(); 1636f7627e25SThomas Gleixner 163721c4cd10SIngo Molnar fpu__init_cpu(); 163869218e47SThomas Garnier 163969218e47SThomas Garnier setup_fixmap_gdt(cpu); 164069218e47SThomas Garnier load_fixmap_gdt(cpu); 1641f7627e25SThomas Gleixner } 16421ba76586SYinghai Lu #endif 16435700f743SBorislav Petkov 1644b51ef52dSLaura Abbott static void bsp_resume(void) 1645b51ef52dSLaura Abbott { 1646b51ef52dSLaura Abbott if (this_cpu->c_bsp_resume) 1647b51ef52dSLaura Abbott this_cpu->c_bsp_resume(&boot_cpu_data); 1648b51ef52dSLaura Abbott } 1649b51ef52dSLaura Abbott 1650b51ef52dSLaura Abbott static struct syscore_ops cpu_syscore_ops = { 1651b51ef52dSLaura Abbott .resume = bsp_resume, 1652b51ef52dSLaura Abbott }; 1653b51ef52dSLaura Abbott 1654b51ef52dSLaura Abbott static int __init init_cpu_syscore(void) 1655b51ef52dSLaura Abbott { 1656b51ef52dSLaura Abbott register_syscore_ops(&cpu_syscore_ops); 1657b51ef52dSLaura Abbott return 0; 1658b51ef52dSLaura Abbott } 1659b51ef52dSLaura Abbott core_initcall(init_cpu_syscore); 1660