1dd7d207dSJung-uk Kim /*- 2ebf5747bSPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 3ebf5747bSPedro F. Giffuni * 4dd7d207dSJung-uk Kim * Copyright (c) 1998-2003 Poul-Henning Kamp 5dd7d207dSJung-uk Kim * All rights reserved. 6dd7d207dSJung-uk Kim * 7dd7d207dSJung-uk Kim * Redistribution and use in source and binary forms, with or without 8dd7d207dSJung-uk Kim * modification, are permitted provided that the following conditions 9dd7d207dSJung-uk Kim * are met: 10dd7d207dSJung-uk Kim * 1. Redistributions of source code must retain the above copyright 11dd7d207dSJung-uk Kim * notice, this list of conditions and the following disclaimer. 12dd7d207dSJung-uk Kim * 2. Redistributions in binary form must reproduce the above copyright 13dd7d207dSJung-uk Kim * notice, this list of conditions and the following disclaimer in the 14dd7d207dSJung-uk Kim * documentation and/or other materials provided with the distribution. 15dd7d207dSJung-uk Kim * 16dd7d207dSJung-uk Kim * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 17dd7d207dSJung-uk Kim * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18dd7d207dSJung-uk Kim * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 19dd7d207dSJung-uk Kim * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 20dd7d207dSJung-uk Kim * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21dd7d207dSJung-uk Kim * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 22dd7d207dSJung-uk Kim * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 23dd7d207dSJung-uk Kim * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 24dd7d207dSJung-uk Kim * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 25dd7d207dSJung-uk Kim * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26dd7d207dSJung-uk Kim * SUCH DAMAGE. 27dd7d207dSJung-uk Kim */ 28dd7d207dSJung-uk Kim 29dd7d207dSJung-uk Kim #include <sys/cdefs.h> 30dd7d207dSJung-uk Kim __FBSDID("$FreeBSD$"); 31dd7d207dSJung-uk Kim 32dd7d207dSJung-uk Kim #include "opt_clock.h" 33dd7d207dSJung-uk Kim 34dd7d207dSJung-uk Kim #include <sys/param.h> 35dd7d207dSJung-uk Kim #include <sys/bus.h> 36dd7d207dSJung-uk Kim #include <sys/cpu.h> 37e2e050c8SConrad Meyer #include <sys/eventhandler.h> 385da5812bSJung-uk Kim #include <sys/limits.h> 39dd7d207dSJung-uk Kim #include <sys/malloc.h> 40dd7d207dSJung-uk Kim #include <sys/systm.h> 41dd7d207dSJung-uk Kim #include <sys/sysctl.h> 42dd7d207dSJung-uk Kim #include <sys/time.h> 43dd7d207dSJung-uk Kim #include <sys/timetc.h> 44dd7d207dSJung-uk Kim #include <sys/kernel.h> 45dd7d207dSJung-uk Kim #include <sys/power.h> 46dd7d207dSJung-uk Kim #include <sys/smp.h> 47aea81038SKonstantin Belousov #include <sys/vdso.h> 48dd7d207dSJung-uk Kim #include <machine/clock.h> 49dd7d207dSJung-uk Kim #include <machine/cputypes.h> 50dd7d207dSJung-uk Kim #include <machine/md_var.h> 51dd7d207dSJung-uk Kim #include <machine/specialreg.h> 5201e1933dSJohn Baldwin #include <x86/vmware.h> 5316808549SKonstantin Belousov #include <dev/acpica/acpi_hpet.h> 54ce3bf750SKonstantin Belousov #include <contrib/dev/acpica/include/acpi.h> 55dd7d207dSJung-uk Kim 56dd7d207dSJung-uk Kim #include "cpufreq_if.h" 57dd7d207dSJung-uk Kim 58dd7d207dSJung-uk Kim uint64_t tsc_freq; 59dd7d207dSJung-uk Kim int tsc_is_invariant; 60155094d7SJung-uk Kim int tsc_perf_stat; 61155094d7SJung-uk Kim 62dd7d207dSJung-uk Kim static eventhandler_tag tsc_levels_tag, tsc_pre_tag, tsc_post_tag; 63dd7d207dSJung-uk Kim 64dd7d207dSJung-uk Kim SYSCTL_INT(_kern_timecounter, OID_AUTO, invariant_tsc, CTLFLAG_RDTUN, 65dd7d207dSJung-uk Kim &tsc_is_invariant, 0, "Indicates whether the TSC is P-state invariant"); 66dd7d207dSJung-uk Kim 67dd7d207dSJung-uk Kim #ifdef SMP 681472b87fSNeel Natu int smp_tsc; 69dd7d207dSJung-uk Kim SYSCTL_INT(_kern_timecounter, OID_AUTO, smp_tsc, CTLFLAG_RDTUN, &smp_tsc, 0, 70dd7d207dSJung-uk Kim "Indicates whether the TSC is safe to use in SMP mode"); 71b2c63698SAlexander Motin 72b2c63698SAlexander Motin int smp_tsc_adjust = 0; 73b2c63698SAlexander Motin SYSCTL_INT(_kern_timecounter, OID_AUTO, smp_tsc_adjust, CTLFLAG_RDTUN, 74b2c63698SAlexander Motin &smp_tsc_adjust, 0, "Try to adjust TSC on APs to match BSP"); 75dd7d207dSJung-uk Kim #endif 76dd7d207dSJung-uk Kim 77e7f1427dSKonstantin Belousov static int tsc_shift = 1; 78e7f1427dSKonstantin Belousov SYSCTL_INT(_kern_timecounter, OID_AUTO, tsc_shift, CTLFLAG_RDTUN, 79e7f1427dSKonstantin Belousov &tsc_shift, 0, "Shift to pre-apply for the maximum TSC frequency"); 80e7f1427dSKonstantin Belousov 8179422085SJung-uk Kim static int tsc_disabled; 8279422085SJung-uk Kim SYSCTL_INT(_machdep, OID_AUTO, disable_tsc, CTLFLAG_RDTUN, &tsc_disabled, 0, 8379422085SJung-uk Kim "Disable x86 Time Stamp Counter"); 8479422085SJung-uk Kim 85a4e4127fSJung-uk Kim static int tsc_skip_calibration; 86ce3bf750SKonstantin Belousov SYSCTL_INT(_machdep, OID_AUTO, disable_tsc_calibration, CTLFLAG_RDTUN | 87ce3bf750SKonstantin Belousov CTLFLAG_NOFETCH, &tsc_skip_calibration, 0, 88ce3bf750SKonstantin Belousov "Disable TSC frequency calibration"); 89a4e4127fSJung-uk Kim 90dd7d207dSJung-uk Kim static void tsc_freq_changed(void *arg, const struct cf_level *level, 91dd7d207dSJung-uk Kim int status); 92dd7d207dSJung-uk Kim static void tsc_freq_changing(void *arg, const struct cf_level *level, 93dd7d207dSJung-uk Kim int *status); 94dd7d207dSJung-uk Kim static unsigned tsc_get_timecount(struct timecounter *tc); 95814124c3SKonstantin Belousov static inline unsigned tsc_get_timecount_low(struct timecounter *tc); 96814124c3SKonstantin Belousov static unsigned tsc_get_timecount_lfence(struct timecounter *tc); 97814124c3SKonstantin Belousov static unsigned tsc_get_timecount_low_lfence(struct timecounter *tc); 98814124c3SKonstantin Belousov static unsigned tsc_get_timecount_mfence(struct timecounter *tc); 99814124c3SKonstantin Belousov static unsigned tsc_get_timecount_low_mfence(struct timecounter *tc); 100dd7d207dSJung-uk Kim static void tsc_levels_changed(void *arg, int unit); 10116808549SKonstantin Belousov static uint32_t x86_tsc_vdso_timehands(struct vdso_timehands *vdso_th, 10216808549SKonstantin Belousov struct timecounter *tc); 10316808549SKonstantin Belousov #ifdef COMPAT_FREEBSD32 10416808549SKonstantin Belousov static uint32_t x86_tsc_vdso_timehands32(struct vdso_timehands32 *vdso_th32, 10516808549SKonstantin Belousov struct timecounter *tc); 10616808549SKonstantin Belousov #endif 107dd7d207dSJung-uk Kim 108dd7d207dSJung-uk Kim static struct timecounter tsc_timecounter = { 10916808549SKonstantin Belousov .tc_get_timecount = tsc_get_timecount, 11016808549SKonstantin Belousov .tc_counter_mask = ~0u, 11116808549SKonstantin Belousov .tc_name = "TSC", 11216808549SKonstantin Belousov .tc_quality = 800, /* adjusted in code */ 11316808549SKonstantin Belousov .tc_fill_vdso_timehands = x86_tsc_vdso_timehands, 11416808549SKonstantin Belousov #ifdef COMPAT_FREEBSD32 11516808549SKonstantin Belousov .tc_fill_vdso_timehands32 = x86_tsc_vdso_timehands32, 11616808549SKonstantin Belousov #endif 117dd7d207dSJung-uk Kim }; 118dd7d207dSJung-uk Kim 11901e1933dSJohn Baldwin static void 1205da5812bSJung-uk Kim tsc_freq_vmware(void) 1215da5812bSJung-uk Kim { 1225da5812bSJung-uk Kim u_int regs[4]; 1235da5812bSJung-uk Kim 1245da5812bSJung-uk Kim if (hv_high >= 0x40000010) { 1255da5812bSJung-uk Kim do_cpuid(0x40000010, regs); 1265da5812bSJung-uk Kim tsc_freq = regs[0] * 1000; 1275da5812bSJung-uk Kim } else { 1285da5812bSJung-uk Kim vmware_hvcall(VMW_HVCMD_GETHZ, regs); 1295da5812bSJung-uk Kim if (regs[1] != UINT_MAX) 1305da5812bSJung-uk Kim tsc_freq = regs[0] | ((uint64_t)regs[1] << 32); 1315da5812bSJung-uk Kim } 1325da5812bSJung-uk Kim tsc_is_invariant = 1; 1335da5812bSJung-uk Kim } 1345da5812bSJung-uk Kim 135506a906cSKonstantin Belousov /* 136506a906cSKonstantin Belousov * Calculate TSC frequency using information from the CPUID leaf 0x15 137*a9d0e007SKonstantin Belousov * 'Time Stamp Counter and Nominal Core Crystal Clock'. If leaf 0x15 138*a9d0e007SKonstantin Belousov * is not functional, as it is on Skylake/Kabylake, try 0x16 'Processor 139*a9d0e007SKonstantin Belousov * Frequency Information'. Leaf 0x16 is described in the SDM as 140*a9d0e007SKonstantin Belousov * informational only, but if 0x15 did not work, and TSC calibration 141*a9d0e007SKonstantin Belousov * is disabled, it is the best we can get at all. It should still be 142506a906cSKonstantin Belousov * an improvement over the parsing of the CPU model name in 143506a906cSKonstantin Belousov * tsc_freq_intel(), when available. 144506a906cSKonstantin Belousov */ 145506a906cSKonstantin Belousov static bool 146506a906cSKonstantin Belousov tsc_freq_cpuid(void) 147506a906cSKonstantin Belousov { 148506a906cSKonstantin Belousov u_int regs[4]; 149506a906cSKonstantin Belousov 150506a906cSKonstantin Belousov if (cpu_high < 0x15) 151506a906cSKonstantin Belousov return (false); 152506a906cSKonstantin Belousov do_cpuid(0x15, regs); 153*a9d0e007SKonstantin Belousov if (regs[0] != 0 && regs[1] != 0 && regs[2] != 0) { 154506a906cSKonstantin Belousov tsc_freq = (uint64_t)regs[2] * regs[1] / regs[0]; 155506a906cSKonstantin Belousov return (true); 156506a906cSKonstantin Belousov } 157506a906cSKonstantin Belousov 158*a9d0e007SKonstantin Belousov if (cpu_high < 0x16) 159*a9d0e007SKonstantin Belousov return (false); 160*a9d0e007SKonstantin Belousov do_cpuid(0x16, regs); 161*a9d0e007SKonstantin Belousov if (regs[0] != 0) { 162*a9d0e007SKonstantin Belousov tsc_freq = (uint64_t)regs[0] * 1000000; 163*a9d0e007SKonstantin Belousov return (true); 164*a9d0e007SKonstantin Belousov } 165*a9d0e007SKonstantin Belousov 166*a9d0e007SKonstantin Belousov return (false); 167*a9d0e007SKonstantin Belousov } 168*a9d0e007SKonstantin Belousov 169a4e4127fSJung-uk Kim static void 170a4e4127fSJung-uk Kim tsc_freq_intel(void) 171dd7d207dSJung-uk Kim { 172a4e4127fSJung-uk Kim char brand[48]; 173a4e4127fSJung-uk Kim u_int regs[4]; 174a4e4127fSJung-uk Kim uint64_t freq; 175a4e4127fSJung-uk Kim char *p; 176a4e4127fSJung-uk Kim u_int i; 177dd7d207dSJung-uk Kim 178a4e4127fSJung-uk Kim /* 179a4e4127fSJung-uk Kim * Intel Processor Identification and the CPUID Instruction 180a4e4127fSJung-uk Kim * Application Note 485. 181a4e4127fSJung-uk Kim * http://www.intel.com/assets/pdf/appnote/241618.pdf 182a4e4127fSJung-uk Kim */ 183a4e4127fSJung-uk Kim if (cpu_exthigh >= 0x80000004) { 184a4e4127fSJung-uk Kim p = brand; 185a4e4127fSJung-uk Kim for (i = 0x80000002; i < 0x80000005; i++) { 186a4e4127fSJung-uk Kim do_cpuid(i, regs); 187a4e4127fSJung-uk Kim memcpy(p, regs, sizeof(regs)); 188a4e4127fSJung-uk Kim p += sizeof(regs); 189a4e4127fSJung-uk Kim } 190a4e4127fSJung-uk Kim p = NULL; 191a4e4127fSJung-uk Kim for (i = 0; i < sizeof(brand) - 1; i++) 192a4e4127fSJung-uk Kim if (brand[i] == 'H' && brand[i + 1] == 'z') 193a4e4127fSJung-uk Kim p = brand + i; 194a4e4127fSJung-uk Kim if (p != NULL) { 195a4e4127fSJung-uk Kim p -= 5; 196a4e4127fSJung-uk Kim switch (p[4]) { 197a4e4127fSJung-uk Kim case 'M': 198a4e4127fSJung-uk Kim i = 1; 199a4e4127fSJung-uk Kim break; 200a4e4127fSJung-uk Kim case 'G': 201a4e4127fSJung-uk Kim i = 1000; 202a4e4127fSJung-uk Kim break; 203a4e4127fSJung-uk Kim case 'T': 204a4e4127fSJung-uk Kim i = 1000000; 205a4e4127fSJung-uk Kim break; 206a4e4127fSJung-uk Kim default: 207dd7d207dSJung-uk Kim return; 208a4e4127fSJung-uk Kim } 209a4e4127fSJung-uk Kim #define C2D(c) ((c) - '0') 210a4e4127fSJung-uk Kim if (p[1] == '.') { 211a4e4127fSJung-uk Kim freq = C2D(p[0]) * 1000; 212a4e4127fSJung-uk Kim freq += C2D(p[2]) * 100; 213a4e4127fSJung-uk Kim freq += C2D(p[3]) * 10; 214a4e4127fSJung-uk Kim freq *= i * 1000; 215a4e4127fSJung-uk Kim } else { 216a4e4127fSJung-uk Kim freq = C2D(p[0]) * 1000; 217a4e4127fSJung-uk Kim freq += C2D(p[1]) * 100; 218a4e4127fSJung-uk Kim freq += C2D(p[2]) * 10; 219a4e4127fSJung-uk Kim freq += C2D(p[3]); 220a4e4127fSJung-uk Kim freq *= i * 1000000; 221a4e4127fSJung-uk Kim } 222a4e4127fSJung-uk Kim #undef C2D 223a4e4127fSJung-uk Kim tsc_freq = freq; 224a4e4127fSJung-uk Kim } 225a4e4127fSJung-uk Kim } 226a4e4127fSJung-uk Kim } 227dd7d207dSJung-uk Kim 228a4e4127fSJung-uk Kim static void 229a4e4127fSJung-uk Kim probe_tsc_freq(void) 230a4e4127fSJung-uk Kim { 231155094d7SJung-uk Kim u_int regs[4]; 232a4e4127fSJung-uk Kim uint64_t tsc1, tsc2; 233ce3bf750SKonstantin Belousov uint16_t bootflags; 234dd7d207dSJung-uk Kim 2355da5812bSJung-uk Kim if (cpu_high >= 6) { 2365da5812bSJung-uk Kim do_cpuid(6, regs); 2375da5812bSJung-uk Kim if ((regs[2] & CPUID_PERF_STAT) != 0) { 2385da5812bSJung-uk Kim /* 2395da5812bSJung-uk Kim * XXX Some emulators expose host CPUID without actual 2405da5812bSJung-uk Kim * support for these MSRs. We must test whether they 2415da5812bSJung-uk Kim * really work. 2425da5812bSJung-uk Kim */ 2435da5812bSJung-uk Kim wrmsr(MSR_MPERF, 0); 2445da5812bSJung-uk Kim wrmsr(MSR_APERF, 0); 2455da5812bSJung-uk Kim DELAY(10); 2465da5812bSJung-uk Kim if (rdmsr(MSR_MPERF) > 0 && rdmsr(MSR_APERF) > 0) 2475da5812bSJung-uk Kim tsc_perf_stat = 1; 2485da5812bSJung-uk Kim } 2495da5812bSJung-uk Kim } 2505da5812bSJung-uk Kim 25101e1933dSJohn Baldwin if (vm_guest == VM_GUEST_VMWARE) { 25201e1933dSJohn Baldwin tsc_freq_vmware(); 2535da5812bSJung-uk Kim return; 25401e1933dSJohn Baldwin } 2555da5812bSJung-uk Kim 256dd7d207dSJung-uk Kim switch (cpu_vendor_id) { 257dd7d207dSJung-uk Kim case CPU_VENDOR_AMD: 258a106a27cSJung-uk Kim if ((amd_pminfo & AMDPM_TSC_INVARIANT) != 0 || 259a106a27cSJung-uk Kim (vm_guest == VM_GUEST_NO && 260a106a27cSJung-uk Kim CPUID_TO_FAMILY(cpu_id) >= 0x10)) 261dd7d207dSJung-uk Kim tsc_is_invariant = 1; 262814124c3SKonstantin Belousov if (cpu_feature & CPUID_SSE2) { 263814124c3SKonstantin Belousov tsc_timecounter.tc_get_timecount = 264814124c3SKonstantin Belousov tsc_get_timecount_mfence; 265814124c3SKonstantin Belousov } 266dd7d207dSJung-uk Kim break; 267dd7d207dSJung-uk Kim case CPU_VENDOR_INTEL: 268a106a27cSJung-uk Kim if ((amd_pminfo & AMDPM_TSC_INVARIANT) != 0 || 269a106a27cSJung-uk Kim (vm_guest == VM_GUEST_NO && 270a106a27cSJung-uk Kim ((CPUID_TO_FAMILY(cpu_id) == 0x6 && 271dd7d207dSJung-uk Kim CPUID_TO_MODEL(cpu_id) >= 0xe) || 272dd7d207dSJung-uk Kim (CPUID_TO_FAMILY(cpu_id) == 0xf && 273a106a27cSJung-uk Kim CPUID_TO_MODEL(cpu_id) >= 0x3)))) 274dd7d207dSJung-uk Kim tsc_is_invariant = 1; 275814124c3SKonstantin Belousov if (cpu_feature & CPUID_SSE2) { 276814124c3SKonstantin Belousov tsc_timecounter.tc_get_timecount = 277814124c3SKonstantin Belousov tsc_get_timecount_lfence; 278814124c3SKonstantin Belousov } 279dd7d207dSJung-uk Kim break; 280dd7d207dSJung-uk Kim case CPU_VENDOR_CENTAUR: 281a106a27cSJung-uk Kim if (vm_guest == VM_GUEST_NO && 282a106a27cSJung-uk Kim CPUID_TO_FAMILY(cpu_id) == 0x6 && 283dd7d207dSJung-uk Kim CPUID_TO_MODEL(cpu_id) >= 0xf && 284dd7d207dSJung-uk Kim (rdmsr(0x1203) & 0x100000000ULL) == 0) 285dd7d207dSJung-uk Kim tsc_is_invariant = 1; 286814124c3SKonstantin Belousov if (cpu_feature & CPUID_SSE2) { 287814124c3SKonstantin Belousov tsc_timecounter.tc_get_timecount = 288814124c3SKonstantin Belousov tsc_get_timecount_lfence; 289814124c3SKonstantin Belousov } 290dd7d207dSJung-uk Kim break; 291dd7d207dSJung-uk Kim } 292dd7d207dSJung-uk Kim 293ce3bf750SKonstantin Belousov if (!TUNABLE_INT_FETCH("machdep.disable_tsc_calibration", 294ce3bf750SKonstantin Belousov &tsc_skip_calibration)) { 295ce3bf750SKonstantin Belousov /* 296ce3bf750SKonstantin Belousov * User did not give the order about calibration. 297ce3bf750SKonstantin Belousov * If he did, we do not try to guess. 298ce3bf750SKonstantin Belousov * 299ce3bf750SKonstantin Belousov * Otherwise, if ACPI FADT reports that the platform 300ce3bf750SKonstantin Belousov * is legacy-free and CPUID provides TSC frequency, 301ce3bf750SKonstantin Belousov * use it. The calibration could fail anyway since 302ce3bf750SKonstantin Belousov * ISA timer can be absent or power gated. 303ce3bf750SKonstantin Belousov */ 304ce3bf750SKonstantin Belousov if (acpi_get_fadt_bootflags(&bootflags) && 305ce3bf750SKonstantin Belousov (bootflags & ACPI_FADT_LEGACY_DEVICES) == 0 && 306ce3bf750SKonstantin Belousov tsc_freq_cpuid()) { 307ce3bf750SKonstantin Belousov printf("Skipping TSC calibration since no legacy " 308ce3bf750SKonstantin Belousov "devices reported by FADT and CPUID works\n"); 309ce3bf750SKonstantin Belousov tsc_skip_calibration = 1; 310ce3bf750SKonstantin Belousov } 311ce3bf750SKonstantin Belousov } 312a4e4127fSJung-uk Kim if (tsc_skip_calibration) { 313506a906cSKonstantin Belousov if (tsc_freq_cpuid()) 314506a906cSKonstantin Belousov ; 315506a906cSKonstantin Belousov else if (cpu_vendor_id == CPU_VENDOR_INTEL) 316a4e4127fSJung-uk Kim tsc_freq_intel(); 317506a906cSKonstantin Belousov } else { 318a4e4127fSJung-uk Kim if (bootverbose) 319a4e4127fSJung-uk Kim printf("Calibrating TSC clock ... "); 320a4e4127fSJung-uk Kim tsc1 = rdtsc(); 321a4e4127fSJung-uk Kim DELAY(1000000); 322a4e4127fSJung-uk Kim tsc2 = rdtsc(); 323a4e4127fSJung-uk Kim tsc_freq = tsc2 - tsc1; 324506a906cSKonstantin Belousov } 325a4e4127fSJung-uk Kim if (bootverbose) 326a4e4127fSJung-uk Kim printf("TSC clock: %ju Hz\n", (intmax_t)tsc_freq); 327a4e4127fSJung-uk Kim } 328a4e4127fSJung-uk Kim 329a4e4127fSJung-uk Kim void 330a4e4127fSJung-uk Kim init_TSC(void) 331a4e4127fSJung-uk Kim { 332a4e4127fSJung-uk Kim 333a4e4127fSJung-uk Kim if ((cpu_feature & CPUID_TSC) == 0 || tsc_disabled) 334a4e4127fSJung-uk Kim return; 335a4e4127fSJung-uk Kim 336fe760cfaSJohn Baldwin #ifdef __i386__ 337fe760cfaSJohn Baldwin /* The TSC is known to be broken on certain CPUs. */ 338fe760cfaSJohn Baldwin switch (cpu_vendor_id) { 339fe760cfaSJohn Baldwin case CPU_VENDOR_AMD: 340fe760cfaSJohn Baldwin switch (cpu_id & 0xFF0) { 341fe760cfaSJohn Baldwin case 0x500: 342fe760cfaSJohn Baldwin /* K5 Model 0 */ 343fe760cfaSJohn Baldwin return; 344fe760cfaSJohn Baldwin } 345fe760cfaSJohn Baldwin break; 346fe760cfaSJohn Baldwin case CPU_VENDOR_CENTAUR: 347fe760cfaSJohn Baldwin switch (cpu_id & 0xff0) { 348fe760cfaSJohn Baldwin case 0x540: 349fe760cfaSJohn Baldwin /* 350fe760cfaSJohn Baldwin * http://www.centtech.com/c6_data_sheet.pdf 351fe760cfaSJohn Baldwin * 352fe760cfaSJohn Baldwin * I-12 RDTSC may return incoherent values in EDX:EAX 353fe760cfaSJohn Baldwin * I-13 RDTSC hangs when certain event counters are used 354fe760cfaSJohn Baldwin */ 355fe760cfaSJohn Baldwin return; 356fe760cfaSJohn Baldwin } 357fe760cfaSJohn Baldwin break; 358fe760cfaSJohn Baldwin case CPU_VENDOR_NSC: 359fe760cfaSJohn Baldwin switch (cpu_id & 0xff0) { 360fe760cfaSJohn Baldwin case 0x540: 361fe760cfaSJohn Baldwin if ((cpu_id & CPUID_STEPPING) == 0) 362fe760cfaSJohn Baldwin return; 363fe760cfaSJohn Baldwin break; 364fe760cfaSJohn Baldwin } 365fe760cfaSJohn Baldwin break; 366fe760cfaSJohn Baldwin } 367fe760cfaSJohn Baldwin #endif 368fe760cfaSJohn Baldwin 369a4e4127fSJung-uk Kim probe_tsc_freq(); 370a4e4127fSJung-uk Kim 371dd7d207dSJung-uk Kim /* 372dd7d207dSJung-uk Kim * Inform CPU accounting about our boot-time clock rate. This will 373dd7d207dSJung-uk Kim * be updated if someone loads a cpufreq driver after boot that 374dd7d207dSJung-uk Kim * discovers a new max frequency. 375dd7d207dSJung-uk Kim */ 376a4e4127fSJung-uk Kim if (tsc_freq != 0) 3775ac44f72SJung-uk Kim set_cputicker(rdtsc, tsc_freq, !tsc_is_invariant); 378dd7d207dSJung-uk Kim 379dd7d207dSJung-uk Kim if (tsc_is_invariant) 380dd7d207dSJung-uk Kim return; 381dd7d207dSJung-uk Kim 382dd7d207dSJung-uk Kim /* Register to find out about changes in CPU frequency. */ 383dd7d207dSJung-uk Kim tsc_pre_tag = EVENTHANDLER_REGISTER(cpufreq_pre_change, 384dd7d207dSJung-uk Kim tsc_freq_changing, NULL, EVENTHANDLER_PRI_FIRST); 385dd7d207dSJung-uk Kim tsc_post_tag = EVENTHANDLER_REGISTER(cpufreq_post_change, 386dd7d207dSJung-uk Kim tsc_freq_changed, NULL, EVENTHANDLER_PRI_FIRST); 387dd7d207dSJung-uk Kim tsc_levels_tag = EVENTHANDLER_REGISTER(cpufreq_levels_changed, 388dd7d207dSJung-uk Kim tsc_levels_changed, NULL, EVENTHANDLER_PRI_ANY); 389dd7d207dSJung-uk Kim } 390dd7d207dSJung-uk Kim 39165e7d70bSJung-uk Kim #ifdef SMP 39265e7d70bSJung-uk Kim 393814124c3SKonstantin Belousov /* 394814124c3SKonstantin Belousov * RDTSC is not a serializing instruction, and does not drain 395814124c3SKonstantin Belousov * instruction stream, so we need to drain the stream before executing 396814124c3SKonstantin Belousov * it. It could be fixed by use of RDTSCP, except the instruction is 397814124c3SKonstantin Belousov * not available everywhere. 398814124c3SKonstantin Belousov * 399814124c3SKonstantin Belousov * Use CPUID for draining in the boot-time SMP constistency test. The 400814124c3SKonstantin Belousov * timecounters use MFENCE for AMD CPUs, and LFENCE for others (Intel 401814124c3SKonstantin Belousov * and VIA) when SSE2 is present, and nothing on older machines which 402814124c3SKonstantin Belousov * also do not issue RDTSC prematurely. There, testing for SSE2 and 403e1a18e46SKonstantin Belousov * vendor is too cumbersome, and we learn about TSC presence from CPUID. 404814124c3SKonstantin Belousov * 405814124c3SKonstantin Belousov * Do not use do_cpuid(), since we do not need CPUID results, which 406814124c3SKonstantin Belousov * have to be written into memory with do_cpuid(). 407814124c3SKonstantin Belousov */ 40865e7d70bSJung-uk Kim #define TSC_READ(x) \ 40965e7d70bSJung-uk Kim static void \ 41065e7d70bSJung-uk Kim tsc_read_##x(void *arg) \ 41165e7d70bSJung-uk Kim { \ 4127bfcb3bbSJim Harris uint64_t *tsc = arg; \ 41365e7d70bSJung-uk Kim u_int cpu = PCPU_GET(cpuid); \ 41465e7d70bSJung-uk Kim \ 415814124c3SKonstantin Belousov __asm __volatile("cpuid" : : : "eax", "ebx", "ecx", "edx"); \ 4167bfcb3bbSJim Harris tsc[cpu * 3 + x] = rdtsc(); \ 41765e7d70bSJung-uk Kim } 41865e7d70bSJung-uk Kim TSC_READ(0) 41965e7d70bSJung-uk Kim TSC_READ(1) 42065e7d70bSJung-uk Kim TSC_READ(2) 42165e7d70bSJung-uk Kim #undef TSC_READ 42265e7d70bSJung-uk Kim 42365e7d70bSJung-uk Kim #define N 1000 42465e7d70bSJung-uk Kim 42565e7d70bSJung-uk Kim static void 42665e7d70bSJung-uk Kim comp_smp_tsc(void *arg) 42765e7d70bSJung-uk Kim { 4287bfcb3bbSJim Harris uint64_t *tsc; 4297bfcb3bbSJim Harris int64_t d1, d2; 43065e7d70bSJung-uk Kim u_int cpu = PCPU_GET(cpuid); 43165e7d70bSJung-uk Kim u_int i, j, size; 43265e7d70bSJung-uk Kim 43365e7d70bSJung-uk Kim size = (mp_maxid + 1) * 3; 43465e7d70bSJung-uk Kim for (i = 0, tsc = arg; i < N; i++, tsc += size) 43565e7d70bSJung-uk Kim CPU_FOREACH(j) { 43665e7d70bSJung-uk Kim if (j == cpu) 43765e7d70bSJung-uk Kim continue; 43865e7d70bSJung-uk Kim d1 = tsc[cpu * 3 + 1] - tsc[j * 3]; 43965e7d70bSJung-uk Kim d2 = tsc[cpu * 3 + 2] - tsc[j * 3 + 1]; 44065e7d70bSJung-uk Kim if (d1 <= 0 || d2 <= 0) { 44165e7d70bSJung-uk Kim smp_tsc = 0; 44265e7d70bSJung-uk Kim return; 44365e7d70bSJung-uk Kim } 44465e7d70bSJung-uk Kim } 44565e7d70bSJung-uk Kim } 44665e7d70bSJung-uk Kim 447b2c63698SAlexander Motin static void 448b2c63698SAlexander Motin adj_smp_tsc(void *arg) 449b2c63698SAlexander Motin { 450b2c63698SAlexander Motin uint64_t *tsc; 451b2c63698SAlexander Motin int64_t d, min, max; 452b2c63698SAlexander Motin u_int cpu = PCPU_GET(cpuid); 453b2c63698SAlexander Motin u_int first, i, size; 454b2c63698SAlexander Motin 455b2c63698SAlexander Motin first = CPU_FIRST(); 456b2c63698SAlexander Motin if (cpu == first) 457b2c63698SAlexander Motin return; 458b2c63698SAlexander Motin min = INT64_MIN; 459b2c63698SAlexander Motin max = INT64_MAX; 460b2c63698SAlexander Motin size = (mp_maxid + 1) * 3; 461b2c63698SAlexander Motin for (i = 0, tsc = arg; i < N; i++, tsc += size) { 462b2c63698SAlexander Motin d = tsc[first * 3] - tsc[cpu * 3 + 1]; 463b2c63698SAlexander Motin if (d > min) 464b2c63698SAlexander Motin min = d; 465b2c63698SAlexander Motin d = tsc[first * 3 + 1] - tsc[cpu * 3 + 2]; 466b2c63698SAlexander Motin if (d > min) 467b2c63698SAlexander Motin min = d; 468b2c63698SAlexander Motin d = tsc[first * 3 + 1] - tsc[cpu * 3]; 469b2c63698SAlexander Motin if (d < max) 470b2c63698SAlexander Motin max = d; 471b2c63698SAlexander Motin d = tsc[first * 3 + 2] - tsc[cpu * 3 + 1]; 472b2c63698SAlexander Motin if (d < max) 473b2c63698SAlexander Motin max = d; 474b2c63698SAlexander Motin } 475b2c63698SAlexander Motin if (min > max) 476b2c63698SAlexander Motin return; 477b2c63698SAlexander Motin d = min / 2 + max / 2; 478b2c63698SAlexander Motin __asm __volatile ( 479b2c63698SAlexander Motin "movl $0x10, %%ecx\n\t" 480b2c63698SAlexander Motin "rdmsr\n\t" 481b2c63698SAlexander Motin "addl %%edi, %%eax\n\t" 482b2c63698SAlexander Motin "adcl %%esi, %%edx\n\t" 483b2c63698SAlexander Motin "wrmsr\n" 484b2c63698SAlexander Motin : /* No output */ 485b2c63698SAlexander Motin : "D" ((uint32_t)d), "S" ((uint32_t)(d >> 32)) 486b2c63698SAlexander Motin : "ax", "cx", "dx", "cc" 487b2c63698SAlexander Motin ); 488b2c63698SAlexander Motin } 489b2c63698SAlexander Motin 49065e7d70bSJung-uk Kim static int 491279be68bSAndriy Gapon test_tsc(int adj_max_count) 49265e7d70bSJung-uk Kim { 4937bfcb3bbSJim Harris uint64_t *data, *tsc; 494b2c63698SAlexander Motin u_int i, size, adj; 49565e7d70bSJung-uk Kim 496e7f1427dSKonstantin Belousov if ((!smp_tsc && !tsc_is_invariant) || vm_guest) 49765e7d70bSJung-uk Kim return (-100); 49865e7d70bSJung-uk Kim size = (mp_maxid + 1) * 3; 49965e7d70bSJung-uk Kim data = malloc(sizeof(*data) * size * N, M_TEMP, M_WAITOK); 500b2c63698SAlexander Motin adj = 0; 501b2c63698SAlexander Motin retry: 50265e7d70bSJung-uk Kim for (i = 0, tsc = data; i < N; i++, tsc += size) 50365e7d70bSJung-uk Kim smp_rendezvous(tsc_read_0, tsc_read_1, tsc_read_2, tsc); 50465e7d70bSJung-uk Kim smp_tsc = 1; /* XXX */ 50567d955aaSPatrick Kelsey smp_rendezvous(smp_no_rendezvous_barrier, comp_smp_tsc, 50667d955aaSPatrick Kelsey smp_no_rendezvous_barrier, data); 507279be68bSAndriy Gapon if (!smp_tsc && adj < adj_max_count) { 508b2c63698SAlexander Motin adj++; 50967d955aaSPatrick Kelsey smp_rendezvous(smp_no_rendezvous_barrier, adj_smp_tsc, 51067d955aaSPatrick Kelsey smp_no_rendezvous_barrier, data); 511b2c63698SAlexander Motin goto retry; 512b2c63698SAlexander Motin } 51365e7d70bSJung-uk Kim free(data, M_TEMP); 51465e7d70bSJung-uk Kim if (bootverbose) 515b2c63698SAlexander Motin printf("SMP: %sed TSC synchronization test%s\n", 516b2c63698SAlexander Motin smp_tsc ? "pass" : "fail", 517b2c63698SAlexander Motin adj > 0 ? " after adjustment" : ""); 51826e6537aSJung-uk Kim if (smp_tsc && tsc_is_invariant) { 51926e6537aSJung-uk Kim switch (cpu_vendor_id) { 52026e6537aSJung-uk Kim case CPU_VENDOR_AMD: 52126e6537aSJung-uk Kim /* 52226e6537aSJung-uk Kim * Starting with Family 15h processors, TSC clock 52326e6537aSJung-uk Kim * source is in the north bridge. Check whether 52426e6537aSJung-uk Kim * we have a single-socket/multi-core platform. 52526e6537aSJung-uk Kim * XXX Need more work for complex cases. 52626e6537aSJung-uk Kim */ 52726e6537aSJung-uk Kim if (CPUID_TO_FAMILY(cpu_id) < 0x15 || 52826e6537aSJung-uk Kim (amd_feature2 & AMDID2_CMP) == 0 || 52926e6537aSJung-uk Kim smp_cpus > (cpu_procinfo2 & AMDID_CMP_CORES) + 1) 53026e6537aSJung-uk Kim break; 53126e6537aSJung-uk Kim return (1000); 53226e6537aSJung-uk Kim case CPU_VENDOR_INTEL: 53326e6537aSJung-uk Kim /* 53426e6537aSJung-uk Kim * XXX Assume Intel platforms have synchronized TSCs. 53526e6537aSJung-uk Kim */ 53626e6537aSJung-uk Kim return (1000); 53726e6537aSJung-uk Kim } 53826e6537aSJung-uk Kim return (800); 53926e6537aSJung-uk Kim } 54026e6537aSJung-uk Kim return (-100); 54165e7d70bSJung-uk Kim } 54265e7d70bSJung-uk Kim 54365e7d70bSJung-uk Kim #undef N 54465e7d70bSJung-uk Kim 54565e7d70bSJung-uk Kim #endif /* SMP */ 54665e7d70bSJung-uk Kim 54765e7d70bSJung-uk Kim static void 548dd7d207dSJung-uk Kim init_TSC_tc(void) 549dd7d207dSJung-uk Kim { 55095f2f098SJung-uk Kim uint64_t max_freq; 55195f2f098SJung-uk Kim int shift; 552dd7d207dSJung-uk Kim 55338b8542cSJung-uk Kim if ((cpu_feature & CPUID_TSC) == 0 || tsc_disabled) 554dd7d207dSJung-uk Kim return; 555dd7d207dSJung-uk Kim 556dd7d207dSJung-uk Kim /* 55795f2f098SJung-uk Kim * Limit timecounter frequency to fit in an int and prevent it from 55895f2f098SJung-uk Kim * overflowing too fast. 55995f2f098SJung-uk Kim */ 56095f2f098SJung-uk Kim max_freq = UINT_MAX; 56195f2f098SJung-uk Kim 56295f2f098SJung-uk Kim /* 563dd7d207dSJung-uk Kim * We can not use the TSC if we support APM. Precise timekeeping 564dd7d207dSJung-uk Kim * on an APM'ed machine is at best a fools pursuit, since 565dd7d207dSJung-uk Kim * any and all of the time spent in various SMM code can't 566dd7d207dSJung-uk Kim * be reliably accounted for. Reading the RTC is your only 567dd7d207dSJung-uk Kim * source of reliable time info. The i8254 loses too, of course, 568dd7d207dSJung-uk Kim * but we need to have some kind of time... 569dd7d207dSJung-uk Kim * We don't know at this point whether APM is going to be used 570dd7d207dSJung-uk Kim * or not, nor when it might be activated. Play it safe. 571dd7d207dSJung-uk Kim */ 572dd7d207dSJung-uk Kim if (power_pm_get_type() == POWER_PM_TYPE_APM) { 573dd7d207dSJung-uk Kim tsc_timecounter.tc_quality = -1000; 574dd7d207dSJung-uk Kim if (bootverbose) 575dd7d207dSJung-uk Kim printf("TSC timecounter disabled: APM enabled.\n"); 57665e7d70bSJung-uk Kim goto init; 577dd7d207dSJung-uk Kim } 578dd7d207dSJung-uk Kim 579a49399a9SJung-uk Kim /* 58092597e06SJohn Baldwin * Intel CPUs without a C-state invariant TSC can stop the TSC 581d1411416SJohn Baldwin * in either C2 or C3. Disable use of C2 and C3 while using 582d1411416SJohn Baldwin * the TSC as the timecounter. The timecounter can be changed 583d1411416SJohn Baldwin * to enable C2 and C3. 584d1411416SJohn Baldwin * 585d1411416SJohn Baldwin * Note that the TSC is used as the cputicker for computing 586d1411416SJohn Baldwin * thread runtime regardless of the timecounter setting, so 587d1411416SJohn Baldwin * using an alternate timecounter and enabling C2 or C3 can 588d1411416SJohn Baldwin * result incorrect runtimes for kernel idle threads (but not 589d1411416SJohn Baldwin * for any non-idle threads). 590a49399a9SJung-uk Kim */ 5918cd59625SKonstantin Belousov if (cpu_vendor_id == CPU_VENDOR_INTEL && 592a49399a9SJung-uk Kim (amd_pminfo & AMDPM_TSC_INVARIANT) == 0) { 59392597e06SJohn Baldwin tsc_timecounter.tc_flags |= TC_FLAGS_C2STOP; 594a49399a9SJung-uk Kim if (bootverbose) 595d1411416SJohn Baldwin printf("TSC timecounter disables C2 and C3.\n"); 596a49399a9SJung-uk Kim } 597a49399a9SJung-uk Kim 598dd7d207dSJung-uk Kim /* 599e7f1427dSKonstantin Belousov * We can not use the TSC in SMP mode unless the TSCs on all CPUs 600e7f1427dSKonstantin Belousov * are synchronized. If the user is sure that the system has 601e7f1427dSKonstantin Belousov * synchronized TSCs, set kern.timecounter.smp_tsc tunable to a 602e7f1427dSKonstantin Belousov * non-zero value. The TSC seems unreliable in virtualized SMP 6035cf8ac1bSMike Silbersack * environments, so it is set to a negative quality in those cases. 604dd7d207dSJung-uk Kim */ 605ba79ab82SAndriy Gapon #ifdef SMP 606e7f1427dSKonstantin Belousov if (mp_ncpus > 1) 607279be68bSAndriy Gapon tsc_timecounter.tc_quality = test_tsc(smp_tsc_adjust); 608ba79ab82SAndriy Gapon else 609ba79ab82SAndriy Gapon #endif /* SMP */ 610ba79ab82SAndriy Gapon if (tsc_is_invariant) 61126e6537aSJung-uk Kim tsc_timecounter.tc_quality = 1000; 612e7f1427dSKonstantin Belousov max_freq >>= tsc_shift; 61326e6537aSJung-uk Kim 61465e7d70bSJung-uk Kim init: 615e7f1427dSKonstantin Belousov for (shift = 0; shift <= 31 && (tsc_freq >> shift) > max_freq; shift++) 61695f2f098SJung-uk Kim ; 617e7f1427dSKonstantin Belousov if ((cpu_feature & CPUID_SSE2) != 0 && mp_ncpus > 1) { 618814124c3SKonstantin Belousov if (cpu_vendor_id == CPU_VENDOR_AMD) { 619e7f1427dSKonstantin Belousov tsc_timecounter.tc_get_timecount = shift > 0 ? 620e7f1427dSKonstantin Belousov tsc_get_timecount_low_mfence : 621e7f1427dSKonstantin Belousov tsc_get_timecount_mfence; 622814124c3SKonstantin Belousov } else { 623e7f1427dSKonstantin Belousov tsc_timecounter.tc_get_timecount = shift > 0 ? 624e7f1427dSKonstantin Belousov tsc_get_timecount_low_lfence : 625e7f1427dSKonstantin Belousov tsc_get_timecount_lfence; 626814124c3SKonstantin Belousov } 627e7f1427dSKonstantin Belousov } else { 628e7f1427dSKonstantin Belousov tsc_timecounter.tc_get_timecount = shift > 0 ? 629e7f1427dSKonstantin Belousov tsc_get_timecount_low : tsc_get_timecount; 630e7f1427dSKonstantin Belousov } 631e7f1427dSKonstantin Belousov if (shift > 0) { 63295f2f098SJung-uk Kim tsc_timecounter.tc_name = "TSC-low"; 63395f2f098SJung-uk Kim if (bootverbose) 634bc8e4ad2SJung-uk Kim printf("TSC timecounter discards lower %d bit(s)\n", 63595f2f098SJung-uk Kim shift); 63695f2f098SJung-uk Kim } 637bc34c87eSJung-uk Kim if (tsc_freq != 0) { 63895f2f098SJung-uk Kim tsc_timecounter.tc_frequency = tsc_freq >> shift; 63995f2f098SJung-uk Kim tsc_timecounter.tc_priv = (void *)(intptr_t)shift; 640dd7d207dSJung-uk Kim tc_init(&tsc_timecounter); 641dd7d207dSJung-uk Kim } 642dd7d207dSJung-uk Kim } 64365e7d70bSJung-uk Kim SYSINIT(tsc_tc, SI_SUB_SMP, SI_ORDER_ANY, init_TSC_tc, NULL); 644dd7d207dSJung-uk Kim 645279be68bSAndriy Gapon void 646279be68bSAndriy Gapon resume_TSC(void) 647279be68bSAndriy Gapon { 648ba79ab82SAndriy Gapon #ifdef SMP 649279be68bSAndriy Gapon int quality; 650279be68bSAndriy Gapon 651279be68bSAndriy Gapon /* If TSC was not good on boot, it is unlikely to become good now. */ 652279be68bSAndriy Gapon if (tsc_timecounter.tc_quality < 0) 653279be68bSAndriy Gapon return; 654279be68bSAndriy Gapon /* Nothing to do with UP. */ 655279be68bSAndriy Gapon if (mp_ncpus < 2) 656279be68bSAndriy Gapon return; 657279be68bSAndriy Gapon 658279be68bSAndriy Gapon /* 659279be68bSAndriy Gapon * If TSC was good, a single synchronization should be enough, 660279be68bSAndriy Gapon * but honour smp_tsc_adjust if it's set. 661279be68bSAndriy Gapon */ 662279be68bSAndriy Gapon quality = test_tsc(MAX(smp_tsc_adjust, 1)); 663279be68bSAndriy Gapon if (quality != tsc_timecounter.tc_quality) { 664279be68bSAndriy Gapon printf("TSC timecounter quality changed: %d -> %d\n", 665279be68bSAndriy Gapon tsc_timecounter.tc_quality, quality); 666279be68bSAndriy Gapon tsc_timecounter.tc_quality = quality; 667279be68bSAndriy Gapon } 668ba79ab82SAndriy Gapon #endif /* SMP */ 669279be68bSAndriy Gapon } 670279be68bSAndriy Gapon 671dd7d207dSJung-uk Kim /* 672dd7d207dSJung-uk Kim * When cpufreq levels change, find out about the (new) max frequency. We 673dd7d207dSJung-uk Kim * use this to update CPU accounting in case it got a lower estimate at boot. 674dd7d207dSJung-uk Kim */ 675dd7d207dSJung-uk Kim static void 676dd7d207dSJung-uk Kim tsc_levels_changed(void *arg, int unit) 677dd7d207dSJung-uk Kim { 678dd7d207dSJung-uk Kim device_t cf_dev; 679dd7d207dSJung-uk Kim struct cf_level *levels; 680dd7d207dSJung-uk Kim int count, error; 681dd7d207dSJung-uk Kim uint64_t max_freq; 682dd7d207dSJung-uk Kim 683dd7d207dSJung-uk Kim /* Only use values from the first CPU, assuming all are equal. */ 684dd7d207dSJung-uk Kim if (unit != 0) 685dd7d207dSJung-uk Kim return; 686dd7d207dSJung-uk Kim 687dd7d207dSJung-uk Kim /* Find the appropriate cpufreq device instance. */ 688dd7d207dSJung-uk Kim cf_dev = devclass_get_device(devclass_find("cpufreq"), unit); 689dd7d207dSJung-uk Kim if (cf_dev == NULL) { 690dd7d207dSJung-uk Kim printf("tsc_levels_changed() called but no cpufreq device?\n"); 691dd7d207dSJung-uk Kim return; 692dd7d207dSJung-uk Kim } 693dd7d207dSJung-uk Kim 694dd7d207dSJung-uk Kim /* Get settings from the device and find the max frequency. */ 695dd7d207dSJung-uk Kim count = 64; 696dd7d207dSJung-uk Kim levels = malloc(count * sizeof(*levels), M_TEMP, M_NOWAIT); 697dd7d207dSJung-uk Kim if (levels == NULL) 698dd7d207dSJung-uk Kim return; 699dd7d207dSJung-uk Kim error = CPUFREQ_LEVELS(cf_dev, levels, &count); 700dd7d207dSJung-uk Kim if (error == 0 && count != 0) { 701dd7d207dSJung-uk Kim max_freq = (uint64_t)levels[0].total_set.freq * 1000000; 702dd7d207dSJung-uk Kim set_cputicker(rdtsc, max_freq, 1); 703dd7d207dSJung-uk Kim } else 704dd7d207dSJung-uk Kim printf("tsc_levels_changed: no max freq found\n"); 705dd7d207dSJung-uk Kim free(levels, M_TEMP); 706dd7d207dSJung-uk Kim } 707dd7d207dSJung-uk Kim 708dd7d207dSJung-uk Kim /* 709dd7d207dSJung-uk Kim * If the TSC timecounter is in use, veto the pending change. It may be 710dd7d207dSJung-uk Kim * possible in the future to handle a dynamically-changing timecounter rate. 711dd7d207dSJung-uk Kim */ 712dd7d207dSJung-uk Kim static void 713dd7d207dSJung-uk Kim tsc_freq_changing(void *arg, const struct cf_level *level, int *status) 714dd7d207dSJung-uk Kim { 715dd7d207dSJung-uk Kim 716dd7d207dSJung-uk Kim if (*status != 0 || timecounter != &tsc_timecounter) 717dd7d207dSJung-uk Kim return; 718dd7d207dSJung-uk Kim 719dd7d207dSJung-uk Kim printf("timecounter TSC must not be in use when " 720dd7d207dSJung-uk Kim "changing frequencies; change denied\n"); 721dd7d207dSJung-uk Kim *status = EBUSY; 722dd7d207dSJung-uk Kim } 723dd7d207dSJung-uk Kim 724dd7d207dSJung-uk Kim /* Update TSC freq with the value indicated by the caller. */ 725dd7d207dSJung-uk Kim static void 726dd7d207dSJung-uk Kim tsc_freq_changed(void *arg, const struct cf_level *level, int status) 727dd7d207dSJung-uk Kim { 7283453537fSJung-uk Kim uint64_t freq; 729dd7d207dSJung-uk Kim 730dd7d207dSJung-uk Kim /* If there was an error during the transition, don't do anything. */ 73179422085SJung-uk Kim if (tsc_disabled || status != 0) 732dd7d207dSJung-uk Kim return; 733dd7d207dSJung-uk Kim 734dd7d207dSJung-uk Kim /* Total setting for this level gives the new frequency in MHz. */ 7353453537fSJung-uk Kim freq = (uint64_t)level->total_set.freq * 1000000; 7363453537fSJung-uk Kim atomic_store_rel_64(&tsc_freq, freq); 73795f2f098SJung-uk Kim tsc_timecounter.tc_frequency = 73895f2f098SJung-uk Kim freq >> (int)(intptr_t)tsc_timecounter.tc_priv; 739dd7d207dSJung-uk Kim } 740dd7d207dSJung-uk Kim 741dd7d207dSJung-uk Kim static int 742dd7d207dSJung-uk Kim sysctl_machdep_tsc_freq(SYSCTL_HANDLER_ARGS) 743dd7d207dSJung-uk Kim { 744dd7d207dSJung-uk Kim int error; 745dd7d207dSJung-uk Kim uint64_t freq; 746dd7d207dSJung-uk Kim 7473453537fSJung-uk Kim freq = atomic_load_acq_64(&tsc_freq); 7483453537fSJung-uk Kim if (freq == 0) 749dd7d207dSJung-uk Kim return (EOPNOTSUPP); 750cbc134adSMatthew D Fleming error = sysctl_handle_64(oidp, &freq, 0, req); 7517ebbcb21SJung-uk Kim if (error == 0 && req->newptr != NULL) { 7523453537fSJung-uk Kim atomic_store_rel_64(&tsc_freq, freq); 753bc8e4ad2SJung-uk Kim atomic_store_rel_64(&tsc_timecounter.tc_frequency, 754bc8e4ad2SJung-uk Kim freq >> (int)(intptr_t)tsc_timecounter.tc_priv); 7557ebbcb21SJung-uk Kim } 756dd7d207dSJung-uk Kim return (error); 757dd7d207dSJung-uk Kim } 758dd7d207dSJung-uk Kim 759cbc134adSMatthew D Fleming SYSCTL_PROC(_machdep, OID_AUTO, tsc_freq, CTLTYPE_U64 | CTLFLAG_RW, 7605331d61dSJung-uk Kim 0, 0, sysctl_machdep_tsc_freq, "QU", "Time Stamp Counter frequency"); 761dd7d207dSJung-uk Kim 762727c7b2dSJung-uk Kim static u_int 76395f2f098SJung-uk Kim tsc_get_timecount(struct timecounter *tc __unused) 764dd7d207dSJung-uk Kim { 765727c7b2dSJung-uk Kim 766727c7b2dSJung-uk Kim return (rdtsc32()); 767dd7d207dSJung-uk Kim } 76895f2f098SJung-uk Kim 769814124c3SKonstantin Belousov static inline u_int 770bc8e4ad2SJung-uk Kim tsc_get_timecount_low(struct timecounter *tc) 77195f2f098SJung-uk Kim { 7725df88f46SJung-uk Kim uint32_t rv; 77395f2f098SJung-uk Kim 7745df88f46SJung-uk Kim __asm __volatile("rdtsc; shrd %%cl, %%edx, %0" 7755df88f46SJung-uk Kim : "=a" (rv) : "c" ((int)(intptr_t)tc->tc_priv) : "edx"); 7765df88f46SJung-uk Kim return (rv); 77795f2f098SJung-uk Kim } 778aea81038SKonstantin Belousov 779814124c3SKonstantin Belousov static u_int 780814124c3SKonstantin Belousov tsc_get_timecount_lfence(struct timecounter *tc __unused) 781814124c3SKonstantin Belousov { 782814124c3SKonstantin Belousov 783814124c3SKonstantin Belousov lfence(); 784814124c3SKonstantin Belousov return (rdtsc32()); 785814124c3SKonstantin Belousov } 786814124c3SKonstantin Belousov 787814124c3SKonstantin Belousov static u_int 788814124c3SKonstantin Belousov tsc_get_timecount_low_lfence(struct timecounter *tc) 789814124c3SKonstantin Belousov { 790814124c3SKonstantin Belousov 791814124c3SKonstantin Belousov lfence(); 792814124c3SKonstantin Belousov return (tsc_get_timecount_low(tc)); 793814124c3SKonstantin Belousov } 794814124c3SKonstantin Belousov 795814124c3SKonstantin Belousov static u_int 796814124c3SKonstantin Belousov tsc_get_timecount_mfence(struct timecounter *tc __unused) 797814124c3SKonstantin Belousov { 798814124c3SKonstantin Belousov 799814124c3SKonstantin Belousov mfence(); 800814124c3SKonstantin Belousov return (rdtsc32()); 801814124c3SKonstantin Belousov } 802814124c3SKonstantin Belousov 803814124c3SKonstantin Belousov static u_int 804814124c3SKonstantin Belousov tsc_get_timecount_low_mfence(struct timecounter *tc) 805814124c3SKonstantin Belousov { 806814124c3SKonstantin Belousov 807814124c3SKonstantin Belousov mfence(); 808814124c3SKonstantin Belousov return (tsc_get_timecount_low(tc)); 809814124c3SKonstantin Belousov } 810814124c3SKonstantin Belousov 81116808549SKonstantin Belousov static uint32_t 81216808549SKonstantin Belousov x86_tsc_vdso_timehands(struct vdso_timehands *vdso_th, struct timecounter *tc) 813aea81038SKonstantin Belousov { 814aea81038SKonstantin Belousov 81516808549SKonstantin Belousov vdso_th->th_algo = VDSO_TH_ALGO_X86_TSC; 816d1b1b600SNeel Natu vdso_th->th_x86_shift = (int)(intptr_t)tc->tc_priv; 81716808549SKonstantin Belousov vdso_th->th_x86_hpet_idx = 0xffffffff; 818aea81038SKonstantin Belousov bzero(vdso_th->th_res, sizeof(vdso_th->th_res)); 81916808549SKonstantin Belousov return (1); 820aea81038SKonstantin Belousov } 821aea81038SKonstantin Belousov 822aea81038SKonstantin Belousov #ifdef COMPAT_FREEBSD32 82316808549SKonstantin Belousov static uint32_t 82416808549SKonstantin Belousov x86_tsc_vdso_timehands32(struct vdso_timehands32 *vdso_th32, 825d1b1b600SNeel Natu struct timecounter *tc) 826aea81038SKonstantin Belousov { 827aea81038SKonstantin Belousov 82816808549SKonstantin Belousov vdso_th32->th_algo = VDSO_TH_ALGO_X86_TSC; 829d1b1b600SNeel Natu vdso_th32->th_x86_shift = (int)(intptr_t)tc->tc_priv; 83016808549SKonstantin Belousov vdso_th32->th_x86_hpet_idx = 0xffffffff; 831aea81038SKonstantin Belousov bzero(vdso_th32->th_res, sizeof(vdso_th32->th_res)); 83216808549SKonstantin Belousov return (1); 833aea81038SKonstantin Belousov } 834aea81038SKonstantin Belousov #endif 835