1dd7d207dSJung-uk Kim /*- 2ebf5747bSPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 3ebf5747bSPedro F. Giffuni * 4dd7d207dSJung-uk Kim * Copyright (c) 1998-2003 Poul-Henning Kamp 5dd7d207dSJung-uk Kim * All rights reserved. 6dd7d207dSJung-uk Kim * 7dd7d207dSJung-uk Kim * Redistribution and use in source and binary forms, with or without 8dd7d207dSJung-uk Kim * modification, are permitted provided that the following conditions 9dd7d207dSJung-uk Kim * are met: 10dd7d207dSJung-uk Kim * 1. Redistributions of source code must retain the above copyright 11dd7d207dSJung-uk Kim * notice, this list of conditions and the following disclaimer. 12dd7d207dSJung-uk Kim * 2. Redistributions in binary form must reproduce the above copyright 13dd7d207dSJung-uk Kim * notice, this list of conditions and the following disclaimer in the 14dd7d207dSJung-uk Kim * documentation and/or other materials provided with the distribution. 15dd7d207dSJung-uk Kim * 16dd7d207dSJung-uk Kim * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 17dd7d207dSJung-uk Kim * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18dd7d207dSJung-uk Kim * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 19dd7d207dSJung-uk Kim * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 20dd7d207dSJung-uk Kim * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21dd7d207dSJung-uk Kim * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 22dd7d207dSJung-uk Kim * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 23dd7d207dSJung-uk Kim * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 24dd7d207dSJung-uk Kim * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 25dd7d207dSJung-uk Kim * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26dd7d207dSJung-uk Kim * SUCH DAMAGE. 27dd7d207dSJung-uk Kim */ 28dd7d207dSJung-uk Kim 29dd7d207dSJung-uk Kim #include <sys/cdefs.h> 30dd7d207dSJung-uk Kim __FBSDID("$FreeBSD$"); 31dd7d207dSJung-uk Kim 32dd7d207dSJung-uk Kim #include "opt_clock.h" 33dd7d207dSJung-uk Kim 34dd7d207dSJung-uk Kim #include <sys/param.h> 35dd7d207dSJung-uk Kim #include <sys/bus.h> 36dd7d207dSJung-uk Kim #include <sys/cpu.h> 375da5812bSJung-uk Kim #include <sys/limits.h> 38dd7d207dSJung-uk Kim #include <sys/malloc.h> 39dd7d207dSJung-uk Kim #include <sys/systm.h> 40dd7d207dSJung-uk Kim #include <sys/sysctl.h> 41dd7d207dSJung-uk Kim #include <sys/time.h> 42dd7d207dSJung-uk Kim #include <sys/timetc.h> 43dd7d207dSJung-uk Kim #include <sys/kernel.h> 44dd7d207dSJung-uk Kim #include <sys/power.h> 45dd7d207dSJung-uk Kim #include <sys/smp.h> 46aea81038SKonstantin Belousov #include <sys/vdso.h> 47dd7d207dSJung-uk Kim #include <machine/clock.h> 48dd7d207dSJung-uk Kim #include <machine/cputypes.h> 49dd7d207dSJung-uk Kim #include <machine/md_var.h> 50dd7d207dSJung-uk Kim #include <machine/specialreg.h> 5101e1933dSJohn Baldwin #include <x86/vmware.h> 5216808549SKonstantin Belousov #include <dev/acpica/acpi_hpet.h> 53*ce3bf750SKonstantin Belousov #include <contrib/dev/acpica/include/acpi.h> 54dd7d207dSJung-uk Kim 55dd7d207dSJung-uk Kim #include "cpufreq_if.h" 56dd7d207dSJung-uk Kim 57dd7d207dSJung-uk Kim uint64_t tsc_freq; 58dd7d207dSJung-uk Kim int tsc_is_invariant; 59155094d7SJung-uk Kim int tsc_perf_stat; 60155094d7SJung-uk Kim 61dd7d207dSJung-uk Kim static eventhandler_tag tsc_levels_tag, tsc_pre_tag, tsc_post_tag; 62dd7d207dSJung-uk Kim 63dd7d207dSJung-uk Kim SYSCTL_INT(_kern_timecounter, OID_AUTO, invariant_tsc, CTLFLAG_RDTUN, 64dd7d207dSJung-uk Kim &tsc_is_invariant, 0, "Indicates whether the TSC is P-state invariant"); 65dd7d207dSJung-uk Kim 66dd7d207dSJung-uk Kim #ifdef SMP 671472b87fSNeel Natu int smp_tsc; 68dd7d207dSJung-uk Kim SYSCTL_INT(_kern_timecounter, OID_AUTO, smp_tsc, CTLFLAG_RDTUN, &smp_tsc, 0, 69dd7d207dSJung-uk Kim "Indicates whether the TSC is safe to use in SMP mode"); 70b2c63698SAlexander Motin 71b2c63698SAlexander Motin int smp_tsc_adjust = 0; 72b2c63698SAlexander Motin SYSCTL_INT(_kern_timecounter, OID_AUTO, smp_tsc_adjust, CTLFLAG_RDTUN, 73b2c63698SAlexander Motin &smp_tsc_adjust, 0, "Try to adjust TSC on APs to match BSP"); 74dd7d207dSJung-uk Kim #endif 75dd7d207dSJung-uk Kim 76e7f1427dSKonstantin Belousov static int tsc_shift = 1; 77e7f1427dSKonstantin Belousov SYSCTL_INT(_kern_timecounter, OID_AUTO, tsc_shift, CTLFLAG_RDTUN, 78e7f1427dSKonstantin Belousov &tsc_shift, 0, "Shift to pre-apply for the maximum TSC frequency"); 79e7f1427dSKonstantin Belousov 8079422085SJung-uk Kim static int tsc_disabled; 8179422085SJung-uk Kim SYSCTL_INT(_machdep, OID_AUTO, disable_tsc, CTLFLAG_RDTUN, &tsc_disabled, 0, 8279422085SJung-uk Kim "Disable x86 Time Stamp Counter"); 8379422085SJung-uk Kim 84a4e4127fSJung-uk Kim static int tsc_skip_calibration; 85*ce3bf750SKonstantin Belousov SYSCTL_INT(_machdep, OID_AUTO, disable_tsc_calibration, CTLFLAG_RDTUN | 86*ce3bf750SKonstantin Belousov CTLFLAG_NOFETCH, &tsc_skip_calibration, 0, 87*ce3bf750SKonstantin Belousov "Disable TSC frequency calibration"); 88a4e4127fSJung-uk Kim 89dd7d207dSJung-uk Kim static void tsc_freq_changed(void *arg, const struct cf_level *level, 90dd7d207dSJung-uk Kim int status); 91dd7d207dSJung-uk Kim static void tsc_freq_changing(void *arg, const struct cf_level *level, 92dd7d207dSJung-uk Kim int *status); 93dd7d207dSJung-uk Kim static unsigned tsc_get_timecount(struct timecounter *tc); 94814124c3SKonstantin Belousov static inline unsigned tsc_get_timecount_low(struct timecounter *tc); 95814124c3SKonstantin Belousov static unsigned tsc_get_timecount_lfence(struct timecounter *tc); 96814124c3SKonstantin Belousov static unsigned tsc_get_timecount_low_lfence(struct timecounter *tc); 97814124c3SKonstantin Belousov static unsigned tsc_get_timecount_mfence(struct timecounter *tc); 98814124c3SKonstantin Belousov static unsigned tsc_get_timecount_low_mfence(struct timecounter *tc); 99dd7d207dSJung-uk Kim static void tsc_levels_changed(void *arg, int unit); 10016808549SKonstantin Belousov static uint32_t x86_tsc_vdso_timehands(struct vdso_timehands *vdso_th, 10116808549SKonstantin Belousov struct timecounter *tc); 10216808549SKonstantin Belousov #ifdef COMPAT_FREEBSD32 10316808549SKonstantin Belousov static uint32_t x86_tsc_vdso_timehands32(struct vdso_timehands32 *vdso_th32, 10416808549SKonstantin Belousov struct timecounter *tc); 10516808549SKonstantin Belousov #endif 106dd7d207dSJung-uk Kim 107dd7d207dSJung-uk Kim static struct timecounter tsc_timecounter = { 10816808549SKonstantin Belousov .tc_get_timecount = tsc_get_timecount, 10916808549SKonstantin Belousov .tc_counter_mask = ~0u, 11016808549SKonstantin Belousov .tc_name = "TSC", 11116808549SKonstantin Belousov .tc_quality = 800, /* adjusted in code */ 11216808549SKonstantin Belousov .tc_fill_vdso_timehands = x86_tsc_vdso_timehands, 11316808549SKonstantin Belousov #ifdef COMPAT_FREEBSD32 11416808549SKonstantin Belousov .tc_fill_vdso_timehands32 = x86_tsc_vdso_timehands32, 11516808549SKonstantin Belousov #endif 116dd7d207dSJung-uk Kim }; 117dd7d207dSJung-uk Kim 11801e1933dSJohn Baldwin static void 1195da5812bSJung-uk Kim tsc_freq_vmware(void) 1205da5812bSJung-uk Kim { 1215da5812bSJung-uk Kim u_int regs[4]; 1225da5812bSJung-uk Kim 1235da5812bSJung-uk Kim if (hv_high >= 0x40000010) { 1245da5812bSJung-uk Kim do_cpuid(0x40000010, regs); 1255da5812bSJung-uk Kim tsc_freq = regs[0] * 1000; 1265da5812bSJung-uk Kim } else { 1275da5812bSJung-uk Kim vmware_hvcall(VMW_HVCMD_GETHZ, regs); 1285da5812bSJung-uk Kim if (regs[1] != UINT_MAX) 1295da5812bSJung-uk Kim tsc_freq = regs[0] | ((uint64_t)regs[1] << 32); 1305da5812bSJung-uk Kim } 1315da5812bSJung-uk Kim tsc_is_invariant = 1; 1325da5812bSJung-uk Kim } 1335da5812bSJung-uk Kim 134506a906cSKonstantin Belousov /* 135506a906cSKonstantin Belousov * Calculate TSC frequency using information from the CPUID leaf 0x15 136506a906cSKonstantin Belousov * 'Time Stamp Counter and Nominal Core Crystal Clock'. It should be 137506a906cSKonstantin Belousov * an improvement over the parsing of the CPU model name in 138506a906cSKonstantin Belousov * tsc_freq_intel(), when available. 139506a906cSKonstantin Belousov */ 140506a906cSKonstantin Belousov static bool 141506a906cSKonstantin Belousov tsc_freq_cpuid(void) 142506a906cSKonstantin Belousov { 143506a906cSKonstantin Belousov u_int regs[4]; 144506a906cSKonstantin Belousov 145506a906cSKonstantin Belousov if (cpu_high < 0x15) 146506a906cSKonstantin Belousov return (false); 147506a906cSKonstantin Belousov do_cpuid(0x15, regs); 148506a906cSKonstantin Belousov if (regs[0] == 0 || regs[1] == 0 || regs[2] == 0) 149506a906cSKonstantin Belousov return (false); 150506a906cSKonstantin Belousov tsc_freq = (uint64_t)regs[2] * regs[1] / regs[0]; 151506a906cSKonstantin Belousov return (true); 152506a906cSKonstantin Belousov } 153506a906cSKonstantin Belousov 154a4e4127fSJung-uk Kim static void 155a4e4127fSJung-uk Kim tsc_freq_intel(void) 156dd7d207dSJung-uk Kim { 157a4e4127fSJung-uk Kim char brand[48]; 158a4e4127fSJung-uk Kim u_int regs[4]; 159a4e4127fSJung-uk Kim uint64_t freq; 160a4e4127fSJung-uk Kim char *p; 161a4e4127fSJung-uk Kim u_int i; 162dd7d207dSJung-uk Kim 163a4e4127fSJung-uk Kim /* 164a4e4127fSJung-uk Kim * Intel Processor Identification and the CPUID Instruction 165a4e4127fSJung-uk Kim * Application Note 485. 166a4e4127fSJung-uk Kim * http://www.intel.com/assets/pdf/appnote/241618.pdf 167a4e4127fSJung-uk Kim */ 168a4e4127fSJung-uk Kim if (cpu_exthigh >= 0x80000004) { 169a4e4127fSJung-uk Kim p = brand; 170a4e4127fSJung-uk Kim for (i = 0x80000002; i < 0x80000005; i++) { 171a4e4127fSJung-uk Kim do_cpuid(i, regs); 172a4e4127fSJung-uk Kim memcpy(p, regs, sizeof(regs)); 173a4e4127fSJung-uk Kim p += sizeof(regs); 174a4e4127fSJung-uk Kim } 175a4e4127fSJung-uk Kim p = NULL; 176a4e4127fSJung-uk Kim for (i = 0; i < sizeof(brand) - 1; i++) 177a4e4127fSJung-uk Kim if (brand[i] == 'H' && brand[i + 1] == 'z') 178a4e4127fSJung-uk Kim p = brand + i; 179a4e4127fSJung-uk Kim if (p != NULL) { 180a4e4127fSJung-uk Kim p -= 5; 181a4e4127fSJung-uk Kim switch (p[4]) { 182a4e4127fSJung-uk Kim case 'M': 183a4e4127fSJung-uk Kim i = 1; 184a4e4127fSJung-uk Kim break; 185a4e4127fSJung-uk Kim case 'G': 186a4e4127fSJung-uk Kim i = 1000; 187a4e4127fSJung-uk Kim break; 188a4e4127fSJung-uk Kim case 'T': 189a4e4127fSJung-uk Kim i = 1000000; 190a4e4127fSJung-uk Kim break; 191a4e4127fSJung-uk Kim default: 192dd7d207dSJung-uk Kim return; 193a4e4127fSJung-uk Kim } 194a4e4127fSJung-uk Kim #define C2D(c) ((c) - '0') 195a4e4127fSJung-uk Kim if (p[1] == '.') { 196a4e4127fSJung-uk Kim freq = C2D(p[0]) * 1000; 197a4e4127fSJung-uk Kim freq += C2D(p[2]) * 100; 198a4e4127fSJung-uk Kim freq += C2D(p[3]) * 10; 199a4e4127fSJung-uk Kim freq *= i * 1000; 200a4e4127fSJung-uk Kim } else { 201a4e4127fSJung-uk Kim freq = C2D(p[0]) * 1000; 202a4e4127fSJung-uk Kim freq += C2D(p[1]) * 100; 203a4e4127fSJung-uk Kim freq += C2D(p[2]) * 10; 204a4e4127fSJung-uk Kim freq += C2D(p[3]); 205a4e4127fSJung-uk Kim freq *= i * 1000000; 206a4e4127fSJung-uk Kim } 207a4e4127fSJung-uk Kim #undef C2D 208a4e4127fSJung-uk Kim tsc_freq = freq; 209a4e4127fSJung-uk Kim } 210a4e4127fSJung-uk Kim } 211a4e4127fSJung-uk Kim } 212dd7d207dSJung-uk Kim 213a4e4127fSJung-uk Kim static void 214a4e4127fSJung-uk Kim probe_tsc_freq(void) 215a4e4127fSJung-uk Kim { 216155094d7SJung-uk Kim u_int regs[4]; 217a4e4127fSJung-uk Kim uint64_t tsc1, tsc2; 218*ce3bf750SKonstantin Belousov uint16_t bootflags; 219dd7d207dSJung-uk Kim 2205da5812bSJung-uk Kim if (cpu_high >= 6) { 2215da5812bSJung-uk Kim do_cpuid(6, regs); 2225da5812bSJung-uk Kim if ((regs[2] & CPUID_PERF_STAT) != 0) { 2235da5812bSJung-uk Kim /* 2245da5812bSJung-uk Kim * XXX Some emulators expose host CPUID without actual 2255da5812bSJung-uk Kim * support for these MSRs. We must test whether they 2265da5812bSJung-uk Kim * really work. 2275da5812bSJung-uk Kim */ 2285da5812bSJung-uk Kim wrmsr(MSR_MPERF, 0); 2295da5812bSJung-uk Kim wrmsr(MSR_APERF, 0); 2305da5812bSJung-uk Kim DELAY(10); 2315da5812bSJung-uk Kim if (rdmsr(MSR_MPERF) > 0 && rdmsr(MSR_APERF) > 0) 2325da5812bSJung-uk Kim tsc_perf_stat = 1; 2335da5812bSJung-uk Kim } 2345da5812bSJung-uk Kim } 2355da5812bSJung-uk Kim 23601e1933dSJohn Baldwin if (vm_guest == VM_GUEST_VMWARE) { 23701e1933dSJohn Baldwin tsc_freq_vmware(); 2385da5812bSJung-uk Kim return; 23901e1933dSJohn Baldwin } 2405da5812bSJung-uk Kim 241dd7d207dSJung-uk Kim switch (cpu_vendor_id) { 242dd7d207dSJung-uk Kim case CPU_VENDOR_AMD: 243a106a27cSJung-uk Kim if ((amd_pminfo & AMDPM_TSC_INVARIANT) != 0 || 244a106a27cSJung-uk Kim (vm_guest == VM_GUEST_NO && 245a106a27cSJung-uk Kim CPUID_TO_FAMILY(cpu_id) >= 0x10)) 246dd7d207dSJung-uk Kim tsc_is_invariant = 1; 247814124c3SKonstantin Belousov if (cpu_feature & CPUID_SSE2) { 248814124c3SKonstantin Belousov tsc_timecounter.tc_get_timecount = 249814124c3SKonstantin Belousov tsc_get_timecount_mfence; 250814124c3SKonstantin Belousov } 251dd7d207dSJung-uk Kim break; 252dd7d207dSJung-uk Kim case CPU_VENDOR_INTEL: 253a106a27cSJung-uk Kim if ((amd_pminfo & AMDPM_TSC_INVARIANT) != 0 || 254a106a27cSJung-uk Kim (vm_guest == VM_GUEST_NO && 255a106a27cSJung-uk Kim ((CPUID_TO_FAMILY(cpu_id) == 0x6 && 256dd7d207dSJung-uk Kim CPUID_TO_MODEL(cpu_id) >= 0xe) || 257dd7d207dSJung-uk Kim (CPUID_TO_FAMILY(cpu_id) == 0xf && 258a106a27cSJung-uk Kim CPUID_TO_MODEL(cpu_id) >= 0x3)))) 259dd7d207dSJung-uk Kim tsc_is_invariant = 1; 260814124c3SKonstantin Belousov if (cpu_feature & CPUID_SSE2) { 261814124c3SKonstantin Belousov tsc_timecounter.tc_get_timecount = 262814124c3SKonstantin Belousov tsc_get_timecount_lfence; 263814124c3SKonstantin Belousov } 264dd7d207dSJung-uk Kim break; 265dd7d207dSJung-uk Kim case CPU_VENDOR_CENTAUR: 266a106a27cSJung-uk Kim if (vm_guest == VM_GUEST_NO && 267a106a27cSJung-uk Kim CPUID_TO_FAMILY(cpu_id) == 0x6 && 268dd7d207dSJung-uk Kim CPUID_TO_MODEL(cpu_id) >= 0xf && 269dd7d207dSJung-uk Kim (rdmsr(0x1203) & 0x100000000ULL) == 0) 270dd7d207dSJung-uk Kim tsc_is_invariant = 1; 271814124c3SKonstantin Belousov if (cpu_feature & CPUID_SSE2) { 272814124c3SKonstantin Belousov tsc_timecounter.tc_get_timecount = 273814124c3SKonstantin Belousov tsc_get_timecount_lfence; 274814124c3SKonstantin Belousov } 275dd7d207dSJung-uk Kim break; 276dd7d207dSJung-uk Kim } 277dd7d207dSJung-uk Kim 278*ce3bf750SKonstantin Belousov if (!TUNABLE_INT_FETCH("machdep.disable_tsc_calibration", 279*ce3bf750SKonstantin Belousov &tsc_skip_calibration)) { 280*ce3bf750SKonstantin Belousov /* 281*ce3bf750SKonstantin Belousov * User did not give the order about calibration. 282*ce3bf750SKonstantin Belousov * If he did, we do not try to guess. 283*ce3bf750SKonstantin Belousov * 284*ce3bf750SKonstantin Belousov * Otherwise, if ACPI FADT reports that the platform 285*ce3bf750SKonstantin Belousov * is legacy-free and CPUID provides TSC frequency, 286*ce3bf750SKonstantin Belousov * use it. The calibration could fail anyway since 287*ce3bf750SKonstantin Belousov * ISA timer can be absent or power gated. 288*ce3bf750SKonstantin Belousov */ 289*ce3bf750SKonstantin Belousov if (acpi_get_fadt_bootflags(&bootflags) && 290*ce3bf750SKonstantin Belousov (bootflags & ACPI_FADT_LEGACY_DEVICES) == 0 && 291*ce3bf750SKonstantin Belousov tsc_freq_cpuid()) { 292*ce3bf750SKonstantin Belousov printf("Skipping TSC calibration since no legacy " 293*ce3bf750SKonstantin Belousov "devices reported by FADT and CPUID works\n"); 294*ce3bf750SKonstantin Belousov tsc_skip_calibration = 1; 295*ce3bf750SKonstantin Belousov } 296*ce3bf750SKonstantin Belousov } 297a4e4127fSJung-uk Kim if (tsc_skip_calibration) { 298506a906cSKonstantin Belousov if (tsc_freq_cpuid()) 299506a906cSKonstantin Belousov ; 300506a906cSKonstantin Belousov else if (cpu_vendor_id == CPU_VENDOR_INTEL) 301a4e4127fSJung-uk Kim tsc_freq_intel(); 302506a906cSKonstantin Belousov } else { 303a4e4127fSJung-uk Kim if (bootverbose) 304a4e4127fSJung-uk Kim printf("Calibrating TSC clock ... "); 305a4e4127fSJung-uk Kim tsc1 = rdtsc(); 306a4e4127fSJung-uk Kim DELAY(1000000); 307a4e4127fSJung-uk Kim tsc2 = rdtsc(); 308a4e4127fSJung-uk Kim tsc_freq = tsc2 - tsc1; 309506a906cSKonstantin Belousov } 310a4e4127fSJung-uk Kim if (bootverbose) 311a4e4127fSJung-uk Kim printf("TSC clock: %ju Hz\n", (intmax_t)tsc_freq); 312a4e4127fSJung-uk Kim } 313a4e4127fSJung-uk Kim 314a4e4127fSJung-uk Kim void 315a4e4127fSJung-uk Kim init_TSC(void) 316a4e4127fSJung-uk Kim { 317a4e4127fSJung-uk Kim 318a4e4127fSJung-uk Kim if ((cpu_feature & CPUID_TSC) == 0 || tsc_disabled) 319a4e4127fSJung-uk Kim return; 320a4e4127fSJung-uk Kim 321fe760cfaSJohn Baldwin #ifdef __i386__ 322fe760cfaSJohn Baldwin /* The TSC is known to be broken on certain CPUs. */ 323fe760cfaSJohn Baldwin switch (cpu_vendor_id) { 324fe760cfaSJohn Baldwin case CPU_VENDOR_AMD: 325fe760cfaSJohn Baldwin switch (cpu_id & 0xFF0) { 326fe760cfaSJohn Baldwin case 0x500: 327fe760cfaSJohn Baldwin /* K5 Model 0 */ 328fe760cfaSJohn Baldwin return; 329fe760cfaSJohn Baldwin } 330fe760cfaSJohn Baldwin break; 331fe760cfaSJohn Baldwin case CPU_VENDOR_CENTAUR: 332fe760cfaSJohn Baldwin switch (cpu_id & 0xff0) { 333fe760cfaSJohn Baldwin case 0x540: 334fe760cfaSJohn Baldwin /* 335fe760cfaSJohn Baldwin * http://www.centtech.com/c6_data_sheet.pdf 336fe760cfaSJohn Baldwin * 337fe760cfaSJohn Baldwin * I-12 RDTSC may return incoherent values in EDX:EAX 338fe760cfaSJohn Baldwin * I-13 RDTSC hangs when certain event counters are used 339fe760cfaSJohn Baldwin */ 340fe760cfaSJohn Baldwin return; 341fe760cfaSJohn Baldwin } 342fe760cfaSJohn Baldwin break; 343fe760cfaSJohn Baldwin case CPU_VENDOR_NSC: 344fe760cfaSJohn Baldwin switch (cpu_id & 0xff0) { 345fe760cfaSJohn Baldwin case 0x540: 346fe760cfaSJohn Baldwin if ((cpu_id & CPUID_STEPPING) == 0) 347fe760cfaSJohn Baldwin return; 348fe760cfaSJohn Baldwin break; 349fe760cfaSJohn Baldwin } 350fe760cfaSJohn Baldwin break; 351fe760cfaSJohn Baldwin } 352fe760cfaSJohn Baldwin #endif 353fe760cfaSJohn Baldwin 354a4e4127fSJung-uk Kim probe_tsc_freq(); 355a4e4127fSJung-uk Kim 356dd7d207dSJung-uk Kim /* 357dd7d207dSJung-uk Kim * Inform CPU accounting about our boot-time clock rate. This will 358dd7d207dSJung-uk Kim * be updated if someone loads a cpufreq driver after boot that 359dd7d207dSJung-uk Kim * discovers a new max frequency. 360dd7d207dSJung-uk Kim */ 361a4e4127fSJung-uk Kim if (tsc_freq != 0) 3625ac44f72SJung-uk Kim set_cputicker(rdtsc, tsc_freq, !tsc_is_invariant); 363dd7d207dSJung-uk Kim 364dd7d207dSJung-uk Kim if (tsc_is_invariant) 365dd7d207dSJung-uk Kim return; 366dd7d207dSJung-uk Kim 367dd7d207dSJung-uk Kim /* Register to find out about changes in CPU frequency. */ 368dd7d207dSJung-uk Kim tsc_pre_tag = EVENTHANDLER_REGISTER(cpufreq_pre_change, 369dd7d207dSJung-uk Kim tsc_freq_changing, NULL, EVENTHANDLER_PRI_FIRST); 370dd7d207dSJung-uk Kim tsc_post_tag = EVENTHANDLER_REGISTER(cpufreq_post_change, 371dd7d207dSJung-uk Kim tsc_freq_changed, NULL, EVENTHANDLER_PRI_FIRST); 372dd7d207dSJung-uk Kim tsc_levels_tag = EVENTHANDLER_REGISTER(cpufreq_levels_changed, 373dd7d207dSJung-uk Kim tsc_levels_changed, NULL, EVENTHANDLER_PRI_ANY); 374dd7d207dSJung-uk Kim } 375dd7d207dSJung-uk Kim 37665e7d70bSJung-uk Kim #ifdef SMP 37765e7d70bSJung-uk Kim 378814124c3SKonstantin Belousov /* 379814124c3SKonstantin Belousov * RDTSC is not a serializing instruction, and does not drain 380814124c3SKonstantin Belousov * instruction stream, so we need to drain the stream before executing 381814124c3SKonstantin Belousov * it. It could be fixed by use of RDTSCP, except the instruction is 382814124c3SKonstantin Belousov * not available everywhere. 383814124c3SKonstantin Belousov * 384814124c3SKonstantin Belousov * Use CPUID for draining in the boot-time SMP constistency test. The 385814124c3SKonstantin Belousov * timecounters use MFENCE for AMD CPUs, and LFENCE for others (Intel 386814124c3SKonstantin Belousov * and VIA) when SSE2 is present, and nothing on older machines which 387814124c3SKonstantin Belousov * also do not issue RDTSC prematurely. There, testing for SSE2 and 388e1a18e46SKonstantin Belousov * vendor is too cumbersome, and we learn about TSC presence from CPUID. 389814124c3SKonstantin Belousov * 390814124c3SKonstantin Belousov * Do not use do_cpuid(), since we do not need CPUID results, which 391814124c3SKonstantin Belousov * have to be written into memory with do_cpuid(). 392814124c3SKonstantin Belousov */ 39365e7d70bSJung-uk Kim #define TSC_READ(x) \ 39465e7d70bSJung-uk Kim static void \ 39565e7d70bSJung-uk Kim tsc_read_##x(void *arg) \ 39665e7d70bSJung-uk Kim { \ 3977bfcb3bbSJim Harris uint64_t *tsc = arg; \ 39865e7d70bSJung-uk Kim u_int cpu = PCPU_GET(cpuid); \ 39965e7d70bSJung-uk Kim \ 400814124c3SKonstantin Belousov __asm __volatile("cpuid" : : : "eax", "ebx", "ecx", "edx"); \ 4017bfcb3bbSJim Harris tsc[cpu * 3 + x] = rdtsc(); \ 40265e7d70bSJung-uk Kim } 40365e7d70bSJung-uk Kim TSC_READ(0) 40465e7d70bSJung-uk Kim TSC_READ(1) 40565e7d70bSJung-uk Kim TSC_READ(2) 40665e7d70bSJung-uk Kim #undef TSC_READ 40765e7d70bSJung-uk Kim 40865e7d70bSJung-uk Kim #define N 1000 40965e7d70bSJung-uk Kim 41065e7d70bSJung-uk Kim static void 41165e7d70bSJung-uk Kim comp_smp_tsc(void *arg) 41265e7d70bSJung-uk Kim { 4137bfcb3bbSJim Harris uint64_t *tsc; 4147bfcb3bbSJim Harris int64_t d1, d2; 41565e7d70bSJung-uk Kim u_int cpu = PCPU_GET(cpuid); 41665e7d70bSJung-uk Kim u_int i, j, size; 41765e7d70bSJung-uk Kim 41865e7d70bSJung-uk Kim size = (mp_maxid + 1) * 3; 41965e7d70bSJung-uk Kim for (i = 0, tsc = arg; i < N; i++, tsc += size) 42065e7d70bSJung-uk Kim CPU_FOREACH(j) { 42165e7d70bSJung-uk Kim if (j == cpu) 42265e7d70bSJung-uk Kim continue; 42365e7d70bSJung-uk Kim d1 = tsc[cpu * 3 + 1] - tsc[j * 3]; 42465e7d70bSJung-uk Kim d2 = tsc[cpu * 3 + 2] - tsc[j * 3 + 1]; 42565e7d70bSJung-uk Kim if (d1 <= 0 || d2 <= 0) { 42665e7d70bSJung-uk Kim smp_tsc = 0; 42765e7d70bSJung-uk Kim return; 42865e7d70bSJung-uk Kim } 42965e7d70bSJung-uk Kim } 43065e7d70bSJung-uk Kim } 43165e7d70bSJung-uk Kim 432b2c63698SAlexander Motin static void 433b2c63698SAlexander Motin adj_smp_tsc(void *arg) 434b2c63698SAlexander Motin { 435b2c63698SAlexander Motin uint64_t *tsc; 436b2c63698SAlexander Motin int64_t d, min, max; 437b2c63698SAlexander Motin u_int cpu = PCPU_GET(cpuid); 438b2c63698SAlexander Motin u_int first, i, size; 439b2c63698SAlexander Motin 440b2c63698SAlexander Motin first = CPU_FIRST(); 441b2c63698SAlexander Motin if (cpu == first) 442b2c63698SAlexander Motin return; 443b2c63698SAlexander Motin min = INT64_MIN; 444b2c63698SAlexander Motin max = INT64_MAX; 445b2c63698SAlexander Motin size = (mp_maxid + 1) * 3; 446b2c63698SAlexander Motin for (i = 0, tsc = arg; i < N; i++, tsc += size) { 447b2c63698SAlexander Motin d = tsc[first * 3] - tsc[cpu * 3 + 1]; 448b2c63698SAlexander Motin if (d > min) 449b2c63698SAlexander Motin min = d; 450b2c63698SAlexander Motin d = tsc[first * 3 + 1] - tsc[cpu * 3 + 2]; 451b2c63698SAlexander Motin if (d > min) 452b2c63698SAlexander Motin min = d; 453b2c63698SAlexander Motin d = tsc[first * 3 + 1] - tsc[cpu * 3]; 454b2c63698SAlexander Motin if (d < max) 455b2c63698SAlexander Motin max = d; 456b2c63698SAlexander Motin d = tsc[first * 3 + 2] - tsc[cpu * 3 + 1]; 457b2c63698SAlexander Motin if (d < max) 458b2c63698SAlexander Motin max = d; 459b2c63698SAlexander Motin } 460b2c63698SAlexander Motin if (min > max) 461b2c63698SAlexander Motin return; 462b2c63698SAlexander Motin d = min / 2 + max / 2; 463b2c63698SAlexander Motin __asm __volatile ( 464b2c63698SAlexander Motin "movl $0x10, %%ecx\n\t" 465b2c63698SAlexander Motin "rdmsr\n\t" 466b2c63698SAlexander Motin "addl %%edi, %%eax\n\t" 467b2c63698SAlexander Motin "adcl %%esi, %%edx\n\t" 468b2c63698SAlexander Motin "wrmsr\n" 469b2c63698SAlexander Motin : /* No output */ 470b2c63698SAlexander Motin : "D" ((uint32_t)d), "S" ((uint32_t)(d >> 32)) 471b2c63698SAlexander Motin : "ax", "cx", "dx", "cc" 472b2c63698SAlexander Motin ); 473b2c63698SAlexander Motin } 474b2c63698SAlexander Motin 47565e7d70bSJung-uk Kim static int 476279be68bSAndriy Gapon test_tsc(int adj_max_count) 47765e7d70bSJung-uk Kim { 4787bfcb3bbSJim Harris uint64_t *data, *tsc; 479b2c63698SAlexander Motin u_int i, size, adj; 48065e7d70bSJung-uk Kim 481e7f1427dSKonstantin Belousov if ((!smp_tsc && !tsc_is_invariant) || vm_guest) 48265e7d70bSJung-uk Kim return (-100); 48365e7d70bSJung-uk Kim size = (mp_maxid + 1) * 3; 48465e7d70bSJung-uk Kim data = malloc(sizeof(*data) * size * N, M_TEMP, M_WAITOK); 485b2c63698SAlexander Motin adj = 0; 486b2c63698SAlexander Motin retry: 48765e7d70bSJung-uk Kim for (i = 0, tsc = data; i < N; i++, tsc += size) 48865e7d70bSJung-uk Kim smp_rendezvous(tsc_read_0, tsc_read_1, tsc_read_2, tsc); 48965e7d70bSJung-uk Kim smp_tsc = 1; /* XXX */ 49067d955aaSPatrick Kelsey smp_rendezvous(smp_no_rendezvous_barrier, comp_smp_tsc, 49167d955aaSPatrick Kelsey smp_no_rendezvous_barrier, data); 492279be68bSAndriy Gapon if (!smp_tsc && adj < adj_max_count) { 493b2c63698SAlexander Motin adj++; 49467d955aaSPatrick Kelsey smp_rendezvous(smp_no_rendezvous_barrier, adj_smp_tsc, 49567d955aaSPatrick Kelsey smp_no_rendezvous_barrier, data); 496b2c63698SAlexander Motin goto retry; 497b2c63698SAlexander Motin } 49865e7d70bSJung-uk Kim free(data, M_TEMP); 49965e7d70bSJung-uk Kim if (bootverbose) 500b2c63698SAlexander Motin printf("SMP: %sed TSC synchronization test%s\n", 501b2c63698SAlexander Motin smp_tsc ? "pass" : "fail", 502b2c63698SAlexander Motin adj > 0 ? " after adjustment" : ""); 50326e6537aSJung-uk Kim if (smp_tsc && tsc_is_invariant) { 50426e6537aSJung-uk Kim switch (cpu_vendor_id) { 50526e6537aSJung-uk Kim case CPU_VENDOR_AMD: 50626e6537aSJung-uk Kim /* 50726e6537aSJung-uk Kim * Starting with Family 15h processors, TSC clock 50826e6537aSJung-uk Kim * source is in the north bridge. Check whether 50926e6537aSJung-uk Kim * we have a single-socket/multi-core platform. 51026e6537aSJung-uk Kim * XXX Need more work for complex cases. 51126e6537aSJung-uk Kim */ 51226e6537aSJung-uk Kim if (CPUID_TO_FAMILY(cpu_id) < 0x15 || 51326e6537aSJung-uk Kim (amd_feature2 & AMDID2_CMP) == 0 || 51426e6537aSJung-uk Kim smp_cpus > (cpu_procinfo2 & AMDID_CMP_CORES) + 1) 51526e6537aSJung-uk Kim break; 51626e6537aSJung-uk Kim return (1000); 51726e6537aSJung-uk Kim case CPU_VENDOR_INTEL: 51826e6537aSJung-uk Kim /* 51926e6537aSJung-uk Kim * XXX Assume Intel platforms have synchronized TSCs. 52026e6537aSJung-uk Kim */ 52126e6537aSJung-uk Kim return (1000); 52226e6537aSJung-uk Kim } 52326e6537aSJung-uk Kim return (800); 52426e6537aSJung-uk Kim } 52526e6537aSJung-uk Kim return (-100); 52665e7d70bSJung-uk Kim } 52765e7d70bSJung-uk Kim 52865e7d70bSJung-uk Kim #undef N 52965e7d70bSJung-uk Kim 53065e7d70bSJung-uk Kim #endif /* SMP */ 53165e7d70bSJung-uk Kim 53265e7d70bSJung-uk Kim static void 533dd7d207dSJung-uk Kim init_TSC_tc(void) 534dd7d207dSJung-uk Kim { 53595f2f098SJung-uk Kim uint64_t max_freq; 53695f2f098SJung-uk Kim int shift; 537dd7d207dSJung-uk Kim 53838b8542cSJung-uk Kim if ((cpu_feature & CPUID_TSC) == 0 || tsc_disabled) 539dd7d207dSJung-uk Kim return; 540dd7d207dSJung-uk Kim 541dd7d207dSJung-uk Kim /* 54295f2f098SJung-uk Kim * Limit timecounter frequency to fit in an int and prevent it from 54395f2f098SJung-uk Kim * overflowing too fast. 54495f2f098SJung-uk Kim */ 54595f2f098SJung-uk Kim max_freq = UINT_MAX; 54695f2f098SJung-uk Kim 54795f2f098SJung-uk Kim /* 548dd7d207dSJung-uk Kim * We can not use the TSC if we support APM. Precise timekeeping 549dd7d207dSJung-uk Kim * on an APM'ed machine is at best a fools pursuit, since 550dd7d207dSJung-uk Kim * any and all of the time spent in various SMM code can't 551dd7d207dSJung-uk Kim * be reliably accounted for. Reading the RTC is your only 552dd7d207dSJung-uk Kim * source of reliable time info. The i8254 loses too, of course, 553dd7d207dSJung-uk Kim * but we need to have some kind of time... 554dd7d207dSJung-uk Kim * We don't know at this point whether APM is going to be used 555dd7d207dSJung-uk Kim * or not, nor when it might be activated. Play it safe. 556dd7d207dSJung-uk Kim */ 557dd7d207dSJung-uk Kim if (power_pm_get_type() == POWER_PM_TYPE_APM) { 558dd7d207dSJung-uk Kim tsc_timecounter.tc_quality = -1000; 559dd7d207dSJung-uk Kim if (bootverbose) 560dd7d207dSJung-uk Kim printf("TSC timecounter disabled: APM enabled.\n"); 56165e7d70bSJung-uk Kim goto init; 562dd7d207dSJung-uk Kim } 563dd7d207dSJung-uk Kim 564a49399a9SJung-uk Kim /* 56592597e06SJohn Baldwin * Intel CPUs without a C-state invariant TSC can stop the TSC 566d1411416SJohn Baldwin * in either C2 or C3. Disable use of C2 and C3 while using 567d1411416SJohn Baldwin * the TSC as the timecounter. The timecounter can be changed 568d1411416SJohn Baldwin * to enable C2 and C3. 569d1411416SJohn Baldwin * 570d1411416SJohn Baldwin * Note that the TSC is used as the cputicker for computing 571d1411416SJohn Baldwin * thread runtime regardless of the timecounter setting, so 572d1411416SJohn Baldwin * using an alternate timecounter and enabling C2 or C3 can 573d1411416SJohn Baldwin * result incorrect runtimes for kernel idle threads (but not 574d1411416SJohn Baldwin * for any non-idle threads). 575a49399a9SJung-uk Kim */ 5768cd59625SKonstantin Belousov if (cpu_vendor_id == CPU_VENDOR_INTEL && 577a49399a9SJung-uk Kim (amd_pminfo & AMDPM_TSC_INVARIANT) == 0) { 57892597e06SJohn Baldwin tsc_timecounter.tc_flags |= TC_FLAGS_C2STOP; 579a49399a9SJung-uk Kim if (bootverbose) 580d1411416SJohn Baldwin printf("TSC timecounter disables C2 and C3.\n"); 581a49399a9SJung-uk Kim } 582a49399a9SJung-uk Kim 583dd7d207dSJung-uk Kim /* 584e7f1427dSKonstantin Belousov * We can not use the TSC in SMP mode unless the TSCs on all CPUs 585e7f1427dSKonstantin Belousov * are synchronized. If the user is sure that the system has 586e7f1427dSKonstantin Belousov * synchronized TSCs, set kern.timecounter.smp_tsc tunable to a 587e7f1427dSKonstantin Belousov * non-zero value. The TSC seems unreliable in virtualized SMP 5885cf8ac1bSMike Silbersack * environments, so it is set to a negative quality in those cases. 589dd7d207dSJung-uk Kim */ 590ba79ab82SAndriy Gapon #ifdef SMP 591e7f1427dSKonstantin Belousov if (mp_ncpus > 1) 592279be68bSAndriy Gapon tsc_timecounter.tc_quality = test_tsc(smp_tsc_adjust); 593ba79ab82SAndriy Gapon else 594ba79ab82SAndriy Gapon #endif /* SMP */ 595ba79ab82SAndriy Gapon if (tsc_is_invariant) 59626e6537aSJung-uk Kim tsc_timecounter.tc_quality = 1000; 597e7f1427dSKonstantin Belousov max_freq >>= tsc_shift; 59826e6537aSJung-uk Kim 59965e7d70bSJung-uk Kim init: 600e7f1427dSKonstantin Belousov for (shift = 0; shift <= 31 && (tsc_freq >> shift) > max_freq; shift++) 60195f2f098SJung-uk Kim ; 602e7f1427dSKonstantin Belousov if ((cpu_feature & CPUID_SSE2) != 0 && mp_ncpus > 1) { 603814124c3SKonstantin Belousov if (cpu_vendor_id == CPU_VENDOR_AMD) { 604e7f1427dSKonstantin Belousov tsc_timecounter.tc_get_timecount = shift > 0 ? 605e7f1427dSKonstantin Belousov tsc_get_timecount_low_mfence : 606e7f1427dSKonstantin Belousov tsc_get_timecount_mfence; 607814124c3SKonstantin Belousov } else { 608e7f1427dSKonstantin Belousov tsc_timecounter.tc_get_timecount = shift > 0 ? 609e7f1427dSKonstantin Belousov tsc_get_timecount_low_lfence : 610e7f1427dSKonstantin Belousov tsc_get_timecount_lfence; 611814124c3SKonstantin Belousov } 612e7f1427dSKonstantin Belousov } else { 613e7f1427dSKonstantin Belousov tsc_timecounter.tc_get_timecount = shift > 0 ? 614e7f1427dSKonstantin Belousov tsc_get_timecount_low : tsc_get_timecount; 615e7f1427dSKonstantin Belousov } 616e7f1427dSKonstantin Belousov if (shift > 0) { 61795f2f098SJung-uk Kim tsc_timecounter.tc_name = "TSC-low"; 61895f2f098SJung-uk Kim if (bootverbose) 619bc8e4ad2SJung-uk Kim printf("TSC timecounter discards lower %d bit(s)\n", 62095f2f098SJung-uk Kim shift); 62195f2f098SJung-uk Kim } 622bc34c87eSJung-uk Kim if (tsc_freq != 0) { 62395f2f098SJung-uk Kim tsc_timecounter.tc_frequency = tsc_freq >> shift; 62495f2f098SJung-uk Kim tsc_timecounter.tc_priv = (void *)(intptr_t)shift; 625dd7d207dSJung-uk Kim tc_init(&tsc_timecounter); 626dd7d207dSJung-uk Kim } 627dd7d207dSJung-uk Kim } 62865e7d70bSJung-uk Kim SYSINIT(tsc_tc, SI_SUB_SMP, SI_ORDER_ANY, init_TSC_tc, NULL); 629dd7d207dSJung-uk Kim 630279be68bSAndriy Gapon void 631279be68bSAndriy Gapon resume_TSC(void) 632279be68bSAndriy Gapon { 633ba79ab82SAndriy Gapon #ifdef SMP 634279be68bSAndriy Gapon int quality; 635279be68bSAndriy Gapon 636279be68bSAndriy Gapon /* If TSC was not good on boot, it is unlikely to become good now. */ 637279be68bSAndriy Gapon if (tsc_timecounter.tc_quality < 0) 638279be68bSAndriy Gapon return; 639279be68bSAndriy Gapon /* Nothing to do with UP. */ 640279be68bSAndriy Gapon if (mp_ncpus < 2) 641279be68bSAndriy Gapon return; 642279be68bSAndriy Gapon 643279be68bSAndriy Gapon /* 644279be68bSAndriy Gapon * If TSC was good, a single synchronization should be enough, 645279be68bSAndriy Gapon * but honour smp_tsc_adjust if it's set. 646279be68bSAndriy Gapon */ 647279be68bSAndriy Gapon quality = test_tsc(MAX(smp_tsc_adjust, 1)); 648279be68bSAndriy Gapon if (quality != tsc_timecounter.tc_quality) { 649279be68bSAndriy Gapon printf("TSC timecounter quality changed: %d -> %d\n", 650279be68bSAndriy Gapon tsc_timecounter.tc_quality, quality); 651279be68bSAndriy Gapon tsc_timecounter.tc_quality = quality; 652279be68bSAndriy Gapon } 653ba79ab82SAndriy Gapon #endif /* SMP */ 654279be68bSAndriy Gapon } 655279be68bSAndriy Gapon 656dd7d207dSJung-uk Kim /* 657dd7d207dSJung-uk Kim * When cpufreq levels change, find out about the (new) max frequency. We 658dd7d207dSJung-uk Kim * use this to update CPU accounting in case it got a lower estimate at boot. 659dd7d207dSJung-uk Kim */ 660dd7d207dSJung-uk Kim static void 661dd7d207dSJung-uk Kim tsc_levels_changed(void *arg, int unit) 662dd7d207dSJung-uk Kim { 663dd7d207dSJung-uk Kim device_t cf_dev; 664dd7d207dSJung-uk Kim struct cf_level *levels; 665dd7d207dSJung-uk Kim int count, error; 666dd7d207dSJung-uk Kim uint64_t max_freq; 667dd7d207dSJung-uk Kim 668dd7d207dSJung-uk Kim /* Only use values from the first CPU, assuming all are equal. */ 669dd7d207dSJung-uk Kim if (unit != 0) 670dd7d207dSJung-uk Kim return; 671dd7d207dSJung-uk Kim 672dd7d207dSJung-uk Kim /* Find the appropriate cpufreq device instance. */ 673dd7d207dSJung-uk Kim cf_dev = devclass_get_device(devclass_find("cpufreq"), unit); 674dd7d207dSJung-uk Kim if (cf_dev == NULL) { 675dd7d207dSJung-uk Kim printf("tsc_levels_changed() called but no cpufreq device?\n"); 676dd7d207dSJung-uk Kim return; 677dd7d207dSJung-uk Kim } 678dd7d207dSJung-uk Kim 679dd7d207dSJung-uk Kim /* Get settings from the device and find the max frequency. */ 680dd7d207dSJung-uk Kim count = 64; 681dd7d207dSJung-uk Kim levels = malloc(count * sizeof(*levels), M_TEMP, M_NOWAIT); 682dd7d207dSJung-uk Kim if (levels == NULL) 683dd7d207dSJung-uk Kim return; 684dd7d207dSJung-uk Kim error = CPUFREQ_LEVELS(cf_dev, levels, &count); 685dd7d207dSJung-uk Kim if (error == 0 && count != 0) { 686dd7d207dSJung-uk Kim max_freq = (uint64_t)levels[0].total_set.freq * 1000000; 687dd7d207dSJung-uk Kim set_cputicker(rdtsc, max_freq, 1); 688dd7d207dSJung-uk Kim } else 689dd7d207dSJung-uk Kim printf("tsc_levels_changed: no max freq found\n"); 690dd7d207dSJung-uk Kim free(levels, M_TEMP); 691dd7d207dSJung-uk Kim } 692dd7d207dSJung-uk Kim 693dd7d207dSJung-uk Kim /* 694dd7d207dSJung-uk Kim * If the TSC timecounter is in use, veto the pending change. It may be 695dd7d207dSJung-uk Kim * possible in the future to handle a dynamically-changing timecounter rate. 696dd7d207dSJung-uk Kim */ 697dd7d207dSJung-uk Kim static void 698dd7d207dSJung-uk Kim tsc_freq_changing(void *arg, const struct cf_level *level, int *status) 699dd7d207dSJung-uk Kim { 700dd7d207dSJung-uk Kim 701dd7d207dSJung-uk Kim if (*status != 0 || timecounter != &tsc_timecounter) 702dd7d207dSJung-uk Kim return; 703dd7d207dSJung-uk Kim 704dd7d207dSJung-uk Kim printf("timecounter TSC must not be in use when " 705dd7d207dSJung-uk Kim "changing frequencies; change denied\n"); 706dd7d207dSJung-uk Kim *status = EBUSY; 707dd7d207dSJung-uk Kim } 708dd7d207dSJung-uk Kim 709dd7d207dSJung-uk Kim /* Update TSC freq with the value indicated by the caller. */ 710dd7d207dSJung-uk Kim static void 711dd7d207dSJung-uk Kim tsc_freq_changed(void *arg, const struct cf_level *level, int status) 712dd7d207dSJung-uk Kim { 7133453537fSJung-uk Kim uint64_t freq; 714dd7d207dSJung-uk Kim 715dd7d207dSJung-uk Kim /* If there was an error during the transition, don't do anything. */ 71679422085SJung-uk Kim if (tsc_disabled || status != 0) 717dd7d207dSJung-uk Kim return; 718dd7d207dSJung-uk Kim 719dd7d207dSJung-uk Kim /* Total setting for this level gives the new frequency in MHz. */ 7203453537fSJung-uk Kim freq = (uint64_t)level->total_set.freq * 1000000; 7213453537fSJung-uk Kim atomic_store_rel_64(&tsc_freq, freq); 72295f2f098SJung-uk Kim tsc_timecounter.tc_frequency = 72395f2f098SJung-uk Kim freq >> (int)(intptr_t)tsc_timecounter.tc_priv; 724dd7d207dSJung-uk Kim } 725dd7d207dSJung-uk Kim 726dd7d207dSJung-uk Kim static int 727dd7d207dSJung-uk Kim sysctl_machdep_tsc_freq(SYSCTL_HANDLER_ARGS) 728dd7d207dSJung-uk Kim { 729dd7d207dSJung-uk Kim int error; 730dd7d207dSJung-uk Kim uint64_t freq; 731dd7d207dSJung-uk Kim 7323453537fSJung-uk Kim freq = atomic_load_acq_64(&tsc_freq); 7333453537fSJung-uk Kim if (freq == 0) 734dd7d207dSJung-uk Kim return (EOPNOTSUPP); 735cbc134adSMatthew D Fleming error = sysctl_handle_64(oidp, &freq, 0, req); 7367ebbcb21SJung-uk Kim if (error == 0 && req->newptr != NULL) { 7373453537fSJung-uk Kim atomic_store_rel_64(&tsc_freq, freq); 738bc8e4ad2SJung-uk Kim atomic_store_rel_64(&tsc_timecounter.tc_frequency, 739bc8e4ad2SJung-uk Kim freq >> (int)(intptr_t)tsc_timecounter.tc_priv); 7407ebbcb21SJung-uk Kim } 741dd7d207dSJung-uk Kim return (error); 742dd7d207dSJung-uk Kim } 743dd7d207dSJung-uk Kim 744cbc134adSMatthew D Fleming SYSCTL_PROC(_machdep, OID_AUTO, tsc_freq, CTLTYPE_U64 | CTLFLAG_RW, 7455331d61dSJung-uk Kim 0, 0, sysctl_machdep_tsc_freq, "QU", "Time Stamp Counter frequency"); 746dd7d207dSJung-uk Kim 747727c7b2dSJung-uk Kim static u_int 74895f2f098SJung-uk Kim tsc_get_timecount(struct timecounter *tc __unused) 749dd7d207dSJung-uk Kim { 750727c7b2dSJung-uk Kim 751727c7b2dSJung-uk Kim return (rdtsc32()); 752dd7d207dSJung-uk Kim } 75395f2f098SJung-uk Kim 754814124c3SKonstantin Belousov static inline u_int 755bc8e4ad2SJung-uk Kim tsc_get_timecount_low(struct timecounter *tc) 75695f2f098SJung-uk Kim { 7575df88f46SJung-uk Kim uint32_t rv; 75895f2f098SJung-uk Kim 7595df88f46SJung-uk Kim __asm __volatile("rdtsc; shrd %%cl, %%edx, %0" 7605df88f46SJung-uk Kim : "=a" (rv) : "c" ((int)(intptr_t)tc->tc_priv) : "edx"); 7615df88f46SJung-uk Kim return (rv); 76295f2f098SJung-uk Kim } 763aea81038SKonstantin Belousov 764814124c3SKonstantin Belousov static u_int 765814124c3SKonstantin Belousov tsc_get_timecount_lfence(struct timecounter *tc __unused) 766814124c3SKonstantin Belousov { 767814124c3SKonstantin Belousov 768814124c3SKonstantin Belousov lfence(); 769814124c3SKonstantin Belousov return (rdtsc32()); 770814124c3SKonstantin Belousov } 771814124c3SKonstantin Belousov 772814124c3SKonstantin Belousov static u_int 773814124c3SKonstantin Belousov tsc_get_timecount_low_lfence(struct timecounter *tc) 774814124c3SKonstantin Belousov { 775814124c3SKonstantin Belousov 776814124c3SKonstantin Belousov lfence(); 777814124c3SKonstantin Belousov return (tsc_get_timecount_low(tc)); 778814124c3SKonstantin Belousov } 779814124c3SKonstantin Belousov 780814124c3SKonstantin Belousov static u_int 781814124c3SKonstantin Belousov tsc_get_timecount_mfence(struct timecounter *tc __unused) 782814124c3SKonstantin Belousov { 783814124c3SKonstantin Belousov 784814124c3SKonstantin Belousov mfence(); 785814124c3SKonstantin Belousov return (rdtsc32()); 786814124c3SKonstantin Belousov } 787814124c3SKonstantin Belousov 788814124c3SKonstantin Belousov static u_int 789814124c3SKonstantin Belousov tsc_get_timecount_low_mfence(struct timecounter *tc) 790814124c3SKonstantin Belousov { 791814124c3SKonstantin Belousov 792814124c3SKonstantin Belousov mfence(); 793814124c3SKonstantin Belousov return (tsc_get_timecount_low(tc)); 794814124c3SKonstantin Belousov } 795814124c3SKonstantin Belousov 79616808549SKonstantin Belousov static uint32_t 79716808549SKonstantin Belousov x86_tsc_vdso_timehands(struct vdso_timehands *vdso_th, struct timecounter *tc) 798aea81038SKonstantin Belousov { 799aea81038SKonstantin Belousov 80016808549SKonstantin Belousov vdso_th->th_algo = VDSO_TH_ALGO_X86_TSC; 801d1b1b600SNeel Natu vdso_th->th_x86_shift = (int)(intptr_t)tc->tc_priv; 80216808549SKonstantin Belousov vdso_th->th_x86_hpet_idx = 0xffffffff; 803aea81038SKonstantin Belousov bzero(vdso_th->th_res, sizeof(vdso_th->th_res)); 80416808549SKonstantin Belousov return (1); 805aea81038SKonstantin Belousov } 806aea81038SKonstantin Belousov 807aea81038SKonstantin Belousov #ifdef COMPAT_FREEBSD32 80816808549SKonstantin Belousov static uint32_t 80916808549SKonstantin Belousov x86_tsc_vdso_timehands32(struct vdso_timehands32 *vdso_th32, 810d1b1b600SNeel Natu struct timecounter *tc) 811aea81038SKonstantin Belousov { 812aea81038SKonstantin Belousov 81316808549SKonstantin Belousov vdso_th32->th_algo = VDSO_TH_ALGO_X86_TSC; 814d1b1b600SNeel Natu vdso_th32->th_x86_shift = (int)(intptr_t)tc->tc_priv; 81516808549SKonstantin Belousov vdso_th32->th_x86_hpet_idx = 0xffffffff; 816aea81038SKonstantin Belousov bzero(vdso_th32->th_res, sizeof(vdso_th32->th_res)); 81716808549SKonstantin Belousov return (1); 818aea81038SKonstantin Belousov } 819aea81038SKonstantin Belousov #endif 820