xref: /freebsd/sys/dev/coretemp/coretemp.c (revision fdafd315ad0d0f28a11b9fb4476a9ab059c62b92)
183d18f22SDag-Erling Smørgrav /*-
2*4d846d26SWarner Losh  * SPDX-License-Identifier: BSD-2-Clause
3718cf2ccSPedro F. Giffuni  *
43684e5b0SRui Paulo  * Copyright (c) 2007, 2008 Rui Paulo <rpaulo@FreeBSD.org>
583d18f22SDag-Erling Smørgrav  * All rights reserved.
683d18f22SDag-Erling Smørgrav  *
783d18f22SDag-Erling Smørgrav  * Redistribution and use in source and binary forms, with or without
883d18f22SDag-Erling Smørgrav  * modification, are permitted provided that the following conditions
983d18f22SDag-Erling Smørgrav  * are met:
1083d18f22SDag-Erling Smørgrav  * 1. Redistributions of source code must retain the above copyright
1183d18f22SDag-Erling Smørgrav  *    notice, this list of conditions and the following disclaimer.
1283d18f22SDag-Erling Smørgrav  * 2. Redistributions in binary form must reproduce the above copyright
1383d18f22SDag-Erling Smørgrav  *    notice, this list of conditions and the following disclaimer in the
1483d18f22SDag-Erling Smørgrav  *    documentation and/or other materials provided with the distribution.
1583d18f22SDag-Erling Smørgrav  *
1683d18f22SDag-Erling Smørgrav  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
1783d18f22SDag-Erling Smørgrav  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
1883d18f22SDag-Erling Smørgrav  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
1983d18f22SDag-Erling Smørgrav  * DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
2083d18f22SDag-Erling Smørgrav  * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
2183d18f22SDag-Erling Smørgrav  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
2283d18f22SDag-Erling Smørgrav  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2383d18f22SDag-Erling Smørgrav  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
2483d18f22SDag-Erling Smørgrav  * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
2583d18f22SDag-Erling Smørgrav  * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
2683d18f22SDag-Erling Smørgrav  * POSSIBILITY OF SUCH DAMAGE.
2783d18f22SDag-Erling Smørgrav  */
2883d18f22SDag-Erling Smørgrav 
2983d18f22SDag-Erling Smørgrav /*
3083d18f22SDag-Erling Smørgrav  * Device driver for Intel's On Die thermal sensor via MSR.
3183d18f22SDag-Erling Smørgrav  * First introduced in Intel's Core line of processors.
3283d18f22SDag-Erling Smørgrav  */
3383d18f22SDag-Erling Smørgrav 
3483d18f22SDag-Erling Smørgrav #include <sys/param.h>
3583d18f22SDag-Erling Smørgrav #include <sys/bus.h>
3683d18f22SDag-Erling Smørgrav #include <sys/conf.h>
3783d18f22SDag-Erling Smørgrav #include <sys/kernel.h>
38e2e050c8SConrad Meyer #include <sys/lock.h>
39e2e050c8SConrad Meyer #include <sys/module.h>
40e2e050c8SConrad Meyer #include <sys/mutex.h>
4183d18f22SDag-Erling Smørgrav #include <sys/proc.h>	/* for curthread */
4274f80bc1SAlexander Motin #include <sys/smp.h>
43e2e050c8SConrad Meyer #include <sys/sysctl.h>
44e2e050c8SConrad Meyer #include <sys/systm.h>
4583d18f22SDag-Erling Smørgrav 
4683d18f22SDag-Erling Smørgrav #include <machine/specialreg.h>
4783d18f22SDag-Erling Smørgrav #include <machine/cpufunc.h>
485113aa0aSJung-uk Kim #include <machine/cputypes.h>
4983d18f22SDag-Erling Smørgrav #include <machine/md_var.h>
5083d18f22SDag-Erling Smørgrav 
519d6672e1SLuiz Otavio O Souza #define	TZ_ZEROC			2731
523705c384SNorikatsu Shigemura 
538362905cSsadaszewski #define	THERM_CRITICAL_STATUS_LOG       0x20
548362905cSsadaszewski #define	THERM_CRITICAL_STATUS           0x10
55d1f97f76SXin LI #define	THERM_STATUS_LOG		0x02
56d1f97f76SXin LI #define	THERM_STATUS			0x01
57d1f97f76SXin LI #define	THERM_STATUS_TEMP_SHIFT		16
58d1f97f76SXin LI #define	THERM_STATUS_TEMP_MASK		0x7f
59d1f97f76SXin LI #define	THERM_STATUS_RES_SHIFT		27
60d1f97f76SXin LI #define	THERM_STATUS_RES_MASK		0x0f
61d1f97f76SXin LI #define	THERM_STATUS_VALID_SHIFT	31
62d1f97f76SXin LI #define	THERM_STATUS_VALID_MASK		0x01
63d1f97f76SXin LI 
6483d18f22SDag-Erling Smørgrav struct coretemp_softc {
6583d18f22SDag-Erling Smørgrav 	device_t	sc_dev;
6683d18f22SDag-Erling Smørgrav 	int		sc_tjmax;
67d1f97f76SXin LI 	unsigned int	sc_throttle_log;
6883d18f22SDag-Erling Smørgrav };
6983d18f22SDag-Erling Smørgrav 
7083d18f22SDag-Erling Smørgrav /*
7183d18f22SDag-Erling Smørgrav  * Device methods.
7283d18f22SDag-Erling Smørgrav  */
7383d18f22SDag-Erling Smørgrav static void	coretemp_identify(driver_t *driver, device_t parent);
7483d18f22SDag-Erling Smørgrav static int	coretemp_probe(device_t dev);
7583d18f22SDag-Erling Smørgrav static int	coretemp_attach(device_t dev);
7683d18f22SDag-Erling Smørgrav static int	coretemp_detach(device_t dev);
7783d18f22SDag-Erling Smørgrav 
78d1f97f76SXin LI static uint64_t	coretemp_get_thermal_msr(int cpu);
79d1f97f76SXin LI static void	coretemp_clear_thermal_msr(int cpu);
80d1f97f76SXin LI static int	coretemp_get_val_sysctl(SYSCTL_HANDLER_ARGS);
81d1f97f76SXin LI static int	coretemp_throttle_log_sysctl(SYSCTL_HANDLER_ARGS);
8283d18f22SDag-Erling Smørgrav 
8383d18f22SDag-Erling Smørgrav static device_method_t coretemp_methods[] = {
8483d18f22SDag-Erling Smørgrav 	/* Device interface */
8583d18f22SDag-Erling Smørgrav 	DEVMETHOD(device_identify,	coretemp_identify),
8683d18f22SDag-Erling Smørgrav 	DEVMETHOD(device_probe,		coretemp_probe),
8783d18f22SDag-Erling Smørgrav 	DEVMETHOD(device_attach,	coretemp_attach),
8883d18f22SDag-Erling Smørgrav 	DEVMETHOD(device_detach,	coretemp_detach),
8983d18f22SDag-Erling Smørgrav 
9061bfd867SSofian Brabez 	DEVMETHOD_END
9183d18f22SDag-Erling Smørgrav };
9283d18f22SDag-Erling Smørgrav 
9383d18f22SDag-Erling Smørgrav static driver_t coretemp_driver = {
9483d18f22SDag-Erling Smørgrav 	"coretemp",
9583d18f22SDag-Erling Smørgrav 	coretemp_methods,
9683d18f22SDag-Erling Smørgrav 	sizeof(struct coretemp_softc),
9783d18f22SDag-Erling Smørgrav };
9883d18f22SDag-Erling Smørgrav 
99d1f97f76SXin LI enum therm_info {
100d1f97f76SXin LI 	CORETEMP_TEMP,
101d1f97f76SXin LI 	CORETEMP_DELTA,
102d1f97f76SXin LI 	CORETEMP_RESOLUTION,
103d1f97f76SXin LI 	CORETEMP_TJMAX,
104d1f97f76SXin LI };
105d1f97f76SXin LI 
106b3ed7cc5SJohn Baldwin DRIVER_MODULE(coretemp, cpu, coretemp_driver, NULL, NULL);
10783d18f22SDag-Erling Smørgrav 
10883d18f22SDag-Erling Smørgrav static void
coretemp_identify(driver_t * driver,device_t parent)10983d18f22SDag-Erling Smørgrav coretemp_identify(driver_t *driver, device_t parent)
11083d18f22SDag-Erling Smørgrav {
11183d18f22SDag-Erling Smørgrav 	device_t child;
11283d18f22SDag-Erling Smørgrav 	u_int regs[4];
11383d18f22SDag-Erling Smørgrav 
11483d18f22SDag-Erling Smørgrav 	/* Make sure we're not being doubly invoked. */
11583d18f22SDag-Erling Smørgrav 	if (device_find_child(parent, "coretemp", -1) != NULL)
11683d18f22SDag-Erling Smørgrav 		return;
11783d18f22SDag-Erling Smørgrav 
1183684e5b0SRui Paulo 	/* Check that CPUID 0x06 is supported and the vendor is Intel.*/
1195113aa0aSJung-uk Kim 	if (cpu_high < 6 || cpu_vendor_id != CPU_VENDOR_INTEL)
12083d18f22SDag-Erling Smørgrav 		return;
12183d18f22SDag-Erling Smørgrav 	/*
12283d18f22SDag-Erling Smørgrav 	 * CPUID 0x06 returns 1 if the processor has on-die thermal
12383d18f22SDag-Erling Smørgrav 	 * sensors. EBX[0:3] contains the number of sensors.
12483d18f22SDag-Erling Smørgrav 	 */
12583d18f22SDag-Erling Smørgrav 	do_cpuid(0x06, regs);
12683d18f22SDag-Erling Smørgrav 	if ((regs[0] & 0x1) != 1)
12783d18f22SDag-Erling Smørgrav 		return;
12883d18f22SDag-Erling Smørgrav 
12983d18f22SDag-Erling Smørgrav 	/*
13083d18f22SDag-Erling Smørgrav 	 * We add a child for each CPU since settings must be performed
13183d18f22SDag-Erling Smørgrav 	 * on each CPU in the SMP case.
13283d18f22SDag-Erling Smørgrav 	 */
133d3a8f98aSAlexander Motin 	child = device_add_child(parent, "coretemp", device_get_unit(parent));
13483d18f22SDag-Erling Smørgrav 	if (child == NULL)
13583d18f22SDag-Erling Smørgrav 		device_printf(parent, "add coretemp child failed\n");
13683d18f22SDag-Erling Smørgrav }
13783d18f22SDag-Erling Smørgrav 
13883d18f22SDag-Erling Smørgrav static int
coretemp_probe(device_t dev)13983d18f22SDag-Erling Smørgrav coretemp_probe(device_t dev)
14083d18f22SDag-Erling Smørgrav {
141a8de37b0SEitan Adler 	if (resource_disabled("coretemp", 0))
142a8de37b0SEitan Adler 		return (ENXIO);
14383d18f22SDag-Erling Smørgrav 
14483d18f22SDag-Erling Smørgrav 	device_set_desc(dev, "CPU On-Die Thermal Sensors");
14583d18f22SDag-Erling Smørgrav 
1462e3f84e5SMatt Macy 	if (!bootverbose && device_get_unit(dev) != 0)
1472e3f84e5SMatt Macy 		device_quiet(dev);
1482e3f84e5SMatt Macy 
14983d18f22SDag-Erling Smørgrav 	return (BUS_PROBE_GENERIC);
15083d18f22SDag-Erling Smørgrav }
15183d18f22SDag-Erling Smørgrav 
15283d18f22SDag-Erling Smørgrav static int
coretemp_attach(device_t dev)15383d18f22SDag-Erling Smørgrav coretemp_attach(device_t dev)
15483d18f22SDag-Erling Smørgrav {
15583d18f22SDag-Erling Smørgrav 	struct coretemp_softc *sc = device_get_softc(dev);
15683d18f22SDag-Erling Smørgrav 	device_t pdev;
15783d18f22SDag-Erling Smørgrav 	uint64_t msr;
158a3bc0a4eSXin LI 	int cpu_model, cpu_stepping;
159a3bc0a4eSXin LI 	int ret, tjtarget;
160d1f97f76SXin LI 	struct sysctl_oid *oid;
161d1f97f76SXin LI 	struct sysctl_ctx_list *ctx;
16283d18f22SDag-Erling Smørgrav 
1635afb221cSDag-Erling Smørgrav 	sc->sc_dev = dev;
16483d18f22SDag-Erling Smørgrav 	pdev = device_get_parent(dev);
165a3bc0a4eSXin LI 	cpu_model = CPUID_TO_MODEL(cpu_id);
166ef013ceeSRyan Moeller 	cpu_stepping = CPUID_TO_STEPPING(cpu_id);
16783d18f22SDag-Erling Smørgrav 
16818d69021SRui Paulo 	/*
16918d69021SRui Paulo 	 * Some CPUs, namely the PIII, don't have thermal sensors, but
17018d69021SRui Paulo 	 * report them when the CPUID check is performed in
17118d69021SRui Paulo 	 * coretemp_identify(). This leads to a later GPF when the sensor
17218d69021SRui Paulo 	 * is queried via a MSR, so we stop here.
17318d69021SRui Paulo 	 */
17418d69021SRui Paulo 	if (cpu_model < 0xe)
17518d69021SRui Paulo 		return (ENXIO);
17618d69021SRui Paulo 
177ab0b1257SRui Paulo #if 0 /*
178ab0b1257SRui Paulo        * XXXrpaulo: I have this CPU model and when it returns from C3
179ab0b1257SRui Paulo        * coretemp continues to function properly.
180ab0b1257SRui Paulo        */
181ab0b1257SRui Paulo 
18283d18f22SDag-Erling Smørgrav 	/*
18383d18f22SDag-Erling Smørgrav 	 * Check for errata AE18.
18483d18f22SDag-Erling Smørgrav 	 * "Processor Digital Thermal Sensor (DTS) Readout stops
18583d18f22SDag-Erling Smørgrav 	 *  updating upon returning from C3/C4 state."
18683d18f22SDag-Erling Smørgrav 	 *
18783d18f22SDag-Erling Smørgrav 	 * Adapted from the Linux coretemp driver.
18883d18f22SDag-Erling Smørgrav 	 */
189a3bc0a4eSXin LI 	if (cpu_model == 0xe && cpu_stepping < 0xc) {
19083d18f22SDag-Erling Smørgrav 		msr = rdmsr(MSR_BIOS_SIGN);
19183d18f22SDag-Erling Smørgrav 		msr = msr >> 32;
19283d18f22SDag-Erling Smørgrav 		if (msr < 0x39) {
1935afb221cSDag-Erling Smørgrav 			device_printf(dev, "not supported (Intel errata "
1945afb221cSDag-Erling Smørgrav 			    "AE18), try updating your BIOS\n");
19583d18f22SDag-Erling Smørgrav 			return (ENXIO);
19683d18f22SDag-Erling Smørgrav 		}
19783d18f22SDag-Erling Smørgrav 	}
198ab0b1257SRui Paulo #endif
199a3bc0a4eSXin LI 
200a3bc0a4eSXin LI 	/*
201a3bc0a4eSXin LI 	 * Use 100C as the initial value.
202a3bc0a4eSXin LI 	 */
203a3bc0a4eSXin LI 	sc->sc_tjmax = 100;
204a3bc0a4eSXin LI 
205a3bc0a4eSXin LI 	if ((cpu_model == 0xf && cpu_stepping >= 2) || cpu_model == 0xe) {
20683d18f22SDag-Erling Smørgrav 		/*
20783d18f22SDag-Erling Smørgrav 		 * On some Core 2 CPUs, there's an undocumented MSR that
20883d18f22SDag-Erling Smørgrav 		 * can tell us if Tj(max) is 100 or 85.
20983d18f22SDag-Erling Smørgrav 		 *
21083d18f22SDag-Erling Smørgrav 		 * The if-clause for CPUs having the MSR_IA32_EXT_CONFIG was adapted
21183d18f22SDag-Erling Smørgrav 		 * from the Linux coretemp driver.
21283d18f22SDag-Erling Smørgrav 		 */
2135afb221cSDag-Erling Smørgrav 		msr = rdmsr(MSR_IA32_EXT_CONFIG);
2145afb221cSDag-Erling Smørgrav 		if (msr & (1 << 30))
2155afb221cSDag-Erling Smørgrav 			sc->sc_tjmax = 85;
21628a54cacSXin LI 	} else if (cpu_model == 0x17) {
21728a54cacSXin LI 		switch (cpu_stepping) {
21828a54cacSXin LI 		case 0x6:	/* Mobile Core 2 Duo */
219ba95b1e1SXin LI 			sc->sc_tjmax = 105;
22028a54cacSXin LI 			break;
22128a54cacSXin LI 		default:	/* Unknown stepping */
22228a54cacSXin LI 			break;
22328a54cacSXin LI 		}
22489017932SXin LI 	} else if (cpu_model == 0x1c) {
22589017932SXin LI 		switch (cpu_stepping) {
22689017932SXin LI 		case 0xa:	/* 45nm Atom D400, N400 and D500 series */
22789017932SXin LI 			sc->sc_tjmax = 100;
22889017932SXin LI 			break;
22989017932SXin LI 		default:
23089017932SXin LI 			sc->sc_tjmax = 90;
23189017932SXin LI 			break;
23289017932SXin LI 		}
23328a54cacSXin LI 	} else {
23428a54cacSXin LI 		/*
23528a54cacSXin LI 		 * Attempt to get Tj(max) from MSR IA32_TEMPERATURE_TARGET.
23628a54cacSXin LI 		 *
23728a54cacSXin LI 		 * This method is described in Intel white paper "CPU
23828a54cacSXin LI 		 * Monitoring With DTS/PECI". (#322683)
23928a54cacSXin LI 		 */
24028a54cacSXin LI 		ret = rdmsr_safe(MSR_IA32_TEMPERATURE_TARGET, &msr);
24128a54cacSXin LI 		if (ret == 0) {
24228a54cacSXin LI 			tjtarget = (msr >> 16) & 0xff;
24328a54cacSXin LI 
24428a54cacSXin LI 			/*
24528a54cacSXin LI 			 * On earlier generation of processors, the value
24628a54cacSXin LI 			 * obtained from IA32_TEMPERATURE_TARGET register is
24728a54cacSXin LI 			 * an offset that needs to be summed with a model
24828a54cacSXin LI 			 * specific base.  It is however not clear what
24928a54cacSXin LI 			 * these numbers are, with the publicly available
25028a54cacSXin LI 			 * documents from Intel.
25128a54cacSXin LI 			 *
25272dc07ebSAttilio Rao 			 * For now, we consider [70, 110]C range, as
25328a54cacSXin LI 			 * described in #322683, as "reasonable" and accept
25428a54cacSXin LI 			 * these values whenever the MSR is available for
25528a54cacSXin LI 			 * read, regardless the CPU model.
25628a54cacSXin LI 			 */
25772dc07ebSAttilio Rao 			if (tjtarget >= 70 && tjtarget <= 110)
25828a54cacSXin LI 				sc->sc_tjmax = tjtarget;
25928a54cacSXin LI 			else
26028a54cacSXin LI 				device_printf(dev, "Tj(target) value %d "
26128a54cacSXin LI 				    "does not seem right.\n", tjtarget);
26228a54cacSXin LI 		} else
26328a54cacSXin LI 			device_printf(dev, "Can not get Tj(target) "
26428a54cacSXin LI 			    "from your CPU, using 100C.\n");
2655afb221cSDag-Erling Smørgrav 	}
26683d18f22SDag-Erling Smørgrav 
267a3bc0a4eSXin LI 	if (bootverbose)
268a3bc0a4eSXin LI 		device_printf(dev, "Setting TjMax=%d\n", sc->sc_tjmax);
269a3bc0a4eSXin LI 
270d1f97f76SXin LI 	ctx = device_get_sysctl_ctx(dev);
271d1f97f76SXin LI 
272d1f97f76SXin LI 	oid = SYSCTL_ADD_NODE(ctx,
273d1f97f76SXin LI 	    SYSCTL_CHILDREN(device_get_sysctl_tree(pdev)), OID_AUTO,
2747029da5cSPawel Biernacki 	    "coretemp", CTLFLAG_RD | CTLFLAG_MPSAFE, NULL,
2757029da5cSPawel Biernacki 	    "Per-CPU thermal information");
276d1f97f76SXin LI 
27783d18f22SDag-Erling Smørgrav 	/*
278d1f97f76SXin LI 	 * Add the MIBs to dev.cpu.N and dev.cpu.N.coretemp.
27983d18f22SDag-Erling Smørgrav 	 */
280d1f97f76SXin LI 	SYSCTL_ADD_PROC(ctx, SYSCTL_CHILDREN(device_get_sysctl_tree(pdev)),
281e42412a9SMark Johnston 	    OID_AUTO, "temperature", CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE,
282e42412a9SMark Johnston 	    dev, CORETEMP_TEMP, coretemp_get_val_sysctl, "IK",
2833705c384SNorikatsu Shigemura 	    "Current temperature");
284d1f97f76SXin LI 	SYSCTL_ADD_PROC(ctx, SYSCTL_CHILDREN(oid), OID_AUTO, "delta",
285e42412a9SMark Johnston 	    CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, dev, CORETEMP_DELTA,
286d1f97f76SXin LI 	    coretemp_get_val_sysctl, "I",
287d1f97f76SXin LI 	    "Delta between TCC activation and current temperature");
288d1f97f76SXin LI 	SYSCTL_ADD_PROC(ctx, SYSCTL_CHILDREN(oid), OID_AUTO, "resolution",
289e42412a9SMark Johnston 	    CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, dev, CORETEMP_RESOLUTION,
290d1f97f76SXin LI 	    coretemp_get_val_sysctl, "I",
291d1f97f76SXin LI 	    "Resolution of CPU thermal sensor");
292d1f97f76SXin LI 	SYSCTL_ADD_PROC(ctx, SYSCTL_CHILDREN(oid), OID_AUTO, "tjmax",
293e42412a9SMark Johnston 	    CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_MPSAFE, dev, CORETEMP_TJMAX,
294d1f97f76SXin LI 	    coretemp_get_val_sysctl, "IK",
295d1f97f76SXin LI 	    "TCC activation temperature");
296d1f97f76SXin LI 	SYSCTL_ADD_PROC(ctx, SYSCTL_CHILDREN(oid), OID_AUTO,
297e42412a9SMark Johnston 	    "throttle_log", CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_MPSAFE, dev, 0,
298d1f97f76SXin LI 	    coretemp_throttle_log_sysctl, "I",
299d1f97f76SXin LI 	    "Set to 1 if the thermal sensor has tripped");
30083d18f22SDag-Erling Smørgrav 
30183d18f22SDag-Erling Smørgrav 	return (0);
30283d18f22SDag-Erling Smørgrav }
30383d18f22SDag-Erling Smørgrav 
30483d18f22SDag-Erling Smørgrav static int
coretemp_detach(device_t dev)30583d18f22SDag-Erling Smørgrav coretemp_detach(device_t dev)
30683d18f22SDag-Erling Smørgrav {
30783d18f22SDag-Erling Smørgrav 	return (0);
30883d18f22SDag-Erling Smørgrav }
30983d18f22SDag-Erling Smørgrav 
31074f80bc1SAlexander Motin struct coretemp_args {
31174f80bc1SAlexander Motin 	u_int		msr;
31274f80bc1SAlexander Motin 	uint64_t	val;
31374f80bc1SAlexander Motin };
31474f80bc1SAlexander Motin 
3159f05d312SAlexander Leidinger /*
3169f05d312SAlexander Leidinger  * The digital temperature reading is located at bit 16
3179f05d312SAlexander Leidinger  * of MSR_THERM_STATUS.
3189f05d312SAlexander Leidinger  *
3199f05d312SAlexander Leidinger  * There is a bit on that MSR that indicates whether the
3209f05d312SAlexander Leidinger  * temperature is valid or not.
3219f05d312SAlexander Leidinger  *
3229f05d312SAlexander Leidinger  * The temperature is computed by subtracting the temperature
3239f05d312SAlexander Leidinger  * reading by Tj(max).
3249f05d312SAlexander Leidinger  */
3254cc6fe1eSKonstantin Belousov static uint64_t
coretemp_get_thermal_msr(int cpu)3264cc6fe1eSKonstantin Belousov coretemp_get_thermal_msr(int cpu)
3274cc6fe1eSKonstantin Belousov {
3284cc6fe1eSKonstantin Belousov 	uint64_t res;
3294cc6fe1eSKonstantin Belousov 
3304cc6fe1eSKonstantin Belousov 	x86_msr_op(MSR_THERM_STATUS, MSR_OP_RENDEZVOUS_ONE | MSR_OP_READ |
3314cc6fe1eSKonstantin Belousov 	    MSR_OP_CPUID(cpu), 0, &res);
3324cc6fe1eSKonstantin Belousov 	return (res);
33383d18f22SDag-Erling Smørgrav }
33483d18f22SDag-Erling Smørgrav 
335d1f97f76SXin LI static void
coretemp_clear_thermal_msr(int cpu)336d1f97f76SXin LI coretemp_clear_thermal_msr(int cpu)
337d1f97f76SXin LI {
3384cc6fe1eSKonstantin Belousov 	x86_msr_op(MSR_THERM_STATUS, MSR_OP_RENDEZVOUS_ONE | MSR_OP_WRITE |
3394cc6fe1eSKonstantin Belousov 	    MSR_OP_CPUID(cpu), 0, NULL);
34083d18f22SDag-Erling Smørgrav }
34183d18f22SDag-Erling Smørgrav 
3429f05d312SAlexander Leidinger static int
coretemp_get_val_sysctl(SYSCTL_HANDLER_ARGS)343d1f97f76SXin LI coretemp_get_val_sysctl(SYSCTL_HANDLER_ARGS)
34483d18f22SDag-Erling Smørgrav {
345d1f97f76SXin LI 	device_t dev;
346d1f97f76SXin LI 	uint64_t msr;
347d1f97f76SXin LI 	int val, tmp;
348d1f97f76SXin LI 	struct coretemp_softc *sc;
349d1f97f76SXin LI 	enum therm_info type;
350d1f97f76SXin LI 	char stemp[16];
35183d18f22SDag-Erling Smørgrav 
352d1f97f76SXin LI 	dev = (device_t) arg1;
353d1f97f76SXin LI 	msr = coretemp_get_thermal_msr(device_get_unit(dev));
354d1f97f76SXin LI 	sc = device_get_softc(dev);
355d1f97f76SXin LI 	type = arg2;
35683d18f22SDag-Erling Smørgrav 
357d1f97f76SXin LI 	if (((msr >> THERM_STATUS_VALID_SHIFT) & THERM_STATUS_VALID_MASK) != 1) {
358d1f97f76SXin LI 		val = -1;
359d1f97f76SXin LI 	} else {
360d1f97f76SXin LI 		switch (type) {
361d1f97f76SXin LI 		case CORETEMP_TEMP:
362d1f97f76SXin LI 			tmp = (msr >> THERM_STATUS_TEMP_SHIFT) &
363d1f97f76SXin LI 			    THERM_STATUS_TEMP_MASK;
364d1f97f76SXin LI 			val = (sc->sc_tjmax - tmp) * 10 + TZ_ZEROC;
365d1f97f76SXin LI 			break;
366d1f97f76SXin LI 		case CORETEMP_DELTA:
367d1f97f76SXin LI 			val = (msr >> THERM_STATUS_TEMP_SHIFT) &
368d1f97f76SXin LI 			    THERM_STATUS_TEMP_MASK;
369d1f97f76SXin LI 			break;
370d1f97f76SXin LI 		case CORETEMP_RESOLUTION:
371d1f97f76SXin LI 			val = (msr >> THERM_STATUS_RES_SHIFT) &
372d1f97f76SXin LI 			    THERM_STATUS_RES_MASK;
373d1f97f76SXin LI 			break;
374d1f97f76SXin LI 		case CORETEMP_TJMAX:
375d1f97f76SXin LI 			val = sc->sc_tjmax * 10 + TZ_ZEROC;
376d1f97f76SXin LI 			break;
377d1f97f76SXin LI 		}
378d1f97f76SXin LI 	}
379d1f97f76SXin LI 
380d1f97f76SXin LI 	if (msr & THERM_STATUS_LOG) {
381c839b5bbSAttilio Rao 		coretemp_clear_thermal_msr(device_get_unit(dev));
382d1f97f76SXin LI 		sc->sc_throttle_log = 1;
383d1f97f76SXin LI 
384d1f97f76SXin LI 		/*
385d1f97f76SXin LI 		 * Check for Critical Temperature Status and Critical
386d1f97f76SXin LI 		 * Temperature Log.  It doesn't really matter if the
387d1f97f76SXin LI 		 * current temperature is invalid because the "Critical
388d1f97f76SXin LI 		 * Temperature Log" bit will tell us if the Critical
389d1f97f76SXin LI 		 * Temperature has * been reached in past. It's not
390d1f97f76SXin LI 		 * directly related to the current temperature.
391d1f97f76SXin LI 		 *
392d1f97f76SXin LI 		 * If we reach a critical level, allow devctl(4)
393d1f97f76SXin LI 		 * to catch this and shutdown the system.
394d1f97f76SXin LI 		 */
3958362905cSsadaszewski 		if (msr & THERM_CRITICAL_STATUS) {
396d1f97f76SXin LI 			tmp = (msr >> THERM_STATUS_TEMP_SHIFT) &
397d1f97f76SXin LI 			    THERM_STATUS_TEMP_MASK;
398d1f97f76SXin LI 			tmp = (sc->sc_tjmax - tmp) * 10 + TZ_ZEROC;
399d1f97f76SXin LI 			device_printf(dev, "critical temperature detected, "
400d1f97f76SXin LI 			    "suggest system shutdown\n");
401d1f97f76SXin LI 			snprintf(stemp, sizeof(stemp), "%d", tmp);
402d1f97f76SXin LI 			devctl_notify("coretemp", "Thermal", stemp,
403d1f97f76SXin LI 			    "notify=0xcc");
404d1f97f76SXin LI 		}
405d1f97f76SXin LI 	}
406d1f97f76SXin LI 
407d1f97f76SXin LI 	return (sysctl_handle_int(oidp, &val, 0, req));
408d1f97f76SXin LI }
409d1f97f76SXin LI 
410d1f97f76SXin LI static int
coretemp_throttle_log_sysctl(SYSCTL_HANDLER_ARGS)411d1f97f76SXin LI coretemp_throttle_log_sysctl(SYSCTL_HANDLER_ARGS)
412d1f97f76SXin LI {
413d1f97f76SXin LI 	device_t dev;
414d1f97f76SXin LI 	uint64_t msr;
415d1f97f76SXin LI 	int error, val;
416d1f97f76SXin LI 	struct coretemp_softc *sc;
417d1f97f76SXin LI 
418d1f97f76SXin LI 	dev = (device_t) arg1;
419d1f97f76SXin LI 	msr = coretemp_get_thermal_msr(device_get_unit(dev));
420d1f97f76SXin LI 	sc = device_get_softc(dev);
421d1f97f76SXin LI 
422c839b5bbSAttilio Rao 	if (msr & THERM_STATUS_LOG) {
423c839b5bbSAttilio Rao 		coretemp_clear_thermal_msr(device_get_unit(dev));
424d1f97f76SXin LI 		sc->sc_throttle_log = 1;
425c839b5bbSAttilio Rao 	}
426d1f97f76SXin LI 
427d1f97f76SXin LI 	val = sc->sc_throttle_log;
428d1f97f76SXin LI 
429d1f97f76SXin LI 	error = sysctl_handle_int(oidp, &val, 0, req);
430d1f97f76SXin LI 
431d1f97f76SXin LI 	if (error || !req->newptr)
432d1f97f76SXin LI 		return (error);
433d1f97f76SXin LI 	else if (val != 0)
434d1f97f76SXin LI 		return (EINVAL);
435d1f97f76SXin LI 
436d1f97f76SXin LI 	coretemp_clear_thermal_msr(device_get_unit(dev));
437d1f97f76SXin LI 	sc->sc_throttle_log = 0;
438d1f97f76SXin LI 
439d1f97f76SXin LI 	return (0);
44083d18f22SDag-Erling Smørgrav }
441