sys/kern/subr_clockcalib.c

*c2705ceaSColin Percival/*-
*c2705ceaSColin Percival * Copyright (c) 2022 Colin Percival
*c2705ceaSColin Percival * All rights reserved.
*c2705ceaSColin Percival *
*c2705ceaSColin Percival * Redistribution and use in source and binary forms, with or without
*c2705ceaSColin Percival * modification, are permitted provided that the following conditions
*c2705ceaSColin Percival * are met:
*c2705ceaSColin Percival * 1. Redistributions of source code must retain the above copyright
*c2705ceaSColin Percival *    notice, this list of conditions and the following disclaimer.
*c2705ceaSColin Percival * 2. Redistributions in binary form must reproduce the above copyright
*c2705ceaSColin Percival *    notice, this list of conditions and the following disclaimer in the
*c2705ceaSColin Percival *    documentation and/or other materials provided with the distribution.
*c2705ceaSColin Percival *
*c2705ceaSColin Percival * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
*c2705ceaSColin Percival * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
*c2705ceaSColin Percival * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
*c2705ceaSColin Percival * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
*c2705ceaSColin Percival * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
*c2705ceaSColin Percival * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
*c2705ceaSColin Percival * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
*c2705ceaSColin Percival * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
*c2705ceaSColin Percival * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
*c2705ceaSColin Percival * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
*c2705ceaSColin Percival * SUCH DAMAGE.
*c2705ceaSColin Percival */
*c2705ceaSColin Percival
*c2705ceaSColin Percival#include <sys/cdefs.h>
*c2705ceaSColin Percival__FBSDID("$FreeBSD$");
*c2705ceaSColin Percival
*c2705ceaSColin Percival#include <sys/param.h>
*c2705ceaSColin Percival#include <sys/systm.h>
*c2705ceaSColin Percival#include <sys/timetc.h>
*c2705ceaSColin Percival#include <sys/tslog.h>
*c2705ceaSColin Percival#include <machine/cpu.h>
*c2705ceaSColin Percival
*c2705ceaSColin Percival/**
*c2705ceaSColin Percival * clockcalib(clk, clkname):
*c2705ceaSColin Percival * Return the frequency of the provided timer, as calibrated against the
*c2705ceaSColin Percival * current best-available timecounter.
*c2705ceaSColin Percival */
*c2705ceaSColin Percivaluint64_t
*c2705ceaSColin Percivalclockcalib(uint64_t (*clk)(void), const char *clkname)
*c2705ceaSColin Percival{
*c2705ceaSColin Percival	struct timecounter *tc = atomic_load_ptr(&timecounter);
*c2705ceaSColin Percival	uint64_t clk0, clk1, clk_delay, n, passes = 0;
*c2705ceaSColin Percival	uint64_t t0, t1, tadj, tlast;
*c2705ceaSColin Percival	double mu_clk = 0;
*c2705ceaSColin Percival	double mu_t = 0;
*c2705ceaSColin Percival	double va_clk = 0;
*c2705ceaSColin Percival	double va_t = 0;
*c2705ceaSColin Percival	double cva = 0;
*c2705ceaSColin Percival	double d1, d2;
*c2705ceaSColin Percival	double inv_n;
*c2705ceaSColin Percival	uint64_t freq;
*c2705ceaSColin Percival
*c2705ceaSColin Percival	TSENTER();
*c2705ceaSColin Percival	/*-
*c2705ceaSColin Percival	 * The idea here is to compute a best-fit linear regression between
*c2705ceaSColin Percival	 * the clock we're calibrating and the reference clock; the slope of
*c2705ceaSColin Percival	 * that line multiplied by the frequency of the reference clock gives
*c2705ceaSColin Percival	 * us the frequency we're looking for.
*c2705ceaSColin Percival	 *
*c2705ceaSColin Percival	 * To do this, we calculate the
*c2705ceaSColin Percival	 * (a) mean of the target clock measurements,
*c2705ceaSColin Percival	 * (b) variance of the target clock measurements,
*c2705ceaSColin Percival	 * (c) mean of the reference clock measurements,
*c2705ceaSColin Percival	 * (d) variance of the reference clock measurements, and
*c2705ceaSColin Percival	 * (e) covariance of the target clock and reference clock measurements
*c2705ceaSColin Percival	 * on an ongoing basis, updating all five values after each new data
*c2705ceaSColin Percival	 * point arrives, stopping when we're confident that we've accurately
*c2705ceaSColin Percival	 * measured the target clock frequency.
*c2705ceaSColin Percival	 *
*c2705ceaSColin Percival	 * Given those five values, the important formulas to remember from
*c2705ceaSColin Percival	 * introductory statistics are:
*c2705ceaSColin Percival	 * 1. slope of regression line = covariance(x, y) / variance(x)
*c2705ceaSColin Percival	 * 2. (relative uncertainty in slope)^2 =
*c2705ceaSColin Percival	 *    (variance(x) * variance(y) - covariance(x, y)^2)
*c2705ceaSColin Percival	 *    ------------------------------------------------
*c2705ceaSColin Percival	 *              covariance(x, y)^2 * (N - 2)
*c2705ceaSColin Percival	 *
*c2705ceaSColin Percival	 * We adjust the second formula slightly, adding a term to each of
*c2705ceaSColin Percival	 * the variance values to reflect the measurement quantization.
*c2705ceaSColin Percival	 *
*c2705ceaSColin Percival	 * Finally, we need to determine when to stop gathering data.  We
*c2705ceaSColin Percival	 * can't simply stop as soon as the computed uncertainty estimate
*c2705ceaSColin Percival	 * is below our threshold; this would make us overconfident since it
*c2705ceaSColin Percival	 * would introduce a multiple-comparisons problem (cf. sequential
*c2705ceaSColin Percival	 * analysis in clinical trials).  Instead, we stop with N data points
*c2705ceaSColin Percival	 * if the estimated uncertainty of the first k data points meets our
*c2705ceaSColin Percival	 * target for all N/2 < k <= N; this is not theoretically optimal,
*c2705ceaSColin Percival	 * but in practice works well enough.
*c2705ceaSColin Percival	 */
*c2705ceaSColin Percival
*c2705ceaSColin Percival	/*
*c2705ceaSColin Percival	 * Initial values for clocks; we'll subtract these off from values
*c2705ceaSColin Percival	 * we measure later in order to reduce floating-point rounding errors.
*c2705ceaSColin Percival	 * We keep track of an adjustment for values read from the reference
*c2705ceaSColin Percival	 * timecounter, since it can wrap.
*c2705ceaSColin Percival	 */
*c2705ceaSColin Percival	clk0 = clk();
*c2705ceaSColin Percival	t0 = tc->tc_get_timecount(tc) & tc->tc_counter_mask;
*c2705ceaSColin Percival	tadj = 0;
*c2705ceaSColin Percival	tlast = t0;
*c2705ceaSColin Percival
*c2705ceaSColin Percival	/* Loop until we give up or decide that we're calibrated. */
*c2705ceaSColin Percival	for (n = 1; ; n++) {
*c2705ceaSColin Percival		/* Get a new data point. */
*c2705ceaSColin Percival		clk1 = clk() - clk0;
*c2705ceaSColin Percival		t1 = tc->tc_get_timecount(tc) & tc->tc_counter_mask;
*c2705ceaSColin Percival		while (t1 + tadj < tlast)
*c2705ceaSColin Percival			tadj += tc->tc_counter_mask + 1;
*c2705ceaSColin Percival		tlast = t1 + tadj;
*c2705ceaSColin Percival		t1 += tadj - t0;
*c2705ceaSColin Percival
*c2705ceaSColin Percival		/* If we spent too long, bail. */
*c2705ceaSColin Percival		if (t1 > tc->tc_frequency) {
*c2705ceaSColin Percival			printf("Statistical %s calibration failed!  "
*c2705ceaSColin Percival			    "Clocks might be ticking at variable rates.\n",
*c2705ceaSColin Percival			     clkname);
*c2705ceaSColin Percival			printf("Falling back to slow %s calibration.\n",
*c2705ceaSColin Percival			    clkname);
*c2705ceaSColin Percival			freq = (double)(tc->tc_frequency) * clk1 / t1;
*c2705ceaSColin Percival			break;
*c2705ceaSColin Percival		}
*c2705ceaSColin Percival
*c2705ceaSColin Percival		/* Precompute to save on divisions later. */
*c2705ceaSColin Percival		inv_n = 1.0 / n;
*c2705ceaSColin Percival
*c2705ceaSColin Percival		/* Update mean and variance of recorded TSC values. */
*c2705ceaSColin Percival		d1 = clk1 - mu_clk;
*c2705ceaSColin Percival		mu_clk += d1 * inv_n;
*c2705ceaSColin Percival		d2 = d1 * (clk1 - mu_clk);
*c2705ceaSColin Percival		va_clk += (d2 - va_clk) * inv_n;
*c2705ceaSColin Percival
*c2705ceaSColin Percival		/* Update mean and variance of recorded time values. */
*c2705ceaSColin Percival		d1 = t1 - mu_t;
*c2705ceaSColin Percival		mu_t += d1 * inv_n;
*c2705ceaSColin Percival		d2 = d1 * (t1 - mu_t);
*c2705ceaSColin Percival		va_t += (d2 - va_t) * inv_n;
*c2705ceaSColin Percival
*c2705ceaSColin Percival		/* Update covariance. */
*c2705ceaSColin Percival		d2 = d1 * (clk1 - mu_clk);
*c2705ceaSColin Percival		cva += (d2 - cva) * inv_n;
*c2705ceaSColin Percival
*c2705ceaSColin Percival		/*
*c2705ceaSColin Percival		 * Count low-uncertainty iterations.  This is a rearrangement
*c2705ceaSColin Percival		 * of "relative uncertainty < 1 PPM" avoiding division.
*c2705ceaSColin Percival		 */
*c2705ceaSColin Percival#define TSC_PPM_UNCERTAINTY	1
*c2705ceaSColin Percival#define TSC_UNCERTAINTY		TSC_PPM_UNCERTAINTY * 0.000001
*c2705ceaSColin Percival#define TSC_UNCERTAINTY_SQR	TSC_UNCERTAINTY * TSC_UNCERTAINTY
*c2705ceaSColin Percival		if (TSC_UNCERTAINTY_SQR * (n - 2) * cva * cva >
*c2705ceaSColin Percival		    (va_t + 4) * (va_clk + 4) - cva * cva)
*c2705ceaSColin Percival			passes++;
*c2705ceaSColin Percival		else
*c2705ceaSColin Percival			passes = 0;
*c2705ceaSColin Percival
*c2705ceaSColin Percival		/* Break if we're consistently certain. */
*c2705ceaSColin Percival		if (passes * 2 > n) {
*c2705ceaSColin Percival			freq = (double)(tc->tc_frequency) * cva / va_t;
*c2705ceaSColin Percival			if (bootverbose)
*c2705ceaSColin Percival				printf("Statistical %s calibration took"
*c2705ceaSColin Percival				    " %lu us and %lu data points\n",
*c2705ceaSColin Percival				    clkname, (unsigned long)(t1 *
*c2705ceaSColin Percival					1000000.0 / tc->tc_frequency),
*c2705ceaSColin Percival				    (unsigned long)n);
*c2705ceaSColin Percival			break;
*c2705ceaSColin Percival		}
*c2705ceaSColin Percival
*c2705ceaSColin Percival		/*
*c2705ceaSColin Percival		 * Add variable delay to avoid theoretical risk of aliasing
*c2705ceaSColin Percival		 * resulting from this loop synchronizing with the frequency
*c2705ceaSColin Percival		 * of the reference clock.  On the nth iteration, we spend
*c2705ceaSColin Percival		 * O(1 / n) time here -- long enough to avoid aliasing, but
*c2705ceaSColin Percival		 * short enough to be insignificant as n grows.
*c2705ceaSColin Percival		 */
*c2705ceaSColin Percival		clk_delay = clk() + (clk() - clk0) / (n * n);
*c2705ceaSColin Percival		while (clk() < clk_delay)
*c2705ceaSColin Percival			cpu_spinwait(); /* Do nothing. */
*c2705ceaSColin Percival	}
*c2705ceaSColin Percival	TSEXIT();
*c2705ceaSColin Percival	return (freq);
*c2705ceaSColin Percival}