xref: /freebsd/sys/kern/kern_ffclock.c (revision 809922b01004daf627ad4b8d92c7f98eb579043c)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 2011 The University of Melbourne
5  * All rights reserved.
6  *
7  * This software was developed by Julien Ridoux at the University of Melbourne
8  * under sponsorship from the FreeBSD Foundation.
9  *
10  * Redistribution and use in source and binary forms, with or without
11  * modification, are permitted provided that the following conditions
12  * are met:
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in the
17  *    documentation and/or other materials provided with the distribution.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
20  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
23  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29  * SUCH DAMAGE.
30  */
31 
32 #include <sys/cdefs.h>
33 __FBSDID("$FreeBSD$");
34 
35 #include "opt_ffclock.h"
36 
37 #include <sys/param.h>
38 #include <sys/bus.h>
39 #include <sys/kernel.h>
40 #include <sys/lock.h>
41 #include <sys/module.h>
42 #include <sys/mutex.h>
43 #include <sys/priv.h>
44 #include <sys/proc.h>
45 #include <sys/sbuf.h>
46 #include <sys/sysproto.h>
47 #include <sys/sysctl.h>
48 #include <sys/systm.h>
49 #include <sys/timeffc.h>
50 
51 #ifdef FFCLOCK
52 
53 FEATURE(ffclock, "Feed-forward clock support");
54 
55 extern struct ffclock_estimate ffclock_estimate;
56 extern struct bintime ffclock_boottime;
57 extern int8_t ffclock_updated;
58 extern struct mtx ffclock_mtx;
59 
60 /*
61  * Feed-forward clock absolute time. This should be the preferred way to read
62  * the feed-forward clock for "wall-clock" type time. The flags allow to compose
63  * various flavours of absolute time (e.g. with or without leap seconds taken
64  * into account). If valid pointers are provided, the ffcounter value and an
65  * upper bound on clock error associated with the bintime are provided.
66  * NOTE: use ffclock_convert_abs() to differ the conversion of a ffcounter value
67  * read earlier.
68  */
69 void
70 ffclock_abstime(ffcounter *ffcount, struct bintime *bt,
71     struct bintime *error_bound, uint32_t flags)
72 {
73 	struct ffclock_estimate cest;
74 	ffcounter ffc;
75 	ffcounter update_ffcount;
76 	ffcounter ffdelta_error;
77 
78 	/* Get counter and corresponding time. */
79 	if ((flags & FFCLOCK_FAST) == FFCLOCK_FAST)
80 		ffclock_last_tick(&ffc, bt, flags);
81 	else {
82 		ffclock_read_counter(&ffc);
83 		ffclock_convert_abs(ffc, bt, flags);
84 	}
85 
86 	/* Current ffclock estimate, use update_ffcount as generation number. */
87 	do {
88 		update_ffcount = ffclock_estimate.update_ffcount;
89 		bcopy(&ffclock_estimate, &cest, sizeof(struct ffclock_estimate));
90 	} while (update_ffcount != ffclock_estimate.update_ffcount);
91 
92 	/*
93 	 * Leap second adjustment. Total as seen by synchronisation algorithm
94 	 * since it started. cest.leapsec_next is the ffcounter prediction of
95 	 * when the next leapsecond occurs.
96 	 */
97 	if ((flags & FFCLOCK_LEAPSEC) == FFCLOCK_LEAPSEC) {
98 		bt->sec -= cest.leapsec_total;
99 		if (ffc > cest.leapsec_next)
100 			bt->sec -= cest.leapsec;
101 	}
102 
103 	/* Boot time adjustment, for uptime/monotonic clocks. */
104 	if ((flags & FFCLOCK_UPTIME) == FFCLOCK_UPTIME) {
105 		bintime_sub(bt, &ffclock_boottime);
106 	}
107 
108 	/* Compute error bound if a valid pointer has been passed. */
109 	if (error_bound) {
110 		ffdelta_error = ffc - cest.update_ffcount;
111 		ffclock_convert_diff(ffdelta_error, error_bound);
112 		/* 18446744073709 = int(2^64/1e12), err_bound_rate in [ps/s] */
113 		bintime_mul(error_bound, cest.errb_rate *
114 		    (uint64_t)18446744073709LL);
115 		/* 18446744073 = int(2^64 / 1e9), since err_abs in [ns] */
116 		bintime_addx(error_bound, cest.errb_abs *
117 		    (uint64_t)18446744073LL);
118 	}
119 
120 	if (ffcount)
121 		*ffcount = ffc;
122 }
123 
124 /*
125  * Feed-forward difference clock. This should be the preferred way to convert a
126  * time interval in ffcounter values into a time interval in seconds. If a valid
127  * pointer is passed, an upper bound on the error in computing the time interval
128  * in seconds is provided.
129  */
130 void
131 ffclock_difftime(ffcounter ffdelta, struct bintime *bt,
132     struct bintime *error_bound)
133 {
134 	ffcounter update_ffcount;
135 	uint32_t err_rate;
136 
137 	ffclock_convert_diff(ffdelta, bt);
138 
139 	if (error_bound) {
140 		do {
141 			update_ffcount = ffclock_estimate.update_ffcount;
142 			err_rate = ffclock_estimate.errb_rate;
143 		} while (update_ffcount != ffclock_estimate.update_ffcount);
144 
145 		ffclock_convert_diff(ffdelta, error_bound);
146 		/* 18446744073709 = int(2^64/1e12), err_bound_rate in [ps/s] */
147 		bintime_mul(error_bound, err_rate * (uint64_t)18446744073709LL);
148 	}
149 }
150 
151 /*
152  * Create a new kern.sysclock sysctl node, which will be home to some generic
153  * sysclock configuration variables. Feed-forward clock specific variables will
154  * live under the ffclock subnode.
155  */
156 
157 SYSCTL_NODE(_kern, OID_AUTO, sysclock, CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
158     "System clock related configuration");
159 SYSCTL_NODE(_kern_sysclock, OID_AUTO, ffclock, CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
160     "Feed-forward clock configuration");
161 
162 static char *sysclocks[] = {"feedback", "feed-forward"};
163 #define	MAX_SYSCLOCK_NAME_LEN 16
164 #define	NUM_SYSCLOCKS nitems(sysclocks)
165 
166 static int ffclock_version = 2;
167 SYSCTL_INT(_kern_sysclock_ffclock, OID_AUTO, version, CTLFLAG_RD,
168     &ffclock_version, 0, "Feed-forward clock kernel version");
169 
170 /* List available sysclocks. */
171 static int
172 sysctl_kern_sysclock_available(SYSCTL_HANDLER_ARGS)
173 {
174 	struct sbuf *s;
175 	int clk, error;
176 
177 	s = sbuf_new_for_sysctl(NULL, NULL,
178 	    MAX_SYSCLOCK_NAME_LEN * NUM_SYSCLOCKS, req);
179 	if (s == NULL)
180 		return (ENOMEM);
181 
182 	for (clk = 0; clk < NUM_SYSCLOCKS; clk++) {
183 		sbuf_cat(s, sysclocks[clk]);
184 		if (clk + 1 < NUM_SYSCLOCKS)
185 			sbuf_cat(s, " ");
186 	}
187 	error = sbuf_finish(s);
188 	sbuf_delete(s);
189 
190 	return (error);
191 }
192 
193 SYSCTL_PROC(_kern_sysclock, OID_AUTO, available,
194     CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_NEEDGIANT, 0, 0,
195     sysctl_kern_sysclock_available, "A",
196     "List of available system clocks");
197 
198 /*
199  * Return the name of the active system clock if read, or attempt to change
200  * the active system clock to the user specified one if written to. The active
201  * system clock is read when calling any of the [get]{bin,nano,micro}[up]time()
202  * functions.
203  */
204 static int
205 sysctl_kern_sysclock_active(SYSCTL_HANDLER_ARGS)
206 {
207 	char newclock[MAX_SYSCLOCK_NAME_LEN];
208 	int error;
209 	int clk;
210 
211 	/* Return the name of the current active sysclock. */
212 	strlcpy(newclock, sysclocks[sysclock_active], sizeof(newclock));
213 	error = sysctl_handle_string(oidp, newclock, sizeof(newclock), req);
214 
215 	/* Check for error or no change */
216 	if (error != 0 || req->newptr == NULL)
217 		goto done;
218 
219 	/* Change the active sysclock to the user specified one: */
220 	error = EINVAL;
221 	for (clk = 0; clk < NUM_SYSCLOCKS; clk++) {
222 		if (strncmp(newclock, sysclocks[clk],
223 		    MAX_SYSCLOCK_NAME_LEN - 1)) {
224 			continue;
225 		}
226 		sysclock_active = clk;
227 		error = 0;
228 		break;
229 	}
230 done:
231 	return (error);
232 }
233 
234 SYSCTL_PROC(_kern_sysclock, OID_AUTO, active,
235     CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_NEEDGIANT, 0, 0,
236     sysctl_kern_sysclock_active, "A",
237     "Name of the active system clock which is currently serving time");
238 
239 static int sysctl_kern_ffclock_ffcounter_bypass = 0;
240 SYSCTL_INT(_kern_sysclock_ffclock, OID_AUTO, ffcounter_bypass, CTLFLAG_RW,
241     &sysctl_kern_ffclock_ffcounter_bypass, 0,
242     "Use reliable hardware timecounter as the feed-forward counter");
243 
244 /*
245  * High level functions to access the Feed-Forward Clock.
246  */
247 void
248 ffclock_bintime(struct bintime *bt)
249 {
250 
251 	ffclock_abstime(NULL, bt, NULL, FFCLOCK_LERP | FFCLOCK_LEAPSEC);
252 }
253 
254 void
255 ffclock_nanotime(struct timespec *tsp)
256 {
257 	struct bintime bt;
258 
259 	ffclock_abstime(NULL, &bt, NULL, FFCLOCK_LERP | FFCLOCK_LEAPSEC);
260 	bintime2timespec(&bt, tsp);
261 }
262 
263 void
264 ffclock_microtime(struct timeval *tvp)
265 {
266 	struct bintime bt;
267 
268 	ffclock_abstime(NULL, &bt, NULL, FFCLOCK_LERP | FFCLOCK_LEAPSEC);
269 	bintime2timeval(&bt, tvp);
270 }
271 
272 void
273 ffclock_getbintime(struct bintime *bt)
274 {
275 
276 	ffclock_abstime(NULL, bt, NULL,
277 	    FFCLOCK_LERP | FFCLOCK_LEAPSEC | FFCLOCK_FAST);
278 }
279 
280 void
281 ffclock_getnanotime(struct timespec *tsp)
282 {
283 	struct bintime bt;
284 
285 	ffclock_abstime(NULL, &bt, NULL,
286 	    FFCLOCK_LERP | FFCLOCK_LEAPSEC | FFCLOCK_FAST);
287 	bintime2timespec(&bt, tsp);
288 }
289 
290 void
291 ffclock_getmicrotime(struct timeval *tvp)
292 {
293 	struct bintime bt;
294 
295 	ffclock_abstime(NULL, &bt, NULL,
296 	    FFCLOCK_LERP | FFCLOCK_LEAPSEC | FFCLOCK_FAST);
297 	bintime2timeval(&bt, tvp);
298 }
299 
300 void
301 ffclock_binuptime(struct bintime *bt)
302 {
303 
304 	ffclock_abstime(NULL, bt, NULL, FFCLOCK_LERP | FFCLOCK_UPTIME);
305 }
306 
307 void
308 ffclock_nanouptime(struct timespec *tsp)
309 {
310 	struct bintime bt;
311 
312 	ffclock_abstime(NULL, &bt, NULL, FFCLOCK_LERP | FFCLOCK_UPTIME);
313 	bintime2timespec(&bt, tsp);
314 }
315 
316 void
317 ffclock_microuptime(struct timeval *tvp)
318 {
319 	struct bintime bt;
320 
321 	ffclock_abstime(NULL, &bt, NULL, FFCLOCK_LERP | FFCLOCK_UPTIME);
322 	bintime2timeval(&bt, tvp);
323 }
324 
325 void
326 ffclock_getbinuptime(struct bintime *bt)
327 {
328 
329 	ffclock_abstime(NULL, bt, NULL,
330 	    FFCLOCK_LERP | FFCLOCK_UPTIME | FFCLOCK_FAST);
331 }
332 
333 void
334 ffclock_getnanouptime(struct timespec *tsp)
335 {
336 	struct bintime bt;
337 
338 	ffclock_abstime(NULL, &bt, NULL,
339 	    FFCLOCK_LERP | FFCLOCK_UPTIME | FFCLOCK_FAST);
340 	bintime2timespec(&bt, tsp);
341 }
342 
343 void
344 ffclock_getmicrouptime(struct timeval *tvp)
345 {
346 	struct bintime bt;
347 
348 	ffclock_abstime(NULL, &bt, NULL,
349 	    FFCLOCK_LERP | FFCLOCK_UPTIME | FFCLOCK_FAST);
350 	bintime2timeval(&bt, tvp);
351 }
352 
353 void
354 ffclock_bindifftime(ffcounter ffdelta, struct bintime *bt)
355 {
356 
357 	ffclock_difftime(ffdelta, bt, NULL);
358 }
359 
360 void
361 ffclock_nanodifftime(ffcounter ffdelta, struct timespec *tsp)
362 {
363 	struct bintime bt;
364 
365 	ffclock_difftime(ffdelta, &bt, NULL);
366 	bintime2timespec(&bt, tsp);
367 }
368 
369 void
370 ffclock_microdifftime(ffcounter ffdelta, struct timeval *tvp)
371 {
372 	struct bintime bt;
373 
374 	ffclock_difftime(ffdelta, &bt, NULL);
375 	bintime2timeval(&bt, tvp);
376 }
377 
378 /*
379  * System call allowing userland applications to retrieve the current value of
380  * the Feed-Forward Clock counter.
381  */
382 #ifndef _SYS_SYSPROTO_H_
383 struct ffclock_getcounter_args {
384 	ffcounter *ffcount;
385 };
386 #endif
387 /* ARGSUSED */
388 int
389 sys_ffclock_getcounter(struct thread *td, struct ffclock_getcounter_args *uap)
390 {
391 	ffcounter ffcount;
392 	int error;
393 
394 	ffcount = 0;
395 	ffclock_read_counter(&ffcount);
396 	if (ffcount == 0)
397 		return (EAGAIN);
398 	error = copyout(&ffcount, uap->ffcount, sizeof(ffcounter));
399 
400 	return (error);
401 }
402 
403 /*
404  * System call allowing the synchronisation daemon to push new feed-forward clock
405  * estimates to the kernel. Acquire ffclock_mtx to prevent concurrent updates
406  * and ensure data consistency.
407  * NOTE: ffclock_updated signals the fftimehands that new estimates are
408  * available. The updated estimates are picked up by the fftimehands on next
409  * tick, which could take as long as 1/hz seconds (if ticks are not missed).
410  */
411 #ifndef _SYS_SYSPROTO_H_
412 struct ffclock_setestimate_args {
413 	struct ffclock_estimate *cest;
414 };
415 #endif
416 /* ARGSUSED */
417 int
418 sys_ffclock_setestimate(struct thread *td, struct ffclock_setestimate_args *uap)
419 {
420 	struct ffclock_estimate cest;
421 	int error;
422 
423 	/* Reuse of PRIV_CLOCK_SETTIME. */
424 	if ((error = priv_check(td, PRIV_CLOCK_SETTIME)) != 0)
425 		return (error);
426 
427 	if ((error = copyin(uap->cest, &cest, sizeof(struct ffclock_estimate)))
428 	    != 0)
429 		return (error);
430 
431 	mtx_lock(&ffclock_mtx);
432 	memcpy(&ffclock_estimate, &cest, sizeof(struct ffclock_estimate));
433 	ffclock_updated++;
434 	mtx_unlock(&ffclock_mtx);
435 	return (error);
436 }
437 
438 /*
439  * System call allowing userland applications to retrieve the clock estimates
440  * stored within the kernel. It is useful to kickstart the synchronisation
441  * daemon with the kernel's knowledge of hardware timecounter.
442  */
443 #ifndef _SYS_SYSPROTO_H_
444 struct ffclock_getestimate_args {
445 	struct ffclock_estimate *cest;
446 };
447 #endif
448 /* ARGSUSED */
449 int
450 sys_ffclock_getestimate(struct thread *td, struct ffclock_getestimate_args *uap)
451 {
452 	struct ffclock_estimate cest;
453 	int error;
454 
455 	mtx_lock(&ffclock_mtx);
456 	memcpy(&cest, &ffclock_estimate, sizeof(struct ffclock_estimate));
457 	mtx_unlock(&ffclock_mtx);
458 	error = copyout(&cest, uap->cest, sizeof(struct ffclock_estimate));
459 	return (error);
460 }
461 
462 #else /* !FFCLOCK */
463 
464 int
465 sys_ffclock_getcounter(struct thread *td, struct ffclock_getcounter_args *uap)
466 {
467 
468 	return (ENOSYS);
469 }
470 
471 int
472 sys_ffclock_setestimate(struct thread *td, struct ffclock_setestimate_args *uap)
473 {
474 
475 	return (ENOSYS);
476 }
477 
478 int
479 sys_ffclock_getestimate(struct thread *td, struct ffclock_getestimate_args *uap)
480 {
481 
482 	return (ENOSYS);
483 }
484 
485 #endif /* FFCLOCK */
486