1af93fea7SJake Freeland /*- 2af93fea7SJake Freeland * SPDX-License-Identifier: BSD-2-Clause 3af93fea7SJake Freeland * 4af93fea7SJake Freeland * Copyright (c) 2014 Dmitry Chagin <dchagin@FreeBSD.org> 5af93fea7SJake Freeland * Copyright (c) 2023 Jake Freeland <jfree@FreeBSD.org> 6af93fea7SJake Freeland * 7af93fea7SJake Freeland * Redistribution and use in source and binary forms, with or without 8af93fea7SJake Freeland * modification, are permitted provided that the following conditions 9af93fea7SJake Freeland * are met: 10af93fea7SJake Freeland * 1. Redistributions of source code must retain the above copyright 11af93fea7SJake Freeland * notice, this list of conditions and the following disclaimer. 12af93fea7SJake Freeland * 2. Redistributions in binary form must reproduce the above copyright 13af93fea7SJake Freeland * notice, this list of conditions and the following disclaimer in the 14af93fea7SJake Freeland * documentation and/or other materials provided with the distribution. 15af93fea7SJake Freeland * 16af93fea7SJake Freeland * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 17af93fea7SJake Freeland * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18af93fea7SJake Freeland * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 19af93fea7SJake Freeland * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 20af93fea7SJake Freeland * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21af93fea7SJake Freeland * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 22af93fea7SJake Freeland * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 23af93fea7SJake Freeland * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 24af93fea7SJake Freeland * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 25af93fea7SJake Freeland * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26af93fea7SJake Freeland * SUCH DAMAGE. 27af93fea7SJake Freeland */ 28af93fea7SJake Freeland 29af93fea7SJake Freeland #include <sys/param.h> 30af93fea7SJake Freeland #include <sys/systm.h> 31af93fea7SJake Freeland #include <sys/callout.h> 32af93fea7SJake Freeland #include <sys/fcntl.h> 33af93fea7SJake Freeland #include <sys/file.h> 34af93fea7SJake Freeland #include <sys/filedesc.h> 35af93fea7SJake Freeland #include <sys/filio.h> 36af93fea7SJake Freeland #include <sys/kernel.h> 37af93fea7SJake Freeland #include <sys/lock.h> 38af93fea7SJake Freeland #include <sys/malloc.h> 39af93fea7SJake Freeland #include <sys/mount.h> 40af93fea7SJake Freeland #include <sys/mutex.h> 41af93fea7SJake Freeland #include <sys/poll.h> 42af93fea7SJake Freeland #include <sys/proc.h> 43af93fea7SJake Freeland #include <sys/queue.h> 44af93fea7SJake Freeland #include <sys/selinfo.h> 45af93fea7SJake Freeland #include <sys/stat.h> 4602f534b5SMateusz Guzik #include <sys/sx.h> 47af93fea7SJake Freeland #include <sys/sysctl.h> 48af93fea7SJake Freeland #include <sys/sysent.h> 49af93fea7SJake Freeland #include <sys/sysproto.h> 50af93fea7SJake Freeland #include <sys/timerfd.h> 51af93fea7SJake Freeland #include <sys/timespec.h> 52af93fea7SJake Freeland #include <sys/uio.h> 53af93fea7SJake Freeland #include <sys/user.h> 54af93fea7SJake Freeland 55af93fea7SJake Freeland #include <security/audit/audit.h> 56af93fea7SJake Freeland 57af93fea7SJake Freeland static MALLOC_DEFINE(M_TIMERFD, "timerfd", "timerfd structures"); 5802f534b5SMateusz Guzik 59f4296cfbSMateusz Guzik static struct mtx timerfd_list_lock; 6002f534b5SMateusz Guzik static LIST_HEAD(, timerfd) timerfd_list; 61f4296cfbSMateusz Guzik MTX_SYSINIT(timerfd, &timerfd_list_lock, "timerfd_list_lock", MTX_DEF); 6202f534b5SMateusz Guzik 63af93fea7SJake Freeland static struct unrhdr64 tfdino_unr; 64af93fea7SJake Freeland 65af93fea7SJake Freeland #define TFD_NOJUMP 0 /* Realtime clock has not jumped. */ 66af93fea7SJake Freeland #define TFD_READ 1 /* Jumped, tfd has been read since. */ 67af93fea7SJake Freeland #define TFD_ZREAD 2 /* Jumped backwards, CANCEL_ON_SET=false. */ 68af93fea7SJake Freeland #define TFD_CANCELED 4 /* Jumped, CANCEL_ON_SET=true. */ 69af93fea7SJake Freeland #define TFD_JUMPED (TFD_ZREAD | TFD_CANCELED) 70af93fea7SJake Freeland 71a1f50615SJake Freeland /* 72a1f50615SJake Freeland * One structure allocated per timerfd descriptor. 73a1f50615SJake Freeland * 74a1f50615SJake Freeland * Locking semantics: 75a1f50615SJake Freeland * (t) locked by tfd_lock mtx 76a1f50615SJake Freeland * (l) locked by timerfd_list_lock sx 77a1f50615SJake Freeland * (c) const until freeing 78a1f50615SJake Freeland */ 79af93fea7SJake Freeland struct timerfd { 80af93fea7SJake Freeland /* User specified. */ 81a1f50615SJake Freeland struct itimerspec tfd_time; /* (t) tfd timer */ 82a1f50615SJake Freeland clockid_t tfd_clockid; /* (c) timing base */ 83a1f50615SJake Freeland int tfd_flags; /* (c) creation flags */ 84a1f50615SJake Freeland int tfd_timflags; /* (t) timer flags */ 85af93fea7SJake Freeland 86af93fea7SJake Freeland /* Used internally. */ 87a1f50615SJake Freeland timerfd_t tfd_count; /* (t) expiration count since read */ 88a1f50615SJake Freeland bool tfd_expired; /* (t) true upon initial expiration */ 89a1f50615SJake Freeland struct mtx tfd_lock; /* tfd mtx lock */ 90a1f50615SJake Freeland struct callout tfd_callout; /* (t) expiration notification */ 91a1f50615SJake Freeland struct selinfo tfd_sel; /* (t) I/O alerts */ 92a1f50615SJake Freeland struct timespec tfd_boottim; /* (t) cached boottime */ 93a1f50615SJake Freeland int tfd_jumped; /* (t) timer jump status */ 94a1f50615SJake Freeland LIST_ENTRY(timerfd) entry; /* (l) entry in list */ 95af93fea7SJake Freeland 96af93fea7SJake Freeland /* For stat(2). */ 97a1f50615SJake Freeland ino_t tfd_ino; /* (c) inode number */ 98a1f50615SJake Freeland struct timespec tfd_atim; /* (t) time of last read */ 99a1f50615SJake Freeland struct timespec tfd_mtim; /* (t) time of last settime */ 100a1f50615SJake Freeland struct timespec tfd_birthtim; /* (c) creation time */ 101af93fea7SJake Freeland }; 102af93fea7SJake Freeland 103af93fea7SJake Freeland static void 104af93fea7SJake Freeland timerfd_init(void *data) 105af93fea7SJake Freeland { 106af93fea7SJake Freeland new_unrhdr64(&tfdino_unr, 1); 107af93fea7SJake Freeland } 108af93fea7SJake Freeland 109af93fea7SJake Freeland SYSINIT(timerfd, SI_SUB_VFS, SI_ORDER_ANY, timerfd_init, NULL); 110af93fea7SJake Freeland 111af93fea7SJake Freeland static inline void 112af93fea7SJake Freeland timerfd_getboottime(struct timespec *ts) 113af93fea7SJake Freeland { 114af93fea7SJake Freeland struct timeval tv; 115a1f50615SJake Freeland 116af93fea7SJake Freeland getboottime(&tv); 117af93fea7SJake Freeland TIMEVAL_TO_TIMESPEC(&tv, ts); 118af93fea7SJake Freeland } 119af93fea7SJake Freeland 120af93fea7SJake Freeland /* 121af93fea7SJake Freeland * Call when a discontinuous jump has occured in CLOCK_REALTIME and 122af93fea7SJake Freeland * update timerfd's cached boottime. A jump can be triggered using 123af93fea7SJake Freeland * functions like clock_settime(2) or settimeofday(2). 124af93fea7SJake Freeland * 125af93fea7SJake Freeland * Timer is marked TFD_CANCELED if TFD_TIMER_CANCEL_ON_SET is set 126af93fea7SJake Freeland * and the realtime clock jumps. 127af93fea7SJake Freeland * Timer is marked TFD_ZREAD if TFD_TIMER_CANCEL_ON_SET is not set, 128af93fea7SJake Freeland * but the realtime clock jumps backwards. 129af93fea7SJake Freeland */ 130af93fea7SJake Freeland void 131af93fea7SJake Freeland timerfd_jumped(void) 132af93fea7SJake Freeland { 133af93fea7SJake Freeland struct timerfd *tfd; 134af93fea7SJake Freeland struct timespec boottime, diff; 135af93fea7SJake Freeland 1365eab5230SMateusz Guzik if (LIST_EMPTY(&timerfd_list)) 1375eab5230SMateusz Guzik return; 1385eab5230SMateusz Guzik 139af93fea7SJake Freeland timerfd_getboottime(&boottime); 140f4296cfbSMateusz Guzik mtx_lock(&timerfd_list_lock); 14102f534b5SMateusz Guzik LIST_FOREACH(tfd, &timerfd_list, entry) { 142af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 143af93fea7SJake Freeland if (tfd->tfd_clockid != CLOCK_REALTIME || 144af93fea7SJake Freeland (tfd->tfd_timflags & TFD_TIMER_ABSTIME) == 0 || 145af93fea7SJake Freeland timespeccmp(&boottime, &tfd->tfd_boottim, ==)) { 146af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 147af93fea7SJake Freeland continue; 148af93fea7SJake Freeland } 149af93fea7SJake Freeland 150af93fea7SJake Freeland if (callout_active(&tfd->tfd_callout)) { 151af93fea7SJake Freeland if ((tfd->tfd_timflags & TFD_TIMER_CANCEL_ON_SET) != 0) 152af93fea7SJake Freeland tfd->tfd_jumped = TFD_CANCELED; 153af93fea7SJake Freeland else if (timespeccmp(&boottime, &tfd->tfd_boottim, <)) 154af93fea7SJake Freeland tfd->tfd_jumped = TFD_ZREAD; 155af93fea7SJake Freeland 156af93fea7SJake Freeland /* 157af93fea7SJake Freeland * Do not reschedule callout when 158af93fea7SJake Freeland * inside interval time loop. 159af93fea7SJake Freeland */ 160af93fea7SJake Freeland if (!tfd->tfd_expired) { 161af93fea7SJake Freeland timespecsub(&boottime, 162af93fea7SJake Freeland &tfd->tfd_boottim, &diff); 163af93fea7SJake Freeland timespecsub(&tfd->tfd_time.it_value, 164af93fea7SJake Freeland &diff, &tfd->tfd_time.it_value); 165af93fea7SJake Freeland if (callout_stop(&tfd->tfd_callout) == 1) { 166af93fea7SJake Freeland callout_schedule_sbt(&tfd->tfd_callout, 167af93fea7SJake Freeland tstosbt(tfd->tfd_time.it_value), 168af93fea7SJake Freeland 0, C_ABSOLUTE); 169af93fea7SJake Freeland } 170af93fea7SJake Freeland } 171af93fea7SJake Freeland } 172af93fea7SJake Freeland 173af93fea7SJake Freeland tfd->tfd_boottim = boottime; 174af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 175af93fea7SJake Freeland } 176f4296cfbSMateusz Guzik mtx_unlock(&timerfd_list_lock); 177af93fea7SJake Freeland } 178af93fea7SJake Freeland 179af93fea7SJake Freeland static int 180af93fea7SJake Freeland timerfd_read(struct file *fp, struct uio *uio, struct ucred *active_cred, 181af93fea7SJake Freeland int flags, struct thread *td) 182af93fea7SJake Freeland { 183af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 184af93fea7SJake Freeland timerfd_t count; 185af93fea7SJake Freeland int error = 0; 186af93fea7SJake Freeland 187af93fea7SJake Freeland if (uio->uio_resid < sizeof(timerfd_t)) 188af93fea7SJake Freeland return (EINVAL); 189af93fea7SJake Freeland 190af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 191af93fea7SJake Freeland retry: 192af93fea7SJake Freeland getnanotime(&tfd->tfd_atim); 193af93fea7SJake Freeland if ((tfd->tfd_jumped & TFD_JUMPED) != 0) { 194af93fea7SJake Freeland if (tfd->tfd_jumped == TFD_CANCELED) 195af93fea7SJake Freeland error = ECANCELED; 196af93fea7SJake Freeland tfd->tfd_jumped = TFD_READ; 197af93fea7SJake Freeland tfd->tfd_count = 0; 198af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 199af93fea7SJake Freeland return (error); 200af93fea7SJake Freeland } else { 201af93fea7SJake Freeland tfd->tfd_jumped = TFD_NOJUMP; 202af93fea7SJake Freeland } 203af93fea7SJake Freeland if (tfd->tfd_count == 0) { 204af93fea7SJake Freeland if ((fp->f_flag & FNONBLOCK) != 0) { 205af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 206af93fea7SJake Freeland return (EAGAIN); 207af93fea7SJake Freeland } 208af93fea7SJake Freeland td->td_rtcgen = atomic_load_acq_int(&rtc_generation); 209af93fea7SJake Freeland error = mtx_sleep(&tfd->tfd_count, &tfd->tfd_lock, 210af93fea7SJake Freeland PCATCH, "tfdrd", 0); 211af93fea7SJake Freeland if (error == 0) { 212af93fea7SJake Freeland goto retry; 213af93fea7SJake Freeland } else { 214af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 215af93fea7SJake Freeland return (error); 216af93fea7SJake Freeland } 217af93fea7SJake Freeland } 218af93fea7SJake Freeland 219af93fea7SJake Freeland count = tfd->tfd_count; 220af93fea7SJake Freeland tfd->tfd_count = 0; 221af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 222af93fea7SJake Freeland error = uiomove(&count, sizeof(timerfd_t), uio); 223af93fea7SJake Freeland 224af93fea7SJake Freeland return (error); 225af93fea7SJake Freeland } 226af93fea7SJake Freeland 227af93fea7SJake Freeland static int 228af93fea7SJake Freeland timerfd_ioctl(struct file *fp, u_long cmd, void *data, 229af93fea7SJake Freeland struct ucred *active_cred, struct thread *td) 230af93fea7SJake Freeland { 231af93fea7SJake Freeland switch (cmd) { 232af93fea7SJake Freeland case FIOASYNC: 233af93fea7SJake Freeland if (*(int *)data != 0) 234af93fea7SJake Freeland atomic_set_int(&fp->f_flag, FASYNC); 235af93fea7SJake Freeland else 236af93fea7SJake Freeland atomic_clear_int(&fp->f_flag, FASYNC); 237af93fea7SJake Freeland return (0); 238af93fea7SJake Freeland case FIONBIO: 239af93fea7SJake Freeland if (*(int *)data != 0) 240af93fea7SJake Freeland atomic_set_int(&fp->f_flag, FNONBLOCK); 241af93fea7SJake Freeland else 242af93fea7SJake Freeland atomic_clear_int(&fp->f_flag, FNONBLOCK); 243af93fea7SJake Freeland return (0); 244af93fea7SJake Freeland } 245af93fea7SJake Freeland return (ENOTTY); 246af93fea7SJake Freeland } 247af93fea7SJake Freeland 248af93fea7SJake Freeland static int 249af93fea7SJake Freeland timerfd_poll(struct file *fp, int events, struct ucred *active_cred, 250af93fea7SJake Freeland struct thread *td) 251af93fea7SJake Freeland { 252af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 253af93fea7SJake Freeland int revents = 0; 254af93fea7SJake Freeland 255af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 256af93fea7SJake Freeland if ((events & (POLLIN | POLLRDNORM)) != 0 && 257af93fea7SJake Freeland tfd->tfd_count > 0 && tfd->tfd_jumped != TFD_READ) 258af93fea7SJake Freeland revents |= events & (POLLIN | POLLRDNORM); 259af93fea7SJake Freeland if (revents == 0) 260af93fea7SJake Freeland selrecord(td, &tfd->tfd_sel); 261af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 262af93fea7SJake Freeland 263af93fea7SJake Freeland return (revents); 264af93fea7SJake Freeland } 265af93fea7SJake Freeland 266af93fea7SJake Freeland static void 267af93fea7SJake Freeland filt_timerfddetach(struct knote *kn) 268af93fea7SJake Freeland { 269af93fea7SJake Freeland struct timerfd *tfd = kn->kn_hook; 270af93fea7SJake Freeland 271af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 272af93fea7SJake Freeland knlist_remove(&tfd->tfd_sel.si_note, kn, 1); 273af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 274af93fea7SJake Freeland } 275af93fea7SJake Freeland 276af93fea7SJake Freeland static int 277af93fea7SJake Freeland filt_timerfdread(struct knote *kn, long hint) 278af93fea7SJake Freeland { 279af93fea7SJake Freeland struct timerfd *tfd = kn->kn_hook; 280af93fea7SJake Freeland 281a1f50615SJake Freeland mtx_assert(&tfd->tfd_lock, MA_OWNED); 282a1f50615SJake Freeland kn->kn_data = (int64_t)tfd->tfd_count; 283af93fea7SJake Freeland return (tfd->tfd_count > 0); 284af93fea7SJake Freeland } 285af93fea7SJake Freeland 286af93fea7SJake Freeland static struct filterops timerfd_rfiltops = { 287af93fea7SJake Freeland .f_isfd = 1, 288af93fea7SJake Freeland .f_detach = filt_timerfddetach, 289af93fea7SJake Freeland .f_event = filt_timerfdread, 290af93fea7SJake Freeland }; 291af93fea7SJake Freeland 292af93fea7SJake Freeland static int 293af93fea7SJake Freeland timerfd_kqfilter(struct file *fp, struct knote *kn) 294af93fea7SJake Freeland { 295af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 296af93fea7SJake Freeland 297af93fea7SJake Freeland if (kn->kn_filter != EVFILT_READ) 298af93fea7SJake Freeland return (EINVAL); 299af93fea7SJake Freeland 300af93fea7SJake Freeland kn->kn_fop = &timerfd_rfiltops; 301af93fea7SJake Freeland kn->kn_hook = tfd; 302af93fea7SJake Freeland knlist_add(&tfd->tfd_sel.si_note, kn, 0); 303af93fea7SJake Freeland 304af93fea7SJake Freeland return (0); 305af93fea7SJake Freeland } 306af93fea7SJake Freeland 307af93fea7SJake Freeland static int 308af93fea7SJake Freeland timerfd_stat(struct file *fp, struct stat *sb, struct ucred *active_cred) 309af93fea7SJake Freeland { 310af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 311af93fea7SJake Freeland 312af93fea7SJake Freeland bzero(sb, sizeof(*sb)); 313af93fea7SJake Freeland sb->st_nlink = fp->f_count - 1; 314af93fea7SJake Freeland sb->st_uid = fp->f_cred->cr_uid; 315af93fea7SJake Freeland sb->st_gid = fp->f_cred->cr_gid; 316af93fea7SJake Freeland sb->st_blksize = PAGE_SIZE; 317af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 318af93fea7SJake Freeland sb->st_atim = tfd->tfd_atim; 319af93fea7SJake Freeland sb->st_mtim = tfd->tfd_mtim; 320af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 321a1f50615SJake Freeland sb->st_ctim = sb->st_mtim; 322a1f50615SJake Freeland sb->st_ino = tfd->tfd_ino; 323a1f50615SJake Freeland sb->st_birthtim = tfd->tfd_birthtim; 324af93fea7SJake Freeland 325af93fea7SJake Freeland return (0); 326af93fea7SJake Freeland } 327af93fea7SJake Freeland 328af93fea7SJake Freeland static int 329af93fea7SJake Freeland timerfd_close(struct file *fp, struct thread *td) 330af93fea7SJake Freeland { 331af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 332af93fea7SJake Freeland 333f4296cfbSMateusz Guzik mtx_lock(&timerfd_list_lock); 33402f534b5SMateusz Guzik LIST_REMOVE(tfd, entry); 335f4296cfbSMateusz Guzik mtx_unlock(&timerfd_list_lock); 33602f534b5SMateusz Guzik 337af93fea7SJake Freeland callout_drain(&tfd->tfd_callout); 338af93fea7SJake Freeland seldrain(&tfd->tfd_sel); 339af93fea7SJake Freeland knlist_destroy(&tfd->tfd_sel.si_note); 340af93fea7SJake Freeland mtx_destroy(&tfd->tfd_lock); 341af93fea7SJake Freeland free(tfd, M_TIMERFD); 342af93fea7SJake Freeland fp->f_ops = &badfileops; 343af93fea7SJake Freeland 344af93fea7SJake Freeland return (0); 345af93fea7SJake Freeland } 346af93fea7SJake Freeland 347af93fea7SJake Freeland static int 348af93fea7SJake Freeland timerfd_fill_kinfo(struct file *fp, struct kinfo_file *kif, 349af93fea7SJake Freeland struct filedesc *fdp) 350af93fea7SJake Freeland { 351af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 352af93fea7SJake Freeland 353af93fea7SJake Freeland kif->kf_type = KF_TYPE_TIMERFD; 354af93fea7SJake Freeland kif->kf_un.kf_timerfd.kf_timerfd_clockid = tfd->tfd_clockid; 355af93fea7SJake Freeland kif->kf_un.kf_timerfd.kf_timerfd_flags = tfd->tfd_flags; 356af93fea7SJake Freeland kif->kf_un.kf_timerfd.kf_timerfd_addr = (uintptr_t)tfd; 357af93fea7SJake Freeland 358af93fea7SJake Freeland return (0); 359af93fea7SJake Freeland } 360af93fea7SJake Freeland 361af93fea7SJake Freeland static struct fileops timerfdops = { 362af93fea7SJake Freeland .fo_read = timerfd_read, 363af93fea7SJake Freeland .fo_write = invfo_rdwr, 364af93fea7SJake Freeland .fo_truncate = invfo_truncate, 365af93fea7SJake Freeland .fo_ioctl = timerfd_ioctl, 366af93fea7SJake Freeland .fo_poll = timerfd_poll, 367af93fea7SJake Freeland .fo_kqfilter = timerfd_kqfilter, 368af93fea7SJake Freeland .fo_stat = timerfd_stat, 369af93fea7SJake Freeland .fo_close = timerfd_close, 370af93fea7SJake Freeland .fo_chmod = invfo_chmod, 371af93fea7SJake Freeland .fo_chown = invfo_chown, 372af93fea7SJake Freeland .fo_sendfile = invfo_sendfile, 373af93fea7SJake Freeland .fo_fill_kinfo = timerfd_fill_kinfo, 374*f28526e9SKonstantin Belousov .fo_cmp = file_kcmp_generic, 375af93fea7SJake Freeland .fo_flags = DFLAG_PASSABLE, 376af93fea7SJake Freeland }; 377af93fea7SJake Freeland 378af93fea7SJake Freeland static void 379af93fea7SJake Freeland timerfd_curval(struct timerfd *tfd, struct itimerspec *old_value) 380af93fea7SJake Freeland { 381af93fea7SJake Freeland struct timespec curr_value; 382af93fea7SJake Freeland 383a1f50615SJake Freeland mtx_assert(&tfd->tfd_lock, MA_OWNED); 384af93fea7SJake Freeland *old_value = tfd->tfd_time; 385af93fea7SJake Freeland if (timespecisset(&tfd->tfd_time.it_value)) { 386af93fea7SJake Freeland nanouptime(&curr_value); 387af93fea7SJake Freeland timespecsub(&tfd->tfd_time.it_value, &curr_value, 388af93fea7SJake Freeland &old_value->it_value); 389af93fea7SJake Freeland } 390af93fea7SJake Freeland } 391af93fea7SJake Freeland 392af93fea7SJake Freeland static void 393af93fea7SJake Freeland timerfd_expire(void *arg) 394af93fea7SJake Freeland { 395af93fea7SJake Freeland struct timerfd *tfd = (struct timerfd *)arg; 396af93fea7SJake Freeland struct timespec uptime; 397af93fea7SJake Freeland 398af93fea7SJake Freeland ++tfd->tfd_count; 399af93fea7SJake Freeland tfd->tfd_expired = true; 400af93fea7SJake Freeland if (timespecisset(&tfd->tfd_time.it_interval)) { 401af93fea7SJake Freeland /* Count missed events. */ 402af93fea7SJake Freeland nanouptime(&uptime); 403af93fea7SJake Freeland if (timespeccmp(&uptime, &tfd->tfd_time.it_value, >)) { 404af93fea7SJake Freeland timespecsub(&uptime, &tfd->tfd_time.it_value, &uptime); 405af93fea7SJake Freeland tfd->tfd_count += tstosbt(uptime) / 406af93fea7SJake Freeland tstosbt(tfd->tfd_time.it_interval); 407af93fea7SJake Freeland } 408af93fea7SJake Freeland timespecadd(&tfd->tfd_time.it_value, 409af93fea7SJake Freeland &tfd->tfd_time.it_interval, &tfd->tfd_time.it_value); 410af93fea7SJake Freeland callout_schedule_sbt(&tfd->tfd_callout, 411af93fea7SJake Freeland tstosbt(tfd->tfd_time.it_value), 412af93fea7SJake Freeland 0, C_ABSOLUTE); 413af93fea7SJake Freeland } else { 414af93fea7SJake Freeland /* Single shot timer. */ 415af93fea7SJake Freeland callout_deactivate(&tfd->tfd_callout); 416af93fea7SJake Freeland timespecclear(&tfd->tfd_time.it_value); 417af93fea7SJake Freeland } 418af93fea7SJake Freeland 419af93fea7SJake Freeland wakeup(&tfd->tfd_count); 420af93fea7SJake Freeland selwakeup(&tfd->tfd_sel); 421af93fea7SJake Freeland KNOTE_LOCKED(&tfd->tfd_sel.si_note, 0); 422af93fea7SJake Freeland } 423af93fea7SJake Freeland 424af93fea7SJake Freeland int 425af93fea7SJake Freeland kern_timerfd_create(struct thread *td, int clockid, int flags) 426af93fea7SJake Freeland { 427af93fea7SJake Freeland struct file *fp; 428af93fea7SJake Freeland struct timerfd *tfd; 4295eab5230SMateusz Guzik int error, fd, fflags; 430af93fea7SJake Freeland 431af93fea7SJake Freeland AUDIT_ARG_VALUE(clockid); 432af93fea7SJake Freeland AUDIT_ARG_FFLAGS(flags); 433af93fea7SJake Freeland 434af93fea7SJake Freeland if (clockid != CLOCK_REALTIME && clockid != CLOCK_MONOTONIC) 435af93fea7SJake Freeland return (EINVAL); 436af93fea7SJake Freeland if ((flags & ~(TFD_CLOEXEC | TFD_NONBLOCK)) != 0) 437af93fea7SJake Freeland return (EINVAL); 4385eab5230SMateusz Guzik 4395eab5230SMateusz Guzik fflags = FREAD; 440af93fea7SJake Freeland if ((flags & TFD_CLOEXEC) != 0) 441af93fea7SJake Freeland fflags |= O_CLOEXEC; 4425eab5230SMateusz Guzik if ((flags & TFD_NONBLOCK) != 0) 4435eab5230SMateusz Guzik fflags |= FNONBLOCK; 444af93fea7SJake Freeland 44502f534b5SMateusz Guzik error = falloc(td, &fp, &fd, fflags); 44602f534b5SMateusz Guzik if (error != 0) 44702f534b5SMateusz Guzik return (error); 44802f534b5SMateusz Guzik 449af93fea7SJake Freeland tfd = malloc(sizeof(*tfd), M_TIMERFD, M_WAITOK | M_ZERO); 450af93fea7SJake Freeland tfd->tfd_clockid = (clockid_t)clockid; 451af93fea7SJake Freeland tfd->tfd_flags = flags; 452af93fea7SJake Freeland tfd->tfd_ino = alloc_unr64(&tfdino_unr); 453af93fea7SJake Freeland mtx_init(&tfd->tfd_lock, "timerfd", NULL, MTX_DEF); 454af93fea7SJake Freeland callout_init_mtx(&tfd->tfd_callout, &tfd->tfd_lock, 0); 455af93fea7SJake Freeland knlist_init_mtx(&tfd->tfd_sel.si_note, &tfd->tfd_lock); 456af93fea7SJake Freeland timerfd_getboottime(&tfd->tfd_boottim); 457af93fea7SJake Freeland getnanotime(&tfd->tfd_birthtim); 458f4296cfbSMateusz Guzik mtx_lock(&timerfd_list_lock); 45902f534b5SMateusz Guzik LIST_INSERT_HEAD(&timerfd_list, tfd, entry); 460f4296cfbSMateusz Guzik mtx_unlock(&timerfd_list_lock); 461af93fea7SJake Freeland 462af93fea7SJake Freeland finit(fp, fflags, DTYPE_TIMERFD, tfd, &timerfdops); 46302f534b5SMateusz Guzik 464af93fea7SJake Freeland fdrop(fp, td); 465af93fea7SJake Freeland 466af93fea7SJake Freeland td->td_retval[0] = fd; 467af93fea7SJake Freeland return (0); 468af93fea7SJake Freeland } 469af93fea7SJake Freeland 470af93fea7SJake Freeland int 471af93fea7SJake Freeland kern_timerfd_gettime(struct thread *td, int fd, struct itimerspec *curr_value) 472af93fea7SJake Freeland { 473af93fea7SJake Freeland struct file *fp; 474af93fea7SJake Freeland struct timerfd *tfd; 475af93fea7SJake Freeland int error; 476af93fea7SJake Freeland 477af93fea7SJake Freeland error = fget(td, fd, &cap_write_rights, &fp); 478af93fea7SJake Freeland if (error != 0) 479af93fea7SJake Freeland return (error); 480a1f50615SJake Freeland if (fp->f_type != DTYPE_TIMERFD) { 481af93fea7SJake Freeland fdrop(fp, td); 482af93fea7SJake Freeland return (EINVAL); 483af93fea7SJake Freeland } 484a1f50615SJake Freeland tfd = fp->f_data; 485af93fea7SJake Freeland 486af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 487af93fea7SJake Freeland timerfd_curval(tfd, curr_value); 488af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 489af93fea7SJake Freeland 490af93fea7SJake Freeland fdrop(fp, td); 491af93fea7SJake Freeland return (0); 492af93fea7SJake Freeland } 493af93fea7SJake Freeland 494af93fea7SJake Freeland int 495af93fea7SJake Freeland kern_timerfd_settime(struct thread *td, int fd, int flags, 496af93fea7SJake Freeland const struct itimerspec *new_value, struct itimerspec *old_value) 497af93fea7SJake Freeland { 498af93fea7SJake Freeland struct file *fp; 499af93fea7SJake Freeland struct timerfd *tfd; 500af93fea7SJake Freeland struct timespec ts; 501af93fea7SJake Freeland int error = 0; 502af93fea7SJake Freeland 503af93fea7SJake Freeland if ((flags & ~(TFD_TIMER_ABSTIME | TFD_TIMER_CANCEL_ON_SET)) != 0) 504af93fea7SJake Freeland return (EINVAL); 505af93fea7SJake Freeland if (!timespecvalid_interval(&new_value->it_value) || 506af93fea7SJake Freeland !timespecvalid_interval(&new_value->it_interval)) 507af93fea7SJake Freeland return (EINVAL); 508af93fea7SJake Freeland 509af93fea7SJake Freeland error = fget(td, fd, &cap_write_rights, &fp); 510af93fea7SJake Freeland if (error != 0) 511af93fea7SJake Freeland return (error); 512a1f50615SJake Freeland if (fp->f_type != DTYPE_TIMERFD) { 513af93fea7SJake Freeland fdrop(fp, td); 514af93fea7SJake Freeland return (EINVAL); 515af93fea7SJake Freeland } 516a1f50615SJake Freeland tfd = fp->f_data; 517af93fea7SJake Freeland 518af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 519af93fea7SJake Freeland getnanotime(&tfd->tfd_mtim); 520af93fea7SJake Freeland tfd->tfd_timflags = flags; 521af93fea7SJake Freeland 522af93fea7SJake Freeland /* Store old itimerspec, if applicable. */ 523af93fea7SJake Freeland if (old_value != NULL) 524af93fea7SJake Freeland timerfd_curval(tfd, old_value); 525af93fea7SJake Freeland 526af93fea7SJake Freeland /* Set new expiration. */ 527af93fea7SJake Freeland tfd->tfd_time = *new_value; 528af93fea7SJake Freeland if (timespecisset(&tfd->tfd_time.it_value)) { 529af93fea7SJake Freeland if ((flags & TFD_TIMER_ABSTIME) == 0) { 530af93fea7SJake Freeland nanouptime(&ts); 531af93fea7SJake Freeland timespecadd(&tfd->tfd_time.it_value, &ts, 532af93fea7SJake Freeland &tfd->tfd_time.it_value); 533af93fea7SJake Freeland } else if (tfd->tfd_clockid == CLOCK_REALTIME) { 534af93fea7SJake Freeland /* ECANCELED if unread jump is pending. */ 535af93fea7SJake Freeland if (tfd->tfd_jumped == TFD_CANCELED) 536af93fea7SJake Freeland error = ECANCELED; 537af93fea7SJake Freeland /* Convert from CLOCK_REALTIME to CLOCK_BOOTTIME. */ 538af93fea7SJake Freeland timespecsub(&tfd->tfd_time.it_value, &tfd->tfd_boottim, 539af93fea7SJake Freeland &tfd->tfd_time.it_value); 540af93fea7SJake Freeland } 541af93fea7SJake Freeland callout_reset_sbt(&tfd->tfd_callout, 542af93fea7SJake Freeland tstosbt(tfd->tfd_time.it_value), 543af93fea7SJake Freeland 0, timerfd_expire, tfd, C_ABSOLUTE); 544af93fea7SJake Freeland } else { 545af93fea7SJake Freeland callout_stop(&tfd->tfd_callout); 546af93fea7SJake Freeland } 547af93fea7SJake Freeland tfd->tfd_count = 0; 548af93fea7SJake Freeland tfd->tfd_expired = false; 549af93fea7SJake Freeland tfd->tfd_jumped = TFD_NOJUMP; 550af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 551af93fea7SJake Freeland 552af93fea7SJake Freeland fdrop(fp, td); 553af93fea7SJake Freeland return (error); 554af93fea7SJake Freeland } 555af93fea7SJake Freeland 556af93fea7SJake Freeland int 557af93fea7SJake Freeland sys_timerfd_create(struct thread *td, struct timerfd_create_args *uap) 558af93fea7SJake Freeland { 559af93fea7SJake Freeland return (kern_timerfd_create(td, uap->clockid, uap->flags)); 560af93fea7SJake Freeland } 561af93fea7SJake Freeland 562af93fea7SJake Freeland int 563af93fea7SJake Freeland sys_timerfd_gettime(struct thread *td, struct timerfd_gettime_args *uap) 564af93fea7SJake Freeland { 565af93fea7SJake Freeland struct itimerspec curr_value; 566af93fea7SJake Freeland int error; 567af93fea7SJake Freeland 568af93fea7SJake Freeland error = kern_timerfd_gettime(td, uap->fd, &curr_value); 569af93fea7SJake Freeland if (error == 0) 570af93fea7SJake Freeland error = copyout(&curr_value, uap->curr_value, 571af93fea7SJake Freeland sizeof(curr_value)); 572af93fea7SJake Freeland 573af93fea7SJake Freeland return (error); 574af93fea7SJake Freeland } 575af93fea7SJake Freeland 576af93fea7SJake Freeland int 577af93fea7SJake Freeland sys_timerfd_settime(struct thread *td, struct timerfd_settime_args *uap) 578af93fea7SJake Freeland { 579af93fea7SJake Freeland struct itimerspec new_value, old_value; 580af93fea7SJake Freeland int error; 581af93fea7SJake Freeland 582af93fea7SJake Freeland error = copyin(uap->new_value, &new_value, sizeof(new_value)); 583af93fea7SJake Freeland if (error != 0) 584af93fea7SJake Freeland return (error); 585af93fea7SJake Freeland if (uap->old_value == NULL) { 586af93fea7SJake Freeland error = kern_timerfd_settime(td, uap->fd, uap->flags, 587af93fea7SJake Freeland &new_value, NULL); 588af93fea7SJake Freeland } else { 589af93fea7SJake Freeland error = kern_timerfd_settime(td, uap->fd, uap->flags, 590af93fea7SJake Freeland &new_value, &old_value); 591af93fea7SJake Freeland if (error == 0) 592af93fea7SJake Freeland error = copyout(&old_value, uap->old_value, 593af93fea7SJake Freeland sizeof(old_value)); 594af93fea7SJake Freeland } 595af93fea7SJake Freeland return (error); 596af93fea7SJake Freeland } 597