1af93fea7SJake Freeland /*- 2af93fea7SJake Freeland * SPDX-License-Identifier: BSD-2-Clause 3af93fea7SJake Freeland * 4af93fea7SJake Freeland * Copyright (c) 2014 Dmitry Chagin <dchagin@FreeBSD.org> 5af93fea7SJake Freeland * Copyright (c) 2023 Jake Freeland <jfree@FreeBSD.org> 6af93fea7SJake Freeland * 7af93fea7SJake Freeland * Redistribution and use in source and binary forms, with or without 8af93fea7SJake Freeland * modification, are permitted provided that the following conditions 9af93fea7SJake Freeland * are met: 10af93fea7SJake Freeland * 1. Redistributions of source code must retain the above copyright 11af93fea7SJake Freeland * notice, this list of conditions and the following disclaimer. 12af93fea7SJake Freeland * 2. Redistributions in binary form must reproduce the above copyright 13af93fea7SJake Freeland * notice, this list of conditions and the following disclaimer in the 14af93fea7SJake Freeland * documentation and/or other materials provided with the distribution. 15af93fea7SJake Freeland * 16af93fea7SJake Freeland * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 17af93fea7SJake Freeland * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18af93fea7SJake Freeland * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 19af93fea7SJake Freeland * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 20af93fea7SJake Freeland * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21af93fea7SJake Freeland * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 22af93fea7SJake Freeland * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 23af93fea7SJake Freeland * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 24af93fea7SJake Freeland * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 25af93fea7SJake Freeland * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26af93fea7SJake Freeland * SUCH DAMAGE. 27af93fea7SJake Freeland */ 28af93fea7SJake Freeland 29*cf742faaSBaptiste Daroussin #include <sys/_clock_id.h> 30af93fea7SJake Freeland #include <sys/param.h> 31af93fea7SJake Freeland #include <sys/systm.h> 32af93fea7SJake Freeland #include <sys/callout.h> 33af93fea7SJake Freeland #include <sys/fcntl.h> 34af93fea7SJake Freeland #include <sys/file.h> 35af93fea7SJake Freeland #include <sys/filedesc.h> 36af93fea7SJake Freeland #include <sys/filio.h> 37af93fea7SJake Freeland #include <sys/kernel.h> 38af93fea7SJake Freeland #include <sys/lock.h> 39af93fea7SJake Freeland #include <sys/malloc.h> 40af93fea7SJake Freeland #include <sys/mount.h> 41af93fea7SJake Freeland #include <sys/mutex.h> 42af93fea7SJake Freeland #include <sys/poll.h> 43af93fea7SJake Freeland #include <sys/proc.h> 44af93fea7SJake Freeland #include <sys/queue.h> 45af93fea7SJake Freeland #include <sys/selinfo.h> 46af93fea7SJake Freeland #include <sys/stat.h> 4702f534b5SMateusz Guzik #include <sys/sx.h> 4818cb4223SJohn Baldwin #include <sys/syscallsubr.h> 49af93fea7SJake Freeland #include <sys/sysctl.h> 50af93fea7SJake Freeland #include <sys/sysent.h> 51af93fea7SJake Freeland #include <sys/sysproto.h> 52af93fea7SJake Freeland #include <sys/timerfd.h> 53af93fea7SJake Freeland #include <sys/timespec.h> 54af93fea7SJake Freeland #include <sys/uio.h> 55af93fea7SJake Freeland #include <sys/user.h> 56af93fea7SJake Freeland 57af93fea7SJake Freeland #include <security/audit/audit.h> 58af93fea7SJake Freeland 59af93fea7SJake Freeland static MALLOC_DEFINE(M_TIMERFD, "timerfd", "timerfd structures"); 6002f534b5SMateusz Guzik 61f4296cfbSMateusz Guzik static struct mtx timerfd_list_lock; 6202f534b5SMateusz Guzik static LIST_HEAD(, timerfd) timerfd_list; 63f4296cfbSMateusz Guzik MTX_SYSINIT(timerfd, &timerfd_list_lock, "timerfd_list_lock", MTX_DEF); 6402f534b5SMateusz Guzik 65af93fea7SJake Freeland static struct unrhdr64 tfdino_unr; 66af93fea7SJake Freeland 67af93fea7SJake Freeland #define TFD_NOJUMP 0 /* Realtime clock has not jumped. */ 68af93fea7SJake Freeland #define TFD_READ 1 /* Jumped, tfd has been read since. */ 69af93fea7SJake Freeland #define TFD_ZREAD 2 /* Jumped backwards, CANCEL_ON_SET=false. */ 70af93fea7SJake Freeland #define TFD_CANCELED 4 /* Jumped, CANCEL_ON_SET=true. */ 71af93fea7SJake Freeland #define TFD_JUMPED (TFD_ZREAD | TFD_CANCELED) 72af93fea7SJake Freeland 73a1f50615SJake Freeland /* 74a1f50615SJake Freeland * One structure allocated per timerfd descriptor. 75a1f50615SJake Freeland * 76a1f50615SJake Freeland * Locking semantics: 77a1f50615SJake Freeland * (t) locked by tfd_lock mtx 78a1f50615SJake Freeland * (l) locked by timerfd_list_lock sx 79a1f50615SJake Freeland * (c) const until freeing 80a1f50615SJake Freeland */ 81af93fea7SJake Freeland struct timerfd { 82af93fea7SJake Freeland /* User specified. */ 83a1f50615SJake Freeland struct itimerspec tfd_time; /* (t) tfd timer */ 84a1f50615SJake Freeland clockid_t tfd_clockid; /* (c) timing base */ 85a1f50615SJake Freeland int tfd_flags; /* (c) creation flags */ 86a1f50615SJake Freeland int tfd_timflags; /* (t) timer flags */ 87af93fea7SJake Freeland 88af93fea7SJake Freeland /* Used internally. */ 89a1f50615SJake Freeland timerfd_t tfd_count; /* (t) expiration count since read */ 90a1f50615SJake Freeland bool tfd_expired; /* (t) true upon initial expiration */ 91a1f50615SJake Freeland struct mtx tfd_lock; /* tfd mtx lock */ 92a1f50615SJake Freeland struct callout tfd_callout; /* (t) expiration notification */ 93a1f50615SJake Freeland struct selinfo tfd_sel; /* (t) I/O alerts */ 94a1f50615SJake Freeland struct timespec tfd_boottim; /* (t) cached boottime */ 95a1f50615SJake Freeland int tfd_jumped; /* (t) timer jump status */ 96a1f50615SJake Freeland LIST_ENTRY(timerfd) entry; /* (l) entry in list */ 97af93fea7SJake Freeland 98af93fea7SJake Freeland /* For stat(2). */ 99a1f50615SJake Freeland ino_t tfd_ino; /* (c) inode number */ 100a1f50615SJake Freeland struct timespec tfd_atim; /* (t) time of last read */ 101a1f50615SJake Freeland struct timespec tfd_mtim; /* (t) time of last settime */ 102a1f50615SJake Freeland struct timespec tfd_birthtim; /* (c) creation time */ 103af93fea7SJake Freeland }; 104af93fea7SJake Freeland 105af93fea7SJake Freeland static void 106af93fea7SJake Freeland timerfd_init(void *data) 107af93fea7SJake Freeland { 108af93fea7SJake Freeland new_unrhdr64(&tfdino_unr, 1); 109af93fea7SJake Freeland } 110af93fea7SJake Freeland 111af93fea7SJake Freeland SYSINIT(timerfd, SI_SUB_VFS, SI_ORDER_ANY, timerfd_init, NULL); 112af93fea7SJake Freeland 113af93fea7SJake Freeland static inline void 114af93fea7SJake Freeland timerfd_getboottime(struct timespec *ts) 115af93fea7SJake Freeland { 116af93fea7SJake Freeland struct timeval tv; 117a1f50615SJake Freeland 118af93fea7SJake Freeland getboottime(&tv); 119af93fea7SJake Freeland TIMEVAL_TO_TIMESPEC(&tv, ts); 120af93fea7SJake Freeland } 121af93fea7SJake Freeland 122af93fea7SJake Freeland /* 123af93fea7SJake Freeland * Call when a discontinuous jump has occured in CLOCK_REALTIME and 124af93fea7SJake Freeland * update timerfd's cached boottime. A jump can be triggered using 125af93fea7SJake Freeland * functions like clock_settime(2) or settimeofday(2). 126af93fea7SJake Freeland * 127af93fea7SJake Freeland * Timer is marked TFD_CANCELED if TFD_TIMER_CANCEL_ON_SET is set 128af93fea7SJake Freeland * and the realtime clock jumps. 129af93fea7SJake Freeland * Timer is marked TFD_ZREAD if TFD_TIMER_CANCEL_ON_SET is not set, 130af93fea7SJake Freeland * but the realtime clock jumps backwards. 131af93fea7SJake Freeland */ 132af93fea7SJake Freeland void 133af93fea7SJake Freeland timerfd_jumped(void) 134af93fea7SJake Freeland { 135af93fea7SJake Freeland struct timerfd *tfd; 136af93fea7SJake Freeland struct timespec boottime, diff; 137af93fea7SJake Freeland 1385eab5230SMateusz Guzik if (LIST_EMPTY(&timerfd_list)) 1395eab5230SMateusz Guzik return; 1405eab5230SMateusz Guzik 141af93fea7SJake Freeland timerfd_getboottime(&boottime); 142f4296cfbSMateusz Guzik mtx_lock(&timerfd_list_lock); 14302f534b5SMateusz Guzik LIST_FOREACH(tfd, &timerfd_list, entry) { 144af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 145af93fea7SJake Freeland if (tfd->tfd_clockid != CLOCK_REALTIME || 146af93fea7SJake Freeland (tfd->tfd_timflags & TFD_TIMER_ABSTIME) == 0 || 147af93fea7SJake Freeland timespeccmp(&boottime, &tfd->tfd_boottim, ==)) { 148af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 149af93fea7SJake Freeland continue; 150af93fea7SJake Freeland } 151af93fea7SJake Freeland 152af93fea7SJake Freeland if (callout_active(&tfd->tfd_callout)) { 153af93fea7SJake Freeland if ((tfd->tfd_timflags & TFD_TIMER_CANCEL_ON_SET) != 0) 154af93fea7SJake Freeland tfd->tfd_jumped = TFD_CANCELED; 155af93fea7SJake Freeland else if (timespeccmp(&boottime, &tfd->tfd_boottim, <)) 156af93fea7SJake Freeland tfd->tfd_jumped = TFD_ZREAD; 157af93fea7SJake Freeland 158af93fea7SJake Freeland /* 159af93fea7SJake Freeland * Do not reschedule callout when 160af93fea7SJake Freeland * inside interval time loop. 161af93fea7SJake Freeland */ 162af93fea7SJake Freeland if (!tfd->tfd_expired) { 163af93fea7SJake Freeland timespecsub(&boottime, 164af93fea7SJake Freeland &tfd->tfd_boottim, &diff); 165af93fea7SJake Freeland timespecsub(&tfd->tfd_time.it_value, 166af93fea7SJake Freeland &diff, &tfd->tfd_time.it_value); 167af93fea7SJake Freeland if (callout_stop(&tfd->tfd_callout) == 1) { 168af93fea7SJake Freeland callout_schedule_sbt(&tfd->tfd_callout, 169af93fea7SJake Freeland tstosbt(tfd->tfd_time.it_value), 170af93fea7SJake Freeland 0, C_ABSOLUTE); 171af93fea7SJake Freeland } 172af93fea7SJake Freeland } 173af93fea7SJake Freeland } 174af93fea7SJake Freeland 175af93fea7SJake Freeland tfd->tfd_boottim = boottime; 176af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 177af93fea7SJake Freeland } 178f4296cfbSMateusz Guzik mtx_unlock(&timerfd_list_lock); 179af93fea7SJake Freeland } 180af93fea7SJake Freeland 181af93fea7SJake Freeland static int 182af93fea7SJake Freeland timerfd_read(struct file *fp, struct uio *uio, struct ucred *active_cred, 183af93fea7SJake Freeland int flags, struct thread *td) 184af93fea7SJake Freeland { 185af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 186af93fea7SJake Freeland timerfd_t count; 187af93fea7SJake Freeland int error = 0; 188af93fea7SJake Freeland 189af93fea7SJake Freeland if (uio->uio_resid < sizeof(timerfd_t)) 190af93fea7SJake Freeland return (EINVAL); 191af93fea7SJake Freeland 192af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 193af93fea7SJake Freeland retry: 194af93fea7SJake Freeland getnanotime(&tfd->tfd_atim); 195af93fea7SJake Freeland if ((tfd->tfd_jumped & TFD_JUMPED) != 0) { 196af93fea7SJake Freeland if (tfd->tfd_jumped == TFD_CANCELED) 197af93fea7SJake Freeland error = ECANCELED; 198af93fea7SJake Freeland tfd->tfd_jumped = TFD_READ; 199af93fea7SJake Freeland tfd->tfd_count = 0; 200af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 201af93fea7SJake Freeland return (error); 202af93fea7SJake Freeland } else { 203af93fea7SJake Freeland tfd->tfd_jumped = TFD_NOJUMP; 204af93fea7SJake Freeland } 205af93fea7SJake Freeland if (tfd->tfd_count == 0) { 206af93fea7SJake Freeland if ((fp->f_flag & FNONBLOCK) != 0) { 207af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 208af93fea7SJake Freeland return (EAGAIN); 209af93fea7SJake Freeland } 210af93fea7SJake Freeland td->td_rtcgen = atomic_load_acq_int(&rtc_generation); 211af93fea7SJake Freeland error = mtx_sleep(&tfd->tfd_count, &tfd->tfd_lock, 212af93fea7SJake Freeland PCATCH, "tfdrd", 0); 213af93fea7SJake Freeland if (error == 0) { 214af93fea7SJake Freeland goto retry; 215af93fea7SJake Freeland } else { 216af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 217af93fea7SJake Freeland return (error); 218af93fea7SJake Freeland } 219af93fea7SJake Freeland } 220af93fea7SJake Freeland 221af93fea7SJake Freeland count = tfd->tfd_count; 222af93fea7SJake Freeland tfd->tfd_count = 0; 223af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 224af93fea7SJake Freeland error = uiomove(&count, sizeof(timerfd_t), uio); 225af93fea7SJake Freeland 226af93fea7SJake Freeland return (error); 227af93fea7SJake Freeland } 228af93fea7SJake Freeland 229af93fea7SJake Freeland static int 230af93fea7SJake Freeland timerfd_ioctl(struct file *fp, u_long cmd, void *data, 231af93fea7SJake Freeland struct ucred *active_cred, struct thread *td) 232af93fea7SJake Freeland { 233af93fea7SJake Freeland switch (cmd) { 234af93fea7SJake Freeland case FIOASYNC: 235af93fea7SJake Freeland if (*(int *)data != 0) 236af93fea7SJake Freeland atomic_set_int(&fp->f_flag, FASYNC); 237af93fea7SJake Freeland else 238af93fea7SJake Freeland atomic_clear_int(&fp->f_flag, FASYNC); 239af93fea7SJake Freeland return (0); 240af93fea7SJake Freeland case FIONBIO: 241af93fea7SJake Freeland if (*(int *)data != 0) 242af93fea7SJake Freeland atomic_set_int(&fp->f_flag, FNONBLOCK); 243af93fea7SJake Freeland else 244af93fea7SJake Freeland atomic_clear_int(&fp->f_flag, FNONBLOCK); 245af93fea7SJake Freeland return (0); 246af93fea7SJake Freeland } 247af93fea7SJake Freeland return (ENOTTY); 248af93fea7SJake Freeland } 249af93fea7SJake Freeland 250af93fea7SJake Freeland static int 251af93fea7SJake Freeland timerfd_poll(struct file *fp, int events, struct ucred *active_cred, 252af93fea7SJake Freeland struct thread *td) 253af93fea7SJake Freeland { 254af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 255af93fea7SJake Freeland int revents = 0; 256af93fea7SJake Freeland 257af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 258af93fea7SJake Freeland if ((events & (POLLIN | POLLRDNORM)) != 0 && 259af93fea7SJake Freeland tfd->tfd_count > 0 && tfd->tfd_jumped != TFD_READ) 260af93fea7SJake Freeland revents |= events & (POLLIN | POLLRDNORM); 261af93fea7SJake Freeland if (revents == 0) 262af93fea7SJake Freeland selrecord(td, &tfd->tfd_sel); 263af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 264af93fea7SJake Freeland 265af93fea7SJake Freeland return (revents); 266af93fea7SJake Freeland } 267af93fea7SJake Freeland 268af93fea7SJake Freeland static void 269af93fea7SJake Freeland filt_timerfddetach(struct knote *kn) 270af93fea7SJake Freeland { 271af93fea7SJake Freeland struct timerfd *tfd = kn->kn_hook; 272af93fea7SJake Freeland 273af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 274af93fea7SJake Freeland knlist_remove(&tfd->tfd_sel.si_note, kn, 1); 275af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 276af93fea7SJake Freeland } 277af93fea7SJake Freeland 278af93fea7SJake Freeland static int 279af93fea7SJake Freeland filt_timerfdread(struct knote *kn, long hint) 280af93fea7SJake Freeland { 281af93fea7SJake Freeland struct timerfd *tfd = kn->kn_hook; 282af93fea7SJake Freeland 283a1f50615SJake Freeland mtx_assert(&tfd->tfd_lock, MA_OWNED); 284a1f50615SJake Freeland kn->kn_data = (int64_t)tfd->tfd_count; 285af93fea7SJake Freeland return (tfd->tfd_count > 0); 286af93fea7SJake Freeland } 287af93fea7SJake Freeland 288af93fea7SJake Freeland static struct filterops timerfd_rfiltops = { 289af93fea7SJake Freeland .f_isfd = 1, 290af93fea7SJake Freeland .f_detach = filt_timerfddetach, 291af93fea7SJake Freeland .f_event = filt_timerfdread, 292af93fea7SJake Freeland }; 293af93fea7SJake Freeland 294af93fea7SJake Freeland static int 295af93fea7SJake Freeland timerfd_kqfilter(struct file *fp, struct knote *kn) 296af93fea7SJake Freeland { 297af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 298af93fea7SJake Freeland 299af93fea7SJake Freeland if (kn->kn_filter != EVFILT_READ) 300af93fea7SJake Freeland return (EINVAL); 301af93fea7SJake Freeland 302af93fea7SJake Freeland kn->kn_fop = &timerfd_rfiltops; 303af93fea7SJake Freeland kn->kn_hook = tfd; 304af93fea7SJake Freeland knlist_add(&tfd->tfd_sel.si_note, kn, 0); 305af93fea7SJake Freeland 306af93fea7SJake Freeland return (0); 307af93fea7SJake Freeland } 308af93fea7SJake Freeland 309af93fea7SJake Freeland static int 310af93fea7SJake Freeland timerfd_stat(struct file *fp, struct stat *sb, struct ucred *active_cred) 311af93fea7SJake Freeland { 312af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 313af93fea7SJake Freeland 314af93fea7SJake Freeland bzero(sb, sizeof(*sb)); 315af93fea7SJake Freeland sb->st_nlink = fp->f_count - 1; 316af93fea7SJake Freeland sb->st_uid = fp->f_cred->cr_uid; 317af93fea7SJake Freeland sb->st_gid = fp->f_cred->cr_gid; 318af93fea7SJake Freeland sb->st_blksize = PAGE_SIZE; 319af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 320af93fea7SJake Freeland sb->st_atim = tfd->tfd_atim; 321af93fea7SJake Freeland sb->st_mtim = tfd->tfd_mtim; 322af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 323a1f50615SJake Freeland sb->st_ctim = sb->st_mtim; 324a1f50615SJake Freeland sb->st_ino = tfd->tfd_ino; 325a1f50615SJake Freeland sb->st_birthtim = tfd->tfd_birthtim; 326af93fea7SJake Freeland 327af93fea7SJake Freeland return (0); 328af93fea7SJake Freeland } 329af93fea7SJake Freeland 330af93fea7SJake Freeland static int 331af93fea7SJake Freeland timerfd_close(struct file *fp, struct thread *td) 332af93fea7SJake Freeland { 333af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 334af93fea7SJake Freeland 335f4296cfbSMateusz Guzik mtx_lock(&timerfd_list_lock); 33602f534b5SMateusz Guzik LIST_REMOVE(tfd, entry); 337f4296cfbSMateusz Guzik mtx_unlock(&timerfd_list_lock); 33802f534b5SMateusz Guzik 339af93fea7SJake Freeland callout_drain(&tfd->tfd_callout); 340af93fea7SJake Freeland seldrain(&tfd->tfd_sel); 341af93fea7SJake Freeland knlist_destroy(&tfd->tfd_sel.si_note); 342af93fea7SJake Freeland mtx_destroy(&tfd->tfd_lock); 343af93fea7SJake Freeland free(tfd, M_TIMERFD); 344af93fea7SJake Freeland fp->f_ops = &badfileops; 345af93fea7SJake Freeland 346af93fea7SJake Freeland return (0); 347af93fea7SJake Freeland } 348af93fea7SJake Freeland 349af93fea7SJake Freeland static int 350af93fea7SJake Freeland timerfd_fill_kinfo(struct file *fp, struct kinfo_file *kif, 351af93fea7SJake Freeland struct filedesc *fdp) 352af93fea7SJake Freeland { 353af93fea7SJake Freeland struct timerfd *tfd = fp->f_data; 354af93fea7SJake Freeland 355af93fea7SJake Freeland kif->kf_type = KF_TYPE_TIMERFD; 356af93fea7SJake Freeland kif->kf_un.kf_timerfd.kf_timerfd_clockid = tfd->tfd_clockid; 357af93fea7SJake Freeland kif->kf_un.kf_timerfd.kf_timerfd_flags = tfd->tfd_flags; 358af93fea7SJake Freeland kif->kf_un.kf_timerfd.kf_timerfd_addr = (uintptr_t)tfd; 359af93fea7SJake Freeland 360af93fea7SJake Freeland return (0); 361af93fea7SJake Freeland } 362af93fea7SJake Freeland 363af93fea7SJake Freeland static struct fileops timerfdops = { 364af93fea7SJake Freeland .fo_read = timerfd_read, 365af93fea7SJake Freeland .fo_write = invfo_rdwr, 366af93fea7SJake Freeland .fo_truncate = invfo_truncate, 367af93fea7SJake Freeland .fo_ioctl = timerfd_ioctl, 368af93fea7SJake Freeland .fo_poll = timerfd_poll, 369af93fea7SJake Freeland .fo_kqfilter = timerfd_kqfilter, 370af93fea7SJake Freeland .fo_stat = timerfd_stat, 371af93fea7SJake Freeland .fo_close = timerfd_close, 372af93fea7SJake Freeland .fo_chmod = invfo_chmod, 373af93fea7SJake Freeland .fo_chown = invfo_chown, 374af93fea7SJake Freeland .fo_sendfile = invfo_sendfile, 375af93fea7SJake Freeland .fo_fill_kinfo = timerfd_fill_kinfo, 376f28526e9SKonstantin Belousov .fo_cmp = file_kcmp_generic, 377af93fea7SJake Freeland .fo_flags = DFLAG_PASSABLE, 378af93fea7SJake Freeland }; 379af93fea7SJake Freeland 380af93fea7SJake Freeland static void 381af93fea7SJake Freeland timerfd_curval(struct timerfd *tfd, struct itimerspec *old_value) 382af93fea7SJake Freeland { 383af93fea7SJake Freeland struct timespec curr_value; 384af93fea7SJake Freeland 385a1f50615SJake Freeland mtx_assert(&tfd->tfd_lock, MA_OWNED); 386af93fea7SJake Freeland *old_value = tfd->tfd_time; 387af93fea7SJake Freeland if (timespecisset(&tfd->tfd_time.it_value)) { 388af93fea7SJake Freeland nanouptime(&curr_value); 389af93fea7SJake Freeland timespecsub(&tfd->tfd_time.it_value, &curr_value, 390af93fea7SJake Freeland &old_value->it_value); 391af93fea7SJake Freeland } 392af93fea7SJake Freeland } 393af93fea7SJake Freeland 394af93fea7SJake Freeland static void 395af93fea7SJake Freeland timerfd_expire(void *arg) 396af93fea7SJake Freeland { 397af93fea7SJake Freeland struct timerfd *tfd = (struct timerfd *)arg; 398af93fea7SJake Freeland struct timespec uptime; 399af93fea7SJake Freeland 400af93fea7SJake Freeland ++tfd->tfd_count; 401af93fea7SJake Freeland tfd->tfd_expired = true; 402af93fea7SJake Freeland if (timespecisset(&tfd->tfd_time.it_interval)) { 403af93fea7SJake Freeland /* Count missed events. */ 404af93fea7SJake Freeland nanouptime(&uptime); 405af93fea7SJake Freeland if (timespeccmp(&uptime, &tfd->tfd_time.it_value, >)) { 406af93fea7SJake Freeland timespecsub(&uptime, &tfd->tfd_time.it_value, &uptime); 407af93fea7SJake Freeland tfd->tfd_count += tstosbt(uptime) / 408af93fea7SJake Freeland tstosbt(tfd->tfd_time.it_interval); 409af93fea7SJake Freeland } 410af93fea7SJake Freeland timespecadd(&tfd->tfd_time.it_value, 411af93fea7SJake Freeland &tfd->tfd_time.it_interval, &tfd->tfd_time.it_value); 412af93fea7SJake Freeland callout_schedule_sbt(&tfd->tfd_callout, 413af93fea7SJake Freeland tstosbt(tfd->tfd_time.it_value), 414af93fea7SJake Freeland 0, C_ABSOLUTE); 415af93fea7SJake Freeland } else { 416af93fea7SJake Freeland /* Single shot timer. */ 417af93fea7SJake Freeland callout_deactivate(&tfd->tfd_callout); 418af93fea7SJake Freeland timespecclear(&tfd->tfd_time.it_value); 419af93fea7SJake Freeland } 420af93fea7SJake Freeland 421af93fea7SJake Freeland wakeup(&tfd->tfd_count); 422af93fea7SJake Freeland selwakeup(&tfd->tfd_sel); 423af93fea7SJake Freeland KNOTE_LOCKED(&tfd->tfd_sel.si_note, 0); 424af93fea7SJake Freeland } 425af93fea7SJake Freeland 426af93fea7SJake Freeland int 427af93fea7SJake Freeland kern_timerfd_create(struct thread *td, int clockid, int flags) 428af93fea7SJake Freeland { 429af93fea7SJake Freeland struct file *fp; 430af93fea7SJake Freeland struct timerfd *tfd; 4315eab5230SMateusz Guzik int error, fd, fflags; 432af93fea7SJake Freeland 433af93fea7SJake Freeland AUDIT_ARG_VALUE(clockid); 434af93fea7SJake Freeland AUDIT_ARG_FFLAGS(flags); 435af93fea7SJake Freeland 436*cf742faaSBaptiste Daroussin switch (clockid) { 437*cf742faaSBaptiste Daroussin case CLOCK_REALTIME: 438*cf742faaSBaptiste Daroussin /* FALLTHROUGH */ 439*cf742faaSBaptiste Daroussin case CLOCK_MONOTONIC: 440*cf742faaSBaptiste Daroussin /* FALLTHROUGH */ 441*cf742faaSBaptiste Daroussin case CLOCK_UPTIME: 442*cf742faaSBaptiste Daroussin /* FALLTHROUGH */ 443*cf742faaSBaptiste Daroussin case CLOCK_BOOTTIME: 444*cf742faaSBaptiste Daroussin break; 445*cf742faaSBaptiste Daroussin default: 446af93fea7SJake Freeland return (EINVAL); 447*cf742faaSBaptiste Daroussin } 448af93fea7SJake Freeland if ((flags & ~(TFD_CLOEXEC | TFD_NONBLOCK)) != 0) 449af93fea7SJake Freeland return (EINVAL); 4505eab5230SMateusz Guzik 4515eab5230SMateusz Guzik fflags = FREAD; 452af93fea7SJake Freeland if ((flags & TFD_CLOEXEC) != 0) 453af93fea7SJake Freeland fflags |= O_CLOEXEC; 4545eab5230SMateusz Guzik if ((flags & TFD_NONBLOCK) != 0) 4555eab5230SMateusz Guzik fflags |= FNONBLOCK; 456af93fea7SJake Freeland 45702f534b5SMateusz Guzik error = falloc(td, &fp, &fd, fflags); 45802f534b5SMateusz Guzik if (error != 0) 45902f534b5SMateusz Guzik return (error); 46002f534b5SMateusz Guzik 461af93fea7SJake Freeland tfd = malloc(sizeof(*tfd), M_TIMERFD, M_WAITOK | M_ZERO); 462af93fea7SJake Freeland tfd->tfd_clockid = (clockid_t)clockid; 463af93fea7SJake Freeland tfd->tfd_flags = flags; 464af93fea7SJake Freeland tfd->tfd_ino = alloc_unr64(&tfdino_unr); 465af93fea7SJake Freeland mtx_init(&tfd->tfd_lock, "timerfd", NULL, MTX_DEF); 466af93fea7SJake Freeland callout_init_mtx(&tfd->tfd_callout, &tfd->tfd_lock, 0); 467af93fea7SJake Freeland knlist_init_mtx(&tfd->tfd_sel.si_note, &tfd->tfd_lock); 468af93fea7SJake Freeland timerfd_getboottime(&tfd->tfd_boottim); 469af93fea7SJake Freeland getnanotime(&tfd->tfd_birthtim); 470f4296cfbSMateusz Guzik mtx_lock(&timerfd_list_lock); 47102f534b5SMateusz Guzik LIST_INSERT_HEAD(&timerfd_list, tfd, entry); 472f4296cfbSMateusz Guzik mtx_unlock(&timerfd_list_lock); 473af93fea7SJake Freeland 474af93fea7SJake Freeland finit(fp, fflags, DTYPE_TIMERFD, tfd, &timerfdops); 47502f534b5SMateusz Guzik 476af93fea7SJake Freeland fdrop(fp, td); 477af93fea7SJake Freeland 478af93fea7SJake Freeland td->td_retval[0] = fd; 479af93fea7SJake Freeland return (0); 480af93fea7SJake Freeland } 481af93fea7SJake Freeland 482af93fea7SJake Freeland int 483af93fea7SJake Freeland kern_timerfd_gettime(struct thread *td, int fd, struct itimerspec *curr_value) 484af93fea7SJake Freeland { 485af93fea7SJake Freeland struct file *fp; 486af93fea7SJake Freeland struct timerfd *tfd; 487af93fea7SJake Freeland int error; 488af93fea7SJake Freeland 489af93fea7SJake Freeland error = fget(td, fd, &cap_write_rights, &fp); 490af93fea7SJake Freeland if (error != 0) 491af93fea7SJake Freeland return (error); 492a1f50615SJake Freeland if (fp->f_type != DTYPE_TIMERFD) { 493af93fea7SJake Freeland fdrop(fp, td); 494af93fea7SJake Freeland return (EINVAL); 495af93fea7SJake Freeland } 496a1f50615SJake Freeland tfd = fp->f_data; 497af93fea7SJake Freeland 498af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 499af93fea7SJake Freeland timerfd_curval(tfd, curr_value); 500af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 501af93fea7SJake Freeland 502af93fea7SJake Freeland fdrop(fp, td); 503af93fea7SJake Freeland return (0); 504af93fea7SJake Freeland } 505af93fea7SJake Freeland 506af93fea7SJake Freeland int 507af93fea7SJake Freeland kern_timerfd_settime(struct thread *td, int fd, int flags, 508af93fea7SJake Freeland const struct itimerspec *new_value, struct itimerspec *old_value) 509af93fea7SJake Freeland { 510af93fea7SJake Freeland struct file *fp; 511af93fea7SJake Freeland struct timerfd *tfd; 512af93fea7SJake Freeland struct timespec ts; 513af93fea7SJake Freeland int error = 0; 514af93fea7SJake Freeland 515af93fea7SJake Freeland if ((flags & ~(TFD_TIMER_ABSTIME | TFD_TIMER_CANCEL_ON_SET)) != 0) 516af93fea7SJake Freeland return (EINVAL); 517af93fea7SJake Freeland if (!timespecvalid_interval(&new_value->it_value) || 518af93fea7SJake Freeland !timespecvalid_interval(&new_value->it_interval)) 519af93fea7SJake Freeland return (EINVAL); 520af93fea7SJake Freeland 521af93fea7SJake Freeland error = fget(td, fd, &cap_write_rights, &fp); 522af93fea7SJake Freeland if (error != 0) 523af93fea7SJake Freeland return (error); 524a1f50615SJake Freeland if (fp->f_type != DTYPE_TIMERFD) { 525af93fea7SJake Freeland fdrop(fp, td); 526af93fea7SJake Freeland return (EINVAL); 527af93fea7SJake Freeland } 528a1f50615SJake Freeland tfd = fp->f_data; 529af93fea7SJake Freeland 530af93fea7SJake Freeland mtx_lock(&tfd->tfd_lock); 531af93fea7SJake Freeland getnanotime(&tfd->tfd_mtim); 532af93fea7SJake Freeland tfd->tfd_timflags = flags; 533af93fea7SJake Freeland 534af93fea7SJake Freeland /* Store old itimerspec, if applicable. */ 535af93fea7SJake Freeland if (old_value != NULL) 536af93fea7SJake Freeland timerfd_curval(tfd, old_value); 537af93fea7SJake Freeland 538af93fea7SJake Freeland /* Set new expiration. */ 539af93fea7SJake Freeland tfd->tfd_time = *new_value; 540af93fea7SJake Freeland if (timespecisset(&tfd->tfd_time.it_value)) { 541af93fea7SJake Freeland if ((flags & TFD_TIMER_ABSTIME) == 0) { 542af93fea7SJake Freeland nanouptime(&ts); 543af93fea7SJake Freeland timespecadd(&tfd->tfd_time.it_value, &ts, 544af93fea7SJake Freeland &tfd->tfd_time.it_value); 545af93fea7SJake Freeland } else if (tfd->tfd_clockid == CLOCK_REALTIME) { 546af93fea7SJake Freeland /* ECANCELED if unread jump is pending. */ 547af93fea7SJake Freeland if (tfd->tfd_jumped == TFD_CANCELED) 548af93fea7SJake Freeland error = ECANCELED; 549af93fea7SJake Freeland /* Convert from CLOCK_REALTIME to CLOCK_BOOTTIME. */ 550af93fea7SJake Freeland timespecsub(&tfd->tfd_time.it_value, &tfd->tfd_boottim, 551af93fea7SJake Freeland &tfd->tfd_time.it_value); 552af93fea7SJake Freeland } 553af93fea7SJake Freeland callout_reset_sbt(&tfd->tfd_callout, 554af93fea7SJake Freeland tstosbt(tfd->tfd_time.it_value), 555af93fea7SJake Freeland 0, timerfd_expire, tfd, C_ABSOLUTE); 556af93fea7SJake Freeland } else { 557af93fea7SJake Freeland callout_stop(&tfd->tfd_callout); 558af93fea7SJake Freeland } 559af93fea7SJake Freeland tfd->tfd_count = 0; 560af93fea7SJake Freeland tfd->tfd_expired = false; 561af93fea7SJake Freeland tfd->tfd_jumped = TFD_NOJUMP; 562af93fea7SJake Freeland mtx_unlock(&tfd->tfd_lock); 563af93fea7SJake Freeland 564af93fea7SJake Freeland fdrop(fp, td); 565af93fea7SJake Freeland return (error); 566af93fea7SJake Freeland } 567af93fea7SJake Freeland 568af93fea7SJake Freeland int 569af93fea7SJake Freeland sys_timerfd_create(struct thread *td, struct timerfd_create_args *uap) 570af93fea7SJake Freeland { 571af93fea7SJake Freeland return (kern_timerfd_create(td, uap->clockid, uap->flags)); 572af93fea7SJake Freeland } 573af93fea7SJake Freeland 574af93fea7SJake Freeland int 575af93fea7SJake Freeland sys_timerfd_gettime(struct thread *td, struct timerfd_gettime_args *uap) 576af93fea7SJake Freeland { 577af93fea7SJake Freeland struct itimerspec curr_value; 578af93fea7SJake Freeland int error; 579af93fea7SJake Freeland 580af93fea7SJake Freeland error = kern_timerfd_gettime(td, uap->fd, &curr_value); 581af93fea7SJake Freeland if (error == 0) 582af93fea7SJake Freeland error = copyout(&curr_value, uap->curr_value, 583af93fea7SJake Freeland sizeof(curr_value)); 584af93fea7SJake Freeland 585af93fea7SJake Freeland return (error); 586af93fea7SJake Freeland } 587af93fea7SJake Freeland 588af93fea7SJake Freeland int 589af93fea7SJake Freeland sys_timerfd_settime(struct thread *td, struct timerfd_settime_args *uap) 590af93fea7SJake Freeland { 591af93fea7SJake Freeland struct itimerspec new_value, old_value; 592af93fea7SJake Freeland int error; 593af93fea7SJake Freeland 594af93fea7SJake Freeland error = copyin(uap->new_value, &new_value, sizeof(new_value)); 595af93fea7SJake Freeland if (error != 0) 596af93fea7SJake Freeland return (error); 597af93fea7SJake Freeland if (uap->old_value == NULL) { 598af93fea7SJake Freeland error = kern_timerfd_settime(td, uap->fd, uap->flags, 599af93fea7SJake Freeland &new_value, NULL); 600af93fea7SJake Freeland } else { 601af93fea7SJake Freeland error = kern_timerfd_settime(td, uap->fd, uap->flags, 602af93fea7SJake Freeland &new_value, &old_value); 603af93fea7SJake Freeland if (error == 0) 604af93fea7SJake Freeland error = copyout(&old_value, uap->old_value, 605af93fea7SJake Freeland sizeof(old_value)); 606af93fea7SJake Freeland } 607af93fea7SJake Freeland return (error); 608af93fea7SJake Freeland } 609