xref: /freebsd/sys/contrib/openzfs/lib/libzpool/kernel.c (revision 071ab5a1f3cbfd29c8fbec27f7e619418adaf074)
1*61145dc2SMartin Matuska // SPDX-License-Identifier: CDDL-1.0
2eda14cbcSMatt Macy /*
3eda14cbcSMatt Macy  * CDDL HEADER START
4eda14cbcSMatt Macy  *
5eda14cbcSMatt Macy  * The contents of this file are subject to the terms of the
6eda14cbcSMatt Macy  * Common Development and Distribution License (the "License").
7eda14cbcSMatt Macy  * You may not use this file except in compliance with the License.
8eda14cbcSMatt Macy  *
9eda14cbcSMatt Macy  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
10271171e0SMartin Matuska  * or https://opensource.org/licenses/CDDL-1.0.
11eda14cbcSMatt Macy  * See the License for the specific language governing permissions
12eda14cbcSMatt Macy  * and limitations under the License.
13eda14cbcSMatt Macy  *
14eda14cbcSMatt Macy  * When distributing Covered Code, include this CDDL HEADER in each
15eda14cbcSMatt Macy  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
16eda14cbcSMatt Macy  * If applicable, add the following below this CDDL HEADER, with the
17eda14cbcSMatt Macy  * fields enclosed by brackets "[]" replaced with your own identifying
18eda14cbcSMatt Macy  * information: Portions Copyright [yyyy] [name of copyright owner]
19eda14cbcSMatt Macy  *
20eda14cbcSMatt Macy  * CDDL HEADER END
21eda14cbcSMatt Macy  */
22eda14cbcSMatt Macy /*
23eda14cbcSMatt Macy  * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
24eda14cbcSMatt Macy  * Copyright (c) 2012, 2018 by Delphix. All rights reserved.
25eda14cbcSMatt Macy  * Copyright (c) 2016 Actifio, Inc. All rights reserved.
26eda14cbcSMatt Macy  */
27eda14cbcSMatt Macy 
28eda14cbcSMatt Macy #include <assert.h>
29eda14cbcSMatt Macy #include <fcntl.h>
30eda14cbcSMatt Macy #include <libgen.h>
31eda14cbcSMatt Macy #include <poll.h>
32eda14cbcSMatt Macy #include <stdio.h>
33eda14cbcSMatt Macy #include <stdlib.h>
34eda14cbcSMatt Macy #include <string.h>
35bb2d13b6SMartin Matuska #include <limits.h>
363ff01b23SMartin Matuska #include <libzutil.h>
37eda14cbcSMatt Macy #include <sys/crypto/icp.h>
38eda14cbcSMatt Macy #include <sys/processor.h>
39eda14cbcSMatt Macy #include <sys/rrwlock.h>
40eda14cbcSMatt Macy #include <sys/spa.h>
41eda14cbcSMatt Macy #include <sys/stat.h>
42eda14cbcSMatt Macy #include <sys/systeminfo.h>
43eda14cbcSMatt Macy #include <sys/time.h>
44eda14cbcSMatt Macy #include <sys/utsname.h>
45eda14cbcSMatt Macy #include <sys/zfs_context.h>
46eda14cbcSMatt Macy #include <sys/zfs_onexit.h>
47eac7052fSMatt Macy #include <sys/zfs_vfsops.h>
48eda14cbcSMatt Macy #include <sys/zstd/zstd.h>
49eda14cbcSMatt Macy #include <sys/zvol.h>
50eda14cbcSMatt Macy #include <zfs_fletcher.h>
51eda14cbcSMatt Macy #include <zlib.h>
52eda14cbcSMatt Macy 
53eda14cbcSMatt Macy /*
54eda14cbcSMatt Macy  * Emulation of kernel services in userland.
55eda14cbcSMatt Macy  */
56eda14cbcSMatt Macy 
57eda14cbcSMatt Macy uint64_t physmem;
58716fd348SMartin Matuska uint32_t hostid;
59eda14cbcSMatt Macy struct utsname hw_utsname;
60eda14cbcSMatt Macy 
61eda14cbcSMatt Macy /* If set, all blocks read will be copied to the specified directory. */
62eda14cbcSMatt Macy char *vn_dumpdir = NULL;
63eda14cbcSMatt Macy 
64eda14cbcSMatt Macy /* this only exists to have its address taken */
65eda14cbcSMatt Macy struct proc p0;
66eda14cbcSMatt Macy 
67eda14cbcSMatt Macy /*
68eda14cbcSMatt Macy  * =========================================================================
69eda14cbcSMatt Macy  * threads
70eda14cbcSMatt Macy  * =========================================================================
71eda14cbcSMatt Macy  *
72eda14cbcSMatt Macy  * TS_STACK_MIN is dictated by the minimum allowed pthread stack size.  While
73eda14cbcSMatt Macy  * TS_STACK_MAX is somewhat arbitrary, it was selected to be large enough for
74eda14cbcSMatt Macy  * the expected stack depth while small enough to avoid exhausting address
75eda14cbcSMatt Macy  * space with high thread counts.
76eda14cbcSMatt Macy  */
77eda14cbcSMatt Macy #define	TS_STACK_MIN	MAX(PTHREAD_STACK_MIN, 32768)
78eda14cbcSMatt Macy #define	TS_STACK_MAX	(256 * 1024)
79eda14cbcSMatt Macy 
80c03c5b1cSMartin Matuska struct zk_thread_wrapper {
81c03c5b1cSMartin Matuska 	void (*func)(void *);
82c03c5b1cSMartin Matuska 	void *arg;
83c03c5b1cSMartin Matuska };
84c03c5b1cSMartin Matuska 
85c03c5b1cSMartin Matuska static void *
zk_thread_wrapper(void * arg)86c03c5b1cSMartin Matuska zk_thread_wrapper(void *arg)
87c03c5b1cSMartin Matuska {
88c03c5b1cSMartin Matuska 	struct zk_thread_wrapper ztw;
89c03c5b1cSMartin Matuska 	memcpy(&ztw, arg, sizeof (ztw));
90c03c5b1cSMartin Matuska 	free(arg);
91c03c5b1cSMartin Matuska 	ztw.func(ztw.arg);
92c03c5b1cSMartin Matuska 	return (NULL);
93c03c5b1cSMartin Matuska }
94c03c5b1cSMartin Matuska 
95eda14cbcSMatt Macy kthread_t *
zk_thread_create(const char * name,void (* func)(void *),void * arg,size_t stksize,int state)96b985c9caSMartin Matuska zk_thread_create(const char *name, void (*func)(void *), void *arg,
97b985c9caSMartin Matuska     size_t stksize, int state)
98eda14cbcSMatt Macy {
99eda14cbcSMatt Macy 	pthread_attr_t attr;
100eda14cbcSMatt Macy 	pthread_t tid;
101eda14cbcSMatt Macy 	char *stkstr;
102c03c5b1cSMartin Matuska 	struct zk_thread_wrapper *ztw;
103eda14cbcSMatt Macy 	int detachstate = PTHREAD_CREATE_DETACHED;
104eda14cbcSMatt Macy 
105eda14cbcSMatt Macy 	VERIFY0(pthread_attr_init(&attr));
106eda14cbcSMatt Macy 
107eda14cbcSMatt Macy 	if (state & TS_JOINABLE)
108eda14cbcSMatt Macy 		detachstate = PTHREAD_CREATE_JOINABLE;
109eda14cbcSMatt Macy 
110eda14cbcSMatt Macy 	VERIFY0(pthread_attr_setdetachstate(&attr, detachstate));
111eda14cbcSMatt Macy 
112eda14cbcSMatt Macy 	/*
113eda14cbcSMatt Macy 	 * We allow the default stack size in user space to be specified by
114eda14cbcSMatt Macy 	 * setting the ZFS_STACK_SIZE environment variable.  This allows us
115eda14cbcSMatt Macy 	 * the convenience of observing and debugging stack overruns in
116eda14cbcSMatt Macy 	 * user space.  Explicitly specified stack sizes will be honored.
117eda14cbcSMatt Macy 	 * The usage of ZFS_STACK_SIZE is discussed further in the
118eda14cbcSMatt Macy 	 * ENVIRONMENT VARIABLES sections of the ztest(1) man page.
119eda14cbcSMatt Macy 	 */
120eda14cbcSMatt Macy 	if (stksize == 0) {
121eda14cbcSMatt Macy 		stkstr = getenv("ZFS_STACK_SIZE");
122eda14cbcSMatt Macy 
123eda14cbcSMatt Macy 		if (stkstr == NULL)
124eda14cbcSMatt Macy 			stksize = TS_STACK_MAX;
125eda14cbcSMatt Macy 		else
126eda14cbcSMatt Macy 			stksize = MAX(atoi(stkstr), TS_STACK_MIN);
127eda14cbcSMatt Macy 	}
128eda14cbcSMatt Macy 
129eda14cbcSMatt Macy 	VERIFY3S(stksize, >, 0);
130eda14cbcSMatt Macy 	stksize = P2ROUNDUP(MAX(stksize, TS_STACK_MIN), PAGESIZE);
131eda14cbcSMatt Macy 
132eda14cbcSMatt Macy 	/*
133eda14cbcSMatt Macy 	 * If this ever fails, it may be because the stack size is not a
134eda14cbcSMatt Macy 	 * multiple of system page size.
135eda14cbcSMatt Macy 	 */
136eda14cbcSMatt Macy 	VERIFY0(pthread_attr_setstacksize(&attr, stksize));
137eda14cbcSMatt Macy 	VERIFY0(pthread_attr_setguardsize(&attr, PAGESIZE));
138eda14cbcSMatt Macy 
139c03c5b1cSMartin Matuska 	VERIFY(ztw = malloc(sizeof (*ztw)));
140c03c5b1cSMartin Matuska 	ztw->func = func;
141c03c5b1cSMartin Matuska 	ztw->arg = arg;
142c03c5b1cSMartin Matuska 	VERIFY0(pthread_create(&tid, &attr, zk_thread_wrapper, ztw));
143eda14cbcSMatt Macy 	VERIFY0(pthread_attr_destroy(&attr));
144eda14cbcSMatt Macy 
145b985c9caSMartin Matuska 	pthread_setname_np(tid, name);
146b985c9caSMartin Matuska 
147eda14cbcSMatt Macy 	return ((void *)(uintptr_t)tid);
148eda14cbcSMatt Macy }
149eda14cbcSMatt Macy 
150eda14cbcSMatt Macy /*
151eda14cbcSMatt Macy  * =========================================================================
152eda14cbcSMatt Macy  * kstats
153eda14cbcSMatt Macy  * =========================================================================
154eda14cbcSMatt Macy  */
155eda14cbcSMatt Macy kstat_t *
kstat_create(const char * module,int instance,const char * name,const char * class,uchar_t type,ulong_t ndata,uchar_t ks_flag)156eda14cbcSMatt Macy kstat_create(const char *module, int instance, const char *name,
157eda14cbcSMatt Macy     const char *class, uchar_t type, ulong_t ndata, uchar_t ks_flag)
158eda14cbcSMatt Macy {
159e92ffd9bSMartin Matuska 	(void) module, (void) instance, (void) name, (void) class, (void) type,
160e92ffd9bSMartin Matuska 	    (void) ndata, (void) ks_flag;
161eda14cbcSMatt Macy 	return (NULL);
162eda14cbcSMatt Macy }
163eda14cbcSMatt Macy 
164eda14cbcSMatt Macy void
kstat_install(kstat_t * ksp)165eda14cbcSMatt Macy kstat_install(kstat_t *ksp)
166e92ffd9bSMartin Matuska {
167e92ffd9bSMartin Matuska 	(void) ksp;
168e92ffd9bSMartin Matuska }
169eda14cbcSMatt Macy 
170eda14cbcSMatt Macy void
kstat_delete(kstat_t * ksp)171eda14cbcSMatt Macy kstat_delete(kstat_t *ksp)
172e92ffd9bSMartin Matuska {
173e92ffd9bSMartin Matuska 	(void) ksp;
174e92ffd9bSMartin Matuska }
175eda14cbcSMatt Macy 
176eda14cbcSMatt Macy void
kstat_set_raw_ops(kstat_t * ksp,int (* headers)(char * buf,size_t size),int (* data)(char * buf,size_t size,void * data),void * (* addr)(kstat_t * ksp,loff_t index))177eda14cbcSMatt Macy kstat_set_raw_ops(kstat_t *ksp,
178eda14cbcSMatt Macy     int (*headers)(char *buf, size_t size),
179eda14cbcSMatt Macy     int (*data)(char *buf, size_t size, void *data),
180eda14cbcSMatt Macy     void *(*addr)(kstat_t *ksp, loff_t index))
181e92ffd9bSMartin Matuska {
182e92ffd9bSMartin Matuska 	(void) ksp, (void) headers, (void) data, (void) addr;
183e92ffd9bSMartin Matuska }
184eda14cbcSMatt Macy 
185eda14cbcSMatt Macy /*
186eda14cbcSMatt Macy  * =========================================================================
187eda14cbcSMatt Macy  * mutexes
188eda14cbcSMatt Macy  * =========================================================================
189eda14cbcSMatt Macy  */
190eda14cbcSMatt Macy 
191eda14cbcSMatt Macy void
mutex_init(kmutex_t * mp,char * name,int type,void * cookie)192eda14cbcSMatt Macy mutex_init(kmutex_t *mp, char *name, int type, void *cookie)
193eda14cbcSMatt Macy {
194e92ffd9bSMartin Matuska 	(void) name, (void) type, (void) cookie;
195eda14cbcSMatt Macy 	VERIFY0(pthread_mutex_init(&mp->m_lock, NULL));
196eda14cbcSMatt Macy 	memset(&mp->m_owner, 0, sizeof (pthread_t));
197eda14cbcSMatt Macy }
198eda14cbcSMatt Macy 
199eda14cbcSMatt Macy void
mutex_destroy(kmutex_t * mp)200eda14cbcSMatt Macy mutex_destroy(kmutex_t *mp)
201eda14cbcSMatt Macy {
202eda14cbcSMatt Macy 	VERIFY0(pthread_mutex_destroy(&mp->m_lock));
203eda14cbcSMatt Macy }
204eda14cbcSMatt Macy 
205eda14cbcSMatt Macy void
mutex_enter(kmutex_t * mp)206eda14cbcSMatt Macy mutex_enter(kmutex_t *mp)
207eda14cbcSMatt Macy {
208eda14cbcSMatt Macy 	VERIFY0(pthread_mutex_lock(&mp->m_lock));
209eda14cbcSMatt Macy 	mp->m_owner = pthread_self();
210eda14cbcSMatt Macy }
211eda14cbcSMatt Macy 
212eda14cbcSMatt Macy int
mutex_enter_check_return(kmutex_t * mp)2136c1e79dfSMartin Matuska mutex_enter_check_return(kmutex_t *mp)
2146c1e79dfSMartin Matuska {
2156c1e79dfSMartin Matuska 	int error = pthread_mutex_lock(&mp->m_lock);
2166c1e79dfSMartin Matuska 	if (error == 0)
2176c1e79dfSMartin Matuska 		mp->m_owner = pthread_self();
2186c1e79dfSMartin Matuska 	return (error);
2196c1e79dfSMartin Matuska }
2206c1e79dfSMartin Matuska 
2216c1e79dfSMartin Matuska int
mutex_tryenter(kmutex_t * mp)222eda14cbcSMatt Macy mutex_tryenter(kmutex_t *mp)
223eda14cbcSMatt Macy {
224e92ffd9bSMartin Matuska 	int error = pthread_mutex_trylock(&mp->m_lock);
225eda14cbcSMatt Macy 	if (error == 0) {
226eda14cbcSMatt Macy 		mp->m_owner = pthread_self();
227eda14cbcSMatt Macy 		return (1);
228eda14cbcSMatt Macy 	} else {
229eda14cbcSMatt Macy 		VERIFY3S(error, ==, EBUSY);
230eda14cbcSMatt Macy 		return (0);
231eda14cbcSMatt Macy 	}
232eda14cbcSMatt Macy }
233eda14cbcSMatt Macy 
234eda14cbcSMatt Macy void
mutex_exit(kmutex_t * mp)235eda14cbcSMatt Macy mutex_exit(kmutex_t *mp)
236eda14cbcSMatt Macy {
237eda14cbcSMatt Macy 	memset(&mp->m_owner, 0, sizeof (pthread_t));
238eda14cbcSMatt Macy 	VERIFY0(pthread_mutex_unlock(&mp->m_lock));
239eda14cbcSMatt Macy }
240eda14cbcSMatt Macy 
241eda14cbcSMatt Macy /*
242eda14cbcSMatt Macy  * =========================================================================
243eda14cbcSMatt Macy  * rwlocks
244eda14cbcSMatt Macy  * =========================================================================
245eda14cbcSMatt Macy  */
246eda14cbcSMatt Macy 
247eda14cbcSMatt Macy void
rw_init(krwlock_t * rwlp,char * name,int type,void * arg)248eda14cbcSMatt Macy rw_init(krwlock_t *rwlp, char *name, int type, void *arg)
249eda14cbcSMatt Macy {
250e92ffd9bSMartin Matuska 	(void) name, (void) type, (void) arg;
251eda14cbcSMatt Macy 	VERIFY0(pthread_rwlock_init(&rwlp->rw_lock, NULL));
252eda14cbcSMatt Macy 	rwlp->rw_readers = 0;
253eda14cbcSMatt Macy 	rwlp->rw_owner = 0;
254eda14cbcSMatt Macy }
255eda14cbcSMatt Macy 
256eda14cbcSMatt Macy void
rw_destroy(krwlock_t * rwlp)257eda14cbcSMatt Macy rw_destroy(krwlock_t *rwlp)
258eda14cbcSMatt Macy {
259eda14cbcSMatt Macy 	VERIFY0(pthread_rwlock_destroy(&rwlp->rw_lock));
260eda14cbcSMatt Macy }
261eda14cbcSMatt Macy 
262eda14cbcSMatt Macy void
rw_enter(krwlock_t * rwlp,krw_t rw)263eda14cbcSMatt Macy rw_enter(krwlock_t *rwlp, krw_t rw)
264eda14cbcSMatt Macy {
265eda14cbcSMatt Macy 	if (rw == RW_READER) {
266eda14cbcSMatt Macy 		VERIFY0(pthread_rwlock_rdlock(&rwlp->rw_lock));
267eda14cbcSMatt Macy 		atomic_inc_uint(&rwlp->rw_readers);
268eda14cbcSMatt Macy 	} else {
269eda14cbcSMatt Macy 		VERIFY0(pthread_rwlock_wrlock(&rwlp->rw_lock));
270eda14cbcSMatt Macy 		rwlp->rw_owner = pthread_self();
271eda14cbcSMatt Macy 	}
272eda14cbcSMatt Macy }
273eda14cbcSMatt Macy 
274eda14cbcSMatt Macy void
rw_exit(krwlock_t * rwlp)275eda14cbcSMatt Macy rw_exit(krwlock_t *rwlp)
276eda14cbcSMatt Macy {
277eda14cbcSMatt Macy 	if (RW_READ_HELD(rwlp))
278eda14cbcSMatt Macy 		atomic_dec_uint(&rwlp->rw_readers);
279eda14cbcSMatt Macy 	else
280eda14cbcSMatt Macy 		rwlp->rw_owner = 0;
281eda14cbcSMatt Macy 
282eda14cbcSMatt Macy 	VERIFY0(pthread_rwlock_unlock(&rwlp->rw_lock));
283eda14cbcSMatt Macy }
284eda14cbcSMatt Macy 
285eda14cbcSMatt Macy int
rw_tryenter(krwlock_t * rwlp,krw_t rw)286eda14cbcSMatt Macy rw_tryenter(krwlock_t *rwlp, krw_t rw)
287eda14cbcSMatt Macy {
288eda14cbcSMatt Macy 	int error;
289eda14cbcSMatt Macy 
290eda14cbcSMatt Macy 	if (rw == RW_READER)
291eda14cbcSMatt Macy 		error = pthread_rwlock_tryrdlock(&rwlp->rw_lock);
292eda14cbcSMatt Macy 	else
293eda14cbcSMatt Macy 		error = pthread_rwlock_trywrlock(&rwlp->rw_lock);
294eda14cbcSMatt Macy 
295eda14cbcSMatt Macy 	if (error == 0) {
296eda14cbcSMatt Macy 		if (rw == RW_READER)
297eda14cbcSMatt Macy 			atomic_inc_uint(&rwlp->rw_readers);
298eda14cbcSMatt Macy 		else
299eda14cbcSMatt Macy 			rwlp->rw_owner = pthread_self();
300eda14cbcSMatt Macy 
301eda14cbcSMatt Macy 		return (1);
302eda14cbcSMatt Macy 	}
303eda14cbcSMatt Macy 
304eda14cbcSMatt Macy 	VERIFY3S(error, ==, EBUSY);
305eda14cbcSMatt Macy 
306eda14cbcSMatt Macy 	return (0);
307eda14cbcSMatt Macy }
308eda14cbcSMatt Macy 
309eda14cbcSMatt Macy uint32_t
zone_get_hostid(void * zonep)310eda14cbcSMatt Macy zone_get_hostid(void *zonep)
311eda14cbcSMatt Macy {
312eda14cbcSMatt Macy 	/*
313eda14cbcSMatt Macy 	 * We're emulating the system's hostid in userland.
314eda14cbcSMatt Macy 	 */
315e92ffd9bSMartin Matuska 	(void) zonep;
316716fd348SMartin Matuska 	return (hostid);
317eda14cbcSMatt Macy }
318eda14cbcSMatt Macy 
319eda14cbcSMatt Macy int
rw_tryupgrade(krwlock_t * rwlp)320eda14cbcSMatt Macy rw_tryupgrade(krwlock_t *rwlp)
321eda14cbcSMatt Macy {
322e92ffd9bSMartin Matuska 	(void) rwlp;
323eda14cbcSMatt Macy 	return (0);
324eda14cbcSMatt Macy }
325eda14cbcSMatt Macy 
326eda14cbcSMatt Macy /*
327eda14cbcSMatt Macy  * =========================================================================
328eda14cbcSMatt Macy  * condition variables
329eda14cbcSMatt Macy  * =========================================================================
330eda14cbcSMatt Macy  */
331eda14cbcSMatt Macy 
332eda14cbcSMatt Macy void
cv_init(kcondvar_t * cv,char * name,int type,void * arg)333eda14cbcSMatt Macy cv_init(kcondvar_t *cv, char *name, int type, void *arg)
334eda14cbcSMatt Macy {
335e92ffd9bSMartin Matuska 	(void) name, (void) type, (void) arg;
336eda14cbcSMatt Macy 	VERIFY0(pthread_cond_init(cv, NULL));
337eda14cbcSMatt Macy }
338eda14cbcSMatt Macy 
339eda14cbcSMatt Macy void
cv_destroy(kcondvar_t * cv)340eda14cbcSMatt Macy cv_destroy(kcondvar_t *cv)
341eda14cbcSMatt Macy {
342eda14cbcSMatt Macy 	VERIFY0(pthread_cond_destroy(cv));
343eda14cbcSMatt Macy }
344eda14cbcSMatt Macy 
345eda14cbcSMatt Macy void
cv_wait(kcondvar_t * cv,kmutex_t * mp)346eda14cbcSMatt Macy cv_wait(kcondvar_t *cv, kmutex_t *mp)
347eda14cbcSMatt Macy {
348eda14cbcSMatt Macy 	memset(&mp->m_owner, 0, sizeof (pthread_t));
349eda14cbcSMatt Macy 	VERIFY0(pthread_cond_wait(cv, &mp->m_lock));
350eda14cbcSMatt Macy 	mp->m_owner = pthread_self();
351eda14cbcSMatt Macy }
352eda14cbcSMatt Macy 
353eda14cbcSMatt Macy int
cv_wait_sig(kcondvar_t * cv,kmutex_t * mp)354eda14cbcSMatt Macy cv_wait_sig(kcondvar_t *cv, kmutex_t *mp)
355eda14cbcSMatt Macy {
356eda14cbcSMatt Macy 	cv_wait(cv, mp);
357eda14cbcSMatt Macy 	return (1);
358eda14cbcSMatt Macy }
359eda14cbcSMatt Macy 
360eda14cbcSMatt Macy int
cv_timedwait(kcondvar_t * cv,kmutex_t * mp,clock_t abstime)361eda14cbcSMatt Macy cv_timedwait(kcondvar_t *cv, kmutex_t *mp, clock_t abstime)
362eda14cbcSMatt Macy {
363eda14cbcSMatt Macy 	int error;
364eda14cbcSMatt Macy 	struct timeval tv;
365eda14cbcSMatt Macy 	struct timespec ts;
366eda14cbcSMatt Macy 	clock_t delta;
367eda14cbcSMatt Macy 
368eda14cbcSMatt Macy 	delta = abstime - ddi_get_lbolt();
369eda14cbcSMatt Macy 	if (delta <= 0)
370eda14cbcSMatt Macy 		return (-1);
371eda14cbcSMatt Macy 
372eda14cbcSMatt Macy 	VERIFY(gettimeofday(&tv, NULL) == 0);
373eda14cbcSMatt Macy 
374eda14cbcSMatt Macy 	ts.tv_sec = tv.tv_sec + delta / hz;
375eda14cbcSMatt Macy 	ts.tv_nsec = tv.tv_usec * NSEC_PER_USEC + (delta % hz) * (NANOSEC / hz);
376eda14cbcSMatt Macy 	if (ts.tv_nsec >= NANOSEC) {
377eda14cbcSMatt Macy 		ts.tv_sec++;
378eda14cbcSMatt Macy 		ts.tv_nsec -= NANOSEC;
379eda14cbcSMatt Macy 	}
380eda14cbcSMatt Macy 
381eda14cbcSMatt Macy 	memset(&mp->m_owner, 0, sizeof (pthread_t));
382eda14cbcSMatt Macy 	error = pthread_cond_timedwait(cv, &mp->m_lock, &ts);
383eda14cbcSMatt Macy 	mp->m_owner = pthread_self();
384eda14cbcSMatt Macy 
385eda14cbcSMatt Macy 	if (error == ETIMEDOUT)
386eda14cbcSMatt Macy 		return (-1);
387eda14cbcSMatt Macy 
388eda14cbcSMatt Macy 	VERIFY0(error);
389eda14cbcSMatt Macy 
390eda14cbcSMatt Macy 	return (1);
391eda14cbcSMatt Macy }
392eda14cbcSMatt Macy 
393eda14cbcSMatt Macy int
cv_timedwait_hires(kcondvar_t * cv,kmutex_t * mp,hrtime_t tim,hrtime_t res,int flag)394eda14cbcSMatt Macy cv_timedwait_hires(kcondvar_t *cv, kmutex_t *mp, hrtime_t tim, hrtime_t res,
395eda14cbcSMatt Macy     int flag)
396eda14cbcSMatt Macy {
397e92ffd9bSMartin Matuska 	(void) res;
398eda14cbcSMatt Macy 	int error;
399eda14cbcSMatt Macy 	struct timeval tv;
400eda14cbcSMatt Macy 	struct timespec ts;
401eda14cbcSMatt Macy 	hrtime_t delta;
402eda14cbcSMatt Macy 
403eda14cbcSMatt Macy 	ASSERT(flag == 0 || flag == CALLOUT_FLAG_ABSOLUTE);
404eda14cbcSMatt Macy 
405eda14cbcSMatt Macy 	delta = tim;
406eda14cbcSMatt Macy 	if (flag & CALLOUT_FLAG_ABSOLUTE)
407eda14cbcSMatt Macy 		delta -= gethrtime();
408eda14cbcSMatt Macy 
409eda14cbcSMatt Macy 	if (delta <= 0)
410eda14cbcSMatt Macy 		return (-1);
411eda14cbcSMatt Macy 
412eda14cbcSMatt Macy 	VERIFY0(gettimeofday(&tv, NULL));
413eda14cbcSMatt Macy 
414eda14cbcSMatt Macy 	ts.tv_sec = tv.tv_sec + delta / NANOSEC;
415eda14cbcSMatt Macy 	ts.tv_nsec = tv.tv_usec * NSEC_PER_USEC + (delta % NANOSEC);
416eda14cbcSMatt Macy 	if (ts.tv_nsec >= NANOSEC) {
417eda14cbcSMatt Macy 		ts.tv_sec++;
418eda14cbcSMatt Macy 		ts.tv_nsec -= NANOSEC;
419eda14cbcSMatt Macy 	}
420eda14cbcSMatt Macy 
421eda14cbcSMatt Macy 	memset(&mp->m_owner, 0, sizeof (pthread_t));
422eda14cbcSMatt Macy 	error = pthread_cond_timedwait(cv, &mp->m_lock, &ts);
423eda14cbcSMatt Macy 	mp->m_owner = pthread_self();
424eda14cbcSMatt Macy 
425eda14cbcSMatt Macy 	if (error == ETIMEDOUT)
426eda14cbcSMatt Macy 		return (-1);
427eda14cbcSMatt Macy 
428eda14cbcSMatt Macy 	VERIFY0(error);
429eda14cbcSMatt Macy 
430eda14cbcSMatt Macy 	return (1);
431eda14cbcSMatt Macy }
432eda14cbcSMatt Macy 
433eda14cbcSMatt Macy void
cv_signal(kcondvar_t * cv)434eda14cbcSMatt Macy cv_signal(kcondvar_t *cv)
435eda14cbcSMatt Macy {
436eda14cbcSMatt Macy 	VERIFY0(pthread_cond_signal(cv));
437eda14cbcSMatt Macy }
438eda14cbcSMatt Macy 
439eda14cbcSMatt Macy void
cv_broadcast(kcondvar_t * cv)440eda14cbcSMatt Macy cv_broadcast(kcondvar_t *cv)
441eda14cbcSMatt Macy {
442eda14cbcSMatt Macy 	VERIFY0(pthread_cond_broadcast(cv));
443eda14cbcSMatt Macy }
444eda14cbcSMatt Macy 
445eda14cbcSMatt Macy /*
446eda14cbcSMatt Macy  * =========================================================================
447eda14cbcSMatt Macy  * procfs list
448eda14cbcSMatt Macy  * =========================================================================
449eda14cbcSMatt Macy  */
450eda14cbcSMatt Macy 
451eda14cbcSMatt Macy void
seq_printf(struct seq_file * m,const char * fmt,...)452eda14cbcSMatt Macy seq_printf(struct seq_file *m, const char *fmt, ...)
453e92ffd9bSMartin Matuska {
454e92ffd9bSMartin Matuska 	(void) m, (void) fmt;
455e92ffd9bSMartin Matuska }
456eda14cbcSMatt Macy 
457eda14cbcSMatt Macy void
procfs_list_install(const char * module,const char * submodule,const char * name,mode_t mode,procfs_list_t * procfs_list,int (* show)(struct seq_file * f,void * p),int (* show_header)(struct seq_file * f),int (* clear)(procfs_list_t * procfs_list),size_t procfs_list_node_off)458eda14cbcSMatt Macy procfs_list_install(const char *module,
459c40487d4SMatt Macy     const char *submodule,
460eda14cbcSMatt Macy     const char *name,
461eda14cbcSMatt Macy     mode_t mode,
462eda14cbcSMatt Macy     procfs_list_t *procfs_list,
463eda14cbcSMatt Macy     int (*show)(struct seq_file *f, void *p),
464eda14cbcSMatt Macy     int (*show_header)(struct seq_file *f),
465eda14cbcSMatt Macy     int (*clear)(procfs_list_t *procfs_list),
466eda14cbcSMatt Macy     size_t procfs_list_node_off)
467eda14cbcSMatt Macy {
468e92ffd9bSMartin Matuska 	(void) module, (void) submodule, (void) name, (void) mode, (void) show,
469e92ffd9bSMartin Matuska 	    (void) show_header, (void) clear;
470eda14cbcSMatt Macy 	mutex_init(&procfs_list->pl_lock, NULL, MUTEX_DEFAULT, NULL);
471eda14cbcSMatt Macy 	list_create(&procfs_list->pl_list,
472eda14cbcSMatt Macy 	    procfs_list_node_off + sizeof (procfs_list_node_t),
473eda14cbcSMatt Macy 	    procfs_list_node_off + offsetof(procfs_list_node_t, pln_link));
474eda14cbcSMatt Macy 	procfs_list->pl_next_id = 1;
475eda14cbcSMatt Macy 	procfs_list->pl_node_offset = procfs_list_node_off;
476eda14cbcSMatt Macy }
477eda14cbcSMatt Macy 
478eda14cbcSMatt Macy void
procfs_list_uninstall(procfs_list_t * procfs_list)479eda14cbcSMatt Macy procfs_list_uninstall(procfs_list_t *procfs_list)
480e92ffd9bSMartin Matuska {
481e92ffd9bSMartin Matuska 	(void) procfs_list;
482e92ffd9bSMartin Matuska }
483eda14cbcSMatt Macy 
484eda14cbcSMatt Macy void
procfs_list_destroy(procfs_list_t * procfs_list)485eda14cbcSMatt Macy procfs_list_destroy(procfs_list_t *procfs_list)
486eda14cbcSMatt Macy {
487eda14cbcSMatt Macy 	ASSERT(list_is_empty(&procfs_list->pl_list));
488eda14cbcSMatt Macy 	list_destroy(&procfs_list->pl_list);
489eda14cbcSMatt Macy 	mutex_destroy(&procfs_list->pl_lock);
490eda14cbcSMatt Macy }
491eda14cbcSMatt Macy 
492eda14cbcSMatt Macy #define	NODE_ID(procfs_list, obj) \
493eda14cbcSMatt Macy 		(((procfs_list_node_t *)(((char *)obj) + \
494eda14cbcSMatt Macy 		(procfs_list)->pl_node_offset))->pln_id)
495eda14cbcSMatt Macy 
496eda14cbcSMatt Macy void
procfs_list_add(procfs_list_t * procfs_list,void * p)497eda14cbcSMatt Macy procfs_list_add(procfs_list_t *procfs_list, void *p)
498eda14cbcSMatt Macy {
499eda14cbcSMatt Macy 	ASSERT(MUTEX_HELD(&procfs_list->pl_lock));
500eda14cbcSMatt Macy 	NODE_ID(procfs_list, p) = procfs_list->pl_next_id++;
501eda14cbcSMatt Macy 	list_insert_tail(&procfs_list->pl_list, p);
502eda14cbcSMatt Macy }
503eda14cbcSMatt Macy 
504eda14cbcSMatt Macy /*
505eda14cbcSMatt Macy  * =========================================================================
506eda14cbcSMatt Macy  * vnode operations
507eda14cbcSMatt Macy  * =========================================================================
508eda14cbcSMatt Macy  */
509eda14cbcSMatt Macy 
510eda14cbcSMatt Macy /*
511eda14cbcSMatt Macy  * =========================================================================
512eda14cbcSMatt Macy  * Figure out which debugging statements to print
513eda14cbcSMatt Macy  * =========================================================================
514eda14cbcSMatt Macy  */
515eda14cbcSMatt Macy 
516eda14cbcSMatt Macy static char *dprintf_string;
517eda14cbcSMatt Macy static int dprintf_print_all;
518eda14cbcSMatt Macy 
519eda14cbcSMatt Macy int
dprintf_find_string(const char * string)520eda14cbcSMatt Macy dprintf_find_string(const char *string)
521eda14cbcSMatt Macy {
522eda14cbcSMatt Macy 	char *tmp_str = dprintf_string;
523eda14cbcSMatt Macy 	int len = strlen(string);
524eda14cbcSMatt Macy 
525eda14cbcSMatt Macy 	/*
526eda14cbcSMatt Macy 	 * Find out if this is a string we want to print.
527eda14cbcSMatt Macy 	 * String format: file1.c,function_name1,file2.c,file3.c
528eda14cbcSMatt Macy 	 */
529eda14cbcSMatt Macy 
530eda14cbcSMatt Macy 	while (tmp_str != NULL) {
531eda14cbcSMatt Macy 		if (strncmp(tmp_str, string, len) == 0 &&
532eda14cbcSMatt Macy 		    (tmp_str[len] == ',' || tmp_str[len] == '\0'))
533eda14cbcSMatt Macy 			return (1);
534eda14cbcSMatt Macy 		tmp_str = strchr(tmp_str, ',');
535eda14cbcSMatt Macy 		if (tmp_str != NULL)
536eda14cbcSMatt Macy 			tmp_str++; /* Get rid of , */
537eda14cbcSMatt Macy 	}
538eda14cbcSMatt Macy 	return (0);
539eda14cbcSMatt Macy }
540eda14cbcSMatt Macy 
541eda14cbcSMatt Macy void
dprintf_setup(int * argc,char ** argv)542eda14cbcSMatt Macy dprintf_setup(int *argc, char **argv)
543eda14cbcSMatt Macy {
544eda14cbcSMatt Macy 	int i, j;
545eda14cbcSMatt Macy 
546eda14cbcSMatt Macy 	/*
547eda14cbcSMatt Macy 	 * Debugging can be specified two ways: by setting the
548eda14cbcSMatt Macy 	 * environment variable ZFS_DEBUG, or by including a
549eda14cbcSMatt Macy 	 * "debug=..."  argument on the command line.  The command
550eda14cbcSMatt Macy 	 * line setting overrides the environment variable.
551eda14cbcSMatt Macy 	 */
552eda14cbcSMatt Macy 
553eda14cbcSMatt Macy 	for (i = 1; i < *argc; i++) {
554eda14cbcSMatt Macy 		int len = strlen("debug=");
555eda14cbcSMatt Macy 		/* First look for a command line argument */
556eda14cbcSMatt Macy 		if (strncmp("debug=", argv[i], len) == 0) {
557eda14cbcSMatt Macy 			dprintf_string = argv[i] + len;
558eda14cbcSMatt Macy 			/* Remove from args */
559eda14cbcSMatt Macy 			for (j = i; j < *argc; j++)
560eda14cbcSMatt Macy 				argv[j] = argv[j+1];
561eda14cbcSMatt Macy 			argv[j] = NULL;
562eda14cbcSMatt Macy 			(*argc)--;
563eda14cbcSMatt Macy 		}
564eda14cbcSMatt Macy 	}
565eda14cbcSMatt Macy 
566eda14cbcSMatt Macy 	if (dprintf_string == NULL) {
567eda14cbcSMatt Macy 		/* Look for ZFS_DEBUG environment variable */
568eda14cbcSMatt Macy 		dprintf_string = getenv("ZFS_DEBUG");
569eda14cbcSMatt Macy 	}
570eda14cbcSMatt Macy 
571eda14cbcSMatt Macy 	/*
572eda14cbcSMatt Macy 	 * Are we just turning on all debugging?
573eda14cbcSMatt Macy 	 */
574eda14cbcSMatt Macy 	if (dprintf_find_string("on"))
575eda14cbcSMatt Macy 		dprintf_print_all = 1;
576eda14cbcSMatt Macy 
577eda14cbcSMatt Macy 	if (dprintf_string != NULL)
578eda14cbcSMatt Macy 		zfs_flags |= ZFS_DEBUG_DPRINTF;
579eda14cbcSMatt Macy }
580eda14cbcSMatt Macy 
581eda14cbcSMatt Macy /*
582eda14cbcSMatt Macy  * =========================================================================
583eda14cbcSMatt Macy  * debug printfs
584eda14cbcSMatt Macy  * =========================================================================
585eda14cbcSMatt Macy  */
586eda14cbcSMatt Macy void
__dprintf(boolean_t dprint,const char * file,const char * func,int line,const char * fmt,...)587eda14cbcSMatt Macy __dprintf(boolean_t dprint, const char *file, const char *func,
588eda14cbcSMatt Macy     int line, const char *fmt, ...)
589eda14cbcSMatt Macy {
5903ff01b23SMartin Matuska 	/* Get rid of annoying "../common/" prefix to filename. */
5913ff01b23SMartin Matuska 	const char *newfile = zfs_basename(file);
5923ff01b23SMartin Matuska 
593eda14cbcSMatt Macy 	va_list adx;
594eda14cbcSMatt Macy 	if (dprint) {
595eda14cbcSMatt Macy 		/* dprintf messages are printed immediately */
596eda14cbcSMatt Macy 
597eda14cbcSMatt Macy 		if (!dprintf_print_all &&
598eda14cbcSMatt Macy 		    !dprintf_find_string(newfile) &&
599eda14cbcSMatt Macy 		    !dprintf_find_string(func))
600eda14cbcSMatt Macy 			return;
601eda14cbcSMatt Macy 
602eda14cbcSMatt Macy 		/* Print out just the function name if requested */
603eda14cbcSMatt Macy 		flockfile(stdout);
604eda14cbcSMatt Macy 		if (dprintf_find_string("pid"))
605eda14cbcSMatt Macy 			(void) printf("%d ", getpid());
606eda14cbcSMatt Macy 		if (dprintf_find_string("tid"))
607eda14cbcSMatt Macy 			(void) printf("%ju ",
608eda14cbcSMatt Macy 			    (uintmax_t)(uintptr_t)pthread_self());
609eda14cbcSMatt Macy 		if (dprintf_find_string("cpu"))
610eda14cbcSMatt Macy 			(void) printf("%u ", getcpuid());
611eda14cbcSMatt Macy 		if (dprintf_find_string("time"))
612eda14cbcSMatt Macy 			(void) printf("%llu ", gethrtime());
613eda14cbcSMatt Macy 		if (dprintf_find_string("long"))
614eda14cbcSMatt Macy 			(void) printf("%s, line %d: ", newfile, line);
615eda14cbcSMatt Macy 		(void) printf("dprintf: %s: ", func);
616eda14cbcSMatt Macy 		va_start(adx, fmt);
617eda14cbcSMatt Macy 		(void) vprintf(fmt, adx);
618eda14cbcSMatt Macy 		va_end(adx);
619eda14cbcSMatt Macy 		funlockfile(stdout);
620eda14cbcSMatt Macy 	} else {
621eda14cbcSMatt Macy 		/* zfs_dbgmsg is logged for dumping later */
622eda14cbcSMatt Macy 		size_t size;
623eda14cbcSMatt Macy 		char *buf;
624eda14cbcSMatt Macy 		int i;
625eda14cbcSMatt Macy 
626eda14cbcSMatt Macy 		size = 1024;
627eda14cbcSMatt Macy 		buf = umem_alloc(size, UMEM_NOFAIL);
628eda14cbcSMatt Macy 		i = snprintf(buf, size, "%s:%d:%s(): ", newfile, line, func);
629eda14cbcSMatt Macy 
630eda14cbcSMatt Macy 		if (i < size) {
631eda14cbcSMatt Macy 			va_start(adx, fmt);
632eda14cbcSMatt Macy 			(void) vsnprintf(buf + i, size - i, fmt, adx);
633eda14cbcSMatt Macy 			va_end(adx);
634eda14cbcSMatt Macy 		}
635eda14cbcSMatt Macy 
636eda14cbcSMatt Macy 		__zfs_dbgmsg(buf);
637eda14cbcSMatt Macy 
638eda14cbcSMatt Macy 		umem_free(buf, size);
639eda14cbcSMatt Macy 	}
640eda14cbcSMatt Macy }
641eda14cbcSMatt Macy 
642eda14cbcSMatt Macy /*
643eda14cbcSMatt Macy  * =========================================================================
644eda14cbcSMatt Macy  * cmn_err() and panic()
645eda14cbcSMatt Macy  * =========================================================================
646eda14cbcSMatt Macy  */
647eda14cbcSMatt Macy static char ce_prefix[CE_IGNORE][10] = { "", "NOTICE: ", "WARNING: ", "" };
648eda14cbcSMatt Macy static char ce_suffix[CE_IGNORE][2] = { "", "\n", "\n", "" };
649eda14cbcSMatt Macy 
650da5137abSMartin Matuska __attribute__((noreturn)) void
vpanic(const char * fmt,va_list adx)651eda14cbcSMatt Macy vpanic(const char *fmt, va_list adx)
652eda14cbcSMatt Macy {
653eda14cbcSMatt Macy 	(void) fprintf(stderr, "error: ");
654eda14cbcSMatt Macy 	(void) vfprintf(stderr, fmt, adx);
655eda14cbcSMatt Macy 	(void) fprintf(stderr, "\n");
656eda14cbcSMatt Macy 
657eda14cbcSMatt Macy 	abort();	/* think of it as a "user-level crash dump" */
658eda14cbcSMatt Macy }
659eda14cbcSMatt Macy 
660da5137abSMartin Matuska __attribute__((noreturn)) void
panic(const char * fmt,...)661eda14cbcSMatt Macy panic(const char *fmt, ...)
662eda14cbcSMatt Macy {
663eda14cbcSMatt Macy 	va_list adx;
664eda14cbcSMatt Macy 
665eda14cbcSMatt Macy 	va_start(adx, fmt);
666eda14cbcSMatt Macy 	vpanic(fmt, adx);
667eda14cbcSMatt Macy 	va_end(adx);
668eda14cbcSMatt Macy }
669eda14cbcSMatt Macy 
670eda14cbcSMatt Macy void
vcmn_err(int ce,const char * fmt,va_list adx)671eda14cbcSMatt Macy vcmn_err(int ce, const char *fmt, va_list adx)
672eda14cbcSMatt Macy {
673eda14cbcSMatt Macy 	if (ce == CE_PANIC)
674eda14cbcSMatt Macy 		vpanic(fmt, adx);
675eda14cbcSMatt Macy 	if (ce != CE_NOTE) {	/* suppress noise in userland stress testing */
676eda14cbcSMatt Macy 		(void) fprintf(stderr, "%s", ce_prefix[ce]);
677eda14cbcSMatt Macy 		(void) vfprintf(stderr, fmt, adx);
678eda14cbcSMatt Macy 		(void) fprintf(stderr, "%s", ce_suffix[ce]);
679eda14cbcSMatt Macy 	}
680eda14cbcSMatt Macy }
681eda14cbcSMatt Macy 
682eda14cbcSMatt Macy void
cmn_err(int ce,const char * fmt,...)683eda14cbcSMatt Macy cmn_err(int ce, const char *fmt, ...)
684eda14cbcSMatt Macy {
685eda14cbcSMatt Macy 	va_list adx;
686eda14cbcSMatt Macy 
687eda14cbcSMatt Macy 	va_start(adx, fmt);
688eda14cbcSMatt Macy 	vcmn_err(ce, fmt, adx);
689eda14cbcSMatt Macy 	va_end(adx);
690eda14cbcSMatt Macy }
691eda14cbcSMatt Macy 
692eda14cbcSMatt Macy /*
693eda14cbcSMatt Macy  * =========================================================================
694eda14cbcSMatt Macy  * misc routines
695eda14cbcSMatt Macy  * =========================================================================
696eda14cbcSMatt Macy  */
697eda14cbcSMatt Macy 
698eda14cbcSMatt Macy void
delay(clock_t ticks)699eda14cbcSMatt Macy delay(clock_t ticks)
700eda14cbcSMatt Macy {
701eda14cbcSMatt Macy 	(void) poll(0, 0, ticks * (1000 / hz));
702eda14cbcSMatt Macy }
703eda14cbcSMatt Macy 
704eda14cbcSMatt Macy /*
705eda14cbcSMatt Macy  * Find highest one bit set.
706eda14cbcSMatt Macy  * Returns bit number + 1 of highest bit that is set, otherwise returns 0.
707eda14cbcSMatt Macy  * The __builtin_clzll() function is supported by both GCC and Clang.
708eda14cbcSMatt Macy  */
709eda14cbcSMatt Macy int
highbit64(uint64_t i)710eda14cbcSMatt Macy highbit64(uint64_t i)
711eda14cbcSMatt Macy {
712eda14cbcSMatt Macy 	if (i == 0)
713eda14cbcSMatt Macy 	return (0);
714eda14cbcSMatt Macy 
715eda14cbcSMatt Macy 	return (NBBY * sizeof (uint64_t) - __builtin_clzll(i));
716eda14cbcSMatt Macy }
717eda14cbcSMatt Macy 
718eda14cbcSMatt Macy /*
719eda14cbcSMatt Macy  * Find lowest one bit set.
720eda14cbcSMatt Macy  * Returns bit number + 1 of lowest bit that is set, otherwise returns 0.
721eda14cbcSMatt Macy  * The __builtin_ffsll() function is supported by both GCC and Clang.
722eda14cbcSMatt Macy  */
723eda14cbcSMatt Macy int
lowbit64(uint64_t i)724eda14cbcSMatt Macy lowbit64(uint64_t i)
725eda14cbcSMatt Macy {
726eda14cbcSMatt Macy 	if (i == 0)
727eda14cbcSMatt Macy 		return (0);
728eda14cbcSMatt Macy 
729eda14cbcSMatt Macy 	return (__builtin_ffsll(i));
730eda14cbcSMatt Macy }
731eda14cbcSMatt Macy 
73216038816SMartin Matuska const char *random_path = "/dev/random";
73316038816SMartin Matuska const char *urandom_path = "/dev/urandom";
734eda14cbcSMatt Macy static int random_fd = -1, urandom_fd = -1;
735eda14cbcSMatt Macy 
736eda14cbcSMatt Macy void
random_init(void)737eda14cbcSMatt Macy random_init(void)
738eda14cbcSMatt Macy {
73916038816SMartin Matuska 	VERIFY((random_fd = open(random_path, O_RDONLY | O_CLOEXEC)) != -1);
74016038816SMartin Matuska 	VERIFY((urandom_fd = open(urandom_path, O_RDONLY | O_CLOEXEC)) != -1);
741eda14cbcSMatt Macy }
742eda14cbcSMatt Macy 
743eda14cbcSMatt Macy void
random_fini(void)744eda14cbcSMatt Macy random_fini(void)
745eda14cbcSMatt Macy {
746eda14cbcSMatt Macy 	close(random_fd);
747eda14cbcSMatt Macy 	close(urandom_fd);
748eda14cbcSMatt Macy 
749eda14cbcSMatt Macy 	random_fd = -1;
750eda14cbcSMatt Macy 	urandom_fd = -1;
751eda14cbcSMatt Macy }
752eda14cbcSMatt Macy 
753eda14cbcSMatt Macy static int
random_get_bytes_common(uint8_t * ptr,size_t len,int fd)754eda14cbcSMatt Macy random_get_bytes_common(uint8_t *ptr, size_t len, int fd)
755eda14cbcSMatt Macy {
756eda14cbcSMatt Macy 	size_t resid = len;
757eda14cbcSMatt Macy 	ssize_t bytes;
758eda14cbcSMatt Macy 
759eda14cbcSMatt Macy 	ASSERT(fd != -1);
760eda14cbcSMatt Macy 
761eda14cbcSMatt Macy 	while (resid != 0) {
762eda14cbcSMatt Macy 		bytes = read(fd, ptr, resid);
763eda14cbcSMatt Macy 		ASSERT3S(bytes, >=, 0);
764eda14cbcSMatt Macy 		ptr += bytes;
765eda14cbcSMatt Macy 		resid -= bytes;
766eda14cbcSMatt Macy 	}
767eda14cbcSMatt Macy 
768eda14cbcSMatt Macy 	return (0);
769eda14cbcSMatt Macy }
770eda14cbcSMatt Macy 
771eda14cbcSMatt Macy int
random_get_bytes(uint8_t * ptr,size_t len)772eda14cbcSMatt Macy random_get_bytes(uint8_t *ptr, size_t len)
773eda14cbcSMatt Macy {
774eda14cbcSMatt Macy 	return (random_get_bytes_common(ptr, len, random_fd));
775eda14cbcSMatt Macy }
776eda14cbcSMatt Macy 
777eda14cbcSMatt Macy int
random_get_pseudo_bytes(uint8_t * ptr,size_t len)778eda14cbcSMatt Macy random_get_pseudo_bytes(uint8_t *ptr, size_t len)
779eda14cbcSMatt Macy {
780eda14cbcSMatt Macy 	return (random_get_bytes_common(ptr, len, urandom_fd));
781eda14cbcSMatt Macy }
782eda14cbcSMatt Macy 
783eda14cbcSMatt Macy int
ddi_strtoull(const char * str,char ** nptr,int base,u_longlong_t * result)784eda14cbcSMatt Macy ddi_strtoull(const char *str, char **nptr, int base, u_longlong_t *result)
785eda14cbcSMatt Macy {
78615f0b8c3SMartin Matuska 	errno = 0;
78715f0b8c3SMartin Matuska 	*result = strtoull(str, nptr, base);
788eda14cbcSMatt Macy 	if (*result == 0)
789eda14cbcSMatt Macy 		return (errno);
790eda14cbcSMatt Macy 	return (0);
791eda14cbcSMatt Macy }
792eda14cbcSMatt Macy 
793eda14cbcSMatt Macy utsname_t *
utsname(void)794eda14cbcSMatt Macy utsname(void)
795eda14cbcSMatt Macy {
796eda14cbcSMatt Macy 	return (&hw_utsname);
797eda14cbcSMatt Macy }
798eda14cbcSMatt Macy 
799eda14cbcSMatt Macy /*
800eda14cbcSMatt Macy  * =========================================================================
801eda14cbcSMatt Macy  * kernel emulation setup & teardown
802eda14cbcSMatt Macy  * =========================================================================
803eda14cbcSMatt Macy  */
804eda14cbcSMatt Macy static int
umem_out_of_memory(void)805eda14cbcSMatt Macy umem_out_of_memory(void)
806eda14cbcSMatt Macy {
807eda14cbcSMatt Macy 	char errmsg[] = "out of memory -- generating core dump\n";
808eda14cbcSMatt Macy 
809eda14cbcSMatt Macy 	(void) fprintf(stderr, "%s", errmsg);
810eda14cbcSMatt Macy 	abort();
811eda14cbcSMatt Macy 	return (0);
812eda14cbcSMatt Macy }
813eda14cbcSMatt Macy 
814eda14cbcSMatt Macy void
kernel_init(int mode)815eda14cbcSMatt Macy kernel_init(int mode)
816eda14cbcSMatt Macy {
817eda14cbcSMatt Macy 	extern uint_t rrw_tsd_key;
818eda14cbcSMatt Macy 
819eda14cbcSMatt Macy 	umem_nofail_callback(umem_out_of_memory);
820eda14cbcSMatt Macy 
821eda14cbcSMatt Macy 	physmem = sysconf(_SC_PHYS_PAGES);
822eda14cbcSMatt Macy 
82333b8c039SMartin Matuska 	dprintf("physmem = %llu pages (%.2f GB)\n", (u_longlong_t)physmem,
824eda14cbcSMatt Macy 	    (double)physmem * sysconf(_SC_PAGE_SIZE) / (1ULL << 30));
825eda14cbcSMatt Macy 
826716fd348SMartin Matuska 	hostid = (mode & SPA_MODE_WRITE) ? get_system_hostid() : 0;
827eda14cbcSMatt Macy 
828eda14cbcSMatt Macy 	random_init();
829eda14cbcSMatt Macy 
830eda14cbcSMatt Macy 	VERIFY0(uname(&hw_utsname));
831eda14cbcSMatt Macy 
832eda14cbcSMatt Macy 	system_taskq_init();
833eda14cbcSMatt Macy 	icp_init();
834eda14cbcSMatt Macy 
835eda14cbcSMatt Macy 	zstd_init();
836eda14cbcSMatt Macy 
837eda14cbcSMatt Macy 	spa_init((spa_mode_t)mode);
838eda14cbcSMatt Macy 
839eda14cbcSMatt Macy 	fletcher_4_init();
840eda14cbcSMatt Macy 
841eda14cbcSMatt Macy 	tsd_create(&rrw_tsd_key, rrw_tsd_destroy);
842eda14cbcSMatt Macy }
843eda14cbcSMatt Macy 
844eda14cbcSMatt Macy void
kernel_fini(void)845eda14cbcSMatt Macy kernel_fini(void)
846eda14cbcSMatt Macy {
847eda14cbcSMatt Macy 	fletcher_4_fini();
848eda14cbcSMatt Macy 	spa_fini();
849eda14cbcSMatt Macy 
850eda14cbcSMatt Macy 	zstd_fini();
851eda14cbcSMatt Macy 
852eda14cbcSMatt Macy 	icp_fini();
853eda14cbcSMatt Macy 	system_taskq_fini();
854eda14cbcSMatt Macy 
855eda14cbcSMatt Macy 	random_fini();
856eda14cbcSMatt Macy }
857eda14cbcSMatt Macy 
858eda14cbcSMatt Macy uid_t
crgetuid(cred_t * cr)859eda14cbcSMatt Macy crgetuid(cred_t *cr)
860eda14cbcSMatt Macy {
861e92ffd9bSMartin Matuska 	(void) cr;
862eda14cbcSMatt Macy 	return (0);
863eda14cbcSMatt Macy }
864eda14cbcSMatt Macy 
865eda14cbcSMatt Macy uid_t
crgetruid(cred_t * cr)866eda14cbcSMatt Macy crgetruid(cred_t *cr)
867eda14cbcSMatt Macy {
868e92ffd9bSMartin Matuska 	(void) cr;
869eda14cbcSMatt Macy 	return (0);
870eda14cbcSMatt Macy }
871eda14cbcSMatt Macy 
872eda14cbcSMatt Macy gid_t
crgetgid(cred_t * cr)873eda14cbcSMatt Macy crgetgid(cred_t *cr)
874eda14cbcSMatt Macy {
875e92ffd9bSMartin Matuska 	(void) cr;
876eda14cbcSMatt Macy 	return (0);
877eda14cbcSMatt Macy }
878eda14cbcSMatt Macy 
879eda14cbcSMatt Macy int
crgetngroups(cred_t * cr)880eda14cbcSMatt Macy crgetngroups(cred_t *cr)
881eda14cbcSMatt Macy {
882e92ffd9bSMartin Matuska 	(void) cr;
883eda14cbcSMatt Macy 	return (0);
884eda14cbcSMatt Macy }
885eda14cbcSMatt Macy 
886eda14cbcSMatt Macy gid_t *
crgetgroups(cred_t * cr)887eda14cbcSMatt Macy crgetgroups(cred_t *cr)
888eda14cbcSMatt Macy {
889e92ffd9bSMartin Matuska 	(void) cr;
890eda14cbcSMatt Macy 	return (NULL);
891eda14cbcSMatt Macy }
892eda14cbcSMatt Macy 
893eda14cbcSMatt Macy int
zfs_secpolicy_snapshot_perms(const char * name,cred_t * cr)894eda14cbcSMatt Macy zfs_secpolicy_snapshot_perms(const char *name, cred_t *cr)
895eda14cbcSMatt Macy {
896e92ffd9bSMartin Matuska 	(void) name, (void) cr;
897eda14cbcSMatt Macy 	return (0);
898eda14cbcSMatt Macy }
899eda14cbcSMatt Macy 
900eda14cbcSMatt Macy int
zfs_secpolicy_rename_perms(const char * from,const char * to,cred_t * cr)901eda14cbcSMatt Macy zfs_secpolicy_rename_perms(const char *from, const char *to, cred_t *cr)
902eda14cbcSMatt Macy {
903e92ffd9bSMartin Matuska 	(void) from, (void) to, (void) cr;
904eda14cbcSMatt Macy 	return (0);
905eda14cbcSMatt Macy }
906eda14cbcSMatt Macy 
907eda14cbcSMatt Macy int
zfs_secpolicy_destroy_perms(const char * name,cred_t * cr)908eda14cbcSMatt Macy zfs_secpolicy_destroy_perms(const char *name, cred_t *cr)
909eda14cbcSMatt Macy {
910e92ffd9bSMartin Matuska 	(void) name, (void) cr;
911eda14cbcSMatt Macy 	return (0);
912eda14cbcSMatt Macy }
913eda14cbcSMatt Macy 
914eda14cbcSMatt Macy int
secpolicy_zfs(const cred_t * cr)915eda14cbcSMatt Macy secpolicy_zfs(const cred_t *cr)
916eda14cbcSMatt Macy {
917e92ffd9bSMartin Matuska 	(void) cr;
918eda14cbcSMatt Macy 	return (0);
919eda14cbcSMatt Macy }
920eda14cbcSMatt Macy 
921eda14cbcSMatt Macy ksiddomain_t *
ksid_lookupdomain(const char * dom)922eda14cbcSMatt Macy ksid_lookupdomain(const char *dom)
923eda14cbcSMatt Macy {
924eda14cbcSMatt Macy 	ksiddomain_t *kd;
925eda14cbcSMatt Macy 
926eda14cbcSMatt Macy 	kd = umem_zalloc(sizeof (ksiddomain_t), UMEM_NOFAIL);
927eda14cbcSMatt Macy 	kd->kd_name = spa_strdup(dom);
928eda14cbcSMatt Macy 	return (kd);
929eda14cbcSMatt Macy }
930eda14cbcSMatt Macy 
931eda14cbcSMatt Macy void
ksiddomain_rele(ksiddomain_t * ksid)932eda14cbcSMatt Macy ksiddomain_rele(ksiddomain_t *ksid)
933eda14cbcSMatt Macy {
934eda14cbcSMatt Macy 	spa_strfree(ksid->kd_name);
935eda14cbcSMatt Macy 	umem_free(ksid, sizeof (ksiddomain_t));
936eda14cbcSMatt Macy }
937eda14cbcSMatt Macy 
938eda14cbcSMatt Macy char *
kmem_vasprintf(const char * fmt,va_list adx)939eda14cbcSMatt Macy kmem_vasprintf(const char *fmt, va_list adx)
940eda14cbcSMatt Macy {
941eda14cbcSMatt Macy 	char *buf = NULL;
942eda14cbcSMatt Macy 	va_list adx_copy;
943eda14cbcSMatt Macy 
944eda14cbcSMatt Macy 	va_copy(adx_copy, adx);
945eda14cbcSMatt Macy 	VERIFY(vasprintf(&buf, fmt, adx_copy) != -1);
946eda14cbcSMatt Macy 	va_end(adx_copy);
947eda14cbcSMatt Macy 
948eda14cbcSMatt Macy 	return (buf);
949eda14cbcSMatt Macy }
950eda14cbcSMatt Macy 
951eda14cbcSMatt Macy char *
kmem_asprintf(const char * fmt,...)952eda14cbcSMatt Macy kmem_asprintf(const char *fmt, ...)
953eda14cbcSMatt Macy {
954eda14cbcSMatt Macy 	char *buf = NULL;
955eda14cbcSMatt Macy 	va_list adx;
956eda14cbcSMatt Macy 
957eda14cbcSMatt Macy 	va_start(adx, fmt);
958eda14cbcSMatt Macy 	VERIFY(vasprintf(&buf, fmt, adx) != -1);
959eda14cbcSMatt Macy 	va_end(adx);
960eda14cbcSMatt Macy 
961eda14cbcSMatt Macy 	return (buf);
962eda14cbcSMatt Macy }
963eda14cbcSMatt Macy 
964dbd5678dSMartin Matuska /*
965dbd5678dSMartin Matuska  * kmem_scnprintf() will return the number of characters that it would have
966dbd5678dSMartin Matuska  * printed whenever it is limited by value of the size variable, rather than
967dbd5678dSMartin Matuska  * the number of characters that it did print. This can cause misbehavior on
968dbd5678dSMartin Matuska  * subsequent uses of the return value, so we define a safe version that will
969dbd5678dSMartin Matuska  * return the number of characters actually printed, minus the NULL format
970dbd5678dSMartin Matuska  * character.  Subsequent use of this by the safe string functions is safe
971dbd5678dSMartin Matuska  * whether it is snprintf(), strlcat() or strlcpy().
972dbd5678dSMartin Matuska  */
973dbd5678dSMartin Matuska int
kmem_scnprintf(char * restrict str,size_t size,const char * restrict fmt,...)974dbd5678dSMartin Matuska kmem_scnprintf(char *restrict str, size_t size, const char *restrict fmt, ...)
975dbd5678dSMartin Matuska {
976dbd5678dSMartin Matuska 	int n;
977dbd5678dSMartin Matuska 	va_list ap;
978dbd5678dSMartin Matuska 
979dbd5678dSMartin Matuska 	/* Make the 0 case a no-op so that we do not return -1 */
980dbd5678dSMartin Matuska 	if (size == 0)
981dbd5678dSMartin Matuska 		return (0);
982dbd5678dSMartin Matuska 
983dbd5678dSMartin Matuska 	va_start(ap, fmt);
984dbd5678dSMartin Matuska 	n = vsnprintf(str, size, fmt, ap);
985dbd5678dSMartin Matuska 	va_end(ap);
986dbd5678dSMartin Matuska 
987dbd5678dSMartin Matuska 	if (n >= size)
988dbd5678dSMartin Matuska 		n = size - 1;
989dbd5678dSMartin Matuska 
990dbd5678dSMartin Matuska 	return (n);
991dbd5678dSMartin Matuska }
992dbd5678dSMartin Matuska 
9935eb61f6cSMartin Matuska zfs_file_t *
zfs_onexit_fd_hold(int fd,minor_t * minorp)994eda14cbcSMatt Macy zfs_onexit_fd_hold(int fd, minor_t *minorp)
995eda14cbcSMatt Macy {
996e92ffd9bSMartin Matuska 	(void) fd;
997eda14cbcSMatt Macy 	*minorp = 0;
9985eb61f6cSMartin Matuska 	return (NULL);
999eda14cbcSMatt Macy }
1000eda14cbcSMatt Macy 
1001eda14cbcSMatt Macy void
zfs_onexit_fd_rele(zfs_file_t * fp)10025eb61f6cSMartin Matuska zfs_onexit_fd_rele(zfs_file_t *fp)
1003eda14cbcSMatt Macy {
1004e92ffd9bSMartin Matuska 	(void) fp;
1005eda14cbcSMatt Macy }
1006eda14cbcSMatt Macy 
1007eda14cbcSMatt Macy int
zfs_onexit_add_cb(minor_t minor,void (* func)(void *),void * data,uintptr_t * action_handle)1008eda14cbcSMatt Macy zfs_onexit_add_cb(minor_t minor, void (*func)(void *), void *data,
1009dbd5678dSMartin Matuska     uintptr_t *action_handle)
1010eda14cbcSMatt Macy {
1011e92ffd9bSMartin Matuska 	(void) minor, (void) func, (void) data, (void) action_handle;
1012eda14cbcSMatt Macy 	return (0);
1013eda14cbcSMatt Macy }
1014eda14cbcSMatt Macy 
1015eda14cbcSMatt Macy fstrans_cookie_t
spl_fstrans_mark(void)1016eda14cbcSMatt Macy spl_fstrans_mark(void)
1017eda14cbcSMatt Macy {
1018eda14cbcSMatt Macy 	return ((fstrans_cookie_t)0);
1019eda14cbcSMatt Macy }
1020eda14cbcSMatt Macy 
1021eda14cbcSMatt Macy void
spl_fstrans_unmark(fstrans_cookie_t cookie)1022eda14cbcSMatt Macy spl_fstrans_unmark(fstrans_cookie_t cookie)
1023eda14cbcSMatt Macy {
1024e92ffd9bSMartin Matuska 	(void) cookie;
1025eda14cbcSMatt Macy }
1026eda14cbcSMatt Macy 
1027eda14cbcSMatt Macy int
__spl_pf_fstrans_check(void)1028eda14cbcSMatt Macy __spl_pf_fstrans_check(void)
1029eda14cbcSMatt Macy {
1030eda14cbcSMatt Macy 	return (0);
1031eda14cbcSMatt Macy }
1032eda14cbcSMatt Macy 
1033eda14cbcSMatt Macy int
kmem_cache_reap_active(void)1034eda14cbcSMatt Macy kmem_cache_reap_active(void)
1035eda14cbcSMatt Macy {
1036eda14cbcSMatt Macy 	return (0);
1037eda14cbcSMatt Macy }
1038eda14cbcSMatt Macy 
1039eda14cbcSMatt Macy void
zvol_create_minor(const char * name)1040eda14cbcSMatt Macy zvol_create_minor(const char *name)
1041eda14cbcSMatt Macy {
1042e92ffd9bSMartin Matuska 	(void) name;
1043eda14cbcSMatt Macy }
1044eda14cbcSMatt Macy 
1045eda14cbcSMatt Macy void
zvol_create_minors_recursive(const char * name)1046eda14cbcSMatt Macy zvol_create_minors_recursive(const char *name)
1047eda14cbcSMatt Macy {
1048e92ffd9bSMartin Matuska 	(void) name;
1049eda14cbcSMatt Macy }
1050eda14cbcSMatt Macy 
1051eda14cbcSMatt Macy void
zvol_remove_minors(spa_t * spa,const char * name,boolean_t async)1052eda14cbcSMatt Macy zvol_remove_minors(spa_t *spa, const char *name, boolean_t async)
1053eda14cbcSMatt Macy {
1054e92ffd9bSMartin Matuska 	(void) spa, (void) name, (void) async;
1055eda14cbcSMatt Macy }
1056eda14cbcSMatt Macy 
1057eda14cbcSMatt Macy void
zvol_rename_minors(spa_t * spa,const char * oldname,const char * newname,boolean_t async)1058eda14cbcSMatt Macy zvol_rename_minors(spa_t *spa, const char *oldname, const char *newname,
1059eda14cbcSMatt Macy     boolean_t async)
1060eda14cbcSMatt Macy {
1061e92ffd9bSMartin Matuska 	(void) spa, (void) oldname, (void) newname, (void) async;
1062eda14cbcSMatt Macy }
1063eda14cbcSMatt Macy 
1064eda14cbcSMatt Macy /*
1065eda14cbcSMatt Macy  * Open file
1066eda14cbcSMatt Macy  *
1067eda14cbcSMatt Macy  * path - fully qualified path to file
1068eda14cbcSMatt Macy  * flags - file attributes O_READ / O_WRITE / O_EXCL
1069eda14cbcSMatt Macy  * fpp - pointer to return file pointer
1070eda14cbcSMatt Macy  *
1071eda14cbcSMatt Macy  * Returns 0 on success underlying error on failure.
1072eda14cbcSMatt Macy  */
1073eda14cbcSMatt Macy int
zfs_file_open(const char * path,int flags,int mode,zfs_file_t ** fpp)1074eda14cbcSMatt Macy zfs_file_open(const char *path, int flags, int mode, zfs_file_t **fpp)
1075eda14cbcSMatt Macy {
1076eda14cbcSMatt Macy 	int fd = -1;
1077eda14cbcSMatt Macy 	int dump_fd = -1;
1078eda14cbcSMatt Macy 	int err;
1079eda14cbcSMatt Macy 	int old_umask = 0;
1080eda14cbcSMatt Macy 	zfs_file_t *fp;
1081eda14cbcSMatt Macy 	struct stat64 st;
1082eda14cbcSMatt Macy 
1083eda14cbcSMatt Macy 	if (!(flags & O_CREAT) && stat64(path, &st) == -1)
1084eda14cbcSMatt Macy 		return (errno);
1085eda14cbcSMatt Macy 
1086eda14cbcSMatt Macy 	if (!(flags & O_CREAT) && S_ISBLK(st.st_mode))
1087eda14cbcSMatt Macy 		flags |= O_DIRECT;
1088eda14cbcSMatt Macy 
1089eda14cbcSMatt Macy 	if (flags & O_CREAT)
1090eda14cbcSMatt Macy 		old_umask = umask(0);
1091eda14cbcSMatt Macy 
1092eda14cbcSMatt Macy 	fd = open64(path, flags, mode);
1093eda14cbcSMatt Macy 	if (fd == -1)
1094eda14cbcSMatt Macy 		return (errno);
1095eda14cbcSMatt Macy 
1096eda14cbcSMatt Macy 	if (flags & O_CREAT)
1097eda14cbcSMatt Macy 		(void) umask(old_umask);
1098eda14cbcSMatt Macy 
1099eda14cbcSMatt Macy 	if (vn_dumpdir != NULL) {
1100eda14cbcSMatt Macy 		char *dumppath = umem_zalloc(MAXPATHLEN, UMEM_NOFAIL);
11013ff01b23SMartin Matuska 		const char *inpath = zfs_basename(path);
1102eda14cbcSMatt Macy 
1103eda14cbcSMatt Macy 		(void) snprintf(dumppath, MAXPATHLEN,
1104eda14cbcSMatt Macy 		    "%s/%s", vn_dumpdir, inpath);
1105eda14cbcSMatt Macy 		dump_fd = open64(dumppath, O_CREAT | O_WRONLY, 0666);
1106eda14cbcSMatt Macy 		umem_free(dumppath, MAXPATHLEN);
1107eda14cbcSMatt Macy 		if (dump_fd == -1) {
1108eda14cbcSMatt Macy 			err = errno;
1109eda14cbcSMatt Macy 			close(fd);
1110eda14cbcSMatt Macy 			return (err);
1111eda14cbcSMatt Macy 		}
1112eda14cbcSMatt Macy 	} else {
1113eda14cbcSMatt Macy 		dump_fd = -1;
1114eda14cbcSMatt Macy 	}
1115eda14cbcSMatt Macy 
1116eda14cbcSMatt Macy 	(void) fcntl(fd, F_SETFD, FD_CLOEXEC);
1117eda14cbcSMatt Macy 
1118eda14cbcSMatt Macy 	fp = umem_zalloc(sizeof (zfs_file_t), UMEM_NOFAIL);
1119eda14cbcSMatt Macy 	fp->f_fd = fd;
1120eda14cbcSMatt Macy 	fp->f_dump_fd = dump_fd;
1121eda14cbcSMatt Macy 	*fpp = fp;
1122eda14cbcSMatt Macy 
1123eda14cbcSMatt Macy 	return (0);
1124eda14cbcSMatt Macy }
1125eda14cbcSMatt Macy 
1126eda14cbcSMatt Macy void
zfs_file_close(zfs_file_t * fp)1127eda14cbcSMatt Macy zfs_file_close(zfs_file_t *fp)
1128eda14cbcSMatt Macy {
1129eda14cbcSMatt Macy 	close(fp->f_fd);
1130eda14cbcSMatt Macy 	if (fp->f_dump_fd != -1)
1131eda14cbcSMatt Macy 		close(fp->f_dump_fd);
1132eda14cbcSMatt Macy 
1133eda14cbcSMatt Macy 	umem_free(fp, sizeof (zfs_file_t));
1134eda14cbcSMatt Macy }
1135eda14cbcSMatt Macy 
1136eda14cbcSMatt Macy /*
1137eda14cbcSMatt Macy  * Stateful write - use os internal file pointer to determine where to
1138eda14cbcSMatt Macy  * write and update on successful completion.
1139eda14cbcSMatt Macy  *
1140eda14cbcSMatt Macy  * fp -  pointer to file (pipe, socket, etc) to write to
1141eda14cbcSMatt Macy  * buf - buffer to write
1142eda14cbcSMatt Macy  * count - # of bytes to write
1143eda14cbcSMatt Macy  * resid -  pointer to count of unwritten bytes  (if short write)
1144eda14cbcSMatt Macy  *
1145eda14cbcSMatt Macy  * Returns 0 on success errno on failure.
1146eda14cbcSMatt Macy  */
1147eda14cbcSMatt Macy int
zfs_file_write(zfs_file_t * fp,const void * buf,size_t count,ssize_t * resid)1148eda14cbcSMatt Macy zfs_file_write(zfs_file_t *fp, const void *buf, size_t count, ssize_t *resid)
1149eda14cbcSMatt Macy {
1150eda14cbcSMatt Macy 	ssize_t rc;
1151eda14cbcSMatt Macy 
1152eda14cbcSMatt Macy 	rc = write(fp->f_fd, buf, count);
1153eda14cbcSMatt Macy 	if (rc < 0)
1154eda14cbcSMatt Macy 		return (errno);
1155eda14cbcSMatt Macy 
1156eda14cbcSMatt Macy 	if (resid) {
1157eda14cbcSMatt Macy 		*resid = count - rc;
1158eda14cbcSMatt Macy 	} else if (rc != count) {
1159eda14cbcSMatt Macy 		return (EIO);
1160eda14cbcSMatt Macy 	}
1161eda14cbcSMatt Macy 
1162eda14cbcSMatt Macy 	return (0);
1163eda14cbcSMatt Macy }
1164eda14cbcSMatt Macy 
1165eda14cbcSMatt Macy /*
1166eda14cbcSMatt Macy  * Stateless write - os internal file pointer is not updated.
1167eda14cbcSMatt Macy  *
1168eda14cbcSMatt Macy  * fp -  pointer to file (pipe, socket, etc) to write to
1169eda14cbcSMatt Macy  * buf - buffer to write
1170eda14cbcSMatt Macy  * count - # of bytes to write
1171eda14cbcSMatt Macy  * off - file offset to write to (only valid for seekable types)
1172eda14cbcSMatt Macy  * resid -  pointer to count of unwritten bytes
1173eda14cbcSMatt Macy  *
1174eda14cbcSMatt Macy  * Returns 0 on success errno on failure.
1175eda14cbcSMatt Macy  */
1176eda14cbcSMatt Macy int
zfs_file_pwrite(zfs_file_t * fp,const void * buf,size_t count,loff_t pos,ssize_t * resid)1177eda14cbcSMatt Macy zfs_file_pwrite(zfs_file_t *fp, const void *buf,
1178eda14cbcSMatt Macy     size_t count, loff_t pos, ssize_t *resid)
1179eda14cbcSMatt Macy {
1180eda14cbcSMatt Macy 	ssize_t rc, split, done;
1181eda14cbcSMatt Macy 	int sectors;
1182eda14cbcSMatt Macy 
1183eda14cbcSMatt Macy 	/*
1184eda14cbcSMatt Macy 	 * To simulate partial disk writes, we split writes into two
1185eda14cbcSMatt Macy 	 * system calls so that the process can be killed in between.
1186eda14cbcSMatt Macy 	 * This is used by ztest to simulate realistic failure modes.
1187eda14cbcSMatt Macy 	 */
1188eda14cbcSMatt Macy 	sectors = count >> SPA_MINBLOCKSHIFT;
1189eda14cbcSMatt Macy 	split = (sectors > 0 ? rand() % sectors : 0) << SPA_MINBLOCKSHIFT;
1190eda14cbcSMatt Macy 	rc = pwrite64(fp->f_fd, buf, split, pos);
1191eda14cbcSMatt Macy 	if (rc != -1) {
1192eda14cbcSMatt Macy 		done = rc;
1193eda14cbcSMatt Macy 		rc = pwrite64(fp->f_fd, (char *)buf + split,
1194eda14cbcSMatt Macy 		    count - split, pos + split);
1195eda14cbcSMatt Macy 	}
1196eda14cbcSMatt Macy #ifdef __linux__
1197eda14cbcSMatt Macy 	if (rc == -1 && errno == EINVAL) {
1198eda14cbcSMatt Macy 		/*
1199eda14cbcSMatt Macy 		 * Under Linux, this most likely means an alignment issue
1200eda14cbcSMatt Macy 		 * (memory or disk) due to O_DIRECT, so we abort() in order
1201eda14cbcSMatt Macy 		 * to catch the offender.
1202eda14cbcSMatt Macy 		 */
1203eda14cbcSMatt Macy 		abort();
1204eda14cbcSMatt Macy 	}
1205eda14cbcSMatt Macy #endif
1206eda14cbcSMatt Macy 
1207eda14cbcSMatt Macy 	if (rc < 0)
1208eda14cbcSMatt Macy 		return (errno);
1209eda14cbcSMatt Macy 
1210eda14cbcSMatt Macy 	done += rc;
1211eda14cbcSMatt Macy 
1212eda14cbcSMatt Macy 	if (resid) {
1213eda14cbcSMatt Macy 		*resid = count - done;
1214eda14cbcSMatt Macy 	} else if (done != count) {
1215eda14cbcSMatt Macy 		return (EIO);
1216eda14cbcSMatt Macy 	}
1217eda14cbcSMatt Macy 
1218eda14cbcSMatt Macy 	return (0);
1219eda14cbcSMatt Macy }
1220eda14cbcSMatt Macy 
1221eda14cbcSMatt Macy /*
1222eda14cbcSMatt Macy  * Stateful read - use os internal file pointer to determine where to
1223eda14cbcSMatt Macy  * read and update on successful completion.
1224eda14cbcSMatt Macy  *
1225eda14cbcSMatt Macy  * fp -  pointer to file (pipe, socket, etc) to read from
1226eda14cbcSMatt Macy  * buf - buffer to write
1227eda14cbcSMatt Macy  * count - # of bytes to read
1228eda14cbcSMatt Macy  * resid -  pointer to count of unread bytes (if short read)
1229eda14cbcSMatt Macy  *
1230eda14cbcSMatt Macy  * Returns 0 on success errno on failure.
1231eda14cbcSMatt Macy  */
1232eda14cbcSMatt Macy int
zfs_file_read(zfs_file_t * fp,void * buf,size_t count,ssize_t * resid)1233eda14cbcSMatt Macy zfs_file_read(zfs_file_t *fp, void *buf, size_t count, ssize_t *resid)
1234eda14cbcSMatt Macy {
1235eda14cbcSMatt Macy 	int rc;
1236eda14cbcSMatt Macy 
1237eda14cbcSMatt Macy 	rc = read(fp->f_fd, buf, count);
1238eda14cbcSMatt Macy 	if (rc < 0)
1239eda14cbcSMatt Macy 		return (errno);
1240eda14cbcSMatt Macy 
1241eda14cbcSMatt Macy 	if (resid) {
1242eda14cbcSMatt Macy 		*resid = count - rc;
1243eda14cbcSMatt Macy 	} else if (rc != count) {
1244eda14cbcSMatt Macy 		return (EIO);
1245eda14cbcSMatt Macy 	}
1246eda14cbcSMatt Macy 
1247eda14cbcSMatt Macy 	return (0);
1248eda14cbcSMatt Macy }
1249eda14cbcSMatt Macy 
1250eda14cbcSMatt Macy /*
1251eda14cbcSMatt Macy  * Stateless read - os internal file pointer is not updated.
1252eda14cbcSMatt Macy  *
1253eda14cbcSMatt Macy  * fp -  pointer to file (pipe, socket, etc) to read from
1254eda14cbcSMatt Macy  * buf - buffer to write
1255eda14cbcSMatt Macy  * count - # of bytes to write
1256eda14cbcSMatt Macy  * off - file offset to read from (only valid for seekable types)
1257eda14cbcSMatt Macy  * resid -  pointer to count of unwritten bytes (if short write)
1258eda14cbcSMatt Macy  *
1259eda14cbcSMatt Macy  * Returns 0 on success errno on failure.
1260eda14cbcSMatt Macy  */
1261eda14cbcSMatt Macy int
zfs_file_pread(zfs_file_t * fp,void * buf,size_t count,loff_t off,ssize_t * resid)1262eda14cbcSMatt Macy zfs_file_pread(zfs_file_t *fp, void *buf, size_t count, loff_t off,
1263eda14cbcSMatt Macy     ssize_t *resid)
1264eda14cbcSMatt Macy {
1265eda14cbcSMatt Macy 	ssize_t rc;
1266eda14cbcSMatt Macy 
1267eda14cbcSMatt Macy 	rc = pread64(fp->f_fd, buf, count, off);
1268eda14cbcSMatt Macy 	if (rc < 0) {
1269eda14cbcSMatt Macy #ifdef __linux__
1270eda14cbcSMatt Macy 		/*
1271eda14cbcSMatt Macy 		 * Under Linux, this most likely means an alignment issue
1272eda14cbcSMatt Macy 		 * (memory or disk) due to O_DIRECT, so we abort() in order to
1273eda14cbcSMatt Macy 		 * catch the offender.
1274eda14cbcSMatt Macy 		 */
1275eda14cbcSMatt Macy 		if (errno == EINVAL)
1276eda14cbcSMatt Macy 			abort();
1277eda14cbcSMatt Macy #endif
1278eda14cbcSMatt Macy 		return (errno);
1279eda14cbcSMatt Macy 	}
1280eda14cbcSMatt Macy 
1281eda14cbcSMatt Macy 	if (fp->f_dump_fd != -1) {
1282eda14cbcSMatt Macy 		int status;
1283eda14cbcSMatt Macy 
1284eda14cbcSMatt Macy 		status = pwrite64(fp->f_dump_fd, buf, rc, off);
1285eda14cbcSMatt Macy 		ASSERT(status != -1);
1286eda14cbcSMatt Macy 	}
1287eda14cbcSMatt Macy 
1288eda14cbcSMatt Macy 	if (resid) {
1289eda14cbcSMatt Macy 		*resid = count - rc;
1290eda14cbcSMatt Macy 	} else if (rc != count) {
1291eda14cbcSMatt Macy 		return (EIO);
1292eda14cbcSMatt Macy 	}
1293eda14cbcSMatt Macy 
1294eda14cbcSMatt Macy 	return (0);
1295eda14cbcSMatt Macy }
1296eda14cbcSMatt Macy 
1297eda14cbcSMatt Macy /*
1298eda14cbcSMatt Macy  * lseek - set / get file pointer
1299eda14cbcSMatt Macy  *
1300eda14cbcSMatt Macy  * fp -  pointer to file (pipe, socket, etc) to read from
1301eda14cbcSMatt Macy  * offp - value to seek to, returns current value plus passed offset
1302eda14cbcSMatt Macy  * whence - see man pages for standard lseek whence values
1303eda14cbcSMatt Macy  *
1304eda14cbcSMatt Macy  * Returns 0 on success errno on failure (ESPIPE for non seekable types)
1305eda14cbcSMatt Macy  */
1306eda14cbcSMatt Macy int
zfs_file_seek(zfs_file_t * fp,loff_t * offp,int whence)1307eda14cbcSMatt Macy zfs_file_seek(zfs_file_t *fp, loff_t *offp, int whence)
1308eda14cbcSMatt Macy {
1309eda14cbcSMatt Macy 	loff_t rc;
1310eda14cbcSMatt Macy 
1311eda14cbcSMatt Macy 	rc = lseek(fp->f_fd, *offp, whence);
1312eda14cbcSMatt Macy 	if (rc < 0)
1313eda14cbcSMatt Macy 		return (errno);
1314eda14cbcSMatt Macy 
1315eda14cbcSMatt Macy 	*offp = rc;
1316eda14cbcSMatt Macy 
1317eda14cbcSMatt Macy 	return (0);
1318eda14cbcSMatt Macy }
1319eda14cbcSMatt Macy 
1320eda14cbcSMatt Macy /*
1321eda14cbcSMatt Macy  * Get file attributes
1322eda14cbcSMatt Macy  *
1323eda14cbcSMatt Macy  * filp - file pointer
1324eda14cbcSMatt Macy  * zfattr - pointer to file attr structure
1325eda14cbcSMatt Macy  *
1326eda14cbcSMatt Macy  * Currently only used for fetching size and file mode
1327eda14cbcSMatt Macy  *
1328eda14cbcSMatt Macy  * Returns 0 on success or error code of underlying getattr call on failure.
1329eda14cbcSMatt Macy  */
1330eda14cbcSMatt Macy int
zfs_file_getattr(zfs_file_t * fp,zfs_file_attr_t * zfattr)1331eda14cbcSMatt Macy zfs_file_getattr(zfs_file_t *fp, zfs_file_attr_t *zfattr)
1332eda14cbcSMatt Macy {
1333eda14cbcSMatt Macy 	struct stat64 st;
1334eda14cbcSMatt Macy 
1335eda14cbcSMatt Macy 	if (fstat64_blk(fp->f_fd, &st) == -1)
1336eda14cbcSMatt Macy 		return (errno);
1337eda14cbcSMatt Macy 
1338eda14cbcSMatt Macy 	zfattr->zfa_size = st.st_size;
1339eda14cbcSMatt Macy 	zfattr->zfa_mode = st.st_mode;
1340eda14cbcSMatt Macy 
1341eda14cbcSMatt Macy 	return (0);
1342eda14cbcSMatt Macy }
1343eda14cbcSMatt Macy 
1344eda14cbcSMatt Macy /*
1345eda14cbcSMatt Macy  * Sync file to disk
1346eda14cbcSMatt Macy  *
1347eda14cbcSMatt Macy  * filp - file pointer
1348eda14cbcSMatt Macy  * flags - O_SYNC and or O_DSYNC
1349eda14cbcSMatt Macy  *
1350eda14cbcSMatt Macy  * Returns 0 on success or error code of underlying sync call on failure.
1351eda14cbcSMatt Macy  */
1352eda14cbcSMatt Macy int
zfs_file_fsync(zfs_file_t * fp,int flags)1353eda14cbcSMatt Macy zfs_file_fsync(zfs_file_t *fp, int flags)
1354eda14cbcSMatt Macy {
1355e92ffd9bSMartin Matuska 	(void) flags;
1356eda14cbcSMatt Macy 
1357e92ffd9bSMartin Matuska 	if (fsync(fp->f_fd) < 0)
1358eda14cbcSMatt Macy 		return (errno);
1359eda14cbcSMatt Macy 
1360eda14cbcSMatt Macy 	return (0);
1361eda14cbcSMatt Macy }
1362eda14cbcSMatt Macy 
1363eda14cbcSMatt Macy /*
13647a7741afSMartin Matuska  * deallocate - zero and/or deallocate file storage
1365eda14cbcSMatt Macy  *
1366eda14cbcSMatt Macy  * fp - file pointer
13677a7741afSMartin Matuska  * offset - offset to start zeroing or deallocating
13687a7741afSMartin Matuska  * len - length to zero or deallocate
1369eda14cbcSMatt Macy  */
1370eda14cbcSMatt Macy int
zfs_file_deallocate(zfs_file_t * fp,loff_t offset,loff_t len)13717a7741afSMartin Matuska zfs_file_deallocate(zfs_file_t *fp, loff_t offset, loff_t len)
1372eda14cbcSMatt Macy {
13737a7741afSMartin Matuska 	int rc;
13747a7741afSMartin Matuska #if defined(__linux__)
13757a7741afSMartin Matuska 	rc = fallocate(fp->f_fd,
13767a7741afSMartin Matuska 	    FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE, offset, len);
13777a7741afSMartin Matuska #elif defined(__FreeBSD__) && (__FreeBSD_version >= 1400029)
13787a7741afSMartin Matuska 	struct spacectl_range rqsr = {
13797a7741afSMartin Matuska 		.r_offset = offset,
13807a7741afSMartin Matuska 		.r_len = len,
13817a7741afSMartin Matuska 	};
13827a7741afSMartin Matuska 	rc = fspacectl(fp->f_fd, SPACECTL_DEALLOC, &rqsr, 0, &rqsr);
1383eda14cbcSMatt Macy #else
13847a7741afSMartin Matuska 	(void) fp, (void) offset, (void) len;
13857a7741afSMartin Matuska 	rc = EOPNOTSUPP;
1386eda14cbcSMatt Macy #endif
13877a7741afSMartin Matuska 	if (rc)
13887a7741afSMartin Matuska 		return (SET_ERROR(rc));
13897a7741afSMartin Matuska 	return (0);
1390eda14cbcSMatt Macy }
1391eda14cbcSMatt Macy 
1392eda14cbcSMatt Macy /*
1393eda14cbcSMatt Macy  * Request current file pointer offset
1394eda14cbcSMatt Macy  *
1395eda14cbcSMatt Macy  * fp - pointer to file
1396eda14cbcSMatt Macy  *
1397eda14cbcSMatt Macy  * Returns current file offset.
1398eda14cbcSMatt Macy  */
1399eda14cbcSMatt Macy loff_t
zfs_file_off(zfs_file_t * fp)1400eda14cbcSMatt Macy zfs_file_off(zfs_file_t *fp)
1401eda14cbcSMatt Macy {
1402eda14cbcSMatt Macy 	return (lseek(fp->f_fd, SEEK_CUR, 0));
1403eda14cbcSMatt Macy }
1404eda14cbcSMatt Macy 
1405eda14cbcSMatt Macy /*
1406eda14cbcSMatt Macy  * unlink file
1407eda14cbcSMatt Macy  *
1408eda14cbcSMatt Macy  * path - fully qualified file path
1409eda14cbcSMatt Macy  *
1410eda14cbcSMatt Macy  * Returns 0 on success.
1411eda14cbcSMatt Macy  *
1412eda14cbcSMatt Macy  * OPTIONAL
1413eda14cbcSMatt Macy  */
1414eda14cbcSMatt Macy int
zfs_file_unlink(const char * path)1415eda14cbcSMatt Macy zfs_file_unlink(const char *path)
1416eda14cbcSMatt Macy {
1417eda14cbcSMatt Macy 	return (remove(path));
1418eda14cbcSMatt Macy }
1419eda14cbcSMatt Macy 
1420eda14cbcSMatt Macy /*
1421eda14cbcSMatt Macy  * Get reference to file pointer
1422eda14cbcSMatt Macy  *
1423eda14cbcSMatt Macy  * fd - input file descriptor
1424eda14cbcSMatt Macy  *
14255eb61f6cSMartin Matuska  * Returns pointer to file struct or NULL.
1426eda14cbcSMatt Macy  * Unsupported in user space.
1427eda14cbcSMatt Macy  */
14285eb61f6cSMartin Matuska zfs_file_t *
zfs_file_get(int fd)14295eb61f6cSMartin Matuska zfs_file_get(int fd)
1430eda14cbcSMatt Macy {
1431e92ffd9bSMartin Matuska 	(void) fd;
1432eda14cbcSMatt Macy 	abort();
14335eb61f6cSMartin Matuska 	return (NULL);
1434eda14cbcSMatt Macy }
1435eda14cbcSMatt Macy /*
1436eda14cbcSMatt Macy  * Drop reference to file pointer
1437eda14cbcSMatt Macy  *
14385eb61f6cSMartin Matuska  * fp - pointer to file struct
1439eda14cbcSMatt Macy  *
1440eda14cbcSMatt Macy  * Unsupported in user space.
1441eda14cbcSMatt Macy  */
1442eda14cbcSMatt Macy void
zfs_file_put(zfs_file_t * fp)14435eb61f6cSMartin Matuska zfs_file_put(zfs_file_t *fp)
1444eda14cbcSMatt Macy {
1445eda14cbcSMatt Macy 	abort();
1446e92ffd9bSMartin Matuska 	(void) fp;
1447eda14cbcSMatt Macy }
1448eac7052fSMatt Macy 
1449eac7052fSMatt Macy void
zfsvfs_update_fromname(const char * oldname,const char * newname)1450eac7052fSMatt Macy zfsvfs_update_fromname(const char *oldname, const char *newname)
1451eac7052fSMatt Macy {
1452e92ffd9bSMartin Matuska 	(void) oldname, (void) newname;
1453eac7052fSMatt Macy }
1454c03c5b1cSMartin Matuska 
1455c03c5b1cSMartin Matuska void
spa_import_os(spa_t * spa)1456c03c5b1cSMartin Matuska spa_import_os(spa_t *spa)
1457c03c5b1cSMartin Matuska {
1458c03c5b1cSMartin Matuska 	(void) spa;
1459c03c5b1cSMartin Matuska }
1460c03c5b1cSMartin Matuska 
1461c03c5b1cSMartin Matuska void
spa_export_os(spa_t * spa)1462c03c5b1cSMartin Matuska spa_export_os(spa_t *spa)
1463c03c5b1cSMartin Matuska {
1464c03c5b1cSMartin Matuska 	(void) spa;
1465c03c5b1cSMartin Matuska }
1466c03c5b1cSMartin Matuska 
1467c03c5b1cSMartin Matuska void
spa_activate_os(spa_t * spa)1468c03c5b1cSMartin Matuska spa_activate_os(spa_t *spa)
1469c03c5b1cSMartin Matuska {
1470c03c5b1cSMartin Matuska 	(void) spa;
1471c03c5b1cSMartin Matuska }
1472c03c5b1cSMartin Matuska 
1473c03c5b1cSMartin Matuska void
spa_deactivate_os(spa_t * spa)1474c03c5b1cSMartin Matuska spa_deactivate_os(spa_t *spa)
1475c03c5b1cSMartin Matuska {
1476c03c5b1cSMartin Matuska 	(void) spa;
1477c03c5b1cSMartin Matuska }
1478