xref: /freebsd/sys/ufs/ffs/ffs_suspend.c (revision 1f8b431d185416f70e96f03b8fd69b98442b1913)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 2012 The FreeBSD Foundation
5  * All rights reserved.
6  *
7  * This software was developed by Edward Tomasz Napierala under sponsorship
8  * from the FreeBSD Foundation.
9  *
10  * Redistribution and use in source and binary forms, with or without
11  * modification, are permitted provided that the following conditions
12  * are met:
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in the
17  *    documentation and/or other materials provided with the distribution.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
20  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
23  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29  * SUCH DAMAGE.
30  *
31  * $FreeBSD$
32  */
33 
34 #include <sys/cdefs.h>
35 __FBSDID("$FreeBSD$");
36 
37 #include <sys/param.h>
38 #include <sys/systm.h>
39 #include <sys/buf.h>
40 #include <sys/ioccom.h>
41 #include <sys/mount.h>
42 #include <sys/vnode.h>
43 #include <sys/conf.h>
44 #include <sys/jail.h>
45 #include <sys/sx.h>
46 
47 #include <security/mac/mac_framework.h>
48 
49 #include <ufs/ufs/extattr.h>
50 #include <ufs/ufs/quota.h>
51 #include <ufs/ufs/ufsmount.h>
52 #include <ufs/ufs/inode.h>
53 
54 #include <ufs/ffs/fs.h>
55 #include <ufs/ffs/ffs_extern.h>
56 
57 static d_open_t ffs_susp_open;
58 static d_write_t ffs_susp_rdwr;
59 static d_ioctl_t ffs_susp_ioctl;
60 
61 static struct cdevsw ffs_susp_cdevsw = {
62 	.d_version =	D_VERSION,
63 	.d_open =	ffs_susp_open,
64 	.d_read =	ffs_susp_rdwr,
65 	.d_write =	ffs_susp_rdwr,
66 	.d_ioctl =	ffs_susp_ioctl,
67 	.d_name =	"ffs_susp",
68 };
69 
70 static struct cdev *ffs_susp_dev;
71 static struct sx ffs_susp_lock;
72 
73 static int
74 ffs_susp_suspended(struct mount *mp)
75 {
76 	struct ufsmount *ump;
77 
78 	sx_assert(&ffs_susp_lock, SA_LOCKED);
79 
80 	ump = VFSTOUFS(mp);
81 	if ((ump->um_flags & UM_WRITESUSPENDED) != 0)
82 		return (1);
83 	return (0);
84 }
85 
86 static int
87 ffs_susp_open(struct cdev *dev __unused, int flags __unused,
88     int fmt __unused, struct thread *td __unused)
89 {
90 
91 	return (0);
92 }
93 
94 static int
95 ffs_susp_rdwr(struct cdev *dev, struct uio *uio, int ioflag)
96 {
97 	int error, i;
98 	struct vnode *devvp;
99 	struct mount *mp;
100 	struct ufsmount *ump;
101 	struct buf *bp;
102 	void *base;
103 	size_t len;
104 	ssize_t cnt;
105 	struct fs *fs;
106 
107 	sx_slock(&ffs_susp_lock);
108 
109 	error = devfs_get_cdevpriv((void **)&mp);
110 	if (error != 0) {
111 		sx_sunlock(&ffs_susp_lock);
112 		return (ENXIO);
113 	}
114 
115 	ump = VFSTOUFS(mp);
116 	devvp = ump->um_devvp;
117 	fs = ump->um_fs;
118 
119 	if (ffs_susp_suspended(mp) == 0) {
120 		sx_sunlock(&ffs_susp_lock);
121 		return (ENXIO);
122 	}
123 
124 	KASSERT(uio->uio_rw == UIO_READ || uio->uio_rw == UIO_WRITE,
125 	    ("neither UIO_READ or UIO_WRITE"));
126 	KASSERT(uio->uio_segflg == UIO_USERSPACE,
127 	    ("uio->uio_segflg != UIO_USERSPACE"));
128 
129 	cnt = uio->uio_resid;
130 
131 	for (i = 0; i < uio->uio_iovcnt; i++) {
132 		while (uio->uio_iov[i].iov_len) {
133 			base = uio->uio_iov[i].iov_base;
134 			len = uio->uio_iov[i].iov_len;
135 			if (len > fs->fs_bsize)
136 				len = fs->fs_bsize;
137 			if (fragoff(fs, uio->uio_offset) != 0 ||
138 			    fragoff(fs, len) != 0) {
139 				error = EINVAL;
140 				goto out;
141 			}
142 			error = bread(devvp, btodb(uio->uio_offset), len,
143 			    NOCRED, &bp);
144 			if (error != 0)
145 				goto out;
146 			if (uio->uio_rw == UIO_WRITE) {
147 				error = copyin(base, bp->b_data, len);
148 				if (error != 0) {
149 					bp->b_flags |= B_INVAL | B_NOCACHE;
150 					brelse(bp);
151 					goto out;
152 				}
153 				error = bwrite(bp);
154 				if (error != 0)
155 					goto out;
156 			} else {
157 				error = copyout(bp->b_data, base, len);
158 				brelse(bp);
159 				if (error != 0)
160 					goto out;
161 			}
162 			uio->uio_iov[i].iov_base =
163 			    (char *)uio->uio_iov[i].iov_base + len;
164 			uio->uio_iov[i].iov_len -= len;
165 			uio->uio_resid -= len;
166 			uio->uio_offset += len;
167 		}
168 	}
169 
170 out:
171 	sx_sunlock(&ffs_susp_lock);
172 
173 	if (uio->uio_resid < cnt)
174 		return (0);
175 
176 	return (error);
177 }
178 
179 static int
180 ffs_susp_suspend(struct mount *mp)
181 {
182 	struct ufsmount *ump;
183 	int error;
184 
185 	sx_assert(&ffs_susp_lock, SA_XLOCKED);
186 
187 	if (!ffs_own_mount(mp))
188 		return (EINVAL);
189 	if (ffs_susp_suspended(mp))
190 		return (EBUSY);
191 
192 	ump = VFSTOUFS(mp);
193 
194 	/*
195 	 * Make sure the calling thread is permitted to access the mounted
196 	 * device.  The permissions can change after we unlock the vnode;
197 	 * it's harmless.
198 	 */
199 	vn_lock(ump->um_devvp, LK_EXCLUSIVE | LK_RETRY);
200 	error = VOP_ACCESS(ump->um_devvp, VREAD | VWRITE,
201 	    curthread->td_ucred, curthread);
202 	VOP_UNLOCK(ump->um_devvp, 0);
203 	if (error != 0)
204 		return (error);
205 #ifdef MAC
206 	if (mac_mount_check_stat(curthread->td_ucred, mp) != 0)
207 		return (EPERM);
208 #endif
209 
210 	if ((error = vfs_write_suspend(mp, VS_SKIP_UNMOUNT)) != 0)
211 		return (error);
212 
213 	UFS_LOCK(ump);
214 	ump->um_flags |= UM_WRITESUSPENDED;
215 	UFS_UNLOCK(ump);
216 
217 	return (0);
218 }
219 
220 static void
221 ffs_susp_dtor(void *data)
222 {
223 	struct fs *fs;
224 	struct ufsmount *ump;
225 	struct mount *mp;
226 	int error;
227 
228 	sx_xlock(&ffs_susp_lock);
229 
230 	mp = (struct mount *)data;
231 	ump = VFSTOUFS(mp);
232 	fs = ump->um_fs;
233 
234 	if (ffs_susp_suspended(mp) == 0) {
235 		sx_xunlock(&ffs_susp_lock);
236 		return;
237 	}
238 
239 	KASSERT((mp->mnt_kern_flag & MNTK_SUSPEND) != 0,
240 	    ("MNTK_SUSPEND not set"));
241 
242 	error = ffs_reload(mp, curthread, FFSR_FORCE | FFSR_UNSUSPEND);
243 	if (error != 0)
244 		panic("failed to unsuspend writes on %s", fs->fs_fsmnt);
245 
246 	/*
247 	 * XXX: The status is kept per-process; the vfs_write_resume() routine
248 	 * 	asserts that the resuming thread is the same one that called
249 	 * 	vfs_write_suspend().  The cdevpriv data, however, is attached
250 	 * 	to the file descriptor, e.g. is inherited during fork.  Thus,
251 	 * 	it's possible that the resuming process will be different from
252 	 * 	the one that started the suspension.
253 	 *
254 	 * 	Work around by fooling the check in vfs_write_resume().
255 	 */
256 	mp->mnt_susp_owner = curthread;
257 
258 	vfs_write_resume(mp, 0);
259 	vfs_unbusy(mp);
260 	UFS_LOCK(ump);
261 	ump->um_flags &= ~UM_WRITESUSPENDED;
262 	UFS_UNLOCK(ump);
263 
264 	sx_xunlock(&ffs_susp_lock);
265 }
266 
267 static int
268 ffs_susp_ioctl(struct cdev *dev, u_long cmd, caddr_t addr, int flags,
269     struct thread *td)
270 {
271 	struct mount *mp;
272 	fsid_t *fsidp;
273 	int error;
274 
275 	/*
276 	 * No suspend inside the jail.  Allowing it would require making
277 	 * sure that e.g. the devfs ruleset for that jail permits access
278 	 * to the devvp.
279 	 */
280 	if (jailed(td->td_ucred))
281 		return (EPERM);
282 
283 	sx_xlock(&ffs_susp_lock);
284 
285 	switch (cmd) {
286 	case UFSSUSPEND:
287 		fsidp = (fsid_t *)addr;
288 		mp = vfs_getvfs(fsidp);
289 		if (mp == NULL) {
290 			error = ENOENT;
291 			break;
292 		}
293 		error = vfs_busy(mp, 0);
294 		vfs_rel(mp);
295 		if (error != 0)
296 			break;
297 		error = ffs_susp_suspend(mp);
298 		if (error != 0) {
299 			vfs_unbusy(mp);
300 			break;
301 		}
302 		error = devfs_set_cdevpriv(mp, ffs_susp_dtor);
303 		KASSERT(error == 0, ("devfs_set_cdevpriv failed"));
304 		break;
305 	case UFSRESUME:
306 		error = devfs_get_cdevpriv((void **)&mp);
307 		if (error != 0)
308 			break;
309 		/*
310 		 * This calls ffs_susp_dtor, which in turn unsuspends the fs.
311 		 * The dtor expects to be called without lock held, because
312 		 * sometimes it's called from here, and sometimes due to the
313 		 * file being closed or process exiting.
314 		 */
315 		sx_xunlock(&ffs_susp_lock);
316 		devfs_clear_cdevpriv();
317 		return (0);
318 	default:
319 		error = ENXIO;
320 		break;
321 	}
322 
323 	sx_xunlock(&ffs_susp_lock);
324 
325 	return (error);
326 }
327 
328 void
329 ffs_susp_initialize(void)
330 {
331 
332 	sx_init(&ffs_susp_lock, "ffs_susp");
333 	ffs_susp_dev = make_dev(&ffs_susp_cdevsw, 0, UID_ROOT, GID_WHEEL, 0600,
334 	    "ufssuspend");
335 }
336 
337 void
338 ffs_susp_uninitialize(void)
339 {
340 
341 	destroy_dev(ffs_susp_dev);
342 	sx_destroy(&ffs_susp_lock);
343 }
344