1*61145dc2SMartin Matuska // SPDX-License-Identifier: CDDL-1.0
2eda14cbcSMatt Macy /*
3eda14cbcSMatt Macy * CDDL HEADER START
4eda14cbcSMatt Macy *
5eda14cbcSMatt Macy * The contents of this file are subject to the terms of the
6eda14cbcSMatt Macy * Common Development and Distribution License (the "License").
7eda14cbcSMatt Macy * You may not use this file except in compliance with the License.
8eda14cbcSMatt Macy *
9eda14cbcSMatt Macy * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
10271171e0SMartin Matuska * or https://opensource.org/licenses/CDDL-1.0.
11eda14cbcSMatt Macy * See the License for the specific language governing permissions
12eda14cbcSMatt Macy * and limitations under the License.
13eda14cbcSMatt Macy *
14eda14cbcSMatt Macy * When distributing Covered Code, include this CDDL HEADER in each
15eda14cbcSMatt Macy * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
16eda14cbcSMatt Macy * If applicable, add the following below this CDDL HEADER, with the
17eda14cbcSMatt Macy * fields enclosed by brackets "[]" replaced with your own identifying
18eda14cbcSMatt Macy * information: Portions Copyright [yyyy] [name of copyright owner]
19eda14cbcSMatt Macy *
20eda14cbcSMatt Macy * CDDL HEADER END
21eda14cbcSMatt Macy */
22eda14cbcSMatt Macy /*
23eda14cbcSMatt Macy * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
24eda14cbcSMatt Macy * Copyright (c) 2015, 2018 by Delphix. All rights reserved.
252a58b312SMartin Matuska * Copyright (c) 2022 by Pawel Jakub Dawidek
26eda14cbcSMatt Macy */
27eda14cbcSMatt Macy
28eda14cbcSMatt Macy
29eda14cbcSMatt Macy #include <sys/types.h>
30eda14cbcSMatt Macy #include <sys/param.h>
31eda14cbcSMatt Macy #include <sys/sysmacros.h>
32eda14cbcSMatt Macy #include <sys/cmn_err.h>
33eda14cbcSMatt Macy #include <sys/kmem.h>
34eda14cbcSMatt Macy #include <sys/thread.h>
35eda14cbcSMatt Macy #include <sys/file.h>
36eda14cbcSMatt Macy #include <sys/vfs.h>
37eda14cbcSMatt Macy #include <sys/zfs_znode.h>
38eda14cbcSMatt Macy #include <sys/zfs_dir.h>
39eda14cbcSMatt Macy #include <sys/zil.h>
40eda14cbcSMatt Macy #include <sys/zil_impl.h>
41eda14cbcSMatt Macy #include <sys/byteorder.h>
42eda14cbcSMatt Macy #include <sys/policy.h>
43eda14cbcSMatt Macy #include <sys/stat.h>
44eda14cbcSMatt Macy #include <sys/acl.h>
45eda14cbcSMatt Macy #include <sys/dmu.h>
46eda14cbcSMatt Macy #include <sys/dbuf.h>
47eda14cbcSMatt Macy #include <sys/spa.h>
48eda14cbcSMatt Macy #include <sys/zfs_fuid.h>
49eda14cbcSMatt Macy #include <sys/dsl_dataset.h>
50eda14cbcSMatt Macy
51eda14cbcSMatt Macy /*
52eda14cbcSMatt Macy * These zfs_log_* functions must be called within a dmu tx, in one
53eda14cbcSMatt Macy * of 2 contexts depending on zilog->z_replay:
54eda14cbcSMatt Macy *
55eda14cbcSMatt Macy * Non replay mode
56eda14cbcSMatt Macy * ---------------
57eda14cbcSMatt Macy * We need to record the transaction so that if it is committed to
58eda14cbcSMatt Macy * the Intent Log then it can be replayed. An intent log transaction
59eda14cbcSMatt Macy * structure (itx_t) is allocated and all the information necessary to
60eda14cbcSMatt Macy * possibly replay the transaction is saved in it. The itx is then assigned
61eda14cbcSMatt Macy * a sequence number and inserted in the in-memory list anchored in the zilog.
62eda14cbcSMatt Macy *
63eda14cbcSMatt Macy * Replay mode
64eda14cbcSMatt Macy * -----------
65eda14cbcSMatt Macy * We need to mark the intent log record as replayed in the log header.
66eda14cbcSMatt Macy * This is done in the same transaction as the replay so that they
67eda14cbcSMatt Macy * commit atomically.
68eda14cbcSMatt Macy */
69eda14cbcSMatt Macy
70eda14cbcSMatt Macy int
zfs_log_create_txtype(zil_create_t type,vsecattr_t * vsecp,vattr_t * vap)71eda14cbcSMatt Macy zfs_log_create_txtype(zil_create_t type, vsecattr_t *vsecp, vattr_t *vap)
72eda14cbcSMatt Macy {
73eda14cbcSMatt Macy int isxvattr = (vap->va_mask & ATTR_XVATTR);
74eda14cbcSMatt Macy switch (type) {
75eda14cbcSMatt Macy case Z_FILE:
76eda14cbcSMatt Macy if (vsecp == NULL && !isxvattr)
77eda14cbcSMatt Macy return (TX_CREATE);
78eda14cbcSMatt Macy if (vsecp && isxvattr)
79eda14cbcSMatt Macy return (TX_CREATE_ACL_ATTR);
80eda14cbcSMatt Macy if (vsecp)
81eda14cbcSMatt Macy return (TX_CREATE_ACL);
82eda14cbcSMatt Macy else
83eda14cbcSMatt Macy return (TX_CREATE_ATTR);
84eda14cbcSMatt Macy case Z_DIR:
85eda14cbcSMatt Macy if (vsecp == NULL && !isxvattr)
86eda14cbcSMatt Macy return (TX_MKDIR);
87eda14cbcSMatt Macy if (vsecp && isxvattr)
88eda14cbcSMatt Macy return (TX_MKDIR_ACL_ATTR);
89eda14cbcSMatt Macy if (vsecp)
90eda14cbcSMatt Macy return (TX_MKDIR_ACL);
91eda14cbcSMatt Macy else
92eda14cbcSMatt Macy return (TX_MKDIR_ATTR);
93eda14cbcSMatt Macy case Z_XATTRDIR:
94eda14cbcSMatt Macy return (TX_MKXATTR);
95eda14cbcSMatt Macy }
96eda14cbcSMatt Macy ASSERT(0);
97eda14cbcSMatt Macy return (TX_MAX_TYPE);
98eda14cbcSMatt Macy }
99eda14cbcSMatt Macy
100eda14cbcSMatt Macy /*
101eda14cbcSMatt Macy * build up the log data necessary for logging xvattr_t
102eda14cbcSMatt Macy * First lr_attr_t is initialized. following the lr_attr_t
103eda14cbcSMatt Macy * is the mapsize and attribute bitmap copied from the xvattr_t.
104eda14cbcSMatt Macy * Following the bitmap and bitmapsize two 64 bit words are reserved
105eda14cbcSMatt Macy * for the create time which may be set. Following the create time
106eda14cbcSMatt Macy * records a single 64 bit integer which has the bits to set on
107eda14cbcSMatt Macy * replay for the xvattr.
108eda14cbcSMatt Macy */
109eda14cbcSMatt Macy static void
zfs_log_xvattr(lr_attr_t * lrattr,xvattr_t * xvap)110eda14cbcSMatt Macy zfs_log_xvattr(lr_attr_t *lrattr, xvattr_t *xvap)
111eda14cbcSMatt Macy {
112eda14cbcSMatt Macy xoptattr_t *xoap;
113eda14cbcSMatt Macy
114eda14cbcSMatt Macy xoap = xva_getxoptattr(xvap);
115eda14cbcSMatt Macy ASSERT(xoap);
116eda14cbcSMatt Macy
117eda14cbcSMatt Macy lrattr->lr_attr_masksize = xvap->xva_mapsize;
118a0b956f5SMartin Matuska uint32_t *bitmap = &lrattr->lr_attr_bitmap;
119a0b956f5SMartin Matuska for (int i = 0; i != xvap->xva_mapsize; i++, bitmap++)
120eda14cbcSMatt Macy *bitmap = xvap->xva_reqattrmap[i];
121eda14cbcSMatt Macy
122a0b956f5SMartin Matuska lr_attr_end_t *end = (lr_attr_end_t *)bitmap;
123a0b956f5SMartin Matuska end->lr_attr_attrs = 0;
124a0b956f5SMartin Matuska end->lr_attr_crtime[0] = 0;
125a0b956f5SMartin Matuska end->lr_attr_crtime[1] = 0;
126a0b956f5SMartin Matuska memset(end->lr_attr_scanstamp, 0, AV_SCANSTAMP_SZ);
127a0b956f5SMartin Matuska
128eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_READONLY))
129a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_readonly == 0) ? 0 :
130eda14cbcSMatt Macy XAT0_READONLY;
131eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_HIDDEN))
132a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_hidden == 0) ? 0 :
133eda14cbcSMatt Macy XAT0_HIDDEN;
134eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_SYSTEM))
135a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_system == 0) ? 0 :
136eda14cbcSMatt Macy XAT0_SYSTEM;
137eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_ARCHIVE))
138a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_archive == 0) ? 0 :
139eda14cbcSMatt Macy XAT0_ARCHIVE;
140eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_IMMUTABLE))
141a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_immutable == 0) ? 0 :
142eda14cbcSMatt Macy XAT0_IMMUTABLE;
143eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_NOUNLINK))
144a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_nounlink == 0) ? 0 :
145eda14cbcSMatt Macy XAT0_NOUNLINK;
146eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_APPENDONLY))
147a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_appendonly == 0) ? 0 :
148eda14cbcSMatt Macy XAT0_APPENDONLY;
149eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_OPAQUE))
150a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_opaque == 0) ? 0 :
151eda14cbcSMatt Macy XAT0_APPENDONLY;
152eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_NODUMP))
153a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_nodump == 0) ? 0 :
154eda14cbcSMatt Macy XAT0_NODUMP;
155eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_AV_QUARANTINED))
156a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_av_quarantined == 0) ? 0 :
157eda14cbcSMatt Macy XAT0_AV_QUARANTINED;
158eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_AV_MODIFIED))
159a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_av_modified == 0) ? 0 :
160eda14cbcSMatt Macy XAT0_AV_MODIFIED;
161eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_CREATETIME))
162a0b956f5SMartin Matuska ZFS_TIME_ENCODE(&xoap->xoa_createtime, end->lr_attr_crtime);
163eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_AV_SCANSTAMP)) {
164eda14cbcSMatt Macy ASSERT(!XVA_ISSET_REQ(xvap, XAT_PROJID));
165eda14cbcSMatt Macy
166a0b956f5SMartin Matuska memcpy(end->lr_attr_scanstamp, xoap->xoa_av_scanstamp,
167a0b956f5SMartin Matuska AV_SCANSTAMP_SZ);
168eda14cbcSMatt Macy } else if (XVA_ISSET_REQ(xvap, XAT_PROJID)) {
169eda14cbcSMatt Macy /*
170eda14cbcSMatt Macy * XAT_PROJID and XAT_AV_SCANSTAMP will never be valid
171eda14cbcSMatt Macy * at the same time, so we can share the same space.
172eda14cbcSMatt Macy */
173a0b956f5SMartin Matuska memcpy(end->lr_attr_scanstamp, &xoap->xoa_projid,
174a0b956f5SMartin Matuska sizeof (uint64_t));
175eda14cbcSMatt Macy }
176eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_REPARSE))
177a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_reparse == 0) ? 0 :
178eda14cbcSMatt Macy XAT0_REPARSE;
179eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_OFFLINE))
180a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_offline == 0) ? 0 :
181eda14cbcSMatt Macy XAT0_OFFLINE;
182eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_SPARSE))
183a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_sparse == 0) ? 0 :
184eda14cbcSMatt Macy XAT0_SPARSE;
185eda14cbcSMatt Macy if (XVA_ISSET_REQ(xvap, XAT_PROJINHERIT))
186a0b956f5SMartin Matuska end->lr_attr_attrs |= (xoap->xoa_projinherit == 0) ? 0 :
187eda14cbcSMatt Macy XAT0_PROJINHERIT;
188eda14cbcSMatt Macy }
189eda14cbcSMatt Macy
190eda14cbcSMatt Macy static void *
zfs_log_fuid_ids(zfs_fuid_info_t * fuidp,void * start)191eda14cbcSMatt Macy zfs_log_fuid_ids(zfs_fuid_info_t *fuidp, void *start)
192eda14cbcSMatt Macy {
193eda14cbcSMatt Macy zfs_fuid_t *zfuid;
194eda14cbcSMatt Macy uint64_t *fuidloc = start;
195eda14cbcSMatt Macy
196eda14cbcSMatt Macy /* First copy in the ACE FUIDs */
197eda14cbcSMatt Macy for (zfuid = list_head(&fuidp->z_fuids); zfuid;
198eda14cbcSMatt Macy zfuid = list_next(&fuidp->z_fuids, zfuid)) {
199eda14cbcSMatt Macy *fuidloc++ = zfuid->z_logfuid;
200eda14cbcSMatt Macy }
201eda14cbcSMatt Macy return (fuidloc);
202eda14cbcSMatt Macy }
203eda14cbcSMatt Macy
204eda14cbcSMatt Macy
205eda14cbcSMatt Macy static void *
zfs_log_fuid_domains(zfs_fuid_info_t * fuidp,void * start)206eda14cbcSMatt Macy zfs_log_fuid_domains(zfs_fuid_info_t *fuidp, void *start)
207eda14cbcSMatt Macy {
208eda14cbcSMatt Macy zfs_fuid_domain_t *zdomain;
209eda14cbcSMatt Macy
210eda14cbcSMatt Macy /* now copy in the domain info, if any */
211eda14cbcSMatt Macy if (fuidp->z_domain_str_sz != 0) {
212eda14cbcSMatt Macy for (zdomain = list_head(&fuidp->z_domains); zdomain;
213eda14cbcSMatt Macy zdomain = list_next(&fuidp->z_domains, zdomain)) {
214da5137abSMartin Matuska memcpy(start, zdomain->z_domain,
215eda14cbcSMatt Macy strlen(zdomain->z_domain) + 1);
216eda14cbcSMatt Macy start = (caddr_t)start +
217eda14cbcSMatt Macy strlen(zdomain->z_domain) + 1;
218eda14cbcSMatt Macy }
219eda14cbcSMatt Macy }
220eda14cbcSMatt Macy return (start);
221eda14cbcSMatt Macy }
222eda14cbcSMatt Macy
223eda14cbcSMatt Macy /*
224eda14cbcSMatt Macy * If zp is an xattr node, check whether the xattr owner is unlinked.
225eda14cbcSMatt Macy * We don't want to log anything if the owner is unlinked.
226eda14cbcSMatt Macy */
227eda14cbcSMatt Macy static int
zfs_xattr_owner_unlinked(znode_t * zp)228eda14cbcSMatt Macy zfs_xattr_owner_unlinked(znode_t *zp)
229eda14cbcSMatt Macy {
230eda14cbcSMatt Macy int unlinked = 0;
231eda14cbcSMatt Macy znode_t *dzp;
232eda14cbcSMatt Macy #ifdef __FreeBSD__
233eda14cbcSMatt Macy znode_t *tzp = zp;
234eda14cbcSMatt Macy
235eda14cbcSMatt Macy /*
236eda14cbcSMatt Macy * zrele drops the vnode lock which violates the VOP locking contract
237eda14cbcSMatt Macy * on FreeBSD. See comment at the top of zfs_replay.c for more detail.
238eda14cbcSMatt Macy */
239eda14cbcSMatt Macy /*
240eda14cbcSMatt Macy * if zp is XATTR node, keep walking up via z_xattr_parent until we
241eda14cbcSMatt Macy * get the owner
242eda14cbcSMatt Macy */
243eda14cbcSMatt Macy while (tzp->z_pflags & ZFS_XATTR) {
244eda14cbcSMatt Macy ASSERT3U(zp->z_xattr_parent, !=, 0);
245eda14cbcSMatt Macy if (zfs_zget(ZTOZSB(tzp), tzp->z_xattr_parent, &dzp) != 0) {
246eda14cbcSMatt Macy unlinked = 1;
247eda14cbcSMatt Macy break;
248eda14cbcSMatt Macy }
249eda14cbcSMatt Macy
250eda14cbcSMatt Macy if (tzp != zp)
251eda14cbcSMatt Macy zrele(tzp);
252eda14cbcSMatt Macy tzp = dzp;
253eda14cbcSMatt Macy unlinked = tzp->z_unlinked;
254eda14cbcSMatt Macy }
255eda14cbcSMatt Macy if (tzp != zp)
256eda14cbcSMatt Macy zrele(tzp);
257eda14cbcSMatt Macy #else
258eda14cbcSMatt Macy zhold(zp);
259eda14cbcSMatt Macy /*
260eda14cbcSMatt Macy * if zp is XATTR node, keep walking up via z_xattr_parent until we
261eda14cbcSMatt Macy * get the owner
262eda14cbcSMatt Macy */
263eda14cbcSMatt Macy while (zp->z_pflags & ZFS_XATTR) {
264eda14cbcSMatt Macy ASSERT3U(zp->z_xattr_parent, !=, 0);
265eda14cbcSMatt Macy if (zfs_zget(ZTOZSB(zp), zp->z_xattr_parent, &dzp) != 0) {
266eda14cbcSMatt Macy unlinked = 1;
267eda14cbcSMatt Macy break;
268eda14cbcSMatt Macy }
269eda14cbcSMatt Macy
270eda14cbcSMatt Macy zrele(zp);
271eda14cbcSMatt Macy zp = dzp;
272eda14cbcSMatt Macy unlinked = zp->z_unlinked;
273eda14cbcSMatt Macy }
274eda14cbcSMatt Macy zrele(zp);
275eda14cbcSMatt Macy #endif
276eda14cbcSMatt Macy return (unlinked);
277eda14cbcSMatt Macy }
278eda14cbcSMatt Macy
279eda14cbcSMatt Macy /*
280eda14cbcSMatt Macy * Handles TX_CREATE, TX_CREATE_ATTR, TX_MKDIR, TX_MKDIR_ATTR and
281eda14cbcSMatt Macy * TK_MKXATTR transactions.
282eda14cbcSMatt Macy *
283eda14cbcSMatt Macy * TX_CREATE and TX_MKDIR are standard creates, but they may have FUID
284eda14cbcSMatt Macy * domain information appended prior to the name. In this case the
285eda14cbcSMatt Macy * uid/gid in the log record will be a log centric FUID.
286eda14cbcSMatt Macy *
287eda14cbcSMatt Macy * TX_CREATE_ACL_ATTR and TX_MKDIR_ACL_ATTR handle special creates that
288eda14cbcSMatt Macy * may contain attributes, ACL and optional fuid information.
289eda14cbcSMatt Macy *
290eda14cbcSMatt Macy * TX_CREATE_ACL and TX_MKDIR_ACL handle special creates that specify
291eda14cbcSMatt Macy * and ACL and normal users/groups in the ACEs.
292eda14cbcSMatt Macy *
293eda14cbcSMatt Macy * There may be an optional xvattr attribute information similar
294eda14cbcSMatt Macy * to zfs_log_setattr.
295eda14cbcSMatt Macy *
296eda14cbcSMatt Macy * Also, after the file name "domain" strings may be appended.
297eda14cbcSMatt Macy */
298eda14cbcSMatt Macy void
zfs_log_create(zilog_t * zilog,dmu_tx_t * tx,uint64_t txtype,znode_t * dzp,znode_t * zp,const char * name,vsecattr_t * vsecp,zfs_fuid_info_t * fuidp,vattr_t * vap)299eda14cbcSMatt Macy zfs_log_create(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype,
300180f8225SMatt Macy znode_t *dzp, znode_t *zp, const char *name, vsecattr_t *vsecp,
301eda14cbcSMatt Macy zfs_fuid_info_t *fuidp, vattr_t *vap)
302eda14cbcSMatt Macy {
303eda14cbcSMatt Macy itx_t *itx;
3047a7741afSMartin Matuska _lr_create_t *lr;
3057a7741afSMartin Matuska lr_acl_create_t *lracl = NULL;
3067a7741afSMartin Matuska uint8_t *lrdata;
307eda14cbcSMatt Macy size_t aclsize = 0;
308eda14cbcSMatt Macy size_t xvatsize = 0;
309eda14cbcSMatt Macy size_t txsize;
310eda14cbcSMatt Macy xvattr_t *xvap = (xvattr_t *)vap;
311eda14cbcSMatt Macy size_t namesize = strlen(name) + 1;
312eda14cbcSMatt Macy size_t fuidsz = 0;
313eda14cbcSMatt Macy
314eda14cbcSMatt Macy if (zil_replaying(zilog, tx) || zfs_xattr_owner_unlinked(dzp))
315eda14cbcSMatt Macy return;
316eda14cbcSMatt Macy
317eda14cbcSMatt Macy /*
318eda14cbcSMatt Macy * If we have FUIDs present then add in space for
319eda14cbcSMatt Macy * domains and ACE fuid's if any.
320eda14cbcSMatt Macy */
321eda14cbcSMatt Macy if (fuidp) {
322eda14cbcSMatt Macy fuidsz += fuidp->z_domain_str_sz;
323eda14cbcSMatt Macy fuidsz += fuidp->z_fuid_cnt * sizeof (uint64_t);
324eda14cbcSMatt Macy }
325eda14cbcSMatt Macy
326eda14cbcSMatt Macy if (vap->va_mask & ATTR_XVATTR)
327eda14cbcSMatt Macy xvatsize = ZIL_XVAT_SIZE(xvap->xva_mapsize);
328eda14cbcSMatt Macy
329eda14cbcSMatt Macy if ((int)txtype == TX_CREATE_ATTR || (int)txtype == TX_MKDIR_ATTR ||
330eda14cbcSMatt Macy (int)txtype == TX_CREATE || (int)txtype == TX_MKDIR ||
331eda14cbcSMatt Macy (int)txtype == TX_MKXATTR) {
3327a7741afSMartin Matuska txsize = sizeof (lr_create_t) + namesize + fuidsz + xvatsize;
3337a7741afSMartin Matuska itx = zil_itx_create(txtype, txsize);
3347a7741afSMartin Matuska lr_create_t *lrc = (lr_create_t *)&itx->itx_lr;
3357a7741afSMartin Matuska lrdata = &lrc->lr_data[0];
336eda14cbcSMatt Macy } else {
337eda14cbcSMatt Macy txsize =
338eda14cbcSMatt Macy sizeof (lr_acl_create_t) + namesize + fuidsz +
339eda14cbcSMatt Macy ZIL_ACE_LENGTH(aclsize) + xvatsize;
3407a7741afSMartin Matuska itx = zil_itx_create(txtype, txsize);
3417a7741afSMartin Matuska lracl = (lr_acl_create_t *)&itx->itx_lr;
3427a7741afSMartin Matuska lrdata = &lracl->lr_data[0];
343eda14cbcSMatt Macy }
344eda14cbcSMatt Macy
345eda14cbcSMatt Macy
3467a7741afSMartin Matuska lr = (_lr_create_t *)&itx->itx_lr;
347eda14cbcSMatt Macy lr->lr_doid = dzp->z_id;
348eda14cbcSMatt Macy lr->lr_foid = zp->z_id;
349eda14cbcSMatt Macy /* Store dnode slot count in 8 bits above object id. */
350eda14cbcSMatt Macy LR_FOID_SET_SLOTS(lr->lr_foid, zp->z_dnodesize >> DNODE_SHIFT);
351eda14cbcSMatt Macy lr->lr_mode = zp->z_mode;
352eda14cbcSMatt Macy if (!IS_EPHEMERAL(KUID_TO_SUID(ZTOUID(zp)))) {
353eda14cbcSMatt Macy lr->lr_uid = (uint64_t)KUID_TO_SUID(ZTOUID(zp));
354eda14cbcSMatt Macy } else {
355eda14cbcSMatt Macy lr->lr_uid = fuidp->z_fuid_owner;
356eda14cbcSMatt Macy }
357eda14cbcSMatt Macy if (!IS_EPHEMERAL(KGID_TO_SGID(ZTOGID(zp)))) {
358eda14cbcSMatt Macy lr->lr_gid = (uint64_t)KGID_TO_SGID(ZTOGID(zp));
359eda14cbcSMatt Macy } else {
360eda14cbcSMatt Macy lr->lr_gid = fuidp->z_fuid_group;
361eda14cbcSMatt Macy }
362eda14cbcSMatt Macy (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_GEN(ZTOZSB(zp)), &lr->lr_gen,
363eda14cbcSMatt Macy sizeof (uint64_t));
364eda14cbcSMatt Macy (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_CRTIME(ZTOZSB(zp)),
365eda14cbcSMatt Macy lr->lr_crtime, sizeof (uint64_t) * 2);
366eda14cbcSMatt Macy
367eda14cbcSMatt Macy if (sa_lookup(zp->z_sa_hdl, SA_ZPL_RDEV(ZTOZSB(zp)), &lr->lr_rdev,
368eda14cbcSMatt Macy sizeof (lr->lr_rdev)) != 0)
369eda14cbcSMatt Macy lr->lr_rdev = 0;
370eda14cbcSMatt Macy
371eda14cbcSMatt Macy /*
372eda14cbcSMatt Macy * Fill in xvattr info if any
373eda14cbcSMatt Macy */
374eda14cbcSMatt Macy if (vap->va_mask & ATTR_XVATTR) {
3757a7741afSMartin Matuska zfs_log_xvattr((lr_attr_t *)lrdata, xvap);
3767a7741afSMartin Matuska lrdata = &lrdata[xvatsize];
377eda14cbcSMatt Macy }
378eda14cbcSMatt Macy
379eda14cbcSMatt Macy /* Now fill in any ACL info */
380eda14cbcSMatt Macy
381eda14cbcSMatt Macy if (vsecp) {
3827a7741afSMartin Matuska ASSERT3P(lracl, !=, NULL);
383eda14cbcSMatt Macy lracl->lr_aclcnt = vsecp->vsa_aclcnt;
384eda14cbcSMatt Macy lracl->lr_acl_bytes = aclsize;
385eda14cbcSMatt Macy lracl->lr_domcnt = fuidp ? fuidp->z_domain_cnt : 0;
386eda14cbcSMatt Macy lracl->lr_fuidcnt = fuidp ? fuidp->z_fuid_cnt : 0;
387eda14cbcSMatt Macy if (vsecp->vsa_aclflags & VSA_ACE_ACLFLAGS)
388eda14cbcSMatt Macy lracl->lr_acl_flags = (uint64_t)vsecp->vsa_aclflags;
389eda14cbcSMatt Macy else
390eda14cbcSMatt Macy lracl->lr_acl_flags = 0;
391eda14cbcSMatt Macy
3927a7741afSMartin Matuska memcpy(lrdata, vsecp->vsa_aclentp, aclsize);
3937a7741afSMartin Matuska lrdata = &lrdata[ZIL_ACE_LENGTH(aclsize)];
394eda14cbcSMatt Macy }
395eda14cbcSMatt Macy
396eda14cbcSMatt Macy /* drop in FUID info */
397eda14cbcSMatt Macy if (fuidp) {
3987a7741afSMartin Matuska lrdata = zfs_log_fuid_ids(fuidp, lrdata);
3997a7741afSMartin Matuska lrdata = zfs_log_fuid_domains(fuidp, lrdata);
400eda14cbcSMatt Macy }
401eda14cbcSMatt Macy /*
402eda14cbcSMatt Macy * Now place file name in log record
403eda14cbcSMatt Macy */
4047a7741afSMartin Matuska memcpy(lrdata, name, namesize);
405eda14cbcSMatt Macy
406eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
407eda14cbcSMatt Macy }
408eda14cbcSMatt Macy
409eda14cbcSMatt Macy /*
410eda14cbcSMatt Macy * Handles both TX_REMOVE and TX_RMDIR transactions.
411eda14cbcSMatt Macy */
412eda14cbcSMatt Macy void
zfs_log_remove(zilog_t * zilog,dmu_tx_t * tx,uint64_t txtype,znode_t * dzp,const char * name,uint64_t foid,boolean_t unlinked)413eda14cbcSMatt Macy zfs_log_remove(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype,
414180f8225SMatt Macy znode_t *dzp, const char *name, uint64_t foid, boolean_t unlinked)
415eda14cbcSMatt Macy {
416eda14cbcSMatt Macy itx_t *itx;
417eda14cbcSMatt Macy lr_remove_t *lr;
418eda14cbcSMatt Macy size_t namesize = strlen(name) + 1;
419eda14cbcSMatt Macy
420eda14cbcSMatt Macy if (zil_replaying(zilog, tx) || zfs_xattr_owner_unlinked(dzp))
421eda14cbcSMatt Macy return;
422eda14cbcSMatt Macy
423eda14cbcSMatt Macy itx = zil_itx_create(txtype, sizeof (*lr) + namesize);
424eda14cbcSMatt Macy lr = (lr_remove_t *)&itx->itx_lr;
425eda14cbcSMatt Macy lr->lr_doid = dzp->z_id;
4267a7741afSMartin Matuska memcpy(&lr->lr_data[0], name, namesize);
427eda14cbcSMatt Macy
428eda14cbcSMatt Macy itx->itx_oid = foid;
429eda14cbcSMatt Macy
430eda14cbcSMatt Macy /*
431eda14cbcSMatt Macy * Object ids can be re-instantiated in the next txg so
432eda14cbcSMatt Macy * remove any async transactions to avoid future leaks.
433eda14cbcSMatt Macy * This can happen if a fsync occurs on the re-instantiated
434eda14cbcSMatt Macy * object for a WR_INDIRECT or WR_NEED_COPY write, which gets
435eda14cbcSMatt Macy * the new file data and flushes a write record for the old object.
436eda14cbcSMatt Macy */
437eda14cbcSMatt Macy if (unlinked) {
438eda14cbcSMatt Macy ASSERT((txtype & ~TX_CI) == TX_REMOVE);
439eda14cbcSMatt Macy zil_remove_async(zilog, foid);
440eda14cbcSMatt Macy }
441eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
442eda14cbcSMatt Macy }
443eda14cbcSMatt Macy
444eda14cbcSMatt Macy /*
445eda14cbcSMatt Macy * Handles TX_LINK transactions.
446eda14cbcSMatt Macy */
447eda14cbcSMatt Macy void
zfs_log_link(zilog_t * zilog,dmu_tx_t * tx,uint64_t txtype,znode_t * dzp,znode_t * zp,const char * name)448eda14cbcSMatt Macy zfs_log_link(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype,
449180f8225SMatt Macy znode_t *dzp, znode_t *zp, const char *name)
450eda14cbcSMatt Macy {
451eda14cbcSMatt Macy itx_t *itx;
452eda14cbcSMatt Macy lr_link_t *lr;
453eda14cbcSMatt Macy size_t namesize = strlen(name) + 1;
454eda14cbcSMatt Macy
455eda14cbcSMatt Macy if (zil_replaying(zilog, tx))
456eda14cbcSMatt Macy return;
457eda14cbcSMatt Macy
458eda14cbcSMatt Macy itx = zil_itx_create(txtype, sizeof (*lr) + namesize);
459eda14cbcSMatt Macy lr = (lr_link_t *)&itx->itx_lr;
460eda14cbcSMatt Macy lr->lr_doid = dzp->z_id;
461eda14cbcSMatt Macy lr->lr_link_obj = zp->z_id;
4627a7741afSMartin Matuska memcpy(&lr->lr_data[0], name, namesize);
463eda14cbcSMatt Macy
464eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
465eda14cbcSMatt Macy }
466eda14cbcSMatt Macy
467eda14cbcSMatt Macy /*
468eda14cbcSMatt Macy * Handles TX_SYMLINK transactions.
469eda14cbcSMatt Macy */
470eda14cbcSMatt Macy void
zfs_log_symlink(zilog_t * zilog,dmu_tx_t * tx,uint64_t txtype,znode_t * dzp,znode_t * zp,const char * name,const char * link)471eda14cbcSMatt Macy zfs_log_symlink(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype,
472180f8225SMatt Macy znode_t *dzp, znode_t *zp, const char *name, const char *link)
473eda14cbcSMatt Macy {
474eda14cbcSMatt Macy itx_t *itx;
4757a7741afSMartin Matuska _lr_create_t *lr;
4767a7741afSMartin Matuska lr_create_t *lrc;
477eda14cbcSMatt Macy size_t namesize = strlen(name) + 1;
478eda14cbcSMatt Macy size_t linksize = strlen(link) + 1;
479eda14cbcSMatt Macy
480eda14cbcSMatt Macy if (zil_replaying(zilog, tx))
481eda14cbcSMatt Macy return;
482eda14cbcSMatt Macy
4837a7741afSMartin Matuska itx = zil_itx_create(txtype, sizeof (*lrc) + namesize + linksize);
4847a7741afSMartin Matuska lrc = (lr_create_t *)&itx->itx_lr;
4857a7741afSMartin Matuska lr = &lrc->lr_create;
486eda14cbcSMatt Macy lr->lr_doid = dzp->z_id;
487eda14cbcSMatt Macy lr->lr_foid = zp->z_id;
488eda14cbcSMatt Macy lr->lr_uid = KUID_TO_SUID(ZTOUID(zp));
489eda14cbcSMatt Macy lr->lr_gid = KGID_TO_SGID(ZTOGID(zp));
490eda14cbcSMatt Macy lr->lr_mode = zp->z_mode;
491eda14cbcSMatt Macy (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_GEN(ZTOZSB(zp)), &lr->lr_gen,
492eda14cbcSMatt Macy sizeof (uint64_t));
493eda14cbcSMatt Macy (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_CRTIME(ZTOZSB(zp)),
494eda14cbcSMatt Macy lr->lr_crtime, sizeof (uint64_t) * 2);
4957a7741afSMartin Matuska memcpy(&lrc->lr_data[0], name, namesize);
4967a7741afSMartin Matuska memcpy(&lrc->lr_data[namesize], link, linksize);
497eda14cbcSMatt Macy
498eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
499eda14cbcSMatt Macy }
500eda14cbcSMatt Macy
501dbd5678dSMartin Matuska static void
do_zfs_log_rename(zilog_t * zilog,dmu_tx_t * tx,uint64_t txtype,znode_t * sdzp,const char * sname,znode_t * tdzp,const char * dname,znode_t * szp)502dbd5678dSMartin Matuska do_zfs_log_rename(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype, znode_t *sdzp,
503180f8225SMatt Macy const char *sname, znode_t *tdzp, const char *dname, znode_t *szp)
504eda14cbcSMatt Macy {
505eda14cbcSMatt Macy itx_t *itx;
5067a7741afSMartin Matuska _lr_rename_t *lr;
5077a7741afSMartin Matuska lr_rename_t *lrr;
508eda14cbcSMatt Macy size_t snamesize = strlen(sname) + 1;
509eda14cbcSMatt Macy size_t dnamesize = strlen(dname) + 1;
510eda14cbcSMatt Macy
511eda14cbcSMatt Macy if (zil_replaying(zilog, tx))
512eda14cbcSMatt Macy return;
513eda14cbcSMatt Macy
514eda14cbcSMatt Macy itx = zil_itx_create(txtype, sizeof (*lr) + snamesize + dnamesize);
5157a7741afSMartin Matuska lrr = (lr_rename_t *)&itx->itx_lr;
5167a7741afSMartin Matuska lr = &lrr->lr_rename;
517eda14cbcSMatt Macy lr->lr_sdoid = sdzp->z_id;
518eda14cbcSMatt Macy lr->lr_tdoid = tdzp->z_id;
5197a7741afSMartin Matuska memcpy(&lrr->lr_data[0], sname, snamesize);
5207a7741afSMartin Matuska memcpy(&lrr->lr_data[snamesize], dname, dnamesize);
521eda14cbcSMatt Macy itx->itx_oid = szp->z_id;
522eda14cbcSMatt Macy
523eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
524eda14cbcSMatt Macy }
525eda14cbcSMatt Macy
526eda14cbcSMatt Macy /*
527dbd5678dSMartin Matuska * Handles TX_RENAME transactions.
528dbd5678dSMartin Matuska */
529dbd5678dSMartin Matuska void
zfs_log_rename(zilog_t * zilog,dmu_tx_t * tx,uint64_t txtype,znode_t * sdzp,const char * sname,znode_t * tdzp,const char * dname,znode_t * szp)530dbd5678dSMartin Matuska zfs_log_rename(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype, znode_t *sdzp,
531dbd5678dSMartin Matuska const char *sname, znode_t *tdzp, const char *dname, znode_t *szp)
532dbd5678dSMartin Matuska {
533dbd5678dSMartin Matuska txtype |= TX_RENAME;
534dbd5678dSMartin Matuska do_zfs_log_rename(zilog, tx, txtype, sdzp, sname, tdzp, dname, szp);
535dbd5678dSMartin Matuska }
536dbd5678dSMartin Matuska
537dbd5678dSMartin Matuska /*
538dbd5678dSMartin Matuska * Handles TX_RENAME_EXCHANGE transactions.
539dbd5678dSMartin Matuska */
540dbd5678dSMartin Matuska void
zfs_log_rename_exchange(zilog_t * zilog,dmu_tx_t * tx,uint64_t txtype,znode_t * sdzp,const char * sname,znode_t * tdzp,const char * dname,znode_t * szp)541dbd5678dSMartin Matuska zfs_log_rename_exchange(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype,
542dbd5678dSMartin Matuska znode_t *sdzp, const char *sname, znode_t *tdzp, const char *dname,
543dbd5678dSMartin Matuska znode_t *szp)
544dbd5678dSMartin Matuska {
545dbd5678dSMartin Matuska txtype |= TX_RENAME_EXCHANGE;
546dbd5678dSMartin Matuska do_zfs_log_rename(zilog, tx, txtype, sdzp, sname, tdzp, dname, szp);
547dbd5678dSMartin Matuska }
548dbd5678dSMartin Matuska
549dbd5678dSMartin Matuska /*
550dbd5678dSMartin Matuska * Handles TX_RENAME_WHITEOUT transactions.
551dbd5678dSMartin Matuska *
552dbd5678dSMartin Matuska * Unfortunately we cannot reuse do_zfs_log_rename because we we need to call
553dbd5678dSMartin Matuska * zfs_mknode() on replay which requires stashing bits as with TX_CREATE.
554dbd5678dSMartin Matuska */
555dbd5678dSMartin Matuska void
zfs_log_rename_whiteout(zilog_t * zilog,dmu_tx_t * tx,uint64_t txtype,znode_t * sdzp,const char * sname,znode_t * tdzp,const char * dname,znode_t * szp,znode_t * wzp)556dbd5678dSMartin Matuska zfs_log_rename_whiteout(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype,
557dbd5678dSMartin Matuska znode_t *sdzp, const char *sname, znode_t *tdzp, const char *dname,
558dbd5678dSMartin Matuska znode_t *szp, znode_t *wzp)
559dbd5678dSMartin Matuska {
560dbd5678dSMartin Matuska itx_t *itx;
561dbd5678dSMartin Matuska lr_rename_whiteout_t *lr;
562dbd5678dSMartin Matuska size_t snamesize = strlen(sname) + 1;
563dbd5678dSMartin Matuska size_t dnamesize = strlen(dname) + 1;
564dbd5678dSMartin Matuska
565dbd5678dSMartin Matuska if (zil_replaying(zilog, tx))
566dbd5678dSMartin Matuska return;
567dbd5678dSMartin Matuska
568dbd5678dSMartin Matuska txtype |= TX_RENAME_WHITEOUT;
569dbd5678dSMartin Matuska itx = zil_itx_create(txtype, sizeof (*lr) + snamesize + dnamesize);
570dbd5678dSMartin Matuska lr = (lr_rename_whiteout_t *)&itx->itx_lr;
571dbd5678dSMartin Matuska lr->lr_rename.lr_sdoid = sdzp->z_id;
572dbd5678dSMartin Matuska lr->lr_rename.lr_tdoid = tdzp->z_id;
573dbd5678dSMartin Matuska
574dbd5678dSMartin Matuska /*
575dbd5678dSMartin Matuska * RENAME_WHITEOUT will create an entry at the source znode, so we need
576dbd5678dSMartin Matuska * to store the same data that the equivalent call to zfs_log_create()
577dbd5678dSMartin Matuska * would.
578dbd5678dSMartin Matuska */
579dbd5678dSMartin Matuska lr->lr_wfoid = wzp->z_id;
580dbd5678dSMartin Matuska LR_FOID_SET_SLOTS(lr->lr_wfoid, wzp->z_dnodesize >> DNODE_SHIFT);
581dbd5678dSMartin Matuska (void) sa_lookup(wzp->z_sa_hdl, SA_ZPL_GEN(ZTOZSB(wzp)), &lr->lr_wgen,
582dbd5678dSMartin Matuska sizeof (uint64_t));
583dbd5678dSMartin Matuska (void) sa_lookup(wzp->z_sa_hdl, SA_ZPL_CRTIME(ZTOZSB(wzp)),
584dbd5678dSMartin Matuska lr->lr_wcrtime, sizeof (uint64_t) * 2);
585dbd5678dSMartin Matuska lr->lr_wmode = wzp->z_mode;
586dbd5678dSMartin Matuska lr->lr_wuid = (uint64_t)KUID_TO_SUID(ZTOUID(wzp));
587dbd5678dSMartin Matuska lr->lr_wgid = (uint64_t)KGID_TO_SGID(ZTOGID(wzp));
588dbd5678dSMartin Matuska
589dbd5678dSMartin Matuska /*
590dbd5678dSMartin Matuska * This rdev will always be makdevice(0, 0) but because the ZIL log and
591dbd5678dSMartin Matuska * replay code needs to be platform independent (and there is no
592dbd5678dSMartin Matuska * platform independent makdev()) we need to copy the one created
593dbd5678dSMartin Matuska * during the rename operation.
594dbd5678dSMartin Matuska */
595dbd5678dSMartin Matuska (void) sa_lookup(wzp->z_sa_hdl, SA_ZPL_RDEV(ZTOZSB(wzp)), &lr->lr_wrdev,
596dbd5678dSMartin Matuska sizeof (lr->lr_wrdev));
597dbd5678dSMartin Matuska
5987a7741afSMartin Matuska memcpy(&lr->lr_data[0], sname, snamesize);
5997a7741afSMartin Matuska memcpy(&lr->lr_data[snamesize], dname, dnamesize);
600dbd5678dSMartin Matuska itx->itx_oid = szp->z_id;
601dbd5678dSMartin Matuska
602dbd5678dSMartin Matuska zil_itx_assign(zilog, itx, tx);
603dbd5678dSMartin Matuska }
604dbd5678dSMartin Matuska
605dbd5678dSMartin Matuska /*
606eda14cbcSMatt Macy * zfs_log_write() handles TX_WRITE transactions. The specified callback is
607eda14cbcSMatt Macy * called as soon as the write is on stable storage (be it via a DMU sync or a
608eda14cbcSMatt Macy * ZIL commit).
609eda14cbcSMatt Macy */
610dbd5678dSMartin Matuska static int64_t zfs_immediate_write_sz = 32768;
611eda14cbcSMatt Macy
612eda14cbcSMatt Macy void
zfs_log_write(zilog_t * zilog,dmu_tx_t * tx,int txtype,znode_t * zp,offset_t off,ssize_t resid,boolean_t commit,boolean_t o_direct,zil_callback_t callback,void * callback_data)613eda14cbcSMatt Macy zfs_log_write(zilog_t *zilog, dmu_tx_t *tx, int txtype,
614f8b1db88SMartin Matuska znode_t *zp, offset_t off, ssize_t resid, boolean_t commit,
6157a7741afSMartin Matuska boolean_t o_direct, zil_callback_t callback, void *callback_data)
616eda14cbcSMatt Macy {
617eda14cbcSMatt Macy dmu_buf_impl_t *db = (dmu_buf_impl_t *)sa_get_db(zp->z_sa_hdl);
618eda14cbcSMatt Macy uint32_t blocksize = zp->z_blksz;
619eda14cbcSMatt Macy itx_wr_state_t write_state;
620f9693befSMartin Matuska uint64_t gen = 0;
6213f9d360cSMartin Matuska ssize_t size = resid;
622eda14cbcSMatt Macy
623eda14cbcSMatt Macy if (zil_replaying(zilog, tx) || zp->z_unlinked ||
624eda14cbcSMatt Macy zfs_xattr_owner_unlinked(zp)) {
625eda14cbcSMatt Macy if (callback != NULL)
626eda14cbcSMatt Macy callback(callback_data);
627eda14cbcSMatt Macy return;
628eda14cbcSMatt Macy }
629eda14cbcSMatt Macy
6307a7741afSMartin Matuska if (zilog->zl_logbias == ZFS_LOGBIAS_THROUGHPUT || o_direct)
631eda14cbcSMatt Macy write_state = WR_INDIRECT;
632eda14cbcSMatt Macy else if (!spa_has_slogs(zilog->zl_spa) &&
633eda14cbcSMatt Macy resid >= zfs_immediate_write_sz)
634eda14cbcSMatt Macy write_state = WR_INDIRECT;
635f8b1db88SMartin Matuska else if (commit)
636eda14cbcSMatt Macy write_state = WR_COPIED;
637eda14cbcSMatt Macy else
638eda14cbcSMatt Macy write_state = WR_NEED_COPY;
639eda14cbcSMatt Macy
640f9693befSMartin Matuska (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_GEN(ZTOZSB(zp)), &gen,
641f9693befSMartin Matuska sizeof (gen));
642f9693befSMartin Matuska
643eda14cbcSMatt Macy while (resid) {
644eda14cbcSMatt Macy itx_t *itx;
645eda14cbcSMatt Macy lr_write_t *lr;
646eda14cbcSMatt Macy itx_wr_state_t wr_state = write_state;
647eda14cbcSMatt Macy ssize_t len = resid;
648eda14cbcSMatt Macy
649eda14cbcSMatt Macy /*
650eda14cbcSMatt Macy * A WR_COPIED record must fit entirely in one log block.
651eda14cbcSMatt Macy * Large writes can use WR_NEED_COPY, which the ZIL will
652eda14cbcSMatt Macy * split into multiple records across several log blocks
653eda14cbcSMatt Macy * if necessary.
654eda14cbcSMatt Macy */
655eda14cbcSMatt Macy if (wr_state == WR_COPIED &&
656eda14cbcSMatt Macy resid > zil_max_copied_data(zilog))
657eda14cbcSMatt Macy wr_state = WR_NEED_COPY;
658eda14cbcSMatt Macy else if (wr_state == WR_INDIRECT)
659eda14cbcSMatt Macy len = MIN(blocksize - P2PHASE(off, blocksize), resid);
660eda14cbcSMatt Macy
661eda14cbcSMatt Macy itx = zil_itx_create(txtype, sizeof (*lr) +
662eda14cbcSMatt Macy (wr_state == WR_COPIED ? len : 0));
663eda14cbcSMatt Macy lr = (lr_write_t *)&itx->itx_lr;
664eda14cbcSMatt Macy
665c40487d4SMatt Macy /*
666c40487d4SMatt Macy * For WR_COPIED records, copy the data into the lr_write_t.
667c40487d4SMatt Macy */
668c40487d4SMatt Macy if (wr_state == WR_COPIED) {
669c40487d4SMatt Macy int err;
670eda14cbcSMatt Macy DB_DNODE_ENTER(db);
6717a7741afSMartin Matuska err = dmu_read_by_dnode(DB_DNODE(db), off, len,
6727a7741afSMartin Matuska &lr->lr_data[0], DMU_READ_NO_PREFETCH);
673ce4dcb97SMartin Matuska DB_DNODE_EXIT(db);
674c40487d4SMatt Macy if (err != 0) {
675eda14cbcSMatt Macy zil_itx_destroy(itx);
676eda14cbcSMatt Macy itx = zil_itx_create(txtype, sizeof (*lr));
677eda14cbcSMatt Macy lr = (lr_write_t *)&itx->itx_lr;
678eda14cbcSMatt Macy wr_state = WR_NEED_COPY;
679eda14cbcSMatt Macy }
680c40487d4SMatt Macy }
681eda14cbcSMatt Macy
682eda14cbcSMatt Macy itx->itx_wr_state = wr_state;
683eda14cbcSMatt Macy lr->lr_foid = zp->z_id;
684eda14cbcSMatt Macy lr->lr_offset = off;
685eda14cbcSMatt Macy lr->lr_length = len;
686eda14cbcSMatt Macy lr->lr_blkoff = 0;
687eda14cbcSMatt Macy BP_ZERO(&lr->lr_blkptr);
688eda14cbcSMatt Macy
689eda14cbcSMatt Macy itx->itx_private = ZTOZSB(zp);
690f8b1db88SMartin Matuska itx->itx_sync = (zp->z_sync_cnt != 0);
691f9693befSMartin Matuska itx->itx_gen = gen;
692eda14cbcSMatt Macy
693eda14cbcSMatt Macy itx->itx_callback = callback;
694eda14cbcSMatt Macy itx->itx_callback_data = callback_data;
695eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
696eda14cbcSMatt Macy
697eda14cbcSMatt Macy off += len;
698eda14cbcSMatt Macy resid -= len;
699eda14cbcSMatt Macy }
7003f9d360cSMartin Matuska
7013f9d360cSMartin Matuska if (write_state == WR_COPIED || write_state == WR_NEED_COPY) {
7023f9d360cSMartin Matuska dsl_pool_wrlog_count(zilog->zl_dmu_pool, size, tx->tx_txg);
7033f9d360cSMartin Matuska }
704eda14cbcSMatt Macy }
705eda14cbcSMatt Macy
706eda14cbcSMatt Macy /*
707eda14cbcSMatt Macy * Handles TX_TRUNCATE transactions.
708eda14cbcSMatt Macy */
709eda14cbcSMatt Macy void
zfs_log_truncate(zilog_t * zilog,dmu_tx_t * tx,int txtype,znode_t * zp,uint64_t off,uint64_t len)710eda14cbcSMatt Macy zfs_log_truncate(zilog_t *zilog, dmu_tx_t *tx, int txtype,
711eda14cbcSMatt Macy znode_t *zp, uint64_t off, uint64_t len)
712eda14cbcSMatt Macy {
713eda14cbcSMatt Macy itx_t *itx;
714eda14cbcSMatt Macy lr_truncate_t *lr;
715eda14cbcSMatt Macy
716eda14cbcSMatt Macy if (zil_replaying(zilog, tx) || zp->z_unlinked ||
717eda14cbcSMatt Macy zfs_xattr_owner_unlinked(zp))
718eda14cbcSMatt Macy return;
719eda14cbcSMatt Macy
720eda14cbcSMatt Macy itx = zil_itx_create(txtype, sizeof (*lr));
721eda14cbcSMatt Macy lr = (lr_truncate_t *)&itx->itx_lr;
722eda14cbcSMatt Macy lr->lr_foid = zp->z_id;
723eda14cbcSMatt Macy lr->lr_offset = off;
724eda14cbcSMatt Macy lr->lr_length = len;
725eda14cbcSMatt Macy
726eda14cbcSMatt Macy itx->itx_sync = (zp->z_sync_cnt != 0);
727eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
728eda14cbcSMatt Macy }
729eda14cbcSMatt Macy
730eda14cbcSMatt Macy /*
731eda14cbcSMatt Macy * Handles TX_SETATTR transactions.
732eda14cbcSMatt Macy */
733eda14cbcSMatt Macy void
zfs_log_setattr(zilog_t * zilog,dmu_tx_t * tx,int txtype,znode_t * zp,vattr_t * vap,uint_t mask_applied,zfs_fuid_info_t * fuidp)734eda14cbcSMatt Macy zfs_log_setattr(zilog_t *zilog, dmu_tx_t *tx, int txtype,
735eda14cbcSMatt Macy znode_t *zp, vattr_t *vap, uint_t mask_applied, zfs_fuid_info_t *fuidp)
736eda14cbcSMatt Macy {
737eda14cbcSMatt Macy itx_t *itx;
738eda14cbcSMatt Macy lr_setattr_t *lr;
739eda14cbcSMatt Macy xvattr_t *xvap = (xvattr_t *)vap;
740eda14cbcSMatt Macy size_t recsize = sizeof (lr_setattr_t);
7417a7741afSMartin Matuska uint8_t *start;
742eda14cbcSMatt Macy
743eda14cbcSMatt Macy if (zil_replaying(zilog, tx) || zp->z_unlinked)
744eda14cbcSMatt Macy return;
745eda14cbcSMatt Macy
746eda14cbcSMatt Macy /*
747eda14cbcSMatt Macy * If XVATTR set, then log record size needs to allow
748eda14cbcSMatt Macy * for lr_attr_t + xvattr mask, mapsize and create time
749eda14cbcSMatt Macy * plus actual attribute values
750eda14cbcSMatt Macy */
751eda14cbcSMatt Macy if (vap->va_mask & ATTR_XVATTR)
752eda14cbcSMatt Macy recsize = sizeof (*lr) + ZIL_XVAT_SIZE(xvap->xva_mapsize);
753eda14cbcSMatt Macy
754eda14cbcSMatt Macy if (fuidp)
755eda14cbcSMatt Macy recsize += fuidp->z_domain_str_sz;
756eda14cbcSMatt Macy
757eda14cbcSMatt Macy itx = zil_itx_create(txtype, recsize);
758eda14cbcSMatt Macy lr = (lr_setattr_t *)&itx->itx_lr;
759eda14cbcSMatt Macy lr->lr_foid = zp->z_id;
760eda14cbcSMatt Macy lr->lr_mask = (uint64_t)mask_applied;
761eda14cbcSMatt Macy lr->lr_mode = (uint64_t)vap->va_mode;
762eda14cbcSMatt Macy if ((mask_applied & ATTR_UID) && IS_EPHEMERAL(vap->va_uid))
763eda14cbcSMatt Macy lr->lr_uid = fuidp->z_fuid_owner;
764eda14cbcSMatt Macy else
765eda14cbcSMatt Macy lr->lr_uid = (uint64_t)vap->va_uid;
766eda14cbcSMatt Macy
767eda14cbcSMatt Macy if ((mask_applied & ATTR_GID) && IS_EPHEMERAL(vap->va_gid))
768eda14cbcSMatt Macy lr->lr_gid = fuidp->z_fuid_group;
769eda14cbcSMatt Macy else
770eda14cbcSMatt Macy lr->lr_gid = (uint64_t)vap->va_gid;
771eda14cbcSMatt Macy
772eda14cbcSMatt Macy lr->lr_size = (uint64_t)vap->va_size;
773eda14cbcSMatt Macy ZFS_TIME_ENCODE(&vap->va_atime, lr->lr_atime);
774eda14cbcSMatt Macy ZFS_TIME_ENCODE(&vap->va_mtime, lr->lr_mtime);
7757a7741afSMartin Matuska start = &lr->lr_data[0];
776eda14cbcSMatt Macy if (vap->va_mask & ATTR_XVATTR) {
777eda14cbcSMatt Macy zfs_log_xvattr((lr_attr_t *)start, xvap);
7787a7741afSMartin Matuska start = &lr->lr_data[ZIL_XVAT_SIZE(xvap->xva_mapsize)];
779eda14cbcSMatt Macy }
780eda14cbcSMatt Macy
781eda14cbcSMatt Macy /*
782eda14cbcSMatt Macy * Now stick on domain information if any on end
783eda14cbcSMatt Macy */
784eda14cbcSMatt Macy
785eda14cbcSMatt Macy if (fuidp)
786eda14cbcSMatt Macy (void) zfs_log_fuid_domains(fuidp, start);
787eda14cbcSMatt Macy
788eda14cbcSMatt Macy itx->itx_sync = (zp->z_sync_cnt != 0);
789eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
790eda14cbcSMatt Macy }
791eda14cbcSMatt Macy
792eda14cbcSMatt Macy /*
793c03c5b1cSMartin Matuska * Handles TX_SETSAXATTR transactions.
794c03c5b1cSMartin Matuska */
795c03c5b1cSMartin Matuska void
zfs_log_setsaxattr(zilog_t * zilog,dmu_tx_t * tx,int txtype,znode_t * zp,const char * name,const void * value,size_t size)796c03c5b1cSMartin Matuska zfs_log_setsaxattr(zilog_t *zilog, dmu_tx_t *tx, int txtype,
797c03c5b1cSMartin Matuska znode_t *zp, const char *name, const void *value, size_t size)
798c03c5b1cSMartin Matuska {
799c03c5b1cSMartin Matuska itx_t *itx;
800c03c5b1cSMartin Matuska lr_setsaxattr_t *lr;
801c03c5b1cSMartin Matuska size_t recsize = sizeof (lr_setsaxattr_t);
802c03c5b1cSMartin Matuska int namelen;
803c03c5b1cSMartin Matuska
804c03c5b1cSMartin Matuska if (zil_replaying(zilog, tx) || zp->z_unlinked)
805c03c5b1cSMartin Matuska return;
806c03c5b1cSMartin Matuska
807c03c5b1cSMartin Matuska namelen = strlen(name) + 1;
808c03c5b1cSMartin Matuska recsize += (namelen + size);
809c03c5b1cSMartin Matuska itx = zil_itx_create(txtype, recsize);
810c03c5b1cSMartin Matuska lr = (lr_setsaxattr_t *)&itx->itx_lr;
811c03c5b1cSMartin Matuska lr->lr_foid = zp->z_id;
8127a7741afSMartin Matuska memcpy(&lr->lr_data[0], name, namelen);
813c03c5b1cSMartin Matuska if (value != NULL) {
8147a7741afSMartin Matuska memcpy(&lr->lr_data[namelen], value, size);
815c03c5b1cSMartin Matuska lr->lr_size = size;
816c03c5b1cSMartin Matuska } else {
817c03c5b1cSMartin Matuska lr->lr_size = 0;
818c03c5b1cSMartin Matuska }
819c03c5b1cSMartin Matuska
820c03c5b1cSMartin Matuska itx->itx_sync = (zp->z_sync_cnt != 0);
821c03c5b1cSMartin Matuska zil_itx_assign(zilog, itx, tx);
822c03c5b1cSMartin Matuska }
823c03c5b1cSMartin Matuska
824c03c5b1cSMartin Matuska /*
825eda14cbcSMatt Macy * Handles TX_ACL transactions.
826eda14cbcSMatt Macy */
827eda14cbcSMatt Macy void
zfs_log_acl(zilog_t * zilog,dmu_tx_t * tx,znode_t * zp,vsecattr_t * vsecp,zfs_fuid_info_t * fuidp)828eda14cbcSMatt Macy zfs_log_acl(zilog_t *zilog, dmu_tx_t *tx, znode_t *zp,
829eda14cbcSMatt Macy vsecattr_t *vsecp, zfs_fuid_info_t *fuidp)
830eda14cbcSMatt Macy {
831eda14cbcSMatt Macy itx_t *itx;
832eda14cbcSMatt Macy lr_acl_v0_t *lrv0;
833eda14cbcSMatt Macy lr_acl_t *lr;
834eda14cbcSMatt Macy int txtype;
835eda14cbcSMatt Macy int lrsize;
836eda14cbcSMatt Macy size_t txsize;
837eda14cbcSMatt Macy size_t aclbytes = vsecp->vsa_aclentsz;
838eda14cbcSMatt Macy
839eda14cbcSMatt Macy if (zil_replaying(zilog, tx) || zp->z_unlinked)
840eda14cbcSMatt Macy return;
841eda14cbcSMatt Macy
842eda14cbcSMatt Macy txtype = (ZTOZSB(zp)->z_version < ZPL_VERSION_FUID) ?
843eda14cbcSMatt Macy TX_ACL_V0 : TX_ACL;
844eda14cbcSMatt Macy
845eda14cbcSMatt Macy if (txtype == TX_ACL)
846eda14cbcSMatt Macy lrsize = sizeof (*lr);
847eda14cbcSMatt Macy else
848eda14cbcSMatt Macy lrsize = sizeof (*lrv0);
849eda14cbcSMatt Macy
850eda14cbcSMatt Macy txsize = lrsize +
851eda14cbcSMatt Macy ((txtype == TX_ACL) ? ZIL_ACE_LENGTH(aclbytes) : aclbytes) +
852eda14cbcSMatt Macy (fuidp ? fuidp->z_domain_str_sz : 0) +
853eda14cbcSMatt Macy sizeof (uint64_t) * (fuidp ? fuidp->z_fuid_cnt : 0);
854eda14cbcSMatt Macy
855eda14cbcSMatt Macy itx = zil_itx_create(txtype, txsize);
856eda14cbcSMatt Macy
857eda14cbcSMatt Macy lr = (lr_acl_t *)&itx->itx_lr;
858eda14cbcSMatt Macy lr->lr_foid = zp->z_id;
859eda14cbcSMatt Macy if (txtype == TX_ACL) {
860eda14cbcSMatt Macy lr->lr_acl_bytes = aclbytes;
861eda14cbcSMatt Macy lr->lr_domcnt = fuidp ? fuidp->z_domain_cnt : 0;
862eda14cbcSMatt Macy lr->lr_fuidcnt = fuidp ? fuidp->z_fuid_cnt : 0;
863eda14cbcSMatt Macy if (vsecp->vsa_mask & VSA_ACE_ACLFLAGS)
864eda14cbcSMatt Macy lr->lr_acl_flags = (uint64_t)vsecp->vsa_aclflags;
865eda14cbcSMatt Macy else
866eda14cbcSMatt Macy lr->lr_acl_flags = 0;
867eda14cbcSMatt Macy }
868eda14cbcSMatt Macy lr->lr_aclcnt = (uint64_t)vsecp->vsa_aclcnt;
869eda14cbcSMatt Macy
870eda14cbcSMatt Macy if (txtype == TX_ACL_V0) {
871eda14cbcSMatt Macy lrv0 = (lr_acl_v0_t *)lr;
8727a7741afSMartin Matuska memcpy(&lrv0->lr_data[0], vsecp->vsa_aclentp, aclbytes);
873eda14cbcSMatt Macy } else {
8747a7741afSMartin Matuska uint8_t *start = &lr->lr_data[0];
875eda14cbcSMatt Macy
876da5137abSMartin Matuska memcpy(start, vsecp->vsa_aclentp, aclbytes);
877eda14cbcSMatt Macy
8787a7741afSMartin Matuska start = &lr->lr_data[ZIL_ACE_LENGTH(aclbytes)];
879eda14cbcSMatt Macy
880eda14cbcSMatt Macy if (fuidp) {
881eda14cbcSMatt Macy start = zfs_log_fuid_ids(fuidp, start);
882eda14cbcSMatt Macy (void) zfs_log_fuid_domains(fuidp, start);
883eda14cbcSMatt Macy }
884eda14cbcSMatt Macy }
885eda14cbcSMatt Macy
886eda14cbcSMatt Macy itx->itx_sync = (zp->z_sync_cnt != 0);
887eda14cbcSMatt Macy zil_itx_assign(zilog, itx, tx);
888eda14cbcSMatt Macy }
889eda14cbcSMatt Macy
8902a58b312SMartin Matuska /*
8912a58b312SMartin Matuska * Handles TX_CLONE_RANGE transactions.
8922a58b312SMartin Matuska */
8932a58b312SMartin Matuska void
zfs_log_clone_range(zilog_t * zilog,dmu_tx_t * tx,int txtype,znode_t * zp,uint64_t off,uint64_t len,uint64_t blksz,const blkptr_t * bps,size_t nbps)8942a58b312SMartin Matuska zfs_log_clone_range(zilog_t *zilog, dmu_tx_t *tx, int txtype, znode_t *zp,
8952a58b312SMartin Matuska uint64_t off, uint64_t len, uint64_t blksz, const blkptr_t *bps,
8962a58b312SMartin Matuska size_t nbps)
8972a58b312SMartin Matuska {
8982a58b312SMartin Matuska itx_t *itx;
8992a58b312SMartin Matuska lr_clone_range_t *lr;
9002a58b312SMartin Matuska uint64_t partlen, max_log_data;
901aca928a5SMartin Matuska size_t partnbps;
9022a58b312SMartin Matuska
9031959e122SPawel Jakub Dawidek if (zil_replaying(zilog, tx) || zp->z_unlinked)
9042a58b312SMartin Matuska return;
9052a58b312SMartin Matuska
9062a58b312SMartin Matuska max_log_data = zil_max_log_data(zilog, sizeof (lr_clone_range_t));
9072a58b312SMartin Matuska
9082a58b312SMartin Matuska while (nbps > 0) {
9092a58b312SMartin Matuska partnbps = MIN(nbps, max_log_data / sizeof (bps[0]));
910aca928a5SMartin Matuska partlen = partnbps * blksz;
911aca928a5SMartin Matuska ASSERT3U(partlen, <, len + blksz);
9122a58b312SMartin Matuska partlen = MIN(partlen, len);
9132a58b312SMartin Matuska
9142a58b312SMartin Matuska itx = zil_itx_create(txtype,
9152a58b312SMartin Matuska sizeof (*lr) + sizeof (bps[0]) * partnbps);
9162a58b312SMartin Matuska lr = (lr_clone_range_t *)&itx->itx_lr;
9172a58b312SMartin Matuska lr->lr_foid = zp->z_id;
9182a58b312SMartin Matuska lr->lr_offset = off;
9192a58b312SMartin Matuska lr->lr_length = partlen;
9202a58b312SMartin Matuska lr->lr_blksz = blksz;
9212a58b312SMartin Matuska lr->lr_nbps = partnbps;
9222a58b312SMartin Matuska memcpy(lr->lr_bps, bps, sizeof (bps[0]) * partnbps);
9232a58b312SMartin Matuska
9242a58b312SMartin Matuska itx->itx_sync = (zp->z_sync_cnt != 0);
9252a58b312SMartin Matuska
9262a58b312SMartin Matuska zil_itx_assign(zilog, itx, tx);
9272a58b312SMartin Matuska
9282a58b312SMartin Matuska bps += partnbps;
9292a58b312SMartin Matuska ASSERT3U(nbps, >=, partnbps);
9302a58b312SMartin Matuska nbps -= partnbps;
9312a58b312SMartin Matuska off += partlen;
9322a58b312SMartin Matuska ASSERT3U(len, >=, partlen);
9332a58b312SMartin Matuska len -= partlen;
9342a58b312SMartin Matuska }
9352a58b312SMartin Matuska }
9362a58b312SMartin Matuska
937dbd5678dSMartin Matuska ZFS_MODULE_PARAM(zfs, zfs_, immediate_write_sz, S64, ZMOD_RW,
938eda14cbcSMatt Macy "Largest data block to write to zil");
939