1168404Spjd/* 2168404Spjd * CDDL HEADER START 3168404Spjd * 4168404Spjd * The contents of this file are subject to the terms of the 5168404Spjd * Common Development and Distribution License (the "License"). 6168404Spjd * You may not use this file except in compliance with the License. 7168404Spjd * 8168404Spjd * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9168404Spjd * or http://www.opensolaris.org/os/licensing. 10168404Spjd * See the License for the specific language governing permissions 11168404Spjd * and limitations under the License. 12168404Spjd * 13168404Spjd * When distributing Covered Code, include this CDDL HEADER in each 14168404Spjd * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15168404Spjd * If applicable, add the following below this CDDL HEADER, with the 16168404Spjd * fields enclosed by brackets "[]" replaced with your own identifying 17168404Spjd * information: Portions Copyright [yyyy] [name of copyright owner] 18168404Spjd * 19168404Spjd * CDDL HEADER END 20168404Spjd */ 21168404Spjd/* 22219089Spjd * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved. 23290765Smav * Copyright (c) 2015 by Delphix. All rights reserved. 24297112Smav * Copyright (c) 2014 Integros [integros.com] 25168404Spjd */ 26168404Spjd 27168404Spjd#include <sys/types.h> 28168404Spjd#include <sys/param.h> 29168404Spjd#include <sys/systm.h> 30168404Spjd#include <sys/sysmacros.h> 31168404Spjd#include <sys/cmn_err.h> 32168404Spjd#include <sys/kmem.h> 33168404Spjd#include <sys/file.h> 34168404Spjd#include <sys/vfs.h> 35168404Spjd#include <sys/zfs_znode.h> 36168404Spjd#include <sys/zfs_dir.h> 37168404Spjd#include <sys/zil.h> 38185029Spjd#include <sys/zil_impl.h> 39168404Spjd#include <sys/byteorder.h> 40168962Spjd#include <sys/policy.h> 41168404Spjd#include <sys/stat.h> 42168404Spjd#include <sys/acl.h> 43168404Spjd#include <sys/dmu.h> 44168404Spjd#include <sys/spa.h> 45185029Spjd#include <sys/zfs_fuid.h> 46209962Smm#include <sys/dsl_dataset.h> 47168404Spjd 48168404Spjd/* 49209962Smm * These zfs_log_* functions must be called within a dmu tx, in one 50209962Smm * of 2 contexts depending on zilog->z_replay: 51209962Smm * 52209962Smm * Non replay mode 53209962Smm * --------------- 54209962Smm * We need to record the transaction so that if it is committed to 55209962Smm * the Intent Log then it can be replayed. An intent log transaction 56209962Smm * structure (itx_t) is allocated and all the information necessary to 57209962Smm * possibly replay the transaction is saved in it. The itx is then assigned 58209962Smm * a sequence number and inserted in the in-memory list anchored in the zilog. 59209962Smm * 60209962Smm * Replay mode 61209962Smm * ----------- 62209962Smm * We need to mark the intent log record as replayed in the log header. 63209962Smm * This is done in the same transaction as the replay so that they 64209962Smm * commit atomically. 65168404Spjd */ 66168404Spjd 67185029Spjdint 68185029Spjdzfs_log_create_txtype(zil_create_t type, vsecattr_t *vsecp, vattr_t *vap) 69185029Spjd{ 70185029Spjd int isxvattr = (vap->va_mask & AT_XVATTR); 71185029Spjd switch (type) { 72185029Spjd case Z_FILE: 73185029Spjd if (vsecp == NULL && !isxvattr) 74185029Spjd return (TX_CREATE); 75185029Spjd if (vsecp && isxvattr) 76185321Strasz#ifdef TODO 77185029Spjd return (TX_CREATE_ACL_ATTR); 78185321Strasz#else 79185321Strasz panic("%s:%u: unsupported condition", __func__, __LINE__); 80185321Strasz#endif 81185029Spjd if (vsecp) 82185029Spjd return (TX_CREATE_ACL); 83185029Spjd else 84185029Spjd return (TX_CREATE_ATTR); 85185029Spjd /*NOTREACHED*/ 86185029Spjd case Z_DIR: 87185029Spjd if (vsecp == NULL && !isxvattr) 88185029Spjd return (TX_MKDIR); 89185029Spjd if (vsecp && isxvattr) 90185321Strasz#ifdef TODO 91185029Spjd return (TX_MKDIR_ACL_ATTR); 92185321Strasz#else 93185321Strasz panic("%s:%u: unsupported condition", __func__, __LINE__); 94185321Strasz#endif 95185029Spjd if (vsecp) 96185029Spjd return (TX_MKDIR_ACL); 97185029Spjd else 98185029Spjd return (TX_MKDIR_ATTR); 99185029Spjd case Z_XATTRDIR: 100185029Spjd return (TX_MKXATTR); 101185029Spjd } 102185029Spjd ASSERT(0); 103185029Spjd return (TX_MAX_TYPE); 104185029Spjd} 105185029Spjd 106168404Spjd/* 107185029Spjd * build up the log data necessary for logging xvattr_t 108185029Spjd * First lr_attr_t is initialized. following the lr_attr_t 109185029Spjd * is the mapsize and attribute bitmap copied from the xvattr_t. 110185029Spjd * Following the bitmap and bitmapsize two 64 bit words are reserved 111185029Spjd * for the create time which may be set. Following the create time 112185029Spjd * records a single 64 bit integer which has the bits to set on 113185029Spjd * replay for the xvattr. 114185029Spjd */ 115185029Spjdstatic void 116185029Spjdzfs_log_xvattr(lr_attr_t *lrattr, xvattr_t *xvap) 117185029Spjd{ 118185029Spjd uint32_t *bitmap; 119185029Spjd uint64_t *attrs; 120185029Spjd uint64_t *crtime; 121185029Spjd xoptattr_t *xoap; 122185029Spjd void *scanstamp; 123185029Spjd int i; 124185029Spjd 125185029Spjd xoap = xva_getxoptattr(xvap); 126185029Spjd ASSERT(xoap); 127185029Spjd 128185029Spjd lrattr->lr_attr_masksize = xvap->xva_mapsize; 129185029Spjd bitmap = &lrattr->lr_attr_bitmap; 130185029Spjd for (i = 0; i != xvap->xva_mapsize; i++, bitmap++) { 131185029Spjd *bitmap = xvap->xva_reqattrmap[i]; 132185029Spjd } 133185029Spjd 134185029Spjd /* Now pack the attributes up in a single uint64_t */ 135185029Spjd attrs = (uint64_t *)bitmap; 136185029Spjd crtime = attrs + 1; 137185029Spjd scanstamp = (caddr_t)(crtime + 2); 138185029Spjd *attrs = 0; 139185029Spjd if (XVA_ISSET_REQ(xvap, XAT_READONLY)) 140185029Spjd *attrs |= (xoap->xoa_readonly == 0) ? 0 : 141185029Spjd XAT0_READONLY; 142185029Spjd if (XVA_ISSET_REQ(xvap, XAT_HIDDEN)) 143185029Spjd *attrs |= (xoap->xoa_hidden == 0) ? 0 : 144185029Spjd XAT0_HIDDEN; 145185029Spjd if (XVA_ISSET_REQ(xvap, XAT_SYSTEM)) 146185029Spjd *attrs |= (xoap->xoa_system == 0) ? 0 : 147185029Spjd XAT0_SYSTEM; 148185029Spjd if (XVA_ISSET_REQ(xvap, XAT_ARCHIVE)) 149185029Spjd *attrs |= (xoap->xoa_archive == 0) ? 0 : 150185029Spjd XAT0_ARCHIVE; 151185029Spjd if (XVA_ISSET_REQ(xvap, XAT_IMMUTABLE)) 152185029Spjd *attrs |= (xoap->xoa_immutable == 0) ? 0 : 153185029Spjd XAT0_IMMUTABLE; 154185029Spjd if (XVA_ISSET_REQ(xvap, XAT_NOUNLINK)) 155185029Spjd *attrs |= (xoap->xoa_nounlink == 0) ? 0 : 156185029Spjd XAT0_NOUNLINK; 157185029Spjd if (XVA_ISSET_REQ(xvap, XAT_APPENDONLY)) 158185029Spjd *attrs |= (xoap->xoa_appendonly == 0) ? 0 : 159185029Spjd XAT0_APPENDONLY; 160185029Spjd if (XVA_ISSET_REQ(xvap, XAT_OPAQUE)) 161185029Spjd *attrs |= (xoap->xoa_opaque == 0) ? 0 : 162185029Spjd XAT0_APPENDONLY; 163185029Spjd if (XVA_ISSET_REQ(xvap, XAT_NODUMP)) 164185029Spjd *attrs |= (xoap->xoa_nodump == 0) ? 0 : 165185029Spjd XAT0_NODUMP; 166185029Spjd if (XVA_ISSET_REQ(xvap, XAT_AV_QUARANTINED)) 167185029Spjd *attrs |= (xoap->xoa_av_quarantined == 0) ? 0 : 168185029Spjd XAT0_AV_QUARANTINED; 169185029Spjd if (XVA_ISSET_REQ(xvap, XAT_AV_MODIFIED)) 170185029Spjd *attrs |= (xoap->xoa_av_modified == 0) ? 0 : 171185029Spjd XAT0_AV_MODIFIED; 172185029Spjd if (XVA_ISSET_REQ(xvap, XAT_CREATETIME)) 173185029Spjd ZFS_TIME_ENCODE(&xoap->xoa_createtime, crtime); 174185029Spjd if (XVA_ISSET_REQ(xvap, XAT_AV_SCANSTAMP)) 175185029Spjd bcopy(xoap->xoa_av_scanstamp, scanstamp, AV_SCANSTAMP_SZ); 176219089Spjd if (XVA_ISSET_REQ(xvap, XAT_REPARSE)) 177219089Spjd *attrs |= (xoap->xoa_reparse == 0) ? 0 : 178219089Spjd XAT0_REPARSE; 179219089Spjd if (XVA_ISSET_REQ(xvap, XAT_OFFLINE)) 180219089Spjd *attrs |= (xoap->xoa_offline == 0) ? 0 : 181219089Spjd XAT0_OFFLINE; 182219089Spjd if (XVA_ISSET_REQ(xvap, XAT_SPARSE)) 183219089Spjd *attrs |= (xoap->xoa_sparse == 0) ? 0 : 184219089Spjd XAT0_SPARSE; 185185029Spjd} 186185029Spjd 187185029Spjdstatic void * 188185029Spjdzfs_log_fuid_ids(zfs_fuid_info_t *fuidp, void *start) 189185029Spjd{ 190185029Spjd zfs_fuid_t *zfuid; 191185029Spjd uint64_t *fuidloc = start; 192185029Spjd 193185029Spjd /* First copy in the ACE FUIDs */ 194185029Spjd for (zfuid = list_head(&fuidp->z_fuids); zfuid; 195185029Spjd zfuid = list_next(&fuidp->z_fuids, zfuid)) { 196185029Spjd *fuidloc++ = zfuid->z_logfuid; 197185029Spjd } 198185029Spjd return (fuidloc); 199185029Spjd} 200185029Spjd 201185029Spjd 202185029Spjdstatic void * 203185029Spjdzfs_log_fuid_domains(zfs_fuid_info_t *fuidp, void *start) 204185029Spjd{ 205185029Spjd zfs_fuid_domain_t *zdomain; 206185029Spjd 207185029Spjd /* now copy in the domain info, if any */ 208185029Spjd if (fuidp->z_domain_str_sz != 0) { 209185029Spjd for (zdomain = list_head(&fuidp->z_domains); zdomain; 210185029Spjd zdomain = list_next(&fuidp->z_domains, zdomain)) { 211185029Spjd bcopy((void *)zdomain->z_domain, start, 212185029Spjd strlen(zdomain->z_domain) + 1); 213185029Spjd start = (caddr_t)start + 214185029Spjd strlen(zdomain->z_domain) + 1; 215185029Spjd } 216185029Spjd } 217185029Spjd return (start); 218185029Spjd} 219185029Spjd 220185029Spjd/* 221251631Sdelphij * Handles TX_CREATE, TX_CREATE_ATTR, TX_MKDIR, TX_MKDIR_ATTR and 222251631Sdelphij * TK_MKXATTR transactions. 223185029Spjd * 224185029Spjd * TX_CREATE and TX_MKDIR are standard creates, but they may have FUID 225185029Spjd * domain information appended prior to the name. In this case the 226185029Spjd * uid/gid in the log record will be a log centric FUID. 227185029Spjd * 228185029Spjd * TX_CREATE_ACL_ATTR and TX_MKDIR_ACL_ATTR handle special creates that 229185029Spjd * may contain attributes, ACL and optional fuid information. 230185029Spjd * 231185029Spjd * TX_CREATE_ACL and TX_MKDIR_ACL handle special creates that specify 232185029Spjd * and ACL and normal users/groups in the ACEs. 233185029Spjd * 234185029Spjd * There may be an optional xvattr attribute information similar 235185029Spjd * to zfs_log_setattr. 236185029Spjd * 237185029Spjd * Also, after the file name "domain" strings may be appended. 238168404Spjd */ 239168404Spjdvoid 240185029Spjdzfs_log_create(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype, 241185029Spjd znode_t *dzp, znode_t *zp, char *name, vsecattr_t *vsecp, 242185029Spjd zfs_fuid_info_t *fuidp, vattr_t *vap) 243168404Spjd{ 244168404Spjd itx_t *itx; 245168404Spjd lr_create_t *lr; 246185029Spjd lr_acl_create_t *lracl; 247247187Smm size_t aclsize = (vsecp != NULL) ? vsecp->vsa_aclentsz : 0; 248185029Spjd size_t xvatsize = 0; 249185029Spjd size_t txsize; 250185029Spjd xvattr_t *xvap = (xvattr_t *)vap; 251185029Spjd void *end; 252185029Spjd size_t lrsize; 253168404Spjd size_t namesize = strlen(name) + 1; 254185029Spjd size_t fuidsz = 0; 255168404Spjd 256219089Spjd if (zil_replaying(zilog, tx)) 257168404Spjd return; 258168404Spjd 259185029Spjd /* 260185029Spjd * If we have FUIDs present then add in space for 261185029Spjd * domains and ACE fuid's if any. 262185029Spjd */ 263185029Spjd if (fuidp) { 264185029Spjd fuidsz += fuidp->z_domain_str_sz; 265185029Spjd fuidsz += fuidp->z_fuid_cnt * sizeof (uint64_t); 266185029Spjd } 267185029Spjd 268185029Spjd if (vap->va_mask & AT_XVATTR) 269185029Spjd xvatsize = ZIL_XVAT_SIZE(xvap->xva_mapsize); 270185029Spjd 271185029Spjd if ((int)txtype == TX_CREATE_ATTR || (int)txtype == TX_MKDIR_ATTR || 272185029Spjd (int)txtype == TX_CREATE || (int)txtype == TX_MKDIR || 273185029Spjd (int)txtype == TX_MKXATTR) { 274185029Spjd txsize = sizeof (*lr) + namesize + fuidsz + xvatsize; 275185029Spjd lrsize = sizeof (*lr); 276185029Spjd } else { 277185029Spjd txsize = 278185029Spjd sizeof (lr_acl_create_t) + namesize + fuidsz + 279185029Spjd ZIL_ACE_LENGTH(aclsize) + xvatsize; 280185029Spjd lrsize = sizeof (lr_acl_create_t); 281185029Spjd } 282185029Spjd 283185029Spjd itx = zil_itx_create(txtype, txsize); 284185029Spjd 285168404Spjd lr = (lr_create_t *)&itx->itx_lr; 286168404Spjd lr->lr_doid = dzp->z_id; 287168404Spjd lr->lr_foid = zp->z_id; 288219089Spjd lr->lr_mode = zp->z_mode; 289219089Spjd if (!IS_EPHEMERAL(zp->z_uid)) { 290219089Spjd lr->lr_uid = (uint64_t)zp->z_uid; 291185029Spjd } else { 292185029Spjd lr->lr_uid = fuidp->z_fuid_owner; 293185029Spjd } 294219089Spjd if (!IS_EPHEMERAL(zp->z_gid)) { 295219089Spjd lr->lr_gid = (uint64_t)zp->z_gid; 296185029Spjd } else { 297185029Spjd lr->lr_gid = fuidp->z_fuid_group; 298185029Spjd } 299219089Spjd (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_GEN(zp->z_zfsvfs), &lr->lr_gen, 300219089Spjd sizeof (uint64_t)); 301219089Spjd (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_CRTIME(zp->z_zfsvfs), 302219089Spjd lr->lr_crtime, sizeof (uint64_t) * 2); 303168404Spjd 304219089Spjd if (sa_lookup(zp->z_sa_hdl, SA_ZPL_RDEV(zp->z_zfsvfs), &lr->lr_rdev, 305219089Spjd sizeof (lr->lr_rdev)) != 0) 306219089Spjd lr->lr_rdev = 0; 307219089Spjd 308185029Spjd /* 309185029Spjd * Fill in xvattr info if any 310185029Spjd */ 311185029Spjd if (vap->va_mask & AT_XVATTR) { 312185029Spjd zfs_log_xvattr((lr_attr_t *)((caddr_t)lr + lrsize), xvap); 313185029Spjd end = (caddr_t)lr + lrsize + xvatsize; 314185029Spjd } else { 315185029Spjd end = (caddr_t)lr + lrsize; 316185029Spjd } 317185029Spjd 318185029Spjd /* Now fill in any ACL info */ 319185029Spjd 320185029Spjd if (vsecp) { 321185029Spjd lracl = (lr_acl_create_t *)&itx->itx_lr; 322185029Spjd lracl->lr_aclcnt = vsecp->vsa_aclcnt; 323185029Spjd lracl->lr_acl_bytes = aclsize; 324185029Spjd lracl->lr_domcnt = fuidp ? fuidp->z_domain_cnt : 0; 325185029Spjd lracl->lr_fuidcnt = fuidp ? fuidp->z_fuid_cnt : 0; 326185029Spjd if (vsecp->vsa_aclflags & VSA_ACE_ACLFLAGS) 327185029Spjd lracl->lr_acl_flags = (uint64_t)vsecp->vsa_aclflags; 328185029Spjd else 329185029Spjd lracl->lr_acl_flags = 0; 330185029Spjd 331185029Spjd bcopy(vsecp->vsa_aclentp, end, aclsize); 332185029Spjd end = (caddr_t)end + ZIL_ACE_LENGTH(aclsize); 333185029Spjd } 334185029Spjd 335185029Spjd /* drop in FUID info */ 336185029Spjd if (fuidp) { 337185029Spjd end = zfs_log_fuid_ids(fuidp, end); 338185029Spjd end = zfs_log_fuid_domains(fuidp, end); 339185029Spjd } 340185029Spjd /* 341185029Spjd * Now place file name in log record 342185029Spjd */ 343185029Spjd bcopy(name, end, namesize); 344185029Spjd 345219089Spjd zil_itx_assign(zilog, itx, tx); 346168404Spjd} 347168404Spjd 348168404Spjd/* 349251631Sdelphij * Handles both TX_REMOVE and TX_RMDIR transactions. 350168404Spjd */ 351168404Spjdvoid 352185029Spjdzfs_log_remove(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype, 353290765Smav znode_t *dzp, char *name, uint64_t foid) 354168404Spjd{ 355168404Spjd itx_t *itx; 356168404Spjd lr_remove_t *lr; 357168404Spjd size_t namesize = strlen(name) + 1; 358168404Spjd 359219089Spjd if (zil_replaying(zilog, tx)) 360168404Spjd return; 361168404Spjd 362168404Spjd itx = zil_itx_create(txtype, sizeof (*lr) + namesize); 363168404Spjd lr = (lr_remove_t *)&itx->itx_lr; 364168404Spjd lr->lr_doid = dzp->z_id; 365168404Spjd bcopy(name, (char *)(lr + 1), namesize); 366168404Spjd 367219089Spjd itx->itx_oid = foid; 368219089Spjd 369219089Spjd zil_itx_assign(zilog, itx, tx); 370168404Spjd} 371168404Spjd 372168404Spjd/* 373251631Sdelphij * Handles TX_LINK transactions. 374168404Spjd */ 375168404Spjdvoid 376185029Spjdzfs_log_link(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype, 377290765Smav znode_t *dzp, znode_t *zp, char *name) 378168404Spjd{ 379168404Spjd itx_t *itx; 380168404Spjd lr_link_t *lr; 381168404Spjd size_t namesize = strlen(name) + 1; 382168404Spjd 383219089Spjd if (zil_replaying(zilog, tx)) 384168404Spjd return; 385168404Spjd 386168404Spjd itx = zil_itx_create(txtype, sizeof (*lr) + namesize); 387168404Spjd lr = (lr_link_t *)&itx->itx_lr; 388168404Spjd lr->lr_doid = dzp->z_id; 389168404Spjd lr->lr_link_obj = zp->z_id; 390168404Spjd bcopy(name, (char *)(lr + 1), namesize); 391168404Spjd 392219089Spjd zil_itx_assign(zilog, itx, tx); 393168404Spjd} 394168404Spjd 395168404Spjd/* 396251631Sdelphij * Handles TX_SYMLINK transactions. 397168404Spjd */ 398168404Spjdvoid 399185029Spjdzfs_log_symlink(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype, 400185029Spjd znode_t *dzp, znode_t *zp, char *name, char *link) 401168404Spjd{ 402168404Spjd itx_t *itx; 403168404Spjd lr_create_t *lr; 404168404Spjd size_t namesize = strlen(name) + 1; 405168404Spjd size_t linksize = strlen(link) + 1; 406168404Spjd 407219089Spjd if (zil_replaying(zilog, tx)) 408168404Spjd return; 409168404Spjd 410168404Spjd itx = zil_itx_create(txtype, sizeof (*lr) + namesize + linksize); 411168404Spjd lr = (lr_create_t *)&itx->itx_lr; 412168404Spjd lr->lr_doid = dzp->z_id; 413168404Spjd lr->lr_foid = zp->z_id; 414219089Spjd lr->lr_uid = zp->z_uid; 415219089Spjd lr->lr_gid = zp->z_gid; 416219089Spjd lr->lr_mode = zp->z_mode; 417219089Spjd (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_GEN(zp->z_zfsvfs), &lr->lr_gen, 418219089Spjd sizeof (uint64_t)); 419219089Spjd (void) sa_lookup(zp->z_sa_hdl, SA_ZPL_CRTIME(zp->z_zfsvfs), 420219089Spjd lr->lr_crtime, sizeof (uint64_t) * 2); 421168404Spjd bcopy(name, (char *)(lr + 1), namesize); 422168404Spjd bcopy(link, (char *)(lr + 1) + namesize, linksize); 423168404Spjd 424219089Spjd zil_itx_assign(zilog, itx, tx); 425168404Spjd} 426168404Spjd 427168404Spjd/* 428251631Sdelphij * Handles TX_RENAME transactions. 429168404Spjd */ 430168404Spjdvoid 431185029Spjdzfs_log_rename(zilog_t *zilog, dmu_tx_t *tx, uint64_t txtype, 432290765Smav znode_t *sdzp, char *sname, znode_t *tdzp, char *dname, znode_t *szp) 433168404Spjd{ 434168404Spjd itx_t *itx; 435168404Spjd lr_rename_t *lr; 436168404Spjd size_t snamesize = strlen(sname) + 1; 437168404Spjd size_t dnamesize = strlen(dname) + 1; 438168404Spjd 439219089Spjd if (zil_replaying(zilog, tx)) 440168404Spjd return; 441168404Spjd 442168404Spjd itx = zil_itx_create(txtype, sizeof (*lr) + snamesize + dnamesize); 443168404Spjd lr = (lr_rename_t *)&itx->itx_lr; 444168404Spjd lr->lr_sdoid = sdzp->z_id; 445168404Spjd lr->lr_tdoid = tdzp->z_id; 446168404Spjd bcopy(sname, (char *)(lr + 1), snamesize); 447168404Spjd bcopy(dname, (char *)(lr + 1) + snamesize, dnamesize); 448219089Spjd itx->itx_oid = szp->z_id; 449168404Spjd 450219089Spjd zil_itx_assign(zilog, itx, tx); 451168404Spjd} 452168404Spjd 453168404Spjd/* 454251631Sdelphij * Handles TX_WRITE transactions. 455168404Spjd */ 456168404Spjdssize_t zfs_immediate_write_sz = 32768; 457168404Spjd 458168404Spjdvoid 459168404Spjdzfs_log_write(zilog_t *zilog, dmu_tx_t *tx, int txtype, 460290765Smav znode_t *zp, offset_t off, ssize_t resid, int ioflag) 461168404Spjd{ 462320496Savg uint32_t blocksize = zp->z_blksz; 463168404Spjd itx_wr_state_t write_state; 464185029Spjd uintptr_t fsync_cnt; 465168404Spjd 466219089Spjd if (zil_replaying(zilog, tx) || zp->z_unlinked) 467168404Spjd return; 468168404Spjd 469320496Savg if (zilog->zl_logbias == ZFS_LOGBIAS_THROUGHPUT) 470168404Spjd write_state = WR_INDIRECT; 471320496Savg else if (!spa_has_slogs(zilog->zl_spa) && 472320496Savg resid >= zfs_immediate_write_sz) 473320496Savg write_state = WR_INDIRECT; 474185029Spjd else if (ioflag & (FSYNC | FDSYNC)) 475168404Spjd write_state = WR_COPIED; 476168404Spjd else 477168404Spjd write_state = WR_NEED_COPY; 478168404Spjd 479185029Spjd if ((fsync_cnt = (uintptr_t)tsd_get(zfs_fsyncer_key)) != 0) { 480185029Spjd (void) tsd_set(zfs_fsyncer_key, (void *)(fsync_cnt - 1)); 481185029Spjd } 482185029Spjd 483185029Spjd while (resid) { 484185029Spjd itx_t *itx; 485185029Spjd lr_write_t *lr; 486320496Savg itx_wr_state_t wr_state = write_state; 487320496Savg ssize_t len = resid; 488185029Spjd 489320496Savg if (wr_state == WR_COPIED && resid > ZIL_MAX_COPIED_DATA) 490320496Savg wr_state = WR_NEED_COPY; 491320496Savg else if (wr_state == WR_INDIRECT) 492320496Savg len = MIN(blocksize - P2PHASE(off, blocksize), resid); 493185029Spjd 494185029Spjd itx = zil_itx_create(txtype, sizeof (*lr) + 495320496Savg (wr_state == WR_COPIED ? len : 0)); 496185029Spjd lr = (lr_write_t *)&itx->itx_lr; 497320496Savg if (wr_state == WR_COPIED && dmu_read(zp->z_zfsvfs->z_os, 498209962Smm zp->z_id, off, len, lr + 1, DMU_READ_NO_PREFETCH) != 0) { 499219089Spjd zil_itx_destroy(itx); 500168404Spjd itx = zil_itx_create(txtype, sizeof (*lr)); 501168404Spjd lr = (lr_write_t *)&itx->itx_lr; 502320496Savg wr_state = WR_NEED_COPY; 503168404Spjd } 504168404Spjd 505320496Savg itx->itx_wr_state = wr_state; 506185029Spjd lr->lr_foid = zp->z_id; 507185029Spjd lr->lr_offset = off; 508185029Spjd lr->lr_length = len; 509185029Spjd lr->lr_blkoff = 0; 510185029Spjd BP_ZERO(&lr->lr_blkptr); 511168404Spjd 512185029Spjd itx->itx_private = zp->z_zfsvfs; 513168404Spjd 514219089Spjd if (!(ioflag & (FSYNC | FDSYNC)) && (zp->z_sync_cnt == 0) && 515219089Spjd (fsync_cnt == 0)) 516185029Spjd itx->itx_sync = B_FALSE; 517185029Spjd 518219089Spjd zil_itx_assign(zilog, itx, tx); 519185029Spjd 520185029Spjd off += len; 521185029Spjd resid -= len; 522185029Spjd } 523168404Spjd} 524168404Spjd 525168404Spjd/* 526251631Sdelphij * Handles TX_TRUNCATE transactions. 527168404Spjd */ 528168404Spjdvoid 529168404Spjdzfs_log_truncate(zilog_t *zilog, dmu_tx_t *tx, int txtype, 530290765Smav znode_t *zp, uint64_t off, uint64_t len) 531168404Spjd{ 532168404Spjd itx_t *itx; 533168404Spjd lr_truncate_t *lr; 534168404Spjd 535219089Spjd if (zil_replaying(zilog, tx) || zp->z_unlinked) 536168404Spjd return; 537168404Spjd 538168404Spjd itx = zil_itx_create(txtype, sizeof (*lr)); 539168404Spjd lr = (lr_truncate_t *)&itx->itx_lr; 540168404Spjd lr->lr_foid = zp->z_id; 541168404Spjd lr->lr_offset = off; 542168404Spjd lr->lr_length = len; 543168404Spjd 544168404Spjd itx->itx_sync = (zp->z_sync_cnt != 0); 545219089Spjd zil_itx_assign(zilog, itx, tx); 546168404Spjd} 547168404Spjd 548168404Spjd/* 549251631Sdelphij * Handles TX_SETATTR transactions. 550168404Spjd */ 551168404Spjdvoid 552168404Spjdzfs_log_setattr(zilog_t *zilog, dmu_tx_t *tx, int txtype, 553290765Smav znode_t *zp, vattr_t *vap, uint_t mask_applied, zfs_fuid_info_t *fuidp) 554168404Spjd{ 555185029Spjd itx_t *itx; 556185029Spjd lr_setattr_t *lr; 557185029Spjd xvattr_t *xvap = (xvattr_t *)vap; 558185029Spjd size_t recsize = sizeof (lr_setattr_t); 559185029Spjd void *start; 560168404Spjd 561219089Spjd if (zil_replaying(zilog, tx) || zp->z_unlinked) 562168404Spjd return; 563168404Spjd 564185029Spjd /* 565185029Spjd * If XVATTR set, then log record size needs to allow 566185029Spjd * for lr_attr_t + xvattr mask, mapsize and create time 567185029Spjd * plus actual attribute values 568185029Spjd */ 569185029Spjd if (vap->va_mask & AT_XVATTR) 570185029Spjd recsize = sizeof (*lr) + ZIL_XVAT_SIZE(xvap->xva_mapsize); 571185029Spjd 572185029Spjd if (fuidp) 573185029Spjd recsize += fuidp->z_domain_str_sz; 574185029Spjd 575185029Spjd itx = zil_itx_create(txtype, recsize); 576168404Spjd lr = (lr_setattr_t *)&itx->itx_lr; 577168404Spjd lr->lr_foid = zp->z_id; 578168404Spjd lr->lr_mask = (uint64_t)mask_applied; 579168404Spjd lr->lr_mode = (uint64_t)vap->va_mode; 580185029Spjd if ((mask_applied & AT_UID) && IS_EPHEMERAL(vap->va_uid)) 581185029Spjd lr->lr_uid = fuidp->z_fuid_owner; 582185029Spjd else 583185029Spjd lr->lr_uid = (uint64_t)vap->va_uid; 584185029Spjd 585185029Spjd if ((mask_applied & AT_GID) && IS_EPHEMERAL(vap->va_gid)) 586185029Spjd lr->lr_gid = fuidp->z_fuid_group; 587185029Spjd else 588185029Spjd lr->lr_gid = (uint64_t)vap->va_gid; 589185029Spjd 590168404Spjd lr->lr_size = (uint64_t)vap->va_size; 591168404Spjd ZFS_TIME_ENCODE(&vap->va_atime, lr->lr_atime); 592168404Spjd ZFS_TIME_ENCODE(&vap->va_mtime, lr->lr_mtime); 593185029Spjd start = (lr_setattr_t *)(lr + 1); 594185029Spjd if (vap->va_mask & AT_XVATTR) { 595185029Spjd zfs_log_xvattr((lr_attr_t *)start, xvap); 596185029Spjd start = (caddr_t)start + ZIL_XVAT_SIZE(xvap->xva_mapsize); 597185029Spjd } 598168404Spjd 599185029Spjd /* 600185029Spjd * Now stick on domain information if any on end 601185029Spjd */ 602185029Spjd 603185029Spjd if (fuidp) 604185029Spjd (void) zfs_log_fuid_domains(fuidp, start); 605185029Spjd 606168404Spjd itx->itx_sync = (zp->z_sync_cnt != 0); 607219089Spjd zil_itx_assign(zilog, itx, tx); 608168404Spjd} 609168404Spjd 610168404Spjd/* 611251631Sdelphij * Handles TX_ACL transactions. 612168404Spjd */ 613168404Spjdvoid 614185029Spjdzfs_log_acl(zilog_t *zilog, dmu_tx_t *tx, znode_t *zp, 615185029Spjd vsecattr_t *vsecp, zfs_fuid_info_t *fuidp) 616168404Spjd{ 617168404Spjd itx_t *itx; 618185029Spjd lr_acl_v0_t *lrv0; 619168404Spjd lr_acl_t *lr; 620185029Spjd int txtype; 621185029Spjd int lrsize; 622185029Spjd size_t txsize; 623185029Spjd size_t aclbytes = vsecp->vsa_aclentsz; 624168404Spjd 625219089Spjd if (zil_replaying(zilog, tx) || zp->z_unlinked) 626168404Spjd return; 627168404Spjd 628185029Spjd txtype = (zp->z_zfsvfs->z_version < ZPL_VERSION_FUID) ? 629185029Spjd TX_ACL_V0 : TX_ACL; 630185029Spjd 631185029Spjd if (txtype == TX_ACL) 632185029Spjd lrsize = sizeof (*lr); 633185029Spjd else 634185029Spjd lrsize = sizeof (*lrv0); 635185029Spjd 636185029Spjd txsize = lrsize + 637185029Spjd ((txtype == TX_ACL) ? ZIL_ACE_LENGTH(aclbytes) : aclbytes) + 638185029Spjd (fuidp ? fuidp->z_domain_str_sz : 0) + 639185029Spjd sizeof (uint64_t) * (fuidp ? fuidp->z_fuid_cnt : 0); 640185029Spjd 641185029Spjd itx = zil_itx_create(txtype, txsize); 642185029Spjd 643168404Spjd lr = (lr_acl_t *)&itx->itx_lr; 644168404Spjd lr->lr_foid = zp->z_id; 645185029Spjd if (txtype == TX_ACL) { 646185029Spjd lr->lr_acl_bytes = aclbytes; 647185029Spjd lr->lr_domcnt = fuidp ? fuidp->z_domain_cnt : 0; 648185029Spjd lr->lr_fuidcnt = fuidp ? fuidp->z_fuid_cnt : 0; 649185029Spjd if (vsecp->vsa_mask & VSA_ACE_ACLFLAGS) 650185029Spjd lr->lr_acl_flags = (uint64_t)vsecp->vsa_aclflags; 651185029Spjd else 652185029Spjd lr->lr_acl_flags = 0; 653185029Spjd } 654185029Spjd lr->lr_aclcnt = (uint64_t)vsecp->vsa_aclcnt; 655168404Spjd 656185029Spjd if (txtype == TX_ACL_V0) { 657185029Spjd lrv0 = (lr_acl_v0_t *)lr; 658185029Spjd bcopy(vsecp->vsa_aclentp, (ace_t *)(lrv0 + 1), aclbytes); 659185029Spjd } else { 660185029Spjd void *start = (ace_t *)(lr + 1); 661185029Spjd 662185029Spjd bcopy(vsecp->vsa_aclentp, start, aclbytes); 663185029Spjd 664185029Spjd start = (caddr_t)start + ZIL_ACE_LENGTH(aclbytes); 665185029Spjd 666185029Spjd if (fuidp) { 667185029Spjd start = zfs_log_fuid_ids(fuidp, start); 668185029Spjd (void) zfs_log_fuid_domains(fuidp, start); 669185029Spjd } 670185029Spjd } 671185029Spjd 672168404Spjd itx->itx_sync = (zp->z_sync_cnt != 0); 673219089Spjd zil_itx_assign(zilog, itx, tx); 674168404Spjd} 675