1*7a7741afSMartin Matuska /* 2*7a7741afSMartin Matuska * CDDL HEADER START 3*7a7741afSMartin Matuska * 4*7a7741afSMartin Matuska * The contents of this file are subject to the terms of the 5*7a7741afSMartin Matuska * Common Development and Distribution License (the "License"). 6*7a7741afSMartin Matuska * You may not use this file except in compliance with the License. 7*7a7741afSMartin Matuska * 8*7a7741afSMartin Matuska * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9*7a7741afSMartin Matuska * or https://opensource.org/licenses/CDDL-1.0. 10*7a7741afSMartin Matuska * See the License for the specific language governing permissions 11*7a7741afSMartin Matuska * and limitations under the License. 12*7a7741afSMartin Matuska * 13*7a7741afSMartin Matuska * When distributing Covered Code, include this CDDL HEADER in each 14*7a7741afSMartin Matuska * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15*7a7741afSMartin Matuska * If applicable, add the following below this CDDL HEADER, with the 16*7a7741afSMartin Matuska * fields enclosed by brackets "[]" replaced with your own identifying 17*7a7741afSMartin Matuska * information: Portions Copyright [yyyy] [name of copyright owner] 18*7a7741afSMartin Matuska * 19*7a7741afSMartin Matuska * CDDL HEADER END 20*7a7741afSMartin Matuska */ 21*7a7741afSMartin Matuska /* 22*7a7741afSMartin Matuska * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved. 23*7a7741afSMartin Matuska * Copyright (c) 2012, 2014 by Delphix. All rights reserved. 24*7a7741afSMartin Matuska * Copyright (c) 2014 Integros [integros.com] 25*7a7741afSMartin Matuska */ 26*7a7741afSMartin Matuska 27*7a7741afSMartin Matuska /* Portions Copyright 2007 Jeremy Teo */ 28*7a7741afSMartin Matuska /* Portions Copyright 2011 Martin Matuska <mm@FreeBSD.org> */ 29*7a7741afSMartin Matuska 30*7a7741afSMartin Matuska #include <sys/types.h> 31*7a7741afSMartin Matuska #include <sys/param.h> 32*7a7741afSMartin Matuska #include <sys/time.h> 33*7a7741afSMartin Matuska #include <sys/systm.h> 34*7a7741afSMartin Matuska #include <sys/sysmacros.h> 35*7a7741afSMartin Matuska #include <sys/resource.h> 36*7a7741afSMartin Matuska #include <sys/resourcevar.h> 37*7a7741afSMartin Matuska #include <sys/mntent.h> 38*7a7741afSMartin Matuska #include <sys/u8_textprep.h> 39*7a7741afSMartin Matuska #include <sys/dsl_dataset.h> 40*7a7741afSMartin Matuska #include <sys/vfs.h> 41*7a7741afSMartin Matuska #include <sys/vnode.h> 42*7a7741afSMartin Matuska #include <sys/file.h> 43*7a7741afSMartin Matuska #include <sys/kmem.h> 44*7a7741afSMartin Matuska #include <sys/errno.h> 45*7a7741afSMartin Matuska #include <sys/unistd.h> 46*7a7741afSMartin Matuska #include <sys/atomic.h> 47*7a7741afSMartin Matuska #include <sys/zfs_dir.h> 48*7a7741afSMartin Matuska #include <sys/zfs_acl.h> 49*7a7741afSMartin Matuska #include <sys/zfs_ioctl.h> 50*7a7741afSMartin Matuska #include <sys/zfs_rlock.h> 51*7a7741afSMartin Matuska #include <sys/zfs_fuid.h> 52*7a7741afSMartin Matuska #include <sys/dnode.h> 53*7a7741afSMartin Matuska #include <sys/fs/zfs.h> 54*7a7741afSMartin Matuska #include <sys/dmu.h> 55*7a7741afSMartin Matuska #include <sys/dmu_objset.h> 56*7a7741afSMartin Matuska #include <sys/dmu_tx.h> 57*7a7741afSMartin Matuska #include <sys/zfs_refcount.h> 58*7a7741afSMartin Matuska #include <sys/stat.h> 59*7a7741afSMartin Matuska #include <sys/zap.h> 60*7a7741afSMartin Matuska #include <sys/zfs_znode.h> 61*7a7741afSMartin Matuska #include <sys/sa.h> 62*7a7741afSMartin Matuska #include <sys/zfs_sa.h> 63*7a7741afSMartin Matuska #include <sys/zfs_stat.h> 64*7a7741afSMartin Matuska 65*7a7741afSMartin Matuska #include "zfs_prop.h" 66*7a7741afSMartin Matuska #include "zfs_comutil.h" 67*7a7741afSMartin Matuska 68*7a7741afSMartin Matuska /* Used by fstat(1). */ 69*7a7741afSMartin Matuska SYSCTL_INT(_debug_sizeof, OID_AUTO, znode, CTLFLAG_RD, 70*7a7741afSMartin Matuska SYSCTL_NULL_INT_PTR, sizeof (znode_t), "sizeof(znode_t)"); 71*7a7741afSMartin Matuska 72*7a7741afSMartin Matuska /* 73*7a7741afSMartin Matuska * Define ZNODE_STATS to turn on statistic gathering. By default, it is only 74*7a7741afSMartin Matuska * turned on when DEBUG is also defined. 75*7a7741afSMartin Matuska */ 76*7a7741afSMartin Matuska #ifdef ZFS_DEBUG 77*7a7741afSMartin Matuska #define ZNODE_STATS 78*7a7741afSMartin Matuska #endif /* DEBUG */ 79*7a7741afSMartin Matuska 80*7a7741afSMartin Matuska #ifdef ZNODE_STATS 81*7a7741afSMartin Matuska #define ZNODE_STAT_ADD(stat) ((stat)++) 82*7a7741afSMartin Matuska #else 83*7a7741afSMartin Matuska #define ZNODE_STAT_ADD(stat) /* nothing */ 84*7a7741afSMartin Matuska #endif /* ZNODE_STATS */ 85*7a7741afSMartin Matuska 86*7a7741afSMartin Matuska #if !defined(KMEM_DEBUG) 87*7a7741afSMartin Matuska #define _ZFS_USE_SMR 88*7a7741afSMartin Matuska static uma_zone_t znode_uma_zone; 89*7a7741afSMartin Matuska #else 90*7a7741afSMartin Matuska static kmem_cache_t *znode_cache = NULL; 91*7a7741afSMartin Matuska #endif 92*7a7741afSMartin Matuska 93*7a7741afSMartin Matuska extern struct vop_vector zfs_vnodeops; 94*7a7741afSMartin Matuska extern struct vop_vector zfs_fifoops; 95*7a7741afSMartin Matuska extern struct vop_vector zfs_shareops; 96*7a7741afSMartin Matuska 97*7a7741afSMartin Matuska 98*7a7741afSMartin Matuska /* 99*7a7741afSMartin Matuska * This callback is invoked when acquiring a RL_WRITER or RL_APPEND lock on 100*7a7741afSMartin Matuska * z_rangelock. It will modify the offset and length of the lock to reflect 101*7a7741afSMartin Matuska * znode-specific information, and convert RL_APPEND to RL_WRITER. This is 102*7a7741afSMartin Matuska * called with the rangelock_t's rl_lock held, which avoids races. 103*7a7741afSMartin Matuska */ 104*7a7741afSMartin Matuska static void 105*7a7741afSMartin Matuska zfs_rangelock_cb(zfs_locked_range_t *new, void *arg) 106*7a7741afSMartin Matuska { 107*7a7741afSMartin Matuska znode_t *zp = arg; 108*7a7741afSMartin Matuska 109*7a7741afSMartin Matuska /* 110*7a7741afSMartin Matuska * If in append mode, convert to writer and lock starting at the 111*7a7741afSMartin Matuska * current end of file. 112*7a7741afSMartin Matuska */ 113*7a7741afSMartin Matuska if (new->lr_type == RL_APPEND) { 114*7a7741afSMartin Matuska new->lr_offset = zp->z_size; 115*7a7741afSMartin Matuska new->lr_type = RL_WRITER; 116*7a7741afSMartin Matuska } 117*7a7741afSMartin Matuska 118*7a7741afSMartin Matuska /* 119*7a7741afSMartin Matuska * If we need to grow the block size then lock the whole file range. 120*7a7741afSMartin Matuska */ 121*7a7741afSMartin Matuska uint64_t end_size = MAX(zp->z_size, new->lr_offset + new->lr_length); 122*7a7741afSMartin Matuska if (end_size > zp->z_blksz && (!ISP2(zp->z_blksz) || 123*7a7741afSMartin Matuska zp->z_blksz < ZTOZSB(zp)->z_max_blksz)) { 124*7a7741afSMartin Matuska new->lr_offset = 0; 125*7a7741afSMartin Matuska new->lr_length = UINT64_MAX; 126*7a7741afSMartin Matuska } 127*7a7741afSMartin Matuska } 128*7a7741afSMartin Matuska 129*7a7741afSMartin Matuska static int 130*7a7741afSMartin Matuska zfs_znode_cache_constructor(void *buf, void *arg, int kmflags) 131*7a7741afSMartin Matuska { 132*7a7741afSMartin Matuska znode_t *zp = buf; 133*7a7741afSMartin Matuska 134*7a7741afSMartin Matuska POINTER_INVALIDATE(&zp->z_zfsvfs); 135*7a7741afSMartin Matuska 136*7a7741afSMartin Matuska list_link_init(&zp->z_link_node); 137*7a7741afSMartin Matuska 138*7a7741afSMartin Matuska mutex_init(&zp->z_lock, NULL, MUTEX_DEFAULT, NULL); 139*7a7741afSMartin Matuska mutex_init(&zp->z_acl_lock, NULL, MUTEX_DEFAULT, NULL); 140*7a7741afSMartin Matuska rw_init(&zp->z_xattr_lock, NULL, RW_DEFAULT, NULL); 141*7a7741afSMartin Matuska 142*7a7741afSMartin Matuska zfs_rangelock_init(&zp->z_rangelock, zfs_rangelock_cb, zp); 143*7a7741afSMartin Matuska 144*7a7741afSMartin Matuska zp->z_acl_cached = NULL; 145*7a7741afSMartin Matuska zp->z_xattr_cached = NULL; 146*7a7741afSMartin Matuska zp->z_xattr_parent = 0; 147*7a7741afSMartin Matuska zp->z_vnode = NULL; 148*7a7741afSMartin Matuska zp->z_sync_writes_cnt = 0; 149*7a7741afSMartin Matuska zp->z_async_writes_cnt = 0; 150*7a7741afSMartin Matuska 151*7a7741afSMartin Matuska return (0); 152*7a7741afSMartin Matuska } 153*7a7741afSMartin Matuska 154*7a7741afSMartin Matuska static void 155*7a7741afSMartin Matuska zfs_znode_cache_destructor(void *buf, void *arg) 156*7a7741afSMartin Matuska { 157*7a7741afSMartin Matuska (void) arg; 158*7a7741afSMartin Matuska znode_t *zp = buf; 159*7a7741afSMartin Matuska 160*7a7741afSMartin Matuska ASSERT(!POINTER_IS_VALID(zp->z_zfsvfs)); 161*7a7741afSMartin Matuska ASSERT3P(zp->z_vnode, ==, NULL); 162*7a7741afSMartin Matuska ASSERT(!list_link_active(&zp->z_link_node)); 163*7a7741afSMartin Matuska mutex_destroy(&zp->z_lock); 164*7a7741afSMartin Matuska mutex_destroy(&zp->z_acl_lock); 165*7a7741afSMartin Matuska rw_destroy(&zp->z_xattr_lock); 166*7a7741afSMartin Matuska zfs_rangelock_fini(&zp->z_rangelock); 167*7a7741afSMartin Matuska 168*7a7741afSMartin Matuska ASSERT3P(zp->z_acl_cached, ==, NULL); 169*7a7741afSMartin Matuska ASSERT3P(zp->z_xattr_cached, ==, NULL); 170*7a7741afSMartin Matuska 171*7a7741afSMartin Matuska ASSERT0(atomic_load_32(&zp->z_sync_writes_cnt)); 172*7a7741afSMartin Matuska ASSERT0(atomic_load_32(&zp->z_async_writes_cnt)); 173*7a7741afSMartin Matuska } 174*7a7741afSMartin Matuska 175*7a7741afSMartin Matuska 176*7a7741afSMartin Matuska #ifdef _ZFS_USE_SMR 177*7a7741afSMartin Matuska VFS_SMR_DECLARE; 178*7a7741afSMartin Matuska 179*7a7741afSMartin Matuska static int 180*7a7741afSMartin Matuska zfs_znode_cache_constructor_smr(void *mem, int size __unused, void *private, 181*7a7741afSMartin Matuska int flags) 182*7a7741afSMartin Matuska { 183*7a7741afSMartin Matuska return (zfs_znode_cache_constructor(mem, private, flags)); 184*7a7741afSMartin Matuska } 185*7a7741afSMartin Matuska 186*7a7741afSMartin Matuska static void 187*7a7741afSMartin Matuska zfs_znode_cache_destructor_smr(void *mem, int size __unused, void *private) 188*7a7741afSMartin Matuska { 189*7a7741afSMartin Matuska zfs_znode_cache_destructor(mem, private); 190*7a7741afSMartin Matuska } 191*7a7741afSMartin Matuska 192*7a7741afSMartin Matuska void 193*7a7741afSMartin Matuska zfs_znode_init(void) 194*7a7741afSMartin Matuska { 195*7a7741afSMartin Matuska /* 196*7a7741afSMartin Matuska * Initialize zcache 197*7a7741afSMartin Matuska */ 198*7a7741afSMartin Matuska ASSERT3P(znode_uma_zone, ==, NULL); 199*7a7741afSMartin Matuska znode_uma_zone = uma_zcreate("zfs_znode_cache", 200*7a7741afSMartin Matuska sizeof (znode_t), zfs_znode_cache_constructor_smr, 201*7a7741afSMartin Matuska zfs_znode_cache_destructor_smr, NULL, NULL, 0, 0); 202*7a7741afSMartin Matuska VFS_SMR_ZONE_SET(znode_uma_zone); 203*7a7741afSMartin Matuska } 204*7a7741afSMartin Matuska 205*7a7741afSMartin Matuska static znode_t * 206*7a7741afSMartin Matuska zfs_znode_alloc_kmem(int flags) 207*7a7741afSMartin Matuska { 208*7a7741afSMartin Matuska return (uma_zalloc_smr(znode_uma_zone, flags)); 209*7a7741afSMartin Matuska } 210*7a7741afSMartin Matuska 211*7a7741afSMartin Matuska static void 212*7a7741afSMartin Matuska zfs_znode_free_kmem(znode_t *zp) 213*7a7741afSMartin Matuska { 214*7a7741afSMartin Matuska if (zp->z_xattr_cached) { 215*7a7741afSMartin Matuska nvlist_free(zp->z_xattr_cached); 216*7a7741afSMartin Matuska zp->z_xattr_cached = NULL; 217*7a7741afSMartin Matuska } 218*7a7741afSMartin Matuska uma_zfree_smr(znode_uma_zone, zp); 219*7a7741afSMartin Matuska } 220*7a7741afSMartin Matuska #else 221*7a7741afSMartin Matuska void 222*7a7741afSMartin Matuska zfs_znode_init(void) 223*7a7741afSMartin Matuska { 224*7a7741afSMartin Matuska /* 225*7a7741afSMartin Matuska * Initialize zcache 226*7a7741afSMartin Matuska */ 227*7a7741afSMartin Matuska ASSERT3P(znode_cache, ==, NULL); 228*7a7741afSMartin Matuska znode_cache = kmem_cache_create("zfs_znode_cache", 229*7a7741afSMartin Matuska sizeof (znode_t), 0, zfs_znode_cache_constructor, 230*7a7741afSMartin Matuska zfs_znode_cache_destructor, NULL, NULL, NULL, KMC_RECLAIMABLE); 231*7a7741afSMartin Matuska } 232*7a7741afSMartin Matuska 233*7a7741afSMartin Matuska static znode_t * 234*7a7741afSMartin Matuska zfs_znode_alloc_kmem(int flags) 235*7a7741afSMartin Matuska { 236*7a7741afSMartin Matuska return (kmem_cache_alloc(znode_cache, flags)); 237*7a7741afSMartin Matuska } 238*7a7741afSMartin Matuska 239*7a7741afSMartin Matuska static void 240*7a7741afSMartin Matuska zfs_znode_free_kmem(znode_t *zp) 241*7a7741afSMartin Matuska { 242*7a7741afSMartin Matuska if (zp->z_xattr_cached) { 243*7a7741afSMartin Matuska nvlist_free(zp->z_xattr_cached); 244*7a7741afSMartin Matuska zp->z_xattr_cached = NULL; 245*7a7741afSMartin Matuska } 246*7a7741afSMartin Matuska kmem_cache_free(znode_cache, zp); 247*7a7741afSMartin Matuska } 248*7a7741afSMartin Matuska #endif 249*7a7741afSMartin Matuska 250*7a7741afSMartin Matuska void 251*7a7741afSMartin Matuska zfs_znode_fini(void) 252*7a7741afSMartin Matuska { 253*7a7741afSMartin Matuska /* 254*7a7741afSMartin Matuska * Cleanup zcache 255*7a7741afSMartin Matuska */ 256*7a7741afSMartin Matuska #ifdef _ZFS_USE_SMR 257*7a7741afSMartin Matuska if (znode_uma_zone) { 258*7a7741afSMartin Matuska uma_zdestroy(znode_uma_zone); 259*7a7741afSMartin Matuska znode_uma_zone = NULL; 260*7a7741afSMartin Matuska } 261*7a7741afSMartin Matuska #else 262*7a7741afSMartin Matuska if (znode_cache) { 263*7a7741afSMartin Matuska kmem_cache_destroy(znode_cache); 264*7a7741afSMartin Matuska znode_cache = NULL; 265*7a7741afSMartin Matuska } 266*7a7741afSMartin Matuska #endif 267*7a7741afSMartin Matuska } 268*7a7741afSMartin Matuska 269*7a7741afSMartin Matuska 270*7a7741afSMartin Matuska static int 271*7a7741afSMartin Matuska zfs_create_share_dir(zfsvfs_t *zfsvfs, dmu_tx_t *tx) 272*7a7741afSMartin Matuska { 273*7a7741afSMartin Matuska zfs_acl_ids_t acl_ids; 274*7a7741afSMartin Matuska vattr_t vattr; 275*7a7741afSMartin Matuska znode_t *sharezp; 276*7a7741afSMartin Matuska znode_t *zp; 277*7a7741afSMartin Matuska int error; 278*7a7741afSMartin Matuska 279*7a7741afSMartin Matuska vattr.va_mask = AT_MODE|AT_UID|AT_GID; 280*7a7741afSMartin Matuska vattr.va_type = VDIR; 281*7a7741afSMartin Matuska vattr.va_mode = S_IFDIR|0555; 282*7a7741afSMartin Matuska vattr.va_uid = crgetuid(kcred); 283*7a7741afSMartin Matuska vattr.va_gid = crgetgid(kcred); 284*7a7741afSMartin Matuska 285*7a7741afSMartin Matuska sharezp = zfs_znode_alloc_kmem(KM_SLEEP); 286*7a7741afSMartin Matuska ASSERT(!POINTER_IS_VALID(sharezp->z_zfsvfs)); 287*7a7741afSMartin Matuska sharezp->z_unlinked = 0; 288*7a7741afSMartin Matuska sharezp->z_atime_dirty = 0; 289*7a7741afSMartin Matuska sharezp->z_zfsvfs = zfsvfs; 290*7a7741afSMartin Matuska sharezp->z_is_sa = zfsvfs->z_use_sa; 291*7a7741afSMartin Matuska 292*7a7741afSMartin Matuska VERIFY0(zfs_acl_ids_create(sharezp, IS_ROOT_NODE, &vattr, 293*7a7741afSMartin Matuska kcred, NULL, &acl_ids, NULL)); 294*7a7741afSMartin Matuska zfs_mknode(sharezp, &vattr, tx, kcred, IS_ROOT_NODE, &zp, &acl_ids); 295*7a7741afSMartin Matuska ASSERT3P(zp, ==, sharezp); 296*7a7741afSMartin Matuska POINTER_INVALIDATE(&sharezp->z_zfsvfs); 297*7a7741afSMartin Matuska error = zap_add(zfsvfs->z_os, MASTER_NODE_OBJ, 298*7a7741afSMartin Matuska ZFS_SHARES_DIR, 8, 1, &sharezp->z_id, tx); 299*7a7741afSMartin Matuska zfsvfs->z_shares_dir = sharezp->z_id; 300*7a7741afSMartin Matuska 301*7a7741afSMartin Matuska zfs_acl_ids_free(&acl_ids); 302*7a7741afSMartin Matuska sa_handle_destroy(sharezp->z_sa_hdl); 303*7a7741afSMartin Matuska zfs_znode_free_kmem(sharezp); 304*7a7741afSMartin Matuska 305*7a7741afSMartin Matuska return (error); 306*7a7741afSMartin Matuska } 307*7a7741afSMartin Matuska 308*7a7741afSMartin Matuska /* 309*7a7741afSMartin Matuska * define a couple of values we need available 310*7a7741afSMartin Matuska * for both 64 and 32 bit environments. 311*7a7741afSMartin Matuska */ 312*7a7741afSMartin Matuska #ifndef NBITSMINOR64 313*7a7741afSMartin Matuska #define NBITSMINOR64 32 314*7a7741afSMartin Matuska #endif 315*7a7741afSMartin Matuska #ifndef MAXMAJ64 316*7a7741afSMartin Matuska #define MAXMAJ64 0xffffffffUL 317*7a7741afSMartin Matuska #endif 318*7a7741afSMartin Matuska #ifndef MAXMIN64 319*7a7741afSMartin Matuska #define MAXMIN64 0xffffffffUL 320*7a7741afSMartin Matuska #endif 321*7a7741afSMartin Matuska 322*7a7741afSMartin Matuska /* 323*7a7741afSMartin Matuska * Create special expldev for ZFS private use. 324*7a7741afSMartin Matuska * Can't use standard expldev since it doesn't do 325*7a7741afSMartin Matuska * what we want. The standard expldev() takes a 326*7a7741afSMartin Matuska * dev32_t in LP64 and expands it to a long dev_t. 327*7a7741afSMartin Matuska * We need an interface that takes a dev32_t in ILP32 328*7a7741afSMartin Matuska * and expands it to a long dev_t. 329*7a7741afSMartin Matuska */ 330*7a7741afSMartin Matuska static uint64_t 331*7a7741afSMartin Matuska zfs_expldev(dev_t dev) 332*7a7741afSMartin Matuska { 333*7a7741afSMartin Matuska return (((uint64_t)major(dev) << NBITSMINOR64) | minor(dev)); 334*7a7741afSMartin Matuska } 335*7a7741afSMartin Matuska /* 336*7a7741afSMartin Matuska * Special cmpldev for ZFS private use. 337*7a7741afSMartin Matuska * Can't use standard cmpldev since it takes 338*7a7741afSMartin Matuska * a long dev_t and compresses it to dev32_t in 339*7a7741afSMartin Matuska * LP64. We need to do a compaction of a long dev_t 340*7a7741afSMartin Matuska * to a dev32_t in ILP32. 341*7a7741afSMartin Matuska */ 342*7a7741afSMartin Matuska dev_t 343*7a7741afSMartin Matuska zfs_cmpldev(uint64_t dev) 344*7a7741afSMartin Matuska { 345*7a7741afSMartin Matuska return (makedev((dev >> NBITSMINOR64), (dev & MAXMIN64))); 346*7a7741afSMartin Matuska } 347*7a7741afSMartin Matuska 348*7a7741afSMartin Matuska static void 349*7a7741afSMartin Matuska zfs_znode_sa_init(zfsvfs_t *zfsvfs, znode_t *zp, 350*7a7741afSMartin Matuska dmu_buf_t *db, dmu_object_type_t obj_type, sa_handle_t *sa_hdl) 351*7a7741afSMartin Matuska { 352*7a7741afSMartin Matuska ASSERT(!POINTER_IS_VALID(zp->z_zfsvfs) || (zfsvfs == zp->z_zfsvfs)); 353*7a7741afSMartin Matuska ASSERT(MUTEX_HELD(ZFS_OBJ_MUTEX(zfsvfs, zp->z_id))); 354*7a7741afSMartin Matuska 355*7a7741afSMartin Matuska ASSERT3P(zp->z_sa_hdl, ==, NULL); 356*7a7741afSMartin Matuska ASSERT3P(zp->z_acl_cached, ==, NULL); 357*7a7741afSMartin Matuska if (sa_hdl == NULL) { 358*7a7741afSMartin Matuska VERIFY0(sa_handle_get_from_db(zfsvfs->z_os, db, zp, 359*7a7741afSMartin Matuska SA_HDL_SHARED, &zp->z_sa_hdl)); 360*7a7741afSMartin Matuska } else { 361*7a7741afSMartin Matuska zp->z_sa_hdl = sa_hdl; 362*7a7741afSMartin Matuska sa_set_userp(sa_hdl, zp); 363*7a7741afSMartin Matuska } 364*7a7741afSMartin Matuska 365*7a7741afSMartin Matuska zp->z_is_sa = (obj_type == DMU_OT_SA) ? B_TRUE : B_FALSE; 366*7a7741afSMartin Matuska 367*7a7741afSMartin Matuska /* 368*7a7741afSMartin Matuska * Slap on VROOT if we are the root znode unless we are the root 369*7a7741afSMartin Matuska * node of a snapshot mounted under .zfs. 370*7a7741afSMartin Matuska */ 371*7a7741afSMartin Matuska if (zp->z_id == zfsvfs->z_root && zfsvfs->z_parent == zfsvfs) 372*7a7741afSMartin Matuska ZTOV(zp)->v_flag |= VROOT; 373*7a7741afSMartin Matuska } 374*7a7741afSMartin Matuska 375*7a7741afSMartin Matuska void 376*7a7741afSMartin Matuska zfs_znode_dmu_fini(znode_t *zp) 377*7a7741afSMartin Matuska { 378*7a7741afSMartin Matuska ASSERT(MUTEX_HELD(ZFS_OBJ_MUTEX(zp->z_zfsvfs, zp->z_id)) || 379*7a7741afSMartin Matuska ZFS_TEARDOWN_INACTIVE_WRITE_HELD(zp->z_zfsvfs)); 380*7a7741afSMartin Matuska 381*7a7741afSMartin Matuska sa_handle_destroy(zp->z_sa_hdl); 382*7a7741afSMartin Matuska zp->z_sa_hdl = NULL; 383*7a7741afSMartin Matuska } 384*7a7741afSMartin Matuska 385*7a7741afSMartin Matuska static void 386*7a7741afSMartin Matuska zfs_vnode_forget(vnode_t *vp) 387*7a7741afSMartin Matuska { 388*7a7741afSMartin Matuska 389*7a7741afSMartin Matuska /* copied from insmntque_stddtr */ 390*7a7741afSMartin Matuska vp->v_data = NULL; 391*7a7741afSMartin Matuska vp->v_op = &dead_vnodeops; 392*7a7741afSMartin Matuska vgone(vp); 393*7a7741afSMartin Matuska vput(vp); 394*7a7741afSMartin Matuska } 395*7a7741afSMartin Matuska 396*7a7741afSMartin Matuska /* 397*7a7741afSMartin Matuska * Construct a new znode/vnode and initialize. 398*7a7741afSMartin Matuska * 399*7a7741afSMartin Matuska * This does not do a call to dmu_set_user() that is 400*7a7741afSMartin Matuska * up to the caller to do, in case you don't want to 401*7a7741afSMartin Matuska * return the znode 402*7a7741afSMartin Matuska */ 403*7a7741afSMartin Matuska static znode_t * 404*7a7741afSMartin Matuska zfs_znode_alloc(zfsvfs_t *zfsvfs, dmu_buf_t *db, int blksz, 405*7a7741afSMartin Matuska dmu_object_type_t obj_type, sa_handle_t *hdl) 406*7a7741afSMartin Matuska { 407*7a7741afSMartin Matuska znode_t *zp; 408*7a7741afSMartin Matuska vnode_t *vp; 409*7a7741afSMartin Matuska uint64_t mode; 410*7a7741afSMartin Matuska uint64_t parent; 411*7a7741afSMartin Matuska #ifdef notyet 412*7a7741afSMartin Matuska uint64_t mtime[2], ctime[2]; 413*7a7741afSMartin Matuska #endif 414*7a7741afSMartin Matuska uint64_t projid = ZFS_DEFAULT_PROJID; 415*7a7741afSMartin Matuska sa_bulk_attr_t bulk[9]; 416*7a7741afSMartin Matuska int count = 0; 417*7a7741afSMartin Matuska int error; 418*7a7741afSMartin Matuska 419*7a7741afSMartin Matuska zp = zfs_znode_alloc_kmem(KM_SLEEP); 420*7a7741afSMartin Matuska 421*7a7741afSMartin Matuska #ifndef _ZFS_USE_SMR 422*7a7741afSMartin Matuska KASSERT((zfsvfs->z_parent->z_vfs->mnt_kern_flag & MNTK_FPLOOKUP) == 0, 423*7a7741afSMartin Matuska ("%s: fast path lookup enabled without smr", __func__)); 424*7a7741afSMartin Matuska #endif 425*7a7741afSMartin Matuska 426*7a7741afSMartin Matuska KASSERT(curthread->td_vp_reserved != NULL, 427*7a7741afSMartin Matuska ("zfs_znode_alloc: getnewvnode without any vnodes reserved")); 428*7a7741afSMartin Matuska error = getnewvnode("zfs", zfsvfs->z_parent->z_vfs, &zfs_vnodeops, &vp); 429*7a7741afSMartin Matuska if (error != 0) { 430*7a7741afSMartin Matuska zfs_znode_free_kmem(zp); 431*7a7741afSMartin Matuska return (NULL); 432*7a7741afSMartin Matuska } 433*7a7741afSMartin Matuska zp->z_vnode = vp; 434*7a7741afSMartin Matuska vp->v_data = zp; 435*7a7741afSMartin Matuska 436*7a7741afSMartin Matuska /* 437*7a7741afSMartin Matuska * Acquire the vnode lock before any possible interaction with the 438*7a7741afSMartin Matuska * outside world. Specifically, there is an error path that calls 439*7a7741afSMartin Matuska * zfs_vnode_forget() and the vnode should be exclusively locked. 440*7a7741afSMartin Matuska */ 441*7a7741afSMartin Matuska vn_lock(vp, LK_EXCLUSIVE | LK_RETRY); 442*7a7741afSMartin Matuska 443*7a7741afSMartin Matuska ASSERT(!POINTER_IS_VALID(zp->z_zfsvfs)); 444*7a7741afSMartin Matuska 445*7a7741afSMartin Matuska zp->z_sa_hdl = NULL; 446*7a7741afSMartin Matuska zp->z_unlinked = 0; 447*7a7741afSMartin Matuska zp->z_atime_dirty = 0; 448*7a7741afSMartin Matuska zp->z_mapcnt = 0; 449*7a7741afSMartin Matuska zp->z_id = db->db_object; 450*7a7741afSMartin Matuska zp->z_blksz = blksz; 451*7a7741afSMartin Matuska zp->z_seq = 0x7A4653; 452*7a7741afSMartin Matuska zp->z_sync_cnt = 0; 453*7a7741afSMartin Matuska zp->z_sync_writes_cnt = 0; 454*7a7741afSMartin Matuska zp->z_async_writes_cnt = 0; 455*7a7741afSMartin Matuska atomic_store_ptr(&zp->z_cached_symlink, NULL); 456*7a7741afSMartin Matuska 457*7a7741afSMartin Matuska zfs_znode_sa_init(zfsvfs, zp, db, obj_type, hdl); 458*7a7741afSMartin Matuska 459*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_MODE(zfsvfs), NULL, &mode, 8); 460*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_GEN(zfsvfs), NULL, &zp->z_gen, 8); 461*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_SIZE(zfsvfs), NULL, 462*7a7741afSMartin Matuska &zp->z_size, 8); 463*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_LINKS(zfsvfs), NULL, 464*7a7741afSMartin Matuska &zp->z_links, 8); 465*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_FLAGS(zfsvfs), NULL, 466*7a7741afSMartin Matuska &zp->z_pflags, 8); 467*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_PARENT(zfsvfs), NULL, &parent, 8); 468*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_ATIME(zfsvfs), NULL, 469*7a7741afSMartin Matuska &zp->z_atime, 16); 470*7a7741afSMartin Matuska #ifdef notyet 471*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_MTIME(zfsvfs), NULL, 472*7a7741afSMartin Matuska &mtime, 16); 473*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_CTIME(zfsvfs), NULL, 474*7a7741afSMartin Matuska &ctime, 16); 475*7a7741afSMartin Matuska #endif 476*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_UID(zfsvfs), NULL, 477*7a7741afSMartin Matuska &zp->z_uid, 8); 478*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_GID(zfsvfs), NULL, 479*7a7741afSMartin Matuska &zp->z_gid, 8); 480*7a7741afSMartin Matuska 481*7a7741afSMartin Matuska if (sa_bulk_lookup(zp->z_sa_hdl, bulk, count) != 0 || zp->z_gen == 0 || 482*7a7741afSMartin Matuska (dmu_objset_projectquota_enabled(zfsvfs->z_os) && 483*7a7741afSMartin Matuska (zp->z_pflags & ZFS_PROJID) && 484*7a7741afSMartin Matuska sa_lookup(zp->z_sa_hdl, SA_ZPL_PROJID(zfsvfs), &projid, 8) != 0)) { 485*7a7741afSMartin Matuska if (hdl == NULL) 486*7a7741afSMartin Matuska sa_handle_destroy(zp->z_sa_hdl); 487*7a7741afSMartin Matuska zfs_vnode_forget(vp); 488*7a7741afSMartin Matuska zp->z_vnode = NULL; 489*7a7741afSMartin Matuska zfs_znode_free_kmem(zp); 490*7a7741afSMartin Matuska return (NULL); 491*7a7741afSMartin Matuska } 492*7a7741afSMartin Matuska 493*7a7741afSMartin Matuska zp->z_projid = projid; 494*7a7741afSMartin Matuska zp->z_mode = mode; 495*7a7741afSMartin Matuska 496*7a7741afSMartin Matuska /* Cache the xattr parent id */ 497*7a7741afSMartin Matuska if (zp->z_pflags & ZFS_XATTR) 498*7a7741afSMartin Matuska zp->z_xattr_parent = parent; 499*7a7741afSMartin Matuska 500*7a7741afSMartin Matuska vp->v_type = IFTOVT((mode_t)mode); 501*7a7741afSMartin Matuska 502*7a7741afSMartin Matuska switch (vp->v_type) { 503*7a7741afSMartin Matuska case VDIR: 504*7a7741afSMartin Matuska zp->z_zn_prefetch = B_TRUE; /* z_prefetch default is enabled */ 505*7a7741afSMartin Matuska break; 506*7a7741afSMartin Matuska case VFIFO: 507*7a7741afSMartin Matuska vp->v_op = &zfs_fifoops; 508*7a7741afSMartin Matuska break; 509*7a7741afSMartin Matuska case VREG: 510*7a7741afSMartin Matuska if (parent == zfsvfs->z_shares_dir) { 511*7a7741afSMartin Matuska ASSERT0(zp->z_uid); 512*7a7741afSMartin Matuska ASSERT0(zp->z_gid); 513*7a7741afSMartin Matuska vp->v_op = &zfs_shareops; 514*7a7741afSMartin Matuska } 515*7a7741afSMartin Matuska break; 516*7a7741afSMartin Matuska default: 517*7a7741afSMartin Matuska break; 518*7a7741afSMartin Matuska } 519*7a7741afSMartin Matuska 520*7a7741afSMartin Matuska mutex_enter(&zfsvfs->z_znodes_lock); 521*7a7741afSMartin Matuska list_insert_tail(&zfsvfs->z_all_znodes, zp); 522*7a7741afSMartin Matuska zp->z_zfsvfs = zfsvfs; 523*7a7741afSMartin Matuska mutex_exit(&zfsvfs->z_znodes_lock); 524*7a7741afSMartin Matuska 525*7a7741afSMartin Matuska #if __FreeBSD_version >= 1400077 526*7a7741afSMartin Matuska vn_set_state(vp, VSTATE_CONSTRUCTED); 527*7a7741afSMartin Matuska #endif 528*7a7741afSMartin Matuska VN_LOCK_AREC(vp); 529*7a7741afSMartin Matuska if (vp->v_type != VFIFO) 530*7a7741afSMartin Matuska VN_LOCK_ASHARE(vp); 531*7a7741afSMartin Matuska 532*7a7741afSMartin Matuska return (zp); 533*7a7741afSMartin Matuska } 534*7a7741afSMartin Matuska 535*7a7741afSMartin Matuska static uint64_t empty_xattr; 536*7a7741afSMartin Matuska static uint64_t pad[4]; 537*7a7741afSMartin Matuska static zfs_acl_phys_t acl_phys; 538*7a7741afSMartin Matuska /* 539*7a7741afSMartin Matuska * Create a new DMU object to hold a zfs znode. 540*7a7741afSMartin Matuska * 541*7a7741afSMartin Matuska * IN: dzp - parent directory for new znode 542*7a7741afSMartin Matuska * vap - file attributes for new znode 543*7a7741afSMartin Matuska * tx - dmu transaction id for zap operations 544*7a7741afSMartin Matuska * cr - credentials of caller 545*7a7741afSMartin Matuska * flag - flags: 546*7a7741afSMartin Matuska * IS_ROOT_NODE - new object will be root 547*7a7741afSMartin Matuska * IS_XATTR - new object is an attribute 548*7a7741afSMartin Matuska * bonuslen - length of bonus buffer 549*7a7741afSMartin Matuska * setaclp - File/Dir initial ACL 550*7a7741afSMartin Matuska * fuidp - Tracks fuid allocation. 551*7a7741afSMartin Matuska * 552*7a7741afSMartin Matuska * OUT: zpp - allocated znode 553*7a7741afSMartin Matuska * 554*7a7741afSMartin Matuska */ 555*7a7741afSMartin Matuska void 556*7a7741afSMartin Matuska zfs_mknode(znode_t *dzp, vattr_t *vap, dmu_tx_t *tx, cred_t *cr, 557*7a7741afSMartin Matuska uint_t flag, znode_t **zpp, zfs_acl_ids_t *acl_ids) 558*7a7741afSMartin Matuska { 559*7a7741afSMartin Matuska uint64_t crtime[2], atime[2], mtime[2], ctime[2]; 560*7a7741afSMartin Matuska uint64_t mode, size, links, parent, pflags; 561*7a7741afSMartin Matuska uint64_t dzp_pflags = 0; 562*7a7741afSMartin Matuska uint64_t rdev = 0; 563*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = dzp->z_zfsvfs; 564*7a7741afSMartin Matuska dmu_buf_t *db; 565*7a7741afSMartin Matuska timestruc_t now; 566*7a7741afSMartin Matuska uint64_t gen, obj; 567*7a7741afSMartin Matuska int bonuslen; 568*7a7741afSMartin Matuska int dnodesize; 569*7a7741afSMartin Matuska sa_handle_t *sa_hdl; 570*7a7741afSMartin Matuska dmu_object_type_t obj_type; 571*7a7741afSMartin Matuska sa_bulk_attr_t *sa_attrs; 572*7a7741afSMartin Matuska int cnt = 0; 573*7a7741afSMartin Matuska zfs_acl_locator_cb_t locate = { 0 }; 574*7a7741afSMartin Matuska 575*7a7741afSMartin Matuska ASSERT3P(vap, !=, NULL); 576*7a7741afSMartin Matuska ASSERT3U((vap->va_mask & AT_MODE), ==, AT_MODE); 577*7a7741afSMartin Matuska 578*7a7741afSMartin Matuska if (zfsvfs->z_replay) { 579*7a7741afSMartin Matuska obj = vap->va_nodeid; 580*7a7741afSMartin Matuska now = vap->va_ctime; /* see zfs_replay_create() */ 581*7a7741afSMartin Matuska gen = vap->va_nblocks; /* ditto */ 582*7a7741afSMartin Matuska dnodesize = vap->va_fsid; /* ditto */ 583*7a7741afSMartin Matuska } else { 584*7a7741afSMartin Matuska obj = 0; 585*7a7741afSMartin Matuska vfs_timestamp(&now); 586*7a7741afSMartin Matuska gen = dmu_tx_get_txg(tx); 587*7a7741afSMartin Matuska dnodesize = dmu_objset_dnodesize(zfsvfs->z_os); 588*7a7741afSMartin Matuska } 589*7a7741afSMartin Matuska 590*7a7741afSMartin Matuska if (dnodesize == 0) 591*7a7741afSMartin Matuska dnodesize = DNODE_MIN_SIZE; 592*7a7741afSMartin Matuska 593*7a7741afSMartin Matuska obj_type = zfsvfs->z_use_sa ? DMU_OT_SA : DMU_OT_ZNODE; 594*7a7741afSMartin Matuska bonuslen = (obj_type == DMU_OT_SA) ? 595*7a7741afSMartin Matuska DN_BONUS_SIZE(dnodesize) : ZFS_OLD_ZNODE_PHYS_SIZE; 596*7a7741afSMartin Matuska 597*7a7741afSMartin Matuska /* 598*7a7741afSMartin Matuska * Create a new DMU object. 599*7a7741afSMartin Matuska */ 600*7a7741afSMartin Matuska /* 601*7a7741afSMartin Matuska * There's currently no mechanism for pre-reading the blocks that will 602*7a7741afSMartin Matuska * be needed to allocate a new object, so we accept the small chance 603*7a7741afSMartin Matuska * that there will be an i/o error and we will fail one of the 604*7a7741afSMartin Matuska * assertions below. 605*7a7741afSMartin Matuska */ 606*7a7741afSMartin Matuska if (vap->va_type == VDIR) { 607*7a7741afSMartin Matuska if (zfsvfs->z_replay) { 608*7a7741afSMartin Matuska VERIFY0(zap_create_claim_norm_dnsize(zfsvfs->z_os, obj, 609*7a7741afSMartin Matuska zfsvfs->z_norm, DMU_OT_DIRECTORY_CONTENTS, 610*7a7741afSMartin Matuska obj_type, bonuslen, dnodesize, tx)); 611*7a7741afSMartin Matuska } else { 612*7a7741afSMartin Matuska obj = zap_create_norm_dnsize(zfsvfs->z_os, 613*7a7741afSMartin Matuska zfsvfs->z_norm, DMU_OT_DIRECTORY_CONTENTS, 614*7a7741afSMartin Matuska obj_type, bonuslen, dnodesize, tx); 615*7a7741afSMartin Matuska } 616*7a7741afSMartin Matuska } else { 617*7a7741afSMartin Matuska if (zfsvfs->z_replay) { 618*7a7741afSMartin Matuska VERIFY0(dmu_object_claim_dnsize(zfsvfs->z_os, obj, 619*7a7741afSMartin Matuska DMU_OT_PLAIN_FILE_CONTENTS, 0, 620*7a7741afSMartin Matuska obj_type, bonuslen, dnodesize, tx)); 621*7a7741afSMartin Matuska } else { 622*7a7741afSMartin Matuska obj = dmu_object_alloc_dnsize(zfsvfs->z_os, 623*7a7741afSMartin Matuska DMU_OT_PLAIN_FILE_CONTENTS, 0, 624*7a7741afSMartin Matuska obj_type, bonuslen, dnodesize, tx); 625*7a7741afSMartin Matuska } 626*7a7741afSMartin Matuska } 627*7a7741afSMartin Matuska 628*7a7741afSMartin Matuska ZFS_OBJ_HOLD_ENTER(zfsvfs, obj); 629*7a7741afSMartin Matuska VERIFY0(sa_buf_hold(zfsvfs->z_os, obj, NULL, &db)); 630*7a7741afSMartin Matuska 631*7a7741afSMartin Matuska /* 632*7a7741afSMartin Matuska * If this is the root, fix up the half-initialized parent pointer 633*7a7741afSMartin Matuska * to reference the just-allocated physical data area. 634*7a7741afSMartin Matuska */ 635*7a7741afSMartin Matuska if (flag & IS_ROOT_NODE) { 636*7a7741afSMartin Matuska dzp->z_id = obj; 637*7a7741afSMartin Matuska } else { 638*7a7741afSMartin Matuska dzp_pflags = dzp->z_pflags; 639*7a7741afSMartin Matuska } 640*7a7741afSMartin Matuska 641*7a7741afSMartin Matuska /* 642*7a7741afSMartin Matuska * If parent is an xattr, so am I. 643*7a7741afSMartin Matuska */ 644*7a7741afSMartin Matuska if (dzp_pflags & ZFS_XATTR) { 645*7a7741afSMartin Matuska flag |= IS_XATTR; 646*7a7741afSMartin Matuska } 647*7a7741afSMartin Matuska 648*7a7741afSMartin Matuska if (zfsvfs->z_use_fuids) 649*7a7741afSMartin Matuska pflags = ZFS_ARCHIVE | ZFS_AV_MODIFIED; 650*7a7741afSMartin Matuska else 651*7a7741afSMartin Matuska pflags = 0; 652*7a7741afSMartin Matuska 653*7a7741afSMartin Matuska if (vap->va_type == VDIR) { 654*7a7741afSMartin Matuska size = 2; /* contents ("." and "..") */ 655*7a7741afSMartin Matuska links = (flag & (IS_ROOT_NODE | IS_XATTR)) ? 2 : 1; 656*7a7741afSMartin Matuska } else { 657*7a7741afSMartin Matuska size = links = 0; 658*7a7741afSMartin Matuska } 659*7a7741afSMartin Matuska 660*7a7741afSMartin Matuska if (vap->va_type == VBLK || vap->va_type == VCHR) { 661*7a7741afSMartin Matuska rdev = zfs_expldev(vap->va_rdev); 662*7a7741afSMartin Matuska } 663*7a7741afSMartin Matuska 664*7a7741afSMartin Matuska parent = dzp->z_id; 665*7a7741afSMartin Matuska mode = acl_ids->z_mode; 666*7a7741afSMartin Matuska if (flag & IS_XATTR) 667*7a7741afSMartin Matuska pflags |= ZFS_XATTR; 668*7a7741afSMartin Matuska 669*7a7741afSMartin Matuska /* 670*7a7741afSMartin Matuska * No execs denied will be determined when zfs_mode_compute() is called. 671*7a7741afSMartin Matuska */ 672*7a7741afSMartin Matuska pflags |= acl_ids->z_aclp->z_hints & 673*7a7741afSMartin Matuska (ZFS_ACL_TRIVIAL|ZFS_INHERIT_ACE|ZFS_ACL_AUTO_INHERIT| 674*7a7741afSMartin Matuska ZFS_ACL_DEFAULTED|ZFS_ACL_PROTECTED); 675*7a7741afSMartin Matuska 676*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&now, crtime); 677*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&now, ctime); 678*7a7741afSMartin Matuska 679*7a7741afSMartin Matuska if (vap->va_mask & AT_ATIME) { 680*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&vap->va_atime, atime); 681*7a7741afSMartin Matuska } else { 682*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&now, atime); 683*7a7741afSMartin Matuska } 684*7a7741afSMartin Matuska 685*7a7741afSMartin Matuska if (vap->va_mask & AT_MTIME) { 686*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&vap->va_mtime, mtime); 687*7a7741afSMartin Matuska } else { 688*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&now, mtime); 689*7a7741afSMartin Matuska } 690*7a7741afSMartin Matuska 691*7a7741afSMartin Matuska /* Now add in all of the "SA" attributes */ 692*7a7741afSMartin Matuska VERIFY0(sa_handle_get_from_db(zfsvfs->z_os, db, NULL, SA_HDL_SHARED, 693*7a7741afSMartin Matuska &sa_hdl)); 694*7a7741afSMartin Matuska 695*7a7741afSMartin Matuska /* 696*7a7741afSMartin Matuska * Setup the array of attributes to be replaced/set on the new file 697*7a7741afSMartin Matuska * 698*7a7741afSMartin Matuska * order for DMU_OT_ZNODE is critical since it needs to be constructed 699*7a7741afSMartin Matuska * in the old znode_phys_t format. Don't change this ordering 700*7a7741afSMartin Matuska */ 701*7a7741afSMartin Matuska sa_attrs = kmem_alloc(sizeof (sa_bulk_attr_t) * ZPL_END, KM_SLEEP); 702*7a7741afSMartin Matuska 703*7a7741afSMartin Matuska if (obj_type == DMU_OT_ZNODE) { 704*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_ATIME(zfsvfs), 705*7a7741afSMartin Matuska NULL, &atime, 16); 706*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_MTIME(zfsvfs), 707*7a7741afSMartin Matuska NULL, &mtime, 16); 708*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_CTIME(zfsvfs), 709*7a7741afSMartin Matuska NULL, &ctime, 16); 710*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_CRTIME(zfsvfs), 711*7a7741afSMartin Matuska NULL, &crtime, 16); 712*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_GEN(zfsvfs), 713*7a7741afSMartin Matuska NULL, &gen, 8); 714*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_MODE(zfsvfs), 715*7a7741afSMartin Matuska NULL, &mode, 8); 716*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_SIZE(zfsvfs), 717*7a7741afSMartin Matuska NULL, &size, 8); 718*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_PARENT(zfsvfs), 719*7a7741afSMartin Matuska NULL, &parent, 8); 720*7a7741afSMartin Matuska } else { 721*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_MODE(zfsvfs), 722*7a7741afSMartin Matuska NULL, &mode, 8); 723*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_SIZE(zfsvfs), 724*7a7741afSMartin Matuska NULL, &size, 8); 725*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_GEN(zfsvfs), 726*7a7741afSMartin Matuska NULL, &gen, 8); 727*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_UID(zfsvfs), 728*7a7741afSMartin Matuska NULL, &acl_ids->z_fuid, 8); 729*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_GID(zfsvfs), 730*7a7741afSMartin Matuska NULL, &acl_ids->z_fgid, 8); 731*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_PARENT(zfsvfs), 732*7a7741afSMartin Matuska NULL, &parent, 8); 733*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_FLAGS(zfsvfs), 734*7a7741afSMartin Matuska NULL, &pflags, 8); 735*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_ATIME(zfsvfs), 736*7a7741afSMartin Matuska NULL, &atime, 16); 737*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_MTIME(zfsvfs), 738*7a7741afSMartin Matuska NULL, &mtime, 16); 739*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_CTIME(zfsvfs), 740*7a7741afSMartin Matuska NULL, &ctime, 16); 741*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_CRTIME(zfsvfs), 742*7a7741afSMartin Matuska NULL, &crtime, 16); 743*7a7741afSMartin Matuska } 744*7a7741afSMartin Matuska 745*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_LINKS(zfsvfs), NULL, &links, 8); 746*7a7741afSMartin Matuska 747*7a7741afSMartin Matuska if (obj_type == DMU_OT_ZNODE) { 748*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_XATTR(zfsvfs), NULL, 749*7a7741afSMartin Matuska &empty_xattr, 8); 750*7a7741afSMartin Matuska } 751*7a7741afSMartin Matuska if (obj_type == DMU_OT_ZNODE || 752*7a7741afSMartin Matuska (vap->va_type == VBLK || vap->va_type == VCHR)) { 753*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_RDEV(zfsvfs), 754*7a7741afSMartin Matuska NULL, &rdev, 8); 755*7a7741afSMartin Matuska 756*7a7741afSMartin Matuska } 757*7a7741afSMartin Matuska if (obj_type == DMU_OT_ZNODE) { 758*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_FLAGS(zfsvfs), 759*7a7741afSMartin Matuska NULL, &pflags, 8); 760*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_UID(zfsvfs), NULL, 761*7a7741afSMartin Matuska &acl_ids->z_fuid, 8); 762*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_GID(zfsvfs), NULL, 763*7a7741afSMartin Matuska &acl_ids->z_fgid, 8); 764*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_PAD(zfsvfs), NULL, pad, 765*7a7741afSMartin Matuska sizeof (uint64_t) * 4); 766*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_ZNODE_ACL(zfsvfs), NULL, 767*7a7741afSMartin Matuska &acl_phys, sizeof (zfs_acl_phys_t)); 768*7a7741afSMartin Matuska } else if (acl_ids->z_aclp->z_version >= ZFS_ACL_VERSION_FUID) { 769*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_DACL_COUNT(zfsvfs), NULL, 770*7a7741afSMartin Matuska &acl_ids->z_aclp->z_acl_count, 8); 771*7a7741afSMartin Matuska locate.cb_aclp = acl_ids->z_aclp; 772*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(sa_attrs, cnt, SA_ZPL_DACL_ACES(zfsvfs), 773*7a7741afSMartin Matuska zfs_acl_data_locator, &locate, 774*7a7741afSMartin Matuska acl_ids->z_aclp->z_acl_bytes); 775*7a7741afSMartin Matuska mode = zfs_mode_compute(mode, acl_ids->z_aclp, &pflags, 776*7a7741afSMartin Matuska acl_ids->z_fuid, acl_ids->z_fgid); 777*7a7741afSMartin Matuska } 778*7a7741afSMartin Matuska 779*7a7741afSMartin Matuska VERIFY0(sa_replace_all_by_template(sa_hdl, sa_attrs, cnt, tx)); 780*7a7741afSMartin Matuska 781*7a7741afSMartin Matuska if (!(flag & IS_ROOT_NODE)) { 782*7a7741afSMartin Matuska *zpp = zfs_znode_alloc(zfsvfs, db, 0, obj_type, sa_hdl); 783*7a7741afSMartin Matuska ASSERT3P(*zpp, !=, NULL); 784*7a7741afSMartin Matuska } else { 785*7a7741afSMartin Matuska /* 786*7a7741afSMartin Matuska * If we are creating the root node, the "parent" we 787*7a7741afSMartin Matuska * passed in is the znode for the root. 788*7a7741afSMartin Matuska */ 789*7a7741afSMartin Matuska *zpp = dzp; 790*7a7741afSMartin Matuska 791*7a7741afSMartin Matuska (*zpp)->z_sa_hdl = sa_hdl; 792*7a7741afSMartin Matuska } 793*7a7741afSMartin Matuska 794*7a7741afSMartin Matuska (*zpp)->z_pflags = pflags; 795*7a7741afSMartin Matuska (*zpp)->z_mode = mode; 796*7a7741afSMartin Matuska (*zpp)->z_dnodesize = dnodesize; 797*7a7741afSMartin Matuska 798*7a7741afSMartin Matuska if (vap->va_mask & AT_XVATTR) 799*7a7741afSMartin Matuska zfs_xvattr_set(*zpp, (xvattr_t *)vap, tx); 800*7a7741afSMartin Matuska 801*7a7741afSMartin Matuska if (obj_type == DMU_OT_ZNODE || 802*7a7741afSMartin Matuska acl_ids->z_aclp->z_version < ZFS_ACL_VERSION_FUID) { 803*7a7741afSMartin Matuska VERIFY0(zfs_aclset_common(*zpp, acl_ids->z_aclp, cr, tx)); 804*7a7741afSMartin Matuska } 805*7a7741afSMartin Matuska if (!(flag & IS_ROOT_NODE)) { 806*7a7741afSMartin Matuska vnode_t *vp = ZTOV(*zpp); 807*7a7741afSMartin Matuska vp->v_vflag |= VV_FORCEINSMQ; 808*7a7741afSMartin Matuska int err = insmntque(vp, zfsvfs->z_vfs); 809*7a7741afSMartin Matuska vp->v_vflag &= ~VV_FORCEINSMQ; 810*7a7741afSMartin Matuska (void) err; 811*7a7741afSMartin Matuska KASSERT(err == 0, ("insmntque() failed: error %d", err)); 812*7a7741afSMartin Matuska } 813*7a7741afSMartin Matuska kmem_free(sa_attrs, sizeof (sa_bulk_attr_t) * ZPL_END); 814*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj); 815*7a7741afSMartin Matuska } 816*7a7741afSMartin Matuska 817*7a7741afSMartin Matuska /* 818*7a7741afSMartin Matuska * Update in-core attributes. It is assumed the caller will be doing an 819*7a7741afSMartin Matuska * sa_bulk_update to push the changes out. 820*7a7741afSMartin Matuska */ 821*7a7741afSMartin Matuska void 822*7a7741afSMartin Matuska zfs_xvattr_set(znode_t *zp, xvattr_t *xvap, dmu_tx_t *tx) 823*7a7741afSMartin Matuska { 824*7a7741afSMartin Matuska xoptattr_t *xoap; 825*7a7741afSMartin Matuska 826*7a7741afSMartin Matuska xoap = xva_getxoptattr(xvap); 827*7a7741afSMartin Matuska ASSERT3P(xoap, !=, NULL); 828*7a7741afSMartin Matuska 829*7a7741afSMartin Matuska if (zp->z_zfsvfs->z_replay == B_FALSE) { 830*7a7741afSMartin Matuska ASSERT_VOP_IN_SEQC(ZTOV(zp)); 831*7a7741afSMartin Matuska } 832*7a7741afSMartin Matuska 833*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_CREATETIME)) { 834*7a7741afSMartin Matuska uint64_t times[2]; 835*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&xoap->xoa_createtime, times); 836*7a7741afSMartin Matuska (void) sa_update(zp->z_sa_hdl, SA_ZPL_CRTIME(zp->z_zfsvfs), 837*7a7741afSMartin Matuska ×, sizeof (times), tx); 838*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_CREATETIME); 839*7a7741afSMartin Matuska } 840*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_READONLY)) { 841*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_READONLY, xoap->xoa_readonly, 842*7a7741afSMartin Matuska zp->z_pflags, tx); 843*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_READONLY); 844*7a7741afSMartin Matuska } 845*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_HIDDEN)) { 846*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_HIDDEN, xoap->xoa_hidden, 847*7a7741afSMartin Matuska zp->z_pflags, tx); 848*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_HIDDEN); 849*7a7741afSMartin Matuska } 850*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_SYSTEM)) { 851*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_SYSTEM, xoap->xoa_system, 852*7a7741afSMartin Matuska zp->z_pflags, tx); 853*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_SYSTEM); 854*7a7741afSMartin Matuska } 855*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_ARCHIVE)) { 856*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_ARCHIVE, xoap->xoa_archive, 857*7a7741afSMartin Matuska zp->z_pflags, tx); 858*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_ARCHIVE); 859*7a7741afSMartin Matuska } 860*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_IMMUTABLE)) { 861*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_IMMUTABLE, xoap->xoa_immutable, 862*7a7741afSMartin Matuska zp->z_pflags, tx); 863*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_IMMUTABLE); 864*7a7741afSMartin Matuska } 865*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_NOUNLINK)) { 866*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_NOUNLINK, xoap->xoa_nounlink, 867*7a7741afSMartin Matuska zp->z_pflags, tx); 868*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_NOUNLINK); 869*7a7741afSMartin Matuska } 870*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_APPENDONLY)) { 871*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_APPENDONLY, xoap->xoa_appendonly, 872*7a7741afSMartin Matuska zp->z_pflags, tx); 873*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_APPENDONLY); 874*7a7741afSMartin Matuska } 875*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_NODUMP)) { 876*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_NODUMP, xoap->xoa_nodump, 877*7a7741afSMartin Matuska zp->z_pflags, tx); 878*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_NODUMP); 879*7a7741afSMartin Matuska } 880*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_OPAQUE)) { 881*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_OPAQUE, xoap->xoa_opaque, 882*7a7741afSMartin Matuska zp->z_pflags, tx); 883*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_OPAQUE); 884*7a7741afSMartin Matuska } 885*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_AV_QUARANTINED)) { 886*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_AV_QUARANTINED, 887*7a7741afSMartin Matuska xoap->xoa_av_quarantined, zp->z_pflags, tx); 888*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_AV_QUARANTINED); 889*7a7741afSMartin Matuska } 890*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_AV_MODIFIED)) { 891*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_AV_MODIFIED, xoap->xoa_av_modified, 892*7a7741afSMartin Matuska zp->z_pflags, tx); 893*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_AV_MODIFIED); 894*7a7741afSMartin Matuska } 895*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_AV_SCANSTAMP)) { 896*7a7741afSMartin Matuska zfs_sa_set_scanstamp(zp, xvap, tx); 897*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_AV_SCANSTAMP); 898*7a7741afSMartin Matuska } 899*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_REPARSE)) { 900*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_REPARSE, xoap->xoa_reparse, 901*7a7741afSMartin Matuska zp->z_pflags, tx); 902*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_REPARSE); 903*7a7741afSMartin Matuska } 904*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_OFFLINE)) { 905*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_OFFLINE, xoap->xoa_offline, 906*7a7741afSMartin Matuska zp->z_pflags, tx); 907*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_OFFLINE); 908*7a7741afSMartin Matuska } 909*7a7741afSMartin Matuska if (XVA_ISSET_REQ(xvap, XAT_SPARSE)) { 910*7a7741afSMartin Matuska ZFS_ATTR_SET(zp, ZFS_SPARSE, xoap->xoa_sparse, 911*7a7741afSMartin Matuska zp->z_pflags, tx); 912*7a7741afSMartin Matuska XVA_SET_RTN(xvap, XAT_SPARSE); 913*7a7741afSMartin Matuska } 914*7a7741afSMartin Matuska } 915*7a7741afSMartin Matuska 916*7a7741afSMartin Matuska int 917*7a7741afSMartin Matuska zfs_zget(zfsvfs_t *zfsvfs, uint64_t obj_num, znode_t **zpp) 918*7a7741afSMartin Matuska { 919*7a7741afSMartin Matuska dmu_object_info_t doi; 920*7a7741afSMartin Matuska dmu_buf_t *db; 921*7a7741afSMartin Matuska znode_t *zp; 922*7a7741afSMartin Matuska vnode_t *vp; 923*7a7741afSMartin Matuska sa_handle_t *hdl; 924*7a7741afSMartin Matuska int locked; 925*7a7741afSMartin Matuska int err; 926*7a7741afSMartin Matuska 927*7a7741afSMartin Matuska getnewvnode_reserve(); 928*7a7741afSMartin Matuska again: 929*7a7741afSMartin Matuska *zpp = NULL; 930*7a7741afSMartin Matuska ZFS_OBJ_HOLD_ENTER(zfsvfs, obj_num); 931*7a7741afSMartin Matuska 932*7a7741afSMartin Matuska err = sa_buf_hold(zfsvfs->z_os, obj_num, NULL, &db); 933*7a7741afSMartin Matuska if (err) { 934*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 935*7a7741afSMartin Matuska getnewvnode_drop_reserve(); 936*7a7741afSMartin Matuska return (err); 937*7a7741afSMartin Matuska } 938*7a7741afSMartin Matuska 939*7a7741afSMartin Matuska dmu_object_info_from_db(db, &doi); 940*7a7741afSMartin Matuska if (doi.doi_bonus_type != DMU_OT_SA && 941*7a7741afSMartin Matuska (doi.doi_bonus_type != DMU_OT_ZNODE || 942*7a7741afSMartin Matuska (doi.doi_bonus_type == DMU_OT_ZNODE && 943*7a7741afSMartin Matuska doi.doi_bonus_size < sizeof (znode_phys_t)))) { 944*7a7741afSMartin Matuska sa_buf_rele(db, NULL); 945*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 946*7a7741afSMartin Matuska getnewvnode_drop_reserve(); 947*7a7741afSMartin Matuska return (SET_ERROR(EINVAL)); 948*7a7741afSMartin Matuska } 949*7a7741afSMartin Matuska 950*7a7741afSMartin Matuska hdl = dmu_buf_get_user(db); 951*7a7741afSMartin Matuska if (hdl != NULL) { 952*7a7741afSMartin Matuska zp = sa_get_userdata(hdl); 953*7a7741afSMartin Matuska 954*7a7741afSMartin Matuska /* 955*7a7741afSMartin Matuska * Since "SA" does immediate eviction we 956*7a7741afSMartin Matuska * should never find a sa handle that doesn't 957*7a7741afSMartin Matuska * know about the znode. 958*7a7741afSMartin Matuska */ 959*7a7741afSMartin Matuska ASSERT3P(zp, !=, NULL); 960*7a7741afSMartin Matuska ASSERT3U(zp->z_id, ==, obj_num); 961*7a7741afSMartin Matuska if (zp->z_unlinked) { 962*7a7741afSMartin Matuska err = SET_ERROR(ENOENT); 963*7a7741afSMartin Matuska } else { 964*7a7741afSMartin Matuska vp = ZTOV(zp); 965*7a7741afSMartin Matuska /* 966*7a7741afSMartin Matuska * Don't let the vnode disappear after 967*7a7741afSMartin Matuska * ZFS_OBJ_HOLD_EXIT. 968*7a7741afSMartin Matuska */ 969*7a7741afSMartin Matuska VN_HOLD(vp); 970*7a7741afSMartin Matuska *zpp = zp; 971*7a7741afSMartin Matuska err = 0; 972*7a7741afSMartin Matuska } 973*7a7741afSMartin Matuska 974*7a7741afSMartin Matuska sa_buf_rele(db, NULL); 975*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 976*7a7741afSMartin Matuska 977*7a7741afSMartin Matuska if (err) { 978*7a7741afSMartin Matuska getnewvnode_drop_reserve(); 979*7a7741afSMartin Matuska return (err); 980*7a7741afSMartin Matuska } 981*7a7741afSMartin Matuska 982*7a7741afSMartin Matuska locked = VOP_ISLOCKED(vp); 983*7a7741afSMartin Matuska VI_LOCK(vp); 984*7a7741afSMartin Matuska if (VN_IS_DOOMED(vp) && locked != LK_EXCLUSIVE) { 985*7a7741afSMartin Matuska /* 986*7a7741afSMartin Matuska * The vnode is doomed and this thread doesn't 987*7a7741afSMartin Matuska * hold the exclusive lock on it, so the vnode 988*7a7741afSMartin Matuska * must be being reclaimed by another thread. 989*7a7741afSMartin Matuska * Otherwise the doomed vnode is being reclaimed 990*7a7741afSMartin Matuska * by this thread and zfs_zget is called from 991*7a7741afSMartin Matuska * ZIL internals. 992*7a7741afSMartin Matuska */ 993*7a7741afSMartin Matuska VI_UNLOCK(vp); 994*7a7741afSMartin Matuska 995*7a7741afSMartin Matuska /* 996*7a7741afSMartin Matuska * XXX vrele() locks the vnode when the last reference 997*7a7741afSMartin Matuska * is dropped. Although in this case the vnode is 998*7a7741afSMartin Matuska * doomed / dead and so no inactivation is required, 999*7a7741afSMartin Matuska * the vnode lock is still acquired. That could result 1000*7a7741afSMartin Matuska * in a LOR with z_teardown_lock if another thread holds 1001*7a7741afSMartin Matuska * the vnode's lock and tries to take z_teardown_lock. 1002*7a7741afSMartin Matuska * But that is only possible if the other thread peforms 1003*7a7741afSMartin Matuska * a ZFS vnode operation on the vnode. That either 1004*7a7741afSMartin Matuska * should not happen if the vnode is dead or the thread 1005*7a7741afSMartin Matuska * should also have a reference to the vnode and thus 1006*7a7741afSMartin Matuska * our reference is not last. 1007*7a7741afSMartin Matuska */ 1008*7a7741afSMartin Matuska VN_RELE(vp); 1009*7a7741afSMartin Matuska goto again; 1010*7a7741afSMartin Matuska } 1011*7a7741afSMartin Matuska VI_UNLOCK(vp); 1012*7a7741afSMartin Matuska getnewvnode_drop_reserve(); 1013*7a7741afSMartin Matuska return (err); 1014*7a7741afSMartin Matuska } 1015*7a7741afSMartin Matuska 1016*7a7741afSMartin Matuska /* 1017*7a7741afSMartin Matuska * Not found create new znode/vnode 1018*7a7741afSMartin Matuska * but only if file exists. 1019*7a7741afSMartin Matuska * 1020*7a7741afSMartin Matuska * There is a small window where zfs_vget() could 1021*7a7741afSMartin Matuska * find this object while a file create is still in 1022*7a7741afSMartin Matuska * progress. This is checked for in zfs_znode_alloc() 1023*7a7741afSMartin Matuska * 1024*7a7741afSMartin Matuska * if zfs_znode_alloc() fails it will drop the hold on the 1025*7a7741afSMartin Matuska * bonus buffer. 1026*7a7741afSMartin Matuska */ 1027*7a7741afSMartin Matuska zp = zfs_znode_alloc(zfsvfs, db, doi.doi_data_block_size, 1028*7a7741afSMartin Matuska doi.doi_bonus_type, NULL); 1029*7a7741afSMartin Matuska if (zp == NULL) { 1030*7a7741afSMartin Matuska err = SET_ERROR(ENOENT); 1031*7a7741afSMartin Matuska } else { 1032*7a7741afSMartin Matuska *zpp = zp; 1033*7a7741afSMartin Matuska } 1034*7a7741afSMartin Matuska if (err == 0) { 1035*7a7741afSMartin Matuska vnode_t *vp = ZTOV(zp); 1036*7a7741afSMartin Matuska 1037*7a7741afSMartin Matuska err = insmntque(vp, zfsvfs->z_vfs); 1038*7a7741afSMartin Matuska if (err == 0) { 1039*7a7741afSMartin Matuska vp->v_hash = obj_num; 1040*7a7741afSMartin Matuska VOP_UNLOCK(vp); 1041*7a7741afSMartin Matuska } else { 1042*7a7741afSMartin Matuska zp->z_vnode = NULL; 1043*7a7741afSMartin Matuska zfs_znode_dmu_fini(zp); 1044*7a7741afSMartin Matuska zfs_znode_free(zp); 1045*7a7741afSMartin Matuska *zpp = NULL; 1046*7a7741afSMartin Matuska } 1047*7a7741afSMartin Matuska } 1048*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 1049*7a7741afSMartin Matuska getnewvnode_drop_reserve(); 1050*7a7741afSMartin Matuska return (err); 1051*7a7741afSMartin Matuska } 1052*7a7741afSMartin Matuska 1053*7a7741afSMartin Matuska int 1054*7a7741afSMartin Matuska zfs_rezget(znode_t *zp) 1055*7a7741afSMartin Matuska { 1056*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1057*7a7741afSMartin Matuska dmu_object_info_t doi; 1058*7a7741afSMartin Matuska dmu_buf_t *db; 1059*7a7741afSMartin Matuska vnode_t *vp; 1060*7a7741afSMartin Matuska uint64_t obj_num = zp->z_id; 1061*7a7741afSMartin Matuska uint64_t mode, size; 1062*7a7741afSMartin Matuska sa_bulk_attr_t bulk[8]; 1063*7a7741afSMartin Matuska int err; 1064*7a7741afSMartin Matuska int count = 0; 1065*7a7741afSMartin Matuska uint64_t gen; 1066*7a7741afSMartin Matuska 1067*7a7741afSMartin Matuska /* 1068*7a7741afSMartin Matuska * Remove cached pages before reloading the znode, so that they are not 1069*7a7741afSMartin Matuska * lingering after we run into any error. Ideally, we should vgone() 1070*7a7741afSMartin Matuska * the vnode in case of error, but currently we cannot do that 1071*7a7741afSMartin Matuska * because of the LOR between the vnode lock and z_teardown_lock. 1072*7a7741afSMartin Matuska * So, instead, we have to "doom" the znode in the illumos style. 1073*7a7741afSMartin Matuska * 1074*7a7741afSMartin Matuska * Ignore invalid pages during the scan. This is to avoid deadlocks 1075*7a7741afSMartin Matuska * between page busying and the teardown lock, as pages are busied prior 1076*7a7741afSMartin Matuska * to a VOP_GETPAGES operation, which acquires the teardown read lock. 1077*7a7741afSMartin Matuska * Such pages will be invalid and can safely be skipped here. 1078*7a7741afSMartin Matuska */ 1079*7a7741afSMartin Matuska vp = ZTOV(zp); 1080*7a7741afSMartin Matuska #if __FreeBSD_version >= 1400042 1081*7a7741afSMartin Matuska vn_pages_remove_valid(vp, 0, 0); 1082*7a7741afSMartin Matuska #else 1083*7a7741afSMartin Matuska vn_pages_remove(vp, 0, 0); 1084*7a7741afSMartin Matuska #endif 1085*7a7741afSMartin Matuska 1086*7a7741afSMartin Matuska ZFS_OBJ_HOLD_ENTER(zfsvfs, obj_num); 1087*7a7741afSMartin Matuska 1088*7a7741afSMartin Matuska mutex_enter(&zp->z_acl_lock); 1089*7a7741afSMartin Matuska if (zp->z_acl_cached) { 1090*7a7741afSMartin Matuska zfs_acl_free(zp->z_acl_cached); 1091*7a7741afSMartin Matuska zp->z_acl_cached = NULL; 1092*7a7741afSMartin Matuska } 1093*7a7741afSMartin Matuska mutex_exit(&zp->z_acl_lock); 1094*7a7741afSMartin Matuska 1095*7a7741afSMartin Matuska rw_enter(&zp->z_xattr_lock, RW_WRITER); 1096*7a7741afSMartin Matuska if (zp->z_xattr_cached) { 1097*7a7741afSMartin Matuska nvlist_free(zp->z_xattr_cached); 1098*7a7741afSMartin Matuska zp->z_xattr_cached = NULL; 1099*7a7741afSMartin Matuska } 1100*7a7741afSMartin Matuska rw_exit(&zp->z_xattr_lock); 1101*7a7741afSMartin Matuska 1102*7a7741afSMartin Matuska ASSERT3P(zp->z_sa_hdl, ==, NULL); 1103*7a7741afSMartin Matuska err = sa_buf_hold(zfsvfs->z_os, obj_num, NULL, &db); 1104*7a7741afSMartin Matuska if (err) { 1105*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 1106*7a7741afSMartin Matuska return (err); 1107*7a7741afSMartin Matuska } 1108*7a7741afSMartin Matuska 1109*7a7741afSMartin Matuska dmu_object_info_from_db(db, &doi); 1110*7a7741afSMartin Matuska if (doi.doi_bonus_type != DMU_OT_SA && 1111*7a7741afSMartin Matuska (doi.doi_bonus_type != DMU_OT_ZNODE || 1112*7a7741afSMartin Matuska (doi.doi_bonus_type == DMU_OT_ZNODE && 1113*7a7741afSMartin Matuska doi.doi_bonus_size < sizeof (znode_phys_t)))) { 1114*7a7741afSMartin Matuska sa_buf_rele(db, NULL); 1115*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 1116*7a7741afSMartin Matuska return (SET_ERROR(EINVAL)); 1117*7a7741afSMartin Matuska } 1118*7a7741afSMartin Matuska 1119*7a7741afSMartin Matuska zfs_znode_sa_init(zfsvfs, zp, db, doi.doi_bonus_type, NULL); 1120*7a7741afSMartin Matuska size = zp->z_size; 1121*7a7741afSMartin Matuska 1122*7a7741afSMartin Matuska /* reload cached values */ 1123*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_GEN(zfsvfs), NULL, 1124*7a7741afSMartin Matuska &gen, sizeof (gen)); 1125*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_SIZE(zfsvfs), NULL, 1126*7a7741afSMartin Matuska &zp->z_size, sizeof (zp->z_size)); 1127*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_LINKS(zfsvfs), NULL, 1128*7a7741afSMartin Matuska &zp->z_links, sizeof (zp->z_links)); 1129*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_FLAGS(zfsvfs), NULL, 1130*7a7741afSMartin Matuska &zp->z_pflags, sizeof (zp->z_pflags)); 1131*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_ATIME(zfsvfs), NULL, 1132*7a7741afSMartin Matuska &zp->z_atime, sizeof (zp->z_atime)); 1133*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_UID(zfsvfs), NULL, 1134*7a7741afSMartin Matuska &zp->z_uid, sizeof (zp->z_uid)); 1135*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_GID(zfsvfs), NULL, 1136*7a7741afSMartin Matuska &zp->z_gid, sizeof (zp->z_gid)); 1137*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_MODE(zfsvfs), NULL, 1138*7a7741afSMartin Matuska &mode, sizeof (mode)); 1139*7a7741afSMartin Matuska 1140*7a7741afSMartin Matuska if (sa_bulk_lookup(zp->z_sa_hdl, bulk, count)) { 1141*7a7741afSMartin Matuska zfs_znode_dmu_fini(zp); 1142*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 1143*7a7741afSMartin Matuska return (SET_ERROR(EIO)); 1144*7a7741afSMartin Matuska } 1145*7a7741afSMartin Matuska 1146*7a7741afSMartin Matuska zp->z_mode = mode; 1147*7a7741afSMartin Matuska 1148*7a7741afSMartin Matuska if (gen != zp->z_gen) { 1149*7a7741afSMartin Matuska zfs_znode_dmu_fini(zp); 1150*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 1151*7a7741afSMartin Matuska return (SET_ERROR(EIO)); 1152*7a7741afSMartin Matuska } 1153*7a7741afSMartin Matuska 1154*7a7741afSMartin Matuska /* 1155*7a7741afSMartin Matuska * It is highly improbable but still quite possible that two 1156*7a7741afSMartin Matuska * objects in different datasets are created with the same 1157*7a7741afSMartin Matuska * object numbers and in transaction groups with the same 1158*7a7741afSMartin Matuska * numbers. znodes corresponding to those objects would 1159*7a7741afSMartin Matuska * have the same z_id and z_gen, but their other attributes 1160*7a7741afSMartin Matuska * may be different. 1161*7a7741afSMartin Matuska * zfs recv -F may replace one of such objects with the other. 1162*7a7741afSMartin Matuska * As a result file properties recorded in the replaced 1163*7a7741afSMartin Matuska * object's vnode may no longer match the received object's 1164*7a7741afSMartin Matuska * properties. At present the only cached property is the 1165*7a7741afSMartin Matuska * files type recorded in v_type. 1166*7a7741afSMartin Matuska * So, handle this case by leaving the old vnode and znode 1167*7a7741afSMartin Matuska * disassociated from the actual object. A new vnode and a 1168*7a7741afSMartin Matuska * znode will be created if the object is accessed 1169*7a7741afSMartin Matuska * (e.g. via a look-up). The old vnode and znode will be 1170*7a7741afSMartin Matuska * recycled when the last vnode reference is dropped. 1171*7a7741afSMartin Matuska */ 1172*7a7741afSMartin Matuska if (vp->v_type != IFTOVT((mode_t)zp->z_mode)) { 1173*7a7741afSMartin Matuska zfs_znode_dmu_fini(zp); 1174*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 1175*7a7741afSMartin Matuska return (SET_ERROR(EIO)); 1176*7a7741afSMartin Matuska } 1177*7a7741afSMartin Matuska 1178*7a7741afSMartin Matuska /* 1179*7a7741afSMartin Matuska * If the file has zero links, then it has been unlinked on the send 1180*7a7741afSMartin Matuska * side and it must be in the received unlinked set. 1181*7a7741afSMartin Matuska * We call zfs_znode_dmu_fini() now to prevent any accesses to the 1182*7a7741afSMartin Matuska * stale data and to prevent automatically removal of the file in 1183*7a7741afSMartin Matuska * zfs_zinactive(). The file will be removed either when it is removed 1184*7a7741afSMartin Matuska * on the send side and the next incremental stream is received or 1185*7a7741afSMartin Matuska * when the unlinked set gets processed. 1186*7a7741afSMartin Matuska */ 1187*7a7741afSMartin Matuska zp->z_unlinked = (zp->z_links == 0); 1188*7a7741afSMartin Matuska if (zp->z_unlinked) { 1189*7a7741afSMartin Matuska zfs_znode_dmu_fini(zp); 1190*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 1191*7a7741afSMartin Matuska return (0); 1192*7a7741afSMartin Matuska } 1193*7a7741afSMartin Matuska 1194*7a7741afSMartin Matuska zp->z_blksz = doi.doi_data_block_size; 1195*7a7741afSMartin Matuska if (zp->z_size != size) 1196*7a7741afSMartin Matuska vnode_pager_setsize(vp, zp->z_size); 1197*7a7741afSMartin Matuska 1198*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj_num); 1199*7a7741afSMartin Matuska 1200*7a7741afSMartin Matuska return (0); 1201*7a7741afSMartin Matuska } 1202*7a7741afSMartin Matuska 1203*7a7741afSMartin Matuska void 1204*7a7741afSMartin Matuska zfs_znode_delete(znode_t *zp, dmu_tx_t *tx) 1205*7a7741afSMartin Matuska { 1206*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1207*7a7741afSMartin Matuska objset_t *os = zfsvfs->z_os; 1208*7a7741afSMartin Matuska uint64_t obj = zp->z_id; 1209*7a7741afSMartin Matuska uint64_t acl_obj = zfs_external_acl(zp); 1210*7a7741afSMartin Matuska 1211*7a7741afSMartin Matuska ZFS_OBJ_HOLD_ENTER(zfsvfs, obj); 1212*7a7741afSMartin Matuska if (acl_obj) { 1213*7a7741afSMartin Matuska VERIFY(!zp->z_is_sa); 1214*7a7741afSMartin Matuska VERIFY0(dmu_object_free(os, acl_obj, tx)); 1215*7a7741afSMartin Matuska } 1216*7a7741afSMartin Matuska VERIFY0(dmu_object_free(os, obj, tx)); 1217*7a7741afSMartin Matuska zfs_znode_dmu_fini(zp); 1218*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, obj); 1219*7a7741afSMartin Matuska } 1220*7a7741afSMartin Matuska 1221*7a7741afSMartin Matuska void 1222*7a7741afSMartin Matuska zfs_zinactive(znode_t *zp) 1223*7a7741afSMartin Matuska { 1224*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1225*7a7741afSMartin Matuska uint64_t z_id = zp->z_id; 1226*7a7741afSMartin Matuska 1227*7a7741afSMartin Matuska ASSERT3P(zp->z_sa_hdl, !=, NULL); 1228*7a7741afSMartin Matuska 1229*7a7741afSMartin Matuska /* 1230*7a7741afSMartin Matuska * Don't allow a zfs_zget() while were trying to release this znode 1231*7a7741afSMartin Matuska */ 1232*7a7741afSMartin Matuska ZFS_OBJ_HOLD_ENTER(zfsvfs, z_id); 1233*7a7741afSMartin Matuska 1234*7a7741afSMartin Matuska /* 1235*7a7741afSMartin Matuska * If this was the last reference to a file with no links, remove 1236*7a7741afSMartin Matuska * the file from the file system unless the file system is mounted 1237*7a7741afSMartin Matuska * read-only. That can happen, for example, if the file system was 1238*7a7741afSMartin Matuska * originally read-write, the file was opened, then unlinked and 1239*7a7741afSMartin Matuska * the file system was made read-only before the file was finally 1240*7a7741afSMartin Matuska * closed. The file will remain in the unlinked set. 1241*7a7741afSMartin Matuska */ 1242*7a7741afSMartin Matuska if (zp->z_unlinked) { 1243*7a7741afSMartin Matuska ASSERT(!zfsvfs->z_issnap); 1244*7a7741afSMartin Matuska if ((zfsvfs->z_vfs->vfs_flag & VFS_RDONLY) == 0) { 1245*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, z_id); 1246*7a7741afSMartin Matuska zfs_rmnode(zp); 1247*7a7741afSMartin Matuska return; 1248*7a7741afSMartin Matuska } 1249*7a7741afSMartin Matuska } 1250*7a7741afSMartin Matuska 1251*7a7741afSMartin Matuska zfs_znode_dmu_fini(zp); 1252*7a7741afSMartin Matuska ZFS_OBJ_HOLD_EXIT(zfsvfs, z_id); 1253*7a7741afSMartin Matuska zfs_znode_free(zp); 1254*7a7741afSMartin Matuska } 1255*7a7741afSMartin Matuska 1256*7a7741afSMartin Matuska void 1257*7a7741afSMartin Matuska zfs_znode_free(znode_t *zp) 1258*7a7741afSMartin Matuska { 1259*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1260*7a7741afSMartin Matuska char *symlink; 1261*7a7741afSMartin Matuska 1262*7a7741afSMartin Matuska ASSERT3P(zp->z_sa_hdl, ==, NULL); 1263*7a7741afSMartin Matuska zp->z_vnode = NULL; 1264*7a7741afSMartin Matuska mutex_enter(&zfsvfs->z_znodes_lock); 1265*7a7741afSMartin Matuska POINTER_INVALIDATE(&zp->z_zfsvfs); 1266*7a7741afSMartin Matuska list_remove(&zfsvfs->z_all_znodes, zp); 1267*7a7741afSMartin Matuska mutex_exit(&zfsvfs->z_znodes_lock); 1268*7a7741afSMartin Matuska 1269*7a7741afSMartin Matuska symlink = atomic_load_ptr(&zp->z_cached_symlink); 1270*7a7741afSMartin Matuska if (symlink != NULL) { 1271*7a7741afSMartin Matuska atomic_store_rel_ptr((uintptr_t *)&zp->z_cached_symlink, 1272*7a7741afSMartin Matuska (uintptr_t)NULL); 1273*7a7741afSMartin Matuska cache_symlink_free(symlink, strlen(symlink) + 1); 1274*7a7741afSMartin Matuska } 1275*7a7741afSMartin Matuska 1276*7a7741afSMartin Matuska if (zp->z_acl_cached) { 1277*7a7741afSMartin Matuska zfs_acl_free(zp->z_acl_cached); 1278*7a7741afSMartin Matuska zp->z_acl_cached = NULL; 1279*7a7741afSMartin Matuska } 1280*7a7741afSMartin Matuska 1281*7a7741afSMartin Matuska zfs_znode_free_kmem(zp); 1282*7a7741afSMartin Matuska } 1283*7a7741afSMartin Matuska 1284*7a7741afSMartin Matuska void 1285*7a7741afSMartin Matuska zfs_tstamp_update_setup_ext(znode_t *zp, uint_t flag, uint64_t mtime[2], 1286*7a7741afSMartin Matuska uint64_t ctime[2], boolean_t have_tx) 1287*7a7741afSMartin Matuska { 1288*7a7741afSMartin Matuska timestruc_t now; 1289*7a7741afSMartin Matuska 1290*7a7741afSMartin Matuska vfs_timestamp(&now); 1291*7a7741afSMartin Matuska 1292*7a7741afSMartin Matuska if (have_tx) { /* will sa_bulk_update happen really soon? */ 1293*7a7741afSMartin Matuska zp->z_atime_dirty = 0; 1294*7a7741afSMartin Matuska zp->z_seq++; 1295*7a7741afSMartin Matuska } else { 1296*7a7741afSMartin Matuska zp->z_atime_dirty = 1; 1297*7a7741afSMartin Matuska } 1298*7a7741afSMartin Matuska 1299*7a7741afSMartin Matuska if (flag & AT_ATIME) { 1300*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&now, zp->z_atime); 1301*7a7741afSMartin Matuska } 1302*7a7741afSMartin Matuska 1303*7a7741afSMartin Matuska if (flag & AT_MTIME) { 1304*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&now, mtime); 1305*7a7741afSMartin Matuska if (zp->z_zfsvfs->z_use_fuids) { 1306*7a7741afSMartin Matuska zp->z_pflags |= (ZFS_ARCHIVE | 1307*7a7741afSMartin Matuska ZFS_AV_MODIFIED); 1308*7a7741afSMartin Matuska } 1309*7a7741afSMartin Matuska } 1310*7a7741afSMartin Matuska 1311*7a7741afSMartin Matuska if (flag & AT_CTIME) { 1312*7a7741afSMartin Matuska ZFS_TIME_ENCODE(&now, ctime); 1313*7a7741afSMartin Matuska if (zp->z_zfsvfs->z_use_fuids) 1314*7a7741afSMartin Matuska zp->z_pflags |= ZFS_ARCHIVE; 1315*7a7741afSMartin Matuska } 1316*7a7741afSMartin Matuska } 1317*7a7741afSMartin Matuska 1318*7a7741afSMartin Matuska 1319*7a7741afSMartin Matuska void 1320*7a7741afSMartin Matuska zfs_tstamp_update_setup(znode_t *zp, uint_t flag, uint64_t mtime[2], 1321*7a7741afSMartin Matuska uint64_t ctime[2]) 1322*7a7741afSMartin Matuska { 1323*7a7741afSMartin Matuska zfs_tstamp_update_setup_ext(zp, flag, mtime, ctime, B_TRUE); 1324*7a7741afSMartin Matuska } 1325*7a7741afSMartin Matuska /* 1326*7a7741afSMartin Matuska * Grow the block size for a file. 1327*7a7741afSMartin Matuska * 1328*7a7741afSMartin Matuska * IN: zp - znode of file to free data in. 1329*7a7741afSMartin Matuska * size - requested block size 1330*7a7741afSMartin Matuska * tx - open transaction. 1331*7a7741afSMartin Matuska * 1332*7a7741afSMartin Matuska * NOTE: this function assumes that the znode is write locked. 1333*7a7741afSMartin Matuska */ 1334*7a7741afSMartin Matuska void 1335*7a7741afSMartin Matuska zfs_grow_blocksize(znode_t *zp, uint64_t size, dmu_tx_t *tx) 1336*7a7741afSMartin Matuska { 1337*7a7741afSMartin Matuska int error; 1338*7a7741afSMartin Matuska u_longlong_t dummy; 1339*7a7741afSMartin Matuska 1340*7a7741afSMartin Matuska if (size <= zp->z_blksz) 1341*7a7741afSMartin Matuska return; 1342*7a7741afSMartin Matuska /* 1343*7a7741afSMartin Matuska * If the file size is already greater than the current blocksize, 1344*7a7741afSMartin Matuska * we will not grow. If there is more than one block in a file, 1345*7a7741afSMartin Matuska * the blocksize cannot change. 1346*7a7741afSMartin Matuska */ 1347*7a7741afSMartin Matuska if (zp->z_blksz && zp->z_size > zp->z_blksz) 1348*7a7741afSMartin Matuska return; 1349*7a7741afSMartin Matuska 1350*7a7741afSMartin Matuska error = dmu_object_set_blocksize(zp->z_zfsvfs->z_os, zp->z_id, 1351*7a7741afSMartin Matuska size, 0, tx); 1352*7a7741afSMartin Matuska 1353*7a7741afSMartin Matuska if (error == ENOTSUP) 1354*7a7741afSMartin Matuska return; 1355*7a7741afSMartin Matuska ASSERT0(error); 1356*7a7741afSMartin Matuska 1357*7a7741afSMartin Matuska /* What blocksize did we actually get? */ 1358*7a7741afSMartin Matuska dmu_object_size_from_db(sa_get_db(zp->z_sa_hdl), &zp->z_blksz, &dummy); 1359*7a7741afSMartin Matuska } 1360*7a7741afSMartin Matuska 1361*7a7741afSMartin Matuska /* 1362*7a7741afSMartin Matuska * Increase the file length 1363*7a7741afSMartin Matuska * 1364*7a7741afSMartin Matuska * IN: zp - znode of file to free data in. 1365*7a7741afSMartin Matuska * end - new end-of-file 1366*7a7741afSMartin Matuska * 1367*7a7741afSMartin Matuska * RETURN: 0 on success, error code on failure 1368*7a7741afSMartin Matuska */ 1369*7a7741afSMartin Matuska static int 1370*7a7741afSMartin Matuska zfs_extend(znode_t *zp, uint64_t end) 1371*7a7741afSMartin Matuska { 1372*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1373*7a7741afSMartin Matuska dmu_tx_t *tx; 1374*7a7741afSMartin Matuska zfs_locked_range_t *lr; 1375*7a7741afSMartin Matuska uint64_t newblksz; 1376*7a7741afSMartin Matuska int error; 1377*7a7741afSMartin Matuska 1378*7a7741afSMartin Matuska /* 1379*7a7741afSMartin Matuska * We will change zp_size, lock the whole file. 1380*7a7741afSMartin Matuska */ 1381*7a7741afSMartin Matuska lr = zfs_rangelock_enter(&zp->z_rangelock, 0, UINT64_MAX, RL_WRITER); 1382*7a7741afSMartin Matuska 1383*7a7741afSMartin Matuska /* 1384*7a7741afSMartin Matuska * Nothing to do if file already at desired length. 1385*7a7741afSMartin Matuska */ 1386*7a7741afSMartin Matuska if (end <= zp->z_size) { 1387*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1388*7a7741afSMartin Matuska return (0); 1389*7a7741afSMartin Matuska } 1390*7a7741afSMartin Matuska tx = dmu_tx_create(zfsvfs->z_os); 1391*7a7741afSMartin Matuska dmu_tx_hold_sa(tx, zp->z_sa_hdl, B_FALSE); 1392*7a7741afSMartin Matuska zfs_sa_upgrade_txholds(tx, zp); 1393*7a7741afSMartin Matuska if (end > zp->z_blksz && 1394*7a7741afSMartin Matuska (!ISP2(zp->z_blksz) || zp->z_blksz < zfsvfs->z_max_blksz)) { 1395*7a7741afSMartin Matuska /* 1396*7a7741afSMartin Matuska * We are growing the file past the current block size. 1397*7a7741afSMartin Matuska */ 1398*7a7741afSMartin Matuska if (zp->z_blksz > zp->z_zfsvfs->z_max_blksz) { 1399*7a7741afSMartin Matuska /* 1400*7a7741afSMartin Matuska * File's blocksize is already larger than the 1401*7a7741afSMartin Matuska * "recordsize" property. Only let it grow to 1402*7a7741afSMartin Matuska * the next power of 2. 1403*7a7741afSMartin Matuska */ 1404*7a7741afSMartin Matuska ASSERT(!ISP2(zp->z_blksz)); 1405*7a7741afSMartin Matuska newblksz = MIN(end, 1 << highbit64(zp->z_blksz)); 1406*7a7741afSMartin Matuska } else { 1407*7a7741afSMartin Matuska newblksz = MIN(end, zp->z_zfsvfs->z_max_blksz); 1408*7a7741afSMartin Matuska } 1409*7a7741afSMartin Matuska dmu_tx_hold_write(tx, zp->z_id, 0, newblksz); 1410*7a7741afSMartin Matuska } else { 1411*7a7741afSMartin Matuska newblksz = 0; 1412*7a7741afSMartin Matuska } 1413*7a7741afSMartin Matuska 1414*7a7741afSMartin Matuska error = dmu_tx_assign(tx, TXG_WAIT); 1415*7a7741afSMartin Matuska if (error) { 1416*7a7741afSMartin Matuska dmu_tx_abort(tx); 1417*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1418*7a7741afSMartin Matuska return (error); 1419*7a7741afSMartin Matuska } 1420*7a7741afSMartin Matuska 1421*7a7741afSMartin Matuska if (newblksz) 1422*7a7741afSMartin Matuska zfs_grow_blocksize(zp, newblksz, tx); 1423*7a7741afSMartin Matuska 1424*7a7741afSMartin Matuska zp->z_size = end; 1425*7a7741afSMartin Matuska 1426*7a7741afSMartin Matuska VERIFY0(sa_update(zp->z_sa_hdl, SA_ZPL_SIZE(zp->z_zfsvfs), 1427*7a7741afSMartin Matuska &zp->z_size, sizeof (zp->z_size), tx)); 1428*7a7741afSMartin Matuska 1429*7a7741afSMartin Matuska vnode_pager_setsize(ZTOV(zp), end); 1430*7a7741afSMartin Matuska 1431*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1432*7a7741afSMartin Matuska 1433*7a7741afSMartin Matuska dmu_tx_commit(tx); 1434*7a7741afSMartin Matuska 1435*7a7741afSMartin Matuska return (0); 1436*7a7741afSMartin Matuska } 1437*7a7741afSMartin Matuska 1438*7a7741afSMartin Matuska /* 1439*7a7741afSMartin Matuska * Free space in a file. 1440*7a7741afSMartin Matuska * 1441*7a7741afSMartin Matuska * IN: zp - znode of file to free data in. 1442*7a7741afSMartin Matuska * off - start of section to free. 1443*7a7741afSMartin Matuska * len - length of section to free. 1444*7a7741afSMartin Matuska * 1445*7a7741afSMartin Matuska * RETURN: 0 on success, error code on failure 1446*7a7741afSMartin Matuska */ 1447*7a7741afSMartin Matuska static int 1448*7a7741afSMartin Matuska zfs_free_range(znode_t *zp, uint64_t off, uint64_t len) 1449*7a7741afSMartin Matuska { 1450*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1451*7a7741afSMartin Matuska zfs_locked_range_t *lr; 1452*7a7741afSMartin Matuska int error; 1453*7a7741afSMartin Matuska 1454*7a7741afSMartin Matuska /* 1455*7a7741afSMartin Matuska * Lock the range being freed. 1456*7a7741afSMartin Matuska */ 1457*7a7741afSMartin Matuska lr = zfs_rangelock_enter(&zp->z_rangelock, off, len, RL_WRITER); 1458*7a7741afSMartin Matuska 1459*7a7741afSMartin Matuska /* 1460*7a7741afSMartin Matuska * Nothing to do if file already at desired length. 1461*7a7741afSMartin Matuska */ 1462*7a7741afSMartin Matuska if (off >= zp->z_size) { 1463*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1464*7a7741afSMartin Matuska return (0); 1465*7a7741afSMartin Matuska } 1466*7a7741afSMartin Matuska 1467*7a7741afSMartin Matuska if (off + len > zp->z_size) 1468*7a7741afSMartin Matuska len = zp->z_size - off; 1469*7a7741afSMartin Matuska 1470*7a7741afSMartin Matuska error = dmu_free_long_range(zfsvfs->z_os, zp->z_id, off, len); 1471*7a7741afSMartin Matuska 1472*7a7741afSMartin Matuska if (error == 0) { 1473*7a7741afSMartin Matuska #if __FreeBSD_version >= 1400032 1474*7a7741afSMartin Matuska vnode_pager_purge_range(ZTOV(zp), off, off + len); 1475*7a7741afSMartin Matuska #else 1476*7a7741afSMartin Matuska /* 1477*7a7741afSMartin Matuska * Before __FreeBSD_version 1400032 we cannot free block in the 1478*7a7741afSMartin Matuska * middle of a file, but only at the end of a file, so this code 1479*7a7741afSMartin Matuska * path should never happen. 1480*7a7741afSMartin Matuska */ 1481*7a7741afSMartin Matuska vnode_pager_setsize(ZTOV(zp), off); 1482*7a7741afSMartin Matuska #endif 1483*7a7741afSMartin Matuska } 1484*7a7741afSMartin Matuska 1485*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1486*7a7741afSMartin Matuska 1487*7a7741afSMartin Matuska return (error); 1488*7a7741afSMartin Matuska } 1489*7a7741afSMartin Matuska 1490*7a7741afSMartin Matuska /* 1491*7a7741afSMartin Matuska * Truncate a file 1492*7a7741afSMartin Matuska * 1493*7a7741afSMartin Matuska * IN: zp - znode of file to free data in. 1494*7a7741afSMartin Matuska * end - new end-of-file. 1495*7a7741afSMartin Matuska * 1496*7a7741afSMartin Matuska * RETURN: 0 on success, error code on failure 1497*7a7741afSMartin Matuska */ 1498*7a7741afSMartin Matuska static int 1499*7a7741afSMartin Matuska zfs_trunc(znode_t *zp, uint64_t end) 1500*7a7741afSMartin Matuska { 1501*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1502*7a7741afSMartin Matuska vnode_t *vp = ZTOV(zp); 1503*7a7741afSMartin Matuska dmu_tx_t *tx; 1504*7a7741afSMartin Matuska zfs_locked_range_t *lr; 1505*7a7741afSMartin Matuska int error; 1506*7a7741afSMartin Matuska sa_bulk_attr_t bulk[2]; 1507*7a7741afSMartin Matuska int count = 0; 1508*7a7741afSMartin Matuska 1509*7a7741afSMartin Matuska /* 1510*7a7741afSMartin Matuska * We will change zp_size, lock the whole file. 1511*7a7741afSMartin Matuska */ 1512*7a7741afSMartin Matuska lr = zfs_rangelock_enter(&zp->z_rangelock, 0, UINT64_MAX, RL_WRITER); 1513*7a7741afSMartin Matuska 1514*7a7741afSMartin Matuska /* 1515*7a7741afSMartin Matuska * Nothing to do if file already at desired length. 1516*7a7741afSMartin Matuska */ 1517*7a7741afSMartin Matuska if (end >= zp->z_size) { 1518*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1519*7a7741afSMartin Matuska return (0); 1520*7a7741afSMartin Matuska } 1521*7a7741afSMartin Matuska 1522*7a7741afSMartin Matuska error = dmu_free_long_range(zfsvfs->z_os, zp->z_id, end, 1523*7a7741afSMartin Matuska DMU_OBJECT_END); 1524*7a7741afSMartin Matuska if (error) { 1525*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1526*7a7741afSMartin Matuska return (error); 1527*7a7741afSMartin Matuska } 1528*7a7741afSMartin Matuska tx = dmu_tx_create(zfsvfs->z_os); 1529*7a7741afSMartin Matuska dmu_tx_hold_sa(tx, zp->z_sa_hdl, B_FALSE); 1530*7a7741afSMartin Matuska zfs_sa_upgrade_txholds(tx, zp); 1531*7a7741afSMartin Matuska dmu_tx_mark_netfree(tx); 1532*7a7741afSMartin Matuska error = dmu_tx_assign(tx, TXG_WAIT); 1533*7a7741afSMartin Matuska if (error) { 1534*7a7741afSMartin Matuska dmu_tx_abort(tx); 1535*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1536*7a7741afSMartin Matuska return (error); 1537*7a7741afSMartin Matuska } 1538*7a7741afSMartin Matuska 1539*7a7741afSMartin Matuska zp->z_size = end; 1540*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_SIZE(zfsvfs), 1541*7a7741afSMartin Matuska NULL, &zp->z_size, sizeof (zp->z_size)); 1542*7a7741afSMartin Matuska 1543*7a7741afSMartin Matuska if (end == 0) { 1544*7a7741afSMartin Matuska zp->z_pflags &= ~ZFS_SPARSE; 1545*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_FLAGS(zfsvfs), 1546*7a7741afSMartin Matuska NULL, &zp->z_pflags, 8); 1547*7a7741afSMartin Matuska } 1548*7a7741afSMartin Matuska VERIFY0(sa_bulk_update(zp->z_sa_hdl, bulk, count, tx)); 1549*7a7741afSMartin Matuska 1550*7a7741afSMartin Matuska dmu_tx_commit(tx); 1551*7a7741afSMartin Matuska 1552*7a7741afSMartin Matuska /* 1553*7a7741afSMartin Matuska * Clear any mapped pages in the truncated region. This has to 1554*7a7741afSMartin Matuska * happen outside of the transaction to avoid the possibility of 1555*7a7741afSMartin Matuska * a deadlock with someone trying to push a page that we are 1556*7a7741afSMartin Matuska * about to invalidate. 1557*7a7741afSMartin Matuska */ 1558*7a7741afSMartin Matuska vnode_pager_setsize(vp, end); 1559*7a7741afSMartin Matuska 1560*7a7741afSMartin Matuska zfs_rangelock_exit(lr); 1561*7a7741afSMartin Matuska 1562*7a7741afSMartin Matuska return (0); 1563*7a7741afSMartin Matuska } 1564*7a7741afSMartin Matuska 1565*7a7741afSMartin Matuska /* 1566*7a7741afSMartin Matuska * Free space in a file 1567*7a7741afSMartin Matuska * 1568*7a7741afSMartin Matuska * IN: zp - znode of file to free data in. 1569*7a7741afSMartin Matuska * off - start of range 1570*7a7741afSMartin Matuska * len - end of range (0 => EOF) 1571*7a7741afSMartin Matuska * flag - current file open mode flags. 1572*7a7741afSMartin Matuska * log - TRUE if this action should be logged 1573*7a7741afSMartin Matuska * 1574*7a7741afSMartin Matuska * RETURN: 0 on success, error code on failure 1575*7a7741afSMartin Matuska */ 1576*7a7741afSMartin Matuska int 1577*7a7741afSMartin Matuska zfs_freesp(znode_t *zp, uint64_t off, uint64_t len, int flag, boolean_t log) 1578*7a7741afSMartin Matuska { 1579*7a7741afSMartin Matuska dmu_tx_t *tx; 1580*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1581*7a7741afSMartin Matuska zilog_t *zilog = zfsvfs->z_log; 1582*7a7741afSMartin Matuska uint64_t mode; 1583*7a7741afSMartin Matuska uint64_t mtime[2], ctime[2]; 1584*7a7741afSMartin Matuska sa_bulk_attr_t bulk[3]; 1585*7a7741afSMartin Matuska int count = 0; 1586*7a7741afSMartin Matuska int error; 1587*7a7741afSMartin Matuska 1588*7a7741afSMartin Matuska if ((error = sa_lookup(zp->z_sa_hdl, SA_ZPL_MODE(zfsvfs), &mode, 1589*7a7741afSMartin Matuska sizeof (mode))) != 0) 1590*7a7741afSMartin Matuska return (error); 1591*7a7741afSMartin Matuska 1592*7a7741afSMartin Matuska if (off > zp->z_size) { 1593*7a7741afSMartin Matuska error = zfs_extend(zp, off+len); 1594*7a7741afSMartin Matuska if (error == 0 && log) 1595*7a7741afSMartin Matuska goto log; 1596*7a7741afSMartin Matuska else 1597*7a7741afSMartin Matuska return (error); 1598*7a7741afSMartin Matuska } 1599*7a7741afSMartin Matuska 1600*7a7741afSMartin Matuska if (len == 0) { 1601*7a7741afSMartin Matuska error = zfs_trunc(zp, off); 1602*7a7741afSMartin Matuska } else { 1603*7a7741afSMartin Matuska if ((error = zfs_free_range(zp, off, len)) == 0 && 1604*7a7741afSMartin Matuska off + len > zp->z_size) 1605*7a7741afSMartin Matuska error = zfs_extend(zp, off+len); 1606*7a7741afSMartin Matuska } 1607*7a7741afSMartin Matuska if (error || !log) 1608*7a7741afSMartin Matuska return (error); 1609*7a7741afSMartin Matuska log: 1610*7a7741afSMartin Matuska tx = dmu_tx_create(zfsvfs->z_os); 1611*7a7741afSMartin Matuska dmu_tx_hold_sa(tx, zp->z_sa_hdl, B_FALSE); 1612*7a7741afSMartin Matuska zfs_sa_upgrade_txholds(tx, zp); 1613*7a7741afSMartin Matuska error = dmu_tx_assign(tx, TXG_WAIT); 1614*7a7741afSMartin Matuska if (error) { 1615*7a7741afSMartin Matuska dmu_tx_abort(tx); 1616*7a7741afSMartin Matuska return (error); 1617*7a7741afSMartin Matuska } 1618*7a7741afSMartin Matuska 1619*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_MTIME(zfsvfs), NULL, mtime, 16); 1620*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_CTIME(zfsvfs), NULL, ctime, 16); 1621*7a7741afSMartin Matuska SA_ADD_BULK_ATTR(bulk, count, SA_ZPL_FLAGS(zfsvfs), 1622*7a7741afSMartin Matuska NULL, &zp->z_pflags, 8); 1623*7a7741afSMartin Matuska zfs_tstamp_update_setup(zp, CONTENT_MODIFIED, mtime, ctime); 1624*7a7741afSMartin Matuska error = sa_bulk_update(zp->z_sa_hdl, bulk, count, tx); 1625*7a7741afSMartin Matuska ASSERT0(error); 1626*7a7741afSMartin Matuska 1627*7a7741afSMartin Matuska zfs_log_truncate(zilog, tx, TX_TRUNCATE, zp, off, len); 1628*7a7741afSMartin Matuska 1629*7a7741afSMartin Matuska dmu_tx_commit(tx); 1630*7a7741afSMartin Matuska return (0); 1631*7a7741afSMartin Matuska } 1632*7a7741afSMartin Matuska 1633*7a7741afSMartin Matuska void 1634*7a7741afSMartin Matuska zfs_create_fs(objset_t *os, cred_t *cr, nvlist_t *zplprops, dmu_tx_t *tx) 1635*7a7741afSMartin Matuska { 1636*7a7741afSMartin Matuska uint64_t moid, obj, sa_obj, version; 1637*7a7741afSMartin Matuska uint64_t sense = ZFS_CASE_SENSITIVE; 1638*7a7741afSMartin Matuska uint64_t norm = 0; 1639*7a7741afSMartin Matuska nvpair_t *elem; 1640*7a7741afSMartin Matuska int error; 1641*7a7741afSMartin Matuska int i; 1642*7a7741afSMartin Matuska znode_t *rootzp = NULL; 1643*7a7741afSMartin Matuska zfsvfs_t *zfsvfs; 1644*7a7741afSMartin Matuska vattr_t vattr; 1645*7a7741afSMartin Matuska znode_t *zp; 1646*7a7741afSMartin Matuska zfs_acl_ids_t acl_ids; 1647*7a7741afSMartin Matuska 1648*7a7741afSMartin Matuska /* 1649*7a7741afSMartin Matuska * First attempt to create master node. 1650*7a7741afSMartin Matuska */ 1651*7a7741afSMartin Matuska /* 1652*7a7741afSMartin Matuska * In an empty objset, there are no blocks to read and thus 1653*7a7741afSMartin Matuska * there can be no i/o errors (which we assert below). 1654*7a7741afSMartin Matuska */ 1655*7a7741afSMartin Matuska moid = MASTER_NODE_OBJ; 1656*7a7741afSMartin Matuska error = zap_create_claim(os, moid, DMU_OT_MASTER_NODE, 1657*7a7741afSMartin Matuska DMU_OT_NONE, 0, tx); 1658*7a7741afSMartin Matuska ASSERT0(error); 1659*7a7741afSMartin Matuska 1660*7a7741afSMartin Matuska /* 1661*7a7741afSMartin Matuska * Set starting attributes. 1662*7a7741afSMartin Matuska */ 1663*7a7741afSMartin Matuska version = zfs_zpl_version_map(spa_version(dmu_objset_spa(os))); 1664*7a7741afSMartin Matuska elem = NULL; 1665*7a7741afSMartin Matuska while ((elem = nvlist_next_nvpair(zplprops, elem)) != NULL) { 1666*7a7741afSMartin Matuska /* For the moment we expect all zpl props to be uint64_ts */ 1667*7a7741afSMartin Matuska uint64_t val; 1668*7a7741afSMartin Matuska const char *name; 1669*7a7741afSMartin Matuska 1670*7a7741afSMartin Matuska ASSERT3S(nvpair_type(elem), ==, DATA_TYPE_UINT64); 1671*7a7741afSMartin Matuska val = fnvpair_value_uint64(elem); 1672*7a7741afSMartin Matuska name = nvpair_name(elem); 1673*7a7741afSMartin Matuska if (strcmp(name, zfs_prop_to_name(ZFS_PROP_VERSION)) == 0) { 1674*7a7741afSMartin Matuska if (val < version) 1675*7a7741afSMartin Matuska version = val; 1676*7a7741afSMartin Matuska } else { 1677*7a7741afSMartin Matuska error = zap_update(os, moid, name, 8, 1, &val, tx); 1678*7a7741afSMartin Matuska } 1679*7a7741afSMartin Matuska ASSERT0(error); 1680*7a7741afSMartin Matuska if (strcmp(name, zfs_prop_to_name(ZFS_PROP_NORMALIZE)) == 0) 1681*7a7741afSMartin Matuska norm = val; 1682*7a7741afSMartin Matuska else if (strcmp(name, zfs_prop_to_name(ZFS_PROP_CASE)) == 0) 1683*7a7741afSMartin Matuska sense = val; 1684*7a7741afSMartin Matuska } 1685*7a7741afSMartin Matuska ASSERT3U(version, !=, 0); 1686*7a7741afSMartin Matuska error = zap_update(os, moid, ZPL_VERSION_STR, 8, 1, &version, tx); 1687*7a7741afSMartin Matuska ASSERT0(error); 1688*7a7741afSMartin Matuska 1689*7a7741afSMartin Matuska /* 1690*7a7741afSMartin Matuska * Create zap object used for SA attribute registration 1691*7a7741afSMartin Matuska */ 1692*7a7741afSMartin Matuska 1693*7a7741afSMartin Matuska if (version >= ZPL_VERSION_SA) { 1694*7a7741afSMartin Matuska sa_obj = zap_create(os, DMU_OT_SA_MASTER_NODE, 1695*7a7741afSMartin Matuska DMU_OT_NONE, 0, tx); 1696*7a7741afSMartin Matuska error = zap_add(os, moid, ZFS_SA_ATTRS, 8, 1, &sa_obj, tx); 1697*7a7741afSMartin Matuska ASSERT0(error); 1698*7a7741afSMartin Matuska } else { 1699*7a7741afSMartin Matuska sa_obj = 0; 1700*7a7741afSMartin Matuska } 1701*7a7741afSMartin Matuska /* 1702*7a7741afSMartin Matuska * Create a delete queue. 1703*7a7741afSMartin Matuska */ 1704*7a7741afSMartin Matuska obj = zap_create(os, DMU_OT_UNLINKED_SET, DMU_OT_NONE, 0, tx); 1705*7a7741afSMartin Matuska 1706*7a7741afSMartin Matuska error = zap_add(os, moid, ZFS_UNLINKED_SET, 8, 1, &obj, tx); 1707*7a7741afSMartin Matuska ASSERT0(error); 1708*7a7741afSMartin Matuska 1709*7a7741afSMartin Matuska /* 1710*7a7741afSMartin Matuska * Create root znode. Create minimal znode/vnode/zfsvfs 1711*7a7741afSMartin Matuska * to allow zfs_mknode to work. 1712*7a7741afSMartin Matuska */ 1713*7a7741afSMartin Matuska VATTR_NULL(&vattr); 1714*7a7741afSMartin Matuska vattr.va_mask = AT_MODE|AT_UID|AT_GID; 1715*7a7741afSMartin Matuska vattr.va_type = VDIR; 1716*7a7741afSMartin Matuska vattr.va_mode = S_IFDIR|0755; 1717*7a7741afSMartin Matuska vattr.va_uid = crgetuid(cr); 1718*7a7741afSMartin Matuska vattr.va_gid = crgetgid(cr); 1719*7a7741afSMartin Matuska 1720*7a7741afSMartin Matuska zfsvfs = kmem_zalloc(sizeof (zfsvfs_t), KM_SLEEP); 1721*7a7741afSMartin Matuska 1722*7a7741afSMartin Matuska rootzp = zfs_znode_alloc_kmem(KM_SLEEP); 1723*7a7741afSMartin Matuska ASSERT(!POINTER_IS_VALID(rootzp->z_zfsvfs)); 1724*7a7741afSMartin Matuska rootzp->z_unlinked = 0; 1725*7a7741afSMartin Matuska rootzp->z_atime_dirty = 0; 1726*7a7741afSMartin Matuska rootzp->z_is_sa = USE_SA(version, os); 1727*7a7741afSMartin Matuska 1728*7a7741afSMartin Matuska zfsvfs->z_os = os; 1729*7a7741afSMartin Matuska zfsvfs->z_parent = zfsvfs; 1730*7a7741afSMartin Matuska zfsvfs->z_version = version; 1731*7a7741afSMartin Matuska zfsvfs->z_use_fuids = USE_FUIDS(version, os); 1732*7a7741afSMartin Matuska zfsvfs->z_use_sa = USE_SA(version, os); 1733*7a7741afSMartin Matuska zfsvfs->z_norm = norm; 1734*7a7741afSMartin Matuska 1735*7a7741afSMartin Matuska error = sa_setup(os, sa_obj, zfs_attr_table, ZPL_END, 1736*7a7741afSMartin Matuska &zfsvfs->z_attr_table); 1737*7a7741afSMartin Matuska 1738*7a7741afSMartin Matuska ASSERT0(error); 1739*7a7741afSMartin Matuska 1740*7a7741afSMartin Matuska /* 1741*7a7741afSMartin Matuska * Fold case on file systems that are always or sometimes case 1742*7a7741afSMartin Matuska * insensitive. 1743*7a7741afSMartin Matuska */ 1744*7a7741afSMartin Matuska if (sense == ZFS_CASE_INSENSITIVE || sense == ZFS_CASE_MIXED) 1745*7a7741afSMartin Matuska zfsvfs->z_norm |= U8_TEXTPREP_TOUPPER; 1746*7a7741afSMartin Matuska 1747*7a7741afSMartin Matuska mutex_init(&zfsvfs->z_znodes_lock, NULL, MUTEX_DEFAULT, NULL); 1748*7a7741afSMartin Matuska list_create(&zfsvfs->z_all_znodes, sizeof (znode_t), 1749*7a7741afSMartin Matuska offsetof(znode_t, z_link_node)); 1750*7a7741afSMartin Matuska 1751*7a7741afSMartin Matuska for (i = 0; i != ZFS_OBJ_MTX_SZ; i++) 1752*7a7741afSMartin Matuska mutex_init(&zfsvfs->z_hold_mtx[i], NULL, MUTEX_DEFAULT, NULL); 1753*7a7741afSMartin Matuska 1754*7a7741afSMartin Matuska rootzp->z_zfsvfs = zfsvfs; 1755*7a7741afSMartin Matuska VERIFY0(zfs_acl_ids_create(rootzp, IS_ROOT_NODE, &vattr, 1756*7a7741afSMartin Matuska cr, NULL, &acl_ids, NULL)); 1757*7a7741afSMartin Matuska zfs_mknode(rootzp, &vattr, tx, cr, IS_ROOT_NODE, &zp, &acl_ids); 1758*7a7741afSMartin Matuska ASSERT3P(zp, ==, rootzp); 1759*7a7741afSMartin Matuska error = zap_add(os, moid, ZFS_ROOT_OBJ, 8, 1, &rootzp->z_id, tx); 1760*7a7741afSMartin Matuska ASSERT0(error); 1761*7a7741afSMartin Matuska zfs_acl_ids_free(&acl_ids); 1762*7a7741afSMartin Matuska POINTER_INVALIDATE(&rootzp->z_zfsvfs); 1763*7a7741afSMartin Matuska 1764*7a7741afSMartin Matuska sa_handle_destroy(rootzp->z_sa_hdl); 1765*7a7741afSMartin Matuska zfs_znode_free_kmem(rootzp); 1766*7a7741afSMartin Matuska 1767*7a7741afSMartin Matuska /* 1768*7a7741afSMartin Matuska * Create shares directory 1769*7a7741afSMartin Matuska */ 1770*7a7741afSMartin Matuska 1771*7a7741afSMartin Matuska error = zfs_create_share_dir(zfsvfs, tx); 1772*7a7741afSMartin Matuska 1773*7a7741afSMartin Matuska ASSERT0(error); 1774*7a7741afSMartin Matuska 1775*7a7741afSMartin Matuska for (i = 0; i != ZFS_OBJ_MTX_SZ; i++) 1776*7a7741afSMartin Matuska mutex_destroy(&zfsvfs->z_hold_mtx[i]); 1777*7a7741afSMartin Matuska kmem_free(zfsvfs, sizeof (zfsvfs_t)); 1778*7a7741afSMartin Matuska } 1779*7a7741afSMartin Matuska 1780*7a7741afSMartin Matuska void 1781*7a7741afSMartin Matuska zfs_znode_update_vfs(znode_t *zp) 1782*7a7741afSMartin Matuska { 1783*7a7741afSMartin Matuska vm_object_t object; 1784*7a7741afSMartin Matuska 1785*7a7741afSMartin Matuska if ((object = ZTOV(zp)->v_object) == NULL || 1786*7a7741afSMartin Matuska zp->z_size == object->un_pager.vnp.vnp_size) 1787*7a7741afSMartin Matuska return; 1788*7a7741afSMartin Matuska 1789*7a7741afSMartin Matuska vnode_pager_setsize(ZTOV(zp), zp->z_size); 1790*7a7741afSMartin Matuska } 1791*7a7741afSMartin Matuska 1792*7a7741afSMartin Matuska int 1793*7a7741afSMartin Matuska zfs_znode_parent_and_name(znode_t *zp, znode_t **dzpp, char *buf, 1794*7a7741afSMartin Matuska uint64_t buflen) 1795*7a7741afSMartin Matuska { 1796*7a7741afSMartin Matuska zfsvfs_t *zfsvfs = zp->z_zfsvfs; 1797*7a7741afSMartin Matuska uint64_t parent; 1798*7a7741afSMartin Matuska int is_xattrdir; 1799*7a7741afSMartin Matuska int err; 1800*7a7741afSMartin Matuska 1801*7a7741afSMartin Matuska /* Extended attributes should not be visible as regular files. */ 1802*7a7741afSMartin Matuska if ((zp->z_pflags & ZFS_XATTR) != 0) 1803*7a7741afSMartin Matuska return (SET_ERROR(EINVAL)); 1804*7a7741afSMartin Matuska 1805*7a7741afSMartin Matuska err = zfs_obj_to_pobj(zfsvfs->z_os, zp->z_sa_hdl, zfsvfs->z_attr_table, 1806*7a7741afSMartin Matuska &parent, &is_xattrdir); 1807*7a7741afSMartin Matuska if (err != 0) 1808*7a7741afSMartin Matuska return (err); 1809*7a7741afSMartin Matuska ASSERT0(is_xattrdir); 1810*7a7741afSMartin Matuska 1811*7a7741afSMartin Matuska /* No name as this is a root object. */ 1812*7a7741afSMartin Matuska if (parent == zp->z_id) 1813*7a7741afSMartin Matuska return (SET_ERROR(EINVAL)); 1814*7a7741afSMartin Matuska 1815*7a7741afSMartin Matuska err = zap_value_search(zfsvfs->z_os, parent, zp->z_id, 1816*7a7741afSMartin Matuska ZFS_DIRENT_OBJ(-1ULL), buf, buflen); 1817*7a7741afSMartin Matuska if (err != 0) 1818*7a7741afSMartin Matuska return (err); 1819*7a7741afSMartin Matuska err = zfs_zget(zfsvfs, parent, dzpp); 1820*7a7741afSMartin Matuska return (err); 1821*7a7741afSMartin Matuska } 1822*7a7741afSMartin Matuska 1823*7a7741afSMartin Matuska int 1824*7a7741afSMartin Matuska zfs_rlimit_fsize(off_t fsize) 1825*7a7741afSMartin Matuska { 1826*7a7741afSMartin Matuska struct thread *td = curthread; 1827*7a7741afSMartin Matuska off_t lim; 1828*7a7741afSMartin Matuska 1829*7a7741afSMartin Matuska if (td == NULL) 1830*7a7741afSMartin Matuska return (0); 1831*7a7741afSMartin Matuska 1832*7a7741afSMartin Matuska lim = lim_cur(td, RLIMIT_FSIZE); 1833*7a7741afSMartin Matuska if (__predict_true((uoff_t)fsize <= lim)) 1834*7a7741afSMartin Matuska return (0); 1835*7a7741afSMartin Matuska 1836*7a7741afSMartin Matuska /* 1837*7a7741afSMartin Matuska * The limit is reached. 1838*7a7741afSMartin Matuska */ 1839*7a7741afSMartin Matuska PROC_LOCK(td->td_proc); 1840*7a7741afSMartin Matuska kern_psignal(td->td_proc, SIGXFSZ); 1841*7a7741afSMartin Matuska PROC_UNLOCK(td->td_proc); 1842*7a7741afSMartin Matuska 1843*7a7741afSMartin Matuska return (EFBIG); 1844*7a7741afSMartin Matuska } 1845