1789Sahrens /* 2789Sahrens * CDDL HEADER START 3789Sahrens * 4789Sahrens * The contents of this file are subject to the terms of the 51544Seschrock * Common Development and Distribution License (the "License"). 61544Seschrock * You may not use this file except in compliance with the License. 7789Sahrens * 8789Sahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9789Sahrens * or http://www.opensolaris.org/os/licensing. 10789Sahrens * See the License for the specific language governing permissions 11789Sahrens * and limitations under the License. 12789Sahrens * 13789Sahrens * When distributing Covered Code, include this CDDL HEADER in each 14789Sahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15789Sahrens * If applicable, add the following below this CDDL HEADER, with the 16789Sahrens * fields enclosed by brackets "[]" replaced with your own identifying 17789Sahrens * information: Portions Copyright [yyyy] [name of copyright owner] 18789Sahrens * 19789Sahrens * CDDL HEADER END 20789Sahrens */ 21789Sahrens /* 226174Sahrens * Copyright 2008 Sun Microsystems, Inc. All rights reserved. 23789Sahrens * Use is subject to license terms. 24789Sahrens */ 25789Sahrens 26789Sahrens #pragma ident "%Z%%M% %I% %E% SMI" 27789Sahrens 284543Smarks #include <sys/cred.h> 29789Sahrens #include <sys/zfs_context.h> 30789Sahrens #include <sys/dmu_objset.h> 31789Sahrens #include <sys/dsl_dir.h> 32789Sahrens #include <sys/dsl_dataset.h> 33789Sahrens #include <sys/dsl_prop.h> 34789Sahrens #include <sys/dsl_pool.h> 352199Sahrens #include <sys/dsl_synctask.h> 364543Smarks #include <sys/dsl_deleg.h> 37789Sahrens #include <sys/dnode.h> 38789Sahrens #include <sys/dbuf.h> 392885Sahrens #include <sys/zvol.h> 40789Sahrens #include <sys/dmu_tx.h> 41789Sahrens #include <sys/zio_checksum.h> 42789Sahrens #include <sys/zap.h> 43789Sahrens #include <sys/zil.h> 44789Sahrens #include <sys/dmu_impl.h> 454543Smarks #include <sys/zfs_ioctl.h> 46789Sahrens 47789Sahrens spa_t * 48789Sahrens dmu_objset_spa(objset_t *os) 49789Sahrens { 50789Sahrens return (os->os->os_spa); 51789Sahrens } 52789Sahrens 53789Sahrens zilog_t * 54789Sahrens dmu_objset_zil(objset_t *os) 55789Sahrens { 56789Sahrens return (os->os->os_zil); 57789Sahrens } 58789Sahrens 59789Sahrens dsl_pool_t * 60789Sahrens dmu_objset_pool(objset_t *os) 61789Sahrens { 62789Sahrens dsl_dataset_t *ds; 63789Sahrens 64789Sahrens if ((ds = os->os->os_dsl_dataset) != NULL && ds->ds_dir) 65789Sahrens return (ds->ds_dir->dd_pool); 66789Sahrens else 67789Sahrens return (spa_get_dsl(os->os->os_spa)); 68789Sahrens } 69789Sahrens 70789Sahrens dsl_dataset_t * 71789Sahrens dmu_objset_ds(objset_t *os) 72789Sahrens { 73789Sahrens return (os->os->os_dsl_dataset); 74789Sahrens } 75789Sahrens 76789Sahrens dmu_objset_type_t 77789Sahrens dmu_objset_type(objset_t *os) 78789Sahrens { 79789Sahrens return (os->os->os_phys->os_type); 80789Sahrens } 81789Sahrens 82789Sahrens void 83789Sahrens dmu_objset_name(objset_t *os, char *buf) 84789Sahrens { 85789Sahrens dsl_dataset_name(os->os->os_dsl_dataset, buf); 86789Sahrens } 87789Sahrens 88789Sahrens uint64_t 89789Sahrens dmu_objset_id(objset_t *os) 90789Sahrens { 91789Sahrens dsl_dataset_t *ds = os->os->os_dsl_dataset; 92789Sahrens 93789Sahrens return (ds ? ds->ds_object : 0); 94789Sahrens } 95789Sahrens 96789Sahrens static void 97789Sahrens checksum_changed_cb(void *arg, uint64_t newval) 98789Sahrens { 99789Sahrens objset_impl_t *osi = arg; 100789Sahrens 101789Sahrens /* 102789Sahrens * Inheritance should have been done by now. 103789Sahrens */ 104789Sahrens ASSERT(newval != ZIO_CHECKSUM_INHERIT); 105789Sahrens 106789Sahrens osi->os_checksum = zio_checksum_select(newval, ZIO_CHECKSUM_ON_VALUE); 107789Sahrens } 108789Sahrens 109789Sahrens static void 110789Sahrens compression_changed_cb(void *arg, uint64_t newval) 111789Sahrens { 112789Sahrens objset_impl_t *osi = arg; 113789Sahrens 114789Sahrens /* 115789Sahrens * Inheritance and range checking should have been done by now. 116789Sahrens */ 117789Sahrens ASSERT(newval != ZIO_COMPRESS_INHERIT); 118789Sahrens 119789Sahrens osi->os_compress = zio_compress_select(newval, ZIO_COMPRESS_ON_VALUE); 120789Sahrens } 121789Sahrens 1223835Sahrens static void 1233835Sahrens copies_changed_cb(void *arg, uint64_t newval) 1243835Sahrens { 1253835Sahrens objset_impl_t *osi = arg; 1263835Sahrens 1273835Sahrens /* 1283835Sahrens * Inheritance and range checking should have been done by now. 1293835Sahrens */ 1303835Sahrens ASSERT(newval > 0); 1313835Sahrens ASSERT(newval <= spa_max_replication(osi->os_spa)); 1323835Sahrens 1333835Sahrens osi->os_copies = newval; 1343835Sahrens } 1353835Sahrens 136789Sahrens void 137789Sahrens dmu_objset_byteswap(void *buf, size_t size) 138789Sahrens { 139789Sahrens objset_phys_t *osp = buf; 140789Sahrens 141789Sahrens ASSERT(size == sizeof (objset_phys_t)); 142789Sahrens dnode_byteswap(&osp->os_meta_dnode); 143789Sahrens byteswap_uint64_array(&osp->os_zil_header, sizeof (zil_header_t)); 144789Sahrens osp->os_type = BSWAP_64(osp->os_type); 145789Sahrens } 146789Sahrens 1471544Seschrock int 1481544Seschrock dmu_objset_open_impl(spa_t *spa, dsl_dataset_t *ds, blkptr_t *bp, 1491544Seschrock objset_impl_t **osip) 150789Sahrens { 1514787Sahrens objset_impl_t *osi; 152789Sahrens int i, err, checksum; 153789Sahrens 1544787Sahrens ASSERT(ds == NULL || MUTEX_HELD(&ds->ds_opening_lock)); 1554787Sahrens 156789Sahrens osi = kmem_zalloc(sizeof (objset_impl_t), KM_SLEEP); 157789Sahrens osi->os.os = osi; 158789Sahrens osi->os_dsl_dataset = ds; 159789Sahrens osi->os_spa = spa; 1603547Smaybee osi->os_rootbp = bp; 1613547Smaybee if (!BP_IS_HOLE(osi->os_rootbp)) { 1622391Smaybee uint32_t aflags = ARC_WAIT; 1631544Seschrock zbookmark_t zb; 1641544Seschrock zb.zb_objset = ds ? ds->ds_object : 0; 1651544Seschrock zb.zb_object = 0; 1661544Seschrock zb.zb_level = -1; 1671544Seschrock zb.zb_blkid = 0; 1681544Seschrock 1693547Smaybee dprintf_bp(osi->os_rootbp, "reading %s", ""); 1703547Smaybee err = arc_read(NULL, spa, osi->os_rootbp, 171789Sahrens dmu_ot[DMU_OT_OBJSET].ot_byteswap, 1723547Smaybee arc_getbuf_func, &osi->os_phys_buf, 1732391Smaybee ZIO_PRIORITY_SYNC_READ, ZIO_FLAG_CANFAIL, &aflags, &zb); 1741544Seschrock if (err) { 1751544Seschrock kmem_free(osi, sizeof (objset_impl_t)); 1761544Seschrock return (err); 1771544Seschrock } 1783547Smaybee osi->os_phys = osi->os_phys_buf->b_data; 1795147Srm160521 if (ds == NULL || dsl_dataset_is_snapshot(ds) == 0) 1805147Srm160521 arc_release(osi->os_phys_buf, &osi->os_phys_buf); 181789Sahrens } else { 1823547Smaybee osi->os_phys_buf = arc_buf_alloc(spa, sizeof (objset_phys_t), 1833547Smaybee &osi->os_phys_buf, ARC_BUFC_METADATA); 1843547Smaybee osi->os_phys = osi->os_phys_buf->b_data; 185789Sahrens bzero(osi->os_phys, sizeof (objset_phys_t)); 186789Sahrens } 187789Sahrens 188789Sahrens /* 189789Sahrens * Note: the changed_cb will be called once before the register 190789Sahrens * func returns, thus changing the checksum/compression from the 1912082Seschrock * default (fletcher2/off). Snapshots don't need to know, and 1922082Seschrock * registering would complicate clone promotion. 193789Sahrens */ 1942082Seschrock if (ds && ds->ds_phys->ds_num_children == 0) { 195789Sahrens err = dsl_prop_register(ds, "checksum", 196789Sahrens checksum_changed_cb, osi); 1971544Seschrock if (err == 0) 1981544Seschrock err = dsl_prop_register(ds, "compression", 1991544Seschrock compression_changed_cb, osi); 2003835Sahrens if (err == 0) 2013835Sahrens err = dsl_prop_register(ds, "copies", 2023835Sahrens copies_changed_cb, osi); 2031544Seschrock if (err) { 2043547Smaybee VERIFY(arc_buf_remove_ref(osi->os_phys_buf, 2053547Smaybee &osi->os_phys_buf) == 1); 2061544Seschrock kmem_free(osi, sizeof (objset_impl_t)); 2071544Seschrock return (err); 2081544Seschrock } 2092082Seschrock } else if (ds == NULL) { 210789Sahrens /* It's the meta-objset. */ 211789Sahrens osi->os_checksum = ZIO_CHECKSUM_FLETCHER_4; 2121544Seschrock osi->os_compress = ZIO_COMPRESS_LZJB; 2133835Sahrens osi->os_copies = spa_max_replication(spa); 214789Sahrens } 215789Sahrens 2161544Seschrock osi->os_zil = zil_alloc(&osi->os, &osi->os_phys->os_zil_header); 2171544Seschrock 218789Sahrens /* 219789Sahrens * Metadata always gets compressed and checksummed. 220789Sahrens * If the data checksum is multi-bit correctable, and it's not 221789Sahrens * a ZBT-style checksum, then it's suitable for metadata as well. 222789Sahrens * Otherwise, the metadata checksum defaults to fletcher4. 223789Sahrens */ 224789Sahrens checksum = osi->os_checksum; 225789Sahrens 226789Sahrens if (zio_checksum_table[checksum].ci_correctable && 227789Sahrens !zio_checksum_table[checksum].ci_zbt) 228789Sahrens osi->os_md_checksum = checksum; 229789Sahrens else 230789Sahrens osi->os_md_checksum = ZIO_CHECKSUM_FLETCHER_4; 2311544Seschrock osi->os_md_compress = ZIO_COMPRESS_LZJB; 232789Sahrens 233789Sahrens for (i = 0; i < TXG_SIZE; i++) { 234789Sahrens list_create(&osi->os_dirty_dnodes[i], sizeof (dnode_t), 235789Sahrens offsetof(dnode_t, dn_dirty_link[i])); 236789Sahrens list_create(&osi->os_free_dnodes[i], sizeof (dnode_t), 237789Sahrens offsetof(dnode_t, dn_dirty_link[i])); 238789Sahrens } 239789Sahrens list_create(&osi->os_dnodes, sizeof (dnode_t), 240789Sahrens offsetof(dnode_t, dn_link)); 241789Sahrens list_create(&osi->os_downgraded_dbufs, sizeof (dmu_buf_impl_t), 242789Sahrens offsetof(dmu_buf_impl_t, db_link)); 243789Sahrens 2442856Snd150628 mutex_init(&osi->os_lock, NULL, MUTEX_DEFAULT, NULL); 2452856Snd150628 mutex_init(&osi->os_obj_lock, NULL, MUTEX_DEFAULT, NULL); 2465326Sek110237 mutex_init(&osi->os_user_ptr_lock, NULL, MUTEX_DEFAULT, NULL); 2472856Snd150628 248789Sahrens osi->os_meta_dnode = dnode_special_open(osi, 249789Sahrens &osi->os_phys->os_meta_dnode, DMU_META_DNODE_OBJECT); 250789Sahrens 2514787Sahrens /* 2524787Sahrens * We should be the only thread trying to do this because we 2534787Sahrens * have ds_opening_lock 2544787Sahrens */ 2554787Sahrens if (ds) { 2564787Sahrens VERIFY(NULL == dsl_dataset_set_user_ptr(ds, osi, 2574787Sahrens dmu_objset_evict)); 258789Sahrens } 259789Sahrens 2601544Seschrock *osip = osi; 2611544Seschrock return (0); 262789Sahrens } 263789Sahrens 2645367Sahrens static int 2655367Sahrens dmu_objset_open_ds_os(dsl_dataset_t *ds, objset_t *os, dmu_objset_type_t type) 2665367Sahrens { 2675367Sahrens objset_impl_t *osi; 2685367Sahrens 2695367Sahrens mutex_enter(&ds->ds_opening_lock); 2705367Sahrens osi = dsl_dataset_get_user_ptr(ds); 2715367Sahrens if (osi == NULL) { 272*6689Smaybee int err; 273*6689Smaybee 2745367Sahrens err = dmu_objset_open_impl(dsl_dataset_get_spa(ds), 2755367Sahrens ds, &ds->ds_phys->ds_bp, &osi); 276*6689Smaybee if (err) { 277*6689Smaybee mutex_exit(&ds->ds_opening_lock); 2785367Sahrens return (err); 279*6689Smaybee } 2805367Sahrens } 2815367Sahrens mutex_exit(&ds->ds_opening_lock); 2825367Sahrens 2835367Sahrens os->os = osi; 284*6689Smaybee os->os_mode = DS_MODE_NOHOLD; 2855367Sahrens 2865367Sahrens if (type != DMU_OST_ANY && type != os->os->os_phys->os_type) 2875367Sahrens return (EINVAL); 2885367Sahrens return (0); 2895367Sahrens } 2905367Sahrens 2915367Sahrens int 2925367Sahrens dmu_objset_open_ds(dsl_dataset_t *ds, dmu_objset_type_t type, objset_t **osp) 2935367Sahrens { 2945367Sahrens objset_t *os; 2955367Sahrens int err; 2965367Sahrens 2975367Sahrens os = kmem_alloc(sizeof (objset_t), KM_SLEEP); 2985367Sahrens err = dmu_objset_open_ds_os(ds, os, type); 2995367Sahrens if (err) 3005367Sahrens kmem_free(os, sizeof (objset_t)); 3015367Sahrens else 3025367Sahrens *osp = os; 3035367Sahrens return (err); 3045367Sahrens } 3055367Sahrens 306789Sahrens /* called from zpl */ 307789Sahrens int 308789Sahrens dmu_objset_open(const char *name, dmu_objset_type_t type, int mode, 309789Sahrens objset_t **osp) 310789Sahrens { 3115326Sek110237 objset_t *os; 312789Sahrens dsl_dataset_t *ds; 313789Sahrens int err; 314789Sahrens 315*6689Smaybee ASSERT(DS_MODE_TYPE(mode) == DS_MODE_USER || 316*6689Smaybee DS_MODE_TYPE(mode) == DS_MODE_OWNER); 3175367Sahrens 318789Sahrens os = kmem_alloc(sizeof (objset_t), KM_SLEEP); 319*6689Smaybee if (DS_MODE_TYPE(mode) == DS_MODE_USER) 320*6689Smaybee err = dsl_dataset_hold(name, os, &ds); 321*6689Smaybee else 322*6689Smaybee err = dsl_dataset_own(name, mode, os, &ds); 323789Sahrens if (err) { 324789Sahrens kmem_free(os, sizeof (objset_t)); 325789Sahrens return (err); 326789Sahrens } 327789Sahrens 3285367Sahrens err = dmu_objset_open_ds_os(ds, os, type); 3295367Sahrens if (err) { 330*6689Smaybee if (DS_MODE_TYPE(mode) == DS_MODE_USER) 331*6689Smaybee dsl_dataset_rele(ds, os); 332*6689Smaybee else 333*6689Smaybee dsl_dataset_disown(ds, os); 3345367Sahrens kmem_free(os, sizeof (objset_t)); 3355367Sahrens } else { 336*6689Smaybee os->os_mode = mode; 3375367Sahrens *osp = os; 338789Sahrens } 3395367Sahrens return (err); 340789Sahrens } 341789Sahrens 342789Sahrens void 343789Sahrens dmu_objset_close(objset_t *os) 344789Sahrens { 345*6689Smaybee ASSERT(DS_MODE_TYPE(os->os_mode) == DS_MODE_USER || 346*6689Smaybee DS_MODE_TYPE(os->os_mode) == DS_MODE_OWNER || 347*6689Smaybee DS_MODE_TYPE(os->os_mode) == DS_MODE_NOHOLD); 348*6689Smaybee 349*6689Smaybee if (DS_MODE_TYPE(os->os_mode) == DS_MODE_USER) 350*6689Smaybee dsl_dataset_rele(os->os->os_dsl_dataset, os); 351*6689Smaybee else if (DS_MODE_TYPE(os->os_mode) == DS_MODE_OWNER) 352*6689Smaybee dsl_dataset_disown(os->os->os_dsl_dataset, os); 353789Sahrens kmem_free(os, sizeof (objset_t)); 354789Sahrens } 355789Sahrens 3561646Sperrin int 3574944Smaybee dmu_objset_evict_dbufs(objset_t *os) 3581544Seschrock { 3591544Seschrock objset_impl_t *osi = os->os; 3601544Seschrock dnode_t *dn; 3611596Sahrens 3621596Sahrens mutex_enter(&osi->os_lock); 3631596Sahrens 3641596Sahrens /* process the mdn last, since the other dnodes have holds on it */ 3651596Sahrens list_remove(&osi->os_dnodes, osi->os_meta_dnode); 3661596Sahrens list_insert_tail(&osi->os_dnodes, osi->os_meta_dnode); 3671544Seschrock 3681544Seschrock /* 3691596Sahrens * Find the first dnode with holds. We have to do this dance 3701596Sahrens * because dnode_add_ref() only works if you already have a 3711596Sahrens * hold. If there are no holds then it has no dbufs so OK to 3721596Sahrens * skip. 3731544Seschrock */ 3741596Sahrens for (dn = list_head(&osi->os_dnodes); 3754944Smaybee dn && !dnode_add_ref(dn, FTAG); 3761596Sahrens dn = list_next(&osi->os_dnodes, dn)) 3771596Sahrens continue; 3781596Sahrens 3791596Sahrens while (dn) { 3801596Sahrens dnode_t *next_dn = dn; 3811596Sahrens 3821596Sahrens do { 3831596Sahrens next_dn = list_next(&osi->os_dnodes, next_dn); 3844944Smaybee } while (next_dn && !dnode_add_ref(next_dn, FTAG)); 3851596Sahrens 3861596Sahrens mutex_exit(&osi->os_lock); 3874944Smaybee dnode_evict_dbufs(dn); 3881596Sahrens dnode_rele(dn, FTAG); 3891596Sahrens mutex_enter(&osi->os_lock); 3901596Sahrens dn = next_dn; 3911544Seschrock } 3921544Seschrock mutex_exit(&osi->os_lock); 3934944Smaybee return (list_head(&osi->os_dnodes) != osi->os_meta_dnode); 3941544Seschrock } 3951544Seschrock 3961544Seschrock void 397789Sahrens dmu_objset_evict(dsl_dataset_t *ds, void *arg) 398789Sahrens { 399789Sahrens objset_impl_t *osi = arg; 4001544Seschrock objset_t os; 4012082Seschrock int i; 402789Sahrens 403789Sahrens for (i = 0; i < TXG_SIZE; i++) { 404789Sahrens ASSERT(list_head(&osi->os_dirty_dnodes[i]) == NULL); 405789Sahrens ASSERT(list_head(&osi->os_free_dnodes[i]) == NULL); 406789Sahrens } 407789Sahrens 408*6689Smaybee if (ds && ds->ds_phys && ds->ds_phys->ds_num_children == 0) { 4092082Seschrock VERIFY(0 == dsl_prop_unregister(ds, "checksum", 4102082Seschrock checksum_changed_cb, osi)); 4112082Seschrock VERIFY(0 == dsl_prop_unregister(ds, "compression", 4122082Seschrock compression_changed_cb, osi)); 4133835Sahrens VERIFY(0 == dsl_prop_unregister(ds, "copies", 4143835Sahrens copies_changed_cb, osi)); 415789Sahrens } 416789Sahrens 4171544Seschrock /* 4181544Seschrock * We should need only a single pass over the dnode list, since 4191544Seschrock * nothing can be added to the list at this point. 4201544Seschrock */ 4211544Seschrock os.os = osi; 4224944Smaybee (void) dmu_objset_evict_dbufs(&os); 4231544Seschrock 424789Sahrens ASSERT3P(list_head(&osi->os_dnodes), ==, osi->os_meta_dnode); 425789Sahrens ASSERT3P(list_tail(&osi->os_dnodes), ==, osi->os_meta_dnode); 426789Sahrens ASSERT3P(list_head(&osi->os_meta_dnode->dn_dbufs), ==, NULL); 427789Sahrens 428789Sahrens dnode_special_close(osi->os_meta_dnode); 429789Sahrens zil_free(osi->os_zil); 430789Sahrens 4313547Smaybee VERIFY(arc_buf_remove_ref(osi->os_phys_buf, &osi->os_phys_buf) == 1); 4322856Snd150628 mutex_destroy(&osi->os_lock); 4332856Snd150628 mutex_destroy(&osi->os_obj_lock); 4345326Sek110237 mutex_destroy(&osi->os_user_ptr_lock); 435789Sahrens kmem_free(osi, sizeof (objset_impl_t)); 436789Sahrens } 437789Sahrens 438789Sahrens /* called from dsl for meta-objset */ 439789Sahrens objset_impl_t * 4403547Smaybee dmu_objset_create_impl(spa_t *spa, dsl_dataset_t *ds, blkptr_t *bp, 4413547Smaybee dmu_objset_type_t type, dmu_tx_t *tx) 442789Sahrens { 443789Sahrens objset_impl_t *osi; 444789Sahrens dnode_t *mdn; 445789Sahrens 446789Sahrens ASSERT(dmu_tx_is_syncing(tx)); 4474787Sahrens if (ds) 4484787Sahrens mutex_enter(&ds->ds_opening_lock); 4493547Smaybee VERIFY(0 == dmu_objset_open_impl(spa, ds, bp, &osi)); 4504787Sahrens if (ds) 4514787Sahrens mutex_exit(&ds->ds_opening_lock); 452789Sahrens mdn = osi->os_meta_dnode; 453789Sahrens 454789Sahrens dnode_allocate(mdn, DMU_OT_DNODE, 1 << DNODE_BLOCK_SHIFT, 455789Sahrens DN_MAX_INDBLKSHIFT, DMU_OT_NONE, 0, tx); 456789Sahrens 457789Sahrens /* 458789Sahrens * We don't want to have to increase the meta-dnode's nlevels 459789Sahrens * later, because then we could do it in quescing context while 460789Sahrens * we are also accessing it in open context. 461789Sahrens * 462789Sahrens * This precaution is not necessary for the MOS (ds == NULL), 463789Sahrens * because the MOS is only updated in syncing context. 464789Sahrens * This is most fortunate: the MOS is the only objset that 465789Sahrens * needs to be synced multiple times as spa_sync() iterates 466789Sahrens * to convergence, so minimizing its dn_nlevels matters. 467789Sahrens */ 4681544Seschrock if (ds != NULL) { 4691544Seschrock int levels = 1; 4701544Seschrock 4711544Seschrock /* 4721544Seschrock * Determine the number of levels necessary for the meta-dnode 4731544Seschrock * to contain DN_MAX_OBJECT dnodes. 4741544Seschrock */ 4751544Seschrock while ((uint64_t)mdn->dn_nblkptr << (mdn->dn_datablkshift + 4761544Seschrock (levels - 1) * (mdn->dn_indblkshift - SPA_BLKPTRSHIFT)) < 4771544Seschrock DN_MAX_OBJECT * sizeof (dnode_phys_t)) 4781544Seschrock levels++; 4791544Seschrock 480789Sahrens mdn->dn_next_nlevels[tx->tx_txg & TXG_MASK] = 4811544Seschrock mdn->dn_nlevels = levels; 4821544Seschrock } 483789Sahrens 484789Sahrens ASSERT(type != DMU_OST_NONE); 485789Sahrens ASSERT(type != DMU_OST_ANY); 486789Sahrens ASSERT(type < DMU_OST_NUMTYPES); 487789Sahrens osi->os_phys->os_type = type; 488789Sahrens 489789Sahrens dsl_dataset_dirty(ds, tx); 490789Sahrens 491789Sahrens return (osi); 492789Sahrens } 493789Sahrens 494789Sahrens struct oscarg { 4954543Smarks void (*userfunc)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx); 496789Sahrens void *userarg; 497789Sahrens dsl_dataset_t *clone_parent; 498789Sahrens const char *lastname; 499789Sahrens dmu_objset_type_t type; 5006492Stimh uint64_t flags; 501789Sahrens }; 502789Sahrens 5034543Smarks /*ARGSUSED*/ 504789Sahrens static int 5052199Sahrens dmu_objset_create_check(void *arg1, void *arg2, dmu_tx_t *tx) 506789Sahrens { 5072199Sahrens dsl_dir_t *dd = arg1; 5082199Sahrens struct oscarg *oa = arg2; 5092199Sahrens objset_t *mos = dd->dd_pool->dp_meta_objset; 5102199Sahrens int err; 5112199Sahrens uint64_t ddobj; 5122199Sahrens 5132199Sahrens err = zap_lookup(mos, dd->dd_phys->dd_child_dir_zapobj, 5142199Sahrens oa->lastname, sizeof (uint64_t), 1, &ddobj); 5152199Sahrens if (err != ENOENT) 5162199Sahrens return (err ? err : EEXIST); 5172199Sahrens 5182199Sahrens if (oa->clone_parent != NULL) { 5192199Sahrens /* 5202199Sahrens * You can't clone across pools. 5212199Sahrens */ 5222199Sahrens if (oa->clone_parent->ds_dir->dd_pool != dd->dd_pool) 5232199Sahrens return (EXDEV); 5242199Sahrens 5252199Sahrens /* 5262199Sahrens * You can only clone snapshots, not the head datasets. 5272199Sahrens */ 5282199Sahrens if (oa->clone_parent->ds_phys->ds_num_children == 0) 5292199Sahrens return (EINVAL); 5302199Sahrens } 5314543Smarks 5322199Sahrens return (0); 5332199Sahrens } 5342199Sahrens 5352199Sahrens static void 5364543Smarks dmu_objset_create_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) 5372199Sahrens { 5382199Sahrens dsl_dir_t *dd = arg1; 5392199Sahrens struct oscarg *oa = arg2; 540789Sahrens dsl_dataset_t *ds; 5413547Smaybee blkptr_t *bp; 5422199Sahrens uint64_t dsobj; 543789Sahrens 544789Sahrens ASSERT(dmu_tx_is_syncing(tx)); 545789Sahrens 5462199Sahrens dsobj = dsl_dataset_create_sync(dd, oa->lastname, 5476492Stimh oa->clone_parent, oa->flags, cr, tx); 548789Sahrens 549*6689Smaybee VERIFY(0 == dsl_dataset_hold_obj(dd->dd_pool, dsobj, FTAG, &ds)); 5503547Smaybee bp = dsl_dataset_get_blkptr(ds); 5513547Smaybee if (BP_IS_HOLE(bp)) { 552789Sahrens objset_impl_t *osi; 553789Sahrens 554789Sahrens /* This is an empty dmu_objset; not a clone. */ 555789Sahrens osi = dmu_objset_create_impl(dsl_dataset_get_spa(ds), 5563547Smaybee ds, bp, oa->type, tx); 557789Sahrens 558789Sahrens if (oa->userfunc) 5594543Smarks oa->userfunc(&osi->os, oa->userarg, cr, tx); 560789Sahrens } 5614543Smarks 5624543Smarks spa_history_internal_log(LOG_DS_CREATE, dd->dd_pool->dp_spa, 5634543Smarks tx, cr, "dataset = %llu", dsobj); 5644543Smarks 565*6689Smaybee dsl_dataset_rele(ds, FTAG); 566789Sahrens } 567789Sahrens 568789Sahrens int 569789Sahrens dmu_objset_create(const char *name, dmu_objset_type_t type, 5706492Stimh objset_t *clone_parent, uint64_t flags, 5714543Smarks void (*func)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx), void *arg) 572789Sahrens { 5732199Sahrens dsl_dir_t *pdd; 574789Sahrens const char *tail; 575789Sahrens int err = 0; 5762199Sahrens struct oscarg oa = { 0 }; 577789Sahrens 5782199Sahrens ASSERT(strchr(name, '@') == NULL); 5792199Sahrens err = dsl_dir_open(name, FTAG, &pdd, &tail); 5801544Seschrock if (err) 5811544Seschrock return (err); 582789Sahrens if (tail == NULL) { 5832199Sahrens dsl_dir_close(pdd, FTAG); 584789Sahrens return (EEXIST); 585789Sahrens } 586789Sahrens 587789Sahrens dprintf("name=%s\n", name); 588789Sahrens 5892199Sahrens oa.userfunc = func; 5902199Sahrens oa.userarg = arg; 5912199Sahrens oa.lastname = tail; 5922199Sahrens oa.type = type; 5936492Stimh oa.flags = flags; 5944543Smarks 5952199Sahrens if (clone_parent != NULL) { 596789Sahrens /* 5972199Sahrens * You can't clone to a different type. 598789Sahrens */ 5992199Sahrens if (clone_parent->os->os_phys->os_type != type) { 6002199Sahrens dsl_dir_close(pdd, FTAG); 6012199Sahrens return (EINVAL); 602789Sahrens } 6032199Sahrens oa.clone_parent = clone_parent->os->os_dsl_dataset; 604789Sahrens } 6052199Sahrens err = dsl_sync_task_do(pdd->dd_pool, dmu_objset_create_check, 6062199Sahrens dmu_objset_create_sync, pdd, &oa, 5); 6072199Sahrens dsl_dir_close(pdd, FTAG); 608789Sahrens return (err); 609789Sahrens } 610789Sahrens 611789Sahrens int 612789Sahrens dmu_objset_destroy(const char *name) 613789Sahrens { 614789Sahrens objset_t *os; 615789Sahrens int error; 616789Sahrens 617789Sahrens /* 618789Sahrens * If it looks like we'll be able to destroy it, and there's 619789Sahrens * an unplayed replay log sitting around, destroy the log. 620789Sahrens * It would be nicer to do this in dsl_dataset_destroy_sync(), 621789Sahrens * but the replay log objset is modified in open context. 622789Sahrens */ 6235367Sahrens error = dmu_objset_open(name, DMU_OST_ANY, 624*6689Smaybee DS_MODE_OWNER|DS_MODE_READONLY|DS_MODE_INCONSISTENT, &os); 625789Sahrens if (error == 0) { 6265367Sahrens dsl_dataset_t *ds = os->os->os_dsl_dataset; 6271807Sbonwick zil_destroy(dmu_objset_zil(os), B_FALSE); 6285367Sahrens 629*6689Smaybee error = dsl_dataset_destroy(ds, os); 6305367Sahrens /* 6315367Sahrens * dsl_dataset_destroy() closes the ds. 6325367Sahrens */ 6335367Sahrens kmem_free(os, sizeof (objset_t)); 634789Sahrens } 635789Sahrens 6365367Sahrens return (error); 637789Sahrens } 638789Sahrens 6395446Sahrens /* 6405446Sahrens * This will close the objset. 6415446Sahrens */ 642789Sahrens int 6435446Sahrens dmu_objset_rollback(objset_t *os) 644789Sahrens { 645789Sahrens int err; 6465367Sahrens dsl_dataset_t *ds; 647789Sahrens 6485446Sahrens ds = os->os->os_dsl_dataset; 6494935Sperrin 650*6689Smaybee if (!dsl_dataset_tryown(ds, TRUE, os)) { 6515446Sahrens dmu_objset_close(os); 6525446Sahrens return (EBUSY); 6535446Sahrens } 6545446Sahrens 6555367Sahrens err = dsl_dataset_rollback(ds, os->os->os_phys->os_type); 6564935Sperrin 6575367Sahrens /* 6585367Sahrens * NB: we close the objset manually because the rollback 6595367Sahrens * actually implicitly called dmu_objset_evict(), thus freeing 6605367Sahrens * the objset_impl_t. 6615367Sahrens */ 662*6689Smaybee dsl_dataset_disown(ds, os); 6635367Sahrens kmem_free(os, sizeof (objset_t)); 664789Sahrens return (err); 665789Sahrens } 666789Sahrens 6672199Sahrens struct snaparg { 6682199Sahrens dsl_sync_task_group_t *dstg; 6692199Sahrens char *snapname; 6702199Sahrens char failed[MAXPATHLEN]; 6714543Smarks boolean_t checkperms; 6725367Sahrens list_t objsets; 6735367Sahrens }; 6745367Sahrens 6755367Sahrens struct osnode { 6765367Sahrens list_node_t node; 6775367Sahrens objset_t *os; 6782199Sahrens }; 6792199Sahrens 6802199Sahrens static int 6812199Sahrens dmu_objset_snapshot_one(char *name, void *arg) 6822199Sahrens { 6832199Sahrens struct snaparg *sn = arg; 6842199Sahrens objset_t *os; 6852199Sahrens int err; 6862199Sahrens 6872199Sahrens (void) strcpy(sn->failed, name); 6882199Sahrens 6894543Smarks /* 6904543Smarks * Check permissions only when requested. This only applies when 6914543Smarks * doing a recursive snapshot. The permission checks for the starting 6924543Smarks * dataset have already been performed in zfs_secpolicy_snapshot() 6934543Smarks */ 6944543Smarks if (sn->checkperms == B_TRUE && 6954543Smarks (err = zfs_secpolicy_snapshot_perms(name, CRED()))) 6964543Smarks return (err); 6974543Smarks 698*6689Smaybee err = dmu_objset_open(name, DMU_OST_ANY, DS_MODE_USER, &os); 6992199Sahrens if (err != 0) 7002199Sahrens return (err); 7012199Sahrens 702*6689Smaybee /* If the objset is in an inconsistent state, return busy */ 703*6689Smaybee if (os->os->os_dsl_dataset->ds_phys->ds_flags & DS_FLAG_INCONSISTENT) { 7043637Srm160521 dmu_objset_close(os); 7053637Srm160521 return (EBUSY); 7063637Srm160521 } 7073637Srm160521 7083637Srm160521 /* 7092199Sahrens * NB: we need to wait for all in-flight changes to get to disk, 7102199Sahrens * so that we snapshot those changes. zil_suspend does this as 7112199Sahrens * a side effect. 7122199Sahrens */ 7132199Sahrens err = zil_suspend(dmu_objset_zil(os)); 7142199Sahrens if (err == 0) { 7155367Sahrens struct osnode *osn; 7162199Sahrens dsl_sync_task_create(sn->dstg, dsl_dataset_snapshot_check, 7175367Sahrens dsl_dataset_snapshot_sync, os->os->os_dsl_dataset, 7185367Sahrens sn->snapname, 3); 7195367Sahrens osn = kmem_alloc(sizeof (struct osnode), KM_SLEEP); 7205367Sahrens osn->os = os; 7215367Sahrens list_insert_tail(&sn->objsets, osn); 7223637Srm160521 } else { 7233637Srm160521 dmu_objset_close(os); 7242199Sahrens } 7253637Srm160521 7262199Sahrens return (err); 7272199Sahrens } 7282199Sahrens 7292199Sahrens int 7302199Sahrens dmu_objset_snapshot(char *fsname, char *snapname, boolean_t recursive) 7312199Sahrens { 7322199Sahrens dsl_sync_task_t *dst; 7335367Sahrens struct osnode *osn; 7342199Sahrens struct snaparg sn = { 0 }; 7352199Sahrens spa_t *spa; 7362199Sahrens int err; 7372199Sahrens 7382199Sahrens (void) strcpy(sn.failed, fsname); 7392199Sahrens 7404603Sahrens err = spa_open(fsname, &spa, FTAG); 7412199Sahrens if (err) 7422199Sahrens return (err); 7432199Sahrens 7442199Sahrens sn.dstg = dsl_sync_task_group_create(spa_get_dsl(spa)); 7452199Sahrens sn.snapname = snapname; 7465367Sahrens list_create(&sn.objsets, sizeof (struct osnode), 7475367Sahrens offsetof(struct osnode, node)); 7482199Sahrens 7492417Sahrens if (recursive) { 7504543Smarks sn.checkperms = B_TRUE; 7512417Sahrens err = dmu_objset_find(fsname, 7522417Sahrens dmu_objset_snapshot_one, &sn, DS_FIND_CHILDREN); 7532417Sahrens } else { 7544543Smarks sn.checkperms = B_FALSE; 7552199Sahrens err = dmu_objset_snapshot_one(fsname, &sn); 7562417Sahrens } 7572199Sahrens 7582199Sahrens if (err) 7592199Sahrens goto out; 7602199Sahrens 7612199Sahrens err = dsl_sync_task_group_wait(sn.dstg); 7622199Sahrens 7632199Sahrens for (dst = list_head(&sn.dstg->dstg_tasks); dst; 7642199Sahrens dst = list_next(&sn.dstg->dstg_tasks, dst)) { 7655367Sahrens dsl_dataset_t *ds = dst->dst_arg1; 7662199Sahrens if (dst->dst_err) 7675367Sahrens dsl_dataset_name(ds, sn.failed); 7682199Sahrens } 7695367Sahrens 7706174Sahrens out: 7715367Sahrens while (osn = list_head(&sn.objsets)) { 7725367Sahrens list_remove(&sn.objsets, osn); 7735367Sahrens zil_resume(dmu_objset_zil(osn->os)); 7745367Sahrens dmu_objset_close(osn->os); 7755367Sahrens kmem_free(osn, sizeof (struct osnode)); 7765367Sahrens } 7775367Sahrens list_destroy(&sn.objsets); 7786174Sahrens 7792199Sahrens if (err) 7802199Sahrens (void) strcpy(fsname, sn.failed); 7812199Sahrens dsl_sync_task_group_destroy(sn.dstg); 7822199Sahrens spa_close(spa, FTAG); 7832199Sahrens return (err); 7842199Sahrens } 7852199Sahrens 786789Sahrens static void 7873547Smaybee dmu_objset_sync_dnodes(list_t *list, dmu_tx_t *tx) 788789Sahrens { 7893547Smaybee dnode_t *dn; 790789Sahrens 7913547Smaybee while (dn = list_head(list)) { 7923547Smaybee ASSERT(dn->dn_object != DMU_META_DNODE_OBJECT); 7933547Smaybee ASSERT(dn->dn_dbuf->db_data_pending); 7943547Smaybee /* 7953547Smaybee * Initialize dn_zio outside dnode_sync() 7963547Smaybee * to accomodate meta-dnode 7973547Smaybee */ 7983547Smaybee dn->dn_zio = dn->dn_dbuf->db_data_pending->dr_zio; 7993547Smaybee ASSERT(dn->dn_zio); 800789Sahrens 8013547Smaybee ASSERT3U(dn->dn_nlevels, <=, DN_MAX_LEVELS); 8023547Smaybee list_remove(list, dn); 8033547Smaybee dnode_sync(dn, tx); 8043547Smaybee } 8053547Smaybee } 8062981Sahrens 8073547Smaybee /* ARGSUSED */ 8083547Smaybee static void 8093547Smaybee ready(zio_t *zio, arc_buf_t *abuf, void *arg) 8103547Smaybee { 8113547Smaybee objset_impl_t *os = arg; 8123547Smaybee blkptr_t *bp = os->os_rootbp; 8133547Smaybee dnode_phys_t *dnp = &os->os_phys->os_meta_dnode; 8143547Smaybee int i; 8152981Sahrens 8165329Sgw25295 ASSERT(bp == zio->io_bp); 8175329Sgw25295 8183547Smaybee /* 8193547Smaybee * Update rootbp fill count. 8203547Smaybee */ 8213547Smaybee bp->blk_fill = 1; /* count the meta-dnode */ 8223547Smaybee for (i = 0; i < dnp->dn_nblkptr; i++) 8233547Smaybee bp->blk_fill += dnp->dn_blkptr[i].blk_fill; 8245329Sgw25295 8255329Sgw25295 BP_SET_TYPE(bp, DMU_OT_OBJSET); 8265329Sgw25295 BP_SET_LEVEL(bp, 0); 8275329Sgw25295 8285329Sgw25295 /* We must do this after we've set the bp's type and level */ 8295329Sgw25295 if (!DVA_EQUAL(BP_IDENTITY(bp), 8305329Sgw25295 BP_IDENTITY(&zio->io_bp_orig))) { 8315329Sgw25295 if (zio->io_bp_orig.blk_birth == os->os_synctx->tx_txg) 8325329Sgw25295 dsl_dataset_block_kill(os->os_dsl_dataset, 8335329Sgw25295 &zio->io_bp_orig, NULL, os->os_synctx); 8345329Sgw25295 dsl_dataset_block_born(os->os_dsl_dataset, bp, os->os_synctx); 8355329Sgw25295 } 836789Sahrens } 837789Sahrens 838789Sahrens /* ARGSUSED */ 839789Sahrens static void 840789Sahrens killer(zio_t *zio, arc_buf_t *abuf, void *arg) 841789Sahrens { 842789Sahrens objset_impl_t *os = arg; 843789Sahrens 844789Sahrens ASSERT3U(zio->io_error, ==, 0); 8453547Smaybee arc_release(os->os_phys_buf, &os->os_phys_buf); 846789Sahrens } 847789Sahrens 848789Sahrens /* called from dsl */ 849789Sahrens void 8503547Smaybee dmu_objset_sync(objset_impl_t *os, zio_t *pio, dmu_tx_t *tx) 851789Sahrens { 852789Sahrens int txgoff; 8531544Seschrock zbookmark_t zb; 8543547Smaybee zio_t *zio; 8553547Smaybee list_t *list; 8563547Smaybee dbuf_dirty_record_t *dr; 8573547Smaybee 8583547Smaybee dprintf_ds(os->os_dsl_dataset, "txg=%llu\n", tx->tx_txg); 859789Sahrens 860789Sahrens ASSERT(dmu_tx_is_syncing(tx)); 861789Sahrens /* XXX the write_done callback should really give us the tx... */ 862789Sahrens os->os_synctx = tx; 863789Sahrens 8643882Sahrens if (os->os_dsl_dataset == NULL) { 8653882Sahrens /* 8663882Sahrens * This is the MOS. If we have upgraded, 8673882Sahrens * spa_max_replication() could change, so reset 8683882Sahrens * os_copies here. 8693882Sahrens */ 8703882Sahrens os->os_copies = spa_max_replication(os->os_spa); 8713882Sahrens } 8723882Sahrens 8733547Smaybee /* 8743547Smaybee * Create the root block IO 8753547Smaybee */ 8763547Smaybee zb.zb_objset = os->os_dsl_dataset ? os->os_dsl_dataset->ds_object : 0; 8773547Smaybee zb.zb_object = 0; 8783547Smaybee zb.zb_level = -1; 8793547Smaybee zb.zb_blkid = 0; 8804787Sahrens if (BP_IS_OLDER(os->os_rootbp, tx->tx_txg)) { 8813547Smaybee dsl_dataset_block_kill(os->os_dsl_dataset, 8823547Smaybee os->os_rootbp, pio, tx); 8834787Sahrens } 8843547Smaybee zio = arc_write(pio, os->os_spa, os->os_md_checksum, 8853547Smaybee os->os_md_compress, 8863835Sahrens dmu_get_replication_level(os, &zb, DMU_OT_OBJSET), 8873547Smaybee tx->tx_txg, os->os_rootbp, os->os_phys_buf, ready, killer, os, 8884634Sek110237 ZIO_PRIORITY_ASYNC_WRITE, ZIO_FLAG_MUSTSUCCEED | ZIO_FLAG_METADATA, 8894634Sek110237 &zb); 8903547Smaybee 8913547Smaybee /* 8923547Smaybee * Sync meta-dnode - the parent IO for the sync is the root block 8933547Smaybee */ 8943547Smaybee os->os_meta_dnode->dn_zio = zio; 8953547Smaybee dnode_sync(os->os_meta_dnode, tx); 896789Sahrens 897789Sahrens txgoff = tx->tx_txg & TXG_MASK; 898789Sahrens 8993547Smaybee dmu_objset_sync_dnodes(&os->os_free_dnodes[txgoff], tx); 9003547Smaybee dmu_objset_sync_dnodes(&os->os_dirty_dnodes[txgoff], tx); 901789Sahrens 9023547Smaybee list = &os->os_meta_dnode->dn_dirty_records[txgoff]; 9033547Smaybee while (dr = list_head(list)) { 9043547Smaybee ASSERT(dr->dr_dbuf->db_level == 0); 9053547Smaybee list_remove(list, dr); 9063547Smaybee if (dr->dr_zio) 9073547Smaybee zio_nowait(dr->dr_zio); 9083547Smaybee } 909789Sahrens /* 910789Sahrens * Free intent log blocks up to this tx. 911789Sahrens */ 912789Sahrens zil_sync(os->os_zil, tx); 9133547Smaybee zio_nowait(zio); 914789Sahrens } 915789Sahrens 916789Sahrens void 9172885Sahrens dmu_objset_space(objset_t *os, uint64_t *refdbytesp, uint64_t *availbytesp, 9182885Sahrens uint64_t *usedobjsp, uint64_t *availobjsp) 9192885Sahrens { 9202885Sahrens dsl_dataset_space(os->os->os_dsl_dataset, refdbytesp, availbytesp, 9212885Sahrens usedobjsp, availobjsp); 9222885Sahrens } 9232885Sahrens 9242885Sahrens uint64_t 9252885Sahrens dmu_objset_fsid_guid(objset_t *os) 9262885Sahrens { 9272885Sahrens return (dsl_dataset_fsid_guid(os->os->os_dsl_dataset)); 9282885Sahrens } 9292885Sahrens 9302885Sahrens void 9312885Sahrens dmu_objset_fast_stat(objset_t *os, dmu_objset_stats_t *stat) 932789Sahrens { 9332885Sahrens stat->dds_type = os->os->os_phys->os_type; 9342885Sahrens if (os->os->os_dsl_dataset) 9352885Sahrens dsl_dataset_fast_stat(os->os->os_dsl_dataset, stat); 9362885Sahrens } 9372885Sahrens 9382885Sahrens void 9392885Sahrens dmu_objset_stats(objset_t *os, nvlist_t *nv) 9402885Sahrens { 9412885Sahrens ASSERT(os->os->os_dsl_dataset || 9422885Sahrens os->os->os_phys->os_type == DMU_OST_META); 9432885Sahrens 9442885Sahrens if (os->os->os_dsl_dataset != NULL) 9452885Sahrens dsl_dataset_stats(os->os->os_dsl_dataset, nv); 9462885Sahrens 9472885Sahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_TYPE, 9482885Sahrens os->os->os_phys->os_type); 949789Sahrens } 950789Sahrens 951789Sahrens int 952789Sahrens dmu_objset_is_snapshot(objset_t *os) 953789Sahrens { 954789Sahrens if (os->os->os_dsl_dataset != NULL) 955789Sahrens return (dsl_dataset_is_snapshot(os->os->os_dsl_dataset)); 956789Sahrens else 957789Sahrens return (B_FALSE); 958789Sahrens } 959789Sahrens 960789Sahrens int 9616492Stimh dmu_snapshot_realname(objset_t *os, char *name, char *real, int maxlen, 9626492Stimh boolean_t *conflict) 9636492Stimh { 9646492Stimh dsl_dataset_t *ds = os->os->os_dsl_dataset; 9656492Stimh uint64_t ignored; 9666492Stimh 9676492Stimh if (ds->ds_phys->ds_snapnames_zapobj == 0) 9686492Stimh return (ENOENT); 9696492Stimh 9706492Stimh return (zap_lookup_norm(ds->ds_dir->dd_pool->dp_meta_objset, 9716492Stimh ds->ds_phys->ds_snapnames_zapobj, name, 8, 1, &ignored, MT_FIRST, 9726492Stimh real, maxlen, conflict)); 9736492Stimh } 9746492Stimh 9756492Stimh int 976789Sahrens dmu_snapshot_list_next(objset_t *os, int namelen, char *name, 9775663Sck153898 uint64_t *idp, uint64_t *offp, boolean_t *case_conflict) 978789Sahrens { 979789Sahrens dsl_dataset_t *ds = os->os->os_dsl_dataset; 980789Sahrens zap_cursor_t cursor; 981789Sahrens zap_attribute_t attr; 982789Sahrens 983789Sahrens if (ds->ds_phys->ds_snapnames_zapobj == 0) 984789Sahrens return (ENOENT); 985789Sahrens 986789Sahrens zap_cursor_init_serialized(&cursor, 987789Sahrens ds->ds_dir->dd_pool->dp_meta_objset, 988789Sahrens ds->ds_phys->ds_snapnames_zapobj, *offp); 989789Sahrens 990885Sahrens if (zap_cursor_retrieve(&cursor, &attr) != 0) { 991885Sahrens zap_cursor_fini(&cursor); 992885Sahrens return (ENOENT); 993885Sahrens } 994885Sahrens 995885Sahrens if (strlen(attr.za_name) + 1 > namelen) { 996885Sahrens zap_cursor_fini(&cursor); 997885Sahrens return (ENAMETOOLONG); 998885Sahrens } 999885Sahrens 1000885Sahrens (void) strcpy(name, attr.za_name); 1001885Sahrens if (idp) 1002885Sahrens *idp = attr.za_first_integer; 10035663Sck153898 if (case_conflict) 10045663Sck153898 *case_conflict = attr.za_normalization_conflict; 1005885Sahrens zap_cursor_advance(&cursor); 1006885Sahrens *offp = zap_cursor_serialize(&cursor); 1007885Sahrens zap_cursor_fini(&cursor); 1008885Sahrens 1009885Sahrens return (0); 1010885Sahrens } 1011885Sahrens 1012885Sahrens int 1013885Sahrens dmu_dir_list_next(objset_t *os, int namelen, char *name, 1014885Sahrens uint64_t *idp, uint64_t *offp) 1015885Sahrens { 1016885Sahrens dsl_dir_t *dd = os->os->os_dsl_dataset->ds_dir; 1017885Sahrens zap_cursor_t cursor; 1018885Sahrens zap_attribute_t attr; 1019885Sahrens 1020885Sahrens /* there is no next dir on a snapshot! */ 1021885Sahrens if (os->os->os_dsl_dataset->ds_object != 1022885Sahrens dd->dd_phys->dd_head_dataset_obj) 1023885Sahrens return (ENOENT); 1024885Sahrens 1025885Sahrens zap_cursor_init_serialized(&cursor, 1026885Sahrens dd->dd_pool->dp_meta_objset, 1027885Sahrens dd->dd_phys->dd_child_dir_zapobj, *offp); 1028885Sahrens 1029885Sahrens if (zap_cursor_retrieve(&cursor, &attr) != 0) { 1030885Sahrens zap_cursor_fini(&cursor); 1031885Sahrens return (ENOENT); 1032885Sahrens } 1033885Sahrens 1034885Sahrens if (strlen(attr.za_name) + 1 > namelen) { 1035885Sahrens zap_cursor_fini(&cursor); 1036789Sahrens return (ENAMETOOLONG); 1037885Sahrens } 1038789Sahrens 1039789Sahrens (void) strcpy(name, attr.za_name); 1040885Sahrens if (idp) 1041885Sahrens *idp = attr.za_first_integer; 1042789Sahrens zap_cursor_advance(&cursor); 1043789Sahrens *offp = zap_cursor_serialize(&cursor); 1044885Sahrens zap_cursor_fini(&cursor); 1045789Sahrens 1046789Sahrens return (0); 1047789Sahrens } 1048789Sahrens 1049789Sahrens /* 1050789Sahrens * Find all objsets under name, and for each, call 'func(child_name, arg)'. 1051789Sahrens */ 10522199Sahrens int 10532199Sahrens dmu_objset_find(char *name, int func(char *, void *), void *arg, int flags) 1054789Sahrens { 1055789Sahrens dsl_dir_t *dd; 1056789Sahrens objset_t *os; 1057789Sahrens uint64_t snapobj; 1058789Sahrens zap_cursor_t zc; 10593978Smmusante zap_attribute_t *attr; 1060789Sahrens char *child; 10611544Seschrock int do_self, err; 1062789Sahrens 10631544Seschrock err = dsl_dir_open(name, FTAG, &dd, NULL); 10641544Seschrock if (err) 10652199Sahrens return (err); 1066789Sahrens 10672199Sahrens /* NB: the $MOS dir doesn't have a head dataset */ 1068789Sahrens do_self = (dd->dd_phys->dd_head_dataset_obj != 0); 10693978Smmusante attr = kmem_alloc(sizeof (zap_attribute_t), KM_SLEEP); 1070789Sahrens 1071789Sahrens /* 1072789Sahrens * Iterate over all children. 1073789Sahrens */ 10742417Sahrens if (flags & DS_FIND_CHILDREN) { 10752417Sahrens for (zap_cursor_init(&zc, dd->dd_pool->dp_meta_objset, 10762417Sahrens dd->dd_phys->dd_child_dir_zapobj); 10773978Smmusante zap_cursor_retrieve(&zc, attr) == 0; 10782417Sahrens (void) zap_cursor_advance(&zc)) { 10793978Smmusante ASSERT(attr->za_integer_length == sizeof (uint64_t)); 10803978Smmusante ASSERT(attr->za_num_integers == 1); 1081789Sahrens 10822417Sahrens /* 10832417Sahrens * No separating '/' because parent's name ends in /. 10842417Sahrens */ 10852417Sahrens child = kmem_alloc(MAXPATHLEN, KM_SLEEP); 10862417Sahrens /* XXX could probably just use name here */ 10872417Sahrens dsl_dir_name(dd, child); 10882417Sahrens (void) strcat(child, "/"); 10893978Smmusante (void) strcat(child, attr->za_name); 10902417Sahrens err = dmu_objset_find(child, func, arg, flags); 10912417Sahrens kmem_free(child, MAXPATHLEN); 10922417Sahrens if (err) 10932417Sahrens break; 10942417Sahrens } 10952417Sahrens zap_cursor_fini(&zc); 10962199Sahrens 10972417Sahrens if (err) { 10982417Sahrens dsl_dir_close(dd, FTAG); 10993978Smmusante kmem_free(attr, sizeof (zap_attribute_t)); 11002417Sahrens return (err); 11012417Sahrens } 1102789Sahrens } 1103789Sahrens 1104789Sahrens /* 1105789Sahrens * Iterate over all snapshots. 1106789Sahrens */ 1107789Sahrens if ((flags & DS_FIND_SNAPSHOTS) && 1108789Sahrens dmu_objset_open(name, DMU_OST_ANY, 1109*6689Smaybee DS_MODE_USER | DS_MODE_READONLY, &os) == 0) { 1110789Sahrens 1111789Sahrens snapobj = os->os->os_dsl_dataset->ds_phys->ds_snapnames_zapobj; 1112789Sahrens dmu_objset_close(os); 1113789Sahrens 1114789Sahrens for (zap_cursor_init(&zc, dd->dd_pool->dp_meta_objset, snapobj); 11153978Smmusante zap_cursor_retrieve(&zc, attr) == 0; 1116789Sahrens (void) zap_cursor_advance(&zc)) { 11173978Smmusante ASSERT(attr->za_integer_length == sizeof (uint64_t)); 11183978Smmusante ASSERT(attr->za_num_integers == 1); 1119789Sahrens 1120789Sahrens child = kmem_alloc(MAXPATHLEN, KM_SLEEP); 1121789Sahrens /* XXX could probably just use name here */ 1122789Sahrens dsl_dir_name(dd, child); 1123789Sahrens (void) strcat(child, "@"); 11243978Smmusante (void) strcat(child, attr->za_name); 11252199Sahrens err = func(child, arg); 1126789Sahrens kmem_free(child, MAXPATHLEN); 11272199Sahrens if (err) 11282199Sahrens break; 1129789Sahrens } 1130885Sahrens zap_cursor_fini(&zc); 1131789Sahrens } 1132789Sahrens 1133789Sahrens dsl_dir_close(dd, FTAG); 11343978Smmusante kmem_free(attr, sizeof (zap_attribute_t)); 1135789Sahrens 11362199Sahrens if (err) 11372199Sahrens return (err); 11382199Sahrens 1139789Sahrens /* 1140789Sahrens * Apply to self if appropriate. 1141789Sahrens */ 1142789Sahrens if (do_self) 11432199Sahrens err = func(name, arg); 11442199Sahrens return (err); 1145789Sahrens } 11465326Sek110237 11475326Sek110237 void 11485326Sek110237 dmu_objset_set_user(objset_t *os, void *user_ptr) 11495326Sek110237 { 11505326Sek110237 ASSERT(MUTEX_HELD(&os->os->os_user_ptr_lock)); 11515326Sek110237 os->os->os_user_ptr = user_ptr; 11525326Sek110237 } 11535326Sek110237 11545326Sek110237 void * 11555326Sek110237 dmu_objset_get_user(objset_t *os) 11565326Sek110237 { 11575326Sek110237 ASSERT(MUTEX_HELD(&os->os->os_user_ptr_lock)); 11585326Sek110237 return (os->os->os_user_ptr); 11595326Sek110237 } 1160