12743Sahrens /* 22743Sahrens * CDDL HEADER START 32743Sahrens * 42743Sahrens * The contents of this file are subject to the terms of the 52743Sahrens * Common Development and Distribution License (the "License"). 62743Sahrens * You may not use this file except in compliance with the License. 72743Sahrens * 82743Sahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 92743Sahrens * or http://www.opensolaris.org/os/licensing. 102743Sahrens * See the License for the specific language governing permissions 112743Sahrens * and limitations under the License. 122743Sahrens * 132743Sahrens * When distributing Covered Code, include this CDDL HEADER in each 142743Sahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 152743Sahrens * If applicable, add the following below this CDDL HEADER, with the 162743Sahrens * fields enclosed by brackets "[]" replaced with your own identifying 172743Sahrens * information: Portions Copyright [yyyy] [name of copyright owner] 182743Sahrens * 192743Sahrens * CDDL HEADER END 202743Sahrens */ 212743Sahrens /* 2212070SMark.Shellenbaum@Sun.COM * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved. 232743Sahrens */ 242743Sahrens 252743Sahrens #include <sys/dmu.h> 262743Sahrens #include <sys/dmu_impl.h> 272743Sahrens #include <sys/dmu_tx.h> 282743Sahrens #include <sys/dbuf.h> 292743Sahrens #include <sys/dnode.h> 302743Sahrens #include <sys/zfs_context.h> 312743Sahrens #include <sys/dmu_objset.h> 322743Sahrens #include <sys/dmu_traverse.h> 332743Sahrens #include <sys/dsl_dataset.h> 342743Sahrens #include <sys/dsl_dir.h> 3511022STom.Erickson@Sun.COM #include <sys/dsl_prop.h> 362743Sahrens #include <sys/dsl_pool.h> 372743Sahrens #include <sys/dsl_synctask.h> 382743Sahrens #include <sys/zfs_ioctl.h> 392743Sahrens #include <sys/zap.h> 402743Sahrens #include <sys/zio_checksum.h> 4112070SMark.Shellenbaum@Sun.COM #include <sys/zfs_znode.h> 42*12470SMatthew.Ahrens@Sun.COM #include <zfs_fletcher.h> 4311007SLori.Alt@Sun.COM #include <sys/avl.h> 4411381SLori.Alt@Sun.COM #include <sys/ddt.h> 452743Sahrens 465367Sahrens static char *dmu_recv_tag = "dmu_recv_tag"; 475367Sahrens 4811007SLori.Alt@Sun.COM /* 4911007SLori.Alt@Sun.COM * The list of data whose inclusion in a send stream can be pending from 5011007SLori.Alt@Sun.COM * one call to backup_cb to another. Multiple calls to dump_free() and 5111007SLori.Alt@Sun.COM * dump_freeobjects() can be aggregated into a single DRR_FREE or 5211007SLori.Alt@Sun.COM * DRR_FREEOBJECTS replay record. 5311007SLori.Alt@Sun.COM */ 5411007SLori.Alt@Sun.COM typedef enum { 5511007SLori.Alt@Sun.COM PENDING_NONE, 5611007SLori.Alt@Sun.COM PENDING_FREE, 5711007SLori.Alt@Sun.COM PENDING_FREEOBJECTS 5811007SLori.Alt@Sun.COM } pendop_t; 5911007SLori.Alt@Sun.COM 602743Sahrens struct backuparg { 612743Sahrens dmu_replay_record_t *drr; 622743Sahrens vnode_t *vp; 635367Sahrens offset_t *off; 642743Sahrens objset_t *os; 652743Sahrens zio_cksum_t zc; 6611007SLori.Alt@Sun.COM uint64_t toguid; 672743Sahrens int err; 6811007SLori.Alt@Sun.COM pendop_t pending_op; 692743Sahrens }; 702743Sahrens 712743Sahrens static int 722743Sahrens dump_bytes(struct backuparg *ba, void *buf, int len) 732743Sahrens { 742743Sahrens ssize_t resid; /* have to get resid to get detailed errno */ 752743Sahrens ASSERT3U(len % 8, ==, 0); 762743Sahrens 772743Sahrens fletcher_4_incremental_native(buf, len, &ba->zc); 782743Sahrens ba->err = vn_rdwr(UIO_WRITE, ba->vp, 792743Sahrens (caddr_t)buf, len, 802743Sahrens 0, UIO_SYSSPACE, FAPPEND, RLIM64_INFINITY, CRED(), &resid); 815367Sahrens *ba->off += len; 822743Sahrens return (ba->err); 832743Sahrens } 842743Sahrens 852743Sahrens static int 862743Sahrens dump_free(struct backuparg *ba, uint64_t object, uint64_t offset, 872743Sahrens uint64_t length) 882743Sahrens { 8911007SLori.Alt@Sun.COM struct drr_free *drrf = &(ba->drr->drr_u.drr_free); 9011007SLori.Alt@Sun.COM 9111007SLori.Alt@Sun.COM /* 9211007SLori.Alt@Sun.COM * If there is a pending op, but it's not PENDING_FREE, push it out, 9311007SLori.Alt@Sun.COM * since free block aggregation can only be done for blocks of the 9411007SLori.Alt@Sun.COM * same type (i.e., DRR_FREE records can only be aggregated with 9511007SLori.Alt@Sun.COM * other DRR_FREE records. DRR_FREEOBJECTS records can only be 9611007SLori.Alt@Sun.COM * aggregated with other DRR_FREEOBJECTS records. 9711007SLori.Alt@Sun.COM */ 9811007SLori.Alt@Sun.COM if (ba->pending_op != PENDING_NONE && ba->pending_op != PENDING_FREE) { 9911007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 10011007SLori.Alt@Sun.COM return (EINTR); 10111007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 10211007SLori.Alt@Sun.COM } 10311007SLori.Alt@Sun.COM 10411007SLori.Alt@Sun.COM if (ba->pending_op == PENDING_FREE) { 10511007SLori.Alt@Sun.COM /* 10611007SLori.Alt@Sun.COM * There should never be a PENDING_FREE if length is -1 10711007SLori.Alt@Sun.COM * (because dump_dnode is the only place where this 10811007SLori.Alt@Sun.COM * function is called with a -1, and only after flushing 10911007SLori.Alt@Sun.COM * any pending record). 11011007SLori.Alt@Sun.COM */ 11111007SLori.Alt@Sun.COM ASSERT(length != -1ULL); 11211007SLori.Alt@Sun.COM /* 11311007SLori.Alt@Sun.COM * Check to see whether this free block can be aggregated 11411007SLori.Alt@Sun.COM * with pending one. 11511007SLori.Alt@Sun.COM */ 11611007SLori.Alt@Sun.COM if (drrf->drr_object == object && drrf->drr_offset + 11711007SLori.Alt@Sun.COM drrf->drr_length == offset) { 11811007SLori.Alt@Sun.COM drrf->drr_length += length; 11911007SLori.Alt@Sun.COM return (0); 12011007SLori.Alt@Sun.COM } else { 12111007SLori.Alt@Sun.COM /* not a continuation. Push out pending record */ 12211007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, 12311007SLori.Alt@Sun.COM sizeof (dmu_replay_record_t)) != 0) 12411007SLori.Alt@Sun.COM return (EINTR); 12511007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 12611007SLori.Alt@Sun.COM } 12711007SLori.Alt@Sun.COM } 12811007SLori.Alt@Sun.COM /* create a FREE record and make it pending */ 1292743Sahrens bzero(ba->drr, sizeof (dmu_replay_record_t)); 1302743Sahrens ba->drr->drr_type = DRR_FREE; 13111007SLori.Alt@Sun.COM drrf->drr_object = object; 13211007SLori.Alt@Sun.COM drrf->drr_offset = offset; 13311007SLori.Alt@Sun.COM drrf->drr_length = length; 13411007SLori.Alt@Sun.COM drrf->drr_toguid = ba->toguid; 13511007SLori.Alt@Sun.COM if (length == -1ULL) { 13611007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 13711007SLori.Alt@Sun.COM return (EINTR); 13811007SLori.Alt@Sun.COM } else { 13911007SLori.Alt@Sun.COM ba->pending_op = PENDING_FREE; 14011007SLori.Alt@Sun.COM } 1412743Sahrens 1422743Sahrens return (0); 1432743Sahrens } 1442743Sahrens 1452743Sahrens static int 1462743Sahrens dump_data(struct backuparg *ba, dmu_object_type_t type, 14711381SLori.Alt@Sun.COM uint64_t object, uint64_t offset, int blksz, const blkptr_t *bp, void *data) 1482743Sahrens { 14911007SLori.Alt@Sun.COM struct drr_write *drrw = &(ba->drr->drr_u.drr_write); 15011007SLori.Alt@Sun.COM 15111381SLori.Alt@Sun.COM 15211007SLori.Alt@Sun.COM /* 15311007SLori.Alt@Sun.COM * If there is any kind of pending aggregation (currently either 15411007SLori.Alt@Sun.COM * a grouping of free objects or free blocks), push it out to 15511007SLori.Alt@Sun.COM * the stream, since aggregation can't be done across operations 15611007SLori.Alt@Sun.COM * of different types. 15711007SLori.Alt@Sun.COM */ 15811007SLori.Alt@Sun.COM if (ba->pending_op != PENDING_NONE) { 15911007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 16011007SLori.Alt@Sun.COM return (EINTR); 16111007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 16211007SLori.Alt@Sun.COM } 1632743Sahrens /* write a DATA record */ 1642743Sahrens bzero(ba->drr, sizeof (dmu_replay_record_t)); 1652743Sahrens ba->drr->drr_type = DRR_WRITE; 16611007SLori.Alt@Sun.COM drrw->drr_object = object; 16711007SLori.Alt@Sun.COM drrw->drr_type = type; 16811007SLori.Alt@Sun.COM drrw->drr_offset = offset; 16911007SLori.Alt@Sun.COM drrw->drr_length = blksz; 17011007SLori.Alt@Sun.COM drrw->drr_toguid = ba->toguid; 17111381SLori.Alt@Sun.COM drrw->drr_checksumtype = BP_GET_CHECKSUM(bp); 17211381SLori.Alt@Sun.COM if (zio_checksum_table[drrw->drr_checksumtype].ci_dedup) 17311381SLori.Alt@Sun.COM drrw->drr_checksumflags |= DRR_CHECKSUM_DEDUP; 17411381SLori.Alt@Sun.COM DDK_SET_LSIZE(&drrw->drr_key, BP_GET_LSIZE(bp)); 17511381SLori.Alt@Sun.COM DDK_SET_PSIZE(&drrw->drr_key, BP_GET_PSIZE(bp)); 17611381SLori.Alt@Sun.COM DDK_SET_COMPRESS(&drrw->drr_key, BP_GET_COMPRESS(bp)); 17711381SLori.Alt@Sun.COM drrw->drr_key.ddk_cksum = bp->blk_cksum; 1782743Sahrens 17911007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 1802743Sahrens return (EINTR); 18111007SLori.Alt@Sun.COM if (dump_bytes(ba, data, blksz) != 0) 1822743Sahrens return (EINTR); 1832743Sahrens return (0); 1842743Sahrens } 1852743Sahrens 1862743Sahrens static int 18711935SMark.Shellenbaum@Sun.COM dump_spill(struct backuparg *ba, uint64_t object, int blksz, void *data) 18811935SMark.Shellenbaum@Sun.COM { 18911935SMark.Shellenbaum@Sun.COM struct drr_spill *drrs = &(ba->drr->drr_u.drr_spill); 19011935SMark.Shellenbaum@Sun.COM 19111935SMark.Shellenbaum@Sun.COM if (ba->pending_op != PENDING_NONE) { 19211935SMark.Shellenbaum@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 19311935SMark.Shellenbaum@Sun.COM return (EINTR); 19411935SMark.Shellenbaum@Sun.COM ba->pending_op = PENDING_NONE; 19511935SMark.Shellenbaum@Sun.COM } 19611935SMark.Shellenbaum@Sun.COM 19711935SMark.Shellenbaum@Sun.COM /* write a SPILL record */ 19811935SMark.Shellenbaum@Sun.COM bzero(ba->drr, sizeof (dmu_replay_record_t)); 19911935SMark.Shellenbaum@Sun.COM ba->drr->drr_type = DRR_SPILL; 20011935SMark.Shellenbaum@Sun.COM drrs->drr_object = object; 20111935SMark.Shellenbaum@Sun.COM drrs->drr_length = blksz; 20211935SMark.Shellenbaum@Sun.COM drrs->drr_toguid = ba->toguid; 20311935SMark.Shellenbaum@Sun.COM 20411935SMark.Shellenbaum@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t))) 20511935SMark.Shellenbaum@Sun.COM return (EINTR); 20611935SMark.Shellenbaum@Sun.COM if (dump_bytes(ba, data, blksz)) 20711935SMark.Shellenbaum@Sun.COM return (EINTR); 20811935SMark.Shellenbaum@Sun.COM return (0); 20911935SMark.Shellenbaum@Sun.COM } 21011935SMark.Shellenbaum@Sun.COM 21111935SMark.Shellenbaum@Sun.COM static int 2122743Sahrens dump_freeobjects(struct backuparg *ba, uint64_t firstobj, uint64_t numobjs) 2132743Sahrens { 21411007SLori.Alt@Sun.COM struct drr_freeobjects *drrfo = &(ba->drr->drr_u.drr_freeobjects); 21511007SLori.Alt@Sun.COM 21611007SLori.Alt@Sun.COM /* 21711007SLori.Alt@Sun.COM * If there is a pending op, but it's not PENDING_FREEOBJECTS, 21811007SLori.Alt@Sun.COM * push it out, since free block aggregation can only be done for 21911007SLori.Alt@Sun.COM * blocks of the same type (i.e., DRR_FREE records can only be 22011007SLori.Alt@Sun.COM * aggregated with other DRR_FREE records. DRR_FREEOBJECTS records 22111007SLori.Alt@Sun.COM * can only be aggregated with other DRR_FREEOBJECTS records. 22211007SLori.Alt@Sun.COM */ 22311007SLori.Alt@Sun.COM if (ba->pending_op != PENDING_NONE && 22411007SLori.Alt@Sun.COM ba->pending_op != PENDING_FREEOBJECTS) { 22511007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 22611007SLori.Alt@Sun.COM return (EINTR); 22711007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 22811007SLori.Alt@Sun.COM } 22911007SLori.Alt@Sun.COM if (ba->pending_op == PENDING_FREEOBJECTS) { 23011007SLori.Alt@Sun.COM /* 23111007SLori.Alt@Sun.COM * See whether this free object array can be aggregated 23211007SLori.Alt@Sun.COM * with pending one 23311007SLori.Alt@Sun.COM */ 23411007SLori.Alt@Sun.COM if (drrfo->drr_firstobj + drrfo->drr_numobjs == firstobj) { 23511007SLori.Alt@Sun.COM drrfo->drr_numobjs += numobjs; 23611007SLori.Alt@Sun.COM return (0); 23711007SLori.Alt@Sun.COM } else { 23811007SLori.Alt@Sun.COM /* can't be aggregated. Push out pending record */ 23911007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, 24011007SLori.Alt@Sun.COM sizeof (dmu_replay_record_t)) != 0) 24111007SLori.Alt@Sun.COM return (EINTR); 24211007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 24311007SLori.Alt@Sun.COM } 24411007SLori.Alt@Sun.COM } 24511007SLori.Alt@Sun.COM 2462743Sahrens /* write a FREEOBJECTS record */ 2472743Sahrens bzero(ba->drr, sizeof (dmu_replay_record_t)); 2482743Sahrens ba->drr->drr_type = DRR_FREEOBJECTS; 24911007SLori.Alt@Sun.COM drrfo->drr_firstobj = firstobj; 25011007SLori.Alt@Sun.COM drrfo->drr_numobjs = numobjs; 25111007SLori.Alt@Sun.COM drrfo->drr_toguid = ba->toguid; 2522743Sahrens 25311007SLori.Alt@Sun.COM ba->pending_op = PENDING_FREEOBJECTS; 25411007SLori.Alt@Sun.COM 2552743Sahrens return (0); 2562743Sahrens } 2572743Sahrens 2582743Sahrens static int 2592743Sahrens dump_dnode(struct backuparg *ba, uint64_t object, dnode_phys_t *dnp) 2602743Sahrens { 26111007SLori.Alt@Sun.COM struct drr_object *drro = &(ba->drr->drr_u.drr_object); 26211007SLori.Alt@Sun.COM 2632743Sahrens if (dnp == NULL || dnp->dn_type == DMU_OT_NONE) 2642743Sahrens return (dump_freeobjects(ba, object, 1)); 2652743Sahrens 26611007SLori.Alt@Sun.COM if (ba->pending_op != PENDING_NONE) { 26711007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 26811007SLori.Alt@Sun.COM return (EINTR); 26911007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 27011007SLori.Alt@Sun.COM } 27111007SLori.Alt@Sun.COM 2722743Sahrens /* write an OBJECT record */ 2732743Sahrens bzero(ba->drr, sizeof (dmu_replay_record_t)); 2742743Sahrens ba->drr->drr_type = DRR_OBJECT; 27511007SLori.Alt@Sun.COM drro->drr_object = object; 27611007SLori.Alt@Sun.COM drro->drr_type = dnp->dn_type; 27711007SLori.Alt@Sun.COM drro->drr_bonustype = dnp->dn_bonustype; 27811007SLori.Alt@Sun.COM drro->drr_blksz = dnp->dn_datablkszsec << SPA_MINBLOCKSHIFT; 27911007SLori.Alt@Sun.COM drro->drr_bonuslen = dnp->dn_bonuslen; 28011007SLori.Alt@Sun.COM drro->drr_checksumtype = dnp->dn_checksum; 28111007SLori.Alt@Sun.COM drro->drr_compress = dnp->dn_compress; 28211007SLori.Alt@Sun.COM drro->drr_toguid = ba->toguid; 2832743Sahrens 28411007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 2852743Sahrens return (EINTR); 2862743Sahrens 28711007SLori.Alt@Sun.COM if (dump_bytes(ba, DN_BONUS(dnp), P2ROUNDUP(dnp->dn_bonuslen, 8)) != 0) 2882743Sahrens return (EINTR); 2892743Sahrens 2902743Sahrens /* free anything past the end of the file */ 2912743Sahrens if (dump_free(ba, object, (dnp->dn_maxblkid + 1) * 2922743Sahrens (dnp->dn_datablkszsec << SPA_MINBLOCKSHIFT), -1ULL)) 2932743Sahrens return (EINTR); 2942743Sahrens if (ba->err) 2952743Sahrens return (EINTR); 2962743Sahrens return (0); 2972743Sahrens } 2982743Sahrens 2992743Sahrens #define BP_SPAN(dnp, level) \ 3002743Sahrens (((uint64_t)dnp->dn_datablkszsec) << (SPA_MINBLOCKSHIFT + \ 3012743Sahrens (level) * (dnp->dn_indblkshift - SPA_BLKPTRSHIFT))) 3022743Sahrens 30310922SJeff.Bonwick@Sun.COM /* ARGSUSED */ 3042743Sahrens static int 30512296SLin.Ling@Sun.COM backup_cb(spa_t *spa, zilog_t *zilog, const blkptr_t *bp, arc_buf_t *pbuf, 30610922SJeff.Bonwick@Sun.COM const zbookmark_t *zb, const dnode_phys_t *dnp, void *arg) 3072743Sahrens { 3082743Sahrens struct backuparg *ba = arg; 3092743Sahrens dmu_object_type_t type = bp ? BP_GET_TYPE(bp) : DMU_OT_NONE; 3102743Sahrens int err = 0; 3112743Sahrens 3122743Sahrens if (issig(JUSTLOOKING) && issig(FORREAL)) 3132743Sahrens return (EINTR); 3142743Sahrens 31510922SJeff.Bonwick@Sun.COM if (zb->zb_object != DMU_META_DNODE_OBJECT && 31610922SJeff.Bonwick@Sun.COM DMU_OBJECT_IS_SPECIAL(zb->zb_object)) { 3179396SMatthew.Ahrens@Sun.COM return (0); 31810922SJeff.Bonwick@Sun.COM } else if (bp == NULL && zb->zb_object == DMU_META_DNODE_OBJECT) { 3197837SMatthew.Ahrens@Sun.COM uint64_t span = BP_SPAN(dnp, zb->zb_level); 3207837SMatthew.Ahrens@Sun.COM uint64_t dnobj = (zb->zb_blkid * span) >> DNODE_SHIFT; 3212743Sahrens err = dump_freeobjects(ba, dnobj, span >> DNODE_SHIFT); 3222743Sahrens } else if (bp == NULL) { 3237837SMatthew.Ahrens@Sun.COM uint64_t span = BP_SPAN(dnp, zb->zb_level); 3247837SMatthew.Ahrens@Sun.COM err = dump_free(ba, zb->zb_object, zb->zb_blkid * span, span); 3257837SMatthew.Ahrens@Sun.COM } else if (zb->zb_level > 0 || type == DMU_OT_OBJSET) { 3267837SMatthew.Ahrens@Sun.COM return (0); 3277837SMatthew.Ahrens@Sun.COM } else if (type == DMU_OT_DNODE) { 3287837SMatthew.Ahrens@Sun.COM dnode_phys_t *blk; 3292743Sahrens int i; 3302743Sahrens int blksz = BP_GET_LSIZE(bp); 3317837SMatthew.Ahrens@Sun.COM uint32_t aflags = ARC_WAIT; 3327837SMatthew.Ahrens@Sun.COM arc_buf_t *abuf; 3332743Sahrens 33412296SLin.Ling@Sun.COM if (dsl_read(NULL, spa, bp, pbuf, 3357837SMatthew.Ahrens@Sun.COM arc_getbuf_func, &abuf, ZIO_PRIORITY_ASYNC_READ, 3367837SMatthew.Ahrens@Sun.COM ZIO_FLAG_CANFAIL, &aflags, zb) != 0) 3377837SMatthew.Ahrens@Sun.COM return (EIO); 3387837SMatthew.Ahrens@Sun.COM 3397837SMatthew.Ahrens@Sun.COM blk = abuf->b_data; 3402743Sahrens for (i = 0; i < blksz >> DNODE_SHIFT; i++) { 3417837SMatthew.Ahrens@Sun.COM uint64_t dnobj = (zb->zb_blkid << 3427837SMatthew.Ahrens@Sun.COM (DNODE_BLOCK_SHIFT - DNODE_SHIFT)) + i; 3432743Sahrens err = dump_dnode(ba, dnobj, blk+i); 3442743Sahrens if (err) 3452743Sahrens break; 3462743Sahrens } 3477837SMatthew.Ahrens@Sun.COM (void) arc_buf_remove_ref(abuf, &abuf); 34811935SMark.Shellenbaum@Sun.COM } else if (type == DMU_OT_SA) { 34911935SMark.Shellenbaum@Sun.COM uint32_t aflags = ARC_WAIT; 35011935SMark.Shellenbaum@Sun.COM arc_buf_t *abuf; 35111935SMark.Shellenbaum@Sun.COM int blksz = BP_GET_LSIZE(bp); 35211935SMark.Shellenbaum@Sun.COM 35311935SMark.Shellenbaum@Sun.COM if (arc_read_nolock(NULL, spa, bp, 35411935SMark.Shellenbaum@Sun.COM arc_getbuf_func, &abuf, ZIO_PRIORITY_ASYNC_READ, 35511935SMark.Shellenbaum@Sun.COM ZIO_FLAG_CANFAIL, &aflags, zb) != 0) 35611935SMark.Shellenbaum@Sun.COM return (EIO); 35711935SMark.Shellenbaum@Sun.COM 35811935SMark.Shellenbaum@Sun.COM err = dump_spill(ba, zb->zb_object, blksz, abuf->b_data); 35911935SMark.Shellenbaum@Sun.COM (void) arc_buf_remove_ref(abuf, &abuf); 3607837SMatthew.Ahrens@Sun.COM } else { /* it's a level-0 block of a regular object */ 3617837SMatthew.Ahrens@Sun.COM uint32_t aflags = ARC_WAIT; 3627837SMatthew.Ahrens@Sun.COM arc_buf_t *abuf; 3632743Sahrens int blksz = BP_GET_LSIZE(bp); 3642743Sahrens 36512296SLin.Ling@Sun.COM if (dsl_read(NULL, spa, bp, pbuf, 3667837SMatthew.Ahrens@Sun.COM arc_getbuf_func, &abuf, ZIO_PRIORITY_ASYNC_READ, 3677837SMatthew.Ahrens@Sun.COM ZIO_FLAG_CANFAIL, &aflags, zb) != 0) 3687837SMatthew.Ahrens@Sun.COM return (EIO); 3692743Sahrens 3707837SMatthew.Ahrens@Sun.COM err = dump_data(ba, type, zb->zb_object, zb->zb_blkid * blksz, 37111381SLori.Alt@Sun.COM blksz, bp, abuf->b_data); 3727837SMatthew.Ahrens@Sun.COM (void) arc_buf_remove_ref(abuf, &abuf); 3732743Sahrens } 3742743Sahrens 3752743Sahrens ASSERT(err == 0 || err == EINTR); 3762743Sahrens return (err); 3772743Sahrens } 3782743Sahrens 3792743Sahrens int 3805367Sahrens dmu_sendbackup(objset_t *tosnap, objset_t *fromsnap, boolean_t fromorigin, 3815367Sahrens vnode_t *vp, offset_t *off) 3822743Sahrens { 38310298SMatthew.Ahrens@Sun.COM dsl_dataset_t *ds = tosnap->os_dsl_dataset; 38410298SMatthew.Ahrens@Sun.COM dsl_dataset_t *fromds = fromsnap ? fromsnap->os_dsl_dataset : NULL; 3852743Sahrens dmu_replay_record_t *drr; 3862743Sahrens struct backuparg ba; 3872743Sahrens int err; 3885367Sahrens uint64_t fromtxg = 0; 3892743Sahrens 3902743Sahrens /* tosnap must be a snapshot */ 3912743Sahrens if (ds->ds_phys->ds_next_snap_obj == 0) 3922743Sahrens return (EINVAL); 3932743Sahrens 3942743Sahrens /* fromsnap must be an earlier snapshot from the same fs as tosnap */ 3952743Sahrens if (fromds && (ds->ds_dir != fromds->ds_dir || 3965367Sahrens fromds->ds_phys->ds_creation_txg >= ds->ds_phys->ds_creation_txg)) 3972743Sahrens return (EXDEV); 3982743Sahrens 3995367Sahrens if (fromorigin) { 4007046Sahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 4017046Sahrens 4025367Sahrens if (fromsnap) 4035367Sahrens return (EINVAL); 4045367Sahrens 4057046Sahrens if (dsl_dir_is_clone(ds->ds_dir)) { 4065367Sahrens rw_enter(&dp->dp_config_rwlock, RW_READER); 4076689Smaybee err = dsl_dataset_hold_obj(dp, 4086689Smaybee ds->ds_dir->dd_phys->dd_origin_obj, FTAG, &fromds); 4095367Sahrens rw_exit(&dp->dp_config_rwlock); 4105367Sahrens if (err) 4115367Sahrens return (err); 4125367Sahrens } else { 4135367Sahrens fromorigin = B_FALSE; 4145367Sahrens } 4155367Sahrens } 4165367Sahrens 4175367Sahrens 4182743Sahrens drr = kmem_zalloc(sizeof (dmu_replay_record_t), KM_SLEEP); 4192743Sahrens drr->drr_type = DRR_BEGIN; 4202743Sahrens drr->drr_u.drr_begin.drr_magic = DMU_BACKUP_MAGIC; 42111007SLori.Alt@Sun.COM DMU_SET_STREAM_HDRTYPE(drr->drr_u.drr_begin.drr_versioninfo, 42211007SLori.Alt@Sun.COM DMU_SUBSTREAM); 42312070SMark.Shellenbaum@Sun.COM 42412070SMark.Shellenbaum@Sun.COM #ifdef _KERNEL 42512070SMark.Shellenbaum@Sun.COM if (dmu_objset_type(tosnap) == DMU_OST_ZFS) { 42612070SMark.Shellenbaum@Sun.COM uint64_t version; 42712070SMark.Shellenbaum@Sun.COM if (zfs_get_zplprop(tosnap, ZFS_PROP_VERSION, &version) != 0) 42812070SMark.Shellenbaum@Sun.COM return (EINVAL); 42912070SMark.Shellenbaum@Sun.COM if (version == ZPL_VERSION_SA) { 43012070SMark.Shellenbaum@Sun.COM DMU_SET_FEATUREFLAGS( 43112070SMark.Shellenbaum@Sun.COM drr->drr_u.drr_begin.drr_versioninfo, 43212070SMark.Shellenbaum@Sun.COM DMU_BACKUP_FEATURE_SA_SPILL); 43312070SMark.Shellenbaum@Sun.COM } 43412070SMark.Shellenbaum@Sun.COM } 43512070SMark.Shellenbaum@Sun.COM #endif 43612070SMark.Shellenbaum@Sun.COM 4372743Sahrens drr->drr_u.drr_begin.drr_creation_time = 4382743Sahrens ds->ds_phys->ds_creation_time; 43910298SMatthew.Ahrens@Sun.COM drr->drr_u.drr_begin.drr_type = tosnap->os_phys->os_type; 4405367Sahrens if (fromorigin) 4415367Sahrens drr->drr_u.drr_begin.drr_flags |= DRR_FLAG_CLONE; 4422743Sahrens drr->drr_u.drr_begin.drr_toguid = ds->ds_phys->ds_guid; 4436492Stimh if (ds->ds_phys->ds_flags & DS_FLAG_CI_DATASET) 4446492Stimh drr->drr_u.drr_begin.drr_flags |= DRR_FLAG_CI_DATA; 4456492Stimh 4462743Sahrens if (fromds) 4472743Sahrens drr->drr_u.drr_begin.drr_fromguid = fromds->ds_phys->ds_guid; 4482743Sahrens dsl_dataset_name(ds, drr->drr_u.drr_begin.drr_toname); 4492743Sahrens 4505367Sahrens if (fromds) 4515367Sahrens fromtxg = fromds->ds_phys->ds_creation_txg; 4525367Sahrens if (fromorigin) 4536689Smaybee dsl_dataset_rele(fromds, FTAG); 4545367Sahrens 4552743Sahrens ba.drr = drr; 4562743Sahrens ba.vp = vp; 4572743Sahrens ba.os = tosnap; 4585367Sahrens ba.off = off; 45911007SLori.Alt@Sun.COM ba.toguid = ds->ds_phys->ds_guid; 4602743Sahrens ZIO_SET_CHECKSUM(&ba.zc, 0, 0, 0, 0); 46111007SLori.Alt@Sun.COM ba.pending_op = PENDING_NONE; 4622743Sahrens 46311007SLori.Alt@Sun.COM if (dump_bytes(&ba, drr, sizeof (dmu_replay_record_t)) != 0) { 4642743Sahrens kmem_free(drr, sizeof (dmu_replay_record_t)); 4652743Sahrens return (ba.err); 4662743Sahrens } 4672743Sahrens 4687837SMatthew.Ahrens@Sun.COM err = traverse_dataset(ds, fromtxg, TRAVERSE_PRE | TRAVERSE_PREFETCH, 4692743Sahrens backup_cb, &ba); 4702743Sahrens 47111007SLori.Alt@Sun.COM if (ba.pending_op != PENDING_NONE) 47211007SLori.Alt@Sun.COM if (dump_bytes(&ba, drr, sizeof (dmu_replay_record_t)) != 0) 47311007SLori.Alt@Sun.COM err = EINTR; 47411007SLori.Alt@Sun.COM 4752743Sahrens if (err) { 4762743Sahrens if (err == EINTR && ba.err) 4772743Sahrens err = ba.err; 4783655Sgw25295 kmem_free(drr, sizeof (dmu_replay_record_t)); 4792743Sahrens return (err); 4802743Sahrens } 4812743Sahrens 4822743Sahrens bzero(drr, sizeof (dmu_replay_record_t)); 4832743Sahrens drr->drr_type = DRR_END; 4842743Sahrens drr->drr_u.drr_end.drr_checksum = ba.zc; 48511007SLori.Alt@Sun.COM drr->drr_u.drr_end.drr_toguid = ba.toguid; 4862743Sahrens 48711007SLori.Alt@Sun.COM if (dump_bytes(&ba, drr, sizeof (dmu_replay_record_t)) != 0) { 4883655Sgw25295 kmem_free(drr, sizeof (dmu_replay_record_t)); 4892743Sahrens return (ba.err); 4903655Sgw25295 } 4912743Sahrens 4922743Sahrens kmem_free(drr, sizeof (dmu_replay_record_t)); 4932743Sahrens 4942743Sahrens return (0); 4952743Sahrens } 4962743Sahrens 4975367Sahrens struct recvbeginsyncarg { 4985367Sahrens const char *tofs; 4995367Sahrens const char *tosnap; 5005367Sahrens dsl_dataset_t *origin; 5015367Sahrens uint64_t fromguid; 5025367Sahrens dmu_objset_type_t type; 5035367Sahrens void *tag; 5045367Sahrens boolean_t force; 5056492Stimh uint64_t dsflags; 5065367Sahrens char clonelastname[MAXNAMELEN]; 5075367Sahrens dsl_dataset_t *ds; /* the ds to recv into; returned from the syncfunc */ 50812296SLin.Ling@Sun.COM cred_t *cr; 5092743Sahrens }; 5102743Sahrens 5115367Sahrens /* ARGSUSED */ 5122743Sahrens static int 51310272SMatthew.Ahrens@Sun.COM recv_new_check(void *arg1, void *arg2, dmu_tx_t *tx) 5145367Sahrens { 5155367Sahrens dsl_dir_t *dd = arg1; 5165367Sahrens struct recvbeginsyncarg *rbsa = arg2; 5175367Sahrens objset_t *mos = dd->dd_pool->dp_meta_objset; 5185367Sahrens uint64_t val; 5195367Sahrens int err; 5205367Sahrens 5215367Sahrens err = zap_lookup(mos, dd->dd_phys->dd_child_dir_zapobj, 5225367Sahrens strrchr(rbsa->tofs, '/') + 1, sizeof (uint64_t), 1, &val); 5235367Sahrens 5245367Sahrens if (err != ENOENT) 5255367Sahrens return (err ? err : EEXIST); 5265367Sahrens 5275367Sahrens if (rbsa->origin) { 5285367Sahrens /* make sure it's a snap in the same pool */ 5295367Sahrens if (rbsa->origin->ds_dir->dd_pool != dd->dd_pool) 5305367Sahrens return (EXDEV); 53110272SMatthew.Ahrens@Sun.COM if (!dsl_dataset_is_snapshot(rbsa->origin)) 5325367Sahrens return (EINVAL); 5335367Sahrens if (rbsa->origin->ds_phys->ds_guid != rbsa->fromguid) 5345367Sahrens return (ENODEV); 5355367Sahrens } 5365367Sahrens 5375367Sahrens return (0); 5385367Sahrens } 5395367Sahrens 5405367Sahrens static void 54112296SLin.Ling@Sun.COM recv_new_sync(void *arg1, void *arg2, dmu_tx_t *tx) 5425367Sahrens { 5435367Sahrens dsl_dir_t *dd = arg1; 5445367Sahrens struct recvbeginsyncarg *rbsa = arg2; 5456689Smaybee uint64_t flags = DS_FLAG_INCONSISTENT | rbsa->dsflags; 5465367Sahrens uint64_t dsobj; 5475367Sahrens 54810272SMatthew.Ahrens@Sun.COM /* Create and open new dataset. */ 5495367Sahrens dsobj = dsl_dataset_create_sync(dd, strrchr(rbsa->tofs, '/') + 1, 55012296SLin.Ling@Sun.COM rbsa->origin, flags, rbsa->cr, tx); 55110272SMatthew.Ahrens@Sun.COM VERIFY(0 == dsl_dataset_own_obj(dd->dd_pool, dsobj, 55210298SMatthew.Ahrens@Sun.COM B_TRUE, dmu_recv_tag, &rbsa->ds)); 5535367Sahrens 55410272SMatthew.Ahrens@Sun.COM if (rbsa->origin == NULL) { 55510272SMatthew.Ahrens@Sun.COM (void) dmu_objset_create_impl(dd->dd_pool->dp_spa, 55610272SMatthew.Ahrens@Sun.COM rbsa->ds, &rbsa->ds->ds_phys->ds_bp, rbsa->type, tx); 5575367Sahrens } 5585367Sahrens 55912296SLin.Ling@Sun.COM spa_history_log_internal(LOG_DS_REPLAY_FULL_SYNC, 56012296SLin.Ling@Sun.COM dd->dd_pool->dp_spa, tx, "dataset = %lld", dsobj); 5615367Sahrens } 5625367Sahrens 5635367Sahrens /* ARGSUSED */ 5645367Sahrens static int 56510272SMatthew.Ahrens@Sun.COM recv_existing_check(void *arg1, void *arg2, dmu_tx_t *tx) 5665367Sahrens { 5675367Sahrens dsl_dataset_t *ds = arg1; 5685367Sahrens struct recvbeginsyncarg *rbsa = arg2; 5692743Sahrens int err; 5702743Sahrens uint64_t val; 5712743Sahrens 5725367Sahrens /* must not have any changes since most recent snapshot */ 5735367Sahrens if (!rbsa->force && dsl_dataset_modified_since_lastsnap(ds)) 5745367Sahrens return (ETXTBSY); 5755367Sahrens 57610272SMatthew.Ahrens@Sun.COM if (rbsa->fromguid) { 57710272SMatthew.Ahrens@Sun.COM /* if incremental, most recent snapshot must match fromguid */ 57810272SMatthew.Ahrens@Sun.COM if (ds->ds_prev == NULL) 57910272SMatthew.Ahrens@Sun.COM return (ENODEV); 58011022STom.Erickson@Sun.COM 58111022STom.Erickson@Sun.COM /* 58211022STom.Erickson@Sun.COM * most recent snapshot must match fromguid, or there are no 58311022STom.Erickson@Sun.COM * changes since the fromguid one 58411022STom.Erickson@Sun.COM */ 58511022STom.Erickson@Sun.COM if (ds->ds_prev->ds_phys->ds_guid != rbsa->fromguid) { 58611022STom.Erickson@Sun.COM uint64_t birth = ds->ds_prev->ds_phys->ds_bp.blk_birth; 58711022STom.Erickson@Sun.COM uint64_t obj = ds->ds_prev->ds_phys->ds_prev_snap_obj; 58811022STom.Erickson@Sun.COM while (obj != 0) { 58911022STom.Erickson@Sun.COM dsl_dataset_t *snap; 59011022STom.Erickson@Sun.COM err = dsl_dataset_hold_obj(ds->ds_dir->dd_pool, 59111022STom.Erickson@Sun.COM obj, FTAG, &snap); 59211022STom.Erickson@Sun.COM if (err) 59311022STom.Erickson@Sun.COM return (ENODEV); 59411022STom.Erickson@Sun.COM if (snap->ds_phys->ds_creation_txg < birth) { 59511022STom.Erickson@Sun.COM dsl_dataset_rele(snap, FTAG); 59611022STom.Erickson@Sun.COM return (ENODEV); 59711022STom.Erickson@Sun.COM } 59811022STom.Erickson@Sun.COM if (snap->ds_phys->ds_guid == rbsa->fromguid) { 59911022STom.Erickson@Sun.COM dsl_dataset_rele(snap, FTAG); 60011022STom.Erickson@Sun.COM break; /* it's ok */ 60111022STom.Erickson@Sun.COM } 60211022STom.Erickson@Sun.COM obj = snap->ds_phys->ds_prev_snap_obj; 60311022STom.Erickson@Sun.COM dsl_dataset_rele(snap, FTAG); 60411022STom.Erickson@Sun.COM } 60511022STom.Erickson@Sun.COM if (obj == 0) 60611022STom.Erickson@Sun.COM return (ENODEV); 60711022STom.Erickson@Sun.COM } 60810272SMatthew.Ahrens@Sun.COM } else { 60910272SMatthew.Ahrens@Sun.COM /* if full, most recent snapshot must be $ORIGIN */ 61010272SMatthew.Ahrens@Sun.COM if (ds->ds_phys->ds_prev_snap_txg >= TXG_INITIAL) 61110272SMatthew.Ahrens@Sun.COM return (ENODEV); 61210272SMatthew.Ahrens@Sun.COM } 6132743Sahrens 6146083Sek110237 /* temporary clone name must not exist */ 6156083Sek110237 err = zap_lookup(ds->ds_dir->dd_pool->dp_meta_objset, 6166083Sek110237 ds->ds_dir->dd_phys->dd_child_dir_zapobj, 6176083Sek110237 rbsa->clonelastname, 8, 1, &val); 6186083Sek110237 if (err == 0) 6196083Sek110237 return (EEXIST); 6206083Sek110237 if (err != ENOENT) 6216083Sek110237 return (err); 6226083Sek110237 6232743Sahrens /* new snapshot name must not exist */ 6245367Sahrens err = zap_lookup(ds->ds_dir->dd_pool->dp_meta_objset, 6255367Sahrens ds->ds_phys->ds_snapnames_zapobj, rbsa->tosnap, 8, 1, &val); 6265367Sahrens if (err == 0) 6272743Sahrens return (EEXIST); 6282743Sahrens if (err != ENOENT) 6295367Sahrens return (err); 6302743Sahrens return (0); 6312743Sahrens } 6322743Sahrens 6332743Sahrens /* ARGSUSED */ 6345367Sahrens static void 63512296SLin.Ling@Sun.COM recv_existing_sync(void *arg1, void *arg2, dmu_tx_t *tx) 6365326Sek110237 { 6375367Sahrens dsl_dataset_t *ohds = arg1; 6385367Sahrens struct recvbeginsyncarg *rbsa = arg2; 6395367Sahrens dsl_pool_t *dp = ohds->ds_dir->dd_pool; 64010272SMatthew.Ahrens@Sun.COM dsl_dataset_t *cds; 6416689Smaybee uint64_t flags = DS_FLAG_INCONSISTENT | rbsa->dsflags; 6425367Sahrens uint64_t dsobj; 6435326Sek110237 64410272SMatthew.Ahrens@Sun.COM /* create and open the temporary clone */ 64510272SMatthew.Ahrens@Sun.COM dsobj = dsl_dataset_create_sync(ohds->ds_dir, rbsa->clonelastname, 64612296SLin.Ling@Sun.COM ohds->ds_prev, flags, rbsa->cr, tx); 64710298SMatthew.Ahrens@Sun.COM VERIFY(0 == dsl_dataset_own_obj(dp, dsobj, B_TRUE, dmu_recv_tag, &cds)); 6485367Sahrens 64910272SMatthew.Ahrens@Sun.COM /* 65010272SMatthew.Ahrens@Sun.COM * If we actually created a non-clone, we need to create the 65110272SMatthew.Ahrens@Sun.COM * objset in our new dataset. 65210272SMatthew.Ahrens@Sun.COM */ 65310272SMatthew.Ahrens@Sun.COM if (BP_IS_HOLE(dsl_dataset_get_blkptr(cds))) { 65410272SMatthew.Ahrens@Sun.COM (void) dmu_objset_create_impl(dp->dp_spa, 65510272SMatthew.Ahrens@Sun.COM cds, dsl_dataset_get_blkptr(cds), rbsa->type, tx); 65610272SMatthew.Ahrens@Sun.COM } 65710272SMatthew.Ahrens@Sun.COM 6585367Sahrens rbsa->ds = cds; 6595367Sahrens 66012296SLin.Ling@Sun.COM spa_history_log_internal(LOG_DS_REPLAY_INC_SYNC, 66112296SLin.Ling@Sun.COM dp->dp_spa, tx, "dataset = %lld", dsobj); 6625326Sek110237 } 6635326Sek110237 66412070SMark.Shellenbaum@Sun.COM 66512070SMark.Shellenbaum@Sun.COM static boolean_t 66612070SMark.Shellenbaum@Sun.COM dmu_recv_verify_features(dsl_dataset_t *ds, struct drr_begin *drrb) 66712070SMark.Shellenbaum@Sun.COM { 66812070SMark.Shellenbaum@Sun.COM int featureflags; 66912070SMark.Shellenbaum@Sun.COM 67012070SMark.Shellenbaum@Sun.COM featureflags = DMU_GET_FEATUREFLAGS(drrb->drr_versioninfo); 67112070SMark.Shellenbaum@Sun.COM 67212070SMark.Shellenbaum@Sun.COM /* Verify pool version supports SA if SA_SPILL feature set */ 67312070SMark.Shellenbaum@Sun.COM return ((featureflags & DMU_BACKUP_FEATURE_SA_SPILL) && 67412070SMark.Shellenbaum@Sun.COM (spa_version(dsl_dataset_get_spa(ds)) < SPA_VERSION_SA)); 67512070SMark.Shellenbaum@Sun.COM } 67612070SMark.Shellenbaum@Sun.COM 6775367Sahrens /* 6785367Sahrens * NB: callers *MUST* call dmu_recv_stream() if dmu_recv_begin() 6795367Sahrens * succeeds; otherwise we will leak the holds on the datasets. 6805367Sahrens */ 6815367Sahrens int 68211007SLori.Alt@Sun.COM dmu_recv_begin(char *tofs, char *tosnap, char *top_ds, struct drr_begin *drrb, 68310204SMatthew.Ahrens@Sun.COM boolean_t force, objset_t *origin, dmu_recv_cookie_t *drc) 6842743Sahrens { 6855367Sahrens int err = 0; 6865367Sahrens boolean_t byteswap; 68710272SMatthew.Ahrens@Sun.COM struct recvbeginsyncarg rbsa = { 0 }; 68811007SLori.Alt@Sun.COM uint64_t versioninfo; 6895367Sahrens int flags; 6905367Sahrens dsl_dataset_t *ds; 6915367Sahrens 6925367Sahrens if (drrb->drr_magic == DMU_BACKUP_MAGIC) 6935367Sahrens byteswap = FALSE; 6945367Sahrens else if (drrb->drr_magic == BSWAP_64(DMU_BACKUP_MAGIC)) 6955367Sahrens byteswap = TRUE; 6965367Sahrens else 6975367Sahrens return (EINVAL); 6985367Sahrens 6995367Sahrens rbsa.tofs = tofs; 7005367Sahrens rbsa.tosnap = tosnap; 70110298SMatthew.Ahrens@Sun.COM rbsa.origin = origin ? origin->os_dsl_dataset : NULL; 7025367Sahrens rbsa.fromguid = drrb->drr_fromguid; 7035367Sahrens rbsa.type = drrb->drr_type; 7045367Sahrens rbsa.tag = FTAG; 7056492Stimh rbsa.dsflags = 0; 70612296SLin.Ling@Sun.COM rbsa.cr = CRED(); 70711007SLori.Alt@Sun.COM versioninfo = drrb->drr_versioninfo; 7085367Sahrens flags = drrb->drr_flags; 7095367Sahrens 7105367Sahrens if (byteswap) { 7115367Sahrens rbsa.type = BSWAP_32(rbsa.type); 7125367Sahrens rbsa.fromguid = BSWAP_64(rbsa.fromguid); 71311007SLori.Alt@Sun.COM versioninfo = BSWAP_64(versioninfo); 7145367Sahrens flags = BSWAP_32(flags); 7155367Sahrens } 7165367Sahrens 71711007SLori.Alt@Sun.COM if (DMU_GET_STREAM_HDRTYPE(versioninfo) == DMU_COMPOUNDSTREAM || 7185367Sahrens rbsa.type >= DMU_OST_NUMTYPES || 7195367Sahrens ((flags & DRR_FLAG_CLONE) && origin == NULL)) 7205367Sahrens return (EINVAL); 7215367Sahrens 7226492Stimh if (flags & DRR_FLAG_CI_DATA) 7236492Stimh rbsa.dsflags = DS_FLAG_CI_DATASET; 7246492Stimh 7255367Sahrens bzero(drc, sizeof (dmu_recv_cookie_t)); 7265367Sahrens drc->drc_drrb = drrb; 7275367Sahrens drc->drc_tosnap = tosnap; 72811007SLori.Alt@Sun.COM drc->drc_top_ds = top_ds; 7295367Sahrens drc->drc_force = force; 7305367Sahrens 7315367Sahrens /* 7325367Sahrens * Process the begin in syncing context. 7335367Sahrens */ 73410272SMatthew.Ahrens@Sun.COM 73510272SMatthew.Ahrens@Sun.COM /* open the dataset we are logically receiving into */ 73610272SMatthew.Ahrens@Sun.COM err = dsl_dataset_hold(tofs, dmu_recv_tag, &ds); 73710272SMatthew.Ahrens@Sun.COM if (err == 0) { 73812070SMark.Shellenbaum@Sun.COM if (dmu_recv_verify_features(ds, drrb)) { 73912070SMark.Shellenbaum@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 74012070SMark.Shellenbaum@Sun.COM return (ENOTSUP); 74112070SMark.Shellenbaum@Sun.COM } 74210272SMatthew.Ahrens@Sun.COM /* target fs already exists; recv into temp clone */ 7435367Sahrens 74410272SMatthew.Ahrens@Sun.COM /* Can't recv a clone into an existing fs */ 74510272SMatthew.Ahrens@Sun.COM if (flags & DRR_FLAG_CLONE) { 74610272SMatthew.Ahrens@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 74710272SMatthew.Ahrens@Sun.COM return (EINVAL); 74810272SMatthew.Ahrens@Sun.COM } 7492743Sahrens 75010204SMatthew.Ahrens@Sun.COM /* must not have an incremental recv already in progress */ 75110204SMatthew.Ahrens@Sun.COM if (!mutex_tryenter(&ds->ds_recvlock)) { 75210204SMatthew.Ahrens@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 75310204SMatthew.Ahrens@Sun.COM return (EBUSY); 75410204SMatthew.Ahrens@Sun.COM } 75510204SMatthew.Ahrens@Sun.COM 75610272SMatthew.Ahrens@Sun.COM /* tmp clone name is: tofs/%tosnap" */ 75710272SMatthew.Ahrens@Sun.COM (void) snprintf(rbsa.clonelastname, sizeof (rbsa.clonelastname), 75810272SMatthew.Ahrens@Sun.COM "%%%s", tosnap); 7595367Sahrens rbsa.force = force; 7605367Sahrens err = dsl_sync_task_do(ds->ds_dir->dd_pool, 76110272SMatthew.Ahrens@Sun.COM recv_existing_check, recv_existing_sync, ds, &rbsa, 5); 7625367Sahrens if (err) { 76310204SMatthew.Ahrens@Sun.COM mutex_exit(&ds->ds_recvlock); 7646689Smaybee dsl_dataset_rele(ds, dmu_recv_tag); 7655367Sahrens return (err); 7665367Sahrens } 7675367Sahrens drc->drc_logical_ds = ds; 7685367Sahrens drc->drc_real_ds = rbsa.ds; 76910272SMatthew.Ahrens@Sun.COM } else if (err == ENOENT) { 77010272SMatthew.Ahrens@Sun.COM /* target fs does not exist; must be a full backup or clone */ 77110272SMatthew.Ahrens@Sun.COM char *cp; 7725367Sahrens 77310272SMatthew.Ahrens@Sun.COM /* 77410272SMatthew.Ahrens@Sun.COM * If it's a non-clone incremental, we are missing the 77510272SMatthew.Ahrens@Sun.COM * target fs, so fail the recv. 77610272SMatthew.Ahrens@Sun.COM */ 77710272SMatthew.Ahrens@Sun.COM if (rbsa.fromguid && !(flags & DRR_FLAG_CLONE)) 77810272SMatthew.Ahrens@Sun.COM return (ENOENT); 77910272SMatthew.Ahrens@Sun.COM 78010272SMatthew.Ahrens@Sun.COM /* Open the parent of tofs */ 78110272SMatthew.Ahrens@Sun.COM cp = strrchr(tofs, '/'); 78210272SMatthew.Ahrens@Sun.COM *cp = '\0'; 78310819SChris.Kirby@sun.com err = dsl_dataset_hold(tofs, FTAG, &ds); 78410272SMatthew.Ahrens@Sun.COM *cp = '/'; 7855367Sahrens if (err) 7865367Sahrens return (err); 7875367Sahrens 78812070SMark.Shellenbaum@Sun.COM if (dmu_recv_verify_features(ds, drrb)) { 78912070SMark.Shellenbaum@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 79012070SMark.Shellenbaum@Sun.COM return (ENOTSUP); 79112070SMark.Shellenbaum@Sun.COM } 79212070SMark.Shellenbaum@Sun.COM 79310272SMatthew.Ahrens@Sun.COM err = dsl_sync_task_do(ds->ds_dir->dd_pool, 79410272SMatthew.Ahrens@Sun.COM recv_new_check, recv_new_sync, ds->ds_dir, &rbsa, 5); 79510819SChris.Kirby@sun.com dsl_dataset_rele(ds, FTAG); 7965367Sahrens if (err) 7975367Sahrens return (err); 7985367Sahrens drc->drc_logical_ds = drc->drc_real_ds = rbsa.ds; 7995367Sahrens drc->drc_newfs = B_TRUE; 8005367Sahrens } 8015367Sahrens 80210272SMatthew.Ahrens@Sun.COM return (err); 8032743Sahrens } 8042743Sahrens 8055367Sahrens struct restorearg { 8065367Sahrens int err; 8075367Sahrens int byteswap; 8085367Sahrens vnode_t *vp; 8095367Sahrens char *buf; 8105367Sahrens uint64_t voff; 8115367Sahrens int bufsize; /* amount of memory allocated for buf */ 8125367Sahrens zio_cksum_t cksum; 81311007SLori.Alt@Sun.COM avl_tree_t guid_to_ds_map; 8145326Sek110237 }; 8155326Sek110237 81611007SLori.Alt@Sun.COM typedef struct guid_map_entry { 81711007SLori.Alt@Sun.COM uint64_t guid; 81811007SLori.Alt@Sun.COM dsl_dataset_t *gme_ds; 81911007SLori.Alt@Sun.COM avl_node_t avlnode; 82011007SLori.Alt@Sun.COM } guid_map_entry_t; 82111007SLori.Alt@Sun.COM 82211007SLori.Alt@Sun.COM static int 82311007SLori.Alt@Sun.COM guid_compare(const void *arg1, const void *arg2) 82411007SLori.Alt@Sun.COM { 82511007SLori.Alt@Sun.COM const guid_map_entry_t *gmep1 = arg1; 82611007SLori.Alt@Sun.COM const guid_map_entry_t *gmep2 = arg2; 82711007SLori.Alt@Sun.COM 82811007SLori.Alt@Sun.COM if (gmep1->guid < gmep2->guid) 82911007SLori.Alt@Sun.COM return (-1); 83011007SLori.Alt@Sun.COM else if (gmep1->guid > gmep2->guid) 83111007SLori.Alt@Sun.COM return (1); 83211007SLori.Alt@Sun.COM return (0); 83311007SLori.Alt@Sun.COM } 83411007SLori.Alt@Sun.COM 83511007SLori.Alt@Sun.COM /* 83611007SLori.Alt@Sun.COM * This function is a callback used by dmu_objset_find() (which 83711007SLori.Alt@Sun.COM * enumerates the object sets) to build an avl tree that maps guids 83811007SLori.Alt@Sun.COM * to datasets. The resulting table is used when processing DRR_WRITE_BYREF 83911007SLori.Alt@Sun.COM * send stream records. These records, which are used in dedup'ed 84011007SLori.Alt@Sun.COM * streams, do not contain data themselves, but refer to a copy 84111007SLori.Alt@Sun.COM * of the data block that has already been written because it was 84211007SLori.Alt@Sun.COM * earlier in the stream. That previous copy is identified by the 84311007SLori.Alt@Sun.COM * guid of the dataset with the referenced data. 84411007SLori.Alt@Sun.COM */ 84511007SLori.Alt@Sun.COM int 84611209SMatthew.Ahrens@Sun.COM find_ds_by_guid(const char *name, void *arg) 84711007SLori.Alt@Sun.COM { 84811209SMatthew.Ahrens@Sun.COM avl_tree_t *guid_map = arg; 84911007SLori.Alt@Sun.COM dsl_dataset_t *ds, *snapds; 85011007SLori.Alt@Sun.COM guid_map_entry_t *gmep; 85111209SMatthew.Ahrens@Sun.COM dsl_pool_t *dp; 85211007SLori.Alt@Sun.COM int err; 85311007SLori.Alt@Sun.COM uint64_t lastobj, firstobj; 85411007SLori.Alt@Sun.COM 85511007SLori.Alt@Sun.COM if (dsl_dataset_hold(name, FTAG, &ds) != 0) 85611007SLori.Alt@Sun.COM return (0); 85711007SLori.Alt@Sun.COM 85811007SLori.Alt@Sun.COM dp = ds->ds_dir->dd_pool; 85911007SLori.Alt@Sun.COM rw_enter(&dp->dp_config_rwlock, RW_READER); 86011007SLori.Alt@Sun.COM firstobj = ds->ds_dir->dd_phys->dd_origin_obj; 86111007SLori.Alt@Sun.COM lastobj = ds->ds_phys->ds_prev_snap_obj; 86211007SLori.Alt@Sun.COM 86311007SLori.Alt@Sun.COM while (lastobj != firstobj) { 86411007SLori.Alt@Sun.COM err = dsl_dataset_hold_obj(dp, lastobj, guid_map, &snapds); 86511007SLori.Alt@Sun.COM if (err) { 86611007SLori.Alt@Sun.COM /* 86711007SLori.Alt@Sun.COM * Skip this snapshot and move on. It's not 86811007SLori.Alt@Sun.COM * clear why this would ever happen, but the 86911007SLori.Alt@Sun.COM * remainder of the snapshot streadm can be 87011007SLori.Alt@Sun.COM * processed. 87111007SLori.Alt@Sun.COM */ 87211007SLori.Alt@Sun.COM rw_exit(&dp->dp_config_rwlock); 87311007SLori.Alt@Sun.COM dsl_dataset_rele(ds, FTAG); 87411007SLori.Alt@Sun.COM return (0); 87511007SLori.Alt@Sun.COM } 87611007SLori.Alt@Sun.COM 87711007SLori.Alt@Sun.COM gmep = kmem_alloc(sizeof (guid_map_entry_t), KM_SLEEP); 87811007SLori.Alt@Sun.COM gmep->guid = snapds->ds_phys->ds_guid; 87911007SLori.Alt@Sun.COM gmep->gme_ds = snapds; 88011007SLori.Alt@Sun.COM avl_add(guid_map, gmep); 88111007SLori.Alt@Sun.COM lastobj = snapds->ds_phys->ds_prev_snap_obj; 88211007SLori.Alt@Sun.COM } 88311007SLori.Alt@Sun.COM 88411007SLori.Alt@Sun.COM rw_exit(&dp->dp_config_rwlock); 88511007SLori.Alt@Sun.COM dsl_dataset_rele(ds, FTAG); 88611007SLori.Alt@Sun.COM 88711007SLori.Alt@Sun.COM return (0); 88811007SLori.Alt@Sun.COM } 88911007SLori.Alt@Sun.COM 8902743Sahrens static void * 8912743Sahrens restore_read(struct restorearg *ra, int len) 8922743Sahrens { 8932743Sahrens void *rv; 8945367Sahrens int done = 0; 8952743Sahrens 8962743Sahrens /* some things will require 8-byte alignment, so everything must */ 8972743Sahrens ASSERT3U(len % 8, ==, 0); 8982743Sahrens 8995367Sahrens while (done < len) { 9002743Sahrens ssize_t resid; 9012743Sahrens 9022743Sahrens ra->err = vn_rdwr(UIO_READ, ra->vp, 9035367Sahrens (caddr_t)ra->buf + done, len - done, 9042743Sahrens ra->voff, UIO_SYSSPACE, FAPPEND, 9052743Sahrens RLIM64_INFINITY, CRED(), &resid); 9062743Sahrens 9075367Sahrens if (resid == len - done) 9082743Sahrens ra->err = EINVAL; 9095367Sahrens ra->voff += len - done - resid; 9105367Sahrens done = len - resid; 9112743Sahrens if (ra->err) 9122743Sahrens return (NULL); 9132743Sahrens } 9142743Sahrens 9155367Sahrens ASSERT3U(done, ==, len); 9165367Sahrens rv = ra->buf; 9172743Sahrens if (ra->byteswap) 9185367Sahrens fletcher_4_incremental_byteswap(rv, len, &ra->cksum); 9192743Sahrens else 9205367Sahrens fletcher_4_incremental_native(rv, len, &ra->cksum); 9212743Sahrens return (rv); 9222743Sahrens } 9232743Sahrens 9242743Sahrens static void 9252743Sahrens backup_byteswap(dmu_replay_record_t *drr) 9262743Sahrens { 9272743Sahrens #define DO64(X) (drr->drr_u.X = BSWAP_64(drr->drr_u.X)) 9282743Sahrens #define DO32(X) (drr->drr_u.X = BSWAP_32(drr->drr_u.X)) 9292743Sahrens drr->drr_type = BSWAP_32(drr->drr_type); 9305367Sahrens drr->drr_payloadlen = BSWAP_32(drr->drr_payloadlen); 9312743Sahrens switch (drr->drr_type) { 9322743Sahrens case DRR_BEGIN: 9332743Sahrens DO64(drr_begin.drr_magic); 93411007SLori.Alt@Sun.COM DO64(drr_begin.drr_versioninfo); 9352743Sahrens DO64(drr_begin.drr_creation_time); 9362743Sahrens DO32(drr_begin.drr_type); 9375367Sahrens DO32(drr_begin.drr_flags); 9382743Sahrens DO64(drr_begin.drr_toguid); 9392743Sahrens DO64(drr_begin.drr_fromguid); 9402743Sahrens break; 9412743Sahrens case DRR_OBJECT: 9422743Sahrens DO64(drr_object.drr_object); 9432743Sahrens /* DO64(drr_object.drr_allocation_txg); */ 9442743Sahrens DO32(drr_object.drr_type); 9452743Sahrens DO32(drr_object.drr_bonustype); 9462743Sahrens DO32(drr_object.drr_blksz); 9472743Sahrens DO32(drr_object.drr_bonuslen); 94811007SLori.Alt@Sun.COM DO64(drr_object.drr_toguid); 9492743Sahrens break; 9502743Sahrens case DRR_FREEOBJECTS: 9512743Sahrens DO64(drr_freeobjects.drr_firstobj); 9522743Sahrens DO64(drr_freeobjects.drr_numobjs); 95311007SLori.Alt@Sun.COM DO64(drr_freeobjects.drr_toguid); 9542743Sahrens break; 9552743Sahrens case DRR_WRITE: 9562743Sahrens DO64(drr_write.drr_object); 9572743Sahrens DO32(drr_write.drr_type); 9582743Sahrens DO64(drr_write.drr_offset); 9592743Sahrens DO64(drr_write.drr_length); 96011007SLori.Alt@Sun.COM DO64(drr_write.drr_toguid); 96111381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_cksum.zc_word[0]); 96211381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_cksum.zc_word[1]); 96311381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_cksum.zc_word[2]); 96411381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_cksum.zc_word[3]); 96511381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_prop); 96611007SLori.Alt@Sun.COM break; 96711007SLori.Alt@Sun.COM case DRR_WRITE_BYREF: 96811007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_object); 96911007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_offset); 97011007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_length); 97111007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_toguid); 97211007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_refguid); 97311007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_refobject); 97411007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_refoffset); 97511381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_cksum.zc_word[0]); 97611381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_cksum.zc_word[1]); 97711381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_cksum.zc_word[2]); 97811381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_cksum.zc_word[3]); 97911381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_prop); 9802743Sahrens break; 9812743Sahrens case DRR_FREE: 9822743Sahrens DO64(drr_free.drr_object); 9832743Sahrens DO64(drr_free.drr_offset); 9842743Sahrens DO64(drr_free.drr_length); 98511007SLori.Alt@Sun.COM DO64(drr_free.drr_toguid); 9862743Sahrens break; 98711935SMark.Shellenbaum@Sun.COM case DRR_SPILL: 98811935SMark.Shellenbaum@Sun.COM DO64(drr_spill.drr_object); 98911935SMark.Shellenbaum@Sun.COM DO64(drr_spill.drr_length); 99011935SMark.Shellenbaum@Sun.COM DO64(drr_spill.drr_toguid); 99111935SMark.Shellenbaum@Sun.COM break; 9922743Sahrens case DRR_END: 9932743Sahrens DO64(drr_end.drr_checksum.zc_word[0]); 9942743Sahrens DO64(drr_end.drr_checksum.zc_word[1]); 9952743Sahrens DO64(drr_end.drr_checksum.zc_word[2]); 9962743Sahrens DO64(drr_end.drr_checksum.zc_word[3]); 99711007SLori.Alt@Sun.COM DO64(drr_end.drr_toguid); 9982743Sahrens break; 9992743Sahrens } 10002743Sahrens #undef DO64 10012743Sahrens #undef DO32 10022743Sahrens } 10032743Sahrens 10042743Sahrens static int 10052743Sahrens restore_object(struct restorearg *ra, objset_t *os, struct drr_object *drro) 10062743Sahrens { 10072743Sahrens int err; 10082743Sahrens dmu_tx_t *tx; 10097994STim.Haley@Sun.COM void *data = NULL; 10102743Sahrens 10112743Sahrens if (drro->drr_type == DMU_OT_NONE || 10122743Sahrens drro->drr_type >= DMU_OT_NUMTYPES || 10132743Sahrens drro->drr_bonustype >= DMU_OT_NUMTYPES || 101411007SLori.Alt@Sun.COM drro->drr_checksumtype >= ZIO_CHECKSUM_FUNCTIONS || 10152743Sahrens drro->drr_compress >= ZIO_COMPRESS_FUNCTIONS || 10162743Sahrens P2PHASE(drro->drr_blksz, SPA_MINBLOCKSIZE) || 10172743Sahrens drro->drr_blksz < SPA_MINBLOCKSIZE || 10182743Sahrens drro->drr_blksz > SPA_MAXBLOCKSIZE || 10192743Sahrens drro->drr_bonuslen > DN_MAX_BONUSLEN) { 10202743Sahrens return (EINVAL); 10212743Sahrens } 10222743Sahrens 10238986SMark.Maybee@Sun.COM err = dmu_object_info(os, drro->drr_object, NULL); 10248986SMark.Maybee@Sun.COM 10258986SMark.Maybee@Sun.COM if (err != 0 && err != ENOENT) 10268986SMark.Maybee@Sun.COM return (EINVAL); 10278986SMark.Maybee@Sun.COM 10287994STim.Haley@Sun.COM if (drro->drr_bonuslen) { 10297994STim.Haley@Sun.COM data = restore_read(ra, P2ROUNDUP(drro->drr_bonuslen, 8)); 10307994STim.Haley@Sun.COM if (ra->err) 10317994STim.Haley@Sun.COM return (ra->err); 10327994STim.Haley@Sun.COM } 10337994STim.Haley@Sun.COM 10342743Sahrens if (err == ENOENT) { 10352743Sahrens /* currently free, want to be allocated */ 10368986SMark.Maybee@Sun.COM tx = dmu_tx_create(os); 10372743Sahrens dmu_tx_hold_bonus(tx, DMU_NEW_OBJECT); 10382743Sahrens err = dmu_tx_assign(tx, TXG_WAIT); 10392743Sahrens if (err) { 10402743Sahrens dmu_tx_abort(tx); 10412743Sahrens return (err); 10422743Sahrens } 10432743Sahrens err = dmu_object_claim(os, drro->drr_object, 10442743Sahrens drro->drr_type, drro->drr_blksz, 10452743Sahrens drro->drr_bonustype, drro->drr_bonuslen, tx); 10468986SMark.Maybee@Sun.COM dmu_tx_commit(tx); 10472743Sahrens } else { 10482743Sahrens /* currently allocated, want to be allocated */ 10492743Sahrens err = dmu_object_reclaim(os, drro->drr_object, 10502743Sahrens drro->drr_type, drro->drr_blksz, 10518986SMark.Maybee@Sun.COM drro->drr_bonustype, drro->drr_bonuslen); 10522743Sahrens } 105311935SMark.Shellenbaum@Sun.COM if (err) { 10548986SMark.Maybee@Sun.COM return (EINVAL); 105511935SMark.Shellenbaum@Sun.COM } 10568986SMark.Maybee@Sun.COM 10578986SMark.Maybee@Sun.COM tx = dmu_tx_create(os); 10588986SMark.Maybee@Sun.COM dmu_tx_hold_bonus(tx, drro->drr_object); 10598986SMark.Maybee@Sun.COM err = dmu_tx_assign(tx, TXG_WAIT); 10602743Sahrens if (err) { 10618986SMark.Maybee@Sun.COM dmu_tx_abort(tx); 10628986SMark.Maybee@Sun.COM return (err); 10632743Sahrens } 10642743Sahrens 106511007SLori.Alt@Sun.COM dmu_object_set_checksum(os, drro->drr_object, drro->drr_checksumtype, 106611007SLori.Alt@Sun.COM tx); 10672743Sahrens dmu_object_set_compress(os, drro->drr_object, drro->drr_compress, tx); 10682743Sahrens 10697994STim.Haley@Sun.COM if (data != NULL) { 10702743Sahrens dmu_buf_t *db; 10717994STim.Haley@Sun.COM 10722743Sahrens VERIFY(0 == dmu_bonus_hold(os, drro->drr_object, FTAG, &db)); 10732743Sahrens dmu_buf_will_dirty(db, tx); 10742743Sahrens 10754944Smaybee ASSERT3U(db->db_size, >=, drro->drr_bonuslen); 10764944Smaybee bcopy(data, db->db_data, drro->drr_bonuslen); 10772743Sahrens if (ra->byteswap) { 10782743Sahrens dmu_ot[drro->drr_bonustype].ot_byteswap(db->db_data, 10792743Sahrens drro->drr_bonuslen); 10802743Sahrens } 10812743Sahrens dmu_buf_rele(db, FTAG); 10822743Sahrens } 10832743Sahrens dmu_tx_commit(tx); 10842743Sahrens return (0); 10852743Sahrens } 10862743Sahrens 10872743Sahrens /* ARGSUSED */ 10882743Sahrens static int 10892743Sahrens restore_freeobjects(struct restorearg *ra, objset_t *os, 10902743Sahrens struct drr_freeobjects *drrfo) 10912743Sahrens { 10922743Sahrens uint64_t obj; 10932743Sahrens 10942743Sahrens if (drrfo->drr_firstobj + drrfo->drr_numobjs < drrfo->drr_firstobj) 10952743Sahrens return (EINVAL); 10962743Sahrens 10972743Sahrens for (obj = drrfo->drr_firstobj; 10983087Sahrens obj < drrfo->drr_firstobj + drrfo->drr_numobjs; 10993087Sahrens (void) dmu_object_next(os, &obj, FALSE, 0)) { 11002743Sahrens int err; 11012743Sahrens 11022743Sahrens if (dmu_object_info(os, obj, NULL) != 0) 11032743Sahrens continue; 11042743Sahrens 11056992Smaybee err = dmu_free_object(os, obj); 11066992Smaybee if (err) 11072743Sahrens return (err); 11082743Sahrens } 11092743Sahrens return (0); 11102743Sahrens } 11112743Sahrens 11122743Sahrens static int 11132743Sahrens restore_write(struct restorearg *ra, objset_t *os, 11142743Sahrens struct drr_write *drrw) 11152743Sahrens { 11162743Sahrens dmu_tx_t *tx; 11172743Sahrens void *data; 11182743Sahrens int err; 11192743Sahrens 11202743Sahrens if (drrw->drr_offset + drrw->drr_length < drrw->drr_offset || 11212743Sahrens drrw->drr_type >= DMU_OT_NUMTYPES) 11222743Sahrens return (EINVAL); 11232743Sahrens 11242743Sahrens data = restore_read(ra, drrw->drr_length); 11252743Sahrens if (data == NULL) 11262743Sahrens return (ra->err); 11272743Sahrens 11282743Sahrens if (dmu_object_info(os, drrw->drr_object, NULL) != 0) 11292743Sahrens return (EINVAL); 11302743Sahrens 11312743Sahrens tx = dmu_tx_create(os); 11322743Sahrens 11332743Sahrens dmu_tx_hold_write(tx, drrw->drr_object, 11342743Sahrens drrw->drr_offset, drrw->drr_length); 11352743Sahrens err = dmu_tx_assign(tx, TXG_WAIT); 11362743Sahrens if (err) { 11372743Sahrens dmu_tx_abort(tx); 11382743Sahrens return (err); 11392743Sahrens } 11402743Sahrens if (ra->byteswap) 11412743Sahrens dmu_ot[drrw->drr_type].ot_byteswap(data, drrw->drr_length); 11422743Sahrens dmu_write(os, drrw->drr_object, 11432743Sahrens drrw->drr_offset, drrw->drr_length, data, tx); 11442743Sahrens dmu_tx_commit(tx); 11452743Sahrens return (0); 11462743Sahrens } 11472743Sahrens 114811007SLori.Alt@Sun.COM /* 114911007SLori.Alt@Sun.COM * Handle a DRR_WRITE_BYREF record. This record is used in dedup'ed 115011007SLori.Alt@Sun.COM * streams to refer to a copy of the data that is already on the 115111007SLori.Alt@Sun.COM * system because it came in earlier in the stream. This function 115211007SLori.Alt@Sun.COM * finds the earlier copy of the data, and uses that copy instead of 115311007SLori.Alt@Sun.COM * data from the stream to fulfill this write. 115411007SLori.Alt@Sun.COM */ 115511007SLori.Alt@Sun.COM static int 115611007SLori.Alt@Sun.COM restore_write_byref(struct restorearg *ra, objset_t *os, 115711007SLori.Alt@Sun.COM struct drr_write_byref *drrwbr) 115811007SLori.Alt@Sun.COM { 115911007SLori.Alt@Sun.COM dmu_tx_t *tx; 116011007SLori.Alt@Sun.COM int err; 116111007SLori.Alt@Sun.COM guid_map_entry_t gmesrch; 116211007SLori.Alt@Sun.COM guid_map_entry_t *gmep; 116311007SLori.Alt@Sun.COM avl_index_t where; 116411007SLori.Alt@Sun.COM objset_t *ref_os = NULL; 116511007SLori.Alt@Sun.COM dmu_buf_t *dbp; 116611007SLori.Alt@Sun.COM 116711007SLori.Alt@Sun.COM if (drrwbr->drr_offset + drrwbr->drr_length < drrwbr->drr_offset) 116811007SLori.Alt@Sun.COM return (EINVAL); 116911007SLori.Alt@Sun.COM 117011007SLori.Alt@Sun.COM /* 117111007SLori.Alt@Sun.COM * If the GUID of the referenced dataset is different from the 117211007SLori.Alt@Sun.COM * GUID of the target dataset, find the referenced dataset. 117311007SLori.Alt@Sun.COM */ 117411007SLori.Alt@Sun.COM if (drrwbr->drr_toguid != drrwbr->drr_refguid) { 117511007SLori.Alt@Sun.COM gmesrch.guid = drrwbr->drr_refguid; 117611007SLori.Alt@Sun.COM if ((gmep = avl_find(&ra->guid_to_ds_map, &gmesrch, 117711007SLori.Alt@Sun.COM &where)) == NULL) { 117811007SLori.Alt@Sun.COM return (EINVAL); 117911007SLori.Alt@Sun.COM } 118011007SLori.Alt@Sun.COM if (dmu_objset_from_ds(gmep->gme_ds, &ref_os)) 118111007SLori.Alt@Sun.COM return (EINVAL); 118211007SLori.Alt@Sun.COM } else { 118311007SLori.Alt@Sun.COM ref_os = os; 118411007SLori.Alt@Sun.COM } 118511007SLori.Alt@Sun.COM 118611007SLori.Alt@Sun.COM if (err = dmu_buf_hold(ref_os, drrwbr->drr_refobject, 118712285SJeff.Bonwick@Sun.COM drrwbr->drr_refoffset, FTAG, &dbp, DMU_READ_PREFETCH)) 118811007SLori.Alt@Sun.COM return (err); 118911007SLori.Alt@Sun.COM 119011007SLori.Alt@Sun.COM tx = dmu_tx_create(os); 119111007SLori.Alt@Sun.COM 119211007SLori.Alt@Sun.COM dmu_tx_hold_write(tx, drrwbr->drr_object, 119311007SLori.Alt@Sun.COM drrwbr->drr_offset, drrwbr->drr_length); 119411007SLori.Alt@Sun.COM err = dmu_tx_assign(tx, TXG_WAIT); 119511007SLori.Alt@Sun.COM if (err) { 119611007SLori.Alt@Sun.COM dmu_tx_abort(tx); 119711007SLori.Alt@Sun.COM return (err); 119811007SLori.Alt@Sun.COM } 119911007SLori.Alt@Sun.COM dmu_write(os, drrwbr->drr_object, 120011007SLori.Alt@Sun.COM drrwbr->drr_offset, drrwbr->drr_length, dbp->db_data, tx); 120111007SLori.Alt@Sun.COM dmu_buf_rele(dbp, FTAG); 120211007SLori.Alt@Sun.COM dmu_tx_commit(tx); 120311007SLori.Alt@Sun.COM return (0); 120411007SLori.Alt@Sun.COM } 120511007SLori.Alt@Sun.COM 120611935SMark.Shellenbaum@Sun.COM static int 120711935SMark.Shellenbaum@Sun.COM restore_spill(struct restorearg *ra, objset_t *os, struct drr_spill *drrs) 120811935SMark.Shellenbaum@Sun.COM { 120911935SMark.Shellenbaum@Sun.COM dmu_tx_t *tx; 121011935SMark.Shellenbaum@Sun.COM void *data; 121111935SMark.Shellenbaum@Sun.COM dmu_buf_t *db, *db_spill; 121211935SMark.Shellenbaum@Sun.COM int err; 121311935SMark.Shellenbaum@Sun.COM 121411935SMark.Shellenbaum@Sun.COM if (drrs->drr_length < SPA_MINBLOCKSIZE || 121511935SMark.Shellenbaum@Sun.COM drrs->drr_length > SPA_MAXBLOCKSIZE) 121611935SMark.Shellenbaum@Sun.COM return (EINVAL); 121711935SMark.Shellenbaum@Sun.COM 121811935SMark.Shellenbaum@Sun.COM data = restore_read(ra, drrs->drr_length); 121911935SMark.Shellenbaum@Sun.COM if (data == NULL) 122011935SMark.Shellenbaum@Sun.COM return (ra->err); 122111935SMark.Shellenbaum@Sun.COM 122211935SMark.Shellenbaum@Sun.COM if (dmu_object_info(os, drrs->drr_object, NULL) != 0) 122311935SMark.Shellenbaum@Sun.COM return (EINVAL); 122411935SMark.Shellenbaum@Sun.COM 122511935SMark.Shellenbaum@Sun.COM VERIFY(0 == dmu_bonus_hold(os, drrs->drr_object, FTAG, &db)); 122611935SMark.Shellenbaum@Sun.COM if ((err = dmu_spill_hold_by_bonus(db, FTAG, &db_spill)) != 0) { 122711935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db, FTAG); 122811935SMark.Shellenbaum@Sun.COM return (err); 122911935SMark.Shellenbaum@Sun.COM } 123011935SMark.Shellenbaum@Sun.COM 123111935SMark.Shellenbaum@Sun.COM tx = dmu_tx_create(os); 123211935SMark.Shellenbaum@Sun.COM 123311935SMark.Shellenbaum@Sun.COM dmu_tx_hold_spill(tx, db->db_object); 123411935SMark.Shellenbaum@Sun.COM 123511935SMark.Shellenbaum@Sun.COM err = dmu_tx_assign(tx, TXG_WAIT); 123611935SMark.Shellenbaum@Sun.COM if (err) { 123711935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db, FTAG); 123811935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db_spill, FTAG); 123911935SMark.Shellenbaum@Sun.COM dmu_tx_abort(tx); 124011935SMark.Shellenbaum@Sun.COM return (err); 124111935SMark.Shellenbaum@Sun.COM } 124211935SMark.Shellenbaum@Sun.COM dmu_buf_will_dirty(db_spill, tx); 124311935SMark.Shellenbaum@Sun.COM 124411935SMark.Shellenbaum@Sun.COM if (db_spill->db_size < drrs->drr_length) 124511935SMark.Shellenbaum@Sun.COM VERIFY(0 == dbuf_spill_set_blksz(db_spill, 124611935SMark.Shellenbaum@Sun.COM drrs->drr_length, tx)); 124711935SMark.Shellenbaum@Sun.COM bcopy(data, db_spill->db_data, drrs->drr_length); 124811935SMark.Shellenbaum@Sun.COM 124911935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db, FTAG); 125011935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db_spill, FTAG); 125111935SMark.Shellenbaum@Sun.COM 125211935SMark.Shellenbaum@Sun.COM dmu_tx_commit(tx); 125311935SMark.Shellenbaum@Sun.COM return (0); 125411935SMark.Shellenbaum@Sun.COM } 125511935SMark.Shellenbaum@Sun.COM 12562743Sahrens /* ARGSUSED */ 12572743Sahrens static int 12582743Sahrens restore_free(struct restorearg *ra, objset_t *os, 12592743Sahrens struct drr_free *drrf) 12602743Sahrens { 12612743Sahrens int err; 12622743Sahrens 12632743Sahrens if (drrf->drr_length != -1ULL && 12642743Sahrens drrf->drr_offset + drrf->drr_length < drrf->drr_offset) 12652743Sahrens return (EINVAL); 12662743Sahrens 12672743Sahrens if (dmu_object_info(os, drrf->drr_object, NULL) != 0) 12682743Sahrens return (EINVAL); 12692743Sahrens 12706992Smaybee err = dmu_free_long_range(os, drrf->drr_object, 12712743Sahrens drrf->drr_offset, drrf->drr_length); 12722743Sahrens return (err); 12732743Sahrens } 12742743Sahrens 12755367Sahrens /* 12765367Sahrens * NB: callers *must* call dmu_recv_end() if this succeeds. 12775367Sahrens */ 12785367Sahrens int 12795367Sahrens dmu_recv_stream(dmu_recv_cookie_t *drc, vnode_t *vp, offset_t *voffp) 12805367Sahrens { 12815367Sahrens struct restorearg ra = { 0 }; 12825367Sahrens dmu_replay_record_t *drr; 12835367Sahrens objset_t *os; 12845367Sahrens zio_cksum_t pcksum; 128511007SLori.Alt@Sun.COM guid_map_entry_t *gmep; 128611007SLori.Alt@Sun.COM int featureflags; 12875367Sahrens 12885367Sahrens if (drc->drc_drrb->drr_magic == BSWAP_64(DMU_BACKUP_MAGIC)) 12895367Sahrens ra.byteswap = TRUE; 12902743Sahrens 12915367Sahrens { 12925367Sahrens /* compute checksum of drr_begin record */ 12935367Sahrens dmu_replay_record_t *drr; 12945367Sahrens drr = kmem_zalloc(sizeof (dmu_replay_record_t), KM_SLEEP); 12955367Sahrens 12965367Sahrens drr->drr_type = DRR_BEGIN; 12975367Sahrens drr->drr_u.drr_begin = *drc->drc_drrb; 12985367Sahrens if (ra.byteswap) { 12995367Sahrens fletcher_4_incremental_byteswap(drr, 13005367Sahrens sizeof (dmu_replay_record_t), &ra.cksum); 13015367Sahrens } else { 13025367Sahrens fletcher_4_incremental_native(drr, 13035367Sahrens sizeof (dmu_replay_record_t), &ra.cksum); 13045367Sahrens } 13055367Sahrens kmem_free(drr, sizeof (dmu_replay_record_t)); 13062743Sahrens } 13072743Sahrens 13082743Sahrens if (ra.byteswap) { 13095367Sahrens struct drr_begin *drrb = drc->drc_drrb; 13102743Sahrens drrb->drr_magic = BSWAP_64(drrb->drr_magic); 131111007SLori.Alt@Sun.COM drrb->drr_versioninfo = BSWAP_64(drrb->drr_versioninfo); 13122743Sahrens drrb->drr_creation_time = BSWAP_64(drrb->drr_creation_time); 13132743Sahrens drrb->drr_type = BSWAP_32(drrb->drr_type); 13142743Sahrens drrb->drr_toguid = BSWAP_64(drrb->drr_toguid); 13152743Sahrens drrb->drr_fromguid = BSWAP_64(drrb->drr_fromguid); 13162743Sahrens } 13172743Sahrens 13185367Sahrens ra.vp = vp; 13195367Sahrens ra.voff = *voffp; 13205367Sahrens ra.bufsize = 1<<20; 13215367Sahrens ra.buf = kmem_alloc(ra.bufsize, KM_SLEEP); 13225326Sek110237 13235367Sahrens /* these were verified in dmu_recv_begin */ 132411007SLori.Alt@Sun.COM ASSERT(DMU_GET_STREAM_HDRTYPE(drc->drc_drrb->drr_versioninfo) == 132511007SLori.Alt@Sun.COM DMU_SUBSTREAM); 13265367Sahrens ASSERT(drc->drc_drrb->drr_type < DMU_OST_NUMTYPES); 13272743Sahrens 13282743Sahrens /* 13292743Sahrens * Open the objset we are modifying. 13302743Sahrens */ 133110298SMatthew.Ahrens@Sun.COM VERIFY(dmu_objset_from_ds(drc->drc_real_ds, &os) == 0); 13322743Sahrens 13335367Sahrens ASSERT(drc->drc_real_ds->ds_phys->ds_flags & DS_FLAG_INCONSISTENT); 13342743Sahrens 133511007SLori.Alt@Sun.COM featureflags = DMU_GET_FEATUREFLAGS(drc->drc_drrb->drr_versioninfo); 133611007SLori.Alt@Sun.COM 133711007SLori.Alt@Sun.COM /* if this stream is dedup'ed, set up the avl tree for guid mapping */ 133811007SLori.Alt@Sun.COM if (featureflags & DMU_BACKUP_FEATURE_DEDUP) { 133911007SLori.Alt@Sun.COM avl_create(&ra.guid_to_ds_map, guid_compare, 134011007SLori.Alt@Sun.COM sizeof (guid_map_entry_t), 134111007SLori.Alt@Sun.COM offsetof(guid_map_entry_t, avlnode)); 134211007SLori.Alt@Sun.COM (void) dmu_objset_find(drc->drc_top_ds, find_ds_by_guid, 134311007SLori.Alt@Sun.COM (void *)&ra.guid_to_ds_map, 134411007SLori.Alt@Sun.COM DS_FIND_CHILDREN); 134511007SLori.Alt@Sun.COM } 134611007SLori.Alt@Sun.COM 13472743Sahrens /* 13482743Sahrens * Read records and process them. 13492743Sahrens */ 13505367Sahrens pcksum = ra.cksum; 13512743Sahrens while (ra.err == 0 && 13522743Sahrens NULL != (drr = restore_read(&ra, sizeof (*drr)))) { 13532743Sahrens if (issig(JUSTLOOKING) && issig(FORREAL)) { 13542743Sahrens ra.err = EINTR; 13552743Sahrens goto out; 13562743Sahrens } 13572743Sahrens 13582743Sahrens if (ra.byteswap) 13592743Sahrens backup_byteswap(drr); 13602743Sahrens 13612743Sahrens switch (drr->drr_type) { 13622743Sahrens case DRR_OBJECT: 13632743Sahrens { 13642743Sahrens /* 13652743Sahrens * We need to make a copy of the record header, 13662743Sahrens * because restore_{object,write} may need to 13672743Sahrens * restore_read(), which will invalidate drr. 13682743Sahrens */ 13692743Sahrens struct drr_object drro = drr->drr_u.drr_object; 13702743Sahrens ra.err = restore_object(&ra, os, &drro); 13712743Sahrens break; 13722743Sahrens } 13732743Sahrens case DRR_FREEOBJECTS: 13742743Sahrens { 13752743Sahrens struct drr_freeobjects drrfo = 13762743Sahrens drr->drr_u.drr_freeobjects; 13772743Sahrens ra.err = restore_freeobjects(&ra, os, &drrfo); 13782743Sahrens break; 13792743Sahrens } 13802743Sahrens case DRR_WRITE: 13812743Sahrens { 13822743Sahrens struct drr_write drrw = drr->drr_u.drr_write; 13832743Sahrens ra.err = restore_write(&ra, os, &drrw); 13842743Sahrens break; 13852743Sahrens } 138611007SLori.Alt@Sun.COM case DRR_WRITE_BYREF: 138711007SLori.Alt@Sun.COM { 138811007SLori.Alt@Sun.COM struct drr_write_byref drrwbr = 138911007SLori.Alt@Sun.COM drr->drr_u.drr_write_byref; 139011007SLori.Alt@Sun.COM ra.err = restore_write_byref(&ra, os, &drrwbr); 139111007SLori.Alt@Sun.COM break; 139211007SLori.Alt@Sun.COM } 13932743Sahrens case DRR_FREE: 13942743Sahrens { 13952743Sahrens struct drr_free drrf = drr->drr_u.drr_free; 13962743Sahrens ra.err = restore_free(&ra, os, &drrf); 13972743Sahrens break; 13982743Sahrens } 13992743Sahrens case DRR_END: 14002743Sahrens { 14012743Sahrens struct drr_end drre = drr->drr_u.drr_end; 14022743Sahrens /* 14032743Sahrens * We compare against the *previous* checksum 14042743Sahrens * value, because the stored checksum is of 14052743Sahrens * everything before the DRR_END record. 14062743Sahrens */ 14076479Sahrens if (!ZIO_CHECKSUM_EQUAL(drre.drr_checksum, pcksum)) 14082743Sahrens ra.err = ECKSUM; 14092743Sahrens goto out; 14102743Sahrens } 141111935SMark.Shellenbaum@Sun.COM case DRR_SPILL: 141211935SMark.Shellenbaum@Sun.COM { 141311935SMark.Shellenbaum@Sun.COM struct drr_spill drrs = drr->drr_u.drr_spill; 141411935SMark.Shellenbaum@Sun.COM ra.err = restore_spill(&ra, os, &drrs); 141511935SMark.Shellenbaum@Sun.COM break; 141611935SMark.Shellenbaum@Sun.COM } 14172743Sahrens default: 14182743Sahrens ra.err = EINVAL; 14192743Sahrens goto out; 14202743Sahrens } 14215367Sahrens pcksum = ra.cksum; 14222743Sahrens } 14236479Sahrens ASSERT(ra.err != 0); 14242743Sahrens 14252743Sahrens out: 14265367Sahrens if (ra.err != 0) { 14272743Sahrens /* 142810204SMatthew.Ahrens@Sun.COM * destroy what we created, so we don't leave it in the 142910204SMatthew.Ahrens@Sun.COM * inconsistent restoring state. 14302743Sahrens */ 14315367Sahrens txg_wait_synced(drc->drc_real_ds->ds_dir->dd_pool, 0); 143210204SMatthew.Ahrens@Sun.COM 143310242Schris.kirby@sun.com (void) dsl_dataset_destroy(drc->drc_real_ds, dmu_recv_tag, 143410242Schris.kirby@sun.com B_FALSE); 143510204SMatthew.Ahrens@Sun.COM if (drc->drc_real_ds != drc->drc_logical_ds) { 143610204SMatthew.Ahrens@Sun.COM mutex_exit(&drc->drc_logical_ds->ds_recvlock); 143710204SMatthew.Ahrens@Sun.COM dsl_dataset_rele(drc->drc_logical_ds, dmu_recv_tag); 143810204SMatthew.Ahrens@Sun.COM } 14392743Sahrens } 14402743Sahrens 144111007SLori.Alt@Sun.COM if (featureflags & DMU_BACKUP_FEATURE_DEDUP) { 144211007SLori.Alt@Sun.COM void *cookie = NULL; 144311007SLori.Alt@Sun.COM 144411007SLori.Alt@Sun.COM while (gmep = avl_destroy_nodes(&ra.guid_to_ds_map, &cookie)) { 144511007SLori.Alt@Sun.COM dsl_dataset_rele(gmep->gme_ds, &ra.guid_to_ds_map); 144611007SLori.Alt@Sun.COM kmem_free(gmep, sizeof (guid_map_entry_t)); 144711007SLori.Alt@Sun.COM } 144811007SLori.Alt@Sun.COM avl_destroy(&ra.guid_to_ds_map); 144911007SLori.Alt@Sun.COM } 145011007SLori.Alt@Sun.COM 14512743Sahrens kmem_free(ra.buf, ra.bufsize); 14525367Sahrens *voffp = ra.voff; 14532743Sahrens return (ra.err); 14542743Sahrens } 14555326Sek110237 14565367Sahrens struct recvendsyncarg { 14575367Sahrens char *tosnap; 14585367Sahrens uint64_t creation_time; 14595367Sahrens uint64_t toguid; 14605367Sahrens }; 14615367Sahrens 14625367Sahrens static int 14635367Sahrens recv_end_check(void *arg1, void *arg2, dmu_tx_t *tx) 14645367Sahrens { 14655367Sahrens dsl_dataset_t *ds = arg1; 14665367Sahrens struct recvendsyncarg *resa = arg2; 14675367Sahrens 14685367Sahrens return (dsl_dataset_snapshot_check(ds, resa->tosnap, tx)); 14695367Sahrens } 14705367Sahrens 14715367Sahrens static void 147212296SLin.Ling@Sun.COM recv_end_sync(void *arg1, void *arg2, dmu_tx_t *tx) 14735326Sek110237 { 14745367Sahrens dsl_dataset_t *ds = arg1; 14755367Sahrens struct recvendsyncarg *resa = arg2; 14765367Sahrens 147712296SLin.Ling@Sun.COM dsl_dataset_snapshot_sync(ds, resa->tosnap, tx); 14785367Sahrens 14795367Sahrens /* set snapshot's creation time and guid */ 14805367Sahrens dmu_buf_will_dirty(ds->ds_prev->ds_dbuf, tx); 14815367Sahrens ds->ds_prev->ds_phys->ds_creation_time = resa->creation_time; 14825367Sahrens ds->ds_prev->ds_phys->ds_guid = resa->toguid; 14835367Sahrens ds->ds_prev->ds_phys->ds_flags &= ~DS_FLAG_INCONSISTENT; 14845367Sahrens 14855367Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 14865367Sahrens ds->ds_phys->ds_flags &= ~DS_FLAG_INCONSISTENT; 14875367Sahrens } 14885367Sahrens 148910272SMatthew.Ahrens@Sun.COM static int 149010272SMatthew.Ahrens@Sun.COM dmu_recv_existing_end(dmu_recv_cookie_t *drc) 14915367Sahrens { 14926689Smaybee struct recvendsyncarg resa; 14936689Smaybee dsl_dataset_t *ds = drc->drc_logical_ds; 14946689Smaybee int err; 14955367Sahrens 14965367Sahrens /* 149710272SMatthew.Ahrens@Sun.COM * XXX hack; seems the ds is still dirty and dsl_pool_zil_clean() 149810272SMatthew.Ahrens@Sun.COM * expects it to have a ds_user_ptr (and zil), but clone_swap() 149910272SMatthew.Ahrens@Sun.COM * can close it. 15005367Sahrens */ 15016689Smaybee txg_wait_synced(ds->ds_dir->dd_pool, 0); 15025326Sek110237 150310272SMatthew.Ahrens@Sun.COM if (dsl_dataset_tryown(ds, FALSE, dmu_recv_tag)) { 150410272SMatthew.Ahrens@Sun.COM err = dsl_dataset_clone_swap(drc->drc_real_ds, ds, 150510272SMatthew.Ahrens@Sun.COM drc->drc_force); 150610272SMatthew.Ahrens@Sun.COM if (err) 150710272SMatthew.Ahrens@Sun.COM goto out; 150810272SMatthew.Ahrens@Sun.COM } else { 150910272SMatthew.Ahrens@Sun.COM mutex_exit(&ds->ds_recvlock); 151010272SMatthew.Ahrens@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 151110242Schris.kirby@sun.com (void) dsl_dataset_destroy(drc->drc_real_ds, dmu_recv_tag, 151210242Schris.kirby@sun.com B_FALSE); 151310272SMatthew.Ahrens@Sun.COM return (EBUSY); 15145367Sahrens } 15155367Sahrens 15166689Smaybee resa.creation_time = drc->drc_drrb->drr_creation_time; 15176689Smaybee resa.toguid = drc->drc_drrb->drr_toguid; 15186689Smaybee resa.tosnap = drc->drc_tosnap; 15196689Smaybee 15206689Smaybee err = dsl_sync_task_do(ds->ds_dir->dd_pool, 15216689Smaybee recv_end_check, recv_end_sync, ds, &resa, 3); 15226689Smaybee if (err) { 152310272SMatthew.Ahrens@Sun.COM /* swap back */ 152410272SMatthew.Ahrens@Sun.COM (void) dsl_dataset_clone_swap(drc->drc_real_ds, ds, B_TRUE); 15255367Sahrens } 15265367Sahrens 152710272SMatthew.Ahrens@Sun.COM out: 152810272SMatthew.Ahrens@Sun.COM mutex_exit(&ds->ds_recvlock); 15296689Smaybee dsl_dataset_disown(ds, dmu_recv_tag); 153010272SMatthew.Ahrens@Sun.COM (void) dsl_dataset_destroy(drc->drc_real_ds, dmu_recv_tag, B_FALSE); 15315326Sek110237 return (err); 15325326Sek110237 } 153310272SMatthew.Ahrens@Sun.COM 153410272SMatthew.Ahrens@Sun.COM static int 153510272SMatthew.Ahrens@Sun.COM dmu_recv_new_end(dmu_recv_cookie_t *drc) 153610272SMatthew.Ahrens@Sun.COM { 153710272SMatthew.Ahrens@Sun.COM struct recvendsyncarg resa; 153810272SMatthew.Ahrens@Sun.COM dsl_dataset_t *ds = drc->drc_logical_ds; 153910272SMatthew.Ahrens@Sun.COM int err; 154010272SMatthew.Ahrens@Sun.COM 154110272SMatthew.Ahrens@Sun.COM /* 154210272SMatthew.Ahrens@Sun.COM * XXX hack; seems the ds is still dirty and dsl_pool_zil_clean() 154310272SMatthew.Ahrens@Sun.COM * expects it to have a ds_user_ptr (and zil), but clone_swap() 154410272SMatthew.Ahrens@Sun.COM * can close it. 154510272SMatthew.Ahrens@Sun.COM */ 154610272SMatthew.Ahrens@Sun.COM txg_wait_synced(ds->ds_dir->dd_pool, 0); 154710272SMatthew.Ahrens@Sun.COM 154810272SMatthew.Ahrens@Sun.COM resa.creation_time = drc->drc_drrb->drr_creation_time; 154910272SMatthew.Ahrens@Sun.COM resa.toguid = drc->drc_drrb->drr_toguid; 155010272SMatthew.Ahrens@Sun.COM resa.tosnap = drc->drc_tosnap; 155110272SMatthew.Ahrens@Sun.COM 155210272SMatthew.Ahrens@Sun.COM err = dsl_sync_task_do(ds->ds_dir->dd_pool, 155310272SMatthew.Ahrens@Sun.COM recv_end_check, recv_end_sync, ds, &resa, 3); 155410272SMatthew.Ahrens@Sun.COM if (err) { 155510272SMatthew.Ahrens@Sun.COM /* clean up the fs we just recv'd into */ 155610272SMatthew.Ahrens@Sun.COM (void) dsl_dataset_destroy(ds, dmu_recv_tag, B_FALSE); 155710272SMatthew.Ahrens@Sun.COM } else { 155810272SMatthew.Ahrens@Sun.COM /* release the hold from dmu_recv_begin */ 155910272SMatthew.Ahrens@Sun.COM dsl_dataset_disown(ds, dmu_recv_tag); 156010272SMatthew.Ahrens@Sun.COM } 156110272SMatthew.Ahrens@Sun.COM return (err); 156210272SMatthew.Ahrens@Sun.COM } 156310272SMatthew.Ahrens@Sun.COM 156410272SMatthew.Ahrens@Sun.COM int 156510272SMatthew.Ahrens@Sun.COM dmu_recv_end(dmu_recv_cookie_t *drc) 156610272SMatthew.Ahrens@Sun.COM { 156710272SMatthew.Ahrens@Sun.COM if (drc->drc_logical_ds != drc->drc_real_ds) 156810272SMatthew.Ahrens@Sun.COM return (dmu_recv_existing_end(drc)); 156910272SMatthew.Ahrens@Sun.COM else 157010272SMatthew.Ahrens@Sun.COM return (dmu_recv_new_end(drc)); 157110272SMatthew.Ahrens@Sun.COM } 1572