12743Sahrens /* 22743Sahrens * CDDL HEADER START 32743Sahrens * 42743Sahrens * The contents of this file are subject to the terms of the 52743Sahrens * Common Development and Distribution License (the "License"). 62743Sahrens * You may not use this file except in compliance with the License. 72743Sahrens * 82743Sahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 92743Sahrens * or http://www.opensolaris.org/os/licensing. 102743Sahrens * See the License for the specific language governing permissions 112743Sahrens * and limitations under the License. 122743Sahrens * 132743Sahrens * When distributing Covered Code, include this CDDL HEADER in each 142743Sahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 152743Sahrens * If applicable, add the following below this CDDL HEADER, with the 162743Sahrens * fields enclosed by brackets "[]" replaced with your own identifying 172743Sahrens * information: Portions Copyright [yyyy] [name of copyright owner] 182743Sahrens * 192743Sahrens * CDDL HEADER END 202743Sahrens */ 212743Sahrens /* 2212070SMark.Shellenbaum@Sun.COM * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved. 232743Sahrens */ 242743Sahrens 252743Sahrens #include <sys/dmu.h> 262743Sahrens #include <sys/dmu_impl.h> 272743Sahrens #include <sys/dmu_tx.h> 282743Sahrens #include <sys/dbuf.h> 292743Sahrens #include <sys/dnode.h> 302743Sahrens #include <sys/zfs_context.h> 312743Sahrens #include <sys/dmu_objset.h> 322743Sahrens #include <sys/dmu_traverse.h> 332743Sahrens #include <sys/dsl_dataset.h> 342743Sahrens #include <sys/dsl_dir.h> 3511022STom.Erickson@Sun.COM #include <sys/dsl_prop.h> 362743Sahrens #include <sys/dsl_pool.h> 372743Sahrens #include <sys/dsl_synctask.h> 382743Sahrens #include <sys/zfs_ioctl.h> 392743Sahrens #include <sys/zap.h> 402743Sahrens #include <sys/zio_checksum.h> 4112070SMark.Shellenbaum@Sun.COM #include <sys/zfs_znode.h> 4211007SLori.Alt@Sun.COM #include <sys/avl.h> 4311381SLori.Alt@Sun.COM #include <sys/ddt.h> 442743Sahrens 455367Sahrens static char *dmu_recv_tag = "dmu_recv_tag"; 465367Sahrens 4711007SLori.Alt@Sun.COM /* 4811007SLori.Alt@Sun.COM * The list of data whose inclusion in a send stream can be pending from 4911007SLori.Alt@Sun.COM * one call to backup_cb to another. Multiple calls to dump_free() and 5011007SLori.Alt@Sun.COM * dump_freeobjects() can be aggregated into a single DRR_FREE or 5111007SLori.Alt@Sun.COM * DRR_FREEOBJECTS replay record. 5211007SLori.Alt@Sun.COM */ 5311007SLori.Alt@Sun.COM typedef enum { 5411007SLori.Alt@Sun.COM PENDING_NONE, 5511007SLori.Alt@Sun.COM PENDING_FREE, 5611007SLori.Alt@Sun.COM PENDING_FREEOBJECTS 5711007SLori.Alt@Sun.COM } pendop_t; 5811007SLori.Alt@Sun.COM 592743Sahrens struct backuparg { 602743Sahrens dmu_replay_record_t *drr; 612743Sahrens vnode_t *vp; 625367Sahrens offset_t *off; 632743Sahrens objset_t *os; 642743Sahrens zio_cksum_t zc; 6511007SLori.Alt@Sun.COM uint64_t toguid; 662743Sahrens int err; 6711007SLori.Alt@Sun.COM pendop_t pending_op; 682743Sahrens }; 692743Sahrens 702743Sahrens static int 712743Sahrens dump_bytes(struct backuparg *ba, void *buf, int len) 722743Sahrens { 732743Sahrens ssize_t resid; /* have to get resid to get detailed errno */ 742743Sahrens ASSERT3U(len % 8, ==, 0); 752743Sahrens 762743Sahrens fletcher_4_incremental_native(buf, len, &ba->zc); 772743Sahrens ba->err = vn_rdwr(UIO_WRITE, ba->vp, 782743Sahrens (caddr_t)buf, len, 792743Sahrens 0, UIO_SYSSPACE, FAPPEND, RLIM64_INFINITY, CRED(), &resid); 805367Sahrens *ba->off += len; 812743Sahrens return (ba->err); 822743Sahrens } 832743Sahrens 842743Sahrens static int 852743Sahrens dump_free(struct backuparg *ba, uint64_t object, uint64_t offset, 862743Sahrens uint64_t length) 872743Sahrens { 8811007SLori.Alt@Sun.COM struct drr_free *drrf = &(ba->drr->drr_u.drr_free); 8911007SLori.Alt@Sun.COM 9011007SLori.Alt@Sun.COM /* 9111007SLori.Alt@Sun.COM * If there is a pending op, but it's not PENDING_FREE, push it out, 9211007SLori.Alt@Sun.COM * since free block aggregation can only be done for blocks of the 9311007SLori.Alt@Sun.COM * same type (i.e., DRR_FREE records can only be aggregated with 9411007SLori.Alt@Sun.COM * other DRR_FREE records. DRR_FREEOBJECTS records can only be 9511007SLori.Alt@Sun.COM * aggregated with other DRR_FREEOBJECTS records. 9611007SLori.Alt@Sun.COM */ 9711007SLori.Alt@Sun.COM if (ba->pending_op != PENDING_NONE && ba->pending_op != PENDING_FREE) { 9811007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 9911007SLori.Alt@Sun.COM return (EINTR); 10011007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 10111007SLori.Alt@Sun.COM } 10211007SLori.Alt@Sun.COM 10311007SLori.Alt@Sun.COM if (ba->pending_op == PENDING_FREE) { 10411007SLori.Alt@Sun.COM /* 10511007SLori.Alt@Sun.COM * There should never be a PENDING_FREE if length is -1 10611007SLori.Alt@Sun.COM * (because dump_dnode is the only place where this 10711007SLori.Alt@Sun.COM * function is called with a -1, and only after flushing 10811007SLori.Alt@Sun.COM * any pending record). 10911007SLori.Alt@Sun.COM */ 11011007SLori.Alt@Sun.COM ASSERT(length != -1ULL); 11111007SLori.Alt@Sun.COM /* 11211007SLori.Alt@Sun.COM * Check to see whether this free block can be aggregated 11311007SLori.Alt@Sun.COM * with pending one. 11411007SLori.Alt@Sun.COM */ 11511007SLori.Alt@Sun.COM if (drrf->drr_object == object && drrf->drr_offset + 11611007SLori.Alt@Sun.COM drrf->drr_length == offset) { 11711007SLori.Alt@Sun.COM drrf->drr_length += length; 11811007SLori.Alt@Sun.COM return (0); 11911007SLori.Alt@Sun.COM } else { 12011007SLori.Alt@Sun.COM /* not a continuation. Push out pending record */ 12111007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, 12211007SLori.Alt@Sun.COM sizeof (dmu_replay_record_t)) != 0) 12311007SLori.Alt@Sun.COM return (EINTR); 12411007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 12511007SLori.Alt@Sun.COM } 12611007SLori.Alt@Sun.COM } 12711007SLori.Alt@Sun.COM /* create a FREE record and make it pending */ 1282743Sahrens bzero(ba->drr, sizeof (dmu_replay_record_t)); 1292743Sahrens ba->drr->drr_type = DRR_FREE; 13011007SLori.Alt@Sun.COM drrf->drr_object = object; 13111007SLori.Alt@Sun.COM drrf->drr_offset = offset; 13211007SLori.Alt@Sun.COM drrf->drr_length = length; 13311007SLori.Alt@Sun.COM drrf->drr_toguid = ba->toguid; 13411007SLori.Alt@Sun.COM if (length == -1ULL) { 13511007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 13611007SLori.Alt@Sun.COM return (EINTR); 13711007SLori.Alt@Sun.COM } else { 13811007SLori.Alt@Sun.COM ba->pending_op = PENDING_FREE; 13911007SLori.Alt@Sun.COM } 1402743Sahrens 1412743Sahrens return (0); 1422743Sahrens } 1432743Sahrens 1442743Sahrens static int 1452743Sahrens dump_data(struct backuparg *ba, dmu_object_type_t type, 14611381SLori.Alt@Sun.COM uint64_t object, uint64_t offset, int blksz, const blkptr_t *bp, void *data) 1472743Sahrens { 14811007SLori.Alt@Sun.COM struct drr_write *drrw = &(ba->drr->drr_u.drr_write); 14911007SLori.Alt@Sun.COM 15011381SLori.Alt@Sun.COM 15111007SLori.Alt@Sun.COM /* 15211007SLori.Alt@Sun.COM * If there is any kind of pending aggregation (currently either 15311007SLori.Alt@Sun.COM * a grouping of free objects or free blocks), push it out to 15411007SLori.Alt@Sun.COM * the stream, since aggregation can't be done across operations 15511007SLori.Alt@Sun.COM * of different types. 15611007SLori.Alt@Sun.COM */ 15711007SLori.Alt@Sun.COM if (ba->pending_op != PENDING_NONE) { 15811007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 15911007SLori.Alt@Sun.COM return (EINTR); 16011007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 16111007SLori.Alt@Sun.COM } 1622743Sahrens /* write a DATA record */ 1632743Sahrens bzero(ba->drr, sizeof (dmu_replay_record_t)); 1642743Sahrens ba->drr->drr_type = DRR_WRITE; 16511007SLori.Alt@Sun.COM drrw->drr_object = object; 16611007SLori.Alt@Sun.COM drrw->drr_type = type; 16711007SLori.Alt@Sun.COM drrw->drr_offset = offset; 16811007SLori.Alt@Sun.COM drrw->drr_length = blksz; 16911007SLori.Alt@Sun.COM drrw->drr_toguid = ba->toguid; 17011381SLori.Alt@Sun.COM drrw->drr_checksumtype = BP_GET_CHECKSUM(bp); 17111381SLori.Alt@Sun.COM if (zio_checksum_table[drrw->drr_checksumtype].ci_dedup) 17211381SLori.Alt@Sun.COM drrw->drr_checksumflags |= DRR_CHECKSUM_DEDUP; 17311381SLori.Alt@Sun.COM DDK_SET_LSIZE(&drrw->drr_key, BP_GET_LSIZE(bp)); 17411381SLori.Alt@Sun.COM DDK_SET_PSIZE(&drrw->drr_key, BP_GET_PSIZE(bp)); 17511381SLori.Alt@Sun.COM DDK_SET_COMPRESS(&drrw->drr_key, BP_GET_COMPRESS(bp)); 17611381SLori.Alt@Sun.COM drrw->drr_key.ddk_cksum = bp->blk_cksum; 1772743Sahrens 17811007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 1792743Sahrens return (EINTR); 18011007SLori.Alt@Sun.COM if (dump_bytes(ba, data, blksz) != 0) 1812743Sahrens return (EINTR); 1822743Sahrens return (0); 1832743Sahrens } 1842743Sahrens 1852743Sahrens static int 18611935SMark.Shellenbaum@Sun.COM dump_spill(struct backuparg *ba, uint64_t object, int blksz, void *data) 18711935SMark.Shellenbaum@Sun.COM { 18811935SMark.Shellenbaum@Sun.COM struct drr_spill *drrs = &(ba->drr->drr_u.drr_spill); 18911935SMark.Shellenbaum@Sun.COM 19011935SMark.Shellenbaum@Sun.COM if (ba->pending_op != PENDING_NONE) { 19111935SMark.Shellenbaum@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 19211935SMark.Shellenbaum@Sun.COM return (EINTR); 19311935SMark.Shellenbaum@Sun.COM ba->pending_op = PENDING_NONE; 19411935SMark.Shellenbaum@Sun.COM } 19511935SMark.Shellenbaum@Sun.COM 19611935SMark.Shellenbaum@Sun.COM /* write a SPILL record */ 19711935SMark.Shellenbaum@Sun.COM bzero(ba->drr, sizeof (dmu_replay_record_t)); 19811935SMark.Shellenbaum@Sun.COM ba->drr->drr_type = DRR_SPILL; 19911935SMark.Shellenbaum@Sun.COM drrs->drr_object = object; 20011935SMark.Shellenbaum@Sun.COM drrs->drr_length = blksz; 20111935SMark.Shellenbaum@Sun.COM drrs->drr_toguid = ba->toguid; 20211935SMark.Shellenbaum@Sun.COM 20311935SMark.Shellenbaum@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t))) 20411935SMark.Shellenbaum@Sun.COM return (EINTR); 20511935SMark.Shellenbaum@Sun.COM if (dump_bytes(ba, data, blksz)) 20611935SMark.Shellenbaum@Sun.COM return (EINTR); 20711935SMark.Shellenbaum@Sun.COM return (0); 20811935SMark.Shellenbaum@Sun.COM } 20911935SMark.Shellenbaum@Sun.COM 21011935SMark.Shellenbaum@Sun.COM static int 2112743Sahrens dump_freeobjects(struct backuparg *ba, uint64_t firstobj, uint64_t numobjs) 2122743Sahrens { 21311007SLori.Alt@Sun.COM struct drr_freeobjects *drrfo = &(ba->drr->drr_u.drr_freeobjects); 21411007SLori.Alt@Sun.COM 21511007SLori.Alt@Sun.COM /* 21611007SLori.Alt@Sun.COM * If there is a pending op, but it's not PENDING_FREEOBJECTS, 21711007SLori.Alt@Sun.COM * push it out, since free block aggregation can only be done for 21811007SLori.Alt@Sun.COM * blocks of the same type (i.e., DRR_FREE records can only be 21911007SLori.Alt@Sun.COM * aggregated with other DRR_FREE records. DRR_FREEOBJECTS records 22011007SLori.Alt@Sun.COM * can only be aggregated with other DRR_FREEOBJECTS records. 22111007SLori.Alt@Sun.COM */ 22211007SLori.Alt@Sun.COM if (ba->pending_op != PENDING_NONE && 22311007SLori.Alt@Sun.COM ba->pending_op != PENDING_FREEOBJECTS) { 22411007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 22511007SLori.Alt@Sun.COM return (EINTR); 22611007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 22711007SLori.Alt@Sun.COM } 22811007SLori.Alt@Sun.COM if (ba->pending_op == PENDING_FREEOBJECTS) { 22911007SLori.Alt@Sun.COM /* 23011007SLori.Alt@Sun.COM * See whether this free object array can be aggregated 23111007SLori.Alt@Sun.COM * with pending one 23211007SLori.Alt@Sun.COM */ 23311007SLori.Alt@Sun.COM if (drrfo->drr_firstobj + drrfo->drr_numobjs == firstobj) { 23411007SLori.Alt@Sun.COM drrfo->drr_numobjs += numobjs; 23511007SLori.Alt@Sun.COM return (0); 23611007SLori.Alt@Sun.COM } else { 23711007SLori.Alt@Sun.COM /* can't be aggregated. Push out pending record */ 23811007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, 23911007SLori.Alt@Sun.COM sizeof (dmu_replay_record_t)) != 0) 24011007SLori.Alt@Sun.COM return (EINTR); 24111007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 24211007SLori.Alt@Sun.COM } 24311007SLori.Alt@Sun.COM } 24411007SLori.Alt@Sun.COM 2452743Sahrens /* write a FREEOBJECTS record */ 2462743Sahrens bzero(ba->drr, sizeof (dmu_replay_record_t)); 2472743Sahrens ba->drr->drr_type = DRR_FREEOBJECTS; 24811007SLori.Alt@Sun.COM drrfo->drr_firstobj = firstobj; 24911007SLori.Alt@Sun.COM drrfo->drr_numobjs = numobjs; 25011007SLori.Alt@Sun.COM drrfo->drr_toguid = ba->toguid; 2512743Sahrens 25211007SLori.Alt@Sun.COM ba->pending_op = PENDING_FREEOBJECTS; 25311007SLori.Alt@Sun.COM 2542743Sahrens return (0); 2552743Sahrens } 2562743Sahrens 2572743Sahrens static int 2582743Sahrens dump_dnode(struct backuparg *ba, uint64_t object, dnode_phys_t *dnp) 2592743Sahrens { 26011007SLori.Alt@Sun.COM struct drr_object *drro = &(ba->drr->drr_u.drr_object); 26111007SLori.Alt@Sun.COM 2622743Sahrens if (dnp == NULL || dnp->dn_type == DMU_OT_NONE) 2632743Sahrens return (dump_freeobjects(ba, object, 1)); 2642743Sahrens 26511007SLori.Alt@Sun.COM if (ba->pending_op != PENDING_NONE) { 26611007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 26711007SLori.Alt@Sun.COM return (EINTR); 26811007SLori.Alt@Sun.COM ba->pending_op = PENDING_NONE; 26911007SLori.Alt@Sun.COM } 27011007SLori.Alt@Sun.COM 2712743Sahrens /* write an OBJECT record */ 2722743Sahrens bzero(ba->drr, sizeof (dmu_replay_record_t)); 2732743Sahrens ba->drr->drr_type = DRR_OBJECT; 27411007SLori.Alt@Sun.COM drro->drr_object = object; 27511007SLori.Alt@Sun.COM drro->drr_type = dnp->dn_type; 27611007SLori.Alt@Sun.COM drro->drr_bonustype = dnp->dn_bonustype; 27711007SLori.Alt@Sun.COM drro->drr_blksz = dnp->dn_datablkszsec << SPA_MINBLOCKSHIFT; 27811007SLori.Alt@Sun.COM drro->drr_bonuslen = dnp->dn_bonuslen; 27911007SLori.Alt@Sun.COM drro->drr_checksumtype = dnp->dn_checksum; 28011007SLori.Alt@Sun.COM drro->drr_compress = dnp->dn_compress; 28111007SLori.Alt@Sun.COM drro->drr_toguid = ba->toguid; 2822743Sahrens 28311007SLori.Alt@Sun.COM if (dump_bytes(ba, ba->drr, sizeof (dmu_replay_record_t)) != 0) 2842743Sahrens return (EINTR); 2852743Sahrens 28611007SLori.Alt@Sun.COM if (dump_bytes(ba, DN_BONUS(dnp), P2ROUNDUP(dnp->dn_bonuslen, 8)) != 0) 2872743Sahrens return (EINTR); 2882743Sahrens 2892743Sahrens /* free anything past the end of the file */ 2902743Sahrens if (dump_free(ba, object, (dnp->dn_maxblkid + 1) * 2912743Sahrens (dnp->dn_datablkszsec << SPA_MINBLOCKSHIFT), -1ULL)) 2922743Sahrens return (EINTR); 2932743Sahrens if (ba->err) 2942743Sahrens return (EINTR); 2952743Sahrens return (0); 2962743Sahrens } 2972743Sahrens 2982743Sahrens #define BP_SPAN(dnp, level) \ 2992743Sahrens (((uint64_t)dnp->dn_datablkszsec) << (SPA_MINBLOCKSHIFT + \ 3002743Sahrens (level) * (dnp->dn_indblkshift - SPA_BLKPTRSHIFT))) 3012743Sahrens 30210922SJeff.Bonwick@Sun.COM /* ARGSUSED */ 3032743Sahrens static int 30410922SJeff.Bonwick@Sun.COM backup_cb(spa_t *spa, zilog_t *zilog, const blkptr_t *bp, 30510922SJeff.Bonwick@Sun.COM const zbookmark_t *zb, const dnode_phys_t *dnp, void *arg) 3062743Sahrens { 3072743Sahrens struct backuparg *ba = arg; 3082743Sahrens dmu_object_type_t type = bp ? BP_GET_TYPE(bp) : DMU_OT_NONE; 3092743Sahrens int err = 0; 3102743Sahrens 3112743Sahrens if (issig(JUSTLOOKING) && issig(FORREAL)) 3122743Sahrens return (EINTR); 3132743Sahrens 31410922SJeff.Bonwick@Sun.COM if (zb->zb_object != DMU_META_DNODE_OBJECT && 31510922SJeff.Bonwick@Sun.COM DMU_OBJECT_IS_SPECIAL(zb->zb_object)) { 3169396SMatthew.Ahrens@Sun.COM return (0); 31710922SJeff.Bonwick@Sun.COM } else if (bp == NULL && zb->zb_object == DMU_META_DNODE_OBJECT) { 3187837SMatthew.Ahrens@Sun.COM uint64_t span = BP_SPAN(dnp, zb->zb_level); 3197837SMatthew.Ahrens@Sun.COM uint64_t dnobj = (zb->zb_blkid * span) >> DNODE_SHIFT; 3202743Sahrens err = dump_freeobjects(ba, dnobj, span >> DNODE_SHIFT); 3212743Sahrens } else if (bp == NULL) { 3227837SMatthew.Ahrens@Sun.COM uint64_t span = BP_SPAN(dnp, zb->zb_level); 3237837SMatthew.Ahrens@Sun.COM err = dump_free(ba, zb->zb_object, zb->zb_blkid * span, span); 3247837SMatthew.Ahrens@Sun.COM } else if (zb->zb_level > 0 || type == DMU_OT_OBJSET) { 3257837SMatthew.Ahrens@Sun.COM return (0); 3267837SMatthew.Ahrens@Sun.COM } else if (type == DMU_OT_DNODE) { 3277837SMatthew.Ahrens@Sun.COM dnode_phys_t *blk; 3282743Sahrens int i; 3292743Sahrens int blksz = BP_GET_LSIZE(bp); 3307837SMatthew.Ahrens@Sun.COM uint32_t aflags = ARC_WAIT; 3317837SMatthew.Ahrens@Sun.COM arc_buf_t *abuf; 3322743Sahrens 3337837SMatthew.Ahrens@Sun.COM if (arc_read_nolock(NULL, spa, bp, 3347837SMatthew.Ahrens@Sun.COM arc_getbuf_func, &abuf, ZIO_PRIORITY_ASYNC_READ, 3357837SMatthew.Ahrens@Sun.COM ZIO_FLAG_CANFAIL, &aflags, zb) != 0) 3367837SMatthew.Ahrens@Sun.COM return (EIO); 3377837SMatthew.Ahrens@Sun.COM 3387837SMatthew.Ahrens@Sun.COM blk = abuf->b_data; 3392743Sahrens for (i = 0; i < blksz >> DNODE_SHIFT; i++) { 3407837SMatthew.Ahrens@Sun.COM uint64_t dnobj = (zb->zb_blkid << 3417837SMatthew.Ahrens@Sun.COM (DNODE_BLOCK_SHIFT - DNODE_SHIFT)) + i; 3422743Sahrens err = dump_dnode(ba, dnobj, blk+i); 3432743Sahrens if (err) 3442743Sahrens break; 3452743Sahrens } 3467837SMatthew.Ahrens@Sun.COM (void) arc_buf_remove_ref(abuf, &abuf); 34711935SMark.Shellenbaum@Sun.COM } else if (type == DMU_OT_SA) { 34811935SMark.Shellenbaum@Sun.COM uint32_t aflags = ARC_WAIT; 34911935SMark.Shellenbaum@Sun.COM arc_buf_t *abuf; 35011935SMark.Shellenbaum@Sun.COM int blksz = BP_GET_LSIZE(bp); 35111935SMark.Shellenbaum@Sun.COM 35211935SMark.Shellenbaum@Sun.COM if (arc_read_nolock(NULL, spa, bp, 35311935SMark.Shellenbaum@Sun.COM arc_getbuf_func, &abuf, ZIO_PRIORITY_ASYNC_READ, 35411935SMark.Shellenbaum@Sun.COM ZIO_FLAG_CANFAIL, &aflags, zb) != 0) 35511935SMark.Shellenbaum@Sun.COM return (EIO); 35611935SMark.Shellenbaum@Sun.COM 35711935SMark.Shellenbaum@Sun.COM err = dump_spill(ba, zb->zb_object, blksz, abuf->b_data); 35811935SMark.Shellenbaum@Sun.COM (void) arc_buf_remove_ref(abuf, &abuf); 3597837SMatthew.Ahrens@Sun.COM } else { /* it's a level-0 block of a regular object */ 3607837SMatthew.Ahrens@Sun.COM uint32_t aflags = ARC_WAIT; 3617837SMatthew.Ahrens@Sun.COM arc_buf_t *abuf; 3622743Sahrens int blksz = BP_GET_LSIZE(bp); 3632743Sahrens 3647837SMatthew.Ahrens@Sun.COM if (arc_read_nolock(NULL, spa, bp, 3657837SMatthew.Ahrens@Sun.COM arc_getbuf_func, &abuf, ZIO_PRIORITY_ASYNC_READ, 3667837SMatthew.Ahrens@Sun.COM ZIO_FLAG_CANFAIL, &aflags, zb) != 0) 3677837SMatthew.Ahrens@Sun.COM return (EIO); 3682743Sahrens 3697837SMatthew.Ahrens@Sun.COM err = dump_data(ba, type, zb->zb_object, zb->zb_blkid * blksz, 37011381SLori.Alt@Sun.COM blksz, bp, abuf->b_data); 3717837SMatthew.Ahrens@Sun.COM (void) arc_buf_remove_ref(abuf, &abuf); 3722743Sahrens } 3732743Sahrens 3742743Sahrens ASSERT(err == 0 || err == EINTR); 3752743Sahrens return (err); 3762743Sahrens } 3772743Sahrens 3782743Sahrens int 3795367Sahrens dmu_sendbackup(objset_t *tosnap, objset_t *fromsnap, boolean_t fromorigin, 3805367Sahrens vnode_t *vp, offset_t *off) 3812743Sahrens { 38210298SMatthew.Ahrens@Sun.COM dsl_dataset_t *ds = tosnap->os_dsl_dataset; 38310298SMatthew.Ahrens@Sun.COM dsl_dataset_t *fromds = fromsnap ? fromsnap->os_dsl_dataset : NULL; 3842743Sahrens dmu_replay_record_t *drr; 3852743Sahrens struct backuparg ba; 3862743Sahrens int err; 3875367Sahrens uint64_t fromtxg = 0; 3882743Sahrens 3892743Sahrens /* tosnap must be a snapshot */ 3902743Sahrens if (ds->ds_phys->ds_next_snap_obj == 0) 3912743Sahrens return (EINVAL); 3922743Sahrens 3932743Sahrens /* fromsnap must be an earlier snapshot from the same fs as tosnap */ 3942743Sahrens if (fromds && (ds->ds_dir != fromds->ds_dir || 3955367Sahrens fromds->ds_phys->ds_creation_txg >= ds->ds_phys->ds_creation_txg)) 3962743Sahrens return (EXDEV); 3972743Sahrens 3985367Sahrens if (fromorigin) { 3997046Sahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 4007046Sahrens 4015367Sahrens if (fromsnap) 4025367Sahrens return (EINVAL); 4035367Sahrens 4047046Sahrens if (dsl_dir_is_clone(ds->ds_dir)) { 4055367Sahrens rw_enter(&dp->dp_config_rwlock, RW_READER); 4066689Smaybee err = dsl_dataset_hold_obj(dp, 4076689Smaybee ds->ds_dir->dd_phys->dd_origin_obj, FTAG, &fromds); 4085367Sahrens rw_exit(&dp->dp_config_rwlock); 4095367Sahrens if (err) 4105367Sahrens return (err); 4115367Sahrens } else { 4125367Sahrens fromorigin = B_FALSE; 4135367Sahrens } 4145367Sahrens } 4155367Sahrens 4165367Sahrens 4172743Sahrens drr = kmem_zalloc(sizeof (dmu_replay_record_t), KM_SLEEP); 4182743Sahrens drr->drr_type = DRR_BEGIN; 4192743Sahrens drr->drr_u.drr_begin.drr_magic = DMU_BACKUP_MAGIC; 42011007SLori.Alt@Sun.COM DMU_SET_STREAM_HDRTYPE(drr->drr_u.drr_begin.drr_versioninfo, 42111007SLori.Alt@Sun.COM DMU_SUBSTREAM); 42212070SMark.Shellenbaum@Sun.COM 42312070SMark.Shellenbaum@Sun.COM #ifdef _KERNEL 42412070SMark.Shellenbaum@Sun.COM if (dmu_objset_type(tosnap) == DMU_OST_ZFS) { 42512070SMark.Shellenbaum@Sun.COM uint64_t version; 42612070SMark.Shellenbaum@Sun.COM if (zfs_get_zplprop(tosnap, ZFS_PROP_VERSION, &version) != 0) 42712070SMark.Shellenbaum@Sun.COM return (EINVAL); 42812070SMark.Shellenbaum@Sun.COM if (version == ZPL_VERSION_SA) { 42912070SMark.Shellenbaum@Sun.COM DMU_SET_FEATUREFLAGS( 43012070SMark.Shellenbaum@Sun.COM drr->drr_u.drr_begin.drr_versioninfo, 43112070SMark.Shellenbaum@Sun.COM DMU_BACKUP_FEATURE_SA_SPILL); 43212070SMark.Shellenbaum@Sun.COM } 43312070SMark.Shellenbaum@Sun.COM } 43412070SMark.Shellenbaum@Sun.COM #endif 43512070SMark.Shellenbaum@Sun.COM 4362743Sahrens drr->drr_u.drr_begin.drr_creation_time = 4372743Sahrens ds->ds_phys->ds_creation_time; 43810298SMatthew.Ahrens@Sun.COM drr->drr_u.drr_begin.drr_type = tosnap->os_phys->os_type; 4395367Sahrens if (fromorigin) 4405367Sahrens drr->drr_u.drr_begin.drr_flags |= DRR_FLAG_CLONE; 4412743Sahrens drr->drr_u.drr_begin.drr_toguid = ds->ds_phys->ds_guid; 4426492Stimh if (ds->ds_phys->ds_flags & DS_FLAG_CI_DATASET) 4436492Stimh drr->drr_u.drr_begin.drr_flags |= DRR_FLAG_CI_DATA; 4446492Stimh 4452743Sahrens if (fromds) 4462743Sahrens drr->drr_u.drr_begin.drr_fromguid = fromds->ds_phys->ds_guid; 4472743Sahrens dsl_dataset_name(ds, drr->drr_u.drr_begin.drr_toname); 4482743Sahrens 4495367Sahrens if (fromds) 4505367Sahrens fromtxg = fromds->ds_phys->ds_creation_txg; 4515367Sahrens if (fromorigin) 4526689Smaybee dsl_dataset_rele(fromds, FTAG); 4535367Sahrens 4542743Sahrens ba.drr = drr; 4552743Sahrens ba.vp = vp; 4562743Sahrens ba.os = tosnap; 4575367Sahrens ba.off = off; 45811007SLori.Alt@Sun.COM ba.toguid = ds->ds_phys->ds_guid; 4592743Sahrens ZIO_SET_CHECKSUM(&ba.zc, 0, 0, 0, 0); 46011007SLori.Alt@Sun.COM ba.pending_op = PENDING_NONE; 4612743Sahrens 46211007SLori.Alt@Sun.COM if (dump_bytes(&ba, drr, sizeof (dmu_replay_record_t)) != 0) { 4632743Sahrens kmem_free(drr, sizeof (dmu_replay_record_t)); 4642743Sahrens return (ba.err); 4652743Sahrens } 4662743Sahrens 4677837SMatthew.Ahrens@Sun.COM err = traverse_dataset(ds, fromtxg, TRAVERSE_PRE | TRAVERSE_PREFETCH, 4682743Sahrens backup_cb, &ba); 4692743Sahrens 47011007SLori.Alt@Sun.COM if (ba.pending_op != PENDING_NONE) 47111007SLori.Alt@Sun.COM if (dump_bytes(&ba, drr, sizeof (dmu_replay_record_t)) != 0) 47211007SLori.Alt@Sun.COM err = EINTR; 47311007SLori.Alt@Sun.COM 4742743Sahrens if (err) { 4752743Sahrens if (err == EINTR && ba.err) 4762743Sahrens err = ba.err; 4773655Sgw25295 kmem_free(drr, sizeof (dmu_replay_record_t)); 4782743Sahrens return (err); 4792743Sahrens } 4802743Sahrens 4812743Sahrens bzero(drr, sizeof (dmu_replay_record_t)); 4822743Sahrens drr->drr_type = DRR_END; 4832743Sahrens drr->drr_u.drr_end.drr_checksum = ba.zc; 48411007SLori.Alt@Sun.COM drr->drr_u.drr_end.drr_toguid = ba.toguid; 4852743Sahrens 48611007SLori.Alt@Sun.COM if (dump_bytes(&ba, drr, sizeof (dmu_replay_record_t)) != 0) { 4873655Sgw25295 kmem_free(drr, sizeof (dmu_replay_record_t)); 4882743Sahrens return (ba.err); 4893655Sgw25295 } 4902743Sahrens 4912743Sahrens kmem_free(drr, sizeof (dmu_replay_record_t)); 4922743Sahrens 4932743Sahrens return (0); 4942743Sahrens } 4952743Sahrens 4965367Sahrens struct recvbeginsyncarg { 4975367Sahrens const char *tofs; 4985367Sahrens const char *tosnap; 4995367Sahrens dsl_dataset_t *origin; 5005367Sahrens uint64_t fromguid; 5015367Sahrens dmu_objset_type_t type; 5025367Sahrens void *tag; 5035367Sahrens boolean_t force; 5046492Stimh uint64_t dsflags; 5055367Sahrens char clonelastname[MAXNAMELEN]; 5065367Sahrens dsl_dataset_t *ds; /* the ds to recv into; returned from the syncfunc */ 5072743Sahrens }; 5082743Sahrens 5095367Sahrens /* ARGSUSED */ 5102743Sahrens static int 51110272SMatthew.Ahrens@Sun.COM recv_new_check(void *arg1, void *arg2, dmu_tx_t *tx) 5125367Sahrens { 5135367Sahrens dsl_dir_t *dd = arg1; 5145367Sahrens struct recvbeginsyncarg *rbsa = arg2; 5155367Sahrens objset_t *mos = dd->dd_pool->dp_meta_objset; 5165367Sahrens uint64_t val; 5175367Sahrens int err; 5185367Sahrens 5195367Sahrens err = zap_lookup(mos, dd->dd_phys->dd_child_dir_zapobj, 5205367Sahrens strrchr(rbsa->tofs, '/') + 1, sizeof (uint64_t), 1, &val); 5215367Sahrens 5225367Sahrens if (err != ENOENT) 5235367Sahrens return (err ? err : EEXIST); 5245367Sahrens 5255367Sahrens if (rbsa->origin) { 5265367Sahrens /* make sure it's a snap in the same pool */ 5275367Sahrens if (rbsa->origin->ds_dir->dd_pool != dd->dd_pool) 5285367Sahrens return (EXDEV); 52910272SMatthew.Ahrens@Sun.COM if (!dsl_dataset_is_snapshot(rbsa->origin)) 5305367Sahrens return (EINVAL); 5315367Sahrens if (rbsa->origin->ds_phys->ds_guid != rbsa->fromguid) 5325367Sahrens return (ENODEV); 5335367Sahrens } 5345367Sahrens 5355367Sahrens return (0); 5365367Sahrens } 5375367Sahrens 5385367Sahrens static void 53910272SMatthew.Ahrens@Sun.COM recv_new_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) 5405367Sahrens { 5415367Sahrens dsl_dir_t *dd = arg1; 5425367Sahrens struct recvbeginsyncarg *rbsa = arg2; 5436689Smaybee uint64_t flags = DS_FLAG_INCONSISTENT | rbsa->dsflags; 5445367Sahrens uint64_t dsobj; 5455367Sahrens 54610272SMatthew.Ahrens@Sun.COM /* Create and open new dataset. */ 5475367Sahrens dsobj = dsl_dataset_create_sync(dd, strrchr(rbsa->tofs, '/') + 1, 5486492Stimh rbsa->origin, flags, cr, tx); 54910272SMatthew.Ahrens@Sun.COM VERIFY(0 == dsl_dataset_own_obj(dd->dd_pool, dsobj, 55010298SMatthew.Ahrens@Sun.COM B_TRUE, dmu_recv_tag, &rbsa->ds)); 5515367Sahrens 55210272SMatthew.Ahrens@Sun.COM if (rbsa->origin == NULL) { 55310272SMatthew.Ahrens@Sun.COM (void) dmu_objset_create_impl(dd->dd_pool->dp_spa, 55410272SMatthew.Ahrens@Sun.COM rbsa->ds, &rbsa->ds->ds_phys->ds_bp, rbsa->type, tx); 5555367Sahrens } 5565367Sahrens 55710272SMatthew.Ahrens@Sun.COM spa_history_internal_log(LOG_DS_REPLAY_FULL_SYNC, 55810272SMatthew.Ahrens@Sun.COM dd->dd_pool->dp_spa, tx, cr, "dataset = %lld", dsobj); 5595367Sahrens } 5605367Sahrens 5615367Sahrens /* ARGSUSED */ 5625367Sahrens static int 56310272SMatthew.Ahrens@Sun.COM recv_existing_check(void *arg1, void *arg2, dmu_tx_t *tx) 5645367Sahrens { 5655367Sahrens dsl_dataset_t *ds = arg1; 5665367Sahrens struct recvbeginsyncarg *rbsa = arg2; 5672743Sahrens int err; 5682743Sahrens uint64_t val; 5692743Sahrens 5705367Sahrens /* must not have any changes since most recent snapshot */ 5715367Sahrens if (!rbsa->force && dsl_dataset_modified_since_lastsnap(ds)) 5725367Sahrens return (ETXTBSY); 5735367Sahrens 57410272SMatthew.Ahrens@Sun.COM if (rbsa->fromguid) { 57510272SMatthew.Ahrens@Sun.COM /* if incremental, most recent snapshot must match fromguid */ 57610272SMatthew.Ahrens@Sun.COM if (ds->ds_prev == NULL) 57710272SMatthew.Ahrens@Sun.COM return (ENODEV); 57811022STom.Erickson@Sun.COM 57911022STom.Erickson@Sun.COM /* 58011022STom.Erickson@Sun.COM * most recent snapshot must match fromguid, or there are no 58111022STom.Erickson@Sun.COM * changes since the fromguid one 58211022STom.Erickson@Sun.COM */ 58311022STom.Erickson@Sun.COM if (ds->ds_prev->ds_phys->ds_guid != rbsa->fromguid) { 58411022STom.Erickson@Sun.COM uint64_t birth = ds->ds_prev->ds_phys->ds_bp.blk_birth; 58511022STom.Erickson@Sun.COM uint64_t obj = ds->ds_prev->ds_phys->ds_prev_snap_obj; 58611022STom.Erickson@Sun.COM while (obj != 0) { 58711022STom.Erickson@Sun.COM dsl_dataset_t *snap; 58811022STom.Erickson@Sun.COM err = dsl_dataset_hold_obj(ds->ds_dir->dd_pool, 58911022STom.Erickson@Sun.COM obj, FTAG, &snap); 59011022STom.Erickson@Sun.COM if (err) 59111022STom.Erickson@Sun.COM return (ENODEV); 59211022STom.Erickson@Sun.COM if (snap->ds_phys->ds_creation_txg < birth) { 59311022STom.Erickson@Sun.COM dsl_dataset_rele(snap, FTAG); 59411022STom.Erickson@Sun.COM return (ENODEV); 59511022STom.Erickson@Sun.COM } 59611022STom.Erickson@Sun.COM if (snap->ds_phys->ds_guid == rbsa->fromguid) { 59711022STom.Erickson@Sun.COM dsl_dataset_rele(snap, FTAG); 59811022STom.Erickson@Sun.COM break; /* it's ok */ 59911022STom.Erickson@Sun.COM } 60011022STom.Erickson@Sun.COM obj = snap->ds_phys->ds_prev_snap_obj; 60111022STom.Erickson@Sun.COM dsl_dataset_rele(snap, FTAG); 60211022STom.Erickson@Sun.COM } 60311022STom.Erickson@Sun.COM if (obj == 0) 60411022STom.Erickson@Sun.COM return (ENODEV); 60511022STom.Erickson@Sun.COM } 60610272SMatthew.Ahrens@Sun.COM } else { 60710272SMatthew.Ahrens@Sun.COM /* if full, most recent snapshot must be $ORIGIN */ 60810272SMatthew.Ahrens@Sun.COM if (ds->ds_phys->ds_prev_snap_txg >= TXG_INITIAL) 60910272SMatthew.Ahrens@Sun.COM return (ENODEV); 61010272SMatthew.Ahrens@Sun.COM } 6112743Sahrens 6126083Sek110237 /* temporary clone name must not exist */ 6136083Sek110237 err = zap_lookup(ds->ds_dir->dd_pool->dp_meta_objset, 6146083Sek110237 ds->ds_dir->dd_phys->dd_child_dir_zapobj, 6156083Sek110237 rbsa->clonelastname, 8, 1, &val); 6166083Sek110237 if (err == 0) 6176083Sek110237 return (EEXIST); 6186083Sek110237 if (err != ENOENT) 6196083Sek110237 return (err); 6206083Sek110237 6212743Sahrens /* new snapshot name must not exist */ 6225367Sahrens err = zap_lookup(ds->ds_dir->dd_pool->dp_meta_objset, 6235367Sahrens ds->ds_phys->ds_snapnames_zapobj, rbsa->tosnap, 8, 1, &val); 6245367Sahrens if (err == 0) 6252743Sahrens return (EEXIST); 6262743Sahrens if (err != ENOENT) 6275367Sahrens return (err); 6282743Sahrens return (0); 6292743Sahrens } 6302743Sahrens 6312743Sahrens /* ARGSUSED */ 6325367Sahrens static void 63310272SMatthew.Ahrens@Sun.COM recv_existing_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) 6345326Sek110237 { 6355367Sahrens dsl_dataset_t *ohds = arg1; 6365367Sahrens struct recvbeginsyncarg *rbsa = arg2; 6375367Sahrens dsl_pool_t *dp = ohds->ds_dir->dd_pool; 63810272SMatthew.Ahrens@Sun.COM dsl_dataset_t *cds; 6396689Smaybee uint64_t flags = DS_FLAG_INCONSISTENT | rbsa->dsflags; 6405367Sahrens uint64_t dsobj; 6415326Sek110237 64210272SMatthew.Ahrens@Sun.COM /* create and open the temporary clone */ 64310272SMatthew.Ahrens@Sun.COM dsobj = dsl_dataset_create_sync(ohds->ds_dir, rbsa->clonelastname, 64410272SMatthew.Ahrens@Sun.COM ohds->ds_prev, flags, cr, tx); 64510298SMatthew.Ahrens@Sun.COM VERIFY(0 == dsl_dataset_own_obj(dp, dsobj, B_TRUE, dmu_recv_tag, &cds)); 6465367Sahrens 64710272SMatthew.Ahrens@Sun.COM /* 64810272SMatthew.Ahrens@Sun.COM * If we actually created a non-clone, we need to create the 64910272SMatthew.Ahrens@Sun.COM * objset in our new dataset. 65010272SMatthew.Ahrens@Sun.COM */ 65110272SMatthew.Ahrens@Sun.COM if (BP_IS_HOLE(dsl_dataset_get_blkptr(cds))) { 65210272SMatthew.Ahrens@Sun.COM (void) dmu_objset_create_impl(dp->dp_spa, 65310272SMatthew.Ahrens@Sun.COM cds, dsl_dataset_get_blkptr(cds), rbsa->type, tx); 65410272SMatthew.Ahrens@Sun.COM } 65510272SMatthew.Ahrens@Sun.COM 6565367Sahrens rbsa->ds = cds; 6575367Sahrens 6585367Sahrens spa_history_internal_log(LOG_DS_REPLAY_INC_SYNC, 6596689Smaybee dp->dp_spa, tx, cr, "dataset = %lld", dsobj); 6605326Sek110237 } 6615326Sek110237 66212070SMark.Shellenbaum@Sun.COM 66312070SMark.Shellenbaum@Sun.COM static boolean_t 66412070SMark.Shellenbaum@Sun.COM dmu_recv_verify_features(dsl_dataset_t *ds, struct drr_begin *drrb) 66512070SMark.Shellenbaum@Sun.COM { 66612070SMark.Shellenbaum@Sun.COM int featureflags; 66712070SMark.Shellenbaum@Sun.COM 66812070SMark.Shellenbaum@Sun.COM featureflags = DMU_GET_FEATUREFLAGS(drrb->drr_versioninfo); 66912070SMark.Shellenbaum@Sun.COM 67012070SMark.Shellenbaum@Sun.COM /* Verify pool version supports SA if SA_SPILL feature set */ 67112070SMark.Shellenbaum@Sun.COM return ((featureflags & DMU_BACKUP_FEATURE_SA_SPILL) && 67212070SMark.Shellenbaum@Sun.COM (spa_version(dsl_dataset_get_spa(ds)) < SPA_VERSION_SA)); 67312070SMark.Shellenbaum@Sun.COM } 67412070SMark.Shellenbaum@Sun.COM 6755367Sahrens /* 6765367Sahrens * NB: callers *MUST* call dmu_recv_stream() if dmu_recv_begin() 6775367Sahrens * succeeds; otherwise we will leak the holds on the datasets. 6785367Sahrens */ 6795367Sahrens int 68011007SLori.Alt@Sun.COM dmu_recv_begin(char *tofs, char *tosnap, char *top_ds, struct drr_begin *drrb, 68110204SMatthew.Ahrens@Sun.COM boolean_t force, objset_t *origin, dmu_recv_cookie_t *drc) 6822743Sahrens { 6835367Sahrens int err = 0; 6845367Sahrens boolean_t byteswap; 68510272SMatthew.Ahrens@Sun.COM struct recvbeginsyncarg rbsa = { 0 }; 68611007SLori.Alt@Sun.COM uint64_t versioninfo; 6875367Sahrens int flags; 6885367Sahrens dsl_dataset_t *ds; 6895367Sahrens 6905367Sahrens if (drrb->drr_magic == DMU_BACKUP_MAGIC) 6915367Sahrens byteswap = FALSE; 6925367Sahrens else if (drrb->drr_magic == BSWAP_64(DMU_BACKUP_MAGIC)) 6935367Sahrens byteswap = TRUE; 6945367Sahrens else 6955367Sahrens return (EINVAL); 6965367Sahrens 6975367Sahrens rbsa.tofs = tofs; 6985367Sahrens rbsa.tosnap = tosnap; 69910298SMatthew.Ahrens@Sun.COM rbsa.origin = origin ? origin->os_dsl_dataset : NULL; 7005367Sahrens rbsa.fromguid = drrb->drr_fromguid; 7015367Sahrens rbsa.type = drrb->drr_type; 7025367Sahrens rbsa.tag = FTAG; 7036492Stimh rbsa.dsflags = 0; 70411007SLori.Alt@Sun.COM versioninfo = drrb->drr_versioninfo; 7055367Sahrens flags = drrb->drr_flags; 7065367Sahrens 7075367Sahrens if (byteswap) { 7085367Sahrens rbsa.type = BSWAP_32(rbsa.type); 7095367Sahrens rbsa.fromguid = BSWAP_64(rbsa.fromguid); 71011007SLori.Alt@Sun.COM versioninfo = BSWAP_64(versioninfo); 7115367Sahrens flags = BSWAP_32(flags); 7125367Sahrens } 7135367Sahrens 71411007SLori.Alt@Sun.COM if (DMU_GET_STREAM_HDRTYPE(versioninfo) == DMU_COMPOUNDSTREAM || 7155367Sahrens rbsa.type >= DMU_OST_NUMTYPES || 7165367Sahrens ((flags & DRR_FLAG_CLONE) && origin == NULL)) 7175367Sahrens return (EINVAL); 7185367Sahrens 7196492Stimh if (flags & DRR_FLAG_CI_DATA) 7206492Stimh rbsa.dsflags = DS_FLAG_CI_DATASET; 7216492Stimh 7225367Sahrens bzero(drc, sizeof (dmu_recv_cookie_t)); 7235367Sahrens drc->drc_drrb = drrb; 7245367Sahrens drc->drc_tosnap = tosnap; 72511007SLori.Alt@Sun.COM drc->drc_top_ds = top_ds; 7265367Sahrens drc->drc_force = force; 7275367Sahrens 7285367Sahrens /* 7295367Sahrens * Process the begin in syncing context. 7305367Sahrens */ 73110272SMatthew.Ahrens@Sun.COM 73210272SMatthew.Ahrens@Sun.COM /* open the dataset we are logically receiving into */ 73310272SMatthew.Ahrens@Sun.COM err = dsl_dataset_hold(tofs, dmu_recv_tag, &ds); 73410272SMatthew.Ahrens@Sun.COM if (err == 0) { 73512070SMark.Shellenbaum@Sun.COM if (dmu_recv_verify_features(ds, drrb)) { 73612070SMark.Shellenbaum@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 73712070SMark.Shellenbaum@Sun.COM return (ENOTSUP); 73812070SMark.Shellenbaum@Sun.COM } 73910272SMatthew.Ahrens@Sun.COM /* target fs already exists; recv into temp clone */ 7405367Sahrens 74110272SMatthew.Ahrens@Sun.COM /* Can't recv a clone into an existing fs */ 74210272SMatthew.Ahrens@Sun.COM if (flags & DRR_FLAG_CLONE) { 74310272SMatthew.Ahrens@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 74410272SMatthew.Ahrens@Sun.COM return (EINVAL); 74510272SMatthew.Ahrens@Sun.COM } 7462743Sahrens 74710204SMatthew.Ahrens@Sun.COM /* must not have an incremental recv already in progress */ 74810204SMatthew.Ahrens@Sun.COM if (!mutex_tryenter(&ds->ds_recvlock)) { 74910204SMatthew.Ahrens@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 75010204SMatthew.Ahrens@Sun.COM return (EBUSY); 75110204SMatthew.Ahrens@Sun.COM } 75210204SMatthew.Ahrens@Sun.COM 75310272SMatthew.Ahrens@Sun.COM /* tmp clone name is: tofs/%tosnap" */ 75410272SMatthew.Ahrens@Sun.COM (void) snprintf(rbsa.clonelastname, sizeof (rbsa.clonelastname), 75510272SMatthew.Ahrens@Sun.COM "%%%s", tosnap); 7565367Sahrens rbsa.force = force; 7575367Sahrens err = dsl_sync_task_do(ds->ds_dir->dd_pool, 75810272SMatthew.Ahrens@Sun.COM recv_existing_check, recv_existing_sync, ds, &rbsa, 5); 7595367Sahrens if (err) { 76010204SMatthew.Ahrens@Sun.COM mutex_exit(&ds->ds_recvlock); 7616689Smaybee dsl_dataset_rele(ds, dmu_recv_tag); 7625367Sahrens return (err); 7635367Sahrens } 7645367Sahrens drc->drc_logical_ds = ds; 7655367Sahrens drc->drc_real_ds = rbsa.ds; 76610272SMatthew.Ahrens@Sun.COM } else if (err == ENOENT) { 76710272SMatthew.Ahrens@Sun.COM /* target fs does not exist; must be a full backup or clone */ 76810272SMatthew.Ahrens@Sun.COM char *cp; 7695367Sahrens 77010272SMatthew.Ahrens@Sun.COM /* 77110272SMatthew.Ahrens@Sun.COM * If it's a non-clone incremental, we are missing the 77210272SMatthew.Ahrens@Sun.COM * target fs, so fail the recv. 77310272SMatthew.Ahrens@Sun.COM */ 77410272SMatthew.Ahrens@Sun.COM if (rbsa.fromguid && !(flags & DRR_FLAG_CLONE)) 77510272SMatthew.Ahrens@Sun.COM return (ENOENT); 77610272SMatthew.Ahrens@Sun.COM 77710272SMatthew.Ahrens@Sun.COM /* Open the parent of tofs */ 77810272SMatthew.Ahrens@Sun.COM cp = strrchr(tofs, '/'); 77910272SMatthew.Ahrens@Sun.COM *cp = '\0'; 78010819SChris.Kirby@sun.com err = dsl_dataset_hold(tofs, FTAG, &ds); 78110272SMatthew.Ahrens@Sun.COM *cp = '/'; 7825367Sahrens if (err) 7835367Sahrens return (err); 7845367Sahrens 78512070SMark.Shellenbaum@Sun.COM if (dmu_recv_verify_features(ds, drrb)) { 78612070SMark.Shellenbaum@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 78712070SMark.Shellenbaum@Sun.COM return (ENOTSUP); 78812070SMark.Shellenbaum@Sun.COM } 78912070SMark.Shellenbaum@Sun.COM 79010272SMatthew.Ahrens@Sun.COM err = dsl_sync_task_do(ds->ds_dir->dd_pool, 79110272SMatthew.Ahrens@Sun.COM recv_new_check, recv_new_sync, ds->ds_dir, &rbsa, 5); 79210819SChris.Kirby@sun.com dsl_dataset_rele(ds, FTAG); 7935367Sahrens if (err) 7945367Sahrens return (err); 7955367Sahrens drc->drc_logical_ds = drc->drc_real_ds = rbsa.ds; 7965367Sahrens drc->drc_newfs = B_TRUE; 7975367Sahrens } 7985367Sahrens 79910272SMatthew.Ahrens@Sun.COM return (err); 8002743Sahrens } 8012743Sahrens 8025367Sahrens struct restorearg { 8035367Sahrens int err; 8045367Sahrens int byteswap; 8055367Sahrens vnode_t *vp; 8065367Sahrens char *buf; 8075367Sahrens uint64_t voff; 8085367Sahrens int bufsize; /* amount of memory allocated for buf */ 8095367Sahrens zio_cksum_t cksum; 81011007SLori.Alt@Sun.COM avl_tree_t guid_to_ds_map; 8115326Sek110237 }; 8125326Sek110237 81311007SLori.Alt@Sun.COM typedef struct guid_map_entry { 81411007SLori.Alt@Sun.COM uint64_t guid; 81511007SLori.Alt@Sun.COM dsl_dataset_t *gme_ds; 81611007SLori.Alt@Sun.COM avl_node_t avlnode; 81711007SLori.Alt@Sun.COM } guid_map_entry_t; 81811007SLori.Alt@Sun.COM 81911007SLori.Alt@Sun.COM static int 82011007SLori.Alt@Sun.COM guid_compare(const void *arg1, const void *arg2) 82111007SLori.Alt@Sun.COM { 82211007SLori.Alt@Sun.COM const guid_map_entry_t *gmep1 = arg1; 82311007SLori.Alt@Sun.COM const guid_map_entry_t *gmep2 = arg2; 82411007SLori.Alt@Sun.COM 82511007SLori.Alt@Sun.COM if (gmep1->guid < gmep2->guid) 82611007SLori.Alt@Sun.COM return (-1); 82711007SLori.Alt@Sun.COM else if (gmep1->guid > gmep2->guid) 82811007SLori.Alt@Sun.COM return (1); 82911007SLori.Alt@Sun.COM return (0); 83011007SLori.Alt@Sun.COM } 83111007SLori.Alt@Sun.COM 83211007SLori.Alt@Sun.COM /* 83311007SLori.Alt@Sun.COM * This function is a callback used by dmu_objset_find() (which 83411007SLori.Alt@Sun.COM * enumerates the object sets) to build an avl tree that maps guids 83511007SLori.Alt@Sun.COM * to datasets. The resulting table is used when processing DRR_WRITE_BYREF 83611007SLori.Alt@Sun.COM * send stream records. These records, which are used in dedup'ed 83711007SLori.Alt@Sun.COM * streams, do not contain data themselves, but refer to a copy 83811007SLori.Alt@Sun.COM * of the data block that has already been written because it was 83911007SLori.Alt@Sun.COM * earlier in the stream. That previous copy is identified by the 84011007SLori.Alt@Sun.COM * guid of the dataset with the referenced data. 84111007SLori.Alt@Sun.COM */ 84211007SLori.Alt@Sun.COM int 84311209SMatthew.Ahrens@Sun.COM find_ds_by_guid(const char *name, void *arg) 84411007SLori.Alt@Sun.COM { 84511209SMatthew.Ahrens@Sun.COM avl_tree_t *guid_map = arg; 84611007SLori.Alt@Sun.COM dsl_dataset_t *ds, *snapds; 84711007SLori.Alt@Sun.COM guid_map_entry_t *gmep; 84811209SMatthew.Ahrens@Sun.COM dsl_pool_t *dp; 84911007SLori.Alt@Sun.COM int err; 85011007SLori.Alt@Sun.COM uint64_t lastobj, firstobj; 85111007SLori.Alt@Sun.COM 85211007SLori.Alt@Sun.COM if (dsl_dataset_hold(name, FTAG, &ds) != 0) 85311007SLori.Alt@Sun.COM return (0); 85411007SLori.Alt@Sun.COM 85511007SLori.Alt@Sun.COM dp = ds->ds_dir->dd_pool; 85611007SLori.Alt@Sun.COM rw_enter(&dp->dp_config_rwlock, RW_READER); 85711007SLori.Alt@Sun.COM firstobj = ds->ds_dir->dd_phys->dd_origin_obj; 85811007SLori.Alt@Sun.COM lastobj = ds->ds_phys->ds_prev_snap_obj; 85911007SLori.Alt@Sun.COM 86011007SLori.Alt@Sun.COM while (lastobj != firstobj) { 86111007SLori.Alt@Sun.COM err = dsl_dataset_hold_obj(dp, lastobj, guid_map, &snapds); 86211007SLori.Alt@Sun.COM if (err) { 86311007SLori.Alt@Sun.COM /* 86411007SLori.Alt@Sun.COM * Skip this snapshot and move on. It's not 86511007SLori.Alt@Sun.COM * clear why this would ever happen, but the 86611007SLori.Alt@Sun.COM * remainder of the snapshot streadm can be 86711007SLori.Alt@Sun.COM * processed. 86811007SLori.Alt@Sun.COM */ 86911007SLori.Alt@Sun.COM rw_exit(&dp->dp_config_rwlock); 87011007SLori.Alt@Sun.COM dsl_dataset_rele(ds, FTAG); 87111007SLori.Alt@Sun.COM return (0); 87211007SLori.Alt@Sun.COM } 87311007SLori.Alt@Sun.COM 87411007SLori.Alt@Sun.COM gmep = kmem_alloc(sizeof (guid_map_entry_t), KM_SLEEP); 87511007SLori.Alt@Sun.COM gmep->guid = snapds->ds_phys->ds_guid; 87611007SLori.Alt@Sun.COM gmep->gme_ds = snapds; 87711007SLori.Alt@Sun.COM avl_add(guid_map, gmep); 87811007SLori.Alt@Sun.COM lastobj = snapds->ds_phys->ds_prev_snap_obj; 87911007SLori.Alt@Sun.COM } 88011007SLori.Alt@Sun.COM 88111007SLori.Alt@Sun.COM rw_exit(&dp->dp_config_rwlock); 88211007SLori.Alt@Sun.COM dsl_dataset_rele(ds, FTAG); 88311007SLori.Alt@Sun.COM 88411007SLori.Alt@Sun.COM return (0); 88511007SLori.Alt@Sun.COM } 88611007SLori.Alt@Sun.COM 8872743Sahrens static void * 8882743Sahrens restore_read(struct restorearg *ra, int len) 8892743Sahrens { 8902743Sahrens void *rv; 8915367Sahrens int done = 0; 8922743Sahrens 8932743Sahrens /* some things will require 8-byte alignment, so everything must */ 8942743Sahrens ASSERT3U(len % 8, ==, 0); 8952743Sahrens 8965367Sahrens while (done < len) { 8972743Sahrens ssize_t resid; 8982743Sahrens 8992743Sahrens ra->err = vn_rdwr(UIO_READ, ra->vp, 9005367Sahrens (caddr_t)ra->buf + done, len - done, 9012743Sahrens ra->voff, UIO_SYSSPACE, FAPPEND, 9022743Sahrens RLIM64_INFINITY, CRED(), &resid); 9032743Sahrens 9045367Sahrens if (resid == len - done) 9052743Sahrens ra->err = EINVAL; 9065367Sahrens ra->voff += len - done - resid; 9075367Sahrens done = len - resid; 9082743Sahrens if (ra->err) 9092743Sahrens return (NULL); 9102743Sahrens } 9112743Sahrens 9125367Sahrens ASSERT3U(done, ==, len); 9135367Sahrens rv = ra->buf; 9142743Sahrens if (ra->byteswap) 9155367Sahrens fletcher_4_incremental_byteswap(rv, len, &ra->cksum); 9162743Sahrens else 9175367Sahrens fletcher_4_incremental_native(rv, len, &ra->cksum); 9182743Sahrens return (rv); 9192743Sahrens } 9202743Sahrens 9212743Sahrens static void 9222743Sahrens backup_byteswap(dmu_replay_record_t *drr) 9232743Sahrens { 9242743Sahrens #define DO64(X) (drr->drr_u.X = BSWAP_64(drr->drr_u.X)) 9252743Sahrens #define DO32(X) (drr->drr_u.X = BSWAP_32(drr->drr_u.X)) 9262743Sahrens drr->drr_type = BSWAP_32(drr->drr_type); 9275367Sahrens drr->drr_payloadlen = BSWAP_32(drr->drr_payloadlen); 9282743Sahrens switch (drr->drr_type) { 9292743Sahrens case DRR_BEGIN: 9302743Sahrens DO64(drr_begin.drr_magic); 93111007SLori.Alt@Sun.COM DO64(drr_begin.drr_versioninfo); 9322743Sahrens DO64(drr_begin.drr_creation_time); 9332743Sahrens DO32(drr_begin.drr_type); 9345367Sahrens DO32(drr_begin.drr_flags); 9352743Sahrens DO64(drr_begin.drr_toguid); 9362743Sahrens DO64(drr_begin.drr_fromguid); 9372743Sahrens break; 9382743Sahrens case DRR_OBJECT: 9392743Sahrens DO64(drr_object.drr_object); 9402743Sahrens /* DO64(drr_object.drr_allocation_txg); */ 9412743Sahrens DO32(drr_object.drr_type); 9422743Sahrens DO32(drr_object.drr_bonustype); 9432743Sahrens DO32(drr_object.drr_blksz); 9442743Sahrens DO32(drr_object.drr_bonuslen); 94511007SLori.Alt@Sun.COM DO64(drr_object.drr_toguid); 9462743Sahrens break; 9472743Sahrens case DRR_FREEOBJECTS: 9482743Sahrens DO64(drr_freeobjects.drr_firstobj); 9492743Sahrens DO64(drr_freeobjects.drr_numobjs); 95011007SLori.Alt@Sun.COM DO64(drr_freeobjects.drr_toguid); 9512743Sahrens break; 9522743Sahrens case DRR_WRITE: 9532743Sahrens DO64(drr_write.drr_object); 9542743Sahrens DO32(drr_write.drr_type); 9552743Sahrens DO64(drr_write.drr_offset); 9562743Sahrens DO64(drr_write.drr_length); 95711007SLori.Alt@Sun.COM DO64(drr_write.drr_toguid); 95811381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_cksum.zc_word[0]); 95911381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_cksum.zc_word[1]); 96011381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_cksum.zc_word[2]); 96111381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_cksum.zc_word[3]); 96211381SLori.Alt@Sun.COM DO64(drr_write.drr_key.ddk_prop); 96311007SLori.Alt@Sun.COM break; 96411007SLori.Alt@Sun.COM case DRR_WRITE_BYREF: 96511007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_object); 96611007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_offset); 96711007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_length); 96811007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_toguid); 96911007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_refguid); 97011007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_refobject); 97111007SLori.Alt@Sun.COM DO64(drr_write_byref.drr_refoffset); 97211381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_cksum.zc_word[0]); 97311381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_cksum.zc_word[1]); 97411381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_cksum.zc_word[2]); 97511381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_cksum.zc_word[3]); 97611381SLori.Alt@Sun.COM DO64(drr_write_byref.drr_key.ddk_prop); 9772743Sahrens break; 9782743Sahrens case DRR_FREE: 9792743Sahrens DO64(drr_free.drr_object); 9802743Sahrens DO64(drr_free.drr_offset); 9812743Sahrens DO64(drr_free.drr_length); 98211007SLori.Alt@Sun.COM DO64(drr_free.drr_toguid); 9832743Sahrens break; 98411935SMark.Shellenbaum@Sun.COM case DRR_SPILL: 98511935SMark.Shellenbaum@Sun.COM DO64(drr_spill.drr_object); 98611935SMark.Shellenbaum@Sun.COM DO64(drr_spill.drr_length); 98711935SMark.Shellenbaum@Sun.COM DO64(drr_spill.drr_toguid); 98811935SMark.Shellenbaum@Sun.COM break; 9892743Sahrens case DRR_END: 9902743Sahrens DO64(drr_end.drr_checksum.zc_word[0]); 9912743Sahrens DO64(drr_end.drr_checksum.zc_word[1]); 9922743Sahrens DO64(drr_end.drr_checksum.zc_word[2]); 9932743Sahrens DO64(drr_end.drr_checksum.zc_word[3]); 99411007SLori.Alt@Sun.COM DO64(drr_end.drr_toguid); 9952743Sahrens break; 9962743Sahrens } 9972743Sahrens #undef DO64 9982743Sahrens #undef DO32 9992743Sahrens } 10002743Sahrens 10012743Sahrens static int 10022743Sahrens restore_object(struct restorearg *ra, objset_t *os, struct drr_object *drro) 10032743Sahrens { 10042743Sahrens int err; 10052743Sahrens dmu_tx_t *tx; 10067994STim.Haley@Sun.COM void *data = NULL; 10072743Sahrens 10082743Sahrens if (drro->drr_type == DMU_OT_NONE || 10092743Sahrens drro->drr_type >= DMU_OT_NUMTYPES || 10102743Sahrens drro->drr_bonustype >= DMU_OT_NUMTYPES || 101111007SLori.Alt@Sun.COM drro->drr_checksumtype >= ZIO_CHECKSUM_FUNCTIONS || 10122743Sahrens drro->drr_compress >= ZIO_COMPRESS_FUNCTIONS || 10132743Sahrens P2PHASE(drro->drr_blksz, SPA_MINBLOCKSIZE) || 10142743Sahrens drro->drr_blksz < SPA_MINBLOCKSIZE || 10152743Sahrens drro->drr_blksz > SPA_MAXBLOCKSIZE || 10162743Sahrens drro->drr_bonuslen > DN_MAX_BONUSLEN) { 10172743Sahrens return (EINVAL); 10182743Sahrens } 10192743Sahrens 10208986SMark.Maybee@Sun.COM err = dmu_object_info(os, drro->drr_object, NULL); 10218986SMark.Maybee@Sun.COM 10228986SMark.Maybee@Sun.COM if (err != 0 && err != ENOENT) 10238986SMark.Maybee@Sun.COM return (EINVAL); 10248986SMark.Maybee@Sun.COM 10257994STim.Haley@Sun.COM if (drro->drr_bonuslen) { 10267994STim.Haley@Sun.COM data = restore_read(ra, P2ROUNDUP(drro->drr_bonuslen, 8)); 10277994STim.Haley@Sun.COM if (ra->err) 10287994STim.Haley@Sun.COM return (ra->err); 10297994STim.Haley@Sun.COM } 10307994STim.Haley@Sun.COM 10312743Sahrens if (err == ENOENT) { 10322743Sahrens /* currently free, want to be allocated */ 10338986SMark.Maybee@Sun.COM tx = dmu_tx_create(os); 10342743Sahrens dmu_tx_hold_bonus(tx, DMU_NEW_OBJECT); 10352743Sahrens err = dmu_tx_assign(tx, TXG_WAIT); 10362743Sahrens if (err) { 10372743Sahrens dmu_tx_abort(tx); 10382743Sahrens return (err); 10392743Sahrens } 10402743Sahrens err = dmu_object_claim(os, drro->drr_object, 10412743Sahrens drro->drr_type, drro->drr_blksz, 10422743Sahrens drro->drr_bonustype, drro->drr_bonuslen, tx); 10438986SMark.Maybee@Sun.COM dmu_tx_commit(tx); 10442743Sahrens } else { 10452743Sahrens /* currently allocated, want to be allocated */ 10462743Sahrens err = dmu_object_reclaim(os, drro->drr_object, 10472743Sahrens drro->drr_type, drro->drr_blksz, 10488986SMark.Maybee@Sun.COM drro->drr_bonustype, drro->drr_bonuslen); 10492743Sahrens } 105011935SMark.Shellenbaum@Sun.COM if (err) { 10518986SMark.Maybee@Sun.COM return (EINVAL); 105211935SMark.Shellenbaum@Sun.COM } 10538986SMark.Maybee@Sun.COM 10548986SMark.Maybee@Sun.COM tx = dmu_tx_create(os); 10558986SMark.Maybee@Sun.COM dmu_tx_hold_bonus(tx, drro->drr_object); 10568986SMark.Maybee@Sun.COM err = dmu_tx_assign(tx, TXG_WAIT); 10572743Sahrens if (err) { 10588986SMark.Maybee@Sun.COM dmu_tx_abort(tx); 10598986SMark.Maybee@Sun.COM return (err); 10602743Sahrens } 10612743Sahrens 106211007SLori.Alt@Sun.COM dmu_object_set_checksum(os, drro->drr_object, drro->drr_checksumtype, 106311007SLori.Alt@Sun.COM tx); 10642743Sahrens dmu_object_set_compress(os, drro->drr_object, drro->drr_compress, tx); 10652743Sahrens 10667994STim.Haley@Sun.COM if (data != NULL) { 10672743Sahrens dmu_buf_t *db; 10687994STim.Haley@Sun.COM 10692743Sahrens VERIFY(0 == dmu_bonus_hold(os, drro->drr_object, FTAG, &db)); 10702743Sahrens dmu_buf_will_dirty(db, tx); 10712743Sahrens 10724944Smaybee ASSERT3U(db->db_size, >=, drro->drr_bonuslen); 10734944Smaybee bcopy(data, db->db_data, drro->drr_bonuslen); 10742743Sahrens if (ra->byteswap) { 10752743Sahrens dmu_ot[drro->drr_bonustype].ot_byteswap(db->db_data, 10762743Sahrens drro->drr_bonuslen); 10772743Sahrens } 10782743Sahrens dmu_buf_rele(db, FTAG); 10792743Sahrens } 10802743Sahrens dmu_tx_commit(tx); 10812743Sahrens return (0); 10822743Sahrens } 10832743Sahrens 10842743Sahrens /* ARGSUSED */ 10852743Sahrens static int 10862743Sahrens restore_freeobjects(struct restorearg *ra, objset_t *os, 10872743Sahrens struct drr_freeobjects *drrfo) 10882743Sahrens { 10892743Sahrens uint64_t obj; 10902743Sahrens 10912743Sahrens if (drrfo->drr_firstobj + drrfo->drr_numobjs < drrfo->drr_firstobj) 10922743Sahrens return (EINVAL); 10932743Sahrens 10942743Sahrens for (obj = drrfo->drr_firstobj; 10953087Sahrens obj < drrfo->drr_firstobj + drrfo->drr_numobjs; 10963087Sahrens (void) dmu_object_next(os, &obj, FALSE, 0)) { 10972743Sahrens int err; 10982743Sahrens 10992743Sahrens if (dmu_object_info(os, obj, NULL) != 0) 11002743Sahrens continue; 11012743Sahrens 11026992Smaybee err = dmu_free_object(os, obj); 11036992Smaybee if (err) 11042743Sahrens return (err); 11052743Sahrens } 11062743Sahrens return (0); 11072743Sahrens } 11082743Sahrens 11092743Sahrens static int 11102743Sahrens restore_write(struct restorearg *ra, objset_t *os, 11112743Sahrens struct drr_write *drrw) 11122743Sahrens { 11132743Sahrens dmu_tx_t *tx; 11142743Sahrens void *data; 11152743Sahrens int err; 11162743Sahrens 11172743Sahrens if (drrw->drr_offset + drrw->drr_length < drrw->drr_offset || 11182743Sahrens drrw->drr_type >= DMU_OT_NUMTYPES) 11192743Sahrens return (EINVAL); 11202743Sahrens 11212743Sahrens data = restore_read(ra, drrw->drr_length); 11222743Sahrens if (data == NULL) 11232743Sahrens return (ra->err); 11242743Sahrens 11252743Sahrens if (dmu_object_info(os, drrw->drr_object, NULL) != 0) 11262743Sahrens return (EINVAL); 11272743Sahrens 11282743Sahrens tx = dmu_tx_create(os); 11292743Sahrens 11302743Sahrens dmu_tx_hold_write(tx, drrw->drr_object, 11312743Sahrens drrw->drr_offset, drrw->drr_length); 11322743Sahrens err = dmu_tx_assign(tx, TXG_WAIT); 11332743Sahrens if (err) { 11342743Sahrens dmu_tx_abort(tx); 11352743Sahrens return (err); 11362743Sahrens } 11372743Sahrens if (ra->byteswap) 11382743Sahrens dmu_ot[drrw->drr_type].ot_byteswap(data, drrw->drr_length); 11392743Sahrens dmu_write(os, drrw->drr_object, 11402743Sahrens drrw->drr_offset, drrw->drr_length, data, tx); 11412743Sahrens dmu_tx_commit(tx); 11422743Sahrens return (0); 11432743Sahrens } 11442743Sahrens 114511007SLori.Alt@Sun.COM /* 114611007SLori.Alt@Sun.COM * Handle a DRR_WRITE_BYREF record. This record is used in dedup'ed 114711007SLori.Alt@Sun.COM * streams to refer to a copy of the data that is already on the 114811007SLori.Alt@Sun.COM * system because it came in earlier in the stream. This function 114911007SLori.Alt@Sun.COM * finds the earlier copy of the data, and uses that copy instead of 115011007SLori.Alt@Sun.COM * data from the stream to fulfill this write. 115111007SLori.Alt@Sun.COM */ 115211007SLori.Alt@Sun.COM static int 115311007SLori.Alt@Sun.COM restore_write_byref(struct restorearg *ra, objset_t *os, 115411007SLori.Alt@Sun.COM struct drr_write_byref *drrwbr) 115511007SLori.Alt@Sun.COM { 115611007SLori.Alt@Sun.COM dmu_tx_t *tx; 115711007SLori.Alt@Sun.COM int err; 115811007SLori.Alt@Sun.COM guid_map_entry_t gmesrch; 115911007SLori.Alt@Sun.COM guid_map_entry_t *gmep; 116011007SLori.Alt@Sun.COM avl_index_t where; 116111007SLori.Alt@Sun.COM objset_t *ref_os = NULL; 116211007SLori.Alt@Sun.COM dmu_buf_t *dbp; 116311007SLori.Alt@Sun.COM 116411007SLori.Alt@Sun.COM if (drrwbr->drr_offset + drrwbr->drr_length < drrwbr->drr_offset) 116511007SLori.Alt@Sun.COM return (EINVAL); 116611007SLori.Alt@Sun.COM 116711007SLori.Alt@Sun.COM /* 116811007SLori.Alt@Sun.COM * If the GUID of the referenced dataset is different from the 116911007SLori.Alt@Sun.COM * GUID of the target dataset, find the referenced dataset. 117011007SLori.Alt@Sun.COM */ 117111007SLori.Alt@Sun.COM if (drrwbr->drr_toguid != drrwbr->drr_refguid) { 117211007SLori.Alt@Sun.COM gmesrch.guid = drrwbr->drr_refguid; 117311007SLori.Alt@Sun.COM if ((gmep = avl_find(&ra->guid_to_ds_map, &gmesrch, 117411007SLori.Alt@Sun.COM &where)) == NULL) { 117511007SLori.Alt@Sun.COM return (EINVAL); 117611007SLori.Alt@Sun.COM } 117711007SLori.Alt@Sun.COM if (dmu_objset_from_ds(gmep->gme_ds, &ref_os)) 117811007SLori.Alt@Sun.COM return (EINVAL); 117911007SLori.Alt@Sun.COM } else { 118011007SLori.Alt@Sun.COM ref_os = os; 118111007SLori.Alt@Sun.COM } 118211007SLori.Alt@Sun.COM 118311007SLori.Alt@Sun.COM if (err = dmu_buf_hold(ref_os, drrwbr->drr_refobject, 1184*12285SJeff.Bonwick@Sun.COM drrwbr->drr_refoffset, FTAG, &dbp, DMU_READ_PREFETCH)) 118511007SLori.Alt@Sun.COM return (err); 118611007SLori.Alt@Sun.COM 118711007SLori.Alt@Sun.COM tx = dmu_tx_create(os); 118811007SLori.Alt@Sun.COM 118911007SLori.Alt@Sun.COM dmu_tx_hold_write(tx, drrwbr->drr_object, 119011007SLori.Alt@Sun.COM drrwbr->drr_offset, drrwbr->drr_length); 119111007SLori.Alt@Sun.COM err = dmu_tx_assign(tx, TXG_WAIT); 119211007SLori.Alt@Sun.COM if (err) { 119311007SLori.Alt@Sun.COM dmu_tx_abort(tx); 119411007SLori.Alt@Sun.COM return (err); 119511007SLori.Alt@Sun.COM } 119611007SLori.Alt@Sun.COM dmu_write(os, drrwbr->drr_object, 119711007SLori.Alt@Sun.COM drrwbr->drr_offset, drrwbr->drr_length, dbp->db_data, tx); 119811007SLori.Alt@Sun.COM dmu_buf_rele(dbp, FTAG); 119911007SLori.Alt@Sun.COM dmu_tx_commit(tx); 120011007SLori.Alt@Sun.COM return (0); 120111007SLori.Alt@Sun.COM } 120211007SLori.Alt@Sun.COM 120311935SMark.Shellenbaum@Sun.COM static int 120411935SMark.Shellenbaum@Sun.COM restore_spill(struct restorearg *ra, objset_t *os, struct drr_spill *drrs) 120511935SMark.Shellenbaum@Sun.COM { 120611935SMark.Shellenbaum@Sun.COM dmu_tx_t *tx; 120711935SMark.Shellenbaum@Sun.COM void *data; 120811935SMark.Shellenbaum@Sun.COM dmu_buf_t *db, *db_spill; 120911935SMark.Shellenbaum@Sun.COM int err; 121011935SMark.Shellenbaum@Sun.COM 121111935SMark.Shellenbaum@Sun.COM if (drrs->drr_length < SPA_MINBLOCKSIZE || 121211935SMark.Shellenbaum@Sun.COM drrs->drr_length > SPA_MAXBLOCKSIZE) 121311935SMark.Shellenbaum@Sun.COM return (EINVAL); 121411935SMark.Shellenbaum@Sun.COM 121511935SMark.Shellenbaum@Sun.COM data = restore_read(ra, drrs->drr_length); 121611935SMark.Shellenbaum@Sun.COM if (data == NULL) 121711935SMark.Shellenbaum@Sun.COM return (ra->err); 121811935SMark.Shellenbaum@Sun.COM 121911935SMark.Shellenbaum@Sun.COM if (dmu_object_info(os, drrs->drr_object, NULL) != 0) 122011935SMark.Shellenbaum@Sun.COM return (EINVAL); 122111935SMark.Shellenbaum@Sun.COM 122211935SMark.Shellenbaum@Sun.COM VERIFY(0 == dmu_bonus_hold(os, drrs->drr_object, FTAG, &db)); 122311935SMark.Shellenbaum@Sun.COM if ((err = dmu_spill_hold_by_bonus(db, FTAG, &db_spill)) != 0) { 122411935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db, FTAG); 122511935SMark.Shellenbaum@Sun.COM return (err); 122611935SMark.Shellenbaum@Sun.COM } 122711935SMark.Shellenbaum@Sun.COM 122811935SMark.Shellenbaum@Sun.COM tx = dmu_tx_create(os); 122911935SMark.Shellenbaum@Sun.COM 123011935SMark.Shellenbaum@Sun.COM dmu_tx_hold_spill(tx, db->db_object); 123111935SMark.Shellenbaum@Sun.COM 123211935SMark.Shellenbaum@Sun.COM err = dmu_tx_assign(tx, TXG_WAIT); 123311935SMark.Shellenbaum@Sun.COM if (err) { 123411935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db, FTAG); 123511935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db_spill, FTAG); 123611935SMark.Shellenbaum@Sun.COM dmu_tx_abort(tx); 123711935SMark.Shellenbaum@Sun.COM return (err); 123811935SMark.Shellenbaum@Sun.COM } 123911935SMark.Shellenbaum@Sun.COM dmu_buf_will_dirty(db_spill, tx); 124011935SMark.Shellenbaum@Sun.COM 124111935SMark.Shellenbaum@Sun.COM if (db_spill->db_size < drrs->drr_length) 124211935SMark.Shellenbaum@Sun.COM VERIFY(0 == dbuf_spill_set_blksz(db_spill, 124311935SMark.Shellenbaum@Sun.COM drrs->drr_length, tx)); 124411935SMark.Shellenbaum@Sun.COM bcopy(data, db_spill->db_data, drrs->drr_length); 124511935SMark.Shellenbaum@Sun.COM 124611935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db, FTAG); 124711935SMark.Shellenbaum@Sun.COM dmu_buf_rele(db_spill, FTAG); 124811935SMark.Shellenbaum@Sun.COM 124911935SMark.Shellenbaum@Sun.COM dmu_tx_commit(tx); 125011935SMark.Shellenbaum@Sun.COM return (0); 125111935SMark.Shellenbaum@Sun.COM } 125211935SMark.Shellenbaum@Sun.COM 12532743Sahrens /* ARGSUSED */ 12542743Sahrens static int 12552743Sahrens restore_free(struct restorearg *ra, objset_t *os, 12562743Sahrens struct drr_free *drrf) 12572743Sahrens { 12582743Sahrens int err; 12592743Sahrens 12602743Sahrens if (drrf->drr_length != -1ULL && 12612743Sahrens drrf->drr_offset + drrf->drr_length < drrf->drr_offset) 12622743Sahrens return (EINVAL); 12632743Sahrens 12642743Sahrens if (dmu_object_info(os, drrf->drr_object, NULL) != 0) 12652743Sahrens return (EINVAL); 12662743Sahrens 12676992Smaybee err = dmu_free_long_range(os, drrf->drr_object, 12682743Sahrens drrf->drr_offset, drrf->drr_length); 12692743Sahrens return (err); 12702743Sahrens } 12712743Sahrens 12725367Sahrens /* 12735367Sahrens * NB: callers *must* call dmu_recv_end() if this succeeds. 12745367Sahrens */ 12755367Sahrens int 12765367Sahrens dmu_recv_stream(dmu_recv_cookie_t *drc, vnode_t *vp, offset_t *voffp) 12775367Sahrens { 12785367Sahrens struct restorearg ra = { 0 }; 12795367Sahrens dmu_replay_record_t *drr; 12805367Sahrens objset_t *os; 12815367Sahrens zio_cksum_t pcksum; 128211007SLori.Alt@Sun.COM guid_map_entry_t *gmep; 128311007SLori.Alt@Sun.COM int featureflags; 12845367Sahrens 12855367Sahrens if (drc->drc_drrb->drr_magic == BSWAP_64(DMU_BACKUP_MAGIC)) 12865367Sahrens ra.byteswap = TRUE; 12872743Sahrens 12885367Sahrens { 12895367Sahrens /* compute checksum of drr_begin record */ 12905367Sahrens dmu_replay_record_t *drr; 12915367Sahrens drr = kmem_zalloc(sizeof (dmu_replay_record_t), KM_SLEEP); 12925367Sahrens 12935367Sahrens drr->drr_type = DRR_BEGIN; 12945367Sahrens drr->drr_u.drr_begin = *drc->drc_drrb; 12955367Sahrens if (ra.byteswap) { 12965367Sahrens fletcher_4_incremental_byteswap(drr, 12975367Sahrens sizeof (dmu_replay_record_t), &ra.cksum); 12985367Sahrens } else { 12995367Sahrens fletcher_4_incremental_native(drr, 13005367Sahrens sizeof (dmu_replay_record_t), &ra.cksum); 13015367Sahrens } 13025367Sahrens kmem_free(drr, sizeof (dmu_replay_record_t)); 13032743Sahrens } 13042743Sahrens 13052743Sahrens if (ra.byteswap) { 13065367Sahrens struct drr_begin *drrb = drc->drc_drrb; 13072743Sahrens drrb->drr_magic = BSWAP_64(drrb->drr_magic); 130811007SLori.Alt@Sun.COM drrb->drr_versioninfo = BSWAP_64(drrb->drr_versioninfo); 13092743Sahrens drrb->drr_creation_time = BSWAP_64(drrb->drr_creation_time); 13102743Sahrens drrb->drr_type = BSWAP_32(drrb->drr_type); 13112743Sahrens drrb->drr_toguid = BSWAP_64(drrb->drr_toguid); 13122743Sahrens drrb->drr_fromguid = BSWAP_64(drrb->drr_fromguid); 13132743Sahrens } 13142743Sahrens 13155367Sahrens ra.vp = vp; 13165367Sahrens ra.voff = *voffp; 13175367Sahrens ra.bufsize = 1<<20; 13185367Sahrens ra.buf = kmem_alloc(ra.bufsize, KM_SLEEP); 13195326Sek110237 13205367Sahrens /* these were verified in dmu_recv_begin */ 132111007SLori.Alt@Sun.COM ASSERT(DMU_GET_STREAM_HDRTYPE(drc->drc_drrb->drr_versioninfo) == 132211007SLori.Alt@Sun.COM DMU_SUBSTREAM); 13235367Sahrens ASSERT(drc->drc_drrb->drr_type < DMU_OST_NUMTYPES); 13242743Sahrens 13252743Sahrens /* 13262743Sahrens * Open the objset we are modifying. 13272743Sahrens */ 132810298SMatthew.Ahrens@Sun.COM VERIFY(dmu_objset_from_ds(drc->drc_real_ds, &os) == 0); 13292743Sahrens 13305367Sahrens ASSERT(drc->drc_real_ds->ds_phys->ds_flags & DS_FLAG_INCONSISTENT); 13312743Sahrens 133211007SLori.Alt@Sun.COM featureflags = DMU_GET_FEATUREFLAGS(drc->drc_drrb->drr_versioninfo); 133311007SLori.Alt@Sun.COM 133411007SLori.Alt@Sun.COM /* if this stream is dedup'ed, set up the avl tree for guid mapping */ 133511007SLori.Alt@Sun.COM if (featureflags & DMU_BACKUP_FEATURE_DEDUP) { 133611007SLori.Alt@Sun.COM avl_create(&ra.guid_to_ds_map, guid_compare, 133711007SLori.Alt@Sun.COM sizeof (guid_map_entry_t), 133811007SLori.Alt@Sun.COM offsetof(guid_map_entry_t, avlnode)); 133911007SLori.Alt@Sun.COM (void) dmu_objset_find(drc->drc_top_ds, find_ds_by_guid, 134011007SLori.Alt@Sun.COM (void *)&ra.guid_to_ds_map, 134111007SLori.Alt@Sun.COM DS_FIND_CHILDREN); 134211007SLori.Alt@Sun.COM } 134311007SLori.Alt@Sun.COM 13442743Sahrens /* 13452743Sahrens * Read records and process them. 13462743Sahrens */ 13475367Sahrens pcksum = ra.cksum; 13482743Sahrens while (ra.err == 0 && 13492743Sahrens NULL != (drr = restore_read(&ra, sizeof (*drr)))) { 13502743Sahrens if (issig(JUSTLOOKING) && issig(FORREAL)) { 13512743Sahrens ra.err = EINTR; 13522743Sahrens goto out; 13532743Sahrens } 13542743Sahrens 13552743Sahrens if (ra.byteswap) 13562743Sahrens backup_byteswap(drr); 13572743Sahrens 13582743Sahrens switch (drr->drr_type) { 13592743Sahrens case DRR_OBJECT: 13602743Sahrens { 13612743Sahrens /* 13622743Sahrens * We need to make a copy of the record header, 13632743Sahrens * because restore_{object,write} may need to 13642743Sahrens * restore_read(), which will invalidate drr. 13652743Sahrens */ 13662743Sahrens struct drr_object drro = drr->drr_u.drr_object; 13672743Sahrens ra.err = restore_object(&ra, os, &drro); 13682743Sahrens break; 13692743Sahrens } 13702743Sahrens case DRR_FREEOBJECTS: 13712743Sahrens { 13722743Sahrens struct drr_freeobjects drrfo = 13732743Sahrens drr->drr_u.drr_freeobjects; 13742743Sahrens ra.err = restore_freeobjects(&ra, os, &drrfo); 13752743Sahrens break; 13762743Sahrens } 13772743Sahrens case DRR_WRITE: 13782743Sahrens { 13792743Sahrens struct drr_write drrw = drr->drr_u.drr_write; 13802743Sahrens ra.err = restore_write(&ra, os, &drrw); 13812743Sahrens break; 13822743Sahrens } 138311007SLori.Alt@Sun.COM case DRR_WRITE_BYREF: 138411007SLori.Alt@Sun.COM { 138511007SLori.Alt@Sun.COM struct drr_write_byref drrwbr = 138611007SLori.Alt@Sun.COM drr->drr_u.drr_write_byref; 138711007SLori.Alt@Sun.COM ra.err = restore_write_byref(&ra, os, &drrwbr); 138811007SLori.Alt@Sun.COM break; 138911007SLori.Alt@Sun.COM } 13902743Sahrens case DRR_FREE: 13912743Sahrens { 13922743Sahrens struct drr_free drrf = drr->drr_u.drr_free; 13932743Sahrens ra.err = restore_free(&ra, os, &drrf); 13942743Sahrens break; 13952743Sahrens } 13962743Sahrens case DRR_END: 13972743Sahrens { 13982743Sahrens struct drr_end drre = drr->drr_u.drr_end; 13992743Sahrens /* 14002743Sahrens * We compare against the *previous* checksum 14012743Sahrens * value, because the stored checksum is of 14022743Sahrens * everything before the DRR_END record. 14032743Sahrens */ 14046479Sahrens if (!ZIO_CHECKSUM_EQUAL(drre.drr_checksum, pcksum)) 14052743Sahrens ra.err = ECKSUM; 14062743Sahrens goto out; 14072743Sahrens } 140811935SMark.Shellenbaum@Sun.COM case DRR_SPILL: 140911935SMark.Shellenbaum@Sun.COM { 141011935SMark.Shellenbaum@Sun.COM struct drr_spill drrs = drr->drr_u.drr_spill; 141111935SMark.Shellenbaum@Sun.COM ra.err = restore_spill(&ra, os, &drrs); 141211935SMark.Shellenbaum@Sun.COM break; 141311935SMark.Shellenbaum@Sun.COM } 14142743Sahrens default: 14152743Sahrens ra.err = EINVAL; 14162743Sahrens goto out; 14172743Sahrens } 14185367Sahrens pcksum = ra.cksum; 14192743Sahrens } 14206479Sahrens ASSERT(ra.err != 0); 14212743Sahrens 14222743Sahrens out: 14235367Sahrens if (ra.err != 0) { 14242743Sahrens /* 142510204SMatthew.Ahrens@Sun.COM * destroy what we created, so we don't leave it in the 142610204SMatthew.Ahrens@Sun.COM * inconsistent restoring state. 14272743Sahrens */ 14285367Sahrens txg_wait_synced(drc->drc_real_ds->ds_dir->dd_pool, 0); 142910204SMatthew.Ahrens@Sun.COM 143010242Schris.kirby@sun.com (void) dsl_dataset_destroy(drc->drc_real_ds, dmu_recv_tag, 143110242Schris.kirby@sun.com B_FALSE); 143210204SMatthew.Ahrens@Sun.COM if (drc->drc_real_ds != drc->drc_logical_ds) { 143310204SMatthew.Ahrens@Sun.COM mutex_exit(&drc->drc_logical_ds->ds_recvlock); 143410204SMatthew.Ahrens@Sun.COM dsl_dataset_rele(drc->drc_logical_ds, dmu_recv_tag); 143510204SMatthew.Ahrens@Sun.COM } 14362743Sahrens } 14372743Sahrens 143811007SLori.Alt@Sun.COM if (featureflags & DMU_BACKUP_FEATURE_DEDUP) { 143911007SLori.Alt@Sun.COM void *cookie = NULL; 144011007SLori.Alt@Sun.COM 144111007SLori.Alt@Sun.COM while (gmep = avl_destroy_nodes(&ra.guid_to_ds_map, &cookie)) { 144211007SLori.Alt@Sun.COM dsl_dataset_rele(gmep->gme_ds, &ra.guid_to_ds_map); 144311007SLori.Alt@Sun.COM kmem_free(gmep, sizeof (guid_map_entry_t)); 144411007SLori.Alt@Sun.COM } 144511007SLori.Alt@Sun.COM avl_destroy(&ra.guid_to_ds_map); 144611007SLori.Alt@Sun.COM } 144711007SLori.Alt@Sun.COM 14482743Sahrens kmem_free(ra.buf, ra.bufsize); 14495367Sahrens *voffp = ra.voff; 14502743Sahrens return (ra.err); 14512743Sahrens } 14525326Sek110237 14535367Sahrens struct recvendsyncarg { 14545367Sahrens char *tosnap; 14555367Sahrens uint64_t creation_time; 14565367Sahrens uint64_t toguid; 14575367Sahrens }; 14585367Sahrens 14595367Sahrens static int 14605367Sahrens recv_end_check(void *arg1, void *arg2, dmu_tx_t *tx) 14615367Sahrens { 14625367Sahrens dsl_dataset_t *ds = arg1; 14635367Sahrens struct recvendsyncarg *resa = arg2; 14645367Sahrens 14655367Sahrens return (dsl_dataset_snapshot_check(ds, resa->tosnap, tx)); 14665367Sahrens } 14675367Sahrens 14685367Sahrens static void 14695367Sahrens recv_end_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) 14705326Sek110237 { 14715367Sahrens dsl_dataset_t *ds = arg1; 14725367Sahrens struct recvendsyncarg *resa = arg2; 14735367Sahrens 14745367Sahrens dsl_dataset_snapshot_sync(ds, resa->tosnap, cr, tx); 14755367Sahrens 14765367Sahrens /* set snapshot's creation time and guid */ 14775367Sahrens dmu_buf_will_dirty(ds->ds_prev->ds_dbuf, tx); 14785367Sahrens ds->ds_prev->ds_phys->ds_creation_time = resa->creation_time; 14795367Sahrens ds->ds_prev->ds_phys->ds_guid = resa->toguid; 14805367Sahrens ds->ds_prev->ds_phys->ds_flags &= ~DS_FLAG_INCONSISTENT; 14815367Sahrens 14825367Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 14835367Sahrens ds->ds_phys->ds_flags &= ~DS_FLAG_INCONSISTENT; 14845367Sahrens } 14855367Sahrens 148610272SMatthew.Ahrens@Sun.COM static int 148710272SMatthew.Ahrens@Sun.COM dmu_recv_existing_end(dmu_recv_cookie_t *drc) 14885367Sahrens { 14896689Smaybee struct recvendsyncarg resa; 14906689Smaybee dsl_dataset_t *ds = drc->drc_logical_ds; 14916689Smaybee int err; 14925367Sahrens 14935367Sahrens /* 149410272SMatthew.Ahrens@Sun.COM * XXX hack; seems the ds is still dirty and dsl_pool_zil_clean() 149510272SMatthew.Ahrens@Sun.COM * expects it to have a ds_user_ptr (and zil), but clone_swap() 149610272SMatthew.Ahrens@Sun.COM * can close it. 14975367Sahrens */ 14986689Smaybee txg_wait_synced(ds->ds_dir->dd_pool, 0); 14995326Sek110237 150010272SMatthew.Ahrens@Sun.COM if (dsl_dataset_tryown(ds, FALSE, dmu_recv_tag)) { 150110272SMatthew.Ahrens@Sun.COM err = dsl_dataset_clone_swap(drc->drc_real_ds, ds, 150210272SMatthew.Ahrens@Sun.COM drc->drc_force); 150310272SMatthew.Ahrens@Sun.COM if (err) 150410272SMatthew.Ahrens@Sun.COM goto out; 150510272SMatthew.Ahrens@Sun.COM } else { 150610272SMatthew.Ahrens@Sun.COM mutex_exit(&ds->ds_recvlock); 150710272SMatthew.Ahrens@Sun.COM dsl_dataset_rele(ds, dmu_recv_tag); 150810242Schris.kirby@sun.com (void) dsl_dataset_destroy(drc->drc_real_ds, dmu_recv_tag, 150910242Schris.kirby@sun.com B_FALSE); 151010272SMatthew.Ahrens@Sun.COM return (EBUSY); 15115367Sahrens } 15125367Sahrens 15136689Smaybee resa.creation_time = drc->drc_drrb->drr_creation_time; 15146689Smaybee resa.toguid = drc->drc_drrb->drr_toguid; 15156689Smaybee resa.tosnap = drc->drc_tosnap; 15166689Smaybee 15176689Smaybee err = dsl_sync_task_do(ds->ds_dir->dd_pool, 15186689Smaybee recv_end_check, recv_end_sync, ds, &resa, 3); 15196689Smaybee if (err) { 152010272SMatthew.Ahrens@Sun.COM /* swap back */ 152110272SMatthew.Ahrens@Sun.COM (void) dsl_dataset_clone_swap(drc->drc_real_ds, ds, B_TRUE); 15225367Sahrens } 15235367Sahrens 152410272SMatthew.Ahrens@Sun.COM out: 152510272SMatthew.Ahrens@Sun.COM mutex_exit(&ds->ds_recvlock); 15266689Smaybee dsl_dataset_disown(ds, dmu_recv_tag); 152710272SMatthew.Ahrens@Sun.COM (void) dsl_dataset_destroy(drc->drc_real_ds, dmu_recv_tag, B_FALSE); 15285326Sek110237 return (err); 15295326Sek110237 } 153010272SMatthew.Ahrens@Sun.COM 153110272SMatthew.Ahrens@Sun.COM static int 153210272SMatthew.Ahrens@Sun.COM dmu_recv_new_end(dmu_recv_cookie_t *drc) 153310272SMatthew.Ahrens@Sun.COM { 153410272SMatthew.Ahrens@Sun.COM struct recvendsyncarg resa; 153510272SMatthew.Ahrens@Sun.COM dsl_dataset_t *ds = drc->drc_logical_ds; 153610272SMatthew.Ahrens@Sun.COM int err; 153710272SMatthew.Ahrens@Sun.COM 153810272SMatthew.Ahrens@Sun.COM /* 153910272SMatthew.Ahrens@Sun.COM * XXX hack; seems the ds is still dirty and dsl_pool_zil_clean() 154010272SMatthew.Ahrens@Sun.COM * expects it to have a ds_user_ptr (and zil), but clone_swap() 154110272SMatthew.Ahrens@Sun.COM * can close it. 154210272SMatthew.Ahrens@Sun.COM */ 154310272SMatthew.Ahrens@Sun.COM txg_wait_synced(ds->ds_dir->dd_pool, 0); 154410272SMatthew.Ahrens@Sun.COM 154510272SMatthew.Ahrens@Sun.COM resa.creation_time = drc->drc_drrb->drr_creation_time; 154610272SMatthew.Ahrens@Sun.COM resa.toguid = drc->drc_drrb->drr_toguid; 154710272SMatthew.Ahrens@Sun.COM resa.tosnap = drc->drc_tosnap; 154810272SMatthew.Ahrens@Sun.COM 154910272SMatthew.Ahrens@Sun.COM err = dsl_sync_task_do(ds->ds_dir->dd_pool, 155010272SMatthew.Ahrens@Sun.COM recv_end_check, recv_end_sync, ds, &resa, 3); 155110272SMatthew.Ahrens@Sun.COM if (err) { 155210272SMatthew.Ahrens@Sun.COM /* clean up the fs we just recv'd into */ 155310272SMatthew.Ahrens@Sun.COM (void) dsl_dataset_destroy(ds, dmu_recv_tag, B_FALSE); 155410272SMatthew.Ahrens@Sun.COM } else { 155510272SMatthew.Ahrens@Sun.COM /* release the hold from dmu_recv_begin */ 155610272SMatthew.Ahrens@Sun.COM dsl_dataset_disown(ds, dmu_recv_tag); 155710272SMatthew.Ahrens@Sun.COM } 155810272SMatthew.Ahrens@Sun.COM return (err); 155910272SMatthew.Ahrens@Sun.COM } 156010272SMatthew.Ahrens@Sun.COM 156110272SMatthew.Ahrens@Sun.COM int 156210272SMatthew.Ahrens@Sun.COM dmu_recv_end(dmu_recv_cookie_t *drc) 156310272SMatthew.Ahrens@Sun.COM { 156410272SMatthew.Ahrens@Sun.COM if (drc->drc_logical_ds != drc->drc_real_ds) 156510272SMatthew.Ahrens@Sun.COM return (dmu_recv_existing_end(drc)); 156610272SMatthew.Ahrens@Sun.COM else 156710272SMatthew.Ahrens@Sun.COM return (dmu_recv_new_end(drc)); 156810272SMatthew.Ahrens@Sun.COM } 1569