15367Sahrens /* 25367Sahrens * CDDL HEADER START 35367Sahrens * 45367Sahrens * The contents of this file are subject to the terms of the 55367Sahrens * Common Development and Distribution License (the "License"). 65367Sahrens * You may not use this file except in compliance with the License. 75367Sahrens * 85367Sahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 95367Sahrens * or http://www.opensolaris.org/os/licensing. 105367Sahrens * See the License for the specific language governing permissions 115367Sahrens * and limitations under the License. 125367Sahrens * 135367Sahrens * When distributing Covered Code, include this CDDL HEADER in each 145367Sahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 155367Sahrens * If applicable, add the following below this CDDL HEADER, with the 165367Sahrens * fields enclosed by brackets "[]" replaced with your own identifying 175367Sahrens * information: Portions Copyright [yyyy] [name of copyright owner] 185367Sahrens * 195367Sahrens * CDDL HEADER END 205367Sahrens */ 215367Sahrens 225367Sahrens /* 2311461STom.Erickson@Sun.COM * Copyright 2010 Sun Microsystems, Inc. All rights reserved. 245367Sahrens * Use is subject to license terms. 255367Sahrens */ 265367Sahrens 275367Sahrens #include <assert.h> 285367Sahrens #include <ctype.h> 295367Sahrens #include <errno.h> 305367Sahrens #include <libintl.h> 315367Sahrens #include <stdio.h> 325367Sahrens #include <stdlib.h> 335367Sahrens #include <strings.h> 345367Sahrens #include <unistd.h> 355367Sahrens #include <stddef.h> 365367Sahrens #include <fcntl.h> 375367Sahrens #include <sys/mount.h> 3811007SLori.Alt@Sun.COM #include <pthread.h> 3911007SLori.Alt@Sun.COM #include <umem.h> 405367Sahrens 415367Sahrens #include <libzfs.h> 425367Sahrens 435367Sahrens #include "zfs_namecheck.h" 445367Sahrens #include "zfs_prop.h" 4510602SLori.Alt@Sun.COM #include "zfs_fletcher.h" 465367Sahrens #include "libzfs_impl.h" 4711007SLori.Alt@Sun.COM #include <sha2.h> 4811381SLori.Alt@Sun.COM #include <sys/zio_checksum.h> 4911381SLori.Alt@Sun.COM #include <sys/ddt.h> 505367Sahrens 5111022STom.Erickson@Sun.COM /* in libzfs_dataset.c */ 5211022STom.Erickson@Sun.COM extern void zfs_setprop_error(libzfs_handle_t *, zfs_prop_t, int, char *); 5311022STom.Erickson@Sun.COM 547366STim.Haley@Sun.COM static int zfs_receive_impl(libzfs_handle_t *, const char *, recvflags_t, 557366STim.Haley@Sun.COM int, avl_tree_t *, char **); 567366STim.Haley@Sun.COM 5711007SLori.Alt@Sun.COM static const zio_cksum_t zero_cksum = { 0 }; 5811007SLori.Alt@Sun.COM 5911007SLori.Alt@Sun.COM typedef struct dedup_arg { 6011007SLori.Alt@Sun.COM int inputfd; 6111007SLori.Alt@Sun.COM int outputfd; 6211007SLori.Alt@Sun.COM libzfs_handle_t *dedup_hdl; 6311007SLori.Alt@Sun.COM } dedup_arg_t; 6411007SLori.Alt@Sun.COM 6511007SLori.Alt@Sun.COM typedef struct dataref { 6611007SLori.Alt@Sun.COM uint64_t ref_guid; 6711007SLori.Alt@Sun.COM uint64_t ref_object; 6811007SLori.Alt@Sun.COM uint64_t ref_offset; 6911007SLori.Alt@Sun.COM } dataref_t; 7011007SLori.Alt@Sun.COM 7111007SLori.Alt@Sun.COM typedef struct dedup_entry { 7211007SLori.Alt@Sun.COM struct dedup_entry *dde_next; 7311007SLori.Alt@Sun.COM zio_cksum_t dde_chksum; 7411381SLori.Alt@Sun.COM uint64_t dde_prop; 7511007SLori.Alt@Sun.COM dataref_t dde_ref; 7611007SLori.Alt@Sun.COM } dedup_entry_t; 7711007SLori.Alt@Sun.COM 7811007SLori.Alt@Sun.COM #define MAX_DDT_PHYSMEM_PERCENT 20 7911007SLori.Alt@Sun.COM #define SMALLEST_POSSIBLE_MAX_DDT_MB 128 8011007SLori.Alt@Sun.COM 8111007SLori.Alt@Sun.COM typedef struct dedup_table { 8211007SLori.Alt@Sun.COM dedup_entry_t **dedup_hash_array; 8311007SLori.Alt@Sun.COM umem_cache_t *ddecache; 8411007SLori.Alt@Sun.COM uint64_t max_ddt_size; /* max dedup table size in bytes */ 8511007SLori.Alt@Sun.COM uint64_t cur_ddt_size; /* current dedup table size in bytes */ 8611007SLori.Alt@Sun.COM uint64_t ddt_count; 8711007SLori.Alt@Sun.COM int numhashbits; 8811007SLori.Alt@Sun.COM boolean_t ddt_full; 8911007SLori.Alt@Sun.COM } dedup_table_t; 9011007SLori.Alt@Sun.COM 9111007SLori.Alt@Sun.COM static int 9211007SLori.Alt@Sun.COM high_order_bit(uint64_t n) 9311007SLori.Alt@Sun.COM { 9411007SLori.Alt@Sun.COM int count; 9511007SLori.Alt@Sun.COM 9611007SLori.Alt@Sun.COM for (count = 0; n != 0; count++) 9711007SLori.Alt@Sun.COM n >>= 1; 9811007SLori.Alt@Sun.COM return (count); 9911007SLori.Alt@Sun.COM } 10011007SLori.Alt@Sun.COM 10111007SLori.Alt@Sun.COM static size_t 10211007SLori.Alt@Sun.COM ssread(void *buf, size_t len, FILE *stream) 10311007SLori.Alt@Sun.COM { 10411007SLori.Alt@Sun.COM size_t outlen; 10511007SLori.Alt@Sun.COM 10611007SLori.Alt@Sun.COM if ((outlen = fread(buf, len, 1, stream)) == 0) 10711007SLori.Alt@Sun.COM return (0); 10811007SLori.Alt@Sun.COM 10911007SLori.Alt@Sun.COM return (outlen); 11011007SLori.Alt@Sun.COM } 11111007SLori.Alt@Sun.COM 11211007SLori.Alt@Sun.COM static void 11311007SLori.Alt@Sun.COM ddt_hash_append(libzfs_handle_t *hdl, dedup_table_t *ddt, dedup_entry_t **ddepp, 11411381SLori.Alt@Sun.COM zio_cksum_t *cs, uint64_t prop, dataref_t *dr) 11511007SLori.Alt@Sun.COM { 11611007SLori.Alt@Sun.COM dedup_entry_t *dde; 11711007SLori.Alt@Sun.COM 11811007SLori.Alt@Sun.COM if (ddt->cur_ddt_size >= ddt->max_ddt_size) { 11911007SLori.Alt@Sun.COM if (ddt->ddt_full == B_FALSE) { 12011007SLori.Alt@Sun.COM zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 12111007SLori.Alt@Sun.COM "Dedup table full. Deduplication will continue " 12211007SLori.Alt@Sun.COM "with existing table entries")); 12311007SLori.Alt@Sun.COM ddt->ddt_full = B_TRUE; 12411007SLori.Alt@Sun.COM } 12511007SLori.Alt@Sun.COM return; 12611007SLori.Alt@Sun.COM } 12711007SLori.Alt@Sun.COM 12811007SLori.Alt@Sun.COM if ((dde = umem_cache_alloc(ddt->ddecache, UMEM_DEFAULT)) 12911007SLori.Alt@Sun.COM != NULL) { 13011007SLori.Alt@Sun.COM assert(*ddepp == NULL); 13111007SLori.Alt@Sun.COM dde->dde_next = NULL; 13211007SLori.Alt@Sun.COM dde->dde_chksum = *cs; 13311381SLori.Alt@Sun.COM dde->dde_prop = prop; 13411007SLori.Alt@Sun.COM dde->dde_ref = *dr; 13511007SLori.Alt@Sun.COM *ddepp = dde; 13611007SLori.Alt@Sun.COM ddt->cur_ddt_size += sizeof (dedup_entry_t); 13711007SLori.Alt@Sun.COM ddt->ddt_count++; 13811007SLori.Alt@Sun.COM } 13911007SLori.Alt@Sun.COM } 14011007SLori.Alt@Sun.COM 14111007SLori.Alt@Sun.COM /* 14211007SLori.Alt@Sun.COM * Using the specified dedup table, do a lookup for an entry with 14311007SLori.Alt@Sun.COM * the checksum cs. If found, return the block's reference info 14411007SLori.Alt@Sun.COM * in *dr. Otherwise, insert a new entry in the dedup table, using 14511007SLori.Alt@Sun.COM * the reference information specified by *dr. 14611007SLori.Alt@Sun.COM * 14711007SLori.Alt@Sun.COM * return value: true - entry was found 14811007SLori.Alt@Sun.COM * false - entry was not found 14911007SLori.Alt@Sun.COM */ 15011007SLori.Alt@Sun.COM static boolean_t 15111007SLori.Alt@Sun.COM ddt_update(libzfs_handle_t *hdl, dedup_table_t *ddt, zio_cksum_t *cs, 15211381SLori.Alt@Sun.COM uint64_t prop, dataref_t *dr) 15311007SLori.Alt@Sun.COM { 15411007SLori.Alt@Sun.COM uint32_t hashcode; 15511007SLori.Alt@Sun.COM dedup_entry_t **ddepp; 15611007SLori.Alt@Sun.COM 15711007SLori.Alt@Sun.COM hashcode = BF64_GET(cs->zc_word[0], 0, ddt->numhashbits); 15811007SLori.Alt@Sun.COM 15911007SLori.Alt@Sun.COM for (ddepp = &(ddt->dedup_hash_array[hashcode]); *ddepp != NULL; 16011007SLori.Alt@Sun.COM ddepp = &((*ddepp)->dde_next)) { 16111381SLori.Alt@Sun.COM if (ZIO_CHECKSUM_EQUAL(((*ddepp)->dde_chksum), *cs) && 16211381SLori.Alt@Sun.COM (*ddepp)->dde_prop == prop) { 16311007SLori.Alt@Sun.COM *dr = (*ddepp)->dde_ref; 16411007SLori.Alt@Sun.COM return (B_TRUE); 16511007SLori.Alt@Sun.COM } 16611007SLori.Alt@Sun.COM } 16711381SLori.Alt@Sun.COM ddt_hash_append(hdl, ddt, ddepp, cs, prop, dr); 16811007SLori.Alt@Sun.COM return (B_FALSE); 16911007SLori.Alt@Sun.COM } 17011007SLori.Alt@Sun.COM 17111007SLori.Alt@Sun.COM static int 17211007SLori.Alt@Sun.COM cksum_and_write(const void *buf, uint64_t len, zio_cksum_t *zc, int outfd) 17311007SLori.Alt@Sun.COM { 17411007SLori.Alt@Sun.COM fletcher_4_incremental_native(buf, len, zc); 17511007SLori.Alt@Sun.COM return (write(outfd, buf, len)); 17611007SLori.Alt@Sun.COM } 17711007SLori.Alt@Sun.COM 17811007SLori.Alt@Sun.COM /* 17911007SLori.Alt@Sun.COM * This function is started in a separate thread when the dedup option 18011007SLori.Alt@Sun.COM * has been requested. The main send thread determines the list of 18111007SLori.Alt@Sun.COM * snapshots to be included in the send stream and makes the ioctl calls 18211007SLori.Alt@Sun.COM * for each one. But instead of having the ioctl send the output to the 18311007SLori.Alt@Sun.COM * the output fd specified by the caller of zfs_send()), the 18411007SLori.Alt@Sun.COM * ioctl is told to direct the output to a pipe, which is read by the 18511007SLori.Alt@Sun.COM * alternate thread running THIS function. This function does the 18611007SLori.Alt@Sun.COM * dedup'ing by: 18711007SLori.Alt@Sun.COM * 1. building a dedup table (the DDT) 18811007SLori.Alt@Sun.COM * 2. doing checksums on each data block and inserting a record in the DDT 18911007SLori.Alt@Sun.COM * 3. looking for matching checksums, and 19011007SLori.Alt@Sun.COM * 4. sending a DRR_WRITE_BYREF record instead of a write record whenever 19111007SLori.Alt@Sun.COM * a duplicate block is found. 19211007SLori.Alt@Sun.COM * The output of this function then goes to the output fd requested 19311007SLori.Alt@Sun.COM * by the caller of zfs_send(). 19411007SLori.Alt@Sun.COM */ 19511007SLori.Alt@Sun.COM static void * 19611007SLori.Alt@Sun.COM cksummer(void *arg) 19711007SLori.Alt@Sun.COM { 19811007SLori.Alt@Sun.COM dedup_arg_t *dda = arg; 19911007SLori.Alt@Sun.COM char *buf = malloc(1<<20); 20011007SLori.Alt@Sun.COM dmu_replay_record_t thedrr; 20111007SLori.Alt@Sun.COM dmu_replay_record_t *drr = &thedrr; 20211007SLori.Alt@Sun.COM struct drr_begin *drrb = &thedrr.drr_u.drr_begin; 20311007SLori.Alt@Sun.COM struct drr_end *drre = &thedrr.drr_u.drr_end; 20411007SLori.Alt@Sun.COM struct drr_object *drro = &thedrr.drr_u.drr_object; 20511007SLori.Alt@Sun.COM struct drr_write *drrw = &thedrr.drr_u.drr_write; 20611007SLori.Alt@Sun.COM FILE *ofp; 20711007SLori.Alt@Sun.COM int outfd; 20811381SLori.Alt@Sun.COM dmu_replay_record_t wbr_drr = {0}; 20911007SLori.Alt@Sun.COM struct drr_write_byref *wbr_drrr = &wbr_drr.drr_u.drr_write_byref; 21011007SLori.Alt@Sun.COM dedup_table_t ddt; 21111007SLori.Alt@Sun.COM zio_cksum_t stream_cksum; 21211007SLori.Alt@Sun.COM uint64_t physmem = sysconf(_SC_PHYS_PAGES) * sysconf(_SC_PAGESIZE); 21311007SLori.Alt@Sun.COM uint64_t numbuckets; 21411007SLori.Alt@Sun.COM 21511007SLori.Alt@Sun.COM ddt.max_ddt_size = 21611007SLori.Alt@Sun.COM MAX((physmem * MAX_DDT_PHYSMEM_PERCENT)/100, 21711007SLori.Alt@Sun.COM SMALLEST_POSSIBLE_MAX_DDT_MB<<20); 21811007SLori.Alt@Sun.COM 21911007SLori.Alt@Sun.COM numbuckets = ddt.max_ddt_size/(sizeof (dedup_entry_t)); 22011007SLori.Alt@Sun.COM 22111007SLori.Alt@Sun.COM /* 22211007SLori.Alt@Sun.COM * numbuckets must be a power of 2. Increase number to 22311007SLori.Alt@Sun.COM * a power of 2 if necessary. 22411007SLori.Alt@Sun.COM */ 22511007SLori.Alt@Sun.COM if (!ISP2(numbuckets)) 22611007SLori.Alt@Sun.COM numbuckets = 1 << high_order_bit(numbuckets); 22711007SLori.Alt@Sun.COM 22811007SLori.Alt@Sun.COM ddt.dedup_hash_array = calloc(numbuckets, sizeof (dedup_entry_t *)); 22911007SLori.Alt@Sun.COM ddt.ddecache = umem_cache_create("dde", sizeof (dedup_entry_t), 0, 23011007SLori.Alt@Sun.COM NULL, NULL, NULL, NULL, NULL, 0); 23111007SLori.Alt@Sun.COM ddt.cur_ddt_size = numbuckets * sizeof (dedup_entry_t *); 23211007SLori.Alt@Sun.COM ddt.numhashbits = high_order_bit(numbuckets) - 1; 23311007SLori.Alt@Sun.COM ddt.ddt_full = B_FALSE; 23411007SLori.Alt@Sun.COM 23511007SLori.Alt@Sun.COM /* Initialize the write-by-reference block. */ 23611007SLori.Alt@Sun.COM wbr_drr.drr_type = DRR_WRITE_BYREF; 23711007SLori.Alt@Sun.COM wbr_drr.drr_payloadlen = 0; 23811007SLori.Alt@Sun.COM 23911007SLori.Alt@Sun.COM outfd = dda->outputfd; 24011007SLori.Alt@Sun.COM ofp = fdopen(dda->inputfd, "r"); 24111007SLori.Alt@Sun.COM while (ssread(drr, sizeof (dmu_replay_record_t), ofp) != 0) { 24211007SLori.Alt@Sun.COM 24311007SLori.Alt@Sun.COM switch (drr->drr_type) { 24411007SLori.Alt@Sun.COM case DRR_BEGIN: 24511007SLori.Alt@Sun.COM { 24611007SLori.Alt@Sun.COM int fflags; 24711007SLori.Alt@Sun.COM ZIO_SET_CHECKSUM(&stream_cksum, 0, 0, 0, 0); 24811007SLori.Alt@Sun.COM 24911007SLori.Alt@Sun.COM /* set the DEDUP feature flag for this stream */ 25011007SLori.Alt@Sun.COM fflags = DMU_GET_FEATUREFLAGS(drrb->drr_versioninfo); 25111381SLori.Alt@Sun.COM fflags |= (DMU_BACKUP_FEATURE_DEDUP | 25211381SLori.Alt@Sun.COM DMU_BACKUP_FEATURE_DEDUPPROPS); 25311007SLori.Alt@Sun.COM DMU_SET_FEATUREFLAGS(drrb->drr_versioninfo, fflags); 25411007SLori.Alt@Sun.COM 25511007SLori.Alt@Sun.COM if (cksum_and_write(drr, sizeof (dmu_replay_record_t), 25611007SLori.Alt@Sun.COM &stream_cksum, outfd) == -1) 25711007SLori.Alt@Sun.COM goto out; 25811007SLori.Alt@Sun.COM if (DMU_GET_STREAM_HDRTYPE(drrb->drr_versioninfo) == 25911007SLori.Alt@Sun.COM DMU_COMPOUNDSTREAM && drr->drr_payloadlen != 0) { 26011007SLori.Alt@Sun.COM int sz = drr->drr_payloadlen; 26111007SLori.Alt@Sun.COM 26211007SLori.Alt@Sun.COM if (sz > 1<<20) { 26311007SLori.Alt@Sun.COM free(buf); 26411007SLori.Alt@Sun.COM buf = malloc(sz); 26511007SLori.Alt@Sun.COM } 26611007SLori.Alt@Sun.COM (void) ssread(buf, sz, ofp); 26711007SLori.Alt@Sun.COM if (ferror(stdin)) 26811007SLori.Alt@Sun.COM perror("fread"); 26911007SLori.Alt@Sun.COM if (cksum_and_write(buf, sz, &stream_cksum, 27011007SLori.Alt@Sun.COM outfd) == -1) 27111007SLori.Alt@Sun.COM goto out; 27211007SLori.Alt@Sun.COM } 27311007SLori.Alt@Sun.COM break; 27411007SLori.Alt@Sun.COM } 27511007SLori.Alt@Sun.COM 27611007SLori.Alt@Sun.COM case DRR_END: 27711007SLori.Alt@Sun.COM { 27811007SLori.Alt@Sun.COM /* use the recalculated checksum */ 27911007SLori.Alt@Sun.COM ZIO_SET_CHECKSUM(&drre->drr_checksum, 28011007SLori.Alt@Sun.COM stream_cksum.zc_word[0], stream_cksum.zc_word[1], 28111007SLori.Alt@Sun.COM stream_cksum.zc_word[2], stream_cksum.zc_word[3]); 28211007SLori.Alt@Sun.COM if ((write(outfd, drr, 28311007SLori.Alt@Sun.COM sizeof (dmu_replay_record_t))) == -1) 28411007SLori.Alt@Sun.COM goto out; 28511007SLori.Alt@Sun.COM break; 28611007SLori.Alt@Sun.COM } 28711007SLori.Alt@Sun.COM 28811007SLori.Alt@Sun.COM case DRR_OBJECT: 28911007SLori.Alt@Sun.COM { 29011007SLori.Alt@Sun.COM if (cksum_and_write(drr, sizeof (dmu_replay_record_t), 29111007SLori.Alt@Sun.COM &stream_cksum, outfd) == -1) 29211007SLori.Alt@Sun.COM goto out; 29311007SLori.Alt@Sun.COM if (drro->drr_bonuslen > 0) { 29411007SLori.Alt@Sun.COM (void) ssread(buf, 29511007SLori.Alt@Sun.COM P2ROUNDUP((uint64_t)drro->drr_bonuslen, 8), 29611007SLori.Alt@Sun.COM ofp); 29711007SLori.Alt@Sun.COM if (cksum_and_write(buf, 29811007SLori.Alt@Sun.COM P2ROUNDUP((uint64_t)drro->drr_bonuslen, 8), 29911007SLori.Alt@Sun.COM &stream_cksum, outfd) == -1) 30011007SLori.Alt@Sun.COM goto out; 30111007SLori.Alt@Sun.COM } 30211007SLori.Alt@Sun.COM break; 30311007SLori.Alt@Sun.COM } 30411007SLori.Alt@Sun.COM 30511007SLori.Alt@Sun.COM case DRR_FREEOBJECTS: 30611007SLori.Alt@Sun.COM { 30711007SLori.Alt@Sun.COM if (cksum_and_write(drr, sizeof (dmu_replay_record_t), 30811007SLori.Alt@Sun.COM &stream_cksum, outfd) == -1) 30911007SLori.Alt@Sun.COM goto out; 31011007SLori.Alt@Sun.COM break; 31111007SLori.Alt@Sun.COM } 31211007SLori.Alt@Sun.COM 31311007SLori.Alt@Sun.COM case DRR_WRITE: 31411007SLori.Alt@Sun.COM { 31511007SLori.Alt@Sun.COM dataref_t dataref; 31611007SLori.Alt@Sun.COM 31711007SLori.Alt@Sun.COM (void) ssread(buf, drrw->drr_length, ofp); 31811381SLori.Alt@Sun.COM 31911007SLori.Alt@Sun.COM /* 32011381SLori.Alt@Sun.COM * Use the existing checksum if it's dedup-capable, 32111381SLori.Alt@Sun.COM * else calculate a SHA256 checksum for it. 32211007SLori.Alt@Sun.COM */ 32311381SLori.Alt@Sun.COM 32411381SLori.Alt@Sun.COM if (ZIO_CHECKSUM_EQUAL(drrw->drr_key.ddk_cksum, 32511381SLori.Alt@Sun.COM zero_cksum) || 32611381SLori.Alt@Sun.COM !DRR_IS_DEDUP_CAPABLE(drrw->drr_checksumflags)) { 32711007SLori.Alt@Sun.COM SHA256_CTX ctx; 32811007SLori.Alt@Sun.COM zio_cksum_t tmpsha256; 32911007SLori.Alt@Sun.COM 33011007SLori.Alt@Sun.COM SHA256Init(&ctx); 33111007SLori.Alt@Sun.COM SHA256Update(&ctx, buf, drrw->drr_length); 33211007SLori.Alt@Sun.COM SHA256Final(&tmpsha256, &ctx); 33311381SLori.Alt@Sun.COM drrw->drr_key.ddk_cksum.zc_word[0] = 33411007SLori.Alt@Sun.COM BE_64(tmpsha256.zc_word[0]); 33511381SLori.Alt@Sun.COM drrw->drr_key.ddk_cksum.zc_word[1] = 33611007SLori.Alt@Sun.COM BE_64(tmpsha256.zc_word[1]); 33711381SLori.Alt@Sun.COM drrw->drr_key.ddk_cksum.zc_word[2] = 33811007SLori.Alt@Sun.COM BE_64(tmpsha256.zc_word[2]); 33911381SLori.Alt@Sun.COM drrw->drr_key.ddk_cksum.zc_word[3] = 34011007SLori.Alt@Sun.COM BE_64(tmpsha256.zc_word[3]); 34111381SLori.Alt@Sun.COM drrw->drr_checksumtype = ZIO_CHECKSUM_SHA256; 34211381SLori.Alt@Sun.COM drrw->drr_checksumflags = DRR_CHECKSUM_DEDUP; 34311007SLori.Alt@Sun.COM } 34411007SLori.Alt@Sun.COM 34511007SLori.Alt@Sun.COM dataref.ref_guid = drrw->drr_toguid; 34611007SLori.Alt@Sun.COM dataref.ref_object = drrw->drr_object; 34711007SLori.Alt@Sun.COM dataref.ref_offset = drrw->drr_offset; 34811007SLori.Alt@Sun.COM 34911007SLori.Alt@Sun.COM if (ddt_update(dda->dedup_hdl, &ddt, 35011381SLori.Alt@Sun.COM &drrw->drr_key.ddk_cksum, drrw->drr_key.ddk_prop, 35111381SLori.Alt@Sun.COM &dataref)) { 35211007SLori.Alt@Sun.COM /* block already present in stream */ 35311007SLori.Alt@Sun.COM wbr_drrr->drr_object = drrw->drr_object; 35411007SLori.Alt@Sun.COM wbr_drrr->drr_offset = drrw->drr_offset; 35511007SLori.Alt@Sun.COM wbr_drrr->drr_length = drrw->drr_length; 35611007SLori.Alt@Sun.COM wbr_drrr->drr_toguid = drrw->drr_toguid; 35711007SLori.Alt@Sun.COM wbr_drrr->drr_refguid = dataref.ref_guid; 35811007SLori.Alt@Sun.COM wbr_drrr->drr_refobject = 35911007SLori.Alt@Sun.COM dataref.ref_object; 36011007SLori.Alt@Sun.COM wbr_drrr->drr_refoffset = 36111007SLori.Alt@Sun.COM dataref.ref_offset; 36211007SLori.Alt@Sun.COM 36311381SLori.Alt@Sun.COM wbr_drrr->drr_checksumtype = 36411381SLori.Alt@Sun.COM drrw->drr_checksumtype; 36511381SLori.Alt@Sun.COM wbr_drrr->drr_checksumflags = 36611381SLori.Alt@Sun.COM drrw->drr_checksumtype; 36711381SLori.Alt@Sun.COM wbr_drrr->drr_key.ddk_cksum = 36811381SLori.Alt@Sun.COM drrw->drr_key.ddk_cksum; 36911381SLori.Alt@Sun.COM wbr_drrr->drr_key.ddk_prop = 37011381SLori.Alt@Sun.COM drrw->drr_key.ddk_prop; 37111007SLori.Alt@Sun.COM 37211007SLori.Alt@Sun.COM if (cksum_and_write(&wbr_drr, 37311007SLori.Alt@Sun.COM sizeof (dmu_replay_record_t), &stream_cksum, 37411007SLori.Alt@Sun.COM outfd) == -1) 37511007SLori.Alt@Sun.COM goto out; 37611007SLori.Alt@Sun.COM } else { 37711007SLori.Alt@Sun.COM /* block not previously seen */ 37811007SLori.Alt@Sun.COM if (cksum_and_write(drr, 37911007SLori.Alt@Sun.COM sizeof (dmu_replay_record_t), &stream_cksum, 38011007SLori.Alt@Sun.COM outfd) == -1) 38111007SLori.Alt@Sun.COM goto out; 38211007SLori.Alt@Sun.COM if (cksum_and_write(buf, 38311007SLori.Alt@Sun.COM drrw->drr_length, 38411007SLori.Alt@Sun.COM &stream_cksum, outfd) == -1) 38511007SLori.Alt@Sun.COM goto out; 38611007SLori.Alt@Sun.COM } 38711007SLori.Alt@Sun.COM break; 38811007SLori.Alt@Sun.COM } 38911007SLori.Alt@Sun.COM 39011007SLori.Alt@Sun.COM case DRR_FREE: 39111007SLori.Alt@Sun.COM { 39211007SLori.Alt@Sun.COM if (cksum_and_write(drr, sizeof (dmu_replay_record_t), 39311007SLori.Alt@Sun.COM &stream_cksum, outfd) == -1) 39411007SLori.Alt@Sun.COM goto out; 39511007SLori.Alt@Sun.COM break; 39611007SLori.Alt@Sun.COM } 39711007SLori.Alt@Sun.COM 39811007SLori.Alt@Sun.COM default: 39911007SLori.Alt@Sun.COM (void) printf("INVALID record type 0x%x\n", 40011007SLori.Alt@Sun.COM drr->drr_type); 40111007SLori.Alt@Sun.COM /* should never happen, so assert */ 40211007SLori.Alt@Sun.COM assert(B_FALSE); 40311007SLori.Alt@Sun.COM } 40411007SLori.Alt@Sun.COM } 40511007SLori.Alt@Sun.COM out: 40611007SLori.Alt@Sun.COM umem_cache_destroy(ddt.ddecache); 40711007SLori.Alt@Sun.COM free(ddt.dedup_hash_array); 40811007SLori.Alt@Sun.COM free(buf); 40911007SLori.Alt@Sun.COM (void) fclose(ofp); 41011007SLori.Alt@Sun.COM 41111007SLori.Alt@Sun.COM return (NULL); 41211007SLori.Alt@Sun.COM } 41311007SLori.Alt@Sun.COM 4145367Sahrens /* 4155367Sahrens * Routines for dealing with the AVL tree of fs-nvlists 4165367Sahrens */ 4175367Sahrens typedef struct fsavl_node { 4185367Sahrens avl_node_t fn_node; 4195367Sahrens nvlist_t *fn_nvfs; 4205367Sahrens char *fn_snapname; 4215367Sahrens uint64_t fn_guid; 4225367Sahrens } fsavl_node_t; 4235367Sahrens 4245367Sahrens static int 4255367Sahrens fsavl_compare(const void *arg1, const void *arg2) 4265367Sahrens { 4275367Sahrens const fsavl_node_t *fn1 = arg1; 4285367Sahrens const fsavl_node_t *fn2 = arg2; 4295367Sahrens 4305367Sahrens if (fn1->fn_guid > fn2->fn_guid) 4315367Sahrens return (+1); 4325367Sahrens else if (fn1->fn_guid < fn2->fn_guid) 4335367Sahrens return (-1); 4345367Sahrens else 4355367Sahrens return (0); 4365367Sahrens } 4375367Sahrens 4385367Sahrens /* 4395367Sahrens * Given the GUID of a snapshot, find its containing filesystem and 4405367Sahrens * (optionally) name. 4415367Sahrens */ 4425367Sahrens static nvlist_t * 4435367Sahrens fsavl_find(avl_tree_t *avl, uint64_t snapguid, char **snapname) 4445367Sahrens { 4455367Sahrens fsavl_node_t fn_find; 4465367Sahrens fsavl_node_t *fn; 4475367Sahrens 4485367Sahrens fn_find.fn_guid = snapguid; 4495367Sahrens 4505367Sahrens fn = avl_find(avl, &fn_find, NULL); 4515367Sahrens if (fn) { 4525367Sahrens if (snapname) 4535367Sahrens *snapname = fn->fn_snapname; 4545367Sahrens return (fn->fn_nvfs); 4555367Sahrens } 4565367Sahrens return (NULL); 4575367Sahrens } 4585367Sahrens 4595896Sahl static void 4605896Sahl fsavl_destroy(avl_tree_t *avl) 4615896Sahl { 4625896Sahl fsavl_node_t *fn; 4635896Sahl void *cookie; 4645896Sahl 4655896Sahl if (avl == NULL) 4665896Sahl return; 4675896Sahl 4685896Sahl cookie = NULL; 4695896Sahl while ((fn = avl_destroy_nodes(avl, &cookie)) != NULL) 4705896Sahl free(fn); 4715896Sahl avl_destroy(avl); 4725896Sahl free(avl); 4735896Sahl } 4745896Sahl 47510200SLori.Alt@Sun.COM /* 47610200SLori.Alt@Sun.COM * Given an nvlist, produce an avl tree of snapshots, ordered by guid 47710200SLori.Alt@Sun.COM */ 4785367Sahrens static avl_tree_t * 4795367Sahrens fsavl_create(nvlist_t *fss) 4805367Sahrens { 4815367Sahrens avl_tree_t *fsavl; 4825367Sahrens nvpair_t *fselem = NULL; 4835367Sahrens 4845896Sahl if ((fsavl = malloc(sizeof (avl_tree_t))) == NULL) 4855896Sahl return (NULL); 4865896Sahl 4875367Sahrens avl_create(fsavl, fsavl_compare, sizeof (fsavl_node_t), 4885367Sahrens offsetof(fsavl_node_t, fn_node)); 4895367Sahrens 4905367Sahrens while ((fselem = nvlist_next_nvpair(fss, fselem)) != NULL) { 4915367Sahrens nvlist_t *nvfs, *snaps; 4925367Sahrens nvpair_t *snapelem = NULL; 4935367Sahrens 4945367Sahrens VERIFY(0 == nvpair_value_nvlist(fselem, &nvfs)); 4955367Sahrens VERIFY(0 == nvlist_lookup_nvlist(nvfs, "snaps", &snaps)); 4965367Sahrens 4975367Sahrens while ((snapelem = 4985367Sahrens nvlist_next_nvpair(snaps, snapelem)) != NULL) { 4995367Sahrens fsavl_node_t *fn; 5005367Sahrens uint64_t guid; 5015367Sahrens 5025367Sahrens VERIFY(0 == nvpair_value_uint64(snapelem, &guid)); 5035896Sahl if ((fn = malloc(sizeof (fsavl_node_t))) == NULL) { 5045896Sahl fsavl_destroy(fsavl); 5055896Sahl return (NULL); 5065896Sahl } 5075367Sahrens fn->fn_nvfs = nvfs; 5085367Sahrens fn->fn_snapname = nvpair_name(snapelem); 5095367Sahrens fn->fn_guid = guid; 5105367Sahrens 5115367Sahrens /* 5125367Sahrens * Note: if there are multiple snaps with the 5135367Sahrens * same GUID, we ignore all but one. 5145367Sahrens */ 5155367Sahrens if (avl_find(fsavl, fn, NULL) == NULL) 5165367Sahrens avl_add(fsavl, fn); 5175367Sahrens else 5185367Sahrens free(fn); 5195367Sahrens } 5205367Sahrens } 5215367Sahrens 5225367Sahrens return (fsavl); 5235367Sahrens } 5245367Sahrens 5255367Sahrens /* 5265367Sahrens * Routines for dealing with the giant nvlist of fs-nvlists, etc. 5275367Sahrens */ 5285367Sahrens typedef struct send_data { 5295367Sahrens uint64_t parent_fromsnap_guid; 5305367Sahrens nvlist_t *parent_snaps; 5315367Sahrens nvlist_t *fss; 5327265Sahrens nvlist_t *snapprops; 5335367Sahrens const char *fromsnap; 5345367Sahrens const char *tosnap; 53511022STom.Erickson@Sun.COM boolean_t recursive; 5365367Sahrens 5375367Sahrens /* 5385367Sahrens * The header nvlist is of the following format: 5395367Sahrens * { 5405367Sahrens * "tosnap" -> string 5415367Sahrens * "fromsnap" -> string (if incremental) 5425367Sahrens * "fss" -> { 5435367Sahrens * id -> { 5445367Sahrens * 5455367Sahrens * "name" -> string (full name; for debugging) 5465367Sahrens * "parentfromsnap" -> number (guid of fromsnap in parent) 5475367Sahrens * 5485367Sahrens * "props" -> { name -> value (only if set here) } 5495367Sahrens * "snaps" -> { name (lastname) -> number (guid) } 5507265Sahrens * "snapprops" -> { name (lastname) -> { name -> value } } 5515367Sahrens * 5525367Sahrens * "origin" -> number (guid) (if clone) 5535367Sahrens * "sent" -> boolean (not on-disk) 5545367Sahrens * } 5555367Sahrens * } 5565367Sahrens * } 5575367Sahrens * 5585367Sahrens */ 5595367Sahrens } send_data_t; 5605367Sahrens 5617265Sahrens static void send_iterate_prop(zfs_handle_t *zhp, nvlist_t *nv); 5627265Sahrens 5635367Sahrens static int 5645367Sahrens send_iterate_snap(zfs_handle_t *zhp, void *arg) 5655367Sahrens { 5665367Sahrens send_data_t *sd = arg; 5675367Sahrens uint64_t guid = zhp->zfs_dmustats.dds_guid; 5685367Sahrens char *snapname; 5697265Sahrens nvlist_t *nv; 5705367Sahrens 5715367Sahrens snapname = strrchr(zhp->zfs_name, '@')+1; 5725367Sahrens 5735367Sahrens VERIFY(0 == nvlist_add_uint64(sd->parent_snaps, snapname, guid)); 5745367Sahrens /* 5755367Sahrens * NB: if there is no fromsnap here (it's a newly created fs in 5765367Sahrens * an incremental replication), we will substitute the tosnap. 5775367Sahrens */ 5785367Sahrens if ((sd->fromsnap && strcmp(snapname, sd->fromsnap) == 0) || 5795367Sahrens (sd->parent_fromsnap_guid == 0 && sd->tosnap && 5805367Sahrens strcmp(snapname, sd->tosnap) == 0)) { 5815367Sahrens sd->parent_fromsnap_guid = guid; 5825367Sahrens } 5835367Sahrens 5847265Sahrens VERIFY(0 == nvlist_alloc(&nv, NV_UNIQUE_NAME, 0)); 5857265Sahrens send_iterate_prop(zhp, nv); 5867265Sahrens VERIFY(0 == nvlist_add_nvlist(sd->snapprops, snapname, nv)); 5877265Sahrens nvlist_free(nv); 5887265Sahrens 5895367Sahrens zfs_close(zhp); 5905367Sahrens return (0); 5915367Sahrens } 5925367Sahrens 5935367Sahrens static void 5945367Sahrens send_iterate_prop(zfs_handle_t *zhp, nvlist_t *nv) 5955367Sahrens { 5965367Sahrens nvpair_t *elem = NULL; 5975367Sahrens 5985367Sahrens while ((elem = nvlist_next_nvpair(zhp->zfs_props, elem)) != NULL) { 5995367Sahrens char *propname = nvpair_name(elem); 6005367Sahrens zfs_prop_t prop = zfs_name_to_prop(propname); 6015367Sahrens nvlist_t *propnv; 6025367Sahrens 60310960SEric.Schrock@Sun.COM if (!zfs_prop_user(propname)) { 60410960SEric.Schrock@Sun.COM /* 60510960SEric.Schrock@Sun.COM * Realistically, this should never happen. However, 60610960SEric.Schrock@Sun.COM * we want the ability to add DSL properties without 60710960SEric.Schrock@Sun.COM * needing to make incompatible version changes. We 60810960SEric.Schrock@Sun.COM * need to ignore unknown properties to allow older 60910960SEric.Schrock@Sun.COM * software to still send datasets containing these 61010960SEric.Schrock@Sun.COM * properties, with the unknown properties elided. 61110960SEric.Schrock@Sun.COM */ 61210960SEric.Schrock@Sun.COM if (prop == ZPROP_INVAL) 61310960SEric.Schrock@Sun.COM continue; 6149396SMatthew.Ahrens@Sun.COM 61510960SEric.Schrock@Sun.COM if (zfs_prop_readonly(prop)) 61610960SEric.Schrock@Sun.COM continue; 61710960SEric.Schrock@Sun.COM } 6185367Sahrens 6195367Sahrens verify(nvpair_value_nvlist(elem, &propnv) == 0); 62010195SSanjeev.Bagewadi@Sun.COM if (prop == ZFS_PROP_QUOTA || prop == ZFS_PROP_RESERVATION || 62110195SSanjeev.Bagewadi@Sun.COM prop == ZFS_PROP_REFQUOTA || 62210195SSanjeev.Bagewadi@Sun.COM prop == ZFS_PROP_REFRESERVATION) { 62311022STom.Erickson@Sun.COM char *source; 6245367Sahrens uint64_t value; 6255367Sahrens verify(nvlist_lookup_uint64(propnv, 6265367Sahrens ZPROP_VALUE, &value) == 0); 6277265Sahrens if (zhp->zfs_type == ZFS_TYPE_SNAPSHOT) 6287265Sahrens continue; 62911022STom.Erickson@Sun.COM /* 63011022STom.Erickson@Sun.COM * May have no source before SPA_VERSION_RECVD_PROPS, 63111022STom.Erickson@Sun.COM * but is still modifiable. 63211022STom.Erickson@Sun.COM */ 63311022STom.Erickson@Sun.COM if (nvlist_lookup_string(propnv, 63411022STom.Erickson@Sun.COM ZPROP_SOURCE, &source) == 0) { 63511022STom.Erickson@Sun.COM if ((strcmp(source, zhp->zfs_name) != 0) && 63611022STom.Erickson@Sun.COM (strcmp(source, 63711022STom.Erickson@Sun.COM ZPROP_SOURCE_VAL_RECVD) != 0)) 63811022STom.Erickson@Sun.COM continue; 63911022STom.Erickson@Sun.COM } 6405367Sahrens } else { 6415367Sahrens char *source; 6425367Sahrens if (nvlist_lookup_string(propnv, 6435367Sahrens ZPROP_SOURCE, &source) != 0) 6445367Sahrens continue; 64511022STom.Erickson@Sun.COM if ((strcmp(source, zhp->zfs_name) != 0) && 64611022STom.Erickson@Sun.COM (strcmp(source, ZPROP_SOURCE_VAL_RECVD) != 0)) 6475367Sahrens continue; 6485367Sahrens } 6495367Sahrens 6505367Sahrens if (zfs_prop_user(propname) || 6515367Sahrens zfs_prop_get_type(prop) == PROP_TYPE_STRING) { 6525367Sahrens char *value; 6535367Sahrens verify(nvlist_lookup_string(propnv, 6545367Sahrens ZPROP_VALUE, &value) == 0); 6555367Sahrens VERIFY(0 == nvlist_add_string(nv, propname, value)); 6565367Sahrens } else { 6575367Sahrens uint64_t value; 6585367Sahrens verify(nvlist_lookup_uint64(propnv, 6595367Sahrens ZPROP_VALUE, &value) == 0); 6605367Sahrens VERIFY(0 == nvlist_add_uint64(nv, propname, value)); 6615367Sahrens } 6625367Sahrens } 6635367Sahrens } 6645367Sahrens 66510200SLori.Alt@Sun.COM /* 66610200SLori.Alt@Sun.COM * recursively generate nvlists describing datasets. See comment 66710200SLori.Alt@Sun.COM * for the data structure send_data_t above for description of contents 66810200SLori.Alt@Sun.COM * of the nvlist. 66910200SLori.Alt@Sun.COM */ 6705367Sahrens static int 6715367Sahrens send_iterate_fs(zfs_handle_t *zhp, void *arg) 6725367Sahrens { 6735367Sahrens send_data_t *sd = arg; 6745367Sahrens nvlist_t *nvfs, *nv; 67511022STom.Erickson@Sun.COM int rv = 0; 6765367Sahrens uint64_t parent_fromsnap_guid_save = sd->parent_fromsnap_guid; 6775367Sahrens uint64_t guid = zhp->zfs_dmustats.dds_guid; 6785367Sahrens char guidstring[64]; 6795367Sahrens 6805367Sahrens VERIFY(0 == nvlist_alloc(&nvfs, NV_UNIQUE_NAME, 0)); 6815367Sahrens VERIFY(0 == nvlist_add_string(nvfs, "name", zhp->zfs_name)); 6825367Sahrens VERIFY(0 == nvlist_add_uint64(nvfs, "parentfromsnap", 6835367Sahrens sd->parent_fromsnap_guid)); 6845367Sahrens 6855367Sahrens if (zhp->zfs_dmustats.dds_origin[0]) { 6865367Sahrens zfs_handle_t *origin = zfs_open(zhp->zfs_hdl, 6875367Sahrens zhp->zfs_dmustats.dds_origin, ZFS_TYPE_SNAPSHOT); 6885367Sahrens if (origin == NULL) 6895367Sahrens return (-1); 6905367Sahrens VERIFY(0 == nvlist_add_uint64(nvfs, "origin", 6915367Sahrens origin->zfs_dmustats.dds_guid)); 6925367Sahrens } 6935367Sahrens 6945367Sahrens /* iterate over props */ 6955367Sahrens VERIFY(0 == nvlist_alloc(&nv, NV_UNIQUE_NAME, 0)); 6965367Sahrens send_iterate_prop(zhp, nv); 6975367Sahrens VERIFY(0 == nvlist_add_nvlist(nvfs, "props", nv)); 6985367Sahrens nvlist_free(nv); 6995367Sahrens 7005367Sahrens /* iterate over snaps, and set sd->parent_fromsnap_guid */ 7015367Sahrens sd->parent_fromsnap_guid = 0; 7025367Sahrens VERIFY(0 == nvlist_alloc(&sd->parent_snaps, NV_UNIQUE_NAME, 0)); 7037265Sahrens VERIFY(0 == nvlist_alloc(&sd->snapprops, NV_UNIQUE_NAME, 0)); 7045367Sahrens (void) zfs_iter_snapshots(zhp, send_iterate_snap, sd); 7055367Sahrens VERIFY(0 == nvlist_add_nvlist(nvfs, "snaps", sd->parent_snaps)); 7067265Sahrens VERIFY(0 == nvlist_add_nvlist(nvfs, "snapprops", sd->snapprops)); 7075367Sahrens nvlist_free(sd->parent_snaps); 7087265Sahrens nvlist_free(sd->snapprops); 7095367Sahrens 7105367Sahrens /* add this fs to nvlist */ 7115367Sahrens (void) snprintf(guidstring, sizeof (guidstring), 7125367Sahrens "0x%llx", (longlong_t)guid); 7135367Sahrens VERIFY(0 == nvlist_add_nvlist(sd->fss, guidstring, nvfs)); 7145367Sahrens nvlist_free(nvfs); 7155367Sahrens 7165367Sahrens /* iterate over children */ 71711022STom.Erickson@Sun.COM if (sd->recursive) 71811022STom.Erickson@Sun.COM rv = zfs_iter_filesystems(zhp, send_iterate_fs, sd); 7195367Sahrens 7205367Sahrens sd->parent_fromsnap_guid = parent_fromsnap_guid_save; 7215367Sahrens 7225367Sahrens zfs_close(zhp); 7235367Sahrens return (rv); 7245367Sahrens } 7255367Sahrens 7265367Sahrens static int 7275367Sahrens gather_nvlist(libzfs_handle_t *hdl, const char *fsname, const char *fromsnap, 72811022STom.Erickson@Sun.COM const char *tosnap, boolean_t recursive, nvlist_t **nvlp, avl_tree_t **avlp) 7295367Sahrens { 7305367Sahrens zfs_handle_t *zhp; 7315367Sahrens send_data_t sd = { 0 }; 7325367Sahrens int error; 7335367Sahrens 7345367Sahrens zhp = zfs_open(hdl, fsname, ZFS_TYPE_FILESYSTEM | ZFS_TYPE_VOLUME); 7355367Sahrens if (zhp == NULL) 7365367Sahrens return (EZFS_BADTYPE); 7375367Sahrens 7385367Sahrens VERIFY(0 == nvlist_alloc(&sd.fss, NV_UNIQUE_NAME, 0)); 7395367Sahrens sd.fromsnap = fromsnap; 7405367Sahrens sd.tosnap = tosnap; 74111022STom.Erickson@Sun.COM sd.recursive = recursive; 7425896Sahl 7435896Sahl if ((error = send_iterate_fs(zhp, &sd)) != 0) { 7445896Sahl nvlist_free(sd.fss); 7455896Sahl if (avlp != NULL) 7465896Sahl *avlp = NULL; 7475896Sahl *nvlp = NULL; 7485896Sahl return (error); 7495896Sahl } 7505896Sahl 7515896Sahl if (avlp != NULL && (*avlp = fsavl_create(sd.fss)) == NULL) { 7525896Sahl nvlist_free(sd.fss); 7535896Sahl *nvlp = NULL; 7545896Sahl return (EZFS_NOMEM); 7555896Sahl } 7565367Sahrens 7575367Sahrens *nvlp = sd.fss; 7585896Sahl return (0); 7595367Sahrens } 7605367Sahrens 7615367Sahrens /* 7625367Sahrens * Routines for dealing with the sorted snapshot functionality 7635367Sahrens */ 7645367Sahrens typedef struct zfs_node { 7655367Sahrens zfs_handle_t *zn_handle; 7665367Sahrens avl_node_t zn_avlnode; 7675367Sahrens } zfs_node_t; 7685367Sahrens 7695367Sahrens static int 7705367Sahrens zfs_sort_snaps(zfs_handle_t *zhp, void *data) 7715367Sahrens { 7725367Sahrens avl_tree_t *avl = data; 7735367Sahrens zfs_node_t *node = zfs_alloc(zhp->zfs_hdl, sizeof (zfs_node_t)); 7745367Sahrens 7755367Sahrens node->zn_handle = zhp; 7765367Sahrens avl_add(avl, node); 7775367Sahrens return (0); 7785367Sahrens } 7795367Sahrens 7805367Sahrens /* ARGSUSED */ 7815367Sahrens static int 7825367Sahrens zfs_snapshot_compare(const void *larg, const void *rarg) 7835367Sahrens { 7845367Sahrens zfs_handle_t *l = ((zfs_node_t *)larg)->zn_handle; 7855367Sahrens zfs_handle_t *r = ((zfs_node_t *)rarg)->zn_handle; 7865367Sahrens uint64_t lcreate, rcreate; 7875367Sahrens 7885367Sahrens /* 7895367Sahrens * Sort them according to creation time. We use the hidden 7905367Sahrens * CREATETXG property to get an absolute ordering of snapshots. 7915367Sahrens */ 7925367Sahrens lcreate = zfs_prop_get_int(l, ZFS_PROP_CREATETXG); 7935367Sahrens rcreate = zfs_prop_get_int(r, ZFS_PROP_CREATETXG); 7945367Sahrens 7955367Sahrens if (lcreate < rcreate) 7965367Sahrens return (-1); 7975367Sahrens else if (lcreate > rcreate) 7985367Sahrens return (+1); 7995367Sahrens else 8005367Sahrens return (0); 8015367Sahrens } 8025367Sahrens 80310342Schris.kirby@sun.com int 8045367Sahrens zfs_iter_snapshots_sorted(zfs_handle_t *zhp, zfs_iter_f callback, void *data) 8055367Sahrens { 8065367Sahrens int ret = 0; 8075367Sahrens zfs_node_t *node; 8085367Sahrens avl_tree_t avl; 8095367Sahrens void *cookie = NULL; 8105367Sahrens 8115367Sahrens avl_create(&avl, zfs_snapshot_compare, 8125367Sahrens sizeof (zfs_node_t), offsetof(zfs_node_t, zn_avlnode)); 8135367Sahrens 8145367Sahrens ret = zfs_iter_snapshots(zhp, zfs_sort_snaps, &avl); 8155367Sahrens 8165367Sahrens for (node = avl_first(&avl); node != NULL; node = AVL_NEXT(&avl, node)) 8175367Sahrens ret |= callback(node->zn_handle, data); 8185367Sahrens 8195367Sahrens while ((node = avl_destroy_nodes(&avl, &cookie)) != NULL) 8205367Sahrens free(node); 8215367Sahrens 8225367Sahrens avl_destroy(&avl); 8235367Sahrens 8245367Sahrens return (ret); 8255367Sahrens } 8265367Sahrens 8275367Sahrens /* 8285367Sahrens * Routines specific to "zfs send" 8295367Sahrens */ 8305367Sahrens typedef struct send_dump_data { 8315367Sahrens /* these are all just the short snapname (the part after the @) */ 8325367Sahrens const char *fromsnap; 8335367Sahrens const char *tosnap; 83411007SLori.Alt@Sun.COM char prevsnap[ZFS_MAXNAMELEN]; 8355367Sahrens boolean_t seenfrom, seento, replicate, doall, fromorigin; 8365367Sahrens boolean_t verbose; 8375367Sahrens int outfd; 8385367Sahrens boolean_t err; 8395367Sahrens nvlist_t *fss; 8405367Sahrens avl_tree_t *fsavl; 84111007SLori.Alt@Sun.COM snapfilter_cb_t *filter_cb; 84211007SLori.Alt@Sun.COM void *filter_cb_arg; 8435367Sahrens } send_dump_data_t; 8445367Sahrens 8455367Sahrens /* 8465367Sahrens * Dumps a backup of the given snapshot (incremental from fromsnap if it's not 8475367Sahrens * NULL) to the file descriptor specified by outfd. 8485367Sahrens */ 8495367Sahrens static int 8505367Sahrens dump_ioctl(zfs_handle_t *zhp, const char *fromsnap, boolean_t fromorigin, 85111668SChris.Kirby@sun.com int outfd, boolean_t enoent_ok, boolean_t *got_enoent) 8525367Sahrens { 8535367Sahrens zfs_cmd_t zc = { 0 }; 8545367Sahrens libzfs_handle_t *hdl = zhp->zfs_hdl; 8555367Sahrens 8565367Sahrens assert(zhp->zfs_type == ZFS_TYPE_SNAPSHOT); 8575367Sahrens assert(fromsnap == NULL || fromsnap[0] == '\0' || !fromorigin); 8585367Sahrens 8595367Sahrens (void) strlcpy(zc.zc_name, zhp->zfs_name, sizeof (zc.zc_name)); 8605367Sahrens if (fromsnap) 8615765Sek110237 (void) strlcpy(zc.zc_value, fromsnap, sizeof (zc.zc_value)); 8625367Sahrens zc.zc_cookie = outfd; 8635367Sahrens zc.zc_obj = fromorigin; 8645367Sahrens 86511668SChris.Kirby@sun.com *got_enoent = B_FALSE; 86611668SChris.Kirby@sun.com 8675367Sahrens if (ioctl(zhp->zfs_hdl->libzfs_fd, ZFS_IOC_SEND, &zc) != 0) { 8685367Sahrens char errbuf[1024]; 8695367Sahrens (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN, 8705367Sahrens "warning: cannot send '%s'"), zhp->zfs_name); 8715367Sahrens 8725367Sahrens switch (errno) { 8735367Sahrens 8745367Sahrens case EXDEV: 8755367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 8765367Sahrens "not an earlier snapshot from the same fs")); 8775367Sahrens return (zfs_error(hdl, EZFS_CROSSTARGET, errbuf)); 8785367Sahrens 8795367Sahrens case ENOENT: 88011668SChris.Kirby@sun.com if (enoent_ok) { 88111668SChris.Kirby@sun.com *got_enoent = B_TRUE; 88211668SChris.Kirby@sun.com return (0); 88311668SChris.Kirby@sun.com } 8845367Sahrens if (zfs_dataset_exists(hdl, zc.zc_name, 8855367Sahrens ZFS_TYPE_SNAPSHOT)) { 8865367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 8875367Sahrens "incremental source (@%s) does not exist"), 8885367Sahrens zc.zc_value); 8895367Sahrens } 8905367Sahrens return (zfs_error(hdl, EZFS_NOENT, errbuf)); 8915367Sahrens 8925367Sahrens case EDQUOT: 8935367Sahrens case EFBIG: 8945367Sahrens case EIO: 8955367Sahrens case ENOLINK: 8965367Sahrens case ENOSPC: 8975367Sahrens case ENOSTR: 8985367Sahrens case ENXIO: 8995367Sahrens case EPIPE: 9005367Sahrens case ERANGE: 9015367Sahrens case EFAULT: 9025367Sahrens case EROFS: 9035367Sahrens zfs_error_aux(hdl, strerror(errno)); 9045367Sahrens return (zfs_error(hdl, EZFS_BADBACKUP, errbuf)); 9055367Sahrens 9065367Sahrens default: 9075367Sahrens return (zfs_standard_error(hdl, errno, errbuf)); 9085367Sahrens } 9095367Sahrens } 9105367Sahrens 9115367Sahrens return (0); 9125367Sahrens } 9135367Sahrens 9145367Sahrens static int 9155367Sahrens dump_snapshot(zfs_handle_t *zhp, void *arg) 9165367Sahrens { 9175367Sahrens send_dump_data_t *sdd = arg; 9185367Sahrens const char *thissnap; 9195367Sahrens int err; 92011668SChris.Kirby@sun.com boolean_t got_enoent; 9215367Sahrens 9225367Sahrens thissnap = strchr(zhp->zfs_name, '@') + 1; 9235367Sahrens 9245367Sahrens if (sdd->fromsnap && !sdd->seenfrom && 9255367Sahrens strcmp(sdd->fromsnap, thissnap) == 0) { 9265367Sahrens sdd->seenfrom = B_TRUE; 92711007SLori.Alt@Sun.COM (void) strcpy(sdd->prevsnap, thissnap); 9285367Sahrens zfs_close(zhp); 9295367Sahrens return (0); 9305367Sahrens } 9315367Sahrens 9325367Sahrens if (sdd->seento || !sdd->seenfrom) { 9335367Sahrens zfs_close(zhp); 9345367Sahrens return (0); 9355367Sahrens } 9365367Sahrens 93711007SLori.Alt@Sun.COM if (strcmp(sdd->tosnap, thissnap) == 0) 93811007SLori.Alt@Sun.COM sdd->seento = B_TRUE; 93911007SLori.Alt@Sun.COM 94011007SLori.Alt@Sun.COM /* 94111007SLori.Alt@Sun.COM * If a filter function exists, call it to determine whether 94211007SLori.Alt@Sun.COM * this snapshot will be sent. 94311007SLori.Alt@Sun.COM */ 94411007SLori.Alt@Sun.COM if (sdd->filter_cb != NULL && 94511007SLori.Alt@Sun.COM sdd->filter_cb(zhp, sdd->filter_cb_arg) == B_FALSE) { 94611007SLori.Alt@Sun.COM /* 94711007SLori.Alt@Sun.COM * This snapshot is filtered out. Don't send it, and don't 94811007SLori.Alt@Sun.COM * set prevsnap, so it will be as if this snapshot didn't 94911007SLori.Alt@Sun.COM * exist, and the next accepted snapshot will be sent as 95011007SLori.Alt@Sun.COM * an incremental from the last accepted one, or as the 95111007SLori.Alt@Sun.COM * first (and full) snapshot in the case of a replication, 95211007SLori.Alt@Sun.COM * non-incremental send. 95311007SLori.Alt@Sun.COM */ 95411007SLori.Alt@Sun.COM zfs_close(zhp); 95511007SLori.Alt@Sun.COM return (0); 95611007SLori.Alt@Sun.COM } 95711007SLori.Alt@Sun.COM 9585367Sahrens /* send it */ 9595367Sahrens if (sdd->verbose) { 9605367Sahrens (void) fprintf(stderr, "sending from @%s to %s\n", 96111007SLori.Alt@Sun.COM sdd->prevsnap, zhp->zfs_name); 9625367Sahrens } 9635367Sahrens 96411007SLori.Alt@Sun.COM err = dump_ioctl(zhp, sdd->prevsnap, 96511007SLori.Alt@Sun.COM sdd->prevsnap[0] == '\0' && (sdd->fromorigin || sdd->replicate), 96611668SChris.Kirby@sun.com sdd->outfd, B_TRUE, &got_enoent); 9675367Sahrens 96811668SChris.Kirby@sun.com if (got_enoent) 96911668SChris.Kirby@sun.com err = 0; 97011668SChris.Kirby@sun.com else 97111668SChris.Kirby@sun.com (void) strcpy(sdd->prevsnap, thissnap); 9725367Sahrens zfs_close(zhp); 9735367Sahrens return (err); 9745367Sahrens } 9755367Sahrens 9765367Sahrens static int 9775367Sahrens dump_filesystem(zfs_handle_t *zhp, void *arg) 9785367Sahrens { 9795367Sahrens int rv = 0; 9805367Sahrens send_dump_data_t *sdd = arg; 9815367Sahrens boolean_t missingfrom = B_FALSE; 9825367Sahrens zfs_cmd_t zc = { 0 }; 9835367Sahrens 9845367Sahrens (void) snprintf(zc.zc_name, sizeof (zc.zc_name), "%s@%s", 9855367Sahrens zhp->zfs_name, sdd->tosnap); 9865367Sahrens if (ioctl(zhp->zfs_hdl->libzfs_fd, ZFS_IOC_OBJSET_STATS, &zc) != 0) { 9875367Sahrens (void) fprintf(stderr, "WARNING: " 9885367Sahrens "could not send %s@%s: does not exist\n", 9895367Sahrens zhp->zfs_name, sdd->tosnap); 9905367Sahrens sdd->err = B_TRUE; 9915367Sahrens return (0); 9925367Sahrens } 9935367Sahrens 9945367Sahrens if (sdd->replicate && sdd->fromsnap) { 9955367Sahrens /* 9965367Sahrens * If this fs does not have fromsnap, and we're doing 9975367Sahrens * recursive, we need to send a full stream from the 9985367Sahrens * beginning (or an incremental from the origin if this 9995367Sahrens * is a clone). If we're doing non-recursive, then let 10005367Sahrens * them get the error. 10015367Sahrens */ 10025367Sahrens (void) snprintf(zc.zc_name, sizeof (zc.zc_name), "%s@%s", 10035367Sahrens zhp->zfs_name, sdd->fromsnap); 10045367Sahrens if (ioctl(zhp->zfs_hdl->libzfs_fd, 10055367Sahrens ZFS_IOC_OBJSET_STATS, &zc) != 0) { 10065367Sahrens missingfrom = B_TRUE; 10075367Sahrens } 10085367Sahrens } 10095367Sahrens 10105367Sahrens if (sdd->doall) { 101111007SLori.Alt@Sun.COM sdd->seenfrom = sdd->seento = sdd->prevsnap[0] = 0; 10125367Sahrens if (sdd->fromsnap == NULL || missingfrom) 10135367Sahrens sdd->seenfrom = B_TRUE; 10145367Sahrens 10155367Sahrens rv = zfs_iter_snapshots_sorted(zhp, dump_snapshot, arg); 10165367Sahrens if (!sdd->seenfrom) { 10175367Sahrens (void) fprintf(stderr, 10185367Sahrens "WARNING: could not send %s@%s:\n" 10195367Sahrens "incremental source (%s@%s) does not exist\n", 10205367Sahrens zhp->zfs_name, sdd->tosnap, 10215367Sahrens zhp->zfs_name, sdd->fromsnap); 10225367Sahrens sdd->err = B_TRUE; 10235367Sahrens } else if (!sdd->seento) { 10249396SMatthew.Ahrens@Sun.COM if (sdd->fromsnap) { 10259396SMatthew.Ahrens@Sun.COM (void) fprintf(stderr, 10269396SMatthew.Ahrens@Sun.COM "WARNING: could not send %s@%s:\n" 10279396SMatthew.Ahrens@Sun.COM "incremental source (%s@%s) " 10289396SMatthew.Ahrens@Sun.COM "is not earlier than it\n", 10299396SMatthew.Ahrens@Sun.COM zhp->zfs_name, sdd->tosnap, 10309396SMatthew.Ahrens@Sun.COM zhp->zfs_name, sdd->fromsnap); 10319396SMatthew.Ahrens@Sun.COM } else { 10329396SMatthew.Ahrens@Sun.COM (void) fprintf(stderr, "WARNING: " 10339396SMatthew.Ahrens@Sun.COM "could not send %s@%s: does not exist\n", 10349396SMatthew.Ahrens@Sun.COM zhp->zfs_name, sdd->tosnap); 10359396SMatthew.Ahrens@Sun.COM } 10365367Sahrens sdd->err = B_TRUE; 10375367Sahrens } 10385367Sahrens } else { 10395367Sahrens zfs_handle_t *snapzhp; 10405367Sahrens char snapname[ZFS_MAXNAMELEN]; 10415367Sahrens 10425367Sahrens (void) snprintf(snapname, sizeof (snapname), "%s@%s", 10435367Sahrens zfs_get_name(zhp), sdd->tosnap); 10445367Sahrens snapzhp = zfs_open(zhp->zfs_hdl, snapname, ZFS_TYPE_SNAPSHOT); 10456476Sahl if (snapzhp == NULL) { 10466476Sahl rv = -1; 10476476Sahl } else { 104811007SLori.Alt@Sun.COM if (sdd->filter_cb == NULL || 104911007SLori.Alt@Sun.COM sdd->filter_cb(snapzhp, sdd->filter_cb_arg) == 105011007SLori.Alt@Sun.COM B_TRUE) { 105111668SChris.Kirby@sun.com boolean_t got_enoent; 105211668SChris.Kirby@sun.com 105311007SLori.Alt@Sun.COM rv = dump_ioctl(snapzhp, 105411007SLori.Alt@Sun.COM missingfrom ? NULL : sdd->fromsnap, 105511007SLori.Alt@Sun.COM sdd->fromorigin || missingfrom, 105611668SChris.Kirby@sun.com sdd->outfd, B_FALSE, &got_enoent); 105711007SLori.Alt@Sun.COM } 10586476Sahl sdd->seento = B_TRUE; 10596476Sahl zfs_close(snapzhp); 10606476Sahl } 10615367Sahrens } 10625367Sahrens 10635367Sahrens return (rv); 10645367Sahrens } 10655367Sahrens 10665367Sahrens static int 10675367Sahrens dump_filesystems(zfs_handle_t *rzhp, void *arg) 10685367Sahrens { 10695367Sahrens send_dump_data_t *sdd = arg; 10705367Sahrens nvpair_t *fspair; 10715367Sahrens boolean_t needagain, progress; 10725367Sahrens 10735367Sahrens if (!sdd->replicate) 10745367Sahrens return (dump_filesystem(rzhp, sdd)); 10755367Sahrens 10765367Sahrens again: 10775367Sahrens needagain = progress = B_FALSE; 10785367Sahrens for (fspair = nvlist_next_nvpair(sdd->fss, NULL); fspair; 10795367Sahrens fspair = nvlist_next_nvpair(sdd->fss, fspair)) { 10805367Sahrens nvlist_t *fslist; 10815367Sahrens char *fsname; 10825367Sahrens zfs_handle_t *zhp; 10835367Sahrens int err; 10845367Sahrens uint64_t origin_guid = 0; 10855367Sahrens nvlist_t *origin_nv; 10865367Sahrens 10875367Sahrens VERIFY(nvpair_value_nvlist(fspair, &fslist) == 0); 10885367Sahrens if (nvlist_lookup_boolean(fslist, "sent") == 0) 10895367Sahrens continue; 10905367Sahrens 10915367Sahrens VERIFY(nvlist_lookup_string(fslist, "name", &fsname) == 0); 10925367Sahrens (void) nvlist_lookup_uint64(fslist, "origin", &origin_guid); 10935367Sahrens 10945367Sahrens origin_nv = fsavl_find(sdd->fsavl, origin_guid, NULL); 10955367Sahrens if (origin_nv && 10965367Sahrens nvlist_lookup_boolean(origin_nv, "sent") == ENOENT) { 109711022STom.Erickson@Sun.COM /* 109811022STom.Erickson@Sun.COM * origin has not been sent yet; 109911022STom.Erickson@Sun.COM * skip this clone. 110011022STom.Erickson@Sun.COM */ 110111022STom.Erickson@Sun.COM needagain = B_TRUE; 110211022STom.Erickson@Sun.COM continue; 11035367Sahrens } 11045367Sahrens 11055367Sahrens zhp = zfs_open(rzhp->zfs_hdl, fsname, ZFS_TYPE_DATASET); 11066476Sahl if (zhp == NULL) 11076476Sahl return (-1); 11085367Sahrens err = dump_filesystem(zhp, sdd); 11095367Sahrens VERIFY(nvlist_add_boolean(fslist, "sent") == 0); 11105367Sahrens progress = B_TRUE; 11115367Sahrens zfs_close(zhp); 11125367Sahrens if (err) 11135367Sahrens return (err); 11145367Sahrens } 11155367Sahrens if (needagain) { 11165367Sahrens assert(progress); 11175367Sahrens goto again; 11185367Sahrens } 11195367Sahrens return (0); 11205367Sahrens } 11215367Sahrens 11225367Sahrens /* 112310200SLori.Alt@Sun.COM * Generate a send stream for the dataset identified by the argument zhp. 112410200SLori.Alt@Sun.COM * 112510200SLori.Alt@Sun.COM * The content of the send stream is the snapshot identified by 112610200SLori.Alt@Sun.COM * 'tosnap'. Incremental streams are requested in two ways: 112710200SLori.Alt@Sun.COM * - from the snapshot identified by "fromsnap" (if non-null) or 112810200SLori.Alt@Sun.COM * - from the origin of the dataset identified by zhp, which must 112910200SLori.Alt@Sun.COM * be a clone. In this case, "fromsnap" is null and "fromorigin" 113010200SLori.Alt@Sun.COM * is TRUE. 113110200SLori.Alt@Sun.COM * 113210200SLori.Alt@Sun.COM * The send stream is recursive (i.e. dumps a hierarchy of snapshots) and 113311007SLori.Alt@Sun.COM * uses a special header (with a hdrtype field of DMU_COMPOUNDSTREAM) 113410200SLori.Alt@Sun.COM * if "replicate" is set. If "doall" is set, dump all the intermediate 113511007SLori.Alt@Sun.COM * snapshots. The DMU_COMPOUNDSTREAM header is used in the "doall" 113611022STom.Erickson@Sun.COM * case too. If "props" is set, send properties. 11375367Sahrens */ 11385367Sahrens int 11395367Sahrens zfs_send(zfs_handle_t *zhp, const char *fromsnap, const char *tosnap, 114011007SLori.Alt@Sun.COM sendflags_t flags, int outfd, snapfilter_cb_t filter_func, 114111007SLori.Alt@Sun.COM void *cb_arg) 11425367Sahrens { 11435367Sahrens char errbuf[1024]; 11445367Sahrens send_dump_data_t sdd = { 0 }; 11455367Sahrens int err; 11465367Sahrens nvlist_t *fss = NULL; 11475367Sahrens avl_tree_t *fsavl = NULL; 114810342Schris.kirby@sun.com char holdtag[128]; 114910342Schris.kirby@sun.com static uint64_t holdseq; 115010735Schris.kirby@sun.com int spa_version; 115110735Schris.kirby@sun.com boolean_t holdsnaps = B_FALSE; 115211007SLori.Alt@Sun.COM pthread_t tid; 115311007SLori.Alt@Sun.COM int pipefd[2]; 115411007SLori.Alt@Sun.COM dedup_arg_t dda = { 0 }; 115511007SLori.Alt@Sun.COM int featureflags = 0; 11565367Sahrens 11575367Sahrens (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN, 11585367Sahrens "cannot send '%s'"), zhp->zfs_name); 11595367Sahrens 11605367Sahrens if (fromsnap && fromsnap[0] == '\0') { 11615367Sahrens zfs_error_aux(zhp->zfs_hdl, dgettext(TEXT_DOMAIN, 11625367Sahrens "zero-length incremental source")); 11635367Sahrens return (zfs_error(zhp->zfs_hdl, EZFS_NOENT, errbuf)); 11645367Sahrens } 11655367Sahrens 116610735Schris.kirby@sun.com if (zfs_spa_version(zhp, &spa_version) == 0 && 116710735Schris.kirby@sun.com spa_version >= SPA_VERSION_USERREFS) 116810735Schris.kirby@sun.com holdsnaps = B_TRUE; 116910735Schris.kirby@sun.com 117011007SLori.Alt@Sun.COM if (flags.dedup) { 117111381SLori.Alt@Sun.COM featureflags |= (DMU_BACKUP_FEATURE_DEDUP | 117211381SLori.Alt@Sun.COM DMU_BACKUP_FEATURE_DEDUPPROPS); 117311007SLori.Alt@Sun.COM if (err = pipe(pipefd)) { 117411007SLori.Alt@Sun.COM zfs_error_aux(zhp->zfs_hdl, strerror(errno)); 117511007SLori.Alt@Sun.COM return (zfs_error(zhp->zfs_hdl, EZFS_PIPEFAILED, 117611007SLori.Alt@Sun.COM errbuf)); 117711007SLori.Alt@Sun.COM } 117811007SLori.Alt@Sun.COM dda.outputfd = outfd; 117911007SLori.Alt@Sun.COM dda.inputfd = pipefd[1]; 118011007SLori.Alt@Sun.COM dda.dedup_hdl = zhp->zfs_hdl; 118111007SLori.Alt@Sun.COM if (err = pthread_create(&tid, NULL, cksummer, &dda)) { 118211007SLori.Alt@Sun.COM (void) close(pipefd[0]); 118311007SLori.Alt@Sun.COM (void) close(pipefd[1]); 118411007SLori.Alt@Sun.COM zfs_error_aux(zhp->zfs_hdl, strerror(errno)); 118511007SLori.Alt@Sun.COM return (zfs_error(zhp->zfs_hdl, 118611007SLori.Alt@Sun.COM EZFS_THREADCREATEFAILED, errbuf)); 118711007SLori.Alt@Sun.COM } 118811007SLori.Alt@Sun.COM } 118911007SLori.Alt@Sun.COM 119011022STom.Erickson@Sun.COM if (flags.replicate || flags.doall || flags.props) { 11915367Sahrens dmu_replay_record_t drr = { 0 }; 11925367Sahrens char *packbuf = NULL; 11935367Sahrens size_t buflen = 0; 11945367Sahrens zio_cksum_t zc = { 0 }; 11955367Sahrens 119610735Schris.kirby@sun.com if (holdsnaps) { 119710735Schris.kirby@sun.com (void) snprintf(holdtag, sizeof (holdtag), 119810735Schris.kirby@sun.com ".send-%d-%llu", getpid(), (u_longlong_t)holdseq); 119910735Schris.kirby@sun.com ++holdseq; 120010735Schris.kirby@sun.com err = zfs_hold_range(zhp, fromsnap, tosnap, 1201*11814SChris.Kirby@sun.com holdtag, flags.replicate, B_TRUE, filter_func, 1202*11814SChris.Kirby@sun.com cb_arg); 120310735Schris.kirby@sun.com if (err) 120411007SLori.Alt@Sun.COM goto err_out; 120510735Schris.kirby@sun.com } 120611007SLori.Alt@Sun.COM 120711022STom.Erickson@Sun.COM if (flags.replicate || flags.props) { 12085367Sahrens nvlist_t *hdrnv; 12095367Sahrens 12105367Sahrens VERIFY(0 == nvlist_alloc(&hdrnv, NV_UNIQUE_NAME, 0)); 12115367Sahrens if (fromsnap) { 12125367Sahrens VERIFY(0 == nvlist_add_string(hdrnv, 12135367Sahrens "fromsnap", fromsnap)); 12145367Sahrens } 12155367Sahrens VERIFY(0 == nvlist_add_string(hdrnv, "tosnap", tosnap)); 121611022STom.Erickson@Sun.COM if (!flags.replicate) { 121711022STom.Erickson@Sun.COM VERIFY(0 == nvlist_add_boolean(hdrnv, 121811022STom.Erickson@Sun.COM "not_recursive")); 121911022STom.Erickson@Sun.COM } 12205367Sahrens 12215367Sahrens err = gather_nvlist(zhp->zfs_hdl, zhp->zfs_name, 122211022STom.Erickson@Sun.COM fromsnap, tosnap, flags.replicate, &fss, &fsavl); 122310342Schris.kirby@sun.com if (err) { 122410735Schris.kirby@sun.com if (holdsnaps) { 122510735Schris.kirby@sun.com (void) zfs_release_range(zhp, fromsnap, 122611546SChris.Kirby@sun.com tosnap, holdtag, flags.replicate); 122710735Schris.kirby@sun.com } 122811007SLori.Alt@Sun.COM goto err_out; 122910342Schris.kirby@sun.com } 12305367Sahrens VERIFY(0 == nvlist_add_nvlist(hdrnv, "fss", fss)); 12315367Sahrens err = nvlist_pack(hdrnv, &packbuf, &buflen, 12325367Sahrens NV_ENCODE_XDR, 0); 12335367Sahrens nvlist_free(hdrnv); 12345367Sahrens if (err) { 12355367Sahrens fsavl_destroy(fsavl); 12365367Sahrens nvlist_free(fss); 123710735Schris.kirby@sun.com if (holdsnaps) { 123810735Schris.kirby@sun.com (void) zfs_release_range(zhp, fromsnap, 123911546SChris.Kirby@sun.com tosnap, holdtag, flags.replicate); 124010735Schris.kirby@sun.com } 124111007SLori.Alt@Sun.COM goto stderr_out; 12425367Sahrens } 12435367Sahrens } 12445367Sahrens 12455367Sahrens /* write first begin record */ 12465367Sahrens drr.drr_type = DRR_BEGIN; 12475367Sahrens drr.drr_u.drr_begin.drr_magic = DMU_BACKUP_MAGIC; 124811007SLori.Alt@Sun.COM DMU_SET_STREAM_HDRTYPE(drr.drr_u.drr_begin.drr_versioninfo, 124911007SLori.Alt@Sun.COM DMU_COMPOUNDSTREAM); 125011007SLori.Alt@Sun.COM DMU_SET_FEATUREFLAGS(drr.drr_u.drr_begin.drr_versioninfo, 125111007SLori.Alt@Sun.COM featureflags); 12525367Sahrens (void) snprintf(drr.drr_u.drr_begin.drr_toname, 12535367Sahrens sizeof (drr.drr_u.drr_begin.drr_toname), 12545367Sahrens "%s@%s", zhp->zfs_name, tosnap); 12555367Sahrens drr.drr_payloadlen = buflen; 125611007SLori.Alt@Sun.COM err = cksum_and_write(&drr, sizeof (drr), &zc, outfd); 12575367Sahrens 12585367Sahrens /* write header nvlist */ 125911022STom.Erickson@Sun.COM if (err != -1 && packbuf != NULL) { 126011007SLori.Alt@Sun.COM err = cksum_and_write(packbuf, buflen, &zc, outfd); 12615367Sahrens } 12625367Sahrens free(packbuf); 12635367Sahrens if (err == -1) { 12645367Sahrens fsavl_destroy(fsavl); 12655367Sahrens nvlist_free(fss); 126610735Schris.kirby@sun.com if (holdsnaps) { 126710735Schris.kirby@sun.com (void) zfs_release_range(zhp, fromsnap, tosnap, 126811546SChris.Kirby@sun.com holdtag, flags.replicate); 126910735Schris.kirby@sun.com } 127011007SLori.Alt@Sun.COM err = errno; 127111007SLori.Alt@Sun.COM goto stderr_out; 12725367Sahrens } 12735367Sahrens 12745367Sahrens /* write end record */ 12755367Sahrens if (err != -1) { 12765367Sahrens bzero(&drr, sizeof (drr)); 12775367Sahrens drr.drr_type = DRR_END; 12785367Sahrens drr.drr_u.drr_end.drr_checksum = zc; 12795367Sahrens err = write(outfd, &drr, sizeof (drr)); 12805367Sahrens if (err == -1) { 12815367Sahrens fsavl_destroy(fsavl); 12825367Sahrens nvlist_free(fss); 128311668SChris.Kirby@sun.com err = errno; 128410735Schris.kirby@sun.com if (holdsnaps) { 128510735Schris.kirby@sun.com (void) zfs_release_range(zhp, fromsnap, 128611546SChris.Kirby@sun.com tosnap, holdtag, flags.replicate); 128710735Schris.kirby@sun.com } 128811007SLori.Alt@Sun.COM goto stderr_out; 12895367Sahrens } 12905367Sahrens } 12915367Sahrens } 12925367Sahrens 12935367Sahrens /* dump each stream */ 12945367Sahrens sdd.fromsnap = fromsnap; 12955367Sahrens sdd.tosnap = tosnap; 129611007SLori.Alt@Sun.COM if (flags.dedup) 129711007SLori.Alt@Sun.COM sdd.outfd = pipefd[0]; 129811007SLori.Alt@Sun.COM else 129911007SLori.Alt@Sun.COM sdd.outfd = outfd; 130011007SLori.Alt@Sun.COM sdd.replicate = flags.replicate; 130111007SLori.Alt@Sun.COM sdd.doall = flags.doall; 130211007SLori.Alt@Sun.COM sdd.fromorigin = flags.fromorigin; 13035367Sahrens sdd.fss = fss; 13045367Sahrens sdd.fsavl = fsavl; 130511007SLori.Alt@Sun.COM sdd.verbose = flags.verbose; 130611007SLori.Alt@Sun.COM sdd.filter_cb = filter_func; 130711007SLori.Alt@Sun.COM sdd.filter_cb_arg = cb_arg; 13085367Sahrens err = dump_filesystems(zhp, &sdd); 13095367Sahrens fsavl_destroy(fsavl); 13105367Sahrens nvlist_free(fss); 13115367Sahrens 131211007SLori.Alt@Sun.COM if (flags.dedup) { 131311007SLori.Alt@Sun.COM (void) close(pipefd[0]); 131411007SLori.Alt@Sun.COM (void) pthread_join(tid, NULL); 131511007SLori.Alt@Sun.COM } 131611022STom.Erickson@Sun.COM 131711022STom.Erickson@Sun.COM if (flags.replicate || flags.doall || flags.props) { 13185367Sahrens /* 13195367Sahrens * write final end record. NB: want to do this even if 13205367Sahrens * there was some error, because it might not be totally 13215367Sahrens * failed. 13225367Sahrens */ 13235367Sahrens dmu_replay_record_t drr = { 0 }; 13245367Sahrens drr.drr_type = DRR_END; 132510735Schris.kirby@sun.com if (holdsnaps) { 132610735Schris.kirby@sun.com (void) zfs_release_range(zhp, fromsnap, tosnap, 132711546SChris.Kirby@sun.com holdtag, flags.replicate); 132810735Schris.kirby@sun.com } 13295367Sahrens if (write(outfd, &drr, sizeof (drr)) == -1) { 13305367Sahrens return (zfs_standard_error(zhp->zfs_hdl, 13315367Sahrens errno, errbuf)); 13325367Sahrens } 13335367Sahrens } 13345367Sahrens 13355367Sahrens return (err || sdd.err); 133611007SLori.Alt@Sun.COM 133711007SLori.Alt@Sun.COM stderr_out: 133811007SLori.Alt@Sun.COM err = zfs_standard_error(zhp->zfs_hdl, err, errbuf); 133911007SLori.Alt@Sun.COM err_out: 134011007SLori.Alt@Sun.COM if (flags.dedup) { 134111007SLori.Alt@Sun.COM (void) pthread_cancel(tid); 134211007SLori.Alt@Sun.COM (void) pthread_join(tid, NULL); 134311007SLori.Alt@Sun.COM (void) close(pipefd[0]); 134411007SLori.Alt@Sun.COM } 134511007SLori.Alt@Sun.COM return (err); 13465367Sahrens } 13475367Sahrens 13485367Sahrens /* 13495367Sahrens * Routines specific to "zfs recv" 13505367Sahrens */ 13515367Sahrens 13525367Sahrens static int 13535367Sahrens recv_read(libzfs_handle_t *hdl, int fd, void *buf, int ilen, 13545367Sahrens boolean_t byteswap, zio_cksum_t *zc) 13555367Sahrens { 13565367Sahrens char *cp = buf; 13575367Sahrens int rv; 13585367Sahrens int len = ilen; 13595367Sahrens 13605367Sahrens do { 13615367Sahrens rv = read(fd, cp, len); 13625367Sahrens cp += rv; 13635367Sahrens len -= rv; 13645367Sahrens } while (rv > 0); 13655367Sahrens 13665367Sahrens if (rv < 0 || len != 0) { 13675367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 13685367Sahrens "failed to read from stream")); 13695367Sahrens return (zfs_error(hdl, EZFS_BADSTREAM, dgettext(TEXT_DOMAIN, 13705367Sahrens "cannot receive"))); 13715367Sahrens } 13725367Sahrens 13735367Sahrens if (zc) { 13745367Sahrens if (byteswap) 13755367Sahrens fletcher_4_incremental_byteswap(buf, ilen, zc); 13765367Sahrens else 13775367Sahrens fletcher_4_incremental_native(buf, ilen, zc); 13785367Sahrens } 13795367Sahrens return (0); 13805367Sahrens } 13815367Sahrens 13825367Sahrens static int 13835367Sahrens recv_read_nvlist(libzfs_handle_t *hdl, int fd, int len, nvlist_t **nvp, 13845367Sahrens boolean_t byteswap, zio_cksum_t *zc) 13855367Sahrens { 13865367Sahrens char *buf; 13875367Sahrens int err; 13885367Sahrens 13895367Sahrens buf = zfs_alloc(hdl, len); 13905367Sahrens if (buf == NULL) 13915367Sahrens return (ENOMEM); 13925367Sahrens 13935367Sahrens err = recv_read(hdl, fd, buf, len, byteswap, zc); 13945367Sahrens if (err != 0) { 13955367Sahrens free(buf); 13965367Sahrens return (err); 13975367Sahrens } 13985367Sahrens 13995367Sahrens err = nvlist_unpack(buf, len, nvp, 0); 14005367Sahrens free(buf); 14015367Sahrens if (err != 0) { 14025367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "invalid " 14035367Sahrens "stream (malformed nvlist)")); 14045367Sahrens return (EINVAL); 14055367Sahrens } 14065367Sahrens return (0); 14075367Sahrens } 14085367Sahrens 14095367Sahrens static int 14105367Sahrens recv_rename(libzfs_handle_t *hdl, const char *name, const char *tryname, 14115367Sahrens int baselen, char *newname, recvflags_t flags) 14125367Sahrens { 14135367Sahrens static int seq; 14145367Sahrens zfs_cmd_t zc = { 0 }; 14155367Sahrens int err; 14166047Sahrens prop_changelist_t *clp; 14176047Sahrens zfs_handle_t *zhp; 14185367Sahrens 14196047Sahrens zhp = zfs_open(hdl, name, ZFS_TYPE_DATASET); 14206047Sahrens if (zhp == NULL) 14216047Sahrens return (-1); 14227366STim.Haley@Sun.COM clp = changelist_gather(zhp, ZFS_PROP_NAME, 0, 14237366STim.Haley@Sun.COM flags.force ? MS_FORCE : 0); 14246047Sahrens zfs_close(zhp); 14256047Sahrens if (clp == NULL) 14266047Sahrens return (-1); 14276047Sahrens err = changelist_prefix(clp); 14286047Sahrens if (err) 14296047Sahrens return (err); 14305367Sahrens 143110242Schris.kirby@sun.com zc.zc_objset_type = DMU_OST_ZFS; 143210242Schris.kirby@sun.com (void) strlcpy(zc.zc_name, name, sizeof (zc.zc_name)); 143310242Schris.kirby@sun.com 14345367Sahrens if (tryname) { 14355367Sahrens (void) strcpy(newname, tryname); 14365367Sahrens 14375367Sahrens (void) strlcpy(zc.zc_value, tryname, sizeof (zc.zc_value)); 14385367Sahrens 14395367Sahrens if (flags.verbose) { 14405367Sahrens (void) printf("attempting rename %s to %s\n", 14415367Sahrens zc.zc_name, zc.zc_value); 14425367Sahrens } 14435367Sahrens err = ioctl(hdl->libzfs_fd, ZFS_IOC_RENAME, &zc); 14446047Sahrens if (err == 0) 14455367Sahrens changelist_rename(clp, name, tryname); 14465367Sahrens } else { 14475367Sahrens err = ENOENT; 14485367Sahrens } 14495367Sahrens 14505367Sahrens if (err != 0 && strncmp(name+baselen, "recv-", 5) != 0) { 14515367Sahrens seq++; 14525367Sahrens 14535367Sahrens (void) strncpy(newname, name, baselen); 14545367Sahrens (void) snprintf(newname+baselen, ZFS_MAXNAMELEN-baselen, 14555367Sahrens "recv-%u-%u", getpid(), seq); 14565367Sahrens (void) strlcpy(zc.zc_value, newname, sizeof (zc.zc_value)); 14575367Sahrens 14585367Sahrens if (flags.verbose) { 14595367Sahrens (void) printf("failed - trying rename %s to %s\n", 14605367Sahrens zc.zc_name, zc.zc_value); 14615367Sahrens } 14625367Sahrens err = ioctl(hdl->libzfs_fd, ZFS_IOC_RENAME, &zc); 14636047Sahrens if (err == 0) 14645367Sahrens changelist_rename(clp, name, newname); 14655367Sahrens if (err && flags.verbose) { 14665367Sahrens (void) printf("failed (%u) - " 14675367Sahrens "will try again on next pass\n", errno); 14685367Sahrens } 14695367Sahrens err = EAGAIN; 14705367Sahrens } else if (flags.verbose) { 14715367Sahrens if (err == 0) 14725367Sahrens (void) printf("success\n"); 14735367Sahrens else 14745367Sahrens (void) printf("failed (%u)\n", errno); 14755367Sahrens } 14765367Sahrens 14776047Sahrens (void) changelist_postfix(clp); 14786047Sahrens changelist_free(clp); 14795367Sahrens 14805367Sahrens return (err); 14815367Sahrens } 14825367Sahrens 14835367Sahrens static int 14845367Sahrens recv_destroy(libzfs_handle_t *hdl, const char *name, int baselen, 14855367Sahrens char *newname, recvflags_t flags) 14865367Sahrens { 14875367Sahrens zfs_cmd_t zc = { 0 }; 14886047Sahrens int err = 0; 14896047Sahrens prop_changelist_t *clp; 14906047Sahrens zfs_handle_t *zhp; 149110242Schris.kirby@sun.com boolean_t defer = B_FALSE; 149210242Schris.kirby@sun.com int spa_version; 14936047Sahrens 14946047Sahrens zhp = zfs_open(hdl, name, ZFS_TYPE_DATASET); 14956047Sahrens if (zhp == NULL) 14966047Sahrens return (-1); 14977366STim.Haley@Sun.COM clp = changelist_gather(zhp, ZFS_PROP_NAME, 0, 14987366STim.Haley@Sun.COM flags.force ? MS_FORCE : 0); 149910242Schris.kirby@sun.com if (zfs_get_type(zhp) == ZFS_TYPE_SNAPSHOT && 150010242Schris.kirby@sun.com zfs_spa_version(zhp, &spa_version) == 0 && 150110242Schris.kirby@sun.com spa_version >= SPA_VERSION_USERREFS) 150210242Schris.kirby@sun.com defer = B_TRUE; 15036047Sahrens zfs_close(zhp); 15046047Sahrens if (clp == NULL) 15056047Sahrens return (-1); 15066047Sahrens err = changelist_prefix(clp); 15076047Sahrens if (err) 15086047Sahrens return (err); 15095367Sahrens 15105367Sahrens zc.zc_objset_type = DMU_OST_ZFS; 151110242Schris.kirby@sun.com zc.zc_defer_destroy = defer; 15125367Sahrens (void) strlcpy(zc.zc_name, name, sizeof (zc.zc_name)); 15135367Sahrens 15145367Sahrens if (flags.verbose) 15155367Sahrens (void) printf("attempting destroy %s\n", zc.zc_name); 15165367Sahrens err = ioctl(hdl->libzfs_fd, ZFS_IOC_DESTROY, &zc); 15176047Sahrens if (err == 0) { 15186047Sahrens if (flags.verbose) 15196047Sahrens (void) printf("success\n"); 15206047Sahrens changelist_remove(clp, zc.zc_name); 15215367Sahrens } 15225367Sahrens 15236047Sahrens (void) changelist_postfix(clp); 15246047Sahrens changelist_free(clp); 15256047Sahrens 152610242Schris.kirby@sun.com /* 152711022STom.Erickson@Sun.COM * Deferred destroy might destroy the snapshot or only mark it to be 152811022STom.Erickson@Sun.COM * destroyed later, and it returns success in either case. 152910242Schris.kirby@sun.com */ 153011022STom.Erickson@Sun.COM if (err != 0 || (defer && zfs_dataset_exists(hdl, name, 153111022STom.Erickson@Sun.COM ZFS_TYPE_SNAPSHOT))) { 15326047Sahrens err = recv_rename(hdl, name, NULL, baselen, newname, flags); 153311022STom.Erickson@Sun.COM } 15345367Sahrens 15355367Sahrens return (err); 15365367Sahrens } 15375367Sahrens 15385367Sahrens typedef struct guid_to_name_data { 15395367Sahrens uint64_t guid; 15405367Sahrens char *name; 15415367Sahrens } guid_to_name_data_t; 15425367Sahrens 15435367Sahrens static int 15445367Sahrens guid_to_name_cb(zfs_handle_t *zhp, void *arg) 15455367Sahrens { 15465367Sahrens guid_to_name_data_t *gtnd = arg; 15475367Sahrens int err; 15485367Sahrens 15495367Sahrens if (zhp->zfs_dmustats.dds_guid == gtnd->guid) { 15505367Sahrens (void) strcpy(gtnd->name, zhp->zfs_name); 155111515STom.Erickson@Sun.COM zfs_close(zhp); 15525367Sahrens return (EEXIST); 15535367Sahrens } 15545367Sahrens err = zfs_iter_children(zhp, guid_to_name_cb, gtnd); 15555367Sahrens zfs_close(zhp); 15565367Sahrens return (err); 15575367Sahrens } 15585367Sahrens 15595367Sahrens static int 15605367Sahrens guid_to_name(libzfs_handle_t *hdl, const char *parent, uint64_t guid, 15615367Sahrens char *name) 15625367Sahrens { 15635367Sahrens /* exhaustive search all local snapshots */ 15645367Sahrens guid_to_name_data_t gtnd; 15655367Sahrens int err = 0; 15665367Sahrens zfs_handle_t *zhp; 15675367Sahrens char *cp; 15685367Sahrens 15695367Sahrens gtnd.guid = guid; 15705367Sahrens gtnd.name = name; 15715367Sahrens 15725367Sahrens if (strchr(parent, '@') == NULL) { 15735367Sahrens zhp = make_dataset_handle(hdl, parent); 15745367Sahrens if (zhp != NULL) { 15755367Sahrens err = zfs_iter_children(zhp, guid_to_name_cb, >nd); 15765367Sahrens zfs_close(zhp); 15775367Sahrens if (err == EEXIST) 15785367Sahrens return (0); 15795367Sahrens } 15805367Sahrens } 15815367Sahrens 15825367Sahrens cp = strchr(parent, '/'); 15835367Sahrens if (cp) 15845367Sahrens *cp = '\0'; 15855367Sahrens zhp = make_dataset_handle(hdl, parent); 15865367Sahrens if (cp) 15875367Sahrens *cp = '/'; 15885367Sahrens 15895367Sahrens if (zhp) { 15905367Sahrens err = zfs_iter_children(zhp, guid_to_name_cb, >nd); 15915367Sahrens zfs_close(zhp); 15925367Sahrens } 15935367Sahrens 15945367Sahrens return (err == EEXIST ? 0 : ENOENT); 15955367Sahrens 15965367Sahrens } 15975367Sahrens 15985367Sahrens /* 15995367Sahrens * Return true if dataset guid1 is created before guid2. 16005367Sahrens */ 16016476Sahl static int 16025367Sahrens created_before(libzfs_handle_t *hdl, avl_tree_t *avl, 16035367Sahrens uint64_t guid1, uint64_t guid2) 16045367Sahrens { 16055367Sahrens nvlist_t *nvfs; 16065367Sahrens char *fsname, *snapname; 16075367Sahrens char buf[ZFS_MAXNAMELEN]; 16086476Sahl int rv; 16095367Sahrens zfs_node_t zn1, zn2; 16105367Sahrens 16115367Sahrens if (guid2 == 0) 16126476Sahl return (0); 16135367Sahrens if (guid1 == 0) 16146476Sahl return (1); 16155367Sahrens 16165367Sahrens nvfs = fsavl_find(avl, guid1, &snapname); 16175367Sahrens VERIFY(0 == nvlist_lookup_string(nvfs, "name", &fsname)); 16185367Sahrens (void) snprintf(buf, sizeof (buf), "%s@%s", fsname, snapname); 16195367Sahrens zn1.zn_handle = zfs_open(hdl, buf, ZFS_TYPE_SNAPSHOT); 16206476Sahl if (zn1.zn_handle == NULL) 16216476Sahl return (-1); 16225367Sahrens 16235367Sahrens nvfs = fsavl_find(avl, guid2, &snapname); 16245367Sahrens VERIFY(0 == nvlist_lookup_string(nvfs, "name", &fsname)); 16255367Sahrens (void) snprintf(buf, sizeof (buf), "%s@%s", fsname, snapname); 16265367Sahrens zn2.zn_handle = zfs_open(hdl, buf, ZFS_TYPE_SNAPSHOT); 16276476Sahl if (zn2.zn_handle == NULL) { 16286476Sahl zfs_close(zn2.zn_handle); 16296476Sahl return (-1); 16306476Sahl } 16315367Sahrens 16325367Sahrens rv = (zfs_snapshot_compare(&zn1, &zn2) == -1); 16335367Sahrens 16345367Sahrens zfs_close(zn1.zn_handle); 16355367Sahrens zfs_close(zn2.zn_handle); 16365367Sahrens 16375367Sahrens return (rv); 16385367Sahrens } 16395367Sahrens 16405367Sahrens static int 16415367Sahrens recv_incremental_replication(libzfs_handle_t *hdl, const char *tofs, 16425367Sahrens recvflags_t flags, nvlist_t *stream_nv, avl_tree_t *stream_avl) 16435367Sahrens { 16445367Sahrens nvlist_t *local_nv; 16455367Sahrens avl_tree_t *local_avl; 16465367Sahrens nvpair_t *fselem, *nextfselem; 16475367Sahrens char *tosnap, *fromsnap; 16485367Sahrens char newname[ZFS_MAXNAMELEN]; 16495367Sahrens int error; 165011022STom.Erickson@Sun.COM boolean_t needagain, progress, recursive; 165110299SPrabahar.Jeyaram@Sun.COM char *s1, *s2; 16525367Sahrens 16535367Sahrens VERIFY(0 == nvlist_lookup_string(stream_nv, "fromsnap", &fromsnap)); 16545367Sahrens VERIFY(0 == nvlist_lookup_string(stream_nv, "tosnap", &tosnap)); 16555367Sahrens 165611022STom.Erickson@Sun.COM recursive = (nvlist_lookup_boolean(stream_nv, "not_recursive") == 165711022STom.Erickson@Sun.COM ENOENT); 165811022STom.Erickson@Sun.COM 16595367Sahrens if (flags.dryrun) 16605367Sahrens return (0); 16615367Sahrens 16625367Sahrens again: 16635367Sahrens needagain = progress = B_FALSE; 16645367Sahrens 16655367Sahrens if ((error = gather_nvlist(hdl, tofs, fromsnap, NULL, 166611022STom.Erickson@Sun.COM recursive, &local_nv, &local_avl)) != 0) 16675367Sahrens return (error); 16685367Sahrens 16695367Sahrens /* 16705367Sahrens * Process deletes and renames 16715367Sahrens */ 16725367Sahrens for (fselem = nvlist_next_nvpair(local_nv, NULL); 16735367Sahrens fselem; fselem = nextfselem) { 16745367Sahrens nvlist_t *nvfs, *snaps; 16755367Sahrens nvlist_t *stream_nvfs = NULL; 16765367Sahrens nvpair_t *snapelem, *nextsnapelem; 16775367Sahrens uint64_t fromguid = 0; 16785367Sahrens uint64_t originguid = 0; 16795367Sahrens uint64_t stream_originguid = 0; 16805367Sahrens uint64_t parent_fromsnap_guid, stream_parent_fromsnap_guid; 16815367Sahrens char *fsname, *stream_fsname; 16825367Sahrens 16835367Sahrens nextfselem = nvlist_next_nvpair(local_nv, fselem); 16845367Sahrens 16855367Sahrens VERIFY(0 == nvpair_value_nvlist(fselem, &nvfs)); 16865367Sahrens VERIFY(0 == nvlist_lookup_nvlist(nvfs, "snaps", &snaps)); 16875367Sahrens VERIFY(0 == nvlist_lookup_string(nvfs, "name", &fsname)); 16885367Sahrens VERIFY(0 == nvlist_lookup_uint64(nvfs, "parentfromsnap", 16895367Sahrens &parent_fromsnap_guid)); 16905367Sahrens (void) nvlist_lookup_uint64(nvfs, "origin", &originguid); 16915367Sahrens 16925367Sahrens /* 16935367Sahrens * First find the stream's fs, so we can check for 16945367Sahrens * a different origin (due to "zfs promote") 16955367Sahrens */ 16965367Sahrens for (snapelem = nvlist_next_nvpair(snaps, NULL); 16975367Sahrens snapelem; snapelem = nvlist_next_nvpair(snaps, snapelem)) { 16985367Sahrens uint64_t thisguid; 16995367Sahrens 17005367Sahrens VERIFY(0 == nvpair_value_uint64(snapelem, &thisguid)); 17015367Sahrens stream_nvfs = fsavl_find(stream_avl, thisguid, NULL); 17025367Sahrens 17035367Sahrens if (stream_nvfs != NULL) 17045367Sahrens break; 17055367Sahrens } 17065367Sahrens 17075367Sahrens /* check for promote */ 17085367Sahrens (void) nvlist_lookup_uint64(stream_nvfs, "origin", 17095367Sahrens &stream_originguid); 17105367Sahrens if (stream_nvfs && originguid != stream_originguid) { 17116476Sahl switch (created_before(hdl, local_avl, 17126476Sahl stream_originguid, originguid)) { 17136476Sahl case 1: { 17145367Sahrens /* promote it! */ 17155367Sahrens zfs_cmd_t zc = { 0 }; 17165367Sahrens nvlist_t *origin_nvfs; 17175367Sahrens char *origin_fsname; 17185367Sahrens 17195367Sahrens if (flags.verbose) 17205367Sahrens (void) printf("promoting %s\n", fsname); 17215367Sahrens 17225367Sahrens origin_nvfs = fsavl_find(local_avl, originguid, 17235367Sahrens NULL); 17245367Sahrens VERIFY(0 == nvlist_lookup_string(origin_nvfs, 17255367Sahrens "name", &origin_fsname)); 17265367Sahrens (void) strlcpy(zc.zc_value, origin_fsname, 17275367Sahrens sizeof (zc.zc_value)); 17285367Sahrens (void) strlcpy(zc.zc_name, fsname, 17295367Sahrens sizeof (zc.zc_name)); 17305367Sahrens error = zfs_ioctl(hdl, ZFS_IOC_PROMOTE, &zc); 17315367Sahrens if (error == 0) 17325367Sahrens progress = B_TRUE; 17336476Sahl break; 17346476Sahl } 17356476Sahl default: 17366476Sahl break; 17376476Sahl case -1: 17386476Sahl fsavl_destroy(local_avl); 17396476Sahl nvlist_free(local_nv); 17406476Sahl return (-1); 17415367Sahrens } 17425367Sahrens /* 17435367Sahrens * We had/have the wrong origin, therefore our 17445367Sahrens * list of snapshots is wrong. Need to handle 17455367Sahrens * them on the next pass. 17465367Sahrens */ 17475367Sahrens needagain = B_TRUE; 17485367Sahrens continue; 17495367Sahrens } 17505367Sahrens 17515367Sahrens for (snapelem = nvlist_next_nvpair(snaps, NULL); 17525367Sahrens snapelem; snapelem = nextsnapelem) { 17535367Sahrens uint64_t thisguid; 17545367Sahrens char *stream_snapname; 17557265Sahrens nvlist_t *found, *props; 17565367Sahrens 17575367Sahrens nextsnapelem = nvlist_next_nvpair(snaps, snapelem); 17585367Sahrens 17595367Sahrens VERIFY(0 == nvpair_value_uint64(snapelem, &thisguid)); 17605367Sahrens found = fsavl_find(stream_avl, thisguid, 17615367Sahrens &stream_snapname); 17625367Sahrens 17635367Sahrens /* check for delete */ 17645367Sahrens if (found == NULL) { 17655367Sahrens char name[ZFS_MAXNAMELEN]; 17665367Sahrens 17675367Sahrens if (!flags.force) 17685367Sahrens continue; 17695367Sahrens 17705367Sahrens (void) snprintf(name, sizeof (name), "%s@%s", 17715367Sahrens fsname, nvpair_name(snapelem)); 17725367Sahrens 17735367Sahrens error = recv_destroy(hdl, name, 17745367Sahrens strlen(fsname)+1, newname, flags); 17755367Sahrens if (error) 17765367Sahrens needagain = B_TRUE; 17775367Sahrens else 17785367Sahrens progress = B_TRUE; 17795367Sahrens continue; 17805367Sahrens } 17815367Sahrens 17825367Sahrens stream_nvfs = found; 17835367Sahrens 17847265Sahrens if (0 == nvlist_lookup_nvlist(stream_nvfs, "snapprops", 17857265Sahrens &props) && 0 == nvlist_lookup_nvlist(props, 17867265Sahrens stream_snapname, &props)) { 17877265Sahrens zfs_cmd_t zc = { 0 }; 17887265Sahrens 178911022STom.Erickson@Sun.COM zc.zc_cookie = B_TRUE; /* received */ 17907273Sahrens (void) snprintf(zc.zc_name, sizeof (zc.zc_name), 17917265Sahrens "%s@%s", fsname, nvpair_name(snapelem)); 17927265Sahrens if (zcmd_write_src_nvlist(hdl, &zc, 17937265Sahrens props) == 0) { 17947265Sahrens (void) zfs_ioctl(hdl, 17957265Sahrens ZFS_IOC_SET_PROP, &zc); 17967265Sahrens zcmd_free_nvlists(&zc); 17977265Sahrens } 17987265Sahrens } 17997265Sahrens 18005367Sahrens /* check for different snapname */ 18015367Sahrens if (strcmp(nvpair_name(snapelem), 18025367Sahrens stream_snapname) != 0) { 18035367Sahrens char name[ZFS_MAXNAMELEN]; 18045367Sahrens char tryname[ZFS_MAXNAMELEN]; 18055367Sahrens 18065367Sahrens (void) snprintf(name, sizeof (name), "%s@%s", 18075367Sahrens fsname, nvpair_name(snapelem)); 18085367Sahrens (void) snprintf(tryname, sizeof (name), "%s@%s", 18095367Sahrens fsname, stream_snapname); 18105367Sahrens 18115367Sahrens error = recv_rename(hdl, name, tryname, 18125367Sahrens strlen(fsname)+1, newname, flags); 18135367Sahrens if (error) 18145367Sahrens needagain = B_TRUE; 18155367Sahrens else 18165367Sahrens progress = B_TRUE; 18175367Sahrens } 18185367Sahrens 18195367Sahrens if (strcmp(stream_snapname, fromsnap) == 0) 18205367Sahrens fromguid = thisguid; 18215367Sahrens } 18225367Sahrens 18235367Sahrens /* check for delete */ 18245367Sahrens if (stream_nvfs == NULL) { 18255367Sahrens if (!flags.force) 18265367Sahrens continue; 18275367Sahrens 18285367Sahrens error = recv_destroy(hdl, fsname, strlen(tofs)+1, 18295367Sahrens newname, flags); 18305367Sahrens if (error) 18315367Sahrens needagain = B_TRUE; 18325367Sahrens else 18335367Sahrens progress = B_TRUE; 18345367Sahrens continue; 18355367Sahrens } 18365367Sahrens 18375367Sahrens if (fromguid == 0 && flags.verbose) { 18385367Sahrens (void) printf("local fs %s does not have fromsnap " 18395367Sahrens "(%s in stream); must have been deleted locally; " 18405367Sahrens "ignoring\n", fsname, fromsnap); 18415367Sahrens continue; 18425367Sahrens } 18435367Sahrens 18445367Sahrens VERIFY(0 == nvlist_lookup_string(stream_nvfs, 18455367Sahrens "name", &stream_fsname)); 18465367Sahrens VERIFY(0 == nvlist_lookup_uint64(stream_nvfs, 18475367Sahrens "parentfromsnap", &stream_parent_fromsnap_guid)); 18485367Sahrens 184910302SPrabahar.Jeyaram@Sun.COM s1 = strrchr(fsname, '/'); 185010302SPrabahar.Jeyaram@Sun.COM s2 = strrchr(stream_fsname, '/'); 185110302SPrabahar.Jeyaram@Sun.COM 18525367Sahrens /* check for rename */ 18535367Sahrens if ((stream_parent_fromsnap_guid != 0 && 18545367Sahrens stream_parent_fromsnap_guid != parent_fromsnap_guid) || 185510302SPrabahar.Jeyaram@Sun.COM ((s1 != NULL) && (s2 != NULL) && strcmp(s1, s2) != 0)) { 18565367Sahrens nvlist_t *parent; 18575367Sahrens char tryname[ZFS_MAXNAMELEN]; 18585367Sahrens 18595367Sahrens parent = fsavl_find(local_avl, 18605367Sahrens stream_parent_fromsnap_guid, NULL); 18615367Sahrens /* 18625367Sahrens * NB: parent might not be found if we used the 18635367Sahrens * tosnap for stream_parent_fromsnap_guid, 18645367Sahrens * because the parent is a newly-created fs; 18655367Sahrens * we'll be able to rename it after we recv the 18665367Sahrens * new fs. 18675367Sahrens */ 18685367Sahrens if (parent != NULL) { 18695367Sahrens char *pname; 18705367Sahrens 18715367Sahrens VERIFY(0 == nvlist_lookup_string(parent, "name", 18725367Sahrens &pname)); 18735367Sahrens (void) snprintf(tryname, sizeof (tryname), 18745367Sahrens "%s%s", pname, strrchr(stream_fsname, '/')); 18755367Sahrens } else { 18765367Sahrens tryname[0] = '\0'; 18775367Sahrens if (flags.verbose) { 18785367Sahrens (void) printf("local fs %s new parent " 18795367Sahrens "not found\n", fsname); 18805367Sahrens } 18815367Sahrens } 18825367Sahrens 18835367Sahrens error = recv_rename(hdl, fsname, tryname, 18845367Sahrens strlen(tofs)+1, newname, flags); 18855367Sahrens if (error) 18865367Sahrens needagain = B_TRUE; 18875367Sahrens else 18885367Sahrens progress = B_TRUE; 18895367Sahrens } 18905367Sahrens } 18915367Sahrens 18925367Sahrens fsavl_destroy(local_avl); 18935367Sahrens nvlist_free(local_nv); 18945367Sahrens 18955367Sahrens if (needagain && progress) { 18965367Sahrens /* do another pass to fix up temporary names */ 18975367Sahrens if (flags.verbose) 18985367Sahrens (void) printf("another pass:\n"); 18995367Sahrens goto again; 19005367Sahrens } 19015367Sahrens 19025367Sahrens return (needagain); 19035367Sahrens } 19045367Sahrens 19055367Sahrens static int 19065367Sahrens zfs_receive_package(libzfs_handle_t *hdl, int fd, const char *destname, 19077366STim.Haley@Sun.COM recvflags_t flags, dmu_replay_record_t *drr, zio_cksum_t *zc, 19087366STim.Haley@Sun.COM char **top_zfs) 19095367Sahrens { 19105367Sahrens nvlist_t *stream_nv = NULL; 19115367Sahrens avl_tree_t *stream_avl = NULL; 19125367Sahrens char *fromsnap = NULL; 19135367Sahrens char tofs[ZFS_MAXNAMELEN]; 19145367Sahrens char errbuf[1024]; 19155367Sahrens dmu_replay_record_t drre; 19165367Sahrens int error; 19175367Sahrens boolean_t anyerr = B_FALSE; 19186479Sahrens boolean_t softerr = B_FALSE; 19195367Sahrens 19205367Sahrens (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN, 19215367Sahrens "cannot receive")); 19225367Sahrens 19235367Sahrens if (strchr(destname, '@')) { 19245367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 19255367Sahrens "can not specify snapshot name for multi-snapshot stream")); 19265367Sahrens return (zfs_error(hdl, EZFS_BADSTREAM, errbuf)); 19275367Sahrens } 19285367Sahrens 19295367Sahrens assert(drr->drr_type == DRR_BEGIN); 19305367Sahrens assert(drr->drr_u.drr_begin.drr_magic == DMU_BACKUP_MAGIC); 193111007SLori.Alt@Sun.COM assert(DMU_GET_STREAM_HDRTYPE(drr->drr_u.drr_begin.drr_versioninfo) == 193211007SLori.Alt@Sun.COM DMU_COMPOUNDSTREAM); 19335367Sahrens 19345367Sahrens /* 19355367Sahrens * Read in the nvlist from the stream. 19365367Sahrens */ 19375367Sahrens if (drr->drr_payloadlen != 0) { 19385367Sahrens error = recv_read_nvlist(hdl, fd, drr->drr_payloadlen, 19395367Sahrens &stream_nv, flags.byteswap, zc); 19405367Sahrens if (error) { 19415367Sahrens error = zfs_error(hdl, EZFS_BADSTREAM, errbuf); 19425367Sahrens goto out; 19435367Sahrens } 19445367Sahrens } 19455367Sahrens 19465367Sahrens /* 19475367Sahrens * Read in the end record and verify checksum. 19485367Sahrens */ 19495367Sahrens if (0 != (error = recv_read(hdl, fd, &drre, sizeof (drre), 19505367Sahrens flags.byteswap, NULL))) 19515367Sahrens goto out; 19525367Sahrens if (flags.byteswap) { 19535367Sahrens drre.drr_type = BSWAP_32(drre.drr_type); 19545367Sahrens drre.drr_u.drr_end.drr_checksum.zc_word[0] = 19555367Sahrens BSWAP_64(drre.drr_u.drr_end.drr_checksum.zc_word[0]); 19565367Sahrens drre.drr_u.drr_end.drr_checksum.zc_word[1] = 19575367Sahrens BSWAP_64(drre.drr_u.drr_end.drr_checksum.zc_word[1]); 19585367Sahrens drre.drr_u.drr_end.drr_checksum.zc_word[2] = 19595367Sahrens BSWAP_64(drre.drr_u.drr_end.drr_checksum.zc_word[2]); 19605367Sahrens drre.drr_u.drr_end.drr_checksum.zc_word[3] = 19615367Sahrens BSWAP_64(drre.drr_u.drr_end.drr_checksum.zc_word[3]); 19625367Sahrens } 19635367Sahrens if (drre.drr_type != DRR_END) { 19645367Sahrens error = zfs_error(hdl, EZFS_BADSTREAM, errbuf); 19655367Sahrens goto out; 19665367Sahrens } 19675367Sahrens if (!ZIO_CHECKSUM_EQUAL(drre.drr_u.drr_end.drr_checksum, *zc)) { 19685367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 19695367Sahrens "incorrect header checksum")); 19705367Sahrens error = zfs_error(hdl, EZFS_BADSTREAM, errbuf); 19715367Sahrens goto out; 19725367Sahrens } 19735367Sahrens 19745367Sahrens (void) nvlist_lookup_string(stream_nv, "fromsnap", &fromsnap); 19755367Sahrens 19765367Sahrens if (drr->drr_payloadlen != 0) { 19775367Sahrens nvlist_t *stream_fss; 19785367Sahrens 19795367Sahrens VERIFY(0 == nvlist_lookup_nvlist(stream_nv, "fss", 19805367Sahrens &stream_fss)); 19815896Sahl if ((stream_avl = fsavl_create(stream_fss)) == NULL) { 19825896Sahl zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 19835896Sahl "couldn't allocate avl tree")); 19845896Sahl error = zfs_error(hdl, EZFS_NOMEM, errbuf); 19855896Sahl goto out; 19865896Sahl } 19875367Sahrens 19885367Sahrens if (fromsnap != NULL) { 19895367Sahrens (void) strlcpy(tofs, destname, ZFS_MAXNAMELEN); 19905367Sahrens if (flags.isprefix) { 19915367Sahrens int i = strcspn(drr->drr_u.drr_begin.drr_toname, 19925367Sahrens "/@"); 19935367Sahrens /* zfs_receive_one() will create_parents() */ 19945367Sahrens (void) strlcat(tofs, 19955367Sahrens &drr->drr_u.drr_begin.drr_toname[i], 19965367Sahrens ZFS_MAXNAMELEN); 19975367Sahrens *strchr(tofs, '@') = '\0'; 19985367Sahrens } 19996479Sahrens softerr = recv_incremental_replication(hdl, tofs, 20005367Sahrens flags, stream_nv, stream_avl); 20015367Sahrens } 20025367Sahrens } 20035367Sahrens 20045367Sahrens 20055367Sahrens /* Finally, receive each contained stream */ 20065367Sahrens do { 20075367Sahrens /* 20085367Sahrens * we should figure out if it has a recoverable 20095367Sahrens * error, in which case do a recv_skip() and drive on. 20105367Sahrens * Note, if we fail due to already having this guid, 20115367Sahrens * zfs_receive_one() will take care of it (ie, 20125367Sahrens * recv_skip() and return 0). 20135367Sahrens */ 20147366STim.Haley@Sun.COM error = zfs_receive_impl(hdl, destname, flags, fd, 20157366STim.Haley@Sun.COM stream_avl, top_zfs); 20165367Sahrens if (error == ENODATA) { 20175367Sahrens error = 0; 20185367Sahrens break; 20195367Sahrens } 20205367Sahrens anyerr |= error; 20215367Sahrens } while (error == 0); 20225367Sahrens 20235367Sahrens if (drr->drr_payloadlen != 0 && fromsnap != NULL) { 20245367Sahrens /* 20255367Sahrens * Now that we have the fs's they sent us, try the 20265367Sahrens * renames again. 20275367Sahrens */ 20286479Sahrens softerr = recv_incremental_replication(hdl, tofs, flags, 20295367Sahrens stream_nv, stream_avl); 20305367Sahrens } 20315367Sahrens 20325367Sahrens out: 20335367Sahrens fsavl_destroy(stream_avl); 20345367Sahrens if (stream_nv) 20355367Sahrens nvlist_free(stream_nv); 20366479Sahrens if (softerr) 20376479Sahrens error = -2; 20385367Sahrens if (anyerr) 20395367Sahrens error = -1; 20405367Sahrens return (error); 20415367Sahrens } 20425367Sahrens 204311022STom.Erickson@Sun.COM static void 204411022STom.Erickson@Sun.COM trunc_prop_errs(int truncated) 204511022STom.Erickson@Sun.COM { 204611022STom.Erickson@Sun.COM ASSERT(truncated != 0); 204711022STom.Erickson@Sun.COM 204811022STom.Erickson@Sun.COM if (truncated == 1) 204911022STom.Erickson@Sun.COM (void) fprintf(stderr, dgettext(TEXT_DOMAIN, 205011022STom.Erickson@Sun.COM "1 more property could not be set\n")); 205111022STom.Erickson@Sun.COM else 205211022STom.Erickson@Sun.COM (void) fprintf(stderr, dgettext(TEXT_DOMAIN, 205311022STom.Erickson@Sun.COM "%d more properties could not be set\n"), truncated); 205411022STom.Erickson@Sun.COM } 205511022STom.Erickson@Sun.COM 20565367Sahrens static int 20575367Sahrens recv_skip(libzfs_handle_t *hdl, int fd, boolean_t byteswap) 20585367Sahrens { 20595367Sahrens dmu_replay_record_t *drr; 20605367Sahrens void *buf = malloc(1<<20); 206111007SLori.Alt@Sun.COM char errbuf[1024]; 206211007SLori.Alt@Sun.COM 206311007SLori.Alt@Sun.COM (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN, 206411007SLori.Alt@Sun.COM "cannot receive:")); 20655367Sahrens 20665367Sahrens /* XXX would be great to use lseek if possible... */ 20675367Sahrens drr = buf; 20685367Sahrens 20695367Sahrens while (recv_read(hdl, fd, drr, sizeof (dmu_replay_record_t), 20705367Sahrens byteswap, NULL) == 0) { 20715367Sahrens if (byteswap) 20725367Sahrens drr->drr_type = BSWAP_32(drr->drr_type); 20735367Sahrens 20745367Sahrens switch (drr->drr_type) { 20755367Sahrens case DRR_BEGIN: 20765367Sahrens /* NB: not to be used on v2 stream packages */ 207711007SLori.Alt@Sun.COM if (drr->drr_payloadlen != 0) { 207811007SLori.Alt@Sun.COM zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 207911007SLori.Alt@Sun.COM "invalid substream header")); 208011007SLori.Alt@Sun.COM return (zfs_error(hdl, EZFS_BADSTREAM, errbuf)); 208111007SLori.Alt@Sun.COM } 20825367Sahrens break; 20835367Sahrens 20845367Sahrens case DRR_END: 20855367Sahrens free(buf); 20865367Sahrens return (0); 20875367Sahrens 20885367Sahrens case DRR_OBJECT: 20895367Sahrens if (byteswap) { 20905367Sahrens drr->drr_u.drr_object.drr_bonuslen = 20915367Sahrens BSWAP_32(drr->drr_u.drr_object. 20925367Sahrens drr_bonuslen); 20935367Sahrens } 20945367Sahrens (void) recv_read(hdl, fd, buf, 20955367Sahrens P2ROUNDUP(drr->drr_u.drr_object.drr_bonuslen, 8), 20965367Sahrens B_FALSE, NULL); 20975367Sahrens break; 20985367Sahrens 20995367Sahrens case DRR_WRITE: 21005367Sahrens if (byteswap) { 21015367Sahrens drr->drr_u.drr_write.drr_length = 21027366STim.Haley@Sun.COM BSWAP_64(drr->drr_u.drr_write.drr_length); 21035367Sahrens } 21045367Sahrens (void) recv_read(hdl, fd, buf, 21055367Sahrens drr->drr_u.drr_write.drr_length, B_FALSE, NULL); 21065367Sahrens break; 21075367Sahrens 210811007SLori.Alt@Sun.COM case DRR_WRITE_BYREF: 21095367Sahrens case DRR_FREEOBJECTS: 21105367Sahrens case DRR_FREE: 21115367Sahrens break; 21125367Sahrens 21135367Sahrens default: 211411007SLori.Alt@Sun.COM zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 211511007SLori.Alt@Sun.COM "invalid record type")); 211611007SLori.Alt@Sun.COM return (zfs_error(hdl, EZFS_BADSTREAM, errbuf)); 21175367Sahrens } 21185367Sahrens } 21195367Sahrens 21205367Sahrens free(buf); 21215367Sahrens return (-1); 21225367Sahrens } 21235367Sahrens 21245367Sahrens /* 21255367Sahrens * Restores a backup of tosnap from the file descriptor specified by infd. 21265367Sahrens */ 21275367Sahrens static int 21285367Sahrens zfs_receive_one(libzfs_handle_t *hdl, int infd, const char *tosnap, 21295367Sahrens recvflags_t flags, dmu_replay_record_t *drr, 21307366STim.Haley@Sun.COM dmu_replay_record_t *drr_noswap, avl_tree_t *stream_avl, 21317366STim.Haley@Sun.COM char **top_zfs) 21325367Sahrens { 21335367Sahrens zfs_cmd_t zc = { 0 }; 21345367Sahrens time_t begin_time; 21355367Sahrens int ioctl_err, ioctl_errno, err, choplen; 21365367Sahrens char *cp; 21375367Sahrens struct drr_begin *drrb = &drr->drr_u.drr_begin; 21385367Sahrens char errbuf[1024]; 213911022STom.Erickson@Sun.COM char prop_errbuf[1024]; 21405367Sahrens char chopprefix[ZFS_MAXNAMELEN]; 21415367Sahrens boolean_t newfs = B_FALSE; 21425367Sahrens boolean_t stream_wantsnewfs; 21435367Sahrens uint64_t parent_snapguid = 0; 21445367Sahrens prop_changelist_t *clp = NULL; 21457265Sahrens nvlist_t *snapprops_nvlist = NULL; 214611022STom.Erickson@Sun.COM zprop_errflags_t prop_errflags; 21475367Sahrens 21485367Sahrens begin_time = time(NULL); 21495367Sahrens 21505367Sahrens (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN, 21515367Sahrens "cannot receive")); 21525367Sahrens 21535367Sahrens if (stream_avl != NULL) { 21547265Sahrens char *snapname; 21557265Sahrens nvlist_t *fs = fsavl_find(stream_avl, drrb->drr_toguid, 21567265Sahrens &snapname); 21575367Sahrens nvlist_t *props; 21585896Sahl int ret; 21595367Sahrens 21605367Sahrens (void) nvlist_lookup_uint64(fs, "parentfromsnap", 21615367Sahrens &parent_snapguid); 21625367Sahrens err = nvlist_lookup_nvlist(fs, "props", &props); 21635367Sahrens if (err) 21645367Sahrens VERIFY(0 == nvlist_alloc(&props, NV_UNIQUE_NAME, 0)); 21655896Sahl 21665367Sahrens if (flags.canmountoff) { 21675367Sahrens VERIFY(0 == nvlist_add_uint64(props, 21685367Sahrens zfs_prop_to_name(ZFS_PROP_CANMOUNT), 0)); 21695367Sahrens } 21705896Sahl ret = zcmd_write_src_nvlist(hdl, &zc, props); 21715367Sahrens if (err) 21725367Sahrens nvlist_free(props); 21735896Sahl 21747265Sahrens if (0 == nvlist_lookup_nvlist(fs, "snapprops", &props)) { 21757265Sahrens VERIFY(0 == nvlist_lookup_nvlist(props, 21767265Sahrens snapname, &snapprops_nvlist)); 21777265Sahrens } 21787265Sahrens 21795896Sahl if (ret != 0) 21805896Sahl return (-1); 21815367Sahrens } 21825367Sahrens 21835367Sahrens /* 21845367Sahrens * Determine how much of the snapshot name stored in the stream 21855367Sahrens * we are going to tack on to the name they specified on the 21865367Sahrens * command line, and how much we are going to chop off. 21875367Sahrens * 21885367Sahrens * If they specified a snapshot, chop the entire name stored in 21895367Sahrens * the stream. 21905367Sahrens */ 21915367Sahrens (void) strcpy(chopprefix, drrb->drr_toname); 21925367Sahrens if (flags.isprefix) { 21935367Sahrens /* 219411461STom.Erickson@Sun.COM * They specified a fs with -d or -e. We want to tack on 219511461STom.Erickson@Sun.COM * everything but the first element of the sent snapshot path 219611461STom.Erickson@Sun.COM * (all but the pool name) in the case of -d, or only the tail 219711461STom.Erickson@Sun.COM * of the sent snapshot path in the case of -e. 21985367Sahrens */ 21995367Sahrens if (strchr(tosnap, '@')) { 22005367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "invalid " 220111461STom.Erickson@Sun.COM "argument - snapshot not allowed with %s"), 220211461STom.Erickson@Sun.COM (flags.istail ? "-e" : "-d")); 22035367Sahrens return (zfs_error(hdl, EZFS_INVALIDNAME, errbuf)); 22045367Sahrens } 220511461STom.Erickson@Sun.COM cp = (flags.istail ? strrchr(chopprefix, '/') : 220611461STom.Erickson@Sun.COM strchr(chopprefix, '/')); 22075367Sahrens if (cp == NULL) 22085367Sahrens cp = strchr(chopprefix, '@'); 22095367Sahrens *cp = '\0'; 22105367Sahrens } else if (strchr(tosnap, '@') == NULL) { 22115367Sahrens /* 221211461STom.Erickson@Sun.COM * If they specified a filesystem without -d or -e, we want to 221311461STom.Erickson@Sun.COM * tack on everything after the fs specified in the first name 221411461STom.Erickson@Sun.COM * from the stream. 22155367Sahrens */ 22165367Sahrens cp = strchr(chopprefix, '@'); 22175367Sahrens *cp = '\0'; 22185367Sahrens } 22195367Sahrens choplen = strlen(chopprefix); 22205367Sahrens 22215367Sahrens /* 22225367Sahrens * Determine name of destination snapshot, store in zc_value. 22235367Sahrens */ 222411007SLori.Alt@Sun.COM (void) strcpy(zc.zc_top_ds, tosnap); 22255367Sahrens (void) strcpy(zc.zc_value, tosnap); 22265367Sahrens (void) strncat(zc.zc_value, drrb->drr_toname+choplen, 22275367Sahrens sizeof (zc.zc_value)); 22285896Sahl if (!zfs_name_valid(zc.zc_value, ZFS_TYPE_SNAPSHOT)) { 22295896Sahl zcmd_free_nvlists(&zc); 22305367Sahrens return (zfs_error(hdl, EZFS_INVALIDNAME, errbuf)); 22315896Sahl } 22325367Sahrens 22335367Sahrens /* 22345367Sahrens * Determine the name of the origin snapshot, store in zc_string. 22355367Sahrens */ 22365367Sahrens if (drrb->drr_flags & DRR_FLAG_CLONE) { 22375367Sahrens if (guid_to_name(hdl, tosnap, 22385367Sahrens drrb->drr_fromguid, zc.zc_string) != 0) { 22395896Sahl zcmd_free_nvlists(&zc); 22405367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 22415367Sahrens "local origin for clone %s does not exist"), 22425367Sahrens zc.zc_value); 22435367Sahrens return (zfs_error(hdl, EZFS_NOENT, errbuf)); 22445367Sahrens } 22455367Sahrens if (flags.verbose) 22465367Sahrens (void) printf("found clone origin %s\n", zc.zc_string); 22475367Sahrens } 22485367Sahrens 22495367Sahrens stream_wantsnewfs = (drrb->drr_fromguid == NULL || 22505367Sahrens (drrb->drr_flags & DRR_FLAG_CLONE)); 22515367Sahrens 22525367Sahrens if (stream_wantsnewfs) { 22535367Sahrens /* 22545367Sahrens * if the parent fs does not exist, look for it based on 22555367Sahrens * the parent snap GUID 22565367Sahrens */ 22575367Sahrens (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN, 22585367Sahrens "cannot receive new filesystem stream")); 22595367Sahrens 22605367Sahrens (void) strcpy(zc.zc_name, zc.zc_value); 22615367Sahrens cp = strrchr(zc.zc_name, '/'); 22625367Sahrens if (cp) 22635367Sahrens *cp = '\0'; 22645367Sahrens if (cp && 22655367Sahrens !zfs_dataset_exists(hdl, zc.zc_name, ZFS_TYPE_DATASET)) { 22665367Sahrens char suffix[ZFS_MAXNAMELEN]; 22675367Sahrens (void) strcpy(suffix, strrchr(zc.zc_value, '/')); 22685367Sahrens if (guid_to_name(hdl, tosnap, parent_snapguid, 22695367Sahrens zc.zc_value) == 0) { 22705367Sahrens *strchr(zc.zc_value, '@') = '\0'; 22715367Sahrens (void) strcat(zc.zc_value, suffix); 22725367Sahrens } 22735367Sahrens } 22745367Sahrens } else { 22755367Sahrens /* 22765367Sahrens * if the fs does not exist, look for it based on the 22775367Sahrens * fromsnap GUID 22785367Sahrens */ 22795367Sahrens (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN, 22805367Sahrens "cannot receive incremental stream")); 22815367Sahrens 22825367Sahrens (void) strcpy(zc.zc_name, zc.zc_value); 22835367Sahrens *strchr(zc.zc_name, '@') = '\0'; 22845367Sahrens 22855367Sahrens if (!zfs_dataset_exists(hdl, zc.zc_name, ZFS_TYPE_DATASET)) { 22865367Sahrens char snap[ZFS_MAXNAMELEN]; 22875367Sahrens (void) strcpy(snap, strchr(zc.zc_value, '@')); 22885367Sahrens if (guid_to_name(hdl, tosnap, drrb->drr_fromguid, 22895367Sahrens zc.zc_value) == 0) { 22905367Sahrens *strchr(zc.zc_value, '@') = '\0'; 22915367Sahrens (void) strcat(zc.zc_value, snap); 22925367Sahrens } 22935367Sahrens } 22945367Sahrens } 22955367Sahrens 22965367Sahrens (void) strcpy(zc.zc_name, zc.zc_value); 22975367Sahrens *strchr(zc.zc_name, '@') = '\0'; 22985367Sahrens 22995367Sahrens if (zfs_dataset_exists(hdl, zc.zc_name, ZFS_TYPE_DATASET)) { 23005367Sahrens zfs_handle_t *zhp; 23015367Sahrens /* 23025367Sahrens * Destination fs exists. Therefore this should either 23035367Sahrens * be an incremental, or the stream specifies a new fs 23045367Sahrens * (full stream or clone) and they want us to blow it 23055367Sahrens * away (and have therefore specified -F and removed any 23065367Sahrens * snapshots). 23075367Sahrens */ 23085367Sahrens 23095367Sahrens if (stream_wantsnewfs) { 23105367Sahrens if (!flags.force) { 23115896Sahl zcmd_free_nvlists(&zc); 23125367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 23135367Sahrens "destination '%s' exists\n" 23145367Sahrens "must specify -F to overwrite it"), 23155367Sahrens zc.zc_name); 23165367Sahrens return (zfs_error(hdl, EZFS_EXISTS, errbuf)); 23175367Sahrens } 23185367Sahrens if (ioctl(hdl->libzfs_fd, ZFS_IOC_SNAPSHOT_LIST_NEXT, 23195367Sahrens &zc) == 0) { 23205896Sahl zcmd_free_nvlists(&zc); 23215367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 23225367Sahrens "destination has snapshots (eg. %s)\n" 23235367Sahrens "must destroy them to overwrite it"), 23245367Sahrens zc.zc_name); 23255367Sahrens return (zfs_error(hdl, EZFS_EXISTS, errbuf)); 23265367Sahrens } 23275367Sahrens } 23285367Sahrens 23295896Sahl if ((zhp = zfs_open(hdl, zc.zc_name, 23305896Sahl ZFS_TYPE_FILESYSTEM | ZFS_TYPE_VOLUME)) == NULL) { 23315896Sahl zcmd_free_nvlists(&zc); 23325367Sahrens return (-1); 23335896Sahl } 23345896Sahl 23355367Sahrens if (stream_wantsnewfs && 23365367Sahrens zhp->zfs_dmustats.dds_origin[0]) { 23375896Sahl zcmd_free_nvlists(&zc); 23385367Sahrens zfs_close(zhp); 23395367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 23405367Sahrens "destination '%s' is a clone\n" 23415367Sahrens "must destroy it to overwrite it"), 23425367Sahrens zc.zc_name); 23435367Sahrens return (zfs_error(hdl, EZFS_EXISTS, errbuf)); 23445367Sahrens } 23455367Sahrens 23465367Sahrens if (!flags.dryrun && zhp->zfs_type == ZFS_TYPE_FILESYSTEM && 23475367Sahrens stream_wantsnewfs) { 23485367Sahrens /* We can't do online recv in this case */ 23497366STim.Haley@Sun.COM clp = changelist_gather(zhp, ZFS_PROP_NAME, 0, 0); 23505896Sahl if (clp == NULL) { 235110200SLori.Alt@Sun.COM zfs_close(zhp); 23525896Sahl zcmd_free_nvlists(&zc); 23535367Sahrens return (-1); 23545896Sahl } 23555367Sahrens if (changelist_prefix(clp) != 0) { 23565367Sahrens changelist_free(clp); 235710200SLori.Alt@Sun.COM zfs_close(zhp); 23585896Sahl zcmd_free_nvlists(&zc); 23595367Sahrens return (-1); 23605367Sahrens } 23615367Sahrens } 23625367Sahrens zfs_close(zhp); 23635367Sahrens } else { 23645367Sahrens /* 23655896Sahl * Destination filesystem does not exist. Therefore we better 23665896Sahl * be creating a new filesystem (either from a full backup, or 23675896Sahl * a clone). It would therefore be invalid if the user 23685896Sahl * specified only the pool name (i.e. if the destination name 23695896Sahl * contained no slash character). 23705367Sahrens */ 23715896Sahl if (!stream_wantsnewfs || 23725896Sahl (cp = strrchr(zc.zc_name, '/')) == NULL) { 23735896Sahl zcmd_free_nvlists(&zc); 23745367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 23755367Sahrens "destination '%s' does not exist"), zc.zc_name); 23765367Sahrens return (zfs_error(hdl, EZFS_NOENT, errbuf)); 23775367Sahrens } 23785367Sahrens 23795896Sahl /* 23805896Sahl * Trim off the final dataset component so we perform the 23815896Sahl * recvbackup ioctl to the filesystems's parent. 23825896Sahl */ 23835896Sahl *cp = '\0'; 23845367Sahrens 23855896Sahl if (flags.isprefix && !flags.dryrun && 23865896Sahl create_parents(hdl, zc.zc_value, strlen(tosnap)) != 0) { 23875896Sahl zcmd_free_nvlists(&zc); 23885896Sahl return (zfs_error(hdl, EZFS_BADRESTORE, errbuf)); 23895367Sahrens } 23905367Sahrens 23915367Sahrens newfs = B_TRUE; 23925367Sahrens } 23935367Sahrens 23945367Sahrens zc.zc_begin_record = drr_noswap->drr_u.drr_begin; 23955367Sahrens zc.zc_cookie = infd; 23965367Sahrens zc.zc_guid = flags.force; 23975367Sahrens if (flags.verbose) { 23985367Sahrens (void) printf("%s %s stream of %s into %s\n", 23995367Sahrens flags.dryrun ? "would receive" : "receiving", 24005367Sahrens drrb->drr_fromguid ? "incremental" : "full", 24015367Sahrens drrb->drr_toname, zc.zc_value); 24025367Sahrens (void) fflush(stdout); 24035367Sahrens } 24045367Sahrens 24055896Sahl if (flags.dryrun) { 24065896Sahl zcmd_free_nvlists(&zc); 24075367Sahrens return (recv_skip(hdl, infd, flags.byteswap)); 24085896Sahl } 24095367Sahrens 241011022STom.Erickson@Sun.COM zc.zc_nvlist_dst = (uint64_t)(uintptr_t)prop_errbuf; 241111022STom.Erickson@Sun.COM zc.zc_nvlist_dst_size = sizeof (prop_errbuf); 241211022STom.Erickson@Sun.COM 24135367Sahrens err = ioctl_err = zfs_ioctl(hdl, ZFS_IOC_RECV, &zc); 24145367Sahrens ioctl_errno = errno; 241511022STom.Erickson@Sun.COM prop_errflags = (zprop_errflags_t)zc.zc_obj; 241611022STom.Erickson@Sun.COM 241711022STom.Erickson@Sun.COM if (err == 0) { 241811022STom.Erickson@Sun.COM nvlist_t *prop_errors; 241911022STom.Erickson@Sun.COM VERIFY(0 == nvlist_unpack((void *)(uintptr_t)zc.zc_nvlist_dst, 242011022STom.Erickson@Sun.COM zc.zc_nvlist_dst_size, &prop_errors, 0)); 242111022STom.Erickson@Sun.COM 242211022STom.Erickson@Sun.COM nvpair_t *prop_err = NULL; 242311022STom.Erickson@Sun.COM 242411022STom.Erickson@Sun.COM while ((prop_err = nvlist_next_nvpair(prop_errors, 242511022STom.Erickson@Sun.COM prop_err)) != NULL) { 242611022STom.Erickson@Sun.COM char tbuf[1024]; 242711022STom.Erickson@Sun.COM zfs_prop_t prop; 242811022STom.Erickson@Sun.COM int intval; 242911022STom.Erickson@Sun.COM 243011022STom.Erickson@Sun.COM prop = zfs_name_to_prop(nvpair_name(prop_err)); 243111022STom.Erickson@Sun.COM (void) nvpair_value_int32(prop_err, &intval); 243211022STom.Erickson@Sun.COM if (strcmp(nvpair_name(prop_err), 243311022STom.Erickson@Sun.COM ZPROP_N_MORE_ERRORS) == 0) { 243411022STom.Erickson@Sun.COM trunc_prop_errs(intval); 243511022STom.Erickson@Sun.COM break; 243611022STom.Erickson@Sun.COM } else { 243711022STom.Erickson@Sun.COM (void) snprintf(tbuf, sizeof (tbuf), 243811022STom.Erickson@Sun.COM dgettext(TEXT_DOMAIN, 243911022STom.Erickson@Sun.COM "cannot receive %s property on %s"), 244011022STom.Erickson@Sun.COM nvpair_name(prop_err), zc.zc_name); 244111022STom.Erickson@Sun.COM zfs_setprop_error(hdl, prop, intval, tbuf); 244211022STom.Erickson@Sun.COM } 244311022STom.Erickson@Sun.COM } 244411022STom.Erickson@Sun.COM nvlist_free(prop_errors); 244511022STom.Erickson@Sun.COM } 244611022STom.Erickson@Sun.COM 244711022STom.Erickson@Sun.COM zc.zc_nvlist_dst = 0; 244811022STom.Erickson@Sun.COM zc.zc_nvlist_dst_size = 0; 24497265Sahrens zcmd_free_nvlists(&zc); 24507265Sahrens 24517265Sahrens if (err == 0 && snapprops_nvlist) { 24527265Sahrens zfs_cmd_t zc2 = { 0 }; 24537265Sahrens 24547273Sahrens (void) strcpy(zc2.zc_name, zc.zc_value); 245511022STom.Erickson@Sun.COM zc2.zc_cookie = B_TRUE; /* received */ 24567265Sahrens if (zcmd_write_src_nvlist(hdl, &zc2, snapprops_nvlist) == 0) { 24577265Sahrens (void) zfs_ioctl(hdl, ZFS_IOC_SET_PROP, &zc2); 24587265Sahrens zcmd_free_nvlists(&zc2); 24597265Sahrens } 24607265Sahrens } 24617265Sahrens 24625367Sahrens if (err && (ioctl_errno == ENOENT || ioctl_errno == ENODEV)) { 24635367Sahrens /* 24645367Sahrens * It may be that this snapshot already exists, 24655367Sahrens * in which case we want to consume & ignore it 24665367Sahrens * rather than failing. 24675367Sahrens */ 24685367Sahrens avl_tree_t *local_avl; 24695367Sahrens nvlist_t *local_nv, *fs; 24705367Sahrens char *cp = strchr(zc.zc_value, '@'); 24715367Sahrens 24725367Sahrens /* 24735367Sahrens * XXX Do this faster by just iterating over snaps in 24745367Sahrens * this fs. Also if zc_value does not exist, we will 24755367Sahrens * get a strange "does not exist" error message. 24765367Sahrens */ 24775367Sahrens *cp = '\0'; 247811022STom.Erickson@Sun.COM if (gather_nvlist(hdl, zc.zc_value, NULL, NULL, B_FALSE, 24795367Sahrens &local_nv, &local_avl) == 0) { 24805367Sahrens *cp = '@'; 24815367Sahrens fs = fsavl_find(local_avl, drrb->drr_toguid, NULL); 24825367Sahrens fsavl_destroy(local_avl); 24835367Sahrens nvlist_free(local_nv); 24845367Sahrens 24855367Sahrens if (fs != NULL) { 24865367Sahrens if (flags.verbose) { 24875367Sahrens (void) printf("snap %s already exists; " 24885367Sahrens "ignoring\n", zc.zc_value); 24895367Sahrens } 249011022STom.Erickson@Sun.COM err = ioctl_err = recv_skip(hdl, infd, 24915367Sahrens flags.byteswap); 24925367Sahrens } 24935367Sahrens } 24945367Sahrens *cp = '@'; 24955367Sahrens } 24965367Sahrens 24975367Sahrens if (ioctl_err != 0) { 24985367Sahrens switch (ioctl_errno) { 24995367Sahrens case ENODEV: 25005367Sahrens cp = strchr(zc.zc_value, '@'); 25015367Sahrens *cp = '\0'; 25025367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 25035367Sahrens "most recent snapshot of %s does not\n" 25045367Sahrens "match incremental source"), zc.zc_value); 25055367Sahrens (void) zfs_error(hdl, EZFS_BADRESTORE, errbuf); 25065367Sahrens *cp = '@'; 25075367Sahrens break; 25085367Sahrens case ETXTBSY: 25095367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 25105367Sahrens "destination %s has been modified\n" 25115367Sahrens "since most recent snapshot"), zc.zc_name); 25125367Sahrens (void) zfs_error(hdl, EZFS_BADRESTORE, errbuf); 25135367Sahrens break; 25145367Sahrens case EEXIST: 25155367Sahrens cp = strchr(zc.zc_value, '@'); 25165367Sahrens if (newfs) { 25175367Sahrens /* it's the containing fs that exists */ 25185367Sahrens *cp = '\0'; 25195367Sahrens } 25205367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 25215367Sahrens "destination already exists")); 25225367Sahrens (void) zfs_error_fmt(hdl, EZFS_EXISTS, 25235367Sahrens dgettext(TEXT_DOMAIN, "cannot restore to %s"), 25245367Sahrens zc.zc_value); 25255367Sahrens *cp = '@'; 25265367Sahrens break; 25275367Sahrens case EINVAL: 25285367Sahrens (void) zfs_error(hdl, EZFS_BADSTREAM, errbuf); 25295367Sahrens break; 25305367Sahrens case ECKSUM: 25315367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 25325367Sahrens "invalid stream (checksum mismatch)")); 25335367Sahrens (void) zfs_error(hdl, EZFS_BADSTREAM, errbuf); 25345367Sahrens break; 25355367Sahrens default: 25365367Sahrens (void) zfs_standard_error(hdl, ioctl_errno, errbuf); 25375367Sahrens } 25385367Sahrens } 25395367Sahrens 25405367Sahrens /* 254110588SEric.Taylor@Sun.COM * Mount the target filesystem (if created). Also mount any 254210588SEric.Taylor@Sun.COM * children of the target filesystem if we did a replication 254310588SEric.Taylor@Sun.COM * receive (indicated by stream_avl being non-NULL). 25445367Sahrens */ 25455367Sahrens cp = strchr(zc.zc_value, '@'); 25465367Sahrens if (cp && (ioctl_err == 0 || !newfs)) { 25475367Sahrens zfs_handle_t *h; 25485367Sahrens 25495367Sahrens *cp = '\0'; 25505367Sahrens h = zfs_open(hdl, zc.zc_value, 25515367Sahrens ZFS_TYPE_FILESYSTEM | ZFS_TYPE_VOLUME); 25526476Sahl if (h != NULL) { 25535367Sahrens if (h->zfs_type == ZFS_TYPE_VOLUME) { 25547366STim.Haley@Sun.COM *cp = '@'; 255510200SLori.Alt@Sun.COM } else if (newfs || stream_avl) { 25567366STim.Haley@Sun.COM /* 25577366STim.Haley@Sun.COM * Track the first/top of hierarchy fs, 25587366STim.Haley@Sun.COM * for mounting and sharing later. 25597366STim.Haley@Sun.COM */ 25607366STim.Haley@Sun.COM if (top_zfs && *top_zfs == NULL) 25617366STim.Haley@Sun.COM *top_zfs = zfs_strdup(hdl, zc.zc_value); 25625367Sahrens } 25636476Sahl zfs_close(h); 25645367Sahrens } 25657366STim.Haley@Sun.COM *cp = '@'; 25665367Sahrens } 25675367Sahrens 25685367Sahrens if (clp) { 25695367Sahrens err |= changelist_postfix(clp); 25705367Sahrens changelist_free(clp); 25715367Sahrens } 25725367Sahrens 257311022STom.Erickson@Sun.COM if (prop_errflags & ZPROP_ERR_NOCLEAR) { 257411022STom.Erickson@Sun.COM (void) fprintf(stderr, dgettext(TEXT_DOMAIN, "Warning: " 257511022STom.Erickson@Sun.COM "failed to clear unreceived properties on %s"), 257611022STom.Erickson@Sun.COM zc.zc_name); 257711022STom.Erickson@Sun.COM (void) fprintf(stderr, "\n"); 257811022STom.Erickson@Sun.COM } 257911022STom.Erickson@Sun.COM if (prop_errflags & ZPROP_ERR_NORESTORE) { 258011022STom.Erickson@Sun.COM (void) fprintf(stderr, dgettext(TEXT_DOMAIN, "Warning: " 258111022STom.Erickson@Sun.COM "failed to restore original properties on %s"), 258211022STom.Erickson@Sun.COM zc.zc_name); 258311022STom.Erickson@Sun.COM (void) fprintf(stderr, "\n"); 258411022STom.Erickson@Sun.COM } 258511022STom.Erickson@Sun.COM 25865367Sahrens if (err || ioctl_err) 25875367Sahrens return (-1); 25885367Sahrens 25895367Sahrens if (flags.verbose) { 25905367Sahrens char buf1[64]; 25915367Sahrens char buf2[64]; 25925367Sahrens uint64_t bytes = zc.zc_cookie; 25935367Sahrens time_t delta = time(NULL) - begin_time; 25945367Sahrens if (delta == 0) 25955367Sahrens delta = 1; 25965367Sahrens zfs_nicenum(bytes, buf1, sizeof (buf1)); 25975367Sahrens zfs_nicenum(bytes/delta, buf2, sizeof (buf1)); 25985367Sahrens 25995367Sahrens (void) printf("received %sB stream in %lu seconds (%sB/sec)\n", 26005367Sahrens buf1, delta, buf2); 26015367Sahrens } 26025367Sahrens 26035367Sahrens return (0); 26045367Sahrens } 26055367Sahrens 26067366STim.Haley@Sun.COM static int 26077366STim.Haley@Sun.COM zfs_receive_impl(libzfs_handle_t *hdl, const char *tosnap, recvflags_t flags, 26087366STim.Haley@Sun.COM int infd, avl_tree_t *stream_avl, char **top_zfs) 26095367Sahrens { 26105367Sahrens int err; 26115367Sahrens dmu_replay_record_t drr, drr_noswap; 26125367Sahrens struct drr_begin *drrb = &drr.drr_u.drr_begin; 26135367Sahrens char errbuf[1024]; 26145367Sahrens zio_cksum_t zcksum = { 0 }; 261511007SLori.Alt@Sun.COM uint64_t featureflags; 261611007SLori.Alt@Sun.COM int hdrtype; 26175367Sahrens 26185367Sahrens (void) snprintf(errbuf, sizeof (errbuf), dgettext(TEXT_DOMAIN, 26195367Sahrens "cannot receive")); 26205367Sahrens 26215367Sahrens if (flags.isprefix && 26225367Sahrens !zfs_dataset_exists(hdl, tosnap, ZFS_TYPE_DATASET)) { 26235367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "specified fs " 26245367Sahrens "(%s) does not exist"), tosnap); 26255367Sahrens return (zfs_error(hdl, EZFS_NOENT, errbuf)); 26265367Sahrens } 26275367Sahrens 26285367Sahrens /* read in the BEGIN record */ 26295367Sahrens if (0 != (err = recv_read(hdl, infd, &drr, sizeof (drr), B_FALSE, 26305367Sahrens &zcksum))) 26315367Sahrens return (err); 26325367Sahrens 26335367Sahrens if (drr.drr_type == DRR_END || drr.drr_type == BSWAP_32(DRR_END)) { 26345367Sahrens /* It's the double end record at the end of a package */ 26355367Sahrens return (ENODATA); 26365367Sahrens } 26375367Sahrens 26385367Sahrens /* the kernel needs the non-byteswapped begin record */ 26395367Sahrens drr_noswap = drr; 26405367Sahrens 26415446Sahrens flags.byteswap = B_FALSE; 26425367Sahrens if (drrb->drr_magic == BSWAP_64(DMU_BACKUP_MAGIC)) { 26435367Sahrens /* 26445367Sahrens * We computed the checksum in the wrong byteorder in 26455367Sahrens * recv_read() above; do it again correctly. 26465367Sahrens */ 26475367Sahrens bzero(&zcksum, sizeof (zio_cksum_t)); 26485367Sahrens fletcher_4_incremental_byteswap(&drr, sizeof (drr), &zcksum); 26495367Sahrens flags.byteswap = B_TRUE; 26505367Sahrens 26515367Sahrens drr.drr_type = BSWAP_32(drr.drr_type); 26525367Sahrens drr.drr_payloadlen = BSWAP_32(drr.drr_payloadlen); 26535367Sahrens drrb->drr_magic = BSWAP_64(drrb->drr_magic); 265411007SLori.Alt@Sun.COM drrb->drr_versioninfo = BSWAP_64(drrb->drr_versioninfo); 26555367Sahrens drrb->drr_creation_time = BSWAP_64(drrb->drr_creation_time); 26565367Sahrens drrb->drr_type = BSWAP_32(drrb->drr_type); 26575367Sahrens drrb->drr_flags = BSWAP_32(drrb->drr_flags); 26585367Sahrens drrb->drr_toguid = BSWAP_64(drrb->drr_toguid); 26595367Sahrens drrb->drr_fromguid = BSWAP_64(drrb->drr_fromguid); 26605367Sahrens } 26615367Sahrens 26625367Sahrens if (drrb->drr_magic != DMU_BACKUP_MAGIC || drr.drr_type != DRR_BEGIN) { 26635367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "invalid " 26645367Sahrens "stream (bad magic number)")); 26655367Sahrens return (zfs_error(hdl, EZFS_BADSTREAM, errbuf)); 26665367Sahrens } 26675367Sahrens 266811007SLori.Alt@Sun.COM featureflags = DMU_GET_FEATUREFLAGS(drrb->drr_versioninfo); 266911007SLori.Alt@Sun.COM hdrtype = DMU_GET_STREAM_HDRTYPE(drrb->drr_versioninfo); 267011007SLori.Alt@Sun.COM 267111007SLori.Alt@Sun.COM if (!DMU_STREAM_SUPPORTED(featureflags) || 267211007SLori.Alt@Sun.COM (hdrtype != DMU_SUBSTREAM && hdrtype != DMU_COMPOUNDSTREAM)) { 267311007SLori.Alt@Sun.COM zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, 267411007SLori.Alt@Sun.COM "stream has unsupported feature, feature flags = %lx"), 267511007SLori.Alt@Sun.COM featureflags); 267611007SLori.Alt@Sun.COM return (zfs_error(hdl, EZFS_BADSTREAM, errbuf)); 267711007SLori.Alt@Sun.COM } 267811007SLori.Alt@Sun.COM 26795367Sahrens if (strchr(drrb->drr_toname, '@') == NULL) { 26805367Sahrens zfs_error_aux(hdl, dgettext(TEXT_DOMAIN, "invalid " 26815367Sahrens "stream (bad snapshot name)")); 26825367Sahrens return (zfs_error(hdl, EZFS_BADSTREAM, errbuf)); 26835367Sahrens } 26845367Sahrens 268511007SLori.Alt@Sun.COM if (DMU_GET_STREAM_HDRTYPE(drrb->drr_versioninfo) == DMU_SUBSTREAM) { 26865367Sahrens return (zfs_receive_one(hdl, infd, tosnap, flags, 26877366STim.Haley@Sun.COM &drr, &drr_noswap, stream_avl, top_zfs)); 268811007SLori.Alt@Sun.COM } else { /* must be DMU_COMPOUNDSTREAM */ 268911007SLori.Alt@Sun.COM assert(DMU_GET_STREAM_HDRTYPE(drrb->drr_versioninfo) == 269011007SLori.Alt@Sun.COM DMU_COMPOUNDSTREAM); 26915367Sahrens return (zfs_receive_package(hdl, infd, tosnap, flags, 26927366STim.Haley@Sun.COM &drr, &zcksum, top_zfs)); 26935367Sahrens } 26945367Sahrens } 26957366STim.Haley@Sun.COM 26967366STim.Haley@Sun.COM /* 26977366STim.Haley@Sun.COM * Restores a backup of tosnap from the file descriptor specified by infd. 26987366STim.Haley@Sun.COM * Return 0 on total success, -2 if some things couldn't be 26997366STim.Haley@Sun.COM * destroyed/renamed/promoted, -1 if some things couldn't be received. 27007366STim.Haley@Sun.COM * (-1 will override -2). 27017366STim.Haley@Sun.COM */ 27027366STim.Haley@Sun.COM int 27037366STim.Haley@Sun.COM zfs_receive(libzfs_handle_t *hdl, const char *tosnap, recvflags_t flags, 27047366STim.Haley@Sun.COM int infd, avl_tree_t *stream_avl) 27057366STim.Haley@Sun.COM { 27067366STim.Haley@Sun.COM char *top_zfs = NULL; 27077366STim.Haley@Sun.COM int err; 27087366STim.Haley@Sun.COM 27097366STim.Haley@Sun.COM err = zfs_receive_impl(hdl, tosnap, flags, infd, stream_avl, &top_zfs); 27107366STim.Haley@Sun.COM 27118584SLori.Alt@Sun.COM if (err == 0 && !flags.nomount && top_zfs) { 27127366STim.Haley@Sun.COM zfs_handle_t *zhp; 27137366STim.Haley@Sun.COM prop_changelist_t *clp; 27147366STim.Haley@Sun.COM 27157366STim.Haley@Sun.COM zhp = zfs_open(hdl, top_zfs, ZFS_TYPE_FILESYSTEM); 27167366STim.Haley@Sun.COM if (zhp != NULL) { 27177366STim.Haley@Sun.COM clp = changelist_gather(zhp, ZFS_PROP_MOUNTPOINT, 27187366STim.Haley@Sun.COM CL_GATHER_MOUNT_ALWAYS, 0); 27197366STim.Haley@Sun.COM zfs_close(zhp); 27207366STim.Haley@Sun.COM if (clp != NULL) { 27217366STim.Haley@Sun.COM /* mount and share received datasets */ 27227366STim.Haley@Sun.COM err = changelist_postfix(clp); 27237366STim.Haley@Sun.COM changelist_free(clp); 27247366STim.Haley@Sun.COM } 27257366STim.Haley@Sun.COM } 27267366STim.Haley@Sun.COM if (zhp == NULL || clp == NULL || err) 27277366STim.Haley@Sun.COM err = -1; 27287366STim.Haley@Sun.COM } 27297366STim.Haley@Sun.COM if (top_zfs) 27307366STim.Haley@Sun.COM free(top_zfs); 27317366STim.Haley@Sun.COM 27327366STim.Haley@Sun.COM return (err); 27337366STim.Haley@Sun.COM } 2734