xref: /onnv-gate/usr/src/uts/common/fs/zfs/dmu_diff.c (revision 13043:8c712bbb18ea)
1*13043STim.Haley@Sun.COM /*
2*13043STim.Haley@Sun.COM  * CDDL HEADER START
3*13043STim.Haley@Sun.COM  *
4*13043STim.Haley@Sun.COM  * The contents of this file are subject to the terms of the
5*13043STim.Haley@Sun.COM  * Common Development and Distribution License (the "License").
6*13043STim.Haley@Sun.COM  * You may not use this file except in compliance with the License.
7*13043STim.Haley@Sun.COM  *
8*13043STim.Haley@Sun.COM  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9*13043STim.Haley@Sun.COM  * or http://www.opensolaris.org/os/licensing.
10*13043STim.Haley@Sun.COM  * See the License for the specific language governing permissions
11*13043STim.Haley@Sun.COM  * and limitations under the License.
12*13043STim.Haley@Sun.COM  *
13*13043STim.Haley@Sun.COM  * When distributing Covered Code, include this CDDL HEADER in each
14*13043STim.Haley@Sun.COM  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15*13043STim.Haley@Sun.COM  * If applicable, add the following below this CDDL HEADER, with the
16*13043STim.Haley@Sun.COM  * fields enclosed by brackets "[]" replaced with your own identifying
17*13043STim.Haley@Sun.COM  * information: Portions Copyright [yyyy] [name of copyright owner]
18*13043STim.Haley@Sun.COM  *
19*13043STim.Haley@Sun.COM  * CDDL HEADER END
20*13043STim.Haley@Sun.COM  */
21*13043STim.Haley@Sun.COM /*
22*13043STim.Haley@Sun.COM  * Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved.
23*13043STim.Haley@Sun.COM  */
24*13043STim.Haley@Sun.COM 
25*13043STim.Haley@Sun.COM #include <sys/dmu.h>
26*13043STim.Haley@Sun.COM #include <sys/dmu_impl.h>
27*13043STim.Haley@Sun.COM #include <sys/dmu_tx.h>
28*13043STim.Haley@Sun.COM #include <sys/dbuf.h>
29*13043STim.Haley@Sun.COM #include <sys/dnode.h>
30*13043STim.Haley@Sun.COM #include <sys/zfs_context.h>
31*13043STim.Haley@Sun.COM #include <sys/dmu_objset.h>
32*13043STim.Haley@Sun.COM #include <sys/dmu_traverse.h>
33*13043STim.Haley@Sun.COM #include <sys/dsl_dataset.h>
34*13043STim.Haley@Sun.COM #include <sys/dsl_dir.h>
35*13043STim.Haley@Sun.COM #include <sys/dsl_pool.h>
36*13043STim.Haley@Sun.COM #include <sys/dsl_synctask.h>
37*13043STim.Haley@Sun.COM #include <sys/zfs_ioctl.h>
38*13043STim.Haley@Sun.COM #include <sys/zap.h>
39*13043STim.Haley@Sun.COM #include <sys/zio_checksum.h>
40*13043STim.Haley@Sun.COM #include <sys/zfs_znode.h>
41*13043STim.Haley@Sun.COM 
42*13043STim.Haley@Sun.COM struct diffarg {
43*13043STim.Haley@Sun.COM 	struct vnode *da_vp;		/* file to which we are reporting */
44*13043STim.Haley@Sun.COM 	offset_t *da_offp;
45*13043STim.Haley@Sun.COM 	int da_err;			/* error that stopped diff search */
46*13043STim.Haley@Sun.COM 	dmu_diff_record_t da_ddr;
47*13043STim.Haley@Sun.COM };
48*13043STim.Haley@Sun.COM 
49*13043STim.Haley@Sun.COM static int
write_record(struct diffarg * da)50*13043STim.Haley@Sun.COM write_record(struct diffarg *da)
51*13043STim.Haley@Sun.COM {
52*13043STim.Haley@Sun.COM 	ssize_t resid; /* have to get resid to get detailed errno */
53*13043STim.Haley@Sun.COM 
54*13043STim.Haley@Sun.COM 	if (da->da_ddr.ddr_type == DDR_NONE) {
55*13043STim.Haley@Sun.COM 		da->da_err = 0;
56*13043STim.Haley@Sun.COM 		return (0);
57*13043STim.Haley@Sun.COM 	}
58*13043STim.Haley@Sun.COM 
59*13043STim.Haley@Sun.COM 	da->da_err = vn_rdwr(UIO_WRITE, da->da_vp, (caddr_t)&da->da_ddr,
60*13043STim.Haley@Sun.COM 	    sizeof (da->da_ddr), 0, UIO_SYSSPACE, FAPPEND,
61*13043STim.Haley@Sun.COM 	    RLIM64_INFINITY, CRED(), &resid);
62*13043STim.Haley@Sun.COM 	*da->da_offp += sizeof (da->da_ddr);
63*13043STim.Haley@Sun.COM 	return (da->da_err);
64*13043STim.Haley@Sun.COM }
65*13043STim.Haley@Sun.COM 
66*13043STim.Haley@Sun.COM static int
report_free_dnode_range(struct diffarg * da,uint64_t first,uint64_t last)67*13043STim.Haley@Sun.COM report_free_dnode_range(struct diffarg *da, uint64_t first, uint64_t last)
68*13043STim.Haley@Sun.COM {
69*13043STim.Haley@Sun.COM 	ASSERT(first <= last);
70*13043STim.Haley@Sun.COM 	if (da->da_ddr.ddr_type != DDR_FREE ||
71*13043STim.Haley@Sun.COM 	    first != da->da_ddr.ddr_last + 1) {
72*13043STim.Haley@Sun.COM 		if (write_record(da) != 0)
73*13043STim.Haley@Sun.COM 			return (da->da_err);
74*13043STim.Haley@Sun.COM 		da->da_ddr.ddr_type = DDR_FREE;
75*13043STim.Haley@Sun.COM 		da->da_ddr.ddr_first = first;
76*13043STim.Haley@Sun.COM 		da->da_ddr.ddr_last = last;
77*13043STim.Haley@Sun.COM 		return (0);
78*13043STim.Haley@Sun.COM 	}
79*13043STim.Haley@Sun.COM 	da->da_ddr.ddr_last = last;
80*13043STim.Haley@Sun.COM 	return (0);
81*13043STim.Haley@Sun.COM }
82*13043STim.Haley@Sun.COM 
83*13043STim.Haley@Sun.COM static int
report_dnode(struct diffarg * da,uint64_t object,dnode_phys_t * dnp)84*13043STim.Haley@Sun.COM report_dnode(struct diffarg *da, uint64_t object, dnode_phys_t *dnp)
85*13043STim.Haley@Sun.COM {
86*13043STim.Haley@Sun.COM 	ASSERT(dnp != NULL);
87*13043STim.Haley@Sun.COM 	if (dnp->dn_type == DMU_OT_NONE)
88*13043STim.Haley@Sun.COM 		return (report_free_dnode_range(da, object, object));
89*13043STim.Haley@Sun.COM 
90*13043STim.Haley@Sun.COM 	if (da->da_ddr.ddr_type != DDR_INUSE ||
91*13043STim.Haley@Sun.COM 	    object != da->da_ddr.ddr_last + 1) {
92*13043STim.Haley@Sun.COM 		if (write_record(da) != 0)
93*13043STim.Haley@Sun.COM 			return (da->da_err);
94*13043STim.Haley@Sun.COM 		da->da_ddr.ddr_type = DDR_INUSE;
95*13043STim.Haley@Sun.COM 		da->da_ddr.ddr_first = da->da_ddr.ddr_last = object;
96*13043STim.Haley@Sun.COM 		return (0);
97*13043STim.Haley@Sun.COM 	}
98*13043STim.Haley@Sun.COM 	da->da_ddr.ddr_last = object;
99*13043STim.Haley@Sun.COM 	return (0);
100*13043STim.Haley@Sun.COM }
101*13043STim.Haley@Sun.COM 
102*13043STim.Haley@Sun.COM #define	DBP_SPAN(dnp, level)				  \
103*13043STim.Haley@Sun.COM 	(((uint64_t)dnp->dn_datablkszsec) << (SPA_MINBLOCKSHIFT + \
104*13043STim.Haley@Sun.COM 	(level) * (dnp->dn_indblkshift - SPA_BLKPTRSHIFT)))
105*13043STim.Haley@Sun.COM 
106*13043STim.Haley@Sun.COM /* ARGSUSED */
107*13043STim.Haley@Sun.COM static int
diff_cb(spa_t * spa,zilog_t * zilog,const blkptr_t * bp,arc_buf_t * pbuf,const zbookmark_t * zb,const dnode_phys_t * dnp,void * arg)108*13043STim.Haley@Sun.COM diff_cb(spa_t *spa, zilog_t *zilog, const blkptr_t *bp, arc_buf_t *pbuf,
109*13043STim.Haley@Sun.COM     const zbookmark_t *zb, const dnode_phys_t *dnp, void *arg)
110*13043STim.Haley@Sun.COM {
111*13043STim.Haley@Sun.COM 	struct diffarg *da = arg;
112*13043STim.Haley@Sun.COM 	int err = 0;
113*13043STim.Haley@Sun.COM 
114*13043STim.Haley@Sun.COM 	if (issig(JUSTLOOKING) && issig(FORREAL))
115*13043STim.Haley@Sun.COM 		return (EINTR);
116*13043STim.Haley@Sun.COM 
117*13043STim.Haley@Sun.COM 	if (zb->zb_object != DMU_META_DNODE_OBJECT)
118*13043STim.Haley@Sun.COM 		return (0);
119*13043STim.Haley@Sun.COM 
120*13043STim.Haley@Sun.COM 	if (bp == NULL) {
121*13043STim.Haley@Sun.COM 		uint64_t span = DBP_SPAN(dnp, zb->zb_level);
122*13043STim.Haley@Sun.COM 		uint64_t dnobj = (zb->zb_blkid * span) >> DNODE_SHIFT;
123*13043STim.Haley@Sun.COM 
124*13043STim.Haley@Sun.COM 		err = report_free_dnode_range(da, dnobj,
125*13043STim.Haley@Sun.COM 		    dnobj + (span >> DNODE_SHIFT) - 1);
126*13043STim.Haley@Sun.COM 		if (err)
127*13043STim.Haley@Sun.COM 			return (err);
128*13043STim.Haley@Sun.COM 	} else if (zb->zb_level == 0) {
129*13043STim.Haley@Sun.COM 		dnode_phys_t *blk;
130*13043STim.Haley@Sun.COM 		arc_buf_t *abuf;
131*13043STim.Haley@Sun.COM 		uint32_t aflags = ARC_WAIT;
132*13043STim.Haley@Sun.COM 		int blksz = BP_GET_LSIZE(bp);
133*13043STim.Haley@Sun.COM 		int i;
134*13043STim.Haley@Sun.COM 
135*13043STim.Haley@Sun.COM 		if (dsl_read(NULL, spa, bp, pbuf,
136*13043STim.Haley@Sun.COM 		    arc_getbuf_func, &abuf, ZIO_PRIORITY_ASYNC_READ,
137*13043STim.Haley@Sun.COM 		    ZIO_FLAG_CANFAIL, &aflags, zb) != 0)
138*13043STim.Haley@Sun.COM 			return (EIO);
139*13043STim.Haley@Sun.COM 
140*13043STim.Haley@Sun.COM 		blk = abuf->b_data;
141*13043STim.Haley@Sun.COM 		for (i = 0; i < blksz >> DNODE_SHIFT; i++) {
142*13043STim.Haley@Sun.COM 			uint64_t dnobj = (zb->zb_blkid <<
143*13043STim.Haley@Sun.COM 			    (DNODE_BLOCK_SHIFT - DNODE_SHIFT)) + i;
144*13043STim.Haley@Sun.COM 			err = report_dnode(da, dnobj, blk+i);
145*13043STim.Haley@Sun.COM 			if (err)
146*13043STim.Haley@Sun.COM 				break;
147*13043STim.Haley@Sun.COM 		}
148*13043STim.Haley@Sun.COM 		(void) arc_buf_remove_ref(abuf, &abuf);
149*13043STim.Haley@Sun.COM 		if (err)
150*13043STim.Haley@Sun.COM 			return (err);
151*13043STim.Haley@Sun.COM 		/* Don't care about the data blocks */
152*13043STim.Haley@Sun.COM 		return (TRAVERSE_VISIT_NO_CHILDREN);
153*13043STim.Haley@Sun.COM 	}
154*13043STim.Haley@Sun.COM 	return (0);
155*13043STim.Haley@Sun.COM }
156*13043STim.Haley@Sun.COM 
157*13043STim.Haley@Sun.COM int
dmu_diff(objset_t * tosnap,objset_t * fromsnap,struct vnode * vp,offset_t * offp)158*13043STim.Haley@Sun.COM dmu_diff(objset_t *tosnap, objset_t *fromsnap, struct vnode *vp, offset_t *offp)
159*13043STim.Haley@Sun.COM {
160*13043STim.Haley@Sun.COM 	struct diffarg da;
161*13043STim.Haley@Sun.COM 	dsl_dataset_t *ds = tosnap->os_dsl_dataset;
162*13043STim.Haley@Sun.COM 	dsl_dataset_t *fromds = fromsnap->os_dsl_dataset;
163*13043STim.Haley@Sun.COM 	dsl_dataset_t *findds;
164*13043STim.Haley@Sun.COM 	dsl_dataset_t *relds;
165*13043STim.Haley@Sun.COM 	int err = 0;
166*13043STim.Haley@Sun.COM 
167*13043STim.Haley@Sun.COM 	/* make certain we are looking at snapshots */
168*13043STim.Haley@Sun.COM 	if (!dsl_dataset_is_snapshot(ds) || !dsl_dataset_is_snapshot(fromds))
169*13043STim.Haley@Sun.COM 		return (EINVAL);
170*13043STim.Haley@Sun.COM 
171*13043STim.Haley@Sun.COM 	/* fromsnap must be earlier and from the same lineage as tosnap */
172*13043STim.Haley@Sun.COM 	if (fromds->ds_phys->ds_creation_txg >= ds->ds_phys->ds_creation_txg)
173*13043STim.Haley@Sun.COM 		return (EXDEV);
174*13043STim.Haley@Sun.COM 
175*13043STim.Haley@Sun.COM 	relds = NULL;
176*13043STim.Haley@Sun.COM 	findds = ds;
177*13043STim.Haley@Sun.COM 
178*13043STim.Haley@Sun.COM 	while (fromds->ds_dir != findds->ds_dir) {
179*13043STim.Haley@Sun.COM 		dsl_pool_t *dp = ds->ds_dir->dd_pool;
180*13043STim.Haley@Sun.COM 
181*13043STim.Haley@Sun.COM 		if (!dsl_dir_is_clone(findds->ds_dir)) {
182*13043STim.Haley@Sun.COM 			if (relds)
183*13043STim.Haley@Sun.COM 				dsl_dataset_rele(relds, FTAG);
184*13043STim.Haley@Sun.COM 			return (EXDEV);
185*13043STim.Haley@Sun.COM 		}
186*13043STim.Haley@Sun.COM 
187*13043STim.Haley@Sun.COM 		rw_enter(&dp->dp_config_rwlock, RW_READER);
188*13043STim.Haley@Sun.COM 		err = dsl_dataset_hold_obj(dp,
189*13043STim.Haley@Sun.COM 		    findds->ds_dir->dd_phys->dd_origin_obj, FTAG, &findds);
190*13043STim.Haley@Sun.COM 		rw_exit(&dp->dp_config_rwlock);
191*13043STim.Haley@Sun.COM 
192*13043STim.Haley@Sun.COM 		if (relds)
193*13043STim.Haley@Sun.COM 			dsl_dataset_rele(relds, FTAG);
194*13043STim.Haley@Sun.COM 
195*13043STim.Haley@Sun.COM 		if (err)
196*13043STim.Haley@Sun.COM 			return (EXDEV);
197*13043STim.Haley@Sun.COM 
198*13043STim.Haley@Sun.COM 		relds = findds;
199*13043STim.Haley@Sun.COM 	}
200*13043STim.Haley@Sun.COM 
201*13043STim.Haley@Sun.COM 	if (relds)
202*13043STim.Haley@Sun.COM 		dsl_dataset_rele(relds, FTAG);
203*13043STim.Haley@Sun.COM 
204*13043STim.Haley@Sun.COM 	da.da_vp = vp;
205*13043STim.Haley@Sun.COM 	da.da_offp = offp;
206*13043STim.Haley@Sun.COM 	da.da_ddr.ddr_type = DDR_NONE;
207*13043STim.Haley@Sun.COM 	da.da_ddr.ddr_first = da.da_ddr.ddr_last = 0;
208*13043STim.Haley@Sun.COM 	da.da_err = 0;
209*13043STim.Haley@Sun.COM 
210*13043STim.Haley@Sun.COM 	err = traverse_dataset(ds, fromds->ds_phys->ds_creation_txg,
211*13043STim.Haley@Sun.COM 	    TRAVERSE_PRE | TRAVERSE_PREFETCH_METADATA, diff_cb, &da);
212*13043STim.Haley@Sun.COM 
213*13043STim.Haley@Sun.COM 	if (err) {
214*13043STim.Haley@Sun.COM 		da.da_err = err;
215*13043STim.Haley@Sun.COM 	} else {
216*13043STim.Haley@Sun.COM 		/* we set the da.da_err we return as side-effect */
217*13043STim.Haley@Sun.COM 		(void) write_record(&da);
218*13043STim.Haley@Sun.COM 	}
219*13043STim.Haley@Sun.COM 
220*13043STim.Haley@Sun.COM 	return (da.da_err);
221*13043STim.Haley@Sun.COM }
222