xref: /illumos-gate/usr/src/uts/common/fs/zfs/ddt_zap.c (revision 52abb70e073c2a88808c0d66fd810ba8c5080572)
1b24ab676SJeff Bonwick /*
2b24ab676SJeff Bonwick  * CDDL HEADER START
3b24ab676SJeff Bonwick  *
4b24ab676SJeff Bonwick  * The contents of this file are subject to the terms of the
5b24ab676SJeff Bonwick  * Common Development and Distribution License (the "License").
6b24ab676SJeff Bonwick  * You may not use this file except in compliance with the License.
7b24ab676SJeff Bonwick  *
8b24ab676SJeff Bonwick  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9b24ab676SJeff Bonwick  * or http://www.opensolaris.org/os/licensing.
10b24ab676SJeff Bonwick  * See the License for the specific language governing permissions
11b24ab676SJeff Bonwick  * and limitations under the License.
12b24ab676SJeff Bonwick  *
13b24ab676SJeff Bonwick  * When distributing Covered Code, include this CDDL HEADER in each
14b24ab676SJeff Bonwick  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15b24ab676SJeff Bonwick  * If applicable, add the following below this CDDL HEADER, with the
16b24ab676SJeff Bonwick  * fields enclosed by brackets "[]" replaced with your own identifying
17b24ab676SJeff Bonwick  * information: Portions Copyright [yyyy] [name of copyright owner]
18b24ab676SJeff Bonwick  *
19b24ab676SJeff Bonwick  * CDDL HEADER END
20b24ab676SJeff Bonwick  */
21b24ab676SJeff Bonwick 
22b24ab676SJeff Bonwick /*
23c7cd2421SGeorge Wilson  * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved.
24*52abb70eSMatthew Ahrens  * Copyright (c) 2018 by Delphix. All rights reserved.
25b24ab676SJeff Bonwick  */
26b24ab676SJeff Bonwick 
27b24ab676SJeff Bonwick #include <sys/zfs_context.h>
28b24ab676SJeff Bonwick #include <sys/spa.h>
29b24ab676SJeff Bonwick #include <sys/zio.h>
30b24ab676SJeff Bonwick #include <sys/ddt.h>
31b24ab676SJeff Bonwick #include <sys/zap.h>
32b24ab676SJeff Bonwick #include <sys/dmu_tx.h>
33b24ab676SJeff Bonwick #include <util/sscanf.h>
34b24ab676SJeff Bonwick 
35b24ab676SJeff Bonwick int ddt_zap_leaf_blockshift = 12;
36b24ab676SJeff Bonwick int ddt_zap_indirect_blockshift = 12;
37b24ab676SJeff Bonwick 
38b24ab676SJeff Bonwick static int
ddt_zap_create(objset_t * os,uint64_t * objectp,dmu_tx_t * tx,boolean_t prehash)39b24ab676SJeff Bonwick ddt_zap_create(objset_t *os, uint64_t *objectp, dmu_tx_t *tx, boolean_t prehash)
40b24ab676SJeff Bonwick {
41b24ab676SJeff Bonwick 	zap_flags_t flags = ZAP_FLAG_HASH64 | ZAP_FLAG_UINT64_KEY;
42b24ab676SJeff Bonwick 
43b24ab676SJeff Bonwick 	if (prehash)
44b24ab676SJeff Bonwick 		flags |= ZAP_FLAG_PRE_HASHED_KEY;
45b24ab676SJeff Bonwick 
46b24ab676SJeff Bonwick 	*objectp = zap_create_flags(os, 0, flags, DMU_OT_DDT_ZAP,
47b24ab676SJeff Bonwick 	    ddt_zap_leaf_blockshift, ddt_zap_indirect_blockshift,
48b24ab676SJeff Bonwick 	    DMU_OT_NONE, 0, tx);
49b24ab676SJeff Bonwick 
50b24ab676SJeff Bonwick 	return (*objectp == 0 ? ENOTSUP : 0);
51b24ab676SJeff Bonwick }
52b24ab676SJeff Bonwick 
53b24ab676SJeff Bonwick static int
ddt_zap_destroy(objset_t * os,uint64_t object,dmu_tx_t * tx)54b24ab676SJeff Bonwick ddt_zap_destroy(objset_t *os, uint64_t object, dmu_tx_t *tx)
55b24ab676SJeff Bonwick {
56b24ab676SJeff Bonwick 	return (zap_destroy(os, object, tx));
57b24ab676SJeff Bonwick }
58b24ab676SJeff Bonwick 
59b24ab676SJeff Bonwick static int
ddt_zap_lookup(objset_t * os,uint64_t object,ddt_entry_t * dde)60b24ab676SJeff Bonwick ddt_zap_lookup(objset_t *os, uint64_t object, ddt_entry_t *dde)
61b24ab676SJeff Bonwick {
62b24ab676SJeff Bonwick 	uchar_t cbuf[sizeof (dde->dde_phys) + 1];
63b24ab676SJeff Bonwick 	uint64_t one, csize;
64b24ab676SJeff Bonwick 	int error;
65b24ab676SJeff Bonwick 
66b24ab676SJeff Bonwick 	error = zap_length_uint64(os, object, (uint64_t *)&dde->dde_key,
67b24ab676SJeff Bonwick 	    DDT_KEY_WORDS, &one, &csize);
68b24ab676SJeff Bonwick 	if (error)
69b24ab676SJeff Bonwick 		return (error);
70b24ab676SJeff Bonwick 
71b24ab676SJeff Bonwick 	ASSERT(one == 1);
72b24ab676SJeff Bonwick 	ASSERT(csize <= sizeof (cbuf));
73b24ab676SJeff Bonwick 
74b24ab676SJeff Bonwick 	error = zap_lookup_uint64(os, object, (uint64_t *)&dde->dde_key,
75b24ab676SJeff Bonwick 	    DDT_KEY_WORDS, 1, csize, cbuf);
76b24ab676SJeff Bonwick 	if (error)
77b24ab676SJeff Bonwick 		return (error);
78b24ab676SJeff Bonwick 
79b24ab676SJeff Bonwick 	ddt_decompress(cbuf, dde->dde_phys, csize, sizeof (dde->dde_phys));
80b24ab676SJeff Bonwick 
81b24ab676SJeff Bonwick 	return (0);
82b24ab676SJeff Bonwick }
83b24ab676SJeff Bonwick 
84c7cd2421SGeorge Wilson static void
ddt_zap_prefetch(objset_t * os,uint64_t object,ddt_entry_t * dde)85c7cd2421SGeorge Wilson ddt_zap_prefetch(objset_t *os, uint64_t object, ddt_entry_t *dde)
86c7cd2421SGeorge Wilson {
87c7cd2421SGeorge Wilson 	(void) zap_prefetch_uint64(os, object, (uint64_t *)&dde->dde_key,
88c7cd2421SGeorge Wilson 	    DDT_KEY_WORDS);
89c7cd2421SGeorge Wilson }
90c7cd2421SGeorge Wilson 
91b24ab676SJeff Bonwick static int
ddt_zap_update(objset_t * os,uint64_t object,ddt_entry_t * dde,dmu_tx_t * tx)92b24ab676SJeff Bonwick ddt_zap_update(objset_t *os, uint64_t object, ddt_entry_t *dde, dmu_tx_t *tx)
93b24ab676SJeff Bonwick {
94b24ab676SJeff Bonwick 	uchar_t cbuf[sizeof (dde->dde_phys) + 1];
95b24ab676SJeff Bonwick 	uint64_t csize;
96b24ab676SJeff Bonwick 
97b24ab676SJeff Bonwick 	csize = ddt_compress(dde->dde_phys, cbuf,
98b24ab676SJeff Bonwick 	    sizeof (dde->dde_phys), sizeof (cbuf));
99b24ab676SJeff Bonwick 
100b24ab676SJeff Bonwick 	return (zap_update_uint64(os, object, (uint64_t *)&dde->dde_key,
101b24ab676SJeff Bonwick 	    DDT_KEY_WORDS, 1, csize, cbuf, tx));
102b24ab676SJeff Bonwick }
103b24ab676SJeff Bonwick 
104b24ab676SJeff Bonwick static int
ddt_zap_remove(objset_t * os,uint64_t object,ddt_entry_t * dde,dmu_tx_t * tx)105b24ab676SJeff Bonwick ddt_zap_remove(objset_t *os, uint64_t object, ddt_entry_t *dde, dmu_tx_t *tx)
106b24ab676SJeff Bonwick {
107b24ab676SJeff Bonwick 	return (zap_remove_uint64(os, object, (uint64_t *)&dde->dde_key,
108b24ab676SJeff Bonwick 	    DDT_KEY_WORDS, tx));
109b24ab676SJeff Bonwick }
110b24ab676SJeff Bonwick 
111b24ab676SJeff Bonwick static int
ddt_zap_walk(objset_t * os,uint64_t object,ddt_entry_t * dde,uint64_t * walk)112b24ab676SJeff Bonwick ddt_zap_walk(objset_t *os, uint64_t object, ddt_entry_t *dde, uint64_t *walk)
113b24ab676SJeff Bonwick {
114b24ab676SJeff Bonwick 	zap_cursor_t zc;
115b24ab676SJeff Bonwick 	zap_attribute_t za;
116b24ab676SJeff Bonwick 	int error;
117b24ab676SJeff Bonwick 
118*52abb70eSMatthew Ahrens 	if (*walk == 0) {
119*52abb70eSMatthew Ahrens 		/*
120*52abb70eSMatthew Ahrens 		 * We don't want to prefetch the entire ZAP object, because
121*52abb70eSMatthew Ahrens 		 * it can be enormous.  Also the primary use of DDT iteration
122*52abb70eSMatthew Ahrens 		 * is for scrubbing, in which case we will be issuing many
123*52abb70eSMatthew Ahrens 		 * scrub i/os for each ZAP block that we read in, so
124*52abb70eSMatthew Ahrens 		 * reading the ZAP is unlikely to be the bottleneck.
125*52abb70eSMatthew Ahrens 		 */
126*52abb70eSMatthew Ahrens 		zap_cursor_init_noprefetch(&zc, os, object);
127*52abb70eSMatthew Ahrens 	} else {
128b24ab676SJeff Bonwick 		zap_cursor_init_serialized(&zc, os, object, *walk);
129*52abb70eSMatthew Ahrens 	}
130b24ab676SJeff Bonwick 	if ((error = zap_cursor_retrieve(&zc, &za)) == 0) {
131b24ab676SJeff Bonwick 		uchar_t cbuf[sizeof (dde->dde_phys) + 1];
132b24ab676SJeff Bonwick 		uint64_t csize = za.za_num_integers;
133b24ab676SJeff Bonwick 		ASSERT(za.za_integer_length == 1);
134b24ab676SJeff Bonwick 		error = zap_lookup_uint64(os, object, (uint64_t *)za.za_name,
135b24ab676SJeff Bonwick 		    DDT_KEY_WORDS, 1, csize, cbuf);
136b24ab676SJeff Bonwick 		ASSERT(error == 0);
137b24ab676SJeff Bonwick 		if (error == 0) {
138b24ab676SJeff Bonwick 			ddt_decompress(cbuf, dde->dde_phys, csize,
139b24ab676SJeff Bonwick 			    sizeof (dde->dde_phys));
140b24ab676SJeff Bonwick 			dde->dde_key = *(ddt_key_t *)za.za_name;
141b24ab676SJeff Bonwick 		}
142b24ab676SJeff Bonwick 		zap_cursor_advance(&zc);
143b24ab676SJeff Bonwick 		*walk = zap_cursor_serialize(&zc);
144b24ab676SJeff Bonwick 	}
145b24ab676SJeff Bonwick 	zap_cursor_fini(&zc);
146b24ab676SJeff Bonwick 	return (error);
147b24ab676SJeff Bonwick }
148b24ab676SJeff Bonwick 
149b24ab676SJeff Bonwick static uint64_t
ddt_zap_count(objset_t * os,uint64_t object)150b24ab676SJeff Bonwick ddt_zap_count(objset_t *os, uint64_t object)
151b24ab676SJeff Bonwick {
152b24ab676SJeff Bonwick 	uint64_t count = 0;
153b24ab676SJeff Bonwick 
154b24ab676SJeff Bonwick 	VERIFY(zap_count(os, object, &count) == 0);
155b24ab676SJeff Bonwick 
156b24ab676SJeff Bonwick 	return (count);
157b24ab676SJeff Bonwick }
158b24ab676SJeff Bonwick 
159b24ab676SJeff Bonwick const ddt_ops_t ddt_zap_ops = {
160b24ab676SJeff Bonwick 	"zap",
161b24ab676SJeff Bonwick 	ddt_zap_create,
162b24ab676SJeff Bonwick 	ddt_zap_destroy,
163b24ab676SJeff Bonwick 	ddt_zap_lookup,
164c7cd2421SGeorge Wilson 	ddt_zap_prefetch,
165b24ab676SJeff Bonwick 	ddt_zap_update,
166b24ab676SJeff Bonwick 	ddt_zap_remove,
167b24ab676SJeff Bonwick 	ddt_zap_walk,
168b24ab676SJeff Bonwick 	ddt_zap_count,
169b24ab676SJeff Bonwick };
170