]>
Commit | Line | Data |
---|---|---|
428870ff BB |
1 | /* |
2 | * CDDL HEADER START | |
3 | * | |
4 | * The contents of this file are subject to the terms of the | |
5 | * Common Development and Distribution License (the "License"). | |
6 | * You may not use this file except in compliance with the License. | |
7 | * | |
8 | * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE | |
1d3ba0bf | 9 | * or https://opensource.org/licenses/CDDL-1.0. |
428870ff BB |
10 | * See the License for the specific language governing permissions |
11 | * and limitations under the License. | |
12 | * | |
13 | * When distributing Covered Code, include this CDDL HEADER in each | |
14 | * file and include the License file at usr/src/OPENSOLARIS.LICENSE. | |
15 | * If applicable, add the following below this CDDL HEADER, with the | |
16 | * fields enclosed by brackets "[]" replaced with your own identifying | |
17 | * information: Portions Copyright [yyyy] [name of copyright owner] | |
18 | * | |
19 | * CDDL HEADER END | |
20 | */ | |
21 | ||
22 | /* | |
23 | * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved. | |
d9b4bf06 | 24 | * Copyright (c) 2018 by Delphix. All rights reserved. |
428870ff BB |
25 | */ |
26 | ||
27 | #include <sys/zfs_context.h> | |
28 | #include <sys/spa.h> | |
29 | #include <sys/zio.h> | |
30 | #include <sys/ddt.h> | |
31 | #include <sys/zap.h> | |
32 | #include <sys/dmu_tx.h> | |
428870ff | 33 | |
2b10e325 RE |
34 | static unsigned int ddt_zap_default_bs = 15; |
35 | static unsigned int ddt_zap_default_ibs = 15; | |
428870ff BB |
36 | |
37 | static int | |
38 | ddt_zap_create(objset_t *os, uint64_t *objectp, dmu_tx_t *tx, boolean_t prehash) | |
39 | { | |
40 | zap_flags_t flags = ZAP_FLAG_HASH64 | ZAP_FLAG_UINT64_KEY; | |
41 | ||
42 | if (prehash) | |
43 | flags |= ZAP_FLAG_PRE_HASHED_KEY; | |
44 | ||
45 | *objectp = zap_create_flags(os, 0, flags, DMU_OT_DDT_ZAP, | |
2b10e325 | 46 | ddt_zap_default_bs, ddt_zap_default_ibs, |
428870ff BB |
47 | DMU_OT_NONE, 0, tx); |
48 | ||
28caa74b | 49 | return (*objectp == 0 ? SET_ERROR(ENOTSUP) : 0); |
428870ff BB |
50 | } |
51 | ||
52 | static int | |
53 | ddt_zap_destroy(objset_t *os, uint64_t object, dmu_tx_t *tx) | |
54 | { | |
55 | return (zap_destroy(os, object, tx)); | |
56 | } | |
57 | ||
58 | static int | |
59 | ddt_zap_lookup(objset_t *os, uint64_t object, ddt_entry_t *dde) | |
60 | { | |
5b8c7bbc | 61 | uchar_t *cbuf; |
428870ff BB |
62 | uint64_t one, csize; |
63 | int error; | |
64 | ||
79c76d5b | 65 | cbuf = kmem_alloc(sizeof (dde->dde_phys) + 1, KM_SLEEP); |
5b8c7bbc | 66 | |
428870ff BB |
67 | error = zap_length_uint64(os, object, (uint64_t *)&dde->dde_key, |
68 | DDT_KEY_WORDS, &one, &csize); | |
69 | if (error) | |
5b8c7bbc | 70 | goto out; |
428870ff BB |
71 | |
72 | ASSERT(one == 1); | |
42d3b990 | 73 | ASSERT(csize <= (sizeof (dde->dde_phys) + 1)); |
428870ff BB |
74 | |
75 | error = zap_lookup_uint64(os, object, (uint64_t *)&dde->dde_key, | |
76 | DDT_KEY_WORDS, 1, csize, cbuf); | |
77 | if (error) | |
5b8c7bbc | 78 | goto out; |
428870ff BB |
79 | |
80 | ddt_decompress(cbuf, dde->dde_phys, csize, sizeof (dde->dde_phys)); | |
5b8c7bbc BB |
81 | out: |
82 | kmem_free(cbuf, sizeof (dde->dde_phys) + 1); | |
428870ff | 83 | |
5b8c7bbc | 84 | return (error); |
428870ff BB |
85 | } |
86 | ||
87 | static void | |
88 | ddt_zap_prefetch(objset_t *os, uint64_t object, ddt_entry_t *dde) | |
89 | { | |
90 | (void) zap_prefetch_uint64(os, object, (uint64_t *)&dde->dde_key, | |
91 | DDT_KEY_WORDS); | |
92 | } | |
93 | ||
94 | static int | |
95 | ddt_zap_update(objset_t *os, uint64_t object, ddt_entry_t *dde, dmu_tx_t *tx) | |
96 | { | |
97 | uchar_t cbuf[sizeof (dde->dde_phys) + 1]; | |
98 | uint64_t csize; | |
99 | ||
100 | csize = ddt_compress(dde->dde_phys, cbuf, | |
101 | sizeof (dde->dde_phys), sizeof (cbuf)); | |
102 | ||
103 | return (zap_update_uint64(os, object, (uint64_t *)&dde->dde_key, | |
104 | DDT_KEY_WORDS, 1, csize, cbuf, tx)); | |
105 | } | |
106 | ||
107 | static int | |
108 | ddt_zap_remove(objset_t *os, uint64_t object, ddt_entry_t *dde, dmu_tx_t *tx) | |
109 | { | |
110 | return (zap_remove_uint64(os, object, (uint64_t *)&dde->dde_key, | |
111 | DDT_KEY_WORDS, tx)); | |
112 | } | |
113 | ||
114 | static int | |
115 | ddt_zap_walk(objset_t *os, uint64_t object, ddt_entry_t *dde, uint64_t *walk) | |
116 | { | |
117 | zap_cursor_t zc; | |
118 | zap_attribute_t za; | |
119 | int error; | |
120 | ||
d9b4bf06 MA |
121 | if (*walk == 0) { |
122 | /* | |
123 | * We don't want to prefetch the entire ZAP object, because | |
124 | * it can be enormous. Also the primary use of DDT iteration | |
125 | * is for scrubbing, in which case we will be issuing many | |
126 | * scrub I/Os for each ZAP block that we read in, so | |
127 | * reading the ZAP is unlikely to be the bottleneck. | |
128 | */ | |
129 | zap_cursor_init_noprefetch(&zc, os, object); | |
130 | } else { | |
131 | zap_cursor_init_serialized(&zc, os, object, *walk); | |
132 | } | |
428870ff BB |
133 | if ((error = zap_cursor_retrieve(&zc, &za)) == 0) { |
134 | uchar_t cbuf[sizeof (dde->dde_phys) + 1]; | |
135 | uint64_t csize = za.za_num_integers; | |
136 | ASSERT(za.za_integer_length == 1); | |
137 | error = zap_lookup_uint64(os, object, (uint64_t *)za.za_name, | |
138 | DDT_KEY_WORDS, 1, csize, cbuf); | |
139 | ASSERT(error == 0); | |
140 | if (error == 0) { | |
141 | ddt_decompress(cbuf, dde->dde_phys, csize, | |
142 | sizeof (dde->dde_phys)); | |
143 | dde->dde_key = *(ddt_key_t *)za.za_name; | |
144 | } | |
145 | zap_cursor_advance(&zc); | |
146 | *walk = zap_cursor_serialize(&zc); | |
147 | } | |
148 | zap_cursor_fini(&zc); | |
149 | return (error); | |
150 | } | |
151 | ||
e8fd45a0 BB |
152 | static int |
153 | ddt_zap_count(objset_t *os, uint64_t object, uint64_t *count) | |
428870ff | 154 | { |
d1d7e268 | 155 | return (zap_count(os, object, count)); |
428870ff BB |
156 | } |
157 | ||
158 | const ddt_ops_t ddt_zap_ops = { | |
159 | "zap", | |
160 | ddt_zap_create, | |
161 | ddt_zap_destroy, | |
162 | ddt_zap_lookup, | |
163 | ddt_zap_prefetch, | |
164 | ddt_zap_update, | |
165 | ddt_zap_remove, | |
166 | ddt_zap_walk, | |
167 | ddt_zap_count, | |
168 | }; | |
2b10e325 RE |
169 | |
170 | /* BEGIN CSTYLED */ | |
171 | ZFS_MODULE_PARAM(zfs_dedup, , ddt_zap_default_bs, UINT, ZMOD_RW, | |
172 | "DDT ZAP leaf blockshift"); | |
173 | ZFS_MODULE_PARAM(zfs_dedup, , ddt_zap_default_ibs, UINT, ZMOD_RW, | |
174 | "DDT ZAP indirect blockshift"); | |
175 | /* END CSTYLED */ |