]> git.proxmox.com Git - mirror_zfs.git/blame - module/zfs/ddt_zap.c
ZIL: Remove 128K into 2x68K LWB split optimization
[mirror_zfs.git] / module / zfs / ddt_zap.c
CommitLineData
428870ff
BB
1/*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
7 *
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
1d3ba0bf 9 * or https://opensource.org/licenses/CDDL-1.0.
428870ff
BB
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
12 *
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 *
19 * CDDL HEADER END
20 */
21
22/*
23 * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved.
d9b4bf06 24 * Copyright (c) 2018 by Delphix. All rights reserved.
428870ff
BB
25 */
26
27#include <sys/zfs_context.h>
28#include <sys/spa.h>
29#include <sys/zio.h>
30#include <sys/ddt.h>
31#include <sys/zap.h>
32#include <sys/dmu_tx.h>
428870ff 33
2b10e325
RE
34static unsigned int ddt_zap_default_bs = 15;
35static unsigned int ddt_zap_default_ibs = 15;
428870ff
BB
36
37static int
38ddt_zap_create(objset_t *os, uint64_t *objectp, dmu_tx_t *tx, boolean_t prehash)
39{
40 zap_flags_t flags = ZAP_FLAG_HASH64 | ZAP_FLAG_UINT64_KEY;
41
42 if (prehash)
43 flags |= ZAP_FLAG_PRE_HASHED_KEY;
44
45 *objectp = zap_create_flags(os, 0, flags, DMU_OT_DDT_ZAP,
2b10e325 46 ddt_zap_default_bs, ddt_zap_default_ibs,
428870ff
BB
47 DMU_OT_NONE, 0, tx);
48
28caa74b 49 return (*objectp == 0 ? SET_ERROR(ENOTSUP) : 0);
428870ff
BB
50}
51
52static int
53ddt_zap_destroy(objset_t *os, uint64_t object, dmu_tx_t *tx)
54{
55 return (zap_destroy(os, object, tx));
56}
57
58static int
59ddt_zap_lookup(objset_t *os, uint64_t object, ddt_entry_t *dde)
60{
5b8c7bbc 61 uchar_t *cbuf;
428870ff
BB
62 uint64_t one, csize;
63 int error;
64
79c76d5b 65 cbuf = kmem_alloc(sizeof (dde->dde_phys) + 1, KM_SLEEP);
5b8c7bbc 66
428870ff
BB
67 error = zap_length_uint64(os, object, (uint64_t *)&dde->dde_key,
68 DDT_KEY_WORDS, &one, &csize);
69 if (error)
5b8c7bbc 70 goto out;
428870ff
BB
71
72 ASSERT(one == 1);
42d3b990 73 ASSERT(csize <= (sizeof (dde->dde_phys) + 1));
428870ff
BB
74
75 error = zap_lookup_uint64(os, object, (uint64_t *)&dde->dde_key,
76 DDT_KEY_WORDS, 1, csize, cbuf);
77 if (error)
5b8c7bbc 78 goto out;
428870ff
BB
79
80 ddt_decompress(cbuf, dde->dde_phys, csize, sizeof (dde->dde_phys));
5b8c7bbc
BB
81out:
82 kmem_free(cbuf, sizeof (dde->dde_phys) + 1);
428870ff 83
5b8c7bbc 84 return (error);
428870ff
BB
85}
86
87static void
88ddt_zap_prefetch(objset_t *os, uint64_t object, ddt_entry_t *dde)
89{
90 (void) zap_prefetch_uint64(os, object, (uint64_t *)&dde->dde_key,
91 DDT_KEY_WORDS);
92}
93
94static int
95ddt_zap_update(objset_t *os, uint64_t object, ddt_entry_t *dde, dmu_tx_t *tx)
96{
97 uchar_t cbuf[sizeof (dde->dde_phys) + 1];
98 uint64_t csize;
99
100 csize = ddt_compress(dde->dde_phys, cbuf,
101 sizeof (dde->dde_phys), sizeof (cbuf));
102
103 return (zap_update_uint64(os, object, (uint64_t *)&dde->dde_key,
104 DDT_KEY_WORDS, 1, csize, cbuf, tx));
105}
106
107static int
108ddt_zap_remove(objset_t *os, uint64_t object, ddt_entry_t *dde, dmu_tx_t *tx)
109{
110 return (zap_remove_uint64(os, object, (uint64_t *)&dde->dde_key,
111 DDT_KEY_WORDS, tx));
112}
113
114static int
115ddt_zap_walk(objset_t *os, uint64_t object, ddt_entry_t *dde, uint64_t *walk)
116{
117 zap_cursor_t zc;
118 zap_attribute_t za;
119 int error;
120
d9b4bf06
MA
121 if (*walk == 0) {
122 /*
123 * We don't want to prefetch the entire ZAP object, because
124 * it can be enormous. Also the primary use of DDT iteration
125 * is for scrubbing, in which case we will be issuing many
126 * scrub I/Os for each ZAP block that we read in, so
127 * reading the ZAP is unlikely to be the bottleneck.
128 */
129 zap_cursor_init_noprefetch(&zc, os, object);
130 } else {
131 zap_cursor_init_serialized(&zc, os, object, *walk);
132 }
428870ff
BB
133 if ((error = zap_cursor_retrieve(&zc, &za)) == 0) {
134 uchar_t cbuf[sizeof (dde->dde_phys) + 1];
135 uint64_t csize = za.za_num_integers;
136 ASSERT(za.za_integer_length == 1);
137 error = zap_lookup_uint64(os, object, (uint64_t *)za.za_name,
138 DDT_KEY_WORDS, 1, csize, cbuf);
139 ASSERT(error == 0);
140 if (error == 0) {
141 ddt_decompress(cbuf, dde->dde_phys, csize,
142 sizeof (dde->dde_phys));
143 dde->dde_key = *(ddt_key_t *)za.za_name;
144 }
145 zap_cursor_advance(&zc);
146 *walk = zap_cursor_serialize(&zc);
147 }
148 zap_cursor_fini(&zc);
149 return (error);
150}
151
e8fd45a0
BB
152static int
153ddt_zap_count(objset_t *os, uint64_t object, uint64_t *count)
428870ff 154{
d1d7e268 155 return (zap_count(os, object, count));
428870ff
BB
156}
157
158const ddt_ops_t ddt_zap_ops = {
159 "zap",
160 ddt_zap_create,
161 ddt_zap_destroy,
162 ddt_zap_lookup,
163 ddt_zap_prefetch,
164 ddt_zap_update,
165 ddt_zap_remove,
166 ddt_zap_walk,
167 ddt_zap_count,
168};
2b10e325
RE
169
170/* BEGIN CSTYLED */
171ZFS_MODULE_PARAM(zfs_dedup, , ddt_zap_default_bs, UINT, ZMOD_RW,
172 "DDT ZAP leaf blockshift");
173ZFS_MODULE_PARAM(zfs_dedup, , ddt_zap_default_ibs, UINT, ZMOD_RW,
174 "DDT ZAP indirect blockshift");
175/* END CSTYLED */