]>
Commit | Line | Data |
---|---|---|
34dc7c2f BB |
1 | /* |
2 | * CDDL HEADER START | |
3 | * | |
4 | * The contents of this file are subject to the terms of the | |
5 | * Common Development and Distribution License (the "License"). | |
6 | * You may not use this file except in compliance with the License. | |
7 | * | |
8 | * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE | |
9 | * or http://www.opensolaris.org/os/licensing. | |
10 | * See the License for the specific language governing permissions | |
11 | * and limitations under the License. | |
12 | * | |
13 | * When distributing Covered Code, include this CDDL HEADER in each | |
14 | * file and include the License file at usr/src/OPENSOLARIS.LICENSE. | |
15 | * If applicable, add the following below this CDDL HEADER, with the | |
16 | * fields enclosed by brackets "[]" replaced with your own identifying | |
17 | * information: Portions Copyright [yyyy] [name of copyright owner] | |
18 | * | |
19 | * CDDL HEADER END | |
20 | */ | |
21 | /* | |
428870ff | 22 | * Copyright 2010 Sun Microsystems, Inc. All rights reserved. |
34dc7c2f | 23 | * Use is subject to license terms. |
ea97f8ce MA |
24 | */ |
25 | /* | |
37abac6d | 26 | * Copyright (c) 2012, Joyent, Inc. All rights reserved. |
e6d3a843 | 27 | * Copyright (c) 2013, 2015 by Delphix. All rights reserved. |
34dc7c2f BB |
28 | */ |
29 | ||
30 | #ifndef _SYS_DMU_IMPL_H | |
31 | #define _SYS_DMU_IMPL_H | |
32 | ||
34dc7c2f BB |
33 | #include <sys/txg_impl.h> |
34 | #include <sys/zio.h> | |
35 | #include <sys/dnode.h> | |
36 | #include <sys/zfs_context.h> | |
37abac6d | 37 | #include <sys/zfs_ioctl.h> |
34dc7c2f BB |
38 | |
39 | #ifdef __cplusplus | |
40 | extern "C" { | |
41 | #endif | |
42 | ||
43 | /* | |
44 | * This is the locking strategy for the DMU. Numbers in parenthesis are | |
45 | * cases that use that lock order, referenced below: | |
46 | * | |
47 | * ARC is self-contained | |
48 | * bplist is self-contained | |
49 | * refcount is self-contained | |
50 | * txg is self-contained (hopefully!) | |
51 | * zst_lock | |
52 | * zf_rwlock | |
53 | * | |
54 | * XXX try to improve evicting path? | |
55 | * | |
56 | * dp_config_rwlock > os_obj_lock > dn_struct_rwlock > | |
b128c09f | 57 | * dn_dbufs_mtx > hash_mutexes > db_mtx > dd_lock > leafs |
34dc7c2f BB |
58 | * |
59 | * dp_config_rwlock | |
60 | * must be held before: everything | |
61 | * protects dd namespace changes | |
62 | * protects property changes globally | |
63 | * held from: | |
64 | * dsl_dir_open/r: | |
65 | * dsl_dir_create_sync/w: | |
66 | * dsl_dir_sync_destroy/w: | |
67 | * dsl_dir_rename_sync/w: | |
68 | * dsl_prop_changed_notify/r: | |
69 | * | |
70 | * os_obj_lock | |
71 | * must be held before: | |
72 | * everything except dp_config_rwlock | |
73 | * protects os_obj_next | |
74 | * held from: | |
75 | * dmu_object_alloc: dn_dbufs_mtx, db_mtx, hash_mutexes, dn_struct_rwlock | |
76 | * | |
77 | * dn_struct_rwlock | |
78 | * must be held before: | |
79 | * everything except dp_config_rwlock and os_obj_lock | |
80 | * protects structure of dnode (eg. nlevels) | |
81 | * db_blkptr can change when syncing out change to nlevels | |
82 | * dn_maxblkid | |
83 | * dn_nlevels | |
84 | * dn_*blksz* | |
85 | * phys nlevels, maxblkid, physical blkptr_t's (?) | |
86 | * held from: | |
87 | * callers of dbuf_read_impl, dbuf_hold[_impl], dbuf_prefetch | |
88 | * dmu_object_info_from_dnode: dn_dirty_mtx (dn_datablksz) | |
34dc7c2f BB |
89 | * dbuf_read_impl: db_mtx, dmu_zfetch() |
90 | * dmu_zfetch: zf_rwlock/r, zst_lock, dbuf_prefetch() | |
91 | * dbuf_new_size: db_mtx | |
92 | * dbuf_dirty: db_mtx | |
93 | * dbuf_findbp: (callers, phys? - the real need) | |
94 | * dbuf_create: dn_dbufs_mtx, hash_mutexes, db_mtx (phys?) | |
95 | * dbuf_prefetch: dn_dirty_mtx, hash_mutexes, db_mtx, dn_dbufs_mtx | |
96 | * dbuf_hold_impl: hash_mutexes, db_mtx, dn_dbufs_mtx, dbuf_findbp() | |
97 | * dnode_sync/w (increase_indirection): db_mtx (phys) | |
98 | * dnode_set_blksz/w: dn_dbufs_mtx (dn_*blksz*) | |
99 | * dnode_new_blkid/w: (dn_maxblkid) | |
100 | * dnode_free_range/w: dn_dirty_mtx (dn_maxblkid) | |
101 | * dnode_next_offset: (phys) | |
102 | * | |
103 | * dn_dbufs_mtx | |
104 | * must be held before: | |
105 | * db_mtx, hash_mutexes | |
106 | * protects: | |
107 | * dn_dbufs | |
108 | * dn_evicted | |
109 | * held from: | |
110 | * dmu_evict_user: db_mtx (dn_dbufs) | |
111 | * dbuf_free_range: db_mtx (dn_dbufs) | |
112 | * dbuf_remove_ref: db_mtx, callees: | |
113 | * dbuf_hash_remove: hash_mutexes, db_mtx | |
114 | * dbuf_create: hash_mutexes, db_mtx (dn_dbufs) | |
115 | * dnode_set_blksz: (dn_dbufs) | |
116 | * | |
117 | * hash_mutexes (global) | |
118 | * must be held before: | |
119 | * db_mtx | |
120 | * protects dbuf_hash_table (global) and db_hash_next | |
121 | * held from: | |
122 | * dbuf_find: db_mtx | |
123 | * dbuf_hash_insert: db_mtx | |
124 | * dbuf_hash_remove: db_mtx | |
125 | * | |
126 | * db_mtx (meta-leaf) | |
127 | * must be held before: | |
128 | * dn_mtx, dn_dirty_mtx, dd_lock (leaf mutexes) | |
129 | * protects: | |
130 | * db_state | |
131 | * db_holds | |
132 | * db_buf | |
133 | * db_changed | |
134 | * db_data_pending | |
135 | * db_dirtied | |
136 | * db_link | |
137 | * db_dirty_node (??) | |
138 | * db_dirtycnt | |
139 | * db_d.* | |
140 | * db.* | |
141 | * held from: | |
142 | * dbuf_dirty: dn_mtx, dn_dirty_mtx | |
143 | * dbuf_dirty->dsl_dir_willuse_space: dd_lock | |
144 | * dbuf_dirty->dbuf_new_block->dsl_dataset_block_freeable: dd_lock | |
145 | * dbuf_undirty: dn_dirty_mtx (db_d) | |
146 | * dbuf_write_done: dn_dirty_mtx (db_state) | |
147 | * dbuf_* | |
148 | * dmu_buf_update_user: none (db_d) | |
149 | * dmu_evict_user: none (db_d) (maybe can eliminate) | |
150 | * dbuf_find: none (db_holds) | |
151 | * dbuf_hash_insert: none (db_holds) | |
152 | * dmu_buf_read_array_impl: none (db_state, db_changed) | |
153 | * dmu_sync: none (db_dirty_node, db_d) | |
154 | * dnode_reallocate: none (db) | |
155 | * | |
156 | * dn_mtx (leaf) | |
157 | * protects: | |
158 | * dn_dirty_dbufs | |
159 | * dn_ranges | |
160 | * phys accounting | |
161 | * dn_allocated_txg | |
162 | * dn_free_txg | |
163 | * dn_assigned_txg | |
edc1e713 | 164 | * dn_dirty_txg |
34dc7c2f BB |
165 | * dd_assigned_tx |
166 | * dn_notxholds | |
167 | * dn_dirtyctx | |
168 | * dn_dirtyctx_firstset | |
169 | * (dn_phys copy fields?) | |
170 | * (dn_phys contents?) | |
171 | * held from: | |
172 | * dnode_* | |
173 | * dbuf_dirty: none | |
174 | * dbuf_sync: none (phys accounting) | |
175 | * dbuf_undirty: none (dn_ranges, dn_dirty_dbufs) | |
176 | * dbuf_write_done: none (phys accounting) | |
177 | * dmu_object_info_from_dnode: none (accounting) | |
178 | * dmu_tx_commit: none | |
179 | * dmu_tx_hold_object_impl: none | |
180 | * dmu_tx_try_assign: dn_notxholds(cv) | |
181 | * dmu_tx_unassign: none | |
182 | * | |
b128c09f BB |
183 | * dd_lock |
184 | * must be held before: | |
185 | * ds_lock | |
186 | * ancestors' dd_lock | |
34dc7c2f BB |
187 | * protects: |
188 | * dd_prop_cbs | |
189 | * dd_sync_* | |
190 | * dd_used_bytes | |
191 | * dd_tempreserved | |
192 | * dd_space_towrite | |
193 | * dd_myname | |
194 | * dd_phys accounting? | |
195 | * held from: | |
196 | * dsl_dir_* | |
197 | * dsl_prop_changed_notify: none (dd_prop_cbs) | |
198 | * dsl_prop_register: none (dd_prop_cbs) | |
199 | * dsl_prop_unregister: none (dd_prop_cbs) | |
34dc7c2f BB |
200 | * |
201 | * os_lock (leaf) | |
202 | * protects: | |
203 | * os_dirty_dnodes | |
204 | * os_free_dnodes | |
205 | * os_dnodes | |
206 | * os_downgraded_dbufs | |
207 | * dn_dirtyblksz | |
208 | * dn_dirty_link | |
209 | * held from: | |
210 | * dnode_create: none (os_dnodes) | |
211 | * dnode_destroy: none (os_dnodes) | |
212 | * dnode_setdirty: none (dn_dirtyblksz, os_*_dnodes) | |
213 | * dnode_free: none (dn_dirtyblksz, os_*_dnodes) | |
214 | * | |
b128c09f | 215 | * ds_lock |
34dc7c2f | 216 | * protects: |
428870ff | 217 | * ds_objset |
34dc7c2f BB |
218 | * ds_open_refcount |
219 | * ds_snapname | |
220 | * ds_phys accounting | |
45d1cae3 | 221 | * ds_phys userrefs zapobj |
b128c09f | 222 | * ds_reserved |
34dc7c2f BB |
223 | * held from: |
224 | * dsl_dataset_* | |
225 | * | |
226 | * dr_mtx (leaf) | |
227 | * protects: | |
228 | * dr_children | |
229 | * held from: | |
230 | * dbuf_dirty | |
231 | * dbuf_undirty | |
232 | * dbuf_sync_indirect | |
233 | * dnode_new_blkid | |
234 | */ | |
235 | ||
236 | struct objset; | |
237 | struct dmu_pool; | |
238 | ||
428870ff BB |
239 | typedef struct dmu_xuio { |
240 | int next; | |
241 | int cnt; | |
242 | struct arc_buf **bufs; | |
243 | iovec_t *iovp; | |
244 | } dmu_xuio_t; | |
245 | ||
37abac6d BP |
246 | /* |
247 | * The list of data whose inclusion in a send stream can be pending from | |
248 | * one call to backup_cb to another. Multiple calls to dump_free() and | |
249 | * dump_freeobjects() can be aggregated into a single DRR_FREE or | |
250 | * DRR_FREEOBJECTS replay record. | |
251 | */ | |
252 | typedef enum { | |
253 | PENDING_NONE, | |
254 | PENDING_FREE, | |
255 | PENDING_FREEOBJECTS | |
256 | } dmu_pendop_t; | |
257 | ||
258 | typedef struct dmu_sendarg { | |
259 | list_node_t dsa_link; | |
260 | dmu_replay_record_t *dsa_drr; | |
261 | vnode_t *dsa_vp; | |
262 | int dsa_outfd; | |
263 | proc_t *dsa_proc; | |
264 | offset_t *dsa_off; | |
265 | objset_t *dsa_os; | |
266 | zio_cksum_t dsa_zc; | |
267 | uint64_t dsa_toguid; | |
caf9dd20 | 268 | uint64_t dsa_fromtxg; |
37abac6d BP |
269 | int dsa_err; |
270 | dmu_pendop_t dsa_pending_op; | |
9b67f605 | 271 | uint64_t dsa_featureflags; |
ea97f8ce MA |
272 | uint64_t dsa_last_data_object; |
273 | uint64_t dsa_last_data_offset; | |
47dfff3b MA |
274 | uint64_t dsa_resume_object; |
275 | uint64_t dsa_resume_offset; | |
51907a31 K |
276 | boolean_t dsa_sent_begin; |
277 | boolean_t dsa_sent_end; | |
37abac6d BP |
278 | } dmu_sendarg_t; |
279 | ||
fa86b5db MA |
280 | void dmu_object_zapify(objset_t *, uint64_t, dmu_object_type_t, dmu_tx_t *); |
281 | void dmu_object_free_zapified(objset_t *, uint64_t, dmu_tx_t *); | |
9b67f605 MA |
282 | int dmu_buf_hold_noread(objset_t *, uint64_t, uint64_t, |
283 | void *, dmu_buf_t **); | |
fa86b5db | 284 | |
34dc7c2f BB |
285 | #ifdef __cplusplus |
286 | } | |
287 | #endif | |
288 | ||
289 | #endif /* _SYS_DMU_IMPL_H */ |