4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
22 * Copyright 2009 Sun Microsystems, Inc. All rights reserved.
23 * Use is subject to license terms.
27 #include <stdio_ext.h>
30 #include <sys/zfs_context.h>
32 #include <sys/spa_impl.h>
35 #include <sys/fs/zfs.h>
36 #include <sys/zfs_znode.h>
38 #include <sys/vdev_impl.h>
39 #include <sys/metaslab_impl.h>
40 #include <sys/dmu_objset.h>
41 #include <sys/dsl_dir.h>
42 #include <sys/dsl_dataset.h>
43 #include <sys/dsl_pool.h>
46 #include <sys/zil_impl.h>
48 #include <sys/resource.h>
49 #include <sys/dmu_traverse.h>
50 #include <sys/zio_checksum.h>
51 #include <sys/zio_compress.h>
52 #include <sys/zfs_fuid.h>
58 const char cmdname
[] = "zdb";
59 uint8_t dump_opt
[256];
61 typedef void object_viewer_t(objset_t
*, uint64_t, void *data
, size_t size
);
63 extern void dump_intent_log(zilog_t
*);
64 uint64_t *zopt_object
= NULL
;
66 libzfs_handle_t
*g_zfs
;
67 boolean_t zdb_sig_user_data
= B_TRUE
;
68 int zdb_sig_cksumalg
= ZIO_CHECKSUM_SHA256
;
71 * These libumem hooks provide a reasonable set of defaults for the allocator's
72 * debugging facilities.
77 return ("default,verbose"); /* $UMEM_DEBUG setting */
81 _umem_logging_init(void)
83 return ("fail,contents"); /* $UMEM_LOGGING setting */
89 (void) fprintf(stderr
,
90 "Usage: %s [-udibcsvL] [-U cachefile_path] [-t txg]\n"
91 "\t [-S user:cksumalg] "
92 "dataset [object...]\n"
95 " %s -R pool:vdev:offset:size:flags\n"
96 " %s [-p path_to_vdev_dir]\n"
97 " %s -e pool | GUID | devid ...\n",
98 cmdname
, cmdname
, cmdname
, cmdname
, cmdname
, cmdname
);
100 (void) fprintf(stderr
, " -u uberblock\n");
101 (void) fprintf(stderr
, " -d datasets\n");
102 (void) fprintf(stderr
, " -C cached pool configuration\n");
103 (void) fprintf(stderr
, " -i intent logs\n");
104 (void) fprintf(stderr
, " -b block statistics\n");
105 (void) fprintf(stderr
, " -m metaslabs\n");
106 (void) fprintf(stderr
, " -c checksum all metadata (twice for "
107 "all data) blocks\n");
108 (void) fprintf(stderr
, " -s report stats on zdb's I/O\n");
109 (void) fprintf(stderr
, " -S <user|all>:<cksum_alg|all> -- "
110 "dump blkptr signatures\n");
111 (void) fprintf(stderr
, " -v verbose (applies to all others)\n");
112 (void) fprintf(stderr
, " -l dump label contents\n");
113 (void) fprintf(stderr
, " -L disable leak tracking (do not "
114 "load spacemaps)\n");
115 (void) fprintf(stderr
, " -U cachefile_path -- use alternate "
117 (void) fprintf(stderr
, " -R read and display block from a "
119 (void) fprintf(stderr
, " -e Pool is exported/destroyed/"
121 (void) fprintf(stderr
, " -p <Path to vdev dir> (use with -e)\n");
122 (void) fprintf(stderr
, " -t <txg> highest txg to use when "
123 "searching for uberblocks\n");
124 (void) fprintf(stderr
, "Specify an option more than once (e.g. -bb) "
125 "to make only that option verbose\n");
126 (void) fprintf(stderr
, "Default is to dump everything non-verbosely\n");
131 * Called for usage errors that are discovered after a call to spa_open(),
132 * dmu_bonus_hold(), or pool_match(). abort() is called for other errors.
136 fatal(const char *fmt
, ...)
141 (void) fprintf(stderr
, "%s: ", cmdname
);
142 (void) vfprintf(stderr
, fmt
, ap
);
144 (void) fprintf(stderr
, "\n");
150 dump_nvlist(nvlist_t
*list
, int indent
)
152 nvpair_t
*elem
= NULL
;
154 while ((elem
= nvlist_next_nvpair(list
, elem
)) != NULL
) {
155 switch (nvpair_type(elem
)) {
156 case DATA_TYPE_STRING
:
160 VERIFY(nvpair_value_string(elem
, &value
) == 0);
161 (void) printf("%*s%s='%s'\n", indent
, "",
162 nvpair_name(elem
), value
);
166 case DATA_TYPE_UINT64
:
170 VERIFY(nvpair_value_uint64(elem
, &value
) == 0);
171 (void) printf("%*s%s=%llu\n", indent
, "",
172 nvpair_name(elem
), (u_longlong_t
)value
);
176 case DATA_TYPE_NVLIST
:
180 VERIFY(nvpair_value_nvlist(elem
, &value
) == 0);
181 (void) printf("%*s%s\n", indent
, "",
183 dump_nvlist(value
, indent
+ 4);
187 case DATA_TYPE_NVLIST_ARRAY
:
192 VERIFY(nvpair_value_nvlist_array(elem
, &value
,
195 for (c
= 0; c
< count
; c
++) {
196 (void) printf("%*s%s[%u]\n", indent
, "",
197 nvpair_name(elem
), c
);
198 dump_nvlist(value
[c
], indent
+ 8);
205 (void) printf("bad config type %d for %s\n",
206 nvpair_type(elem
), nvpair_name(elem
));
213 dump_packed_nvlist(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
216 size_t nvsize
= *(uint64_t *)data
;
217 char *packed
= umem_alloc(nvsize
, UMEM_NOFAIL
);
219 VERIFY(0 == dmu_read(os
, object
, 0, nvsize
, packed
, DMU_READ_PREFETCH
));
221 VERIFY(nvlist_unpack(packed
, nvsize
, &nv
, 0) == 0);
223 umem_free(packed
, nvsize
);
230 const char dump_zap_stars
[] = "****************************************";
231 const int dump_zap_width
= sizeof (dump_zap_stars
) - 1;
234 dump_zap_histogram(uint64_t histo
[ZAP_HISTOGRAM_SIZE
])
237 int minidx
= ZAP_HISTOGRAM_SIZE
- 1;
241 for (i
= 0; i
< ZAP_HISTOGRAM_SIZE
; i
++) {
244 if (histo
[i
] > 0 && i
> maxidx
)
246 if (histo
[i
] > 0 && i
< minidx
)
250 if (max
< dump_zap_width
)
251 max
= dump_zap_width
;
253 for (i
= minidx
; i
<= maxidx
; i
++)
254 (void) printf("\t\t\t%u: %6llu %s\n", i
, (u_longlong_t
)histo
[i
],
255 &dump_zap_stars
[(max
- histo
[i
]) * dump_zap_width
/ max
]);
259 dump_zap_stats(objset_t
*os
, uint64_t object
)
264 error
= zap_get_stats(os
, object
, &zs
);
268 if (zs
.zs_ptrtbl_len
== 0) {
269 ASSERT(zs
.zs_num_blocks
== 1);
270 (void) printf("\tmicrozap: %llu bytes, %llu entries\n",
271 (u_longlong_t
)zs
.zs_blocksize
,
272 (u_longlong_t
)zs
.zs_num_entries
);
276 (void) printf("\tFat ZAP stats:\n");
278 (void) printf("\t\tPointer table:\n");
279 (void) printf("\t\t\t%llu elements\n",
280 (u_longlong_t
)zs
.zs_ptrtbl_len
);
281 (void) printf("\t\t\tzt_blk: %llu\n",
282 (u_longlong_t
)zs
.zs_ptrtbl_zt_blk
);
283 (void) printf("\t\t\tzt_numblks: %llu\n",
284 (u_longlong_t
)zs
.zs_ptrtbl_zt_numblks
);
285 (void) printf("\t\t\tzt_shift: %llu\n",
286 (u_longlong_t
)zs
.zs_ptrtbl_zt_shift
);
287 (void) printf("\t\t\tzt_blks_copied: %llu\n",
288 (u_longlong_t
)zs
.zs_ptrtbl_blks_copied
);
289 (void) printf("\t\t\tzt_nextblk: %llu\n",
290 (u_longlong_t
)zs
.zs_ptrtbl_nextblk
);
292 (void) printf("\t\tZAP entries: %llu\n",
293 (u_longlong_t
)zs
.zs_num_entries
);
294 (void) printf("\t\tLeaf blocks: %llu\n",
295 (u_longlong_t
)zs
.zs_num_leafs
);
296 (void) printf("\t\tTotal blocks: %llu\n",
297 (u_longlong_t
)zs
.zs_num_blocks
);
298 (void) printf("\t\tzap_block_type: 0x%llx\n",
299 (u_longlong_t
)zs
.zs_block_type
);
300 (void) printf("\t\tzap_magic: 0x%llx\n",
301 (u_longlong_t
)zs
.zs_magic
);
302 (void) printf("\t\tzap_salt: 0x%llx\n",
303 (u_longlong_t
)zs
.zs_salt
);
305 (void) printf("\t\tLeafs with 2^n pointers:\n");
306 dump_zap_histogram(zs
.zs_leafs_with_2n_pointers
);
308 (void) printf("\t\tBlocks with n*5 entries:\n");
309 dump_zap_histogram(zs
.zs_blocks_with_n5_entries
);
311 (void) printf("\t\tBlocks n/10 full:\n");
312 dump_zap_histogram(zs
.zs_blocks_n_tenths_full
);
314 (void) printf("\t\tEntries with n chunks:\n");
315 dump_zap_histogram(zs
.zs_entries_using_n_chunks
);
317 (void) printf("\t\tBuckets with n entries:\n");
318 dump_zap_histogram(zs
.zs_buckets_with_n_entries
);
323 dump_none(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
329 dump_uint8(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
335 dump_uint64(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
341 dump_zap(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
344 zap_attribute_t attr
;
348 dump_zap_stats(os
, object
);
351 for (zap_cursor_init(&zc
, os
, object
);
352 zap_cursor_retrieve(&zc
, &attr
) == 0;
353 zap_cursor_advance(&zc
)) {
354 (void) printf("\t\t%s = ", attr
.za_name
);
355 if (attr
.za_num_integers
== 0) {
359 prop
= umem_zalloc(attr
.za_num_integers
*
360 attr
.za_integer_length
, UMEM_NOFAIL
);
361 (void) zap_lookup(os
, object
, attr
.za_name
,
362 attr
.za_integer_length
, attr
.za_num_integers
, prop
);
363 if (attr
.za_integer_length
== 1) {
364 (void) printf("%s", (char *)prop
);
366 for (i
= 0; i
< attr
.za_num_integers
; i
++) {
367 switch (attr
.za_integer_length
) {
370 ((uint16_t *)prop
)[i
]);
374 ((uint32_t *)prop
)[i
]);
377 (void) printf("%lld ",
378 (u_longlong_t
)((int64_t *)prop
)[i
]);
384 umem_free(prop
, attr
.za_num_integers
* attr
.za_integer_length
);
386 zap_cursor_fini(&zc
);
391 dump_zpldir(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
394 zap_attribute_t attr
;
395 const char *typenames
[] = {
396 /* 0 */ "not specified",
398 /* 2 */ "Character Device",
399 /* 3 */ "3 (invalid)",
401 /* 5 */ "5 (invalid)",
402 /* 6 */ "Block Device",
403 /* 7 */ "7 (invalid)",
404 /* 8 */ "Regular File",
405 /* 9 */ "9 (invalid)",
406 /* 10 */ "Symbolic Link",
407 /* 11 */ "11 (invalid)",
410 /* 14 */ "Event Port",
411 /* 15 */ "15 (invalid)",
414 dump_zap_stats(os
, object
);
417 for (zap_cursor_init(&zc
, os
, object
);
418 zap_cursor_retrieve(&zc
, &attr
) == 0;
419 zap_cursor_advance(&zc
)) {
420 (void) printf("\t\t%s = %lld (type: %s)\n",
421 attr
.za_name
, ZFS_DIRENT_OBJ(attr
.za_first_integer
),
422 typenames
[ZFS_DIRENT_TYPE(attr
.za_first_integer
)]);
424 zap_cursor_fini(&zc
);
428 dump_spacemap(objset_t
*os
, space_map_obj_t
*smo
, space_map_t
*sm
)
430 uint64_t alloc
, offset
, entry
;
431 uint8_t mapshift
= sm
->sm_shift
;
432 uint64_t mapstart
= sm
->sm_start
;
433 char *ddata
[] = { "ALLOC", "FREE", "CONDENSE", "INVALID",
434 "INVALID", "INVALID", "INVALID", "INVALID" };
436 if (smo
->smo_object
== 0)
440 * Print out the freelist entries in both encoded and decoded form.
443 for (offset
= 0; offset
< smo
->smo_objsize
; offset
+= sizeof (entry
)) {
444 VERIFY(0 == dmu_read(os
, smo
->smo_object
, offset
,
445 sizeof (entry
), &entry
, DMU_READ_PREFETCH
));
446 if (SM_DEBUG_DECODE(entry
)) {
447 (void) printf("\t\t[%4llu] %s: txg %llu, pass %llu\n",
448 (u_longlong_t
)(offset
/ sizeof (entry
)),
449 ddata
[SM_DEBUG_ACTION_DECODE(entry
)],
450 (u_longlong_t
)SM_DEBUG_TXG_DECODE(entry
),
451 (u_longlong_t
)SM_DEBUG_SYNCPASS_DECODE(entry
));
453 (void) printf("\t\t[%4llu] %c range:"
454 " %08llx-%08llx size: %06llx\n",
455 (u_longlong_t
)(offset
/ sizeof (entry
)),
456 SM_TYPE_DECODE(entry
) == SM_ALLOC
? 'A' : 'F',
457 (u_longlong_t
)((SM_OFFSET_DECODE(entry
) <<
458 mapshift
) + mapstart
),
459 (u_longlong_t
)((SM_OFFSET_DECODE(entry
) <<
460 mapshift
) + mapstart
+ (SM_RUN_DECODE(entry
) <<
462 (u_longlong_t
)(SM_RUN_DECODE(entry
) << mapshift
));
463 if (SM_TYPE_DECODE(entry
) == SM_ALLOC
)
464 alloc
+= SM_RUN_DECODE(entry
) << mapshift
;
466 alloc
-= SM_RUN_DECODE(entry
) << mapshift
;
469 if (alloc
!= smo
->smo_alloc
) {
470 (void) printf("space_map_object alloc (%llu) INCONSISTENT "
471 "with space map summary (%llu)\n",
472 (u_longlong_t
)smo
->smo_alloc
, (u_longlong_t
)alloc
);
477 dump_metaslab_stats(metaslab_t
*msp
)
480 space_map_t
*sm
= &msp
->ms_map
;
481 avl_tree_t
*t
= sm
->sm_pp_root
;
482 int free_pct
= sm
->sm_space
* 100 / sm
->sm_size
;
484 nicenum(space_map_maxsize(sm
), maxbuf
);
486 (void) printf("\t %20s %10lu %7s %6s %4s %4d%%\n",
487 "segments", avl_numnodes(t
), "maxsize", maxbuf
,
488 "freepct", free_pct
);
492 dump_metaslab(metaslab_t
*msp
)
495 space_map_obj_t
*smo
= &msp
->ms_smo
;
496 vdev_t
*vd
= msp
->ms_group
->mg_vd
;
497 spa_t
*spa
= vd
->vdev_spa
;
499 nicenum(msp
->ms_map
.sm_size
- smo
->smo_alloc
, freebuf
);
502 "\tvdev %5llu offset %12llx spacemap %6llu free %5s\n",
503 (u_longlong_t
)vd
->vdev_id
, (u_longlong_t
)msp
->ms_map
.sm_start
,
504 (u_longlong_t
)smo
->smo_object
, freebuf
);
506 if (dump_opt
['m'] > 1) {
507 mutex_enter(&msp
->ms_lock
);
508 VERIFY(space_map_load(&msp
->ms_map
, zfs_metaslab_ops
,
509 SM_FREE
, &msp
->ms_smo
, spa
->spa_meta_objset
) == 0);
510 dump_metaslab_stats(msp
);
511 space_map_unload(&msp
->ms_map
);
512 mutex_exit(&msp
->ms_lock
);
515 if (dump_opt
['d'] > 5 || dump_opt
['m'] > 2) {
516 ASSERT(msp
->ms_map
.sm_size
== (1ULL << vd
->vdev_ms_shift
));
518 mutex_enter(&msp
->ms_lock
);
519 dump_spacemap(spa
->spa_meta_objset
, smo
, &msp
->ms_map
);
520 mutex_exit(&msp
->ms_lock
);
526 dump_metaslabs(spa_t
*spa
)
528 vdev_t
*rvd
= spa
->spa_root_vdev
;
532 (void) printf("\nMetaslabs:\n");
534 for (c
= 0; c
< rvd
->vdev_children
; c
++) {
535 vd
= rvd
->vdev_child
[c
];
537 (void) printf("\t%-10s %-19s %-15s %-10s\n",
538 "vdev", "offset", "spacemap", "free");
539 (void) printf("\t%10s %19s %15s %10s\n",
540 "----------", "-------------------",
541 "---------------", "-------------");
543 for (m
= 0; m
< vd
->vdev_ms_count
; m
++)
544 dump_metaslab(vd
->vdev_ms
[m
]);
550 dump_dtl_seg(space_map_t
*sm
, uint64_t start
, uint64_t size
)
552 char *prefix
= (void *)sm
;
554 (void) printf("%s [%llu,%llu) length %llu\n",
557 (u_longlong_t
)(start
+ size
),
558 (u_longlong_t
)(size
));
562 dump_dtl(vdev_t
*vd
, int indent
)
564 spa_t
*spa
= vd
->vdev_spa
;
566 char *name
[DTL_TYPES
] = { "missing", "partial", "scrub", "outage" };
569 spa_vdev_state_enter(spa
);
570 required
= vdev_dtl_required(vd
);
571 (void) spa_vdev_state_exit(spa
, NULL
, 0);
574 (void) printf("\nDirty time logs:\n\n");
576 (void) printf("\t%*s%s [%s]\n", indent
, "",
577 vd
->vdev_path
? vd
->vdev_path
:
578 vd
->vdev_parent
? vd
->vdev_ops
->vdev_op_type
: spa_name(spa
),
579 required
? "DTL-required" : "DTL-expendable");
581 for (int t
= 0; t
< DTL_TYPES
; t
++) {
582 space_map_t
*sm
= &vd
->vdev_dtl
[t
];
583 if (sm
->sm_space
== 0)
585 (void) snprintf(prefix
, sizeof (prefix
), "\t%*s%s",
586 indent
+ 2, "", name
[t
]);
587 mutex_enter(sm
->sm_lock
);
588 space_map_walk(sm
, dump_dtl_seg
, (void *)prefix
);
589 mutex_exit(sm
->sm_lock
);
590 if (dump_opt
['d'] > 5 && vd
->vdev_children
== 0)
591 dump_spacemap(spa
->spa_meta_objset
,
592 &vd
->vdev_dtl_smo
, sm
);
595 for (int c
= 0; c
< vd
->vdev_children
; c
++)
596 dump_dtl(vd
->vdev_child
[c
], indent
+ 4);
601 dump_dnode(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
606 blkid2offset(const dnode_phys_t
*dnp
, int level
, uint64_t blkid
)
611 return ((blkid
<< (level
* (dnp
->dn_indblkshift
- SPA_BLKPTRSHIFT
))) *
612 dnp
->dn_datablkszsec
<< SPA_MINBLOCKSHIFT
);
616 sprintf_blkptr_compact(char *blkbuf
, blkptr_t
*bp
, int alldvas
)
618 dva_t
*dva
= bp
->blk_dva
;
619 int ndvas
= alldvas
? BP_GET_NDVAS(bp
) : 1;
624 for (i
= 0; i
< ndvas
; i
++)
625 (void) sprintf(blkbuf
+ strlen(blkbuf
), "%llu:%llx:%llx ",
626 (u_longlong_t
)DVA_GET_VDEV(&dva
[i
]),
627 (u_longlong_t
)DVA_GET_OFFSET(&dva
[i
]),
628 (u_longlong_t
)DVA_GET_ASIZE(&dva
[i
]));
630 (void) sprintf(blkbuf
+ strlen(blkbuf
), "%llxL/%llxP F=%llu B=%llu",
631 (u_longlong_t
)BP_GET_LSIZE(bp
),
632 (u_longlong_t
)BP_GET_PSIZE(bp
),
633 (u_longlong_t
)bp
->blk_fill
,
634 (u_longlong_t
)bp
->blk_birth
);
638 print_indirect(blkptr_t
*bp
, const zbookmark_t
*zb
,
639 const dnode_phys_t
*dnp
)
641 char blkbuf
[BP_SPRINTF_LEN
];
644 ASSERT3U(BP_GET_TYPE(bp
), ==, dnp
->dn_type
);
645 ASSERT3U(BP_GET_LEVEL(bp
), ==, zb
->zb_level
);
647 (void) printf("%16llx ",
648 (u_longlong_t
)blkid2offset(dnp
, zb
->zb_level
, zb
->zb_blkid
));
650 ASSERT(zb
->zb_level
>= 0);
652 for (l
= dnp
->dn_nlevels
- 1; l
>= -1; l
--) {
653 if (l
== zb
->zb_level
) {
654 (void) printf("L%llx", (u_longlong_t
)zb
->zb_level
);
660 sprintf_blkptr_compact(blkbuf
, bp
, dump_opt
['d'] > 5 ? 1 : 0);
661 (void) printf("%s\n", blkbuf
);
664 #define SET_BOOKMARK(zb, objset, object, level, blkid) \
666 (zb)->zb_objset = objset; \
667 (zb)->zb_object = object; \
668 (zb)->zb_level = level; \
669 (zb)->zb_blkid = blkid; \
673 visit_indirect(spa_t
*spa
, const dnode_phys_t
*dnp
,
674 blkptr_t
*bp
, const zbookmark_t
*zb
)
678 if (bp
->blk_birth
== 0)
681 print_indirect(bp
, zb
, dnp
);
683 if (BP_GET_LEVEL(bp
) > 0) {
684 uint32_t flags
= ARC_WAIT
;
687 int epb
= BP_GET_LSIZE(bp
) >> SPA_BLKPTRSHIFT
;
691 err
= arc_read_nolock(NULL
, spa
, bp
, arc_getbuf_func
, &buf
,
692 ZIO_PRIORITY_ASYNC_READ
, ZIO_FLAG_CANFAIL
, &flags
, zb
);
696 /* recursively visit blocks below this */
698 for (i
= 0; i
< epb
; i
++, cbp
++) {
701 SET_BOOKMARK(&czb
, zb
->zb_objset
, zb
->zb_object
,
703 zb
->zb_blkid
* epb
+ i
);
704 err
= visit_indirect(spa
, dnp
, cbp
, &czb
);
707 fill
+= cbp
->blk_fill
;
710 ASSERT3U(fill
, ==, bp
->blk_fill
);
711 (void) arc_buf_remove_ref(buf
, &buf
);
719 dump_indirect(dnode_t
*dn
)
721 dnode_phys_t
*dnp
= dn
->dn_phys
;
725 (void) printf("Indirect blocks:\n");
727 SET_BOOKMARK(&czb
, dmu_objset_id(&dn
->dn_objset
->os
),
728 dn
->dn_object
, dnp
->dn_nlevels
- 1, 0);
729 for (j
= 0; j
< dnp
->dn_nblkptr
; j
++) {
731 (void) visit_indirect(dmu_objset_spa(&dn
->dn_objset
->os
), dnp
,
732 &dnp
->dn_blkptr
[j
], &czb
);
740 dump_dsl_dir(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
742 dsl_dir_phys_t
*dd
= data
;
749 ASSERT3U(size
, >=, sizeof (dsl_dir_phys_t
));
751 crtime
= dd
->dd_creation_time
;
752 (void) printf("\t\tcreation_time = %s", ctime(&crtime
));
753 (void) printf("\t\thead_dataset_obj = %llu\n",
754 (u_longlong_t
)dd
->dd_head_dataset_obj
);
755 (void) printf("\t\tparent_dir_obj = %llu\n",
756 (u_longlong_t
)dd
->dd_parent_obj
);
757 (void) printf("\t\torigin_obj = %llu\n",
758 (u_longlong_t
)dd
->dd_origin_obj
);
759 (void) printf("\t\tchild_dir_zapobj = %llu\n",
760 (u_longlong_t
)dd
->dd_child_dir_zapobj
);
761 nicenum(dd
->dd_used_bytes
, nice
);
762 (void) printf("\t\tused_bytes = %s\n", nice
);
763 nicenum(dd
->dd_compressed_bytes
, nice
);
764 (void) printf("\t\tcompressed_bytes = %s\n", nice
);
765 nicenum(dd
->dd_uncompressed_bytes
, nice
);
766 (void) printf("\t\tuncompressed_bytes = %s\n", nice
);
767 nicenum(dd
->dd_quota
, nice
);
768 (void) printf("\t\tquota = %s\n", nice
);
769 nicenum(dd
->dd_reserved
, nice
);
770 (void) printf("\t\treserved = %s\n", nice
);
771 (void) printf("\t\tprops_zapobj = %llu\n",
772 (u_longlong_t
)dd
->dd_props_zapobj
);
773 (void) printf("\t\tdeleg_zapobj = %llu\n",
774 (u_longlong_t
)dd
->dd_deleg_zapobj
);
775 (void) printf("\t\tflags = %llx\n",
776 (u_longlong_t
)dd
->dd_flags
);
779 nicenum(dd->dd_used_breakdown[DD_USED_ ## which], nice); \
780 (void) printf("\t\tused_breakdown[" #which "] = %s\n", nice)
791 dump_dsl_dataset(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
793 dsl_dataset_phys_t
*ds
= data
;
795 char used
[6], compressed
[6], uncompressed
[6], unique
[6];
796 char blkbuf
[BP_SPRINTF_LEN
];
801 ASSERT(size
== sizeof (*ds
));
802 crtime
= ds
->ds_creation_time
;
803 nicenum(ds
->ds_used_bytes
, used
);
804 nicenum(ds
->ds_compressed_bytes
, compressed
);
805 nicenum(ds
->ds_uncompressed_bytes
, uncompressed
);
806 nicenum(ds
->ds_unique_bytes
, unique
);
807 sprintf_blkptr(blkbuf
, BP_SPRINTF_LEN
, &ds
->ds_bp
);
809 (void) printf("\t\tdir_obj = %llu\n",
810 (u_longlong_t
)ds
->ds_dir_obj
);
811 (void) printf("\t\tprev_snap_obj = %llu\n",
812 (u_longlong_t
)ds
->ds_prev_snap_obj
);
813 (void) printf("\t\tprev_snap_txg = %llu\n",
814 (u_longlong_t
)ds
->ds_prev_snap_txg
);
815 (void) printf("\t\tnext_snap_obj = %llu\n",
816 (u_longlong_t
)ds
->ds_next_snap_obj
);
817 (void) printf("\t\tsnapnames_zapobj = %llu\n",
818 (u_longlong_t
)ds
->ds_snapnames_zapobj
);
819 (void) printf("\t\tnum_children = %llu\n",
820 (u_longlong_t
)ds
->ds_num_children
);
821 (void) printf("\t\tuserrefs_obj = %llu\n",
822 (u_longlong_t
)ds
->ds_userrefs_obj
);
823 (void) printf("\t\tcreation_time = %s", ctime(&crtime
));
824 (void) printf("\t\tcreation_txg = %llu\n",
825 (u_longlong_t
)ds
->ds_creation_txg
);
826 (void) printf("\t\tdeadlist_obj = %llu\n",
827 (u_longlong_t
)ds
->ds_deadlist_obj
);
828 (void) printf("\t\tused_bytes = %s\n", used
);
829 (void) printf("\t\tcompressed_bytes = %s\n", compressed
);
830 (void) printf("\t\tuncompressed_bytes = %s\n", uncompressed
);
831 (void) printf("\t\tunique = %s\n", unique
);
832 (void) printf("\t\tfsid_guid = %llu\n",
833 (u_longlong_t
)ds
->ds_fsid_guid
);
834 (void) printf("\t\tguid = %llu\n",
835 (u_longlong_t
)ds
->ds_guid
);
836 (void) printf("\t\tflags = %llx\n",
837 (u_longlong_t
)ds
->ds_flags
);
838 (void) printf("\t\tnext_clones_obj = %llu\n",
839 (u_longlong_t
)ds
->ds_next_clones_obj
);
840 (void) printf("\t\tprops_obj = %llu\n",
841 (u_longlong_t
)ds
->ds_props_obj
);
842 (void) printf("\t\tbp = %s\n", blkbuf
);
846 dump_bplist(objset_t
*mos
, uint64_t object
, char *name
)
848 bplist_t bpl
= { 0 };
849 blkptr_t blk
, *bp
= &blk
;
855 if (dump_opt
['d'] < 3)
858 mutex_init(&bpl
.bpl_lock
, NULL
, MUTEX_DEFAULT
, NULL
);
859 VERIFY(0 == bplist_open(&bpl
, mos
, object
));
860 if (bplist_empty(&bpl
)) {
862 mutex_destroy(&bpl
.bpl_lock
);
866 nicenum(bpl
.bpl_phys
->bpl_bytes
, bytes
);
867 if (bpl
.bpl_dbuf
->db_size
== sizeof (bplist_phys_t
)) {
868 nicenum(bpl
.bpl_phys
->bpl_comp
, comp
);
869 nicenum(bpl
.bpl_phys
->bpl_uncomp
, uncomp
);
870 (void) printf("\n %s: %llu entries, %s (%s/%s comp)\n",
871 name
, (u_longlong_t
)bpl
.bpl_phys
->bpl_entries
,
872 bytes
, comp
, uncomp
);
874 (void) printf("\n %s: %llu entries, %s\n",
875 name
, (u_longlong_t
)bpl
.bpl_phys
->bpl_entries
, bytes
);
878 if (dump_opt
['d'] < 5) {
880 mutex_destroy(&bpl
.bpl_lock
);
886 while (bplist_iterate(&bpl
, &itor
, bp
) == 0) {
887 char blkbuf
[BP_SPRINTF_LEN
];
889 ASSERT(bp
->blk_birth
!= 0);
890 sprintf_blkptr_compact(blkbuf
, bp
, dump_opt
['d'] > 5 ? 1 : 0);
891 (void) printf("\tItem %3llu: %s\n",
892 (u_longlong_t
)itor
- 1, blkbuf
);
896 mutex_destroy(&bpl
.bpl_lock
);
899 static avl_tree_t idx_tree
;
900 static avl_tree_t domain_tree
;
901 static boolean_t fuid_table_loaded
;
906 if (fuid_table_loaded
) {
907 zfs_fuid_table_destroy(&idx_tree
, &domain_tree
);
908 fuid_table_loaded
= B_FALSE
;
913 * print uid or gid information.
914 * For normal POSIX id just the id is printed in decimal format.
915 * For CIFS files with FUID the fuid is printed in hex followed by
916 * the doman-rid string.
919 print_idstr(uint64_t id
, const char *id_type
)
921 if (FUID_INDEX(id
)) {
924 domain
= zfs_fuid_idx_domain(&idx_tree
, FUID_INDEX(id
));
925 (void) printf("\t%s %llx [%s-%d]\n", id_type
,
926 (u_longlong_t
)id
, domain
, (int)FUID_RID(id
));
928 (void) printf("\t%s %llu\n", id_type
, (u_longlong_t
)id
);
934 dump_uidgid(objset_t
*os
, znode_phys_t
*zp
)
936 uint32_t uid_idx
, gid_idx
;
938 uid_idx
= FUID_INDEX(zp
->zp_uid
);
939 gid_idx
= FUID_INDEX(zp
->zp_gid
);
941 /* Load domain table, if not already loaded */
942 if (!fuid_table_loaded
&& (uid_idx
|| gid_idx
)) {
945 /* first find the fuid object. It lives in the master node */
946 VERIFY(zap_lookup(os
, MASTER_NODE_OBJ
, ZFS_FUID_TABLES
,
947 8, 1, &fuid_obj
) == 0);
948 zfs_fuid_avl_tree_create(&idx_tree
, &domain_tree
);
949 (void) zfs_fuid_table_load(os
, fuid_obj
,
950 &idx_tree
, &domain_tree
);
951 fuid_table_loaded
= B_TRUE
;
954 print_idstr(zp
->zp_uid
, "uid");
955 print_idstr(zp
->zp_gid
, "gid");
960 dump_znode(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
962 znode_phys_t
*zp
= data
;
963 time_t z_crtime
, z_atime
, z_mtime
, z_ctime
;
964 char path
[MAXPATHLEN
* 2]; /* allow for xattr and failure prefix */
967 ASSERT(size
>= sizeof (znode_phys_t
));
969 error
= zfs_obj_to_path(os
, object
, path
, sizeof (path
));
971 (void) snprintf(path
, sizeof (path
), "\?\?\?<object#%llu>",
972 (u_longlong_t
)object
);
975 if (dump_opt
['d'] < 3) {
976 (void) printf("\t%s\n", path
);
980 z_crtime
= (time_t)zp
->zp_crtime
[0];
981 z_atime
= (time_t)zp
->zp_atime
[0];
982 z_mtime
= (time_t)zp
->zp_mtime
[0];
983 z_ctime
= (time_t)zp
->zp_ctime
[0];
985 (void) printf("\tpath %s\n", path
);
987 (void) printf("\tatime %s", ctime(&z_atime
));
988 (void) printf("\tmtime %s", ctime(&z_mtime
));
989 (void) printf("\tctime %s", ctime(&z_ctime
));
990 (void) printf("\tcrtime %s", ctime(&z_crtime
));
991 (void) printf("\tgen %llu\n", (u_longlong_t
)zp
->zp_gen
);
992 (void) printf("\tmode %llo\n", (u_longlong_t
)zp
->zp_mode
);
993 (void) printf("\tsize %llu\n", (u_longlong_t
)zp
->zp_size
);
994 (void) printf("\tparent %llu\n", (u_longlong_t
)zp
->zp_parent
);
995 (void) printf("\tlinks %llu\n", (u_longlong_t
)zp
->zp_links
);
996 (void) printf("\txattr %llu\n", (u_longlong_t
)zp
->zp_xattr
);
997 (void) printf("\trdev 0x%016llx\n", (u_longlong_t
)zp
->zp_rdev
);
1002 dump_acl(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
1008 dump_dmu_objset(objset_t
*os
, uint64_t object
, void *data
, size_t size
)
1012 static object_viewer_t
*object_viewer
[DMU_OT_NUMTYPES
] = {
1013 dump_none
, /* unallocated */
1014 dump_zap
, /* object directory */
1015 dump_uint64
, /* object array */
1016 dump_none
, /* packed nvlist */
1017 dump_packed_nvlist
, /* packed nvlist size */
1018 dump_none
, /* bplist */
1019 dump_none
, /* bplist header */
1020 dump_none
, /* SPA space map header */
1021 dump_none
, /* SPA space map */
1022 dump_none
, /* ZIL intent log */
1023 dump_dnode
, /* DMU dnode */
1024 dump_dmu_objset
, /* DMU objset */
1025 dump_dsl_dir
, /* DSL directory */
1026 dump_zap
, /* DSL directory child map */
1027 dump_zap
, /* DSL dataset snap map */
1028 dump_zap
, /* DSL props */
1029 dump_dsl_dataset
, /* DSL dataset */
1030 dump_znode
, /* ZFS znode */
1031 dump_acl
, /* ZFS V0 ACL */
1032 dump_uint8
, /* ZFS plain file */
1033 dump_zpldir
, /* ZFS directory */
1034 dump_zap
, /* ZFS master node */
1035 dump_zap
, /* ZFS delete queue */
1036 dump_uint8
, /* zvol object */
1037 dump_zap
, /* zvol prop */
1038 dump_uint8
, /* other uint8[] */
1039 dump_uint64
, /* other uint64[] */
1040 dump_zap
, /* other ZAP */
1041 dump_zap
, /* persistent error log */
1042 dump_uint8
, /* SPA history */
1043 dump_uint64
, /* SPA history offsets */
1044 dump_zap
, /* Pool properties */
1045 dump_zap
, /* DSL permissions */
1046 dump_acl
, /* ZFS ACL */
1047 dump_uint8
, /* ZFS SYSACL */
1048 dump_none
, /* FUID nvlist */
1049 dump_packed_nvlist
, /* FUID nvlist size */
1050 dump_zap
, /* DSL dataset next clones */
1051 dump_zap
, /* DSL scrub queue */
1052 dump_zap
, /* ZFS user/group used */
1053 dump_zap
, /* ZFS user/group quota */
1054 dump_zap
, /* snapshot refcount tags */
1058 dump_object(objset_t
*os
, uint64_t object
, int verbosity
, int *print_header
)
1060 dmu_buf_t
*db
= NULL
;
1061 dmu_object_info_t doi
;
1065 char iblk
[6], dblk
[6], lsize
[6], asize
[6], bonus_size
[6], segsize
[6];
1069 if (*print_header
) {
1070 (void) printf("\n Object lvl iblk dblk lsize"
1076 dn
= os
->os
->os_meta_dnode
;
1078 error
= dmu_bonus_hold(os
, object
, FTAG
, &db
);
1080 fatal("dmu_bonus_hold(%llu) failed, errno %u",
1082 bonus
= db
->db_data
;
1083 bsize
= db
->db_size
;
1084 dn
= ((dmu_buf_impl_t
*)db
)->db_dnode
;
1086 dmu_object_info_from_dnode(dn
, &doi
);
1088 nicenum(doi
.doi_metadata_block_size
, iblk
);
1089 nicenum(doi
.doi_data_block_size
, dblk
);
1090 nicenum(doi
.doi_data_block_size
* (doi
.doi_max_block_offset
+ 1),
1092 nicenum(doi
.doi_physical_blks
<< 9, asize
);
1093 nicenum(doi
.doi_bonus_size
, bonus_size
);
1097 if (doi
.doi_checksum
!= ZIO_CHECKSUM_INHERIT
|| verbosity
>= 6) {
1098 (void) snprintf(aux
+ strlen(aux
), sizeof (aux
), " (K=%s)",
1099 zio_checksum_table
[doi
.doi_checksum
].ci_name
);
1102 if (doi
.doi_compress
!= ZIO_COMPRESS_INHERIT
|| verbosity
>= 6) {
1103 (void) snprintf(aux
+ strlen(aux
), sizeof (aux
), " (Z=%s)",
1104 zio_compress_table
[doi
.doi_compress
].ci_name
);
1107 (void) printf("%10lld %3u %5s %5s %5s %5s %s%s\n",
1108 (u_longlong_t
)object
, doi
.doi_indirection
, iblk
, dblk
, lsize
,
1109 asize
, dmu_ot
[doi
.doi_type
].ot_name
, aux
);
1111 if (doi
.doi_bonus_type
!= DMU_OT_NONE
&& verbosity
> 3) {
1112 (void) printf("%10s %3s %5s %5s %5s %5s %s\n",
1113 "", "", "", "", bonus_size
, "bonus",
1114 dmu_ot
[doi
.doi_bonus_type
].ot_name
);
1117 if (verbosity
>= 4) {
1118 (void) printf("\tdnode flags: %s%s\n",
1119 (dn
->dn_phys
->dn_flags
& DNODE_FLAG_USED_BYTES
) ?
1121 (dn
->dn_phys
->dn_flags
& DNODE_FLAG_USERUSED_ACCOUNTED
) ?
1122 "USERUSED_ACCOUNTED " : "");
1123 (void) printf("\tdnode maxblkid: %llu\n",
1124 (longlong_t
)dn
->dn_phys
->dn_maxblkid
);
1126 object_viewer
[doi
.doi_bonus_type
](os
, object
, bonus
, bsize
);
1127 object_viewer
[doi
.doi_type
](os
, object
, NULL
, 0);
1134 if (verbosity
>= 5) {
1136 * Report the list of segments that comprise the object.
1140 uint64_t blkfill
= 1;
1143 if (dn
->dn_type
== DMU_OT_DNODE
) {
1145 blkfill
= DNODES_PER_BLOCK
;
1149 error
= dnode_next_offset(dn
,
1150 0, &start
, minlvl
, blkfill
, 0);
1154 error
= dnode_next_offset(dn
,
1155 DNODE_FIND_HOLE
, &end
, minlvl
, blkfill
, 0);
1156 nicenum(end
- start
, segsize
);
1157 (void) printf("\t\tsegment [%016llx, %016llx)"
1158 " size %5s\n", (u_longlong_t
)start
,
1159 (u_longlong_t
)end
, segsize
);
1167 dmu_buf_rele(db
, FTAG
);
1170 static char *objset_types
[DMU_OST_NUMTYPES
] = {
1171 "NONE", "META", "ZPL", "ZVOL", "OTHER", "ANY" };
1174 dump_dir(objset_t
*os
)
1176 dmu_objset_stats_t dds
;
1177 uint64_t object
, object_count
;
1178 uint64_t refdbytes
, usedobjs
, scratch
;
1180 char blkbuf
[BP_SPRINTF_LEN
+ 20];
1181 char osname
[MAXNAMELEN
];
1182 char *type
= "UNKNOWN";
1183 int verbosity
= dump_opt
['d'];
1184 int print_header
= 1;
1187 dmu_objset_fast_stat(os
, &dds
);
1189 if (dds
.dds_type
< DMU_OST_NUMTYPES
)
1190 type
= objset_types
[dds
.dds_type
];
1192 if (dds
.dds_type
== DMU_OST_META
) {
1193 dds
.dds_creation_txg
= TXG_INITIAL
;
1194 usedobjs
= os
->os
->os_rootbp
->blk_fill
;
1195 refdbytes
= os
->os
->os_spa
->spa_dsl_pool
->
1196 dp_mos_dir
->dd_phys
->dd_used_bytes
;
1198 dmu_objset_space(os
, &refdbytes
, &scratch
, &usedobjs
, &scratch
);
1201 ASSERT3U(usedobjs
, ==, os
->os
->os_rootbp
->blk_fill
);
1203 nicenum(refdbytes
, numbuf
);
1205 if (verbosity
>= 4) {
1206 (void) sprintf(blkbuf
+ strlen(blkbuf
), ", rootbp ");
1207 (void) sprintf_blkptr(blkbuf
+ strlen(blkbuf
),
1208 BP_SPRINTF_LEN
- strlen(blkbuf
), os
->os
->os_rootbp
);
1213 dmu_objset_name(os
, osname
);
1215 (void) printf("Dataset %s [%s], ID %llu, cr_txg %llu, "
1216 "%s, %llu objects%s\n",
1217 osname
, type
, (u_longlong_t
)dmu_objset_id(os
),
1218 (u_longlong_t
)dds
.dds_creation_txg
,
1219 numbuf
, (u_longlong_t
)usedobjs
, blkbuf
);
1221 dump_intent_log(dmu_objset_zil(os
));
1223 if (dmu_objset_ds(os
) != NULL
)
1224 dump_bplist(dmu_objset_pool(os
)->dp_meta_objset
,
1225 dmu_objset_ds(os
)->ds_phys
->ds_deadlist_obj
, "Deadlist");
1230 if (os
->os
->os_rootbp
->blk_birth
== 0)
1233 if (zopt_objects
!= 0) {
1234 for (i
= 0; i
< zopt_objects
; i
++)
1235 dump_object(os
, zopt_object
[i
], verbosity
,
1237 (void) printf("\n");
1241 dump_object(os
, 0, verbosity
, &print_header
);
1243 if (os
->os
->os_userused_dnode
&&
1244 os
->os
->os_userused_dnode
->dn_type
!= 0) {
1245 dump_object(os
, DMU_USERUSED_OBJECT
, verbosity
, &print_header
);
1246 dump_object(os
, DMU_GROUPUSED_OBJECT
, verbosity
, &print_header
);
1250 while ((error
= dmu_object_next(os
, &object
, B_FALSE
, 0)) == 0) {
1251 dump_object(os
, object
, verbosity
, &print_header
);
1255 ASSERT3U(object_count
, ==, usedobjs
);
1257 (void) printf("\n");
1259 if (error
!= ESRCH
) {
1260 (void) fprintf(stderr
, "dmu_object_next() = %d\n", error
);
1266 dump_uberblock(uberblock_t
*ub
)
1268 time_t timestamp
= ub
->ub_timestamp
;
1270 (void) printf("Uberblock\n\n");
1271 (void) printf("\tmagic = %016llx\n", (u_longlong_t
)ub
->ub_magic
);
1272 (void) printf("\tversion = %llu\n", (u_longlong_t
)ub
->ub_version
);
1273 (void) printf("\ttxg = %llu\n", (u_longlong_t
)ub
->ub_txg
);
1274 (void) printf("\tguid_sum = %llu\n", (u_longlong_t
)ub
->ub_guid_sum
);
1275 (void) printf("\ttimestamp = %llu UTC = %s",
1276 (u_longlong_t
)ub
->ub_timestamp
, asctime(localtime(×tamp
)));
1277 if (dump_opt
['u'] >= 3) {
1278 char blkbuf
[BP_SPRINTF_LEN
];
1279 sprintf_blkptr(blkbuf
, BP_SPRINTF_LEN
, &ub
->ub_rootbp
);
1280 (void) printf("\trootbp = %s\n", blkbuf
);
1282 (void) printf("\n");
1286 dump_config(const char *pool
)
1290 mutex_enter(&spa_namespace_lock
);
1291 while ((spa
= spa_next(spa
)) != NULL
) {
1293 (void) printf("%s\n", spa_name(spa
));
1294 if (pool
== NULL
|| strcmp(pool
, spa_name(spa
)) == 0)
1295 dump_nvlist(spa
->spa_config
, 4);
1297 mutex_exit(&spa_namespace_lock
);
1301 dump_cachefile(const char *cachefile
)
1304 struct stat64 statbuf
;
1308 if ((fd
= open64(cachefile
, O_RDONLY
)) < 0) {
1309 (void) printf("cannot open '%s': %s\n", cachefile
,
1314 if (fstat64(fd
, &statbuf
) != 0) {
1315 (void) printf("failed to stat '%s': %s\n", cachefile
,
1320 if ((buf
= malloc(statbuf
.st_size
)) == NULL
) {
1321 (void) fprintf(stderr
, "failed to allocate %llu bytes\n",
1322 (u_longlong_t
)statbuf
.st_size
);
1326 if (read(fd
, buf
, statbuf
.st_size
) != statbuf
.st_size
) {
1327 (void) fprintf(stderr
, "failed to read %llu bytes\n",
1328 (u_longlong_t
)statbuf
.st_size
);
1334 if (nvlist_unpack(buf
, statbuf
.st_size
, &config
, 0) != 0) {
1335 (void) fprintf(stderr
, "failed to unpack nvlist\n");
1341 dump_nvlist(config
, 0);
1343 nvlist_free(config
);
1347 dump_label(const char *dev
)
1351 char *buf
= label
.vl_vdev_phys
.vp_nvlist
;
1352 size_t buflen
= sizeof (label
.vl_vdev_phys
.vp_nvlist
);
1353 struct stat64 statbuf
;
1357 if ((fd
= open64(dev
, O_RDONLY
)) < 0) {
1358 (void) printf("cannot open '%s': %s\n", dev
, strerror(errno
));
1362 if (fstat64(fd
, &statbuf
) != 0) {
1363 (void) printf("failed to stat '%s': %s\n", dev
,
1368 psize
= statbuf
.st_size
;
1369 psize
= P2ALIGN(psize
, (uint64_t)sizeof (vdev_label_t
));
1371 for (l
= 0; l
< VDEV_LABELS
; l
++) {
1373 nvlist_t
*config
= NULL
;
1375 (void) printf("--------------------------------------------\n");
1376 (void) printf("LABEL %d\n", l
);
1377 (void) printf("--------------------------------------------\n");
1379 if (pread64(fd
, &label
, sizeof (label
),
1380 vdev_label_offset(psize
, l
, 0)) != sizeof (label
)) {
1381 (void) printf("failed to read label %d\n", l
);
1385 if (nvlist_unpack(buf
, buflen
, &config
, 0) != 0) {
1386 (void) printf("failed to unpack label %d\n", l
);
1389 dump_nvlist(config
, 4);
1390 nvlist_free(config
);
1396 dump_one_dir(char *dsname
, void *arg
)
1401 error
= dmu_objset_open(dsname
, DMU_OST_ANY
,
1402 DS_MODE_USER
| DS_MODE_READONLY
, &os
);
1404 (void) printf("Could not open %s\n", dsname
);
1408 dmu_objset_close(os
);
1409 fuid_table_destroy();
1414 zdb_leak(space_map_t
*sm
, uint64_t start
, uint64_t size
)
1416 vdev_t
*vd
= sm
->sm_ppd
;
1418 (void) printf("leaked space: vdev %llu, offset 0x%llx, size %llu\n",
1419 (u_longlong_t
)vd
->vdev_id
, (u_longlong_t
)start
, (u_longlong_t
)size
);
1424 zdb_space_map_load(space_map_t
*sm
)
1429 zdb_space_map_unload(space_map_t
*sm
)
1431 space_map_vacate(sm
, zdb_leak
, sm
);
1436 zdb_space_map_claim(space_map_t
*sm
, uint64_t start
, uint64_t size
)
1440 static space_map_ops_t zdb_space_map_ops
= {
1442 zdb_space_map_unload
,
1444 zdb_space_map_claim
,
1450 zdb_leak_init(spa_t
*spa
)
1452 vdev_t
*rvd
= spa
->spa_root_vdev
;
1454 for (int c
= 0; c
< rvd
->vdev_children
; c
++) {
1455 vdev_t
*vd
= rvd
->vdev_child
[c
];
1456 for (int m
= 0; m
< vd
->vdev_ms_count
; m
++) {
1457 metaslab_t
*msp
= vd
->vdev_ms
[m
];
1458 mutex_enter(&msp
->ms_lock
);
1459 VERIFY(space_map_load(&msp
->ms_map
, &zdb_space_map_ops
,
1460 SM_ALLOC
, &msp
->ms_smo
, spa
->spa_meta_objset
) == 0);
1461 msp
->ms_map
.sm_ppd
= vd
;
1462 mutex_exit(&msp
->ms_lock
);
1468 zdb_leak_fini(spa_t
*spa
)
1470 vdev_t
*rvd
= spa
->spa_root_vdev
;
1472 for (int c
= 0; c
< rvd
->vdev_children
; c
++) {
1473 vdev_t
*vd
= rvd
->vdev_child
[c
];
1474 for (int m
= 0; m
< vd
->vdev_ms_count
; m
++) {
1475 metaslab_t
*msp
= vd
->vdev_ms
[m
];
1476 mutex_enter(&msp
->ms_lock
);
1477 space_map_unload(&msp
->ms_map
);
1478 mutex_exit(&msp
->ms_lock
);
1484 * Verify that the sum of the sizes of all blocks in the pool adds up
1485 * to the SPA's sa_alloc total.
1487 typedef struct zdb_blkstats
{
1494 #define DMU_OT_DEFERRED DMU_OT_NONE
1495 #define DMU_OT_TOTAL DMU_OT_NUMTYPES
1497 #define ZB_TOTAL DN_MAX_LEVELS
1499 typedef struct zdb_cb
{
1500 zdb_blkstats_t zcb_type
[ZB_TOTAL
+ 1][DMU_OT_TOTAL
+ 1];
1501 uint64_t zcb_errors
[256];
1507 zdb_count_block(spa_t
*spa
, zdb_cb_t
*zcb
, blkptr_t
*bp
, dmu_object_type_t type
)
1509 for (int i
= 0; i
< 4; i
++) {
1510 int l
= (i
< 2) ? BP_GET_LEVEL(bp
) : ZB_TOTAL
;
1511 int t
= (i
& 1) ? type
: DMU_OT_TOTAL
;
1512 zdb_blkstats_t
*zb
= &zcb
->zcb_type
[l
][t
];
1514 zb
->zb_asize
+= BP_GET_ASIZE(bp
);
1515 zb
->zb_lsize
+= BP_GET_LSIZE(bp
);
1516 zb
->zb_psize
+= BP_GET_PSIZE(bp
);
1520 if (dump_opt
['S']) {
1521 boolean_t print_sig
;
1523 print_sig
= !zdb_sig_user_data
|| (BP_GET_LEVEL(bp
) == 0 &&
1524 BP_GET_TYPE(bp
) == DMU_OT_PLAIN_FILE_CONTENTS
);
1526 if (BP_GET_CHECKSUM(bp
) < zdb_sig_cksumalg
)
1527 print_sig
= B_FALSE
;
1530 (void) printf("%llu\t%lld\t%lld\t%s\t%s\t%s\t"
1531 "%llx:%llx:%llx:%llx\n",
1532 (u_longlong_t
)BP_GET_LEVEL(bp
),
1533 (longlong_t
)BP_GET_PSIZE(bp
),
1534 (longlong_t
)BP_GET_NDVAS(bp
),
1535 dmu_ot
[BP_GET_TYPE(bp
)].ot_name
,
1536 zio_checksum_table
[BP_GET_CHECKSUM(bp
)].ci_name
,
1537 zio_compress_table
[BP_GET_COMPRESS(bp
)].ci_name
,
1538 (u_longlong_t
)bp
->blk_cksum
.zc_word
[0],
1539 (u_longlong_t
)bp
->blk_cksum
.zc_word
[1],
1540 (u_longlong_t
)bp
->blk_cksum
.zc_word
[2],
1541 (u_longlong_t
)bp
->blk_cksum
.zc_word
[3]);
1546 VERIFY(zio_wait(zio_claim(NULL
, spa
, spa_first_txg(spa
), bp
,
1547 NULL
, NULL
, ZIO_FLAG_MUSTSUCCEED
)) == 0);
1551 zdb_blkptr_cb(spa_t
*spa
, blkptr_t
*bp
, const zbookmark_t
*zb
,
1552 const dnode_phys_t
*dnp
, void *arg
)
1554 zdb_cb_t
*zcb
= arg
;
1555 char blkbuf
[BP_SPRINTF_LEN
];
1556 dmu_object_type_t type
;
1557 boolean_t is_l0_metadata
;
1562 type
= BP_GET_TYPE(bp
);
1564 zdb_count_block(spa
, zcb
, bp
, type
);
1567 * if we do metadata-only checksumming there's no need to checksum
1568 * indirect blocks here because it is done during traverse
1570 is_l0_metadata
= (BP_GET_LEVEL(bp
) == 0 && type
< DMU_OT_NUMTYPES
&&
1571 dmu_ot
[type
].ot_metadata
);
1573 if (dump_opt
['c'] > 1 || dump_opt
['S'] ||
1574 (dump_opt
['c'] && is_l0_metadata
)) {
1578 size
= BP_GET_LSIZE(bp
);
1579 data
= malloc(size
);
1580 ioerr
= zio_wait(zio_read(NULL
, spa
, bp
, data
, size
,
1581 NULL
, NULL
, ZIO_PRIORITY_ASYNC_READ
,
1582 ZIO_FLAG_CANFAIL
| ZIO_FLAG_SCRUB
, zb
));
1585 /* We expect io errors on intent log */
1586 if (ioerr
&& type
!= DMU_OT_INTENT_LOG
) {
1587 zcb
->zcb_haderrors
= 1;
1588 zcb
->zcb_errors
[ioerr
]++;
1590 if (dump_opt
['b'] >= 2)
1591 sprintf_blkptr(blkbuf
, BP_SPRINTF_LEN
, bp
);
1595 if (!dump_opt
['S']) {
1596 (void) printf("zdb_blkptr_cb: "
1597 "Got error %d reading "
1598 "<%llu, %llu, %lld, %llx> %s -- skipping\n",
1600 (u_longlong_t
)zb
->zb_objset
,
1601 (u_longlong_t
)zb
->zb_object
,
1602 (u_longlong_t
)zb
->zb_level
,
1603 (u_longlong_t
)zb
->zb_blkid
,
1609 zcb
->zcb_readfails
= 0;
1611 if (dump_opt
['b'] >= 4) {
1612 sprintf_blkptr(blkbuf
, BP_SPRINTF_LEN
, bp
);
1613 (void) printf("objset %llu object %llu offset 0x%llx %s\n",
1614 (u_longlong_t
)zb
->zb_objset
,
1615 (u_longlong_t
)zb
->zb_object
,
1616 (u_longlong_t
)blkid2offset(dnp
, zb
->zb_level
, zb
->zb_blkid
),
1624 dump_block_stats(spa_t
*spa
)
1626 zdb_cb_t zcb
= { 0 };
1627 zdb_blkstats_t
*zb
, *tzb
;
1628 uint64_t alloc
, space
, logalloc
;
1629 vdev_t
*rvd
= spa
->spa_root_vdev
;
1633 if (!dump_opt
['S']) {
1634 (void) printf("\nTraversing all blocks %s%s%s%s%s...\n",
1635 (dump_opt
['c'] || !dump_opt
['L']) ? "to verify " : "",
1636 (dump_opt
['c'] == 1) ? "metadata " : "",
1637 dump_opt
['c'] ? "checksums " : "",
1638 (dump_opt
['c'] && !dump_opt
['L']) ? "and verify " : "",
1639 !dump_opt
['L'] ? "nothing leaked " : "");
1643 * Load all space maps as SM_ALLOC maps, then traverse the pool
1644 * claiming each block we discover. If the pool is perfectly
1645 * consistent, the space maps will be empty when we're done.
1646 * Anything left over is a leak; any block we can't claim (because
1647 * it's not part of any space map) is a double allocation,
1648 * reference to a freed block, or an unclaimed log block.
1654 * If there's a deferred-free bplist, process that first.
1656 if (spa
->spa_sync_bplist_obj
!= 0) {
1657 bplist_t
*bpl
= &spa
->spa_sync_bplist
;
1661 VERIFY(0 == bplist_open(bpl
, spa
->spa_meta_objset
,
1662 spa
->spa_sync_bplist_obj
));
1664 while (bplist_iterate(bpl
, &itor
, &blk
) == 0) {
1665 if (dump_opt
['b'] >= 4) {
1666 char blkbuf
[BP_SPRINTF_LEN
];
1667 sprintf_blkptr(blkbuf
, BP_SPRINTF_LEN
, &blk
);
1668 (void) printf("[%s] %s\n",
1669 "deferred free", blkbuf
);
1671 zdb_count_block(spa
, &zcb
, &blk
, DMU_OT_DEFERRED
);
1677 zcb
.zcb_haderrors
|= traverse_pool(spa
, zdb_blkptr_cb
, &zcb
);
1679 if (zcb
.zcb_haderrors
&& !dump_opt
['S']) {
1680 (void) printf("\nError counts:\n\n");
1681 (void) printf("\t%5s %s\n", "errno", "count");
1682 for (e
= 0; e
< 256; e
++) {
1683 if (zcb
.zcb_errors
[e
] != 0) {
1684 (void) printf("\t%5d %llu\n",
1685 e
, (u_longlong_t
)zcb
.zcb_errors
[e
]);
1691 * Report any leaked segments.
1697 * If we're interested in printing out the blkptr signatures,
1698 * return now as we don't print out anything else (including
1699 * errors and leaks).
1702 return (zcb
.zcb_haderrors
? 3 : 0);
1704 alloc
= spa_get_alloc(spa
);
1705 space
= spa_get_space(spa
);
1708 * Log blocks allocated from a separate log device don't count
1709 * as part of the normal pool space; factor them in here.
1713 for (c
= 0; c
< rvd
->vdev_children
; c
++)
1714 if (rvd
->vdev_child
[c
]->vdev_islog
)
1715 logalloc
+= rvd
->vdev_child
[c
]->vdev_stat
.vs_alloc
;
1717 tzb
= &zcb
.zcb_type
[ZB_TOTAL
][DMU_OT_TOTAL
];
1719 if (tzb
->zb_asize
== alloc
+ logalloc
) {
1721 (void) printf("\n\tNo leaks (block sum matches space"
1722 " maps exactly)\n");
1724 (void) printf("block traversal size %llu != alloc %llu "
1726 (u_longlong_t
)tzb
->zb_asize
,
1727 (u_longlong_t
)alloc
+ logalloc
,
1728 (dump_opt
['L']) ? "unreachable" : "leaked",
1729 (longlong_t
)(alloc
+ logalloc
- tzb
->zb_asize
));
1733 if (tzb
->zb_count
== 0)
1736 (void) printf("\n");
1737 (void) printf("\tbp count: %10llu\n",
1738 (u_longlong_t
)tzb
->zb_count
);
1739 (void) printf("\tbp logical: %10llu\t avg: %6llu\n",
1740 (u_longlong_t
)tzb
->zb_lsize
,
1741 (u_longlong_t
)(tzb
->zb_lsize
/ tzb
->zb_count
));
1742 (void) printf("\tbp physical: %10llu\t avg:"
1743 " %6llu\tcompression: %6.2f\n",
1744 (u_longlong_t
)tzb
->zb_psize
,
1745 (u_longlong_t
)(tzb
->zb_psize
/ tzb
->zb_count
),
1746 (double)tzb
->zb_lsize
/ tzb
->zb_psize
);
1747 (void) printf("\tbp allocated: %10llu\t avg:"
1748 " %6llu\tcompression: %6.2f\n",
1749 (u_longlong_t
)tzb
->zb_asize
,
1750 (u_longlong_t
)(tzb
->zb_asize
/ tzb
->zb_count
),
1751 (double)tzb
->zb_lsize
/ tzb
->zb_asize
);
1752 (void) printf("\tSPA allocated: %10llu\tused: %5.2f%%\n",
1753 (u_longlong_t
)alloc
, 100.0 * alloc
/ space
);
1755 if (dump_opt
['b'] >= 2) {
1757 (void) printf("\nBlocks\tLSIZE\tPSIZE\tASIZE"
1758 "\t avg\t comp\t%%Total\tType\n");
1760 for (t
= 0; t
<= DMU_OT_NUMTYPES
; t
++) {
1761 char csize
[6], lsize
[6], psize
[6], asize
[6], avg
[6];
1764 typename
= t
== DMU_OT_DEFERRED
? "deferred free" :
1765 t
== DMU_OT_TOTAL
? "Total" : dmu_ot
[t
].ot_name
;
1767 if (zcb
.zcb_type
[ZB_TOTAL
][t
].zb_asize
== 0) {
1768 (void) printf("%6s\t%5s\t%5s\t%5s"
1769 "\t%5s\t%5s\t%6s\t%s\n",
1781 for (l
= ZB_TOTAL
- 1; l
>= -1; l
--) {
1782 level
= (l
== -1 ? ZB_TOTAL
: l
);
1783 zb
= &zcb
.zcb_type
[level
][t
];
1785 if (zb
->zb_asize
== 0)
1788 if (dump_opt
['b'] < 3 && level
!= ZB_TOTAL
)
1791 if (level
== 0 && zb
->zb_asize
==
1792 zcb
.zcb_type
[ZB_TOTAL
][t
].zb_asize
)
1795 nicenum(zb
->zb_count
, csize
);
1796 nicenum(zb
->zb_lsize
, lsize
);
1797 nicenum(zb
->zb_psize
, psize
);
1798 nicenum(zb
->zb_asize
, asize
);
1799 nicenum(zb
->zb_asize
/ zb
->zb_count
, avg
);
1801 (void) printf("%6s\t%5s\t%5s\t%5s\t%5s"
1803 csize
, lsize
, psize
, asize
, avg
,
1804 (double)zb
->zb_lsize
/ zb
->zb_psize
,
1805 100.0 * zb
->zb_asize
/ tzb
->zb_asize
);
1807 if (level
== ZB_TOTAL
)
1808 (void) printf("%s\n", typename
);
1810 (void) printf(" L%d %s\n",
1816 (void) printf("\n");
1821 if (zcb
.zcb_haderrors
)
1828 dump_zpool(spa_t
*spa
)
1830 dsl_pool_t
*dp
= spa_get_dsl(spa
);
1834 dump_uberblock(&spa
->spa_uberblock
);
1836 if (dump_opt
['d'] || dump_opt
['i'] || dump_opt
['m']) {
1837 dump_dir(dp
->dp_meta_objset
);
1838 if (dump_opt
['d'] >= 3) {
1839 dump_bplist(dp
->dp_meta_objset
,
1840 spa
->spa_sync_bplist_obj
, "Deferred frees");
1841 dump_dtl(spa
->spa_root_vdev
, 0);
1844 if (dump_opt
['d'] >= 3 || dump_opt
['m'])
1845 dump_metaslabs(spa
);
1847 (void) dmu_objset_find(spa_name(spa
), dump_one_dir
, NULL
,
1848 DS_FIND_SNAPSHOTS
| DS_FIND_CHILDREN
);
1851 if (dump_opt
['b'] || dump_opt
['c'] || dump_opt
['S'])
1852 rc
= dump_block_stats(spa
);
1855 show_pool_stats(spa
);
1861 #define ZDB_FLAG_CHECKSUM 0x0001
1862 #define ZDB_FLAG_DECOMPRESS 0x0002
1863 #define ZDB_FLAG_BSWAP 0x0004
1864 #define ZDB_FLAG_GBH 0x0008
1865 #define ZDB_FLAG_INDIRECT 0x0010
1866 #define ZDB_FLAG_PHYS 0x0020
1867 #define ZDB_FLAG_RAW 0x0040
1868 #define ZDB_FLAG_PRINT_BLKPTR 0x0080
1873 zdb_print_blkptr(blkptr_t
*bp
, int flags
)
1875 dva_t
*dva
= bp
->blk_dva
;
1878 if (flags
& ZDB_FLAG_BSWAP
)
1879 byteswap_uint64_array((void *)bp
, sizeof (blkptr_t
));
1881 * Super-ick warning: This code is also duplicated in
1882 * cmd/mdb/common/modules/zfs/zfs.c . Yeah, I hate code
1885 for (d
= 0; d
< BP_GET_NDVAS(bp
); d
++) {
1886 (void) printf("\tDVA[%d]: vdev_id %lld / %llx\n", d
,
1887 (longlong_t
)DVA_GET_VDEV(&dva
[d
]),
1888 (longlong_t
)DVA_GET_OFFSET(&dva
[d
]));
1889 (void) printf("\tDVA[%d]: GANG: %-5s GRID: %04llx\t"
1891 DVA_GET_GANG(&dva
[d
]) ? "TRUE" : "FALSE",
1892 (longlong_t
)DVA_GET_GRID(&dva
[d
]),
1893 (longlong_t
)DVA_GET_ASIZE(&dva
[d
]));
1894 (void) printf("\tDVA[%d]: :%llu:%llx:%llx:%s%s%s%s\n", d
,
1895 (u_longlong_t
)DVA_GET_VDEV(&dva
[d
]),
1896 (longlong_t
)DVA_GET_OFFSET(&dva
[d
]),
1897 (longlong_t
)BP_GET_PSIZE(bp
),
1898 BP_SHOULD_BYTESWAP(bp
) ? "e" : "",
1899 !DVA_GET_GANG(&dva
[d
]) && BP_GET_LEVEL(bp
) != 0 ?
1901 DVA_GET_GANG(&dva
[d
]) ? "g" : "",
1902 BP_GET_COMPRESS(bp
) != 0 ? "d" : "");
1904 (void) printf("\tLSIZE: %-16llx\t\tPSIZE: %llx\n",
1905 (longlong_t
)BP_GET_LSIZE(bp
), (longlong_t
)BP_GET_PSIZE(bp
));
1906 (void) printf("\tENDIAN: %6s\t\t\t\t\tTYPE: %s\n",
1907 BP_GET_BYTEORDER(bp
) ? "LITTLE" : "BIG",
1908 dmu_ot
[BP_GET_TYPE(bp
)].ot_name
);
1909 (void) printf("\tBIRTH: %-16llx LEVEL: %-2llu\tFILL: %llx\n",
1910 (u_longlong_t
)bp
->blk_birth
, (u_longlong_t
)BP_GET_LEVEL(bp
),
1911 (u_longlong_t
)bp
->blk_fill
);
1912 (void) printf("\tCKFUNC: %-16s\t\tCOMP: %s\n",
1913 zio_checksum_table
[BP_GET_CHECKSUM(bp
)].ci_name
,
1914 zio_compress_table
[BP_GET_COMPRESS(bp
)].ci_name
);
1915 (void) printf("\tCKSUM: %llx:%llx:%llx:%llx\n",
1916 (u_longlong_t
)bp
->blk_cksum
.zc_word
[0],
1917 (u_longlong_t
)bp
->blk_cksum
.zc_word
[1],
1918 (u_longlong_t
)bp
->blk_cksum
.zc_word
[2],
1919 (u_longlong_t
)bp
->blk_cksum
.zc_word
[3]);
1923 zdb_dump_indirect(blkptr_t
*bp
, int nbps
, int flags
)
1927 for (i
= 0; i
< nbps
; i
++)
1928 zdb_print_blkptr(&bp
[i
], flags
);
1932 zdb_dump_gbh(void *buf
, int flags
)
1934 zdb_dump_indirect((blkptr_t
*)buf
, SPA_GBH_NBLKPTRS
, flags
);
1938 zdb_dump_block_raw(void *buf
, uint64_t size
, int flags
)
1940 if (flags
& ZDB_FLAG_BSWAP
)
1941 byteswap_uint64_array(buf
, size
);
1942 (void) write(2, buf
, size
);
1946 zdb_dump_block(char *label
, void *buf
, uint64_t size
, int flags
)
1948 uint64_t *d
= (uint64_t *)buf
;
1949 int nwords
= size
/ sizeof (uint64_t);
1950 int do_bswap
= !!(flags
& ZDB_FLAG_BSWAP
);
1956 hdr
= " 7 6 5 4 3 2 1 0 f e d c b a 9 8";
1958 hdr
= " 0 1 2 3 4 5 6 7 8 9 a b c d e f";
1960 (void) printf("\n%s\n%6s %s 0123456789abcdef\n", label
, "", hdr
);
1962 for (i
= 0; i
< nwords
; i
+= 2) {
1963 (void) printf("%06llx: %016llx %016llx ",
1964 (u_longlong_t
)(i
* sizeof (uint64_t)),
1965 (u_longlong_t
)(do_bswap
? BSWAP_64(d
[i
]) : d
[i
]),
1966 (u_longlong_t
)(do_bswap
? BSWAP_64(d
[i
+ 1]) : d
[i
+ 1]));
1969 for (j
= 0; j
< 2 * sizeof (uint64_t); j
++)
1970 (void) printf("%c", isprint(c
[j
]) ? c
[j
] : '.');
1971 (void) printf("\n");
1976 * There are two acceptable formats:
1977 * leaf_name - For example: c1t0d0 or /tmp/ztest.0a
1978 * child[.child]* - For example: 0.1.1
1980 * The second form can be used to specify arbitrary vdevs anywhere
1981 * in the heirarchy. For example, in a pool with a mirror of
1982 * RAID-Zs, you can specify either RAID-Z vdev with 0.0 or 0.1 .
1985 zdb_vdev_lookup(vdev_t
*vdev
, char *path
)
1993 /* First, assume the x.x.x.x format */
1994 i
= (int)strtoul(path
, &s
, 10);
1995 if (s
== path
|| (s
&& *s
!= '.' && *s
!= '\0'))
1997 if (i
< 0 || i
>= vdev
->vdev_children
)
2000 vdev
= vdev
->vdev_child
[i
];
2003 return (zdb_vdev_lookup(vdev
, s
+1));
2006 for (i
= 0; i
< vdev
->vdev_children
; i
++) {
2007 vdev_t
*vc
= vdev
->vdev_child
[i
];
2009 if (vc
->vdev_path
== NULL
) {
2010 vc
= zdb_vdev_lookup(vc
, path
);
2017 p
= strrchr(vc
->vdev_path
, '/');
2018 p
= p
? p
+ 1 : vc
->vdev_path
;
2019 q
= &vc
->vdev_path
[strlen(vc
->vdev_path
) - 2];
2021 if (strcmp(vc
->vdev_path
, path
) == 0)
2023 if (strcmp(p
, path
) == 0)
2025 if (strcmp(q
, "s0") == 0 && strncmp(p
, path
, q
- p
) == 0)
2033 * Read a block from a pool and print it out. The syntax of the
2034 * block descriptor is:
2036 * pool:vdev_specifier:offset:size[:flags]
2038 * pool - The name of the pool you wish to read from
2039 * vdev_specifier - Which vdev (see comment for zdb_vdev_lookup)
2040 * offset - offset, in hex, in bytes
2041 * size - Amount of data to read, in hex, in bytes
2042 * flags - A string of characters specifying options
2043 * b: Decode a blkptr at given offset within block
2044 * *c: Calculate and display checksums
2045 * *d: Decompress data before dumping
2046 * e: Byteswap data before dumping
2047 * *g: Display data as a gang block header
2048 * *i: Display as an indirect block
2049 * p: Do I/O to physical offset
2050 * r: Dump raw data to stdout
2052 * * = not yet implemented
2055 zdb_read_block(char *thing
, spa_t
**spap
)
2059 uint64_t offset
= 0, size
= 0, blkptr_offset
= 0;
2063 char *s
, *p
, *dup
, *pool
, *vdev
, *flagstr
;
2064 int i
, error
, zio_flags
;
2066 dup
= strdup(thing
);
2067 s
= strtok(dup
, ":");
2069 s
= strtok(NULL
, ":");
2071 s
= strtok(NULL
, ":");
2072 offset
= strtoull(s
? s
: "", NULL
, 16);
2073 s
= strtok(NULL
, ":");
2074 size
= strtoull(s
? s
: "", NULL
, 16);
2075 s
= strtok(NULL
, ":");
2076 flagstr
= s
? s
: "";
2080 s
= "size must not be zero";
2081 if (!IS_P2ALIGNED(size
, DEV_BSIZE
))
2082 s
= "size must be a multiple of sector size";
2083 if (!IS_P2ALIGNED(offset
, DEV_BSIZE
))
2084 s
= "offset must be a multiple of sector size";
2086 (void) printf("Invalid block specifier: %s - %s\n", thing
, s
);
2091 for (s
= strtok(flagstr
, ":"); s
; s
= strtok(NULL
, ":")) {
2092 for (i
= 0; flagstr
[i
]; i
++) {
2093 int bit
= flagbits
[(uchar_t
)flagstr
[i
]];
2096 (void) printf("***Invalid flag: %c\n",
2102 /* If it's not something with an argument, keep going */
2103 if ((bit
& (ZDB_FLAG_CHECKSUM
| ZDB_FLAG_DECOMPRESS
|
2104 ZDB_FLAG_PRINT_BLKPTR
)) == 0)
2107 p
= &flagstr
[i
+ 1];
2108 if (bit
== ZDB_FLAG_PRINT_BLKPTR
)
2109 blkptr_offset
= strtoull(p
, &p
, 16);
2110 if (*p
!= ':' && *p
!= '\0') {
2111 (void) printf("***Invalid flag arg: '%s'\n", s
);
2118 if (spa
== NULL
|| strcmp(spa_name(spa
), pool
) != 0) {
2120 spa_close(spa
, (void *)zdb_read_block
);
2121 error
= spa_open(pool
, spap
, (void *)zdb_read_block
);
2123 fatal("Failed to open pool '%s': %s",
2124 pool
, strerror(error
));
2128 vd
= zdb_vdev_lookup(spa
->spa_root_vdev
, vdev
);
2130 (void) printf("***Invalid vdev: %s\n", vdev
);
2135 (void) printf("Found vdev: %s\n", vd
->vdev_path
);
2137 (void) printf("Found vdev type: %s\n",
2138 vd
->vdev_ops
->vdev_op_type
);
2141 buf
= umem_alloc(size
, UMEM_NOFAIL
);
2143 zio_flags
= ZIO_FLAG_DONT_CACHE
| ZIO_FLAG_DONT_QUEUE
|
2144 ZIO_FLAG_DONT_PROPAGATE
| ZIO_FLAG_DONT_RETRY
;
2146 spa_config_enter(spa
, SCL_STATE
, FTAG
, RW_READER
);
2147 zio
= zio_root(spa
, NULL
, NULL
, 0);
2148 /* XXX todo - cons up a BP so RAID-Z will be happy */
2149 zio_nowait(zio_vdev_child_io(zio
, NULL
, vd
, offset
, buf
, size
,
2150 ZIO_TYPE_READ
, ZIO_PRIORITY_SYNC_READ
, zio_flags
, NULL
, NULL
));
2151 error
= zio_wait(zio
);
2152 spa_config_exit(spa
, SCL_STATE
, FTAG
);
2155 (void) printf("Read of %s failed, error: %d\n", thing
, error
);
2159 if (flags
& ZDB_FLAG_PRINT_BLKPTR
)
2160 zdb_print_blkptr((blkptr_t
*)(void *)
2161 ((uintptr_t)buf
+ (uintptr_t)blkptr_offset
), flags
);
2162 else if (flags
& ZDB_FLAG_RAW
)
2163 zdb_dump_block_raw(buf
, size
, flags
);
2164 else if (flags
& ZDB_FLAG_INDIRECT
)
2165 zdb_dump_indirect((blkptr_t
*)buf
, size
/ sizeof (blkptr_t
),
2167 else if (flags
& ZDB_FLAG_GBH
)
2168 zdb_dump_gbh(buf
, flags
);
2170 zdb_dump_block(thing
, buf
, size
, flags
);
2173 umem_free(buf
, size
);
2178 nvlist_string_match(nvlist_t
*config
, char *name
, char *tgt
)
2182 if (nvlist_lookup_string(config
, name
, &s
) != 0)
2185 return (strcmp(s
, tgt
) == 0);
2189 nvlist_uint64_match(nvlist_t
*config
, char *name
, uint64_t tgt
)
2193 if (nvlist_lookup_uint64(config
, name
, &val
) != 0)
2196 return (val
== tgt
);
2200 vdev_child_guid_match(nvlist_t
*vdev
, uint64_t guid
)
2205 verify(nvlist_lookup_nvlist_array(vdev
, ZPOOL_CONFIG_CHILDREN
,
2206 &child
, &children
) == 0);
2207 for (c
= 0; c
< children
; ++c
)
2208 if (nvlist_uint64_match(child
[c
], ZPOOL_CONFIG_GUID
, guid
))
2214 vdev_child_string_match(nvlist_t
*vdev
, char *tgt
)
2219 verify(nvlist_lookup_nvlist_array(vdev
, ZPOOL_CONFIG_CHILDREN
,
2220 &child
, &children
) == 0);
2221 for (c
= 0; c
< children
; ++c
) {
2222 if (nvlist_string_match(child
[c
], ZPOOL_CONFIG_PATH
, tgt
) ||
2223 nvlist_string_match(child
[c
], ZPOOL_CONFIG_DEVID
, tgt
))
2230 vdev_guid_match(nvlist_t
*config
, uint64_t guid
)
2234 verify(nvlist_lookup_nvlist(config
, ZPOOL_CONFIG_VDEV_TREE
,
2237 return (nvlist_uint64_match(nvroot
, ZPOOL_CONFIG_GUID
, guid
) ||
2238 vdev_child_guid_match(nvroot
, guid
));
2242 vdev_string_match(nvlist_t
*config
, char *tgt
)
2246 verify(nvlist_lookup_nvlist(config
, ZPOOL_CONFIG_VDEV_TREE
,
2249 return (vdev_child_string_match(nvroot
, tgt
));
2253 pool_match(nvlist_t
*config
, char *tgt
)
2255 uint64_t guid
= strtoull(tgt
, NULL
, 0);
2259 nvlist_uint64_match(config
, ZPOOL_CONFIG_POOL_GUID
, guid
) ||
2260 vdev_guid_match(config
, guid
));
2263 nvlist_string_match(config
, ZPOOL_CONFIG_POOL_NAME
, tgt
) ||
2264 vdev_string_match(config
, tgt
));
2269 find_exported_zpool(char *pool_id
, nvlist_t
**configp
, char *vdev_dir
)
2273 nvlist_t
*match
= NULL
;
2275 if (vdev_dir
!= NULL
)
2276 pools
= zpool_find_import_activeok(g_zfs
, 1, &vdev_dir
);
2278 pools
= zpool_find_import_activeok(g_zfs
, 0, NULL
);
2280 if (pools
!= NULL
) {
2281 nvpair_t
*elem
= NULL
;
2283 while ((elem
= nvlist_next_nvpair(pools
, elem
)) != NULL
) {
2284 verify(nvpair_value_nvlist(elem
, configp
) == 0);
2285 if (pool_match(*configp
, pool_id
)) {
2286 if (match
!= NULL
) {
2288 "More than one matching pool - "
2289 "specify guid/devid/device path.");
2298 *configp
= error
? NULL
: match
;
2304 main(int argc
, char **argv
)
2307 struct rlimit rl
= { 1024, 1024 };
2309 objset_t
*os
= NULL
;
2315 char *vdev_dir
= NULL
;
2317 (void) setrlimit(RLIMIT_NOFILE
, &rl
);
2318 (void) enable_extended_FILE_stdio(-1, -1);
2320 dprintf_setup(&argc
, argv
);
2322 while ((c
= getopt(argc
, argv
, "udibcmsvCLS:U:lRep:t:")) != -1) {
2344 spa_config_path
= optarg
;
2355 zdb_sig_user_data
= (strncmp(optarg
, "user:", 5) == 0);
2356 if (!zdb_sig_user_data
&& strncmp(optarg
, "all:", 4))
2358 endstr
= strchr(optarg
, ':') + 1;
2359 if (strcmp(endstr
, "fletcher2") == 0)
2360 zdb_sig_cksumalg
= ZIO_CHECKSUM_FLETCHER_2
;
2361 else if (strcmp(endstr
, "fletcher4") == 0)
2362 zdb_sig_cksumalg
= ZIO_CHECKSUM_FLETCHER_4
;
2363 else if (strcmp(endstr
, "sha256") == 0)
2364 zdb_sig_cksumalg
= ZIO_CHECKSUM_SHA256
;
2365 else if (strcmp(endstr
, "all") == 0)
2366 zdb_sig_cksumalg
= ZIO_CHECKSUM_FLETCHER_2
;
2371 ub_max_txg
= strtoull(optarg
, NULL
, 0);
2372 if (ub_max_txg
< TXG_INITIAL
) {
2373 (void) fprintf(stderr
, "incorrect txg "
2374 "specified: %s\n", optarg
);
2384 if (vdev_dir
!= NULL
&& exported
== 0) {
2385 (void) fprintf(stderr
, "-p option requires use of -e\n");
2390 g_zfs
= libzfs_init();
2391 ASSERT(g_zfs
!= NULL
);
2393 for (c
= 0; c
< 256; c
++) {
2394 if (dump_all
&& c
!= 'l' && c
!= 'R')
2397 dump_opt
[c
] += verbose
;
2404 if (dump_opt
['C']) {
2405 dump_cachefile(spa_config_path
);
2411 if (dump_opt
['l']) {
2412 dump_label(argv
[0]);
2416 if (dump_opt
['R']) {
2417 flagbits
['b'] = ZDB_FLAG_PRINT_BLKPTR
;
2418 flagbits
['c'] = ZDB_FLAG_CHECKSUM
;
2419 flagbits
['d'] = ZDB_FLAG_DECOMPRESS
;
2420 flagbits
['e'] = ZDB_FLAG_BSWAP
;
2421 flagbits
['g'] = ZDB_FLAG_GBH
;
2422 flagbits
['i'] = ZDB_FLAG_INDIRECT
;
2423 flagbits
['p'] = ZDB_FLAG_PHYS
;
2424 flagbits
['r'] = ZDB_FLAG_RAW
;
2428 zdb_read_block(argv
[0], &spa
);
2433 spa_close(spa
, (void *)zdb_read_block
);
2438 dump_config(argv
[0]);
2443 * Check to see if the name refers to an exported zpool
2446 nvlist_t
*exported_conf
= NULL
;
2448 if ((slash
= strchr(argv
[0], '/')) != NULL
)
2451 error
= find_exported_zpool(argv
[0], &exported_conf
, vdev_dir
);
2453 nvlist_t
*nvl
= NULL
;
2455 if (vdev_dir
!= NULL
) {
2456 if (nvlist_alloc(&nvl
, NV_UNIQUE_NAME
, 0) != 0)
2458 else if (nvlist_add_string(nvl
,
2459 zpool_prop_to_name(ZPOOL_PROP_ALTROOT
),
2465 error
= spa_import_verbatim(argv
[0],
2466 exported_conf
, nvl
);
2476 if (strchr(argv
[0], '/') != NULL
) {
2477 error
= dmu_objset_open(argv
[0], DMU_OST_ANY
,
2478 DS_MODE_USER
| DS_MODE_READONLY
, &os
);
2480 error
= spa_open(argv
[0], &spa
, FTAG
);
2485 fatal("can't open %s: %s", argv
[0], strerror(error
));
2489 zopt_objects
= argc
;
2490 zopt_object
= calloc(zopt_objects
, sizeof (uint64_t));
2491 for (i
= 0; i
< zopt_objects
; i
++) {
2493 zopt_object
[i
] = strtoull(argv
[i
], NULL
, 0);
2494 if (zopt_object
[i
] == 0 && errno
!= 0)
2495 fatal("bad object number %s: %s",
2496 argv
[i
], strerror(errno
));
2502 dmu_objset_close(os
);
2505 spa_close(spa
, FTAG
);
2508 fuid_table_destroy();