xref: /illumos-gate/usr/src/cmd/zdb/zdb.c (revision 663207adb1669640c01c5ec6949ce78fd806efae)
1fa9e4066Sahrens /*
2fa9e4066Sahrens  * CDDL HEADER START
3fa9e4066Sahrens  *
4fa9e4066Sahrens  * The contents of this file are subject to the terms of the
5ea8dc4b6Seschrock  * Common Development and Distribution License (the "License").
6ea8dc4b6Seschrock  * You may not use this file except in compliance with the License.
7fa9e4066Sahrens  *
8fa9e4066Sahrens  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9fa9e4066Sahrens  * or http://www.opensolaris.org/os/licensing.
10fa9e4066Sahrens  * See the License for the specific language governing permissions
11fa9e4066Sahrens  * and limitations under the License.
12fa9e4066Sahrens  *
13fa9e4066Sahrens  * When distributing Covered Code, include this CDDL HEADER in each
14fa9e4066Sahrens  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15fa9e4066Sahrens  * If applicable, add the following below this CDDL HEADER, with the
16fa9e4066Sahrens  * fields enclosed by brackets "[]" replaced with your own identifying
17fa9e4066Sahrens  * information: Portions Copyright [yyyy] [name of copyright owner]
18fa9e4066Sahrens  *
19fa9e4066Sahrens  * CDDL HEADER END
20fa9e4066Sahrens  */
21ad135b5dSChristopher Siden 
22fa9e4066Sahrens /*
238f2529deSMark Shellenbaum  * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
24*663207adSDon Brady  * Copyright (c) 2011, 2018 by Delphix. All rights reserved.
25c3d26abcSMatthew Ahrens  * Copyright (c) 2014 Integros [integros.com]
26ed61ec1dSYuri Pankov  * Copyright 2017 Nexenta Systems, Inc.
27e0f1c0afSOlaf Faaland  * Copyright (c) 2017, 2018 Lawrence Livermore National Security, LLC.
28f06dce2cSAndrew Stormont  * Copyright 2017 RackTop Systems.
29fa9e4066Sahrens  */
30fa9e4066Sahrens 
31fa9e4066Sahrens #include <stdio.h>
32490d05b9SMatthew Ahrens #include <unistd.h>
33004388ebScasper #include <stdio_ext.h>
34fa9e4066Sahrens #include <stdlib.h>
3544cd46caSbillm #include <ctype.h>
36fa9e4066Sahrens #include <sys/zfs_context.h>
37fa9e4066Sahrens #include <sys/spa.h>
38fa9e4066Sahrens #include <sys/spa_impl.h>
39fa9e4066Sahrens #include <sys/dmu.h>
40fa9e4066Sahrens #include <sys/zap.h>
41fa9e4066Sahrens #include <sys/fs/zfs.h>
42fa9e4066Sahrens #include <sys/zfs_znode.h>
430a586ceaSMark Shellenbaum #include <sys/zfs_sa.h>
440a586ceaSMark Shellenbaum #include <sys/sa.h>
450a586ceaSMark Shellenbaum #include <sys/sa_impl.h>
46fa9e4066Sahrens #include <sys/vdev.h>
47fa9e4066Sahrens #include <sys/vdev_impl.h>
48fa9e4066Sahrens #include <sys/metaslab_impl.h>
49fa9e4066Sahrens #include <sys/dmu_objset.h>
50fa9e4066Sahrens #include <sys/dsl_dir.h>
51fa9e4066Sahrens #include <sys/dsl_dataset.h>
52fa9e4066Sahrens #include <sys/dsl_pool.h>
53fa9e4066Sahrens #include <sys/dbuf.h>
54fa9e4066Sahrens #include <sys/zil.h>
55fa9e4066Sahrens #include <sys/zil_impl.h>
56fa9e4066Sahrens #include <sys/stat.h>
57fa9e4066Sahrens #include <sys/resource.h>
58fa9e4066Sahrens #include <sys/dmu_traverse.h>
59fa9e4066Sahrens #include <sys/zio_checksum.h>
60fa9e4066Sahrens #include <sys/zio_compress.h>
61e0d35c44Smarks #include <sys/zfs_fuid.h>
6288b7b0f2SMatthew Ahrens #include <sys/arc.h>
63b24ab676SJeff Bonwick #include <sys/ddt.h>
64ad135b5dSChristopher Siden #include <sys/zfeature.h>
65770499e1SDan Kimmel #include <sys/abd.h>
664923c69fSMatthew Ahrens #include <sys/blkptr.h>
6717fb938fSMatthew Ahrens #include <sys/dsl_scan.h>
684445fffbSMatthew Ahrens #include <zfs_comutil.h>
690a055120SJason King #include <libcmdutils.h>
70de6628f0Sck #undef verify
71de6628f0Sck #include <libzfs.h>
72fa9e4066Sahrens 
733f7978d0SAlan Somers #include "zdb.h"
743f7978d0SAlan Somers 
75e690fb27SChristopher Siden #define	ZDB_COMPRESS_NAME(idx) ((idx) < ZIO_COMPRESS_FUNCTIONS ?	\
76e690fb27SChristopher Siden 	zio_compress_table[(idx)].ci_name : "UNKNOWN")
77e690fb27SChristopher Siden #define	ZDB_CHECKSUM_NAME(idx) ((idx) < ZIO_CHECKSUM_FUNCTIONS ?	\
78e690fb27SChristopher Siden 	zio_checksum_table[(idx)].ci_name : "UNKNOWN")
79e690fb27SChristopher Siden #define	ZDB_OT_NAME(idx) ((idx) < DMU_OT_NUMTYPES ?	\
80e690fb27SChristopher Siden 	dmu_ot[(idx)].ot_name : DMU_OT_IS_VALID(idx) ?	\
81e690fb27SChristopher Siden 	dmu_ot_byteswap[DMU_OT_BYTESWAP(idx)].ob_name : "UNKNOWN")
82e690fb27SChristopher Siden #define	ZDB_OT_TYPE(idx) ((idx) < DMU_OT_NUMTYPES ? (idx) :		\
835cabbc6bSPrashanth Sreenivasa 	(idx) == DMU_OTN_ZAP_DATA || (idx) == DMU_OTN_ZAP_METADATA ?	\
845cabbc6bSPrashanth Sreenivasa 	DMU_OT_ZAP_OTHER : \
855cabbc6bSPrashanth Sreenivasa 	(idx) == DMU_OTN_UINT64_DATA || (idx) == DMU_OTN_UINT64_METADATA ? \
865cabbc6bSPrashanth Sreenivasa 	DMU_OT_UINT64_OTHER : DMU_OT_NUMTYPES)
876de8f417SVictor Latushkin 
88feef89cfSVictor Latushkin #ifndef lint
894dd77f9eSMatthew Ahrens extern int reference_tracking_enable;
907fd05ac4SMatthew Ahrens extern boolean_t zfs_recover;
9106be9802SMatthew Ahrens extern uint64_t zfs_arc_max, zfs_arc_meta_limit;
92f7950bf1SMatthew Ahrens extern int zfs_vdev_async_read_max_active;
93f06dce2cSAndrew Stormont extern int aok;
94e144c4e6SPavel Zakharov extern boolean_t spa_load_verify_dryrun;
95feef89cfSVictor Latushkin #else
964dd77f9eSMatthew Ahrens int reference_tracking_enable;
977fd05ac4SMatthew Ahrens boolean_t zfs_recover;
9806be9802SMatthew Ahrens uint64_t zfs_arc_max, zfs_arc_meta_limit;
99f7950bf1SMatthew Ahrens int zfs_vdev_async_read_max_active;
100f06dce2cSAndrew Stormont int aok;
101e144c4e6SPavel Zakharov boolean_t spa_load_verify_dryrun;
102feef89cfSVictor Latushkin #endif
103feef89cfSVictor Latushkin 
1043f7978d0SAlan Somers static const char cmdname[] = "zdb";
105fa9e4066Sahrens uint8_t dump_opt[256];
106fa9e4066Sahrens 
107fa9e4066Sahrens typedef void object_viewer_t(objset_t *, uint64_t, void *data, size_t size);
108fa9e4066Sahrens 
109fa9e4066Sahrens uint64_t *zopt_object = NULL;
1103f7978d0SAlan Somers static unsigned zopt_objects = 0;
111de6628f0Sck libzfs_handle_t *g_zfs;
11206be9802SMatthew Ahrens uint64_t max_inflight = 1000;
11320b5dafbSPaul Dagnelie static int leaked_objects = 0;
114fa9e4066Sahrens 
115732885fcSMatthew Ahrens static void snprintf_blkptr_compact(char *, size_t, const blkptr_t *);
11617fb938fSMatthew Ahrens static void mos_obj_refd(uint64_t);
117732885fcSMatthew Ahrens 
118fa9e4066Sahrens /*
119fa9e4066Sahrens  * These libumem hooks provide a reasonable set of defaults for the allocator's
120fa9e4066Sahrens  * debugging facilities.
121fa9e4066Sahrens  */
122fa9e4066Sahrens const char *
123fa9e4066Sahrens _umem_debug_init()
124fa9e4066Sahrens {
125fa9e4066Sahrens 	return ("default,verbose"); /* $UMEM_DEBUG setting */
126fa9e4066Sahrens }
127fa9e4066Sahrens 
128fa9e4066Sahrens const char *
129fa9e4066Sahrens _umem_logging_init(void)
130fa9e4066Sahrens {
131fa9e4066Sahrens 	return ("fail,contents"); /* $UMEM_LOGGING setting */
132fa9e4066Sahrens }
133fa9e4066Sahrens 
134fa9e4066Sahrens static void
135fa9e4066Sahrens usage(void)
136fa9e4066Sahrens {
137fa9e4066Sahrens 	(void) fprintf(stderr,
13886714001SSerapheim Dimitropoulos 	    "Usage:\t%s [-AbcdDFGhikLMPsvX] [-e [-V] [-p <path> ...]] "
139ed61ec1dSYuri Pankov 	    "[-I <inflight I/Os>]\n"
140ed61ec1dSYuri Pankov 	    "\t\t[-o <var>=<value>]... [-t <txg>] [-U <cache>] [-x <dumpdir>]\n"
141ed61ec1dSYuri Pankov 	    "\t\t[<poolname> [<object> ...]]\n"
142dfd5965fSRichard Yao 	    "\t%s [-AdiPv] [-e [-V] [-p <path> ...]] [-U <cache>] <dataset> "
143ed61ec1dSYuri Pankov 	    "[<object> ...]\n"
144ed61ec1dSYuri Pankov 	    "\t%s -C [-A] [-U <cache>]\n"
145ed61ec1dSYuri Pankov 	    "\t%s -l [-Aqu] <device>\n"
146dfd5965fSRichard Yao 	    "\t%s -m [-AFLPX] [-e [-V] [-p <path> ...]] [-t <txg>] "
147dfd5965fSRichard Yao 	    "[-U <cache>]\n\t\t<poolname> [<vdev> [<metaslab> ...]]\n"
148ed61ec1dSYuri Pankov 	    "\t%s -O <dataset> <path>\n"
149dfd5965fSRichard Yao 	    "\t%s -R [-A] [-e [-V] [-p <path> ...]] [-U <cache>]\n"
150ed61ec1dSYuri Pankov 	    "\t\t<poolname> <vdev>:<offset>:<size>[:<flags>]\n"
1514923c69fSMatthew Ahrens 	    "\t%s -E [-A] word0:word1:...:word15\n"
152dfd5965fSRichard Yao 	    "\t%s -S [-AP] [-e [-V] [-p <path> ...]] [-U <cache>] "
153dfd5965fSRichard Yao 	    "<poolname>\n\n",
154ed61ec1dSYuri Pankov 	    cmdname, cmdname, cmdname, cmdname, cmdname, cmdname, cmdname,
1554923c69fSMatthew Ahrens 	    cmdname, cmdname);
1563ad6c7f9SVictor Latushkin 
1573ad6c7f9SVictor Latushkin 	(void) fprintf(stderr, "    Dataset name must include at least one "
1583ad6c7f9SVictor Latushkin 	    "separator character '/' or '@'\n");
1593ad6c7f9SVictor Latushkin 	(void) fprintf(stderr, "    If dataset name is specified, only that "
1603ad6c7f9SVictor Latushkin 	    "dataset is dumped\n");
1613ad6c7f9SVictor Latushkin 	(void) fprintf(stderr, "    If object numbers are specified, only "
1623ad6c7f9SVictor Latushkin 	    "those objects are dumped\n\n");
1633ad6c7f9SVictor Latushkin 	(void) fprintf(stderr, "    Options to control amount of output:\n");
1643ad6c7f9SVictor Latushkin 	(void) fprintf(stderr, "        -b block statistics\n");
1653ad6c7f9SVictor Latushkin 	(void) fprintf(stderr, "        -c checksum all metadata (twice for "
1666365109dSVictor Latushkin 	    "all data) blocks\n");
167ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -C config (or cachefile if alone)\n");
168ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -d dataset(s)\n");
169f0ba89beSJeff Bonwick 	(void) fprintf(stderr, "        -D dedup statistics\n");
1704923c69fSMatthew Ahrens 	(void) fprintf(stderr, "        -E decode and display block from an "
1714923c69fSMatthew Ahrens 	    "embedded block pointer\n");
172ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -h pool history\n");
173ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -i intent logs\n");
17464723e36SYuri Pankov 	(void) fprintf(stderr, "        -l read label contents\n");
17586714001SSerapheim Dimitropoulos 	(void) fprintf(stderr, "        -k examine the checkpointed state "
17686714001SSerapheim Dimitropoulos 	    "of the pool\n");
17782a0a985SVictor Latushkin 	(void) fprintf(stderr, "        -L disable leak tracking (do not "
17882a0a985SVictor Latushkin 	    "load spacemaps)\n");
179ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -m metaslabs\n");
180ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -M metaslab groups\n");
181ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -O perform object lookups by path\n");
182d41e7643Sek 	(void) fprintf(stderr, "        -R read and display block from a "
183ed61ec1dSYuri Pankov 	    "device\n");
184ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -s report stats on zdb's I/O\n");
185ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -S simulate dedup to measure effect\n");
186ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -v verbose (applies to all "
187ed61ec1dSYuri Pankov 	    "others)\n\n");
1883ad6c7f9SVictor Latushkin 	(void) fprintf(stderr, "    Below options are intended for use "
189df15e419SMatthew Ahrens 	    "with other options:\n");
190feef89cfSVictor Latushkin 	(void) fprintf(stderr, "        -A ignore assertions (-A), enable "
191feef89cfSVictor Latushkin 	    "panic recovery (-AA) or both (-AAA)\n");
1923ad6c7f9SVictor Latushkin 	(void) fprintf(stderr, "        -e pool is exported/destroyed/"
1933ad6c7f9SVictor Latushkin 	    "has altroot/not in a cachefile\n");
194ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -F attempt automatic rewind within "
195ed61ec1dSYuri Pankov 	    "safe range of transaction groups\n");
196ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -G dump zfs_dbgmsg buffer before "
197ed61ec1dSYuri Pankov 	    "exiting\n");
1982e4c9986SGeorge Wilson 	(void) fprintf(stderr, "        -I <number of inflight I/Os> -- "
199df15e419SMatthew Ahrens 	    "specify the maximum number of "
200df15e419SMatthew Ahrens 	    "checksumming I/Os [default is 200]\n");
2010e60744cSPavel Zakharov 	(void) fprintf(stderr, "        -o <variable>=<value> set global "
2020e60744cSPavel Zakharov 	    "variable to an unsigned 32-bit integer value\n");
203ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -p <path> -- use one or more with "
204ed61ec1dSYuri Pankov 	    "-e to specify path to vdev dir\n");
205ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -P print numbers in parseable form\n");
20664723e36SYuri Pankov 	(void) fprintf(stderr, "        -q don't print label contents\n");
207ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -t <txg> -- highest txg to use when "
208ed61ec1dSYuri Pankov 	    "searching for uberblocks\n");
20964723e36SYuri Pankov 	(void) fprintf(stderr, "        -u uberblock\n");
210ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -U <cachefile_path> -- use alternate "
211ed61ec1dSYuri Pankov 	    "cachefile\n");
212dfd5965fSRichard Yao 	(void) fprintf(stderr, "        -V do verbatim import\n");
213ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -x <dumpdir> -- "
214ed61ec1dSYuri Pankov 	    "dump all read blocks into specified directory\n");
215ed61ec1dSYuri Pankov 	(void) fprintf(stderr, "        -X attempt extreme rewind (does not "
216ed61ec1dSYuri Pankov 	    "work with dataset)\n\n");
217fa9e4066Sahrens 	(void) fprintf(stderr, "Specify an option more than once (e.g. -bb) "
218fa9e4066Sahrens 	    "to make only that option verbose\n");
219fa9e4066Sahrens 	(void) fprintf(stderr, "Default is to dump everything non-verbosely\n");
220fa9e4066Sahrens 	exit(1);
221fa9e4066Sahrens }
222fa9e4066Sahrens 
22329bdd2f9SPavel Zakharov static void
22429bdd2f9SPavel Zakharov dump_debug_buffer()
22529bdd2f9SPavel Zakharov {
22629bdd2f9SPavel Zakharov 	if (dump_opt['G']) {
22729bdd2f9SPavel Zakharov 		(void) printf("\n");
22829bdd2f9SPavel Zakharov 		zfs_dbgmsg_print("zdb");
22929bdd2f9SPavel Zakharov 	}
23029bdd2f9SPavel Zakharov }
23129bdd2f9SPavel Zakharov 
232ccba0801SRich Morris /*
233ccba0801SRich Morris  * Called for usage errors that are discovered after a call to spa_open(),
234ccba0801SRich Morris  * dmu_bonus_hold(), or pool_match().  abort() is called for other errors.
235ccba0801SRich Morris  */
236ccba0801SRich Morris 
237fa9e4066Sahrens static void
238fa9e4066Sahrens fatal(const char *fmt, ...)
239fa9e4066Sahrens {
240fa9e4066Sahrens 	va_list ap;
241fa9e4066Sahrens 
242fa9e4066Sahrens 	va_start(ap, fmt);
243fa9e4066Sahrens 	(void) fprintf(stderr, "%s: ", cmdname);
244fa9e4066Sahrens 	(void) vfprintf(stderr, fmt, ap);
245fa9e4066Sahrens 	va_end(ap);
246fa9e4066Sahrens 	(void) fprintf(stderr, "\n");
247fa9e4066Sahrens 
24829bdd2f9SPavel Zakharov 	dump_debug_buffer();
24929bdd2f9SPavel Zakharov 
250ccba0801SRich Morris 	exit(1);
251fa9e4066Sahrens }
252fa9e4066Sahrens 
253fa9e4066Sahrens /* ARGSUSED */
254fa9e4066Sahrens static void
255fa9e4066Sahrens dump_packed_nvlist(objset_t *os, uint64_t object, void *data, size_t size)
256fa9e4066Sahrens {
257fa9e4066Sahrens 	nvlist_t *nv;
258fa9e4066Sahrens 	size_t nvsize = *(uint64_t *)data;
259fa9e4066Sahrens 	char *packed = umem_alloc(nvsize, UMEM_NOFAIL);
260fa9e4066Sahrens 
2617bfdf011SNeil Perrin 	VERIFY(0 == dmu_read(os, object, 0, nvsize, packed, DMU_READ_PREFETCH));
262fa9e4066Sahrens 
263fa9e4066Sahrens 	VERIFY(nvlist_unpack(packed, nvsize, &nv, 0) == 0);
264fa9e4066Sahrens 
265fa9e4066Sahrens 	umem_free(packed, nvsize);
266fa9e4066Sahrens 
267fa9e4066Sahrens 	dump_nvlist(nv, 8);
268fa9e4066Sahrens 
269fa9e4066Sahrens 	nvlist_free(nv);
270fa9e4066Sahrens }
271fa9e4066Sahrens 
2724445fffbSMatthew Ahrens /* ARGSUSED */
2734445fffbSMatthew Ahrens static void
2744445fffbSMatthew Ahrens dump_history_offsets(objset_t *os, uint64_t object, void *data, size_t size)
2754445fffbSMatthew Ahrens {
2764445fffbSMatthew Ahrens 	spa_history_phys_t *shp = data;
2774445fffbSMatthew Ahrens 
2784445fffbSMatthew Ahrens 	if (shp == NULL)
2794445fffbSMatthew Ahrens 		return;
2804445fffbSMatthew Ahrens 
2814445fffbSMatthew Ahrens 	(void) printf("\t\tpool_create_len = %llu\n",
2824445fffbSMatthew Ahrens 	    (u_longlong_t)shp->sh_pool_create_len);
2834445fffbSMatthew Ahrens 	(void) printf("\t\tphys_max_off = %llu\n",
2844445fffbSMatthew Ahrens 	    (u_longlong_t)shp->sh_phys_max_off);
2854445fffbSMatthew Ahrens 	(void) printf("\t\tbof = %llu\n",
2864445fffbSMatthew Ahrens 	    (u_longlong_t)shp->sh_bof);
2874445fffbSMatthew Ahrens 	(void) printf("\t\teof = %llu\n",
2884445fffbSMatthew Ahrens 	    (u_longlong_t)shp->sh_eof);
2894445fffbSMatthew Ahrens 	(void) printf("\t\trecords_lost = %llu\n",
2904445fffbSMatthew Ahrens 	    (u_longlong_t)shp->sh_records_lost);
2914445fffbSMatthew Ahrens }
2924445fffbSMatthew Ahrens 
2933f9d6ad7SLin Ling static void
2940a055120SJason King zdb_nicenum(uint64_t num, char *buf, size_t buflen)
2953f9d6ad7SLin Ling {
2963f9d6ad7SLin Ling 	if (dump_opt['P'])
2970a055120SJason King 		(void) snprintf(buf, buflen, "%llu", (longlong_t)num);
2983f9d6ad7SLin Ling 	else
2990a055120SJason King 		nicenum(num, buf, sizeof (buf));
3003f9d6ad7SLin Ling }
3013f9d6ad7SLin Ling 
3023f7978d0SAlan Somers static const char histo_stars[] = "****************************************";
3033f7978d0SAlan Somers static const uint64_t histo_width = sizeof (histo_stars) - 1;
304fa9e4066Sahrens 
305fa9e4066Sahrens static void
3060713e232SGeorge Wilson dump_histogram(const uint64_t *histo, int size, int offset)
307fa9e4066Sahrens {
308fa9e4066Sahrens 	int i;
309490d05b9SMatthew Ahrens 	int minidx = size - 1;
310fa9e4066Sahrens 	int maxidx = 0;
311fa9e4066Sahrens 	uint64_t max = 0;
312fa9e4066Sahrens 
313490d05b9SMatthew Ahrens 	for (i = 0; i < size; i++) {
314fa9e4066Sahrens 		if (histo[i] > max)
315fa9e4066Sahrens 			max = histo[i];
316fa9e4066Sahrens 		if (histo[i] > 0 && i > maxidx)
317fa9e4066Sahrens 			maxidx = i;
318fa9e4066Sahrens 		if (histo[i] > 0 && i < minidx)
319fa9e4066Sahrens 			minidx = i;
320fa9e4066Sahrens 	}
321fa9e4066Sahrens 
322490d05b9SMatthew Ahrens 	if (max < histo_width)
323490d05b9SMatthew Ahrens 		max = histo_width;
324fa9e4066Sahrens 
325490d05b9SMatthew Ahrens 	for (i = minidx; i <= maxidx; i++) {
326490d05b9SMatthew Ahrens 		(void) printf("\t\t\t%3u: %6llu %s\n",
3270713e232SGeorge Wilson 		    i + offset, (u_longlong_t)histo[i],
328490d05b9SMatthew Ahrens 		    &histo_stars[(max - histo[i]) * histo_width / max]);
329490d05b9SMatthew Ahrens 	}
330fa9e4066Sahrens }
331fa9e4066Sahrens 
332fa9e4066Sahrens static void
333fa9e4066Sahrens dump_zap_stats(objset_t *os, uint64_t object)
334fa9e4066Sahrens {
335fa9e4066Sahrens 	int error;
336fa9e4066Sahrens 	zap_stats_t zs;
337fa9e4066Sahrens 
338fa9e4066Sahrens 	error = zap_get_stats(os, object, &zs);
339fa9e4066Sahrens 	if (error)
340fa9e4066Sahrens 		return;
341fa9e4066Sahrens 
342fa9e4066Sahrens 	if (zs.zs_ptrtbl_len == 0) {
343fa9e4066Sahrens 		ASSERT(zs.zs_num_blocks == 1);
344fa9e4066Sahrens 		(void) printf("\tmicrozap: %llu bytes, %llu entries\n",
345fa9e4066Sahrens 		    (u_longlong_t)zs.zs_blocksize,
346fa9e4066Sahrens 		    (u_longlong_t)zs.zs_num_entries);
347fa9e4066Sahrens 		return;
348fa9e4066Sahrens 	}
349fa9e4066Sahrens 
350fa9e4066Sahrens 	(void) printf("\tFat ZAP stats:\n");
3518248818dSnd 
3528248818dSnd 	(void) printf("\t\tPointer table:\n");
3538248818dSnd 	(void) printf("\t\t\t%llu elements\n",
354fa9e4066Sahrens 	    (u_longlong_t)zs.zs_ptrtbl_len);
3558248818dSnd 	(void) printf("\t\t\tzt_blk: %llu\n",
3568248818dSnd 	    (u_longlong_t)zs.zs_ptrtbl_zt_blk);
3578248818dSnd 	(void) printf("\t\t\tzt_numblks: %llu\n",
3588248818dSnd 	    (u_longlong_t)zs.zs_ptrtbl_zt_numblks);
3598248818dSnd 	(void) printf("\t\t\tzt_shift: %llu\n",
3608248818dSnd 	    (u_longlong_t)zs.zs_ptrtbl_zt_shift);
3618248818dSnd 	(void) printf("\t\t\tzt_blks_copied: %llu\n",
3628248818dSnd 	    (u_longlong_t)zs.zs_ptrtbl_blks_copied);
3638248818dSnd 	(void) printf("\t\t\tzt_nextblk: %llu\n",
3648248818dSnd 	    (u_longlong_t)zs.zs_ptrtbl_nextblk);
3658248818dSnd 
366fa9e4066Sahrens 	(void) printf("\t\tZAP entries: %llu\n",
367fa9e4066Sahrens 	    (u_longlong_t)zs.zs_num_entries);
368fa9e4066Sahrens 	(void) printf("\t\tLeaf blocks: %llu\n",
369fa9e4066Sahrens 	    (u_longlong_t)zs.zs_num_leafs);
370fa9e4066Sahrens 	(void) printf("\t\tTotal blocks: %llu\n",
371fa9e4066Sahrens 	    (u_longlong_t)zs.zs_num_blocks);
3728248818dSnd 	(void) printf("\t\tzap_block_type: 0x%llx\n",
3738248818dSnd 	    (u_longlong_t)zs.zs_block_type);
3748248818dSnd 	(void) printf("\t\tzap_magic: 0x%llx\n",
3758248818dSnd 	    (u_longlong_t)zs.zs_magic);
3768248818dSnd 	(void) printf("\t\tzap_salt: 0x%llx\n",
3778248818dSnd 	    (u_longlong_t)zs.zs_salt);
378fa9e4066Sahrens 
379fa9e4066Sahrens 	(void) printf("\t\tLeafs with 2^n pointers:\n");
3800713e232SGeorge Wilson 	dump_histogram(zs.zs_leafs_with_2n_pointers, ZAP_HISTOGRAM_SIZE, 0);
381fa9e4066Sahrens 
382fa9e4066Sahrens 	(void) printf("\t\tBlocks with n*5 entries:\n");
3830713e232SGeorge Wilson 	dump_histogram(zs.zs_blocks_with_n5_entries, ZAP_HISTOGRAM_SIZE, 0);
384fa9e4066Sahrens 
385fa9e4066Sahrens 	(void) printf("\t\tBlocks n/10 full:\n");
3860713e232SGeorge Wilson 	dump_histogram(zs.zs_blocks_n_tenths_full, ZAP_HISTOGRAM_SIZE, 0);
387fa9e4066Sahrens 
388fa9e4066Sahrens 	(void) printf("\t\tEntries with n chunks:\n");
3890713e232SGeorge Wilson 	dump_histogram(zs.zs_entries_using_n_chunks, ZAP_HISTOGRAM_SIZE, 0);
390fa9e4066Sahrens 
391fa9e4066Sahrens 	(void) printf("\t\tBuckets with n entries:\n");
3920713e232SGeorge Wilson 	dump_histogram(zs.zs_buckets_with_n_entries, ZAP_HISTOGRAM_SIZE, 0);
393fa9e4066Sahrens }
394fa9e4066Sahrens 
395fa9e4066Sahrens /*ARGSUSED*/
396fa9e4066Sahrens static void
397fa9e4066Sahrens dump_none(objset_t *os, uint64_t object, void *data, size_t size)
398fa9e4066Sahrens {
399fa9e4066Sahrens }
400fa9e4066Sahrens 
4016de8f417SVictor Latushkin /*ARGSUSED*/
4026de8f417SVictor Latushkin static void
4036de8f417SVictor Latushkin dump_unknown(objset_t *os, uint64_t object, void *data, size_t size)
4046de8f417SVictor Latushkin {
4056de8f417SVictor Latushkin 	(void) printf("\tUNKNOWN OBJECT TYPE\n");
4066de8f417SVictor Latushkin }
4076de8f417SVictor Latushkin 
408fa9e4066Sahrens /*ARGSUSED*/
4093f7978d0SAlan Somers static void
410fa9e4066Sahrens dump_uint8(objset_t *os, uint64_t object, void *data, size_t size)
411fa9e4066Sahrens {
412fa9e4066Sahrens }
413fa9e4066Sahrens 
414fa9e4066Sahrens /*ARGSUSED*/
415fa9e4066Sahrens static void
416fa9e4066Sahrens dump_uint64(objset_t *os, uint64_t object, void *data, size_t size)
417fa9e4066Sahrens {
418fa9e4066Sahrens }
419fa9e4066Sahrens 
420fa9e4066Sahrens /*ARGSUSED*/
421fa9e4066Sahrens static void
422fa9e4066Sahrens dump_zap(objset_t *os, uint64_t object, void *data, size_t size)
423fa9e4066Sahrens {
424fa9e4066Sahrens 	zap_cursor_t zc;
425fa9e4066Sahrens 	zap_attribute_t attr;
426fa9e4066Sahrens 	void *prop;
4273f7978d0SAlan Somers 	unsigned i;
428fa9e4066Sahrens 
429fa9e4066Sahrens 	dump_zap_stats(os, object);
430fa9e4066Sahrens 	(void) printf("\n");
431fa9e4066Sahrens 
432fa9e4066Sahrens 	for (zap_cursor_init(&zc, os, object);
433fa9e4066Sahrens 	    zap_cursor_retrieve(&zc, &attr) == 0;
434fa9e4066Sahrens 	    zap_cursor_advance(&zc)) {
435fa9e4066Sahrens 		(void) printf("\t\t%s = ", attr.za_name);
436fa9e4066Sahrens 		if (attr.za_num_integers == 0) {
437fa9e4066Sahrens 			(void) printf("\n");
438fa9e4066Sahrens 			continue;
439fa9e4066Sahrens 		}
440fa9e4066Sahrens 		prop = umem_zalloc(attr.za_num_integers *
441fa9e4066Sahrens 		    attr.za_integer_length, UMEM_NOFAIL);
442fa9e4066Sahrens 		(void) zap_lookup(os, object, attr.za_name,
443fa9e4066Sahrens 		    attr.za_integer_length, attr.za_num_integers, prop);
444fa9e4066Sahrens 		if (attr.za_integer_length == 1) {
445fa9e4066Sahrens 			(void) printf("%s", (char *)prop);
446fa9e4066Sahrens 		} else {
447fa9e4066Sahrens 			for (i = 0; i < attr.za_num_integers; i++) {
448fa9e4066Sahrens 				switch (attr.za_integer_length) {
449fa9e4066Sahrens 				case 2:
450fa9e4066Sahrens 					(void) printf("%u ",
451fa9e4066Sahrens 					    ((uint16_t *)prop)[i]);
452fa9e4066Sahrens 					break;
453fa9e4066Sahrens 				case 4:
454fa9e4066Sahrens 					(void) printf("%u ",
455fa9e4066Sahrens 					    ((uint32_t *)prop)[i]);
456fa9e4066Sahrens 					break;
457fa9e4066Sahrens 				case 8:
458fa9e4066Sahrens 					(void) printf("%lld ",
459fa9e4066Sahrens 					    (u_longlong_t)((int64_t *)prop)[i]);
460fa9e4066Sahrens 					break;
461fa9e4066Sahrens 				}
462fa9e4066Sahrens 			}
463fa9e4066Sahrens 		}
464fa9e4066Sahrens 		(void) printf("\n");
465fa9e4066Sahrens 		umem_free(prop, attr.za_num_integers * attr.za_integer_length);
466fa9e4066Sahrens 	}
46787e5029aSahrens 	zap_cursor_fini(&zc);
468fa9e4066Sahrens }
469fa9e4066Sahrens 
470732885fcSMatthew Ahrens static void
471732885fcSMatthew Ahrens dump_bpobj(objset_t *os, uint64_t object, void *data, size_t size)
472732885fcSMatthew Ahrens {
473732885fcSMatthew Ahrens 	bpobj_phys_t *bpop = data;
474732885fcSMatthew Ahrens 	char bytes[32], comp[32], uncomp[32];
475732885fcSMatthew Ahrens 
4760a055120SJason King 	/* make sure the output won't get truncated */
4770a055120SJason King 	CTASSERT(sizeof (bytes) >= NN_NUMBUF_SZ);
4780a055120SJason King 	CTASSERT(sizeof (comp) >= NN_NUMBUF_SZ);
4790a055120SJason King 	CTASSERT(sizeof (uncomp) >= NN_NUMBUF_SZ);
4800a055120SJason King 
481732885fcSMatthew Ahrens 	if (bpop == NULL)
482732885fcSMatthew Ahrens 		return;
483732885fcSMatthew Ahrens 
4840a055120SJason King 	zdb_nicenum(bpop->bpo_bytes, bytes, sizeof (bytes));
4850a055120SJason King 	zdb_nicenum(bpop->bpo_comp, comp, sizeof (comp));
4860a055120SJason King 	zdb_nicenum(bpop->bpo_uncomp, uncomp, sizeof (uncomp));
487732885fcSMatthew Ahrens 
488732885fcSMatthew Ahrens 	(void) printf("\t\tnum_blkptrs = %llu\n",
489732885fcSMatthew Ahrens 	    (u_longlong_t)bpop->bpo_num_blkptrs);
490732885fcSMatthew Ahrens 	(void) printf("\t\tbytes = %s\n", bytes);
491732885fcSMatthew Ahrens 	if (size >= BPOBJ_SIZE_V1) {
492732885fcSMatthew Ahrens 		(void) printf("\t\tcomp = %s\n", comp);
493732885fcSMatthew Ahrens 		(void) printf("\t\tuncomp = %s\n", uncomp);
494732885fcSMatthew Ahrens 	}
495732885fcSMatthew Ahrens 	if (size >= sizeof (*bpop)) {
496732885fcSMatthew Ahrens 		(void) printf("\t\tsubobjs = %llu\n",
497732885fcSMatthew Ahrens 		    (u_longlong_t)bpop->bpo_subobjs);
498732885fcSMatthew Ahrens 		(void) printf("\t\tnum_subobjs = %llu\n",
499732885fcSMatthew Ahrens 		    (u_longlong_t)bpop->bpo_num_subobjs);
500732885fcSMatthew Ahrens 	}
501732885fcSMatthew Ahrens 
502732885fcSMatthew Ahrens 	if (dump_opt['d'] < 5)
503732885fcSMatthew Ahrens 		return;
504732885fcSMatthew Ahrens 
505732885fcSMatthew Ahrens 	for (uint64_t i = 0; i < bpop->bpo_num_blkptrs; i++) {
506732885fcSMatthew Ahrens 		char blkbuf[BP_SPRINTF_LEN];
507732885fcSMatthew Ahrens 		blkptr_t bp;
508732885fcSMatthew Ahrens 
509732885fcSMatthew Ahrens 		int err = dmu_read(os, object,
510732885fcSMatthew Ahrens 		    i * sizeof (bp), sizeof (bp), &bp, 0);
511732885fcSMatthew Ahrens 		if (err != 0) {
512732885fcSMatthew Ahrens 			(void) printf("got error %u from dmu_read\n", err);
513732885fcSMatthew Ahrens 			break;
514732885fcSMatthew Ahrens 		}
515732885fcSMatthew Ahrens 		snprintf_blkptr_compact(blkbuf, sizeof (blkbuf), &bp);
516732885fcSMatthew Ahrens 		(void) printf("\t%s\n", blkbuf);
517732885fcSMatthew Ahrens 	}
518732885fcSMatthew Ahrens }
519732885fcSMatthew Ahrens 
520732885fcSMatthew Ahrens /* ARGSUSED */
521732885fcSMatthew Ahrens static void
522732885fcSMatthew Ahrens dump_bpobj_subobjs(objset_t *os, uint64_t object, void *data, size_t size)
523732885fcSMatthew Ahrens {
524732885fcSMatthew Ahrens 	dmu_object_info_t doi;
525732885fcSMatthew Ahrens 
526732885fcSMatthew Ahrens 	VERIFY0(dmu_object_info(os, object, &doi));
527732885fcSMatthew Ahrens 	uint64_t *subobjs = kmem_alloc(doi.doi_max_offset, KM_SLEEP);
528732885fcSMatthew Ahrens 
529732885fcSMatthew Ahrens 	int err = dmu_read(os, object, 0, doi.doi_max_offset, subobjs, 0);
530732885fcSMatthew Ahrens 	if (err != 0) {
531732885fcSMatthew Ahrens 		(void) printf("got error %u from dmu_read\n", err);
532732885fcSMatthew Ahrens 		kmem_free(subobjs, doi.doi_max_offset);
533732885fcSMatthew Ahrens 		return;
534732885fcSMatthew Ahrens 	}
535732885fcSMatthew Ahrens 
536732885fcSMatthew Ahrens 	int64_t last_nonzero = -1;
537732885fcSMatthew Ahrens 	for (uint64_t i = 0; i < doi.doi_max_offset / 8; i++) {
538732885fcSMatthew Ahrens 		if (subobjs[i] != 0)
539732885fcSMatthew Ahrens 			last_nonzero = i;
540732885fcSMatthew Ahrens 	}
541732885fcSMatthew Ahrens 
542732885fcSMatthew Ahrens 	for (int64_t i = 0; i <= last_nonzero; i++) {
543732885fcSMatthew Ahrens 		(void) printf("\t%llu\n", (longlong_t)subobjs[i]);
544732885fcSMatthew Ahrens 	}
545732885fcSMatthew Ahrens 	kmem_free(subobjs, doi.doi_max_offset);
546732885fcSMatthew Ahrens }
547732885fcSMatthew Ahrens 
548486ae710SMatthew Ahrens /*ARGSUSED*/
549486ae710SMatthew Ahrens static void
550486ae710SMatthew Ahrens dump_ddt_zap(objset_t *os, uint64_t object, void *data, size_t size)
551486ae710SMatthew Ahrens {
552486ae710SMatthew Ahrens 	dump_zap_stats(os, object);
553486ae710SMatthew Ahrens 	/* contents are printed elsewhere, properly decoded */
554486ae710SMatthew Ahrens }
555486ae710SMatthew Ahrens 
5560a586ceaSMark Shellenbaum /*ARGSUSED*/
5570a586ceaSMark Shellenbaum static void
5580a586ceaSMark Shellenbaum dump_sa_attrs(objset_t *os, uint64_t object, void *data, size_t size)
5590a586ceaSMark Shellenbaum {
5600a586ceaSMark Shellenbaum 	zap_cursor_t zc;
5610a586ceaSMark Shellenbaum 	zap_attribute_t attr;
5620a586ceaSMark Shellenbaum 
5630a586ceaSMark Shellenbaum 	dump_zap_stats(os, object);
5640a586ceaSMark Shellenbaum 	(void) printf("\n");
5650a586ceaSMark Shellenbaum 
5660a586ceaSMark Shellenbaum 	for (zap_cursor_init(&zc, os, object);
5670a586ceaSMark Shellenbaum 	    zap_cursor_retrieve(&zc, &attr) == 0;
5680a586ceaSMark Shellenbaum 	    zap_cursor_advance(&zc)) {
5690a586ceaSMark Shellenbaum 		(void) printf("\t\t%s = ", attr.za_name);
5700a586ceaSMark Shellenbaum 		if (attr.za_num_integers == 0) {
5710a586ceaSMark Shellenbaum 			(void) printf("\n");
5720a586ceaSMark Shellenbaum 			continue;
5730a586ceaSMark Shellenbaum 		}
5740a586ceaSMark Shellenbaum 		(void) printf(" %llx : [%d:%d:%d]\n",
5750a586ceaSMark Shellenbaum 		    (u_longlong_t)attr.za_first_integer,
5760a586ceaSMark Shellenbaum 		    (int)ATTR_LENGTH(attr.za_first_integer),
5770a586ceaSMark Shellenbaum 		    (int)ATTR_BSWAP(attr.za_first_integer),
5780a586ceaSMark Shellenbaum 		    (int)ATTR_NUM(attr.za_first_integer));
5790a586ceaSMark Shellenbaum 	}
5800a586ceaSMark Shellenbaum 	zap_cursor_fini(&zc);
5810a586ceaSMark Shellenbaum }
5820a586ceaSMark Shellenbaum 
5830a586ceaSMark Shellenbaum /*ARGSUSED*/
5840a586ceaSMark Shellenbaum static void
5850a586ceaSMark Shellenbaum dump_sa_layouts(objset_t *os, uint64_t object, void *data, size_t size)
5860a586ceaSMark Shellenbaum {
5870a586ceaSMark Shellenbaum 	zap_cursor_t zc;
5880a586ceaSMark Shellenbaum 	zap_attribute_t attr;
5890a586ceaSMark Shellenbaum 	uint16_t *layout_attrs;
5903f7978d0SAlan Somers 	unsigned i;
5910a586ceaSMark Shellenbaum 
5920a586ceaSMark Shellenbaum 	dump_zap_stats(os, object);
5930a586ceaSMark Shellenbaum 	(void) printf("\n");
5940a586ceaSMark Shellenbaum 
5950a586ceaSMark Shellenbaum 	for (zap_cursor_init(&zc, os, object);
5960a586ceaSMark Shellenbaum 	    zap_cursor_retrieve(&zc, &attr) == 0;
5970a586ceaSMark Shellenbaum 	    zap_cursor_advance(&zc)) {
5980a586ceaSMark Shellenbaum 		(void) printf("\t\t%s = [", attr.za_name);
5990a586ceaSMark Shellenbaum 		if (attr.za_num_integers == 0) {
6000a586ceaSMark Shellenbaum 			(void) printf("\n");
6010a586ceaSMark Shellenbaum 			continue;
6020a586ceaSMark Shellenbaum 		}
6030a586ceaSMark Shellenbaum 
6040a586ceaSMark Shellenbaum 		VERIFY(attr.za_integer_length == 2);
6050a586ceaSMark Shellenbaum 		layout_attrs = umem_zalloc(attr.za_num_integers *
6060a586ceaSMark Shellenbaum 		    attr.za_integer_length, UMEM_NOFAIL);
6070a586ceaSMark Shellenbaum 
6080a586ceaSMark Shellenbaum 		VERIFY(zap_lookup(os, object, attr.za_name,
6090a586ceaSMark Shellenbaum 		    attr.za_integer_length,
6100a586ceaSMark Shellenbaum 		    attr.za_num_integers, layout_attrs) == 0);
6110a586ceaSMark Shellenbaum 
6120a586ceaSMark Shellenbaum 		for (i = 0; i != attr.za_num_integers; i++)
6130a586ceaSMark Shellenbaum 			(void) printf(" %d ", (int)layout_attrs[i]);
6140a586ceaSMark Shellenbaum 		(void) printf("]\n");
6150a586ceaSMark Shellenbaum 		umem_free(layout_attrs,
6160a586ceaSMark Shellenbaum 		    attr.za_num_integers * attr.za_integer_length);
6170a586ceaSMark Shellenbaum 	}
6180a586ceaSMark Shellenbaum 	zap_cursor_fini(&zc);
6190a586ceaSMark Shellenbaum }
6200a586ceaSMark Shellenbaum 
621e7437265Sahrens /*ARGSUSED*/
622e7437265Sahrens static void
623e7437265Sahrens dump_zpldir(objset_t *os, uint64_t object, void *data, size_t size)
624e7437265Sahrens {
625e7437265Sahrens 	zap_cursor_t zc;
626e7437265Sahrens 	zap_attribute_t attr;
627e7437265Sahrens 	const char *typenames[] = {
628e7437265Sahrens 		/* 0 */ "not specified",
629e7437265Sahrens 		/* 1 */ "FIFO",
630e7437265Sahrens 		/* 2 */ "Character Device",
631e7437265Sahrens 		/* 3 */ "3 (invalid)",
632e7437265Sahrens 		/* 4 */ "Directory",
633e7437265Sahrens 		/* 5 */ "5 (invalid)",
634e7437265Sahrens 		/* 6 */ "Block Device",
635e7437265Sahrens 		/* 7 */ "7 (invalid)",
636e7437265Sahrens 		/* 8 */ "Regular File",
637e7437265Sahrens 		/* 9 */ "9 (invalid)",
638e7437265Sahrens 		/* 10 */ "Symbolic Link",
639e7437265Sahrens 		/* 11 */ "11 (invalid)",
640e7437265Sahrens 		/* 12 */ "Socket",
641e7437265Sahrens 		/* 13 */ "Door",
642e7437265Sahrens 		/* 14 */ "Event Port",
643e7437265Sahrens 		/* 15 */ "15 (invalid)",
644e7437265Sahrens 	};
645e7437265Sahrens 
646e7437265Sahrens 	dump_zap_stats(os, object);
647e7437265Sahrens 	(void) printf("\n");
648e7437265Sahrens 
649e7437265Sahrens 	for (zap_cursor_init(&zc, os, object);
650e7437265Sahrens 	    zap_cursor_retrieve(&zc, &attr) == 0;
651e7437265Sahrens 	    zap_cursor_advance(&zc)) {
652e7437265Sahrens 		(void) printf("\t\t%s = %lld (type: %s)\n",
653e7437265Sahrens 		    attr.za_name, ZFS_DIRENT_OBJ(attr.za_first_integer),
654e7437265Sahrens 		    typenames[ZFS_DIRENT_TYPE(attr.za_first_integer)]);
655e7437265Sahrens 	}
656e7437265Sahrens 	zap_cursor_fini(&zc);
657e7437265Sahrens }
658e7437265Sahrens 
6593f7978d0SAlan Somers static int
6600713e232SGeorge Wilson get_dtl_refcount(vdev_t *vd)
6610713e232SGeorge Wilson {
6620713e232SGeorge Wilson 	int refcount = 0;
6630713e232SGeorge Wilson 
6640713e232SGeorge Wilson 	if (vd->vdev_ops->vdev_op_leaf) {
6650713e232SGeorge Wilson 		space_map_t *sm = vd->vdev_dtl_sm;
6660713e232SGeorge Wilson 
6670713e232SGeorge Wilson 		if (sm != NULL &&
6680713e232SGeorge Wilson 		    sm->sm_dbuf->db_size == sizeof (space_map_phys_t))
6690713e232SGeorge Wilson 			return (1);
6700713e232SGeorge Wilson 		return (0);
6710713e232SGeorge Wilson 	}
6720713e232SGeorge Wilson 
6733f7978d0SAlan Somers 	for (unsigned c = 0; c < vd->vdev_children; c++)
6740713e232SGeorge Wilson 		refcount += get_dtl_refcount(vd->vdev_child[c]);
6750713e232SGeorge Wilson 	return (refcount);
6760713e232SGeorge Wilson }
6770713e232SGeorge Wilson 
6783f7978d0SAlan Somers static int
6790713e232SGeorge Wilson get_metaslab_refcount(vdev_t *vd)
6800713e232SGeorge Wilson {
6810713e232SGeorge Wilson 	int refcount = 0;
6820713e232SGeorge Wilson 
6835cabbc6bSPrashanth Sreenivasa 	if (vd->vdev_top == vd) {
6845cabbc6bSPrashanth Sreenivasa 		for (uint64_t m = 0; m < vd->vdev_ms_count; m++) {
6850713e232SGeorge Wilson 			space_map_t *sm = vd->vdev_ms[m]->ms_sm;
6860713e232SGeorge Wilson 
6870713e232SGeorge Wilson 			if (sm != NULL &&
6880713e232SGeorge Wilson 			    sm->sm_dbuf->db_size == sizeof (space_map_phys_t))
6890713e232SGeorge Wilson 				refcount++;
6900713e232SGeorge Wilson 		}
6910713e232SGeorge Wilson 	}
6923f7978d0SAlan Somers 	for (unsigned c = 0; c < vd->vdev_children; c++)
6930713e232SGeorge Wilson 		refcount += get_metaslab_refcount(vd->vdev_child[c]);
6940713e232SGeorge Wilson 
6950713e232SGeorge Wilson 	return (refcount);
6960713e232SGeorge Wilson }
6970713e232SGeorge Wilson 
6985cabbc6bSPrashanth Sreenivasa static int
6995cabbc6bSPrashanth Sreenivasa get_obsolete_refcount(vdev_t *vd)
7005cabbc6bSPrashanth Sreenivasa {
7015cabbc6bSPrashanth Sreenivasa 	int refcount = 0;
7025cabbc6bSPrashanth Sreenivasa 
7035cabbc6bSPrashanth Sreenivasa 	uint64_t obsolete_sm_obj = vdev_obsolete_sm_object(vd);
7045cabbc6bSPrashanth Sreenivasa 	if (vd->vdev_top == vd && obsolete_sm_obj != 0) {
7055cabbc6bSPrashanth Sreenivasa 		dmu_object_info_t doi;
7065cabbc6bSPrashanth Sreenivasa 		VERIFY0(dmu_object_info(vd->vdev_spa->spa_meta_objset,
7075cabbc6bSPrashanth Sreenivasa 		    obsolete_sm_obj, &doi));
7085cabbc6bSPrashanth Sreenivasa 		if (doi.doi_bonus_size == sizeof (space_map_phys_t)) {
7095cabbc6bSPrashanth Sreenivasa 			refcount++;
7105cabbc6bSPrashanth Sreenivasa 		}
7115cabbc6bSPrashanth Sreenivasa 	} else {
7125cabbc6bSPrashanth Sreenivasa 		ASSERT3P(vd->vdev_obsolete_sm, ==, NULL);
7135cabbc6bSPrashanth Sreenivasa 		ASSERT3U(obsolete_sm_obj, ==, 0);
7145cabbc6bSPrashanth Sreenivasa 	}
7155cabbc6bSPrashanth Sreenivasa 	for (unsigned c = 0; c < vd->vdev_children; c++) {
7165cabbc6bSPrashanth Sreenivasa 		refcount += get_obsolete_refcount(vd->vdev_child[c]);
7175cabbc6bSPrashanth Sreenivasa 	}
7185cabbc6bSPrashanth Sreenivasa 
7195cabbc6bSPrashanth Sreenivasa 	return (refcount);
7205cabbc6bSPrashanth Sreenivasa }
7215cabbc6bSPrashanth Sreenivasa 
7225cabbc6bSPrashanth Sreenivasa static int
7235cabbc6bSPrashanth Sreenivasa get_prev_obsolete_spacemap_refcount(spa_t *spa)
7245cabbc6bSPrashanth Sreenivasa {
7255cabbc6bSPrashanth Sreenivasa 	uint64_t prev_obj =
7265cabbc6bSPrashanth Sreenivasa 	    spa->spa_condensing_indirect_phys.scip_prev_obsolete_sm_object;
7275cabbc6bSPrashanth Sreenivasa 	if (prev_obj != 0) {
7285cabbc6bSPrashanth Sreenivasa 		dmu_object_info_t doi;
7295cabbc6bSPrashanth Sreenivasa 		VERIFY0(dmu_object_info(spa->spa_meta_objset, prev_obj, &doi));
7305cabbc6bSPrashanth Sreenivasa 		if (doi.doi_bonus_size == sizeof (space_map_phys_t)) {
7315cabbc6bSPrashanth Sreenivasa 			return (1);
7325cabbc6bSPrashanth Sreenivasa 		}
7335cabbc6bSPrashanth Sreenivasa 	}
7345cabbc6bSPrashanth Sreenivasa 	return (0);
7355cabbc6bSPrashanth Sreenivasa }
7365cabbc6bSPrashanth Sreenivasa 
73786714001SSerapheim Dimitropoulos static int
73886714001SSerapheim Dimitropoulos get_checkpoint_refcount(vdev_t *vd)
73986714001SSerapheim Dimitropoulos {
74086714001SSerapheim Dimitropoulos 	int refcount = 0;
74186714001SSerapheim Dimitropoulos 
74286714001SSerapheim Dimitropoulos 	if (vd->vdev_top == vd && vd->vdev_top_zap != 0 &&
74386714001SSerapheim Dimitropoulos 	    zap_contains(spa_meta_objset(vd->vdev_spa),
74486714001SSerapheim Dimitropoulos 	    vd->vdev_top_zap, VDEV_TOP_ZAP_POOL_CHECKPOINT_SM) == 0)
74586714001SSerapheim Dimitropoulos 		refcount++;
74686714001SSerapheim Dimitropoulos 
74786714001SSerapheim Dimitropoulos 	for (uint64_t c = 0; c < vd->vdev_children; c++)
74886714001SSerapheim Dimitropoulos 		refcount += get_checkpoint_refcount(vd->vdev_child[c]);
74986714001SSerapheim Dimitropoulos 
75086714001SSerapheim Dimitropoulos 	return (refcount);
75186714001SSerapheim Dimitropoulos }
75286714001SSerapheim Dimitropoulos 
7530713e232SGeorge Wilson static int
7540713e232SGeorge Wilson verify_spacemap_refcounts(spa_t *spa)
7550713e232SGeorge Wilson {
7562acef22dSMatthew Ahrens 	uint64_t expected_refcount = 0;
7572acef22dSMatthew Ahrens 	uint64_t actual_refcount;
7580713e232SGeorge Wilson 
7592acef22dSMatthew Ahrens 	(void) feature_get_refcount(spa,
7602acef22dSMatthew Ahrens 	    &spa_feature_table[SPA_FEATURE_SPACEMAP_HISTOGRAM],
7612acef22dSMatthew Ahrens 	    &expected_refcount);
7620713e232SGeorge Wilson 	actual_refcount = get_dtl_refcount(spa->spa_root_vdev);
7630713e232SGeorge Wilson 	actual_refcount += get_metaslab_refcount(spa->spa_root_vdev);
7645cabbc6bSPrashanth Sreenivasa 	actual_refcount += get_obsolete_refcount(spa->spa_root_vdev);
7655cabbc6bSPrashanth Sreenivasa 	actual_refcount += get_prev_obsolete_spacemap_refcount(spa);
76686714001SSerapheim Dimitropoulos 	actual_refcount += get_checkpoint_refcount(spa->spa_root_vdev);
7670713e232SGeorge Wilson 
7680713e232SGeorge Wilson 	if (expected_refcount != actual_refcount) {
7692acef22dSMatthew Ahrens 		(void) printf("space map refcount mismatch: expected %lld != "
7702acef22dSMatthew Ahrens 		    "actual %lld\n",
7712acef22dSMatthew Ahrens 		    (longlong_t)expected_refcount,
7722acef22dSMatthew Ahrens 		    (longlong_t)actual_refcount);
7730713e232SGeorge Wilson 		return (2);
7740713e232SGeorge Wilson 	}
7750713e232SGeorge Wilson 	return (0);
7760713e232SGeorge Wilson }
7770713e232SGeorge Wilson 
778fa9e4066Sahrens static void
7790713e232SGeorge Wilson dump_spacemap(objset_t *os, space_map_t *sm)
780fa9e4066Sahrens {
7815cabbc6bSPrashanth Sreenivasa 	char *ddata[] = { "ALLOC", "FREE", "CONDENSE", "INVALID",
7825cabbc6bSPrashanth Sreenivasa 	    "INVALID", "INVALID", "INVALID", "INVALID" };
783fa9e4066Sahrens 
7840713e232SGeorge Wilson 	if (sm == NULL)
785fa9e4066Sahrens 		return;
786fa9e4066Sahrens 
7875cabbc6bSPrashanth Sreenivasa 	(void) printf("space map object %llu:\n",
7885cabbc6bSPrashanth Sreenivasa 	    (longlong_t)sm->sm_phys->smp_object);
7895cabbc6bSPrashanth Sreenivasa 	(void) printf("  smp_objsize = 0x%llx\n",
7905cabbc6bSPrashanth Sreenivasa 	    (longlong_t)sm->sm_phys->smp_objsize);
7915cabbc6bSPrashanth Sreenivasa 	(void) printf("  smp_alloc = 0x%llx\n",
7925cabbc6bSPrashanth Sreenivasa 	    (longlong_t)sm->sm_phys->smp_alloc);
7935cabbc6bSPrashanth Sreenivasa 
794fa9e4066Sahrens 	/*
795fa9e4066Sahrens 	 * Print out the freelist entries in both encoded and decoded form.
796fa9e4066Sahrens 	 */
79717f11284SSerapheim Dimitropoulos 	uint8_t mapshift = sm->sm_shift;
79817f11284SSerapheim Dimitropoulos 	int64_t alloc = 0;
79917f11284SSerapheim Dimitropoulos 	uint64_t word;
80017f11284SSerapheim Dimitropoulos 	for (uint64_t offset = 0; offset < space_map_length(sm);
80117f11284SSerapheim Dimitropoulos 	    offset += sizeof (word)) {
8020713e232SGeorge Wilson 
8030713e232SGeorge Wilson 		VERIFY0(dmu_read(os, space_map_object(sm), offset,
80417f11284SSerapheim Dimitropoulos 		    sizeof (word), &word, DMU_READ_PREFETCH));
8050713e232SGeorge Wilson 
80617f11284SSerapheim Dimitropoulos 		if (sm_entry_is_debug(word)) {
80787219db7SVictor Latushkin 			(void) printf("\t    [%6llu] %s: txg %llu, pass %llu\n",
80817f11284SSerapheim Dimitropoulos 			    (u_longlong_t)(offset / sizeof (word)),
80917f11284SSerapheim Dimitropoulos 			    ddata[SM_DEBUG_ACTION_DECODE(word)],
81017f11284SSerapheim Dimitropoulos 			    (u_longlong_t)SM_DEBUG_TXG_DECODE(word),
81117f11284SSerapheim Dimitropoulos 			    (u_longlong_t)SM_DEBUG_SYNCPASS_DECODE(word));
81217f11284SSerapheim Dimitropoulos 			continue;
81317f11284SSerapheim Dimitropoulos 		}
81417f11284SSerapheim Dimitropoulos 
81517f11284SSerapheim Dimitropoulos 		uint8_t words;
81617f11284SSerapheim Dimitropoulos 		char entry_type;
81717f11284SSerapheim Dimitropoulos 		uint64_t entry_off, entry_run, entry_vdev = SM_NO_VDEVID;
81817f11284SSerapheim Dimitropoulos 
81917f11284SSerapheim Dimitropoulos 		if (sm_entry_is_single_word(word)) {
82017f11284SSerapheim Dimitropoulos 			entry_type = (SM_TYPE_DECODE(word) == SM_ALLOC) ?
82117f11284SSerapheim Dimitropoulos 			    'A' : 'F';
82217f11284SSerapheim Dimitropoulos 			entry_off = (SM_OFFSET_DECODE(word) << mapshift) +
82317f11284SSerapheim Dimitropoulos 			    sm->sm_start;
82417f11284SSerapheim Dimitropoulos 			entry_run = SM_RUN_DECODE(word) << mapshift;
82517f11284SSerapheim Dimitropoulos 			words = 1;
826fa9e4066Sahrens 		} else {
82717f11284SSerapheim Dimitropoulos 			/* it is a two-word entry so we read another word */
82817f11284SSerapheim Dimitropoulos 			ASSERT(sm_entry_is_double_word(word));
82917f11284SSerapheim Dimitropoulos 
83017f11284SSerapheim Dimitropoulos 			uint64_t extra_word;
83117f11284SSerapheim Dimitropoulos 			offset += sizeof (extra_word);
83217f11284SSerapheim Dimitropoulos 			VERIFY0(dmu_read(os, space_map_object(sm), offset,
83317f11284SSerapheim Dimitropoulos 			    sizeof (extra_word), &extra_word,
83417f11284SSerapheim Dimitropoulos 			    DMU_READ_PREFETCH));
83517f11284SSerapheim Dimitropoulos 
83617f11284SSerapheim Dimitropoulos 			ASSERT3U(offset, <=, space_map_length(sm));
83717f11284SSerapheim Dimitropoulos 
83817f11284SSerapheim Dimitropoulos 			entry_run = SM2_RUN_DECODE(word) << mapshift;
83917f11284SSerapheim Dimitropoulos 			entry_vdev = SM2_VDEV_DECODE(word);
84017f11284SSerapheim Dimitropoulos 			entry_type = (SM2_TYPE_DECODE(extra_word) == SM_ALLOC) ?
84117f11284SSerapheim Dimitropoulos 			    'A' : 'F';
84217f11284SSerapheim Dimitropoulos 			entry_off = (SM2_OFFSET_DECODE(extra_word) <<
84317f11284SSerapheim Dimitropoulos 			    mapshift) + sm->sm_start;
84417f11284SSerapheim Dimitropoulos 			words = 2;
845fa9e4066Sahrens 		}
84617f11284SSerapheim Dimitropoulos 
84717f11284SSerapheim Dimitropoulos 		(void) printf("\t    [%6llu]    %c  range:"
84817f11284SSerapheim Dimitropoulos 		    " %010llx-%010llx  size: %06llx vdev: %06llu words: %u\n",
84917f11284SSerapheim Dimitropoulos 		    (u_longlong_t)(offset / sizeof (word)),
85017f11284SSerapheim Dimitropoulos 		    entry_type, (u_longlong_t)entry_off,
85117f11284SSerapheim Dimitropoulos 		    (u_longlong_t)(entry_off + entry_run),
85217f11284SSerapheim Dimitropoulos 		    (u_longlong_t)entry_run,
85317f11284SSerapheim Dimitropoulos 		    (u_longlong_t)entry_vdev, words);
85417f11284SSerapheim Dimitropoulos 
85517f11284SSerapheim Dimitropoulos 		if (entry_type == 'A')
85617f11284SSerapheim Dimitropoulos 			alloc += entry_run;
85717f11284SSerapheim Dimitropoulos 		else
85817f11284SSerapheim Dimitropoulos 			alloc -= entry_run;
859fa9e4066Sahrens 	}
86017f11284SSerapheim Dimitropoulos 	if ((uint64_t)alloc != space_map_allocated(sm)) {
86117f11284SSerapheim Dimitropoulos 		(void) printf("space_map_object alloc (%lld) INCONSISTENT "
86217f11284SSerapheim Dimitropoulos 		    "with space map summary (%lld)\n",
86317f11284SSerapheim Dimitropoulos 		    (longlong_t)space_map_allocated(sm), (longlong_t)alloc);
864fa9e4066Sahrens 	}
865fa9e4066Sahrens }
866fa9e4066Sahrens 
867d6e555bdSGeorge Wilson static void
868d6e555bdSGeorge Wilson dump_metaslab_stats(metaslab_t *msp)
869d6e555bdSGeorge Wilson {
8703f9d6ad7SLin Ling 	char maxbuf[32];
87186714001SSerapheim Dimitropoulos 	range_tree_t *rt = msp->ms_allocatable;
87286714001SSerapheim Dimitropoulos 	avl_tree_t *t = &msp->ms_allocatable_by_size;
8730713e232SGeorge Wilson 	int free_pct = range_tree_space(rt) * 100 / msp->ms_size;
874d6e555bdSGeorge Wilson 
8750a055120SJason King 	/* max sure nicenum has enough space */
8760a055120SJason King 	CTASSERT(sizeof (maxbuf) >= NN_NUMBUF_SZ);
8770a055120SJason King 
8780a055120SJason King 	zdb_nicenum(metaslab_block_maxsize(msp), maxbuf, sizeof (maxbuf));
879d6e555bdSGeorge Wilson 
88087219db7SVictor Latushkin 	(void) printf("\t %25s %10lu   %7s  %6s   %4s %4d%%\n",
881d6e555bdSGeorge Wilson 	    "segments", avl_numnodes(t), "maxsize", maxbuf,
882d6e555bdSGeorge Wilson 	    "freepct", free_pct);
8830713e232SGeorge Wilson 	(void) printf("\tIn-memory histogram:\n");
8840713e232SGeorge Wilson 	dump_histogram(rt->rt_histogram, RANGE_TREE_HISTOGRAM_SIZE, 0);
885d6e555bdSGeorge Wilson }
886d6e555bdSGeorge Wilson 
887fa9e4066Sahrens static void
888fa9e4066Sahrens dump_metaslab(metaslab_t *msp)
889fa9e4066Sahrens {
890fa9e4066Sahrens 	vdev_t *vd = msp->ms_group->mg_vd;
891fa9e4066Sahrens 	spa_t *spa = vd->vdev_spa;
8920713e232SGeorge Wilson 	space_map_t *sm = msp->ms_sm;
8933f9d6ad7SLin Ling 	char freebuf[32];
894fa9e4066Sahrens 
8950a055120SJason King 	zdb_nicenum(msp->ms_size - space_map_allocated(sm), freebuf,
8960a055120SJason King 	    sizeof (freebuf));
897fa9e4066Sahrens 
898fa9e4066Sahrens 	(void) printf(
89987219db7SVictor Latushkin 	    "\tmetaslab %6llu   offset %12llx   spacemap %6llu   free    %5s\n",
9000713e232SGeorge Wilson 	    (u_longlong_t)msp->ms_id, (u_longlong_t)msp->ms_start,
9010713e232SGeorge Wilson 	    (u_longlong_t)space_map_object(sm), freebuf);
902fa9e4066Sahrens 
9030713e232SGeorge Wilson 	if (dump_opt['m'] > 2 && !dump_opt['L']) {
904d6e555bdSGeorge Wilson 		mutex_enter(&msp->ms_lock);
905a0b03b16SSerapheim Dimitropoulos 		VERIFY0(metaslab_load(msp));
906a0b03b16SSerapheim Dimitropoulos 		range_tree_stat_verify(msp->ms_allocatable);
907bc3975b5SVictor Latushkin 		dump_metaslab_stats(msp);
9080713e232SGeorge Wilson 		metaslab_unload(msp);
909d6e555bdSGeorge Wilson 		mutex_exit(&msp->ms_lock);
910d6e555bdSGeorge Wilson 	}
911d6e555bdSGeorge Wilson 
9120713e232SGeorge Wilson 	if (dump_opt['m'] > 1 && sm != NULL &&
9132acef22dSMatthew Ahrens 	    spa_feature_is_active(spa, SPA_FEATURE_SPACEMAP_HISTOGRAM)) {
9140713e232SGeorge Wilson 		/*
9150713e232SGeorge Wilson 		 * The space map histogram represents free space in chunks
9160713e232SGeorge Wilson 		 * of sm_shift (i.e. bucket 0 refers to 2^sm_shift).
9170713e232SGeorge Wilson 		 */
9182e4c9986SGeorge Wilson 		(void) printf("\tOn-disk histogram:\t\tfragmentation %llu\n",
9192e4c9986SGeorge Wilson 		    (u_longlong_t)msp->ms_fragmentation);
9200713e232SGeorge Wilson 		dump_histogram(sm->sm_phys->smp_histogram,
9212e4c9986SGeorge Wilson 		    SPACE_MAP_HISTOGRAM_SIZE, sm->sm_shift);
9220713e232SGeorge Wilson 	}
9230713e232SGeorge Wilson 
9240713e232SGeorge Wilson 	if (dump_opt['d'] > 5 || dump_opt['m'] > 3) {
9250713e232SGeorge Wilson 		ASSERT(msp->ms_size == (1ULL << vd->vdev_ms_shift));
926d6e555bdSGeorge Wilson 
9270713e232SGeorge Wilson 		dump_spacemap(spa->spa_meta_objset, msp->ms_sm);
928d6e555bdSGeorge Wilson 	}
92987219db7SVictor Latushkin }
930fa9e4066Sahrens 
93187219db7SVictor Latushkin static void
93287219db7SVictor Latushkin print_vdev_metaslab_header(vdev_t *vd)
93387219db7SVictor Latushkin {
934*663207adSDon Brady 	vdev_alloc_bias_t alloc_bias = vd->vdev_alloc_bias;
935*663207adSDon Brady 	const char *bias_str;
936*663207adSDon Brady 
937*663207adSDon Brady 	bias_str = (alloc_bias == VDEV_BIAS_LOG || vd->vdev_islog) ?
938*663207adSDon Brady 	    VDEV_ALLOC_BIAS_LOG :
939*663207adSDon Brady 	    (alloc_bias == VDEV_BIAS_SPECIAL) ? VDEV_ALLOC_BIAS_SPECIAL :
940*663207adSDon Brady 	    (alloc_bias == VDEV_BIAS_DEDUP) ? VDEV_ALLOC_BIAS_DEDUP :
941*663207adSDon Brady 	    vd->vdev_islog ? "log" : "";
942*663207adSDon Brady 
943*663207adSDon Brady 	(void) printf("\tvdev %10llu   %s\n"
944*663207adSDon Brady 	    "\t%-10s%5llu   %-19s   %-15s   %-12s\n",
945*663207adSDon Brady 	    (u_longlong_t)vd->vdev_id, bias_str,
94687219db7SVictor Latushkin 	    "metaslabs", (u_longlong_t)vd->vdev_ms_count,
94787219db7SVictor Latushkin 	    "offset", "spacemap", "free");
948*663207adSDon Brady 	(void) printf("\t%15s   %19s   %15s   %12s\n",
94987219db7SVictor Latushkin 	    "---------------", "-------------------",
950*663207adSDon Brady 	    "---------------", "------------");
951fa9e4066Sahrens }
952fa9e4066Sahrens 
9532e4c9986SGeorge Wilson static void
9542e4c9986SGeorge Wilson dump_metaslab_groups(spa_t *spa)
9552e4c9986SGeorge Wilson {
9562e4c9986SGeorge Wilson 	vdev_t *rvd = spa->spa_root_vdev;
9572e4c9986SGeorge Wilson 	metaslab_class_t *mc = spa_normal_class(spa);
9582e4c9986SGeorge Wilson 	uint64_t fragmentation;
9592e4c9986SGeorge Wilson 
9602e4c9986SGeorge Wilson 	metaslab_class_histogram_verify(mc);
9612e4c9986SGeorge Wilson 
9623f7978d0SAlan Somers 	for (unsigned c = 0; c < rvd->vdev_children; c++) {
9632e4c9986SGeorge Wilson 		vdev_t *tvd = rvd->vdev_child[c];
9642e4c9986SGeorge Wilson 		metaslab_group_t *mg = tvd->vdev_mg;
9652e4c9986SGeorge Wilson 
966*663207adSDon Brady 		if (mg == NULL || mg->mg_class != mc)
9672e4c9986SGeorge Wilson 			continue;
9682e4c9986SGeorge Wilson 
9692e4c9986SGeorge Wilson 		metaslab_group_histogram_verify(mg);
9702e4c9986SGeorge Wilson 		mg->mg_fragmentation = metaslab_group_fragmentation(mg);
9712e4c9986SGeorge Wilson 
9722e4c9986SGeorge Wilson 		(void) printf("\tvdev %10llu\t\tmetaslabs%5llu\t\t"
9732e4c9986SGeorge Wilson 		    "fragmentation",
9742e4c9986SGeorge Wilson 		    (u_longlong_t)tvd->vdev_id,
9752e4c9986SGeorge Wilson 		    (u_longlong_t)tvd->vdev_ms_count);
9762e4c9986SGeorge Wilson 		if (mg->mg_fragmentation == ZFS_FRAG_INVALID) {
9772e4c9986SGeorge Wilson 			(void) printf("%3s\n", "-");
9782e4c9986SGeorge Wilson 		} else {
9792e4c9986SGeorge Wilson 			(void) printf("%3llu%%\n",
9802e4c9986SGeorge Wilson 			    (u_longlong_t)mg->mg_fragmentation);
9812e4c9986SGeorge Wilson 		}
9822e4c9986SGeorge Wilson 		dump_histogram(mg->mg_histogram, RANGE_TREE_HISTOGRAM_SIZE, 0);
9832e4c9986SGeorge Wilson 	}
9842e4c9986SGeorge Wilson 
9852e4c9986SGeorge Wilson 	(void) printf("\tpool %s\tfragmentation", spa_name(spa));
9862e4c9986SGeorge Wilson 	fragmentation = metaslab_class_fragmentation(mc);
9872e4c9986SGeorge Wilson 	if (fragmentation == ZFS_FRAG_INVALID)
9882e4c9986SGeorge Wilson 		(void) printf("\t%3s\n", "-");
9892e4c9986SGeorge Wilson 	else
9902e4c9986SGeorge Wilson 		(void) printf("\t%3llu%%\n", (u_longlong_t)fragmentation);
9912e4c9986SGeorge Wilson 	dump_histogram(mc->mc_histogram, RANGE_TREE_HISTOGRAM_SIZE, 0);
9922e4c9986SGeorge Wilson }
9932e4c9986SGeorge Wilson 
9945cabbc6bSPrashanth Sreenivasa static void
9955cabbc6bSPrashanth Sreenivasa print_vdev_indirect(vdev_t *vd)
9965cabbc6bSPrashanth Sreenivasa {
9975cabbc6bSPrashanth Sreenivasa 	vdev_indirect_config_t *vic = &vd->vdev_indirect_config;
9985cabbc6bSPrashanth Sreenivasa 	vdev_indirect_mapping_t *vim = vd->vdev_indirect_mapping;
9995cabbc6bSPrashanth Sreenivasa 	vdev_indirect_births_t *vib = vd->vdev_indirect_births;
10005cabbc6bSPrashanth Sreenivasa 
10015cabbc6bSPrashanth Sreenivasa 	if (vim == NULL) {
10025cabbc6bSPrashanth Sreenivasa 		ASSERT3P(vib, ==, NULL);
10035cabbc6bSPrashanth Sreenivasa 		return;
10045cabbc6bSPrashanth Sreenivasa 	}
10055cabbc6bSPrashanth Sreenivasa 
10065cabbc6bSPrashanth Sreenivasa 	ASSERT3U(vdev_indirect_mapping_object(vim), ==,
10075cabbc6bSPrashanth Sreenivasa 	    vic->vic_mapping_object);
10085cabbc6bSPrashanth Sreenivasa 	ASSERT3U(vdev_indirect_births_object(vib), ==,
10095cabbc6bSPrashanth Sreenivasa 	    vic->vic_births_object);
10105cabbc6bSPrashanth Sreenivasa 
10115cabbc6bSPrashanth Sreenivasa 	(void) printf("indirect births obj %llu:\n",
10125cabbc6bSPrashanth Sreenivasa 	    (longlong_t)vic->vic_births_object);
10135cabbc6bSPrashanth Sreenivasa 	(void) printf("    vib_count = %llu\n",
10145cabbc6bSPrashanth Sreenivasa 	    (longlong_t)vdev_indirect_births_count(vib));
10155cabbc6bSPrashanth Sreenivasa 	for (uint64_t i = 0; i < vdev_indirect_births_count(vib); i++) {
10165cabbc6bSPrashanth Sreenivasa 		vdev_indirect_birth_entry_phys_t *cur_vibe =
10175cabbc6bSPrashanth Sreenivasa 		    &vib->vib_entries[i];
10185cabbc6bSPrashanth Sreenivasa 		(void) printf("\toffset %llx -> txg %llu\n",
10195cabbc6bSPrashanth Sreenivasa 		    (longlong_t)cur_vibe->vibe_offset,
10205cabbc6bSPrashanth Sreenivasa 		    (longlong_t)cur_vibe->vibe_phys_birth_txg);
10215cabbc6bSPrashanth Sreenivasa 	}
10225cabbc6bSPrashanth Sreenivasa 	(void) printf("\n");
10235cabbc6bSPrashanth Sreenivasa 
10245cabbc6bSPrashanth Sreenivasa 	(void) printf("indirect mapping obj %llu:\n",
10255cabbc6bSPrashanth Sreenivasa 	    (longlong_t)vic->vic_mapping_object);
10265cabbc6bSPrashanth Sreenivasa 	(void) printf("    vim_max_offset = 0x%llx\n",
10275cabbc6bSPrashanth Sreenivasa 	    (longlong_t)vdev_indirect_mapping_max_offset(vim));
10285cabbc6bSPrashanth Sreenivasa 	(void) printf("    vim_bytes_mapped = 0x%llx\n",
10295cabbc6bSPrashanth Sreenivasa 	    (longlong_t)vdev_indirect_mapping_bytes_mapped(vim));
10305cabbc6bSPrashanth Sreenivasa 	(void) printf("    vim_count = %llu\n",
10315cabbc6bSPrashanth Sreenivasa 	    (longlong_t)vdev_indirect_mapping_num_entries(vim));
10325cabbc6bSPrashanth Sreenivasa 
10335cabbc6bSPrashanth Sreenivasa 	if (dump_opt['d'] <= 5 && dump_opt['m'] <= 3)
10345cabbc6bSPrashanth Sreenivasa 		return;
10355cabbc6bSPrashanth Sreenivasa 
10365cabbc6bSPrashanth Sreenivasa 	uint32_t *counts = vdev_indirect_mapping_load_obsolete_counts(vim);
10375cabbc6bSPrashanth Sreenivasa 
10385cabbc6bSPrashanth Sreenivasa 	for (uint64_t i = 0; i < vdev_indirect_mapping_num_entries(vim); i++) {
10395cabbc6bSPrashanth Sreenivasa 		vdev_indirect_mapping_entry_phys_t *vimep =
10405cabbc6bSPrashanth Sreenivasa 		    &vim->vim_entries[i];
10415cabbc6bSPrashanth Sreenivasa 		(void) printf("\t<%llx:%llx:%llx> -> "
10425cabbc6bSPrashanth Sreenivasa 		    "<%llx:%llx:%llx> (%x obsolete)\n",
10435cabbc6bSPrashanth Sreenivasa 		    (longlong_t)vd->vdev_id,
10445cabbc6bSPrashanth Sreenivasa 		    (longlong_t)DVA_MAPPING_GET_SRC_OFFSET(vimep),
10455cabbc6bSPrashanth Sreenivasa 		    (longlong_t)DVA_GET_ASIZE(&vimep->vimep_dst),
10465cabbc6bSPrashanth Sreenivasa 		    (longlong_t)DVA_GET_VDEV(&vimep->vimep_dst),
10475cabbc6bSPrashanth Sreenivasa 		    (longlong_t)DVA_GET_OFFSET(&vimep->vimep_dst),
10485cabbc6bSPrashanth Sreenivasa 		    (longlong_t)DVA_GET_ASIZE(&vimep->vimep_dst),
10495cabbc6bSPrashanth Sreenivasa 		    counts[i]);
10505cabbc6bSPrashanth Sreenivasa 	}
10515cabbc6bSPrashanth Sreenivasa 	(void) printf("\n");
10525cabbc6bSPrashanth Sreenivasa 
10535cabbc6bSPrashanth Sreenivasa 	uint64_t obsolete_sm_object = vdev_obsolete_sm_object(vd);
10545cabbc6bSPrashanth Sreenivasa 	if (obsolete_sm_object != 0) {
10555cabbc6bSPrashanth Sreenivasa 		objset_t *mos = vd->vdev_spa->spa_meta_objset;
10565cabbc6bSPrashanth Sreenivasa 		(void) printf("obsolete space map object %llu:\n",
10575cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)obsolete_sm_object);
10585cabbc6bSPrashanth Sreenivasa 		ASSERT(vd->vdev_obsolete_sm != NULL);
10595cabbc6bSPrashanth Sreenivasa 		ASSERT3U(space_map_object(vd->vdev_obsolete_sm), ==,
10605cabbc6bSPrashanth Sreenivasa 		    obsolete_sm_object);
10615cabbc6bSPrashanth Sreenivasa 		dump_spacemap(mos, vd->vdev_obsolete_sm);
10625cabbc6bSPrashanth Sreenivasa 		(void) printf("\n");
10635cabbc6bSPrashanth Sreenivasa 	}
10645cabbc6bSPrashanth Sreenivasa }
10655cabbc6bSPrashanth Sreenivasa 
1066fa9e4066Sahrens static void
1067fa9e4066Sahrens dump_metaslabs(spa_t *spa)
1068fa9e4066Sahrens {
106987219db7SVictor Latushkin 	vdev_t *vd, *rvd = spa->spa_root_vdev;
107087219db7SVictor Latushkin 	uint64_t m, c = 0, children = rvd->vdev_children;
1071fa9e4066Sahrens 
1072fa9e4066Sahrens 	(void) printf("\nMetaslabs:\n");
1073fa9e4066Sahrens 
107487219db7SVictor Latushkin 	if (!dump_opt['d'] && zopt_objects > 0) {
107587219db7SVictor Latushkin 		c = zopt_object[0];
107687219db7SVictor Latushkin 
107787219db7SVictor Latushkin 		if (c >= children)
107887219db7SVictor Latushkin 			(void) fatal("bad vdev id: %llu", (u_longlong_t)c);
1079fa9e4066Sahrens 
108087219db7SVictor Latushkin 		if (zopt_objects > 1) {
108187219db7SVictor Latushkin 			vd = rvd->vdev_child[c];
108287219db7SVictor Latushkin 			print_vdev_metaslab_header(vd);
108387219db7SVictor Latushkin 
108487219db7SVictor Latushkin 			for (m = 1; m < zopt_objects; m++) {
108587219db7SVictor Latushkin 				if (zopt_object[m] < vd->vdev_ms_count)
108687219db7SVictor Latushkin 					dump_metaslab(
108787219db7SVictor Latushkin 					    vd->vdev_ms[zopt_object[m]]);
108887219db7SVictor Latushkin 				else
108987219db7SVictor Latushkin 					(void) fprintf(stderr, "bad metaslab "
109087219db7SVictor Latushkin 					    "number %llu\n",
109187219db7SVictor Latushkin 					    (u_longlong_t)zopt_object[m]);
109287219db7SVictor Latushkin 			}
109387219db7SVictor Latushkin 			(void) printf("\n");
109487219db7SVictor Latushkin 			return;
109587219db7SVictor Latushkin 		}
109687219db7SVictor Latushkin 		children = c + 1;
109787219db7SVictor Latushkin 	}
109887219db7SVictor Latushkin 	for (; c < children; c++) {
109987219db7SVictor Latushkin 		vd = rvd->vdev_child[c];
110087219db7SVictor Latushkin 		print_vdev_metaslab_header(vd);
1101fa9e4066Sahrens 
11025cabbc6bSPrashanth Sreenivasa 		print_vdev_indirect(vd);
11035cabbc6bSPrashanth Sreenivasa 
1104fa9e4066Sahrens 		for (m = 0; m < vd->vdev_ms_count; m++)
1105fa9e4066Sahrens 			dump_metaslab(vd->vdev_ms[m]);
1106fa9e4066Sahrens 		(void) printf("\n");
1107fa9e4066Sahrens 	}
1108fa9e4066Sahrens }
1109fa9e4066Sahrens 
1110b24ab676SJeff Bonwick static void
1111b24ab676SJeff Bonwick dump_dde(const ddt_t *ddt, const ddt_entry_t *dde, uint64_t index)
1112b24ab676SJeff Bonwick {
1113b24ab676SJeff Bonwick 	const ddt_phys_t *ddp = dde->dde_phys;
1114b24ab676SJeff Bonwick 	const ddt_key_t *ddk = &dde->dde_key;
11153f7978d0SAlan Somers 	const char *types[4] = { "ditto", "single", "double", "triple" };
1116b24ab676SJeff Bonwick 	char blkbuf[BP_SPRINTF_LEN];
1117b24ab676SJeff Bonwick 	blkptr_t blk;
1118b24ab676SJeff Bonwick 
1119b24ab676SJeff Bonwick 	for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) {
1120b24ab676SJeff Bonwick 		if (ddp->ddp_phys_birth == 0)
1121b24ab676SJeff Bonwick 			continue;
1122bbfd46c4SJeff Bonwick 		ddt_bp_create(ddt->ddt_checksum, ddk, ddp, &blk);
112343466aaeSMax Grossman 		snprintf_blkptr(blkbuf, sizeof (blkbuf), &blk);
1124b24ab676SJeff Bonwick 		(void) printf("index %llx refcnt %llu %s %s\n",
1125b24ab676SJeff Bonwick 		    (u_longlong_t)index, (u_longlong_t)ddp->ddp_refcnt,
1126b24ab676SJeff Bonwick 		    types[p], blkbuf);
1127b24ab676SJeff Bonwick 	}
1128b24ab676SJeff Bonwick }
1129b24ab676SJeff Bonwick 
1130b24ab676SJeff Bonwick static void
1131b24ab676SJeff Bonwick dump_dedup_ratio(const ddt_stat_t *dds)
1132b24ab676SJeff Bonwick {
1133b24ab676SJeff Bonwick 	double rL, rP, rD, D, dedup, compress, copies;
1134b24ab676SJeff Bonwick 
1135b24ab676SJeff Bonwick 	if (dds->dds_blocks == 0)
1136b24ab676SJeff Bonwick 		return;
1137b24ab676SJeff Bonwick 
1138b24ab676SJeff Bonwick 	rL = (double)dds->dds_ref_lsize;
1139b24ab676SJeff Bonwick 	rP = (double)dds->dds_ref_psize;
1140b24ab676SJeff Bonwick 	rD = (double)dds->dds_ref_dsize;
1141b24ab676SJeff Bonwick 	D = (double)dds->dds_dsize;
1142b24ab676SJeff Bonwick 
1143b24ab676SJeff Bonwick 	dedup = rD / D;
1144b24ab676SJeff Bonwick 	compress = rL / rP;
1145b24ab676SJeff Bonwick 	copies = rD / rP;
1146b24ab676SJeff Bonwick 
1147b24ab676SJeff Bonwick 	(void) printf("dedup = %.2f, compress = %.2f, copies = %.2f, "
1148b24ab676SJeff Bonwick 	    "dedup * compress / copies = %.2f\n\n",
1149b24ab676SJeff Bonwick 	    dedup, compress, copies, dedup * compress / copies);
1150b24ab676SJeff Bonwick }
1151b24ab676SJeff Bonwick 
1152b24ab676SJeff Bonwick static void
1153b24ab676SJeff Bonwick dump_ddt(ddt_t *ddt, enum ddt_type type, enum ddt_class class)
1154b24ab676SJeff Bonwick {
1155b24ab676SJeff Bonwick 	char name[DDT_NAMELEN];
1156b24ab676SJeff Bonwick 	ddt_entry_t dde;
1157b24ab676SJeff Bonwick 	uint64_t walk = 0;
1158b24ab676SJeff Bonwick 	dmu_object_info_t doi;
1159b24ab676SJeff Bonwick 	uint64_t count, dspace, mspace;
1160b24ab676SJeff Bonwick 	int error;
1161b24ab676SJeff Bonwick 
1162b24ab676SJeff Bonwick 	error = ddt_object_info(ddt, type, class, &doi);
1163b24ab676SJeff Bonwick 
1164b24ab676SJeff Bonwick 	if (error == ENOENT)
1165b24ab676SJeff Bonwick 		return;
1166b24ab676SJeff Bonwick 	ASSERT(error == 0);
1167b24ab676SJeff Bonwick 
11687448a079SGeorge Wilson 	if ((count = ddt_object_count(ddt, type, class)) == 0)
11697448a079SGeorge Wilson 		return;
11707448a079SGeorge Wilson 
1171b24ab676SJeff Bonwick 	dspace = doi.doi_physical_blocks_512 << 9;
1172b24ab676SJeff Bonwick 	mspace = doi.doi_fill_count * doi.doi_data_block_size;
1173b24ab676SJeff Bonwick 
1174b24ab676SJeff Bonwick 	ddt_object_name(ddt, type, class, name);
1175b24ab676SJeff Bonwick 
1176b24ab676SJeff Bonwick 	(void) printf("%s: %llu entries, size %llu on disk, %llu in core\n",
1177b24ab676SJeff Bonwick 	    name,
1178b24ab676SJeff Bonwick 	    (u_longlong_t)count,
1179b24ab676SJeff Bonwick 	    (u_longlong_t)(dspace / count),
1180b24ab676SJeff Bonwick 	    (u_longlong_t)(mspace / count));
1181b24ab676SJeff Bonwick 
1182b24ab676SJeff Bonwick 	if (dump_opt['D'] < 3)
1183b24ab676SJeff Bonwick 		return;
1184b24ab676SJeff Bonwick 
11859eb19f4dSGeorge Wilson 	zpool_dump_ddt(NULL, &ddt->ddt_histogram[type][class]);
1186b24ab676SJeff Bonwick 
1187b24ab676SJeff Bonwick 	if (dump_opt['D'] < 4)
1188b24ab676SJeff Bonwick 		return;
1189b24ab676SJeff Bonwick 
1190b24ab676SJeff Bonwick 	if (dump_opt['D'] < 5 && class == DDT_CLASS_UNIQUE)
1191b24ab676SJeff Bonwick 		return;
1192b24ab676SJeff Bonwick 
1193b24ab676SJeff Bonwick 	(void) printf("%s contents:\n\n", name);
1194b24ab676SJeff Bonwick 
1195bbfd46c4SJeff Bonwick 	while ((error = ddt_object_walk(ddt, type, class, &walk, &dde)) == 0)
1196b24ab676SJeff Bonwick 		dump_dde(ddt, &dde, walk);
1197b24ab676SJeff Bonwick 
119817f11284SSerapheim Dimitropoulos 	ASSERT3U(error, ==, ENOENT);
1199b24ab676SJeff Bonwick 
1200b24ab676SJeff Bonwick 	(void) printf("\n");
1201b24ab676SJeff Bonwick }
1202b24ab676SJeff Bonwick 
1203b24ab676SJeff Bonwick static void
1204b24ab676SJeff Bonwick dump_all_ddts(spa_t *spa)
1205b24ab676SJeff Bonwick {
12063f7978d0SAlan Somers 	ddt_histogram_t ddh_total;
12073f7978d0SAlan Somers 	ddt_stat_t dds_total;
12083f7978d0SAlan Somers 
12093f7978d0SAlan Somers 	bzero(&ddh_total, sizeof (ddh_total));
12103f7978d0SAlan Somers 	bzero(&dds_total, sizeof (dds_total));
1211b24ab676SJeff Bonwick 
1212b24ab676SJeff Bonwick 	for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) {
1213b24ab676SJeff Bonwick 		ddt_t *ddt = spa->spa_ddt[c];
1214b24ab676SJeff Bonwick 		for (enum ddt_type type = 0; type < DDT_TYPES; type++) {
1215b24ab676SJeff Bonwick 			for (enum ddt_class class = 0; class < DDT_CLASSES;
1216b24ab676SJeff Bonwick 			    class++) {
1217b24ab676SJeff Bonwick 				dump_ddt(ddt, type, class);
1218b24ab676SJeff Bonwick 			}
1219b24ab676SJeff Bonwick 		}
1220b24ab676SJeff Bonwick 	}
1221b24ab676SJeff Bonwick 
12229eb19f4dSGeorge Wilson 	ddt_get_dedup_stats(spa, &dds_total);
1223b24ab676SJeff Bonwick 
1224b24ab676SJeff Bonwick 	if (dds_total.dds_blocks == 0) {
1225b24ab676SJeff Bonwick 		(void) printf("All DDTs are empty\n");
1226b24ab676SJeff Bonwick 		return;
1227b24ab676SJeff Bonwick 	}
1228b24ab676SJeff Bonwick 
1229b24ab676SJeff Bonwick 	(void) printf("\n");
1230b24ab676SJeff Bonwick 
1231b24ab676SJeff Bonwick 	if (dump_opt['D'] > 1) {
1232b24ab676SJeff Bonwick 		(void) printf("DDT histogram (aggregated over all DDTs):\n");
12339eb19f4dSGeorge Wilson 		ddt_get_dedup_histogram(spa, &ddh_total);
12349eb19f4dSGeorge Wilson 		zpool_dump_ddt(&dds_total, &ddh_total);
1235b24ab676SJeff Bonwick 	}
1236b24ab676SJeff Bonwick 
1237b24ab676SJeff Bonwick 	dump_dedup_ratio(&dds_total);
1238b24ab676SJeff Bonwick }
1239b24ab676SJeff Bonwick 
12408ad4d6ddSJeff Bonwick static void
12410713e232SGeorge Wilson dump_dtl_seg(void *arg, uint64_t start, uint64_t size)
12428ad4d6ddSJeff Bonwick {
12430713e232SGeorge Wilson 	char *prefix = arg;
12448ad4d6ddSJeff Bonwick 
12458ad4d6ddSJeff Bonwick 	(void) printf("%s [%llu,%llu) length %llu\n",
12468ad4d6ddSJeff Bonwick 	    prefix,
12478ad4d6ddSJeff Bonwick 	    (u_longlong_t)start,
12488ad4d6ddSJeff Bonwick 	    (u_longlong_t)(start + size),
12498ad4d6ddSJeff Bonwick 	    (u_longlong_t)(size));
12508ad4d6ddSJeff Bonwick }
12518ad4d6ddSJeff Bonwick 
1252fa9e4066Sahrens static void
1253fa9e4066Sahrens dump_dtl(vdev_t *vd, int indent)
1254fa9e4066Sahrens {
12558ad4d6ddSJeff Bonwick 	spa_t *spa = vd->vdev_spa;
12568ad4d6ddSJeff Bonwick 	boolean_t required;
12573f7978d0SAlan Somers 	const char *name[DTL_TYPES] = { "missing", "partial", "scrub",
12583f7978d0SAlan Somers 		"outage" };
12598ad4d6ddSJeff Bonwick 	char prefix[256];
12608ad4d6ddSJeff Bonwick 
12618f18d1faSGeorge Wilson 	spa_vdev_state_enter(spa, SCL_NONE);
12628ad4d6ddSJeff Bonwick 	required = vdev_dtl_required(vd);
12638ad4d6ddSJeff Bonwick 	(void) spa_vdev_state_exit(spa, NULL, 0);
1264fa9e4066Sahrens 
1265fa9e4066Sahrens 	if (indent == 0)
1266fa9e4066Sahrens 		(void) printf("\nDirty time logs:\n\n");
1267fa9e4066Sahrens 
12688ad4d6ddSJeff Bonwick 	(void) printf("\t%*s%s [%s]\n", indent, "",
1269e14bb325SJeff Bonwick 	    vd->vdev_path ? vd->vdev_path :
12708ad4d6ddSJeff Bonwick 	    vd->vdev_parent ? vd->vdev_ops->vdev_op_type : spa_name(spa),
12718ad4d6ddSJeff Bonwick 	    required ? "DTL-required" : "DTL-expendable");
1272fa9e4066Sahrens 
12738ad4d6ddSJeff Bonwick 	for (int t = 0; t < DTL_TYPES; t++) {
12740713e232SGeorge Wilson 		range_tree_t *rt = vd->vdev_dtl[t];
12750713e232SGeorge Wilson 		if (range_tree_space(rt) == 0)
12768ad4d6ddSJeff Bonwick 			continue;
12778ad4d6ddSJeff Bonwick 		(void) snprintf(prefix, sizeof (prefix), "\t%*s%s",
12788ad4d6ddSJeff Bonwick 		    indent + 2, "", name[t]);
12790713e232SGeorge Wilson 		range_tree_walk(rt, dump_dtl_seg, prefix);
12808ad4d6ddSJeff Bonwick 		if (dump_opt['d'] > 5 && vd->vdev_children == 0)
12810713e232SGeorge Wilson 			dump_spacemap(spa->spa_meta_objset, vd->vdev_dtl_sm);
1282fa9e4066Sahrens 	}
1283fa9e4066Sahrens 
12843f7978d0SAlan Somers 	for (unsigned c = 0; c < vd->vdev_children; c++)
1285fa9e4066Sahrens 		dump_dtl(vd->vdev_child[c], indent + 4);
1286fa9e4066Sahrens }
1287fa9e4066Sahrens 
12888f18d1faSGeorge Wilson static void
12898f18d1faSGeorge Wilson dump_history(spa_t *spa)
12908f18d1faSGeorge Wilson {
12918f18d1faSGeorge Wilson 	nvlist_t **events = NULL;
1292e4161df6SVictor Latushkin 	uint64_t resid, len, off = 0;
12938f18d1faSGeorge Wilson 	uint_t num = 0;
12948f18d1faSGeorge Wilson 	int error;
12958f18d1faSGeorge Wilson 	time_t tsec;
12968f18d1faSGeorge Wilson 	struct tm t;
12978f18d1faSGeorge Wilson 	char tbuf[30];
12988f18d1faSGeorge Wilson 	char internalstr[MAXPATHLEN];
12998f18d1faSGeorge Wilson 
13003f84190cSMatthew Ahrens 	char *buf = umem_alloc(SPA_MAXBLOCKSIZE, UMEM_NOFAIL);
13018f18d1faSGeorge Wilson 	do {
13023f84190cSMatthew Ahrens 		len = SPA_MAXBLOCKSIZE;
1303e4161df6SVictor Latushkin 
13048f18d1faSGeorge Wilson 		if ((error = spa_history_get(spa, &off, &len, buf)) != 0) {
13058f18d1faSGeorge Wilson 			(void) fprintf(stderr, "Unable to read history: "
13068f18d1faSGeorge Wilson 			    "error %d\n", error);
13073f84190cSMatthew Ahrens 			umem_free(buf, SPA_MAXBLOCKSIZE);
13088f18d1faSGeorge Wilson 			return;
13098f18d1faSGeorge Wilson 		}
13108f18d1faSGeorge Wilson 
13118f18d1faSGeorge Wilson 		if (zpool_history_unpack(buf, len, &resid, &events, &num) != 0)
13128f18d1faSGeorge Wilson 			break;
13138f18d1faSGeorge Wilson 
13148f18d1faSGeorge Wilson 		off -= resid;
13158f18d1faSGeorge Wilson 	} while (len != 0);
13163f84190cSMatthew Ahrens 	umem_free(buf, SPA_MAXBLOCKSIZE);
13178f18d1faSGeorge Wilson 
13188f18d1faSGeorge Wilson 	(void) printf("\nHistory:\n");
13193f7978d0SAlan Somers 	for (unsigned i = 0; i < num; i++) {
13208f18d1faSGeorge Wilson 		uint64_t time, txg, ievent;
13218f18d1faSGeorge Wilson 		char *cmd, *intstr;
13224445fffbSMatthew Ahrens 		boolean_t printed = B_FALSE;
13238f18d1faSGeorge Wilson 
13248f18d1faSGeorge Wilson 		if (nvlist_lookup_uint64(events[i], ZPOOL_HIST_TIME,
13258f18d1faSGeorge Wilson 		    &time) != 0)
13264445fffbSMatthew Ahrens 			goto next;
13278f18d1faSGeorge Wilson 		if (nvlist_lookup_string(events[i], ZPOOL_HIST_CMD,
13288f18d1faSGeorge Wilson 		    &cmd) != 0) {
13298f18d1faSGeorge Wilson 			if (nvlist_lookup_uint64(events[i],
13308f18d1faSGeorge Wilson 			    ZPOOL_HIST_INT_EVENT, &ievent) != 0)
13314445fffbSMatthew Ahrens 				goto next;
13328f18d1faSGeorge Wilson 			verify(nvlist_lookup_uint64(events[i],
13338f18d1faSGeorge Wilson 			    ZPOOL_HIST_TXG, &txg) == 0);
13348f18d1faSGeorge Wilson 			verify(nvlist_lookup_string(events[i],
13358f18d1faSGeorge Wilson 			    ZPOOL_HIST_INT_STR, &intstr) == 0);
13364445fffbSMatthew Ahrens 			if (ievent >= ZFS_NUM_LEGACY_HISTORY_EVENTS)
13374445fffbSMatthew Ahrens 				goto next;
13388f18d1faSGeorge Wilson 
13398f18d1faSGeorge Wilson 			(void) snprintf(internalstr,
13408f18d1faSGeorge Wilson 			    sizeof (internalstr),
13413f7978d0SAlan Somers 			    "[internal %s txg:%ju] %s",
13423f7978d0SAlan Somers 			    zfs_history_event_names[ievent], (uintmax_t)txg,
13438f18d1faSGeorge Wilson 			    intstr);
13448f18d1faSGeorge Wilson 			cmd = internalstr;
13458f18d1faSGeorge Wilson 		}
13468f18d1faSGeorge Wilson 		tsec = time;
13478f18d1faSGeorge Wilson 		(void) localtime_r(&tsec, &t);
13488f18d1faSGeorge Wilson 		(void) strftime(tbuf, sizeof (tbuf), "%F.%T", &t);
13498f18d1faSGeorge Wilson 		(void) printf("%s %s\n", tbuf, cmd);
13504445fffbSMatthew Ahrens 		printed = B_TRUE;
13514445fffbSMatthew Ahrens 
13524445fffbSMatthew Ahrens next:
13534445fffbSMatthew Ahrens 		if (dump_opt['h'] > 1) {
13544445fffbSMatthew Ahrens 			if (!printed)
13554445fffbSMatthew Ahrens 				(void) printf("unrecognized record:\n");
13564445fffbSMatthew Ahrens 			dump_nvlist(events[i], 2);
13574445fffbSMatthew Ahrens 		}
13588f18d1faSGeorge Wilson 	}
13598f18d1faSGeorge Wilson }
13608f18d1faSGeorge Wilson 
1361fa9e4066Sahrens /*ARGSUSED*/
1362fa9e4066Sahrens static void
1363fa9e4066Sahrens dump_dnode(objset_t *os, uint64_t object, void *data, size_t size)
1364fa9e4066Sahrens {
1365fa9e4066Sahrens }
1366fa9e4066Sahrens 
1367fa9e4066Sahrens static uint64_t
13687802d7bfSMatthew Ahrens blkid2offset(const dnode_phys_t *dnp, const blkptr_t *bp,
13697802d7bfSMatthew Ahrens     const zbookmark_phys_t *zb)
1370fa9e4066Sahrens {
1371b24ab676SJeff Bonwick 	if (dnp == NULL) {
1372b24ab676SJeff Bonwick 		ASSERT(zb->zb_level < 0);
1373b24ab676SJeff Bonwick 		if (zb->zb_object == 0)
1374b24ab676SJeff Bonwick 			return (zb->zb_blkid);
1375b24ab676SJeff Bonwick 		return (zb->zb_blkid * BP_GET_LSIZE(bp));
1376b24ab676SJeff Bonwick 	}
1377b24ab676SJeff Bonwick 
1378b24ab676SJeff Bonwick 	ASSERT(zb->zb_level >= 0);
1379fa9e4066Sahrens 
1380b24ab676SJeff Bonwick 	return ((zb->zb_blkid <<
1381b24ab676SJeff Bonwick 	    (zb->zb_level * (dnp->dn_indblkshift - SPA_BLKPTRSHIFT))) *
1382fa9e4066Sahrens 	    dnp->dn_datablkszsec << SPA_MINBLOCKSHIFT);
1383fa9e4066Sahrens }
1384fa9e4066Sahrens 
138544cd46caSbillm static void
138643466aaeSMax Grossman snprintf_blkptr_compact(char *blkbuf, size_t buflen, const blkptr_t *bp)
138744cd46caSbillm {
1388cde58dbcSMatthew Ahrens 	const dva_t *dva = bp->blk_dva;
1389b24ab676SJeff Bonwick 	int ndvas = dump_opt['d'] > 5 ? BP_GET_NDVAS(bp) : 1;
1390b24ab676SJeff Bonwick 
1391490d05b9SMatthew Ahrens 	if (dump_opt['b'] >= 6) {
139243466aaeSMax Grossman 		snprintf_blkptr(blkbuf, buflen, bp);
1393b24ab676SJeff Bonwick 		return;
1394b24ab676SJeff Bonwick 	}
139544cd46caSbillm 
13965d7b4d43SMatthew Ahrens 	if (BP_IS_EMBEDDED(bp)) {
13975d7b4d43SMatthew Ahrens 		(void) sprintf(blkbuf,
13985d7b4d43SMatthew Ahrens 		    "EMBEDDED et=%u %llxL/%llxP B=%llu",
13995d7b4d43SMatthew Ahrens 		    (int)BPE_GET_ETYPE(bp),
14005d7b4d43SMatthew Ahrens 		    (u_longlong_t)BPE_GET_LSIZE(bp),
14015d7b4d43SMatthew Ahrens 		    (u_longlong_t)BPE_GET_PSIZE(bp),
14025d7b4d43SMatthew Ahrens 		    (u_longlong_t)bp->blk_birth);
14035d7b4d43SMatthew Ahrens 		return;
14045d7b4d43SMatthew Ahrens 	}
140544cd46caSbillm 
14065d7b4d43SMatthew Ahrens 	blkbuf[0] = '\0';
1407b24ab676SJeff Bonwick 	for (int i = 0; i < ndvas; i++)
140843466aaeSMax Grossman 		(void) snprintf(blkbuf + strlen(blkbuf),
140943466aaeSMax Grossman 		    buflen - strlen(blkbuf), "%llu:%llx:%llx ",
141044cd46caSbillm 		    (u_longlong_t)DVA_GET_VDEV(&dva[i]),
141144cd46caSbillm 		    (u_longlong_t)DVA_GET_OFFSET(&dva[i]),
141244cd46caSbillm 		    (u_longlong_t)DVA_GET_ASIZE(&dva[i]));
141344cd46caSbillm 
141443466aaeSMax Grossman 	if (BP_IS_HOLE(bp)) {
141543466aaeSMax Grossman 		(void) snprintf(blkbuf + strlen(blkbuf),
141670163ac5SPrakash Surya 		    buflen - strlen(blkbuf),
141770163ac5SPrakash Surya 		    "%llxL B=%llu",
141870163ac5SPrakash Surya 		    (u_longlong_t)BP_GET_LSIZE(bp),
141943466aaeSMax Grossman 		    (u_longlong_t)bp->blk_birth);
142043466aaeSMax Grossman 	} else {
142143466aaeSMax Grossman 		(void) snprintf(blkbuf + strlen(blkbuf),
142243466aaeSMax Grossman 		    buflen - strlen(blkbuf),
142343466aaeSMax Grossman 		    "%llxL/%llxP F=%llu B=%llu/%llu",
142443466aaeSMax Grossman 		    (u_longlong_t)BP_GET_LSIZE(bp),
142543466aaeSMax Grossman 		    (u_longlong_t)BP_GET_PSIZE(bp),
14265d7b4d43SMatthew Ahrens 		    (u_longlong_t)BP_GET_FILL(bp),
142743466aaeSMax Grossman 		    (u_longlong_t)bp->blk_birth,
142843466aaeSMax Grossman 		    (u_longlong_t)BP_PHYSICAL_BIRTH(bp));
142943466aaeSMax Grossman 	}
143044cd46caSbillm }
143144cd46caSbillm 
143288b7b0f2SMatthew Ahrens static void
14337802d7bfSMatthew Ahrens print_indirect(blkptr_t *bp, const zbookmark_phys_t *zb,
143488b7b0f2SMatthew Ahrens     const dnode_phys_t *dnp)
1435fa9e4066Sahrens {
143688b7b0f2SMatthew Ahrens 	char blkbuf[BP_SPRINTF_LEN];
1437fa9e4066Sahrens 	int l;
1438fa9e4066Sahrens 
14395d7b4d43SMatthew Ahrens 	if (!BP_IS_EMBEDDED(bp)) {
14405d7b4d43SMatthew Ahrens 		ASSERT3U(BP_GET_TYPE(bp), ==, dnp->dn_type);
14415d7b4d43SMatthew Ahrens 		ASSERT3U(BP_GET_LEVEL(bp), ==, zb->zb_level);
14425d7b4d43SMatthew Ahrens 	}
1443fa9e4066Sahrens 
1444b24ab676SJeff Bonwick 	(void) printf("%16llx ", (u_longlong_t)blkid2offset(dnp, bp, zb));
1445fa9e4066Sahrens 
1446fa9e4066Sahrens 	ASSERT(zb->zb_level >= 0);
1447fa9e4066Sahrens 
1448fa9e4066Sahrens 	for (l = dnp->dn_nlevels - 1; l >= -1; l--) {
1449fa9e4066Sahrens 		if (l == zb->zb_level) {
145088b7b0f2SMatthew Ahrens 			(void) printf("L%llx", (u_longlong_t)zb->zb_level);
1451fa9e4066Sahrens 		} else {
145288b7b0f2SMatthew Ahrens 			(void) printf(" ");
1453fa9e4066Sahrens 		}
1454fa9e4066Sahrens 	}
1455fa9e4066Sahrens 
145643466aaeSMax Grossman 	snprintf_blkptr_compact(blkbuf, sizeof (blkbuf), bp);
145788b7b0f2SMatthew Ahrens 	(void) printf("%s\n", blkbuf);
145888b7b0f2SMatthew Ahrens }
145988b7b0f2SMatthew Ahrens 
146088b7b0f2SMatthew Ahrens static int
146188b7b0f2SMatthew Ahrens visit_indirect(spa_t *spa, const dnode_phys_t *dnp,
14627802d7bfSMatthew Ahrens     blkptr_t *bp, const zbookmark_phys_t *zb)
146388b7b0f2SMatthew Ahrens {
1464e4161df6SVictor Latushkin 	int err = 0;
146588b7b0f2SMatthew Ahrens 
146688b7b0f2SMatthew Ahrens 	if (bp->blk_birth == 0)
146788b7b0f2SMatthew Ahrens 		return (0);
146888b7b0f2SMatthew Ahrens 
146988b7b0f2SMatthew Ahrens 	print_indirect(bp, zb, dnp);
147088b7b0f2SMatthew Ahrens 
147143466aaeSMax Grossman 	if (BP_GET_LEVEL(bp) > 0 && !BP_IS_HOLE(bp)) {
14727adb730bSGeorge Wilson 		arc_flags_t flags = ARC_FLAG_WAIT;
147388b7b0f2SMatthew Ahrens 		int i;
147488b7b0f2SMatthew Ahrens 		blkptr_t *cbp;
147588b7b0f2SMatthew Ahrens 		int epb = BP_GET_LSIZE(bp) >> SPA_BLKPTRSHIFT;
147688b7b0f2SMatthew Ahrens 		arc_buf_t *buf;
147788b7b0f2SMatthew Ahrens 		uint64_t fill = 0;
147888b7b0f2SMatthew Ahrens 
14791b912ec7SGeorge Wilson 		err = arc_read(NULL, spa, bp, arc_getbuf_func, &buf,
148088b7b0f2SMatthew Ahrens 		    ZIO_PRIORITY_ASYNC_READ, ZIO_FLAG_CANFAIL, &flags, zb);
148188b7b0f2SMatthew Ahrens 		if (err)
148288b7b0f2SMatthew Ahrens 			return (err);
14833f9d6ad7SLin Ling 		ASSERT(buf->b_data);
148488b7b0f2SMatthew Ahrens 
148588b7b0f2SMatthew Ahrens 		/* recursively visit blocks below this */
148688b7b0f2SMatthew Ahrens 		cbp = buf->b_data;
148788b7b0f2SMatthew Ahrens 		for (i = 0; i < epb; i++, cbp++) {
14887802d7bfSMatthew Ahrens 			zbookmark_phys_t czb;
148988b7b0f2SMatthew Ahrens 
149088b7b0f2SMatthew Ahrens 			SET_BOOKMARK(&czb, zb->zb_objset, zb->zb_object,
149188b7b0f2SMatthew Ahrens 			    zb->zb_level - 1,
149288b7b0f2SMatthew Ahrens 			    zb->zb_blkid * epb + i);
149388b7b0f2SMatthew Ahrens 			err = visit_indirect(spa, dnp, cbp, &czb);
149488b7b0f2SMatthew Ahrens 			if (err)
149588b7b0f2SMatthew Ahrens 				break;
14965d7b4d43SMatthew Ahrens 			fill += BP_GET_FILL(cbp);
149788b7b0f2SMatthew Ahrens 		}
14988ad4d6ddSJeff Bonwick 		if (!err)
14995d7b4d43SMatthew Ahrens 			ASSERT3U(fill, ==, BP_GET_FILL(bp));
1500dcbf3bd6SGeorge Wilson 		arc_buf_destroy(buf, &buf);
1501fa9e4066Sahrens 	}
1502fa9e4066Sahrens 
150388b7b0f2SMatthew Ahrens 	return (err);
1504fa9e4066Sahrens }
1505fa9e4066Sahrens 
1506fa9e4066Sahrens /*ARGSUSED*/
1507fa9e4066Sahrens static void
150888b7b0f2SMatthew Ahrens dump_indirect(dnode_t *dn)
1509fa9e4066Sahrens {
151088b7b0f2SMatthew Ahrens 	dnode_phys_t *dnp = dn->dn_phys;
151188b7b0f2SMatthew Ahrens 	int j;
15127802d7bfSMatthew Ahrens 	zbookmark_phys_t czb;
1513fa9e4066Sahrens 
1514fa9e4066Sahrens 	(void) printf("Indirect blocks:\n");
1515fa9e4066Sahrens 
1516503ad85cSMatthew Ahrens 	SET_BOOKMARK(&czb, dmu_objset_id(dn->dn_objset),
151788b7b0f2SMatthew Ahrens 	    dn->dn_object, dnp->dn_nlevels - 1, 0);
151888b7b0f2SMatthew Ahrens 	for (j = 0; j < dnp->dn_nblkptr; j++) {
151988b7b0f2SMatthew Ahrens 		czb.zb_blkid = j;
1520503ad85cSMatthew Ahrens 		(void) visit_indirect(dmu_objset_spa(dn->dn_objset), dnp,
152188b7b0f2SMatthew Ahrens 		    &dnp->dn_blkptr[j], &czb);
152288b7b0f2SMatthew Ahrens 	}
1523fa9e4066Sahrens 
1524fa9e4066Sahrens 	(void) printf("\n");
1525fa9e4066Sahrens }
1526fa9e4066Sahrens 
1527fa9e4066Sahrens /*ARGSUSED*/
1528fa9e4066Sahrens static void
1529fa9e4066Sahrens dump_dsl_dir(objset_t *os, uint64_t object, void *data, size_t size)
1530fa9e4066Sahrens {
1531fa9e4066Sahrens 	dsl_dir_phys_t *dd = data;
1532fa9e4066Sahrens 	time_t crtime;
15333f9d6ad7SLin Ling 	char nice[32];
1534fa9e4066Sahrens 
15350a055120SJason King 	/* make sure nicenum has enough space */
15360a055120SJason King 	CTASSERT(sizeof (nice) >= NN_NUMBUF_SZ);
15370a055120SJason King 
1538fa9e4066Sahrens 	if (dd == NULL)
1539fa9e4066Sahrens 		return;
1540fa9e4066Sahrens 
1541da6c28aaSamw 	ASSERT3U(size, >=, sizeof (dsl_dir_phys_t));
1542fa9e4066Sahrens 
1543fa9e4066Sahrens 	crtime = dd->dd_creation_time;
1544fa9e4066Sahrens 	(void) printf("\t\tcreation_time = %s", ctime(&crtime));
1545fa9e4066Sahrens 	(void) printf("\t\thead_dataset_obj = %llu\n",
1546fa9e4066Sahrens 	    (u_longlong_t)dd->dd_head_dataset_obj);
1547fa9e4066Sahrens 	(void) printf("\t\tparent_dir_obj = %llu\n",
1548fa9e4066Sahrens 	    (u_longlong_t)dd->dd_parent_obj);
15493cb34c60Sahrens 	(void) printf("\t\torigin_obj = %llu\n",
15503cb34c60Sahrens 	    (u_longlong_t)dd->dd_origin_obj);
1551fa9e4066Sahrens 	(void) printf("\t\tchild_dir_zapobj = %llu\n",
1552fa9e4066Sahrens 	    (u_longlong_t)dd->dd_child_dir_zapobj);
15530a055120SJason King 	zdb_nicenum(dd->dd_used_bytes, nice, sizeof (nice));
155474e7dc98SMatthew Ahrens 	(void) printf("\t\tused_bytes = %s\n", nice);
15550a055120SJason King 	zdb_nicenum(dd->dd_compressed_bytes, nice, sizeof (nice));
155674e7dc98SMatthew Ahrens 	(void) printf("\t\tcompressed_bytes = %s\n", nice);
15570a055120SJason King 	zdb_nicenum(dd->dd_uncompressed_bytes, nice, sizeof (nice));
155874e7dc98SMatthew Ahrens 	(void) printf("\t\tuncompressed_bytes = %s\n", nice);
15590a055120SJason King 	zdb_nicenum(dd->dd_quota, nice, sizeof (nice));
156074e7dc98SMatthew Ahrens 	(void) printf("\t\tquota = %s\n", nice);
15610a055120SJason King 	zdb_nicenum(dd->dd_reserved, nice, sizeof (nice));
156274e7dc98SMatthew Ahrens 	(void) printf("\t\treserved = %s\n", nice);
1563fa9e4066Sahrens 	(void) printf("\t\tprops_zapobj = %llu\n",
1564fa9e4066Sahrens 	    (u_longlong_t)dd->dd_props_zapobj);
1565ecd6cf80Smarks 	(void) printf("\t\tdeleg_zapobj = %llu\n",
1566ecd6cf80Smarks 	    (u_longlong_t)dd->dd_deleg_zapobj);
156774e7dc98SMatthew Ahrens 	(void) printf("\t\tflags = %llx\n",
156874e7dc98SMatthew Ahrens 	    (u_longlong_t)dd->dd_flags);
156974e7dc98SMatthew Ahrens 
157074e7dc98SMatthew Ahrens #define	DO(which) \
15710a055120SJason King 	zdb_nicenum(dd->dd_used_breakdown[DD_USED_ ## which], nice, \
15720a055120SJason King 	    sizeof (nice)); \
157374e7dc98SMatthew Ahrens 	(void) printf("\t\tused_breakdown[" #which "] = %s\n", nice)
157474e7dc98SMatthew Ahrens 	DO(HEAD);
157574e7dc98SMatthew Ahrens 	DO(SNAP);
157674e7dc98SMatthew Ahrens 	DO(CHILD);
157774e7dc98SMatthew Ahrens 	DO(CHILD_RSRV);
157874e7dc98SMatthew Ahrens 	DO(REFRSRV);
157974e7dc98SMatthew Ahrens #undef DO
158017fb938fSMatthew Ahrens 	(void) printf("\t\tclones = %llu\n",
158117fb938fSMatthew Ahrens 	    (u_longlong_t)dd->dd_clones);
1582fa9e4066Sahrens }
1583fa9e4066Sahrens 
1584fa9e4066Sahrens /*ARGSUSED*/
1585fa9e4066Sahrens static void
1586fa9e4066Sahrens dump_dsl_dataset(objset_t *os, uint64_t object, void *data, size_t size)
1587fa9e4066Sahrens {
1588fa9e4066Sahrens 	dsl_dataset_phys_t *ds = data;
1589fa9e4066Sahrens 	time_t crtime;
15903f9d6ad7SLin Ling 	char used[32], compressed[32], uncompressed[32], unique[32];
1591fbabab8fSmaybee 	char blkbuf[BP_SPRINTF_LEN];
1592fa9e4066Sahrens 
15930a055120SJason King 	/* make sure nicenum has enough space */
15940a055120SJason King 	CTASSERT(sizeof (used) >= NN_NUMBUF_SZ);
15950a055120SJason King 	CTASSERT(sizeof (compressed) >= NN_NUMBUF_SZ);
15960a055120SJason King 	CTASSERT(sizeof (uncompressed) >= NN_NUMBUF_SZ);
15970a055120SJason King 	CTASSERT(sizeof (unique) >= NN_NUMBUF_SZ);
15980a055120SJason King 
1599fa9e4066Sahrens 	if (ds == NULL)
1600fa9e4066Sahrens 		return;
1601fa9e4066Sahrens 
1602fa9e4066Sahrens 	ASSERT(size == sizeof (*ds));
1603fa9e4066Sahrens 	crtime = ds->ds_creation_time;
16040a055120SJason King 	zdb_nicenum(ds->ds_referenced_bytes, used, sizeof (used));
16050a055120SJason King 	zdb_nicenum(ds->ds_compressed_bytes, compressed, sizeof (compressed));
16060a055120SJason King 	zdb_nicenum(ds->ds_uncompressed_bytes, uncompressed,
16070a055120SJason King 	    sizeof (uncompressed));
16080a055120SJason King 	zdb_nicenum(ds->ds_unique_bytes, unique, sizeof (unique));
160943466aaeSMax Grossman 	snprintf_blkptr(blkbuf, sizeof (blkbuf), &ds->ds_bp);
1610fa9e4066Sahrens 
1611088f3894Sahrens 	(void) printf("\t\tdir_obj = %llu\n",
1612fa9e4066Sahrens 	    (u_longlong_t)ds->ds_dir_obj);
1613fa9e4066Sahrens 	(void) printf("\t\tprev_snap_obj = %llu\n",
1614fa9e4066Sahrens 	    (u_longlong_t)ds->ds_prev_snap_obj);
1615fa9e4066Sahrens 	(void) printf("\t\tprev_snap_txg = %llu\n",
1616fa9e4066Sahrens 	    (u_longlong_t)ds->ds_prev_snap_txg);
1617fa9e4066Sahrens 	(void) printf("\t\tnext_snap_obj = %llu\n",
1618fa9e4066Sahrens 	    (u_longlong_t)ds->ds_next_snap_obj);
1619fa9e4066Sahrens 	(void) printf("\t\tsnapnames_zapobj = %llu\n",
1620fa9e4066Sahrens 	    (u_longlong_t)ds->ds_snapnames_zapobj);
1621fa9e4066Sahrens 	(void) printf("\t\tnum_children = %llu\n",
1622fa9e4066Sahrens 	    (u_longlong_t)ds->ds_num_children);
1623842727c2SChris Kirby 	(void) printf("\t\tuserrefs_obj = %llu\n",
1624842727c2SChris Kirby 	    (u_longlong_t)ds->ds_userrefs_obj);
1625fa9e4066Sahrens 	(void) printf("\t\tcreation_time = %s", ctime(&crtime));
1626fa9e4066Sahrens 	(void) printf("\t\tcreation_txg = %llu\n",
1627fa9e4066Sahrens 	    (u_longlong_t)ds->ds_creation_txg);
1628fa9e4066Sahrens 	(void) printf("\t\tdeadlist_obj = %llu\n",
1629fa9e4066Sahrens 	    (u_longlong_t)ds->ds_deadlist_obj);
1630fa9e4066Sahrens 	(void) printf("\t\tused_bytes = %s\n", used);
1631fa9e4066Sahrens 	(void) printf("\t\tcompressed_bytes = %s\n", compressed);
1632fa9e4066Sahrens 	(void) printf("\t\tuncompressed_bytes = %s\n", uncompressed);
1633fa9e4066Sahrens 	(void) printf("\t\tunique = %s\n", unique);
1634fa9e4066Sahrens 	(void) printf("\t\tfsid_guid = %llu\n",
1635fa9e4066Sahrens 	    (u_longlong_t)ds->ds_fsid_guid);
1636fa9e4066Sahrens 	(void) printf("\t\tguid = %llu\n",
1637fa9e4066Sahrens 	    (u_longlong_t)ds->ds_guid);
163899653d4eSeschrock 	(void) printf("\t\tflags = %llx\n",
163999653d4eSeschrock 	    (u_longlong_t)ds->ds_flags);
1640088f3894Sahrens 	(void) printf("\t\tnext_clones_obj = %llu\n",
1641088f3894Sahrens 	    (u_longlong_t)ds->ds_next_clones_obj);
1642bb0ade09Sahrens 	(void) printf("\t\tprops_obj = %llu\n",
1643bb0ade09Sahrens 	    (u_longlong_t)ds->ds_props_obj);
1644fa9e4066Sahrens 	(void) printf("\t\tbp = %s\n", blkbuf);
1645fa9e4066Sahrens }
1646fa9e4066Sahrens 
1647ad135b5dSChristopher Siden /* ARGSUSED */
1648ad135b5dSChristopher Siden static int
1649ad135b5dSChristopher Siden dump_bptree_cb(void *arg, const blkptr_t *bp, dmu_tx_t *tx)
1650ad135b5dSChristopher Siden {
1651ad135b5dSChristopher Siden 	char blkbuf[BP_SPRINTF_LEN];
1652ad135b5dSChristopher Siden 
1653ad135b5dSChristopher Siden 	if (bp->blk_birth != 0) {
165443466aaeSMax Grossman 		snprintf_blkptr(blkbuf, sizeof (blkbuf), bp);
1655ad135b5dSChristopher Siden 		(void) printf("\t%s\n", blkbuf);
1656ad135b5dSChristopher Siden 	}
1657ad135b5dSChristopher Siden 	return (0);
1658ad135b5dSChristopher Siden }
1659ad135b5dSChristopher Siden 
1660ad135b5dSChristopher Siden static void
16613f7978d0SAlan Somers dump_bptree(objset_t *os, uint64_t obj, const char *name)
1662ad135b5dSChristopher Siden {
1663ad135b5dSChristopher Siden 	char bytes[32];
1664ad135b5dSChristopher Siden 	bptree_phys_t *bt;
1665ad135b5dSChristopher Siden 	dmu_buf_t *db;
1666ad135b5dSChristopher Siden 
16670a055120SJason King 	/* make sure nicenum has enough space */
16680a055120SJason King 	CTASSERT(sizeof (bytes) >= NN_NUMBUF_SZ);
16690a055120SJason King 
1670ad135b5dSChristopher Siden 	if (dump_opt['d'] < 3)
1671ad135b5dSChristopher Siden 		return;
1672ad135b5dSChristopher Siden 
1673b420f3adSRichard Lowe 	VERIFY3U(0, ==, dmu_bonus_hold(os, obj, FTAG, &db));
1674ad135b5dSChristopher Siden 	bt = db->db_data;
16750a055120SJason King 	zdb_nicenum(bt->bt_bytes, bytes, sizeof (bytes));
1676ad135b5dSChristopher Siden 	(void) printf("\n    %s: %llu datasets, %s\n",
1677ad135b5dSChristopher Siden 	    name, (unsigned long long)(bt->bt_end - bt->bt_begin), bytes);
1678ad135b5dSChristopher Siden 	dmu_buf_rele(db, FTAG);
1679ad135b5dSChristopher Siden 
1680ad135b5dSChristopher Siden 	if (dump_opt['d'] < 5)
1681ad135b5dSChristopher Siden 		return;
1682ad135b5dSChristopher Siden 
1683ad135b5dSChristopher Siden 	(void) printf("\n");
1684ad135b5dSChristopher Siden 
1685ad135b5dSChristopher Siden 	(void) bptree_iterate(os, obj, B_FALSE, dump_bptree_cb, NULL, NULL);
1686ad135b5dSChristopher Siden }
1687ad135b5dSChristopher Siden 
1688cde58dbcSMatthew Ahrens /* ARGSUSED */
1689cde58dbcSMatthew Ahrens static int
1690cde58dbcSMatthew Ahrens dump_bpobj_cb(void *arg, const blkptr_t *bp, dmu_tx_t *tx)
1691cde58dbcSMatthew Ahrens {
1692cde58dbcSMatthew Ahrens 	char blkbuf[BP_SPRINTF_LEN];
1693cde58dbcSMatthew Ahrens 
1694cde58dbcSMatthew Ahrens 	ASSERT(bp->blk_birth != 0);
169543466aaeSMax Grossman 	snprintf_blkptr_compact(blkbuf, sizeof (blkbuf), bp);
1696cde58dbcSMatthew Ahrens 	(void) printf("\t%s\n", blkbuf);
1697cde58dbcSMatthew Ahrens 	return (0);
1698cde58dbcSMatthew Ahrens }
1699cde58dbcSMatthew Ahrens 
1700fa9e4066Sahrens static void
17013f7978d0SAlan Somers dump_full_bpobj(bpobj_t *bpo, const char *name, int indent)
1702fa9e4066Sahrens {
17033f9d6ad7SLin Ling 	char bytes[32];
17043f9d6ad7SLin Ling 	char comp[32];
17053f9d6ad7SLin Ling 	char uncomp[32];
1706fa9e4066Sahrens 
17070a055120SJason King 	/* make sure nicenum has enough space */
17080a055120SJason King 	CTASSERT(sizeof (bytes) >= NN_NUMBUF_SZ);
17090a055120SJason King 	CTASSERT(sizeof (comp) >= NN_NUMBUF_SZ);
17100a055120SJason King 	CTASSERT(sizeof (uncomp) >= NN_NUMBUF_SZ);
17110a055120SJason King 
1712fa9e4066Sahrens 	if (dump_opt['d'] < 3)
1713fa9e4066Sahrens 		return;
1714fa9e4066Sahrens 
17150a055120SJason King 	zdb_nicenum(bpo->bpo_phys->bpo_bytes, bytes, sizeof (bytes));
1716d0475637SMatthew Ahrens 	if (bpo->bpo_havesubobj && bpo->bpo_phys->bpo_subobjs != 0) {
17170a055120SJason King 		zdb_nicenum(bpo->bpo_phys->bpo_comp, comp, sizeof (comp));
17180a055120SJason King 		zdb_nicenum(bpo->bpo_phys->bpo_uncomp, uncomp, sizeof (uncomp));
1719d0475637SMatthew Ahrens 		(void) printf("    %*s: object %llu, %llu local blkptrs, "
1720732885fcSMatthew Ahrens 		    "%llu subobjs in object %llu, %s (%s/%s comp)\n",
1721d0475637SMatthew Ahrens 		    indent * 8, name,
1722d0475637SMatthew Ahrens 		    (u_longlong_t)bpo->bpo_object,
1723d0475637SMatthew Ahrens 		    (u_longlong_t)bpo->bpo_phys->bpo_num_blkptrs,
1724cde58dbcSMatthew Ahrens 		    (u_longlong_t)bpo->bpo_phys->bpo_num_subobjs,
1725732885fcSMatthew Ahrens 		    (u_longlong_t)bpo->bpo_phys->bpo_subobjs,
172699653d4eSeschrock 		    bytes, comp, uncomp);
1727d0475637SMatthew Ahrens 
1728d0475637SMatthew Ahrens 		for (uint64_t i = 0; i < bpo->bpo_phys->bpo_num_subobjs; i++) {
1729d0475637SMatthew Ahrens 			uint64_t subobj;
1730d0475637SMatthew Ahrens 			bpobj_t subbpo;
1731d0475637SMatthew Ahrens 			int error;
1732d0475637SMatthew Ahrens 			VERIFY0(dmu_read(bpo->bpo_os,
1733d0475637SMatthew Ahrens 			    bpo->bpo_phys->bpo_subobjs,
1734d0475637SMatthew Ahrens 			    i * sizeof (subobj), sizeof (subobj), &subobj, 0));
1735d0475637SMatthew Ahrens 			error = bpobj_open(&subbpo, bpo->bpo_os, subobj);
1736d0475637SMatthew Ahrens 			if (error != 0) {
1737d0475637SMatthew Ahrens 				(void) printf("ERROR %u while trying to open "
1738d0475637SMatthew Ahrens 				    "subobj id %llu\n",
1739d0475637SMatthew Ahrens 				    error, (u_longlong_t)subobj);
1740d0475637SMatthew Ahrens 				continue;
1741d0475637SMatthew Ahrens 			}
1742732885fcSMatthew Ahrens 			dump_full_bpobj(&subbpo, "subobj", indent + 1);
174377061867SMatthew Ahrens 			bpobj_close(&subbpo);
1744d0475637SMatthew Ahrens 		}
174599653d4eSeschrock 	} else {
1746d0475637SMatthew Ahrens 		(void) printf("    %*s: object %llu, %llu blkptrs, %s\n",
1747d0475637SMatthew Ahrens 		    indent * 8, name,
1748d0475637SMatthew Ahrens 		    (u_longlong_t)bpo->bpo_object,
1749d0475637SMatthew Ahrens 		    (u_longlong_t)bpo->bpo_phys->bpo_num_blkptrs,
1750d0475637SMatthew Ahrens 		    bytes);
175199653d4eSeschrock 	}
1752fa9e4066Sahrens 
1753cde58dbcSMatthew Ahrens 	if (dump_opt['d'] < 5)
1754fa9e4066Sahrens 		return;
1755fa9e4066Sahrens 
1756fa9e4066Sahrens 
1757d0475637SMatthew Ahrens 	if (indent == 0) {
1758d0475637SMatthew Ahrens 		(void) bpobj_iterate_nofree(bpo, dump_bpobj_cb, NULL, NULL);
1759d0475637SMatthew Ahrens 		(void) printf("\n");
1760d0475637SMatthew Ahrens 	}
1761cde58dbcSMatthew Ahrens }
176244cd46caSbillm 
176317fb938fSMatthew Ahrens static void
176417fb938fSMatthew Ahrens bpobj_count_refd(bpobj_t *bpo)
176517fb938fSMatthew Ahrens {
176617fb938fSMatthew Ahrens 	mos_obj_refd(bpo->bpo_object);
176717fb938fSMatthew Ahrens 
176817fb938fSMatthew Ahrens 	if (bpo->bpo_havesubobj && bpo->bpo_phys->bpo_subobjs != 0) {
176917fb938fSMatthew Ahrens 		mos_obj_refd(bpo->bpo_phys->bpo_subobjs);
177017fb938fSMatthew Ahrens 		for (uint64_t i = 0; i < bpo->bpo_phys->bpo_num_subobjs; i++) {
177117fb938fSMatthew Ahrens 			uint64_t subobj;
177217fb938fSMatthew Ahrens 			bpobj_t subbpo;
177317fb938fSMatthew Ahrens 			int error;
177417fb938fSMatthew Ahrens 			VERIFY0(dmu_read(bpo->bpo_os,
177517fb938fSMatthew Ahrens 			    bpo->bpo_phys->bpo_subobjs,
177617fb938fSMatthew Ahrens 			    i * sizeof (subobj), sizeof (subobj), &subobj, 0));
177717fb938fSMatthew Ahrens 			error = bpobj_open(&subbpo, bpo->bpo_os, subobj);
177817fb938fSMatthew Ahrens 			if (error != 0) {
177917fb938fSMatthew Ahrens 				(void) printf("ERROR %u while trying to open "
178017fb938fSMatthew Ahrens 				    "subobj id %llu\n",
178117fb938fSMatthew Ahrens 				    error, (u_longlong_t)subobj);
178217fb938fSMatthew Ahrens 				continue;
178317fb938fSMatthew Ahrens 			}
178417fb938fSMatthew Ahrens 			bpobj_count_refd(&subbpo);
178517fb938fSMatthew Ahrens 			bpobj_close(&subbpo);
178617fb938fSMatthew Ahrens 		}
178717fb938fSMatthew Ahrens 	}
178817fb938fSMatthew Ahrens }
178917fb938fSMatthew Ahrens 
1790cde58dbcSMatthew Ahrens static void
1791cde58dbcSMatthew Ahrens dump_deadlist(dsl_deadlist_t *dl)
1792cde58dbcSMatthew Ahrens {
1793cde58dbcSMatthew Ahrens 	dsl_deadlist_entry_t *dle;
1794d0475637SMatthew Ahrens 	uint64_t unused;
1795cde58dbcSMatthew Ahrens 	char bytes[32];
1796cde58dbcSMatthew Ahrens 	char comp[32];
1797cde58dbcSMatthew Ahrens 	char uncomp[32];
179817fb938fSMatthew Ahrens 	uint64_t empty_bpobj =
179917fb938fSMatthew Ahrens 	    dmu_objset_spa(dl->dl_os)->spa_dsl_pool->dp_empty_bpobj;
180017fb938fSMatthew Ahrens 
180117fb938fSMatthew Ahrens 	/* force the tree to be loaded */
180217fb938fSMatthew Ahrens 	dsl_deadlist_space_range(dl, 0, UINT64_MAX, &unused, &unused, &unused);
180317fb938fSMatthew Ahrens 
180417fb938fSMatthew Ahrens 	if (dl->dl_oldfmt) {
180517fb938fSMatthew Ahrens 		if (dl->dl_bpobj.bpo_object != empty_bpobj)
180617fb938fSMatthew Ahrens 			bpobj_count_refd(&dl->dl_bpobj);
180717fb938fSMatthew Ahrens 	} else {
180817fb938fSMatthew Ahrens 		mos_obj_refd(dl->dl_object);
180917fb938fSMatthew Ahrens 		for (dle = avl_first(&dl->dl_tree); dle;
181017fb938fSMatthew Ahrens 		    dle = AVL_NEXT(&dl->dl_tree, dle)) {
181117fb938fSMatthew Ahrens 			if (dle->dle_bpobj.bpo_object != empty_bpobj)
181217fb938fSMatthew Ahrens 				bpobj_count_refd(&dle->dle_bpobj);
181317fb938fSMatthew Ahrens 		}
181417fb938fSMatthew Ahrens 	}
1815cde58dbcSMatthew Ahrens 
18160a055120SJason King 	/* make sure nicenum has enough space */
18170a055120SJason King 	CTASSERT(sizeof (bytes) >= NN_NUMBUF_SZ);
18180a055120SJason King 	CTASSERT(sizeof (comp) >= NN_NUMBUF_SZ);
18190a055120SJason King 	CTASSERT(sizeof (uncomp) >= NN_NUMBUF_SZ);
18200a055120SJason King 
1821cde58dbcSMatthew Ahrens 	if (dump_opt['d'] < 3)
1822cde58dbcSMatthew Ahrens 		return;
1823cde58dbcSMatthew Ahrens 
182490c76c66SMatthew Ahrens 	if (dl->dl_oldfmt) {
1825732885fcSMatthew Ahrens 		dump_full_bpobj(&dl->dl_bpobj, "old-format deadlist", 0);
182690c76c66SMatthew Ahrens 		return;
182790c76c66SMatthew Ahrens 	}
182890c76c66SMatthew Ahrens 
18290a055120SJason King 	zdb_nicenum(dl->dl_phys->dl_used, bytes, sizeof (bytes));
18300a055120SJason King 	zdb_nicenum(dl->dl_phys->dl_comp, comp, sizeof (comp));
18310a055120SJason King 	zdb_nicenum(dl->dl_phys->dl_uncomp, uncomp, sizeof (uncomp));
1832cde58dbcSMatthew Ahrens 	(void) printf("\n    Deadlist: %s (%s/%s comp)\n",
1833cde58dbcSMatthew Ahrens 	    bytes, comp, uncomp);
1834cde58dbcSMatthew Ahrens 
1835cde58dbcSMatthew Ahrens 	if (dump_opt['d'] < 4)
1836cde58dbcSMatthew Ahrens 		return;
1837cde58dbcSMatthew Ahrens 
1838cde58dbcSMatthew Ahrens 	(void) printf("\n");
1839cde58dbcSMatthew Ahrens 
1840cde58dbcSMatthew Ahrens 	for (dle = avl_first(&dl->dl_tree); dle;
1841cde58dbcSMatthew Ahrens 	    dle = AVL_NEXT(&dl->dl_tree, dle)) {
1842d0475637SMatthew Ahrens 		if (dump_opt['d'] >= 5) {
1843d0475637SMatthew Ahrens 			char buf[128];
1844de05b588SRichard Yao 			(void) snprintf(buf, sizeof (buf),
1845de05b588SRichard Yao 			    "mintxg %llu -> obj %llu",
1846d0475637SMatthew Ahrens 			    (longlong_t)dle->dle_mintxg,
1847d0475637SMatthew Ahrens 			    (longlong_t)dle->dle_bpobj.bpo_object);
1848fa9e4066Sahrens 
1849732885fcSMatthew Ahrens 			dump_full_bpobj(&dle->dle_bpobj, buf, 0);
1850d0475637SMatthew Ahrens 		} else {
1851d0475637SMatthew Ahrens 			(void) printf("mintxg %llu -> obj %llu\n",
1852d0475637SMatthew Ahrens 			    (longlong_t)dle->dle_mintxg,
1853d0475637SMatthew Ahrens 			    (longlong_t)dle->dle_bpobj.bpo_object);
1854d0475637SMatthew Ahrens 		}
1855cde58dbcSMatthew Ahrens 	}
1856fa9e4066Sahrens }
1857fa9e4066Sahrens 
1858e0d35c44Smarks static avl_tree_t idx_tree;
1859e0d35c44Smarks static avl_tree_t domain_tree;
1860e0d35c44Smarks static boolean_t fuid_table_loaded;
1861ed61ec1dSYuri Pankov static objset_t *sa_os = NULL;
1862ed61ec1dSYuri Pankov static sa_attr_type_t *sa_attr_table = NULL;
1863ed61ec1dSYuri Pankov 
1864ed61ec1dSYuri Pankov static int
1865ed61ec1dSYuri Pankov open_objset(const char *path, dmu_objset_type_t type, void *tag, objset_t **osp)
1866ed61ec1dSYuri Pankov {
1867ed61ec1dSYuri Pankov 	int err;
1868ed61ec1dSYuri Pankov 	uint64_t sa_attrs = 0;
1869ed61ec1dSYuri Pankov 	uint64_t version = 0;
1870ed61ec1dSYuri Pankov 
1871ed61ec1dSYuri Pankov 	VERIFY3P(sa_os, ==, NULL);
1872ed61ec1dSYuri Pankov 	err = dmu_objset_own(path, type, B_TRUE, tag, osp);
1873ed61ec1dSYuri Pankov 	if (err != 0) {
1874ed61ec1dSYuri Pankov 		(void) fprintf(stderr, "failed to own dataset '%s': %s\n", path,
1875ed61ec1dSYuri Pankov 		    strerror(err));
1876ed61ec1dSYuri Pankov 		return (err);
1877ed61ec1dSYuri Pankov 	}
1878ed61ec1dSYuri Pankov 
1879ed61ec1dSYuri Pankov 	if (dmu_objset_type(*osp) == DMU_OST_ZFS) {
1880ed61ec1dSYuri Pankov 		(void) zap_lookup(*osp, MASTER_NODE_OBJ, ZPL_VERSION_STR,
1881ed61ec1dSYuri Pankov 		    8, 1, &version);
1882ed61ec1dSYuri Pankov 		if (version >= ZPL_VERSION_SA) {
1883ed61ec1dSYuri Pankov 			(void) zap_lookup(*osp, MASTER_NODE_OBJ, ZFS_SA_ATTRS,
1884ed61ec1dSYuri Pankov 			    8, 1, &sa_attrs);
1885ed61ec1dSYuri Pankov 		}
1886ed61ec1dSYuri Pankov 		err = sa_setup(*osp, sa_attrs, zfs_attr_table, ZPL_END,
1887ed61ec1dSYuri Pankov 		    &sa_attr_table);
1888ed61ec1dSYuri Pankov 		if (err != 0) {
1889ed61ec1dSYuri Pankov 			(void) fprintf(stderr, "sa_setup failed: %s\n",
1890ed61ec1dSYuri Pankov 			    strerror(err));
1891ed61ec1dSYuri Pankov 			dmu_objset_disown(*osp, tag);
1892ed61ec1dSYuri Pankov 			*osp = NULL;
1893ed61ec1dSYuri Pankov 		}
1894ed61ec1dSYuri Pankov 	}
1895ed61ec1dSYuri Pankov 	sa_os = *osp;
1896ed61ec1dSYuri Pankov 
1897ed61ec1dSYuri Pankov 	return (0);
1898ed61ec1dSYuri Pankov }
1899ed61ec1dSYuri Pankov 
1900ed61ec1dSYuri Pankov static void
1901ed61ec1dSYuri Pankov close_objset(objset_t *os, void *tag)
1902ed61ec1dSYuri Pankov {
1903ed61ec1dSYuri Pankov 	VERIFY3P(os, ==, sa_os);
1904ed61ec1dSYuri Pankov 	if (os->os_sa != NULL)
1905ed61ec1dSYuri Pankov 		sa_tear_down(os);
1906ed61ec1dSYuri Pankov 	dmu_objset_disown(os, tag);
1907ed61ec1dSYuri Pankov 	sa_attr_table = NULL;
1908ed61ec1dSYuri Pankov 	sa_os = NULL;
1909ed61ec1dSYuri Pankov }
1910e0d35c44Smarks 
1911e0d35c44Smarks static void
1912e0d35c44Smarks fuid_table_destroy()
1913e0d35c44Smarks {
1914e0d35c44Smarks 	if (fuid_table_loaded) {
1915e0d35c44Smarks 		zfs_fuid_table_destroy(&idx_tree, &domain_tree);
1916e0d35c44Smarks 		fuid_table_loaded = B_FALSE;
1917e0d35c44Smarks 	}
1918e0d35c44Smarks }
1919e0d35c44Smarks 
1920e0d35c44Smarks /*
1921e0d35c44Smarks  * print uid or gid information.
1922e0d35c44Smarks  * For normal POSIX id just the id is printed in decimal format.
1923e0d35c44Smarks  * For CIFS files with FUID the fuid is printed in hex followed by
1924d0475637SMatthew Ahrens  * the domain-rid string.
1925e0d35c44Smarks  */
1926e0d35c44Smarks static void
1927e0d35c44Smarks print_idstr(uint64_t id, const char *id_type)
1928e0d35c44Smarks {
1929e0d35c44Smarks 	if (FUID_INDEX(id)) {
1930e0d35c44Smarks 		char *domain;
1931e0d35c44Smarks 
1932e0d35c44Smarks 		domain = zfs_fuid_idx_domain(&idx_tree, FUID_INDEX(id));
1933e0d35c44Smarks 		(void) printf("\t%s     %llx [%s-%d]\n", id_type,
1934e0d35c44Smarks 		    (u_longlong_t)id, domain, (int)FUID_RID(id));
1935e0d35c44Smarks 	} else {
1936e0d35c44Smarks 		(void) printf("\t%s     %llu\n", id_type, (u_longlong_t)id);
1937e0d35c44Smarks 	}
1938e0d35c44Smarks 
1939e0d35c44Smarks }
1940e0d35c44Smarks 
1941e0d35c44Smarks static void
19420a586ceaSMark Shellenbaum dump_uidgid(objset_t *os, uint64_t uid, uint64_t gid)
1943e0d35c44Smarks {
1944e0d35c44Smarks 	uint32_t uid_idx, gid_idx;
1945e0d35c44Smarks 
19460a586ceaSMark Shellenbaum 	uid_idx = FUID_INDEX(uid);
19470a586ceaSMark Shellenbaum 	gid_idx = FUID_INDEX(gid);
1948e0d35c44Smarks 
1949e0d35c44Smarks 	/* Load domain table, if not already loaded */
1950e0d35c44Smarks 	if (!fuid_table_loaded && (uid_idx || gid_idx)) {
1951e0d35c44Smarks 		uint64_t fuid_obj;
1952e0d35c44Smarks 
1953e0d35c44Smarks 		/* first find the fuid object.  It lives in the master node */
1954e0d35c44Smarks 		VERIFY(zap_lookup(os, MASTER_NODE_OBJ, ZFS_FUID_TABLES,
1955e0d35c44Smarks 		    8, 1, &fuid_obj) == 0);
195689459e17SMark Shellenbaum 		zfs_fuid_avl_tree_create(&idx_tree, &domain_tree);
1957e0d35c44Smarks 		(void) zfs_fuid_table_load(os, fuid_obj,
1958e0d35c44Smarks 		    &idx_tree, &domain_tree);
1959e0d35c44Smarks 		fuid_table_loaded = B_TRUE;
1960e0d35c44Smarks 	}
1961e0d35c44Smarks 
19620a586ceaSMark Shellenbaum 	print_idstr(uid, "uid");
19630a586ceaSMark Shellenbaum 	print_idstr(gid, "gid");
1964e0d35c44Smarks }
1965e0d35c44Smarks 
1966fa9e4066Sahrens /*ARGSUSED*/
1967fa9e4066Sahrens static void
1968fa9e4066Sahrens dump_znode(objset_t *os, uint64_t object, void *data, size_t size)
1969fa9e4066Sahrens {
1970fa9e4066Sahrens 	char path[MAXPATHLEN * 2];	/* allow for xattr and failure prefix */
19710a586ceaSMark Shellenbaum 	sa_handle_t *hdl;
19720a586ceaSMark Shellenbaum 	uint64_t xattr, rdev, gen;
19730a586ceaSMark Shellenbaum 	uint64_t uid, gid, mode, fsize, parent, links;
19748f2529deSMark Shellenbaum 	uint64_t pflags;
19750a586ceaSMark Shellenbaum 	uint64_t acctm[2], modtm[2], chgtm[2], crtm[2];
19760a586ceaSMark Shellenbaum 	time_t z_crtime, z_atime, z_mtime, z_ctime;
19778f2529deSMark Shellenbaum 	sa_bulk_attr_t bulk[12];
19780a586ceaSMark Shellenbaum 	int idx = 0;
197955434c77Sek 	int error;
1980fa9e4066Sahrens 
1981ed61ec1dSYuri Pankov 	VERIFY3P(os, ==, sa_os);
19820a586ceaSMark Shellenbaum 	if (sa_handle_get(os, object, NULL, SA_HDL_PRIVATE, &hdl)) {
19830a586ceaSMark Shellenbaum 		(void) printf("Failed to get handle for SA znode\n");
19840a586ceaSMark Shellenbaum 		return;
19850a586ceaSMark Shellenbaum 	}
19860a586ceaSMark Shellenbaum 
19870a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_UID], NULL, &uid, 8);
19880a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_GID], NULL, &gid, 8);
19890a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_LINKS], NULL,
19900a586ceaSMark Shellenbaum 	    &links, 8);
19910a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_GEN], NULL, &gen, 8);
19920a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_MODE], NULL,
19930a586ceaSMark Shellenbaum 	    &mode, 8);
19940a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_PARENT],
19950a586ceaSMark Shellenbaum 	    NULL, &parent, 8);
19960a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_SIZE], NULL,
19970a586ceaSMark Shellenbaum 	    &fsize, 8);
19980a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_ATIME], NULL,
19990a586ceaSMark Shellenbaum 	    acctm, 16);
20000a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_MTIME], NULL,
20010a586ceaSMark Shellenbaum 	    modtm, 16);
20020a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_CRTIME], NULL,
20030a586ceaSMark Shellenbaum 	    crtm, 16);
20040a586ceaSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_CTIME], NULL,
20050a586ceaSMark Shellenbaum 	    chgtm, 16);
20068f2529deSMark Shellenbaum 	SA_ADD_BULK_ATTR(bulk, idx, sa_attr_table[ZPL_FLAGS], NULL,
20078f2529deSMark Shellenbaum 	    &pflags, 8);
20080a586ceaSMark Shellenbaum 
20090a586ceaSMark Shellenbaum 	if (sa_bulk_lookup(hdl, bulk, idx)) {
20100a586ceaSMark Shellenbaum 		(void) sa_handle_destroy(hdl);
20110a586ceaSMark Shellenbaum 		return;
20120a586ceaSMark Shellenbaum 	}
2013fa9e4066Sahrens 
20140a586ceaSMark Shellenbaum 	z_crtime = (time_t)crtm[0];
20150a586ceaSMark Shellenbaum 	z_atime = (time_t)acctm[0];
20160a586ceaSMark Shellenbaum 	z_mtime = (time_t)modtm[0];
20170a586ceaSMark Shellenbaum 	z_ctime = (time_t)chgtm[0];
2018fa9e4066Sahrens 
2019e548d2faSAlan Somers 	if (dump_opt['d'] > 4) {
2020e548d2faSAlan Somers 		error = zfs_obj_to_path(os, object, path, sizeof (path));
202120b5dafbSPaul Dagnelie 		if (error == ESTALE) {
202220b5dafbSPaul Dagnelie 			(void) snprintf(path, sizeof (path), "on delete queue");
202320b5dafbSPaul Dagnelie 		} else if (error != 0) {
202420b5dafbSPaul Dagnelie 			leaked_objects++;
2025e548d2faSAlan Somers 			(void) snprintf(path, sizeof (path),
202620b5dafbSPaul Dagnelie 			    "path not found, possibly leaked");
2027e548d2faSAlan Somers 		}
2028e548d2faSAlan Somers 		(void) printf("\tpath	%s\n", path);
2029e548d2faSAlan Somers 	}
20300a586ceaSMark Shellenbaum 	dump_uidgid(os, uid, gid);
2031fa9e4066Sahrens 	(void) printf("\tatime	%s", ctime(&z_atime));
2032fa9e4066Sahrens 	(void) printf("\tmtime	%s", ctime(&z_mtime));
2033fa9e4066Sahrens 	(void) printf("\tctime	%s", ctime(&z_ctime));
2034fa9e4066Sahrens 	(void) printf("\tcrtime	%s", ctime(&z_crtime));
20350a586ceaSMark Shellenbaum 	(void) printf("\tgen	%llu\n", (u_longlong_t)gen);
20360a586ceaSMark Shellenbaum 	(void) printf("\tmode	%llo\n", (u_longlong_t)mode);
20370a586ceaSMark Shellenbaum 	(void) printf("\tsize	%llu\n", (u_longlong_t)fsize);
20380a586ceaSMark Shellenbaum 	(void) printf("\tparent	%llu\n", (u_longlong_t)parent);
20390a586ceaSMark Shellenbaum 	(void) printf("\tlinks	%llu\n", (u_longlong_t)links);
20408f2529deSMark Shellenbaum 	(void) printf("\tpflags	%llx\n", (u_longlong_t)pflags);
20410a586ceaSMark Shellenbaum 	if (sa_lookup(hdl, sa_attr_table[ZPL_XATTR], &xattr,
20420a586ceaSMark Shellenbaum 	    sizeof (uint64_t)) == 0)
20430a586ceaSMark Shellenbaum 		(void) printf("\txattr	%llu\n", (u_longlong_t)xattr);
20440a586ceaSMark Shellenbaum 	if (sa_lookup(hdl, sa_attr_table[ZPL_RDEV], &rdev,
20450a586ceaSMark Shellenbaum 	    sizeof (uint64_t)) == 0)
20460a586ceaSMark Shellenbaum 		(void) printf("\trdev	0x%016llx\n", (u_longlong_t)rdev);
20470a586ceaSMark Shellenbaum 	sa_handle_destroy(hdl);
2048fa9e4066Sahrens }
2049fa9e4066Sahrens 
2050fa9e4066Sahrens /*ARGSUSED*/
2051fa9e4066Sahrens static void
2052fa9e4066Sahrens dump_acl(objset_t *os, uint64_t object, void *data, size_t size)
2053fa9e4066Sahrens {
2054fa9e4066Sahrens }
2055fa9e4066Sahrens 
2056fa9e4066Sahrens /*ARGSUSED*/
2057fa9e4066Sahrens static void
2058fa9e4066Sahrens dump_dmu_objset(objset_t *os, uint64_t object, void *data, size_t size)
2059fa9e4066Sahrens {
2060fa9e4066Sahrens }
2061fa9e4066Sahrens 
20626de8f417SVictor Latushkin static object_viewer_t *object_viewer[DMU_OT_NUMTYPES + 1] = {
2063fa9e4066Sahrens 	dump_none,		/* unallocated			*/
2064fa9e4066Sahrens 	dump_zap,		/* object directory		*/
2065fa9e4066Sahrens 	dump_uint64,		/* object array			*/
2066fa9e4066Sahrens 	dump_none,		/* packed nvlist		*/
2067fa9e4066Sahrens 	dump_packed_nvlist,	/* packed nvlist size		*/
2068732885fcSMatthew Ahrens 	dump_none,		/* bpobj			*/
2069732885fcSMatthew Ahrens 	dump_bpobj,		/* bpobj header			*/
2070fa9e4066Sahrens 	dump_none,		/* SPA space map header		*/
2071fa9e4066Sahrens 	dump_none,		/* SPA space map		*/
2072fa9e4066Sahrens 	dump_none,		/* ZIL intent log		*/
2073fa9e4066Sahrens 	dump_dnode,		/* DMU dnode			*/
2074fa9e4066Sahrens 	dump_dmu_objset,	/* DMU objset			*/
2075ea8dc4b6Seschrock 	dump_dsl_dir,		/* DSL directory		*/
2076fa9e4066Sahrens 	dump_zap,		/* DSL directory child map	*/
2077fa9e4066Sahrens 	dump_zap,		/* DSL dataset snap map		*/
2078fa9e4066Sahrens 	dump_zap,		/* DSL props			*/
2079fa9e4066Sahrens 	dump_dsl_dataset,	/* DSL dataset			*/
2080fa9e4066Sahrens 	dump_znode,		/* ZFS znode			*/
2081da6c28aaSamw 	dump_acl,		/* ZFS V0 ACL			*/
2082fa9e4066Sahrens 	dump_uint8,		/* ZFS plain file		*/
2083e7437265Sahrens 	dump_zpldir,		/* ZFS directory		*/
2084fa9e4066Sahrens 	dump_zap,		/* ZFS master node		*/
2085fa9e4066Sahrens 	dump_zap,		/* ZFS delete queue		*/
2086fa9e4066Sahrens 	dump_uint8,		/* zvol object			*/
2087fa9e4066Sahrens 	dump_zap,		/* zvol prop			*/
2088fa9e4066Sahrens 	dump_uint8,		/* other uint8[]		*/
2089fa9e4066Sahrens 	dump_uint64,		/* other uint64[]		*/
2090fa9e4066Sahrens 	dump_zap,		/* other ZAP			*/
2091ea8dc4b6Seschrock 	dump_zap,		/* persistent error log		*/
209206eeb2adSek 	dump_uint8,		/* SPA history			*/
20934445fffbSMatthew Ahrens 	dump_history_offsets,	/* SPA history offsets		*/
2094b1b8ab34Slling 	dump_zap,		/* Pool properties		*/
2095ecd6cf80Smarks 	dump_zap,		/* DSL permissions		*/
2096da6c28aaSamw 	dump_acl,		/* ZFS ACL			*/
2097da6c28aaSamw 	dump_uint8,		/* ZFS SYSACL			*/
2098da6c28aaSamw 	dump_none,		/* FUID nvlist			*/
2099da6c28aaSamw 	dump_packed_nvlist,	/* FUID nvlist size		*/
2100088f3894Sahrens 	dump_zap,		/* DSL dataset next clones	*/
2101088f3894Sahrens 	dump_zap,		/* DSL scrub queue		*/
210214843421SMatthew Ahrens 	dump_zap,		/* ZFS user/group used		*/
210314843421SMatthew Ahrens 	dump_zap,		/* ZFS user/group quota		*/
2104842727c2SChris Kirby 	dump_zap,		/* snapshot refcount tags	*/
2105486ae710SMatthew Ahrens 	dump_ddt_zap,		/* DDT ZAP object		*/
2106b24ab676SJeff Bonwick 	dump_zap,		/* DDT statistics		*/
21070a586ceaSMark Shellenbaum 	dump_znode,		/* SA object			*/
21080a586ceaSMark Shellenbaum 	dump_zap,		/* SA Master Node		*/
21090a586ceaSMark Shellenbaum 	dump_sa_attrs,		/* SA attribute registration	*/
21100a586ceaSMark Shellenbaum 	dump_sa_layouts,	/* SA attribute layouts		*/
21113f9d6ad7SLin Ling 	dump_zap,		/* DSL scrub translations	*/
21123f9d6ad7SLin Ling 	dump_none,		/* fake dedup BP		*/
2113cde58dbcSMatthew Ahrens 	dump_zap,		/* deadlist			*/
2114cde58dbcSMatthew Ahrens 	dump_none,		/* deadlist hdr			*/
2115cde58dbcSMatthew Ahrens 	dump_zap,		/* dsl clones			*/
2116732885fcSMatthew Ahrens 	dump_bpobj_subobjs,	/* bpobj subobjs		*/
21170a586ceaSMark Shellenbaum 	dump_unknown,		/* Unknown type, must be last	*/
2118fa9e4066Sahrens };
2119fa9e4066Sahrens 
2120fa9e4066Sahrens static void
212154811da5SToomas Soome dump_object(objset_t *os, uint64_t object, int verbosity, int *print_header,
212254811da5SToomas Soome     uint64_t *dnode_slots_used)
2123fa9e4066Sahrens {
2124fa9e4066Sahrens 	dmu_buf_t *db = NULL;
2125fa9e4066Sahrens 	dmu_object_info_t doi;
2126fa9e4066Sahrens 	dnode_t *dn;
2127fa9e4066Sahrens 	void *bonus = NULL;
2128fa9e4066Sahrens 	size_t bsize = 0;
212954811da5SToomas Soome 	char iblk[32], dblk[32], lsize[32], asize[32], fill[32], dnsize[32];
21303f9d6ad7SLin Ling 	char bonus_size[32];
2131fa9e4066Sahrens 	char aux[50];
2132fa9e4066Sahrens 	int error;
2133fa9e4066Sahrens 
21340a055120SJason King 	/* make sure nicenum has enough space */
21350a055120SJason King 	CTASSERT(sizeof (iblk) >= NN_NUMBUF_SZ);
21360a055120SJason King 	CTASSERT(sizeof (dblk) >= NN_NUMBUF_SZ);
21370a055120SJason King 	CTASSERT(sizeof (lsize) >= NN_NUMBUF_SZ);
21380a055120SJason King 	CTASSERT(sizeof (asize) >= NN_NUMBUF_SZ);
21390a055120SJason King 	CTASSERT(sizeof (bonus_size) >= NN_NUMBUF_SZ);
21400a055120SJason King 
2141fa9e4066Sahrens 	if (*print_header) {
214254811da5SToomas Soome 		(void) printf("\n%10s  %3s  %5s  %5s  %5s  %6s  %5s  %6s  %s\n",
214354811da5SToomas Soome 		    "Object", "lvl", "iblk", "dblk", "dsize", "dnsize",
214454811da5SToomas Soome 		    "lsize", "%full", "type");
2145fa9e4066Sahrens 		*print_header = 0;
2146fa9e4066Sahrens 	}
2147fa9e4066Sahrens 
2148fa9e4066Sahrens 	if (object == 0) {
2149744947dcSTom Erickson 		dn = DMU_META_DNODE(os);
2150fa9e4066Sahrens 	} else {
2151ea8dc4b6Seschrock 		error = dmu_bonus_hold(os, object, FTAG, &db);
2152ea8dc4b6Seschrock 		if (error)
2153ea8dc4b6Seschrock 			fatal("dmu_bonus_hold(%llu) failed, errno %u",
2154ea8dc4b6Seschrock 			    object, error);
2155fa9e4066Sahrens 		bonus = db->db_data;
2156fa9e4066Sahrens 		bsize = db->db_size;
2157744947dcSTom Erickson 		dn = DB_DNODE((dmu_buf_impl_t *)db);
2158fa9e4066Sahrens 	}
2159fa9e4066Sahrens 	dmu_object_info_from_dnode(dn, &doi);
2160fa9e4066Sahrens 
216154811da5SToomas Soome 	if (dnode_slots_used != NULL)
216254811da5SToomas Soome 		*dnode_slots_used = doi.doi_dnodesize / DNODE_MIN_SIZE;
216354811da5SToomas Soome 
21640a055120SJason King 	zdb_nicenum(doi.doi_metadata_block_size, iblk, sizeof (iblk));
21650a055120SJason King 	zdb_nicenum(doi.doi_data_block_size, dblk, sizeof (dblk));
21660a055120SJason King 	zdb_nicenum(doi.doi_max_offset, lsize, sizeof (lsize));
21670a055120SJason King 	zdb_nicenum(doi.doi_physical_blocks_512 << 9, asize, sizeof (asize));
21680a055120SJason King 	zdb_nicenum(doi.doi_bonus_size, bonus_size, sizeof (bonus_size));
216954811da5SToomas Soome 	zdb_nicenum(doi.doi_dnodesize, dnsize, sizeof (dnsize));
2170b24ab676SJeff Bonwick 	(void) sprintf(fill, "%6.2f", 100.0 * doi.doi_fill_count *
2171bbfd46c4SJeff Bonwick 	    doi.doi_data_block_size / (object == 0 ? DNODES_PER_BLOCK : 1) /
2172bbfd46c4SJeff Bonwick 	    doi.doi_max_offset);
2173fa9e4066Sahrens 
2174fa9e4066Sahrens 	aux[0] = '\0';
2175fa9e4066Sahrens 
2176e7437265Sahrens 	if (doi.doi_checksum != ZIO_CHECKSUM_INHERIT || verbosity >= 6) {
2177fa9e4066Sahrens 		(void) snprintf(aux + strlen(aux), sizeof (aux), " (K=%s)",
21786de8f417SVictor Latushkin 		    ZDB_CHECKSUM_NAME(doi.doi_checksum));
2179e7437265Sahrens 	}
2180fa9e4066Sahrens 
2181e7437265Sahrens 	if (doi.doi_compress != ZIO_COMPRESS_INHERIT || verbosity >= 6) {
2182fa9e4066Sahrens 		(void) snprintf(aux + strlen(aux), sizeof (aux), " (Z=%s)",
21836de8f417SVictor Latushkin 		    ZDB_COMPRESS_NAME(doi.doi_compress));
2184e7437265Sahrens 	}
2185fa9e4066Sahrens 
218654811da5SToomas Soome 	(void) printf("%10" PRIu64
218754811da5SToomas Soome 	    "  %3u  %5s  %5s  %5s  %5s  %5s  %6s  %s%s\n",
218854811da5SToomas Soome 	    object, doi.doi_indirection, iblk, dblk,
218954811da5SToomas Soome 	    asize, dnsize, lsize, fill, ZDB_OT_NAME(doi.doi_type), aux);
2190fa9e4066Sahrens 
2191fa9e4066Sahrens 	if (doi.doi_bonus_type != DMU_OT_NONE && verbosity > 3) {
219254811da5SToomas Soome 		(void) printf("%10s  %3s  %5s  %5s  %5s  %5s  %5s  %6s  %s\n",
219354811da5SToomas Soome 		    "", "", "", "", "", "", bonus_size, "bonus",
21946de8f417SVictor Latushkin 		    ZDB_OT_NAME(doi.doi_bonus_type));
2195fa9e4066Sahrens 	}
2196fa9e4066Sahrens 
2197fa9e4066Sahrens 	if (verbosity >= 4) {
21980a586ceaSMark Shellenbaum 		(void) printf("\tdnode flags: %s%s%s\n",
219914843421SMatthew Ahrens 		    (dn->dn_phys->dn_flags & DNODE_FLAG_USED_BYTES) ?
220014843421SMatthew Ahrens 		    "USED_BYTES " : "",
220114843421SMatthew Ahrens 		    (dn->dn_phys->dn_flags & DNODE_FLAG_USERUSED_ACCOUNTED) ?
22020a586ceaSMark Shellenbaum 		    "USERUSED_ACCOUNTED " : "",
22030a586ceaSMark Shellenbaum 		    (dn->dn_phys->dn_flags & DNODE_FLAG_SPILL_BLKPTR) ?
22040a586ceaSMark Shellenbaum 		    "SPILL_BLKPTR" : "");
220514843421SMatthew Ahrens 		(void) printf("\tdnode maxblkid: %llu\n",
220614843421SMatthew Ahrens 		    (longlong_t)dn->dn_phys->dn_maxblkid);
220714843421SMatthew Ahrens 
22086de8f417SVictor Latushkin 		object_viewer[ZDB_OT_TYPE(doi.doi_bonus_type)](os, object,
22096de8f417SVictor Latushkin 		    bonus, bsize);
22106de8f417SVictor Latushkin 		object_viewer[ZDB_OT_TYPE(doi.doi_type)](os, object, NULL, 0);
2211fa9e4066Sahrens 		*print_header = 1;
2212fa9e4066Sahrens 	}
2213fa9e4066Sahrens 
2214fa9e4066Sahrens 	if (verbosity >= 5)
221588b7b0f2SMatthew Ahrens 		dump_indirect(dn);
2216fa9e4066Sahrens 
2217fa9e4066Sahrens 	if (verbosity >= 5) {
2218fa9e4066Sahrens 		/*
2219fa9e4066Sahrens 		 * Report the list of segments that comprise the object.
2220fa9e4066Sahrens 		 */
2221fa9e4066Sahrens 		uint64_t start = 0;
2222fa9e4066Sahrens 		uint64_t end;
2223fa9e4066Sahrens 		uint64_t blkfill = 1;
2224fa9e4066Sahrens 		int minlvl = 1;
2225fa9e4066Sahrens 
2226fa9e4066Sahrens 		if (dn->dn_type == DMU_OT_DNODE) {
2227fa9e4066Sahrens 			minlvl = 0;
2228fa9e4066Sahrens 			blkfill = DNODES_PER_BLOCK;
2229fa9e4066Sahrens 		}
2230fa9e4066Sahrens 
2231fa9e4066Sahrens 		for (;;) {
22323f9d6ad7SLin Ling 			char segsize[32];
22330a055120SJason King 			/* make sure nicenum has enough space */
22340a055120SJason King 			CTASSERT(sizeof (segsize) >= NN_NUMBUF_SZ);
2235cdb0ab79Smaybee 			error = dnode_next_offset(dn,
2236cdb0ab79Smaybee 			    0, &start, minlvl, blkfill, 0);
2237fa9e4066Sahrens 			if (error)
2238fa9e4066Sahrens 				break;
2239fa9e4066Sahrens 			end = start;
2240cdb0ab79Smaybee 			error = dnode_next_offset(dn,
2241cdb0ab79Smaybee 			    DNODE_FIND_HOLE, &end, minlvl, blkfill, 0);
22420a055120SJason King 			zdb_nicenum(end - start, segsize, sizeof (segsize));
2243fa9e4066Sahrens 			(void) printf("\t\tsegment [%016llx, %016llx)"
2244fa9e4066Sahrens 			    " size %5s\n", (u_longlong_t)start,
2245fa9e4066Sahrens 			    (u_longlong_t)end, segsize);
2246fa9e4066Sahrens 			if (error)
2247fa9e4066Sahrens 				break;
2248fa9e4066Sahrens 			start = end;
2249fa9e4066Sahrens 		}
2250fa9e4066Sahrens 	}
2251fa9e4066Sahrens 
2252fa9e4066Sahrens 	if (db != NULL)
2253ea8dc4b6Seschrock 		dmu_buf_rele(db, FTAG);
2254fa9e4066Sahrens }
2255fa9e4066Sahrens 
225617fb938fSMatthew Ahrens static void
225717fb938fSMatthew Ahrens count_dir_mos_objects(dsl_dir_t *dd)
225817fb938fSMatthew Ahrens {
225917fb938fSMatthew Ahrens 	mos_obj_refd(dd->dd_object);
226017fb938fSMatthew Ahrens 	mos_obj_refd(dsl_dir_phys(dd)->dd_child_dir_zapobj);
226117fb938fSMatthew Ahrens 	mos_obj_refd(dsl_dir_phys(dd)->dd_deleg_zapobj);
226217fb938fSMatthew Ahrens 	mos_obj_refd(dsl_dir_phys(dd)->dd_props_zapobj);
226317fb938fSMatthew Ahrens 	mos_obj_refd(dsl_dir_phys(dd)->dd_clones);
226417fb938fSMatthew Ahrens }
226517fb938fSMatthew Ahrens 
226617fb938fSMatthew Ahrens static void
226717fb938fSMatthew Ahrens count_ds_mos_objects(dsl_dataset_t *ds)
226817fb938fSMatthew Ahrens {
226917fb938fSMatthew Ahrens 	mos_obj_refd(ds->ds_object);
227017fb938fSMatthew Ahrens 	mos_obj_refd(dsl_dataset_phys(ds)->ds_next_clones_obj);
227117fb938fSMatthew Ahrens 	mos_obj_refd(dsl_dataset_phys(ds)->ds_props_obj);
227217fb938fSMatthew Ahrens 	mos_obj_refd(dsl_dataset_phys(ds)->ds_userrefs_obj);
227317fb938fSMatthew Ahrens 	mos_obj_refd(dsl_dataset_phys(ds)->ds_snapnames_zapobj);
227417fb938fSMatthew Ahrens 
227517fb938fSMatthew Ahrens 	if (!dsl_dataset_is_snapshot(ds)) {
227617fb938fSMatthew Ahrens 		count_dir_mos_objects(ds->ds_dir);
227717fb938fSMatthew Ahrens 	}
227817fb938fSMatthew Ahrens }
227917fb938fSMatthew Ahrens 
22803f7978d0SAlan Somers static const char *objset_types[DMU_OST_NUMTYPES] = {
2281fa9e4066Sahrens 	"NONE", "META", "ZPL", "ZVOL", "OTHER", "ANY" };
2282fa9e4066Sahrens 
2283fa9e4066Sahrens static void
2284fa9e4066Sahrens dump_dir(objset_t *os)
2285fa9e4066Sahrens {
2286fa9e4066Sahrens 	dmu_objset_stats_t dds;
2287fa9e4066Sahrens 	uint64_t object, object_count;
2288a2eea2e1Sahrens 	uint64_t refdbytes, usedobjs, scratch;
22893f9d6ad7SLin Ling 	char numbuf[32];
229014843421SMatthew Ahrens 	char blkbuf[BP_SPRINTF_LEN + 20];
22919adfa60dSMatthew Ahrens 	char osname[ZFS_MAX_DATASET_NAME_LEN];
22923f7978d0SAlan Somers 	const char *type = "UNKNOWN";
2293fa9e4066Sahrens 	int verbosity = dump_opt['d'];
2294fa9e4066Sahrens 	int print_header = 1;
22953f7978d0SAlan Somers 	unsigned i;
22963f7978d0SAlan Somers 	int error;
229754811da5SToomas Soome 	uint64_t total_slots_used = 0;
229854811da5SToomas Soome 	uint64_t max_slot_used = 0;
229954811da5SToomas Soome 	uint64_t dnode_slots;
2300fa9e4066Sahrens 
23010a055120SJason King 	/* make sure nicenum has enough space */
23020a055120SJason King 	CTASSERT(sizeof (numbuf) >= NN_NUMBUF_SZ);
23030a055120SJason King 
23043b2aab18SMatthew Ahrens 	dsl_pool_config_enter(dmu_objset_pool(os), FTAG);
2305a2eea2e1Sahrens 	dmu_objset_fast_stat(os, &dds);
23063b2aab18SMatthew Ahrens 	dsl_pool_config_exit(dmu_objset_pool(os), FTAG);
2307fa9e4066Sahrens 
2308fa9e4066Sahrens 	if (dds.dds_type < DMU_OST_NUMTYPES)
2309fa9e4066Sahrens 		type = objset_types[dds.dds_type];
2310fa9e4066Sahrens 
2311fa9e4066Sahrens 	if (dds.dds_type == DMU_OST_META) {
2312fa9e4066Sahrens 		dds.dds_creation_txg = TXG_INITIAL;
23135d7b4d43SMatthew Ahrens 		usedobjs = BP_GET_FILL(os->os_rootbp);
2314c1379625SJustin T. Gibbs 		refdbytes = dsl_dir_phys(os->os_spa->spa_dsl_pool->dp_mos_dir)->
2315c1379625SJustin T. Gibbs 		    dd_used_bytes;
2316a2eea2e1Sahrens 	} else {
2317a2eea2e1Sahrens 		dmu_objset_space(os, &refdbytes, &scratch, &usedobjs, &scratch);
2318fa9e4066Sahrens 	}
2319fa9e4066Sahrens 
23205d7b4d43SMatthew Ahrens 	ASSERT3U(usedobjs, ==, BP_GET_FILL(os->os_rootbp));
2321fa9e4066Sahrens 
23220a055120SJason King 	zdb_nicenum(refdbytes, numbuf, sizeof (numbuf));
2323fa9e4066Sahrens 
2324fa9e4066Sahrens 	if (verbosity >= 4) {
232543466aaeSMax Grossman 		(void) snprintf(blkbuf, sizeof (blkbuf), ", rootbp ");
232643466aaeSMax Grossman 		(void) snprintf_blkptr(blkbuf + strlen(blkbuf),
232743466aaeSMax Grossman 		    sizeof (blkbuf) - strlen(blkbuf), os->os_rootbp);
2328fa9e4066Sahrens 	} else {
2329fa9e4066Sahrens 		blkbuf[0] = '\0';
2330fa9e4066Sahrens 	}
2331fa9e4066Sahrens 
2332fa9e4066Sahrens 	dmu_objset_name(os, osname);
2333fa9e4066Sahrens 
2334a2eea2e1Sahrens 	(void) printf("Dataset %s [%s], ID %llu, cr_txg %llu, "
2335ade2c828SSerapheim Dimitropoulos 	    "%s, %llu objects%s%s\n",
2336fa9e4066Sahrens 	    osname, type, (u_longlong_t)dmu_objset_id(os),
2337fa9e4066Sahrens 	    (u_longlong_t)dds.dds_creation_txg,
2338ade2c828SSerapheim Dimitropoulos 	    numbuf, (u_longlong_t)usedobjs, blkbuf,
2339ade2c828SSerapheim Dimitropoulos 	    (dds.dds_inconsistent) ? " (inconsistent)" : "");
2340fa9e4066Sahrens 
2341b24ab676SJeff Bonwick 	if (zopt_objects != 0) {
2342b24ab676SJeff Bonwick 		for (i = 0; i < zopt_objects; i++)
2343b24ab676SJeff Bonwick 			dump_object(os, zopt_object[i], verbosity,
234454811da5SToomas Soome 			    &print_header, NULL);
2345b24ab676SJeff Bonwick 		(void) printf("\n");
2346b24ab676SJeff Bonwick 		return;
2347b24ab676SJeff Bonwick 	}
2348b24ab676SJeff Bonwick 
2349b24ab676SJeff Bonwick 	if (dump_opt['i'] != 0 || verbosity >= 2)
2350b24ab676SJeff Bonwick 		dump_intent_log(dmu_objset_zil(os));
2351fa9e4066Sahrens 
23525cabbc6bSPrashanth Sreenivasa 	if (dmu_objset_ds(os) != NULL) {
23535cabbc6bSPrashanth Sreenivasa 		dsl_dataset_t *ds = dmu_objset_ds(os);
23545cabbc6bSPrashanth Sreenivasa 		dump_deadlist(&ds->ds_deadlist);
23555cabbc6bSPrashanth Sreenivasa 
23565cabbc6bSPrashanth Sreenivasa 		if (dsl_dataset_remap_deadlist_exists(ds)) {
23575cabbc6bSPrashanth Sreenivasa 			(void) printf("ds_remap_deadlist:\n");
23585cabbc6bSPrashanth Sreenivasa 			dump_deadlist(&ds->ds_remap_deadlist);
23595cabbc6bSPrashanth Sreenivasa 		}
236017fb938fSMatthew Ahrens 		count_ds_mos_objects(ds);
23615cabbc6bSPrashanth Sreenivasa 	}
2362fa9e4066Sahrens 
2363fa9e4066Sahrens 	if (verbosity < 2)
2364fa9e4066Sahrens 		return;
2365fa9e4066Sahrens 
236643466aaeSMax Grossman 	if (BP_IS_HOLE(os->os_rootbp))
2367088f3894Sahrens 		return;
2368088f3894Sahrens 
236954811da5SToomas Soome 	dump_object(os, 0, verbosity, &print_header, NULL);
237014843421SMatthew Ahrens 	object_count = 0;
2371744947dcSTom Erickson 	if (DMU_USERUSED_DNODE(os) != NULL &&
2372744947dcSTom Erickson 	    DMU_USERUSED_DNODE(os)->dn_type != 0) {
237354811da5SToomas Soome 		dump_object(os, DMU_USERUSED_OBJECT, verbosity, &print_header,
237454811da5SToomas Soome 		    NULL);
237554811da5SToomas Soome 		dump_object(os, DMU_GROUPUSED_OBJECT, verbosity, &print_header,
237654811da5SToomas Soome 		    NULL);
237714843421SMatthew Ahrens 	}
2378fa9e4066Sahrens 
2379fa9e4066Sahrens 	object = 0;
23806754306eSahrens 	while ((error = dmu_object_next(os, &object, B_FALSE, 0)) == 0) {
238154811da5SToomas Soome 		dump_object(os, object, verbosity, &print_header, &dnode_slots);
2382fa9e4066Sahrens 		object_count++;
238354811da5SToomas Soome 		total_slots_used += dnode_slots;
238454811da5SToomas Soome 		max_slot_used = object + dnode_slots - 1;
2385fa9e4066Sahrens 	}
2386fa9e4066Sahrens 
2387a2eea2e1Sahrens 	ASSERT3U(object_count, ==, usedobjs);
2388fa9e4066Sahrens 
2389fa9e4066Sahrens 	(void) printf("\n");
2390fa9e4066Sahrens 
239154811da5SToomas Soome 	(void) printf("    Dnode slots:\n");
239254811da5SToomas Soome 	(void) printf("\tTotal used:    %10llu\n",
239354811da5SToomas Soome 	    (u_longlong_t)total_slots_used);
239454811da5SToomas Soome 	(void) printf("\tMax used:      %10llu\n",
239554811da5SToomas Soome 	    (u_longlong_t)max_slot_used);
239654811da5SToomas Soome 	(void) printf("\tPercent empty: %10lf\n",
239754811da5SToomas Soome 	    (double)(max_slot_used - total_slots_used)*100 /
239854811da5SToomas Soome 	    (double)max_slot_used);
239954811da5SToomas Soome 
240054811da5SToomas Soome 	(void) printf("\n");
240154811da5SToomas Soome 
2402ccba0801SRich Morris 	if (error != ESRCH) {
2403ccba0801SRich Morris 		(void) fprintf(stderr, "dmu_object_next() = %d\n", error);
2404ccba0801SRich Morris 		abort();
2405ccba0801SRich Morris 	}
240620b5dafbSPaul Dagnelie 	if (leaked_objects != 0) {
240720b5dafbSPaul Dagnelie 		(void) printf("%d potentially leaked objects detected\n",
240820b5dafbSPaul Dagnelie 		    leaked_objects);
240920b5dafbSPaul Dagnelie 		leaked_objects = 0;
241020b5dafbSPaul Dagnelie 	}
2411fa9e4066Sahrens }
2412fa9e4066Sahrens 
2413fa9e4066Sahrens static void
241453b9a4a9SVictor Latushkin dump_uberblock(uberblock_t *ub, const char *header, const char *footer)
2415fa9e4066Sahrens {
2416fa9e4066Sahrens 	time_t timestamp = ub->ub_timestamp;
2417fa9e4066Sahrens 
24183f7978d0SAlan Somers 	(void) printf("%s", header ? header : "");
2419fa9e4066Sahrens 	(void) printf("\tmagic = %016llx\n", (u_longlong_t)ub->ub_magic);
2420fa9e4066Sahrens 	(void) printf("\tversion = %llu\n", (u_longlong_t)ub->ub_version);
2421fa9e4066Sahrens 	(void) printf("\ttxg = %llu\n", (u_longlong_t)ub->ub_txg);
2422fa9e4066Sahrens 	(void) printf("\tguid_sum = %llu\n", (u_longlong_t)ub->ub_guid_sum);
2423fa9e4066Sahrens 	(void) printf("\ttimestamp = %llu UTC = %s",
2424fa9e4066Sahrens 	    (u_longlong_t)ub->ub_timestamp, asctime(localtime(&timestamp)));
2425e0f1c0afSOlaf Faaland 
2426e0f1c0afSOlaf Faaland 	(void) printf("\tmmp_magic = %016llx\n",
2427e0f1c0afSOlaf Faaland 	    (u_longlong_t)ub->ub_mmp_magic);
2428e0f1c0afSOlaf Faaland 	if (ub->ub_mmp_magic == MMP_MAGIC)
2429e0f1c0afSOlaf Faaland 		(void) printf("\tmmp_delay = %0llu\n",
2430e0f1c0afSOlaf Faaland 		    (u_longlong_t)ub->ub_mmp_delay);
2431e0f1c0afSOlaf Faaland 
2432fa9e4066Sahrens 	if (dump_opt['u'] >= 3) {
2433fbabab8fSmaybee 		char blkbuf[BP_SPRINTF_LEN];
243443466aaeSMax Grossman 		snprintf_blkptr(blkbuf, sizeof (blkbuf), &ub->ub_rootbp);
2435fa9e4066Sahrens 		(void) printf("\trootbp = %s\n", blkbuf);
2436fa9e4066Sahrens 	}
243786714001SSerapheim Dimitropoulos 	(void) printf("\tcheckpoint_txg = %llu\n",
243886714001SSerapheim Dimitropoulos 	    (u_longlong_t)ub->ub_checkpoint_txg);
24393f7978d0SAlan Somers 	(void) printf("%s", footer ? footer : "");
2440fa9e4066Sahrens }
2441fa9e4066Sahrens 
2442fa9e4066Sahrens static void
244307428bdfSVictor Latushkin dump_config(spa_t *spa)
2444fa9e4066Sahrens {
244507428bdfSVictor Latushkin 	dmu_buf_t *db;
244607428bdfSVictor Latushkin 	size_t nvsize = 0;
244707428bdfSVictor Latushkin 	int error = 0;
244807428bdfSVictor Latushkin 
2449fa9e4066Sahrens 
245007428bdfSVictor Latushkin 	error = dmu_bonus_hold(spa->spa_meta_objset,
245107428bdfSVictor Latushkin 	    spa->spa_config_object, FTAG, &db);
245207428bdfSVictor Latushkin 
245307428bdfSVictor Latushkin 	if (error == 0) {
245407428bdfSVictor Latushkin 		nvsize = *(uint64_t *)db->db_data;
245507428bdfSVictor Latushkin 		dmu_buf_rele(db, FTAG);
245607428bdfSVictor Latushkin 
245707428bdfSVictor Latushkin 		(void) printf("\nMOS Configuration:\n");
245807428bdfSVictor Latushkin 		dump_packed_nvlist(spa->spa_meta_objset,
245907428bdfSVictor Latushkin 		    spa->spa_config_object, (void *)&nvsize, 1);
246007428bdfSVictor Latushkin 	} else {
246107428bdfSVictor Latushkin 		(void) fprintf(stderr, "dmu_bonus_hold(%llu) failed, errno %d",
246207428bdfSVictor Latushkin 		    (u_longlong_t)spa->spa_config_object, error);
2463fa9e4066Sahrens 	}
2464fa9e4066Sahrens }
2465fa9e4066Sahrens 
2466c5904d13Seschrock static void
2467c5904d13Seschrock dump_cachefile(const char *cachefile)
2468c5904d13Seschrock {
2469c5904d13Seschrock 	int fd;
2470c5904d13Seschrock 	struct stat64 statbuf;
2471c5904d13Seschrock 	char *buf;
2472c5904d13Seschrock 	nvlist_t *config;
2473c5904d13Seschrock 
2474c5904d13Seschrock 	if ((fd = open64(cachefile, O_RDONLY)) < 0) {
2475c5904d13Seschrock 		(void) printf("cannot open '%s': %s\n", cachefile,
2476c5904d13Seschrock 		    strerror(errno));
2477c5904d13Seschrock 		exit(1);
2478c5904d13Seschrock 	}
2479c5904d13Seschrock 
2480c5904d13Seschrock 	if (fstat64(fd, &statbuf) != 0) {
2481c5904d13Seschrock 		(void) printf("failed to stat '%s': %s\n", cachefile,
2482c5904d13Seschrock 		    strerror(errno));
2483c5904d13Seschrock 		exit(1);
2484c5904d13Seschrock 	}
2485c5904d13Seschrock 
2486c5904d13Seschrock 	if ((buf = malloc(statbuf.st_size)) == NULL) {
2487c5904d13Seschrock 		(void) fprintf(stderr, "failed to allocate %llu bytes\n",
2488c5904d13Seschrock 		    (u_longlong_t)statbuf.st_size);
2489c5904d13Seschrock 		exit(1);
2490c5904d13Seschrock 	}
2491c5904d13Seschrock 
2492c5904d13Seschrock 	if (read(fd, buf, statbuf.st_size) != statbuf.st_size) {
2493c5904d13Seschrock 		(void) fprintf(stderr, "failed to read %llu bytes\n",
2494c5904d13Seschrock 		    (u_longlong_t)statbuf.st_size);
2495c5904d13Seschrock 		exit(1);
2496c5904d13Seschrock 	}
2497c5904d13Seschrock 
2498c5904d13Seschrock 	(void) close(fd);
2499c5904d13Seschrock 
2500c5904d13Seschrock 	if (nvlist_unpack(buf, statbuf.st_size, &config, 0) != 0) {
2501c5904d13Seschrock 		(void) fprintf(stderr, "failed to unpack nvlist\n");
2502c5904d13Seschrock 		exit(1);
2503c5904d13Seschrock 	}
2504c5904d13Seschrock 
2505c5904d13Seschrock 	free(buf);
2506c5904d13Seschrock 
2507c5904d13Seschrock 	dump_nvlist(config, 0);
2508c5904d13Seschrock 
2509c5904d13Seschrock 	nvlist_free(config);
2510c5904d13Seschrock }
2511c5904d13Seschrock 
251253b9a4a9SVictor Latushkin #define	ZDB_MAX_UB_HEADER_SIZE 32
251353b9a4a9SVictor Latushkin 
251453b9a4a9SVictor Latushkin static void
251553b9a4a9SVictor Latushkin dump_label_uberblocks(vdev_label_t *lbl, uint64_t ashift)
251653b9a4a9SVictor Latushkin {
251753b9a4a9SVictor Latushkin 	vdev_t vd;
251853b9a4a9SVictor Latushkin 	vdev_t *vdp = &vd;
251953b9a4a9SVictor Latushkin 	char header[ZDB_MAX_UB_HEADER_SIZE];
252053b9a4a9SVictor Latushkin 
252153b9a4a9SVictor Latushkin 	vd.vdev_ashift = ashift;
252253b9a4a9SVictor Latushkin 	vdp->vdev_top = vdp;
252353b9a4a9SVictor Latushkin 
252453b9a4a9SVictor Latushkin 	for (int i = 0; i < VDEV_UBERBLOCK_COUNT(vdp); i++) {
252553b9a4a9SVictor Latushkin 		uint64_t uoff = VDEV_UBERBLOCK_OFFSET(vdp, i);
252653b9a4a9SVictor Latushkin 		uberblock_t *ub = (void *)((char *)lbl + uoff);
252753b9a4a9SVictor Latushkin 
252853b9a4a9SVictor Latushkin 		if (uberblock_verify(ub))
252953b9a4a9SVictor Latushkin 			continue;
2530e0f1c0afSOlaf Faaland 
2531e0f1c0afSOlaf Faaland 		if ((dump_opt['u'] < 4) &&
2532e0f1c0afSOlaf Faaland 		    (ub->ub_mmp_magic == MMP_MAGIC) && ub->ub_mmp_delay &&
2533e0f1c0afSOlaf Faaland 		    (i >= VDEV_UBERBLOCK_COUNT(&vd) - MMP_BLOCKS_PER_LABEL))
2534e0f1c0afSOlaf Faaland 			continue;
2535e0f1c0afSOlaf Faaland 
253653b9a4a9SVictor Latushkin 		(void) snprintf(header, ZDB_MAX_UB_HEADER_SIZE,
253753b9a4a9SVictor Latushkin 		    "Uberblock[%d]\n", i);
253853b9a4a9SVictor Latushkin 		dump_uberblock(ub, header, "");
253953b9a4a9SVictor Latushkin 	}
254053b9a4a9SVictor Latushkin }
254153b9a4a9SVictor Latushkin 
2542ed61ec1dSYuri Pankov static char curpath[PATH_MAX];
2543ed61ec1dSYuri Pankov 
2544ed61ec1dSYuri Pankov /*
2545ed61ec1dSYuri Pankov  * Iterate through the path components, recursively passing
2546ed61ec1dSYuri Pankov  * current one's obj and remaining path until we find the obj
2547ed61ec1dSYuri Pankov  * for the last one.
2548ed61ec1dSYuri Pankov  */
2549ed61ec1dSYuri Pankov static int
2550ed61ec1dSYuri Pankov dump_path_impl(objset_t *os, uint64_t obj, char *name)
2551ed61ec1dSYuri Pankov {
2552ed61ec1dSYuri Pankov 	int err;
2553ed61ec1dSYuri Pankov 	int header = 1;
2554ed61ec1dSYuri Pankov 	uint64_t child_obj;
2555ed61ec1dSYuri Pankov 	char *s;
2556ed61ec1dSYuri Pankov 	dmu_buf_t *db;
2557ed61ec1dSYuri Pankov 	dmu_object_info_t doi;
2558ed61ec1dSYuri Pankov 
2559ed61ec1dSYuri Pankov 	if ((s = strchr(name, '/')) != NULL)
2560ed61ec1dSYuri Pankov 		*s = '\0';
2561ed61ec1dSYuri Pankov 	err = zap_lookup(os, obj, name, 8, 1, &child_obj);
2562ed61ec1dSYuri Pankov 
2563ed61ec1dSYuri Pankov 	(void) strlcat(curpath, name, sizeof (curpath));
2564ed61ec1dSYuri Pankov 
2565ed61ec1dSYuri Pankov 	if (err != 0) {
2566ed61ec1dSYuri Pankov 		(void) fprintf(stderr, "failed to lookup %s: %s\n",
2567ed61ec1dSYuri Pankov 		    curpath, strerror(err));
2568ed61ec1dSYuri Pankov 		return (err);
2569ed61ec1dSYuri Pankov 	}
2570ed61ec1dSYuri Pankov 
2571ed61ec1dSYuri Pankov 	child_obj = ZFS_DIRENT_OBJ(child_obj);
2572ed61ec1dSYuri Pankov 	err = sa_buf_hold(os, child_obj, FTAG, &db);
2573ed61ec1dSYuri Pankov 	if (err != 0) {
2574ed61ec1dSYuri Pankov 		(void) fprintf(stderr,
2575ed61ec1dSYuri Pankov 		    "failed to get SA dbuf for obj %llu: %s\n",
2576ed61ec1dSYuri Pankov 		    (u_longlong_t)child_obj, strerror(err));
2577ed61ec1dSYuri Pankov 		return (EINVAL);
2578ed61ec1dSYuri Pankov 	}
2579ed61ec1dSYuri Pankov 	dmu_object_info_from_db(db, &doi);
2580ed61ec1dSYuri Pankov 	sa_buf_rele(db, FTAG);
2581ed61ec1dSYuri Pankov 
2582ed61ec1dSYuri Pankov 	if (doi.doi_bonus_type != DMU_OT_SA &&
2583ed61ec1dSYuri Pankov 	    doi.doi_bonus_type != DMU_OT_ZNODE) {
2584ed61ec1dSYuri Pankov 		(void) fprintf(stderr, "invalid bonus type %d for obj %llu\n",
2585ed61ec1dSYuri Pankov 		    doi.doi_bonus_type, (u_longlong_t)child_obj);
2586ed61ec1dSYuri Pankov 		return (EINVAL);
2587ed61ec1dSYuri Pankov 	}
2588ed61ec1dSYuri Pankov 
2589ed61ec1dSYuri Pankov 	if (dump_opt['v'] > 6) {
2590ed61ec1dSYuri Pankov 		(void) printf("obj=%llu %s type=%d bonustype=%d\n",
2591ed61ec1dSYuri Pankov 		    (u_longlong_t)child_obj, curpath, doi.doi_type,
2592ed61ec1dSYuri Pankov 		    doi.doi_bonus_type);
2593ed61ec1dSYuri Pankov 	}
2594ed61ec1dSYuri Pankov 
2595ed61ec1dSYuri Pankov 	(void) strlcat(curpath, "/", sizeof (curpath));
2596ed61ec1dSYuri Pankov 
2597ed61ec1dSYuri Pankov 	switch (doi.doi_type) {
2598ed61ec1dSYuri Pankov 	case DMU_OT_DIRECTORY_CONTENTS:
2599ed61ec1dSYuri Pankov 		if (s != NULL && *(s + 1) != '\0')
2600ed61ec1dSYuri Pankov 			return (dump_path_impl(os, child_obj, s + 1));
2601ed61ec1dSYuri Pankov 		/*FALLTHROUGH*/
2602ed61ec1dSYuri Pankov 	case DMU_OT_PLAIN_FILE_CONTENTS:
260354811da5SToomas Soome 		dump_object(os, child_obj, dump_opt['v'], &header, NULL);
2604ed61ec1dSYuri Pankov 		return (0);
2605ed61ec1dSYuri Pankov 	default:
2606ed61ec1dSYuri Pankov 		(void) fprintf(stderr, "object %llu has non-file/directory "
2607ed61ec1dSYuri Pankov 		    "type %d\n", (u_longlong_t)obj, doi.doi_type);
2608ed61ec1dSYuri Pankov 		break;
2609ed61ec1dSYuri Pankov 	}
2610ed61ec1dSYuri Pankov 
2611ed61ec1dSYuri Pankov 	return (EINVAL);
2612ed61ec1dSYuri Pankov }
2613ed61ec1dSYuri Pankov 
2614ed61ec1dSYuri Pankov /*
2615ed61ec1dSYuri Pankov  * Dump the blocks for the object specified by path inside the dataset.
2616ed61ec1dSYuri Pankov  */
2617ed61ec1dSYuri Pankov static int
2618ed61ec1dSYuri Pankov dump_path(char *ds, char *path)
2619ed61ec1dSYuri Pankov {
2620ed61ec1dSYuri Pankov 	int err;
2621ed61ec1dSYuri Pankov 	objset_t *os;
2622ed61ec1dSYuri Pankov 	uint64_t root_obj;
2623ed61ec1dSYuri Pankov 
2624ed61ec1dSYuri Pankov 	err = open_objset(ds, DMU_OST_ZFS, FTAG, &os);
2625ed61ec1dSYuri Pankov 	if (err != 0)
2626ed61ec1dSYuri Pankov 		return (err);
2627ed61ec1dSYuri Pankov 
2628ed61ec1dSYuri Pankov 	err = zap_lookup(os, MASTER_NODE_OBJ, ZFS_ROOT_OBJ, 8, 1, &root_obj);
2629ed61ec1dSYuri Pankov 	if (err != 0) {
2630ed61ec1dSYuri Pankov 		(void) fprintf(stderr, "can't lookup root znode: %s\n",
2631ed61ec1dSYuri Pankov 		    strerror(err));
2632ed61ec1dSYuri Pankov 		dmu_objset_disown(os, FTAG);
2633ed61ec1dSYuri Pankov 		return (EINVAL);
2634ed61ec1dSYuri Pankov 	}
2635ed61ec1dSYuri Pankov 
2636ed61ec1dSYuri Pankov 	(void) snprintf(curpath, sizeof (curpath), "dataset=%s path=/", ds);
2637ed61ec1dSYuri Pankov 
2638ed61ec1dSYuri Pankov 	err = dump_path_impl(os, root_obj, path);
2639ed61ec1dSYuri Pankov 
2640ed61ec1dSYuri Pankov 	close_objset(os, FTAG);
2641ed61ec1dSYuri Pankov 	return (err);
2642ed61ec1dSYuri Pankov }
2643ed61ec1dSYuri Pankov 
264464723e36SYuri Pankov static int
2645fa9e4066Sahrens dump_label(const char *dev)
2646fa9e4066Sahrens {
2647fa9e4066Sahrens 	int fd;
2648fa9e4066Sahrens 	vdev_label_t label;
264964723e36SYuri Pankov 	char path[MAXPATHLEN];
265064723e36SYuri Pankov 	char *buf = label.vl_vdev_phys.vp_nvlist;
2651fa9e4066Sahrens 	size_t buflen = sizeof (label.vl_vdev_phys.vp_nvlist);
2652fa9e4066Sahrens 	struct stat64 statbuf;
265353b9a4a9SVictor Latushkin 	uint64_t psize, ashift;
265464723e36SYuri Pankov 	boolean_t label_found = B_FALSE;
265564723e36SYuri Pankov 
265664723e36SYuri Pankov 	(void) strlcpy(path, dev, sizeof (path));
265764723e36SYuri Pankov 	if (dev[0] == '/') {
265864723e36SYuri Pankov 		if (strncmp(dev, ZFS_DISK_ROOTD,
265964723e36SYuri Pankov 		    strlen(ZFS_DISK_ROOTD)) == 0) {
266064723e36SYuri Pankov 			(void) snprintf(path, sizeof (path), "%s%s",
266164723e36SYuri Pankov 			    ZFS_RDISK_ROOTD, dev + strlen(ZFS_DISK_ROOTD));
266264723e36SYuri Pankov 		}
266364723e36SYuri Pankov 	} else if (stat64(path, &statbuf) != 0) {
266464723e36SYuri Pankov 		char *s;
2665c6065d0fSGeorge Wilson 
266664723e36SYuri Pankov 		(void) snprintf(path, sizeof (path), "%s%s", ZFS_RDISK_ROOTD,
266764723e36SYuri Pankov 		    dev);
266822c8b958SYuri Pankov 		if (((s = strrchr(dev, 's')) == NULL &&
266922c8b958SYuri Pankov 		    (s = strchr(dev, 'p')) == NULL) ||
267022c8b958SYuri Pankov 		    !isdigit(*(s + 1)))
267164723e36SYuri Pankov 			(void) strlcat(path, "s0", sizeof (path));
2672fa9e4066Sahrens 	}
2673fa9e4066Sahrens 
267422c8b958SYuri Pankov 	if ((fd = open64(path, O_RDONLY)) < 0) {
267522c8b958SYuri Pankov 		(void) fprintf(stderr, "cannot open '%s': %s\n", path,
2676fa9e4066Sahrens 		    strerror(errno));
2677c6065d0fSGeorge Wilson 		exit(1);
2678c6065d0fSGeorge Wilson 	}
2679c6065d0fSGeorge Wilson 
268022c8b958SYuri Pankov 	if (fstat64(fd, &statbuf) != 0) {
268122c8b958SYuri Pankov 		(void) fprintf(stderr, "failed to stat '%s': %s\n", path,
268222c8b958SYuri Pankov 		    strerror(errno));
268322c8b958SYuri Pankov 		(void) close(fd);
268464723e36SYuri Pankov 		exit(1);
268564723e36SYuri Pankov 	}
268664723e36SYuri Pankov 
268722c8b958SYuri Pankov 	if (S_ISBLK(statbuf.st_mode)) {
268822c8b958SYuri Pankov 		(void) fprintf(stderr,
268922c8b958SYuri Pankov 		    "cannot use '%s': character device required\n", path);
269022c8b958SYuri Pankov 		(void) close(fd);
2691c6065d0fSGeorge Wilson 		exit(1);
2692fa9e4066Sahrens 	}
2693fa9e4066Sahrens 
2694fa9e4066Sahrens 	psize = statbuf.st_size;
2695fa9e4066Sahrens 	psize = P2ALIGN(psize, (uint64_t)sizeof (vdev_label_t));
2696fa9e4066Sahrens 
269753b9a4a9SVictor Latushkin 	for (int l = 0; l < VDEV_LABELS; l++) {
2698fa9e4066Sahrens 		nvlist_t *config = NULL;
2699fa9e4066Sahrens 
270064723e36SYuri Pankov 		if (!dump_opt['q']) {
270164723e36SYuri Pankov 			(void) printf("------------------------------------\n");
270264723e36SYuri Pankov 			(void) printf("LABEL %d\n", l);
270364723e36SYuri Pankov 			(void) printf("------------------------------------\n");
270464723e36SYuri Pankov 		}
2705fa9e4066Sahrens 
27060d981225Seschrock 		if (pread64(fd, &label, sizeof (label),
2707fa9e4066Sahrens 		    vdev_label_offset(psize, l, 0)) != sizeof (label)) {
270864723e36SYuri Pankov 			if (!dump_opt['q'])
270964723e36SYuri Pankov 				(void) printf("failed to read label %d\n", l);
2710fa9e4066Sahrens 			continue;
2711fa9e4066Sahrens 		}
2712fa9e4066Sahrens 
2713fa9e4066Sahrens 		if (nvlist_unpack(buf, buflen, &config, 0) != 0) {
271464723e36SYuri Pankov 			if (!dump_opt['q'])
271564723e36SYuri Pankov 				(void) printf("failed to unpack label %d\n", l);
271653b9a4a9SVictor Latushkin 			ashift = SPA_MINBLOCKSHIFT;
271753b9a4a9SVictor Latushkin 		} else {
271853b9a4a9SVictor Latushkin 			nvlist_t *vdev_tree = NULL;
271953b9a4a9SVictor Latushkin 
272064723e36SYuri Pankov 			if (!dump_opt['q'])
272164723e36SYuri Pankov 				dump_nvlist(config, 4);
272253b9a4a9SVictor Latushkin 			if ((nvlist_lookup_nvlist(config,
272353b9a4a9SVictor Latushkin 			    ZPOOL_CONFIG_VDEV_TREE, &vdev_tree) != 0) ||
272453b9a4a9SVictor Latushkin 			    (nvlist_lookup_uint64(vdev_tree,
272553b9a4a9SVictor Latushkin 			    ZPOOL_CONFIG_ASHIFT, &ashift) != 0))
272653b9a4a9SVictor Latushkin 				ashift = SPA_MINBLOCKSHIFT;
272753b9a4a9SVictor Latushkin 			nvlist_free(config);
272864723e36SYuri Pankov 			label_found = B_TRUE;
2729fa9e4066Sahrens 		}
273053b9a4a9SVictor Latushkin 		if (dump_opt['u'])
273153b9a4a9SVictor Latushkin 			dump_label_uberblocks(&label, ashift);
2732fa9e4066Sahrens 	}
2733c6065d0fSGeorge Wilson 
2734c6065d0fSGeorge Wilson 	(void) close(fd);
273564723e36SYuri Pankov 
273664723e36SYuri Pankov 	return (label_found ? 0 : 2);
2737fa9e4066Sahrens }
2738fa9e4066Sahrens 
2739ca0cc391SMatthew Ahrens static uint64_t dataset_feature_count[SPA_FEATURES];
27405cabbc6bSPrashanth Sreenivasa static uint64_t remap_deadlist_count = 0;
2741b5152584SMatthew Ahrens 
2742fa9e4066Sahrens /*ARGSUSED*/
27431d452cf5Sahrens static int
2744fd136879SMatthew Ahrens dump_one_dir(const char *dsname, void *arg)
2745fa9e4066Sahrens {
2746fa9e4066Sahrens 	int error;
2747fa9e4066Sahrens 	objset_t *os;
2748fa9e4066Sahrens 
2749ed61ec1dSYuri Pankov 	error = open_objset(dsname, DMU_OST_ANY, FTAG, &os);
2750ed61ec1dSYuri Pankov 	if (error != 0)
27511d452cf5Sahrens 		return (0);
2752ca0cc391SMatthew Ahrens 
2753ca0cc391SMatthew Ahrens 	for (spa_feature_t f = 0; f < SPA_FEATURES; f++) {
2754ca0cc391SMatthew Ahrens 		if (!dmu_objset_ds(os)->ds_feature_inuse[f])
2755ca0cc391SMatthew Ahrens 			continue;
2756ca0cc391SMatthew Ahrens 		ASSERT(spa_feature_table[f].fi_flags &
2757ca0cc391SMatthew Ahrens 		    ZFEATURE_FLAG_PER_DATASET);
2758ca0cc391SMatthew Ahrens 		dataset_feature_count[f]++;
2759ca0cc391SMatthew Ahrens 	}
2760ca0cc391SMatthew Ahrens 
27615cabbc6bSPrashanth Sreenivasa 	if (dsl_dataset_remap_deadlist_exists(dmu_objset_ds(os))) {
27625cabbc6bSPrashanth Sreenivasa 		remap_deadlist_count++;
27635cabbc6bSPrashanth Sreenivasa 	}
27645cabbc6bSPrashanth Sreenivasa 
2765fa9e4066Sahrens 	dump_dir(os);
2766ed61ec1dSYuri Pankov 	close_objset(os, FTAG);
2767e0d35c44Smarks 	fuid_table_destroy();
27681d452cf5Sahrens 	return (0);
2769fa9e4066Sahrens }
2770fa9e4066Sahrens 
2771fa9e4066Sahrens /*
2772b24ab676SJeff Bonwick  * Block statistics.
2773fa9e4066Sahrens  */
2774b5152584SMatthew Ahrens #define	PSIZE_HISTO_SIZE (SPA_OLD_MAXBLOCKSIZE / SPA_MINBLOCKSIZE + 2)
2775fa9e4066Sahrens typedef struct zdb_blkstats {
2776490d05b9SMatthew Ahrens 	uint64_t zb_asize;
2777490d05b9SMatthew Ahrens 	uint64_t zb_lsize;
2778490d05b9SMatthew Ahrens 	uint64_t zb_psize;
2779490d05b9SMatthew Ahrens 	uint64_t zb_count;
2780d5ee8a13SMatthew Ahrens 	uint64_t zb_gangs;
2781d5ee8a13SMatthew Ahrens 	uint64_t zb_ditto_samevdev;
2782*663207adSDon Brady 	uint64_t zb_ditto_same_ms;
2783490d05b9SMatthew Ahrens 	uint64_t zb_psize_histogram[PSIZE_HISTO_SIZE];
2784fa9e4066Sahrens } zdb_blkstats_t;
2785fa9e4066Sahrens 
2786b24ab676SJeff Bonwick /*
2787b24ab676SJeff Bonwick  * Extended object types to report deferred frees and dedup auto-ditto blocks.
2788b24ab676SJeff Bonwick  */
2789b24ab676SJeff Bonwick #define	ZDB_OT_DEFERRED	(DMU_OT_NUMTYPES + 0)
2790b24ab676SJeff Bonwick #define	ZDB_OT_DITTO	(DMU_OT_NUMTYPES + 1)
2791ad135b5dSChristopher Siden #define	ZDB_OT_OTHER	(DMU_OT_NUMTYPES + 2)
2792ad135b5dSChristopher Siden #define	ZDB_OT_TOTAL	(DMU_OT_NUMTYPES + 3)
2793b24ab676SJeff Bonwick 
27943f7978d0SAlan Somers static const char *zdb_ot_extname[] = {
2795b24ab676SJeff Bonwick 	"deferred free",
2796b24ab676SJeff Bonwick 	"dedup ditto",
2797ad135b5dSChristopher Siden 	"other",
2798b24ab676SJeff Bonwick 	"Total",
2799b24ab676SJeff Bonwick };
2800fa9e4066Sahrens 
280188b7b0f2SMatthew Ahrens #define	ZB_TOTAL	DN_MAX_LEVELS
2802fa9e4066Sahrens 
2803fa9e4066Sahrens typedef struct zdb_cb {
2804b24ab676SJeff Bonwick 	zdb_blkstats_t	zcb_type[ZB_TOTAL + 1][ZDB_OT_TOTAL + 1];
28055cabbc6bSPrashanth Sreenivasa 	uint64_t	zcb_removing_size;
280686714001SSerapheim Dimitropoulos 	uint64_t	zcb_checkpoint_size;
2807b24ab676SJeff Bonwick 	uint64_t	zcb_dedup_asize;
2808b24ab676SJeff Bonwick 	uint64_t	zcb_dedup_blocks;
28095d7b4d43SMatthew Ahrens 	uint64_t	zcb_embedded_blocks[NUM_BP_EMBEDDED_TYPES];
28105d7b4d43SMatthew Ahrens 	uint64_t	zcb_embedded_histogram[NUM_BP_EMBEDDED_TYPES]
28115d7b4d43SMatthew Ahrens 	    [BPE_PAYLOAD_SIZE];
2812490d05b9SMatthew Ahrens 	uint64_t	zcb_start;
28133f7978d0SAlan Somers 	hrtime_t	zcb_lastprint;
2814490d05b9SMatthew Ahrens 	uint64_t	zcb_totalasize;
2815fa9e4066Sahrens 	uint64_t	zcb_errors[256];
2816fa9e4066Sahrens 	int		zcb_readfails;
2817fa9e4066Sahrens 	int		zcb_haderrors;
2818cde58dbcSMatthew Ahrens 	spa_t		*zcb_spa;
28195cabbc6bSPrashanth Sreenivasa 	uint32_t	**zcb_vd_obsolete_counts;
2820fa9e4066Sahrens } zdb_cb_t;
2821fa9e4066Sahrens 
2822*663207adSDon Brady /* test if two DVA offsets from same vdev are within the same metaslab */
2823*663207adSDon Brady static boolean_t
2824*663207adSDon Brady same_metaslab(spa_t *spa, uint64_t vdev, uint64_t off1, uint64_t off2)
2825*663207adSDon Brady {
2826*663207adSDon Brady 	vdev_t *vd = vdev_lookup_top(spa, vdev);
2827*663207adSDon Brady 	uint64_t ms_shift = vd->vdev_ms_shift;
2828*663207adSDon Brady 
2829*663207adSDon Brady 	return ((off1 >> ms_shift) == (off2 >> ms_shift));
2830*663207adSDon Brady }
2831*663207adSDon Brady 
2832fa9e4066Sahrens static void
2833cde58dbcSMatthew Ahrens zdb_count_block(zdb_cb_t *zcb, zilog_t *zilog, const blkptr_t *bp,
2834b24ab676SJeff Bonwick     dmu_object_type_t type)
2835fa9e4066Sahrens {
2836b24ab676SJeff Bonwick 	uint64_t refcnt = 0;
2837b24ab676SJeff Bonwick 
2838b24ab676SJeff Bonwick 	ASSERT(type < ZDB_OT_TOTAL);
2839b24ab676SJeff Bonwick 
2840b24ab676SJeff Bonwick 	if (zilog && zil_bp_tree_add(zilog, bp) != 0)
2841b24ab676SJeff Bonwick 		return;
2842b24ab676SJeff Bonwick 
2843*663207adSDon Brady 	spa_config_enter(zcb->zcb_spa, SCL_CONFIG, FTAG, RW_READER);
2844*663207adSDon Brady 
2845e14bb325SJeff Bonwick 	for (int i = 0; i < 4; i++) {
2846fa9e4066Sahrens 		int l = (i < 2) ? BP_GET_LEVEL(bp) : ZB_TOTAL;
2847b24ab676SJeff Bonwick 		int t = (i & 1) ? type : ZDB_OT_TOTAL;
2848d5ee8a13SMatthew Ahrens 		int equal;
2849fa9e4066Sahrens 		zdb_blkstats_t *zb = &zcb->zcb_type[l][t];
2850fa9e4066Sahrens 
2851fa9e4066Sahrens 		zb->zb_asize += BP_GET_ASIZE(bp);
2852fa9e4066Sahrens 		zb->zb_lsize += BP_GET_LSIZE(bp);
2853fa9e4066Sahrens 		zb->zb_psize += BP_GET_PSIZE(bp);
2854fa9e4066Sahrens 		zb->zb_count++;
2855b5152584SMatthew Ahrens 
2856b5152584SMatthew Ahrens 		/*
2857b5152584SMatthew Ahrens 		 * The histogram is only big enough to record blocks up to
2858b5152584SMatthew Ahrens 		 * SPA_OLD_MAXBLOCKSIZE; larger blocks go into the last,
2859b5152584SMatthew Ahrens 		 * "other", bucket.
2860b5152584SMatthew Ahrens 		 */
28613f7978d0SAlan Somers 		unsigned idx = BP_GET_PSIZE(bp) >> SPA_MINBLOCKSHIFT;
2862b5152584SMatthew Ahrens 		idx = MIN(idx, SPA_OLD_MAXBLOCKSIZE / SPA_MINBLOCKSIZE + 1);
2863b5152584SMatthew Ahrens 		zb->zb_psize_histogram[idx]++;
2864d5ee8a13SMatthew Ahrens 
2865d5ee8a13SMatthew Ahrens 		zb->zb_gangs += BP_COUNT_GANG(bp);
2866d5ee8a13SMatthew Ahrens 
2867d5ee8a13SMatthew Ahrens 		switch (BP_GET_NDVAS(bp)) {
2868d5ee8a13SMatthew Ahrens 		case 2:
2869d5ee8a13SMatthew Ahrens 			if (DVA_GET_VDEV(&bp->blk_dva[0]) ==
2870*663207adSDon Brady 			    DVA_GET_VDEV(&bp->blk_dva[1])) {
2871d5ee8a13SMatthew Ahrens 				zb->zb_ditto_samevdev++;
2872*663207adSDon Brady 
2873*663207adSDon Brady 				if (same_metaslab(zcb->zcb_spa,
2874*663207adSDon Brady 				    DVA_GET_VDEV(&bp->blk_dva[0]),
2875*663207adSDon Brady 				    DVA_GET_OFFSET(&bp->blk_dva[0]),
2876*663207adSDon Brady 				    DVA_GET_OFFSET(&bp->blk_dva[1])))
2877*663207adSDon Brady 					zb->zb_ditto_same_ms++;
2878*663207adSDon Brady 			}
2879d5ee8a13SMatthew Ahrens 			break;
2880d5ee8a13SMatthew Ahrens 		case 3:
2881d5ee8a13SMatthew Ahrens 			equal = (DVA_GET_VDEV(&bp->blk_dva[0]) ==
2882d5ee8a13SMatthew Ahrens 			    DVA_GET_VDEV(&bp->blk_dva[1])) +
2883d5ee8a13SMatthew Ahrens 			    (DVA_GET_VDEV(&bp->blk_dva[0]) ==
2884d5ee8a13SMatthew Ahrens 			    DVA_GET_VDEV(&bp->blk_dva[2])) +
2885d5ee8a13SMatthew Ahrens 			    (DVA_GET_VDEV(&bp->blk_dva[1]) ==
2886d5ee8a13SMatthew Ahrens 			    DVA_GET_VDEV(&bp->blk_dva[2]));
2887*663207adSDon Brady 			if (equal != 0) {
2888d5ee8a13SMatthew Ahrens 				zb->zb_ditto_samevdev++;
2889*663207adSDon Brady 
2890*663207adSDon Brady 				if (DVA_GET_VDEV(&bp->blk_dva[0]) ==
2891*663207adSDon Brady 				    DVA_GET_VDEV(&bp->blk_dva[1]) &&
2892*663207adSDon Brady 				    same_metaslab(zcb->zcb_spa,
2893*663207adSDon Brady 				    DVA_GET_VDEV(&bp->blk_dva[0]),
2894*663207adSDon Brady 				    DVA_GET_OFFSET(&bp->blk_dva[0]),
2895*663207adSDon Brady 				    DVA_GET_OFFSET(&bp->blk_dva[1])))
2896*663207adSDon Brady 					zb->zb_ditto_same_ms++;
2897*663207adSDon Brady 				else if (DVA_GET_VDEV(&bp->blk_dva[0]) ==
2898*663207adSDon Brady 				    DVA_GET_VDEV(&bp->blk_dva[2]) &&
2899*663207adSDon Brady 				    same_metaslab(zcb->zcb_spa,
2900*663207adSDon Brady 				    DVA_GET_VDEV(&bp->blk_dva[0]),
2901*663207adSDon Brady 				    DVA_GET_OFFSET(&bp->blk_dva[0]),
2902*663207adSDon Brady 				    DVA_GET_OFFSET(&bp->blk_dva[2])))
2903*663207adSDon Brady 					zb->zb_ditto_same_ms++;
2904*663207adSDon Brady 				else if (DVA_GET_VDEV(&bp->blk_dva[1]) ==
2905*663207adSDon Brady 				    DVA_GET_VDEV(&bp->blk_dva[2]) &&
2906*663207adSDon Brady 				    same_metaslab(zcb->zcb_spa,
2907*663207adSDon Brady 				    DVA_GET_VDEV(&bp->blk_dva[1]),
2908*663207adSDon Brady 				    DVA_GET_OFFSET(&bp->blk_dva[1]),
2909*663207adSDon Brady 				    DVA_GET_OFFSET(&bp->blk_dva[2])))
2910*663207adSDon Brady 					zb->zb_ditto_same_ms++;
2911*663207adSDon Brady 			}
2912d5ee8a13SMatthew Ahrens 			break;
2913d5ee8a13SMatthew Ahrens 		}
2914fa9e4066Sahrens 	}
2915fa9e4066Sahrens 
2916*663207adSDon Brady 	spa_config_exit(zcb->zcb_spa, SCL_CONFIG, FTAG);
2917*663207adSDon Brady 
29185d7b4d43SMatthew Ahrens 	if (BP_IS_EMBEDDED(bp)) {
29195d7b4d43SMatthew Ahrens 		zcb->zcb_embedded_blocks[BPE_GET_ETYPE(bp)]++;
29205d7b4d43SMatthew Ahrens 		zcb->zcb_embedded_histogram[BPE_GET_ETYPE(bp)]
29215d7b4d43SMatthew Ahrens 		    [BPE_GET_PSIZE(bp)]++;
29225d7b4d43SMatthew Ahrens 		return;
29235d7b4d43SMatthew Ahrens 	}
29245d7b4d43SMatthew Ahrens 
2925b24ab676SJeff Bonwick 	if (dump_opt['L'])
2926b24ab676SJeff Bonwick 		return;
2927b24ab676SJeff Bonwick 
2928b24ab676SJeff Bonwick 	if (BP_GET_DEDUP(bp)) {
2929b24ab676SJeff Bonwick 		ddt_t *ddt;
2930b24ab676SJeff Bonwick 		ddt_entry_t *dde;
2931b24ab676SJeff Bonwick 
2932cde58dbcSMatthew Ahrens 		ddt = ddt_select(zcb->zcb_spa, bp);
2933b24ab676SJeff Bonwick 		ddt_enter(ddt);
2934b24ab676SJeff Bonwick 		dde = ddt_lookup(ddt, bp, B_FALSE);
2935b24ab676SJeff Bonwick 
2936b24ab676SJeff Bonwick 		if (dde == NULL) {
2937b24ab676SJeff Bonwick 			refcnt = 0;
2938b24ab676SJeff Bonwick 		} else {
2939b24ab676SJeff Bonwick 			ddt_phys_t *ddp = ddt_phys_select(dde, bp);
2940b24ab676SJeff Bonwick 			ddt_phys_decref(ddp);
2941b24ab676SJeff Bonwick 			refcnt = ddp->ddp_refcnt;
2942b24ab676SJeff Bonwick 			if (ddt_phys_total_refcnt(dde) == 0)
2943b24ab676SJeff Bonwick 				ddt_remove(ddt, dde);
2944d41e7643Sek 		}
2945b24ab676SJeff Bonwick 		ddt_exit(ddt);
2946d41e7643Sek 	}
2947d41e7643Sek 
2948cde58dbcSMatthew Ahrens 	VERIFY3U(zio_wait(zio_claim(NULL, zcb->zcb_spa,
294986714001SSerapheim Dimitropoulos 	    refcnt ? 0 : spa_min_claim_txg(zcb->zcb_spa),
2950b24ab676SJeff Bonwick 	    bp, NULL, NULL, ZIO_FLAG_CANFAIL)), ==, 0);
2951fa9e4066Sahrens }
2952fa9e4066Sahrens 
295331d7e8faSGeorge Wilson static void
295431d7e8faSGeorge Wilson zdb_blkptr_done(zio_t *zio)
295531d7e8faSGeorge Wilson {
295631d7e8faSGeorge Wilson 	spa_t *spa = zio->io_spa;
295731d7e8faSGeorge Wilson 	blkptr_t *bp = zio->io_bp;
295831d7e8faSGeorge Wilson 	int ioerr = zio->io_error;
295931d7e8faSGeorge Wilson 	zdb_cb_t *zcb = zio->io_private;
29607802d7bfSMatthew Ahrens 	zbookmark_phys_t *zb = &zio->io_bookmark;
296131d7e8faSGeorge Wilson 
2962770499e1SDan Kimmel 	abd_free(zio->io_abd);
296331d7e8faSGeorge Wilson 
296431d7e8faSGeorge Wilson 	mutex_enter(&spa->spa_scrub_lock);
296531d7e8faSGeorge Wilson 	spa->spa_scrub_inflight--;
296631d7e8faSGeorge Wilson 	cv_broadcast(&spa->spa_scrub_io_cv);
296731d7e8faSGeorge Wilson 
296831d7e8faSGeorge Wilson 	if (ioerr && !(zio->io_flags & ZIO_FLAG_SPECULATIVE)) {
296931d7e8faSGeorge Wilson 		char blkbuf[BP_SPRINTF_LEN];
297031d7e8faSGeorge Wilson 
297131d7e8faSGeorge Wilson 		zcb->zcb_haderrors = 1;
297231d7e8faSGeorge Wilson 		zcb->zcb_errors[ioerr]++;
297331d7e8faSGeorge Wilson 
297431d7e8faSGeorge Wilson 		if (dump_opt['b'] >= 2)
297543466aaeSMax Grossman 			snprintf_blkptr(blkbuf, sizeof (blkbuf), bp);
297631d7e8faSGeorge Wilson 		else
297731d7e8faSGeorge Wilson 			blkbuf[0] = '\0';
297831d7e8faSGeorge Wilson 
297931d7e8faSGeorge Wilson 		(void) printf("zdb_blkptr_cb: "
298031d7e8faSGeorge Wilson 		    "Got error %d reading "
298131d7e8faSGeorge Wilson 		    "<%llu, %llu, %lld, %llx> %s -- skipping\n",
298231d7e8faSGeorge Wilson 		    ioerr,
298331d7e8faSGeorge Wilson 		    (u_longlong_t)zb->zb_objset,
298431d7e8faSGeorge Wilson 		    (u_longlong_t)zb->zb_object,
298531d7e8faSGeorge Wilson 		    (u_longlong_t)zb->zb_level,
298631d7e8faSGeorge Wilson 		    (u_longlong_t)zb->zb_blkid,
298731d7e8faSGeorge Wilson 		    blkbuf);
298831d7e8faSGeorge Wilson 	}
298931d7e8faSGeorge Wilson 	mutex_exit(&spa->spa_scrub_lock);
299031d7e8faSGeorge Wilson }
299131d7e8faSGeorge Wilson 
2992fa9e4066Sahrens static int
29931b912ec7SGeorge Wilson zdb_blkptr_cb(spa_t *spa, zilog_t *zilog, const blkptr_t *bp,
29947802d7bfSMatthew Ahrens     const zbookmark_phys_t *zb, const dnode_phys_t *dnp, void *arg)
2995fa9e4066Sahrens {
2996fa9e4066Sahrens 	zdb_cb_t *zcb = arg;
29976365109dSVictor Latushkin 	dmu_object_type_t type;
2998468c413aSTim Haley 	boolean_t is_metadata;
2999fa9e4066Sahrens 
3000a2cdcdd2SPaul Dagnelie 	if (bp == NULL)
3001a2cdcdd2SPaul Dagnelie 		return (0);
3002a2cdcdd2SPaul Dagnelie 
300343466aaeSMax Grossman 	if (dump_opt['b'] >= 5 && bp->blk_birth > 0) {
300443466aaeSMax Grossman 		char blkbuf[BP_SPRINTF_LEN];
300543466aaeSMax Grossman 		snprintf_blkptr(blkbuf, sizeof (blkbuf), bp);
300643466aaeSMax Grossman 		(void) printf("objset %llu object %llu "
300743466aaeSMax Grossman 		    "level %lld offset 0x%llx %s\n",
300843466aaeSMax Grossman 		    (u_longlong_t)zb->zb_objset,
300943466aaeSMax Grossman 		    (u_longlong_t)zb->zb_object,
301043466aaeSMax Grossman 		    (longlong_t)zb->zb_level,
301143466aaeSMax Grossman 		    (u_longlong_t)blkid2offset(dnp, bp, zb),
301243466aaeSMax Grossman 		    blkbuf);
301343466aaeSMax Grossman 	}
301443466aaeSMax Grossman 
301543466aaeSMax Grossman 	if (BP_IS_HOLE(bp))
301688b7b0f2SMatthew Ahrens 		return (0);
3017e14bb325SJeff Bonwick 
30186365109dSVictor Latushkin 	type = BP_GET_TYPE(bp);
3019e14bb325SJeff Bonwick 
3020ad135b5dSChristopher Siden 	zdb_count_block(zcb, zilog, bp,
3021ad135b5dSChristopher Siden 	    (type & DMU_OT_NEWTYPE) ? ZDB_OT_OTHER : type);
30226365109dSVictor Latushkin 
3023ad135b5dSChristopher Siden 	is_metadata = (BP_GET_LEVEL(bp) != 0 || DMU_OT_IS_METADATA(type));
30246365109dSVictor Latushkin 
30255d7b4d43SMatthew Ahrens 	if (!BP_IS_EMBEDDED(bp) &&
30265d7b4d43SMatthew Ahrens 	    (dump_opt['c'] > 1 || (dump_opt['c'] && is_metadata))) {
3027468c413aSTim Haley 		size_t size = BP_GET_PSIZE(bp);
3028770499e1SDan Kimmel 		abd_t *abd = abd_alloc(size, B_FALSE);
3029b24ab676SJeff Bonwick 		int flags = ZIO_FLAG_CANFAIL | ZIO_FLAG_SCRUB | ZIO_FLAG_RAW;
3030b24ab676SJeff Bonwick 
3031b24ab676SJeff Bonwick 		/* If it's an intent log block, failure is expected. */
3032b24ab676SJeff Bonwick 		if (zb->zb_level == ZB_ZIL_LEVEL)
3033b24ab676SJeff Bonwick 			flags |= ZIO_FLAG_SPECULATIVE;
3034b24ab676SJeff Bonwick 
303531d7e8faSGeorge Wilson 		mutex_enter(&spa->spa_scrub_lock);
303631d7e8faSGeorge Wilson 		while (spa->spa_scrub_inflight > max_inflight)
303731d7e8faSGeorge Wilson 			cv_wait(&spa->spa_scrub_io_cv, &spa->spa_scrub_lock);
303831d7e8faSGeorge Wilson 		spa->spa_scrub_inflight++;
303931d7e8faSGeorge Wilson 		mutex_exit(&spa->spa_scrub_lock);
3040b24ab676SJeff Bonwick 
3041770499e1SDan Kimmel 		zio_nowait(zio_read(NULL, spa, bp, abd, size,
304231d7e8faSGeorge Wilson 		    zdb_blkptr_done, zcb, ZIO_PRIORITY_ASYNC_READ, flags, zb));
3043fa9e4066Sahrens 	}
3044fa9e4066Sahrens 
3045fa9e4066Sahrens 	zcb->zcb_readfails = 0;
3046fa9e4066Sahrens 
3047f7950bf1SMatthew Ahrens 	/* only call gethrtime() every 100 blocks */
3048f7950bf1SMatthew Ahrens 	static int iters;
3049f7950bf1SMatthew Ahrens 	if (++iters > 100)
3050f7950bf1SMatthew Ahrens 		iters = 0;
3051f7950bf1SMatthew Ahrens 	else
3052f7950bf1SMatthew Ahrens 		return (0);
3053f7950bf1SMatthew Ahrens 
3054f7950bf1SMatthew Ahrens 	if (dump_opt['b'] < 5 && gethrtime() > zcb->zcb_lastprint + NANOSEC) {
3055490d05b9SMatthew Ahrens 		uint64_t now = gethrtime();
3056490d05b9SMatthew Ahrens 		char buf[10];
3057490d05b9SMatthew Ahrens 		uint64_t bytes = zcb->zcb_type[ZB_TOTAL][ZDB_OT_TOTAL].zb_asize;
3058490d05b9SMatthew Ahrens 		int kb_per_sec =
3059490d05b9SMatthew Ahrens 		    1 + bytes / (1 + ((now - zcb->zcb_start) / 1000 / 1000));
3060490d05b9SMatthew Ahrens 		int sec_remaining =
3061490d05b9SMatthew Ahrens 		    (zcb->zcb_totalasize - bytes) / 1024 / kb_per_sec;
3062490d05b9SMatthew Ahrens 
30630a055120SJason King 		/* make sure nicenum has enough space */
30640a055120SJason King 		CTASSERT(sizeof (buf) >= NN_NUMBUF_SZ);
30650a055120SJason King 
3066490d05b9SMatthew Ahrens 		zfs_nicenum(bytes, buf, sizeof (buf));
3067490d05b9SMatthew Ahrens 		(void) fprintf(stderr,
3068490d05b9SMatthew Ahrens 		    "\r%5s completed (%4dMB/s) "
3069490d05b9SMatthew Ahrens 		    "estimated time remaining: %uhr %02umin %02usec        ",
3070490d05b9SMatthew Ahrens 		    buf, kb_per_sec / 1024,
3071490d05b9SMatthew Ahrens 		    sec_remaining / 60 / 60,
3072490d05b9SMatthew Ahrens 		    sec_remaining / 60 % 60,
3073490d05b9SMatthew Ahrens 		    sec_remaining % 60);
3074490d05b9SMatthew Ahrens 
3075490d05b9SMatthew Ahrens 		zcb->zcb_lastprint = now;
3076490d05b9SMatthew Ahrens 	}
3077490d05b9SMatthew Ahrens 
3078fa9e4066Sahrens 	return (0);
3079fa9e4066Sahrens }
3080fa9e4066Sahrens 
3081b24ab676SJeff Bonwick static void
30820713e232SGeorge Wilson zdb_leak(void *arg, uint64_t start, uint64_t size)
3083b24ab676SJeff Bonwick {
30840713e232SGeorge Wilson 	vdev_t *vd = arg;
3085b24ab676SJeff Bonwick 
3086b24ab676SJeff Bonwick 	(void) printf("leaked space: vdev %llu, offset 0x%llx, size %llu\n",
3087b24ab676SJeff Bonwick 	    (u_longlong_t)vd->vdev_id, (u_longlong_t)start, (u_longlong_t)size);
3088b24ab676SJeff Bonwick }
3089b24ab676SJeff Bonwick 
30900713e232SGeorge Wilson static metaslab_ops_t zdb_metaslab_ops = {
30912e4c9986SGeorge Wilson 	NULL	/* alloc */
3092b24ab676SJeff Bonwick };
3093b24ab676SJeff Bonwick 
3094b24ab676SJeff Bonwick static void
3095bbfd46c4SJeff Bonwick zdb_ddt_leak_init(spa_t *spa, zdb_cb_t *zcb)
3096b24ab676SJeff Bonwick {
30973f7978d0SAlan Somers 	ddt_bookmark_t ddb;
3098b24ab676SJeff Bonwick 	ddt_entry_t dde;
3099b24ab676SJeff Bonwick 	int error;
3100b24ab676SJeff Bonwick 
31013f7978d0SAlan Somers 	bzero(&ddb, sizeof (ddb));
3102bbfd46c4SJeff Bonwick 	while ((error = ddt_walk(spa, &ddb, &dde)) == 0) {
3103b24ab676SJeff Bonwick 		blkptr_t blk;
3104b24ab676SJeff Bonwick 		ddt_phys_t *ddp = dde.dde_phys;
3105bbfd46c4SJeff Bonwick 
3106bbfd46c4SJeff Bonwick 		if (ddb.ddb_class == DDT_CLASS_UNIQUE)
3107bbfd46c4SJeff Bonwick 			return;
3108bbfd46c4SJeff Bonwick 
3109b24ab676SJeff Bonwick 		ASSERT(ddt_phys_total_refcnt(&dde) > 1);
3110bbfd46c4SJeff Bonwick 
3111b24ab676SJeff Bonwick 		for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) {
3112b24ab676SJeff Bonwick 			if (ddp->ddp_phys_birth == 0)
3113b24ab676SJeff Bonwick 				continue;
3114bbfd46c4SJeff Bonwick 			ddt_bp_create(ddb.ddb_checksum,
3115bbfd46c4SJeff Bonwick 			    &dde.dde_key, ddp, &blk);
3116b24ab676SJeff Bonwick 			if (p == DDT_PHYS_DITTO) {
3117cde58dbcSMatthew Ahrens 				zdb_count_block(zcb, NULL, &blk, ZDB_OT_DITTO);
3118b24ab676SJeff Bonwick 			} else {
3119b24ab676SJeff Bonwick 				zcb->zcb_dedup_asize +=
3120b24ab676SJeff Bonwick 				    BP_GET_ASIZE(&blk) * (ddp->ddp_refcnt - 1);
3121b24ab676SJeff Bonwick 				zcb->zcb_dedup_blocks++;
3122b24ab676SJeff Bonwick 			}
3123b24ab676SJeff Bonwick 		}
3124b24ab676SJeff Bonwick 		if (!dump_opt['L']) {
3125bbfd46c4SJeff Bonwick 			ddt_t *ddt = spa->spa_ddt[ddb.ddb_checksum];
3126b24ab676SJeff Bonwick 			ddt_enter(ddt);
3127b24ab676SJeff Bonwick 			VERIFY(ddt_lookup(ddt, &blk, B_TRUE) != NULL);
3128b24ab676SJeff Bonwick 			ddt_exit(ddt);
3129b24ab676SJeff Bonwick 		}
3130b24ab676SJeff Bonwick 	}
3131b24ab676SJeff Bonwick 
3132b24ab676SJeff Bonwick 	ASSERT(error == ENOENT);
3133b24ab676SJeff Bonwick }
3134b24ab676SJeff Bonwick 
31355cabbc6bSPrashanth Sreenivasa /* ARGSUSED */
31365cabbc6bSPrashanth Sreenivasa static void
31375cabbc6bSPrashanth Sreenivasa claim_segment_impl_cb(uint64_t inner_offset, vdev_t *vd, uint64_t offset,
31385cabbc6bSPrashanth Sreenivasa     uint64_t size, void *arg)
31395cabbc6bSPrashanth Sreenivasa {
31405cabbc6bSPrashanth Sreenivasa 	/*
31415cabbc6bSPrashanth Sreenivasa 	 * This callback was called through a remap from
31425cabbc6bSPrashanth Sreenivasa 	 * a device being removed. Therefore, the vdev that
31435cabbc6bSPrashanth Sreenivasa 	 * this callback is applied to is a concrete
31445cabbc6bSPrashanth Sreenivasa 	 * vdev.
31455cabbc6bSPrashanth Sreenivasa 	 */
31465cabbc6bSPrashanth Sreenivasa 	ASSERT(vdev_is_concrete(vd));
31475cabbc6bSPrashanth Sreenivasa 
31485cabbc6bSPrashanth Sreenivasa 	VERIFY0(metaslab_claim_impl(vd, offset, size,
314986714001SSerapheim Dimitropoulos 	    spa_min_claim_txg(vd->vdev_spa)));
31505cabbc6bSPrashanth Sreenivasa }
31515cabbc6bSPrashanth Sreenivasa 
31525cabbc6bSPrashanth Sreenivasa static void
31535cabbc6bSPrashanth Sreenivasa claim_segment_cb(void *arg, uint64_t offset, uint64_t size)
31545cabbc6bSPrashanth Sreenivasa {
31555cabbc6bSPrashanth Sreenivasa 	vdev_t *vd = arg;
31565cabbc6bSPrashanth Sreenivasa 
31575cabbc6bSPrashanth Sreenivasa 	vdev_indirect_ops.vdev_op_remap(vd, offset, size,
31585cabbc6bSPrashanth Sreenivasa 	    claim_segment_impl_cb, NULL);
31595cabbc6bSPrashanth Sreenivasa }
31605cabbc6bSPrashanth Sreenivasa 
31615cabbc6bSPrashanth Sreenivasa /*
31625cabbc6bSPrashanth Sreenivasa  * After accounting for all allocated blocks that are directly referenced,
31635cabbc6bSPrashanth Sreenivasa  * we might have missed a reference to a block from a partially complete
31645cabbc6bSPrashanth Sreenivasa  * (and thus unused) indirect mapping object. We perform a secondary pass
31655cabbc6bSPrashanth Sreenivasa  * through the metaslabs we have already mapped and claim the destination
31665cabbc6bSPrashanth Sreenivasa  * blocks.
31675cabbc6bSPrashanth Sreenivasa  */
31685cabbc6bSPrashanth Sreenivasa static void
31695cabbc6bSPrashanth Sreenivasa zdb_claim_removing(spa_t *spa, zdb_cb_t *zcb)
31705cabbc6bSPrashanth Sreenivasa {
31715cabbc6bSPrashanth Sreenivasa 	if (spa->spa_vdev_removal == NULL)
31725cabbc6bSPrashanth Sreenivasa 		return;
31735cabbc6bSPrashanth Sreenivasa 
31745cabbc6bSPrashanth Sreenivasa 	spa_config_enter(spa, SCL_CONFIG, FTAG, RW_READER);
31755cabbc6bSPrashanth Sreenivasa 
31765cabbc6bSPrashanth Sreenivasa 	spa_vdev_removal_t *svr = spa->spa_vdev_removal;
31773a4b1be9SMatthew Ahrens 	vdev_t *vd = vdev_lookup_top(spa, svr->svr_vdev_id);
31785cabbc6bSPrashanth Sreenivasa 	vdev_indirect_mapping_t *vim = vd->vdev_indirect_mapping;
31795cabbc6bSPrashanth Sreenivasa 
31805cabbc6bSPrashanth Sreenivasa 	for (uint64_t msi = 0; msi < vd->vdev_ms_count; msi++) {
31815cabbc6bSPrashanth Sreenivasa 		metaslab_t *msp = vd->vdev_ms[msi];
31825cabbc6bSPrashanth Sreenivasa 
31835cabbc6bSPrashanth Sreenivasa 		if (msp->ms_start >= vdev_indirect_mapping_max_offset(vim))
31845cabbc6bSPrashanth Sreenivasa 			break;
31855cabbc6bSPrashanth Sreenivasa 
31865cabbc6bSPrashanth Sreenivasa 		ASSERT0(range_tree_space(svr->svr_allocd_segs));
31875cabbc6bSPrashanth Sreenivasa 
31885cabbc6bSPrashanth Sreenivasa 		if (msp->ms_sm != NULL) {
31895cabbc6bSPrashanth Sreenivasa 			VERIFY0(space_map_load(msp->ms_sm,
31905cabbc6bSPrashanth Sreenivasa 			    svr->svr_allocd_segs, SM_ALLOC));
31915cabbc6bSPrashanth Sreenivasa 
31925cabbc6bSPrashanth Sreenivasa 			/*
31933a4b1be9SMatthew Ahrens 			 * Clear everything past what has been synced unless
31943a4b1be9SMatthew Ahrens 			 * it's past the spacemap, because we have not allocated
31953a4b1be9SMatthew Ahrens 			 * mappings for it yet.
31965cabbc6bSPrashanth Sreenivasa 			 */
31973a4b1be9SMatthew Ahrens 			uint64_t vim_max_offset =
31983a4b1be9SMatthew Ahrens 			    vdev_indirect_mapping_max_offset(vim);
31993a4b1be9SMatthew Ahrens 			uint64_t sm_end = msp->ms_sm->sm_start +
32003a4b1be9SMatthew Ahrens 			    msp->ms_sm->sm_size;
32013a4b1be9SMatthew Ahrens 			if (sm_end > vim_max_offset)
32023a4b1be9SMatthew Ahrens 				range_tree_clear(svr->svr_allocd_segs,
32033a4b1be9SMatthew Ahrens 				    vim_max_offset, sm_end - vim_max_offset);
32045cabbc6bSPrashanth Sreenivasa 		}
32055cabbc6bSPrashanth Sreenivasa 
32065cabbc6bSPrashanth Sreenivasa 		zcb->zcb_removing_size +=
32075cabbc6bSPrashanth Sreenivasa 		    range_tree_space(svr->svr_allocd_segs);
32085cabbc6bSPrashanth Sreenivasa 		range_tree_vacate(svr->svr_allocd_segs, claim_segment_cb, vd);
32095cabbc6bSPrashanth Sreenivasa 	}
32105cabbc6bSPrashanth Sreenivasa 
32115cabbc6bSPrashanth Sreenivasa 	spa_config_exit(spa, SCL_CONFIG, FTAG);
32125cabbc6bSPrashanth Sreenivasa }
32135cabbc6bSPrashanth Sreenivasa 
32145cabbc6bSPrashanth Sreenivasa /* ARGSUSED */
32155cabbc6bSPrashanth Sreenivasa static int
32165cabbc6bSPrashanth Sreenivasa increment_indirect_mapping_cb(void *arg, const blkptr_t *bp, dmu_tx_t *tx)
32175cabbc6bSPrashanth Sreenivasa {
32185cabbc6bSPrashanth Sreenivasa 	zdb_cb_t *zcb = arg;
32195cabbc6bSPrashanth Sreenivasa 	spa_t *spa = zcb->zcb_spa;
32205cabbc6bSPrashanth Sreenivasa 	vdev_t *vd;
32215cabbc6bSPrashanth Sreenivasa 	const dva_t *dva = &bp->blk_dva[0];
32225cabbc6bSPrashanth Sreenivasa 
32235cabbc6bSPrashanth Sreenivasa 	ASSERT(!dump_opt['L']);
32245cabbc6bSPrashanth Sreenivasa 	ASSERT3U(BP_GET_NDVAS(bp), ==, 1);
32255cabbc6bSPrashanth Sreenivasa 
32265cabbc6bSPrashanth Sreenivasa 	spa_config_enter(spa, SCL_VDEV, FTAG, RW_READER);
32275cabbc6bSPrashanth Sreenivasa 	vd = vdev_lookup_top(zcb->zcb_spa, DVA_GET_VDEV(dva));
32285cabbc6bSPrashanth Sreenivasa 	ASSERT3P(vd, !=, NULL);
32295cabbc6bSPrashanth Sreenivasa 	spa_config_exit(spa, SCL_VDEV, FTAG);
32305cabbc6bSPrashanth Sreenivasa 
32315cabbc6bSPrashanth Sreenivasa 	ASSERT(vd->vdev_indirect_config.vic_mapping_object != 0);
32325cabbc6bSPrashanth Sreenivasa 	ASSERT3P(zcb->zcb_vd_obsolete_counts[vd->vdev_id], !=, NULL);
32335cabbc6bSPrashanth Sreenivasa 
32345cabbc6bSPrashanth Sreenivasa 	vdev_indirect_mapping_increment_obsolete_count(
32355cabbc6bSPrashanth Sreenivasa 	    vd->vdev_indirect_mapping,
32365cabbc6bSPrashanth Sreenivasa 	    DVA_GET_OFFSET(dva), DVA_GET_ASIZE(dva),
32375cabbc6bSPrashanth Sreenivasa 	    zcb->zcb_vd_obsolete_counts[vd->vdev_id]);
32385cabbc6bSPrashanth Sreenivasa 
32395cabbc6bSPrashanth Sreenivasa 	return (0);
32405cabbc6bSPrashanth Sreenivasa }
32415cabbc6bSPrashanth Sreenivasa 
32425cabbc6bSPrashanth Sreenivasa static uint32_t *
32435cabbc6bSPrashanth Sreenivasa zdb_load_obsolete_counts(vdev_t *vd)
32445cabbc6bSPrashanth Sreenivasa {
32455cabbc6bSPrashanth Sreenivasa 	vdev_indirect_mapping_t *vim = vd->vdev_indirect_mapping;
32465cabbc6bSPrashanth Sreenivasa 	spa_t *spa = vd->vdev_spa;
32475cabbc6bSPrashanth Sreenivasa 	spa_condensing_indirect_phys_t *scip =
32485cabbc6bSPrashanth Sreenivasa 	    &spa->spa_condensing_indirect_phys;
32495cabbc6bSPrashanth Sreenivasa 	uint32_t *counts;
32505cabbc6bSPrashanth Sreenivasa 
32515cabbc6bSPrashanth Sreenivasa 	EQUIV(vdev_obsolete_sm_object(vd) != 0, vd->vdev_obsolete_sm != NULL);
32525cabbc6bSPrashanth Sreenivasa 	counts = vdev_indirect_mapping_load_obsolete_counts(vim);
32535cabbc6bSPrashanth Sreenivasa 	if (vd->vdev_obsolete_sm != NULL) {
32545cabbc6bSPrashanth Sreenivasa 		vdev_indirect_mapping_load_obsolete_spacemap(vim, counts,
32555cabbc6bSPrashanth Sreenivasa 		    vd->vdev_obsolete_sm);
32565cabbc6bSPrashanth Sreenivasa 	}
32575cabbc6bSPrashanth Sreenivasa 	if (scip->scip_vdev == vd->vdev_id &&
32585cabbc6bSPrashanth Sreenivasa 	    scip->scip_prev_obsolete_sm_object != 0) {
32595cabbc6bSPrashanth Sreenivasa 		space_map_t *prev_obsolete_sm = NULL;
32605cabbc6bSPrashanth Sreenivasa 		VERIFY0(space_map_open(&prev_obsolete_sm, spa->spa_meta_objset,
32615cabbc6bSPrashanth Sreenivasa 		    scip->scip_prev_obsolete_sm_object, 0, vd->vdev_asize, 0));
32625cabbc6bSPrashanth Sreenivasa 		space_map_update(prev_obsolete_sm);
32635cabbc6bSPrashanth Sreenivasa 		vdev_indirect_mapping_load_obsolete_spacemap(vim, counts,
32645cabbc6bSPrashanth Sreenivasa 		    prev_obsolete_sm);
32655cabbc6bSPrashanth Sreenivasa 		space_map_close(prev_obsolete_sm);
32665cabbc6bSPrashanth Sreenivasa 	}
32675cabbc6bSPrashanth Sreenivasa 	return (counts);
32685cabbc6bSPrashanth Sreenivasa }
32695cabbc6bSPrashanth Sreenivasa 
327086714001SSerapheim Dimitropoulos typedef struct checkpoint_sm_exclude_entry_arg {
327186714001SSerapheim Dimitropoulos 	vdev_t *cseea_vd;
327286714001SSerapheim Dimitropoulos 	uint64_t cseea_checkpoint_size;
327386714001SSerapheim Dimitropoulos } checkpoint_sm_exclude_entry_arg_t;
327486714001SSerapheim Dimitropoulos 
327586714001SSerapheim Dimitropoulos static int
327617f11284SSerapheim Dimitropoulos checkpoint_sm_exclude_entry_cb(space_map_entry_t *sme, void *arg)
327786714001SSerapheim Dimitropoulos {
327886714001SSerapheim Dimitropoulos 	checkpoint_sm_exclude_entry_arg_t *cseea = arg;
327986714001SSerapheim Dimitropoulos 	vdev_t *vd = cseea->cseea_vd;
328017f11284SSerapheim Dimitropoulos 	metaslab_t *ms = vd->vdev_ms[sme->sme_offset >> vd->vdev_ms_shift];
328117f11284SSerapheim Dimitropoulos 	uint64_t end = sme->sme_offset + sme->sme_run;
328286714001SSerapheim Dimitropoulos 
328317f11284SSerapheim Dimitropoulos 	ASSERT(sme->sme_type == SM_FREE);
328486714001SSerapheim Dimitropoulos 
328586714001SSerapheim Dimitropoulos 	/*
328686714001SSerapheim Dimitropoulos 	 * Since the vdev_checkpoint_sm exists in the vdev level
328786714001SSerapheim Dimitropoulos 	 * and the ms_sm space maps exist in the metaslab level,
328886714001SSerapheim Dimitropoulos 	 * an entry in the checkpoint space map could theoretically
328986714001SSerapheim Dimitropoulos 	 * cross the boundaries of the metaslab that it belongs.
329086714001SSerapheim Dimitropoulos 	 *
329186714001SSerapheim Dimitropoulos 	 * In reality, because of the way that we populate and
329286714001SSerapheim Dimitropoulos 	 * manipulate the checkpoint's space maps currently,
329386714001SSerapheim Dimitropoulos 	 * there shouldn't be any entries that cross metaslabs.
329486714001SSerapheim Dimitropoulos 	 * Hence the assertion below.
329586714001SSerapheim Dimitropoulos 	 *
329686714001SSerapheim Dimitropoulos 	 * That said, there is no fundamental requirement that
329786714001SSerapheim Dimitropoulos 	 * the checkpoint's space map entries should not cross
329886714001SSerapheim Dimitropoulos 	 * metaslab boundaries. So if needed we could add code
329986714001SSerapheim Dimitropoulos 	 * that handles metaslab-crossing segments in the future.
330086714001SSerapheim Dimitropoulos 	 */
330117f11284SSerapheim Dimitropoulos 	VERIFY3U(sme->sme_offset, >=, ms->ms_start);
330286714001SSerapheim Dimitropoulos 	VERIFY3U(end, <=, ms->ms_start + ms->ms_size);
330386714001SSerapheim Dimitropoulos 
330486714001SSerapheim Dimitropoulos 	/*
330586714001SSerapheim Dimitropoulos 	 * By removing the entry from the allocated segments we
330686714001SSerapheim Dimitropoulos 	 * also verify that the entry is there to begin with.
330786714001SSerapheim Dimitropoulos 	 */
330886714001SSerapheim Dimitropoulos 	mutex_enter(&ms->ms_lock);
330917f11284SSerapheim Dimitropoulos 	range_tree_remove(ms->ms_allocatable, sme->sme_offset, sme->sme_run);
331086714001SSerapheim Dimitropoulos 	mutex_exit(&ms->ms_lock);
331186714001SSerapheim Dimitropoulos 
331217f11284SSerapheim Dimitropoulos 	cseea->cseea_checkpoint_size += sme->sme_run;
331386714001SSerapheim Dimitropoulos 	return (0);
331486714001SSerapheim Dimitropoulos }
331586714001SSerapheim Dimitropoulos 
331686714001SSerapheim Dimitropoulos static void
331786714001SSerapheim Dimitropoulos zdb_leak_init_vdev_exclude_checkpoint(vdev_t *vd, zdb_cb_t *zcb)
331886714001SSerapheim Dimitropoulos {
331986714001SSerapheim Dimitropoulos 	spa_t *spa = vd->vdev_spa;
332086714001SSerapheim Dimitropoulos 	space_map_t *checkpoint_sm = NULL;
332186714001SSerapheim Dimitropoulos 	uint64_t checkpoint_sm_obj;
332286714001SSerapheim Dimitropoulos 
332386714001SSerapheim Dimitropoulos 	/*
332486714001SSerapheim Dimitropoulos 	 * If there is no vdev_top_zap, we are in a pool whose
332586714001SSerapheim Dimitropoulos 	 * version predates the pool checkpoint feature.
332686714001SSerapheim Dimitropoulos 	 */
332786714001SSerapheim Dimitropoulos 	if (vd->vdev_top_zap == 0)
332886714001SSerapheim Dimitropoulos 		return;
332986714001SSerapheim Dimitropoulos 
333086714001SSerapheim Dimitropoulos 	/*
333186714001SSerapheim Dimitropoulos 	 * If there is no reference of the vdev_checkpoint_sm in
333286714001SSerapheim Dimitropoulos 	 * the vdev_top_zap, then one of the following scenarios
333386714001SSerapheim Dimitropoulos 	 * is true:
333486714001SSerapheim Dimitropoulos 	 *
333586714001SSerapheim Dimitropoulos 	 * 1] There is no checkpoint
333686714001SSerapheim Dimitropoulos 	 * 2] There is a checkpoint, but no checkpointed blocks
333786714001SSerapheim Dimitropoulos 	 *    have been freed yet
333886714001SSerapheim Dimitropoulos 	 * 3] The current vdev is indirect
333986714001SSerapheim Dimitropoulos 	 *
334086714001SSerapheim Dimitropoulos 	 * In these cases we return immediately.
334186714001SSerapheim Dimitropoulos 	 */
334286714001SSerapheim Dimitropoulos 	if (zap_contains(spa_meta_objset(spa), vd->vdev_top_zap,
334386714001SSerapheim Dimitropoulos 	    VDEV_TOP_ZAP_POOL_CHECKPOINT_SM) != 0)
334486714001SSerapheim Dimitropoulos 		return;
334586714001SSerapheim Dimitropoulos 
334686714001SSerapheim Dimitropoulos 	VERIFY0(zap_lookup(spa_meta_objset(spa), vd->vdev_top_zap,
334786714001SSerapheim Dimitropoulos 	    VDEV_TOP_ZAP_POOL_CHECKPOINT_SM, sizeof (uint64_t), 1,
334886714001SSerapheim Dimitropoulos 	    &checkpoint_sm_obj));
334986714001SSerapheim Dimitropoulos 
335086714001SSerapheim Dimitropoulos 	checkpoint_sm_exclude_entry_arg_t cseea;
335186714001SSerapheim Dimitropoulos 	cseea.cseea_vd = vd;
335286714001SSerapheim Dimitropoulos 	cseea.cseea_checkpoint_size = 0;
335386714001SSerapheim Dimitropoulos 
335486714001SSerapheim Dimitropoulos 	VERIFY0(space_map_open(&checkpoint_sm, spa_meta_objset(spa),
335586714001SSerapheim Dimitropoulos 	    checkpoint_sm_obj, 0, vd->vdev_asize, vd->vdev_ashift));
335686714001SSerapheim Dimitropoulos 	space_map_update(checkpoint_sm);
335786714001SSerapheim Dimitropoulos 
335886714001SSerapheim Dimitropoulos 	VERIFY0(space_map_iterate(checkpoint_sm,
335986714001SSerapheim Dimitropoulos 	    checkpoint_sm_exclude_entry_cb, &cseea));
336086714001SSerapheim Dimitropoulos 	space_map_close(checkpoint_sm);
336186714001SSerapheim Dimitropoulos 
336286714001SSerapheim Dimitropoulos 	zcb->zcb_checkpoint_size += cseea.cseea_checkpoint_size;
336386714001SSerapheim Dimitropoulos }
336486714001SSerapheim Dimitropoulos 
336586714001SSerapheim Dimitropoulos static void
336686714001SSerapheim Dimitropoulos zdb_leak_init_exclude_checkpoint(spa_t *spa, zdb_cb_t *zcb)
336786714001SSerapheim Dimitropoulos {
336886714001SSerapheim Dimitropoulos 	vdev_t *rvd = spa->spa_root_vdev;
336986714001SSerapheim Dimitropoulos 	for (uint64_t c = 0; c < rvd->vdev_children; c++) {
337086714001SSerapheim Dimitropoulos 		ASSERT3U(c, ==, rvd->vdev_child[c]->vdev_id);
337186714001SSerapheim Dimitropoulos 		zdb_leak_init_vdev_exclude_checkpoint(rvd->vdev_child[c], zcb);
337286714001SSerapheim Dimitropoulos 	}
337386714001SSerapheim Dimitropoulos }
337486714001SSerapheim Dimitropoulos 
337586714001SSerapheim Dimitropoulos static void
337686714001SSerapheim Dimitropoulos load_concrete_ms_allocatable_trees(spa_t *spa, maptype_t maptype)
337786714001SSerapheim Dimitropoulos {
337886714001SSerapheim Dimitropoulos 	vdev_t *rvd = spa->spa_root_vdev;
337986714001SSerapheim Dimitropoulos 	for (uint64_t i = 0; i < rvd->vdev_children; i++) {
338086714001SSerapheim Dimitropoulos 		vdev_t *vd = rvd->vdev_child[i];
338186714001SSerapheim Dimitropoulos 
338286714001SSerapheim Dimitropoulos 		ASSERT3U(i, ==, vd->vdev_id);
338386714001SSerapheim Dimitropoulos 
338486714001SSerapheim Dimitropoulos 		if (vd->vdev_ops == &vdev_indirect_ops)
338586714001SSerapheim Dimitropoulos 			continue;
338686714001SSerapheim Dimitropoulos 
338786714001SSerapheim Dimitropoulos 		for (uint64_t m = 0; m < vd->vdev_ms_count; m++) {
338886714001SSerapheim Dimitropoulos 			metaslab_t *msp = vd->vdev_ms[m];
338986714001SSerapheim Dimitropoulos 
339086714001SSerapheim Dimitropoulos 			(void) fprintf(stderr,
339186714001SSerapheim Dimitropoulos 			    "\rloading concrete vdev %llu, "
339286714001SSerapheim Dimitropoulos 			    "metaslab %llu of %llu ...",
339386714001SSerapheim Dimitropoulos 			    (longlong_t)vd->vdev_id,
339486714001SSerapheim Dimitropoulos 			    (longlong_t)msp->ms_id,
339586714001SSerapheim Dimitropoulos 			    (longlong_t)vd->vdev_ms_count);
339686714001SSerapheim Dimitropoulos 
339786714001SSerapheim Dimitropoulos 			mutex_enter(&msp->ms_lock);
339886714001SSerapheim Dimitropoulos 			metaslab_unload(msp);
339986714001SSerapheim Dimitropoulos 
340086714001SSerapheim Dimitropoulos 			/*
340186714001SSerapheim Dimitropoulos 			 * We don't want to spend the CPU manipulating the
340286714001SSerapheim Dimitropoulos 			 * size-ordered tree, so clear the range_tree ops.
340386714001SSerapheim Dimitropoulos 			 */
340486714001SSerapheim Dimitropoulos 			msp->ms_allocatable->rt_ops = NULL;
340586714001SSerapheim Dimitropoulos 
340686714001SSerapheim Dimitropoulos 			if (msp->ms_sm != NULL) {
340786714001SSerapheim Dimitropoulos 				VERIFY0(space_map_load(msp->ms_sm,
340886714001SSerapheim Dimitropoulos 				    msp->ms_allocatable, maptype));
340986714001SSerapheim Dimitropoulos 			}
341086714001SSerapheim Dimitropoulos 			if (!msp->ms_loaded)
341186714001SSerapheim Dimitropoulos 				msp->ms_loaded = B_TRUE;
341286714001SSerapheim Dimitropoulos 			mutex_exit(&msp->ms_lock);
341386714001SSerapheim Dimitropoulos 		}
341486714001SSerapheim Dimitropoulos 	}
341586714001SSerapheim Dimitropoulos }
341686714001SSerapheim Dimitropoulos 
341786714001SSerapheim Dimitropoulos /*
341886714001SSerapheim Dimitropoulos  * vm_idxp is an in-out parameter which (for indirect vdevs) is the
341986714001SSerapheim Dimitropoulos  * index in vim_entries that has the first entry in this metaslab.
342086714001SSerapheim Dimitropoulos  * On return, it will be set to the first entry after this metaslab.
342186714001SSerapheim Dimitropoulos  */
342286714001SSerapheim Dimitropoulos static void
342386714001SSerapheim Dimitropoulos load_indirect_ms_allocatable_tree(vdev_t *vd, metaslab_t *msp,
342486714001SSerapheim Dimitropoulos     uint64_t *vim_idxp)
342586714001SSerapheim Dimitropoulos {
342686714001SSerapheim Dimitropoulos 	vdev_indirect_mapping_t *vim = vd->vdev_indirect_mapping;
342786714001SSerapheim Dimitropoulos 
342886714001SSerapheim Dimitropoulos 	mutex_enter(&msp->ms_lock);
342986714001SSerapheim Dimitropoulos 	metaslab_unload(msp);
343086714001SSerapheim Dimitropoulos 
343186714001SSerapheim Dimitropoulos 	/*
343286714001SSerapheim Dimitropoulos 	 * We don't want to spend the CPU manipulating the
343386714001SSerapheim Dimitropoulos 	 * size-ordered tree, so clear the range_tree ops.
343486714001SSerapheim Dimitropoulos 	 */
343586714001SSerapheim Dimitropoulos 	msp->ms_allocatable->rt_ops = NULL;
343686714001SSerapheim Dimitropoulos 
343786714001SSerapheim Dimitropoulos 	for (; *vim_idxp < vdev_indirect_mapping_num_entries(vim);
343886714001SSerapheim Dimitropoulos 	    (*vim_idxp)++) {
343986714001SSerapheim Dimitropoulos 		vdev_indirect_mapping_entry_phys_t *vimep =
344086714001SSerapheim Dimitropoulos 		    &vim->vim_entries[*vim_idxp];
344186714001SSerapheim Dimitropoulos 		uint64_t ent_offset = DVA_MAPPING_GET_SRC_OFFSET(vimep);
344286714001SSerapheim Dimitropoulos 		uint64_t ent_len = DVA_GET_ASIZE(&vimep->vimep_dst);
344386714001SSerapheim Dimitropoulos 		ASSERT3U(ent_offset, >=, msp->ms_start);
344486714001SSerapheim Dimitropoulos 		if (ent_offset >= msp->ms_start + msp->ms_size)
344586714001SSerapheim Dimitropoulos 			break;
344686714001SSerapheim Dimitropoulos 
344786714001SSerapheim Dimitropoulos 		/*
344886714001SSerapheim Dimitropoulos 		 * Mappings do not cross metaslab boundaries,
344986714001SSerapheim Dimitropoulos 		 * because we create them by walking the metaslabs.
345086714001SSerapheim Dimitropoulos 		 */
345186714001SSerapheim Dimitropoulos 		ASSERT3U(ent_offset + ent_len, <=,
345286714001SSerapheim Dimitropoulos 		    msp->ms_start + msp->ms_size);
345386714001SSerapheim Dimitropoulos 		range_tree_add(msp->ms_allocatable, ent_offset, ent_len);
345486714001SSerapheim Dimitropoulos 	}
345586714001SSerapheim Dimitropoulos 
345686714001SSerapheim Dimitropoulos 	if (!msp->ms_loaded)
345786714001SSerapheim Dimitropoulos 		msp->ms_loaded = B_TRUE;
345886714001SSerapheim Dimitropoulos 	mutex_exit(&msp->ms_lock);
345986714001SSerapheim Dimitropoulos }
346086714001SSerapheim Dimitropoulos 
346186714001SSerapheim Dimitropoulos static void
346286714001SSerapheim Dimitropoulos zdb_leak_init_prepare_indirect_vdevs(spa_t *spa, zdb_cb_t *zcb)
346386714001SSerapheim Dimitropoulos {
346486714001SSerapheim Dimitropoulos 	vdev_t *rvd = spa->spa_root_vdev;
346586714001SSerapheim Dimitropoulos 	for (uint64_t c = 0; c < rvd->vdev_children; c++) {
346686714001SSerapheim Dimitropoulos 		vdev_t *vd = rvd->vdev_child[c];
346786714001SSerapheim Dimitropoulos 
346886714001SSerapheim Dimitropoulos 		ASSERT3U(c, ==, vd->vdev_id);
346986714001SSerapheim Dimitropoulos 
347086714001SSerapheim Dimitropoulos 		if (vd->vdev_ops != &vdev_indirect_ops)
347186714001SSerapheim Dimitropoulos 			continue;
347286714001SSerapheim Dimitropoulos 
347386714001SSerapheim Dimitropoulos 		/*
347486714001SSerapheim Dimitropoulos 		 * Note: we don't check for mapping leaks on
347586714001SSerapheim Dimitropoulos 		 * removing vdevs because their ms_allocatable's
347686714001SSerapheim Dimitropoulos 		 * are used to look for leaks in allocated space.
347786714001SSerapheim Dimitropoulos 		 */
347886714001SSerapheim Dimitropoulos 		zcb->zcb_vd_obsolete_counts[c] = zdb_load_obsolete_counts(vd);
347986714001SSerapheim Dimitropoulos 
348086714001SSerapheim Dimitropoulos 		/*
348186714001SSerapheim Dimitropoulos 		 * Normally, indirect vdevs don't have any
348286714001SSerapheim Dimitropoulos 		 * metaslabs.  We want to set them up for
348386714001SSerapheim Dimitropoulos 		 * zio_claim().
348486714001SSerapheim Dimitropoulos 		 */
348586714001SSerapheim Dimitropoulos 		VERIFY0(vdev_metaslab_init(vd, 0));
348686714001SSerapheim Dimitropoulos 
348786714001SSerapheim Dimitropoulos 		vdev_indirect_mapping_t *vim = vd->vdev_indirect_mapping;
348886714001SSerapheim Dimitropoulos 		uint64_t vim_idx = 0;
348986714001SSerapheim Dimitropoulos 		for (uint64_t m = 0; m < vd->vdev_ms_count; m++) {
349086714001SSerapheim Dimitropoulos 
349186714001SSerapheim Dimitropoulos 			(void) fprintf(stderr,
349286714001SSerapheim Dimitropoulos 			    "\rloading indirect vdev %llu, "
349386714001SSerapheim Dimitropoulos 			    "metaslab %llu of %llu ...",
349486714001SSerapheim Dimitropoulos 			    (longlong_t)vd->vdev_id,
349586714001SSerapheim Dimitropoulos 			    (longlong_t)vd->vdev_ms[m]->ms_id,
349686714001SSerapheim Dimitropoulos 			    (longlong_t)vd->vdev_ms_count);
349786714001SSerapheim Dimitropoulos 
349886714001SSerapheim Dimitropoulos 			load_indirect_ms_allocatable_tree(vd, vd->vdev_ms[m],
349986714001SSerapheim Dimitropoulos 			    &vim_idx);
350086714001SSerapheim Dimitropoulos 		}
350186714001SSerapheim Dimitropoulos 		ASSERT3U(vim_idx, ==, vdev_indirect_mapping_num_entries(vim));
350286714001SSerapheim Dimitropoulos 	}
350386714001SSerapheim Dimitropoulos }
350486714001SSerapheim Dimitropoulos 
3505b24ab676SJeff Bonwick static void
3506b24ab676SJeff Bonwick zdb_leak_init(spa_t *spa, zdb_cb_t *zcb)
3507b24ab676SJeff Bonwick {
3508cde58dbcSMatthew Ahrens 	zcb->zcb_spa = spa;
3509cde58dbcSMatthew Ahrens 
3510b24ab676SJeff Bonwick 	if (!dump_opt['L']) {
35115cabbc6bSPrashanth Sreenivasa 		dsl_pool_t *dp = spa->spa_dsl_pool;
3512b24ab676SJeff Bonwick 		vdev_t *rvd = spa->spa_root_vdev;
35138363e80aSGeorge Wilson 
35148363e80aSGeorge Wilson 		/*
35158363e80aSGeorge Wilson 		 * We are going to be changing the meaning of the metaslab's
351686714001SSerapheim Dimitropoulos 		 * ms_allocatable.  Ensure that the allocator doesn't try to
35178363e80aSGeorge Wilson 		 * use the tree.
35188363e80aSGeorge Wilson 		 */
35198363e80aSGeorge Wilson 		spa->spa_normal_class->mc_ops = &zdb_metaslab_ops;
35208363e80aSGeorge Wilson 		spa->spa_log_class->mc_ops = &zdb_metaslab_ops;
35218363e80aSGeorge Wilson 
35225cabbc6bSPrashanth Sreenivasa 		zcb->zcb_vd_obsolete_counts =
35235cabbc6bSPrashanth Sreenivasa 		    umem_zalloc(rvd->vdev_children * sizeof (uint32_t *),
35245cabbc6bSPrashanth Sreenivasa 		    UMEM_NOFAIL);
35255cabbc6bSPrashanth Sreenivasa 
352686714001SSerapheim Dimitropoulos 		/*
352786714001SSerapheim Dimitropoulos 		 * For leak detection, we overload the ms_allocatable trees
352886714001SSerapheim Dimitropoulos 		 * to contain allocated segments instead of free segments.
352986714001SSerapheim Dimitropoulos 		 * As a result, we can't use the normal metaslab_load/unload
353086714001SSerapheim Dimitropoulos 		 * interfaces.
353186714001SSerapheim Dimitropoulos 		 */
353286714001SSerapheim Dimitropoulos 		zdb_leak_init_prepare_indirect_vdevs(spa, zcb);
353386714001SSerapheim Dimitropoulos 		load_concrete_ms_allocatable_trees(spa, SM_ALLOC);
35345cabbc6bSPrashanth Sreenivasa 
353586714001SSerapheim Dimitropoulos 		/*
353686714001SSerapheim Dimitropoulos 		 * On load_concrete_ms_allocatable_trees() we loaded all the
353786714001SSerapheim Dimitropoulos 		 * allocated entries from the ms_sm to the ms_allocatable for
353886714001SSerapheim Dimitropoulos 		 * each metaslab. If the pool has a checkpoint or is in the
353986714001SSerapheim Dimitropoulos 		 * middle of discarding a checkpoint, some of these blocks
354086714001SSerapheim Dimitropoulos 		 * may have been freed but their ms_sm may not have been
354186714001SSerapheim Dimitropoulos 		 * updated because they are referenced by the checkpoint. In
354286714001SSerapheim Dimitropoulos 		 * order to avoid false-positives during leak-detection, we
354386714001SSerapheim Dimitropoulos 		 * go through the vdev's checkpoint space map and exclude all
354486714001SSerapheim Dimitropoulos 		 * its entries from their relevant ms_allocatable.
354586714001SSerapheim Dimitropoulos 		 *
354686714001SSerapheim Dimitropoulos 		 * We also aggregate the space held by the checkpoint and add
354786714001SSerapheim Dimitropoulos 		 * it to zcb_checkpoint_size.
354886714001SSerapheim Dimitropoulos 		 *
354986714001SSerapheim Dimitropoulos 		 * Note that at this point we are also verifying that all the
355086714001SSerapheim Dimitropoulos 		 * entries on the checkpoint_sm are marked as allocated in
355186714001SSerapheim Dimitropoulos 		 * the ms_sm of their relevant metaslab.
355286714001SSerapheim Dimitropoulos 		 * [see comment in checkpoint_sm_exclude_entry_cb()]
355386714001SSerapheim Dimitropoulos 		 */
355486714001SSerapheim Dimitropoulos 		zdb_leak_init_exclude_checkpoint(spa, zcb);
35555cabbc6bSPrashanth Sreenivasa 
355686714001SSerapheim Dimitropoulos 		/* for cleaner progress output */
355706be9802SMatthew Ahrens 		(void) fprintf(stderr, "\n");
35585cabbc6bSPrashanth Sreenivasa 
35595cabbc6bSPrashanth Sreenivasa 		if (bpobj_is_open(&dp->dp_obsolete_bpobj)) {
35605cabbc6bSPrashanth Sreenivasa 			ASSERT(spa_feature_is_enabled(spa,
35615cabbc6bSPrashanth Sreenivasa 			    SPA_FEATURE_DEVICE_REMOVAL));
35625cabbc6bSPrashanth Sreenivasa 			(void) bpobj_iterate_nofree(&dp->dp_obsolete_bpobj,
35635cabbc6bSPrashanth Sreenivasa 			    increment_indirect_mapping_cb, zcb, NULL);
35645cabbc6bSPrashanth Sreenivasa 		}
356586714001SSerapheim Dimitropoulos 	} else {
356686714001SSerapheim Dimitropoulos 		/*
356786714001SSerapheim Dimitropoulos 		 * If leak tracing is disabled, we still need to consider
356886714001SSerapheim Dimitropoulos 		 * any checkpointed space in our space verification.
356986714001SSerapheim Dimitropoulos 		 */
357086714001SSerapheim Dimitropoulos 		zcb->zcb_checkpoint_size += spa_get_checkpoint_space(spa);
3571b24ab676SJeff Bonwick 	}
3572b24ab676SJeff Bonwick 
3573b24ab676SJeff Bonwick 	spa_config_enter(spa, SCL_CONFIG, FTAG, RW_READER);
3574bbfd46c4SJeff Bonwick 	zdb_ddt_leak_init(spa, zcb);
3575b24ab676SJeff Bonwick 	spa_config_exit(spa, SCL_CONFIG, FTAG);
3576b24ab676SJeff Bonwick }
3577b24ab676SJeff Bonwick 
35785cabbc6bSPrashanth Sreenivasa static boolean_t
35795cabbc6bSPrashanth Sreenivasa zdb_check_for_obsolete_leaks(vdev_t *vd, zdb_cb_t *zcb)
35805cabbc6bSPrashanth Sreenivasa {
35815cabbc6bSPrashanth Sreenivasa 	boolean_t leaks = B_FALSE;
35825cabbc6bSPrashanth Sreenivasa 	vdev_indirect_mapping_t *vim = vd->vdev_indirect_mapping;
35835cabbc6bSPrashanth Sreenivasa 	uint64_t total_leaked = 0;
35845cabbc6bSPrashanth Sreenivasa 
35855cabbc6bSPrashanth Sreenivasa 	ASSERT(vim != NULL);
35865cabbc6bSPrashanth Sreenivasa 
35875cabbc6bSPrashanth Sreenivasa 	for (uint64_t i = 0; i < vdev_indirect_mapping_num_entries(vim); i++) {
35885cabbc6bSPrashanth Sreenivasa 		vdev_indirect_mapping_entry_phys_t *vimep =
35895cabbc6bSPrashanth Sreenivasa 		    &vim->vim_entries[i];
35905cabbc6bSPrashanth Sreenivasa 		uint64_t obsolete_bytes = 0;
35915cabbc6bSPrashanth Sreenivasa 		uint64_t offset = DVA_MAPPING_GET_SRC_OFFSET(vimep);
35925cabbc6bSPrashanth Sreenivasa 		metaslab_t *msp = vd->vdev_ms[offset >> vd->vdev_ms_shift];
35935cabbc6bSPrashanth Sreenivasa 
35945cabbc6bSPrashanth Sreenivasa 		/*
35955cabbc6bSPrashanth Sreenivasa 		 * This is not very efficient but it's easy to
35965cabbc6bSPrashanth Sreenivasa 		 * verify correctness.
35975cabbc6bSPrashanth Sreenivasa 		 */
35985cabbc6bSPrashanth Sreenivasa 		for (uint64_t inner_offset = 0;
35995cabbc6bSPrashanth Sreenivasa 		    inner_offset < DVA_GET_ASIZE(&vimep->vimep_dst);
36005cabbc6bSPrashanth Sreenivasa 		    inner_offset += 1 << vd->vdev_ashift) {
360186714001SSerapheim Dimitropoulos 			if (range_tree_contains(msp->ms_allocatable,
36025cabbc6bSPrashanth Sreenivasa 			    offset + inner_offset, 1 << vd->vdev_ashift)) {
36035cabbc6bSPrashanth Sreenivasa 				obsolete_bytes += 1 << vd->vdev_ashift;
36045cabbc6bSPrashanth Sreenivasa 			}
36055cabbc6bSPrashanth Sreenivasa 		}
36065cabbc6bSPrashanth Sreenivasa 
36075cabbc6bSPrashanth Sreenivasa 		int64_t bytes_leaked = obsolete_bytes -
36085cabbc6bSPrashanth Sreenivasa 		    zcb->zcb_vd_obsolete_counts[vd->vdev_id][i];
36095cabbc6bSPrashanth Sreenivasa 		ASSERT3U(DVA_GET_ASIZE(&vimep->vimep_dst), >=,
36105cabbc6bSPrashanth Sreenivasa 		    zcb->zcb_vd_obsolete_counts[vd->vdev_id][i]);
36115cabbc6bSPrashanth Sreenivasa 		if (bytes_leaked != 0 &&
36125cabbc6bSPrashanth Sreenivasa 		    (vdev_obsolete_counts_are_precise(vd) ||
36135cabbc6bSPrashanth Sreenivasa 		    dump_opt['d'] >= 5)) {
36145cabbc6bSPrashanth Sreenivasa 			(void) printf("obsolete indirect mapping count "
36155cabbc6bSPrashanth Sreenivasa 			    "mismatch on %llu:%llx:%llx : %llx bytes leaked\n",
36165cabbc6bSPrashanth Sreenivasa 			    (u_longlong_t)vd->vdev_id,
36175cabbc6bSPrashanth Sreenivasa 			    (u_longlong_t)DVA_MAPPING_GET_SRC_OFFSET(vimep),
36185cabbc6bSPrashanth Sreenivasa 			    (u_longlong_t)DVA_GET_ASIZE(&vimep->vimep_dst),
36195cabbc6bSPrashanth Sreenivasa 			    (u_longlong_t)bytes_leaked);
36205cabbc6bSPrashanth Sreenivasa 		}
36215cabbc6bSPrashanth Sreenivasa 		total_leaked += ABS(bytes_leaked);
36225cabbc6bSPrashanth Sreenivasa 	}
36235cabbc6bSPrashanth Sreenivasa 
36245cabbc6bSPrashanth Sreenivasa 	if (!vdev_obsolete_counts_are_precise(vd) && total_leaked > 0) {
36255cabbc6bSPrashanth Sreenivasa 		int pct_leaked = total_leaked * 100 /
36265cabbc6bSPrashanth Sreenivasa 		    vdev_indirect_mapping_bytes_mapped(vim);
36275cabbc6bSPrashanth Sreenivasa 		(void) printf("cannot verify obsolete indirect mapping "
36285cabbc6bSPrashanth Sreenivasa 		    "counts of vdev %llu because precise feature was not "
36295cabbc6bSPrashanth Sreenivasa 		    "enabled when it was removed: %d%% (%llx bytes) of mapping"
36305cabbc6bSPrashanth Sreenivasa 		    "unreferenced\n",
36315cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)vd->vdev_id, pct_leaked,
36325cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)total_leaked);
36335cabbc6bSPrashanth Sreenivasa 	} else if (total_leaked > 0) {
36345cabbc6bSPrashanth Sreenivasa 		(void) printf("obsolete indirect mapping count mismatch "
36355cabbc6bSPrashanth Sreenivasa 		    "for vdev %llu -- %llx total bytes mismatched\n",
36365cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)vd->vdev_id,
36375cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)total_leaked);
36385cabbc6bSPrashanth Sreenivasa 		leaks |= B_TRUE;
36395cabbc6bSPrashanth Sreenivasa 	}
36405cabbc6bSPrashanth Sreenivasa 
36415cabbc6bSPrashanth Sreenivasa 	vdev_indirect_mapping_free_obsolete_counts(vim,
36425cabbc6bSPrashanth Sreenivasa 	    zcb->zcb_vd_obsolete_counts[vd->vdev_id]);
36435cabbc6bSPrashanth Sreenivasa 	zcb->zcb_vd_obsolete_counts[vd->vdev_id] = NULL;
36445cabbc6bSPrashanth Sreenivasa 
36455cabbc6bSPrashanth Sreenivasa 	return (leaks);
36465cabbc6bSPrashanth Sreenivasa }
36475cabbc6bSPrashanth Sreenivasa 
36485cabbc6bSPrashanth Sreenivasa static boolean_t
36495cabbc6bSPrashanth Sreenivasa zdb_leak_fini(spa_t *spa, zdb_cb_t *zcb)
3650b24ab676SJeff Bonwick {
36515cabbc6bSPrashanth Sreenivasa 	boolean_t leaks = B_FALSE;
3652b24ab676SJeff Bonwick 	if (!dump_opt['L']) {
3653b24ab676SJeff Bonwick 		vdev_t *rvd = spa->spa_root_vdev;
36543f7978d0SAlan Somers 		for (unsigned c = 0; c < rvd->vdev_children; c++) {
3655b24ab676SJeff Bonwick 			vdev_t *vd = rvd->vdev_child[c];
36568363e80aSGeorge Wilson 			metaslab_group_t *mg = vd->vdev_mg;
36575cabbc6bSPrashanth Sreenivasa 
36585cabbc6bSPrashanth Sreenivasa 			if (zcb->zcb_vd_obsolete_counts[c] != NULL) {
36595cabbc6bSPrashanth Sreenivasa 				leaks |= zdb_check_for_obsolete_leaks(vd, zcb);
36605cabbc6bSPrashanth Sreenivasa 			}
36615cabbc6bSPrashanth Sreenivasa 
36625cabbc6bSPrashanth Sreenivasa 			for (uint64_t m = 0; m < vd->vdev_ms_count; m++) {
3663b24ab676SJeff Bonwick 				metaslab_t *msp = vd->vdev_ms[m];
36648363e80aSGeorge Wilson 				ASSERT3P(mg, ==, msp->ms_group);
36650713e232SGeorge Wilson 
36660713e232SGeorge Wilson 				/*
366786714001SSerapheim Dimitropoulos 				 * ms_allocatable has been overloaded
366886714001SSerapheim Dimitropoulos 				 * to contain allocated segments. Now that
366986714001SSerapheim Dimitropoulos 				 * we finished traversing all blocks, any
367086714001SSerapheim Dimitropoulos 				 * block that remains in the ms_allocatable
36710713e232SGeorge Wilson 				 * represents an allocated block that we
36720713e232SGeorge Wilson 				 * did not claim during the traversal.
36730713e232SGeorge Wilson 				 * Claimed blocks would have been removed
367486714001SSerapheim Dimitropoulos 				 * from the ms_allocatable.  For indirect
367586714001SSerapheim Dimitropoulos 				 * vdevs, space remaining in the tree
367686714001SSerapheim Dimitropoulos 				 * represents parts of the mapping that are
367786714001SSerapheim Dimitropoulos 				 * not referenced, which is not a bug.
36780713e232SGeorge Wilson 				 */
36795cabbc6bSPrashanth Sreenivasa 				if (vd->vdev_ops == &vdev_indirect_ops) {
368086714001SSerapheim Dimitropoulos 					range_tree_vacate(msp->ms_allocatable,
36815cabbc6bSPrashanth Sreenivasa 					    NULL, NULL);
36825cabbc6bSPrashanth Sreenivasa 				} else {
368386714001SSerapheim Dimitropoulos 					range_tree_vacate(msp->ms_allocatable,
36845cabbc6bSPrashanth Sreenivasa 					    zdb_leak, vd);
36855cabbc6bSPrashanth Sreenivasa 				}
36868363e80aSGeorge Wilson 
36878363e80aSGeorge Wilson 				if (msp->ms_loaded) {
36888363e80aSGeorge Wilson 					msp->ms_loaded = B_FALSE;
36898363e80aSGeorge Wilson 				}
3690b24ab676SJeff Bonwick 			}
3691b24ab676SJeff Bonwick 		}
36925cabbc6bSPrashanth Sreenivasa 
36935cabbc6bSPrashanth Sreenivasa 		umem_free(zcb->zcb_vd_obsolete_counts,
36945cabbc6bSPrashanth Sreenivasa 		    rvd->vdev_children * sizeof (uint32_t *));
36955cabbc6bSPrashanth Sreenivasa 		zcb->zcb_vd_obsolete_counts = NULL;
3696b24ab676SJeff Bonwick 	}
36975cabbc6bSPrashanth Sreenivasa 	return (leaks);
3698b24ab676SJeff Bonwick }
3699b24ab676SJeff Bonwick 
3700cde58dbcSMatthew Ahrens /* ARGSUSED */
3701cde58dbcSMatthew Ahrens static int
3702cde58dbcSMatthew Ahrens count_block_cb(void *arg, const blkptr_t *bp, dmu_tx_t *tx)
3703cde58dbcSMatthew Ahrens {
3704cde58dbcSMatthew Ahrens 	zdb_cb_t *zcb = arg;
3705cde58dbcSMatthew Ahrens 
3706490d05b9SMatthew Ahrens 	if (dump_opt['b'] >= 5) {
3707cde58dbcSMatthew Ahrens 		char blkbuf[BP_SPRINTF_LEN];
370843466aaeSMax Grossman 		snprintf_blkptr(blkbuf, sizeof (blkbuf), bp);
3709cde58dbcSMatthew Ahrens 		(void) printf("[%s] %s\n",
3710cde58dbcSMatthew Ahrens 		    "deferred free", blkbuf);
3711cde58dbcSMatthew Ahrens 	}
3712cde58dbcSMatthew Ahrens 	zdb_count_block(zcb, NULL, bp, ZDB_OT_DEFERRED);
3713cde58dbcSMatthew Ahrens 	return (0);
3714cde58dbcSMatthew Ahrens }
3715cde58dbcSMatthew Ahrens 
3716fa9e4066Sahrens static int
3717fa9e4066Sahrens dump_block_stats(spa_t *spa)
3718fa9e4066Sahrens {
37193f7978d0SAlan Somers 	zdb_cb_t zcb;
3720fa9e4066Sahrens 	zdb_blkstats_t *zb, *tzb;
3721b24ab676SJeff Bonwick 	uint64_t norm_alloc, norm_space, total_alloc, total_found;
3722cd088ea4SVictor Latushkin 	int flags = TRAVERSE_PRE | TRAVERSE_PREFETCH_METADATA | TRAVERSE_HARD;
37235d7b4d43SMatthew Ahrens 	boolean_t leaks = B_FALSE;
3724*663207adSDon Brady 	int err;
3725fa9e4066Sahrens 
37263f7978d0SAlan Somers 	bzero(&zcb, sizeof (zcb));
3727490d05b9SMatthew Ahrens 	(void) printf("\nTraversing all blocks %s%s%s%s%s...\n\n",
3728b24ab676SJeff Bonwick 	    (dump_opt['c'] || !dump_opt['L']) ? "to verify " : "",
3729b24ab676SJeff Bonwick 	    (dump_opt['c'] == 1) ? "metadata " : "",
3730b24ab676SJeff Bonwick 	    dump_opt['c'] ? "checksums " : "",
3731b24ab676SJeff Bonwick 	    (dump_opt['c'] && !dump_opt['L']) ? "and verify " : "",
3732b24ab676SJeff Bonwick 	    !dump_opt['L'] ? "nothing leaked " : "");
3733fa9e4066Sahrens 
3734fa9e4066Sahrens 	/*
3735e14bb325SJeff Bonwick 	 * Load all space maps as SM_ALLOC maps, then traverse the pool
3736e14bb325SJeff Bonwick 	 * claiming each block we discover.  If the pool is perfectly
3737e14bb325SJeff Bonwick 	 * consistent, the space maps will be empty when we're done.
3738e14bb325SJeff Bonwick 	 * Anything left over is a leak; any block we can't claim (because
3739e14bb325SJeff Bonwick 	 * it's not part of any space map) is a double allocation,
3740e14bb325SJeff Bonwick 	 * reference to a freed block, or an unclaimed log block.
3741fa9e4066Sahrens 	 */
3742b24ab676SJeff Bonwick 	zdb_leak_init(spa, &zcb);
3743fa9e4066Sahrens 
3744fa9e4066Sahrens 	/*
3745fa9e4066Sahrens 	 * If there's a deferred-free bplist, process that first.
3746fa9e4066Sahrens 	 */
3747cde58dbcSMatthew Ahrens 	(void) bpobj_iterate_nofree(&spa->spa_deferred_bpobj,
3748cde58dbcSMatthew Ahrens 	    count_block_cb, &zcb, NULL);
37495cabbc6bSPrashanth Sreenivasa 
37503b2aab18SMatthew Ahrens 	if (spa_version(spa) >= SPA_VERSION_DEADLISTS) {
37513b2aab18SMatthew Ahrens 		(void) bpobj_iterate_nofree(&spa->spa_dsl_pool->dp_free_bpobj,
37523b2aab18SMatthew Ahrens 		    count_block_cb, &zcb, NULL);
37533b2aab18SMatthew Ahrens 	}
37545cabbc6bSPrashanth Sreenivasa 
37555cabbc6bSPrashanth Sreenivasa 	zdb_claim_removing(spa, &zcb);
37565cabbc6bSPrashanth Sreenivasa 
37572acef22dSMatthew Ahrens 	if (spa_feature_is_active(spa, SPA_FEATURE_ASYNC_DESTROY)) {
3758b420f3adSRichard Lowe 		VERIFY3U(0, ==, bptree_iterate(spa->spa_meta_objset,
3759ad135b5dSChristopher Siden 		    spa->spa_dsl_pool->dp_bptree_obj, B_FALSE, count_block_cb,
3760ad135b5dSChristopher Siden 		    &zcb, NULL));
3761ad135b5dSChristopher Siden 	}
3762fa9e4066Sahrens 
3763bbfd46c4SJeff Bonwick 	if (dump_opt['c'] > 1)
3764bbfd46c4SJeff Bonwick 		flags |= TRAVERSE_PREFETCH_DATA;
3765bbfd46c4SJeff Bonwick 
3766490d05b9SMatthew Ahrens 	zcb.zcb_totalasize = metaslab_class_get_alloc(spa_normal_class(spa));
3767*663207adSDon Brady 	zcb.zcb_totalasize += metaslab_class_get_alloc(spa_special_class(spa));
3768*663207adSDon Brady 	zcb.zcb_totalasize += metaslab_class_get_alloc(spa_dedup_class(spa));
3769490d05b9SMatthew Ahrens 	zcb.zcb_start = zcb.zcb_lastprint = gethrtime();
3770*663207adSDon Brady 	err = traverse_pool(spa, 0, flags, zdb_blkptr_cb, &zcb);
3771fa9e4066Sahrens 
377231d7e8faSGeorge Wilson 	/*
377331d7e8faSGeorge Wilson 	 * If we've traversed the data blocks then we need to wait for those
377431d7e8faSGeorge Wilson 	 * I/Os to complete. We leverage "The Godfather" zio to wait on
377531d7e8faSGeorge Wilson 	 * all async I/Os to complete.
377631d7e8faSGeorge Wilson 	 */
377731d7e8faSGeorge Wilson 	if (dump_opt['c']) {
37786f834bc1SMatthew Ahrens 		for (int i = 0; i < max_ncpus; i++) {
37796f834bc1SMatthew Ahrens 			(void) zio_wait(spa->spa_async_zio_root[i]);
37806f834bc1SMatthew Ahrens 			spa->spa_async_zio_root[i] = zio_root(spa, NULL, NULL,
37816f834bc1SMatthew Ahrens 			    ZIO_FLAG_CANFAIL | ZIO_FLAG_SPECULATIVE |
37826f834bc1SMatthew Ahrens 			    ZIO_FLAG_GODFATHER);
37836f834bc1SMatthew Ahrens 		}
378431d7e8faSGeorge Wilson 	}
378531d7e8faSGeorge Wilson 
3786*663207adSDon Brady 	/*
3787*663207adSDon Brady 	 * Done after zio_wait() since zcb_haderrors is modified in
3788*663207adSDon Brady 	 * zdb_blkptr_done()
3789*663207adSDon Brady 	 */
3790*663207adSDon Brady 	zcb.zcb_haderrors |= err;
3791*663207adSDon Brady 
3792b24ab676SJeff Bonwick 	if (zcb.zcb_haderrors) {
3793fa9e4066Sahrens 		(void) printf("\nError counts:\n\n");
3794fa9e4066Sahrens 		(void) printf("\t%5s  %s\n", "errno", "count");
3795b24ab676SJeff Bonwick 		for (int e = 0; e < 256; e++) {
3796fa9e4066Sahrens 			if (zcb.zcb_errors[e] != 0) {
3797fa9e4066Sahrens 				(void) printf("\t%5d  %llu\n",
3798fa9e4066Sahrens 				    e, (u_longlong_t)zcb.zcb_errors[e]);
3799fa9e4066Sahrens 			}
3800fa9e4066Sahrens 		}
3801fa9e4066Sahrens 	}
3802fa9e4066Sahrens 
3803fa9e4066Sahrens 	/*
3804fa9e4066Sahrens 	 * Report any leaked segments.
3805fa9e4066Sahrens 	 */
38065cabbc6bSPrashanth Sreenivasa 	leaks |= zdb_leak_fini(spa, &zcb);
3807fa9e4066Sahrens 
3808b24ab676SJeff Bonwick 	tzb = &zcb.zcb_type[ZB_TOTAL][ZDB_OT_TOTAL];
38098654d025Sperrin 
3810b24ab676SJeff Bonwick 	norm_alloc = metaslab_class_get_alloc(spa_normal_class(spa));
3811b24ab676SJeff Bonwick 	norm_space = metaslab_class_get_space(spa_normal_class(spa));
38128654d025Sperrin 
3813*663207adSDon Brady 	total_alloc = norm_alloc +
3814*663207adSDon Brady 	    metaslab_class_get_alloc(spa_log_class(spa)) +
3815*663207adSDon Brady 	    metaslab_class_get_alloc(spa_special_class(spa)) +
3816*663207adSDon Brady 	    metaslab_class_get_alloc(spa_dedup_class(spa));
38175cabbc6bSPrashanth Sreenivasa 	total_found = tzb->zb_asize - zcb.zcb_dedup_asize +
381886714001SSerapheim Dimitropoulos 	    zcb.zcb_removing_size + zcb.zcb_checkpoint_size;
3819fa9e4066Sahrens 
3820b24ab676SJeff Bonwick 	if (total_found == total_alloc) {
382182a0a985SVictor Latushkin 		if (!dump_opt['L'])
382282a0a985SVictor Latushkin 			(void) printf("\n\tNo leaks (block sum matches space"
382382a0a985SVictor Latushkin 			    " maps exactly)\n");
3824fa9e4066Sahrens 	} else {
3825fa9e4066Sahrens 		(void) printf("block traversal size %llu != alloc %llu "
382682a0a985SVictor Latushkin 		    "(%s %lld)\n",
3827b24ab676SJeff Bonwick 		    (u_longlong_t)total_found,
3828b24ab676SJeff Bonwick 		    (u_longlong_t)total_alloc,
382982a0a985SVictor Latushkin 		    (dump_opt['L']) ? "unreachable" : "leaked",
3830b24ab676SJeff Bonwick 		    (longlong_t)(total_alloc - total_found));
38315d7b4d43SMatthew Ahrens 		leaks = B_TRUE;
3832fa9e4066Sahrens 	}
3833fa9e4066Sahrens 
3834fa9e4066Sahrens 	if (tzb->zb_count == 0)
3835fa9e4066Sahrens 		return (2);
3836fa9e4066Sahrens 
3837fa9e4066Sahrens 	(void) printf("\n");
3838*663207adSDon Brady 	(void) printf("\t%-16s %14llu\n", "bp count:",
3839fa9e4066Sahrens 	    (u_longlong_t)tzb->zb_count);
3840*663207adSDon Brady 	(void) printf("\t%-16s %14llu\n", "ganged count:",
3841d5ee8a13SMatthew Ahrens 	    (longlong_t)tzb->zb_gangs);
3842*663207adSDon Brady 	(void) printf("\t%-16s %14llu      avg: %6llu\n", "bp logical:",
3843fa9e4066Sahrens 	    (u_longlong_t)tzb->zb_lsize,
3844fa9e4066Sahrens 	    (u_longlong_t)(tzb->zb_lsize / tzb->zb_count));
3845*663207adSDon Brady 	(void) printf("\t%-16s %14llu      avg: %6llu     compression: %6.2f\n",
3846*663207adSDon Brady 	    "bp physical:", (u_longlong_t)tzb->zb_psize,
3847fa9e4066Sahrens 	    (u_longlong_t)(tzb->zb_psize / tzb->zb_count),
3848fa9e4066Sahrens 	    (double)tzb->zb_lsize / tzb->zb_psize);
3849*663207adSDon Brady 	(void) printf("\t%-16s %14llu      avg: %6llu     compression: %6.2f\n",
3850*663207adSDon Brady 	    "bp allocated:", (u_longlong_t)tzb->zb_asize,
3851fa9e4066Sahrens 	    (u_longlong_t)(tzb->zb_asize / tzb->zb_count),
3852fa9e4066Sahrens 	    (double)tzb->zb_lsize / tzb->zb_asize);
3853*663207adSDon Brady 	(void) printf("\t%-16s %14llu    ref>1: %6llu   deduplication: %6.2f\n",
3854*663207adSDon Brady 	    "bp deduped:", (u_longlong_t)zcb.zcb_dedup_asize,
3855b24ab676SJeff Bonwick 	    (u_longlong_t)zcb.zcb_dedup_blocks,
3856b24ab676SJeff Bonwick 	    (double)zcb.zcb_dedup_asize / tzb->zb_asize + 1.0);
3857*663207adSDon Brady 	(void) printf("\t%-16s %14llu     used: %5.2f%%\n", "Normal class:",
3858b24ab676SJeff Bonwick 	    (u_longlong_t)norm_alloc, 100.0 * norm_alloc / norm_space);
3859fa9e4066Sahrens 
3860*663207adSDon Brady 	if (spa_special_class(spa)->mc_rotor != NULL) {
3861*663207adSDon Brady 		uint64_t alloc = metaslab_class_get_alloc(
3862*663207adSDon Brady 		    spa_special_class(spa));
3863*663207adSDon Brady 		uint64_t space = metaslab_class_get_space(
3864*663207adSDon Brady 		    spa_special_class(spa));
3865*663207adSDon Brady 
3866*663207adSDon Brady 		(void) printf("\t%-16s %14llu     used: %5.2f%%\n",
3867*663207adSDon Brady 		    "Special class", (u_longlong_t)alloc,
3868*663207adSDon Brady 		    100.0 * alloc / space);
3869*663207adSDon Brady 	}
3870*663207adSDon Brady 
3871*663207adSDon Brady 	if (spa_dedup_class(spa)->mc_rotor != NULL) {
3872*663207adSDon Brady 		uint64_t alloc = metaslab_class_get_alloc(
3873*663207adSDon Brady 		    spa_dedup_class(spa));
3874*663207adSDon Brady 		uint64_t space = metaslab_class_get_space(
3875*663207adSDon Brady 		    spa_dedup_class(spa));
3876*663207adSDon Brady 
3877*663207adSDon Brady 		(void) printf("\t%-16s %14llu     used: %5.2f%%\n",
3878*663207adSDon Brady 		    "Dedup class", (u_longlong_t)alloc,
3879*663207adSDon Brady 		    100.0 * alloc / space);
3880*663207adSDon Brady 	}
3881*663207adSDon Brady 
38825d7b4d43SMatthew Ahrens 	for (bp_embedded_type_t i = 0; i < NUM_BP_EMBEDDED_TYPES; i++) {
38835d7b4d43SMatthew Ahrens 		if (zcb.zcb_embedded_blocks[i] == 0)
38845d7b4d43SMatthew Ahrens 			continue;
38855d7b4d43SMatthew Ahrens 		(void) printf("\n");
38865d7b4d43SMatthew Ahrens 		(void) printf("\tadditional, non-pointer bps of type %u: "
38875d7b4d43SMatthew Ahrens 		    "%10llu\n",
38885d7b4d43SMatthew Ahrens 		    i, (u_longlong_t)zcb.zcb_embedded_blocks[i]);
38895d7b4d43SMatthew Ahrens 
38905d7b4d43SMatthew Ahrens 		if (dump_opt['b'] >= 3) {
38915d7b4d43SMatthew Ahrens 			(void) printf("\t number of (compressed) bytes:  "
38925d7b4d43SMatthew Ahrens 			    "number of bps\n");
38935d7b4d43SMatthew Ahrens 			dump_histogram(zcb.zcb_embedded_histogram[i],
38945d7b4d43SMatthew Ahrens 			    sizeof (zcb.zcb_embedded_histogram[i]) /
38955d7b4d43SMatthew Ahrens 			    sizeof (zcb.zcb_embedded_histogram[i][0]), 0);
38965d7b4d43SMatthew Ahrens 		}
38975d7b4d43SMatthew Ahrens 	}
38985d7b4d43SMatthew Ahrens 
3899d5ee8a13SMatthew Ahrens 	if (tzb->zb_ditto_samevdev != 0) {
3900d5ee8a13SMatthew Ahrens 		(void) printf("\tDittoed blocks on same vdev: %llu\n",
3901d5ee8a13SMatthew Ahrens 		    (longlong_t)tzb->zb_ditto_samevdev);
3902d5ee8a13SMatthew Ahrens 	}
3903*663207adSDon Brady 	if (tzb->zb_ditto_same_ms != 0) {
3904*663207adSDon Brady 		(void) printf("\tDittoed blocks in same metaslab: %llu\n",
3905*663207adSDon Brady 		    (longlong_t)tzb->zb_ditto_same_ms);
3906*663207adSDon Brady 	}
3907d5ee8a13SMatthew Ahrens 
39085cabbc6bSPrashanth Sreenivasa 	for (uint64_t v = 0; v < spa->spa_root_vdev->vdev_children; v++) {
39095cabbc6bSPrashanth Sreenivasa 		vdev_t *vd = spa->spa_root_vdev->vdev_child[v];
39105cabbc6bSPrashanth Sreenivasa 		vdev_indirect_mapping_t *vim = vd->vdev_indirect_mapping;
39115cabbc6bSPrashanth Sreenivasa 
39125cabbc6bSPrashanth Sreenivasa 		if (vim == NULL) {
39135cabbc6bSPrashanth Sreenivasa 			continue;
39145cabbc6bSPrashanth Sreenivasa 		}
39155cabbc6bSPrashanth Sreenivasa 
39165cabbc6bSPrashanth Sreenivasa 		char mem[32];
39175cabbc6bSPrashanth Sreenivasa 		zdb_nicenum(vdev_indirect_mapping_num_entries(vim),
39185cabbc6bSPrashanth Sreenivasa 		    mem, vdev_indirect_mapping_size(vim));
39195cabbc6bSPrashanth Sreenivasa 
39205cabbc6bSPrashanth Sreenivasa 		(void) printf("\tindirect vdev id %llu has %llu segments "
39215cabbc6bSPrashanth Sreenivasa 		    "(%s in memory)\n",
39225cabbc6bSPrashanth Sreenivasa 		    (longlong_t)vd->vdev_id,
39235cabbc6bSPrashanth Sreenivasa 		    (longlong_t)vdev_indirect_mapping_num_entries(vim), mem);
39245cabbc6bSPrashanth Sreenivasa 	}
39255cabbc6bSPrashanth Sreenivasa 
3926fa9e4066Sahrens 	if (dump_opt['b'] >= 2) {
3927fa9e4066Sahrens 		int l, t, level;
3928fa9e4066Sahrens 		(void) printf("\nBlocks\tLSIZE\tPSIZE\tASIZE"
3929fa9e4066Sahrens 		    "\t  avg\t comp\t%%Total\tType\n");
3930fa9e4066Sahrens 
3931b24ab676SJeff Bonwick 		for (t = 0; t <= ZDB_OT_TOTAL; t++) {
39323f9d6ad7SLin Ling 			char csize[32], lsize[32], psize[32], asize[32];
3933d5ee8a13SMatthew Ahrens 			char avg[32], gang[32];
39343f7978d0SAlan Somers 			const char *typename;
3935fa9e4066Sahrens 
39360a055120SJason King 			/* make sure nicenum has enough space */
39370a055120SJason King 			CTASSERT(sizeof (csize) >= NN_NUMBUF_SZ);
39380a055120SJason King 			CTASSERT(sizeof (lsize) >= NN_NUMBUF_SZ);
39390a055120SJason King 			CTASSERT(sizeof (psize) >= NN_NUMBUF_SZ);
39400a055120SJason King 			CTASSERT(sizeof (asize) >= NN_NUMBUF_SZ);
39410a055120SJason King 			CTASSERT(sizeof (avg) >= NN_NUMBUF_SZ);
39420a055120SJason King 			CTASSERT(sizeof (gang) >= NN_NUMBUF_SZ);
39430a055120SJason King 
3944b24ab676SJeff Bonwick 			if (t < DMU_OT_NUMTYPES)
3945b24ab676SJeff Bonwick 				typename = dmu_ot[t].ot_name;
3946b24ab676SJeff Bonwick 			else
3947b24ab676SJeff Bonwick 				typename = zdb_ot_extname[t - DMU_OT_NUMTYPES];
3948fa9e4066Sahrens 
3949fa9e4066Sahrens 			if (zcb.zcb_type[ZB_TOTAL][t].zb_asize == 0) {
3950fa9e4066Sahrens 				(void) printf("%6s\t%5s\t%5s\t%5s"
3951fa9e4066Sahrens 				    "\t%5s\t%5s\t%6s\t%s\n",
3952fa9e4066Sahrens 				    "-",
3953fa9e4066Sahrens 				    "-",
3954fa9e4066Sahrens 				    "-",
3955fa9e4066Sahrens 				    "-",
3956fa9e4066Sahrens 				    "-",
3957fa9e4066Sahrens 				    "-",
3958fa9e4066Sahrens 				    "-",
3959fa9e4066Sahrens 				    typename);
3960fa9e4066Sahrens 				continue;
3961fa9e4066Sahrens 			}
3962fa9e4066Sahrens 
3963fa9e4066Sahrens 			for (l = ZB_TOTAL - 1; l >= -1; l--) {
3964fa9e4066Sahrens 				level = (l == -1 ? ZB_TOTAL : l);
3965fa9e4066Sahrens 				zb = &zcb.zcb_type[level][t];
3966fa9e4066Sahrens 
3967fa9e4066Sahrens 				if (zb->zb_asize == 0)
3968fa9e4066Sahrens 					continue;
3969fa9e4066Sahrens 
3970fa9e4066Sahrens 				if (dump_opt['b'] < 3 && level != ZB_TOTAL)
3971fa9e4066Sahrens 					continue;
3972fa9e4066Sahrens 
3973fa9e4066Sahrens 				if (level == 0 && zb->zb_asize ==
3974fa9e4066Sahrens 				    zcb.zcb_type[ZB_TOTAL][t].zb_asize)
3975fa9e4066Sahrens 					continue;
3976fa9e4066Sahrens 
39770a055120SJason King 				zdb_nicenum(zb->zb_count, csize,
39780a055120SJason King 				    sizeof (csize));
39790a055120SJason King 				zdb_nicenum(zb->zb_lsize, lsize,
39800a055120SJason King 				    sizeof (lsize));
39810a055120SJason King 				zdb_nicenum(zb->zb_psize, psize,
39820a055120SJason King 				    sizeof (psize));
39830a055120SJason King 				zdb_nicenum(zb->zb_asize, asize,
39840a055120SJason King 				    sizeof (asize));
39850a055120SJason King 				zdb_nicenum(zb->zb_asize / zb->zb_count, avg,
39860a055120SJason King 				    sizeof (avg));
39870a055120SJason King 				zdb_nicenum(zb->zb_gangs, gang, sizeof (gang));
3988fa9e4066Sahrens 
3989fa9e4066Sahrens 				(void) printf("%6s\t%5s\t%5s\t%5s\t%5s"
3990fa9e4066Sahrens 				    "\t%5.2f\t%6.2f\t",
3991fa9e4066Sahrens 				    csize, lsize, psize, asize, avg,
3992fa9e4066Sahrens 				    (double)zb->zb_lsize / zb->zb_psize,
3993fa9e4066Sahrens 				    100.0 * zb->zb_asize / tzb->zb_asize);
3994fa9e4066Sahrens 
3995fa9e4066Sahrens 				if (level == ZB_TOTAL)
3996fa9e4066Sahrens 					(void) printf("%s\n", typename);
3997fa9e4066Sahrens 				else
3998fa9e4066Sahrens 					(void) printf("    L%d %s\n",
3999fa9e4066Sahrens 					    level, typename);
4000490d05b9SMatthew Ahrens 
4001d5ee8a13SMatthew Ahrens 				if (dump_opt['b'] >= 3 && zb->zb_gangs > 0) {
4002d5ee8a13SMatthew Ahrens 					(void) printf("\t number of ganged "
4003d5ee8a13SMatthew Ahrens 					    "blocks: %s\n", gang);
4004d5ee8a13SMatthew Ahrens 				}
4005d5ee8a13SMatthew Ahrens 
4006490d05b9SMatthew Ahrens 				if (dump_opt['b'] >= 4) {
4007490d05b9SMatthew Ahrens 					(void) printf("psize "
4008490d05b9SMatthew Ahrens 					    "(in 512-byte sectors): "
4009490d05b9SMatthew Ahrens 					    "number of blocks\n");
4010490d05b9SMatthew Ahrens 					dump_histogram(zb->zb_psize_histogram,
40110713e232SGeorge Wilson 					    PSIZE_HISTO_SIZE, 0);
4012490d05b9SMatthew Ahrens 				}
4013fa9e4066Sahrens 			}
4014fa9e4066Sahrens 		}
4015fa9e4066Sahrens 	}
4016fa9e4066Sahrens 
4017fa9e4066Sahrens 	(void) printf("\n");
4018fa9e4066Sahrens 
4019fa9e4066Sahrens 	if (leaks)
4020fa9e4066Sahrens 		return (2);
4021fa9e4066Sahrens 
4022fa9e4066Sahrens 	if (zcb.zcb_haderrors)
4023fa9e4066Sahrens 		return (3);
4024fa9e4066Sahrens 
4025fa9e4066Sahrens 	return (0);
4026fa9e4066Sahrens }
4027fa9e4066Sahrens 
4028b24ab676SJeff Bonwick typedef struct zdb_ddt_entry {
4029b24ab676SJeff Bonwick 	ddt_key_t	zdde_key;
4030b24ab676SJeff Bonwick 	uint64_t	zdde_ref_blocks;
4031b24ab676SJeff Bonwick 	uint64_t	zdde_ref_lsize;
4032b24ab676SJeff Bonwick 	uint64_t	zdde_ref_psize;
4033b24ab676SJeff Bonwick 	uint64_t	zdde_ref_dsize;
4034b24ab676SJeff Bonwick 	avl_node_t	zdde_node;
4035b24ab676SJeff Bonwick } zdb_ddt_entry_t;
4036b24ab676SJeff Bonwick 
4037b24ab676SJeff Bonwick /* ARGSUSED */
4038b24ab676SJeff Bonwick static int
4039b24ab676SJeff Bonwick zdb_ddt_add_cb(spa_t *spa, zilog_t *zilog, const blkptr_t *bp,
40407802d7bfSMatthew Ahrens     const zbookmark_phys_t *zb, const dnode_phys_t *dnp, void *arg)
4041b24ab676SJeff Bonwick {
4042b24ab676SJeff Bonwick 	avl_tree_t *t = arg;
4043b24ab676SJeff Bonwick 	avl_index_t where;
4044b24ab676SJeff Bonwick 	zdb_ddt_entry_t *zdde, zdde_search;
4045b24ab676SJeff Bonwick 
4046a2cdcdd2SPaul Dagnelie 	if (bp == NULL || BP_IS_HOLE(bp) || BP_IS_EMBEDDED(bp))
4047b24ab676SJeff Bonwick 		return (0);
4048b24ab676SJeff Bonwick 
4049b24ab676SJeff Bonwick 	if (dump_opt['S'] > 1 && zb->zb_level == ZB_ROOT_LEVEL) {
4050b24ab676SJeff Bonwick 		(void) printf("traversing objset %llu, %llu objects, "
4051b24ab676SJeff Bonwick 		    "%lu blocks so far\n",
4052b24ab676SJeff Bonwick 		    (u_longlong_t)zb->zb_objset,
40535d7b4d43SMatthew Ahrens 		    (u_longlong_t)BP_GET_FILL(bp),
4054b24ab676SJeff Bonwick 		    avl_numnodes(t));
4055b24ab676SJeff Bonwick 	}
4056b24ab676SJeff Bonwick 
4057bbfd46c4SJeff Bonwick 	if (BP_IS_HOLE(bp) || BP_GET_CHECKSUM(bp) == ZIO_CHECKSUM_OFF ||
4058ad135b5dSChristopher Siden 	    BP_GET_LEVEL(bp) > 0 || DMU_OT_IS_METADATA(BP_GET_TYPE(bp)))
4059b24ab676SJeff Bonwick 		return (0);
4060b24ab676SJeff Bonwick 
4061b24ab676SJeff Bonwick 	ddt_key_fill(&zdde_search.zdde_key, bp);
4062b24ab676SJeff Bonwick 
4063b24ab676SJeff Bonwick 	zdde = avl_find(t, &zdde_search, &where);
4064b24ab676SJeff Bonwick 
4065b24ab676SJeff Bonwick 	if (zdde == NULL) {
4066b24ab676SJeff Bonwick 		zdde = umem_zalloc(sizeof (*zdde), UMEM_NOFAIL);
4067b24ab676SJeff Bonwick 		zdde->zdde_key = zdde_search.zdde_key;
4068b24ab676SJeff Bonwick 		avl_insert(t, zdde, where);
4069b24ab676SJeff Bonwick 	}
4070b24ab676SJeff Bonwick 
4071b24ab676SJeff Bonwick 	zdde->zdde_ref_blocks += 1;
4072b24ab676SJeff Bonwick 	zdde->zdde_ref_lsize += BP_GET_LSIZE(bp);
4073b24ab676SJeff Bonwick 	zdde->zdde_ref_psize += BP_GET_PSIZE(bp);
4074b24ab676SJeff Bonwick 	zdde->zdde_ref_dsize += bp_get_dsize_sync(spa, bp);
4075b24ab676SJeff Bonwick 
4076b24ab676SJeff Bonwick 	return (0);
4077b24ab676SJeff Bonwick }
4078b24ab676SJeff Bonwick 
4079b24ab676SJeff Bonwick static void
4080b24ab676SJeff Bonwick dump_simulated_ddt(spa_t *spa)
4081b24ab676SJeff Bonwick {
4082b24ab676SJeff Bonwick 	avl_tree_t t;
4083b24ab676SJeff Bonwick 	void *cookie = NULL;
4084b24ab676SJeff Bonwick 	zdb_ddt_entry_t *zdde;
40853f7978d0SAlan Somers 	ddt_histogram_t ddh_total;
40863f7978d0SAlan Somers 	ddt_stat_t dds_total;
4087b24ab676SJeff Bonwick 
40883f7978d0SAlan Somers 	bzero(&ddh_total, sizeof (ddh_total));
40893f7978d0SAlan Somers 	bzero(&dds_total, sizeof (dds_total));
4090b24ab676SJeff Bonwick 	avl_create(&t, ddt_entry_compare,
4091b24ab676SJeff Bonwick 	    sizeof (zdb_ddt_entry_t), offsetof(zdb_ddt_entry_t, zdde_node));
4092b24ab676SJeff Bonwick 
4093b24ab676SJeff Bonwick 	spa_config_enter(spa, SCL_CONFIG, FTAG, RW_READER);
4094b24ab676SJeff Bonwick 
4095bbfd46c4SJeff Bonwick 	(void) traverse_pool(spa, 0, TRAVERSE_PRE | TRAVERSE_PREFETCH_METADATA,
4096bbfd46c4SJeff Bonwick 	    zdb_ddt_add_cb, &t);
4097b24ab676SJeff Bonwick 
4098b24ab676SJeff Bonwick 	spa_config_exit(spa, SCL_CONFIG, FTAG);
4099b24ab676SJeff Bonwick 
4100b24ab676SJeff Bonwick 	while ((zdde = avl_destroy_nodes(&t, &cookie)) != NULL) {
4101b24ab676SJeff Bonwick 		ddt_stat_t dds;
4102b24ab676SJeff Bonwick 		uint64_t refcnt = zdde->zdde_ref_blocks;
4103b24ab676SJeff Bonwick 		ASSERT(refcnt != 0);
4104b24ab676SJeff Bonwick 
4105b24ab676SJeff Bonwick 		dds.dds_blocks = zdde->zdde_ref_blocks / refcnt;
4106b24ab676SJeff Bonwick 		dds.dds_lsize = zdde->zdde_ref_lsize / refcnt;
4107b24ab676SJeff Bonwick 		dds.dds_psize = zdde->zdde_ref_psize / refcnt;
4108b24ab676SJeff Bonwick 		dds.dds_dsize = zdde->zdde_ref_dsize / refcnt;
4109b24ab676SJeff Bonwick 
4110b24ab676SJeff Bonwick 		dds.dds_ref_blocks = zdde->zdde_ref_blocks;
4111b24ab676SJeff Bonwick 		dds.dds_ref_lsize = zdde->zdde_ref_lsize;
4112b24ab676SJeff Bonwick 		dds.dds_ref_psize = zdde->zdde_ref_psize;
4113b24ab676SJeff Bonwick 		dds.dds_ref_dsize = zdde->zdde_ref_dsize;
4114b24ab676SJeff Bonwick 
4115bf16b11eSMatthew Ahrens 		ddt_stat_add(&ddh_total.ddh_stat[highbit64(refcnt) - 1],
4116bf16b11eSMatthew Ahrens 		    &dds, 0);
4117b24ab676SJeff Bonwick 
4118b24ab676SJeff Bonwick 		umem_free(zdde, sizeof (*zdde));
4119b24ab676SJeff Bonwick 	}
4120b24ab676SJeff Bonwick 
4121b24ab676SJeff Bonwick 	avl_destroy(&t);
4122b24ab676SJeff Bonwick 
4123b24ab676SJeff Bonwick 	ddt_histogram_stat(&dds_total, &ddh_total);
4124b24ab676SJeff Bonwick 
4125b24ab676SJeff Bonwick 	(void) printf("Simulated DDT histogram:\n");
4126b24ab676SJeff Bonwick 
41279eb19f4dSGeorge Wilson 	zpool_dump_ddt(&dds_total, &ddh_total);
4128b24ab676SJeff Bonwick 
4129b24ab676SJeff Bonwick 	dump_dedup_ratio(&dds_total);
4130b24ab676SJeff Bonwick }
4131b24ab676SJeff Bonwick 
41325cabbc6bSPrashanth Sreenivasa static int
41335cabbc6bSPrashanth Sreenivasa verify_device_removal_feature_counts(spa_t *spa)
41345cabbc6bSPrashanth Sreenivasa {
41355cabbc6bSPrashanth Sreenivasa 	uint64_t dr_feature_refcount = 0;
41365cabbc6bSPrashanth Sreenivasa 	uint64_t oc_feature_refcount = 0;
41375cabbc6bSPrashanth Sreenivasa 	uint64_t indirect_vdev_count = 0;
41385cabbc6bSPrashanth Sreenivasa 	uint64_t precise_vdev_count = 0;
41395cabbc6bSPrashanth Sreenivasa 	uint64_t obsolete_counts_object_count = 0;
41405cabbc6bSPrashanth Sreenivasa 	uint64_t obsolete_sm_count = 0;
41415cabbc6bSPrashanth Sreenivasa 	uint64_t obsolete_counts_count = 0;
41425cabbc6bSPrashanth Sreenivasa 	uint64_t scip_count = 0;
41435cabbc6bSPrashanth Sreenivasa 	uint64_t obsolete_bpobj_count = 0;
41445cabbc6bSPrashanth Sreenivasa 	int ret = 0;
41455cabbc6bSPrashanth Sreenivasa 
41465cabbc6bSPrashanth Sreenivasa 	spa_condensing_indirect_phys_t *scip =
41475cabbc6bSPrashanth Sreenivasa 	    &spa->spa_condensing_indirect_phys;
41485cabbc6bSPrashanth Sreenivasa 	if (scip->scip_next_mapping_object != 0) {
41495cabbc6bSPrashanth Sreenivasa 		vdev_t *vd = spa->spa_root_vdev->vdev_child[scip->scip_vdev];
41505cabbc6bSPrashanth Sreenivasa 		ASSERT(scip->scip_prev_obsolete_sm_object != 0);
41515cabbc6bSPrashanth Sreenivasa 		ASSERT3P(vd->vdev_ops, ==, &vdev_indirect_ops);
41525cabbc6bSPrashanth Sreenivasa 
41535cabbc6bSPrashanth Sreenivasa 		(void) printf("Condensing indirect vdev %llu: new mapping "
41545cabbc6bSPrashanth Sreenivasa 		    "object %llu, prev obsolete sm %llu\n",
41555cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)scip->scip_vdev,
41565cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)scip->scip_next_mapping_object,
41575cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)scip->scip_prev_obsolete_sm_object);
41585cabbc6bSPrashanth Sreenivasa 		if (scip->scip_prev_obsolete_sm_object != 0) {
41595cabbc6bSPrashanth Sreenivasa 			space_map_t *prev_obsolete_sm = NULL;
41605cabbc6bSPrashanth Sreenivasa 			VERIFY0(space_map_open(&prev_obsolete_sm,
41615cabbc6bSPrashanth Sreenivasa 			    spa->spa_meta_objset,
41625cabbc6bSPrashanth Sreenivasa 			    scip->scip_prev_obsolete_sm_object,
41635cabbc6bSPrashanth Sreenivasa 			    0, vd->vdev_asize, 0));
41645cabbc6bSPrashanth Sreenivasa 			space_map_update(prev_obsolete_sm);
41655cabbc6bSPrashanth Sreenivasa 			dump_spacemap(spa->spa_meta_objset, prev_obsolete_sm);
41665cabbc6bSPrashanth Sreenivasa 			(void) printf("\n");
41675cabbc6bSPrashanth Sreenivasa 			space_map_close(prev_obsolete_sm);
41685cabbc6bSPrashanth Sreenivasa 		}
41695cabbc6bSPrashanth Sreenivasa 
41705cabbc6bSPrashanth Sreenivasa 		scip_count += 2;
41715cabbc6bSPrashanth Sreenivasa 	}
41725cabbc6bSPrashanth Sreenivasa 
41735cabbc6bSPrashanth Sreenivasa 	for (uint64_t i = 0; i < spa->spa_root_vdev->vdev_children; i++) {
41745cabbc6bSPrashanth Sreenivasa 		vdev_t *vd = spa->spa_root_vdev->vdev_child[i];
41755cabbc6bSPrashanth Sreenivasa 		vdev_indirect_config_t *vic = &vd->vdev_indirect_config;
41765cabbc6bSPrashanth Sreenivasa 
41775cabbc6bSPrashanth Sreenivasa 		if (vic->vic_mapping_object != 0) {
41785cabbc6bSPrashanth Sreenivasa 			ASSERT(vd->vdev_ops == &vdev_indirect_ops ||
41795cabbc6bSPrashanth Sreenivasa 			    vd->vdev_removing);
41805cabbc6bSPrashanth Sreenivasa 			indirect_vdev_count++;
41815cabbc6bSPrashanth Sreenivasa 
41825cabbc6bSPrashanth Sreenivasa 			if (vd->vdev_indirect_mapping->vim_havecounts) {
41835cabbc6bSPrashanth Sreenivasa 				obsolete_counts_count++;
41845cabbc6bSPrashanth Sreenivasa 			}
41855cabbc6bSPrashanth Sreenivasa 		}
41865cabbc6bSPrashanth Sreenivasa 		if (vdev_obsolete_counts_are_precise(vd)) {
41875cabbc6bSPrashanth Sreenivasa 			ASSERT(vic->vic_mapping_object != 0);
41885cabbc6bSPrashanth Sreenivasa 			precise_vdev_count++;
41895cabbc6bSPrashanth Sreenivasa 		}
41905cabbc6bSPrashanth Sreenivasa 		if (vdev_obsolete_sm_object(vd) != 0) {
41915cabbc6bSPrashanth Sreenivasa 			ASSERT(vic->vic_mapping_object != 0);
41925cabbc6bSPrashanth Sreenivasa 			obsolete_sm_count++;
41935cabbc6bSPrashanth Sreenivasa 		}
41945cabbc6bSPrashanth Sreenivasa 	}
41955cabbc6bSPrashanth Sreenivasa 
41965cabbc6bSPrashanth Sreenivasa 	(void) feature_get_refcount(spa,
41975cabbc6bSPrashanth Sreenivasa 	    &spa_feature_table[SPA_FEATURE_DEVICE_REMOVAL],
41985cabbc6bSPrashanth Sreenivasa 	    &dr_feature_refcount);
41995cabbc6bSPrashanth Sreenivasa 	(void) feature_get_refcount(spa,
42005cabbc6bSPrashanth Sreenivasa 	    &spa_feature_table[SPA_FEATURE_OBSOLETE_COUNTS],
42015cabbc6bSPrashanth Sreenivasa 	    &oc_feature_refcount);
42025cabbc6bSPrashanth Sreenivasa 
42035cabbc6bSPrashanth Sreenivasa 	if (dr_feature_refcount != indirect_vdev_count) {
42045cabbc6bSPrashanth Sreenivasa 		ret = 1;
42055cabbc6bSPrashanth Sreenivasa 		(void) printf("Number of indirect vdevs (%llu) " \
42065cabbc6bSPrashanth Sreenivasa 		    "does not match feature count (%llu)\n",
42075cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)indirect_vdev_count,
42085cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)dr_feature_refcount);
42095cabbc6bSPrashanth Sreenivasa 	} else {
42105cabbc6bSPrashanth Sreenivasa 		(void) printf("Verified device_removal feature refcount " \
42115cabbc6bSPrashanth Sreenivasa 		    "of %llu is correct\n",
42125cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)dr_feature_refcount);
42135cabbc6bSPrashanth Sreenivasa 	}
42145cabbc6bSPrashanth Sreenivasa 
42155cabbc6bSPrashanth Sreenivasa 	if (zap_contains(spa_meta_objset(spa), DMU_POOL_DIRECTORY_OBJECT,
42165cabbc6bSPrashanth Sreenivasa 	    DMU_POOL_OBSOLETE_BPOBJ) == 0) {
42175cabbc6bSPrashanth Sreenivasa 		obsolete_bpobj_count++;
42185cabbc6bSPrashanth Sreenivasa 	}
42195cabbc6bSPrashanth Sreenivasa 
42205cabbc6bSPrashanth Sreenivasa 
42215cabbc6bSPrashanth Sreenivasa 	obsolete_counts_object_count = precise_vdev_count;
42225cabbc6bSPrashanth Sreenivasa 	obsolete_counts_object_count += obsolete_sm_count;
42235cabbc6bSPrashanth Sreenivasa 	obsolete_counts_object_count += obsolete_counts_count;
42245cabbc6bSPrashanth Sreenivasa 	obsolete_counts_object_count += scip_count;
42255cabbc6bSPrashanth Sreenivasa 	obsolete_counts_object_count += obsolete_bpobj_count;
42265cabbc6bSPrashanth Sreenivasa 	obsolete_counts_object_count += remap_deadlist_count;
42275cabbc6bSPrashanth Sreenivasa 
42285cabbc6bSPrashanth Sreenivasa 	if (oc_feature_refcount != obsolete_counts_object_count) {
42295cabbc6bSPrashanth Sreenivasa 		ret = 1;
42305cabbc6bSPrashanth Sreenivasa 		(void) printf("Number of obsolete counts objects (%llu) " \
42315cabbc6bSPrashanth Sreenivasa 		    "does not match feature count (%llu)\n",
42325cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)obsolete_counts_object_count,
42335cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)oc_feature_refcount);
42345cabbc6bSPrashanth Sreenivasa 		(void) printf("pv:%llu os:%llu oc:%llu sc:%llu "
42355cabbc6bSPrashanth Sreenivasa 		    "ob:%llu rd:%llu\n",
42365cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)precise_vdev_count,
42375cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)obsolete_sm_count,
42385cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)obsolete_counts_count,
42395cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)scip_count,
42405cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)obsolete_bpobj_count,
42415cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)remap_deadlist_count);
42425cabbc6bSPrashanth Sreenivasa 	} else {
42435cabbc6bSPrashanth Sreenivasa 		(void) printf("Verified indirect_refcount feature refcount " \
42445cabbc6bSPrashanth Sreenivasa 		    "of %llu is correct\n",
42455cabbc6bSPrashanth Sreenivasa 		    (u_longlong_t)oc_feature_refcount);
42465cabbc6bSPrashanth Sreenivasa 	}
42475cabbc6bSPrashanth Sreenivasa 	return (ret);
42485cabbc6bSPrashanth Sreenivasa }
42495cabbc6bSPrashanth Sreenivasa 
4250e0f1c0afSOlaf Faaland static void
4251e0f1c0afSOlaf Faaland zdb_set_skip_mmp(char *target)
4252e0f1c0afSOlaf Faaland {
4253e0f1c0afSOlaf Faaland 	spa_t *spa;
4254e0f1c0afSOlaf Faaland 
4255e0f1c0afSOlaf Faaland 	/*
4256e0f1c0afSOlaf Faaland 	 * Disable the activity check to allow examination of
4257e0f1c0afSOlaf Faaland 	 * active pools.
4258e0f1c0afSOlaf Faaland 	 */
4259e0f1c0afSOlaf Faaland 	mutex_enter(&spa_namespace_lock);
4260e0f1c0afSOlaf Faaland 	if ((spa = spa_lookup(target)) != NULL) {
4261e0f1c0afSOlaf Faaland 		spa->spa_import_flags |= ZFS_IMPORT_SKIP_MMP;
4262e0f1c0afSOlaf Faaland 	}
4263e0f1c0afSOlaf Faaland 	mutex_exit(&spa_namespace_lock);
4264e0f1c0afSOlaf Faaland }
4265e0f1c0afSOlaf Faaland 
426686714001SSerapheim Dimitropoulos #define	BOGUS_SUFFIX "_CHECKPOINTED_UNIVERSE"
426786714001SSerapheim Dimitropoulos /*
426886714001SSerapheim Dimitropoulos  * Import the checkpointed state of the pool specified by the target
426986714001SSerapheim Dimitropoulos  * parameter as readonly. The function also accepts a pool config
427086714001SSerapheim Dimitropoulos  * as an optional parameter, else it attempts to infer the config by
427186714001SSerapheim Dimitropoulos  * the name of the target pool.
427286714001SSerapheim Dimitropoulos  *
427386714001SSerapheim Dimitropoulos  * Note that the checkpointed state's pool name will be the name of
427486714001SSerapheim Dimitropoulos  * the original pool with the above suffix appened to it. In addition,
427586714001SSerapheim Dimitropoulos  * if the target is not a pool name (e.g. a path to a dataset) then
427686714001SSerapheim Dimitropoulos  * the new_path parameter is populated with the updated path to
427786714001SSerapheim Dimitropoulos  * reflect the fact that we are looking into the checkpointed state.
427886714001SSerapheim Dimitropoulos  *
427986714001SSerapheim Dimitropoulos  * The function returns a newly-allocated copy of the name of the
428086714001SSerapheim Dimitropoulos  * pool containing the checkpointed state. When this copy is no
428186714001SSerapheim Dimitropoulos  * longer needed it should be freed with free(3C). Same thing
428286714001SSerapheim Dimitropoulos  * applies to the new_path parameter if allocated.
428386714001SSerapheim Dimitropoulos  */
428486714001SSerapheim Dimitropoulos static char *
428586714001SSerapheim Dimitropoulos import_checkpointed_state(char *target, nvlist_t *cfg, char **new_path)
428686714001SSerapheim Dimitropoulos {
428786714001SSerapheim Dimitropoulos 	int error = 0;
428886714001SSerapheim Dimitropoulos 	char *poolname, *bogus_name;
428986714001SSerapheim Dimitropoulos 
429086714001SSerapheim Dimitropoulos 	/* If the target is not a pool, the extract the pool name */
429186714001SSerapheim Dimitropoulos 	char *path_start = strchr(target, '/');
429286714001SSerapheim Dimitropoulos 	if (path_start != NULL) {
429386714001SSerapheim Dimitropoulos 		size_t poolname_len = path_start - target;
429486714001SSerapheim Dimitropoulos 		poolname = strndup(target, poolname_len);
429586714001SSerapheim Dimitropoulos 	} else {
429686714001SSerapheim Dimitropoulos 		poolname = target;
429786714001SSerapheim Dimitropoulos 	}
429886714001SSerapheim Dimitropoulos 
429986714001SSerapheim Dimitropoulos 	if (cfg == NULL) {
4300e0f1c0afSOlaf Faaland 		zdb_set_skip_mmp(poolname);
430186714001SSerapheim Dimitropoulos 		error = spa_get_stats(poolname, &cfg, NULL, 0);
430286714001SSerapheim Dimitropoulos 		if (error != 0) {
430386714001SSerapheim Dimitropoulos 			fatal("Tried to read config of pool \"%s\" but "
430486714001SSerapheim Dimitropoulos 			    "spa_get_stats() failed with error %d\n",
430586714001SSerapheim Dimitropoulos 			    poolname, error);
430686714001SSerapheim Dimitropoulos 		}
430786714001SSerapheim Dimitropoulos 	}
430886714001SSerapheim Dimitropoulos 
430986714001SSerapheim Dimitropoulos 	(void) asprintf(&bogus_name, "%s%s", poolname, BOGUS_SUFFIX);
431086714001SSerapheim Dimitropoulos 	fnvlist_add_string(cfg, ZPOOL_CONFIG_POOL_NAME, bogus_name);
431186714001SSerapheim Dimitropoulos 
431286714001SSerapheim Dimitropoulos 	error = spa_import(bogus_name, cfg, NULL,
4313e0f1c0afSOlaf Faaland 	    ZFS_IMPORT_MISSING_LOG | ZFS_IMPORT_CHECKPOINT |
4314e0f1c0afSOlaf Faaland 	    ZFS_IMPORT_SKIP_MMP);
431586714001SSerapheim Dimitropoulos 	if (error != 0) {
431686714001SSerapheim Dimitropoulos 		fatal("Tried to import pool \"%s\" but spa_import() failed "
431786714001SSerapheim Dimitropoulos 		    "with error %d\n", bogus_name, error);
431886714001SSerapheim Dimitropoulos 	}
431986714001SSerapheim Dimitropoulos 
432086714001SSerapheim Dimitropoulos 	if (new_path != NULL && path_start != NULL)
432186714001SSerapheim Dimitropoulos 		(void) asprintf(new_path, "%s%s", bogus_name, path_start);
432286714001SSerapheim Dimitropoulos 
432386714001SSerapheim Dimitropoulos 	if (target != poolname)
432486714001SSerapheim Dimitropoulos 		free(poolname);
432586714001SSerapheim Dimitropoulos 
432686714001SSerapheim Dimitropoulos 	return (bogus_name);
432786714001SSerapheim Dimitropoulos }
432886714001SSerapheim Dimitropoulos 
432986714001SSerapheim Dimitropoulos typedef struct verify_checkpoint_sm_entry_cb_arg {
433086714001SSerapheim Dimitropoulos 	vdev_t *vcsec_vd;
433186714001SSerapheim Dimitropoulos 
433286714001SSerapheim Dimitropoulos 	/* the following fields are only used for printing progress */
433386714001SSerapheim Dimitropoulos 	uint64_t vcsec_entryid;
433486714001SSerapheim Dimitropoulos 	uint64_t vcsec_num_entries;
433586714001SSerapheim Dimitropoulos } verify_checkpoint_sm_entry_cb_arg_t;
433686714001SSerapheim Dimitropoulos 
433786714001SSerapheim Dimitropoulos #define	ENTRIES_PER_PROGRESS_UPDATE 10000
433886714001SSerapheim Dimitropoulos 
433986714001SSerapheim Dimitropoulos static int
434017f11284SSerapheim Dimitropoulos verify_checkpoint_sm_entry_cb(space_map_entry_t *sme, void *arg)
434186714001SSerapheim Dimitropoulos {
434286714001SSerapheim Dimitropoulos 	verify_checkpoint_sm_entry_cb_arg_t *vcsec = arg;
434386714001SSerapheim Dimitropoulos 	vdev_t *vd = vcsec->vcsec_vd;
434417f11284SSerapheim Dimitropoulos 	metaslab_t *ms = vd->vdev_ms[sme->sme_offset >> vd->vdev_ms_shift];
434517f11284SSerapheim Dimitropoulos 	uint64_t end = sme->sme_offset + sme->sme_run;
434686714001SSerapheim Dimitropoulos 
434717f11284SSerapheim Dimitropoulos 	ASSERT(sme->sme_type == SM_FREE);
434886714001SSerapheim Dimitropoulos 
434986714001SSerapheim Dimitropoulos 	if ((vcsec->vcsec_entryid % ENTRIES_PER_PROGRESS_UPDATE) == 0) {
435086714001SSerapheim Dimitropoulos 		(void) fprintf(stderr,
435186714001SSerapheim Dimitropoulos 		    "\rverifying vdev %llu, space map entry %llu of %llu ...",
435286714001SSerapheim Dimitropoulos 		    (longlong_t)vd->vdev_id,
435386714001SSerapheim Dimitropoulos 		    (longlong_t)vcsec->vcsec_entryid,
435486714001SSerapheim Dimitropoulos 		    (longlong_t)vcsec->vcsec_num_entries);
435586714001SSerapheim Dimitropoulos 	}
435686714001SSerapheim Dimitropoulos 	vcsec->vcsec_entryid++;
435786714001SSerapheim Dimitropoulos 
435886714001SSerapheim Dimitropoulos 	/*
435986714001SSerapheim Dimitropoulos 	 * See comment in checkpoint_sm_exclude_entry_cb()
436086714001SSerapheim Dimitropoulos 	 */
436117f11284SSerapheim Dimitropoulos 	VERIFY3U(sme->sme_offset, >=, ms->ms_start);
436286714001SSerapheim Dimitropoulos 	VERIFY3U(end, <=, ms->ms_start + ms->ms_size);
436386714001SSerapheim Dimitropoulos 
436486714001SSerapheim Dimitropoulos 	/*
436586714001SSerapheim Dimitropoulos 	 * The entries in the vdev_checkpoint_sm should be marked as
436686714001SSerapheim Dimitropoulos 	 * allocated in the checkpointed state of the pool, therefore
436786714001SSerapheim Dimitropoulos 	 * their respective ms_allocateable trees should not contain them.
436886714001SSerapheim Dimitropoulos 	 */
436986714001SSerapheim Dimitropoulos 	mutex_enter(&ms->ms_lock);
437017f11284SSerapheim Dimitropoulos 	range_tree_verify(ms->ms_allocatable, sme->sme_offset, sme->sme_run);
437186714001SSerapheim Dimitropoulos 	mutex_exit(&ms->ms_lock);
437286714001SSerapheim Dimitropoulos 
437386714001SSerapheim Dimitropoulos 	return (0);
437486714001SSerapheim Dimitropoulos }
437586714001SSerapheim Dimitropoulos 
437686714001SSerapheim Dimitropoulos /*
437786714001SSerapheim Dimitropoulos  * Verify that all segments in the vdev_checkpoint_sm are allocated
437886714001SSerapheim Dimitropoulos  * according to the checkpoint's ms_sm (i.e. are not in the checkpoint's
437986714001SSerapheim Dimitropoulos  * ms_allocatable).
438086714001SSerapheim Dimitropoulos  *
438186714001SSerapheim Dimitropoulos  * Do so by comparing the checkpoint space maps (vdev_checkpoint_sm) of
438286714001SSerapheim Dimitropoulos  * each vdev in the current state of the pool to the metaslab space maps
438386714001SSerapheim Dimitropoulos  * (ms_sm) of the checkpointed state of the pool.
438486714001SSerapheim Dimitropoulos  *
438586714001SSerapheim Dimitropoulos  * Note that the function changes the state of the ms_allocatable
438686714001SSerapheim Dimitropoulos  * trees of the current spa_t. The entries of these ms_allocatable
438786714001SSerapheim Dimitropoulos  * trees are cleared out and then repopulated from with the free
438886714001SSerapheim Dimitropoulos  * entries of their respective ms_sm space maps.
438986714001SSerapheim Dimitropoulos  */
439086714001SSerapheim Dimitropoulos static void
439186714001SSerapheim Dimitropoulos verify_checkpoint_vdev_spacemaps(spa_t *checkpoint, spa_t *current)
439286714001SSerapheim Dimitropoulos {
439386714001SSerapheim Dimitropoulos 	vdev_t *ckpoint_rvd = checkpoint->spa_root_vdev;
439486714001SSerapheim Dimitropoulos 	vdev_t *current_rvd = current->spa_root_vdev;
439586714001SSerapheim Dimitropoulos 
439686714001SSerapheim Dimitropoulos 	load_concrete_ms_allocatable_trees(checkpoint, SM_FREE);
439786714001SSerapheim Dimitropoulos 
439886714001SSerapheim Dimitropoulos 	for (uint64_t c = 0; c < ckpoint_rvd->vdev_children; c++) {
439986714001SSerapheim Dimitropoulos 		vdev_t *ckpoint_vd = ckpoint_rvd->vdev_child[c];
440086714001SSerapheim Dimitropoulos 		vdev_t *current_vd = current_rvd->vdev_child[c];
440186714001SSerapheim Dimitropoulos 
440286714001SSerapheim Dimitropoulos 		space_map_t *checkpoint_sm = NULL;
440386714001SSerapheim Dimitropoulos 		uint64_t checkpoint_sm_obj;
440486714001SSerapheim Dimitropoulos 
440586714001SSerapheim Dimitropoulos 		if (ckpoint_vd->vdev_ops == &vdev_indirect_ops) {
440686714001SSerapheim Dimitropoulos 			/*
440786714001SSerapheim Dimitropoulos 			 * Since we don't allow device removal in a pool
440886714001SSerapheim Dimitropoulos 			 * that has a checkpoint, we expect that all removed
440986714001SSerapheim Dimitropoulos 			 * vdevs were removed from the pool before the
441086714001SSerapheim Dimitropoulos 			 * checkpoint.
441186714001SSerapheim Dimitropoulos 			 */
441286714001SSerapheim Dimitropoulos 			ASSERT3P(current_vd->vdev_ops, ==, &vdev_indirect_ops);
441386714001SSerapheim Dimitropoulos 			continue;
441486714001SSerapheim Dimitropoulos 		}
441586714001SSerapheim Dimitropoulos 
441686714001SSerapheim Dimitropoulos 		/*
441786714001SSerapheim Dimitropoulos 		 * If the checkpoint space map doesn't exist, then nothing
441886714001SSerapheim Dimitropoulos 		 * here is checkpointed so there's nothing to verify.
441986714001SSerapheim Dimitropoulos 		 */
442086714001SSerapheim Dimitropoulos 		if (current_vd->vdev_top_zap == 0 ||
442186714001SSerapheim Dimitropoulos 		    zap_contains(spa_meta_objset(current),
442286714001SSerapheim Dimitropoulos 		    current_vd->vdev_top_zap,
442386714001SSerapheim Dimitropoulos 		    VDEV_TOP_ZAP_POOL_CHECKPOINT_SM) != 0)
442486714001SSerapheim Dimitropoulos 			continue;
442586714001SSerapheim Dimitropoulos 
442686714001SSerapheim Dimitropoulos 		VERIFY0(zap_lookup(spa_meta_objset(current),
442786714001SSerapheim Dimitropoulos 		    current_vd->vdev_top_zap, VDEV_TOP_ZAP_POOL_CHECKPOINT_SM,
442886714001SSerapheim Dimitropoulos 		    sizeof (uint64_t), 1, &checkpoint_sm_obj));
442986714001SSerapheim Dimitropoulos 
443086714001SSerapheim Dimitropoulos 		VERIFY0(space_map_open(&checkpoint_sm, spa_meta_objset(current),
443186714001SSerapheim Dimitropoulos 		    checkpoint_sm_obj, 0, current_vd->vdev_asize,
443286714001SSerapheim Dimitropoulos 		    current_vd->vdev_ashift));
443386714001SSerapheim Dimitropoulos 		space_map_update(checkpoint_sm);
443486714001SSerapheim Dimitropoulos 
443586714001SSerapheim Dimitropoulos 		verify_checkpoint_sm_entry_cb_arg_t vcsec;
443686714001SSerapheim Dimitropoulos 		vcsec.vcsec_vd = ckpoint_vd;
443786714001SSerapheim Dimitropoulos 		vcsec.vcsec_entryid = 0;
443886714001SSerapheim Dimitropoulos 		vcsec.vcsec_num_entries =
443986714001SSerapheim Dimitropoulos 		    space_map_length(checkpoint_sm) / sizeof (uint64_t);
444086714001SSerapheim Dimitropoulos 		VERIFY0(space_map_iterate(checkpoint_sm,
444186714001SSerapheim Dimitropoulos 		    verify_checkpoint_sm_entry_cb, &vcsec));
444286714001SSerapheim Dimitropoulos 		dump_spacemap(current->spa_meta_objset, checkpoint_sm);
444386714001SSerapheim Dimitropoulos 		space_map_close(checkpoint_sm);
444486714001SSerapheim Dimitropoulos 	}
444586714001SSerapheim Dimitropoulos 
444686714001SSerapheim Dimitropoulos 	/*
444786714001SSerapheim Dimitropoulos 	 * If we've added vdevs since we took the checkpoint, ensure
444886714001SSerapheim Dimitropoulos 	 * that their checkpoint space maps are empty.
444986714001SSerapheim Dimitropoulos 	 */
445086714001SSerapheim Dimitropoulos 	if (ckpoint_rvd->vdev_children < current_rvd->vdev_children) {
445186714001SSerapheim Dimitropoulos 		for (uint64_t c = ckpoint_rvd->vdev_children;
445286714001SSerapheim Dimitropoulos 		    c < current_rvd->vdev_children; c++) {
445386714001SSerapheim Dimitropoulos 			vdev_t *current_vd = current_rvd->vdev_child[c];
445486714001SSerapheim Dimitropoulos 			ASSERT3P(current_vd->vdev_checkpoint_sm, ==, NULL);
445586714001SSerapheim Dimitropoulos 		}
445686714001SSerapheim Dimitropoulos 	}
445786714001SSerapheim Dimitropoulos 
445886714001SSerapheim Dimitropoulos 	/* for cleaner progress output */
445986714001SSerapheim Dimitropoulos 	(void) fprintf(stderr, "\n");
446086714001SSerapheim Dimitropoulos }
446186714001SSerapheim Dimitropoulos 
446286714001SSerapheim Dimitropoulos /*
446386714001SSerapheim Dimitropoulos  * Verifies that all space that's allocated in the checkpoint is
446486714001SSerapheim Dimitropoulos  * still allocated in the current version, by checking that everything
446586714001SSerapheim Dimitropoulos  * in checkpoint's ms_allocatable (which is actually allocated, not
446686714001SSerapheim Dimitropoulos  * allocatable/free) is not present in current's ms_allocatable.
446786714001SSerapheim Dimitropoulos  *
446886714001SSerapheim Dimitropoulos  * Note that the function changes the state of the ms_allocatable
446986714001SSerapheim Dimitropoulos  * trees of both spas when called. The entries of all ms_allocatable
447086714001SSerapheim Dimitropoulos  * trees are cleared out and then repopulated from their respective
447186714001SSerapheim Dimitropoulos  * ms_sm space maps. In the checkpointed state we load the allocated
447286714001SSerapheim Dimitropoulos  * entries, and in the current state we load the free entries.
447386714001SSerapheim Dimitropoulos  */
447486714001SSerapheim Dimitropoulos static void
447586714001SSerapheim Dimitropoulos verify_checkpoint_ms_spacemaps(spa_t *checkpoint, spa_t *current)
447686714001SSerapheim Dimitropoulos {
447786714001SSerapheim Dimitropoulos 	vdev_t *ckpoint_rvd = checkpoint->spa_root_vdev;
447886714001SSerapheim Dimitropoulos 	vdev_t *current_rvd = current->spa_root_vdev;
447986714001SSerapheim Dimitropoulos 
448086714001SSerapheim Dimitropoulos 	load_concrete_ms_allocatable_trees(checkpoint, SM_ALLOC);
448186714001SSerapheim Dimitropoulos 	load_concrete_ms_allocatable_trees(current, SM_FREE);
448286714001SSerapheim Dimitropoulos 
448386714001SSerapheim Dimitropoulos 	for (uint64_t i = 0; i < ckpoint_rvd->vdev_children; i++) {
448486714001SSerapheim Dimitropoulos 		vdev_t *ckpoint_vd = ckpoint_rvd->vdev_child[i];
448586714001SSerapheim Dimitropoulos 		vdev_t *current_vd = current_rvd->vdev_child[i];
448686714001SSerapheim Dimitropoulos 
448786714001SSerapheim Dimitropoulos 		if (ckpoint_vd->vdev_ops == &vdev_indirect_ops) {
448886714001SSerapheim Dimitropoulos 			/*
448986714001SSerapheim Dimitropoulos 			 * See comment in verify_checkpoint_vdev_spacemaps()
449086714001SSerapheim Dimitropoulos 			 */
449186714001SSerapheim Dimitropoulos 			ASSERT3P(current_vd->vdev_ops, ==, &vdev_indirect_ops);
449286714001SSerapheim Dimitropoulos 			continue;
449386714001SSerapheim Dimitropoulos 		}
449486714001SSerapheim Dimitropoulos 
449586714001SSerapheim Dimitropoulos 		for (uint64_t m = 0; m < ckpoint_vd->vdev_ms_count; m++) {
449686714001SSerapheim Dimitropoulos 			metaslab_t *ckpoint_msp = ckpoint_vd->vdev_ms[m];
449786714001SSerapheim Dimitropoulos 			metaslab_t *current_msp = current_vd->vdev_ms[m];
449886714001SSerapheim Dimitropoulos 
449986714001SSerapheim Dimitropoulos 			(void) fprintf(stderr,
450086714001SSerapheim Dimitropoulos 			    "\rverifying vdev %llu of %llu, "
450186714001SSerapheim Dimitropoulos 			    "metaslab %llu of %llu ...",
450286714001SSerapheim Dimitropoulos 			    (longlong_t)current_vd->vdev_id,
450386714001SSerapheim Dimitropoulos 			    (longlong_t)current_rvd->vdev_children,
450486714001SSerapheim Dimitropoulos 			    (longlong_t)current_vd->vdev_ms[m]->ms_id,
450586714001SSerapheim Dimitropoulos 			    (longlong_t)current_vd->vdev_ms_count);
450686714001SSerapheim Dimitropoulos 
450786714001SSerapheim Dimitropoulos 			/*
450886714001SSerapheim Dimitropoulos 			 * We walk through the ms_allocatable trees that
450986714001SSerapheim Dimitropoulos 			 * are loaded with the allocated blocks from the
451086714001SSerapheim Dimitropoulos 			 * ms_sm spacemaps of the checkpoint. For each
451186714001SSerapheim Dimitropoulos 			 * one of these ranges we ensure that none of them
451286714001SSerapheim Dimitropoulos 			 * exists in the ms_allocatable trees of the
451386714001SSerapheim Dimitropoulos 			 * current state which are loaded with the ranges
451486714001SSerapheim Dimitropoulos 			 * that are currently free.
451586714001SSerapheim Dimitropoulos 			 *
451686714001SSerapheim Dimitropoulos 			 * This way we ensure that none of the blocks that
451786714001SSerapheim Dimitropoulos 			 * are part of the checkpoint were freed by mistake.
451886714001SSerapheim Dimitropoulos 			 */
451986714001SSerapheim Dimitropoulos 			range_tree_walk(ckpoint_msp->ms_allocatable,
452086714001SSerapheim Dimitropoulos 			    (range_tree_func_t *)range_tree_verify,
452186714001SSerapheim Dimitropoulos 			    current_msp->ms_allocatable);
452286714001SSerapheim Dimitropoulos 		}
452386714001SSerapheim Dimitropoulos 	}
452486714001SSerapheim Dimitropoulos 
452586714001SSerapheim Dimitropoulos 	/* for cleaner progress output */
452686714001SSerapheim Dimitropoulos 	(void) fprintf(stderr, "\n");
452786714001SSerapheim Dimitropoulos }
452886714001SSerapheim Dimitropoulos 
452986714001SSerapheim Dimitropoulos static void
453086714001SSerapheim Dimitropoulos verify_checkpoint_blocks(spa_t *spa)
453186714001SSerapheim Dimitropoulos {
453286714001SSerapheim Dimitropoulos 	spa_t *checkpoint_spa;
453386714001SSerapheim Dimitropoulos 	char *checkpoint_pool;
453486714001SSerapheim Dimitropoulos 	nvlist_t *config = NULL;
453586714001SSerapheim Dimitropoulos 	int error = 0;
453686714001SSerapheim Dimitropoulos 
453786714001SSerapheim Dimitropoulos 	/*
453886714001SSerapheim Dimitropoulos 	 * We import the checkpointed state of the pool (under a different
453986714001SSerapheim Dimitropoulos 	 * name) so we can do verification on it against the current state
454086714001SSerapheim Dimitropoulos 	 * of the pool.
454186714001SSerapheim Dimitropoulos 	 */
454286714001SSerapheim Dimitropoulos 	checkpoint_pool = import_checkpointed_state(spa->spa_name, config,
454386714001SSerapheim Dimitropoulos 	    NULL);
454486714001SSerapheim Dimitropoulos 	ASSERT(strcmp(spa->spa_name, checkpoint_pool) != 0);
454586714001SSerapheim Dimitropoulos 
454686714001SSerapheim Dimitropoulos 	error = spa_open(checkpoint_pool, &checkpoint_spa, FTAG);
454786714001SSerapheim Dimitropoulos 	if (error != 0) {
454886714001SSerapheim Dimitropoulos 		fatal("Tried to open pool \"%s\" but spa_open() failed with "
454986714001SSerapheim Dimitropoulos 		    "error %d\n", checkpoint_pool, error);
455086714001SSerapheim Dimitropoulos 	}
455186714001SSerapheim Dimitropoulos 
455286714001SSerapheim Dimitropoulos 	/*
455386714001SSerapheim Dimitropoulos 	 * Ensure that ranges in the checkpoint space maps of each vdev
455486714001SSerapheim Dimitropoulos 	 * are allocated according to the checkpointed state's metaslab
455586714001SSerapheim Dimitropoulos 	 * space maps.
455686714001SSerapheim Dimitropoulos 	 */
455786714001SSerapheim Dimitropoulos 	verify_checkpoint_vdev_spacemaps(checkpoint_spa, spa);
455886714001SSerapheim Dimitropoulos 
455986714001SSerapheim Dimitropoulos 	/*
456086714001SSerapheim Dimitropoulos 	 * Ensure that allocated ranges in the checkpoint's metaslab
456186714001SSerapheim Dimitropoulos 	 * space maps remain allocated in the metaslab space maps of
456286714001SSerapheim Dimitropoulos 	 * the current state.
456386714001SSerapheim Dimitropoulos 	 */
456486714001SSerapheim Dimitropoulos 	verify_checkpoint_ms_spacemaps(checkpoint_spa, spa);
456586714001SSerapheim Dimitropoulos 
456686714001SSerapheim Dimitropoulos 	/*
456786714001SSerapheim Dimitropoulos 	 * Once we are done, we get rid of the checkpointed state.
456886714001SSerapheim Dimitropoulos 	 */
456986714001SSerapheim Dimitropoulos 	spa_close(checkpoint_spa, FTAG);
457086714001SSerapheim Dimitropoulos 	free(checkpoint_pool);
457186714001SSerapheim Dimitropoulos }
457286714001SSerapheim Dimitropoulos 
457386714001SSerapheim Dimitropoulos static void
457486714001SSerapheim Dimitropoulos dump_leftover_checkpoint_blocks(spa_t *spa)
457586714001SSerapheim Dimitropoulos {
457686714001SSerapheim Dimitropoulos 	vdev_t *rvd = spa->spa_root_vdev;
457786714001SSerapheim Dimitropoulos 
457886714001SSerapheim Dimitropoulos 	for (uint64_t i = 0; i < rvd->vdev_children; i++) {
457986714001SSerapheim Dimitropoulos 		vdev_t *vd = rvd->vdev_child[i];
458086714001SSerapheim Dimitropoulos 
458186714001SSerapheim Dimitropoulos 		space_map_t *checkpoint_sm = NULL;
458286714001SSerapheim Dimitropoulos 		uint64_t checkpoint_sm_obj;
458386714001SSerapheim Dimitropoulos 
458486714001SSerapheim Dimitropoulos 		if (vd->vdev_top_zap == 0)
458586714001SSerapheim Dimitropoulos 			continue;
458686714001SSerapheim Dimitropoulos 
458786714001SSerapheim Dimitropoulos 		if (zap_contains(spa_meta_objset(spa), vd->vdev_top_zap,
458886714001SSerapheim Dimitropoulos 		    VDEV_TOP_ZAP_POOL_CHECKPOINT_SM) != 0)
458986714001SSerapheim Dimitropoulos 			continue;
459086714001SSerapheim Dimitropoulos 
459186714001SSerapheim Dimitropoulos 		VERIFY0(zap_lookup(spa_meta_objset(spa), vd->vdev_top_zap,
459286714001SSerapheim Dimitropoulos 		    VDEV_TOP_ZAP_POOL_CHECKPOINT_SM,
459386714001SSerapheim Dimitropoulos 		    sizeof (uint64_t), 1, &checkpoint_sm_obj));
459486714001SSerapheim Dimitropoulos 
459586714001SSerapheim Dimitropoulos 		VERIFY0(space_map_open(&checkpoint_sm, spa_meta_objset(spa),
459686714001SSerapheim Dimitropoulos 		    checkpoint_sm_obj, 0, vd->vdev_asize, vd->vdev_ashift));
459786714001SSerapheim Dimitropoulos 		space_map_update(checkpoint_sm);
459886714001SSerapheim Dimitropoulos 		dump_spacemap(spa->spa_meta_objset, checkpoint_sm);
459986714001SSerapheim Dimitropoulos 		space_map_close(checkpoint_sm);
460086714001SSerapheim Dimitropoulos 	}
460186714001SSerapheim Dimitropoulos }
460286714001SSerapheim Dimitropoulos 
460386714001SSerapheim Dimitropoulos static int
460486714001SSerapheim Dimitropoulos verify_checkpoint(spa_t *spa)
460586714001SSerapheim Dimitropoulos {
460686714001SSerapheim Dimitropoulos 	uberblock_t checkpoint;
460786714001SSerapheim Dimitropoulos 	int error;
460886714001SSerapheim Dimitropoulos 
460986714001SSerapheim Dimitropoulos 	if (!spa_feature_is_active(spa, SPA_FEATURE_POOL_CHECKPOINT))
461086714001SSerapheim Dimitropoulos 		return (0);
461186714001SSerapheim Dimitropoulos 
461286714001SSerapheim Dimitropoulos 	error = zap_lookup(spa->spa_meta_objset, DMU_POOL_DIRECTORY_OBJECT,
461386714001SSerapheim Dimitropoulos 	    DMU_POOL_ZPOOL_CHECKPOINT, sizeof (uint64_t),
461486714001SSerapheim Dimitropoulos 	    sizeof (uberblock_t) / sizeof (uint64_t), &checkpoint);
461586714001SSerapheim Dimitropoulos 
461617f11284SSerapheim Dimitropoulos 	if (error == ENOENT && !dump_opt['L']) {
461786714001SSerapheim Dimitropoulos 		/*
461886714001SSerapheim Dimitropoulos 		 * If the feature is active but the uberblock is missing
461986714001SSerapheim Dimitropoulos 		 * then we must be in the middle of discarding the
462086714001SSerapheim Dimitropoulos 		 * checkpoint.
462186714001SSerapheim Dimitropoulos 		 */
462286714001SSerapheim Dimitropoulos 		(void) printf("\nPartially discarded checkpoint "
462386714001SSerapheim Dimitropoulos 		    "state found:\n");
462486714001SSerapheim Dimitropoulos 		dump_leftover_checkpoint_blocks(spa);
462586714001SSerapheim Dimitropoulos 		return (0);
462686714001SSerapheim Dimitropoulos 	} else if (error != 0) {
462786714001SSerapheim Dimitropoulos 		(void) printf("lookup error %d when looking for "
462886714001SSerapheim Dimitropoulos 		    "checkpointed uberblock in MOS\n", error);
462986714001SSerapheim Dimitropoulos 		return (error);
463086714001SSerapheim Dimitropoulos 	}
463186714001SSerapheim Dimitropoulos 	dump_uberblock(&checkpoint, "\nCheckpointed uberblock found:\n", "\n");
463286714001SSerapheim Dimitropoulos 
463386714001SSerapheim Dimitropoulos 	if (checkpoint.ub_checkpoint_txg == 0) {
463486714001SSerapheim Dimitropoulos 		(void) printf("\nub_checkpoint_txg not set in checkpointed "
463586714001SSerapheim Dimitropoulos 		    "uberblock\n");
463686714001SSerapheim Dimitropoulos 		error = 3;
463786714001SSerapheim Dimitropoulos 	}
463886714001SSerapheim Dimitropoulos 
463917f11284SSerapheim Dimitropoulos 	if (error == 0 && !dump_opt['L'])
464086714001SSerapheim Dimitropoulos 		verify_checkpoint_blocks(spa);
464186714001SSerapheim Dimitropoulos 
464286714001SSerapheim Dimitropoulos 	return (error);
464386714001SSerapheim Dimitropoulos }
464486714001SSerapheim Dimitropoulos 
464517fb938fSMatthew Ahrens /* ARGSUSED */
464617fb938fSMatthew Ahrens static void
464717fb938fSMatthew Ahrens mos_leaks_cb(void *arg, uint64_t start, uint64_t size)
464817fb938fSMatthew Ahrens {
464917fb938fSMatthew Ahrens 	for (uint64_t i = start; i < size; i++) {
465017fb938fSMatthew Ahrens 		(void) printf("MOS object %llu referenced but not allocated\n",
465117fb938fSMatthew Ahrens 		    (u_longlong_t)i);
465217fb938fSMatthew Ahrens 	}
465317fb938fSMatthew Ahrens }
465417fb938fSMatthew Ahrens 
465517fb938fSMatthew Ahrens static range_tree_t *mos_refd_objs;
465617fb938fSMatthew Ahrens 
465717fb938fSMatthew Ahrens static void
465817fb938fSMatthew Ahrens mos_obj_refd(uint64_t obj)
465917fb938fSMatthew Ahrens {
466017fb938fSMatthew Ahrens 	if (obj != 0 && mos_refd_objs != NULL)
466117fb938fSMatthew Ahrens 		range_tree_add(mos_refd_objs, obj, 1);
466217fb938fSMatthew Ahrens }
466317fb938fSMatthew Ahrens 
466417fb938fSMatthew Ahrens static void
466517fb938fSMatthew Ahrens mos_leak_vdev(vdev_t *vd)
466617fb938fSMatthew Ahrens {
466717fb938fSMatthew Ahrens 	mos_obj_refd(vd->vdev_dtl_object);
466817fb938fSMatthew Ahrens 	mos_obj_refd(vd->vdev_ms_array);
466917fb938fSMatthew Ahrens 	mos_obj_refd(vd->vdev_top_zap);
467017fb938fSMatthew Ahrens 	mos_obj_refd(vd->vdev_indirect_config.vic_births_object);
467117fb938fSMatthew Ahrens 	mos_obj_refd(vd->vdev_indirect_config.vic_mapping_object);
467217fb938fSMatthew Ahrens 	mos_obj_refd(vd->vdev_leaf_zap);
467317fb938fSMatthew Ahrens 	if (vd->vdev_checkpoint_sm != NULL)
467417fb938fSMatthew Ahrens 		mos_obj_refd(vd->vdev_checkpoint_sm->sm_object);
467517fb938fSMatthew Ahrens 	if (vd->vdev_indirect_mapping != NULL) {
467617fb938fSMatthew Ahrens 		mos_obj_refd(vd->vdev_indirect_mapping->
467717fb938fSMatthew Ahrens 		    vim_phys->vimp_counts_object);
467817fb938fSMatthew Ahrens 	}
467917fb938fSMatthew Ahrens 	if (vd->vdev_obsolete_sm != NULL)
468017fb938fSMatthew Ahrens 		mos_obj_refd(vd->vdev_obsolete_sm->sm_object);
468117fb938fSMatthew Ahrens 
468217fb938fSMatthew Ahrens 	for (uint64_t m = 0; m < vd->vdev_ms_count; m++) {
468317fb938fSMatthew Ahrens 		metaslab_t *ms = vd->vdev_ms[m];
468417fb938fSMatthew Ahrens 		mos_obj_refd(space_map_object(ms->ms_sm));
468517fb938fSMatthew Ahrens 	}
468617fb938fSMatthew Ahrens 
468717fb938fSMatthew Ahrens 	for (uint64_t c = 0; c < vd->vdev_children; c++) {
468817fb938fSMatthew Ahrens 		mos_leak_vdev(vd->vdev_child[c]);
468917fb938fSMatthew Ahrens 	}
469017fb938fSMatthew Ahrens }
469117fb938fSMatthew Ahrens 
469217fb938fSMatthew Ahrens static int
469317fb938fSMatthew Ahrens dump_mos_leaks(spa_t *spa)
469417fb938fSMatthew Ahrens {
469517fb938fSMatthew Ahrens 	int rv = 0;
469617fb938fSMatthew Ahrens 	objset_t *mos = spa->spa_meta_objset;
469717fb938fSMatthew Ahrens 	dsl_pool_t *dp = spa->spa_dsl_pool;
469817fb938fSMatthew Ahrens 
469917fb938fSMatthew Ahrens 	/* Visit and mark all referenced objects in the MOS */
470017fb938fSMatthew Ahrens 
470117fb938fSMatthew Ahrens 	mos_obj_refd(DMU_POOL_DIRECTORY_OBJECT);
470217fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_pool_props_object);
470317fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_config_object);
470417fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_ddt_stat_object);
470517fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_feat_desc_obj);
470617fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_feat_enabled_txg_obj);
470717fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_feat_for_read_obj);
470817fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_feat_for_write_obj);
470917fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_history);
471017fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_errlog_last);
471117fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_errlog_scrub);
471217fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_all_vdev_zaps);
471317fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_dsl_pool->dp_bptree_obj);
471417fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_dsl_pool->dp_tmp_userrefs_obj);
471517fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_dsl_pool->dp_scan->scn_phys.scn_queue_obj);
471617fb938fSMatthew Ahrens 	bpobj_count_refd(&spa->spa_deferred_bpobj);
471717fb938fSMatthew Ahrens 	mos_obj_refd(dp->dp_empty_bpobj);
471817fb938fSMatthew Ahrens 	bpobj_count_refd(&dp->dp_obsolete_bpobj);
471917fb938fSMatthew Ahrens 	bpobj_count_refd(&dp->dp_free_bpobj);
472017fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_l2cache.sav_object);
472117fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_spares.sav_object);
472217fb938fSMatthew Ahrens 
472317fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_condensing_indirect_phys.
472417fb938fSMatthew Ahrens 	    scip_next_mapping_object);
472517fb938fSMatthew Ahrens 	mos_obj_refd(spa->spa_condensing_indirect_phys.
472617fb938fSMatthew Ahrens 	    scip_prev_obsolete_sm_object);
472717fb938fSMatthew Ahrens 	if (spa->spa_condensing_indirect_phys.scip_next_mapping_object != 0) {
472817fb938fSMatthew Ahrens 		vdev_indirect_mapping_t *vim =
472917fb938fSMatthew Ahrens 		    vdev_indirect_mapping_open(mos,
473017fb938fSMatthew Ahrens 		    spa->spa_condensing_indirect_phys.scip_next_mapping_object);
473117fb938fSMatthew Ahrens 		mos_obj_refd(vim->vim_phys->vimp_counts_object);
473217fb938fSMatthew Ahrens 		vdev_indirect_mapping_close(vim);
473317fb938fSMatthew Ahrens 	}
473417fb938fSMatthew Ahrens 
473517fb938fSMatthew Ahrens 	if (dp->dp_origin_snap != NULL) {
473617fb938fSMatthew Ahrens 		dsl_dataset_t *ds;
473717fb938fSMatthew Ahrens 
473817fb938fSMatthew Ahrens 		dsl_pool_config_enter(dp, FTAG);
473917fb938fSMatthew Ahrens 		VERIFY0(dsl_dataset_hold_obj(dp,
474017fb938fSMatthew Ahrens 		    dsl_dataset_phys(dp->dp_origin_snap)->ds_next_snap_obj,
474117fb938fSMatthew Ahrens 		    FTAG, &ds));
474217fb938fSMatthew Ahrens 		count_ds_mos_objects(ds);
474317fb938fSMatthew Ahrens 		dump_deadlist(&ds->ds_deadlist);
474417fb938fSMatthew Ahrens 		dsl_dataset_rele(ds, FTAG);
474517fb938fSMatthew Ahrens 		dsl_pool_config_exit(dp, FTAG);
474617fb938fSMatthew Ahrens 
474717fb938fSMatthew Ahrens 		count_ds_mos_objects(dp->dp_origin_snap);
474817fb938fSMatthew Ahrens 		dump_deadlist(&dp->dp_origin_snap->ds_deadlist);
474917fb938fSMatthew Ahrens 	}
475017fb938fSMatthew Ahrens 	count_dir_mos_objects(dp->dp_mos_dir);
475117fb938fSMatthew Ahrens 	if (dp->dp_free_dir != NULL)
475217fb938fSMatthew Ahrens 		count_dir_mos_objects(dp->dp_free_dir);
475317fb938fSMatthew Ahrens 	if (dp->dp_leak_dir != NULL)
475417fb938fSMatthew Ahrens 		count_dir_mos_objects(dp->dp_leak_dir);
475517fb938fSMatthew Ahrens 
475617fb938fSMatthew Ahrens 	mos_leak_vdev(spa->spa_root_vdev);
475717fb938fSMatthew Ahrens 
475817fb938fSMatthew Ahrens 	for (uint64_t class = 0; class < DDT_CLASSES; class++) {
475917fb938fSMatthew Ahrens 		for (uint64_t type = 0; type < DDT_TYPES; type++) {
476017fb938fSMatthew Ahrens 			for (uint64_t cksum = 0;
476117fb938fSMatthew Ahrens 			    cksum < ZIO_CHECKSUM_FUNCTIONS; cksum++) {
476217fb938fSMatthew Ahrens 				ddt_t *ddt = spa->spa_ddt[cksum];
476317fb938fSMatthew Ahrens 				mos_obj_refd(ddt->ddt_object[type][class]);
476417fb938fSMatthew Ahrens 			}
476517fb938fSMatthew Ahrens 		}
476617fb938fSMatthew Ahrens 	}
476717fb938fSMatthew Ahrens 
476817fb938fSMatthew Ahrens 	/*
476917fb938fSMatthew Ahrens 	 * Visit all allocated objects and make sure they are referenced.
477017fb938fSMatthew Ahrens 	 */
477117fb938fSMatthew Ahrens 	uint64_t object = 0;
477217fb938fSMatthew Ahrens 	while (dmu_object_next(mos, &object, B_FALSE, 0) == 0) {
477317fb938fSMatthew Ahrens 		if (range_tree_contains(mos_refd_objs, object, 1)) {
477417fb938fSMatthew Ahrens 			range_tree_remove(mos_refd_objs, object, 1);
477517fb938fSMatthew Ahrens 		} else {
477617fb938fSMatthew Ahrens 			dmu_object_info_t doi;
477717fb938fSMatthew Ahrens 			const char *name;
477817fb938fSMatthew Ahrens 			dmu_object_info(mos, object, &doi);
477917fb938fSMatthew Ahrens 			if (doi.doi_type & DMU_OT_NEWTYPE) {
478017fb938fSMatthew Ahrens 				dmu_object_byteswap_t bswap =
478117fb938fSMatthew Ahrens 				    DMU_OT_BYTESWAP(doi.doi_type);
478217fb938fSMatthew Ahrens 				name = dmu_ot_byteswap[bswap].ob_name;
478317fb938fSMatthew Ahrens 			} else {
478417fb938fSMatthew Ahrens 				name = dmu_ot[doi.doi_type].ot_name;
478517fb938fSMatthew Ahrens 			}
478617fb938fSMatthew Ahrens 
478717fb938fSMatthew Ahrens 			(void) printf("MOS object %llu (%s) leaked\n",
478817fb938fSMatthew Ahrens 			    (u_longlong_t)object, name);
478917fb938fSMatthew Ahrens 			rv = 2;
479017fb938fSMatthew Ahrens 		}
479117fb938fSMatthew Ahrens 	}
479217fb938fSMatthew Ahrens 	(void) range_tree_walk(mos_refd_objs, mos_leaks_cb, NULL);
479317fb938fSMatthew Ahrens 	if (!range_tree_is_empty(mos_refd_objs))
479417fb938fSMatthew Ahrens 		rv = 2;
479517fb938fSMatthew Ahrens 	range_tree_vacate(mos_refd_objs, NULL, NULL);
479617fb938fSMatthew Ahrens 	range_tree_destroy(mos_refd_objs);
479717fb938fSMatthew Ahrens 	return (rv);
479817fb938fSMatthew Ahrens }
479917fb938fSMatthew Ahrens 
4800fa9e4066Sahrens static void
4801fa9e4066Sahrens dump_zpool(spa_t *spa)
4802fa9e4066Sahrens {
4803fa9e4066Sahrens 	dsl_pool_t *dp = spa_get_dsl(spa);
4804fa9e4066Sahrens 	int rc = 0;
4805fa9e4066Sahrens 
4806b24ab676SJeff Bonwick 	if (dump_opt['S']) {
4807b24ab676SJeff Bonwick 		dump_simulated_ddt(spa);
4808b24ab676SJeff Bonwick 		return;
4809b24ab676SJeff Bonwick 	}
4810b24ab676SJeff Bonwick 
481107428bdfSVictor Latushkin 	if (!dump_opt['e'] && dump_opt['C'] > 1) {
481207428bdfSVictor Latushkin 		(void) printf("\nCached configuration:\n");
481307428bdfSVictor Latushkin 		dump_nvlist(spa->spa_config, 8);
481407428bdfSVictor Latushkin 	}
481507428bdfSVictor Latushkin 
481607428bdfSVictor Latushkin 	if (dump_opt['C'])
481707428bdfSVictor Latushkin 		dump_config(spa);
481807428bdfSVictor Latushkin 
4819fa9e4066Sahrens 	if (dump_opt['u'])
482053b9a4a9SVictor Latushkin 		dump_uberblock(&spa->spa_uberblock, "\nUberblock:\n", "\n");
4821fa9e4066Sahrens 
4822b24ab676SJeff Bonwick 	if (dump_opt['D'])
4823b24ab676SJeff Bonwick 		dump_all_ddts(spa);
4824b24ab676SJeff Bonwick 
482587219db7SVictor Latushkin 	if (dump_opt['d'] > 2 || dump_opt['m'])
482687219db7SVictor Latushkin 		dump_metaslabs(spa);
48272e4c9986SGeorge Wilson 	if (dump_opt['M'])
48282e4c9986SGeorge Wilson 		dump_metaslab_groups(spa);
482987219db7SVictor Latushkin 
483087219db7SVictor Latushkin 	if (dump_opt['d'] || dump_opt['i']) {
483117fb938fSMatthew Ahrens 		mos_refd_objs = range_tree_create(NULL, NULL);
4832fa9e4066Sahrens 		dump_dir(dp->dp_meta_objset);
483317fb938fSMatthew Ahrens 
4834fa9e4066Sahrens 		if (dump_opt['d'] >= 3) {
48355cabbc6bSPrashanth Sreenivasa 			dsl_pool_t *dp = spa->spa_dsl_pool;
4836732885fcSMatthew Ahrens 			dump_full_bpobj(&spa->spa_deferred_bpobj,
4837d0475637SMatthew Ahrens 			    "Deferred frees", 0);
4838cde58dbcSMatthew Ahrens 			if (spa_version(spa) >= SPA_VERSION_DEADLISTS) {
48395cabbc6bSPrashanth Sreenivasa 				dump_full_bpobj(&dp->dp_free_bpobj,
4840d0475637SMatthew Ahrens 				    "Pool snapshot frees", 0);
4841ad135b5dSChristopher Siden 			}
48425cabbc6bSPrashanth Sreenivasa 			if (bpobj_is_open(&dp->dp_obsolete_bpobj)) {
48435cabbc6bSPrashanth Sreenivasa 				ASSERT(spa_feature_is_enabled(spa,
48445cabbc6bSPrashanth Sreenivasa 				    SPA_FEATURE_DEVICE_REMOVAL));
48455cabbc6bSPrashanth Sreenivasa 				dump_full_bpobj(&dp->dp_obsolete_bpobj,
48465cabbc6bSPrashanth Sreenivasa 				    "Pool obsolete blocks", 0);
48475cabbc6bSPrashanth Sreenivasa 			}
4848ad135b5dSChristopher Siden 
4849ad135b5dSChristopher Siden 			if (spa_feature_is_active(spa,
48502acef22dSMatthew Ahrens 			    SPA_FEATURE_ASYNC_DESTROY)) {
4851ad135b5dSChristopher Siden 				dump_bptree(spa->spa_meta_objset,
48525cabbc6bSPrashanth Sreenivasa 				    dp->dp_bptree_obj,
4853ad135b5dSChristopher Siden 				    "Pool dataset frees");
4854cde58dbcSMatthew Ahrens 			}
4855fa9e4066Sahrens 			dump_dtl(spa->spa_root_vdev, 0);
4856fa9e4066Sahrens 		}
485707428bdfSVictor Latushkin 		(void) dmu_objset_find(spa_name(spa), dump_one_dir,
485807428bdfSVictor Latushkin 		    NULL, DS_FIND_SNAPSHOTS | DS_FIND_CHILDREN);
4859b5152584SMatthew Ahrens 
486017fb938fSMatthew Ahrens 		if (rc == 0 && !dump_opt['L'])
486117fb938fSMatthew Ahrens 			rc = dump_mos_leaks(spa);
486217fb938fSMatthew Ahrens 
4863ca0cc391SMatthew Ahrens 		for (spa_feature_t f = 0; f < SPA_FEATURES; f++) {
4864ca0cc391SMatthew Ahrens 			uint64_t refcount;
4865ca0cc391SMatthew Ahrens 
4866ca0cc391SMatthew Ahrens 			if (!(spa_feature_table[f].fi_flags &
4867c5d1600cSMatthew Ahrens 			    ZFEATURE_FLAG_PER_DATASET) ||
4868c5d1600cSMatthew Ahrens 			    !spa_feature_is_enabled(spa, f)) {
4869ca0cc391SMatthew Ahrens 				ASSERT0(dataset_feature_count[f]);
4870ca0cc391SMatthew Ahrens 				continue;
4871ca0cc391SMatthew Ahrens 			}
4872ca0cc391SMatthew Ahrens 			(void) feature_get_refcount(spa,
4873ca0cc391SMatthew Ahrens 			    &spa_feature_table[f], &refcount);
4874ca0cc391SMatthew Ahrens 			if (dataset_feature_count[f] != refcount) {
4875ca0cc391SMatthew Ahrens 				(void) printf("%s feature refcount mismatch: "
4876ca0cc391SMatthew Ahrens 				    "%lld datasets != %lld refcount\n",
4877ca0cc391SMatthew Ahrens 				    spa_feature_table[f].fi_uname,
4878ca0cc391SMatthew Ahrens 				    (longlong_t)dataset_feature_count[f],
4879ca0cc391SMatthew Ahrens 				    (longlong_t)refcount);
4880ca0cc391SMatthew Ahrens 				rc = 2;
4881ca0cc391SMatthew Ahrens 			} else {
4882ca0cc391SMatthew Ahrens 				(void) printf("Verified %s feature refcount "
4883ca0cc391SMatthew Ahrens 				    "of %llu is correct\n",
4884ca0cc391SMatthew Ahrens 				    spa_feature_table[f].fi_uname,
4885ca0cc391SMatthew Ahrens 				    (longlong_t)refcount);
4886ca0cc391SMatthew Ahrens 			}
4887b5152584SMatthew Ahrens 		}
48885cabbc6bSPrashanth Sreenivasa 
48895cabbc6bSPrashanth Sreenivasa 		if (rc == 0) {
48905cabbc6bSPrashanth Sreenivasa 			rc = verify_device_removal_feature_counts(spa);
48915cabbc6bSPrashanth Sreenivasa 		}
4892fa9e4066Sahrens 	}
489317fb938fSMatthew Ahrens 
4894b5152584SMatthew Ahrens 	if (rc == 0 && (dump_opt['b'] || dump_opt['c']))
4895fa9e4066Sahrens 		rc = dump_block_stats(spa);
4896fa9e4066Sahrens 
48970713e232SGeorge Wilson 	if (rc == 0)
48980713e232SGeorge Wilson 		rc = verify_spacemap_refcounts(spa);
48990713e232SGeorge Wilson 
4900fa9e4066Sahrens 	if (dump_opt['s'])
4901fa9e4066Sahrens 		show_pool_stats(spa);
4902fa9e4066Sahrens 
49038f18d1faSGeorge Wilson 	if (dump_opt['h'])
49048f18d1faSGeorge Wilson 		dump_history(spa);
49058f18d1faSGeorge Wilson 
490617f11284SSerapheim Dimitropoulos 	if (rc == 0)
490786714001SSerapheim Dimitropoulos 		rc = verify_checkpoint(spa);
490886714001SSerapheim Dimitropoulos 
490929bdd2f9SPavel Zakharov 	if (rc != 0) {
491029bdd2f9SPavel Zakharov 		dump_debug_buffer();
4911fa9e4066Sahrens 		exit(rc);
491229bdd2f9SPavel Zakharov 	}
4913fa9e4066Sahrens }
4914fa9e4066Sahrens 
491544cd46caSbillm #define	ZDB_FLAG_CHECKSUM	0x0001
491644cd46caSbillm #define	ZDB_FLAG_DECOMPRESS	0x0002
491744cd46caSbillm #define	ZDB_FLAG_BSWAP		0x0004
491844cd46caSbillm #define	ZDB_FLAG_GBH		0x0008
491944cd46caSbillm #define	ZDB_FLAG_INDIRECT	0x0010
492044cd46caSbillm #define	ZDB_FLAG_PHYS		0x0020
492144cd46caSbillm #define	ZDB_FLAG_RAW		0x0040
492244cd46caSbillm #define	ZDB_FLAG_PRINT_BLKPTR	0x0080
492344cd46caSbillm 
49243f7978d0SAlan Somers static int flagbits[256];
492544cd46caSbillm 
492644cd46caSbillm static void
492744cd46caSbillm zdb_print_blkptr(blkptr_t *bp, int flags)
492844cd46caSbillm {
4929b24ab676SJeff Bonwick 	char blkbuf[BP_SPRINTF_LEN];
493044cd46caSbillm 
493144cd46caSbillm 	if (flags & ZDB_FLAG_BSWAP)
493244cd46caSbillm 		byteswap_uint64_array((void *)bp, sizeof (blkptr_t));
4933b24ab676SJeff Bonwick 
493443466aaeSMax Grossman 	snprintf_blkptr(blkbuf, sizeof (blkbuf), bp);
4935b24ab676SJeff Bonwick 	(void) printf("%s\n", blkbuf);
493644cd46caSbillm }
493744cd46caSbillm 
493844cd46caSbillm static void
493944cd46caSbillm zdb_dump_indirect(blkptr_t *bp, int nbps, int flags)
494044cd46caSbillm {
494144cd46caSbillm 	int i;
494244cd46caSbillm 
494344cd46caSbillm 	for (i = 0; i < nbps; i++)
494444cd46caSbillm 		zdb_print_blkptr(&bp[i], flags);
494544cd46caSbillm }
494644cd46caSbillm 
494744cd46caSbillm static void
494844cd46caSbillm zdb_dump_gbh(void *buf, int flags)
494944cd46caSbillm {
495044cd46caSbillm 	zdb_dump_indirect((blkptr_t *)buf, SPA_GBH_NBLKPTRS, flags);
495144cd46caSbillm }
495244cd46caSbillm 
495344cd46caSbillm static void
495444cd46caSbillm zdb_dump_block_raw(void *buf, uint64_t size, int flags)
495544cd46caSbillm {
495644cd46caSbillm 	if (flags & ZDB_FLAG_BSWAP)
495744cd46caSbillm 		byteswap_uint64_array(buf, size);
4958b24ab676SJeff Bonwick 	(void) write(1, buf, size);
495944cd46caSbillm }
496044cd46caSbillm 
496144cd46caSbillm static void
496244cd46caSbillm zdb_dump_block(char *label, void *buf, uint64_t size, int flags)
496344cd46caSbillm {
496444cd46caSbillm 	uint64_t *d = (uint64_t *)buf;
49653f7978d0SAlan Somers 	unsigned nwords = size / sizeof (uint64_t);
496644cd46caSbillm 	int do_bswap = !!(flags & ZDB_FLAG_BSWAP);
49673f7978d0SAlan Somers 	unsigned i, j;
49683f7978d0SAlan Somers 	const char *hdr;
49693f7978d0SAlan Somers 	char *c;
497044cd46caSbillm 
497144cd46caSbillm 
497244cd46caSbillm 	if (do_bswap)
497344cd46caSbillm 		hdr = " 7 6 5 4 3 2 1 0   f e d c b a 9 8";
497444cd46caSbillm 	else
497544cd46caSbillm 		hdr = " 0 1 2 3 4 5 6 7   8 9 a b c d e f";
497644cd46caSbillm 
497744cd46caSbillm 	(void) printf("\n%s\n%6s   %s  0123456789abcdef\n", label, "", hdr);
497844cd46caSbillm 
497944cd46caSbillm 	for (i = 0; i < nwords; i += 2) {
498044cd46caSbillm 		(void) printf("%06llx:  %016llx  %016llx  ",
498144cd46caSbillm 		    (u_longlong_t)(i * sizeof (uint64_t)),
498244cd46caSbillm 		    (u_longlong_t)(do_bswap ? BSWAP_64(d[i]) : d[i]),
498344cd46caSbillm 		    (u_longlong_t)(do_bswap ? BSWAP_64(d[i + 1]) : d[i + 1]));
498444cd46caSbillm 
498544cd46caSbillm 		c = (char *)&d[i];
498644cd46caSbillm 		for (j = 0; j < 2 * sizeof (uint64_t); j++)
498744cd46caSbillm 			(void) printf("%c", isprint(c[j]) ? c[j] : '.');
498844cd46caSbillm 		(void) printf("\n");
498944cd46caSbillm 	}
499044cd46caSbillm }
499144cd46caSbillm 
499244cd46caSbillm /*
499344cd46caSbillm  * There are two acceptable formats:
499444cd46caSbillm  *	leaf_name	  - For example: c1t0d0 or /tmp/ztest.0a
499544cd46caSbillm  *	child[.child]*    - For example: 0.1.1
499644cd46caSbillm  *
499744cd46caSbillm  * The second form can be used to specify arbitrary vdevs anywhere
499844cd46caSbillm  * in the heirarchy.  For example, in a pool with a mirror of
499944cd46caSbillm  * RAID-Zs, you can specify either RAID-Z vdev with 0.0 or 0.1 .
500044cd46caSbillm  */
500144cd46caSbillm static vdev_t *
50023f7978d0SAlan Somers zdb_vdev_lookup(vdev_t *vdev, const char *path)
500344cd46caSbillm {
500444cd46caSbillm 	char *s, *p, *q;
50053f7978d0SAlan Somers 	unsigned i;
500644cd46caSbillm 
500744cd46caSbillm 	if (vdev == NULL)
500844cd46caSbillm 		return (NULL);
500944cd46caSbillm 
501044cd46caSbillm 	/* First, assume the x.x.x.x format */
50113f7978d0SAlan Somers 	i = strtoul(path, &s, 10);
501244cd46caSbillm 	if (s == path || (s && *s != '.' && *s != '\0'))
501344cd46caSbillm 		goto name;
50143f7978d0SAlan Somers 	if (i >= vdev->vdev_children)
501544cd46caSbillm 		return (NULL);
501644cd46caSbillm 
501744cd46caSbillm 	vdev = vdev->vdev_child[i];
501844cd46caSbillm 	if (*s == '\0')
501944cd46caSbillm 		return (vdev);
502044cd46caSbillm 	return (zdb_vdev_lookup(vdev, s+1));
502144cd46caSbillm 
502244cd46caSbillm name:
502344cd46caSbillm 	for (i = 0; i < vdev->vdev_children; i++) {
502444cd46caSbillm 		vdev_t *vc = vdev->vdev_child[i];
502544cd46caSbillm 
502644cd46caSbillm 		if (vc->vdev_path == NULL) {
502744cd46caSbillm 			vc = zdb_vdev_lookup(vc, path);
502844cd46caSbillm 			if (vc == NULL)
502944cd46caSbillm 				continue;
503044cd46caSbillm 			else
503144cd46caSbillm 				return (vc);
503244cd46caSbillm 		}
503344cd46caSbillm 
503444cd46caSbillm 		p = strrchr(vc->vdev_path, '/');
503544cd46caSbillm 		p = p ? p + 1 : vc->vdev_path;
503644cd46caSbillm 		q = &vc->vdev_path[strlen(vc->vdev_path) - 2];
503744cd46caSbillm 
503844cd46caSbillm 		if (strcmp(vc->vdev_path, path) == 0)
503944cd46caSbillm 			return (vc);
504044cd46caSbillm 		if (strcmp(p, path) == 0)
504144cd46caSbillm 			return (vc);
504244cd46caSbillm 		if (strcmp(q, "s0") == 0 && strncmp(p, path, q - p) == 0)
504344cd46caSbillm 			return (vc);
504444cd46caSbillm 	}
504544cd46caSbillm 
504644cd46caSbillm 	return (NULL);
504744cd46caSbillm }
504844cd46caSbillm 
5049770499e1SDan Kimmel /* ARGSUSED */
5050770499e1SDan Kimmel static int
5051770499e1SDan Kimmel random_get_pseudo_bytes_cb(void *buf, size_t len, void *unused)
5052770499e1SDan Kimmel {
5053770499e1SDan Kimmel 	return (random_get_pseudo_bytes(buf, len));
5054770499e1SDan Kimmel }
5055770499e1SDan Kimmel 
505644cd46caSbillm /*
505744cd46caSbillm  * Read a block from a pool and print it out.  The syntax of the
505844cd46caSbillm  * block descriptor is:
505944cd46caSbillm  *
506044cd46caSbillm  *	pool:vdev_specifier:offset:size[:flags]
506144cd46caSbillm  *
506244cd46caSbillm  *	pool           - The name of the pool you wish to read from
506344cd46caSbillm  *	vdev_specifier - Which vdev (see comment for zdb_vdev_lookup)
506444cd46caSbillm  *	offset         - offset, in hex, in bytes
506544cd46caSbillm  *	size           - Amount of data to read, in hex, in bytes
506644cd46caSbillm  *	flags          - A string of characters specifying options
506744cd46caSbillm  *		 b: Decode a blkptr at given offset within block
506844cd46caSbillm  *		*c: Calculate and display checksums
5069b24ab676SJeff Bonwick  *		 d: Decompress data before dumping
507044cd46caSbillm  *		 e: Byteswap data before dumping
5071b24ab676SJeff Bonwick  *		 g: Display data as a gang block header
5072b24ab676SJeff Bonwick  *		 i: Display as an indirect block
507344cd46caSbillm  *		 p: Do I/O to physical offset
507444cd46caSbillm  *		 r: Dump raw data to stdout
507544cd46caSbillm  *
507644cd46caSbillm  *              * = not yet implemented
507744cd46caSbillm  */
507844cd46caSbillm static void
507907428bdfSVictor Latushkin zdb_read_block(char *thing, spa_t *spa)
508044cd46caSbillm {
5081b24ab676SJeff Bonwick 	blkptr_t blk, *bp = &blk;
5082b24ab676SJeff Bonwick 	dva_t *dva = bp->blk_dva;
508344cd46caSbillm 	int flags = 0;
5084b24ab676SJeff Bonwick 	uint64_t offset = 0, size = 0, psize = 0, lsize = 0, blkptr_offset = 0;
508544cd46caSbillm 	zio_t *zio;
508644cd46caSbillm 	vdev_t *vd;
5087770499e1SDan Kimmel 	abd_t *pabd;
5088770499e1SDan Kimmel 	void *lbuf, *buf;
50893f7978d0SAlan Somers 	const char *s, *vdev;
50903f7978d0SAlan Somers 	char *p, *dup, *flagstr;
5091b24ab676SJeff Bonwick 	int i, error;
509244cd46caSbillm 
509344cd46caSbillm 	dup = strdup(thing);
509444cd46caSbillm 	s = strtok(dup, ":");
509544cd46caSbillm 	vdev = s ? s : "";
509644cd46caSbillm 	s = strtok(NULL, ":");
509744cd46caSbillm 	offset = strtoull(s ? s : "", NULL, 16);
509844cd46caSbillm 	s = strtok(NULL, ":");
509944cd46caSbillm 	size = strtoull(s ? s : "", NULL, 16);
510044cd46caSbillm 	s = strtok(NULL, ":");
51013f7978d0SAlan Somers 	if (s)
51023f7978d0SAlan Somers 		flagstr = strdup(s);
51033f7978d0SAlan Somers 	else
51043f7978d0SAlan Somers 		flagstr = strdup("");
510544cd46caSbillm 
510644cd46caSbillm 	s = NULL;
510744cd46caSbillm 	if (size == 0)
510844cd46caSbillm 		s = "size must not be zero";
510944cd46caSbillm 	if (!IS_P2ALIGNED(size, DEV_BSIZE))
511044cd46caSbillm 		s = "size must be a multiple of sector size";
511144cd46caSbillm 	if (!IS_P2ALIGNED(offset, DEV_BSIZE))
511244cd46caSbillm 		s = "offset must be a multiple of sector size";
511344cd46caSbillm 	if (s) {
511444cd46caSbillm 		(void) printf("Invalid block specifier: %s  - %s\n", thing, s);
511544cd46caSbillm 		free(dup);
511644cd46caSbillm 		return;
511744cd46caSbillm 	}
511844cd46caSbillm 
511944cd46caSbillm 	for (s = strtok(flagstr, ":"); s; s = strtok(NULL, ":")) {
512044cd46caSbillm 		for (i = 0; flagstr[i]; i++) {
51215ad82045Snd 			int bit = flagbits[(uchar_t)flagstr[i]];
512244cd46caSbillm 
512344cd46caSbillm 			if (bit == 0) {
512444cd46caSbillm 				(void) printf("***Invalid flag: %c\n",
512544cd46caSbillm 				    flagstr[i]);
512644cd46caSbillm 				continue;
512744cd46caSbillm 			}
512844cd46caSbillm 			flags |= bit;
512944cd46caSbillm 
513044cd46caSbillm 			/* If it's not something with an argument, keep going */
5131b24ab676SJeff Bonwick 			if ((bit & (ZDB_FLAG_CHECKSUM |
513244cd46caSbillm 			    ZDB_FLAG_PRINT_BLKPTR)) == 0)
513344cd46caSbillm 				continue;
513444cd46caSbillm 
513544cd46caSbillm 			p = &flagstr[i + 1];
513644cd46caSbillm 			if (bit == ZDB_FLAG_PRINT_BLKPTR)
513744cd46caSbillm 				blkptr_offset = strtoull(p, &p, 16);
513844cd46caSbillm 			if (*p != ':' && *p != '\0') {
513944cd46caSbillm 				(void) printf("***Invalid flag arg: '%s'\n", s);
514044cd46caSbillm 				free(dup);
514144cd46caSbillm 				return;
514244cd46caSbillm 			}
514344cd46caSbillm 		}
514444cd46caSbillm 	}
51453f7978d0SAlan Somers 	free(flagstr);
514644cd46caSbillm 
514744cd46caSbillm 	vd = zdb_vdev_lookup(spa->spa_root_vdev, vdev);
514844cd46caSbillm 	if (vd == NULL) {
514944cd46caSbillm 		(void) printf("***Invalid vdev: %s\n", vdev);
515044cd46caSbillm 		free(dup);
515144cd46caSbillm 		return;
515244cd46caSbillm 	} else {
515344cd46caSbillm 		if (vd->vdev_path)
5154b24ab676SJeff Bonwick 			(void) fprintf(stderr, "Found vdev: %s\n",
5155b24ab676SJeff Bonwick 			    vd->vdev_path);
515644cd46caSbillm 		else
5157b24ab676SJeff Bonwick 			(void) fprintf(stderr, "Found vdev type: %s\n",
515844cd46caSbillm 			    vd->vdev_ops->vdev_op_type);
515944cd46caSbillm 	}
516044cd46caSbillm 
5161b24ab676SJeff Bonwick 	psize = size;
5162b24ab676SJeff Bonwick 	lsize = size;
516344cd46caSbillm 
5164770499e1SDan Kimmel 	pabd = abd_alloc_linear(SPA_MAXBLOCKSIZE, B_FALSE);
5165b24ab676SJeff Bonwick 	lbuf = umem_alloc(SPA_MAXBLOCKSIZE, UMEM_NOFAIL);
5166b24ab676SJeff Bonwick 
5167b24ab676SJeff Bonwick 	BP_ZERO(bp);
5168b24ab676SJeff Bonwick 
5169b24ab676SJeff Bonwick 	DVA_SET_VDEV(&dva[0], vd->vdev_id);
5170b24ab676SJeff Bonwick 	DVA_SET_OFFSET(&dva[0], offset);
5171b24ab676SJeff Bonwick 	DVA_SET_GANG(&dva[0], !!(flags & ZDB_FLAG_GBH));
5172b24ab676SJeff Bonwick 	DVA_SET_ASIZE(&dva[0], vdev_psize_to_asize(vd, psize));
5173b24ab676SJeff Bonwick 
5174b24ab676SJeff Bonwick 	BP_SET_BIRTH(bp, TXG_INITIAL, TXG_INITIAL);
5175b24ab676SJeff Bonwick 
5176b24ab676SJeff Bonwick 	BP_SET_LSIZE(bp, lsize);
5177b24ab676SJeff Bonwick 	BP_SET_PSIZE(bp, psize);
5178b24ab676SJeff Bonwick 	BP_SET_COMPRESS(bp, ZIO_COMPRESS_OFF);
5179b24ab676SJeff Bonwick 	BP_SET_CHECKSUM(bp, ZIO_CHECKSUM_OFF);
5180b24ab676SJeff Bonwick 	BP_SET_TYPE(bp, DMU_OT_NONE);
5181b24ab676SJeff Bonwick 	BP_SET_LEVEL(bp, 0);
5182b24ab676SJeff Bonwick 	BP_SET_DEDUP(bp, 0);
5183b24ab676SJeff Bonwick 	BP_SET_BYTEORDER(bp, ZFS_HOST_BYTEORDER);
518444cd46caSbillm 
5185e14bb325SJeff Bonwick 	spa_config_enter(spa, SCL_STATE, FTAG, RW_READER);
518644cd46caSbillm 	zio = zio_root(spa, NULL, NULL, 0);
5187b24ab676SJeff Bonwick 
5188b24ab676SJeff Bonwick 	if (vd == vd->vdev_top) {
5189b24ab676SJeff Bonwick 		/*
5190b24ab676SJeff Bonwick 		 * Treat this as a normal block read.
5191b24ab676SJeff Bonwick 		 */
5192770499e1SDan Kimmel 		zio_nowait(zio_read(zio, spa, bp, pabd, psize, NULL, NULL,
5193b24ab676SJeff Bonwick 		    ZIO_PRIORITY_SYNC_READ,
5194b24ab676SJeff Bonwick 		    ZIO_FLAG_CANFAIL | ZIO_FLAG_RAW, NULL));
5195b24ab676SJeff Bonwick 	} else {
5196b24ab676SJeff Bonwick 		/*
5197b24ab676SJeff Bonwick 		 * Treat this as a vdev child I/O.
5198b24ab676SJeff Bonwick 		 */
5199770499e1SDan Kimmel 		zio_nowait(zio_vdev_child_io(zio, bp, vd, offset, pabd,
5200770499e1SDan Kimmel 		    psize, ZIO_TYPE_READ, ZIO_PRIORITY_SYNC_READ,
5201b24ab676SJeff Bonwick 		    ZIO_FLAG_DONT_CACHE | ZIO_FLAG_DONT_QUEUE |
5202b24ab676SJeff Bonwick 		    ZIO_FLAG_DONT_PROPAGATE | ZIO_FLAG_DONT_RETRY |
52035cabbc6bSPrashanth Sreenivasa 		    ZIO_FLAG_CANFAIL | ZIO_FLAG_RAW | ZIO_FLAG_OPTIONAL,
52045cabbc6bSPrashanth Sreenivasa 		    NULL, NULL));
5205b24ab676SJeff Bonwick 	}
5206b24ab676SJeff Bonwick 
520744cd46caSbillm 	error = zio_wait(zio);
5208e14bb325SJeff Bonwick 	spa_config_exit(spa, SCL_STATE, FTAG);
520944cd46caSbillm 
521044cd46caSbillm 	if (error) {
521144cd46caSbillm 		(void) printf("Read of %s failed, error: %d\n", thing, error);
521244cd46caSbillm 		goto out;
521344cd46caSbillm 	}
521444cd46caSbillm 
5215b24ab676SJeff Bonwick 	if (flags & ZDB_FLAG_DECOMPRESS) {
5216b24ab676SJeff Bonwick 		/*
5217b24ab676SJeff Bonwick 		 * We don't know how the data was compressed, so just try
5218b24ab676SJeff Bonwick 		 * every decompress function at every inflated blocksize.
5219b24ab676SJeff Bonwick 		 */
5220b24ab676SJeff Bonwick 		enum zio_compress c;
5221b24ab676SJeff Bonwick 		void *pbuf2 = umem_alloc(SPA_MAXBLOCKSIZE, UMEM_NOFAIL);
5222b24ab676SJeff Bonwick 		void *lbuf2 = umem_alloc(SPA_MAXBLOCKSIZE, UMEM_NOFAIL);
5223b24ab676SJeff Bonwick 
5224770499e1SDan Kimmel 		abd_copy_to_buf(pbuf2, pabd, psize);
5225b24ab676SJeff Bonwick 
5226770499e1SDan Kimmel 		VERIFY0(abd_iterate_func(pabd, psize, SPA_MAXBLOCKSIZE - psize,
5227770499e1SDan Kimmel 		    random_get_pseudo_bytes_cb, NULL));
5228b24ab676SJeff Bonwick 
5229770499e1SDan Kimmel 		VERIFY0(random_get_pseudo_bytes((uint8_t *)pbuf2 + psize,
5230770499e1SDan Kimmel 		    SPA_MAXBLOCKSIZE - psize));
5231b24ab676SJeff Bonwick 
5232b24ab676SJeff Bonwick 		for (lsize = SPA_MAXBLOCKSIZE; lsize > psize;
5233b24ab676SJeff Bonwick 		    lsize -= SPA_MINBLOCKSIZE) {
5234b24ab676SJeff Bonwick 			for (c = 0; c < ZIO_COMPRESS_FUNCTIONS; c++) {
5235770499e1SDan Kimmel 				if (zio_decompress_data(c, pabd,
5236770499e1SDan Kimmel 				    lbuf, psize, lsize) == 0 &&
5237770499e1SDan Kimmel 				    zio_decompress_data_buf(c, pbuf2,
5238770499e1SDan Kimmel 				    lbuf2, psize, lsize) == 0 &&
5239b24ab676SJeff Bonwick 				    bcmp(lbuf, lbuf2, lsize) == 0)
5240b24ab676SJeff Bonwick 					break;
5241b24ab676SJeff Bonwick 			}
5242b24ab676SJeff Bonwick 			if (c != ZIO_COMPRESS_FUNCTIONS)
5243b24ab676SJeff Bonwick 				break;
5244b24ab676SJeff Bonwick 			lsize -= SPA_MINBLOCKSIZE;
5245b24ab676SJeff Bonwick 		}
5246b24ab676SJeff Bonwick 
5247b24ab676SJeff Bonwick 		umem_free(pbuf2, SPA_MAXBLOCKSIZE);
5248b24ab676SJeff Bonwick 		umem_free(lbuf2, SPA_MAXBLOCKSIZE);
5249b24ab676SJeff Bonwick 
5250b24ab676SJeff Bonwick 		if (lsize <= psize) {
5251b24ab676SJeff Bonwick 			(void) printf("Decompress of %s failed\n", thing);
5252b24ab676SJeff Bonwick 			goto out;
5253b24ab676SJeff Bonwick 		}
5254b24ab676SJeff Bonwick 		buf = lbuf;
5255b24ab676SJeff Bonwick 		size = lsize;
5256b24ab676SJeff Bonwick 	} else {
5257770499e1SDan Kimmel 		buf = abd_to_buf(pabd);
5258b24ab676SJeff Bonwick 		size = psize;
5259b24ab676SJeff Bonwick 	}
5260b24ab676SJeff Bonwick 
526144cd46caSbillm 	if (flags & ZDB_FLAG_PRINT_BLKPTR)
526244cd46caSbillm 		zdb_print_blkptr((blkptr_t *)(void *)
526344cd46caSbillm 		    ((uintptr_t)buf + (uintptr_t)blkptr_offset), flags);
526444cd46caSbillm 	else if (flags & ZDB_FLAG_RAW)
526544cd46caSbillm 		zdb_dump_block_raw(buf, size, flags);
526644cd46caSbillm 	else if (flags & ZDB_FLAG_INDIRECT)
526744cd46caSbillm 		zdb_dump_indirect((blkptr_t *)buf, size / sizeof (blkptr_t),
526844cd46caSbillm 		    flags);
526944cd46caSbillm 	else if (flags & ZDB_FLAG_GBH)
527044cd46caSbillm 		zdb_dump_gbh(buf, flags);
527144cd46caSbillm 	else
527244cd46caSbillm 		zdb_dump_block(thing, buf, size, flags);
527344cd46caSbillm 
527444cd46caSbillm out:
5275770499e1SDan Kimmel 	abd_free(pabd);
5276b24ab676SJeff Bonwick 	umem_free(lbuf, SPA_MAXBLOCKSIZE);
527744cd46caSbillm 	free(dup);
527844cd46caSbillm }
527944cd46caSbillm 
52804923c69fSMatthew Ahrens static void
52814923c69fSMatthew Ahrens zdb_embedded_block(char *thing)
52824923c69fSMatthew Ahrens {
52833f7978d0SAlan Somers 	blkptr_t bp;
52844923c69fSMatthew Ahrens 	unsigned long long *words = (void *)&bp;
528503a4c2f4SJorgen Lundman 	char *buf;
52864923c69fSMatthew Ahrens 	int err;
52874923c69fSMatthew Ahrens 
52883f7978d0SAlan Somers 	bzero(&bp, sizeof (bp));
52894923c69fSMatthew Ahrens 	err = sscanf(thing, "%llx:%llx:%llx:%llx:%llx:%llx:%llx:%llx:"
52904923c69fSMatthew Ahrens 	    "%llx:%llx:%llx:%llx:%llx:%llx:%llx:%llx",
52914923c69fSMatthew Ahrens 	    words + 0, words + 1, words + 2, words + 3,
52924923c69fSMatthew Ahrens 	    words + 4, words + 5, words + 6, words + 7,
52934923c69fSMatthew Ahrens 	    words + 8, words + 9, words + 10, words + 11,
52944923c69fSMatthew Ahrens 	    words + 12, words + 13, words + 14, words + 15);
52954923c69fSMatthew Ahrens 	if (err != 16) {
529603a4c2f4SJorgen Lundman 		(void) fprintf(stderr, "invalid input format\n");
52974923c69fSMatthew Ahrens 		exit(1);
52984923c69fSMatthew Ahrens 	}
52994923c69fSMatthew Ahrens 	ASSERT3U(BPE_GET_LSIZE(&bp), <=, SPA_MAXBLOCKSIZE);
530003a4c2f4SJorgen Lundman 	buf = malloc(SPA_MAXBLOCKSIZE);
530103a4c2f4SJorgen Lundman 	if (buf == NULL) {
530203a4c2f4SJorgen Lundman 		(void) fprintf(stderr, "out of memory\n");
530303a4c2f4SJorgen Lundman 		exit(1);
530403a4c2f4SJorgen Lundman 	}
53054923c69fSMatthew Ahrens 	err = decode_embedded_bp(&bp, buf, BPE_GET_LSIZE(&bp));
53064923c69fSMatthew Ahrens 	if (err != 0) {
530703a4c2f4SJorgen Lundman 		(void) fprintf(stderr, "decode failed: %u\n", err);
53084923c69fSMatthew Ahrens 		exit(1);
53094923c69fSMatthew Ahrens 	}
53104923c69fSMatthew Ahrens 	zdb_dump_block_raw(buf, BPE_GET_LSIZE(&bp), 0);
531103a4c2f4SJorgen Lundman 	free(buf);
53124923c69fSMatthew Ahrens }
53134923c69fSMatthew Ahrens 
5314fa9e4066Sahrens int
5315fa9e4066Sahrens main(int argc, char **argv)
5316fa9e4066Sahrens {
53173f7978d0SAlan Somers 	int c;
5318fa9e4066Sahrens 	struct rlimit rl = { 1024, 1024 };
53193ad6c7f9SVictor Latushkin 	spa_t *spa = NULL;
5320fa9e4066Sahrens 	objset_t *os = NULL;
5321fa9e4066Sahrens 	int dump_all = 1;
5322fa9e4066Sahrens 	int verbose = 0;
5323c8ee1847SVictor Latushkin 	int error = 0;
53243ad6c7f9SVictor Latushkin 	char **searchdirs = NULL;
53253ad6c7f9SVictor Latushkin 	int nsearch = 0;
5326e0f1c0afSOlaf Faaland 	char *target, *target_pool;
5327468c413aSTim Haley 	nvlist_t *policy = NULL;
5328468c413aSTim Haley 	uint64_t max_txg = UINT64_MAX;
5329dfd5965fSRichard Yao 	int flags = ZFS_IMPORT_MISSING_LOG;
5330c8ee1847SVictor Latushkin 	int rewind = ZPOOL_NEVER_REWIND;
5331ae24175bSCyril Plisko 	char *spa_config_path_env;
5332b702644aSTim Chase 	boolean_t target_is_spa = B_TRUE;
533386714001SSerapheim Dimitropoulos 	nvlist_t *cfg = NULL;
5334fa9e4066Sahrens 
5335fa9e4066Sahrens 	(void) setrlimit(RLIMIT_NOFILE, &rl);
5336004388ebScasper 	(void) enable_extended_FILE_stdio(-1, -1);
5337fa9e4066Sahrens 
5338fa9e4066Sahrens 	dprintf_setup(&argc, argv);
5339fa9e4066Sahrens 
5340ae24175bSCyril Plisko 	/*
5341ae24175bSCyril Plisko 	 * If there is an environment variable SPA_CONFIG_PATH it overrides
5342ae24175bSCyril Plisko 	 * default spa_config_path setting. If -U flag is specified it will
5343ae24175bSCyril Plisko 	 * override this environment variable settings once again.
5344ae24175bSCyril Plisko 	 */
5345ae24175bSCyril Plisko 	spa_config_path_env = getenv("SPA_CONFIG_PATH");
5346ae24175bSCyril Plisko 	if (spa_config_path_env != NULL)
5347ae24175bSCyril Plisko 		spa_config_path = spa_config_path_env;
5348ae24175bSCyril Plisko 
5349df15e419SMatthew Ahrens 	while ((c = getopt(argc, argv,
535086714001SSerapheim Dimitropoulos 	    "AbcCdDeEFGhiI:klLmMo:Op:PqRsSt:uU:vVx:X")) != -1) {
5351fa9e4066Sahrens 		switch (c) {
5352fa9e4066Sahrens 		case 'b':
5353fa9e4066Sahrens 		case 'c':
5354ed61ec1dSYuri Pankov 		case 'C':
5355b24ab676SJeff Bonwick 		case 'd':
5356ed61ec1dSYuri Pankov 		case 'D':
53574923c69fSMatthew Ahrens 		case 'E':
5358ed61ec1dSYuri Pankov 		case 'G':
5359b24ab676SJeff Bonwick 		case 'h':
5360b24ab676SJeff Bonwick 		case 'i':
5361b24ab676SJeff Bonwick 		case 'l':
5362d6e555bdSGeorge Wilson 		case 'm':
53632e4c9986SGeorge Wilson 		case 'M':
5364ed61ec1dSYuri Pankov 		case 'O':
536544cd46caSbillm 		case 'R':
5366ed61ec1dSYuri Pankov 		case 's':
5367b24ab676SJeff Bonwick 		case 'S':
5368ed61ec1dSYuri Pankov 		case 'u':
5369fa9e4066Sahrens 			dump_opt[c]++;
5370fa9e4066Sahrens 			dump_all = 0;
5371fa9e4066Sahrens 			break;
5372feef89cfSVictor Latushkin 		case 'A':
5373ed61ec1dSYuri Pankov 		case 'e':
5374c8ee1847SVictor Latushkin 		case 'F':
537586714001SSerapheim Dimitropoulos 		case 'k':
537682a0a985SVictor Latushkin 		case 'L':
53773f9d6ad7SLin Ling 		case 'P':
537864723e36SYuri Pankov 		case 'q':
5379ed61ec1dSYuri Pankov 		case 'X':
538082a0a985SVictor Latushkin 			dump_opt[c]++;
538182a0a985SVictor Latushkin 			break;
5382ed61ec1dSYuri Pankov 		/* NB: Sort single match options below. */
53832e4c9986SGeorge Wilson 		case 'I':
538431d7e8faSGeorge Wilson 			max_inflight = strtoull(optarg, NULL, 0);
538531d7e8faSGeorge Wilson 			if (max_inflight == 0) {
538631d7e8faSGeorge Wilson 				(void) fprintf(stderr, "maximum number "
538731d7e8faSGeorge Wilson 				    "of inflight I/Os must be greater "
538831d7e8faSGeorge Wilson 				    "than 0\n");
538931d7e8faSGeorge Wilson 				usage();
539031d7e8faSGeorge Wilson 			}
539131d7e8faSGeorge Wilson 			break;
5392ed61ec1dSYuri Pankov 		case 'o':
5393ed61ec1dSYuri Pankov 			error = set_global_var(optarg);
5394ed61ec1dSYuri Pankov 			if (error != 0)
5395ed61ec1dSYuri Pankov 				usage();
5396ed61ec1dSYuri Pankov 			break;
5397de6628f0Sck 		case 'p':
53983ad6c7f9SVictor Latushkin 			if (searchdirs == NULL) {
53993ad6c7f9SVictor Latushkin 				searchdirs = umem_alloc(sizeof (char *),
54003ad6c7f9SVictor Latushkin 				    UMEM_NOFAIL);
54013ad6c7f9SVictor Latushkin 			} else {
54023ad6c7f9SVictor Latushkin 				char **tmp = umem_alloc((nsearch + 1) *
54033ad6c7f9SVictor Latushkin 				    sizeof (char *), UMEM_NOFAIL);
54043ad6c7f9SVictor Latushkin 				bcopy(searchdirs, tmp, nsearch *
54053ad6c7f9SVictor Latushkin 				    sizeof (char *));
54063ad6c7f9SVictor Latushkin 				umem_free(searchdirs,
54073ad6c7f9SVictor Latushkin 				    nsearch * sizeof (char *));
54083ad6c7f9SVictor Latushkin 				searchdirs = tmp;
54093ad6c7f9SVictor Latushkin 			}
54103ad6c7f9SVictor Latushkin 			searchdirs[nsearch++] = optarg;
5411de6628f0Sck 			break;
54122e551927SVictor Latushkin 		case 't':
5413468c413aSTim Haley 			max_txg = strtoull(optarg, NULL, 0);
5414468c413aSTim Haley 			if (max_txg < TXG_INITIAL) {
54152e551927SVictor Latushkin 				(void) fprintf(stderr, "incorrect txg "
54162e551927SVictor Latushkin 				    "specified: %s\n", optarg);
54172e551927SVictor Latushkin 				usage();
54182e551927SVictor Latushkin 			}
54192e551927SVictor Latushkin 			break;
5420b24ab676SJeff Bonwick 		case 'U':
5421b24ab676SJeff Bonwick 			spa_config_path = optarg;
54224923c69fSMatthew Ahrens 			if (spa_config_path[0] != '/') {
54234923c69fSMatthew Ahrens 				(void) fprintf(stderr,
54244923c69fSMatthew Ahrens 				    "cachefile must be an absolute path "
54254923c69fSMatthew Ahrens 				    "(i.e. start with a slash)\n");
54264923c69fSMatthew Ahrens 				usage();
54274923c69fSMatthew Ahrens 			}
5428b24ab676SJeff Bonwick 			break;
54292e4c9986SGeorge Wilson 		case 'v':
54302e4c9986SGeorge Wilson 			verbose++;
54312e4c9986SGeorge Wilson 			break;
5432dfd5965fSRichard Yao 		case 'V':
5433dfd5965fSRichard Yao 			flags = ZFS_IMPORT_VERBATIM;
5434dfd5965fSRichard Yao 			break;
54352e4c9986SGeorge Wilson 		case 'x':
54362e4c9986SGeorge Wilson 			vn_dumpdir = optarg;
54372e4c9986SGeorge Wilson 			break;
5438fa9e4066Sahrens 		default:
5439fa9e4066Sahrens 			usage();
5440fa9e4066Sahrens 			break;
5441fa9e4066Sahrens 		}
5442fa9e4066Sahrens 	}
5443fa9e4066Sahrens 
54443ad6c7f9SVictor Latushkin 	if (!dump_opt['e'] && searchdirs != NULL) {
544588b7b0f2SMatthew Ahrens 		(void) fprintf(stderr, "-p option requires use of -e\n");
544688b7b0f2SMatthew Ahrens 		usage();
544788b7b0f2SMatthew Ahrens 	}
5448de6628f0Sck 
544906be9802SMatthew Ahrens 	/*
545006be9802SMatthew Ahrens 	 * ZDB does not typically re-read blocks; therefore limit the ARC
545106be9802SMatthew Ahrens 	 * to 256 MB, which can be used entirely for metadata.
545206be9802SMatthew Ahrens 	 */
545306be9802SMatthew Ahrens 	zfs_arc_max = zfs_arc_meta_limit = 256 * 1024 * 1024;
545406be9802SMatthew Ahrens 
5455f7950bf1SMatthew Ahrens 	/*
5456f7950bf1SMatthew Ahrens 	 * "zdb -c" uses checksum-verifying scrub i/os which are async reads.
5457f7950bf1SMatthew Ahrens 	 * "zdb -b" uses traversal prefetch which uses async reads.
5458f7950bf1SMatthew Ahrens 	 * For good performance, let several of them be active at once.
5459f7950bf1SMatthew Ahrens 	 */
5460f7950bf1SMatthew Ahrens 	zfs_vdev_async_read_max_active = 10;
5461f7950bf1SMatthew Ahrens 
54624dd77f9eSMatthew Ahrens 	/*
54634dd77f9eSMatthew Ahrens 	 * Disable reference tracking for better performance.
54644dd77f9eSMatthew Ahrens 	 */
54654dd77f9eSMatthew Ahrens 	reference_tracking_enable = B_FALSE;
54664dd77f9eSMatthew Ahrens 
5467e144c4e6SPavel Zakharov 	/*
5468e144c4e6SPavel Zakharov 	 * Do not fail spa_load when spa_load_verify fails. This is needed
5469e144c4e6SPavel Zakharov 	 * to load non-idle pools.
5470e144c4e6SPavel Zakharov 	 */
5471e144c4e6SPavel Zakharov 	spa_load_verify_dryrun = B_TRUE;
5472e144c4e6SPavel Zakharov 
5473fa9e4066Sahrens 	kernel_init(FREAD);
5474de6628f0Sck 	g_zfs = libzfs_init();
547591ebeef5Sahrens 	ASSERT(g_zfs != NULL);
5476fa9e4066Sahrens 
5477b24ab676SJeff Bonwick 	if (dump_all)
5478b24ab676SJeff Bonwick 		verbose = MAX(verbose, 1);
5479b24ab676SJeff Bonwick 
5480fa9e4066Sahrens 	for (c = 0; c < 256; c++) {
548186714001SSerapheim Dimitropoulos 		if (dump_all && strchr("AeEFklLOPRSX", c) == NULL)
5482fa9e4066Sahrens 			dump_opt[c] = 1;
5483fa9e4066Sahrens 		if (dump_opt[c])
5484fa9e4066Sahrens 			dump_opt[c] += verbose;
5485fa9e4066Sahrens 	}
5486fa9e4066Sahrens 
5487feef89cfSVictor Latushkin 	aok = (dump_opt['A'] == 1) || (dump_opt['A'] > 2);
5488feef89cfSVictor Latushkin 	zfs_recover = (dump_opt['A'] > 1);
5489feef89cfSVictor Latushkin 
5490fa9e4066Sahrens 	argc -= optind;
5491fa9e4066Sahrens 	argv += optind;
5492fa9e4066Sahrens 
549307428bdfSVictor Latushkin 	if (argc < 2 && dump_opt['R'])
549407428bdfSVictor Latushkin 		usage();
54954923c69fSMatthew Ahrens 
54964923c69fSMatthew Ahrens 	if (dump_opt['E']) {
54974923c69fSMatthew Ahrens 		if (argc != 1)
54984923c69fSMatthew Ahrens 			usage();
54994923c69fSMatthew Ahrens 		zdb_embedded_block(argv[0]);
55004923c69fSMatthew Ahrens 		return (0);
55014923c69fSMatthew Ahrens 	}
55024923c69fSMatthew Ahrens 
5503fa9e4066Sahrens 	if (argc < 1) {
55043ad6c7f9SVictor Latushkin 		if (!dump_opt['e'] && dump_opt['C']) {
5505e829d913Sck 			dump_cachefile(spa_config_path);
5506fa9e4066Sahrens 			return (0);
5507fa9e4066Sahrens 		}
5508fa9e4066Sahrens 		usage();
5509fa9e4066Sahrens 	}
5510fa9e4066Sahrens 
551164723e36SYuri Pankov 	if (dump_opt['l'])
551264723e36SYuri Pankov 		return (dump_label(argv[0]));
5513fa9e4066Sahrens 
5514ed61ec1dSYuri Pankov 	if (dump_opt['O']) {
5515ed61ec1dSYuri Pankov 		if (argc != 2)
5516ed61ec1dSYuri Pankov 			usage();
5517ed61ec1dSYuri Pankov 		dump_opt['v'] = verbose + 3;
5518ed61ec1dSYuri Pankov 		return (dump_path(argv[0], argv[1]));
5519ed61ec1dSYuri Pankov 	}
5520ed61ec1dSYuri Pankov 
5521c8ee1847SVictor Latushkin 	if (dump_opt['X'] || dump_opt['F'])
5522c8ee1847SVictor Latushkin 		rewind = ZPOOL_DO_REWIND |
5523c8ee1847SVictor Latushkin 		    (dump_opt['X'] ? ZPOOL_EXTREME_REWIND : 0);
5524c8ee1847SVictor Latushkin 
5525c8ee1847SVictor Latushkin 	if (nvlist_alloc(&policy, NV_UNIQUE_NAME_TYPE, 0) != 0 ||
55265dafeea3SPavel Zakharov 	    nvlist_add_uint64(policy, ZPOOL_LOAD_REQUEST_TXG, max_txg) != 0 ||
55275dafeea3SPavel Zakharov 	    nvlist_add_uint32(policy, ZPOOL_LOAD_REWIND_POLICY, rewind) != 0)
5528c8ee1847SVictor Latushkin 		fatal("internal error: %s", strerror(ENOMEM));
5529c8ee1847SVictor Latushkin 
5530c5904d13Seschrock 	error = 0;
55313ad6c7f9SVictor Latushkin 	target = argv[0];
5532990b4856Slling 
5533e0f1c0afSOlaf Faaland 	if (strpbrk(target, "/@") != NULL) {
5534e0f1c0afSOlaf Faaland 		size_t targetlen;
5535e0f1c0afSOlaf Faaland 
5536e0f1c0afSOlaf Faaland 		target_pool = strdup(target);
5537e0f1c0afSOlaf Faaland 		*strpbrk(target_pool, "/@") = '\0';
5538e0f1c0afSOlaf Faaland 
5539e0f1c0afSOlaf Faaland 		target_is_spa = B_FALSE;
5540e0f1c0afSOlaf Faaland 		targetlen = strlen(target);
5541e0f1c0afSOlaf Faaland 		if (targetlen && target[targetlen - 1] == '/')
5542e0f1c0afSOlaf Faaland 			target[targetlen - 1] = '\0';
5543e0f1c0afSOlaf Faaland 	} else {
5544e0f1c0afSOlaf Faaland 		target_pool = target;
5545e0f1c0afSOlaf Faaland 	}
5546e0f1c0afSOlaf Faaland 
55473ad6c7f9SVictor Latushkin 	if (dump_opt['e']) {
5548e0f1c0afSOlaf Faaland 		importargs_t args = { 0 };
5549990b4856Slling 
5550e0f1c0afSOlaf Faaland 		args.paths = nsearch;
5551e0f1c0afSOlaf Faaland 		args.path = searchdirs;
5552e0f1c0afSOlaf Faaland 		args.can_be_active = B_TRUE;
5553e0f1c0afSOlaf Faaland 
5554e0f1c0afSOlaf Faaland 		error = zpool_tryimport(g_zfs, target_pool, &cfg, &args);
5555e0f1c0afSOlaf Faaland 
5556e0f1c0afSOlaf Faaland 		if (error == 0) {
555786714001SSerapheim Dimitropoulos 
5558c8ee1847SVictor Latushkin 			if (nvlist_add_nvlist(cfg,
55595dafeea3SPavel Zakharov 			    ZPOOL_LOAD_POLICY, policy) != 0) {
5560468c413aSTim Haley 				fatal("can't open '%s': %s",
5561468c413aSTim Haley 				    target, strerror(ENOMEM));
5562468c413aSTim Haley 			}
5563e0f1c0afSOlaf Faaland 
5564e0f1c0afSOlaf Faaland 			if (dump_opt['C'] > 1) {
5565e0f1c0afSOlaf Faaland 				(void) printf("\nConfiguration for import:\n");
5566e0f1c0afSOlaf Faaland 				dump_nvlist(cfg, 8);
5567e0f1c0afSOlaf Faaland 			}
5568e0f1c0afSOlaf Faaland 
5569e0f1c0afSOlaf Faaland 			/*
5570e0f1c0afSOlaf Faaland 			 * Disable the activity check to allow examination of
5571e0f1c0afSOlaf Faaland 			 * active pools.
5572e0f1c0afSOlaf Faaland 			 */
5573e0f1c0afSOlaf Faaland 			error = spa_import(target_pool, cfg, NULL,
5574e0f1c0afSOlaf Faaland 			    flags | ZFS_IMPORT_SKIP_MMP);
5575de6628f0Sck 		}
5576c5904d13Seschrock 	}
5577c5904d13Seschrock 
557886714001SSerapheim Dimitropoulos 	char *checkpoint_pool = NULL;
557986714001SSerapheim Dimitropoulos 	char *checkpoint_target = NULL;
558086714001SSerapheim Dimitropoulos 	if (dump_opt['k']) {
558186714001SSerapheim Dimitropoulos 		checkpoint_pool = import_checkpointed_state(target, cfg,
558286714001SSerapheim Dimitropoulos 		    &checkpoint_target);
558386714001SSerapheim Dimitropoulos 
558486714001SSerapheim Dimitropoulos 		if (checkpoint_target != NULL)
558586714001SSerapheim Dimitropoulos 			target = checkpoint_target;
558686714001SSerapheim Dimitropoulos 
558786714001SSerapheim Dimitropoulos 	}
558886714001SSerapheim Dimitropoulos 
5589c5904d13Seschrock 	if (error == 0) {
559086714001SSerapheim Dimitropoulos 		if (dump_opt['k'] && (target_is_spa || dump_opt['R'])) {
559186714001SSerapheim Dimitropoulos 			ASSERT(checkpoint_pool != NULL);
559286714001SSerapheim Dimitropoulos 			ASSERT(checkpoint_target == NULL);
559386714001SSerapheim Dimitropoulos 
559486714001SSerapheim Dimitropoulos 			error = spa_open(checkpoint_pool, &spa, FTAG);
559586714001SSerapheim Dimitropoulos 			if (error != 0) {
559686714001SSerapheim Dimitropoulos 				fatal("Tried to open pool \"%s\" but "
559786714001SSerapheim Dimitropoulos 				    "spa_open() failed with error %d\n",
559886714001SSerapheim Dimitropoulos 				    checkpoint_pool, error);
559986714001SSerapheim Dimitropoulos 			}
560086714001SSerapheim Dimitropoulos 
560186714001SSerapheim Dimitropoulos 		} else if (target_is_spa || dump_opt['R']) {
5602e0f1c0afSOlaf Faaland 			zdb_set_skip_mmp(target);
560380eb36f2SGeorge Wilson 			error = spa_open_rewind(target, &spa, FTAG, policy,
560480eb36f2SGeorge Wilson 			    NULL);
56058f18d1faSGeorge Wilson 			if (error) {
56068f18d1faSGeorge Wilson 				/*
56078f18d1faSGeorge Wilson 				 * If we're missing the log device then
56088f18d1faSGeorge Wilson 				 * try opening the pool after clearing the
56098f18d1faSGeorge Wilson 				 * log state.
56108f18d1faSGeorge Wilson 				 */
56118f18d1faSGeorge Wilson 				mutex_enter(&spa_namespace_lock);
56123ad6c7f9SVictor Latushkin 				if ((spa = spa_lookup(target)) != NULL &&
56138f18d1faSGeorge Wilson 				    spa->spa_log_state == SPA_LOG_MISSING) {
56148f18d1faSGeorge Wilson 					spa->spa_log_state = SPA_LOG_CLEAR;
56158f18d1faSGeorge Wilson 					error = 0;
56168f18d1faSGeorge Wilson 				}
56178f18d1faSGeorge Wilson 				mutex_exit(&spa_namespace_lock);
56188f18d1faSGeorge Wilson 
561980eb36f2SGeorge Wilson 				if (!error) {
562080eb36f2SGeorge Wilson 					error = spa_open_rewind(target, &spa,
562180eb36f2SGeorge Wilson 					    FTAG, policy, NULL);
562280eb36f2SGeorge Wilson 				}
56238f18d1faSGeorge Wilson 			}
562407428bdfSVictor Latushkin 		} else {
5625e0f1c0afSOlaf Faaland 			zdb_set_skip_mmp(target);
5626ed61ec1dSYuri Pankov 			error = open_objset(target, DMU_OST_ANY, FTAG, &os);
5627c5904d13Seschrock 		}
5628fa9e4066Sahrens 	}
562980eb36f2SGeorge Wilson 	nvlist_free(policy);
563080eb36f2SGeorge Wilson 
5631fa9e4066Sahrens 	if (error)
56323ad6c7f9SVictor Latushkin 		fatal("can't open '%s': %s", target, strerror(error));
5633fa9e4066Sahrens 
5634fa9e4066Sahrens 	argv++;
563507428bdfSVictor Latushkin 	argc--;
563607428bdfSVictor Latushkin 	if (!dump_opt['R']) {
563707428bdfSVictor Latushkin 		if (argc > 0) {
563807428bdfSVictor Latushkin 			zopt_objects = argc;
563907428bdfSVictor Latushkin 			zopt_object = calloc(zopt_objects, sizeof (uint64_t));
56403f7978d0SAlan Somers 			for (unsigned i = 0; i < zopt_objects; i++) {
564107428bdfSVictor Latushkin 				errno = 0;
564207428bdfSVictor Latushkin 				zopt_object[i] = strtoull(argv[i], NULL, 0);
564307428bdfSVictor Latushkin 				if (zopt_object[i] == 0 && errno != 0)
564487219db7SVictor Latushkin 					fatal("bad number %s: %s",
564507428bdfSVictor Latushkin 					    argv[i], strerror(errno));
564607428bdfSVictor Latushkin 			}
5647fa9e4066Sahrens 		}
5648e690fb27SChristopher Siden 		if (os != NULL) {
5649e690fb27SChristopher Siden 			dump_dir(os);
5650e690fb27SChristopher Siden 		} else if (zopt_objects > 0 && !dump_opt['m']) {
5651e690fb27SChristopher Siden 			dump_dir(spa->spa_meta_objset);
5652e690fb27SChristopher Siden 		} else {
5653e690fb27SChristopher Siden 			dump_zpool(spa);
5654e690fb27SChristopher Siden 		}
5655fa9e4066Sahrens 	} else {
565607428bdfSVictor Latushkin 		flagbits['b'] = ZDB_FLAG_PRINT_BLKPTR;
565707428bdfSVictor Latushkin 		flagbits['c'] = ZDB_FLAG_CHECKSUM;
565807428bdfSVictor Latushkin 		flagbits['d'] = ZDB_FLAG_DECOMPRESS;
565907428bdfSVictor Latushkin 		flagbits['e'] = ZDB_FLAG_BSWAP;
566007428bdfSVictor Latushkin 		flagbits['g'] = ZDB_FLAG_GBH;
566107428bdfSVictor Latushkin 		flagbits['i'] = ZDB_FLAG_INDIRECT;
566207428bdfSVictor Latushkin 		flagbits['p'] = ZDB_FLAG_PHYS;
566307428bdfSVictor Latushkin 		flagbits['r'] = ZDB_FLAG_RAW;
566407428bdfSVictor Latushkin 
56653f7978d0SAlan Somers 		for (int i = 0; i < argc; i++)
566607428bdfSVictor Latushkin 			zdb_read_block(argv[i], spa);
5667fa9e4066Sahrens 	}
5668fa9e4066Sahrens 
566986714001SSerapheim Dimitropoulos 	if (dump_opt['k']) {
567086714001SSerapheim Dimitropoulos 		free(checkpoint_pool);
567186714001SSerapheim Dimitropoulos 		if (!target_is_spa)
567286714001SSerapheim Dimitropoulos 			free(checkpoint_target);
567386714001SSerapheim Dimitropoulos 	}
567486714001SSerapheim Dimitropoulos 
5675ed61ec1dSYuri Pankov 	if (os != NULL)
5676ed61ec1dSYuri Pankov 		close_objset(os, FTAG);
5677ed61ec1dSYuri Pankov 	else
5678ed61ec1dSYuri Pankov 		spa_close(spa, FTAG);
567907428bdfSVictor Latushkin 
5680e0d35c44Smarks 	fuid_table_destroy();
5681e0d35c44Smarks 
568229bdd2f9SPavel Zakharov 	dump_debug_buffer();
568329bdd2f9SPavel Zakharov 
5684de6628f0Sck 	libzfs_fini(g_zfs);
5685fa9e4066Sahrens 	kernel_fini();
5686fa9e4066Sahrens 
568720b5dafbSPaul Dagnelie 	return (error);
5688fa9e4066Sahrens }
5689