1b24ab676SJeff Bonwick /* 2b24ab676SJeff Bonwick * CDDL HEADER START 3b24ab676SJeff Bonwick * 4b24ab676SJeff Bonwick * The contents of this file are subject to the terms of the 5b24ab676SJeff Bonwick * Common Development and Distribution License (the "License"). 6b24ab676SJeff Bonwick * You may not use this file except in compliance with the License. 7b24ab676SJeff Bonwick * 8b24ab676SJeff Bonwick * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9b24ab676SJeff Bonwick * or http://www.opensolaris.org/os/licensing. 10b24ab676SJeff Bonwick * See the License for the specific language governing permissions 11b24ab676SJeff Bonwick * and limitations under the License. 12b24ab676SJeff Bonwick * 13b24ab676SJeff Bonwick * When distributing Covered Code, include this CDDL HEADER in each 14b24ab676SJeff Bonwick * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15b24ab676SJeff Bonwick * If applicable, add the following below this CDDL HEADER, with the 16b24ab676SJeff Bonwick * fields enclosed by brackets "[]" replaced with your own identifying 17b24ab676SJeff Bonwick * information: Portions Copyright [yyyy] [name of copyright owner] 18b24ab676SJeff Bonwick * 19b24ab676SJeff Bonwick * CDDL HEADER END 20b24ab676SJeff Bonwick */ 21b24ab676SJeff Bonwick 22b24ab676SJeff Bonwick /* 233f9d6ad7SLin Ling * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved. 24*ad135b5dSChristopher Siden * Copyright (c) 2012 by Delphix. All rights reserved. 25b24ab676SJeff Bonwick */ 26b24ab676SJeff Bonwick 27b24ab676SJeff Bonwick #include <sys/zfs_context.h> 28b24ab676SJeff Bonwick #include <sys/spa.h> 29b24ab676SJeff Bonwick #include <sys/spa_impl.h> 30b24ab676SJeff Bonwick #include <sys/zio.h> 31b24ab676SJeff Bonwick #include <sys/ddt.h> 32b24ab676SJeff Bonwick #include <sys/zap.h> 33b24ab676SJeff Bonwick #include <sys/dmu_tx.h> 34b24ab676SJeff Bonwick #include <sys/arc.h> 35bbfd46c4SJeff Bonwick #include <sys/dsl_pool.h> 36b24ab676SJeff Bonwick #include <sys/zio_checksum.h> 37b24ab676SJeff Bonwick #include <sys/zio_compress.h> 383f9d6ad7SLin Ling #include <sys/dsl_scan.h> 39b24ab676SJeff Bonwick 40837b568bSGeorge Wilson /* 41837b568bSGeorge Wilson * Enable/disable prefetching of dedup-ed blocks which are going to be freed. 42837b568bSGeorge Wilson */ 43837b568bSGeorge Wilson int zfs_dedup_prefetch = 1; 44837b568bSGeorge Wilson 45b24ab676SJeff Bonwick static const ddt_ops_t *ddt_ops[DDT_TYPES] = { 46b24ab676SJeff Bonwick &ddt_zap_ops, 47b24ab676SJeff Bonwick }; 48b24ab676SJeff Bonwick 49b24ab676SJeff Bonwick static const char *ddt_class_name[DDT_CLASSES] = { 50b24ab676SJeff Bonwick "ditto", 51b24ab676SJeff Bonwick "duplicate", 52b24ab676SJeff Bonwick "unique", 53b24ab676SJeff Bonwick }; 54b24ab676SJeff Bonwick 55b24ab676SJeff Bonwick static void 56b24ab676SJeff Bonwick ddt_object_create(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 57b24ab676SJeff Bonwick dmu_tx_t *tx) 58b24ab676SJeff Bonwick { 59b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 60b24ab676SJeff Bonwick objset_t *os = ddt->ddt_os; 61b24ab676SJeff Bonwick uint64_t *objectp = &ddt->ddt_object[type][class]; 62b24ab676SJeff Bonwick boolean_t prehash = zio_checksum_table[ddt->ddt_checksum].ci_dedup; 63b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 64b24ab676SJeff Bonwick 65b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 66b24ab676SJeff Bonwick 67b24ab676SJeff Bonwick ASSERT(*objectp == 0); 68b24ab676SJeff Bonwick VERIFY(ddt_ops[type]->ddt_op_create(os, objectp, tx, prehash) == 0); 69b24ab676SJeff Bonwick ASSERT(*objectp != 0); 70b24ab676SJeff Bonwick 71b24ab676SJeff Bonwick VERIFY(zap_add(os, DMU_POOL_DIRECTORY_OBJECT, name, 72b24ab676SJeff Bonwick sizeof (uint64_t), 1, objectp, tx) == 0); 73b24ab676SJeff Bonwick 74b24ab676SJeff Bonwick VERIFY(zap_add(os, spa->spa_ddt_stat_object, name, 75b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 76b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class], tx) == 0); 77b24ab676SJeff Bonwick } 78b24ab676SJeff Bonwick 79b24ab676SJeff Bonwick static void 80b24ab676SJeff Bonwick ddt_object_destroy(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 81b24ab676SJeff Bonwick dmu_tx_t *tx) 82b24ab676SJeff Bonwick { 83b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 84b24ab676SJeff Bonwick objset_t *os = ddt->ddt_os; 85b24ab676SJeff Bonwick uint64_t *objectp = &ddt->ddt_object[type][class]; 86b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 87b24ab676SJeff Bonwick 88b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 89b24ab676SJeff Bonwick 90b24ab676SJeff Bonwick ASSERT(*objectp != 0); 91b24ab676SJeff Bonwick ASSERT(ddt_object_count(ddt, type, class) == 0); 92b24ab676SJeff Bonwick ASSERT(ddt_histogram_empty(&ddt->ddt_histogram[type][class])); 93b24ab676SJeff Bonwick VERIFY(zap_remove(os, DMU_POOL_DIRECTORY_OBJECT, name, tx) == 0); 94b24ab676SJeff Bonwick VERIFY(zap_remove(os, spa->spa_ddt_stat_object, name, tx) == 0); 95b24ab676SJeff Bonwick VERIFY(ddt_ops[type]->ddt_op_destroy(os, *objectp, tx) == 0); 9630f608a4SGeorge Wilson bzero(&ddt->ddt_object_stats[type][class], sizeof (ddt_object_t)); 97b24ab676SJeff Bonwick 98b24ab676SJeff Bonwick *objectp = 0; 99b24ab676SJeff Bonwick } 100b24ab676SJeff Bonwick 101b24ab676SJeff Bonwick static int 102b24ab676SJeff Bonwick ddt_object_load(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 103b24ab676SJeff Bonwick { 10430f608a4SGeorge Wilson ddt_object_t *ddo = &ddt->ddt_object_stats[type][class]; 10530f608a4SGeorge Wilson dmu_object_info_t doi; 106b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 107b24ab676SJeff Bonwick int error; 108b24ab676SJeff Bonwick 109b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 110b24ab676SJeff Bonwick 111b24ab676SJeff Bonwick error = zap_lookup(ddt->ddt_os, DMU_POOL_DIRECTORY_OBJECT, name, 112b24ab676SJeff Bonwick sizeof (uint64_t), 1, &ddt->ddt_object[type][class]); 113b24ab676SJeff Bonwick 114b24ab676SJeff Bonwick if (error) 115b24ab676SJeff Bonwick return (error); 116b24ab676SJeff Bonwick 117b24ab676SJeff Bonwick error = zap_lookup(ddt->ddt_os, ddt->ddt_spa->spa_ddt_stat_object, name, 118b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 119b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class]); 120b24ab676SJeff Bonwick 12130f608a4SGeorge Wilson /* 12230f608a4SGeorge Wilson * Seed the cached statistics. 12330f608a4SGeorge Wilson */ 12430f608a4SGeorge Wilson VERIFY(ddt_object_info(ddt, type, class, &doi) == 0); 12530f608a4SGeorge Wilson 12630f608a4SGeorge Wilson ddo->ddo_count = ddt_object_count(ddt, type, class); 12730f608a4SGeorge Wilson ddo->ddo_dspace = doi.doi_physical_blocks_512 << 9; 12830f608a4SGeorge Wilson ddo->ddo_mspace = doi.doi_fill_count * doi.doi_data_block_size; 12930f608a4SGeorge Wilson 130b24ab676SJeff Bonwick ASSERT(error == 0); 131b24ab676SJeff Bonwick return (error); 132b24ab676SJeff Bonwick } 133b24ab676SJeff Bonwick 134b24ab676SJeff Bonwick static void 135b24ab676SJeff Bonwick ddt_object_sync(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 136b24ab676SJeff Bonwick dmu_tx_t *tx) 137b24ab676SJeff Bonwick { 13830f608a4SGeorge Wilson ddt_object_t *ddo = &ddt->ddt_object_stats[type][class]; 13930f608a4SGeorge Wilson dmu_object_info_t doi; 140b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 141b24ab676SJeff Bonwick 142b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 143b24ab676SJeff Bonwick 144b24ab676SJeff Bonwick VERIFY(zap_update(ddt->ddt_os, ddt->ddt_spa->spa_ddt_stat_object, name, 145b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 146b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class], tx) == 0); 14730f608a4SGeorge Wilson 14830f608a4SGeorge Wilson /* 14930f608a4SGeorge Wilson * Cache DDT statistics; this is the only time they'll change. 15030f608a4SGeorge Wilson */ 15130f608a4SGeorge Wilson VERIFY(ddt_object_info(ddt, type, class, &doi) == 0); 15230f608a4SGeorge Wilson 15330f608a4SGeorge Wilson ddo->ddo_count = ddt_object_count(ddt, type, class); 15430f608a4SGeorge Wilson ddo->ddo_dspace = doi.doi_physical_blocks_512 << 9; 15530f608a4SGeorge Wilson ddo->ddo_mspace = doi.doi_fill_count * doi.doi_data_block_size; 156b24ab676SJeff Bonwick } 157b24ab676SJeff Bonwick 158b24ab676SJeff Bonwick static int 159b24ab676SJeff Bonwick ddt_object_lookup(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 160b24ab676SJeff Bonwick ddt_entry_t *dde) 161b24ab676SJeff Bonwick { 162b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, type, class)) 163b24ab676SJeff Bonwick return (ENOENT); 164b24ab676SJeff Bonwick 165b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_lookup(ddt->ddt_os, 166b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde)); 167b24ab676SJeff Bonwick } 168b24ab676SJeff Bonwick 169c7cd2421SGeorge Wilson static void 170c7cd2421SGeorge Wilson ddt_object_prefetch(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 171c7cd2421SGeorge Wilson ddt_entry_t *dde) 172c7cd2421SGeorge Wilson { 173c7cd2421SGeorge Wilson if (!ddt_object_exists(ddt, type, class)) 174c7cd2421SGeorge Wilson return; 175c7cd2421SGeorge Wilson 176c7cd2421SGeorge Wilson ddt_ops[type]->ddt_op_prefetch(ddt->ddt_os, 177c7cd2421SGeorge Wilson ddt->ddt_object[type][class], dde); 178c7cd2421SGeorge Wilson } 179c7cd2421SGeorge Wilson 1803f9d6ad7SLin Ling int 181b24ab676SJeff Bonwick ddt_object_update(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 182b24ab676SJeff Bonwick ddt_entry_t *dde, dmu_tx_t *tx) 183b24ab676SJeff Bonwick { 184b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 185b24ab676SJeff Bonwick 186b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_update(ddt->ddt_os, 187b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, tx)); 188b24ab676SJeff Bonwick } 189b24ab676SJeff Bonwick 190b24ab676SJeff Bonwick static int 191b24ab676SJeff Bonwick ddt_object_remove(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 192b24ab676SJeff Bonwick ddt_entry_t *dde, dmu_tx_t *tx) 193b24ab676SJeff Bonwick { 194b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 195b24ab676SJeff Bonwick 196b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_remove(ddt->ddt_os, 197b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, tx)); 198b24ab676SJeff Bonwick } 199b24ab676SJeff Bonwick 200b24ab676SJeff Bonwick int 201b24ab676SJeff Bonwick ddt_object_walk(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 202bbfd46c4SJeff Bonwick uint64_t *walk, ddt_entry_t *dde) 203b24ab676SJeff Bonwick { 204b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 205b24ab676SJeff Bonwick 206b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_walk(ddt->ddt_os, 207b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, walk)); 208b24ab676SJeff Bonwick } 209b24ab676SJeff Bonwick 210b24ab676SJeff Bonwick uint64_t 211b24ab676SJeff Bonwick ddt_object_count(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 212b24ab676SJeff Bonwick { 213b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 214b24ab676SJeff Bonwick 215b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_count(ddt->ddt_os, 216b24ab676SJeff Bonwick ddt->ddt_object[type][class])); 217b24ab676SJeff Bonwick } 218b24ab676SJeff Bonwick 219b24ab676SJeff Bonwick int 220b24ab676SJeff Bonwick ddt_object_info(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 221b24ab676SJeff Bonwick dmu_object_info_t *doi) 222b24ab676SJeff Bonwick { 223b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, type, class)) 224b24ab676SJeff Bonwick return (ENOENT); 225b24ab676SJeff Bonwick 226b24ab676SJeff Bonwick return (dmu_object_info(ddt->ddt_os, ddt->ddt_object[type][class], 227b24ab676SJeff Bonwick doi)); 228b24ab676SJeff Bonwick } 229b24ab676SJeff Bonwick 230b24ab676SJeff Bonwick boolean_t 231b24ab676SJeff Bonwick ddt_object_exists(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 232b24ab676SJeff Bonwick { 233b24ab676SJeff Bonwick return (!!ddt->ddt_object[type][class]); 234b24ab676SJeff Bonwick } 235b24ab676SJeff Bonwick 236b24ab676SJeff Bonwick void 237b24ab676SJeff Bonwick ddt_object_name(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 238b24ab676SJeff Bonwick char *name) 239b24ab676SJeff Bonwick { 240b24ab676SJeff Bonwick (void) sprintf(name, DMU_POOL_DDT, 241b24ab676SJeff Bonwick zio_checksum_table[ddt->ddt_checksum].ci_name, 242b24ab676SJeff Bonwick ddt_ops[type]->ddt_op_name, ddt_class_name[class]); 243b24ab676SJeff Bonwick } 244b24ab676SJeff Bonwick 245b24ab676SJeff Bonwick void 246b24ab676SJeff Bonwick ddt_bp_fill(const ddt_phys_t *ddp, blkptr_t *bp, uint64_t txg) 247b24ab676SJeff Bonwick { 248b24ab676SJeff Bonwick ASSERT(txg != 0); 249b24ab676SJeff Bonwick 250b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 251b24ab676SJeff Bonwick bp->blk_dva[d] = ddp->ddp_dva[d]; 252b24ab676SJeff Bonwick BP_SET_BIRTH(bp, txg, ddp->ddp_phys_birth); 253b24ab676SJeff Bonwick } 254b24ab676SJeff Bonwick 255b24ab676SJeff Bonwick void 256bbfd46c4SJeff Bonwick ddt_bp_create(enum zio_checksum checksum, 257bbfd46c4SJeff Bonwick const ddt_key_t *ddk, const ddt_phys_t *ddp, blkptr_t *bp) 258b24ab676SJeff Bonwick { 259b24ab676SJeff Bonwick BP_ZERO(bp); 260b24ab676SJeff Bonwick 261b24ab676SJeff Bonwick if (ddp != NULL) 262b24ab676SJeff Bonwick ddt_bp_fill(ddp, bp, ddp->ddp_phys_birth); 263b24ab676SJeff Bonwick 264b24ab676SJeff Bonwick bp->blk_cksum = ddk->ddk_cksum; 2653f9d6ad7SLin Ling bp->blk_fill = 1; 266b24ab676SJeff Bonwick 267b24ab676SJeff Bonwick BP_SET_LSIZE(bp, DDK_GET_LSIZE(ddk)); 268b24ab676SJeff Bonwick BP_SET_PSIZE(bp, DDK_GET_PSIZE(ddk)); 269b24ab676SJeff Bonwick BP_SET_COMPRESS(bp, DDK_GET_COMPRESS(ddk)); 270bbfd46c4SJeff Bonwick BP_SET_CHECKSUM(bp, checksum); 2713f9d6ad7SLin Ling BP_SET_TYPE(bp, DMU_OT_DEDUP); 272b24ab676SJeff Bonwick BP_SET_LEVEL(bp, 0); 273b24ab676SJeff Bonwick BP_SET_DEDUP(bp, 0); 274b24ab676SJeff Bonwick BP_SET_BYTEORDER(bp, ZFS_HOST_BYTEORDER); 275b24ab676SJeff Bonwick } 276b24ab676SJeff Bonwick 277b24ab676SJeff Bonwick void 278b24ab676SJeff Bonwick ddt_key_fill(ddt_key_t *ddk, const blkptr_t *bp) 279b24ab676SJeff Bonwick { 280b24ab676SJeff Bonwick ddk->ddk_cksum = bp->blk_cksum; 281b24ab676SJeff Bonwick ddk->ddk_prop = 0; 282b24ab676SJeff Bonwick 283b24ab676SJeff Bonwick DDK_SET_LSIZE(ddk, BP_GET_LSIZE(bp)); 284b24ab676SJeff Bonwick DDK_SET_PSIZE(ddk, BP_GET_PSIZE(bp)); 285b24ab676SJeff Bonwick DDK_SET_COMPRESS(ddk, BP_GET_COMPRESS(bp)); 286b24ab676SJeff Bonwick } 287b24ab676SJeff Bonwick 288b24ab676SJeff Bonwick void 289b24ab676SJeff Bonwick ddt_phys_fill(ddt_phys_t *ddp, const blkptr_t *bp) 290b24ab676SJeff Bonwick { 291b24ab676SJeff Bonwick ASSERT(ddp->ddp_phys_birth == 0); 292b24ab676SJeff Bonwick 293b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 294b24ab676SJeff Bonwick ddp->ddp_dva[d] = bp->blk_dva[d]; 295b24ab676SJeff Bonwick ddp->ddp_phys_birth = BP_PHYSICAL_BIRTH(bp); 296b24ab676SJeff Bonwick } 297b24ab676SJeff Bonwick 298b24ab676SJeff Bonwick void 299b24ab676SJeff Bonwick ddt_phys_clear(ddt_phys_t *ddp) 300b24ab676SJeff Bonwick { 301b24ab676SJeff Bonwick bzero(ddp, sizeof (*ddp)); 302b24ab676SJeff Bonwick } 303b24ab676SJeff Bonwick 304b24ab676SJeff Bonwick void 305b24ab676SJeff Bonwick ddt_phys_addref(ddt_phys_t *ddp) 306b24ab676SJeff Bonwick { 307b24ab676SJeff Bonwick ddp->ddp_refcnt++; 308b24ab676SJeff Bonwick } 309b24ab676SJeff Bonwick 310b24ab676SJeff Bonwick void 311b24ab676SJeff Bonwick ddt_phys_decref(ddt_phys_t *ddp) 312b24ab676SJeff Bonwick { 313b24ab676SJeff Bonwick ASSERT((int64_t)ddp->ddp_refcnt > 0); 314b24ab676SJeff Bonwick ddp->ddp_refcnt--; 315b24ab676SJeff Bonwick } 316b24ab676SJeff Bonwick 317b24ab676SJeff Bonwick void 318b24ab676SJeff Bonwick ddt_phys_free(ddt_t *ddt, ddt_key_t *ddk, ddt_phys_t *ddp, uint64_t txg) 319b24ab676SJeff Bonwick { 320b24ab676SJeff Bonwick blkptr_t blk; 321b24ab676SJeff Bonwick 322bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, ddk, ddp, &blk); 323b24ab676SJeff Bonwick ddt_phys_clear(ddp); 324b24ab676SJeff Bonwick zio_free(ddt->ddt_spa, txg, &blk); 325b24ab676SJeff Bonwick } 326b24ab676SJeff Bonwick 327b24ab676SJeff Bonwick ddt_phys_t * 328b24ab676SJeff Bonwick ddt_phys_select(const ddt_entry_t *dde, const blkptr_t *bp) 329b24ab676SJeff Bonwick { 330b24ab676SJeff Bonwick ddt_phys_t *ddp = (ddt_phys_t *)dde->dde_phys; 331b24ab676SJeff Bonwick 332b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 333b24ab676SJeff Bonwick if (DVA_EQUAL(BP_IDENTITY(bp), &ddp->ddp_dva[0]) && 334b24ab676SJeff Bonwick BP_PHYSICAL_BIRTH(bp) == ddp->ddp_phys_birth) 335b24ab676SJeff Bonwick return (ddp); 336b24ab676SJeff Bonwick } 337b24ab676SJeff Bonwick return (NULL); 338b24ab676SJeff Bonwick } 339b24ab676SJeff Bonwick 340b24ab676SJeff Bonwick uint64_t 341b24ab676SJeff Bonwick ddt_phys_total_refcnt(const ddt_entry_t *dde) 342b24ab676SJeff Bonwick { 343b24ab676SJeff Bonwick uint64_t refcnt = 0; 344b24ab676SJeff Bonwick 345b24ab676SJeff Bonwick for (int p = DDT_PHYS_SINGLE; p <= DDT_PHYS_TRIPLE; p++) 346b24ab676SJeff Bonwick refcnt += dde->dde_phys[p].ddp_refcnt; 347b24ab676SJeff Bonwick 348b24ab676SJeff Bonwick return (refcnt); 349b24ab676SJeff Bonwick } 350b24ab676SJeff Bonwick 351b24ab676SJeff Bonwick static void 352b24ab676SJeff Bonwick ddt_stat_generate(ddt_t *ddt, ddt_entry_t *dde, ddt_stat_t *dds) 353b24ab676SJeff Bonwick { 354b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 355b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 356b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 357b24ab676SJeff Bonwick uint64_t lsize = DDK_GET_LSIZE(ddk); 358b24ab676SJeff Bonwick uint64_t psize = DDK_GET_PSIZE(ddk); 359b24ab676SJeff Bonwick 360b24ab676SJeff Bonwick bzero(dds, sizeof (*dds)); 361b24ab676SJeff Bonwick 362b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 363b24ab676SJeff Bonwick uint64_t dsize = 0; 364b24ab676SJeff Bonwick uint64_t refcnt = ddp->ddp_refcnt; 365b24ab676SJeff Bonwick 366b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0) 367b24ab676SJeff Bonwick continue; 368b24ab676SJeff Bonwick 369b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 370b24ab676SJeff Bonwick dsize += dva_get_dsize_sync(spa, &ddp->ddp_dva[d]); 371b24ab676SJeff Bonwick 372b24ab676SJeff Bonwick dds->dds_blocks += 1; 373b24ab676SJeff Bonwick dds->dds_lsize += lsize; 374b24ab676SJeff Bonwick dds->dds_psize += psize; 375b24ab676SJeff Bonwick dds->dds_dsize += dsize; 376b24ab676SJeff Bonwick 377b24ab676SJeff Bonwick dds->dds_ref_blocks += refcnt; 378b24ab676SJeff Bonwick dds->dds_ref_lsize += lsize * refcnt; 379b24ab676SJeff Bonwick dds->dds_ref_psize += psize * refcnt; 380b24ab676SJeff Bonwick dds->dds_ref_dsize += dsize * refcnt; 381b24ab676SJeff Bonwick } 382b24ab676SJeff Bonwick } 383b24ab676SJeff Bonwick 384b24ab676SJeff Bonwick void 385b24ab676SJeff Bonwick ddt_stat_add(ddt_stat_t *dst, const ddt_stat_t *src, uint64_t neg) 386b24ab676SJeff Bonwick { 387b24ab676SJeff Bonwick const uint64_t *s = (const uint64_t *)src; 388b24ab676SJeff Bonwick uint64_t *d = (uint64_t *)dst; 389b24ab676SJeff Bonwick uint64_t *d_end = (uint64_t *)(dst + 1); 390b24ab676SJeff Bonwick 391b24ab676SJeff Bonwick ASSERT(neg == 0 || neg == -1ULL); /* add or subtract */ 392b24ab676SJeff Bonwick 393b24ab676SJeff Bonwick while (d < d_end) 394b24ab676SJeff Bonwick *d++ += (*s++ ^ neg) - neg; 395b24ab676SJeff Bonwick } 396b24ab676SJeff Bonwick 397b24ab676SJeff Bonwick static void 398b24ab676SJeff Bonwick ddt_stat_update(ddt_t *ddt, ddt_entry_t *dde, uint64_t neg) 399b24ab676SJeff Bonwick { 400b24ab676SJeff Bonwick ddt_stat_t dds; 401b24ab676SJeff Bonwick ddt_histogram_t *ddh; 402b24ab676SJeff Bonwick int bucket; 403b24ab676SJeff Bonwick 404b24ab676SJeff Bonwick ddt_stat_generate(ddt, dde, &dds); 405b24ab676SJeff Bonwick 406b24ab676SJeff Bonwick bucket = highbit(dds.dds_ref_blocks) - 1; 407b24ab676SJeff Bonwick ASSERT(bucket >= 0); 408b24ab676SJeff Bonwick 409b24ab676SJeff Bonwick ddh = &ddt->ddt_histogram[dde->dde_type][dde->dde_class]; 410b24ab676SJeff Bonwick 411b24ab676SJeff Bonwick ddt_stat_add(&ddh->ddh_stat[bucket], &dds, neg); 412b24ab676SJeff Bonwick } 413b24ab676SJeff Bonwick 414b24ab676SJeff Bonwick void 415b24ab676SJeff Bonwick ddt_histogram_add(ddt_histogram_t *dst, const ddt_histogram_t *src) 416b24ab676SJeff Bonwick { 417b24ab676SJeff Bonwick for (int h = 0; h < 64; h++) 418b24ab676SJeff Bonwick ddt_stat_add(&dst->ddh_stat[h], &src->ddh_stat[h], 0); 419b24ab676SJeff Bonwick } 420b24ab676SJeff Bonwick 421b24ab676SJeff Bonwick void 422b24ab676SJeff Bonwick ddt_histogram_stat(ddt_stat_t *dds, const ddt_histogram_t *ddh) 423b24ab676SJeff Bonwick { 424b24ab676SJeff Bonwick bzero(dds, sizeof (*dds)); 425b24ab676SJeff Bonwick 426b24ab676SJeff Bonwick for (int h = 0; h < 64; h++) 427b24ab676SJeff Bonwick ddt_stat_add(dds, &ddh->ddh_stat[h], 0); 428b24ab676SJeff Bonwick } 429b24ab676SJeff Bonwick 430b24ab676SJeff Bonwick boolean_t 431b24ab676SJeff Bonwick ddt_histogram_empty(const ddt_histogram_t *ddh) 432b24ab676SJeff Bonwick { 433b24ab676SJeff Bonwick const uint64_t *s = (const uint64_t *)ddh; 434b24ab676SJeff Bonwick const uint64_t *s_end = (const uint64_t *)(ddh + 1); 435b24ab676SJeff Bonwick 436b24ab676SJeff Bonwick while (s < s_end) 437b24ab676SJeff Bonwick if (*s++ != 0) 438b24ab676SJeff Bonwick return (B_FALSE); 439b24ab676SJeff Bonwick 440b24ab676SJeff Bonwick return (B_TRUE); 441b24ab676SJeff Bonwick } 442b24ab676SJeff Bonwick 4439eb19f4dSGeorge Wilson void 44430f608a4SGeorge Wilson ddt_get_dedup_object_stats(spa_t *spa, ddt_object_t *ddo_total) 445b24ab676SJeff Bonwick { 44630f608a4SGeorge Wilson /* Sum the statistics we cached in ddt_object_sync(). */ 447b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 448b24ab676SJeff Bonwick ddt_t *ddt = spa->spa_ddt[c]; 449b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 450b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; 451b24ab676SJeff Bonwick class++) { 45230f608a4SGeorge Wilson ddt_object_t *ddo = 45330f608a4SGeorge Wilson &ddt->ddt_object_stats[type][class]; 45430f608a4SGeorge Wilson ddo_total->ddo_count += ddo->ddo_count; 45530f608a4SGeorge Wilson ddo_total->ddo_dspace += ddo->ddo_dspace; 45630f608a4SGeorge Wilson ddo_total->ddo_mspace += ddo->ddo_mspace; 4579eb19f4dSGeorge Wilson } 4589eb19f4dSGeorge Wilson } 4599eb19f4dSGeorge Wilson } 46030f608a4SGeorge Wilson 46130f608a4SGeorge Wilson /* ... and compute the averages. */ 46230f608a4SGeorge Wilson if (ddo_total->ddo_count != 0) { 46330f608a4SGeorge Wilson ddo_total->ddo_dspace /= ddo_total->ddo_count; 46430f608a4SGeorge Wilson ddo_total->ddo_mspace /= ddo_total->ddo_count; 46530f608a4SGeorge Wilson } 4669eb19f4dSGeorge Wilson } 4679eb19f4dSGeorge Wilson 4689eb19f4dSGeorge Wilson void 4699eb19f4dSGeorge Wilson ddt_get_dedup_histogram(spa_t *spa, ddt_histogram_t *ddh) 4709eb19f4dSGeorge Wilson { 4719eb19f4dSGeorge Wilson for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 4729eb19f4dSGeorge Wilson ddt_t *ddt = spa->spa_ddt[c]; 4739eb19f4dSGeorge Wilson for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 4749eb19f4dSGeorge Wilson for (enum ddt_class class = 0; class < DDT_CLASSES; 4759eb19f4dSGeorge Wilson class++) { 4769eb19f4dSGeorge Wilson ddt_histogram_add(ddh, 47730f608a4SGeorge Wilson &ddt->ddt_histogram_cache[type][class]); 478b24ab676SJeff Bonwick } 479b24ab676SJeff Bonwick } 480b24ab676SJeff Bonwick } 4819eb19f4dSGeorge Wilson } 4829eb19f4dSGeorge Wilson 4839eb19f4dSGeorge Wilson void 4849eb19f4dSGeorge Wilson ddt_get_dedup_stats(spa_t *spa, ddt_stat_t *dds_total) 4859eb19f4dSGeorge Wilson { 4869eb19f4dSGeorge Wilson ddt_histogram_t *ddh_total; 487b24ab676SJeff Bonwick 4889eb19f4dSGeorge Wilson ddh_total = kmem_zalloc(sizeof (ddt_histogram_t), KM_SLEEP); 4899eb19f4dSGeorge Wilson ddt_get_dedup_histogram(spa, ddh_total); 4909eb19f4dSGeorge Wilson ddt_histogram_stat(dds_total, ddh_total); 4919eb19f4dSGeorge Wilson kmem_free(ddh_total, sizeof (ddt_histogram_t)); 492485bbbf5SGeorge Wilson } 493485bbbf5SGeorge Wilson 494485bbbf5SGeorge Wilson uint64_t 495485bbbf5SGeorge Wilson ddt_get_dedup_dspace(spa_t *spa) 496485bbbf5SGeorge Wilson { 497485bbbf5SGeorge Wilson ddt_stat_t dds_total = { 0 }; 498485bbbf5SGeorge Wilson 499485bbbf5SGeorge Wilson ddt_get_dedup_stats(spa, &dds_total); 500485bbbf5SGeorge Wilson return (dds_total.dds_ref_dsize - dds_total.dds_dsize); 501485bbbf5SGeorge Wilson } 502485bbbf5SGeorge Wilson 503485bbbf5SGeorge Wilson uint64_t 504485bbbf5SGeorge Wilson ddt_get_pool_dedup_ratio(spa_t *spa) 505485bbbf5SGeorge Wilson { 506485bbbf5SGeorge Wilson ddt_stat_t dds_total = { 0 }; 507b24ab676SJeff Bonwick 508485bbbf5SGeorge Wilson ddt_get_dedup_stats(spa, &dds_total); 509b24ab676SJeff Bonwick if (dds_total.dds_dsize == 0) 510b24ab676SJeff Bonwick return (100); 511b24ab676SJeff Bonwick 512b24ab676SJeff Bonwick return (dds_total.dds_ref_dsize * 100 / dds_total.dds_dsize); 513b24ab676SJeff Bonwick } 514b24ab676SJeff Bonwick 515b24ab676SJeff Bonwick int 516b24ab676SJeff Bonwick ddt_ditto_copies_needed(ddt_t *ddt, ddt_entry_t *dde, ddt_phys_t *ddp_willref) 517b24ab676SJeff Bonwick { 518b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 519b24ab676SJeff Bonwick uint64_t total_refcnt = 0; 520b24ab676SJeff Bonwick uint64_t ditto = spa->spa_dedup_ditto; 521b24ab676SJeff Bonwick int total_copies = 0; 522b24ab676SJeff Bonwick int desired_copies = 0; 523b24ab676SJeff Bonwick 524b24ab676SJeff Bonwick for (int p = DDT_PHYS_SINGLE; p <= DDT_PHYS_TRIPLE; p++) { 525b24ab676SJeff Bonwick ddt_phys_t *ddp = &dde->dde_phys[p]; 526b24ab676SJeff Bonwick zio_t *zio = dde->dde_lead_zio[p]; 527b24ab676SJeff Bonwick uint64_t refcnt = ddp->ddp_refcnt; /* committed refs */ 528b24ab676SJeff Bonwick if (zio != NULL) 529b24ab676SJeff Bonwick refcnt += zio->io_parent_count; /* pending refs */ 530b24ab676SJeff Bonwick if (ddp == ddp_willref) 531b24ab676SJeff Bonwick refcnt++; /* caller's ref */ 532b24ab676SJeff Bonwick if (refcnt != 0) { 533b24ab676SJeff Bonwick total_refcnt += refcnt; 534b24ab676SJeff Bonwick total_copies += p; 535b24ab676SJeff Bonwick } 536b24ab676SJeff Bonwick } 537b24ab676SJeff Bonwick 538b24ab676SJeff Bonwick if (ditto == 0 || ditto > UINT32_MAX) 539b24ab676SJeff Bonwick ditto = UINT32_MAX; 540b24ab676SJeff Bonwick 541b24ab676SJeff Bonwick if (total_refcnt >= 1) 542b24ab676SJeff Bonwick desired_copies++; 543b24ab676SJeff Bonwick if (total_refcnt >= ditto) 544b24ab676SJeff Bonwick desired_copies++; 545b24ab676SJeff Bonwick if (total_refcnt >= ditto * ditto) 546b24ab676SJeff Bonwick desired_copies++; 547b24ab676SJeff Bonwick 548b24ab676SJeff Bonwick return (MAX(desired_copies, total_copies) - total_copies); 549b24ab676SJeff Bonwick } 550b24ab676SJeff Bonwick 551b24ab676SJeff Bonwick int 552b24ab676SJeff Bonwick ddt_ditto_copies_present(ddt_entry_t *dde) 553b24ab676SJeff Bonwick { 554b24ab676SJeff Bonwick ddt_phys_t *ddp = &dde->dde_phys[DDT_PHYS_DITTO]; 555b24ab676SJeff Bonwick dva_t *dva = ddp->ddp_dva; 556b24ab676SJeff Bonwick int copies = 0 - DVA_GET_GANG(dva); 557b24ab676SJeff Bonwick 558b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++, dva++) 559b24ab676SJeff Bonwick if (DVA_IS_VALID(dva)) 560b24ab676SJeff Bonwick copies++; 561b24ab676SJeff Bonwick 562b24ab676SJeff Bonwick ASSERT(copies >= 0 && copies < SPA_DVAS_PER_BP); 563b24ab676SJeff Bonwick 564b24ab676SJeff Bonwick return (copies); 565b24ab676SJeff Bonwick } 566b24ab676SJeff Bonwick 567b24ab676SJeff Bonwick size_t 568b24ab676SJeff Bonwick ddt_compress(void *src, uchar_t *dst, size_t s_len, size_t d_len) 569b24ab676SJeff Bonwick { 570b24ab676SJeff Bonwick uchar_t *version = dst++; 571b24ab676SJeff Bonwick int cpfunc = ZIO_COMPRESS_ZLE; 572b24ab676SJeff Bonwick zio_compress_info_t *ci = &zio_compress_table[cpfunc]; 573b24ab676SJeff Bonwick size_t c_len; 574b24ab676SJeff Bonwick 575b24ab676SJeff Bonwick ASSERT(d_len >= s_len + 1); /* no compression plus version byte */ 576b24ab676SJeff Bonwick 577b24ab676SJeff Bonwick c_len = ci->ci_compress(src, dst, s_len, d_len - 1, ci->ci_level); 578b24ab676SJeff Bonwick 579b24ab676SJeff Bonwick if (c_len == s_len) { 580b24ab676SJeff Bonwick cpfunc = ZIO_COMPRESS_OFF; 581b24ab676SJeff Bonwick bcopy(src, dst, s_len); 582b24ab676SJeff Bonwick } 583b24ab676SJeff Bonwick 584b24ab676SJeff Bonwick *version = (ZFS_HOST_BYTEORDER & DDT_COMPRESS_BYTEORDER_MASK) | cpfunc; 585b24ab676SJeff Bonwick 586b24ab676SJeff Bonwick return (c_len + 1); 587b24ab676SJeff Bonwick } 588b24ab676SJeff Bonwick 589b24ab676SJeff Bonwick void 590b24ab676SJeff Bonwick ddt_decompress(uchar_t *src, void *dst, size_t s_len, size_t d_len) 591b24ab676SJeff Bonwick { 592b24ab676SJeff Bonwick uchar_t version = *src++; 593b24ab676SJeff Bonwick int cpfunc = version & DDT_COMPRESS_FUNCTION_MASK; 594b24ab676SJeff Bonwick zio_compress_info_t *ci = &zio_compress_table[cpfunc]; 595b24ab676SJeff Bonwick 596b24ab676SJeff Bonwick if (ci->ci_decompress != NULL) 597b24ab676SJeff Bonwick (void) ci->ci_decompress(src, dst, s_len, d_len, ci->ci_level); 598b24ab676SJeff Bonwick else 599b24ab676SJeff Bonwick bcopy(src, dst, d_len); 600b24ab676SJeff Bonwick 601b24ab676SJeff Bonwick if ((version ^ ZFS_HOST_BYTEORDER) & DDT_COMPRESS_BYTEORDER_MASK) 602b24ab676SJeff Bonwick byteswap_uint64_array(dst, d_len); 603b24ab676SJeff Bonwick } 604b24ab676SJeff Bonwick 605b24ab676SJeff Bonwick ddt_t * 606b24ab676SJeff Bonwick ddt_select_by_checksum(spa_t *spa, enum zio_checksum c) 607b24ab676SJeff Bonwick { 608b24ab676SJeff Bonwick return (spa->spa_ddt[c]); 609b24ab676SJeff Bonwick } 610b24ab676SJeff Bonwick 611b24ab676SJeff Bonwick ddt_t * 612b24ab676SJeff Bonwick ddt_select(spa_t *spa, const blkptr_t *bp) 613b24ab676SJeff Bonwick { 614b24ab676SJeff Bonwick return (spa->spa_ddt[BP_GET_CHECKSUM(bp)]); 615b24ab676SJeff Bonwick } 616b24ab676SJeff Bonwick 617b24ab676SJeff Bonwick void 618b24ab676SJeff Bonwick ddt_enter(ddt_t *ddt) 619b24ab676SJeff Bonwick { 620b24ab676SJeff Bonwick mutex_enter(&ddt->ddt_lock); 621b24ab676SJeff Bonwick } 622b24ab676SJeff Bonwick 623b24ab676SJeff Bonwick void 624b24ab676SJeff Bonwick ddt_exit(ddt_t *ddt) 625b24ab676SJeff Bonwick { 626b24ab676SJeff Bonwick mutex_exit(&ddt->ddt_lock); 627b24ab676SJeff Bonwick } 628b24ab676SJeff Bonwick 629b24ab676SJeff Bonwick static ddt_entry_t * 630b24ab676SJeff Bonwick ddt_alloc(const ddt_key_t *ddk) 631b24ab676SJeff Bonwick { 632b24ab676SJeff Bonwick ddt_entry_t *dde; 633b24ab676SJeff Bonwick 634b24ab676SJeff Bonwick dde = kmem_zalloc(sizeof (ddt_entry_t), KM_SLEEP); 635b24ab676SJeff Bonwick cv_init(&dde->dde_cv, NULL, CV_DEFAULT, NULL); 636b24ab676SJeff Bonwick 637b24ab676SJeff Bonwick dde->dde_key = *ddk; 638b24ab676SJeff Bonwick 639b24ab676SJeff Bonwick return (dde); 640b24ab676SJeff Bonwick } 641b24ab676SJeff Bonwick 642b24ab676SJeff Bonwick static void 643b24ab676SJeff Bonwick ddt_free(ddt_entry_t *dde) 644b24ab676SJeff Bonwick { 645b24ab676SJeff Bonwick ASSERT(!dde->dde_loading); 646b24ab676SJeff Bonwick 647b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++) 648b24ab676SJeff Bonwick ASSERT(dde->dde_lead_zio[p] == NULL); 649b24ab676SJeff Bonwick 650b24ab676SJeff Bonwick if (dde->dde_repair_data != NULL) 651b24ab676SJeff Bonwick zio_buf_free(dde->dde_repair_data, 652b24ab676SJeff Bonwick DDK_GET_PSIZE(&dde->dde_key)); 653b24ab676SJeff Bonwick 654b24ab676SJeff Bonwick cv_destroy(&dde->dde_cv); 655b24ab676SJeff Bonwick kmem_free(dde, sizeof (*dde)); 656b24ab676SJeff Bonwick } 657b24ab676SJeff Bonwick 658b24ab676SJeff Bonwick void 659b24ab676SJeff Bonwick ddt_remove(ddt_t *ddt, ddt_entry_t *dde) 660b24ab676SJeff Bonwick { 661b24ab676SJeff Bonwick ASSERT(MUTEX_HELD(&ddt->ddt_lock)); 662b24ab676SJeff Bonwick 663b24ab676SJeff Bonwick avl_remove(&ddt->ddt_tree, dde); 664b24ab676SJeff Bonwick ddt_free(dde); 665b24ab676SJeff Bonwick } 666b24ab676SJeff Bonwick 667b24ab676SJeff Bonwick ddt_entry_t * 668b24ab676SJeff Bonwick ddt_lookup(ddt_t *ddt, const blkptr_t *bp, boolean_t add) 669b24ab676SJeff Bonwick { 670b24ab676SJeff Bonwick ddt_entry_t *dde, dde_search; 671b24ab676SJeff Bonwick enum ddt_type type; 672b24ab676SJeff Bonwick enum ddt_class class; 673b24ab676SJeff Bonwick avl_index_t where; 674b24ab676SJeff Bonwick int error; 675b24ab676SJeff Bonwick 676b24ab676SJeff Bonwick ASSERT(MUTEX_HELD(&ddt->ddt_lock)); 677b24ab676SJeff Bonwick 678b24ab676SJeff Bonwick ddt_key_fill(&dde_search.dde_key, bp); 679b24ab676SJeff Bonwick 680b24ab676SJeff Bonwick dde = avl_find(&ddt->ddt_tree, &dde_search, &where); 681b24ab676SJeff Bonwick if (dde == NULL) { 682b24ab676SJeff Bonwick if (!add) 683b24ab676SJeff Bonwick return (NULL); 684b24ab676SJeff Bonwick dde = ddt_alloc(&dde_search.dde_key); 685b24ab676SJeff Bonwick avl_insert(&ddt->ddt_tree, dde, where); 686b24ab676SJeff Bonwick } 687b24ab676SJeff Bonwick 688b24ab676SJeff Bonwick while (dde->dde_loading) 689b24ab676SJeff Bonwick cv_wait(&dde->dde_cv, &ddt->ddt_lock); 690b24ab676SJeff Bonwick 691b24ab676SJeff Bonwick if (dde->dde_loaded) 692b24ab676SJeff Bonwick return (dde); 693b24ab676SJeff Bonwick 694b24ab676SJeff Bonwick dde->dde_loading = B_TRUE; 695b24ab676SJeff Bonwick 696b24ab676SJeff Bonwick ddt_exit(ddt); 697b24ab676SJeff Bonwick 698b24ab676SJeff Bonwick error = ENOENT; 699b24ab676SJeff Bonwick 700b24ab676SJeff Bonwick for (type = 0; type < DDT_TYPES; type++) { 701b24ab676SJeff Bonwick for (class = 0; class < DDT_CLASSES; class++) { 702b24ab676SJeff Bonwick error = ddt_object_lookup(ddt, type, class, dde); 703b24ab676SJeff Bonwick if (error != ENOENT) 704b24ab676SJeff Bonwick break; 705b24ab676SJeff Bonwick } 706b24ab676SJeff Bonwick if (error != ENOENT) 707b24ab676SJeff Bonwick break; 708b24ab676SJeff Bonwick } 709b24ab676SJeff Bonwick 710b24ab676SJeff Bonwick ASSERT(error == 0 || error == ENOENT); 711b24ab676SJeff Bonwick 712b24ab676SJeff Bonwick ddt_enter(ddt); 713b24ab676SJeff Bonwick 714b24ab676SJeff Bonwick ASSERT(dde->dde_loaded == B_FALSE); 715b24ab676SJeff Bonwick ASSERT(dde->dde_loading == B_TRUE); 716b24ab676SJeff Bonwick 717b24ab676SJeff Bonwick dde->dde_type = type; /* will be DDT_TYPES if no entry found */ 718b24ab676SJeff Bonwick dde->dde_class = class; /* will be DDT_CLASSES if no entry found */ 719b24ab676SJeff Bonwick dde->dde_loaded = B_TRUE; 720b24ab676SJeff Bonwick dde->dde_loading = B_FALSE; 721b24ab676SJeff Bonwick 722b24ab676SJeff Bonwick if (error == 0) 723b24ab676SJeff Bonwick ddt_stat_update(ddt, dde, -1ULL); 724b24ab676SJeff Bonwick 725b24ab676SJeff Bonwick cv_broadcast(&dde->dde_cv); 726b24ab676SJeff Bonwick 727b24ab676SJeff Bonwick return (dde); 728b24ab676SJeff Bonwick } 729b24ab676SJeff Bonwick 730c7cd2421SGeorge Wilson void 731c7cd2421SGeorge Wilson ddt_prefetch(spa_t *spa, const blkptr_t *bp) 732c7cd2421SGeorge Wilson { 733c7cd2421SGeorge Wilson ddt_t *ddt; 734c7cd2421SGeorge Wilson ddt_entry_t dde; 735c7cd2421SGeorge Wilson 736837b568bSGeorge Wilson if (!zfs_dedup_prefetch || bp == NULL || !BP_GET_DEDUP(bp)) 737c7cd2421SGeorge Wilson return; 738c7cd2421SGeorge Wilson 739c7cd2421SGeorge Wilson /* 740ce053c9dSGeorge Wilson * We only remove the DDT once all tables are empty and only 741ce053c9dSGeorge Wilson * prefetch dedup blocks when there are entries in the DDT. 742ce053c9dSGeorge Wilson * Thus no locking is required as the DDT can't disappear on us. 743c7cd2421SGeorge Wilson */ 744c7cd2421SGeorge Wilson ddt = ddt_select(spa, bp); 745c7cd2421SGeorge Wilson ddt_key_fill(&dde.dde_key, bp); 746c7cd2421SGeorge Wilson 747c7cd2421SGeorge Wilson for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 748c7cd2421SGeorge Wilson for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 749c7cd2421SGeorge Wilson ddt_object_prefetch(ddt, type, class, &dde); 750c7cd2421SGeorge Wilson } 751c7cd2421SGeorge Wilson } 752c7cd2421SGeorge Wilson } 753c7cd2421SGeorge Wilson 754b24ab676SJeff Bonwick int 755b24ab676SJeff Bonwick ddt_entry_compare(const void *x1, const void *x2) 756b24ab676SJeff Bonwick { 757b24ab676SJeff Bonwick const ddt_entry_t *dde1 = x1; 758b24ab676SJeff Bonwick const ddt_entry_t *dde2 = x2; 759b24ab676SJeff Bonwick const uint64_t *u1 = (const uint64_t *)&dde1->dde_key; 760b24ab676SJeff Bonwick const uint64_t *u2 = (const uint64_t *)&dde2->dde_key; 761b24ab676SJeff Bonwick 762b24ab676SJeff Bonwick for (int i = 0; i < DDT_KEY_WORDS; i++) { 763b24ab676SJeff Bonwick if (u1[i] < u2[i]) 764b24ab676SJeff Bonwick return (-1); 765b24ab676SJeff Bonwick if (u1[i] > u2[i]) 766b24ab676SJeff Bonwick return (1); 767b24ab676SJeff Bonwick } 768b24ab676SJeff Bonwick 769b24ab676SJeff Bonwick return (0); 770b24ab676SJeff Bonwick } 771b24ab676SJeff Bonwick 772b24ab676SJeff Bonwick static ddt_t * 773b24ab676SJeff Bonwick ddt_table_alloc(spa_t *spa, enum zio_checksum c) 774b24ab676SJeff Bonwick { 775b24ab676SJeff Bonwick ddt_t *ddt; 776b24ab676SJeff Bonwick 777b24ab676SJeff Bonwick ddt = kmem_zalloc(sizeof (*ddt), KM_SLEEP); 778b24ab676SJeff Bonwick 779b24ab676SJeff Bonwick mutex_init(&ddt->ddt_lock, NULL, MUTEX_DEFAULT, NULL); 780b24ab676SJeff Bonwick avl_create(&ddt->ddt_tree, ddt_entry_compare, 781b24ab676SJeff Bonwick sizeof (ddt_entry_t), offsetof(ddt_entry_t, dde_node)); 782b24ab676SJeff Bonwick avl_create(&ddt->ddt_repair_tree, ddt_entry_compare, 783b24ab676SJeff Bonwick sizeof (ddt_entry_t), offsetof(ddt_entry_t, dde_node)); 784b24ab676SJeff Bonwick ddt->ddt_checksum = c; 785b24ab676SJeff Bonwick ddt->ddt_spa = spa; 786b24ab676SJeff Bonwick ddt->ddt_os = spa->spa_meta_objset; 787b24ab676SJeff Bonwick 788b24ab676SJeff Bonwick return (ddt); 789b24ab676SJeff Bonwick } 790b24ab676SJeff Bonwick 791b24ab676SJeff Bonwick static void 792b24ab676SJeff Bonwick ddt_table_free(ddt_t *ddt) 793b24ab676SJeff Bonwick { 794b24ab676SJeff Bonwick ASSERT(avl_numnodes(&ddt->ddt_tree) == 0); 795b24ab676SJeff Bonwick ASSERT(avl_numnodes(&ddt->ddt_repair_tree) == 0); 796b24ab676SJeff Bonwick avl_destroy(&ddt->ddt_tree); 797b24ab676SJeff Bonwick avl_destroy(&ddt->ddt_repair_tree); 798b24ab676SJeff Bonwick mutex_destroy(&ddt->ddt_lock); 799b24ab676SJeff Bonwick kmem_free(ddt, sizeof (*ddt)); 800b24ab676SJeff Bonwick } 801b24ab676SJeff Bonwick 802b24ab676SJeff Bonwick void 803b24ab676SJeff Bonwick ddt_create(spa_t *spa) 804b24ab676SJeff Bonwick { 805b24ab676SJeff Bonwick spa->spa_dedup_checksum = ZIO_DEDUPCHECKSUM; 806b24ab676SJeff Bonwick 807b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) 808b24ab676SJeff Bonwick spa->spa_ddt[c] = ddt_table_alloc(spa, c); 809b24ab676SJeff Bonwick } 810b24ab676SJeff Bonwick 811b24ab676SJeff Bonwick int 812b24ab676SJeff Bonwick ddt_load(spa_t *spa) 813b24ab676SJeff Bonwick { 814b24ab676SJeff Bonwick int error; 815b24ab676SJeff Bonwick 816b24ab676SJeff Bonwick ddt_create(spa); 817b24ab676SJeff Bonwick 818b24ab676SJeff Bonwick error = zap_lookup(spa->spa_meta_objset, DMU_POOL_DIRECTORY_OBJECT, 819b24ab676SJeff Bonwick DMU_POOL_DDT_STATS, sizeof (uint64_t), 1, 820b24ab676SJeff Bonwick &spa->spa_ddt_stat_object); 821b24ab676SJeff Bonwick 822b24ab676SJeff Bonwick if (error) 823b24ab676SJeff Bonwick return (error == ENOENT ? 0 : error); 824b24ab676SJeff Bonwick 825b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 82630f608a4SGeorge Wilson ddt_t *ddt = spa->spa_ddt[c]; 827b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 828b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; 829b24ab676SJeff Bonwick class++) { 830b24ab676SJeff Bonwick error = ddt_object_load(ddt, type, class); 831b24ab676SJeff Bonwick if (error != 0 && error != ENOENT) 832b24ab676SJeff Bonwick return (error); 833b24ab676SJeff Bonwick } 834b24ab676SJeff Bonwick } 83530f608a4SGeorge Wilson 83630f608a4SGeorge Wilson /* 83730f608a4SGeorge Wilson * Seed the cached histograms. 83830f608a4SGeorge Wilson */ 83930f608a4SGeorge Wilson bcopy(ddt->ddt_histogram, &ddt->ddt_histogram_cache, 84030f608a4SGeorge Wilson sizeof (ddt->ddt_histogram)); 841b24ab676SJeff Bonwick } 842b24ab676SJeff Bonwick 843b24ab676SJeff Bonwick return (0); 844b24ab676SJeff Bonwick } 845b24ab676SJeff Bonwick 846b24ab676SJeff Bonwick void 847b24ab676SJeff Bonwick ddt_unload(spa_t *spa) 848b24ab676SJeff Bonwick { 849b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 850b24ab676SJeff Bonwick if (spa->spa_ddt[c]) { 851b24ab676SJeff Bonwick ddt_table_free(spa->spa_ddt[c]); 852b24ab676SJeff Bonwick spa->spa_ddt[c] = NULL; 853b24ab676SJeff Bonwick } 854b24ab676SJeff Bonwick } 855b24ab676SJeff Bonwick } 856b24ab676SJeff Bonwick 857bbfd46c4SJeff Bonwick boolean_t 858bbfd46c4SJeff Bonwick ddt_class_contains(spa_t *spa, enum ddt_class max_class, const blkptr_t *bp) 859bbfd46c4SJeff Bonwick { 860bbfd46c4SJeff Bonwick ddt_t *ddt; 861bbfd46c4SJeff Bonwick ddt_entry_t dde; 862bbfd46c4SJeff Bonwick 863bbfd46c4SJeff Bonwick if (!BP_GET_DEDUP(bp)) 864bbfd46c4SJeff Bonwick return (B_FALSE); 865bbfd46c4SJeff Bonwick 866bbfd46c4SJeff Bonwick if (max_class == DDT_CLASS_UNIQUE) 867bbfd46c4SJeff Bonwick return (B_TRUE); 868bbfd46c4SJeff Bonwick 869bbfd46c4SJeff Bonwick ddt = spa->spa_ddt[BP_GET_CHECKSUM(bp)]; 870bbfd46c4SJeff Bonwick 871bbfd46c4SJeff Bonwick ddt_key_fill(&dde.dde_key, bp); 872bbfd46c4SJeff Bonwick 873bbfd46c4SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) 874bbfd46c4SJeff Bonwick for (enum ddt_class class = 0; class <= max_class; class++) 875bbfd46c4SJeff Bonwick if (ddt_object_lookup(ddt, type, class, &dde) == 0) 876bbfd46c4SJeff Bonwick return (B_TRUE); 877bbfd46c4SJeff Bonwick 878bbfd46c4SJeff Bonwick return (B_FALSE); 879bbfd46c4SJeff Bonwick } 880bbfd46c4SJeff Bonwick 881b24ab676SJeff Bonwick ddt_entry_t * 882b24ab676SJeff Bonwick ddt_repair_start(ddt_t *ddt, const blkptr_t *bp) 883b24ab676SJeff Bonwick { 884b24ab676SJeff Bonwick ddt_key_t ddk; 885b24ab676SJeff Bonwick ddt_entry_t *dde; 886b24ab676SJeff Bonwick 887b24ab676SJeff Bonwick ddt_key_fill(&ddk, bp); 888b24ab676SJeff Bonwick 889b24ab676SJeff Bonwick dde = ddt_alloc(&ddk); 890b24ab676SJeff Bonwick 891b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 892b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 893b24ab676SJeff Bonwick /* 894b24ab676SJeff Bonwick * We can only do repair if there are multiple copies 895b24ab676SJeff Bonwick * of the block. For anything in the UNIQUE class, 896b24ab676SJeff Bonwick * there's definitely only one copy, so don't even try. 897b24ab676SJeff Bonwick */ 898b24ab676SJeff Bonwick if (class != DDT_CLASS_UNIQUE && 899b24ab676SJeff Bonwick ddt_object_lookup(ddt, type, class, dde) == 0) 900b24ab676SJeff Bonwick return (dde); 901b24ab676SJeff Bonwick } 902b24ab676SJeff Bonwick } 903b24ab676SJeff Bonwick 904b24ab676SJeff Bonwick bzero(dde->dde_phys, sizeof (dde->dde_phys)); 905b24ab676SJeff Bonwick 906b24ab676SJeff Bonwick return (dde); 907b24ab676SJeff Bonwick } 908b24ab676SJeff Bonwick 909b24ab676SJeff Bonwick void 910b24ab676SJeff Bonwick ddt_repair_done(ddt_t *ddt, ddt_entry_t *dde) 911b24ab676SJeff Bonwick { 912b24ab676SJeff Bonwick avl_index_t where; 913b24ab676SJeff Bonwick 914b24ab676SJeff Bonwick ddt_enter(ddt); 915b24ab676SJeff Bonwick 916b24ab676SJeff Bonwick if (dde->dde_repair_data != NULL && spa_writeable(ddt->ddt_spa) && 917b24ab676SJeff Bonwick avl_find(&ddt->ddt_repair_tree, dde, &where) == NULL) 918b24ab676SJeff Bonwick avl_insert(&ddt->ddt_repair_tree, dde, where); 919b24ab676SJeff Bonwick else 920b24ab676SJeff Bonwick ddt_free(dde); 921b24ab676SJeff Bonwick 922b24ab676SJeff Bonwick ddt_exit(ddt); 923b24ab676SJeff Bonwick } 924b24ab676SJeff Bonwick 925b24ab676SJeff Bonwick static void 926b24ab676SJeff Bonwick ddt_repair_entry_done(zio_t *zio) 927b24ab676SJeff Bonwick { 928b24ab676SJeff Bonwick ddt_entry_t *rdde = zio->io_private; 929b24ab676SJeff Bonwick 930b24ab676SJeff Bonwick ddt_free(rdde); 931b24ab676SJeff Bonwick } 932b24ab676SJeff Bonwick 933b24ab676SJeff Bonwick static void 934b24ab676SJeff Bonwick ddt_repair_entry(ddt_t *ddt, ddt_entry_t *dde, ddt_entry_t *rdde, zio_t *rio) 935b24ab676SJeff Bonwick { 936b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 937b24ab676SJeff Bonwick ddt_phys_t *rddp = rdde->dde_phys; 938b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 939b24ab676SJeff Bonwick ddt_key_t *rddk = &rdde->dde_key; 940b24ab676SJeff Bonwick zio_t *zio; 941b24ab676SJeff Bonwick blkptr_t blk; 942b24ab676SJeff Bonwick 943b24ab676SJeff Bonwick zio = zio_null(rio, rio->io_spa, NULL, 944b24ab676SJeff Bonwick ddt_repair_entry_done, rdde, rio->io_flags); 945b24ab676SJeff Bonwick 946b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++, rddp++) { 947b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0 || 948b24ab676SJeff Bonwick ddp->ddp_phys_birth != rddp->ddp_phys_birth || 949b24ab676SJeff Bonwick bcmp(ddp->ddp_dva, rddp->ddp_dva, sizeof (ddp->ddp_dva))) 950b24ab676SJeff Bonwick continue; 951bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, ddk, ddp, &blk); 952b24ab676SJeff Bonwick zio_nowait(zio_rewrite(zio, zio->io_spa, 0, &blk, 953b24ab676SJeff Bonwick rdde->dde_repair_data, DDK_GET_PSIZE(rddk), NULL, NULL, 954b24ab676SJeff Bonwick ZIO_PRIORITY_SYNC_WRITE, ZIO_DDT_CHILD_FLAGS(zio), NULL)); 955b24ab676SJeff Bonwick } 956b24ab676SJeff Bonwick 957b24ab676SJeff Bonwick zio_nowait(zio); 958b24ab676SJeff Bonwick } 959b24ab676SJeff Bonwick 960b24ab676SJeff Bonwick static void 961b24ab676SJeff Bonwick ddt_repair_table(ddt_t *ddt, zio_t *rio) 962b24ab676SJeff Bonwick { 963b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 964b24ab676SJeff Bonwick ddt_entry_t *dde, *rdde_next, *rdde; 965b24ab676SJeff Bonwick avl_tree_t *t = &ddt->ddt_repair_tree; 966b24ab676SJeff Bonwick blkptr_t blk; 967b24ab676SJeff Bonwick 968b24ab676SJeff Bonwick if (spa_sync_pass(spa) > 1) 969b24ab676SJeff Bonwick return; 970b24ab676SJeff Bonwick 971b24ab676SJeff Bonwick ddt_enter(ddt); 972b24ab676SJeff Bonwick for (rdde = avl_first(t); rdde != NULL; rdde = rdde_next) { 973b24ab676SJeff Bonwick rdde_next = AVL_NEXT(t, rdde); 974b24ab676SJeff Bonwick avl_remove(&ddt->ddt_repair_tree, rdde); 975b24ab676SJeff Bonwick ddt_exit(ddt); 976bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, &rdde->dde_key, NULL, &blk); 977b24ab676SJeff Bonwick dde = ddt_repair_start(ddt, &blk); 978b24ab676SJeff Bonwick ddt_repair_entry(ddt, dde, rdde, rio); 979b24ab676SJeff Bonwick ddt_repair_done(ddt, dde); 980b24ab676SJeff Bonwick ddt_enter(ddt); 981b24ab676SJeff Bonwick } 982b24ab676SJeff Bonwick ddt_exit(ddt); 983b24ab676SJeff Bonwick } 984b24ab676SJeff Bonwick 985b24ab676SJeff Bonwick static void 986b24ab676SJeff Bonwick ddt_sync_entry(ddt_t *ddt, ddt_entry_t *dde, dmu_tx_t *tx, uint64_t txg) 987b24ab676SJeff Bonwick { 988bbfd46c4SJeff Bonwick dsl_pool_t *dp = ddt->ddt_spa->spa_dsl_pool; 989b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 990b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 991b24ab676SJeff Bonwick enum ddt_type otype = dde->dde_type; 992b24ab676SJeff Bonwick enum ddt_type ntype = DDT_TYPE_CURRENT; 993b24ab676SJeff Bonwick enum ddt_class oclass = dde->dde_class; 994b24ab676SJeff Bonwick enum ddt_class nclass; 995b24ab676SJeff Bonwick uint64_t total_refcnt = 0; 996b24ab676SJeff Bonwick 997b24ab676SJeff Bonwick ASSERT(dde->dde_loaded); 998b24ab676SJeff Bonwick ASSERT(!dde->dde_loading); 999b24ab676SJeff Bonwick 1000b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 1001b24ab676SJeff Bonwick ASSERT(dde->dde_lead_zio[p] == NULL); 1002b24ab676SJeff Bonwick ASSERT((int64_t)ddp->ddp_refcnt >= 0); 1003b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0) { 1004b24ab676SJeff Bonwick ASSERT(ddp->ddp_refcnt == 0); 1005b24ab676SJeff Bonwick continue; 1006b24ab676SJeff Bonwick } 1007b24ab676SJeff Bonwick if (p == DDT_PHYS_DITTO) { 1008b24ab676SJeff Bonwick if (ddt_ditto_copies_needed(ddt, dde, NULL) == 0) 1009b24ab676SJeff Bonwick ddt_phys_free(ddt, ddk, ddp, txg); 1010b24ab676SJeff Bonwick continue; 1011b24ab676SJeff Bonwick } 1012b24ab676SJeff Bonwick if (ddp->ddp_refcnt == 0) 1013b24ab676SJeff Bonwick ddt_phys_free(ddt, ddk, ddp, txg); 1014b24ab676SJeff Bonwick total_refcnt += ddp->ddp_refcnt; 1015b24ab676SJeff Bonwick } 1016b24ab676SJeff Bonwick 1017b24ab676SJeff Bonwick if (dde->dde_phys[DDT_PHYS_DITTO].ddp_phys_birth != 0) 1018b24ab676SJeff Bonwick nclass = DDT_CLASS_DITTO; 1019b24ab676SJeff Bonwick else if (total_refcnt > 1) 1020b24ab676SJeff Bonwick nclass = DDT_CLASS_DUPLICATE; 1021b24ab676SJeff Bonwick else 1022b24ab676SJeff Bonwick nclass = DDT_CLASS_UNIQUE; 1023b24ab676SJeff Bonwick 1024b24ab676SJeff Bonwick if (otype != DDT_TYPES && 1025b24ab676SJeff Bonwick (otype != ntype || oclass != nclass || total_refcnt == 0)) { 1026b24ab676SJeff Bonwick VERIFY(ddt_object_remove(ddt, otype, oclass, dde, tx) == 0); 1027b24ab676SJeff Bonwick ASSERT(ddt_object_lookup(ddt, otype, oclass, dde) == ENOENT); 1028b24ab676SJeff Bonwick } 1029b24ab676SJeff Bonwick 1030b24ab676SJeff Bonwick if (total_refcnt != 0) { 1031b24ab676SJeff Bonwick dde->dde_type = ntype; 1032b24ab676SJeff Bonwick dde->dde_class = nclass; 1033b24ab676SJeff Bonwick ddt_stat_update(ddt, dde, 0); 1034b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, ntype, nclass)) 1035b24ab676SJeff Bonwick ddt_object_create(ddt, ntype, nclass, tx); 1036b24ab676SJeff Bonwick VERIFY(ddt_object_update(ddt, ntype, nclass, dde, tx) == 0); 1037bbfd46c4SJeff Bonwick 10383f9d6ad7SLin Ling /* 10393f9d6ad7SLin Ling * If the class changes, the order that we scan this bp 10403f9d6ad7SLin Ling * changes. If it decreases, we could miss it, so 10413f9d6ad7SLin Ling * scan it right now. (This covers both class changing 10423f9d6ad7SLin Ling * while we are doing ddt_walk(), and when we are 10433f9d6ad7SLin Ling * traversing.) 10443f9d6ad7SLin Ling */ 10453f9d6ad7SLin Ling if (nclass < oclass) { 10463f9d6ad7SLin Ling dsl_scan_ddt_entry(dp->dp_scan, 10473f9d6ad7SLin Ling ddt->ddt_checksum, dde, tx); 10483f9d6ad7SLin Ling } 1049b24ab676SJeff Bonwick } 1050b24ab676SJeff Bonwick } 1051b24ab676SJeff Bonwick 1052b24ab676SJeff Bonwick static void 1053b24ab676SJeff Bonwick ddt_sync_table(ddt_t *ddt, dmu_tx_t *tx, uint64_t txg) 1054b24ab676SJeff Bonwick { 1055b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 1056b24ab676SJeff Bonwick ddt_entry_t *dde; 1057b24ab676SJeff Bonwick void *cookie = NULL; 1058b24ab676SJeff Bonwick 1059b24ab676SJeff Bonwick if (avl_numnodes(&ddt->ddt_tree) == 0) 1060b24ab676SJeff Bonwick return; 1061b24ab676SJeff Bonwick 1062b24ab676SJeff Bonwick ASSERT(spa->spa_uberblock.ub_version >= SPA_VERSION_DEDUP); 1063b24ab676SJeff Bonwick 1064b24ab676SJeff Bonwick if (spa->spa_ddt_stat_object == 0) { 1065*ad135b5dSChristopher Siden spa->spa_ddt_stat_object = zap_create_link(ddt->ddt_os, 1066*ad135b5dSChristopher Siden DMU_OT_DDT_STATS, DMU_POOL_DIRECTORY_OBJECT, 1067*ad135b5dSChristopher Siden DMU_POOL_DDT_STATS, tx); 1068b24ab676SJeff Bonwick } 1069b24ab676SJeff Bonwick 1070b24ab676SJeff Bonwick while ((dde = avl_destroy_nodes(&ddt->ddt_tree, &cookie)) != NULL) { 1071b24ab676SJeff Bonwick ddt_sync_entry(ddt, dde, tx, txg); 1072b24ab676SJeff Bonwick ddt_free(dde); 1073b24ab676SJeff Bonwick } 1074b24ab676SJeff Bonwick 1075b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 1076ce053c9dSGeorge Wilson uint64_t count = 0; 1077b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 1078ce053c9dSGeorge Wilson if (ddt_object_exists(ddt, type, class)) { 1079ce053c9dSGeorge Wilson ddt_object_sync(ddt, type, class, tx); 1080ce053c9dSGeorge Wilson count += ddt_object_count(ddt, type, class); 1081ce053c9dSGeorge Wilson } 1082ce053c9dSGeorge Wilson } 1083ce053c9dSGeorge Wilson for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 1084ce053c9dSGeorge Wilson if (count == 0 && ddt_object_exists(ddt, type, class)) 1085b24ab676SJeff Bonwick ddt_object_destroy(ddt, type, class, tx); 1086b24ab676SJeff Bonwick } 1087b24ab676SJeff Bonwick } 108830f608a4SGeorge Wilson 108930f608a4SGeorge Wilson bcopy(ddt->ddt_histogram, &ddt->ddt_histogram_cache, 109030f608a4SGeorge Wilson sizeof (ddt->ddt_histogram)); 1091b24ab676SJeff Bonwick } 1092b24ab676SJeff Bonwick 1093b24ab676SJeff Bonwick void 1094b24ab676SJeff Bonwick ddt_sync(spa_t *spa, uint64_t txg) 1095b24ab676SJeff Bonwick { 1096b24ab676SJeff Bonwick dmu_tx_t *tx; 1097b24ab676SJeff Bonwick zio_t *rio = zio_root(spa, NULL, NULL, 1098b24ab676SJeff Bonwick ZIO_FLAG_CANFAIL | ZIO_FLAG_SPECULATIVE); 1099b24ab676SJeff Bonwick 1100b24ab676SJeff Bonwick ASSERT(spa_syncing_txg(spa) == txg); 1101b24ab676SJeff Bonwick 1102b24ab676SJeff Bonwick tx = dmu_tx_create_assigned(spa->spa_dsl_pool, txg); 1103b24ab676SJeff Bonwick 1104b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 1105b24ab676SJeff Bonwick ddt_t *ddt = spa->spa_ddt[c]; 1106b24ab676SJeff Bonwick if (ddt == NULL) 1107b24ab676SJeff Bonwick continue; 1108b24ab676SJeff Bonwick ddt_sync_table(ddt, tx, txg); 1109b24ab676SJeff Bonwick ddt_repair_table(ddt, rio); 1110b24ab676SJeff Bonwick } 1111b24ab676SJeff Bonwick 1112b24ab676SJeff Bonwick (void) zio_wait(rio); 1113b24ab676SJeff Bonwick 1114b24ab676SJeff Bonwick dmu_tx_commit(tx); 1115b24ab676SJeff Bonwick } 1116bbfd46c4SJeff Bonwick 1117bbfd46c4SJeff Bonwick int 1118bbfd46c4SJeff Bonwick ddt_walk(spa_t *spa, ddt_bookmark_t *ddb, ddt_entry_t *dde) 1119bbfd46c4SJeff Bonwick { 1120bbfd46c4SJeff Bonwick do { 1121bbfd46c4SJeff Bonwick do { 1122bbfd46c4SJeff Bonwick do { 1123bbfd46c4SJeff Bonwick ddt_t *ddt = spa->spa_ddt[ddb->ddb_checksum]; 1124bbfd46c4SJeff Bonwick int error = ENOENT; 1125bbfd46c4SJeff Bonwick if (ddt_object_exists(ddt, ddb->ddb_type, 1126bbfd46c4SJeff Bonwick ddb->ddb_class)) { 1127bbfd46c4SJeff Bonwick error = ddt_object_walk(ddt, 1128bbfd46c4SJeff Bonwick ddb->ddb_type, ddb->ddb_class, 1129bbfd46c4SJeff Bonwick &ddb->ddb_cursor, dde); 1130bbfd46c4SJeff Bonwick } 11313f9d6ad7SLin Ling dde->dde_type = ddb->ddb_type; 11323f9d6ad7SLin Ling dde->dde_class = ddb->ddb_class; 1133bbfd46c4SJeff Bonwick if (error == 0) 1134bbfd46c4SJeff Bonwick return (0); 1135bbfd46c4SJeff Bonwick if (error != ENOENT) 1136bbfd46c4SJeff Bonwick return (error); 1137bbfd46c4SJeff Bonwick ddb->ddb_cursor = 0; 1138bbfd46c4SJeff Bonwick } while (++ddb->ddb_checksum < ZIO_CHECKSUM_FUNCTIONS); 1139bbfd46c4SJeff Bonwick ddb->ddb_checksum = 0; 1140bbfd46c4SJeff Bonwick } while (++ddb->ddb_type < DDT_TYPES); 1141bbfd46c4SJeff Bonwick ddb->ddb_type = 0; 1142bbfd46c4SJeff Bonwick } while (++ddb->ddb_class < DDT_CLASSES); 1143bbfd46c4SJeff Bonwick 1144bbfd46c4SJeff Bonwick return (ENOENT); 1145bbfd46c4SJeff Bonwick } 1146