1b24ab676SJeff Bonwick /* 2b24ab676SJeff Bonwick * CDDL HEADER START 3b24ab676SJeff Bonwick * 4b24ab676SJeff Bonwick * The contents of this file are subject to the terms of the 5b24ab676SJeff Bonwick * Common Development and Distribution License (the "License"). 6b24ab676SJeff Bonwick * You may not use this file except in compliance with the License. 7b24ab676SJeff Bonwick * 8b24ab676SJeff Bonwick * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9b24ab676SJeff Bonwick * or http://www.opensolaris.org/os/licensing. 10b24ab676SJeff Bonwick * See the License for the specific language governing permissions 11b24ab676SJeff Bonwick * and limitations under the License. 12b24ab676SJeff Bonwick * 13b24ab676SJeff Bonwick * When distributing Covered Code, include this CDDL HEADER in each 14b24ab676SJeff Bonwick * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15b24ab676SJeff Bonwick * If applicable, add the following below this CDDL HEADER, with the 16b24ab676SJeff Bonwick * fields enclosed by brackets "[]" replaced with your own identifying 17b24ab676SJeff Bonwick * information: Portions Copyright [yyyy] [name of copyright owner] 18b24ab676SJeff Bonwick * 19b24ab676SJeff Bonwick * CDDL HEADER END 20b24ab676SJeff Bonwick */ 21b24ab676SJeff Bonwick 22b24ab676SJeff Bonwick /* 23b24ab676SJeff Bonwick * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 24b24ab676SJeff Bonwick * Use is subject to license terms. 25b24ab676SJeff Bonwick */ 26b24ab676SJeff Bonwick 27b24ab676SJeff Bonwick #include <sys/zfs_context.h> 28b24ab676SJeff Bonwick #include <sys/spa.h> 29b24ab676SJeff Bonwick #include <sys/spa_impl.h> 30b24ab676SJeff Bonwick #include <sys/zio.h> 31b24ab676SJeff Bonwick #include <sys/ddt.h> 32b24ab676SJeff Bonwick #include <sys/zap.h> 33b24ab676SJeff Bonwick #include <sys/dmu_tx.h> 34b24ab676SJeff Bonwick #include <sys/arc.h> 35*bbfd46c4SJeff Bonwick #include <sys/dsl_pool.h> 36b24ab676SJeff Bonwick #include <sys/zio_checksum.h> 37b24ab676SJeff Bonwick #include <sys/zio_compress.h> 38b24ab676SJeff Bonwick 39b24ab676SJeff Bonwick static const ddt_ops_t *ddt_ops[DDT_TYPES] = { 40b24ab676SJeff Bonwick &ddt_zap_ops, 41b24ab676SJeff Bonwick }; 42b24ab676SJeff Bonwick 43b24ab676SJeff Bonwick static const char *ddt_class_name[DDT_CLASSES] = { 44b24ab676SJeff Bonwick "ditto", 45b24ab676SJeff Bonwick "duplicate", 46b24ab676SJeff Bonwick "unique", 47b24ab676SJeff Bonwick }; 48b24ab676SJeff Bonwick 49b24ab676SJeff Bonwick static void 50b24ab676SJeff Bonwick ddt_object_create(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 51b24ab676SJeff Bonwick dmu_tx_t *tx) 52b24ab676SJeff Bonwick { 53b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 54b24ab676SJeff Bonwick objset_t *os = ddt->ddt_os; 55b24ab676SJeff Bonwick uint64_t *objectp = &ddt->ddt_object[type][class]; 56b24ab676SJeff Bonwick boolean_t prehash = zio_checksum_table[ddt->ddt_checksum].ci_dedup; 57b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 58b24ab676SJeff Bonwick 59b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 60b24ab676SJeff Bonwick 61b24ab676SJeff Bonwick ASSERT(*objectp == 0); 62b24ab676SJeff Bonwick VERIFY(ddt_ops[type]->ddt_op_create(os, objectp, tx, prehash) == 0); 63b24ab676SJeff Bonwick ASSERT(*objectp != 0); 64b24ab676SJeff Bonwick 65b24ab676SJeff Bonwick VERIFY(zap_add(os, DMU_POOL_DIRECTORY_OBJECT, name, 66b24ab676SJeff Bonwick sizeof (uint64_t), 1, objectp, tx) == 0); 67b24ab676SJeff Bonwick 68b24ab676SJeff Bonwick VERIFY(zap_add(os, spa->spa_ddt_stat_object, name, 69b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 70b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class], tx) == 0); 71b24ab676SJeff Bonwick } 72b24ab676SJeff Bonwick 73b24ab676SJeff Bonwick static void 74b24ab676SJeff Bonwick ddt_object_destroy(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 75b24ab676SJeff Bonwick dmu_tx_t *tx) 76b24ab676SJeff Bonwick { 77b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 78b24ab676SJeff Bonwick objset_t *os = ddt->ddt_os; 79b24ab676SJeff Bonwick uint64_t *objectp = &ddt->ddt_object[type][class]; 80b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 81b24ab676SJeff Bonwick 82b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 83b24ab676SJeff Bonwick 84b24ab676SJeff Bonwick ASSERT(*objectp != 0); 85b24ab676SJeff Bonwick ASSERT(ddt_object_count(ddt, type, class) == 0); 86b24ab676SJeff Bonwick ASSERT(ddt_histogram_empty(&ddt->ddt_histogram[type][class])); 87b24ab676SJeff Bonwick VERIFY(zap_remove(os, DMU_POOL_DIRECTORY_OBJECT, name, tx) == 0); 88b24ab676SJeff Bonwick VERIFY(zap_remove(os, spa->spa_ddt_stat_object, name, tx) == 0); 89b24ab676SJeff Bonwick VERIFY(ddt_ops[type]->ddt_op_destroy(os, *objectp, tx) == 0); 90b24ab676SJeff Bonwick 91b24ab676SJeff Bonwick *objectp = 0; 92b24ab676SJeff Bonwick } 93b24ab676SJeff Bonwick 94b24ab676SJeff Bonwick static int 95b24ab676SJeff Bonwick ddt_object_load(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 96b24ab676SJeff Bonwick { 97b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 98b24ab676SJeff Bonwick int error; 99b24ab676SJeff Bonwick 100b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 101b24ab676SJeff Bonwick 102b24ab676SJeff Bonwick error = zap_lookup(ddt->ddt_os, DMU_POOL_DIRECTORY_OBJECT, name, 103b24ab676SJeff Bonwick sizeof (uint64_t), 1, &ddt->ddt_object[type][class]); 104b24ab676SJeff Bonwick 105b24ab676SJeff Bonwick if (error) 106b24ab676SJeff Bonwick return (error); 107b24ab676SJeff Bonwick 108b24ab676SJeff Bonwick error = zap_lookup(ddt->ddt_os, ddt->ddt_spa->spa_ddt_stat_object, name, 109b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 110b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class]); 111b24ab676SJeff Bonwick 112b24ab676SJeff Bonwick ASSERT(error == 0); 113b24ab676SJeff Bonwick return (error); 114b24ab676SJeff Bonwick } 115b24ab676SJeff Bonwick 116b24ab676SJeff Bonwick static void 117b24ab676SJeff Bonwick ddt_object_sync(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 118b24ab676SJeff Bonwick dmu_tx_t *tx) 119b24ab676SJeff Bonwick { 120b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 121b24ab676SJeff Bonwick 122b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 123b24ab676SJeff Bonwick 124b24ab676SJeff Bonwick VERIFY(zap_update(ddt->ddt_os, ddt->ddt_spa->spa_ddt_stat_object, name, 125b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 126b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class], tx) == 0); 127b24ab676SJeff Bonwick } 128b24ab676SJeff Bonwick 129b24ab676SJeff Bonwick static int 130b24ab676SJeff Bonwick ddt_object_lookup(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 131b24ab676SJeff Bonwick ddt_entry_t *dde) 132b24ab676SJeff Bonwick { 133b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, type, class)) 134b24ab676SJeff Bonwick return (ENOENT); 135b24ab676SJeff Bonwick 136b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_lookup(ddt->ddt_os, 137b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde)); 138b24ab676SJeff Bonwick } 139b24ab676SJeff Bonwick 140b24ab676SJeff Bonwick static int 141b24ab676SJeff Bonwick ddt_object_update(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 142b24ab676SJeff Bonwick ddt_entry_t *dde, dmu_tx_t *tx) 143b24ab676SJeff Bonwick { 144b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 145b24ab676SJeff Bonwick 146b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_update(ddt->ddt_os, 147b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, tx)); 148b24ab676SJeff Bonwick } 149b24ab676SJeff Bonwick 150b24ab676SJeff Bonwick static int 151b24ab676SJeff Bonwick ddt_object_remove(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 152b24ab676SJeff Bonwick ddt_entry_t *dde, dmu_tx_t *tx) 153b24ab676SJeff Bonwick { 154b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 155b24ab676SJeff Bonwick 156b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_remove(ddt->ddt_os, 157b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, tx)); 158b24ab676SJeff Bonwick } 159b24ab676SJeff Bonwick 160b24ab676SJeff Bonwick int 161b24ab676SJeff Bonwick ddt_object_walk(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 162*bbfd46c4SJeff Bonwick uint64_t *walk, ddt_entry_t *dde) 163b24ab676SJeff Bonwick { 164b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 165b24ab676SJeff Bonwick 166b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_walk(ddt->ddt_os, 167b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, walk)); 168b24ab676SJeff Bonwick } 169b24ab676SJeff Bonwick 170b24ab676SJeff Bonwick uint64_t 171b24ab676SJeff Bonwick ddt_object_count(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 172b24ab676SJeff Bonwick { 173b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 174b24ab676SJeff Bonwick 175b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_count(ddt->ddt_os, 176b24ab676SJeff Bonwick ddt->ddt_object[type][class])); 177b24ab676SJeff Bonwick } 178b24ab676SJeff Bonwick 179b24ab676SJeff Bonwick int 180b24ab676SJeff Bonwick ddt_object_info(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 181b24ab676SJeff Bonwick dmu_object_info_t *doi) 182b24ab676SJeff Bonwick { 183b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, type, class)) 184b24ab676SJeff Bonwick return (ENOENT); 185b24ab676SJeff Bonwick 186b24ab676SJeff Bonwick return (dmu_object_info(ddt->ddt_os, ddt->ddt_object[type][class], 187b24ab676SJeff Bonwick doi)); 188b24ab676SJeff Bonwick } 189b24ab676SJeff Bonwick 190b24ab676SJeff Bonwick boolean_t 191b24ab676SJeff Bonwick ddt_object_exists(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 192b24ab676SJeff Bonwick { 193b24ab676SJeff Bonwick return (!!ddt->ddt_object[type][class]); 194b24ab676SJeff Bonwick } 195b24ab676SJeff Bonwick 196b24ab676SJeff Bonwick void 197b24ab676SJeff Bonwick ddt_object_name(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 198b24ab676SJeff Bonwick char *name) 199b24ab676SJeff Bonwick { 200b24ab676SJeff Bonwick (void) sprintf(name, DMU_POOL_DDT, 201b24ab676SJeff Bonwick zio_checksum_table[ddt->ddt_checksum].ci_name, 202b24ab676SJeff Bonwick ddt_ops[type]->ddt_op_name, ddt_class_name[class]); 203b24ab676SJeff Bonwick } 204b24ab676SJeff Bonwick 205b24ab676SJeff Bonwick void 206b24ab676SJeff Bonwick ddt_bp_fill(const ddt_phys_t *ddp, blkptr_t *bp, uint64_t txg) 207b24ab676SJeff Bonwick { 208b24ab676SJeff Bonwick ASSERT(txg != 0); 209b24ab676SJeff Bonwick 210b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 211b24ab676SJeff Bonwick bp->blk_dva[d] = ddp->ddp_dva[d]; 212b24ab676SJeff Bonwick BP_SET_BIRTH(bp, txg, ddp->ddp_phys_birth); 213b24ab676SJeff Bonwick } 214b24ab676SJeff Bonwick 215b24ab676SJeff Bonwick void 216*bbfd46c4SJeff Bonwick ddt_bp_create(enum zio_checksum checksum, 217*bbfd46c4SJeff Bonwick const ddt_key_t *ddk, const ddt_phys_t *ddp, blkptr_t *bp) 218b24ab676SJeff Bonwick { 219b24ab676SJeff Bonwick BP_ZERO(bp); 220b24ab676SJeff Bonwick 221b24ab676SJeff Bonwick if (ddp != NULL) 222b24ab676SJeff Bonwick ddt_bp_fill(ddp, bp, ddp->ddp_phys_birth); 223b24ab676SJeff Bonwick 224b24ab676SJeff Bonwick bp->blk_cksum = ddk->ddk_cksum; 225b24ab676SJeff Bonwick 226b24ab676SJeff Bonwick BP_SET_LSIZE(bp, DDK_GET_LSIZE(ddk)); 227b24ab676SJeff Bonwick BP_SET_PSIZE(bp, DDK_GET_PSIZE(ddk)); 228b24ab676SJeff Bonwick BP_SET_COMPRESS(bp, DDK_GET_COMPRESS(ddk)); 229*bbfd46c4SJeff Bonwick BP_SET_CHECKSUM(bp, checksum); 230b24ab676SJeff Bonwick BP_SET_TYPE(bp, DMU_OT_NONE); 231b24ab676SJeff Bonwick BP_SET_LEVEL(bp, 0); 232b24ab676SJeff Bonwick BP_SET_DEDUP(bp, 0); 233b24ab676SJeff Bonwick BP_SET_BYTEORDER(bp, ZFS_HOST_BYTEORDER); 234b24ab676SJeff Bonwick } 235b24ab676SJeff Bonwick 236b24ab676SJeff Bonwick void 237b24ab676SJeff Bonwick ddt_key_fill(ddt_key_t *ddk, const blkptr_t *bp) 238b24ab676SJeff Bonwick { 239b24ab676SJeff Bonwick ddk->ddk_cksum = bp->blk_cksum; 240b24ab676SJeff Bonwick ddk->ddk_prop = 0; 241b24ab676SJeff Bonwick 242b24ab676SJeff Bonwick DDK_SET_LSIZE(ddk, BP_GET_LSIZE(bp)); 243b24ab676SJeff Bonwick DDK_SET_PSIZE(ddk, BP_GET_PSIZE(bp)); 244b24ab676SJeff Bonwick DDK_SET_COMPRESS(ddk, BP_GET_COMPRESS(bp)); 245b24ab676SJeff Bonwick } 246b24ab676SJeff Bonwick 247b24ab676SJeff Bonwick void 248b24ab676SJeff Bonwick ddt_phys_fill(ddt_phys_t *ddp, const blkptr_t *bp) 249b24ab676SJeff Bonwick { 250b24ab676SJeff Bonwick ASSERT(ddp->ddp_phys_birth == 0); 251b24ab676SJeff Bonwick 252b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 253b24ab676SJeff Bonwick ddp->ddp_dva[d] = bp->blk_dva[d]; 254b24ab676SJeff Bonwick ddp->ddp_phys_birth = BP_PHYSICAL_BIRTH(bp); 255b24ab676SJeff Bonwick } 256b24ab676SJeff Bonwick 257b24ab676SJeff Bonwick void 258b24ab676SJeff Bonwick ddt_phys_clear(ddt_phys_t *ddp) 259b24ab676SJeff Bonwick { 260b24ab676SJeff Bonwick bzero(ddp, sizeof (*ddp)); 261b24ab676SJeff Bonwick } 262b24ab676SJeff Bonwick 263b24ab676SJeff Bonwick void 264b24ab676SJeff Bonwick ddt_phys_addref(ddt_phys_t *ddp) 265b24ab676SJeff Bonwick { 266b24ab676SJeff Bonwick ddp->ddp_refcnt++; 267b24ab676SJeff Bonwick } 268b24ab676SJeff Bonwick 269b24ab676SJeff Bonwick void 270b24ab676SJeff Bonwick ddt_phys_decref(ddt_phys_t *ddp) 271b24ab676SJeff Bonwick { 272b24ab676SJeff Bonwick ASSERT((int64_t)ddp->ddp_refcnt > 0); 273b24ab676SJeff Bonwick ddp->ddp_refcnt--; 274b24ab676SJeff Bonwick } 275b24ab676SJeff Bonwick 276b24ab676SJeff Bonwick void 277b24ab676SJeff Bonwick ddt_phys_free(ddt_t *ddt, ddt_key_t *ddk, ddt_phys_t *ddp, uint64_t txg) 278b24ab676SJeff Bonwick { 279b24ab676SJeff Bonwick blkptr_t blk; 280b24ab676SJeff Bonwick 281*bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, ddk, ddp, &blk); 282b24ab676SJeff Bonwick ddt_phys_clear(ddp); 283b24ab676SJeff Bonwick zio_free(ddt->ddt_spa, txg, &blk); 284b24ab676SJeff Bonwick } 285b24ab676SJeff Bonwick 286b24ab676SJeff Bonwick ddt_phys_t * 287b24ab676SJeff Bonwick ddt_phys_select(const ddt_entry_t *dde, const blkptr_t *bp) 288b24ab676SJeff Bonwick { 289b24ab676SJeff Bonwick ddt_phys_t *ddp = (ddt_phys_t *)dde->dde_phys; 290b24ab676SJeff Bonwick 291b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 292b24ab676SJeff Bonwick if (DVA_EQUAL(BP_IDENTITY(bp), &ddp->ddp_dva[0]) && 293b24ab676SJeff Bonwick BP_PHYSICAL_BIRTH(bp) == ddp->ddp_phys_birth) 294b24ab676SJeff Bonwick return (ddp); 295b24ab676SJeff Bonwick } 296b24ab676SJeff Bonwick return (NULL); 297b24ab676SJeff Bonwick } 298b24ab676SJeff Bonwick 299b24ab676SJeff Bonwick uint64_t 300b24ab676SJeff Bonwick ddt_phys_total_refcnt(const ddt_entry_t *dde) 301b24ab676SJeff Bonwick { 302b24ab676SJeff Bonwick uint64_t refcnt = 0; 303b24ab676SJeff Bonwick 304b24ab676SJeff Bonwick for (int p = DDT_PHYS_SINGLE; p <= DDT_PHYS_TRIPLE; p++) 305b24ab676SJeff Bonwick refcnt += dde->dde_phys[p].ddp_refcnt; 306b24ab676SJeff Bonwick 307b24ab676SJeff Bonwick return (refcnt); 308b24ab676SJeff Bonwick } 309b24ab676SJeff Bonwick 310b24ab676SJeff Bonwick static void 311b24ab676SJeff Bonwick ddt_stat_generate(ddt_t *ddt, ddt_entry_t *dde, ddt_stat_t *dds) 312b24ab676SJeff Bonwick { 313b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 314b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 315b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 316b24ab676SJeff Bonwick uint64_t lsize = DDK_GET_LSIZE(ddk); 317b24ab676SJeff Bonwick uint64_t psize = DDK_GET_PSIZE(ddk); 318b24ab676SJeff Bonwick 319b24ab676SJeff Bonwick bzero(dds, sizeof (*dds)); 320b24ab676SJeff Bonwick 321b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 322b24ab676SJeff Bonwick uint64_t dsize = 0; 323b24ab676SJeff Bonwick uint64_t refcnt = ddp->ddp_refcnt; 324b24ab676SJeff Bonwick 325b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0) 326b24ab676SJeff Bonwick continue; 327b24ab676SJeff Bonwick 328b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 329b24ab676SJeff Bonwick dsize += dva_get_dsize_sync(spa, &ddp->ddp_dva[d]); 330b24ab676SJeff Bonwick 331b24ab676SJeff Bonwick dds->dds_blocks += 1; 332b24ab676SJeff Bonwick dds->dds_lsize += lsize; 333b24ab676SJeff Bonwick dds->dds_psize += psize; 334b24ab676SJeff Bonwick dds->dds_dsize += dsize; 335b24ab676SJeff Bonwick 336b24ab676SJeff Bonwick dds->dds_ref_blocks += refcnt; 337b24ab676SJeff Bonwick dds->dds_ref_lsize += lsize * refcnt; 338b24ab676SJeff Bonwick dds->dds_ref_psize += psize * refcnt; 339b24ab676SJeff Bonwick dds->dds_ref_dsize += dsize * refcnt; 340b24ab676SJeff Bonwick } 341b24ab676SJeff Bonwick } 342b24ab676SJeff Bonwick 343b24ab676SJeff Bonwick void 344b24ab676SJeff Bonwick ddt_stat_add(ddt_stat_t *dst, const ddt_stat_t *src, uint64_t neg) 345b24ab676SJeff Bonwick { 346b24ab676SJeff Bonwick const uint64_t *s = (const uint64_t *)src; 347b24ab676SJeff Bonwick uint64_t *d = (uint64_t *)dst; 348b24ab676SJeff Bonwick uint64_t *d_end = (uint64_t *)(dst + 1); 349b24ab676SJeff Bonwick 350b24ab676SJeff Bonwick ASSERT(neg == 0 || neg == -1ULL); /* add or subtract */ 351b24ab676SJeff Bonwick 352b24ab676SJeff Bonwick while (d < d_end) 353b24ab676SJeff Bonwick *d++ += (*s++ ^ neg) - neg; 354b24ab676SJeff Bonwick } 355b24ab676SJeff Bonwick 356b24ab676SJeff Bonwick static void 357b24ab676SJeff Bonwick ddt_stat_update(ddt_t *ddt, ddt_entry_t *dde, uint64_t neg) 358b24ab676SJeff Bonwick { 359b24ab676SJeff Bonwick ddt_stat_t dds; 360b24ab676SJeff Bonwick ddt_histogram_t *ddh; 361b24ab676SJeff Bonwick int bucket; 362b24ab676SJeff Bonwick 363b24ab676SJeff Bonwick ddt_stat_generate(ddt, dde, &dds); 364b24ab676SJeff Bonwick 365b24ab676SJeff Bonwick bucket = highbit(dds.dds_ref_blocks) - 1; 366b24ab676SJeff Bonwick ASSERT(bucket >= 0); 367b24ab676SJeff Bonwick 368b24ab676SJeff Bonwick ddh = &ddt->ddt_histogram[dde->dde_type][dde->dde_class]; 369b24ab676SJeff Bonwick 370b24ab676SJeff Bonwick ddt_stat_add(&ddh->ddh_stat[bucket], &dds, neg); 371b24ab676SJeff Bonwick } 372b24ab676SJeff Bonwick 373b24ab676SJeff Bonwick void 374b24ab676SJeff Bonwick ddt_histogram_add(ddt_histogram_t *dst, const ddt_histogram_t *src) 375b24ab676SJeff Bonwick { 376b24ab676SJeff Bonwick for (int h = 0; h < 64; h++) 377b24ab676SJeff Bonwick ddt_stat_add(&dst->ddh_stat[h], &src->ddh_stat[h], 0); 378b24ab676SJeff Bonwick } 379b24ab676SJeff Bonwick 380b24ab676SJeff Bonwick void 381b24ab676SJeff Bonwick ddt_histogram_stat(ddt_stat_t *dds, const ddt_histogram_t *ddh) 382b24ab676SJeff Bonwick { 383b24ab676SJeff Bonwick bzero(dds, sizeof (*dds)); 384b24ab676SJeff Bonwick 385b24ab676SJeff Bonwick for (int h = 0; h < 64; h++) 386b24ab676SJeff Bonwick ddt_stat_add(dds, &ddh->ddh_stat[h], 0); 387b24ab676SJeff Bonwick } 388b24ab676SJeff Bonwick 389b24ab676SJeff Bonwick boolean_t 390b24ab676SJeff Bonwick ddt_histogram_empty(const ddt_histogram_t *ddh) 391b24ab676SJeff Bonwick { 392b24ab676SJeff Bonwick const uint64_t *s = (const uint64_t *)ddh; 393b24ab676SJeff Bonwick const uint64_t *s_end = (const uint64_t *)(ddh + 1); 394b24ab676SJeff Bonwick 395b24ab676SJeff Bonwick while (s < s_end) 396b24ab676SJeff Bonwick if (*s++ != 0) 397b24ab676SJeff Bonwick return (B_FALSE); 398b24ab676SJeff Bonwick 399b24ab676SJeff Bonwick return (B_TRUE); 400b24ab676SJeff Bonwick } 401b24ab676SJeff Bonwick 402485bbbf5SGeorge Wilson static void 403485bbbf5SGeorge Wilson ddt_get_dedup_stats(spa_t *spa, ddt_stat_t *dds_total) 404b24ab676SJeff Bonwick { 405b24ab676SJeff Bonwick ddt_histogram_t ddh_total = { 0 }; 406b24ab676SJeff Bonwick 407b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 408b24ab676SJeff Bonwick ddt_t *ddt = spa->spa_ddt[c]; 409b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 410b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; 411b24ab676SJeff Bonwick class++) { 412b24ab676SJeff Bonwick ddt_histogram_add(&ddh_total, 413b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class]); 414b24ab676SJeff Bonwick } 415b24ab676SJeff Bonwick } 416b24ab676SJeff Bonwick } 417b24ab676SJeff Bonwick 418485bbbf5SGeorge Wilson ddt_histogram_stat(dds_total, &ddh_total); 419485bbbf5SGeorge Wilson } 420485bbbf5SGeorge Wilson 421485bbbf5SGeorge Wilson uint64_t 422485bbbf5SGeorge Wilson ddt_get_dedup_dspace(spa_t *spa) 423485bbbf5SGeorge Wilson { 424485bbbf5SGeorge Wilson ddt_stat_t dds_total = { 0 }; 425485bbbf5SGeorge Wilson 426485bbbf5SGeorge Wilson ddt_get_dedup_stats(spa, &dds_total); 427485bbbf5SGeorge Wilson return (dds_total.dds_ref_dsize - dds_total.dds_dsize); 428485bbbf5SGeorge Wilson } 429485bbbf5SGeorge Wilson 430485bbbf5SGeorge Wilson uint64_t 431485bbbf5SGeorge Wilson ddt_get_pool_dedup_ratio(spa_t *spa) 432485bbbf5SGeorge Wilson { 433485bbbf5SGeorge Wilson ddt_stat_t dds_total = { 0 }; 434b24ab676SJeff Bonwick 435485bbbf5SGeorge Wilson ddt_get_dedup_stats(spa, &dds_total); 436b24ab676SJeff Bonwick if (dds_total.dds_dsize == 0) 437b24ab676SJeff Bonwick return (100); 438b24ab676SJeff Bonwick 439b24ab676SJeff Bonwick return (dds_total.dds_ref_dsize * 100 / dds_total.dds_dsize); 440b24ab676SJeff Bonwick } 441b24ab676SJeff Bonwick 442b24ab676SJeff Bonwick int 443b24ab676SJeff Bonwick ddt_ditto_copies_needed(ddt_t *ddt, ddt_entry_t *dde, ddt_phys_t *ddp_willref) 444b24ab676SJeff Bonwick { 445b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 446b24ab676SJeff Bonwick uint64_t total_refcnt = 0; 447b24ab676SJeff Bonwick uint64_t ditto = spa->spa_dedup_ditto; 448b24ab676SJeff Bonwick int total_copies = 0; 449b24ab676SJeff Bonwick int desired_copies = 0; 450b24ab676SJeff Bonwick 451b24ab676SJeff Bonwick for (int p = DDT_PHYS_SINGLE; p <= DDT_PHYS_TRIPLE; p++) { 452b24ab676SJeff Bonwick ddt_phys_t *ddp = &dde->dde_phys[p]; 453b24ab676SJeff Bonwick zio_t *zio = dde->dde_lead_zio[p]; 454b24ab676SJeff Bonwick uint64_t refcnt = ddp->ddp_refcnt; /* committed refs */ 455b24ab676SJeff Bonwick if (zio != NULL) 456b24ab676SJeff Bonwick refcnt += zio->io_parent_count; /* pending refs */ 457b24ab676SJeff Bonwick if (ddp == ddp_willref) 458b24ab676SJeff Bonwick refcnt++; /* caller's ref */ 459b24ab676SJeff Bonwick if (refcnt != 0) { 460b24ab676SJeff Bonwick total_refcnt += refcnt; 461b24ab676SJeff Bonwick total_copies += p; 462b24ab676SJeff Bonwick } 463b24ab676SJeff Bonwick } 464b24ab676SJeff Bonwick 465b24ab676SJeff Bonwick if (ditto == 0 || ditto > UINT32_MAX) 466b24ab676SJeff Bonwick ditto = UINT32_MAX; 467b24ab676SJeff Bonwick 468b24ab676SJeff Bonwick if (total_refcnt >= 1) 469b24ab676SJeff Bonwick desired_copies++; 470b24ab676SJeff Bonwick if (total_refcnt >= ditto) 471b24ab676SJeff Bonwick desired_copies++; 472b24ab676SJeff Bonwick if (total_refcnt >= ditto * ditto) 473b24ab676SJeff Bonwick desired_copies++; 474b24ab676SJeff Bonwick 475b24ab676SJeff Bonwick return (MAX(desired_copies, total_copies) - total_copies); 476b24ab676SJeff Bonwick } 477b24ab676SJeff Bonwick 478b24ab676SJeff Bonwick int 479b24ab676SJeff Bonwick ddt_ditto_copies_present(ddt_entry_t *dde) 480b24ab676SJeff Bonwick { 481b24ab676SJeff Bonwick ddt_phys_t *ddp = &dde->dde_phys[DDT_PHYS_DITTO]; 482b24ab676SJeff Bonwick dva_t *dva = ddp->ddp_dva; 483b24ab676SJeff Bonwick int copies = 0 - DVA_GET_GANG(dva); 484b24ab676SJeff Bonwick 485b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++, dva++) 486b24ab676SJeff Bonwick if (DVA_IS_VALID(dva)) 487b24ab676SJeff Bonwick copies++; 488b24ab676SJeff Bonwick 489b24ab676SJeff Bonwick ASSERT(copies >= 0 && copies < SPA_DVAS_PER_BP); 490b24ab676SJeff Bonwick 491b24ab676SJeff Bonwick return (copies); 492b24ab676SJeff Bonwick } 493b24ab676SJeff Bonwick 494b24ab676SJeff Bonwick size_t 495b24ab676SJeff Bonwick ddt_compress(void *src, uchar_t *dst, size_t s_len, size_t d_len) 496b24ab676SJeff Bonwick { 497b24ab676SJeff Bonwick uchar_t *version = dst++; 498b24ab676SJeff Bonwick int cpfunc = ZIO_COMPRESS_ZLE; 499b24ab676SJeff Bonwick zio_compress_info_t *ci = &zio_compress_table[cpfunc]; 500b24ab676SJeff Bonwick size_t c_len; 501b24ab676SJeff Bonwick 502b24ab676SJeff Bonwick ASSERT(d_len >= s_len + 1); /* no compression plus version byte */ 503b24ab676SJeff Bonwick 504b24ab676SJeff Bonwick c_len = ci->ci_compress(src, dst, s_len, d_len - 1, ci->ci_level); 505b24ab676SJeff Bonwick 506b24ab676SJeff Bonwick if (c_len == s_len) { 507b24ab676SJeff Bonwick cpfunc = ZIO_COMPRESS_OFF; 508b24ab676SJeff Bonwick bcopy(src, dst, s_len); 509b24ab676SJeff Bonwick } 510b24ab676SJeff Bonwick 511b24ab676SJeff Bonwick *version = (ZFS_HOST_BYTEORDER & DDT_COMPRESS_BYTEORDER_MASK) | cpfunc; 512b24ab676SJeff Bonwick 513b24ab676SJeff Bonwick return (c_len + 1); 514b24ab676SJeff Bonwick } 515b24ab676SJeff Bonwick 516b24ab676SJeff Bonwick void 517b24ab676SJeff Bonwick ddt_decompress(uchar_t *src, void *dst, size_t s_len, size_t d_len) 518b24ab676SJeff Bonwick { 519b24ab676SJeff Bonwick uchar_t version = *src++; 520b24ab676SJeff Bonwick int cpfunc = version & DDT_COMPRESS_FUNCTION_MASK; 521b24ab676SJeff Bonwick zio_compress_info_t *ci = &zio_compress_table[cpfunc]; 522b24ab676SJeff Bonwick 523b24ab676SJeff Bonwick if (ci->ci_decompress != NULL) 524b24ab676SJeff Bonwick (void) ci->ci_decompress(src, dst, s_len, d_len, ci->ci_level); 525b24ab676SJeff Bonwick else 526b24ab676SJeff Bonwick bcopy(src, dst, d_len); 527b24ab676SJeff Bonwick 528b24ab676SJeff Bonwick if ((version ^ ZFS_HOST_BYTEORDER) & DDT_COMPRESS_BYTEORDER_MASK) 529b24ab676SJeff Bonwick byteswap_uint64_array(dst, d_len); 530b24ab676SJeff Bonwick } 531b24ab676SJeff Bonwick 532b24ab676SJeff Bonwick ddt_t * 533b24ab676SJeff Bonwick ddt_select_by_checksum(spa_t *spa, enum zio_checksum c) 534b24ab676SJeff Bonwick { 535b24ab676SJeff Bonwick return (spa->spa_ddt[c]); 536b24ab676SJeff Bonwick } 537b24ab676SJeff Bonwick 538b24ab676SJeff Bonwick ddt_t * 539b24ab676SJeff Bonwick ddt_select(spa_t *spa, const blkptr_t *bp) 540b24ab676SJeff Bonwick { 541b24ab676SJeff Bonwick return (spa->spa_ddt[BP_GET_CHECKSUM(bp)]); 542b24ab676SJeff Bonwick } 543b24ab676SJeff Bonwick 544b24ab676SJeff Bonwick void 545b24ab676SJeff Bonwick ddt_enter(ddt_t *ddt) 546b24ab676SJeff Bonwick { 547b24ab676SJeff Bonwick mutex_enter(&ddt->ddt_lock); 548b24ab676SJeff Bonwick } 549b24ab676SJeff Bonwick 550b24ab676SJeff Bonwick void 551b24ab676SJeff Bonwick ddt_exit(ddt_t *ddt) 552b24ab676SJeff Bonwick { 553b24ab676SJeff Bonwick mutex_exit(&ddt->ddt_lock); 554b24ab676SJeff Bonwick } 555b24ab676SJeff Bonwick 556b24ab676SJeff Bonwick static ddt_entry_t * 557b24ab676SJeff Bonwick ddt_alloc(const ddt_key_t *ddk) 558b24ab676SJeff Bonwick { 559b24ab676SJeff Bonwick ddt_entry_t *dde; 560b24ab676SJeff Bonwick 561b24ab676SJeff Bonwick dde = kmem_zalloc(sizeof (ddt_entry_t), KM_SLEEP); 562b24ab676SJeff Bonwick cv_init(&dde->dde_cv, NULL, CV_DEFAULT, NULL); 563b24ab676SJeff Bonwick 564b24ab676SJeff Bonwick dde->dde_key = *ddk; 565b24ab676SJeff Bonwick 566b24ab676SJeff Bonwick return (dde); 567b24ab676SJeff Bonwick } 568b24ab676SJeff Bonwick 569b24ab676SJeff Bonwick static void 570b24ab676SJeff Bonwick ddt_free(ddt_entry_t *dde) 571b24ab676SJeff Bonwick { 572b24ab676SJeff Bonwick ASSERT(!dde->dde_loading); 573b24ab676SJeff Bonwick 574b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++) 575b24ab676SJeff Bonwick ASSERT(dde->dde_lead_zio[p] == NULL); 576b24ab676SJeff Bonwick 577b24ab676SJeff Bonwick if (dde->dde_repair_data != NULL) 578b24ab676SJeff Bonwick zio_buf_free(dde->dde_repair_data, 579b24ab676SJeff Bonwick DDK_GET_PSIZE(&dde->dde_key)); 580b24ab676SJeff Bonwick 581b24ab676SJeff Bonwick cv_destroy(&dde->dde_cv); 582b24ab676SJeff Bonwick kmem_free(dde, sizeof (*dde)); 583b24ab676SJeff Bonwick } 584b24ab676SJeff Bonwick 585b24ab676SJeff Bonwick void 586b24ab676SJeff Bonwick ddt_remove(ddt_t *ddt, ddt_entry_t *dde) 587b24ab676SJeff Bonwick { 588b24ab676SJeff Bonwick ASSERT(MUTEX_HELD(&ddt->ddt_lock)); 589b24ab676SJeff Bonwick 590b24ab676SJeff Bonwick avl_remove(&ddt->ddt_tree, dde); 591b24ab676SJeff Bonwick ddt_free(dde); 592b24ab676SJeff Bonwick } 593b24ab676SJeff Bonwick 594b24ab676SJeff Bonwick ddt_entry_t * 595b24ab676SJeff Bonwick ddt_lookup(ddt_t *ddt, const blkptr_t *bp, boolean_t add) 596b24ab676SJeff Bonwick { 597b24ab676SJeff Bonwick ddt_entry_t *dde, dde_search; 598b24ab676SJeff Bonwick enum ddt_type type; 599b24ab676SJeff Bonwick enum ddt_class class; 600b24ab676SJeff Bonwick avl_index_t where; 601b24ab676SJeff Bonwick int error; 602b24ab676SJeff Bonwick 603b24ab676SJeff Bonwick ASSERT(MUTEX_HELD(&ddt->ddt_lock)); 604b24ab676SJeff Bonwick 605b24ab676SJeff Bonwick ddt_key_fill(&dde_search.dde_key, bp); 606b24ab676SJeff Bonwick 607b24ab676SJeff Bonwick dde = avl_find(&ddt->ddt_tree, &dde_search, &where); 608b24ab676SJeff Bonwick if (dde == NULL) { 609b24ab676SJeff Bonwick if (!add) 610b24ab676SJeff Bonwick return (NULL); 611b24ab676SJeff Bonwick dde = ddt_alloc(&dde_search.dde_key); 612b24ab676SJeff Bonwick avl_insert(&ddt->ddt_tree, dde, where); 613b24ab676SJeff Bonwick } 614b24ab676SJeff Bonwick 615b24ab676SJeff Bonwick while (dde->dde_loading) 616b24ab676SJeff Bonwick cv_wait(&dde->dde_cv, &ddt->ddt_lock); 617b24ab676SJeff Bonwick 618b24ab676SJeff Bonwick if (dde->dde_loaded) 619b24ab676SJeff Bonwick return (dde); 620b24ab676SJeff Bonwick 621b24ab676SJeff Bonwick dde->dde_loading = B_TRUE; 622b24ab676SJeff Bonwick 623b24ab676SJeff Bonwick ddt_exit(ddt); 624b24ab676SJeff Bonwick 625b24ab676SJeff Bonwick error = ENOENT; 626b24ab676SJeff Bonwick 627b24ab676SJeff Bonwick for (type = 0; type < DDT_TYPES; type++) { 628b24ab676SJeff Bonwick for (class = 0; class < DDT_CLASSES; class++) { 629b24ab676SJeff Bonwick error = ddt_object_lookup(ddt, type, class, dde); 630b24ab676SJeff Bonwick if (error != ENOENT) 631b24ab676SJeff Bonwick break; 632b24ab676SJeff Bonwick } 633b24ab676SJeff Bonwick if (error != ENOENT) 634b24ab676SJeff Bonwick break; 635b24ab676SJeff Bonwick } 636b24ab676SJeff Bonwick 637b24ab676SJeff Bonwick ASSERT(error == 0 || error == ENOENT); 638b24ab676SJeff Bonwick 639b24ab676SJeff Bonwick ddt_enter(ddt); 640b24ab676SJeff Bonwick 641b24ab676SJeff Bonwick ASSERT(dde->dde_loaded == B_FALSE); 642b24ab676SJeff Bonwick ASSERT(dde->dde_loading == B_TRUE); 643b24ab676SJeff Bonwick 644b24ab676SJeff Bonwick dde->dde_type = type; /* will be DDT_TYPES if no entry found */ 645b24ab676SJeff Bonwick dde->dde_class = class; /* will be DDT_CLASSES if no entry found */ 646b24ab676SJeff Bonwick dde->dde_loaded = B_TRUE; 647b24ab676SJeff Bonwick dde->dde_loading = B_FALSE; 648b24ab676SJeff Bonwick 649b24ab676SJeff Bonwick if (error == 0) 650b24ab676SJeff Bonwick ddt_stat_update(ddt, dde, -1ULL); 651b24ab676SJeff Bonwick 652b24ab676SJeff Bonwick cv_broadcast(&dde->dde_cv); 653b24ab676SJeff Bonwick 654b24ab676SJeff Bonwick return (dde); 655b24ab676SJeff Bonwick } 656b24ab676SJeff Bonwick 657b24ab676SJeff Bonwick int 658b24ab676SJeff Bonwick ddt_entry_compare(const void *x1, const void *x2) 659b24ab676SJeff Bonwick { 660b24ab676SJeff Bonwick const ddt_entry_t *dde1 = x1; 661b24ab676SJeff Bonwick const ddt_entry_t *dde2 = x2; 662b24ab676SJeff Bonwick const uint64_t *u1 = (const uint64_t *)&dde1->dde_key; 663b24ab676SJeff Bonwick const uint64_t *u2 = (const uint64_t *)&dde2->dde_key; 664b24ab676SJeff Bonwick 665b24ab676SJeff Bonwick for (int i = 0; i < DDT_KEY_WORDS; i++) { 666b24ab676SJeff Bonwick if (u1[i] < u2[i]) 667b24ab676SJeff Bonwick return (-1); 668b24ab676SJeff Bonwick if (u1[i] > u2[i]) 669b24ab676SJeff Bonwick return (1); 670b24ab676SJeff Bonwick } 671b24ab676SJeff Bonwick 672b24ab676SJeff Bonwick return (0); 673b24ab676SJeff Bonwick } 674b24ab676SJeff Bonwick 675b24ab676SJeff Bonwick static ddt_t * 676b24ab676SJeff Bonwick ddt_table_alloc(spa_t *spa, enum zio_checksum c) 677b24ab676SJeff Bonwick { 678b24ab676SJeff Bonwick ddt_t *ddt; 679b24ab676SJeff Bonwick 680b24ab676SJeff Bonwick ddt = kmem_zalloc(sizeof (*ddt), KM_SLEEP); 681b24ab676SJeff Bonwick 682b24ab676SJeff Bonwick mutex_init(&ddt->ddt_lock, NULL, MUTEX_DEFAULT, NULL); 683b24ab676SJeff Bonwick avl_create(&ddt->ddt_tree, ddt_entry_compare, 684b24ab676SJeff Bonwick sizeof (ddt_entry_t), offsetof(ddt_entry_t, dde_node)); 685b24ab676SJeff Bonwick avl_create(&ddt->ddt_repair_tree, ddt_entry_compare, 686b24ab676SJeff Bonwick sizeof (ddt_entry_t), offsetof(ddt_entry_t, dde_node)); 687b24ab676SJeff Bonwick ddt->ddt_checksum = c; 688b24ab676SJeff Bonwick ddt->ddt_spa = spa; 689b24ab676SJeff Bonwick ddt->ddt_os = spa->spa_meta_objset; 690b24ab676SJeff Bonwick 691b24ab676SJeff Bonwick return (ddt); 692b24ab676SJeff Bonwick } 693b24ab676SJeff Bonwick 694b24ab676SJeff Bonwick static void 695b24ab676SJeff Bonwick ddt_table_free(ddt_t *ddt) 696b24ab676SJeff Bonwick { 697b24ab676SJeff Bonwick ASSERT(avl_numnodes(&ddt->ddt_tree) == 0); 698b24ab676SJeff Bonwick ASSERT(avl_numnodes(&ddt->ddt_repair_tree) == 0); 699b24ab676SJeff Bonwick avl_destroy(&ddt->ddt_tree); 700b24ab676SJeff Bonwick avl_destroy(&ddt->ddt_repair_tree); 701b24ab676SJeff Bonwick mutex_destroy(&ddt->ddt_lock); 702b24ab676SJeff Bonwick kmem_free(ddt, sizeof (*ddt)); 703b24ab676SJeff Bonwick } 704b24ab676SJeff Bonwick 705b24ab676SJeff Bonwick void 706b24ab676SJeff Bonwick ddt_create(spa_t *spa) 707b24ab676SJeff Bonwick { 708b24ab676SJeff Bonwick spa->spa_dedup_checksum = ZIO_DEDUPCHECKSUM; 709b24ab676SJeff Bonwick 710b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) 711b24ab676SJeff Bonwick spa->spa_ddt[c] = ddt_table_alloc(spa, c); 712b24ab676SJeff Bonwick } 713b24ab676SJeff Bonwick 714b24ab676SJeff Bonwick int 715b24ab676SJeff Bonwick ddt_load(spa_t *spa) 716b24ab676SJeff Bonwick { 717b24ab676SJeff Bonwick int error; 718b24ab676SJeff Bonwick 719b24ab676SJeff Bonwick ddt_create(spa); 720b24ab676SJeff Bonwick 721b24ab676SJeff Bonwick error = zap_lookup(spa->spa_meta_objset, DMU_POOL_DIRECTORY_OBJECT, 722b24ab676SJeff Bonwick DMU_POOL_DDT_STATS, sizeof (uint64_t), 1, 723b24ab676SJeff Bonwick &spa->spa_ddt_stat_object); 724b24ab676SJeff Bonwick 725b24ab676SJeff Bonwick if (error) 726b24ab676SJeff Bonwick return (error == ENOENT ? 0 : error); 727b24ab676SJeff Bonwick 728b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 729b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 730b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; 731b24ab676SJeff Bonwick class++) { 732b24ab676SJeff Bonwick ddt_t *ddt = spa->spa_ddt[c]; 733b24ab676SJeff Bonwick error = ddt_object_load(ddt, type, class); 734b24ab676SJeff Bonwick if (error != 0 && error != ENOENT) 735b24ab676SJeff Bonwick return (error); 736b24ab676SJeff Bonwick } 737b24ab676SJeff Bonwick } 738b24ab676SJeff Bonwick } 739b24ab676SJeff Bonwick 740b24ab676SJeff Bonwick return (0); 741b24ab676SJeff Bonwick } 742b24ab676SJeff Bonwick 743b24ab676SJeff Bonwick void 744b24ab676SJeff Bonwick ddt_unload(spa_t *spa) 745b24ab676SJeff Bonwick { 746b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 747b24ab676SJeff Bonwick if (spa->spa_ddt[c]) { 748b24ab676SJeff Bonwick ddt_table_free(spa->spa_ddt[c]); 749b24ab676SJeff Bonwick spa->spa_ddt[c] = NULL; 750b24ab676SJeff Bonwick } 751b24ab676SJeff Bonwick } 752b24ab676SJeff Bonwick } 753b24ab676SJeff Bonwick 754*bbfd46c4SJeff Bonwick boolean_t 755*bbfd46c4SJeff Bonwick ddt_class_contains(spa_t *spa, enum ddt_class max_class, const blkptr_t *bp) 756*bbfd46c4SJeff Bonwick { 757*bbfd46c4SJeff Bonwick ddt_t *ddt; 758*bbfd46c4SJeff Bonwick ddt_entry_t dde; 759*bbfd46c4SJeff Bonwick 760*bbfd46c4SJeff Bonwick if (!BP_GET_DEDUP(bp)) 761*bbfd46c4SJeff Bonwick return (B_FALSE); 762*bbfd46c4SJeff Bonwick 763*bbfd46c4SJeff Bonwick if (max_class == DDT_CLASS_UNIQUE) 764*bbfd46c4SJeff Bonwick return (B_TRUE); 765*bbfd46c4SJeff Bonwick 766*bbfd46c4SJeff Bonwick ddt = spa->spa_ddt[BP_GET_CHECKSUM(bp)]; 767*bbfd46c4SJeff Bonwick 768*bbfd46c4SJeff Bonwick ddt_key_fill(&dde.dde_key, bp); 769*bbfd46c4SJeff Bonwick 770*bbfd46c4SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) 771*bbfd46c4SJeff Bonwick for (enum ddt_class class = 0; class <= max_class; class++) 772*bbfd46c4SJeff Bonwick if (ddt_object_lookup(ddt, type, class, &dde) == 0) 773*bbfd46c4SJeff Bonwick return (B_TRUE); 774*bbfd46c4SJeff Bonwick 775*bbfd46c4SJeff Bonwick return (B_FALSE); 776*bbfd46c4SJeff Bonwick } 777*bbfd46c4SJeff Bonwick 778b24ab676SJeff Bonwick ddt_entry_t * 779b24ab676SJeff Bonwick ddt_repair_start(ddt_t *ddt, const blkptr_t *bp) 780b24ab676SJeff Bonwick { 781b24ab676SJeff Bonwick ddt_key_t ddk; 782b24ab676SJeff Bonwick ddt_entry_t *dde; 783b24ab676SJeff Bonwick 784b24ab676SJeff Bonwick ddt_key_fill(&ddk, bp); 785b24ab676SJeff Bonwick 786b24ab676SJeff Bonwick dde = ddt_alloc(&ddk); 787b24ab676SJeff Bonwick 788b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 789b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 790b24ab676SJeff Bonwick /* 791b24ab676SJeff Bonwick * We can only do repair if there are multiple copies 792b24ab676SJeff Bonwick * of the block. For anything in the UNIQUE class, 793b24ab676SJeff Bonwick * there's definitely only one copy, so don't even try. 794b24ab676SJeff Bonwick */ 795b24ab676SJeff Bonwick if (class != DDT_CLASS_UNIQUE && 796b24ab676SJeff Bonwick ddt_object_lookup(ddt, type, class, dde) == 0) 797b24ab676SJeff Bonwick return (dde); 798b24ab676SJeff Bonwick } 799b24ab676SJeff Bonwick } 800b24ab676SJeff Bonwick 801b24ab676SJeff Bonwick bzero(dde->dde_phys, sizeof (dde->dde_phys)); 802b24ab676SJeff Bonwick 803b24ab676SJeff Bonwick return (dde); 804b24ab676SJeff Bonwick } 805b24ab676SJeff Bonwick 806b24ab676SJeff Bonwick void 807b24ab676SJeff Bonwick ddt_repair_done(ddt_t *ddt, ddt_entry_t *dde) 808b24ab676SJeff Bonwick { 809b24ab676SJeff Bonwick avl_index_t where; 810b24ab676SJeff Bonwick 811b24ab676SJeff Bonwick ddt_enter(ddt); 812b24ab676SJeff Bonwick 813b24ab676SJeff Bonwick if (dde->dde_repair_data != NULL && spa_writeable(ddt->ddt_spa) && 814b24ab676SJeff Bonwick avl_find(&ddt->ddt_repair_tree, dde, &where) == NULL) 815b24ab676SJeff Bonwick avl_insert(&ddt->ddt_repair_tree, dde, where); 816b24ab676SJeff Bonwick else 817b24ab676SJeff Bonwick ddt_free(dde); 818b24ab676SJeff Bonwick 819b24ab676SJeff Bonwick ddt_exit(ddt); 820b24ab676SJeff Bonwick } 821b24ab676SJeff Bonwick 822b24ab676SJeff Bonwick static void 823b24ab676SJeff Bonwick ddt_repair_entry_done(zio_t *zio) 824b24ab676SJeff Bonwick { 825b24ab676SJeff Bonwick ddt_entry_t *rdde = zio->io_private; 826b24ab676SJeff Bonwick 827b24ab676SJeff Bonwick ddt_free(rdde); 828b24ab676SJeff Bonwick } 829b24ab676SJeff Bonwick 830b24ab676SJeff Bonwick static void 831b24ab676SJeff Bonwick ddt_repair_entry(ddt_t *ddt, ddt_entry_t *dde, ddt_entry_t *rdde, zio_t *rio) 832b24ab676SJeff Bonwick { 833b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 834b24ab676SJeff Bonwick ddt_phys_t *rddp = rdde->dde_phys; 835b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 836b24ab676SJeff Bonwick ddt_key_t *rddk = &rdde->dde_key; 837b24ab676SJeff Bonwick zio_t *zio; 838b24ab676SJeff Bonwick blkptr_t blk; 839b24ab676SJeff Bonwick 840b24ab676SJeff Bonwick zio = zio_null(rio, rio->io_spa, NULL, 841b24ab676SJeff Bonwick ddt_repair_entry_done, rdde, rio->io_flags); 842b24ab676SJeff Bonwick 843b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++, rddp++) { 844b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0 || 845b24ab676SJeff Bonwick ddp->ddp_phys_birth != rddp->ddp_phys_birth || 846b24ab676SJeff Bonwick bcmp(ddp->ddp_dva, rddp->ddp_dva, sizeof (ddp->ddp_dva))) 847b24ab676SJeff Bonwick continue; 848*bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, ddk, ddp, &blk); 849b24ab676SJeff Bonwick zio_nowait(zio_rewrite(zio, zio->io_spa, 0, &blk, 850b24ab676SJeff Bonwick rdde->dde_repair_data, DDK_GET_PSIZE(rddk), NULL, NULL, 851b24ab676SJeff Bonwick ZIO_PRIORITY_SYNC_WRITE, ZIO_DDT_CHILD_FLAGS(zio), NULL)); 852b24ab676SJeff Bonwick } 853b24ab676SJeff Bonwick 854b24ab676SJeff Bonwick zio_nowait(zio); 855b24ab676SJeff Bonwick } 856b24ab676SJeff Bonwick 857b24ab676SJeff Bonwick static void 858b24ab676SJeff Bonwick ddt_repair_table(ddt_t *ddt, zio_t *rio) 859b24ab676SJeff Bonwick { 860b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 861b24ab676SJeff Bonwick ddt_entry_t *dde, *rdde_next, *rdde; 862b24ab676SJeff Bonwick avl_tree_t *t = &ddt->ddt_repair_tree; 863b24ab676SJeff Bonwick blkptr_t blk; 864b24ab676SJeff Bonwick 865b24ab676SJeff Bonwick if (spa_sync_pass(spa) > 1) 866b24ab676SJeff Bonwick return; 867b24ab676SJeff Bonwick 868b24ab676SJeff Bonwick ddt_enter(ddt); 869b24ab676SJeff Bonwick for (rdde = avl_first(t); rdde != NULL; rdde = rdde_next) { 870b24ab676SJeff Bonwick rdde_next = AVL_NEXT(t, rdde); 871b24ab676SJeff Bonwick avl_remove(&ddt->ddt_repair_tree, rdde); 872b24ab676SJeff Bonwick ddt_exit(ddt); 873*bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, &rdde->dde_key, NULL, &blk); 874b24ab676SJeff Bonwick dde = ddt_repair_start(ddt, &blk); 875b24ab676SJeff Bonwick ddt_repair_entry(ddt, dde, rdde, rio); 876b24ab676SJeff Bonwick ddt_repair_done(ddt, dde); 877b24ab676SJeff Bonwick ddt_enter(ddt); 878b24ab676SJeff Bonwick } 879b24ab676SJeff Bonwick ddt_exit(ddt); 880b24ab676SJeff Bonwick } 881b24ab676SJeff Bonwick 882b24ab676SJeff Bonwick static void 883b24ab676SJeff Bonwick ddt_sync_entry(ddt_t *ddt, ddt_entry_t *dde, dmu_tx_t *tx, uint64_t txg) 884b24ab676SJeff Bonwick { 885*bbfd46c4SJeff Bonwick dsl_pool_t *dp = ddt->ddt_spa->spa_dsl_pool; 886b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 887b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 888b24ab676SJeff Bonwick enum ddt_type otype = dde->dde_type; 889b24ab676SJeff Bonwick enum ddt_type ntype = DDT_TYPE_CURRENT; 890b24ab676SJeff Bonwick enum ddt_class oclass = dde->dde_class; 891b24ab676SJeff Bonwick enum ddt_class nclass; 892b24ab676SJeff Bonwick uint64_t total_refcnt = 0; 893b24ab676SJeff Bonwick 894b24ab676SJeff Bonwick ASSERT(dde->dde_loaded); 895b24ab676SJeff Bonwick ASSERT(!dde->dde_loading); 896b24ab676SJeff Bonwick 897b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 898b24ab676SJeff Bonwick ASSERT(dde->dde_lead_zio[p] == NULL); 899b24ab676SJeff Bonwick ASSERT((int64_t)ddp->ddp_refcnt >= 0); 900b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0) { 901b24ab676SJeff Bonwick ASSERT(ddp->ddp_refcnt == 0); 902b24ab676SJeff Bonwick continue; 903b24ab676SJeff Bonwick } 904b24ab676SJeff Bonwick if (p == DDT_PHYS_DITTO) { 905b24ab676SJeff Bonwick if (ddt_ditto_copies_needed(ddt, dde, NULL) == 0) 906b24ab676SJeff Bonwick ddt_phys_free(ddt, ddk, ddp, txg); 907b24ab676SJeff Bonwick continue; 908b24ab676SJeff Bonwick } 909b24ab676SJeff Bonwick if (ddp->ddp_refcnt == 0) 910b24ab676SJeff Bonwick ddt_phys_free(ddt, ddk, ddp, txg); 911b24ab676SJeff Bonwick total_refcnt += ddp->ddp_refcnt; 912b24ab676SJeff Bonwick } 913b24ab676SJeff Bonwick 914b24ab676SJeff Bonwick if (dde->dde_phys[DDT_PHYS_DITTO].ddp_phys_birth != 0) 915b24ab676SJeff Bonwick nclass = DDT_CLASS_DITTO; 916b24ab676SJeff Bonwick else if (total_refcnt > 1) 917b24ab676SJeff Bonwick nclass = DDT_CLASS_DUPLICATE; 918b24ab676SJeff Bonwick else 919b24ab676SJeff Bonwick nclass = DDT_CLASS_UNIQUE; 920b24ab676SJeff Bonwick 921b24ab676SJeff Bonwick if (otype != DDT_TYPES && 922b24ab676SJeff Bonwick (otype != ntype || oclass != nclass || total_refcnt == 0)) { 923b24ab676SJeff Bonwick VERIFY(ddt_object_remove(ddt, otype, oclass, dde, tx) == 0); 924b24ab676SJeff Bonwick ASSERT(ddt_object_lookup(ddt, otype, oclass, dde) == ENOENT); 925b24ab676SJeff Bonwick } 926b24ab676SJeff Bonwick 927b24ab676SJeff Bonwick if (total_refcnt != 0) { 928b24ab676SJeff Bonwick dde->dde_type = ntype; 929b24ab676SJeff Bonwick dde->dde_class = nclass; 930b24ab676SJeff Bonwick ddt_stat_update(ddt, dde, 0); 931b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, ntype, nclass)) 932b24ab676SJeff Bonwick ddt_object_create(ddt, ntype, nclass, tx); 933b24ab676SJeff Bonwick VERIFY(ddt_object_update(ddt, ntype, nclass, dde, tx) == 0); 934*bbfd46c4SJeff Bonwick 935*bbfd46c4SJeff Bonwick if (dp->dp_scrub_func != SCRUB_FUNC_NONE && 936*bbfd46c4SJeff Bonwick oclass > dp->dp_scrub_ddt_class_max && 937*bbfd46c4SJeff Bonwick nclass <= dp->dp_scrub_ddt_class_max) 938*bbfd46c4SJeff Bonwick dsl_pool_scrub_ddt_entry(dp, ddt->ddt_checksum, dde); 939b24ab676SJeff Bonwick } 940b24ab676SJeff Bonwick } 941b24ab676SJeff Bonwick 942b24ab676SJeff Bonwick static void 943b24ab676SJeff Bonwick ddt_sync_table(ddt_t *ddt, dmu_tx_t *tx, uint64_t txg) 944b24ab676SJeff Bonwick { 945b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 946b24ab676SJeff Bonwick ddt_entry_t *dde; 947b24ab676SJeff Bonwick void *cookie = NULL; 948b24ab676SJeff Bonwick 949b24ab676SJeff Bonwick if (avl_numnodes(&ddt->ddt_tree) == 0) 950b24ab676SJeff Bonwick return; 951b24ab676SJeff Bonwick 952b24ab676SJeff Bonwick ASSERT(spa_sync_pass(spa) == 1); 953b24ab676SJeff Bonwick ASSERT(spa->spa_uberblock.ub_version >= SPA_VERSION_DEDUP); 954b24ab676SJeff Bonwick 955b24ab676SJeff Bonwick if (spa->spa_ddt_stat_object == 0) { 956b24ab676SJeff Bonwick spa->spa_ddt_stat_object = zap_create(ddt->ddt_os, 957b24ab676SJeff Bonwick DMU_OT_DDT_STATS, DMU_OT_NONE, 0, tx); 958b24ab676SJeff Bonwick VERIFY(zap_add(ddt->ddt_os, DMU_POOL_DIRECTORY_OBJECT, 959b24ab676SJeff Bonwick DMU_POOL_DDT_STATS, sizeof (uint64_t), 1, 960b24ab676SJeff Bonwick &spa->spa_ddt_stat_object, tx) == 0); 961b24ab676SJeff Bonwick } 962b24ab676SJeff Bonwick 963b24ab676SJeff Bonwick while ((dde = avl_destroy_nodes(&ddt->ddt_tree, &cookie)) != NULL) { 964b24ab676SJeff Bonwick ddt_sync_entry(ddt, dde, tx, txg); 965b24ab676SJeff Bonwick ddt_free(dde); 966b24ab676SJeff Bonwick } 967b24ab676SJeff Bonwick 968b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 969b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 970b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, type, class)) 971b24ab676SJeff Bonwick continue; 972b24ab676SJeff Bonwick ddt_object_sync(ddt, type, class, tx); 973b24ab676SJeff Bonwick if (ddt_object_count(ddt, type, class) == 0) 974b24ab676SJeff Bonwick ddt_object_destroy(ddt, type, class, tx); 975b24ab676SJeff Bonwick } 976b24ab676SJeff Bonwick } 977b24ab676SJeff Bonwick } 978b24ab676SJeff Bonwick 979b24ab676SJeff Bonwick void 980b24ab676SJeff Bonwick ddt_sync(spa_t *spa, uint64_t txg) 981b24ab676SJeff Bonwick { 982b24ab676SJeff Bonwick dmu_tx_t *tx; 983b24ab676SJeff Bonwick zio_t *rio = zio_root(spa, NULL, NULL, 984b24ab676SJeff Bonwick ZIO_FLAG_CANFAIL | ZIO_FLAG_SPECULATIVE); 985b24ab676SJeff Bonwick 986b24ab676SJeff Bonwick ASSERT(spa_syncing_txg(spa) == txg); 987b24ab676SJeff Bonwick 988b24ab676SJeff Bonwick tx = dmu_tx_create_assigned(spa->spa_dsl_pool, txg); 989b24ab676SJeff Bonwick 990b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 991b24ab676SJeff Bonwick ddt_t *ddt = spa->spa_ddt[c]; 992b24ab676SJeff Bonwick if (ddt == NULL) 993b24ab676SJeff Bonwick continue; 994b24ab676SJeff Bonwick ddt_sync_table(ddt, tx, txg); 995b24ab676SJeff Bonwick ddt_repair_table(ddt, rio); 996b24ab676SJeff Bonwick } 997b24ab676SJeff Bonwick 998b24ab676SJeff Bonwick (void) zio_wait(rio); 999b24ab676SJeff Bonwick 1000b24ab676SJeff Bonwick dmu_tx_commit(tx); 1001b24ab676SJeff Bonwick } 1002*bbfd46c4SJeff Bonwick 1003*bbfd46c4SJeff Bonwick int 1004*bbfd46c4SJeff Bonwick ddt_walk(spa_t *spa, ddt_bookmark_t *ddb, ddt_entry_t *dde) 1005*bbfd46c4SJeff Bonwick { 1006*bbfd46c4SJeff Bonwick do { 1007*bbfd46c4SJeff Bonwick do { 1008*bbfd46c4SJeff Bonwick do { 1009*bbfd46c4SJeff Bonwick ddt_t *ddt = spa->spa_ddt[ddb->ddb_checksum]; 1010*bbfd46c4SJeff Bonwick int error = ENOENT; 1011*bbfd46c4SJeff Bonwick if (ddt_object_exists(ddt, ddb->ddb_type, 1012*bbfd46c4SJeff Bonwick ddb->ddb_class)) { 1013*bbfd46c4SJeff Bonwick error = ddt_object_walk(ddt, 1014*bbfd46c4SJeff Bonwick ddb->ddb_type, ddb->ddb_class, 1015*bbfd46c4SJeff Bonwick &ddb->ddb_cursor, dde); 1016*bbfd46c4SJeff Bonwick } 1017*bbfd46c4SJeff Bonwick if (error == 0) 1018*bbfd46c4SJeff Bonwick return (0); 1019*bbfd46c4SJeff Bonwick if (error != ENOENT) 1020*bbfd46c4SJeff Bonwick return (error); 1021*bbfd46c4SJeff Bonwick ddb->ddb_cursor = 0; 1022*bbfd46c4SJeff Bonwick } while (++ddb->ddb_checksum < ZIO_CHECKSUM_FUNCTIONS); 1023*bbfd46c4SJeff Bonwick ddb->ddb_checksum = 0; 1024*bbfd46c4SJeff Bonwick } while (++ddb->ddb_type < DDT_TYPES); 1025*bbfd46c4SJeff Bonwick ddb->ddb_type = 0; 1026*bbfd46c4SJeff Bonwick } while (++ddb->ddb_class < DDT_CLASSES); 1027*bbfd46c4SJeff Bonwick 1028*bbfd46c4SJeff Bonwick return (ENOENT); 1029*bbfd46c4SJeff Bonwick } 1030