1cde58dbcSMatthew Ahrens /* 2cde58dbcSMatthew Ahrens * CDDL HEADER START 3cde58dbcSMatthew Ahrens * 4cde58dbcSMatthew Ahrens * The contents of this file are subject to the terms of the 5cde58dbcSMatthew Ahrens * Common Development and Distribution License (the "License"). 6cde58dbcSMatthew Ahrens * You may not use this file except in compliance with the License. 7cde58dbcSMatthew Ahrens * 8cde58dbcSMatthew Ahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9cde58dbcSMatthew Ahrens * or http://www.opensolaris.org/os/licensing. 10cde58dbcSMatthew Ahrens * See the License for the specific language governing permissions 11cde58dbcSMatthew Ahrens * and limitations under the License. 12cde58dbcSMatthew Ahrens * 13cde58dbcSMatthew Ahrens * When distributing Covered Code, include this CDDL HEADER in each 14cde58dbcSMatthew Ahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15cde58dbcSMatthew Ahrens * If applicable, add the following below this CDDL HEADER, with the 16cde58dbcSMatthew Ahrens * fields enclosed by brackets "[]" replaced with your own identifying 17cde58dbcSMatthew Ahrens * information: Portions Copyright [yyyy] [name of copyright owner] 18cde58dbcSMatthew Ahrens * 19cde58dbcSMatthew Ahrens * CDDL HEADER END 20cde58dbcSMatthew Ahrens */ 21cde58dbcSMatthew Ahrens /* 22cde58dbcSMatthew Ahrens * Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved. 23*5cabbc6bSPrashanth Sreenivasa * Copyright (c) 2012, 2015 by Delphix. All rights reserved. 24bc9014e6SJustin Gibbs * Copyright (c) 2014 Spectra Logic Corporation, All rights reserved. 25c3d26abcSMatthew Ahrens * Copyright (c) 2014 Integros [integros.com] 26cde58dbcSMatthew Ahrens */ 27cde58dbcSMatthew Ahrens 28cde58dbcSMatthew Ahrens #include <sys/dsl_dataset.h> 29cde58dbcSMatthew Ahrens #include <sys/dmu.h> 30cde58dbcSMatthew Ahrens #include <sys/refcount.h> 31cde58dbcSMatthew Ahrens #include <sys/zap.h> 32cde58dbcSMatthew Ahrens #include <sys/zfs_context.h> 33cde58dbcSMatthew Ahrens #include <sys/dsl_pool.h> 34cde58dbcSMatthew Ahrens 3519b94df9SMatthew Ahrens /* 3619b94df9SMatthew Ahrens * Deadlist concurrency: 3719b94df9SMatthew Ahrens * 3819b94df9SMatthew Ahrens * Deadlists can only be modified from the syncing thread. 3919b94df9SMatthew Ahrens * 4019b94df9SMatthew Ahrens * Except for dsl_deadlist_insert(), it can only be modified with the 4119b94df9SMatthew Ahrens * dp_config_rwlock held with RW_WRITER. 4219b94df9SMatthew Ahrens * 4319b94df9SMatthew Ahrens * The accessors (dsl_deadlist_space() and dsl_deadlist_space_range()) can 4419b94df9SMatthew Ahrens * be called concurrently, from open context, with the dl_config_rwlock held 4519b94df9SMatthew Ahrens * with RW_READER. 4619b94df9SMatthew Ahrens * 4719b94df9SMatthew Ahrens * Therefore, we only need to provide locking between dsl_deadlist_insert() and 4819b94df9SMatthew Ahrens * the accessors, protecting: 4919b94df9SMatthew Ahrens * dl_phys->dl_used,comp,uncomp 5019b94df9SMatthew Ahrens * and protecting the dl_tree from being loaded. 5119b94df9SMatthew Ahrens * The locking is provided by dl_lock. Note that locking on the bpobj_t 5219b94df9SMatthew Ahrens * provides its own locking, and dl_oldfmt is immutable. 5319b94df9SMatthew Ahrens */ 5419b94df9SMatthew Ahrens 55cde58dbcSMatthew Ahrens static int 56cde58dbcSMatthew Ahrens dsl_deadlist_compare(const void *arg1, const void *arg2) 57cde58dbcSMatthew Ahrens { 58cde58dbcSMatthew Ahrens const dsl_deadlist_entry_t *dle1 = arg1; 59cde58dbcSMatthew Ahrens const dsl_deadlist_entry_t *dle2 = arg2; 60cde58dbcSMatthew Ahrens 61cde58dbcSMatthew Ahrens if (dle1->dle_mintxg < dle2->dle_mintxg) 62cde58dbcSMatthew Ahrens return (-1); 63cde58dbcSMatthew Ahrens else if (dle1->dle_mintxg > dle2->dle_mintxg) 64cde58dbcSMatthew Ahrens return (+1); 65cde58dbcSMatthew Ahrens else 66cde58dbcSMatthew Ahrens return (0); 67cde58dbcSMatthew Ahrens } 68cde58dbcSMatthew Ahrens 69cde58dbcSMatthew Ahrens static void 70cde58dbcSMatthew Ahrens dsl_deadlist_load_tree(dsl_deadlist_t *dl) 71cde58dbcSMatthew Ahrens { 72cde58dbcSMatthew Ahrens zap_cursor_t zc; 73cde58dbcSMatthew Ahrens zap_attribute_t za; 74cde58dbcSMatthew Ahrens 75a3905a45SSerapheim Dimitropoulos ASSERT(MUTEX_HELD(&dl->dl_lock)); 76a3905a45SSerapheim Dimitropoulos 77cde58dbcSMatthew Ahrens ASSERT(!dl->dl_oldfmt); 78cde58dbcSMatthew Ahrens if (dl->dl_havetree) 79cde58dbcSMatthew Ahrens return; 80cde58dbcSMatthew Ahrens 81cde58dbcSMatthew Ahrens avl_create(&dl->dl_tree, dsl_deadlist_compare, 82cde58dbcSMatthew Ahrens sizeof (dsl_deadlist_entry_t), 83cde58dbcSMatthew Ahrens offsetof(dsl_deadlist_entry_t, dle_node)); 84cde58dbcSMatthew Ahrens for (zap_cursor_init(&zc, dl->dl_os, dl->dl_object); 85cde58dbcSMatthew Ahrens zap_cursor_retrieve(&zc, &za) == 0; 86cde58dbcSMatthew Ahrens zap_cursor_advance(&zc)) { 87cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle = kmem_alloc(sizeof (*dle), KM_SLEEP); 884585130bSYuri Pankov dle->dle_mintxg = zfs_strtonum(za.za_name, NULL); 89b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_open(&dle->dle_bpobj, dl->dl_os, 90cde58dbcSMatthew Ahrens za.za_first_integer)); 91cde58dbcSMatthew Ahrens avl_add(&dl->dl_tree, dle); 92cde58dbcSMatthew Ahrens } 93cde58dbcSMatthew Ahrens zap_cursor_fini(&zc); 94cde58dbcSMatthew Ahrens dl->dl_havetree = B_TRUE; 95cde58dbcSMatthew Ahrens } 96cde58dbcSMatthew Ahrens 97cde58dbcSMatthew Ahrens void 98cde58dbcSMatthew Ahrens dsl_deadlist_open(dsl_deadlist_t *dl, objset_t *os, uint64_t object) 99cde58dbcSMatthew Ahrens { 100cde58dbcSMatthew Ahrens dmu_object_info_t doi; 101cde58dbcSMatthew Ahrens 102*5cabbc6bSPrashanth Sreenivasa ASSERT(!dsl_deadlist_is_open(dl)); 103*5cabbc6bSPrashanth Sreenivasa 104cde58dbcSMatthew Ahrens mutex_init(&dl->dl_lock, NULL, MUTEX_DEFAULT, NULL); 105cde58dbcSMatthew Ahrens dl->dl_os = os; 106cde58dbcSMatthew Ahrens dl->dl_object = object; 107b420f3adSRichard Lowe VERIFY3U(0, ==, dmu_bonus_hold(os, object, dl, &dl->dl_dbuf)); 108cde58dbcSMatthew Ahrens dmu_object_info_from_db(dl->dl_dbuf, &doi); 109cde58dbcSMatthew Ahrens if (doi.doi_type == DMU_OT_BPOBJ) { 110cde58dbcSMatthew Ahrens dmu_buf_rele(dl->dl_dbuf, dl); 111cde58dbcSMatthew Ahrens dl->dl_dbuf = NULL; 112cde58dbcSMatthew Ahrens dl->dl_oldfmt = B_TRUE; 113b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_open(&dl->dl_bpobj, os, object)); 114cde58dbcSMatthew Ahrens return; 115cde58dbcSMatthew Ahrens } 116cde58dbcSMatthew Ahrens 117cde58dbcSMatthew Ahrens dl->dl_oldfmt = B_FALSE; 118cde58dbcSMatthew Ahrens dl->dl_phys = dl->dl_dbuf->db_data; 119cde58dbcSMatthew Ahrens dl->dl_havetree = B_FALSE; 120cde58dbcSMatthew Ahrens } 121cde58dbcSMatthew Ahrens 122*5cabbc6bSPrashanth Sreenivasa boolean_t 123*5cabbc6bSPrashanth Sreenivasa dsl_deadlist_is_open(dsl_deadlist_t *dl) 124*5cabbc6bSPrashanth Sreenivasa { 125*5cabbc6bSPrashanth Sreenivasa return (dl->dl_os != NULL); 126*5cabbc6bSPrashanth Sreenivasa } 127*5cabbc6bSPrashanth Sreenivasa 128cde58dbcSMatthew Ahrens void 129cde58dbcSMatthew Ahrens dsl_deadlist_close(dsl_deadlist_t *dl) 130cde58dbcSMatthew Ahrens { 131cde58dbcSMatthew Ahrens void *cookie = NULL; 132cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle; 133cde58dbcSMatthew Ahrens 134*5cabbc6bSPrashanth Sreenivasa ASSERT(dsl_deadlist_is_open(dl)); 135bc9014e6SJustin Gibbs 136cde58dbcSMatthew Ahrens if (dl->dl_oldfmt) { 137cde58dbcSMatthew Ahrens dl->dl_oldfmt = B_FALSE; 138cde58dbcSMatthew Ahrens bpobj_close(&dl->dl_bpobj); 139*5cabbc6bSPrashanth Sreenivasa dl->dl_os = NULL; 140*5cabbc6bSPrashanth Sreenivasa dl->dl_object = 0; 141cde58dbcSMatthew Ahrens return; 142cde58dbcSMatthew Ahrens } 143cde58dbcSMatthew Ahrens 144cde58dbcSMatthew Ahrens if (dl->dl_havetree) { 145cde58dbcSMatthew Ahrens while ((dle = avl_destroy_nodes(&dl->dl_tree, &cookie)) 146cde58dbcSMatthew Ahrens != NULL) { 147cde58dbcSMatthew Ahrens bpobj_close(&dle->dle_bpobj); 148cde58dbcSMatthew Ahrens kmem_free(dle, sizeof (*dle)); 149cde58dbcSMatthew Ahrens } 150cde58dbcSMatthew Ahrens avl_destroy(&dl->dl_tree); 151cde58dbcSMatthew Ahrens } 152cde58dbcSMatthew Ahrens dmu_buf_rele(dl->dl_dbuf, dl); 153cde58dbcSMatthew Ahrens mutex_destroy(&dl->dl_lock); 154cde58dbcSMatthew Ahrens dl->dl_dbuf = NULL; 155cde58dbcSMatthew Ahrens dl->dl_phys = NULL; 156*5cabbc6bSPrashanth Sreenivasa dl->dl_os = NULL; 157*5cabbc6bSPrashanth Sreenivasa dl->dl_object = 0; 158cde58dbcSMatthew Ahrens } 159cde58dbcSMatthew Ahrens 160cde58dbcSMatthew Ahrens uint64_t 161cde58dbcSMatthew Ahrens dsl_deadlist_alloc(objset_t *os, dmu_tx_t *tx) 162cde58dbcSMatthew Ahrens { 163cde58dbcSMatthew Ahrens if (spa_version(dmu_objset_spa(os)) < SPA_VERSION_DEADLISTS) 164b5152584SMatthew Ahrens return (bpobj_alloc(os, SPA_OLD_MAXBLOCKSIZE, tx)); 165cde58dbcSMatthew Ahrens return (zap_create(os, DMU_OT_DEADLIST, DMU_OT_DEADLIST_HDR, 166cde58dbcSMatthew Ahrens sizeof (dsl_deadlist_phys_t), tx)); 167cde58dbcSMatthew Ahrens } 168cde58dbcSMatthew Ahrens 169cde58dbcSMatthew Ahrens void 170cde58dbcSMatthew Ahrens dsl_deadlist_free(objset_t *os, uint64_t dlobj, dmu_tx_t *tx) 171cde58dbcSMatthew Ahrens { 172cde58dbcSMatthew Ahrens dmu_object_info_t doi; 173cde58dbcSMatthew Ahrens zap_cursor_t zc; 174cde58dbcSMatthew Ahrens zap_attribute_t za; 175cde58dbcSMatthew Ahrens 176b420f3adSRichard Lowe VERIFY3U(0, ==, dmu_object_info(os, dlobj, &doi)); 177cde58dbcSMatthew Ahrens if (doi.doi_type == DMU_OT_BPOBJ) { 178cde58dbcSMatthew Ahrens bpobj_free(os, dlobj, tx); 179cde58dbcSMatthew Ahrens return; 180cde58dbcSMatthew Ahrens } 181cde58dbcSMatthew Ahrens 182cde58dbcSMatthew Ahrens for (zap_cursor_init(&zc, os, dlobj); 183cde58dbcSMatthew Ahrens zap_cursor_retrieve(&zc, &za) == 0; 184f1745736SMatthew Ahrens zap_cursor_advance(&zc)) { 185f1745736SMatthew Ahrens uint64_t obj = za.za_first_integer; 186f1745736SMatthew Ahrens if (obj == dmu_objset_pool(os)->dp_empty_bpobj) 187f1745736SMatthew Ahrens bpobj_decr_empty(os, tx); 188f1745736SMatthew Ahrens else 189f1745736SMatthew Ahrens bpobj_free(os, obj, tx); 190f1745736SMatthew Ahrens } 191cde58dbcSMatthew Ahrens zap_cursor_fini(&zc); 192b420f3adSRichard Lowe VERIFY3U(0, ==, dmu_object_free(os, dlobj, tx)); 193cde58dbcSMatthew Ahrens } 194cde58dbcSMatthew Ahrens 195f1745736SMatthew Ahrens static void 196f1745736SMatthew Ahrens dle_enqueue(dsl_deadlist_t *dl, dsl_deadlist_entry_t *dle, 197f1745736SMatthew Ahrens const blkptr_t *bp, dmu_tx_t *tx) 198f1745736SMatthew Ahrens { 199a3905a45SSerapheim Dimitropoulos ASSERT(MUTEX_HELD(&dl->dl_lock)); 200f1745736SMatthew Ahrens if (dle->dle_bpobj.bpo_object == 201f1745736SMatthew Ahrens dmu_objset_pool(dl->dl_os)->dp_empty_bpobj) { 202b5152584SMatthew Ahrens uint64_t obj = bpobj_alloc(dl->dl_os, SPA_OLD_MAXBLOCKSIZE, tx); 203f1745736SMatthew Ahrens bpobj_close(&dle->dle_bpobj); 204f1745736SMatthew Ahrens bpobj_decr_empty(dl->dl_os, tx); 205f1745736SMatthew Ahrens VERIFY3U(0, ==, bpobj_open(&dle->dle_bpobj, dl->dl_os, obj)); 206f1745736SMatthew Ahrens VERIFY3U(0, ==, zap_update_int_key(dl->dl_os, dl->dl_object, 207f1745736SMatthew Ahrens dle->dle_mintxg, obj, tx)); 208f1745736SMatthew Ahrens } 209f1745736SMatthew Ahrens bpobj_enqueue(&dle->dle_bpobj, bp, tx); 210f1745736SMatthew Ahrens } 211f1745736SMatthew Ahrens 212f1745736SMatthew Ahrens static void 213f1745736SMatthew Ahrens dle_enqueue_subobj(dsl_deadlist_t *dl, dsl_deadlist_entry_t *dle, 214f1745736SMatthew Ahrens uint64_t obj, dmu_tx_t *tx) 215f1745736SMatthew Ahrens { 216a3905a45SSerapheim Dimitropoulos ASSERT(MUTEX_HELD(&dl->dl_lock)); 217f1745736SMatthew Ahrens if (dle->dle_bpobj.bpo_object != 218f1745736SMatthew Ahrens dmu_objset_pool(dl->dl_os)->dp_empty_bpobj) { 219f1745736SMatthew Ahrens bpobj_enqueue_subobj(&dle->dle_bpobj, obj, tx); 220f1745736SMatthew Ahrens } else { 221f1745736SMatthew Ahrens bpobj_close(&dle->dle_bpobj); 222f1745736SMatthew Ahrens bpobj_decr_empty(dl->dl_os, tx); 223f1745736SMatthew Ahrens VERIFY3U(0, ==, bpobj_open(&dle->dle_bpobj, dl->dl_os, obj)); 224f1745736SMatthew Ahrens VERIFY3U(0, ==, zap_update_int_key(dl->dl_os, dl->dl_object, 225f1745736SMatthew Ahrens dle->dle_mintxg, obj, tx)); 226f1745736SMatthew Ahrens } 227f1745736SMatthew Ahrens } 228f1745736SMatthew Ahrens 229cde58dbcSMatthew Ahrens void 230cde58dbcSMatthew Ahrens dsl_deadlist_insert(dsl_deadlist_t *dl, const blkptr_t *bp, dmu_tx_t *tx) 231cde58dbcSMatthew Ahrens { 232cde58dbcSMatthew Ahrens dsl_deadlist_entry_t dle_tofind; 233cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle; 234cde58dbcSMatthew Ahrens avl_index_t where; 235cde58dbcSMatthew Ahrens 236cde58dbcSMatthew Ahrens if (dl->dl_oldfmt) { 237cde58dbcSMatthew Ahrens bpobj_enqueue(&dl->dl_bpobj, bp, tx); 238cde58dbcSMatthew Ahrens return; 239cde58dbcSMatthew Ahrens } 240cde58dbcSMatthew Ahrens 241a3905a45SSerapheim Dimitropoulos mutex_enter(&dl->dl_lock); 242cde58dbcSMatthew Ahrens dsl_deadlist_load_tree(dl); 243cde58dbcSMatthew Ahrens 244cde58dbcSMatthew Ahrens dmu_buf_will_dirty(dl->dl_dbuf, tx); 245cde58dbcSMatthew Ahrens dl->dl_phys->dl_used += 246cde58dbcSMatthew Ahrens bp_get_dsize_sync(dmu_objset_spa(dl->dl_os), bp); 247cde58dbcSMatthew Ahrens dl->dl_phys->dl_comp += BP_GET_PSIZE(bp); 248cde58dbcSMatthew Ahrens dl->dl_phys->dl_uncomp += BP_GET_UCSIZE(bp); 249cde58dbcSMatthew Ahrens 250cde58dbcSMatthew Ahrens dle_tofind.dle_mintxg = bp->blk_birth; 251cde58dbcSMatthew Ahrens dle = avl_find(&dl->dl_tree, &dle_tofind, &where); 252cde58dbcSMatthew Ahrens if (dle == NULL) 253cde58dbcSMatthew Ahrens dle = avl_nearest(&dl->dl_tree, where, AVL_BEFORE); 254cde58dbcSMatthew Ahrens else 255cde58dbcSMatthew Ahrens dle = AVL_PREV(&dl->dl_tree, dle); 256f1745736SMatthew Ahrens dle_enqueue(dl, dle, bp, tx); 257a3905a45SSerapheim Dimitropoulos mutex_exit(&dl->dl_lock); 258cde58dbcSMatthew Ahrens } 259cde58dbcSMatthew Ahrens 260cde58dbcSMatthew Ahrens /* 261cde58dbcSMatthew Ahrens * Insert new key in deadlist, which must be > all current entries. 262cde58dbcSMatthew Ahrens * mintxg is not inclusive. 263cde58dbcSMatthew Ahrens */ 264cde58dbcSMatthew Ahrens void 265cde58dbcSMatthew Ahrens dsl_deadlist_add_key(dsl_deadlist_t *dl, uint64_t mintxg, dmu_tx_t *tx) 266cde58dbcSMatthew Ahrens { 267cde58dbcSMatthew Ahrens uint64_t obj; 268cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle; 269cde58dbcSMatthew Ahrens 270cde58dbcSMatthew Ahrens if (dl->dl_oldfmt) 271cde58dbcSMatthew Ahrens return; 272cde58dbcSMatthew Ahrens 273cde58dbcSMatthew Ahrens dle = kmem_alloc(sizeof (*dle), KM_SLEEP); 274cde58dbcSMatthew Ahrens dle->dle_mintxg = mintxg; 275a3905a45SSerapheim Dimitropoulos 276a3905a45SSerapheim Dimitropoulos mutex_enter(&dl->dl_lock); 277a3905a45SSerapheim Dimitropoulos dsl_deadlist_load_tree(dl); 278a3905a45SSerapheim Dimitropoulos 279b5152584SMatthew Ahrens obj = bpobj_alloc_empty(dl->dl_os, SPA_OLD_MAXBLOCKSIZE, tx); 280b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_open(&dle->dle_bpobj, dl->dl_os, obj)); 281cde58dbcSMatthew Ahrens avl_add(&dl->dl_tree, dle); 282cde58dbcSMatthew Ahrens 283b420f3adSRichard Lowe VERIFY3U(0, ==, zap_add_int_key(dl->dl_os, dl->dl_object, 284cde58dbcSMatthew Ahrens mintxg, obj, tx)); 285a3905a45SSerapheim Dimitropoulos mutex_exit(&dl->dl_lock); 286cde58dbcSMatthew Ahrens } 287cde58dbcSMatthew Ahrens 288cde58dbcSMatthew Ahrens /* 289cde58dbcSMatthew Ahrens * Remove this key, merging its entries into the previous key. 290cde58dbcSMatthew Ahrens */ 291cde58dbcSMatthew Ahrens void 292cde58dbcSMatthew Ahrens dsl_deadlist_remove_key(dsl_deadlist_t *dl, uint64_t mintxg, dmu_tx_t *tx) 293cde58dbcSMatthew Ahrens { 294cde58dbcSMatthew Ahrens dsl_deadlist_entry_t dle_tofind; 295cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle, *dle_prev; 296cde58dbcSMatthew Ahrens 297cde58dbcSMatthew Ahrens if (dl->dl_oldfmt) 298cde58dbcSMatthew Ahrens return; 299cde58dbcSMatthew Ahrens 300a3905a45SSerapheim Dimitropoulos mutex_enter(&dl->dl_lock); 301cde58dbcSMatthew Ahrens dsl_deadlist_load_tree(dl); 302cde58dbcSMatthew Ahrens 303cde58dbcSMatthew Ahrens dle_tofind.dle_mintxg = mintxg; 304cde58dbcSMatthew Ahrens dle = avl_find(&dl->dl_tree, &dle_tofind, NULL); 305cde58dbcSMatthew Ahrens dle_prev = AVL_PREV(&dl->dl_tree, dle); 306cde58dbcSMatthew Ahrens 307f1745736SMatthew Ahrens dle_enqueue_subobj(dl, dle_prev, dle->dle_bpobj.bpo_object, tx); 308cde58dbcSMatthew Ahrens 309cde58dbcSMatthew Ahrens avl_remove(&dl->dl_tree, dle); 310cde58dbcSMatthew Ahrens bpobj_close(&dle->dle_bpobj); 311cde58dbcSMatthew Ahrens kmem_free(dle, sizeof (*dle)); 312cde58dbcSMatthew Ahrens 313b420f3adSRichard Lowe VERIFY3U(0, ==, zap_remove_int(dl->dl_os, dl->dl_object, mintxg, tx)); 314a3905a45SSerapheim Dimitropoulos mutex_exit(&dl->dl_lock); 315cde58dbcSMatthew Ahrens } 316cde58dbcSMatthew Ahrens 317cde58dbcSMatthew Ahrens /* 318cde58dbcSMatthew Ahrens * Walk ds's snapshots to regenerate generate ZAP & AVL. 319cde58dbcSMatthew Ahrens */ 320cde58dbcSMatthew Ahrens static void 321cde58dbcSMatthew Ahrens dsl_deadlist_regenerate(objset_t *os, uint64_t dlobj, 322cde58dbcSMatthew Ahrens uint64_t mrs_obj, dmu_tx_t *tx) 323cde58dbcSMatthew Ahrens { 324*5cabbc6bSPrashanth Sreenivasa dsl_deadlist_t dl = { 0 }; 325cde58dbcSMatthew Ahrens dsl_pool_t *dp = dmu_objset_pool(os); 326cde58dbcSMatthew Ahrens 327cde58dbcSMatthew Ahrens dsl_deadlist_open(&dl, os, dlobj); 328cde58dbcSMatthew Ahrens if (dl.dl_oldfmt) { 329cde58dbcSMatthew Ahrens dsl_deadlist_close(&dl); 330cde58dbcSMatthew Ahrens return; 331cde58dbcSMatthew Ahrens } 332cde58dbcSMatthew Ahrens 333cde58dbcSMatthew Ahrens while (mrs_obj != 0) { 334cde58dbcSMatthew Ahrens dsl_dataset_t *ds; 335b420f3adSRichard Lowe VERIFY3U(0, ==, dsl_dataset_hold_obj(dp, mrs_obj, FTAG, &ds)); 336c1379625SJustin T. Gibbs dsl_deadlist_add_key(&dl, 337c1379625SJustin T. Gibbs dsl_dataset_phys(ds)->ds_prev_snap_txg, tx); 338c1379625SJustin T. Gibbs mrs_obj = dsl_dataset_phys(ds)->ds_prev_snap_obj; 339cde58dbcSMatthew Ahrens dsl_dataset_rele(ds, FTAG); 340cde58dbcSMatthew Ahrens } 341cde58dbcSMatthew Ahrens dsl_deadlist_close(&dl); 342cde58dbcSMatthew Ahrens } 343cde58dbcSMatthew Ahrens 344cde58dbcSMatthew Ahrens uint64_t 345cde58dbcSMatthew Ahrens dsl_deadlist_clone(dsl_deadlist_t *dl, uint64_t maxtxg, 346cde58dbcSMatthew Ahrens uint64_t mrs_obj, dmu_tx_t *tx) 347cde58dbcSMatthew Ahrens { 348cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle; 349cde58dbcSMatthew Ahrens uint64_t newobj; 350cde58dbcSMatthew Ahrens 351cde58dbcSMatthew Ahrens newobj = dsl_deadlist_alloc(dl->dl_os, tx); 352cde58dbcSMatthew Ahrens 353cde58dbcSMatthew Ahrens if (dl->dl_oldfmt) { 354cde58dbcSMatthew Ahrens dsl_deadlist_regenerate(dl->dl_os, newobj, mrs_obj, tx); 355cde58dbcSMatthew Ahrens return (newobj); 356cde58dbcSMatthew Ahrens } 357cde58dbcSMatthew Ahrens 358a3905a45SSerapheim Dimitropoulos mutex_enter(&dl->dl_lock); 359cde58dbcSMatthew Ahrens dsl_deadlist_load_tree(dl); 360cde58dbcSMatthew Ahrens 361cde58dbcSMatthew Ahrens for (dle = avl_first(&dl->dl_tree); dle; 362cde58dbcSMatthew Ahrens dle = AVL_NEXT(&dl->dl_tree, dle)) { 363cde58dbcSMatthew Ahrens uint64_t obj; 364cde58dbcSMatthew Ahrens 365cde58dbcSMatthew Ahrens if (dle->dle_mintxg >= maxtxg) 366cde58dbcSMatthew Ahrens break; 367cde58dbcSMatthew Ahrens 368b5152584SMatthew Ahrens obj = bpobj_alloc_empty(dl->dl_os, SPA_OLD_MAXBLOCKSIZE, tx); 369b420f3adSRichard Lowe VERIFY3U(0, ==, zap_add_int_key(dl->dl_os, newobj, 370cde58dbcSMatthew Ahrens dle->dle_mintxg, obj, tx)); 371cde58dbcSMatthew Ahrens } 372a3905a45SSerapheim Dimitropoulos mutex_exit(&dl->dl_lock); 373cde58dbcSMatthew Ahrens return (newobj); 374cde58dbcSMatthew Ahrens } 375cde58dbcSMatthew Ahrens 376cde58dbcSMatthew Ahrens void 377cde58dbcSMatthew Ahrens dsl_deadlist_space(dsl_deadlist_t *dl, 378cde58dbcSMatthew Ahrens uint64_t *usedp, uint64_t *compp, uint64_t *uncompp) 379cde58dbcSMatthew Ahrens { 380*5cabbc6bSPrashanth Sreenivasa ASSERT(dsl_deadlist_is_open(dl)); 381cde58dbcSMatthew Ahrens if (dl->dl_oldfmt) { 382b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_space(&dl->dl_bpobj, 383cde58dbcSMatthew Ahrens usedp, compp, uncompp)); 384cde58dbcSMatthew Ahrens return; 385cde58dbcSMatthew Ahrens } 386cde58dbcSMatthew Ahrens 387cde58dbcSMatthew Ahrens mutex_enter(&dl->dl_lock); 388cde58dbcSMatthew Ahrens *usedp = dl->dl_phys->dl_used; 389cde58dbcSMatthew Ahrens *compp = dl->dl_phys->dl_comp; 390cde58dbcSMatthew Ahrens *uncompp = dl->dl_phys->dl_uncomp; 391cde58dbcSMatthew Ahrens mutex_exit(&dl->dl_lock); 392cde58dbcSMatthew Ahrens } 393cde58dbcSMatthew Ahrens 394cde58dbcSMatthew Ahrens /* 395cde58dbcSMatthew Ahrens * return space used in the range (mintxg, maxtxg]. 396cde58dbcSMatthew Ahrens * Includes maxtxg, does not include mintxg. 397cde58dbcSMatthew Ahrens * mintxg and maxtxg must both be keys in the deadlist (unless maxtxg is 39819b94df9SMatthew Ahrens * larger than any bp in the deadlist (eg. UINT64_MAX)). 399cde58dbcSMatthew Ahrens */ 400cde58dbcSMatthew Ahrens void 401cde58dbcSMatthew Ahrens dsl_deadlist_space_range(dsl_deadlist_t *dl, uint64_t mintxg, uint64_t maxtxg, 402cde58dbcSMatthew Ahrens uint64_t *usedp, uint64_t *compp, uint64_t *uncompp) 403cde58dbcSMatthew Ahrens { 4048ac09fceSRichard Lowe dsl_deadlist_entry_t *dle; 40519b94df9SMatthew Ahrens dsl_deadlist_entry_t dle_tofind; 406cde58dbcSMatthew Ahrens avl_index_t where; 407cde58dbcSMatthew Ahrens 408cde58dbcSMatthew Ahrens if (dl->dl_oldfmt) { 409b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_space_range(&dl->dl_bpobj, 410cde58dbcSMatthew Ahrens mintxg, maxtxg, usedp, compp, uncompp)); 411cde58dbcSMatthew Ahrens return; 412cde58dbcSMatthew Ahrens } 413cde58dbcSMatthew Ahrens 414cde58dbcSMatthew Ahrens *usedp = *compp = *uncompp = 0; 415cde58dbcSMatthew Ahrens 41619b94df9SMatthew Ahrens mutex_enter(&dl->dl_lock); 41719b94df9SMatthew Ahrens dsl_deadlist_load_tree(dl); 418cde58dbcSMatthew Ahrens dle_tofind.dle_mintxg = mintxg; 419cde58dbcSMatthew Ahrens dle = avl_find(&dl->dl_tree, &dle_tofind, &where); 420cde58dbcSMatthew Ahrens /* 421cde58dbcSMatthew Ahrens * If we don't find this mintxg, there shouldn't be anything 422cde58dbcSMatthew Ahrens * after it either. 423cde58dbcSMatthew Ahrens */ 424cde58dbcSMatthew Ahrens ASSERT(dle != NULL || 425cde58dbcSMatthew Ahrens avl_nearest(&dl->dl_tree, where, AVL_AFTER) == NULL); 42619b94df9SMatthew Ahrens 427cde58dbcSMatthew Ahrens for (; dle && dle->dle_mintxg < maxtxg; 428cde58dbcSMatthew Ahrens dle = AVL_NEXT(&dl->dl_tree, dle)) { 429cde58dbcSMatthew Ahrens uint64_t used, comp, uncomp; 430cde58dbcSMatthew Ahrens 431b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_space(&dle->dle_bpobj, 432cde58dbcSMatthew Ahrens &used, &comp, &uncomp)); 433cde58dbcSMatthew Ahrens 434cde58dbcSMatthew Ahrens *usedp += used; 435cde58dbcSMatthew Ahrens *compp += comp; 436cde58dbcSMatthew Ahrens *uncompp += uncomp; 437cde58dbcSMatthew Ahrens } 43819b94df9SMatthew Ahrens mutex_exit(&dl->dl_lock); 439cde58dbcSMatthew Ahrens } 440cde58dbcSMatthew Ahrens 441cde58dbcSMatthew Ahrens static void 442cde58dbcSMatthew Ahrens dsl_deadlist_insert_bpobj(dsl_deadlist_t *dl, uint64_t obj, uint64_t birth, 443cde58dbcSMatthew Ahrens dmu_tx_t *tx) 444cde58dbcSMatthew Ahrens { 445cde58dbcSMatthew Ahrens dsl_deadlist_entry_t dle_tofind; 446cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle; 447cde58dbcSMatthew Ahrens avl_index_t where; 448cde58dbcSMatthew Ahrens uint64_t used, comp, uncomp; 449cde58dbcSMatthew Ahrens bpobj_t bpo; 450cde58dbcSMatthew Ahrens 451a3905a45SSerapheim Dimitropoulos ASSERT(MUTEX_HELD(&dl->dl_lock)); 452a3905a45SSerapheim Dimitropoulos 453b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_open(&bpo, dl->dl_os, obj)); 454b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_space(&bpo, &used, &comp, &uncomp)); 455cde58dbcSMatthew Ahrens bpobj_close(&bpo); 456cde58dbcSMatthew Ahrens 457cde58dbcSMatthew Ahrens dsl_deadlist_load_tree(dl); 458cde58dbcSMatthew Ahrens 459cde58dbcSMatthew Ahrens dmu_buf_will_dirty(dl->dl_dbuf, tx); 460cde58dbcSMatthew Ahrens dl->dl_phys->dl_used += used; 461cde58dbcSMatthew Ahrens dl->dl_phys->dl_comp += comp; 462cde58dbcSMatthew Ahrens dl->dl_phys->dl_uncomp += uncomp; 463cde58dbcSMatthew Ahrens 464cde58dbcSMatthew Ahrens dle_tofind.dle_mintxg = birth; 465cde58dbcSMatthew Ahrens dle = avl_find(&dl->dl_tree, &dle_tofind, &where); 466cde58dbcSMatthew Ahrens if (dle == NULL) 467cde58dbcSMatthew Ahrens dle = avl_nearest(&dl->dl_tree, where, AVL_BEFORE); 468f1745736SMatthew Ahrens dle_enqueue_subobj(dl, dle, obj, tx); 469cde58dbcSMatthew Ahrens } 470cde58dbcSMatthew Ahrens 471cde58dbcSMatthew Ahrens static int 472cde58dbcSMatthew Ahrens dsl_deadlist_insert_cb(void *arg, const blkptr_t *bp, dmu_tx_t *tx) 473cde58dbcSMatthew Ahrens { 474cde58dbcSMatthew Ahrens dsl_deadlist_t *dl = arg; 475cde58dbcSMatthew Ahrens dsl_deadlist_insert(dl, bp, tx); 476cde58dbcSMatthew Ahrens return (0); 477cde58dbcSMatthew Ahrens } 478cde58dbcSMatthew Ahrens 479cde58dbcSMatthew Ahrens /* 480cde58dbcSMatthew Ahrens * Merge the deadlist pointed to by 'obj' into dl. obj will be left as 481cde58dbcSMatthew Ahrens * an empty deadlist. 482cde58dbcSMatthew Ahrens */ 483cde58dbcSMatthew Ahrens void 484cde58dbcSMatthew Ahrens dsl_deadlist_merge(dsl_deadlist_t *dl, uint64_t obj, dmu_tx_t *tx) 485cde58dbcSMatthew Ahrens { 486cde58dbcSMatthew Ahrens zap_cursor_t zc; 487cde58dbcSMatthew Ahrens zap_attribute_t za; 488cde58dbcSMatthew Ahrens dmu_buf_t *bonus; 489cde58dbcSMatthew Ahrens dsl_deadlist_phys_t *dlp; 490cde58dbcSMatthew Ahrens dmu_object_info_t doi; 491cde58dbcSMatthew Ahrens 492b420f3adSRichard Lowe VERIFY3U(0, ==, dmu_object_info(dl->dl_os, obj, &doi)); 493cde58dbcSMatthew Ahrens if (doi.doi_type == DMU_OT_BPOBJ) { 494cde58dbcSMatthew Ahrens bpobj_t bpo; 495b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_open(&bpo, dl->dl_os, obj)); 496b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_iterate(&bpo, 497cde58dbcSMatthew Ahrens dsl_deadlist_insert_cb, dl, tx)); 498cde58dbcSMatthew Ahrens bpobj_close(&bpo); 499cde58dbcSMatthew Ahrens return; 500cde58dbcSMatthew Ahrens } 501cde58dbcSMatthew Ahrens 502a3905a45SSerapheim Dimitropoulos mutex_enter(&dl->dl_lock); 503cde58dbcSMatthew Ahrens for (zap_cursor_init(&zc, dl->dl_os, obj); 504cde58dbcSMatthew Ahrens zap_cursor_retrieve(&zc, &za) == 0; 505cde58dbcSMatthew Ahrens zap_cursor_advance(&zc)) { 5064585130bSYuri Pankov uint64_t mintxg = zfs_strtonum(za.za_name, NULL); 507cde58dbcSMatthew Ahrens dsl_deadlist_insert_bpobj(dl, za.za_first_integer, mintxg, tx); 508b420f3adSRichard Lowe VERIFY3U(0, ==, zap_remove_int(dl->dl_os, obj, mintxg, tx)); 509cde58dbcSMatthew Ahrens } 510cde58dbcSMatthew Ahrens zap_cursor_fini(&zc); 511cde58dbcSMatthew Ahrens 512b420f3adSRichard Lowe VERIFY3U(0, ==, dmu_bonus_hold(dl->dl_os, obj, FTAG, &bonus)); 513cde58dbcSMatthew Ahrens dlp = bonus->db_data; 514cde58dbcSMatthew Ahrens dmu_buf_will_dirty(bonus, tx); 515cde58dbcSMatthew Ahrens bzero(dlp, sizeof (*dlp)); 516cde58dbcSMatthew Ahrens dmu_buf_rele(bonus, FTAG); 517a3905a45SSerapheim Dimitropoulos mutex_exit(&dl->dl_lock); 518cde58dbcSMatthew Ahrens } 519cde58dbcSMatthew Ahrens 520cde58dbcSMatthew Ahrens /* 521cde58dbcSMatthew Ahrens * Remove entries on dl that are >= mintxg, and put them on the bpobj. 522cde58dbcSMatthew Ahrens */ 523cde58dbcSMatthew Ahrens void 524cde58dbcSMatthew Ahrens dsl_deadlist_move_bpobj(dsl_deadlist_t *dl, bpobj_t *bpo, uint64_t mintxg, 525cde58dbcSMatthew Ahrens dmu_tx_t *tx) 526cde58dbcSMatthew Ahrens { 527cde58dbcSMatthew Ahrens dsl_deadlist_entry_t dle_tofind; 528cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle; 529cde58dbcSMatthew Ahrens avl_index_t where; 530cde58dbcSMatthew Ahrens 531cde58dbcSMatthew Ahrens ASSERT(!dl->dl_oldfmt); 532a3905a45SSerapheim Dimitropoulos 533a3905a45SSerapheim Dimitropoulos mutex_enter(&dl->dl_lock); 534cde58dbcSMatthew Ahrens dmu_buf_will_dirty(dl->dl_dbuf, tx); 535cde58dbcSMatthew Ahrens dsl_deadlist_load_tree(dl); 536cde58dbcSMatthew Ahrens 537cde58dbcSMatthew Ahrens dle_tofind.dle_mintxg = mintxg; 538cde58dbcSMatthew Ahrens dle = avl_find(&dl->dl_tree, &dle_tofind, &where); 539cde58dbcSMatthew Ahrens if (dle == NULL) 540cde58dbcSMatthew Ahrens dle = avl_nearest(&dl->dl_tree, where, AVL_AFTER); 541cde58dbcSMatthew Ahrens while (dle) { 542cde58dbcSMatthew Ahrens uint64_t used, comp, uncomp; 543cde58dbcSMatthew Ahrens dsl_deadlist_entry_t *dle_next; 544cde58dbcSMatthew Ahrens 545cde58dbcSMatthew Ahrens bpobj_enqueue_subobj(bpo, dle->dle_bpobj.bpo_object, tx); 546cde58dbcSMatthew Ahrens 547b420f3adSRichard Lowe VERIFY3U(0, ==, bpobj_space(&dle->dle_bpobj, 548cde58dbcSMatthew Ahrens &used, &comp, &uncomp)); 549cde58dbcSMatthew Ahrens ASSERT3U(dl->dl_phys->dl_used, >=, used); 550cde58dbcSMatthew Ahrens ASSERT3U(dl->dl_phys->dl_comp, >=, comp); 551cde58dbcSMatthew Ahrens ASSERT3U(dl->dl_phys->dl_uncomp, >=, uncomp); 552cde58dbcSMatthew Ahrens dl->dl_phys->dl_used -= used; 553cde58dbcSMatthew Ahrens dl->dl_phys->dl_comp -= comp; 554cde58dbcSMatthew Ahrens dl->dl_phys->dl_uncomp -= uncomp; 555cde58dbcSMatthew Ahrens 556b420f3adSRichard Lowe VERIFY3U(0, ==, zap_remove_int(dl->dl_os, dl->dl_object, 557cde58dbcSMatthew Ahrens dle->dle_mintxg, tx)); 558cde58dbcSMatthew Ahrens 559cde58dbcSMatthew Ahrens dle_next = AVL_NEXT(&dl->dl_tree, dle); 560cde58dbcSMatthew Ahrens avl_remove(&dl->dl_tree, dle); 561cde58dbcSMatthew Ahrens bpobj_close(&dle->dle_bpobj); 562cde58dbcSMatthew Ahrens kmem_free(dle, sizeof (*dle)); 563cde58dbcSMatthew Ahrens dle = dle_next; 564cde58dbcSMatthew Ahrens } 565a3905a45SSerapheim Dimitropoulos mutex_exit(&dl->dl_lock); 566cde58dbcSMatthew Ahrens } 567