1fa9e4066Sahrens /* 2fa9e4066Sahrens * CDDL HEADER START 3fa9e4066Sahrens * 4fa9e4066Sahrens * The contents of this file are subject to the terms of the 5ea8dc4b6Seschrock * Common Development and Distribution License (the "License"). 6ea8dc4b6Seschrock * You may not use this file except in compliance with the License. 7fa9e4066Sahrens * 8fa9e4066Sahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9fa9e4066Sahrens * or http://www.opensolaris.org/os/licensing. 10fa9e4066Sahrens * See the License for the specific language governing permissions 11fa9e4066Sahrens * and limitations under the License. 12fa9e4066Sahrens * 13fa9e4066Sahrens * When distributing Covered Code, include this CDDL HEADER in each 14fa9e4066Sahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15fa9e4066Sahrens * If applicable, add the following below this CDDL HEADER, with the 16fa9e4066Sahrens * fields enclosed by brackets "[]" replaced with your own identifying 17fa9e4066Sahrens * information: Portions Copyright [yyyy] [name of copyright owner] 18fa9e4066Sahrens * 19fa9e4066Sahrens * CDDL HEADER END 20fa9e4066Sahrens */ 21fa9e4066Sahrens /* 2255434c77Sek * Copyright 2007 Sun Microsystems, Inc. All rights reserved. 23fa9e4066Sahrens * Use is subject to license terms. 24fa9e4066Sahrens */ 25fa9e4066Sahrens 26fa9e4066Sahrens #pragma ident "%Z%%M% %I% %E% SMI" 27fa9e4066Sahrens 28fa9e4066Sahrens #include <sys/dmu_objset.h> 29fa9e4066Sahrens #include <sys/dsl_dataset.h> 30fa9e4066Sahrens #include <sys/dsl_dir.h> 3199653d4eSeschrock #include <sys/dsl_prop.h> 321d452cf5Sahrens #include <sys/dsl_synctask.h> 33fa9e4066Sahrens #include <sys/dmu_traverse.h> 34fa9e4066Sahrens #include <sys/dmu_tx.h> 35fa9e4066Sahrens #include <sys/arc.h> 36fa9e4066Sahrens #include <sys/zio.h> 37fa9e4066Sahrens #include <sys/zap.h> 38fa9e4066Sahrens #include <sys/unique.h> 39fa9e4066Sahrens #include <sys/zfs_context.h> 40cdf5b4caSmmusante #include <sys/zfs_ioctl.h> 41*ecd6cf80Smarks #include <sys/spa.h> 42*ecd6cf80Smarks #include <sys/sunddi.h> 43fa9e4066Sahrens 441d452cf5Sahrens static dsl_checkfunc_t dsl_dataset_destroy_begin_check; 451d452cf5Sahrens static dsl_syncfunc_t dsl_dataset_destroy_begin_sync; 461d452cf5Sahrens static dsl_checkfunc_t dsl_dataset_rollback_check; 471d452cf5Sahrens static dsl_syncfunc_t dsl_dataset_rollback_sync; 481d452cf5Sahrens static dsl_checkfunc_t dsl_dataset_destroy_check; 491d452cf5Sahrens static dsl_syncfunc_t dsl_dataset_destroy_sync; 50e1930233Sbonwick 5155434c77Sek #define DS_REF_MAX (1ULL << 62) 52fa9e4066Sahrens 53fa9e4066Sahrens #define DSL_DEADLIST_BLOCKSIZE SPA_MAXBLOCKSIZE 54fa9e4066Sahrens 55fa9e4066Sahrens /* 56fa9e4066Sahrens * We use weighted reference counts to express the various forms of exclusion 57fa9e4066Sahrens * between different open modes. A STANDARD open is 1 point, an EXCLUSIVE open 5855434c77Sek * is DS_REF_MAX, and a PRIMARY open is little more than half of an EXCLUSIVE. 59fa9e4066Sahrens * This makes the exclusion logic simple: the total refcnt for all opens cannot 6055434c77Sek * exceed DS_REF_MAX. For example, EXCLUSIVE opens are exclusive because their 6155434c77Sek * weight (DS_REF_MAX) consumes the entire refcnt space. PRIMARY opens consume 62fa9e4066Sahrens * just over half of the refcnt space, so there can't be more than one, but it 63fa9e4066Sahrens * can peacefully coexist with any number of STANDARD opens. 64fa9e4066Sahrens */ 65fa9e4066Sahrens static uint64_t ds_refcnt_weight[DS_MODE_LEVELS] = { 6655434c77Sek 0, /* DS_MODE_NONE - invalid */ 6755434c77Sek 1, /* DS_MODE_STANDARD - unlimited number */ 6855434c77Sek (DS_REF_MAX >> 1) + 1, /* DS_MODE_PRIMARY - only one of these */ 6955434c77Sek DS_REF_MAX /* DS_MODE_EXCLUSIVE - no other opens */ 70fa9e4066Sahrens }; 71fa9e4066Sahrens 72fa9e4066Sahrens 73fa9e4066Sahrens void 74fa9e4066Sahrens dsl_dataset_block_born(dsl_dataset_t *ds, blkptr_t *bp, dmu_tx_t *tx) 75fa9e4066Sahrens { 7699653d4eSeschrock int used = bp_get_dasize(tx->tx_pool->dp_spa, bp); 77fa9e4066Sahrens int compressed = BP_GET_PSIZE(bp); 78fa9e4066Sahrens int uncompressed = BP_GET_UCSIZE(bp); 79fa9e4066Sahrens 80fa9e4066Sahrens dprintf_bp(bp, "born, ds=%p\n", ds); 81fa9e4066Sahrens 82fa9e4066Sahrens ASSERT(dmu_tx_is_syncing(tx)); 83fa9e4066Sahrens /* It could have been compressed away to nothing */ 84fa9e4066Sahrens if (BP_IS_HOLE(bp)) 85fa9e4066Sahrens return; 86fa9e4066Sahrens ASSERT(BP_GET_TYPE(bp) != DMU_OT_NONE); 87fa9e4066Sahrens ASSERT3U(BP_GET_TYPE(bp), <, DMU_OT_NUMTYPES); 88fa9e4066Sahrens if (ds == NULL) { 89fa9e4066Sahrens /* 90fa9e4066Sahrens * Account for the meta-objset space in its placeholder 91fa9e4066Sahrens * dsl_dir. 92fa9e4066Sahrens */ 93fa9e4066Sahrens ASSERT3U(compressed, ==, uncompressed); /* it's all metadata */ 94fa9e4066Sahrens dsl_dir_diduse_space(tx->tx_pool->dp_mos_dir, 95fa9e4066Sahrens used, compressed, uncompressed, tx); 96fa9e4066Sahrens dsl_dir_dirty(tx->tx_pool->dp_mos_dir, tx); 97fa9e4066Sahrens return; 98fa9e4066Sahrens } 99fa9e4066Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 100fa9e4066Sahrens mutex_enter(&ds->ds_lock); 101fa9e4066Sahrens ds->ds_phys->ds_used_bytes += used; 102fa9e4066Sahrens ds->ds_phys->ds_compressed_bytes += compressed; 103fa9e4066Sahrens ds->ds_phys->ds_uncompressed_bytes += uncompressed; 104fa9e4066Sahrens ds->ds_phys->ds_unique_bytes += used; 105fa9e4066Sahrens mutex_exit(&ds->ds_lock); 106fa9e4066Sahrens dsl_dir_diduse_space(ds->ds_dir, 107fa9e4066Sahrens used, compressed, uncompressed, tx); 108fa9e4066Sahrens } 109fa9e4066Sahrens 110fa9e4066Sahrens void 111c717a561Smaybee dsl_dataset_block_kill(dsl_dataset_t *ds, blkptr_t *bp, zio_t *pio, 112c717a561Smaybee dmu_tx_t *tx) 113fa9e4066Sahrens { 11499653d4eSeschrock int used = bp_get_dasize(tx->tx_pool->dp_spa, bp); 115fa9e4066Sahrens int compressed = BP_GET_PSIZE(bp); 116fa9e4066Sahrens int uncompressed = BP_GET_UCSIZE(bp); 117fa9e4066Sahrens 118fa9e4066Sahrens ASSERT(dmu_tx_is_syncing(tx)); 119c717a561Smaybee /* No block pointer => nothing to free */ 120fa9e4066Sahrens if (BP_IS_HOLE(bp)) 121fa9e4066Sahrens return; 122fa9e4066Sahrens 123fa9e4066Sahrens ASSERT(used > 0); 124fa9e4066Sahrens if (ds == NULL) { 125c717a561Smaybee int err; 126fa9e4066Sahrens /* 127fa9e4066Sahrens * Account for the meta-objset space in its placeholder 128fa9e4066Sahrens * dataset. 129fa9e4066Sahrens */ 130c717a561Smaybee err = arc_free(pio, tx->tx_pool->dp_spa, 131c717a561Smaybee tx->tx_txg, bp, NULL, NULL, pio ? ARC_NOWAIT: ARC_WAIT); 132c717a561Smaybee ASSERT(err == 0); 133fa9e4066Sahrens 134fa9e4066Sahrens dsl_dir_diduse_space(tx->tx_pool->dp_mos_dir, 135fa9e4066Sahrens -used, -compressed, -uncompressed, tx); 136fa9e4066Sahrens dsl_dir_dirty(tx->tx_pool->dp_mos_dir, tx); 137fa9e4066Sahrens return; 138fa9e4066Sahrens } 139fa9e4066Sahrens ASSERT3P(tx->tx_pool, ==, ds->ds_dir->dd_pool); 140fa9e4066Sahrens 141fa9e4066Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 142fa9e4066Sahrens 143fa9e4066Sahrens if (bp->blk_birth > ds->ds_phys->ds_prev_snap_txg) { 144c717a561Smaybee int err; 145c717a561Smaybee 146fa9e4066Sahrens dprintf_bp(bp, "freeing: %s", ""); 147c717a561Smaybee err = arc_free(pio, tx->tx_pool->dp_spa, 148c717a561Smaybee tx->tx_txg, bp, NULL, NULL, pio ? ARC_NOWAIT: ARC_WAIT); 149c717a561Smaybee ASSERT(err == 0); 150fa9e4066Sahrens 151fa9e4066Sahrens mutex_enter(&ds->ds_lock); 152fa9e4066Sahrens /* XXX unique_bytes is not accurate for head datasets */ 153fa9e4066Sahrens /* ASSERT3U(ds->ds_phys->ds_unique_bytes, >=, used); */ 154fa9e4066Sahrens ds->ds_phys->ds_unique_bytes -= used; 155fa9e4066Sahrens mutex_exit(&ds->ds_lock); 156fa9e4066Sahrens dsl_dir_diduse_space(ds->ds_dir, 157fa9e4066Sahrens -used, -compressed, -uncompressed, tx); 158fa9e4066Sahrens } else { 159fa9e4066Sahrens dprintf_bp(bp, "putting on dead list: %s", ""); 160ea8dc4b6Seschrock VERIFY(0 == bplist_enqueue(&ds->ds_deadlist, bp, tx)); 161fa9e4066Sahrens /* if (bp->blk_birth > prev prev snap txg) prev unique += bs */ 162fa9e4066Sahrens if (ds->ds_phys->ds_prev_snap_obj != 0) { 163fa9e4066Sahrens ASSERT3U(ds->ds_prev->ds_object, ==, 164fa9e4066Sahrens ds->ds_phys->ds_prev_snap_obj); 165fa9e4066Sahrens ASSERT(ds->ds_prev->ds_phys->ds_num_children > 0); 166fa9e4066Sahrens if (ds->ds_prev->ds_phys->ds_next_snap_obj == 16799653d4eSeschrock ds->ds_object && bp->blk_birth > 168fa9e4066Sahrens ds->ds_prev->ds_phys->ds_prev_snap_txg) { 169fa9e4066Sahrens dmu_buf_will_dirty(ds->ds_prev->ds_dbuf, tx); 170fa9e4066Sahrens mutex_enter(&ds->ds_prev->ds_lock); 171fa9e4066Sahrens ds->ds_prev->ds_phys->ds_unique_bytes += 172fa9e4066Sahrens used; 173fa9e4066Sahrens mutex_exit(&ds->ds_prev->ds_lock); 174fa9e4066Sahrens } 175fa9e4066Sahrens } 176fa9e4066Sahrens } 177fa9e4066Sahrens mutex_enter(&ds->ds_lock); 178fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_used_bytes, >=, used); 179fa9e4066Sahrens ds->ds_phys->ds_used_bytes -= used; 180fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_compressed_bytes, >=, compressed); 181fa9e4066Sahrens ds->ds_phys->ds_compressed_bytes -= compressed; 182fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_uncompressed_bytes, >=, uncompressed); 183fa9e4066Sahrens ds->ds_phys->ds_uncompressed_bytes -= uncompressed; 184fa9e4066Sahrens mutex_exit(&ds->ds_lock); 185fa9e4066Sahrens } 186fa9e4066Sahrens 187ea8dc4b6Seschrock uint64_t 188ea8dc4b6Seschrock dsl_dataset_prev_snap_txg(dsl_dataset_t *ds) 189fa9e4066Sahrens { 190a2eea2e1Sahrens uint64_t trysnap = 0; 191a2eea2e1Sahrens 192fa9e4066Sahrens if (ds == NULL) 193ea8dc4b6Seschrock return (0); 194fa9e4066Sahrens /* 195fa9e4066Sahrens * The snapshot creation could fail, but that would cause an 196fa9e4066Sahrens * incorrect FALSE return, which would only result in an 197fa9e4066Sahrens * overestimation of the amount of space that an operation would 198fa9e4066Sahrens * consume, which is OK. 199fa9e4066Sahrens * 200fa9e4066Sahrens * There's also a small window where we could miss a pending 201fa9e4066Sahrens * snapshot, because we could set the sync task in the quiescing 202fa9e4066Sahrens * phase. So this should only be used as a guess. 203fa9e4066Sahrens */ 204a2eea2e1Sahrens if (ds->ds_trysnap_txg > 205a2eea2e1Sahrens spa_last_synced_txg(ds->ds_dir->dd_pool->dp_spa)) 206a2eea2e1Sahrens trysnap = ds->ds_trysnap_txg; 207a2eea2e1Sahrens return (MAX(ds->ds_phys->ds_prev_snap_txg, trysnap)); 208ea8dc4b6Seschrock } 209ea8dc4b6Seschrock 210ea8dc4b6Seschrock int 211ea8dc4b6Seschrock dsl_dataset_block_freeable(dsl_dataset_t *ds, uint64_t blk_birth) 212ea8dc4b6Seschrock { 213ea8dc4b6Seschrock return (blk_birth > dsl_dataset_prev_snap_txg(ds)); 214fa9e4066Sahrens } 215fa9e4066Sahrens 216fa9e4066Sahrens /* ARGSUSED */ 217fa9e4066Sahrens static void 218fa9e4066Sahrens dsl_dataset_evict(dmu_buf_t *db, void *dsv) 219fa9e4066Sahrens { 220fa9e4066Sahrens dsl_dataset_t *ds = dsv; 221fa9e4066Sahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 222fa9e4066Sahrens 22355434c77Sek /* open_refcount == DS_REF_MAX when deleting */ 224fa9e4066Sahrens ASSERT(ds->ds_open_refcount == 0 || 22555434c77Sek ds->ds_open_refcount == DS_REF_MAX); 226fa9e4066Sahrens 227fa9e4066Sahrens dprintf_ds(ds, "evicting %s\n", ""); 228fa9e4066Sahrens 229fa9e4066Sahrens unique_remove(ds->ds_phys->ds_fsid_guid); 230fa9e4066Sahrens 231fa9e4066Sahrens if (ds->ds_user_ptr != NULL) 232fa9e4066Sahrens ds->ds_user_evict_func(ds, ds->ds_user_ptr); 233fa9e4066Sahrens 234fa9e4066Sahrens if (ds->ds_prev) { 235fa9e4066Sahrens dsl_dataset_close(ds->ds_prev, DS_MODE_NONE, ds); 236fa9e4066Sahrens ds->ds_prev = NULL; 237fa9e4066Sahrens } 238fa9e4066Sahrens 239fa9e4066Sahrens bplist_close(&ds->ds_deadlist); 240fa9e4066Sahrens dsl_dir_close(ds->ds_dir, ds); 241fa9e4066Sahrens 242fa9e4066Sahrens if (list_link_active(&ds->ds_synced_link)) 243fa9e4066Sahrens list_remove(&dp->dp_synced_objsets, ds); 244fa9e4066Sahrens 2455ad82045Snd mutex_destroy(&ds->ds_lock); 2465ad82045Snd mutex_destroy(&ds->ds_deadlist.bpl_lock); 2475ad82045Snd 248fa9e4066Sahrens kmem_free(ds, sizeof (dsl_dataset_t)); 249fa9e4066Sahrens } 250fa9e4066Sahrens 251ea8dc4b6Seschrock static int 252fa9e4066Sahrens dsl_dataset_get_snapname(dsl_dataset_t *ds) 253fa9e4066Sahrens { 254fa9e4066Sahrens dsl_dataset_phys_t *headphys; 255fa9e4066Sahrens int err; 256fa9e4066Sahrens dmu_buf_t *headdbuf; 257fa9e4066Sahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 258fa9e4066Sahrens objset_t *mos = dp->dp_meta_objset; 259fa9e4066Sahrens 260fa9e4066Sahrens if (ds->ds_snapname[0]) 261ea8dc4b6Seschrock return (0); 262fa9e4066Sahrens if (ds->ds_phys->ds_next_snap_obj == 0) 263ea8dc4b6Seschrock return (0); 264fa9e4066Sahrens 265ea8dc4b6Seschrock err = dmu_bonus_hold(mos, ds->ds_dir->dd_phys->dd_head_dataset_obj, 266ea8dc4b6Seschrock FTAG, &headdbuf); 267ea8dc4b6Seschrock if (err) 268ea8dc4b6Seschrock return (err); 269fa9e4066Sahrens headphys = headdbuf->db_data; 270fa9e4066Sahrens err = zap_value_search(dp->dp_meta_objset, 271fa9e4066Sahrens headphys->ds_snapnames_zapobj, ds->ds_object, ds->ds_snapname); 272ea8dc4b6Seschrock dmu_buf_rele(headdbuf, FTAG); 273ea8dc4b6Seschrock return (err); 274fa9e4066Sahrens } 275fa9e4066Sahrens 276ea8dc4b6Seschrock int 277fa9e4066Sahrens dsl_dataset_open_obj(dsl_pool_t *dp, uint64_t dsobj, const char *snapname, 278ea8dc4b6Seschrock int mode, void *tag, dsl_dataset_t **dsp) 279fa9e4066Sahrens { 280fa9e4066Sahrens uint64_t weight = ds_refcnt_weight[DS_MODE_LEVEL(mode)]; 281fa9e4066Sahrens objset_t *mos = dp->dp_meta_objset; 282fa9e4066Sahrens dmu_buf_t *dbuf; 283fa9e4066Sahrens dsl_dataset_t *ds; 284ea8dc4b6Seschrock int err; 285fa9e4066Sahrens 286fa9e4066Sahrens ASSERT(RW_LOCK_HELD(&dp->dp_config_rwlock) || 287fa9e4066Sahrens dsl_pool_sync_context(dp)); 288fa9e4066Sahrens 289ea8dc4b6Seschrock err = dmu_bonus_hold(mos, dsobj, tag, &dbuf); 290ea8dc4b6Seschrock if (err) 291ea8dc4b6Seschrock return (err); 292fa9e4066Sahrens ds = dmu_buf_get_user(dbuf); 293fa9e4066Sahrens if (ds == NULL) { 294fa9e4066Sahrens dsl_dataset_t *winner; 295fa9e4066Sahrens 296fa9e4066Sahrens ds = kmem_zalloc(sizeof (dsl_dataset_t), KM_SLEEP); 297fa9e4066Sahrens ds->ds_dbuf = dbuf; 298fa9e4066Sahrens ds->ds_object = dsobj; 299fa9e4066Sahrens ds->ds_phys = dbuf->db_data; 300fa9e4066Sahrens 3015ad82045Snd mutex_init(&ds->ds_lock, NULL, MUTEX_DEFAULT, NULL); 3025ad82045Snd mutex_init(&ds->ds_deadlist.bpl_lock, NULL, MUTEX_DEFAULT, 3035ad82045Snd NULL); 3045ad82045Snd 305ea8dc4b6Seschrock err = bplist_open(&ds->ds_deadlist, 306fa9e4066Sahrens mos, ds->ds_phys->ds_deadlist_obj); 307ea8dc4b6Seschrock if (err == 0) { 308ea8dc4b6Seschrock err = dsl_dir_open_obj(dp, 309ea8dc4b6Seschrock ds->ds_phys->ds_dir_obj, NULL, ds, &ds->ds_dir); 310ea8dc4b6Seschrock } 311ea8dc4b6Seschrock if (err) { 312ea8dc4b6Seschrock /* 313ea8dc4b6Seschrock * we don't really need to close the blist if we 314ea8dc4b6Seschrock * just opened it. 315ea8dc4b6Seschrock */ 3165ad82045Snd mutex_destroy(&ds->ds_lock); 3175ad82045Snd mutex_destroy(&ds->ds_deadlist.bpl_lock); 318ea8dc4b6Seschrock kmem_free(ds, sizeof (dsl_dataset_t)); 319ea8dc4b6Seschrock dmu_buf_rele(dbuf, tag); 320ea8dc4b6Seschrock return (err); 321ea8dc4b6Seschrock } 322fa9e4066Sahrens 323fa9e4066Sahrens if (ds->ds_dir->dd_phys->dd_head_dataset_obj == dsobj) { 324fa9e4066Sahrens ds->ds_snapname[0] = '\0'; 325fa9e4066Sahrens if (ds->ds_phys->ds_prev_snap_obj) { 326ea8dc4b6Seschrock err = dsl_dataset_open_obj(dp, 327fa9e4066Sahrens ds->ds_phys->ds_prev_snap_obj, NULL, 328ea8dc4b6Seschrock DS_MODE_NONE, ds, &ds->ds_prev); 329fa9e4066Sahrens } 330fa9e4066Sahrens } else { 331fa9e4066Sahrens if (snapname) { 332fa9e4066Sahrens #ifdef ZFS_DEBUG 333fa9e4066Sahrens dsl_dataset_phys_t *headphys; 334ea8dc4b6Seschrock dmu_buf_t *headdbuf; 335ea8dc4b6Seschrock err = dmu_bonus_hold(mos, 336ea8dc4b6Seschrock ds->ds_dir->dd_phys->dd_head_dataset_obj, 337ea8dc4b6Seschrock FTAG, &headdbuf); 338ea8dc4b6Seschrock if (err == 0) { 339ea8dc4b6Seschrock headphys = headdbuf->db_data; 340ea8dc4b6Seschrock uint64_t foundobj; 341ea8dc4b6Seschrock err = zap_lookup(dp->dp_meta_objset, 342ea8dc4b6Seschrock headphys->ds_snapnames_zapobj, 343ea8dc4b6Seschrock snapname, sizeof (foundobj), 1, 344ea8dc4b6Seschrock &foundobj); 345ea8dc4b6Seschrock ASSERT3U(foundobj, ==, dsobj); 346ea8dc4b6Seschrock dmu_buf_rele(headdbuf, FTAG); 347ea8dc4b6Seschrock } 348fa9e4066Sahrens #endif 349fa9e4066Sahrens (void) strcat(ds->ds_snapname, snapname); 350fa9e4066Sahrens } else if (zfs_flags & ZFS_DEBUG_SNAPNAMES) { 351ea8dc4b6Seschrock err = dsl_dataset_get_snapname(ds); 352fa9e4066Sahrens } 353fa9e4066Sahrens } 354fa9e4066Sahrens 355ea8dc4b6Seschrock if (err == 0) { 356ea8dc4b6Seschrock winner = dmu_buf_set_user_ie(dbuf, ds, &ds->ds_phys, 357ea8dc4b6Seschrock dsl_dataset_evict); 358ea8dc4b6Seschrock } 359ea8dc4b6Seschrock if (err || winner) { 360fa9e4066Sahrens bplist_close(&ds->ds_deadlist); 361fa9e4066Sahrens if (ds->ds_prev) { 362fa9e4066Sahrens dsl_dataset_close(ds->ds_prev, 363fa9e4066Sahrens DS_MODE_NONE, ds); 364fa9e4066Sahrens } 365fa9e4066Sahrens dsl_dir_close(ds->ds_dir, ds); 3665ad82045Snd mutex_destroy(&ds->ds_lock); 3675ad82045Snd mutex_destroy(&ds->ds_deadlist.bpl_lock); 368fa9e4066Sahrens kmem_free(ds, sizeof (dsl_dataset_t)); 369ea8dc4b6Seschrock if (err) { 370ea8dc4b6Seschrock dmu_buf_rele(dbuf, tag); 371ea8dc4b6Seschrock return (err); 372ea8dc4b6Seschrock } 373fa9e4066Sahrens ds = winner; 374fa9e4066Sahrens } else { 375fa9e4066Sahrens uint64_t new = 376fa9e4066Sahrens unique_insert(ds->ds_phys->ds_fsid_guid); 377fa9e4066Sahrens if (new != ds->ds_phys->ds_fsid_guid) { 378fa9e4066Sahrens /* XXX it won't necessarily be synced... */ 379fa9e4066Sahrens ds->ds_phys->ds_fsid_guid = new; 380fa9e4066Sahrens } 381fa9e4066Sahrens } 382fa9e4066Sahrens } 383fa9e4066Sahrens ASSERT3P(ds->ds_dbuf, ==, dbuf); 384fa9e4066Sahrens ASSERT3P(ds->ds_phys, ==, dbuf->db_data); 385fa9e4066Sahrens 386fa9e4066Sahrens mutex_enter(&ds->ds_lock); 387fa9e4066Sahrens if ((DS_MODE_LEVEL(mode) == DS_MODE_PRIMARY && 38899653d4eSeschrock (ds->ds_phys->ds_flags & DS_FLAG_INCONSISTENT) && 38999653d4eSeschrock !DS_MODE_IS_INCONSISTENT(mode)) || 39055434c77Sek (ds->ds_open_refcount + weight > DS_REF_MAX)) { 391fa9e4066Sahrens mutex_exit(&ds->ds_lock); 392fa9e4066Sahrens dsl_dataset_close(ds, DS_MODE_NONE, tag); 393ea8dc4b6Seschrock return (EBUSY); 394fa9e4066Sahrens } 395fa9e4066Sahrens ds->ds_open_refcount += weight; 396fa9e4066Sahrens mutex_exit(&ds->ds_lock); 397fa9e4066Sahrens 398ea8dc4b6Seschrock *dsp = ds; 399ea8dc4b6Seschrock return (0); 400fa9e4066Sahrens } 401fa9e4066Sahrens 402fa9e4066Sahrens int 403fa9e4066Sahrens dsl_dataset_open_spa(spa_t *spa, const char *name, int mode, 404fa9e4066Sahrens void *tag, dsl_dataset_t **dsp) 405fa9e4066Sahrens { 406fa9e4066Sahrens dsl_dir_t *dd; 407fa9e4066Sahrens dsl_pool_t *dp; 408fa9e4066Sahrens const char *tail; 409fa9e4066Sahrens uint64_t obj; 410fa9e4066Sahrens dsl_dataset_t *ds = NULL; 411fa9e4066Sahrens int err = 0; 412fa9e4066Sahrens 413ea8dc4b6Seschrock err = dsl_dir_open_spa(spa, name, FTAG, &dd, &tail); 414ea8dc4b6Seschrock if (err) 415ea8dc4b6Seschrock return (err); 416fa9e4066Sahrens 417fa9e4066Sahrens dp = dd->dd_pool; 418fa9e4066Sahrens obj = dd->dd_phys->dd_head_dataset_obj; 419fa9e4066Sahrens rw_enter(&dp->dp_config_rwlock, RW_READER); 420fa9e4066Sahrens if (obj == 0) { 421fa9e4066Sahrens /* A dataset with no associated objset */ 422fa9e4066Sahrens err = ENOENT; 423fa9e4066Sahrens goto out; 424fa9e4066Sahrens } 425fa9e4066Sahrens 426fa9e4066Sahrens if (tail != NULL) { 427fa9e4066Sahrens objset_t *mos = dp->dp_meta_objset; 428fa9e4066Sahrens 429ea8dc4b6Seschrock err = dsl_dataset_open_obj(dp, obj, NULL, 430ea8dc4b6Seschrock DS_MODE_NONE, tag, &ds); 431ea8dc4b6Seschrock if (err) 432ea8dc4b6Seschrock goto out; 433fa9e4066Sahrens obj = ds->ds_phys->ds_snapnames_zapobj; 434fa9e4066Sahrens dsl_dataset_close(ds, DS_MODE_NONE, tag); 435fa9e4066Sahrens ds = NULL; 436fa9e4066Sahrens 437fa9e4066Sahrens if (tail[0] != '@') { 438fa9e4066Sahrens err = ENOENT; 439fa9e4066Sahrens goto out; 440fa9e4066Sahrens } 441fa9e4066Sahrens tail++; 442fa9e4066Sahrens 443fa9e4066Sahrens /* Look for a snapshot */ 444fa9e4066Sahrens if (!DS_MODE_IS_READONLY(mode)) { 445fa9e4066Sahrens err = EROFS; 446fa9e4066Sahrens goto out; 447fa9e4066Sahrens } 448fa9e4066Sahrens dprintf("looking for snapshot '%s'\n", tail); 449fa9e4066Sahrens err = zap_lookup(mos, obj, tail, 8, 1, &obj); 450fa9e4066Sahrens if (err) 451fa9e4066Sahrens goto out; 452fa9e4066Sahrens } 453ea8dc4b6Seschrock err = dsl_dataset_open_obj(dp, obj, tail, mode, tag, &ds); 454fa9e4066Sahrens 455fa9e4066Sahrens out: 456fa9e4066Sahrens rw_exit(&dp->dp_config_rwlock); 457fa9e4066Sahrens dsl_dir_close(dd, FTAG); 458fa9e4066Sahrens 459fa9e4066Sahrens ASSERT3U((err == 0), ==, (ds != NULL)); 460fa9e4066Sahrens /* ASSERT(ds == NULL || strcmp(name, ds->ds_name) == 0); */ 461fa9e4066Sahrens 462fa9e4066Sahrens *dsp = ds; 463fa9e4066Sahrens return (err); 464fa9e4066Sahrens } 465fa9e4066Sahrens 466fa9e4066Sahrens int 467fa9e4066Sahrens dsl_dataset_open(const char *name, int mode, void *tag, dsl_dataset_t **dsp) 468fa9e4066Sahrens { 469fa9e4066Sahrens return (dsl_dataset_open_spa(NULL, name, mode, tag, dsp)); 470fa9e4066Sahrens } 471fa9e4066Sahrens 472fa9e4066Sahrens void 473fa9e4066Sahrens dsl_dataset_name(dsl_dataset_t *ds, char *name) 474fa9e4066Sahrens { 475fa9e4066Sahrens if (ds == NULL) { 476fa9e4066Sahrens (void) strcpy(name, "mos"); 477fa9e4066Sahrens } else { 478fa9e4066Sahrens dsl_dir_name(ds->ds_dir, name); 479ea8dc4b6Seschrock VERIFY(0 == dsl_dataset_get_snapname(ds)); 480fa9e4066Sahrens if (ds->ds_snapname[0]) { 481fa9e4066Sahrens (void) strcat(name, "@"); 482fa9e4066Sahrens if (!MUTEX_HELD(&ds->ds_lock)) { 483fa9e4066Sahrens /* 484fa9e4066Sahrens * We use a "recursive" mutex so that we 485fa9e4066Sahrens * can call dprintf_ds() with ds_lock held. 486fa9e4066Sahrens */ 487fa9e4066Sahrens mutex_enter(&ds->ds_lock); 488fa9e4066Sahrens (void) strcat(name, ds->ds_snapname); 489fa9e4066Sahrens mutex_exit(&ds->ds_lock); 490fa9e4066Sahrens } else { 491fa9e4066Sahrens (void) strcat(name, ds->ds_snapname); 492fa9e4066Sahrens } 493fa9e4066Sahrens } 494fa9e4066Sahrens } 495fa9e4066Sahrens } 496fa9e4066Sahrens 497b7661cccSmmusante static int 498b7661cccSmmusante dsl_dataset_namelen(dsl_dataset_t *ds) 499b7661cccSmmusante { 500b7661cccSmmusante int result; 501b7661cccSmmusante 502b7661cccSmmusante if (ds == NULL) { 503b7661cccSmmusante result = 3; /* "mos" */ 504b7661cccSmmusante } else { 505b7661cccSmmusante result = dsl_dir_namelen(ds->ds_dir); 506b7661cccSmmusante VERIFY(0 == dsl_dataset_get_snapname(ds)); 507b7661cccSmmusante if (ds->ds_snapname[0]) { 508b7661cccSmmusante ++result; /* adding one for the @-sign */ 509b7661cccSmmusante if (!MUTEX_HELD(&ds->ds_lock)) { 510b7661cccSmmusante /* see dsl_datset_name */ 511b7661cccSmmusante mutex_enter(&ds->ds_lock); 512b7661cccSmmusante result += strlen(ds->ds_snapname); 513b7661cccSmmusante mutex_exit(&ds->ds_lock); 514b7661cccSmmusante } else { 515b7661cccSmmusante result += strlen(ds->ds_snapname); 516b7661cccSmmusante } 517b7661cccSmmusante } 518b7661cccSmmusante } 519b7661cccSmmusante 520b7661cccSmmusante return (result); 521b7661cccSmmusante } 522b7661cccSmmusante 523fa9e4066Sahrens void 524fa9e4066Sahrens dsl_dataset_close(dsl_dataset_t *ds, int mode, void *tag) 525fa9e4066Sahrens { 526fa9e4066Sahrens uint64_t weight = ds_refcnt_weight[DS_MODE_LEVEL(mode)]; 527fa9e4066Sahrens mutex_enter(&ds->ds_lock); 528fa9e4066Sahrens ASSERT3U(ds->ds_open_refcount, >=, weight); 529fa9e4066Sahrens ds->ds_open_refcount -= weight; 530fa9e4066Sahrens dprintf_ds(ds, "closing mode %u refcount now 0x%llx\n", 531fa9e4066Sahrens mode, ds->ds_open_refcount); 532fa9e4066Sahrens mutex_exit(&ds->ds_lock); 533fa9e4066Sahrens 534ea8dc4b6Seschrock dmu_buf_rele(ds->ds_dbuf, tag); 535fa9e4066Sahrens } 536fa9e4066Sahrens 537fa9e4066Sahrens void 538fa9e4066Sahrens dsl_dataset_create_root(dsl_pool_t *dp, uint64_t *ddobjp, dmu_tx_t *tx) 539fa9e4066Sahrens { 540fa9e4066Sahrens objset_t *mos = dp->dp_meta_objset; 541fa9e4066Sahrens dmu_buf_t *dbuf; 542fa9e4066Sahrens dsl_dataset_phys_t *dsphys; 543fa9e4066Sahrens dsl_dataset_t *ds; 544fa9e4066Sahrens uint64_t dsobj; 545fa9e4066Sahrens dsl_dir_t *dd; 546fa9e4066Sahrens 547fa9e4066Sahrens dsl_dir_create_root(mos, ddobjp, tx); 548ea8dc4b6Seschrock VERIFY(0 == dsl_dir_open_obj(dp, *ddobjp, NULL, FTAG, &dd)); 549fa9e4066Sahrens 5501649cd4bStabriz dsobj = dmu_object_alloc(mos, DMU_OT_DSL_DATASET, 0, 5511649cd4bStabriz DMU_OT_DSL_DATASET, sizeof (dsl_dataset_phys_t), tx); 552ea8dc4b6Seschrock VERIFY(0 == dmu_bonus_hold(mos, dsobj, FTAG, &dbuf)); 553fa9e4066Sahrens dmu_buf_will_dirty(dbuf, tx); 554fa9e4066Sahrens dsphys = dbuf->db_data; 555fa9e4066Sahrens dsphys->ds_dir_obj = dd->dd_object; 556fa9e4066Sahrens dsphys->ds_fsid_guid = unique_create(); 557ea8dc4b6Seschrock unique_remove(dsphys->ds_fsid_guid); /* it isn't open yet */ 558fa9e4066Sahrens (void) random_get_pseudo_bytes((void*)&dsphys->ds_guid, 559fa9e4066Sahrens sizeof (dsphys->ds_guid)); 560fa9e4066Sahrens dsphys->ds_snapnames_zapobj = 56187e5029aSahrens zap_create(mos, DMU_OT_DSL_DS_SNAP_MAP, DMU_OT_NONE, 0, tx); 562fa9e4066Sahrens dsphys->ds_creation_time = gethrestime_sec(); 563fa9e4066Sahrens dsphys->ds_creation_txg = tx->tx_txg; 564fa9e4066Sahrens dsphys->ds_deadlist_obj = 565fa9e4066Sahrens bplist_create(mos, DSL_DEADLIST_BLOCKSIZE, tx); 566ea8dc4b6Seschrock dmu_buf_rele(dbuf, FTAG); 567fa9e4066Sahrens 568fa9e4066Sahrens dmu_buf_will_dirty(dd->dd_dbuf, tx); 569fa9e4066Sahrens dd->dd_phys->dd_head_dataset_obj = dsobj; 570fa9e4066Sahrens dsl_dir_close(dd, FTAG); 571fa9e4066Sahrens 572ea8dc4b6Seschrock VERIFY(0 == 573ea8dc4b6Seschrock dsl_dataset_open_obj(dp, dsobj, NULL, DS_MODE_NONE, FTAG, &ds)); 574c717a561Smaybee (void) dmu_objset_create_impl(dp->dp_spa, ds, 575c717a561Smaybee &ds->ds_phys->ds_bp, DMU_OST_ZFS, tx); 576fa9e4066Sahrens dsl_dataset_close(ds, DS_MODE_NONE, FTAG); 577fa9e4066Sahrens } 578fa9e4066Sahrens 5791d452cf5Sahrens uint64_t 5801d452cf5Sahrens dsl_dataset_create_sync(dsl_dir_t *pdd, 581fa9e4066Sahrens const char *lastname, dsl_dataset_t *clone_parent, dmu_tx_t *tx) 582fa9e4066Sahrens { 5831d452cf5Sahrens dsl_pool_t *dp = pdd->dd_pool; 584fa9e4066Sahrens dmu_buf_t *dbuf; 585fa9e4066Sahrens dsl_dataset_phys_t *dsphys; 5861d452cf5Sahrens uint64_t dsobj, ddobj; 587fa9e4066Sahrens objset_t *mos = dp->dp_meta_objset; 588fa9e4066Sahrens dsl_dir_t *dd; 589fa9e4066Sahrens 5901d452cf5Sahrens ASSERT(clone_parent == NULL || clone_parent->ds_dir->dd_pool == dp); 5911d452cf5Sahrens ASSERT(clone_parent == NULL || 5921d452cf5Sahrens clone_parent->ds_phys->ds_num_children > 0); 593fa9e4066Sahrens ASSERT(lastname[0] != '@'); 594fa9e4066Sahrens ASSERT(dmu_tx_is_syncing(tx)); 595fa9e4066Sahrens 5961d452cf5Sahrens ddobj = dsl_dir_create_sync(pdd, lastname, tx); 5971d452cf5Sahrens VERIFY(0 == dsl_dir_open_obj(dp, ddobj, lastname, FTAG, &dd)); 598fa9e4066Sahrens 5991649cd4bStabriz dsobj = dmu_object_alloc(mos, DMU_OT_DSL_DATASET, 0, 6001649cd4bStabriz DMU_OT_DSL_DATASET, sizeof (dsl_dataset_phys_t), tx); 601ea8dc4b6Seschrock VERIFY(0 == dmu_bonus_hold(mos, dsobj, FTAG, &dbuf)); 602fa9e4066Sahrens dmu_buf_will_dirty(dbuf, tx); 603fa9e4066Sahrens dsphys = dbuf->db_data; 604fa9e4066Sahrens dsphys->ds_dir_obj = dd->dd_object; 605fa9e4066Sahrens dsphys->ds_fsid_guid = unique_create(); 606fa9e4066Sahrens unique_remove(dsphys->ds_fsid_guid); /* it isn't open yet */ 607fa9e4066Sahrens (void) random_get_pseudo_bytes((void*)&dsphys->ds_guid, 608fa9e4066Sahrens sizeof (dsphys->ds_guid)); 609fa9e4066Sahrens dsphys->ds_snapnames_zapobj = 61087e5029aSahrens zap_create(mos, DMU_OT_DSL_DS_SNAP_MAP, DMU_OT_NONE, 0, tx); 611fa9e4066Sahrens dsphys->ds_creation_time = gethrestime_sec(); 612fa9e4066Sahrens dsphys->ds_creation_txg = tx->tx_txg; 613fa9e4066Sahrens dsphys->ds_deadlist_obj = 614fa9e4066Sahrens bplist_create(mos, DSL_DEADLIST_BLOCKSIZE, tx); 615fa9e4066Sahrens if (clone_parent) { 616fa9e4066Sahrens dsphys->ds_prev_snap_obj = clone_parent->ds_object; 617fa9e4066Sahrens dsphys->ds_prev_snap_txg = 618fa9e4066Sahrens clone_parent->ds_phys->ds_creation_txg; 619fa9e4066Sahrens dsphys->ds_used_bytes = 620fa9e4066Sahrens clone_parent->ds_phys->ds_used_bytes; 621fa9e4066Sahrens dsphys->ds_compressed_bytes = 622fa9e4066Sahrens clone_parent->ds_phys->ds_compressed_bytes; 623fa9e4066Sahrens dsphys->ds_uncompressed_bytes = 624fa9e4066Sahrens clone_parent->ds_phys->ds_uncompressed_bytes; 625fa9e4066Sahrens dsphys->ds_bp = clone_parent->ds_phys->ds_bp; 626fa9e4066Sahrens 627fa9e4066Sahrens dmu_buf_will_dirty(clone_parent->ds_dbuf, tx); 628fa9e4066Sahrens clone_parent->ds_phys->ds_num_children++; 629fa9e4066Sahrens 630fa9e4066Sahrens dmu_buf_will_dirty(dd->dd_dbuf, tx); 631fa9e4066Sahrens dd->dd_phys->dd_clone_parent_obj = clone_parent->ds_object; 632fa9e4066Sahrens } 633ea8dc4b6Seschrock dmu_buf_rele(dbuf, FTAG); 634fa9e4066Sahrens 635fa9e4066Sahrens dmu_buf_will_dirty(dd->dd_dbuf, tx); 636fa9e4066Sahrens dd->dd_phys->dd_head_dataset_obj = dsobj; 637fa9e4066Sahrens dsl_dir_close(dd, FTAG); 638fa9e4066Sahrens 6391d452cf5Sahrens return (dsobj); 640fa9e4066Sahrens } 641fa9e4066Sahrens 6421d452cf5Sahrens struct destroyarg { 6431d452cf5Sahrens dsl_sync_task_group_t *dstg; 6441d452cf5Sahrens char *snapname; 6451d452cf5Sahrens char *failed; 6461d452cf5Sahrens }; 6471d452cf5Sahrens 6481d452cf5Sahrens static int 6491d452cf5Sahrens dsl_snapshot_destroy_one(char *name, void *arg) 650fa9e4066Sahrens { 6511d452cf5Sahrens struct destroyarg *da = arg; 6521d452cf5Sahrens dsl_dataset_t *ds; 6531d452cf5Sahrens char *cp; 654fa9e4066Sahrens int err; 655fa9e4066Sahrens 6561d452cf5Sahrens (void) strcat(name, "@"); 6571d452cf5Sahrens (void) strcat(name, da->snapname); 6581d452cf5Sahrens err = dsl_dataset_open(name, 6591d452cf5Sahrens DS_MODE_EXCLUSIVE | DS_MODE_READONLY | DS_MODE_INCONSISTENT, 660cdf5b4caSmmusante da->dstg, &ds); 6611d452cf5Sahrens cp = strchr(name, '@'); 6621d452cf5Sahrens *cp = '\0'; 6631d452cf5Sahrens if (err == ENOENT) 6641d452cf5Sahrens return (0); 6651d452cf5Sahrens if (err) { 6661d452cf5Sahrens (void) strcpy(da->failed, name); 667ea8dc4b6Seschrock return (err); 6681d452cf5Sahrens } 669fa9e4066Sahrens 6701d452cf5Sahrens dsl_sync_task_create(da->dstg, dsl_dataset_destroy_check, 671cdf5b4caSmmusante dsl_dataset_destroy_sync, ds, da->dstg, 0); 6721d452cf5Sahrens return (0); 6731d452cf5Sahrens } 67431fd60d3Sahrens 6751d452cf5Sahrens /* 6761d452cf5Sahrens * Destroy 'snapname' in all descendants of 'fsname'. 6771d452cf5Sahrens */ 6781d452cf5Sahrens #pragma weak dmu_snapshots_destroy = dsl_snapshots_destroy 6791d452cf5Sahrens int 6801d452cf5Sahrens dsl_snapshots_destroy(char *fsname, char *snapname) 6811d452cf5Sahrens { 6821d452cf5Sahrens int err; 6831d452cf5Sahrens struct destroyarg da; 6841d452cf5Sahrens dsl_sync_task_t *dst; 6851d452cf5Sahrens spa_t *spa; 6861d452cf5Sahrens char *cp; 6871d452cf5Sahrens 6881d452cf5Sahrens cp = strchr(fsname, '/'); 6891d452cf5Sahrens if (cp) { 6901d452cf5Sahrens *cp = '\0'; 6911d452cf5Sahrens err = spa_open(fsname, &spa, FTAG); 6921d452cf5Sahrens *cp = '/'; 6931d452cf5Sahrens } else { 6941d452cf5Sahrens err = spa_open(fsname, &spa, FTAG); 6951d452cf5Sahrens } 6961d452cf5Sahrens if (err) 6971d452cf5Sahrens return (err); 6981d452cf5Sahrens da.dstg = dsl_sync_task_group_create(spa_get_dsl(spa)); 6991d452cf5Sahrens da.snapname = snapname; 7001d452cf5Sahrens da.failed = fsname; 7011d452cf5Sahrens 7021d452cf5Sahrens err = dmu_objset_find(fsname, 7030b69c2f0Sahrens dsl_snapshot_destroy_one, &da, DS_FIND_CHILDREN); 7041d452cf5Sahrens 7051d452cf5Sahrens if (err == 0) 7061d452cf5Sahrens err = dsl_sync_task_group_wait(da.dstg); 7071d452cf5Sahrens 7081d452cf5Sahrens for (dst = list_head(&da.dstg->dstg_tasks); dst; 7091d452cf5Sahrens dst = list_next(&da.dstg->dstg_tasks, dst)) { 7101d452cf5Sahrens dsl_dataset_t *ds = dst->dst_arg1; 7111d452cf5Sahrens if (dst->dst_err) { 7121d452cf5Sahrens dsl_dataset_name(ds, fsname); 7131d452cf5Sahrens cp = strchr(fsname, '@'); 7141d452cf5Sahrens *cp = '\0'; 715e1930233Sbonwick } 716fa9e4066Sahrens /* 7171d452cf5Sahrens * If it was successful, destroy_sync would have 7181d452cf5Sahrens * closed the ds 719fa9e4066Sahrens */ 720ea8dc4b6Seschrock if (err) 721cdf5b4caSmmusante dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, da.dstg); 722fa9e4066Sahrens } 723fa9e4066Sahrens 7241d452cf5Sahrens dsl_sync_task_group_destroy(da.dstg); 7251d452cf5Sahrens spa_close(spa, FTAG); 726fa9e4066Sahrens return (err); 727fa9e4066Sahrens } 728fa9e4066Sahrens 729fa9e4066Sahrens int 7301d452cf5Sahrens dsl_dataset_destroy(const char *name) 731fa9e4066Sahrens { 732fa9e4066Sahrens int err; 7331d452cf5Sahrens dsl_sync_task_group_t *dstg; 7341d452cf5Sahrens objset_t *os; 7351d452cf5Sahrens dsl_dataset_t *ds; 736fa9e4066Sahrens dsl_dir_t *dd; 7371d452cf5Sahrens uint64_t obj; 7381d452cf5Sahrens 7391d452cf5Sahrens if (strchr(name, '@')) { 7401d452cf5Sahrens /* Destroying a snapshot is simpler */ 7411d452cf5Sahrens err = dsl_dataset_open(name, 7421d452cf5Sahrens DS_MODE_EXCLUSIVE | DS_MODE_READONLY | DS_MODE_INCONSISTENT, 7431d452cf5Sahrens FTAG, &ds); 7441d452cf5Sahrens if (err) 7451d452cf5Sahrens return (err); 7461d452cf5Sahrens err = dsl_sync_task_do(ds->ds_dir->dd_pool, 7471d452cf5Sahrens dsl_dataset_destroy_check, dsl_dataset_destroy_sync, 7481d452cf5Sahrens ds, FTAG, 0); 7491d452cf5Sahrens if (err) 7501d452cf5Sahrens dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, FTAG); 7511d452cf5Sahrens return (err); 7521d452cf5Sahrens } 753fa9e4066Sahrens 7541d452cf5Sahrens err = dmu_objset_open(name, DMU_OST_ANY, 7551d452cf5Sahrens DS_MODE_EXCLUSIVE | DS_MODE_INCONSISTENT, &os); 756ea8dc4b6Seschrock if (err) 757ea8dc4b6Seschrock return (err); 7581d452cf5Sahrens ds = os->os->os_dsl_dataset; 7591d452cf5Sahrens dd = ds->ds_dir; 760fa9e4066Sahrens 7611d452cf5Sahrens /* 7621d452cf5Sahrens * Check for errors and mark this ds as inconsistent, in 7631d452cf5Sahrens * case we crash while freeing the objects. 7641d452cf5Sahrens */ 7651d452cf5Sahrens err = dsl_sync_task_do(dd->dd_pool, dsl_dataset_destroy_begin_check, 7661d452cf5Sahrens dsl_dataset_destroy_begin_sync, ds, NULL, 0); 7671d452cf5Sahrens if (err) { 7681d452cf5Sahrens dmu_objset_close(os); 7691d452cf5Sahrens return (err); 770fa9e4066Sahrens } 771fa9e4066Sahrens 7721d452cf5Sahrens /* 7731d452cf5Sahrens * remove the objects in open context, so that we won't 7741d452cf5Sahrens * have too much to do in syncing context. 7751d452cf5Sahrens */ 7766754306eSahrens for (obj = 0; err == 0; err = dmu_object_next(os, &obj, FALSE, 7776754306eSahrens ds->ds_phys->ds_prev_snap_txg)) { 7781d452cf5Sahrens dmu_tx_t *tx = dmu_tx_create(os); 7791d452cf5Sahrens dmu_tx_hold_free(tx, obj, 0, DMU_OBJECT_END); 7801d452cf5Sahrens dmu_tx_hold_bonus(tx, obj); 7811d452cf5Sahrens err = dmu_tx_assign(tx, TXG_WAIT); 7821d452cf5Sahrens if (err) { 7831d452cf5Sahrens /* 7841d452cf5Sahrens * Perhaps there is not enough disk 7851d452cf5Sahrens * space. Just deal with it from 7861d452cf5Sahrens * dsl_dataset_destroy_sync(). 7871d452cf5Sahrens */ 7881d452cf5Sahrens dmu_tx_abort(tx); 7891d452cf5Sahrens continue; 7901d452cf5Sahrens } 7911d452cf5Sahrens VERIFY(0 == dmu_object_free(os, obj, tx)); 7921d452cf5Sahrens dmu_tx_commit(tx); 7931d452cf5Sahrens } 7941d452cf5Sahrens /* Make sure it's not dirty before we finish destroying it. */ 7951d452cf5Sahrens txg_wait_synced(dd->dd_pool, 0); 7961d452cf5Sahrens 7971d452cf5Sahrens dmu_objset_close(os); 7981d452cf5Sahrens if (err != ESRCH) 7991d452cf5Sahrens return (err); 8001d452cf5Sahrens 8011d452cf5Sahrens err = dsl_dataset_open(name, 8021d452cf5Sahrens DS_MODE_EXCLUSIVE | DS_MODE_READONLY | DS_MODE_INCONSISTENT, 8031d452cf5Sahrens FTAG, &ds); 8041d452cf5Sahrens if (err) 8051d452cf5Sahrens return (err); 8061d452cf5Sahrens 8071d452cf5Sahrens err = dsl_dir_open(name, FTAG, &dd, NULL); 8081d452cf5Sahrens if (err) { 8091d452cf5Sahrens dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, FTAG); 8101d452cf5Sahrens return (err); 8111d452cf5Sahrens } 8121d452cf5Sahrens 8131d452cf5Sahrens /* 8141d452cf5Sahrens * Blow away the dsl_dir + head dataset. 8151d452cf5Sahrens */ 8161d452cf5Sahrens dstg = dsl_sync_task_group_create(ds->ds_dir->dd_pool); 8171d452cf5Sahrens dsl_sync_task_create(dstg, dsl_dataset_destroy_check, 8181d452cf5Sahrens dsl_dataset_destroy_sync, ds, FTAG, 0); 8191d452cf5Sahrens dsl_sync_task_create(dstg, dsl_dir_destroy_check, 8201d452cf5Sahrens dsl_dir_destroy_sync, dd, FTAG, 0); 8211d452cf5Sahrens err = dsl_sync_task_group_wait(dstg); 8221d452cf5Sahrens dsl_sync_task_group_destroy(dstg); 8231d452cf5Sahrens /* if it is successful, *destroy_sync will close the ds+dd */ 8241d452cf5Sahrens if (err) { 8251d452cf5Sahrens dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, FTAG); 8261d452cf5Sahrens dsl_dir_close(dd, FTAG); 8271d452cf5Sahrens } 828fa9e4066Sahrens return (err); 829fa9e4066Sahrens } 830fa9e4066Sahrens 8311d452cf5Sahrens int 8321d452cf5Sahrens dsl_dataset_rollback(dsl_dataset_t *ds) 8331d452cf5Sahrens { 83455434c77Sek ASSERT3U(ds->ds_open_refcount, ==, DS_REF_MAX); 8351d452cf5Sahrens return (dsl_sync_task_do(ds->ds_dir->dd_pool, 8361d452cf5Sahrens dsl_dataset_rollback_check, dsl_dataset_rollback_sync, 8371d452cf5Sahrens ds, NULL, 0)); 8381d452cf5Sahrens } 8391d452cf5Sahrens 840fa9e4066Sahrens void * 841fa9e4066Sahrens dsl_dataset_set_user_ptr(dsl_dataset_t *ds, 842fa9e4066Sahrens void *p, dsl_dataset_evict_func_t func) 843fa9e4066Sahrens { 844fa9e4066Sahrens void *old; 845fa9e4066Sahrens 846fa9e4066Sahrens mutex_enter(&ds->ds_lock); 847fa9e4066Sahrens old = ds->ds_user_ptr; 848fa9e4066Sahrens if (old == NULL) { 849fa9e4066Sahrens ds->ds_user_ptr = p; 850fa9e4066Sahrens ds->ds_user_evict_func = func; 851fa9e4066Sahrens } 852fa9e4066Sahrens mutex_exit(&ds->ds_lock); 853fa9e4066Sahrens return (old); 854fa9e4066Sahrens } 855fa9e4066Sahrens 856fa9e4066Sahrens void * 857fa9e4066Sahrens dsl_dataset_get_user_ptr(dsl_dataset_t *ds) 858fa9e4066Sahrens { 859fa9e4066Sahrens return (ds->ds_user_ptr); 860fa9e4066Sahrens } 861fa9e4066Sahrens 862fa9e4066Sahrens 863c717a561Smaybee blkptr_t * 864c717a561Smaybee dsl_dataset_get_blkptr(dsl_dataset_t *ds) 865fa9e4066Sahrens { 866c717a561Smaybee return (&ds->ds_phys->ds_bp); 867fa9e4066Sahrens } 868fa9e4066Sahrens 869fa9e4066Sahrens void 870fa9e4066Sahrens dsl_dataset_set_blkptr(dsl_dataset_t *ds, blkptr_t *bp, dmu_tx_t *tx) 871fa9e4066Sahrens { 872fa9e4066Sahrens ASSERT(dmu_tx_is_syncing(tx)); 873fa9e4066Sahrens /* If it's the meta-objset, set dp_meta_rootbp */ 874fa9e4066Sahrens if (ds == NULL) { 875fa9e4066Sahrens tx->tx_pool->dp_meta_rootbp = *bp; 876fa9e4066Sahrens } else { 877fa9e4066Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 878fa9e4066Sahrens ds->ds_phys->ds_bp = *bp; 879fa9e4066Sahrens } 880fa9e4066Sahrens } 881fa9e4066Sahrens 882fa9e4066Sahrens spa_t * 883fa9e4066Sahrens dsl_dataset_get_spa(dsl_dataset_t *ds) 884fa9e4066Sahrens { 885fa9e4066Sahrens return (ds->ds_dir->dd_pool->dp_spa); 886fa9e4066Sahrens } 887fa9e4066Sahrens 888fa9e4066Sahrens void 889fa9e4066Sahrens dsl_dataset_dirty(dsl_dataset_t *ds, dmu_tx_t *tx) 890fa9e4066Sahrens { 891fa9e4066Sahrens dsl_pool_t *dp; 892fa9e4066Sahrens 893fa9e4066Sahrens if (ds == NULL) /* this is the meta-objset */ 894fa9e4066Sahrens return; 895fa9e4066Sahrens 896fa9e4066Sahrens ASSERT(ds->ds_user_ptr != NULL); 897a2eea2e1Sahrens 898a2eea2e1Sahrens if (ds->ds_phys->ds_next_snap_obj != 0) 899a2eea2e1Sahrens panic("dirtying snapshot!"); 900fa9e4066Sahrens 901fa9e4066Sahrens dp = ds->ds_dir->dd_pool; 902fa9e4066Sahrens 903fa9e4066Sahrens if (txg_list_add(&dp->dp_dirty_datasets, ds, tx->tx_txg) == 0) { 904fa9e4066Sahrens /* up the hold count until we can be written out */ 905fa9e4066Sahrens dmu_buf_add_ref(ds->ds_dbuf, ds); 906fa9e4066Sahrens } 907fa9e4066Sahrens } 908fa9e4066Sahrens 909fa9e4066Sahrens struct killarg { 910fa9e4066Sahrens uint64_t *usedp; 911fa9e4066Sahrens uint64_t *compressedp; 912fa9e4066Sahrens uint64_t *uncompressedp; 913fa9e4066Sahrens zio_t *zio; 914fa9e4066Sahrens dmu_tx_t *tx; 915fa9e4066Sahrens }; 916fa9e4066Sahrens 917fa9e4066Sahrens static int 918fa9e4066Sahrens kill_blkptr(traverse_blk_cache_t *bc, spa_t *spa, void *arg) 919fa9e4066Sahrens { 920fa9e4066Sahrens struct killarg *ka = arg; 921fa9e4066Sahrens blkptr_t *bp = &bc->bc_blkptr; 922fa9e4066Sahrens 923fa9e4066Sahrens ASSERT3U(bc->bc_errno, ==, 0); 924fa9e4066Sahrens 925fa9e4066Sahrens /* 926fa9e4066Sahrens * Since this callback is not called concurrently, no lock is 927fa9e4066Sahrens * needed on the accounting values. 928fa9e4066Sahrens */ 92999653d4eSeschrock *ka->usedp += bp_get_dasize(spa, bp); 930fa9e4066Sahrens *ka->compressedp += BP_GET_PSIZE(bp); 931fa9e4066Sahrens *ka->uncompressedp += BP_GET_UCSIZE(bp); 932fa9e4066Sahrens /* XXX check for EIO? */ 933fa9e4066Sahrens (void) arc_free(ka->zio, spa, ka->tx->tx_txg, bp, NULL, NULL, 934fa9e4066Sahrens ARC_NOWAIT); 935fa9e4066Sahrens return (0); 936fa9e4066Sahrens } 937fa9e4066Sahrens 938fa9e4066Sahrens /* ARGSUSED */ 9391d452cf5Sahrens static int 9401d452cf5Sahrens dsl_dataset_rollback_check(void *arg1, void *arg2, dmu_tx_t *tx) 941fa9e4066Sahrens { 9421d452cf5Sahrens dsl_dataset_t *ds = arg1; 943fa9e4066Sahrens 9441d452cf5Sahrens /* 9451d452cf5Sahrens * There must be a previous snapshot. I suppose we could roll 9461d452cf5Sahrens * it back to being empty (and re-initialize the upper (ZPL) 9471d452cf5Sahrens * layer). But for now there's no way to do this via the user 9481d452cf5Sahrens * interface. 9491d452cf5Sahrens */ 9501d452cf5Sahrens if (ds->ds_phys->ds_prev_snap_txg == 0) 951fa9e4066Sahrens return (EINVAL); 952fa9e4066Sahrens 9531d452cf5Sahrens /* 9541d452cf5Sahrens * This must not be a snapshot. 9551d452cf5Sahrens */ 9561d452cf5Sahrens if (ds->ds_phys->ds_next_snap_obj != 0) 957fa9e4066Sahrens return (EINVAL); 958fa9e4066Sahrens 959fa9e4066Sahrens /* 960fa9e4066Sahrens * If we made changes this txg, traverse_dsl_dataset won't find 961fa9e4066Sahrens * them. Try again. 962fa9e4066Sahrens */ 9631d452cf5Sahrens if (ds->ds_phys->ds_bp.blk_birth >= tx->tx_txg) 964fa9e4066Sahrens return (EAGAIN); 965fa9e4066Sahrens 9661d452cf5Sahrens return (0); 9671d452cf5Sahrens } 9681d452cf5Sahrens 9691d452cf5Sahrens /* ARGSUSED */ 9701d452cf5Sahrens static void 971*ecd6cf80Smarks dsl_dataset_rollback_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) 9721d452cf5Sahrens { 9731d452cf5Sahrens dsl_dataset_t *ds = arg1; 9741d452cf5Sahrens objset_t *mos = ds->ds_dir->dd_pool->dp_meta_objset; 975fa9e4066Sahrens 976fa9e4066Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 977fa9e4066Sahrens 978fa9e4066Sahrens /* Zero out the deadlist. */ 979fa9e4066Sahrens bplist_close(&ds->ds_deadlist); 980fa9e4066Sahrens bplist_destroy(mos, ds->ds_phys->ds_deadlist_obj, tx); 981fa9e4066Sahrens ds->ds_phys->ds_deadlist_obj = 982fa9e4066Sahrens bplist_create(mos, DSL_DEADLIST_BLOCKSIZE, tx); 983ea8dc4b6Seschrock VERIFY(0 == bplist_open(&ds->ds_deadlist, mos, 984ea8dc4b6Seschrock ds->ds_phys->ds_deadlist_obj)); 985fa9e4066Sahrens 986fa9e4066Sahrens { 987fa9e4066Sahrens /* Free blkptrs that we gave birth to */ 988fa9e4066Sahrens zio_t *zio; 989fa9e4066Sahrens uint64_t used = 0, compressed = 0, uncompressed = 0; 990fa9e4066Sahrens struct killarg ka; 991fa9e4066Sahrens 992fa9e4066Sahrens zio = zio_root(tx->tx_pool->dp_spa, NULL, NULL, 993fa9e4066Sahrens ZIO_FLAG_MUSTSUCCEED); 994fa9e4066Sahrens ka.usedp = &used; 995fa9e4066Sahrens ka.compressedp = &compressed; 996fa9e4066Sahrens ka.uncompressedp = &uncompressed; 997fa9e4066Sahrens ka.zio = zio; 998fa9e4066Sahrens ka.tx = tx; 999fa9e4066Sahrens (void) traverse_dsl_dataset(ds, ds->ds_phys->ds_prev_snap_txg, 1000fa9e4066Sahrens ADVANCE_POST, kill_blkptr, &ka); 1001fa9e4066Sahrens (void) zio_wait(zio); 1002fa9e4066Sahrens 10031d452cf5Sahrens dsl_dir_diduse_space(ds->ds_dir, 1004fa9e4066Sahrens -used, -compressed, -uncompressed, tx); 1005fa9e4066Sahrens } 1006fa9e4066Sahrens 10071d452cf5Sahrens /* Change our contents to that of the prev snapshot */ 1008fa9e4066Sahrens ASSERT3U(ds->ds_prev->ds_object, ==, ds->ds_phys->ds_prev_snap_obj); 1009fa9e4066Sahrens ds->ds_phys->ds_bp = ds->ds_prev->ds_phys->ds_bp; 1010fa9e4066Sahrens ds->ds_phys->ds_used_bytes = ds->ds_prev->ds_phys->ds_used_bytes; 1011fa9e4066Sahrens ds->ds_phys->ds_compressed_bytes = 1012fa9e4066Sahrens ds->ds_prev->ds_phys->ds_compressed_bytes; 1013fa9e4066Sahrens ds->ds_phys->ds_uncompressed_bytes = 1014fa9e4066Sahrens ds->ds_prev->ds_phys->ds_uncompressed_bytes; 101599653d4eSeschrock ds->ds_phys->ds_flags = ds->ds_prev->ds_phys->ds_flags; 1016fa9e4066Sahrens ds->ds_phys->ds_unique_bytes = 0; 1017fa9e4066Sahrens 101885edac42Sahrens if (ds->ds_prev->ds_phys->ds_next_snap_obj == ds->ds_object) { 101985edac42Sahrens dmu_buf_will_dirty(ds->ds_prev->ds_dbuf, tx); 102085edac42Sahrens ds->ds_prev->ds_phys->ds_unique_bytes = 0; 102185edac42Sahrens } 1022*ecd6cf80Smarks 1023*ecd6cf80Smarks spa_history_internal_log(LOG_DS_ROLLBACK, ds->ds_dir->dd_pool->dp_spa, 1024*ecd6cf80Smarks tx, cr, "dataset = %llu", ds->ds_object); 1025fa9e4066Sahrens } 1026fa9e4066Sahrens 1027e1930233Sbonwick /* ARGSUSED */ 1028e1930233Sbonwick static int 10291d452cf5Sahrens dsl_dataset_destroy_begin_check(void *arg1, void *arg2, dmu_tx_t *tx) 1030e1930233Sbonwick { 10311d452cf5Sahrens dsl_dataset_t *ds = arg1; 1032e1930233Sbonwick 1033e1930233Sbonwick /* 1034e1930233Sbonwick * Can't delete a head dataset if there are snapshots of it. 1035e1930233Sbonwick * (Except if the only snapshots are from the branch we cloned 1036e1930233Sbonwick * from.) 1037e1930233Sbonwick */ 1038e1930233Sbonwick if (ds->ds_prev != NULL && 1039e1930233Sbonwick ds->ds_prev->ds_phys->ds_next_snap_obj == ds->ds_object) 1040e1930233Sbonwick return (EINVAL); 1041e1930233Sbonwick 1042e1930233Sbonwick return (0); 1043e1930233Sbonwick } 1044e1930233Sbonwick 10451d452cf5Sahrens /* ARGSUSED */ 10461d452cf5Sahrens static void 1047*ecd6cf80Smarks dsl_dataset_destroy_begin_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) 1048fa9e4066Sahrens { 10491d452cf5Sahrens dsl_dataset_t *ds = arg1; 1050*ecd6cf80Smarks dsl_pool_t *dp = ds->ds_dir->dd_pool; 1051fa9e4066Sahrens 10521d452cf5Sahrens /* Mark it as inconsistent on-disk, in case we crash */ 10531d452cf5Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 10541d452cf5Sahrens ds->ds_phys->ds_flags |= DS_FLAG_INCONSISTENT; 1055*ecd6cf80Smarks 1056*ecd6cf80Smarks spa_history_internal_log(LOG_DS_DESTROY_BEGIN, dp->dp_spa, tx, 1057*ecd6cf80Smarks cr, "dataset = %llu", ds->ds_object); 10581d452cf5Sahrens } 1059fa9e4066Sahrens 10601d452cf5Sahrens /* ARGSUSED */ 10611d452cf5Sahrens static int 10621d452cf5Sahrens dsl_dataset_destroy_check(void *arg1, void *arg2, dmu_tx_t *tx) 10631d452cf5Sahrens { 10641d452cf5Sahrens dsl_dataset_t *ds = arg1; 1065fa9e4066Sahrens 1066fa9e4066Sahrens /* Can't delete a branch point. */ 10671d452cf5Sahrens if (ds->ds_phys->ds_num_children > 1) 10681d452cf5Sahrens return (EEXIST); 1069fa9e4066Sahrens 1070fa9e4066Sahrens /* 1071fa9e4066Sahrens * Can't delete a head dataset if there are snapshots of it. 1072fa9e4066Sahrens * (Except if the only snapshots are from the branch we cloned 1073fa9e4066Sahrens * from.) 1074fa9e4066Sahrens */ 1075fa9e4066Sahrens if (ds->ds_prev != NULL && 10761d452cf5Sahrens ds->ds_prev->ds_phys->ds_next_snap_obj == ds->ds_object) 1077fa9e4066Sahrens return (EINVAL); 1078fa9e4066Sahrens 1079fa9e4066Sahrens /* 1080fa9e4066Sahrens * If we made changes this txg, traverse_dsl_dataset won't find 1081fa9e4066Sahrens * them. Try again. 1082fa9e4066Sahrens */ 10831d452cf5Sahrens if (ds->ds_phys->ds_bp.blk_birth >= tx->tx_txg) 1084fa9e4066Sahrens return (EAGAIN); 10851d452cf5Sahrens 10861d452cf5Sahrens /* XXX we should do some i/o error checking... */ 10871d452cf5Sahrens return (0); 10881d452cf5Sahrens } 10891d452cf5Sahrens 10901d452cf5Sahrens static void 1091*ecd6cf80Smarks dsl_dataset_destroy_sync(void *arg1, void *tag, cred_t *cr, dmu_tx_t *tx) 10921d452cf5Sahrens { 10931d452cf5Sahrens dsl_dataset_t *ds = arg1; 10941d452cf5Sahrens uint64_t used = 0, compressed = 0, uncompressed = 0; 10951d452cf5Sahrens zio_t *zio; 10961d452cf5Sahrens int err; 10971d452cf5Sahrens int after_branch_point = FALSE; 10981d452cf5Sahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 10991d452cf5Sahrens objset_t *mos = dp->dp_meta_objset; 11001d452cf5Sahrens dsl_dataset_t *ds_prev = NULL; 11011d452cf5Sahrens uint64_t obj; 11021d452cf5Sahrens 110355434c77Sek ASSERT3U(ds->ds_open_refcount, ==, DS_REF_MAX); 11041d452cf5Sahrens ASSERT3U(ds->ds_phys->ds_num_children, <=, 1); 11051d452cf5Sahrens ASSERT(ds->ds_prev == NULL || 11061d452cf5Sahrens ds->ds_prev->ds_phys->ds_next_snap_obj != ds->ds_object); 11071d452cf5Sahrens ASSERT3U(ds->ds_phys->ds_bp.blk_birth, <=, tx->tx_txg); 11081d452cf5Sahrens 11091d452cf5Sahrens ASSERT(RW_WRITE_HELD(&dp->dp_config_rwlock)); 11101d452cf5Sahrens 11111d452cf5Sahrens obj = ds->ds_object; 1112fa9e4066Sahrens 1113fa9e4066Sahrens if (ds->ds_phys->ds_prev_snap_obj != 0) { 1114fa9e4066Sahrens if (ds->ds_prev) { 1115fa9e4066Sahrens ds_prev = ds->ds_prev; 1116fa9e4066Sahrens } else { 11171d452cf5Sahrens VERIFY(0 == dsl_dataset_open_obj(dp, 1118fa9e4066Sahrens ds->ds_phys->ds_prev_snap_obj, NULL, 11191d452cf5Sahrens DS_MODE_NONE, FTAG, &ds_prev)); 1120fa9e4066Sahrens } 1121fa9e4066Sahrens after_branch_point = 1122fa9e4066Sahrens (ds_prev->ds_phys->ds_next_snap_obj != obj); 1123fa9e4066Sahrens 1124fa9e4066Sahrens dmu_buf_will_dirty(ds_prev->ds_dbuf, tx); 1125fa9e4066Sahrens if (after_branch_point && 1126fa9e4066Sahrens ds->ds_phys->ds_next_snap_obj == 0) { 1127fa9e4066Sahrens /* This clone is toast. */ 1128fa9e4066Sahrens ASSERT(ds_prev->ds_phys->ds_num_children > 1); 1129fa9e4066Sahrens ds_prev->ds_phys->ds_num_children--; 1130fa9e4066Sahrens } else if (!after_branch_point) { 1131fa9e4066Sahrens ds_prev->ds_phys->ds_next_snap_obj = 1132fa9e4066Sahrens ds->ds_phys->ds_next_snap_obj; 1133fa9e4066Sahrens } 1134fa9e4066Sahrens } 1135fa9e4066Sahrens 1136fa9e4066Sahrens zio = zio_root(dp->dp_spa, NULL, NULL, ZIO_FLAG_MUSTSUCCEED); 1137fa9e4066Sahrens 1138fa9e4066Sahrens if (ds->ds_phys->ds_next_snap_obj != 0) { 11391d452cf5Sahrens blkptr_t bp; 1140fa9e4066Sahrens dsl_dataset_t *ds_next; 1141fa9e4066Sahrens uint64_t itor = 0; 1142fa9e4066Sahrens 1143fa9e4066Sahrens spa_scrub_restart(dp->dp_spa, tx->tx_txg); 1144fa9e4066Sahrens 11451d452cf5Sahrens VERIFY(0 == dsl_dataset_open_obj(dp, 1146ea8dc4b6Seschrock ds->ds_phys->ds_next_snap_obj, NULL, 1147ea8dc4b6Seschrock DS_MODE_NONE, FTAG, &ds_next)); 1148fa9e4066Sahrens ASSERT3U(ds_next->ds_phys->ds_prev_snap_obj, ==, obj); 1149fa9e4066Sahrens 1150fa9e4066Sahrens dmu_buf_will_dirty(ds_next->ds_dbuf, tx); 1151fa9e4066Sahrens ds_next->ds_phys->ds_prev_snap_obj = 1152fa9e4066Sahrens ds->ds_phys->ds_prev_snap_obj; 1153fa9e4066Sahrens ds_next->ds_phys->ds_prev_snap_txg = 1154fa9e4066Sahrens ds->ds_phys->ds_prev_snap_txg; 1155fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_prev_snap_txg, ==, 1156fa9e4066Sahrens ds_prev ? ds_prev->ds_phys->ds_creation_txg : 0); 1157fa9e4066Sahrens 1158fa9e4066Sahrens /* 1159fa9e4066Sahrens * Transfer to our deadlist (which will become next's 1160fa9e4066Sahrens * new deadlist) any entries from next's current 1161fa9e4066Sahrens * deadlist which were born before prev, and free the 1162fa9e4066Sahrens * other entries. 1163fa9e4066Sahrens * 1164fa9e4066Sahrens * XXX we're doing this long task with the config lock held 1165fa9e4066Sahrens */ 1166fa9e4066Sahrens while (bplist_iterate(&ds_next->ds_deadlist, &itor, 1167fa9e4066Sahrens &bp) == 0) { 1168fa9e4066Sahrens if (bp.blk_birth <= ds->ds_phys->ds_prev_snap_txg) { 1169ea8dc4b6Seschrock VERIFY(0 == bplist_enqueue(&ds->ds_deadlist, 1170ea8dc4b6Seschrock &bp, tx)); 1171fa9e4066Sahrens if (ds_prev && !after_branch_point && 1172fa9e4066Sahrens bp.blk_birth > 1173fa9e4066Sahrens ds_prev->ds_phys->ds_prev_snap_txg) { 1174fa9e4066Sahrens ds_prev->ds_phys->ds_unique_bytes += 117599653d4eSeschrock bp_get_dasize(dp->dp_spa, &bp); 1176fa9e4066Sahrens } 1177fa9e4066Sahrens } else { 117899653d4eSeschrock used += bp_get_dasize(dp->dp_spa, &bp); 1179fa9e4066Sahrens compressed += BP_GET_PSIZE(&bp); 1180fa9e4066Sahrens uncompressed += BP_GET_UCSIZE(&bp); 1181fa9e4066Sahrens /* XXX check return value? */ 1182fa9e4066Sahrens (void) arc_free(zio, dp->dp_spa, tx->tx_txg, 1183fa9e4066Sahrens &bp, NULL, NULL, ARC_NOWAIT); 1184fa9e4066Sahrens } 1185fa9e4066Sahrens } 1186fa9e4066Sahrens 1187fa9e4066Sahrens /* free next's deadlist */ 1188fa9e4066Sahrens bplist_close(&ds_next->ds_deadlist); 1189fa9e4066Sahrens bplist_destroy(mos, ds_next->ds_phys->ds_deadlist_obj, tx); 1190fa9e4066Sahrens 1191fa9e4066Sahrens /* set next's deadlist to our deadlist */ 1192fa9e4066Sahrens ds_next->ds_phys->ds_deadlist_obj = 1193fa9e4066Sahrens ds->ds_phys->ds_deadlist_obj; 1194ea8dc4b6Seschrock VERIFY(0 == bplist_open(&ds_next->ds_deadlist, mos, 1195ea8dc4b6Seschrock ds_next->ds_phys->ds_deadlist_obj)); 1196fa9e4066Sahrens ds->ds_phys->ds_deadlist_obj = 0; 1197fa9e4066Sahrens 1198fa9e4066Sahrens if (ds_next->ds_phys->ds_next_snap_obj != 0) { 1199fa9e4066Sahrens /* 1200fa9e4066Sahrens * Update next's unique to include blocks which 1201fa9e4066Sahrens * were previously shared by only this snapshot 1202fa9e4066Sahrens * and it. Those blocks will be born after the 1203fa9e4066Sahrens * prev snap and before this snap, and will have 1204fa9e4066Sahrens * died after the next snap and before the one 1205fa9e4066Sahrens * after that (ie. be on the snap after next's 1206fa9e4066Sahrens * deadlist). 1207fa9e4066Sahrens * 1208fa9e4066Sahrens * XXX we're doing this long task with the 1209fa9e4066Sahrens * config lock held 1210fa9e4066Sahrens */ 1211fa9e4066Sahrens dsl_dataset_t *ds_after_next; 1212fa9e4066Sahrens 12131d452cf5Sahrens VERIFY(0 == dsl_dataset_open_obj(dp, 1214fa9e4066Sahrens ds_next->ds_phys->ds_next_snap_obj, NULL, 1215ea8dc4b6Seschrock DS_MODE_NONE, FTAG, &ds_after_next)); 1216fa9e4066Sahrens itor = 0; 1217fa9e4066Sahrens while (bplist_iterate(&ds_after_next->ds_deadlist, 1218fa9e4066Sahrens &itor, &bp) == 0) { 1219fa9e4066Sahrens if (bp.blk_birth > 1220fa9e4066Sahrens ds->ds_phys->ds_prev_snap_txg && 1221fa9e4066Sahrens bp.blk_birth <= 1222fa9e4066Sahrens ds->ds_phys->ds_creation_txg) { 1223fa9e4066Sahrens ds_next->ds_phys->ds_unique_bytes += 122499653d4eSeschrock bp_get_dasize(dp->dp_spa, &bp); 1225fa9e4066Sahrens } 1226fa9e4066Sahrens } 1227fa9e4066Sahrens 1228fa9e4066Sahrens dsl_dataset_close(ds_after_next, DS_MODE_NONE, FTAG); 1229fa9e4066Sahrens ASSERT3P(ds_next->ds_prev, ==, NULL); 1230fa9e4066Sahrens } else { 1231fa9e4066Sahrens /* 1232fa9e4066Sahrens * It would be nice to update the head dataset's 1233fa9e4066Sahrens * unique. To do so we would have to traverse 1234fa9e4066Sahrens * it for blocks born after ds_prev, which is 1235fa9e4066Sahrens * pretty expensive just to maintain something 1236fa9e4066Sahrens * for debugging purposes. 1237fa9e4066Sahrens */ 1238fa9e4066Sahrens ASSERT3P(ds_next->ds_prev, ==, ds); 1239fa9e4066Sahrens dsl_dataset_close(ds_next->ds_prev, DS_MODE_NONE, 1240fa9e4066Sahrens ds_next); 1241fa9e4066Sahrens if (ds_prev) { 12421d452cf5Sahrens VERIFY(0 == dsl_dataset_open_obj(dp, 1243ea8dc4b6Seschrock ds->ds_phys->ds_prev_snap_obj, NULL, 1244ea8dc4b6Seschrock DS_MODE_NONE, ds_next, &ds_next->ds_prev)); 1245fa9e4066Sahrens } else { 1246fa9e4066Sahrens ds_next->ds_prev = NULL; 1247fa9e4066Sahrens } 1248fa9e4066Sahrens } 1249fa9e4066Sahrens dsl_dataset_close(ds_next, DS_MODE_NONE, FTAG); 1250fa9e4066Sahrens 1251fa9e4066Sahrens /* 1252fa9e4066Sahrens * NB: unique_bytes is not accurate for head objsets 1253fa9e4066Sahrens * because we don't update it when we delete the most 1254fa9e4066Sahrens * recent snapshot -- see above comment. 1255fa9e4066Sahrens */ 1256fa9e4066Sahrens ASSERT3U(used, ==, ds->ds_phys->ds_unique_bytes); 1257fa9e4066Sahrens } else { 1258fa9e4066Sahrens /* 1259fa9e4066Sahrens * There's no next snapshot, so this is a head dataset. 1260fa9e4066Sahrens * Destroy the deadlist. Unless it's a clone, the 1261fa9e4066Sahrens * deadlist should be empty. (If it's a clone, it's 1262fa9e4066Sahrens * safe to ignore the deadlist contents.) 1263fa9e4066Sahrens */ 1264fa9e4066Sahrens struct killarg ka; 1265fa9e4066Sahrens 1266fa9e4066Sahrens ASSERT(after_branch_point || bplist_empty(&ds->ds_deadlist)); 1267fa9e4066Sahrens bplist_close(&ds->ds_deadlist); 1268fa9e4066Sahrens bplist_destroy(mos, ds->ds_phys->ds_deadlist_obj, tx); 1269fa9e4066Sahrens ds->ds_phys->ds_deadlist_obj = 0; 1270fa9e4066Sahrens 1271fa9e4066Sahrens /* 1272fa9e4066Sahrens * Free everything that we point to (that's born after 1273fa9e4066Sahrens * the previous snapshot, if we are a clone) 1274fa9e4066Sahrens * 1275fa9e4066Sahrens * XXX we're doing this long task with the config lock held 1276fa9e4066Sahrens */ 1277fa9e4066Sahrens ka.usedp = &used; 1278fa9e4066Sahrens ka.compressedp = &compressed; 1279fa9e4066Sahrens ka.uncompressedp = &uncompressed; 1280fa9e4066Sahrens ka.zio = zio; 1281fa9e4066Sahrens ka.tx = tx; 1282fa9e4066Sahrens err = traverse_dsl_dataset(ds, ds->ds_phys->ds_prev_snap_txg, 1283fa9e4066Sahrens ADVANCE_POST, kill_blkptr, &ka); 1284fa9e4066Sahrens ASSERT3U(err, ==, 0); 1285fa9e4066Sahrens } 1286fa9e4066Sahrens 1287fa9e4066Sahrens err = zio_wait(zio); 1288fa9e4066Sahrens ASSERT3U(err, ==, 0); 1289fa9e4066Sahrens 12901d452cf5Sahrens dsl_dir_diduse_space(ds->ds_dir, -used, -compressed, -uncompressed, tx); 1291fa9e4066Sahrens 1292fa9e4066Sahrens if (ds->ds_phys->ds_snapnames_zapobj) { 1293fa9e4066Sahrens err = zap_destroy(mos, ds->ds_phys->ds_snapnames_zapobj, tx); 1294fa9e4066Sahrens ASSERT(err == 0); 1295fa9e4066Sahrens } 1296fa9e4066Sahrens 12971d452cf5Sahrens if (ds->ds_dir->dd_phys->dd_head_dataset_obj == ds->ds_object) { 1298fa9e4066Sahrens /* Erase the link in the dataset */ 12991d452cf5Sahrens dmu_buf_will_dirty(ds->ds_dir->dd_dbuf, tx); 13001d452cf5Sahrens ds->ds_dir->dd_phys->dd_head_dataset_obj = 0; 1301fa9e4066Sahrens /* 1302fa9e4066Sahrens * dsl_dir_sync_destroy() called us, they'll destroy 1303fa9e4066Sahrens * the dataset. 1304fa9e4066Sahrens */ 1305fa9e4066Sahrens } else { 1306fa9e4066Sahrens /* remove from snapshot namespace */ 1307fa9e4066Sahrens dsl_dataset_t *ds_head; 13081d452cf5Sahrens VERIFY(0 == dsl_dataset_open_obj(dp, 13091d452cf5Sahrens ds->ds_dir->dd_phys->dd_head_dataset_obj, NULL, 1310ea8dc4b6Seschrock DS_MODE_NONE, FTAG, &ds_head)); 13118660574dSahrens VERIFY(0 == dsl_dataset_get_snapname(ds)); 1312fa9e4066Sahrens #ifdef ZFS_DEBUG 1313fa9e4066Sahrens { 1314fa9e4066Sahrens uint64_t val; 1315fa9e4066Sahrens err = zap_lookup(mos, 1316fa9e4066Sahrens ds_head->ds_phys->ds_snapnames_zapobj, 13171d452cf5Sahrens ds->ds_snapname, 8, 1, &val); 1318fa9e4066Sahrens ASSERT3U(err, ==, 0); 1319fa9e4066Sahrens ASSERT3U(val, ==, obj); 1320fa9e4066Sahrens } 1321fa9e4066Sahrens #endif 1322fa9e4066Sahrens err = zap_remove(mos, ds_head->ds_phys->ds_snapnames_zapobj, 13231d452cf5Sahrens ds->ds_snapname, tx); 1324fa9e4066Sahrens ASSERT(err == 0); 1325fa9e4066Sahrens dsl_dataset_close(ds_head, DS_MODE_NONE, FTAG); 1326fa9e4066Sahrens } 1327fa9e4066Sahrens 1328fa9e4066Sahrens if (ds_prev && ds->ds_prev != ds_prev) 1329fa9e4066Sahrens dsl_dataset_close(ds_prev, DS_MODE_NONE, FTAG); 1330fa9e4066Sahrens 1331b1b8ab34Slling spa_clear_bootfs(dp->dp_spa, ds->ds_object, tx); 1332*ecd6cf80Smarks spa_history_internal_log(LOG_DS_DESTROY, dp->dp_spa, tx, 1333*ecd6cf80Smarks cr, "dataset = %llu", ds->ds_object); 1334*ecd6cf80Smarks 13351d452cf5Sahrens dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, tag); 13361d452cf5Sahrens VERIFY(0 == dmu_object_free(mos, obj, tx)); 1337b1b8ab34Slling 1338fa9e4066Sahrens } 1339fa9e4066Sahrens 13401d452cf5Sahrens /* ARGSUSED */ 1341fa9e4066Sahrens int 13421d452cf5Sahrens dsl_dataset_snapshot_check(void *arg1, void *arg2, dmu_tx_t *tx) 1343fa9e4066Sahrens { 13441d452cf5Sahrens objset_t *os = arg1; 13451d452cf5Sahrens dsl_dataset_t *ds = os->os->os_dsl_dataset; 13461d452cf5Sahrens const char *snapname = arg2; 13471d452cf5Sahrens objset_t *mos = ds->ds_dir->dd_pool->dp_meta_objset; 1348fa9e4066Sahrens int err; 13491d452cf5Sahrens uint64_t value; 1350fa9e4066Sahrens 13511d452cf5Sahrens /* 13521d452cf5Sahrens * We don't allow multiple snapshots of the same txg. If there 13531d452cf5Sahrens * is already one, try again. 13541d452cf5Sahrens */ 13551d452cf5Sahrens if (ds->ds_phys->ds_prev_snap_txg >= tx->tx_txg) 13561d452cf5Sahrens return (EAGAIN); 1357fa9e4066Sahrens 13581d452cf5Sahrens /* 13591d452cf5Sahrens * Check for conflicting name snapshot name. 13601d452cf5Sahrens */ 1361fa9e4066Sahrens err = zap_lookup(mos, ds->ds_phys->ds_snapnames_zapobj, 1362fa9e4066Sahrens snapname, 8, 1, &value); 13631d452cf5Sahrens if (err == 0) 1364fa9e4066Sahrens return (EEXIST); 13651d452cf5Sahrens if (err != ENOENT) 13661d452cf5Sahrens return (err); 1367fa9e4066Sahrens 1368b7661cccSmmusante /* 1369b7661cccSmmusante * Check that the dataset's name is not too long. Name consists 1370b7661cccSmmusante * of the dataset's length + 1 for the @-sign + snapshot name's length 1371b7661cccSmmusante */ 1372b7661cccSmmusante if (dsl_dataset_namelen(ds) + 1 + strlen(snapname) >= MAXNAMELEN) 1373b7661cccSmmusante return (ENAMETOOLONG); 1374b7661cccSmmusante 13751d452cf5Sahrens ds->ds_trysnap_txg = tx->tx_txg; 13761d452cf5Sahrens return (0); 13771d452cf5Sahrens } 1378fa9e4066Sahrens 13791d452cf5Sahrens void 1380*ecd6cf80Smarks dsl_dataset_snapshot_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) 13811d452cf5Sahrens { 13821d452cf5Sahrens objset_t *os = arg1; 13831d452cf5Sahrens dsl_dataset_t *ds = os->os->os_dsl_dataset; 13841d452cf5Sahrens const char *snapname = arg2; 13851d452cf5Sahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 13861d452cf5Sahrens dmu_buf_t *dbuf; 13871d452cf5Sahrens dsl_dataset_phys_t *dsphys; 13881d452cf5Sahrens uint64_t dsobj; 13891d452cf5Sahrens objset_t *mos = dp->dp_meta_objset; 13901d452cf5Sahrens int err; 1391fa9e4066Sahrens 1392fa9e4066Sahrens spa_scrub_restart(dp->dp_spa, tx->tx_txg); 13931d452cf5Sahrens ASSERT(RW_WRITE_HELD(&dp->dp_config_rwlock)); 1394fa9e4066Sahrens 13951649cd4bStabriz dsobj = dmu_object_alloc(mos, DMU_OT_DSL_DATASET, 0, 13961649cd4bStabriz DMU_OT_DSL_DATASET, sizeof (dsl_dataset_phys_t), tx); 1397ea8dc4b6Seschrock VERIFY(0 == dmu_bonus_hold(mos, dsobj, FTAG, &dbuf)); 1398fa9e4066Sahrens dmu_buf_will_dirty(dbuf, tx); 1399fa9e4066Sahrens dsphys = dbuf->db_data; 14001d452cf5Sahrens dsphys->ds_dir_obj = ds->ds_dir->dd_object; 1401fa9e4066Sahrens dsphys->ds_fsid_guid = unique_create(); 1402fa9e4066Sahrens unique_remove(dsphys->ds_fsid_guid); /* it isn't open yet */ 1403fa9e4066Sahrens (void) random_get_pseudo_bytes((void*)&dsphys->ds_guid, 1404fa9e4066Sahrens sizeof (dsphys->ds_guid)); 1405fa9e4066Sahrens dsphys->ds_prev_snap_obj = ds->ds_phys->ds_prev_snap_obj; 1406fa9e4066Sahrens dsphys->ds_prev_snap_txg = ds->ds_phys->ds_prev_snap_txg; 1407fa9e4066Sahrens dsphys->ds_next_snap_obj = ds->ds_object; 1408fa9e4066Sahrens dsphys->ds_num_children = 1; 1409fa9e4066Sahrens dsphys->ds_creation_time = gethrestime_sec(); 1410fa9e4066Sahrens dsphys->ds_creation_txg = tx->tx_txg; 1411fa9e4066Sahrens dsphys->ds_deadlist_obj = ds->ds_phys->ds_deadlist_obj; 1412fa9e4066Sahrens dsphys->ds_used_bytes = ds->ds_phys->ds_used_bytes; 1413fa9e4066Sahrens dsphys->ds_compressed_bytes = ds->ds_phys->ds_compressed_bytes; 1414fa9e4066Sahrens dsphys->ds_uncompressed_bytes = ds->ds_phys->ds_uncompressed_bytes; 141599653d4eSeschrock dsphys->ds_flags = ds->ds_phys->ds_flags; 1416fa9e4066Sahrens dsphys->ds_bp = ds->ds_phys->ds_bp; 1417ea8dc4b6Seschrock dmu_buf_rele(dbuf, FTAG); 1418fa9e4066Sahrens 14191d452cf5Sahrens ASSERT3U(ds->ds_prev != 0, ==, ds->ds_phys->ds_prev_snap_obj != 0); 14201d452cf5Sahrens if (ds->ds_prev) { 14211d452cf5Sahrens ASSERT(ds->ds_prev->ds_phys->ds_next_snap_obj == 1422fa9e4066Sahrens ds->ds_object || 14231d452cf5Sahrens ds->ds_prev->ds_phys->ds_num_children > 1); 14241d452cf5Sahrens if (ds->ds_prev->ds_phys->ds_next_snap_obj == ds->ds_object) { 14251d452cf5Sahrens dmu_buf_will_dirty(ds->ds_prev->ds_dbuf, tx); 1426fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_prev_snap_txg, ==, 14271d452cf5Sahrens ds->ds_prev->ds_phys->ds_creation_txg); 14281d452cf5Sahrens ds->ds_prev->ds_phys->ds_next_snap_obj = dsobj; 1429fa9e4066Sahrens } 1430fa9e4066Sahrens } 1431fa9e4066Sahrens 1432fa9e4066Sahrens bplist_close(&ds->ds_deadlist); 1433fa9e4066Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 1434fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_prev_snap_txg, <, dsphys->ds_creation_txg); 1435fa9e4066Sahrens ds->ds_phys->ds_prev_snap_obj = dsobj; 1436fa9e4066Sahrens ds->ds_phys->ds_prev_snap_txg = dsphys->ds_creation_txg; 1437fa9e4066Sahrens ds->ds_phys->ds_unique_bytes = 0; 1438fa9e4066Sahrens ds->ds_phys->ds_deadlist_obj = 1439fa9e4066Sahrens bplist_create(mos, DSL_DEADLIST_BLOCKSIZE, tx); 1440ea8dc4b6Seschrock VERIFY(0 == bplist_open(&ds->ds_deadlist, mos, 1441ea8dc4b6Seschrock ds->ds_phys->ds_deadlist_obj)); 1442fa9e4066Sahrens 1443fa9e4066Sahrens dprintf("snap '%s' -> obj %llu\n", snapname, dsobj); 1444fa9e4066Sahrens err = zap_add(mos, ds->ds_phys->ds_snapnames_zapobj, 1445fa9e4066Sahrens snapname, 8, 1, &dsobj, tx); 1446fa9e4066Sahrens ASSERT(err == 0); 1447fa9e4066Sahrens 1448fa9e4066Sahrens if (ds->ds_prev) 1449fa9e4066Sahrens dsl_dataset_close(ds->ds_prev, DS_MODE_NONE, ds); 1450ea8dc4b6Seschrock VERIFY(0 == dsl_dataset_open_obj(dp, 1451ea8dc4b6Seschrock ds->ds_phys->ds_prev_snap_obj, snapname, 1452ea8dc4b6Seschrock DS_MODE_NONE, ds, &ds->ds_prev)); 1453*ecd6cf80Smarks 1454*ecd6cf80Smarks spa_history_internal_log(LOG_DS_SNAPSHOT, dp->dp_spa, tx, cr, 1455*ecd6cf80Smarks "dataset = %llu", ds->ds_object); 1456fa9e4066Sahrens } 1457fa9e4066Sahrens 1458fa9e4066Sahrens void 1459c717a561Smaybee dsl_dataset_sync(dsl_dataset_t *ds, zio_t *zio, dmu_tx_t *tx) 1460fa9e4066Sahrens { 1461fa9e4066Sahrens ASSERT(dmu_tx_is_syncing(tx)); 1462fa9e4066Sahrens ASSERT(ds->ds_user_ptr != NULL); 1463fa9e4066Sahrens ASSERT(ds->ds_phys->ds_next_snap_obj == 0); 1464fa9e4066Sahrens 1465fa9e4066Sahrens dsl_dir_dirty(ds->ds_dir, tx); 1466c717a561Smaybee dmu_objset_sync(ds->ds_user_ptr, zio, tx); 1467c717a561Smaybee /* Unneeded? bplist_close(&ds->ds_deadlist); */ 1468fa9e4066Sahrens } 1469fa9e4066Sahrens 1470fa9e4066Sahrens void 1471a2eea2e1Sahrens dsl_dataset_stats(dsl_dataset_t *ds, nvlist_t *nv) 1472fa9e4066Sahrens { 1473a2eea2e1Sahrens dsl_dir_stats(ds->ds_dir, nv); 1474fa9e4066Sahrens 1475a2eea2e1Sahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_CREATION, 1476a2eea2e1Sahrens ds->ds_phys->ds_creation_time); 1477a2eea2e1Sahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_CREATETXG, 1478a2eea2e1Sahrens ds->ds_phys->ds_creation_txg); 1479a2eea2e1Sahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_REFERENCED, 1480a2eea2e1Sahrens ds->ds_phys->ds_used_bytes); 1481fa9e4066Sahrens 1482fa9e4066Sahrens if (ds->ds_phys->ds_next_snap_obj) { 1483fa9e4066Sahrens /* 1484fa9e4066Sahrens * This is a snapshot; override the dd's space used with 1485a2eea2e1Sahrens * our unique space and compression ratio. 1486fa9e4066Sahrens */ 1487a2eea2e1Sahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_USED, 1488a2eea2e1Sahrens ds->ds_phys->ds_unique_bytes); 1489a2eea2e1Sahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_COMPRESSRATIO, 1490a2eea2e1Sahrens ds->ds_phys->ds_compressed_bytes == 0 ? 100 : 1491a2eea2e1Sahrens (ds->ds_phys->ds_uncompressed_bytes * 100 / 1492a2eea2e1Sahrens ds->ds_phys->ds_compressed_bytes)); 1493fa9e4066Sahrens } 1494fa9e4066Sahrens } 1495fa9e4066Sahrens 1496a2eea2e1Sahrens void 1497a2eea2e1Sahrens dsl_dataset_fast_stat(dsl_dataset_t *ds, dmu_objset_stats_t *stat) 1498a2eea2e1Sahrens { 1499a2eea2e1Sahrens stat->dds_creation_txg = ds->ds_phys->ds_creation_txg; 1500a2eea2e1Sahrens stat->dds_inconsistent = ds->ds_phys->ds_flags & DS_FLAG_INCONSISTENT; 1501a2eea2e1Sahrens if (ds->ds_phys->ds_next_snap_obj) { 1502a2eea2e1Sahrens stat->dds_is_snapshot = B_TRUE; 1503a2eea2e1Sahrens stat->dds_num_clones = ds->ds_phys->ds_num_children - 1; 1504a2eea2e1Sahrens } 1505a2eea2e1Sahrens 1506a2eea2e1Sahrens /* clone origin is really a dsl_dir thing... */ 1507a2eea2e1Sahrens if (ds->ds_dir->dd_phys->dd_clone_parent_obj) { 1508a2eea2e1Sahrens dsl_dataset_t *ods; 1509a2eea2e1Sahrens 1510a2eea2e1Sahrens rw_enter(&ds->ds_dir->dd_pool->dp_config_rwlock, RW_READER); 1511a2eea2e1Sahrens VERIFY(0 == dsl_dataset_open_obj(ds->ds_dir->dd_pool, 1512a2eea2e1Sahrens ds->ds_dir->dd_phys->dd_clone_parent_obj, 1513a2eea2e1Sahrens NULL, DS_MODE_NONE, FTAG, &ods)); 1514a2eea2e1Sahrens dsl_dataset_name(ods, stat->dds_clone_of); 1515a2eea2e1Sahrens dsl_dataset_close(ods, DS_MODE_NONE, FTAG); 1516a2eea2e1Sahrens rw_exit(&ds->ds_dir->dd_pool->dp_config_rwlock); 1517a2eea2e1Sahrens } 1518a2eea2e1Sahrens } 1519a2eea2e1Sahrens 1520a2eea2e1Sahrens uint64_t 1521a2eea2e1Sahrens dsl_dataset_fsid_guid(dsl_dataset_t *ds) 1522a2eea2e1Sahrens { 1523a2eea2e1Sahrens return (ds->ds_phys->ds_fsid_guid); 1524a2eea2e1Sahrens } 1525a2eea2e1Sahrens 1526a2eea2e1Sahrens void 1527a2eea2e1Sahrens dsl_dataset_space(dsl_dataset_t *ds, 1528a2eea2e1Sahrens uint64_t *refdbytesp, uint64_t *availbytesp, 1529a2eea2e1Sahrens uint64_t *usedobjsp, uint64_t *availobjsp) 1530fa9e4066Sahrens { 1531a2eea2e1Sahrens *refdbytesp = ds->ds_phys->ds_used_bytes; 1532a2eea2e1Sahrens *availbytesp = dsl_dir_space_available(ds->ds_dir, NULL, 0, TRUE); 1533a2eea2e1Sahrens *usedobjsp = ds->ds_phys->ds_bp.blk_fill; 1534a2eea2e1Sahrens *availobjsp = DN_MAX_OBJECT - *usedobjsp; 1535fa9e4066Sahrens } 1536fa9e4066Sahrens 15371d452cf5Sahrens /* ARGSUSED */ 1538fa9e4066Sahrens static int 15391d452cf5Sahrens dsl_dataset_snapshot_rename_check(void *arg1, void *arg2, dmu_tx_t *tx) 1540fa9e4066Sahrens { 15411d452cf5Sahrens dsl_dataset_t *ds = arg1; 15421d452cf5Sahrens char *newsnapname = arg2; 15431d452cf5Sahrens dsl_dir_t *dd = ds->ds_dir; 1544fa9e4066Sahrens objset_t *mos = dd->dd_pool->dp_meta_objset; 15451d452cf5Sahrens dsl_dataset_t *hds; 1546fa9e4066Sahrens uint64_t val; 15471d452cf5Sahrens int err; 1548fa9e4066Sahrens 15491d452cf5Sahrens err = dsl_dataset_open_obj(dd->dd_pool, 15501d452cf5Sahrens dd->dd_phys->dd_head_dataset_obj, NULL, DS_MODE_NONE, FTAG, &hds); 1551fa9e4066Sahrens if (err) 1552fa9e4066Sahrens return (err); 1553fa9e4066Sahrens 15541d452cf5Sahrens /* new name better not be in use */ 15551d452cf5Sahrens err = zap_lookup(mos, hds->ds_phys->ds_snapnames_zapobj, 15561d452cf5Sahrens newsnapname, 8, 1, &val); 15571d452cf5Sahrens dsl_dataset_close(hds, DS_MODE_NONE, FTAG); 15581d452cf5Sahrens 15591d452cf5Sahrens if (err == 0) 15601d452cf5Sahrens err = EEXIST; 15611d452cf5Sahrens else if (err == ENOENT) 15621d452cf5Sahrens err = 0; 1563cdf5b4caSmmusante 1564cdf5b4caSmmusante /* dataset name + 1 for the "@" + the new snapshot name must fit */ 1565cdf5b4caSmmusante if (dsl_dir_namelen(ds->ds_dir) + 1 + strlen(newsnapname) >= MAXNAMELEN) 1566cdf5b4caSmmusante err = ENAMETOOLONG; 1567cdf5b4caSmmusante 15681d452cf5Sahrens return (err); 15691d452cf5Sahrens } 1570fa9e4066Sahrens 15711d452cf5Sahrens static void 1572*ecd6cf80Smarks dsl_dataset_snapshot_rename_sync(void *arg1, void *arg2, 1573*ecd6cf80Smarks cred_t *cr, dmu_tx_t *tx) 15741d452cf5Sahrens { 15751d452cf5Sahrens dsl_dataset_t *ds = arg1; 1576*ecd6cf80Smarks const char *newsnapname = arg2; 15771d452cf5Sahrens dsl_dir_t *dd = ds->ds_dir; 15781d452cf5Sahrens objset_t *mos = dd->dd_pool->dp_meta_objset; 15791d452cf5Sahrens dsl_dataset_t *hds; 15801d452cf5Sahrens int err; 1581fa9e4066Sahrens 15821d452cf5Sahrens ASSERT(ds->ds_phys->ds_next_snap_obj != 0); 1583fa9e4066Sahrens 15841d452cf5Sahrens VERIFY(0 == dsl_dataset_open_obj(dd->dd_pool, 15851d452cf5Sahrens dd->dd_phys->dd_head_dataset_obj, NULL, DS_MODE_NONE, FTAG, &hds)); 1586fa9e4066Sahrens 15871d452cf5Sahrens VERIFY(0 == dsl_dataset_get_snapname(ds)); 15881d452cf5Sahrens err = zap_remove(mos, hds->ds_phys->ds_snapnames_zapobj, 15891d452cf5Sahrens ds->ds_snapname, tx); 1590fa9e4066Sahrens ASSERT3U(err, ==, 0); 15911d452cf5Sahrens mutex_enter(&ds->ds_lock); 15921d452cf5Sahrens (void) strcpy(ds->ds_snapname, newsnapname); 15931d452cf5Sahrens mutex_exit(&ds->ds_lock); 15941d452cf5Sahrens err = zap_add(mos, hds->ds_phys->ds_snapnames_zapobj, 15951d452cf5Sahrens ds->ds_snapname, 8, 1, &ds->ds_object, tx); 1596fa9e4066Sahrens ASSERT3U(err, ==, 0); 1597fa9e4066Sahrens 1598*ecd6cf80Smarks spa_history_internal_log(LOG_DS_RENAME, dd->dd_pool->dp_spa, tx, 1599*ecd6cf80Smarks cr, "dataset = %llu", ds->ds_object); 16001d452cf5Sahrens dsl_dataset_close(hds, DS_MODE_NONE, FTAG); 1601fa9e4066Sahrens } 1602fa9e4066Sahrens 1603cdf5b4caSmmusante struct renamearg { 1604cdf5b4caSmmusante dsl_sync_task_group_t *dstg; 1605cdf5b4caSmmusante char failed[MAXPATHLEN]; 1606cdf5b4caSmmusante char *oldsnap; 1607cdf5b4caSmmusante char *newsnap; 1608cdf5b4caSmmusante }; 1609cdf5b4caSmmusante 1610cdf5b4caSmmusante static int 1611cdf5b4caSmmusante dsl_snapshot_rename_one(char *name, void *arg) 1612cdf5b4caSmmusante { 1613cdf5b4caSmmusante struct renamearg *ra = arg; 1614cdf5b4caSmmusante dsl_dataset_t *ds = NULL; 1615cdf5b4caSmmusante char *cp; 1616cdf5b4caSmmusante int err; 1617cdf5b4caSmmusante 1618cdf5b4caSmmusante cp = name + strlen(name); 1619cdf5b4caSmmusante *cp = '@'; 1620cdf5b4caSmmusante (void) strcpy(cp + 1, ra->oldsnap); 1621*ecd6cf80Smarks 1622*ecd6cf80Smarks /* 1623*ecd6cf80Smarks * For recursive snapshot renames the parent won't be changing 1624*ecd6cf80Smarks * so we just pass name for both the to/from argument. 1625*ecd6cf80Smarks */ 1626*ecd6cf80Smarks if (err = zfs_secpolicy_rename_perms(name, name, CRED())) { 1627*ecd6cf80Smarks (void) strcpy(ra->failed, name); 1628*ecd6cf80Smarks return (err); 1629*ecd6cf80Smarks } 1630*ecd6cf80Smarks 1631cdf5b4caSmmusante err = dsl_dataset_open(name, DS_MODE_READONLY | DS_MODE_STANDARD, 1632cdf5b4caSmmusante ra->dstg, &ds); 1633cdf5b4caSmmusante if (err == ENOENT) { 1634cdf5b4caSmmusante *cp = '\0'; 1635cdf5b4caSmmusante return (0); 1636cdf5b4caSmmusante } 1637cdf5b4caSmmusante if (err) { 1638cdf5b4caSmmusante (void) strcpy(ra->failed, name); 1639cdf5b4caSmmusante *cp = '\0'; 1640cdf5b4caSmmusante dsl_dataset_close(ds, DS_MODE_STANDARD, ra->dstg); 1641cdf5b4caSmmusante return (err); 1642cdf5b4caSmmusante } 1643cdf5b4caSmmusante 1644cdf5b4caSmmusante #ifdef _KERNEL 1645cdf5b4caSmmusante /* for all filesystems undergoing rename, we'll need to unmount it */ 1646cdf5b4caSmmusante (void) zfs_unmount_snap(name, NULL); 1647cdf5b4caSmmusante #endif 1648cdf5b4caSmmusante 1649cdf5b4caSmmusante *cp = '\0'; 1650cdf5b4caSmmusante 1651cdf5b4caSmmusante dsl_sync_task_create(ra->dstg, dsl_dataset_snapshot_rename_check, 1652cdf5b4caSmmusante dsl_dataset_snapshot_rename_sync, ds, ra->newsnap, 0); 1653cdf5b4caSmmusante 1654cdf5b4caSmmusante return (0); 1655cdf5b4caSmmusante } 1656cdf5b4caSmmusante 1657cdf5b4caSmmusante static int 1658cdf5b4caSmmusante dsl_recursive_rename(char *oldname, const char *newname) 1659cdf5b4caSmmusante { 1660cdf5b4caSmmusante int err; 1661cdf5b4caSmmusante struct renamearg *ra; 1662cdf5b4caSmmusante dsl_sync_task_t *dst; 1663cdf5b4caSmmusante spa_t *spa; 1664cdf5b4caSmmusante char *cp, *fsname = spa_strdup(oldname); 1665cdf5b4caSmmusante int len = strlen(oldname); 1666cdf5b4caSmmusante 1667cdf5b4caSmmusante /* truncate the snapshot name to get the fsname */ 1668cdf5b4caSmmusante cp = strchr(fsname, '@'); 1669cdf5b4caSmmusante *cp = '\0'; 1670cdf5b4caSmmusante 1671cdf5b4caSmmusante cp = strchr(fsname, '/'); 1672cdf5b4caSmmusante if (cp) { 1673cdf5b4caSmmusante *cp = '\0'; 1674cdf5b4caSmmusante err = spa_open(fsname, &spa, FTAG); 1675cdf5b4caSmmusante *cp = '/'; 1676cdf5b4caSmmusante } else { 1677cdf5b4caSmmusante err = spa_open(fsname, &spa, FTAG); 1678cdf5b4caSmmusante } 1679cdf5b4caSmmusante if (err) { 1680cdf5b4caSmmusante kmem_free(fsname, len + 1); 1681cdf5b4caSmmusante return (err); 1682cdf5b4caSmmusante } 1683cdf5b4caSmmusante ra = kmem_alloc(sizeof (struct renamearg), KM_SLEEP); 1684cdf5b4caSmmusante ra->dstg = dsl_sync_task_group_create(spa_get_dsl(spa)); 1685cdf5b4caSmmusante 1686cdf5b4caSmmusante ra->oldsnap = strchr(oldname, '@') + 1; 1687cdf5b4caSmmusante ra->newsnap = strchr(newname, '@') + 1; 1688cdf5b4caSmmusante *ra->failed = '\0'; 1689cdf5b4caSmmusante 1690cdf5b4caSmmusante err = dmu_objset_find(fsname, dsl_snapshot_rename_one, ra, 1691cdf5b4caSmmusante DS_FIND_CHILDREN); 1692cdf5b4caSmmusante kmem_free(fsname, len + 1); 1693cdf5b4caSmmusante 1694cdf5b4caSmmusante if (err == 0) { 1695cdf5b4caSmmusante err = dsl_sync_task_group_wait(ra->dstg); 1696cdf5b4caSmmusante } 1697cdf5b4caSmmusante 1698cdf5b4caSmmusante for (dst = list_head(&ra->dstg->dstg_tasks); dst; 1699cdf5b4caSmmusante dst = list_next(&ra->dstg->dstg_tasks, dst)) { 1700cdf5b4caSmmusante dsl_dataset_t *ds = dst->dst_arg1; 1701cdf5b4caSmmusante if (dst->dst_err) { 1702cdf5b4caSmmusante dsl_dir_name(ds->ds_dir, ra->failed); 17032572aa4eSmmusante (void) strcat(ra->failed, "@"); 17042572aa4eSmmusante (void) strcat(ra->failed, ra->newsnap); 1705cdf5b4caSmmusante } 1706cdf5b4caSmmusante dsl_dataset_close(ds, DS_MODE_STANDARD, ra->dstg); 1707cdf5b4caSmmusante } 1708cdf5b4caSmmusante 1709*ecd6cf80Smarks if (err) 1710*ecd6cf80Smarks (void) strcpy(oldname, ra->failed); 1711cdf5b4caSmmusante 1712cdf5b4caSmmusante dsl_sync_task_group_destroy(ra->dstg); 1713cdf5b4caSmmusante kmem_free(ra, sizeof (struct renamearg)); 1714cdf5b4caSmmusante spa_close(spa, FTAG); 1715cdf5b4caSmmusante return (err); 1716cdf5b4caSmmusante } 1717cdf5b4caSmmusante 1718fa9e4066Sahrens #pragma weak dmu_objset_rename = dsl_dataset_rename 1719fa9e4066Sahrens int 1720cdf5b4caSmmusante dsl_dataset_rename(char *oldname, const char *newname, 1721cdf5b4caSmmusante boolean_t recursive) 1722fa9e4066Sahrens { 1723fa9e4066Sahrens dsl_dir_t *dd; 17241d452cf5Sahrens dsl_dataset_t *ds; 1725fa9e4066Sahrens const char *tail; 1726fa9e4066Sahrens int err; 1727fa9e4066Sahrens 17281d452cf5Sahrens err = dsl_dir_open(oldname, FTAG, &dd, &tail); 1729ea8dc4b6Seschrock if (err) 1730ea8dc4b6Seschrock return (err); 1731fa9e4066Sahrens if (tail == NULL) { 17321d452cf5Sahrens err = dsl_dir_rename(dd, newname); 1733fa9e4066Sahrens dsl_dir_close(dd, FTAG); 1734fa9e4066Sahrens return (err); 1735fa9e4066Sahrens } 1736fa9e4066Sahrens if (tail[0] != '@') { 1737fa9e4066Sahrens /* the name ended in a nonexistant component */ 1738fa9e4066Sahrens dsl_dir_close(dd, FTAG); 1739fa9e4066Sahrens return (ENOENT); 1740fa9e4066Sahrens } 1741fa9e4066Sahrens 1742fa9e4066Sahrens dsl_dir_close(dd, FTAG); 17431d452cf5Sahrens 17441d452cf5Sahrens /* new name must be snapshot in same filesystem */ 17451d452cf5Sahrens tail = strchr(newname, '@'); 17461d452cf5Sahrens if (tail == NULL) 17471d452cf5Sahrens return (EINVAL); 17481d452cf5Sahrens tail++; 17491d452cf5Sahrens if (strncmp(oldname, newname, tail - newname) != 0) 17501d452cf5Sahrens return (EXDEV); 17511d452cf5Sahrens 1752cdf5b4caSmmusante if (recursive) { 1753cdf5b4caSmmusante err = dsl_recursive_rename(oldname, newname); 1754cdf5b4caSmmusante } else { 1755cdf5b4caSmmusante err = dsl_dataset_open(oldname, 1756cdf5b4caSmmusante DS_MODE_READONLY | DS_MODE_STANDARD, FTAG, &ds); 1757cdf5b4caSmmusante if (err) 1758cdf5b4caSmmusante return (err); 17591d452cf5Sahrens 1760cdf5b4caSmmusante err = dsl_sync_task_do(ds->ds_dir->dd_pool, 1761cdf5b4caSmmusante dsl_dataset_snapshot_rename_check, 1762cdf5b4caSmmusante dsl_dataset_snapshot_rename_sync, ds, (char *)tail, 1); 17631d452cf5Sahrens 1764cdf5b4caSmmusante dsl_dataset_close(ds, DS_MODE_STANDARD, FTAG); 1765cdf5b4caSmmusante } 17661d452cf5Sahrens 1767fa9e4066Sahrens return (err); 1768fa9e4066Sahrens } 176999653d4eSeschrock 17701d452cf5Sahrens struct promotearg { 17711d452cf5Sahrens uint64_t used, comp, uncomp, unique; 17721d452cf5Sahrens uint64_t newnext_obj, snapnames_obj; 17731d452cf5Sahrens }; 17741d452cf5Sahrens 1775*ecd6cf80Smarks /* ARGSUSED */ 177699653d4eSeschrock static int 17771d452cf5Sahrens dsl_dataset_promote_check(void *arg1, void *arg2, dmu_tx_t *tx) 177899653d4eSeschrock { 17791d452cf5Sahrens dsl_dataset_t *hds = arg1; 17801d452cf5Sahrens struct promotearg *pa = arg2; 17811d452cf5Sahrens dsl_dir_t *dd = hds->ds_dir; 17821d452cf5Sahrens dsl_pool_t *dp = hds->ds_dir->dd_pool; 178399653d4eSeschrock dsl_dir_t *pdd = NULL; 178499653d4eSeschrock dsl_dataset_t *ds = NULL; 178599653d4eSeschrock dsl_dataset_t *pivot_ds = NULL; 178699653d4eSeschrock dsl_dataset_t *newnext_ds = NULL; 178799653d4eSeschrock int err; 178899653d4eSeschrock char *name = NULL; 17891d452cf5Sahrens uint64_t itor = 0; 179099653d4eSeschrock blkptr_t bp; 179199653d4eSeschrock 17921d452cf5Sahrens bzero(pa, sizeof (*pa)); 17931d452cf5Sahrens 179499653d4eSeschrock /* Check that it is a clone */ 179599653d4eSeschrock if (dd->dd_phys->dd_clone_parent_obj == 0) 179699653d4eSeschrock return (EINVAL); 179799653d4eSeschrock 17981d452cf5Sahrens /* Since this is so expensive, don't do the preliminary check */ 17991d452cf5Sahrens if (!dmu_tx_is_syncing(tx)) 18001d452cf5Sahrens return (0); 18011d452cf5Sahrens 18021d452cf5Sahrens if (err = dsl_dataset_open_obj(dp, 180399653d4eSeschrock dd->dd_phys->dd_clone_parent_obj, 180499653d4eSeschrock NULL, DS_MODE_EXCLUSIVE, FTAG, &pivot_ds)) 180599653d4eSeschrock goto out; 180699653d4eSeschrock pdd = pivot_ds->ds_dir; 18071d452cf5Sahrens 18081d452cf5Sahrens { 18091d452cf5Sahrens dsl_dataset_t *phds; 18101d452cf5Sahrens if (err = dsl_dataset_open_obj(dd->dd_pool, 18111d452cf5Sahrens pdd->dd_phys->dd_head_dataset_obj, 18121d452cf5Sahrens NULL, DS_MODE_NONE, FTAG, &phds)) 18131d452cf5Sahrens goto out; 18141d452cf5Sahrens pa->snapnames_obj = phds->ds_phys->ds_snapnames_zapobj; 18151d452cf5Sahrens dsl_dataset_close(phds, DS_MODE_NONE, FTAG); 18161d452cf5Sahrens } 181799653d4eSeschrock 181899653d4eSeschrock if (hds->ds_phys->ds_flags & DS_FLAG_NOPROMOTE) { 181999653d4eSeschrock err = EXDEV; 182099653d4eSeschrock goto out; 182199653d4eSeschrock } 182299653d4eSeschrock 182399653d4eSeschrock /* find pivot point's new next ds */ 182499653d4eSeschrock VERIFY(0 == dsl_dataset_open_obj(dd->dd_pool, hds->ds_object, 182599653d4eSeschrock NULL, DS_MODE_NONE, FTAG, &newnext_ds)); 182699653d4eSeschrock while (newnext_ds->ds_phys->ds_prev_snap_obj != pivot_ds->ds_object) { 182799653d4eSeschrock dsl_dataset_t *prev; 182899653d4eSeschrock 182999653d4eSeschrock if (err = dsl_dataset_open_obj(dd->dd_pool, 18301d452cf5Sahrens newnext_ds->ds_phys->ds_prev_snap_obj, 18311d452cf5Sahrens NULL, DS_MODE_NONE, FTAG, &prev)) 183299653d4eSeschrock goto out; 183399653d4eSeschrock dsl_dataset_close(newnext_ds, DS_MODE_NONE, FTAG); 183499653d4eSeschrock newnext_ds = prev; 183599653d4eSeschrock } 18361d452cf5Sahrens pa->newnext_obj = newnext_ds->ds_object; 183799653d4eSeschrock 183899653d4eSeschrock /* compute pivot point's new unique space */ 183999653d4eSeschrock while ((err = bplist_iterate(&newnext_ds->ds_deadlist, 184099653d4eSeschrock &itor, &bp)) == 0) { 184199653d4eSeschrock if (bp.blk_birth > pivot_ds->ds_phys->ds_prev_snap_txg) 18421d452cf5Sahrens pa->unique += bp_get_dasize(dd->dd_pool->dp_spa, &bp); 184399653d4eSeschrock } 184499653d4eSeschrock if (err != ENOENT) 184599653d4eSeschrock goto out; 184699653d4eSeschrock 184799653d4eSeschrock /* Walk the snapshots that we are moving */ 184899653d4eSeschrock name = kmem_alloc(MAXPATHLEN, KM_SLEEP); 184999653d4eSeschrock ds = pivot_ds; 185099653d4eSeschrock /* CONSTCOND */ 185199653d4eSeschrock while (TRUE) { 185299653d4eSeschrock uint64_t val, dlused, dlcomp, dluncomp; 185399653d4eSeschrock dsl_dataset_t *prev; 185499653d4eSeschrock 185599653d4eSeschrock /* Check that the snapshot name does not conflict */ 185699653d4eSeschrock dsl_dataset_name(ds, name); 185799653d4eSeschrock err = zap_lookup(dd->dd_pool->dp_meta_objset, 185899653d4eSeschrock hds->ds_phys->ds_snapnames_zapobj, ds->ds_snapname, 185999653d4eSeschrock 8, 1, &val); 186099653d4eSeschrock if (err != ENOENT) { 186199653d4eSeschrock if (err == 0) 186299653d4eSeschrock err = EEXIST; 186399653d4eSeschrock goto out; 186499653d4eSeschrock } 186599653d4eSeschrock 186699653d4eSeschrock /* 186799653d4eSeschrock * compute space to transfer. Each snapshot gave birth to: 186899653d4eSeschrock * (my used) - (prev's used) + (deadlist's used) 186999653d4eSeschrock */ 18701d452cf5Sahrens pa->used += ds->ds_phys->ds_used_bytes; 18711d452cf5Sahrens pa->comp += ds->ds_phys->ds_compressed_bytes; 18721d452cf5Sahrens pa->uncomp += ds->ds_phys->ds_uncompressed_bytes; 187399653d4eSeschrock 187499653d4eSeschrock /* If we reach the first snapshot, we're done. */ 187599653d4eSeschrock if (ds->ds_phys->ds_prev_snap_obj == 0) 187699653d4eSeschrock break; 187799653d4eSeschrock 187899653d4eSeschrock if (err = bplist_space(&ds->ds_deadlist, 187999653d4eSeschrock &dlused, &dlcomp, &dluncomp)) 188099653d4eSeschrock goto out; 188199653d4eSeschrock if (err = dsl_dataset_open_obj(dd->dd_pool, 188299653d4eSeschrock ds->ds_phys->ds_prev_snap_obj, NULL, DS_MODE_EXCLUSIVE, 188399653d4eSeschrock FTAG, &prev)) 188499653d4eSeschrock goto out; 18851d452cf5Sahrens pa->used += dlused - prev->ds_phys->ds_used_bytes; 18861d452cf5Sahrens pa->comp += dlcomp - prev->ds_phys->ds_compressed_bytes; 18871d452cf5Sahrens pa->uncomp += dluncomp - prev->ds_phys->ds_uncompressed_bytes; 188899653d4eSeschrock 188999653d4eSeschrock /* 189099653d4eSeschrock * We could be a clone of a clone. If we reach our 189199653d4eSeschrock * parent's branch point, we're done. 189299653d4eSeschrock */ 189399653d4eSeschrock if (prev->ds_phys->ds_next_snap_obj != ds->ds_object) { 189499653d4eSeschrock dsl_dataset_close(prev, DS_MODE_EXCLUSIVE, FTAG); 189599653d4eSeschrock break; 189699653d4eSeschrock } 189799653d4eSeschrock if (ds != pivot_ds) 189899653d4eSeschrock dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, FTAG); 189999653d4eSeschrock ds = prev; 190099653d4eSeschrock } 190199653d4eSeschrock 190299653d4eSeschrock /* Check that there is enough space here */ 19031d452cf5Sahrens err = dsl_dir_transfer_possible(pdd, dd, pa->used); 19041d452cf5Sahrens 19051d452cf5Sahrens out: 19061d452cf5Sahrens if (ds && ds != pivot_ds) 19071d452cf5Sahrens dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, FTAG); 19081d452cf5Sahrens if (pivot_ds) 19091d452cf5Sahrens dsl_dataset_close(pivot_ds, DS_MODE_EXCLUSIVE, FTAG); 19101d452cf5Sahrens if (newnext_ds) 19111d452cf5Sahrens dsl_dataset_close(newnext_ds, DS_MODE_NONE, FTAG); 19121d452cf5Sahrens if (name) 19131d452cf5Sahrens kmem_free(name, MAXPATHLEN); 19141d452cf5Sahrens return (err); 19151d452cf5Sahrens } 191699653d4eSeschrock 19171d452cf5Sahrens static void 1918*ecd6cf80Smarks dsl_dataset_promote_sync(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx) 19191d452cf5Sahrens { 19201d452cf5Sahrens dsl_dataset_t *hds = arg1; 19211d452cf5Sahrens struct promotearg *pa = arg2; 19221d452cf5Sahrens dsl_dir_t *dd = hds->ds_dir; 19231d452cf5Sahrens dsl_pool_t *dp = hds->ds_dir->dd_pool; 19241d452cf5Sahrens dsl_dir_t *pdd = NULL; 19251d452cf5Sahrens dsl_dataset_t *ds, *pivot_ds; 19261d452cf5Sahrens char *name; 19271d452cf5Sahrens 19281d452cf5Sahrens ASSERT(dd->dd_phys->dd_clone_parent_obj != 0); 19291d452cf5Sahrens ASSERT(0 == (hds->ds_phys->ds_flags & DS_FLAG_NOPROMOTE)); 19301d452cf5Sahrens 19311d452cf5Sahrens VERIFY(0 == dsl_dataset_open_obj(dp, 19321d452cf5Sahrens dd->dd_phys->dd_clone_parent_obj, 19331d452cf5Sahrens NULL, DS_MODE_EXCLUSIVE, FTAG, &pivot_ds)); 19340b69c2f0Sahrens /* 19350b69c2f0Sahrens * We need to explicitly open pdd, since pivot_ds's pdd will be 19360b69c2f0Sahrens * changing. 19370b69c2f0Sahrens */ 19380b69c2f0Sahrens VERIFY(0 == dsl_dir_open_obj(dp, pivot_ds->ds_dir->dd_object, 19390b69c2f0Sahrens NULL, FTAG, &pdd)); 194099653d4eSeschrock 194199653d4eSeschrock /* move snapshots to this dir */ 19421d452cf5Sahrens name = kmem_alloc(MAXPATHLEN, KM_SLEEP); 194399653d4eSeschrock ds = pivot_ds; 194499653d4eSeschrock /* CONSTCOND */ 194599653d4eSeschrock while (TRUE) { 194699653d4eSeschrock dsl_dataset_t *prev; 194799653d4eSeschrock 194899653d4eSeschrock /* move snap name entry */ 194999653d4eSeschrock dsl_dataset_name(ds, name); 19501d452cf5Sahrens VERIFY(0 == zap_remove(dp->dp_meta_objset, 19511d452cf5Sahrens pa->snapnames_obj, ds->ds_snapname, tx)); 19521d452cf5Sahrens VERIFY(0 == zap_add(dp->dp_meta_objset, 195399653d4eSeschrock hds->ds_phys->ds_snapnames_zapobj, ds->ds_snapname, 195499653d4eSeschrock 8, 1, &ds->ds_object, tx)); 195599653d4eSeschrock 195699653d4eSeschrock /* change containing dsl_dir */ 195799653d4eSeschrock dmu_buf_will_dirty(ds->ds_dbuf, tx); 195899653d4eSeschrock ASSERT3U(ds->ds_phys->ds_dir_obj, ==, pdd->dd_object); 195999653d4eSeschrock ds->ds_phys->ds_dir_obj = dd->dd_object; 196099653d4eSeschrock ASSERT3P(ds->ds_dir, ==, pdd); 196199653d4eSeschrock dsl_dir_close(ds->ds_dir, ds); 19621d452cf5Sahrens VERIFY(0 == dsl_dir_open_obj(dp, dd->dd_object, 196399653d4eSeschrock NULL, ds, &ds->ds_dir)); 196499653d4eSeschrock 196599653d4eSeschrock ASSERT3U(dsl_prop_numcb(ds), ==, 0); 196699653d4eSeschrock 196799653d4eSeschrock if (ds->ds_phys->ds_prev_snap_obj == 0) 196899653d4eSeschrock break; 196999653d4eSeschrock 19701d452cf5Sahrens VERIFY(0 == dsl_dataset_open_obj(dp, 197199653d4eSeschrock ds->ds_phys->ds_prev_snap_obj, NULL, DS_MODE_EXCLUSIVE, 197299653d4eSeschrock FTAG, &prev)); 197399653d4eSeschrock 197499653d4eSeschrock if (prev->ds_phys->ds_next_snap_obj != ds->ds_object) { 197599653d4eSeschrock dsl_dataset_close(prev, DS_MODE_EXCLUSIVE, FTAG); 197699653d4eSeschrock break; 197799653d4eSeschrock } 197899653d4eSeschrock if (ds != pivot_ds) 197999653d4eSeschrock dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, FTAG); 198099653d4eSeschrock ds = prev; 198199653d4eSeschrock } 19821d452cf5Sahrens if (ds != pivot_ds) 19831d452cf5Sahrens dsl_dataset_close(ds, DS_MODE_EXCLUSIVE, FTAG); 198499653d4eSeschrock 198599653d4eSeschrock /* change pivot point's next snap */ 198699653d4eSeschrock dmu_buf_will_dirty(pivot_ds->ds_dbuf, tx); 19871d452cf5Sahrens pivot_ds->ds_phys->ds_next_snap_obj = pa->newnext_obj; 198899653d4eSeschrock 198999653d4eSeschrock /* change clone_parent-age */ 199099653d4eSeschrock dmu_buf_will_dirty(dd->dd_dbuf, tx); 199199653d4eSeschrock ASSERT3U(dd->dd_phys->dd_clone_parent_obj, ==, pivot_ds->ds_object); 199299653d4eSeschrock dd->dd_phys->dd_clone_parent_obj = pdd->dd_phys->dd_clone_parent_obj; 199399653d4eSeschrock dmu_buf_will_dirty(pdd->dd_dbuf, tx); 199499653d4eSeschrock pdd->dd_phys->dd_clone_parent_obj = pivot_ds->ds_object; 199599653d4eSeschrock 199699653d4eSeschrock /* change space accounting */ 19971d452cf5Sahrens dsl_dir_diduse_space(pdd, -pa->used, -pa->comp, -pa->uncomp, tx); 19981d452cf5Sahrens dsl_dir_diduse_space(dd, pa->used, pa->comp, pa->uncomp, tx); 19991d452cf5Sahrens pivot_ds->ds_phys->ds_unique_bytes = pa->unique; 200099653d4eSeschrock 2001*ecd6cf80Smarks /* log history record */ 2002*ecd6cf80Smarks spa_history_internal_log(LOG_DS_PROMOTE, dd->dd_pool->dp_spa, tx, 2003*ecd6cf80Smarks cr, "dataset = %llu", ds->ds_object); 2004*ecd6cf80Smarks 20050b69c2f0Sahrens dsl_dir_close(pdd, FTAG); 20061d452cf5Sahrens dsl_dataset_close(pivot_ds, DS_MODE_EXCLUSIVE, FTAG); 20071d452cf5Sahrens kmem_free(name, MAXPATHLEN); 200899653d4eSeschrock } 200999653d4eSeschrock 201099653d4eSeschrock int 201199653d4eSeschrock dsl_dataset_promote(const char *name) 201299653d4eSeschrock { 201399653d4eSeschrock dsl_dataset_t *ds; 201499653d4eSeschrock int err; 201599653d4eSeschrock dmu_object_info_t doi; 20161d452cf5Sahrens struct promotearg pa; 201799653d4eSeschrock 201899653d4eSeschrock err = dsl_dataset_open(name, DS_MODE_NONE, FTAG, &ds); 201999653d4eSeschrock if (err) 202099653d4eSeschrock return (err); 202199653d4eSeschrock 202299653d4eSeschrock err = dmu_object_info(ds->ds_dir->dd_pool->dp_meta_objset, 202399653d4eSeschrock ds->ds_phys->ds_snapnames_zapobj, &doi); 202499653d4eSeschrock if (err) { 202599653d4eSeschrock dsl_dataset_close(ds, DS_MODE_NONE, FTAG); 202699653d4eSeschrock return (err); 202799653d4eSeschrock } 202899653d4eSeschrock 202999653d4eSeschrock /* 203099653d4eSeschrock * Add in 128x the snapnames zapobj size, since we will be moving 203199653d4eSeschrock * a bunch of snapnames to the promoted ds, and dirtying their 203299653d4eSeschrock * bonus buffers. 203399653d4eSeschrock */ 20341d452cf5Sahrens err = dsl_sync_task_do(ds->ds_dir->dd_pool, 20351d452cf5Sahrens dsl_dataset_promote_check, 20361d452cf5Sahrens dsl_dataset_promote_sync, ds, &pa, 2 + 2 * doi.doi_physical_blks); 203799653d4eSeschrock dsl_dataset_close(ds, DS_MODE_NONE, FTAG); 203899653d4eSeschrock return (err); 203999653d4eSeschrock } 2040b1b8ab34Slling 2041b1b8ab34Slling /* 2042b1b8ab34Slling * Given a pool name and a dataset object number in that pool, 2043b1b8ab34Slling * return the name of that dataset. 2044b1b8ab34Slling */ 2045b1b8ab34Slling int 2046b1b8ab34Slling dsl_dsobj_to_dsname(char *pname, uint64_t obj, char *buf) 2047b1b8ab34Slling { 2048b1b8ab34Slling spa_t *spa; 2049b1b8ab34Slling dsl_pool_t *dp; 2050b1b8ab34Slling dsl_dataset_t *ds = NULL; 2051b1b8ab34Slling int error; 2052b1b8ab34Slling 2053b1b8ab34Slling if ((error = spa_open(pname, &spa, FTAG)) != 0) 2054b1b8ab34Slling return (error); 2055b1b8ab34Slling dp = spa_get_dsl(spa); 2056b1b8ab34Slling rw_enter(&dp->dp_config_rwlock, RW_READER); 2057b1b8ab34Slling if ((error = dsl_dataset_open_obj(dp, obj, 2058b1b8ab34Slling NULL, DS_MODE_NONE, FTAG, &ds)) != 0) { 2059b1b8ab34Slling rw_exit(&dp->dp_config_rwlock); 2060b1b8ab34Slling spa_close(spa, FTAG); 2061b1b8ab34Slling return (error); 2062b1b8ab34Slling } 2063b1b8ab34Slling dsl_dataset_name(ds, buf); 2064b1b8ab34Slling dsl_dataset_close(ds, DS_MODE_NONE, FTAG); 2065b1b8ab34Slling rw_exit(&dp->dp_config_rwlock); 2066b1b8ab34Slling spa_close(spa, FTAG); 2067b1b8ab34Slling 2068b1b8ab34Slling return (0); 2069b1b8ab34Slling } 2070