1fa9e4066Sahrens /* 2fa9e4066Sahrens * CDDL HEADER START 3fa9e4066Sahrens * 4fa9e4066Sahrens * The contents of this file are subject to the terms of the 5ea8dc4b6Seschrock * Common Development and Distribution License (the "License"). 6ea8dc4b6Seschrock * You may not use this file except in compliance with the License. 7fa9e4066Sahrens * 8fa9e4066Sahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9fa9e4066Sahrens * or http://www.opensolaris.org/os/licensing. 10fa9e4066Sahrens * See the License for the specific language governing permissions 11fa9e4066Sahrens * and limitations under the License. 12fa9e4066Sahrens * 13fa9e4066Sahrens * When distributing Covered Code, include this CDDL HEADER in each 14fa9e4066Sahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15fa9e4066Sahrens * If applicable, add the following below this CDDL HEADER, with the 16fa9e4066Sahrens * fields enclosed by brackets "[]" replaced with your own identifying 17fa9e4066Sahrens * information: Portions Copyright [yyyy] [name of copyright owner] 18fa9e4066Sahrens * 19fa9e4066Sahrens * CDDL HEADER END 20fa9e4066Sahrens */ 21fa9e4066Sahrens /* 225afc78aaSChris Kirby * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved. 23b461c746SMatthew Ahrens * Copyright (c) 2013, 2014 by Delphix. All rights reserved. 24a2afb611SJerry Jelinek * Copyright (c) 2014, Joyent, Inc. All rights reserved. 2503d1795fSAlexander Stetsenko * Copyright (c) 2014 RackTop Systems. 26fa9e4066Sahrens */ 27fa9e4066Sahrens 28fa9e4066Sahrens #include <sys/dmu_objset.h> 29fa9e4066Sahrens #include <sys/dsl_dataset.h> 30fa9e4066Sahrens #include <sys/dsl_dir.h> 3199653d4eSeschrock #include <sys/dsl_prop.h> 321d452cf5Sahrens #include <sys/dsl_synctask.h> 33fa9e4066Sahrens #include <sys/dmu_traverse.h> 344e3c9f44SBill Pijewski #include <sys/dmu_impl.h> 35fa9e4066Sahrens #include <sys/dmu_tx.h> 36fa9e4066Sahrens #include <sys/arc.h> 37fa9e4066Sahrens #include <sys/zio.h> 38fa9e4066Sahrens #include <sys/zap.h> 39ad135b5dSChristopher Siden #include <sys/zfeature.h> 40fa9e4066Sahrens #include <sys/unique.h> 41fa9e4066Sahrens #include <sys/zfs_context.h> 42cdf5b4caSmmusante #include <sys/zfs_ioctl.h> 43ecd6cf80Smarks #include <sys/spa.h> 44088f3894Sahrens #include <sys/zfs_znode.h> 45c99e4bdcSChris Kirby #include <sys/zfs_onexit.h> 46842727c2SChris Kirby #include <sys/zvol.h> 473f9d6ad7SLin Ling #include <sys/dsl_scan.h> 48cde58dbcSMatthew Ahrens #include <sys/dsl_deadlist.h> 493b2aab18SMatthew Ahrens #include <sys/dsl_destroy.h> 503b2aab18SMatthew Ahrens #include <sys/dsl_userhold.h> 5178f17100SMatthew Ahrens #include <sys/dsl_bookmark.h> 52e1930233Sbonwick 53cde58dbcSMatthew Ahrens #define SWITCH64(x, y) \ 54cde58dbcSMatthew Ahrens { \ 55cde58dbcSMatthew Ahrens uint64_t __tmp = (x); \ 56cde58dbcSMatthew Ahrens (x) = (y); \ 57cde58dbcSMatthew Ahrens (y) = __tmp; \ 58cde58dbcSMatthew Ahrens } 59cde58dbcSMatthew Ahrens 6055434c77Sek #define DS_REF_MAX (1ULL << 62) 61fa9e4066Sahrens 62fa9e4066Sahrens #define DSL_DEADLIST_BLOCKSIZE SPA_MAXBLOCKSIZE 63fa9e4066Sahrens 64a9799022Sck /* 65a9799022Sck * Figure out how much of this delta should be propogated to the dsl_dir 66a9799022Sck * layer. If there's a refreservation, that space has already been 67a9799022Sck * partially accounted for in our ancestors. 68a9799022Sck */ 69a9799022Sck static int64_t 70a9799022Sck parent_delta(dsl_dataset_t *ds, int64_t delta) 71a9799022Sck { 72a9799022Sck uint64_t old_bytes, new_bytes; 73a9799022Sck 74a9799022Sck if (ds->ds_reserved == 0) 75a9799022Sck return (delta); 76a9799022Sck 77a9799022Sck old_bytes = MAX(ds->ds_phys->ds_unique_bytes, ds->ds_reserved); 78a9799022Sck new_bytes = MAX(ds->ds_phys->ds_unique_bytes + delta, ds->ds_reserved); 79a9799022Sck 80a9799022Sck ASSERT3U(ABS((int64_t)(new_bytes - old_bytes)), <=, ABS(delta)); 81a9799022Sck return (new_bytes - old_bytes); 82a9799022Sck } 83fa9e4066Sahrens 84fa9e4066Sahrens void 85b24ab676SJeff Bonwick dsl_dataset_block_born(dsl_dataset_t *ds, const blkptr_t *bp, dmu_tx_t *tx) 86fa9e4066Sahrens { 87b24ab676SJeff Bonwick int used = bp_get_dsize_sync(tx->tx_pool->dp_spa, bp); 88fa9e4066Sahrens int compressed = BP_GET_PSIZE(bp); 89fa9e4066Sahrens int uncompressed = BP_GET_UCSIZE(bp); 90a9799022Sck int64_t delta; 91fa9e4066Sahrens 923f9d6ad7SLin Ling dprintf_bp(bp, "ds=%p", ds); 93fa9e4066Sahrens 94fa9e4066Sahrens ASSERT(dmu_tx_is_syncing(tx)); 95fa9e4066Sahrens /* It could have been compressed away to nothing */ 96fa9e4066Sahrens if (BP_IS_HOLE(bp)) 97fa9e4066Sahrens return; 98fa9e4066Sahrens ASSERT(BP_GET_TYPE(bp) != DMU_OT_NONE); 99ad135b5dSChristopher Siden ASSERT(DMU_OT_IS_VALID(BP_GET_TYPE(bp))); 100fa9e4066Sahrens if (ds == NULL) { 101ce636f8bSMatthew Ahrens dsl_pool_mos_diduse_space(tx->tx_pool, 102ce636f8bSMatthew Ahrens used, compressed, uncompressed); 103fa9e4066Sahrens return; 104fa9e4066Sahrens } 1053f9d6ad7SLin Ling 106b62969f8SMatthew Ahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 107fa9e4066Sahrens mutex_enter(&ds->ds_lock); 108a9799022Sck delta = parent_delta(ds, used); 109ad135b5dSChristopher Siden ds->ds_phys->ds_referenced_bytes += used; 110fa9e4066Sahrens ds->ds_phys->ds_compressed_bytes += compressed; 111fa9e4066Sahrens ds->ds_phys->ds_uncompressed_bytes += uncompressed; 112fa9e4066Sahrens ds->ds_phys->ds_unique_bytes += used; 113fa9e4066Sahrens mutex_exit(&ds->ds_lock); 11474e7dc98SMatthew Ahrens dsl_dir_diduse_space(ds->ds_dir, DD_USED_HEAD, delta, 11574e7dc98SMatthew Ahrens compressed, uncompressed, tx); 11674e7dc98SMatthew Ahrens dsl_dir_transfer_space(ds->ds_dir, used - delta, 11774e7dc98SMatthew Ahrens DD_USED_REFRSRV, DD_USED_HEAD, tx); 118fa9e4066Sahrens } 119fa9e4066Sahrens 120cdb0ab79Smaybee int 121b24ab676SJeff Bonwick dsl_dataset_block_kill(dsl_dataset_t *ds, const blkptr_t *bp, dmu_tx_t *tx, 122b24ab676SJeff Bonwick boolean_t async) 123fa9e4066Sahrens { 12443466aaeSMax Grossman int used = bp_get_dsize_sync(tx->tx_pool->dp_spa, bp); 12543466aaeSMax Grossman int compressed = BP_GET_PSIZE(bp); 12643466aaeSMax Grossman int uncompressed = BP_GET_UCSIZE(bp); 12743466aaeSMax Grossman 128fa9e4066Sahrens if (BP_IS_HOLE(bp)) 129cdb0ab79Smaybee return (0); 130fa9e4066Sahrens 131b24ab676SJeff Bonwick ASSERT(dmu_tx_is_syncing(tx)); 132b24ab676SJeff Bonwick ASSERT(bp->blk_birth <= tx->tx_txg); 133b24ab676SJeff Bonwick 134fa9e4066Sahrens if (ds == NULL) { 135b24ab676SJeff Bonwick dsl_free(tx->tx_pool, tx->tx_txg, bp); 136ce636f8bSMatthew Ahrens dsl_pool_mos_diduse_space(tx->tx_pool, 137ce636f8bSMatthew Ahrens -used, -compressed, -uncompressed); 138cdb0ab79Smaybee return (used); 139fa9e4066Sahrens } 140fa9e4066Sahrens ASSERT3P(tx->tx_pool, ==, ds->ds_dir->dd_pool); 141fa9e4066Sahrens 14274e7dc98SMatthew Ahrens ASSERT(!dsl_dataset_is_snapshot(ds)); 143fa9e4066Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 144fa9e4066Sahrens 145fa9e4066Sahrens if (bp->blk_birth > ds->ds_phys->ds_prev_snap_txg) { 146a9799022Sck int64_t delta; 147c717a561Smaybee 1483f9d6ad7SLin Ling dprintf_bp(bp, "freeing ds=%llu", ds->ds_object); 149b24ab676SJeff Bonwick dsl_free(tx->tx_pool, tx->tx_txg, bp); 150fa9e4066Sahrens 151fa9e4066Sahrens mutex_enter(&ds->ds_lock); 152a9799022Sck ASSERT(ds->ds_phys->ds_unique_bytes >= used || 153a9799022Sck !DS_UNIQUE_IS_ACCURATE(ds)); 154a9799022Sck delta = parent_delta(ds, -used); 155fa9e4066Sahrens ds->ds_phys->ds_unique_bytes -= used; 156fa9e4066Sahrens mutex_exit(&ds->ds_lock); 15774e7dc98SMatthew Ahrens dsl_dir_diduse_space(ds->ds_dir, DD_USED_HEAD, 158a9799022Sck delta, -compressed, -uncompressed, tx); 15974e7dc98SMatthew Ahrens dsl_dir_transfer_space(ds->ds_dir, -used - delta, 16074e7dc98SMatthew Ahrens DD_USED_REFRSRV, DD_USED_HEAD, tx); 161fa9e4066Sahrens } else { 162fa9e4066Sahrens dprintf_bp(bp, "putting on dead list: %s", ""); 163b24ab676SJeff Bonwick if (async) { 164b24ab676SJeff Bonwick /* 165b24ab676SJeff Bonwick * We are here as part of zio's write done callback, 166b24ab676SJeff Bonwick * which means we're a zio interrupt thread. We can't 167cde58dbcSMatthew Ahrens * call dsl_deadlist_insert() now because it may block 168b24ab676SJeff Bonwick * waiting for I/O. Instead, put bp on the deferred 169b24ab676SJeff Bonwick * queue and let dsl_pool_sync() finish the job. 170b24ab676SJeff Bonwick */ 171cde58dbcSMatthew Ahrens bplist_append(&ds->ds_pending_deadlist, bp); 172b24ab676SJeff Bonwick } else { 173cde58dbcSMatthew Ahrens dsl_deadlist_insert(&ds->ds_deadlist, bp, tx); 174b24ab676SJeff Bonwick } 175a4611edeSahrens ASSERT3U(ds->ds_prev->ds_object, ==, 176a4611edeSahrens ds->ds_phys->ds_prev_snap_obj); 177a4611edeSahrens ASSERT(ds->ds_prev->ds_phys->ds_num_children > 0); 178fa9e4066Sahrens /* if (bp->blk_birth > prev prev snap txg) prev unique += bs */ 179a4611edeSahrens if (ds->ds_prev->ds_phys->ds_next_snap_obj == 180a4611edeSahrens ds->ds_object && bp->blk_birth > 181a4611edeSahrens ds->ds_prev->ds_phys->ds_prev_snap_txg) { 182a4611edeSahrens dmu_buf_will_dirty(ds->ds_prev->ds_dbuf, tx); 183a4611edeSahrens mutex_enter(&ds->ds_prev->ds_lock); 184a4611edeSahrens ds->ds_prev->ds_phys->ds_unique_bytes += used; 185a4611edeSahrens mutex_exit(&ds->ds_prev->ds_lock); 186fa9e4066Sahrens } 1873f9d6ad7SLin Ling if (bp->blk_birth > ds->ds_dir->dd_origin_txg) { 18874e7dc98SMatthew Ahrens dsl_dir_transfer_space(ds->ds_dir, used, 18974e7dc98SMatthew Ahrens DD_USED_HEAD, DD_USED_SNAP, tx); 19074e7dc98SMatthew Ahrens } 191fa9e4066Sahrens } 192fa9e4066Sahrens mutex_enter(&ds->ds_lock); 193ad135b5dSChristopher Siden ASSERT3U(ds->ds_phys->ds_referenced_bytes, >=, used); 194ad135b5dSChristopher Siden ds->ds_phys->ds_referenced_bytes -= used; 195fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_compressed_bytes, >=, compressed); 196fa9e4066Sahrens ds->ds_phys->ds_compressed_bytes -= compressed; 197fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_uncompressed_bytes, >=, uncompressed); 198fa9e4066Sahrens ds->ds_phys->ds_uncompressed_bytes -= uncompressed; 199fa9e4066Sahrens mutex_exit(&ds->ds_lock); 200cdb0ab79Smaybee 201cdb0ab79Smaybee return (used); 202fa9e4066Sahrens } 203fa9e4066Sahrens 204ea8dc4b6Seschrock uint64_t 205ea8dc4b6Seschrock dsl_dataset_prev_snap_txg(dsl_dataset_t *ds) 206fa9e4066Sahrens { 207a2eea2e1Sahrens uint64_t trysnap = 0; 208a2eea2e1Sahrens 209fa9e4066Sahrens if (ds == NULL) 210ea8dc4b6Seschrock return (0); 211fa9e4066Sahrens /* 212fa9e4066Sahrens * The snapshot creation could fail, but that would cause an 213fa9e4066Sahrens * incorrect FALSE return, which would only result in an 214fa9e4066Sahrens * overestimation of the amount of space that an operation would 215fa9e4066Sahrens * consume, which is OK. 216fa9e4066Sahrens * 217fa9e4066Sahrens * There's also a small window where we could miss a pending 218fa9e4066Sahrens * snapshot, because we could set the sync task in the quiescing 219fa9e4066Sahrens * phase. So this should only be used as a guess. 220fa9e4066Sahrens */ 221a2eea2e1Sahrens if (ds->ds_trysnap_txg > 222a2eea2e1Sahrens spa_last_synced_txg(ds->ds_dir->dd_pool->dp_spa)) 223a2eea2e1Sahrens trysnap = ds->ds_trysnap_txg; 224a2eea2e1Sahrens return (MAX(ds->ds_phys->ds_prev_snap_txg, trysnap)); 225ea8dc4b6Seschrock } 226ea8dc4b6Seschrock 2273d692628SSanjeev Bagewadi boolean_t 228c7cd2421SGeorge Wilson dsl_dataset_block_freeable(dsl_dataset_t *ds, const blkptr_t *bp, 229c7cd2421SGeorge Wilson uint64_t blk_birth) 230ea8dc4b6Seschrock { 23143466aaeSMax Grossman if (blk_birth <= dsl_dataset_prev_snap_txg(ds) || 23243466aaeSMax Grossman (bp != NULL && BP_IS_HOLE(bp))) 233c7cd2421SGeorge Wilson return (B_FALSE); 234c7cd2421SGeorge Wilson 235837b568bSGeorge Wilson ddt_prefetch(dsl_dataset_get_spa(ds), bp); 236c7cd2421SGeorge Wilson 237c7cd2421SGeorge Wilson return (B_TRUE); 238fa9e4066Sahrens } 239fa9e4066Sahrens 240fa9e4066Sahrens /* ARGSUSED */ 241fa9e4066Sahrens static void 242fa9e4066Sahrens dsl_dataset_evict(dmu_buf_t *db, void *dsv) 243fa9e4066Sahrens { 244fa9e4066Sahrens dsl_dataset_t *ds = dsv; 245fa9e4066Sahrens 2463b2aab18SMatthew Ahrens ASSERT(ds->ds_owner == NULL); 247fa9e4066Sahrens 24891ebeef5Sahrens unique_remove(ds->ds_fsid_guid); 249fa9e4066Sahrens 250503ad85cSMatthew Ahrens if (ds->ds_objset != NULL) 251503ad85cSMatthew Ahrens dmu_objset_evict(ds->ds_objset); 252fa9e4066Sahrens 253fa9e4066Sahrens if (ds->ds_prev) { 2543b2aab18SMatthew Ahrens dsl_dataset_rele(ds->ds_prev, ds); 255fa9e4066Sahrens ds->ds_prev = NULL; 256fa9e4066Sahrens } 257fa9e4066Sahrens 258cde58dbcSMatthew Ahrens bplist_destroy(&ds->ds_pending_deadlist); 2593b2aab18SMatthew Ahrens if (ds->ds_phys->ds_deadlist_obj != 0) 260cde58dbcSMatthew Ahrens dsl_deadlist_close(&ds->ds_deadlist); 261745cd3c5Smaybee if (ds->ds_dir) 2623b2aab18SMatthew Ahrens dsl_dir_rele(ds->ds_dir, ds); 263fa9e4066Sahrens 26491ebeef5Sahrens ASSERT(!list_link_active(&ds->ds_synced_link)); 265fa9e4066Sahrens 2665ad82045Snd mutex_destroy(&ds->ds_lock); 26791ebeef5Sahrens mutex_destroy(&ds->ds_opening_lock); 2683b2aab18SMatthew Ahrens refcount_destroy(&ds->ds_longholds); 2695ad82045Snd 270fa9e4066Sahrens kmem_free(ds, sizeof (dsl_dataset_t)); 271fa9e4066Sahrens } 272fa9e4066Sahrens 2733b2aab18SMatthew Ahrens int 274fa9e4066Sahrens dsl_dataset_get_snapname(dsl_dataset_t *ds) 275fa9e4066Sahrens { 276fa9e4066Sahrens dsl_dataset_phys_t *headphys; 277fa9e4066Sahrens int err; 278fa9e4066Sahrens dmu_buf_t *headdbuf; 279fa9e4066Sahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 280fa9e4066Sahrens objset_t *mos = dp->dp_meta_objset; 281fa9e4066Sahrens 282fa9e4066Sahrens if (ds->ds_snapname[0]) 283ea8dc4b6Seschrock return (0); 284fa9e4066Sahrens if (ds->ds_phys->ds_next_snap_obj == 0) 285ea8dc4b6Seschrock return (0); 286fa9e4066Sahrens 287ea8dc4b6Seschrock err = dmu_bonus_hold(mos, ds->ds_dir->dd_phys->dd_head_dataset_obj, 288ea8dc4b6Seschrock FTAG, &headdbuf); 2893b2aab18SMatthew Ahrens if (err != 0) 290ea8dc4b6Seschrock return (err); 291fa9e4066Sahrens headphys = headdbuf->db_data; 292fa9e4066Sahrens err = zap_value_search(dp->dp_meta_objset, 293e7437265Sahrens headphys->ds_snapnames_zapobj, ds->ds_object, 0, ds->ds_snapname); 294ea8dc4b6Seschrock dmu_buf_rele(headdbuf, FTAG); 295ea8dc4b6Seschrock return (err); 296fa9e4066Sahrens } 297fa9e4066Sahrens 2983b2aab18SMatthew Ahrens int 299745cd3c5Smaybee dsl_dataset_snap_lookup(dsl_dataset_t *ds, const char *name, uint64_t *value) 300ab04eb8eStimh { 301745cd3c5Smaybee objset_t *mos = ds->ds_dir->dd_pool->dp_meta_objset; 302745cd3c5Smaybee uint64_t snapobj = ds->ds_phys->ds_snapnames_zapobj; 303ab04eb8eStimh matchtype_t mt; 304ab04eb8eStimh int err; 305ab04eb8eStimh 306745cd3c5Smaybee if (ds->ds_phys->ds_flags & DS_FLAG_CI_DATASET) 307ab04eb8eStimh mt = MT_FIRST; 308ab04eb8eStimh else 309ab04eb8eStimh mt = MT_EXACT; 310ab04eb8eStimh 311745cd3c5Smaybee err = zap_lookup_norm(mos, snapobj, name, 8, 1, 312ab04eb8eStimh value, mt, NULL, 0, NULL); 313ab04eb8eStimh if (err == ENOTSUP && mt == MT_FIRST) 314745cd3c5Smaybee err = zap_lookup(mos, snapobj, name, 8, 1, value); 315ab04eb8eStimh return (err); 316ab04eb8eStimh } 317ab04eb8eStimh 3183b2aab18SMatthew Ahrens int 319a2afb611SJerry Jelinek dsl_dataset_snap_remove(dsl_dataset_t *ds, const char *name, dmu_tx_t *tx, 320a2afb611SJerry Jelinek boolean_t adj_cnt) 321ab04eb8eStimh { 322745cd3c5Smaybee objset_t *mos = ds->ds_dir->dd_pool->dp_meta_objset; 323745cd3c5Smaybee uint64_t snapobj = ds->ds_phys->ds_snapnames_zapobj; 324ab04eb8eStimh matchtype_t mt; 325ab04eb8eStimh int err; 326ab04eb8eStimh 32771eb0538SChris Kirby dsl_dir_snap_cmtime_update(ds->ds_dir); 32871eb0538SChris Kirby 329745cd3c5Smaybee if (ds->ds_phys->ds_flags & DS_FLAG_CI_DATASET) 330ab04eb8eStimh mt = MT_FIRST; 331ab04eb8eStimh else 332ab04eb8eStimh mt = MT_EXACT; 333ab04eb8eStimh 334745cd3c5Smaybee err = zap_remove_norm(mos, snapobj, name, mt, tx); 335ab04eb8eStimh if (err == ENOTSUP && mt == MT_FIRST) 336745cd3c5Smaybee err = zap_remove(mos, snapobj, name, tx); 337a2afb611SJerry Jelinek 338a2afb611SJerry Jelinek if (err == 0 && adj_cnt) 339a2afb611SJerry Jelinek dsl_fs_ss_count_adjust(ds->ds_dir, -1, 340a2afb611SJerry Jelinek DD_FIELD_SNAPSHOT_COUNT, tx); 341a2afb611SJerry Jelinek 342ab04eb8eStimh return (err); 343ab04eb8eStimh } 344ab04eb8eStimh 3453b2aab18SMatthew Ahrens int 3463b2aab18SMatthew Ahrens dsl_dataset_hold_obj(dsl_pool_t *dp, uint64_t dsobj, void *tag, 347745cd3c5Smaybee dsl_dataset_t **dsp) 348fa9e4066Sahrens { 349fa9e4066Sahrens objset_t *mos = dp->dp_meta_objset; 350fa9e4066Sahrens dmu_buf_t *dbuf; 351fa9e4066Sahrens dsl_dataset_t *ds; 352ea8dc4b6Seschrock int err; 353a7f53a56SChris Kirby dmu_object_info_t doi; 354fa9e4066Sahrens 3553b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(dp)); 356fa9e4066Sahrens 357ea8dc4b6Seschrock err = dmu_bonus_hold(mos, dsobj, tag, &dbuf); 3583b2aab18SMatthew Ahrens if (err != 0) 359ea8dc4b6Seschrock return (err); 360a7f53a56SChris Kirby 361a7f53a56SChris Kirby /* Make sure dsobj has the correct object type. */ 362a7f53a56SChris Kirby dmu_object_info_from_db(dbuf, &doi); 3632acef22dSMatthew Ahrens if (doi.doi_bonus_type != DMU_OT_DSL_DATASET) { 364b287be1bSWill Andrews dmu_buf_rele(dbuf, tag); 365be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 366b287be1bSWill Andrews } 367a7f53a56SChris Kirby 368fa9e4066Sahrens ds = dmu_buf_get_user(dbuf); 369fa9e4066Sahrens if (ds == NULL) { 370d5285caeSGeorge Wilson dsl_dataset_t *winner = NULL; 371fa9e4066Sahrens 372fa9e4066Sahrens ds = kmem_zalloc(sizeof (dsl_dataset_t), KM_SLEEP); 373fa9e4066Sahrens ds->ds_dbuf = dbuf; 374fa9e4066Sahrens ds->ds_object = dsobj; 375fa9e4066Sahrens ds->ds_phys = dbuf->db_data; 376fa9e4066Sahrens 3775ad82045Snd mutex_init(&ds->ds_lock, NULL, MUTEX_DEFAULT, NULL); 37891ebeef5Sahrens mutex_init(&ds->ds_opening_lock, NULL, MUTEX_DEFAULT, NULL); 3794e3c9f44SBill Pijewski mutex_init(&ds->ds_sendstream_lock, NULL, MUTEX_DEFAULT, NULL); 3803b2aab18SMatthew Ahrens refcount_create(&ds->ds_longholds); 3815ad82045Snd 382cde58dbcSMatthew Ahrens bplist_create(&ds->ds_pending_deadlist); 383cde58dbcSMatthew Ahrens dsl_deadlist_open(&ds->ds_deadlist, 384fa9e4066Sahrens mos, ds->ds_phys->ds_deadlist_obj); 385cde58dbcSMatthew Ahrens 3864e3c9f44SBill Pijewski list_create(&ds->ds_sendstreams, sizeof (dmu_sendarg_t), 3874e3c9f44SBill Pijewski offsetof(dmu_sendarg_t, dsa_link)); 3884e3c9f44SBill Pijewski 389ea8dc4b6Seschrock if (err == 0) { 3903b2aab18SMatthew Ahrens err = dsl_dir_hold_obj(dp, 391ea8dc4b6Seschrock ds->ds_phys->ds_dir_obj, NULL, ds, &ds->ds_dir); 392ea8dc4b6Seschrock } 3933b2aab18SMatthew Ahrens if (err != 0) { 3945ad82045Snd mutex_destroy(&ds->ds_lock); 39591ebeef5Sahrens mutex_destroy(&ds->ds_opening_lock); 3963b2aab18SMatthew Ahrens refcount_destroy(&ds->ds_longholds); 397cde58dbcSMatthew Ahrens bplist_destroy(&ds->ds_pending_deadlist); 398cde58dbcSMatthew Ahrens dsl_deadlist_close(&ds->ds_deadlist); 399ea8dc4b6Seschrock kmem_free(ds, sizeof (dsl_dataset_t)); 400ea8dc4b6Seschrock dmu_buf_rele(dbuf, tag); 401ea8dc4b6Seschrock return (err); 402ea8dc4b6Seschrock } 403fa9e4066Sahrens 40474e7dc98SMatthew Ahrens if (!dsl_dataset_is_snapshot(ds)) { 405fa9e4066Sahrens ds->ds_snapname[0] = '\0'; 4063b2aab18SMatthew Ahrens if (ds->ds_phys->ds_prev_snap_obj != 0) { 4073b2aab18SMatthew Ahrens err = dsl_dataset_hold_obj(dp, 408745cd3c5Smaybee ds->ds_phys->ds_prev_snap_obj, 409745cd3c5Smaybee ds, &ds->ds_prev); 410fa9e4066Sahrens } 41178f17100SMatthew Ahrens if (doi.doi_type == DMU_OTN_ZAP_METADATA) { 41278f17100SMatthew Ahrens int zaperr = zap_lookup(mos, ds->ds_object, 41378f17100SMatthew Ahrens DS_FIELD_BOOKMARK_NAMES, 41478f17100SMatthew Ahrens sizeof (ds->ds_bookmarks), 1, 41578f17100SMatthew Ahrens &ds->ds_bookmarks); 41678f17100SMatthew Ahrens if (zaperr != ENOENT) 41778f17100SMatthew Ahrens VERIFY0(zaperr); 41878f17100SMatthew Ahrens } 419842727c2SChris Kirby } else { 420842727c2SChris Kirby if (zfs_flags & ZFS_DEBUG_SNAPNAMES) 421842727c2SChris Kirby err = dsl_dataset_get_snapname(ds); 422842727c2SChris Kirby if (err == 0 && ds->ds_phys->ds_userrefs_obj != 0) { 423842727c2SChris Kirby err = zap_count( 424842727c2SChris Kirby ds->ds_dir->dd_pool->dp_meta_objset, 425842727c2SChris Kirby ds->ds_phys->ds_userrefs_obj, 426842727c2SChris Kirby &ds->ds_userrefs); 427842727c2SChris Kirby } 428fa9e4066Sahrens } 429fa9e4066Sahrens 43074e7dc98SMatthew Ahrens if (err == 0 && !dsl_dataset_is_snapshot(ds)) { 4313b2aab18SMatthew Ahrens err = dsl_prop_get_int_ds(ds, 4323b2aab18SMatthew Ahrens zfs_prop_to_name(ZFS_PROP_REFRESERVATION), 4333b2aab18SMatthew Ahrens &ds->ds_reserved); 434cb625fb5Sck if (err == 0) { 4353b2aab18SMatthew Ahrens err = dsl_prop_get_int_ds(ds, 4363b2aab18SMatthew Ahrens zfs_prop_to_name(ZFS_PROP_REFQUOTA), 4373b2aab18SMatthew Ahrens &ds->ds_quota); 438cb625fb5Sck } 439cb625fb5Sck } else { 440cb625fb5Sck ds->ds_reserved = ds->ds_quota = 0; 441cb625fb5Sck } 442cb625fb5Sck 443d5285caeSGeorge Wilson if (err != 0 || (winner = dmu_buf_set_user_ie(dbuf, ds, 444d5285caeSGeorge Wilson &ds->ds_phys, dsl_dataset_evict)) != NULL) { 445cde58dbcSMatthew Ahrens bplist_destroy(&ds->ds_pending_deadlist); 446cde58dbcSMatthew Ahrens dsl_deadlist_close(&ds->ds_deadlist); 447745cd3c5Smaybee if (ds->ds_prev) 4483b2aab18SMatthew Ahrens dsl_dataset_rele(ds->ds_prev, ds); 4493b2aab18SMatthew Ahrens dsl_dir_rele(ds->ds_dir, ds); 4505ad82045Snd mutex_destroy(&ds->ds_lock); 45191ebeef5Sahrens mutex_destroy(&ds->ds_opening_lock); 4523b2aab18SMatthew Ahrens refcount_destroy(&ds->ds_longholds); 453fa9e4066Sahrens kmem_free(ds, sizeof (dsl_dataset_t)); 4543b2aab18SMatthew Ahrens if (err != 0) { 455ea8dc4b6Seschrock dmu_buf_rele(dbuf, tag); 456ea8dc4b6Seschrock return (err); 457ea8dc4b6Seschrock } 458fa9e4066Sahrens ds = winner; 459fa9e4066Sahrens } else { 46091ebeef5Sahrens ds->ds_fsid_guid = 461fa9e4066Sahrens unique_insert(ds->ds_phys->ds_fsid_guid); 462fa9e4066Sahrens } 463fa9e4066Sahrens } 464fa9e4066Sahrens ASSERT3P(ds->ds_dbuf, ==, dbuf); 465fa9e4066Sahrens ASSERT3P(ds->ds_phys, ==, dbuf->db_data); 466088f3894Sahrens ASSERT(ds->ds_phys->ds_prev_snap_obj != 0 || 467afc6333aSahrens spa_version(dp->dp_spa) < SPA_VERSION_ORIGIN || 46884db2a68Sahrens dp->dp_origin_snap == NULL || ds == dp->dp_origin_snap); 469ea8dc4b6Seschrock *dsp = ds; 470ea8dc4b6Seschrock return (0); 471fa9e4066Sahrens } 472fa9e4066Sahrens 473745cd3c5Smaybee int 4743b2aab18SMatthew Ahrens dsl_dataset_hold(dsl_pool_t *dp, const char *name, 475503ad85cSMatthew Ahrens void *tag, dsl_dataset_t **dsp) 476fa9e4066Sahrens { 477fa9e4066Sahrens dsl_dir_t *dd; 478745cd3c5Smaybee const char *snapname; 479fa9e4066Sahrens uint64_t obj; 480fa9e4066Sahrens int err = 0; 481fa9e4066Sahrens 4823b2aab18SMatthew Ahrens err = dsl_dir_hold(dp, name, FTAG, &dd, &snapname); 4833b2aab18SMatthew Ahrens if (err != 0) 484ea8dc4b6Seschrock return (err); 485fa9e4066Sahrens 4863b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(dp)); 487fa9e4066Sahrens obj = dd->dd_phys->dd_head_dataset_obj; 4883b2aab18SMatthew Ahrens if (obj != 0) 4893b2aab18SMatthew Ahrens err = dsl_dataset_hold_obj(dp, obj, tag, dsp); 490745cd3c5Smaybee else 491be6fd75aSMatthew Ahrens err = SET_ERROR(ENOENT); 492fa9e4066Sahrens 493745cd3c5Smaybee /* we may be looking for a snapshot */ 494745cd3c5Smaybee if (err == 0 && snapname != NULL) { 4953b2aab18SMatthew Ahrens dsl_dataset_t *ds; 496fa9e4066Sahrens 497745cd3c5Smaybee if (*snapname++ != '@') { 498745cd3c5Smaybee dsl_dataset_rele(*dsp, tag); 4993b2aab18SMatthew Ahrens dsl_dir_rele(dd, FTAG); 500be6fd75aSMatthew Ahrens return (SET_ERROR(ENOENT)); 501fa9e4066Sahrens } 502fa9e4066Sahrens 503745cd3c5Smaybee dprintf("looking for snapshot '%s'\n", snapname); 504745cd3c5Smaybee err = dsl_dataset_snap_lookup(*dsp, snapname, &obj); 505745cd3c5Smaybee if (err == 0) 5063b2aab18SMatthew Ahrens err = dsl_dataset_hold_obj(dp, obj, tag, &ds); 507745cd3c5Smaybee dsl_dataset_rele(*dsp, tag); 508745cd3c5Smaybee 5093b2aab18SMatthew Ahrens if (err == 0) { 510745cd3c5Smaybee mutex_enter(&ds->ds_lock); 511745cd3c5Smaybee if (ds->ds_snapname[0] == 0) 512745cd3c5Smaybee (void) strlcpy(ds->ds_snapname, snapname, 513745cd3c5Smaybee sizeof (ds->ds_snapname)); 514745cd3c5Smaybee mutex_exit(&ds->ds_lock); 5153b2aab18SMatthew Ahrens *dsp = ds; 516fa9e4066Sahrens } 517fa9e4066Sahrens } 5183b2aab18SMatthew Ahrens 5193b2aab18SMatthew Ahrens dsl_dir_rele(dd, FTAG); 520fa9e4066Sahrens return (err); 521fa9e4066Sahrens } 522fa9e4066Sahrens 523fa9e4066Sahrens int 5243b2aab18SMatthew Ahrens dsl_dataset_own_obj(dsl_pool_t *dp, uint64_t dsobj, 5253b2aab18SMatthew Ahrens void *tag, dsl_dataset_t **dsp) 5263b2aab18SMatthew Ahrens { 5273b2aab18SMatthew Ahrens int err = dsl_dataset_hold_obj(dp, dsobj, tag, dsp); 5283b2aab18SMatthew Ahrens if (err != 0) 5293b2aab18SMatthew Ahrens return (err); 5303b2aab18SMatthew Ahrens if (!dsl_dataset_tryown(*dsp, tag)) { 5313b2aab18SMatthew Ahrens dsl_dataset_rele(*dsp, tag); 5323b2aab18SMatthew Ahrens *dsp = NULL; 533be6fd75aSMatthew Ahrens return (SET_ERROR(EBUSY)); 5343b2aab18SMatthew Ahrens } 5353b2aab18SMatthew Ahrens return (0); 5363b2aab18SMatthew Ahrens } 5373b2aab18SMatthew Ahrens 5383b2aab18SMatthew Ahrens int 5393b2aab18SMatthew Ahrens dsl_dataset_own(dsl_pool_t *dp, const char *name, 540503ad85cSMatthew Ahrens void *tag, dsl_dataset_t **dsp) 541fa9e4066Sahrens { 5423b2aab18SMatthew Ahrens int err = dsl_dataset_hold(dp, name, tag, dsp); 5433b2aab18SMatthew Ahrens if (err != 0) 544745cd3c5Smaybee return (err); 5453b2aab18SMatthew Ahrens if (!dsl_dataset_tryown(*dsp, tag)) { 546503ad85cSMatthew Ahrens dsl_dataset_rele(*dsp, tag); 547be6fd75aSMatthew Ahrens return (SET_ERROR(EBUSY)); 548745cd3c5Smaybee } 549745cd3c5Smaybee return (0); 550fa9e4066Sahrens } 551fa9e4066Sahrens 5523b2aab18SMatthew Ahrens /* 5533b2aab18SMatthew Ahrens * See the comment above dsl_pool_hold() for details. In summary, a long 5543b2aab18SMatthew Ahrens * hold is used to prevent destruction of a dataset while the pool hold 5553b2aab18SMatthew Ahrens * is dropped, allowing other concurrent operations (e.g. spa_sync()). 5563b2aab18SMatthew Ahrens * 5573b2aab18SMatthew Ahrens * The dataset and pool must be held when this function is called. After it 5583b2aab18SMatthew Ahrens * is called, the pool hold may be released while the dataset is still held 5593b2aab18SMatthew Ahrens * and accessed. 5603b2aab18SMatthew Ahrens */ 5613b2aab18SMatthew Ahrens void 5623b2aab18SMatthew Ahrens dsl_dataset_long_hold(dsl_dataset_t *ds, void *tag) 5633b2aab18SMatthew Ahrens { 5643b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(ds->ds_dir->dd_pool)); 5653b2aab18SMatthew Ahrens (void) refcount_add(&ds->ds_longholds, tag); 5663b2aab18SMatthew Ahrens } 5673b2aab18SMatthew Ahrens 5683b2aab18SMatthew Ahrens void 5693b2aab18SMatthew Ahrens dsl_dataset_long_rele(dsl_dataset_t *ds, void *tag) 5703b2aab18SMatthew Ahrens { 5713b2aab18SMatthew Ahrens (void) refcount_remove(&ds->ds_longholds, tag); 5723b2aab18SMatthew Ahrens } 5733b2aab18SMatthew Ahrens 5743b2aab18SMatthew Ahrens /* Return B_TRUE if there are any long holds on this dataset. */ 5753b2aab18SMatthew Ahrens boolean_t 5763b2aab18SMatthew Ahrens dsl_dataset_long_held(dsl_dataset_t *ds) 5773b2aab18SMatthew Ahrens { 5783b2aab18SMatthew Ahrens return (!refcount_is_zero(&ds->ds_longholds)); 5793b2aab18SMatthew Ahrens } 5803b2aab18SMatthew Ahrens 581fa9e4066Sahrens void 582fa9e4066Sahrens dsl_dataset_name(dsl_dataset_t *ds, char *name) 583fa9e4066Sahrens { 584fa9e4066Sahrens if (ds == NULL) { 585fa9e4066Sahrens (void) strcpy(name, "mos"); 586fa9e4066Sahrens } else { 587fa9e4066Sahrens dsl_dir_name(ds->ds_dir, name); 5883b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_get_snapname(ds)); 589fa9e4066Sahrens if (ds->ds_snapname[0]) { 590fa9e4066Sahrens (void) strcat(name, "@"); 591745cd3c5Smaybee /* 592745cd3c5Smaybee * We use a "recursive" mutex so that we 593745cd3c5Smaybee * can call dprintf_ds() with ds_lock held. 594745cd3c5Smaybee */ 595fa9e4066Sahrens if (!MUTEX_HELD(&ds->ds_lock)) { 596fa9e4066Sahrens mutex_enter(&ds->ds_lock); 597fa9e4066Sahrens (void) strcat(name, ds->ds_snapname); 598fa9e4066Sahrens mutex_exit(&ds->ds_lock); 599fa9e4066Sahrens } else { 600fa9e4066Sahrens (void) strcat(name, ds->ds_snapname); 601fa9e4066Sahrens } 602fa9e4066Sahrens } 603fa9e4066Sahrens } 604fa9e4066Sahrens } 605fa9e4066Sahrens 6063cb34c60Sahrens void 607745cd3c5Smaybee dsl_dataset_rele(dsl_dataset_t *ds, void *tag) 6083cb34c60Sahrens { 6093b2aab18SMatthew Ahrens dmu_buf_rele(ds->ds_dbuf, tag); 610745cd3c5Smaybee } 611745cd3c5Smaybee 612745cd3c5Smaybee void 613503ad85cSMatthew Ahrens dsl_dataset_disown(dsl_dataset_t *ds, void *tag) 614745cd3c5Smaybee { 6153b2aab18SMatthew Ahrens ASSERT(ds->ds_owner == tag && ds->ds_dbuf != NULL); 616745cd3c5Smaybee 6173cb34c60Sahrens mutex_enter(&ds->ds_lock); 618745cd3c5Smaybee ds->ds_owner = NULL; 6193cb34c60Sahrens mutex_exit(&ds->ds_lock); 6203b2aab18SMatthew Ahrens dsl_dataset_long_rele(ds, tag); 6213b2aab18SMatthew Ahrens if (ds->ds_dbuf != NULL) 6223b2aab18SMatthew Ahrens dsl_dataset_rele(ds, tag); 623745cd3c5Smaybee else 624cde58dbcSMatthew Ahrens dsl_dataset_evict(NULL, ds); 6253cb34c60Sahrens } 6263cb34c60Sahrens 6273cb34c60Sahrens boolean_t 6283b2aab18SMatthew Ahrens dsl_dataset_tryown(dsl_dataset_t *ds, void *tag) 6293cb34c60Sahrens { 630745cd3c5Smaybee boolean_t gotit = FALSE; 631745cd3c5Smaybee 6323cb34c60Sahrens mutex_enter(&ds->ds_lock); 6333b2aab18SMatthew Ahrens if (ds->ds_owner == NULL && !DS_IS_INCONSISTENT(ds)) { 634503ad85cSMatthew Ahrens ds->ds_owner = tag; 6353b2aab18SMatthew Ahrens dsl_dataset_long_hold(ds, tag); 636745cd3c5Smaybee gotit = TRUE; 6373cb34c60Sahrens } 6383cb34c60Sahrens mutex_exit(&ds->ds_lock); 639745cd3c5Smaybee return (gotit); 640745cd3c5Smaybee } 641745cd3c5Smaybee 6421d452cf5Sahrens uint64_t 643088f3894Sahrens dsl_dataset_create_sync_dd(dsl_dir_t *dd, dsl_dataset_t *origin, 644ab04eb8eStimh uint64_t flags, dmu_tx_t *tx) 645fa9e4066Sahrens { 6463cb34c60Sahrens dsl_pool_t *dp = dd->dd_pool; 647fa9e4066Sahrens dmu_buf_t *dbuf; 648fa9e4066Sahrens dsl_dataset_phys_t *dsphys; 6493cb34c60Sahrens uint64_t dsobj; 650fa9e4066Sahrens objset_t *mos = dp->dp_meta_objset; 651fa9e4066Sahrens 652088f3894Sahrens if (origin == NULL) 653088f3894Sahrens origin = dp->dp_origin_snap; 654088f3894Sahrens 6553cb34c60Sahrens ASSERT(origin == NULL || origin->ds_dir->dd_pool == dp); 6563cb34c60Sahrens ASSERT(origin == NULL || origin->ds_phys->ds_num_children > 0); 657fa9e4066Sahrens ASSERT(dmu_tx_is_syncing(tx)); 6583cb34c60Sahrens ASSERT(dd->dd_phys->dd_head_dataset_obj == 0); 659fa9e4066Sahrens 6601649cd4bStabriz dsobj = dmu_object_alloc(mos, DMU_OT_DSL_DATASET, 0, 6611649cd4bStabriz DMU_OT_DSL_DATASET, sizeof (dsl_dataset_phys_t), tx); 6623b2aab18SMatthew Ahrens VERIFY0(dmu_bonus_hold(mos, dsobj, FTAG, &dbuf)); 663fa9e4066Sahrens dmu_buf_will_dirty(dbuf, tx); 664fa9e4066Sahrens dsphys = dbuf->db_data; 665745cd3c5Smaybee bzero(dsphys, sizeof (dsl_dataset_phys_t)); 666fa9e4066Sahrens dsphys->ds_dir_obj = dd->dd_object; 667ab04eb8eStimh dsphys->ds_flags = flags; 668fa9e4066Sahrens dsphys->ds_fsid_guid = unique_create(); 669fa9e4066Sahrens (void) random_get_pseudo_bytes((void*)&dsphys->ds_guid, 670fa9e4066Sahrens sizeof (dsphys->ds_guid)); 671fa9e4066Sahrens dsphys->ds_snapnames_zapobj = 672ab04eb8eStimh zap_create_norm(mos, U8_TEXTPREP_TOUPPER, DMU_OT_DSL_DS_SNAP_MAP, 673ab04eb8eStimh DMU_OT_NONE, 0, tx); 674fa9e4066Sahrens dsphys->ds_creation_time = gethrestime_sec(); 675088f3894Sahrens dsphys->ds_creation_txg = tx->tx_txg == TXG_INITIAL ? 1 : tx->tx_txg; 676a9799022Sck 677cde58dbcSMatthew Ahrens if (origin == NULL) { 678cde58dbcSMatthew Ahrens dsphys->ds_deadlist_obj = dsl_deadlist_alloc(mos, tx); 679cde58dbcSMatthew Ahrens } else { 6803b2aab18SMatthew Ahrens dsl_dataset_t *ohds; /* head of the origin snapshot */ 681cde58dbcSMatthew Ahrens 6823cb34c60Sahrens dsphys->ds_prev_snap_obj = origin->ds_object; 683fa9e4066Sahrens dsphys->ds_prev_snap_txg = 6843cb34c60Sahrens origin->ds_phys->ds_creation_txg; 685ad135b5dSChristopher Siden dsphys->ds_referenced_bytes = 686ad135b5dSChristopher Siden origin->ds_phys->ds_referenced_bytes; 687fa9e4066Sahrens dsphys->ds_compressed_bytes = 6883cb34c60Sahrens origin->ds_phys->ds_compressed_bytes; 689fa9e4066Sahrens dsphys->ds_uncompressed_bytes = 6903cb34c60Sahrens origin->ds_phys->ds_uncompressed_bytes; 6913cb34c60Sahrens dsphys->ds_bp = origin->ds_phys->ds_bp; 692579ae4d5Stimh dsphys->ds_flags |= origin->ds_phys->ds_flags; 693fa9e4066Sahrens 6943cb34c60Sahrens dmu_buf_will_dirty(origin->ds_dbuf, tx); 6953cb34c60Sahrens origin->ds_phys->ds_num_children++; 696fa9e4066Sahrens 6973b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold_obj(dp, 698cde58dbcSMatthew Ahrens origin->ds_dir->dd_phys->dd_head_dataset_obj, FTAG, &ohds)); 699cde58dbcSMatthew Ahrens dsphys->ds_deadlist_obj = dsl_deadlist_clone(&ohds->ds_deadlist, 700cde58dbcSMatthew Ahrens dsphys->ds_prev_snap_txg, dsphys->ds_prev_snap_obj, tx); 701cde58dbcSMatthew Ahrens dsl_dataset_rele(ohds, FTAG); 702cde58dbcSMatthew Ahrens 703088f3894Sahrens if (spa_version(dp->dp_spa) >= SPA_VERSION_NEXT_CLONES) { 704088f3894Sahrens if (origin->ds_phys->ds_next_clones_obj == 0) { 705088f3894Sahrens origin->ds_phys->ds_next_clones_obj = 706088f3894Sahrens zap_create(mos, 707088f3894Sahrens DMU_OT_NEXT_CLONES, DMU_OT_NONE, 0, tx); 708088f3894Sahrens } 7093b2aab18SMatthew Ahrens VERIFY0(zap_add_int(mos, 7103b2aab18SMatthew Ahrens origin->ds_phys->ds_next_clones_obj, dsobj, tx)); 711088f3894Sahrens } 712088f3894Sahrens 713fa9e4066Sahrens dmu_buf_will_dirty(dd->dd_dbuf, tx); 7143cb34c60Sahrens dd->dd_phys->dd_origin_obj = origin->ds_object; 715cde58dbcSMatthew Ahrens if (spa_version(dp->dp_spa) >= SPA_VERSION_DIR_CLONES) { 716cde58dbcSMatthew Ahrens if (origin->ds_dir->dd_phys->dd_clones == 0) { 717cde58dbcSMatthew Ahrens dmu_buf_will_dirty(origin->ds_dir->dd_dbuf, tx); 718cde58dbcSMatthew Ahrens origin->ds_dir->dd_phys->dd_clones = 719cde58dbcSMatthew Ahrens zap_create(mos, 720cde58dbcSMatthew Ahrens DMU_OT_DSL_CLONES, DMU_OT_NONE, 0, tx); 721cde58dbcSMatthew Ahrens } 7223b2aab18SMatthew Ahrens VERIFY0(zap_add_int(mos, 723cde58dbcSMatthew Ahrens origin->ds_dir->dd_phys->dd_clones, dsobj, tx)); 724cde58dbcSMatthew Ahrens } 725fa9e4066Sahrens } 726ab04eb8eStimh 727ab04eb8eStimh if (spa_version(dp->dp_spa) >= SPA_VERSION_UNIQUE_ACCURATE) 728ab04eb8eStimh dsphys->ds_flags |= DS_FLAG_UNIQUE_ACCURATE; 729ab04eb8eStimh 730ea8dc4b6Seschrock dmu_buf_rele(dbuf, FTAG); 731fa9e4066Sahrens 732fa9e4066Sahrens dmu_buf_will_dirty(dd->dd_dbuf, tx); 733fa9e4066Sahrens dd->dd_phys->dd_head_dataset_obj = dsobj; 7343cb34c60Sahrens 7353cb34c60Sahrens return (dsobj); 7363cb34c60Sahrens } 7373cb34c60Sahrens 7383b2aab18SMatthew Ahrens static void 7393b2aab18SMatthew Ahrens dsl_dataset_zero_zil(dsl_dataset_t *ds, dmu_tx_t *tx) 7403b2aab18SMatthew Ahrens { 7413b2aab18SMatthew Ahrens objset_t *os; 7423b2aab18SMatthew Ahrens 7433b2aab18SMatthew Ahrens VERIFY0(dmu_objset_from_ds(ds, &os)); 7443b2aab18SMatthew Ahrens bzero(&os->os_zil_header, sizeof (os->os_zil_header)); 7453b2aab18SMatthew Ahrens dsl_dataset_dirty(ds, tx); 7463b2aab18SMatthew Ahrens } 7473b2aab18SMatthew Ahrens 7483cb34c60Sahrens uint64_t 749ab04eb8eStimh dsl_dataset_create_sync(dsl_dir_t *pdd, const char *lastname, 750ab04eb8eStimh dsl_dataset_t *origin, uint64_t flags, cred_t *cr, dmu_tx_t *tx) 7513cb34c60Sahrens { 7523cb34c60Sahrens dsl_pool_t *dp = pdd->dd_pool; 7533cb34c60Sahrens uint64_t dsobj, ddobj; 7543cb34c60Sahrens dsl_dir_t *dd; 7553cb34c60Sahrens 7563b2aab18SMatthew Ahrens ASSERT(dmu_tx_is_syncing(tx)); 7573cb34c60Sahrens ASSERT(lastname[0] != '@'); 7583cb34c60Sahrens 759088f3894Sahrens ddobj = dsl_dir_create_sync(dp, pdd, lastname, tx); 7603b2aab18SMatthew Ahrens VERIFY0(dsl_dir_hold_obj(dp, ddobj, lastname, FTAG, &dd)); 7613cb34c60Sahrens 7623b2aab18SMatthew Ahrens dsobj = dsl_dataset_create_sync_dd(dd, origin, 7633b2aab18SMatthew Ahrens flags & ~DS_CREATE_FLAG_NODIRTY, tx); 7643cb34c60Sahrens 7653cb34c60Sahrens dsl_deleg_set_create_perms(dd, tx, cr); 7663cb34c60Sahrens 767a2afb611SJerry Jelinek /* 768a2afb611SJerry Jelinek * Since we're creating a new node we know it's a leaf, so we can 769a2afb611SJerry Jelinek * initialize the counts if the limit feature is active. 770a2afb611SJerry Jelinek */ 771a2afb611SJerry Jelinek if (spa_feature_is_active(dp->dp_spa, SPA_FEATURE_FS_SS_LIMIT)) { 772a2afb611SJerry Jelinek uint64_t cnt = 0; 773a2afb611SJerry Jelinek objset_t *os = dd->dd_pool->dp_meta_objset; 774a2afb611SJerry Jelinek 775a2afb611SJerry Jelinek dsl_dir_zapify(dd, tx); 776a2afb611SJerry Jelinek VERIFY0(zap_add(os, dd->dd_object, DD_FIELD_FILESYSTEM_COUNT, 777a2afb611SJerry Jelinek sizeof (cnt), 1, &cnt, tx)); 778a2afb611SJerry Jelinek VERIFY0(zap_add(os, dd->dd_object, DD_FIELD_SNAPSHOT_COUNT, 779a2afb611SJerry Jelinek sizeof (cnt), 1, &cnt, tx)); 780a2afb611SJerry Jelinek } 781a2afb611SJerry Jelinek 7823b2aab18SMatthew Ahrens dsl_dir_rele(dd, FTAG); 783fa9e4066Sahrens 784feaa74e4SMark Maybee /* 785feaa74e4SMark Maybee * If we are creating a clone, make sure we zero out any stale 786feaa74e4SMark Maybee * data from the origin snapshots zil header. 787feaa74e4SMark Maybee */ 7883b2aab18SMatthew Ahrens if (origin != NULL && !(flags & DS_CREATE_FLAG_NODIRTY)) { 789feaa74e4SMark Maybee dsl_dataset_t *ds; 790feaa74e4SMark Maybee 7913b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold_obj(dp, dsobj, FTAG, &ds)); 7923b2aab18SMatthew Ahrens dsl_dataset_zero_zil(ds, tx); 793feaa74e4SMark Maybee dsl_dataset_rele(ds, FTAG); 794feaa74e4SMark Maybee } 795feaa74e4SMark Maybee 7961d452cf5Sahrens return (dsobj); 797fa9e4066Sahrens } 798fa9e4066Sahrens 7991d452cf5Sahrens /* 8003b2aab18SMatthew Ahrens * The unique space in the head dataset can be calculated by subtracting 8013b2aab18SMatthew Ahrens * the space used in the most recent snapshot, that is still being used 8023b2aab18SMatthew Ahrens * in this file system, from the space currently in use. To figure out 8033b2aab18SMatthew Ahrens * the space in the most recent snapshot still in use, we need to take 8043b2aab18SMatthew Ahrens * the total space used in the snapshot and subtract out the space that 8053b2aab18SMatthew Ahrens * has been freed up since the snapshot was taken. 8061d452cf5Sahrens */ 8073b2aab18SMatthew Ahrens void 8083b2aab18SMatthew Ahrens dsl_dataset_recalc_head_uniq(dsl_dataset_t *ds) 8091d452cf5Sahrens { 8103b2aab18SMatthew Ahrens uint64_t mrs_used; 8113b2aab18SMatthew Ahrens uint64_t dlused, dlcomp, dluncomp; 8121d452cf5Sahrens 8133b2aab18SMatthew Ahrens ASSERT(!dsl_dataset_is_snapshot(ds)); 8141d452cf5Sahrens 8153b2aab18SMatthew Ahrens if (ds->ds_phys->ds_prev_snap_obj != 0) 8163b2aab18SMatthew Ahrens mrs_used = ds->ds_prev->ds_phys->ds_referenced_bytes; 8173b2aab18SMatthew Ahrens else 8183b2aab18SMatthew Ahrens mrs_used = 0; 819842727c2SChris Kirby 8203b2aab18SMatthew Ahrens dsl_deadlist_space(&ds->ds_deadlist, &dlused, &dlcomp, &dluncomp); 821fa9e4066Sahrens 8223b2aab18SMatthew Ahrens ASSERT3U(dlused, <=, mrs_used); 8233b2aab18SMatthew Ahrens ds->ds_phys->ds_unique_bytes = 8243b2aab18SMatthew Ahrens ds->ds_phys->ds_referenced_bytes - (mrs_used - dlused); 82519b94df9SMatthew Ahrens 8263b2aab18SMatthew Ahrens if (spa_version(ds->ds_dir->dd_pool->dp_spa) >= 8273b2aab18SMatthew Ahrens SPA_VERSION_UNIQUE_ACCURATE) 8283b2aab18SMatthew Ahrens ds->ds_phys->ds_flags |= DS_FLAG_UNIQUE_ACCURATE; 829fa9e4066Sahrens } 830fa9e4066Sahrens 8313b2aab18SMatthew Ahrens void 8323b2aab18SMatthew Ahrens dsl_dataset_remove_from_next_clones(dsl_dataset_t *ds, uint64_t obj, 8333b2aab18SMatthew Ahrens dmu_tx_t *tx) 834842727c2SChris Kirby { 8353b2aab18SMatthew Ahrens objset_t *mos = ds->ds_dir->dd_pool->dp_meta_objset; 8363b2aab18SMatthew Ahrens uint64_t count; 8373b2aab18SMatthew Ahrens int err; 8383b2aab18SMatthew Ahrens 8393b2aab18SMatthew Ahrens ASSERT(ds->ds_phys->ds_num_children >= 2); 8403b2aab18SMatthew Ahrens err = zap_remove_int(mos, ds->ds_phys->ds_next_clones_obj, obj, tx); 8413b2aab18SMatthew Ahrens /* 8423b2aab18SMatthew Ahrens * The err should not be ENOENT, but a bug in a previous version 8433b2aab18SMatthew Ahrens * of the code could cause upgrade_clones_cb() to not set 8443b2aab18SMatthew Ahrens * ds_next_snap_obj when it should, leading to a missing entry. 8453b2aab18SMatthew Ahrens * If we knew that the pool was created after 8463b2aab18SMatthew Ahrens * SPA_VERSION_NEXT_CLONES, we could assert that it isn't 8473b2aab18SMatthew Ahrens * ENOENT. However, at least we can check that we don't have 8483b2aab18SMatthew Ahrens * too many entries in the next_clones_obj even after failing to 8493b2aab18SMatthew Ahrens * remove this one. 8503b2aab18SMatthew Ahrens */ 8513b2aab18SMatthew Ahrens if (err != ENOENT) 8523b2aab18SMatthew Ahrens VERIFY0(err); 8533b2aab18SMatthew Ahrens ASSERT0(zap_count(mos, ds->ds_phys->ds_next_clones_obj, 8543b2aab18SMatthew Ahrens &count)); 8553b2aab18SMatthew Ahrens ASSERT3U(count, <=, ds->ds_phys->ds_num_children - 2); 8563b2aab18SMatthew Ahrens } 857842727c2SChris Kirby 858842727c2SChris Kirby 8593b2aab18SMatthew Ahrens blkptr_t * 8603b2aab18SMatthew Ahrens dsl_dataset_get_blkptr(dsl_dataset_t *ds) 8613b2aab18SMatthew Ahrens { 8623b2aab18SMatthew Ahrens return (&ds->ds_phys->ds_bp); 863842727c2SChris Kirby } 864842727c2SChris Kirby 8653b2aab18SMatthew Ahrens void 8663b2aab18SMatthew Ahrens dsl_dataset_set_blkptr(dsl_dataset_t *ds, blkptr_t *bp, dmu_tx_t *tx) 867842727c2SChris Kirby { 8683b2aab18SMatthew Ahrens ASSERT(dmu_tx_is_syncing(tx)); 8693b2aab18SMatthew Ahrens /* If it's the meta-objset, set dp_meta_rootbp */ 8703b2aab18SMatthew Ahrens if (ds == NULL) { 8713b2aab18SMatthew Ahrens tx->tx_pool->dp_meta_rootbp = *bp; 8723b2aab18SMatthew Ahrens } else { 8733b2aab18SMatthew Ahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 8743b2aab18SMatthew Ahrens ds->ds_phys->ds_bp = *bp; 875842727c2SChris Kirby } 8763b2aab18SMatthew Ahrens } 877842727c2SChris Kirby 8783b2aab18SMatthew Ahrens spa_t * 8793b2aab18SMatthew Ahrens dsl_dataset_get_spa(dsl_dataset_t *ds) 8803b2aab18SMatthew Ahrens { 8813b2aab18SMatthew Ahrens return (ds->ds_dir->dd_pool->dp_spa); 882842727c2SChris Kirby } 883842727c2SChris Kirby 8843b2aab18SMatthew Ahrens void 8853b2aab18SMatthew Ahrens dsl_dataset_dirty(dsl_dataset_t *ds, dmu_tx_t *tx) 886fa9e4066Sahrens { 8873b2aab18SMatthew Ahrens dsl_pool_t *dp; 888842727c2SChris Kirby 8893b2aab18SMatthew Ahrens if (ds == NULL) /* this is the meta-objset */ 8903b2aab18SMatthew Ahrens return; 8911d452cf5Sahrens 8923b2aab18SMatthew Ahrens ASSERT(ds->ds_objset != NULL); 893fa9e4066Sahrens 8943b2aab18SMatthew Ahrens if (ds->ds_phys->ds_next_snap_obj != 0) 8953b2aab18SMatthew Ahrens panic("dirtying snapshot!"); 896fa9e4066Sahrens 8973b2aab18SMatthew Ahrens dp = ds->ds_dir->dd_pool; 898ce636f8bSMatthew Ahrens 8993b2aab18SMatthew Ahrens if (txg_list_add(&dp->dp_dirty_datasets, ds, tx->tx_txg)) { 9003b2aab18SMatthew Ahrens /* up the hold count until we can be written out */ 9013b2aab18SMatthew Ahrens dmu_buf_add_ref(ds->ds_dbuf, ds); 9023b2aab18SMatthew Ahrens } 9033b2aab18SMatthew Ahrens } 904fa9e4066Sahrens 9052e2c1355SMatthew Ahrens boolean_t 9062e2c1355SMatthew Ahrens dsl_dataset_is_dirty(dsl_dataset_t *ds) 9072e2c1355SMatthew Ahrens { 9082e2c1355SMatthew Ahrens for (int t = 0; t < TXG_SIZE; t++) { 9092e2c1355SMatthew Ahrens if (txg_list_member(&ds->ds_dir->dd_pool->dp_dirty_datasets, 9102e2c1355SMatthew Ahrens ds, t)) 9112e2c1355SMatthew Ahrens return (B_TRUE); 9122e2c1355SMatthew Ahrens } 9132e2c1355SMatthew Ahrens return (B_FALSE); 9142e2c1355SMatthew Ahrens } 9152e2c1355SMatthew Ahrens 916fa9e4066Sahrens static int 9173b2aab18SMatthew Ahrens dsl_dataset_snapshot_reserve_space(dsl_dataset_t *ds, dmu_tx_t *tx) 918fa9e4066Sahrens { 9193b2aab18SMatthew Ahrens uint64_t asize; 920fa9e4066Sahrens 9213b2aab18SMatthew Ahrens if (!dmu_tx_is_syncing(tx)) 92288b7b0f2SMatthew Ahrens return (0); 923fa9e4066Sahrens 924e1930233Sbonwick /* 9253b2aab18SMatthew Ahrens * If there's an fs-only reservation, any blocks that might become 9263b2aab18SMatthew Ahrens * owned by the snapshot dataset must be accommodated by space 9273b2aab18SMatthew Ahrens * outside of the reservation. 928e1930233Sbonwick */ 9293b2aab18SMatthew Ahrens ASSERT(ds->ds_reserved == 0 || DS_UNIQUE_IS_ACCURATE(ds)); 9303b2aab18SMatthew Ahrens asize = MIN(ds->ds_phys->ds_unique_bytes, ds->ds_reserved); 9313b2aab18SMatthew Ahrens if (asize > dsl_dir_space_available(ds->ds_dir, NULL, 0, TRUE)) 932be6fd75aSMatthew Ahrens return (SET_ERROR(ENOSPC)); 933e1930233Sbonwick 9343cb34c60Sahrens /* 9353b2aab18SMatthew Ahrens * Propagate any reserved space for this snapshot to other 9363b2aab18SMatthew Ahrens * snapshot checks in this sync group. 9373cb34c60Sahrens */ 9383b2aab18SMatthew Ahrens if (asize > 0) 9393b2aab18SMatthew Ahrens dsl_dir_willuse_space(ds->ds_dir, asize, tx); 9403cb34c60Sahrens 941e1930233Sbonwick return (0); 942e1930233Sbonwick } 943e1930233Sbonwick 9443b2aab18SMatthew Ahrens typedef struct dsl_dataset_snapshot_arg { 9453b2aab18SMatthew Ahrens nvlist_t *ddsa_snaps; 9463b2aab18SMatthew Ahrens nvlist_t *ddsa_props; 9473b2aab18SMatthew Ahrens nvlist_t *ddsa_errors; 948a2afb611SJerry Jelinek cred_t *ddsa_cr; 9493b2aab18SMatthew Ahrens } dsl_dataset_snapshot_arg_t; 950842727c2SChris Kirby 9513cb34c60Sahrens int 9523b2aab18SMatthew Ahrens dsl_dataset_snapshot_check_impl(dsl_dataset_t *ds, const char *snapname, 953a2afb611SJerry Jelinek dmu_tx_t *tx, boolean_t recv, uint64_t cnt, cred_t *cr) 9541d452cf5Sahrens { 9553b2aab18SMatthew Ahrens int error; 9563b2aab18SMatthew Ahrens uint64_t value; 957fa9e4066Sahrens 9583b2aab18SMatthew Ahrens ds->ds_trysnap_txg = tx->tx_txg; 959745cd3c5Smaybee 9603b2aab18SMatthew Ahrens if (!dmu_tx_is_syncing(tx)) 961842727c2SChris Kirby return (0); 962fa9e4066Sahrens 963fa9e4066Sahrens /* 9643b2aab18SMatthew Ahrens * We don't allow multiple snapshots of the same txg. If there 9653b2aab18SMatthew Ahrens * is already one, try again. 966fa9e4066Sahrens */ 9673b2aab18SMatthew Ahrens if (ds->ds_phys->ds_prev_snap_txg >= tx->tx_txg) 968be6fd75aSMatthew Ahrens return (SET_ERROR(EAGAIN)); 969fa9e4066Sahrens 970fa9e4066Sahrens /* 9713b2aab18SMatthew Ahrens * Check for conflicting snapshot name. 972fa9e4066Sahrens */ 9733b2aab18SMatthew Ahrens error = dsl_dataset_snap_lookup(ds, snapname, &value); 9743b2aab18SMatthew Ahrens if (error == 0) 975be6fd75aSMatthew Ahrens return (SET_ERROR(EEXIST)); 9763b2aab18SMatthew Ahrens if (error != ENOENT) 9773b2aab18SMatthew Ahrens return (error); 978842727c2SChris Kirby 979ca48f36fSKeith M Wesolowski /* 980ca48f36fSKeith M Wesolowski * We don't allow taking snapshots of inconsistent datasets, such as 981ca48f36fSKeith M Wesolowski * those into which we are currently receiving. However, if we are 982ca48f36fSKeith M Wesolowski * creating this snapshot as part of a receive, this check will be 983ca48f36fSKeith M Wesolowski * executed atomically with respect to the completion of the receive 984ca48f36fSKeith M Wesolowski * itself but prior to the clearing of DS_FLAG_INCONSISTENT; in this 985ca48f36fSKeith M Wesolowski * case we ignore this, knowing it will be fixed up for us shortly in 986ca48f36fSKeith M Wesolowski * dmu_recv_end_sync(). 987ca48f36fSKeith M Wesolowski */ 988ca48f36fSKeith M Wesolowski if (!recv && DS_IS_INCONSISTENT(ds)) 989ca48f36fSKeith M Wesolowski return (SET_ERROR(EBUSY)); 990ca48f36fSKeith M Wesolowski 991a2afb611SJerry Jelinek /* 992a2afb611SJerry Jelinek * Skip the check for temporary snapshots or if we have already checked 993a2afb611SJerry Jelinek * the counts in dsl_dataset_snapshot_check. This means we really only 994a2afb611SJerry Jelinek * check the count here when we're receiving a stream. 995a2afb611SJerry Jelinek */ 996a2afb611SJerry Jelinek if (cnt != 0 && cr != NULL) { 997a2afb611SJerry Jelinek error = dsl_fs_ss_limit_check(ds->ds_dir, cnt, 998a2afb611SJerry Jelinek ZFS_PROP_SNAPSHOT_LIMIT, NULL, cr); 999a2afb611SJerry Jelinek if (error != 0) 1000a2afb611SJerry Jelinek return (error); 1001a2afb611SJerry Jelinek } 1002a2afb611SJerry Jelinek 10033b2aab18SMatthew Ahrens error = dsl_dataset_snapshot_reserve_space(ds, tx); 10043b2aab18SMatthew Ahrens if (error != 0) 10053b2aab18SMatthew Ahrens return (error); 1006842727c2SChris Kirby 10071d452cf5Sahrens return (0); 10081d452cf5Sahrens } 10091d452cf5Sahrens 10103b2aab18SMatthew Ahrens static int 10113b2aab18SMatthew Ahrens dsl_dataset_snapshot_check(void *arg, dmu_tx_t *tx) 1012745cd3c5Smaybee { 10133b2aab18SMatthew Ahrens dsl_dataset_snapshot_arg_t *ddsa = arg; 10143b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 10153b2aab18SMatthew Ahrens nvpair_t *pair; 10163b2aab18SMatthew Ahrens int rv = 0; 10173b2aab18SMatthew Ahrens 1018a2afb611SJerry Jelinek /* 1019a2afb611SJerry Jelinek * Pre-compute how many total new snapshots will be created for each 1020a2afb611SJerry Jelinek * level in the tree and below. This is needed for validating the 1021a2afb611SJerry Jelinek * snapshot limit when either taking a recursive snapshot or when 1022a2afb611SJerry Jelinek * taking multiple snapshots. 1023a2afb611SJerry Jelinek * 1024a2afb611SJerry Jelinek * The problem is that the counts are not actually adjusted when 1025a2afb611SJerry Jelinek * we are checking, only when we finally sync. For a single snapshot, 1026a2afb611SJerry Jelinek * this is easy, the count will increase by 1 at each node up the tree, 1027a2afb611SJerry Jelinek * but its more complicated for the recursive/multiple snapshot case. 1028a2afb611SJerry Jelinek * 1029a2afb611SJerry Jelinek * The dsl_fs_ss_limit_check function does recursively check the count 1030a2afb611SJerry Jelinek * at each level up the tree but since it is validating each snapshot 1031a2afb611SJerry Jelinek * independently we need to be sure that we are validating the complete 1032a2afb611SJerry Jelinek * count for the entire set of snapshots. We do this by rolling up the 1033a2afb611SJerry Jelinek * counts for each component of the name into an nvlist and then 1034a2afb611SJerry Jelinek * checking each of those cases with the aggregated count. 1035a2afb611SJerry Jelinek * 1036a2afb611SJerry Jelinek * This approach properly handles not only the recursive snapshot 1037a2afb611SJerry Jelinek * case (where we get all of those on the ddsa_snaps list) but also 1038a2afb611SJerry Jelinek * the sibling case (e.g. snapshot a/b and a/c so that we will also 1039a2afb611SJerry Jelinek * validate the limit on 'a' using a count of 2). 1040a2afb611SJerry Jelinek * 1041a2afb611SJerry Jelinek * We validate the snapshot names in the third loop and only report 1042a2afb611SJerry Jelinek * name errors once. 1043a2afb611SJerry Jelinek */ 1044a2afb611SJerry Jelinek if (dmu_tx_is_syncing(tx)) { 1045a2afb611SJerry Jelinek nvlist_t *cnt_track = NULL; 1046a2afb611SJerry Jelinek cnt_track = fnvlist_alloc(); 1047a2afb611SJerry Jelinek 1048a2afb611SJerry Jelinek /* Rollup aggregated counts into the cnt_track list */ 1049a2afb611SJerry Jelinek for (pair = nvlist_next_nvpair(ddsa->ddsa_snaps, NULL); 1050a2afb611SJerry Jelinek pair != NULL; 1051a2afb611SJerry Jelinek pair = nvlist_next_nvpair(ddsa->ddsa_snaps, pair)) { 1052a2afb611SJerry Jelinek char *pdelim; 1053a2afb611SJerry Jelinek uint64_t val; 1054a2afb611SJerry Jelinek char nm[MAXPATHLEN]; 1055a2afb611SJerry Jelinek 1056a2afb611SJerry Jelinek (void) strlcpy(nm, nvpair_name(pair), sizeof (nm)); 1057a2afb611SJerry Jelinek pdelim = strchr(nm, '@'); 1058a2afb611SJerry Jelinek if (pdelim == NULL) 1059a2afb611SJerry Jelinek continue; 1060a2afb611SJerry Jelinek *pdelim = '\0'; 1061a2afb611SJerry Jelinek 1062a2afb611SJerry Jelinek do { 1063a2afb611SJerry Jelinek if (nvlist_lookup_uint64(cnt_track, nm, 1064a2afb611SJerry Jelinek &val) == 0) { 1065a2afb611SJerry Jelinek /* update existing entry */ 1066a2afb611SJerry Jelinek fnvlist_add_uint64(cnt_track, nm, 1067a2afb611SJerry Jelinek val + 1); 1068a2afb611SJerry Jelinek } else { 1069a2afb611SJerry Jelinek /* add to list */ 1070a2afb611SJerry Jelinek fnvlist_add_uint64(cnt_track, nm, 1); 1071a2afb611SJerry Jelinek } 1072a2afb611SJerry Jelinek 1073a2afb611SJerry Jelinek pdelim = strrchr(nm, '/'); 1074a2afb611SJerry Jelinek if (pdelim != NULL) 1075a2afb611SJerry Jelinek *pdelim = '\0'; 1076a2afb611SJerry Jelinek } while (pdelim != NULL); 1077a2afb611SJerry Jelinek } 1078a2afb611SJerry Jelinek 1079a2afb611SJerry Jelinek /* Check aggregated counts at each level */ 1080a2afb611SJerry Jelinek for (pair = nvlist_next_nvpair(cnt_track, NULL); 1081a2afb611SJerry Jelinek pair != NULL; pair = nvlist_next_nvpair(cnt_track, pair)) { 1082a2afb611SJerry Jelinek int error = 0; 1083a2afb611SJerry Jelinek char *name; 1084a2afb611SJerry Jelinek uint64_t cnt = 0; 1085a2afb611SJerry Jelinek dsl_dataset_t *ds; 1086a2afb611SJerry Jelinek 1087a2afb611SJerry Jelinek name = nvpair_name(pair); 1088a2afb611SJerry Jelinek cnt = fnvpair_value_uint64(pair); 1089a2afb611SJerry Jelinek ASSERT(cnt > 0); 1090a2afb611SJerry Jelinek 1091a2afb611SJerry Jelinek error = dsl_dataset_hold(dp, name, FTAG, &ds); 1092a2afb611SJerry Jelinek if (error == 0) { 1093a2afb611SJerry Jelinek error = dsl_fs_ss_limit_check(ds->ds_dir, cnt, 1094a2afb611SJerry Jelinek ZFS_PROP_SNAPSHOT_LIMIT, NULL, 1095a2afb611SJerry Jelinek ddsa->ddsa_cr); 1096a2afb611SJerry Jelinek dsl_dataset_rele(ds, FTAG); 1097a2afb611SJerry Jelinek } 1098a2afb611SJerry Jelinek 1099a2afb611SJerry Jelinek if (error != 0) { 1100a2afb611SJerry Jelinek if (ddsa->ddsa_errors != NULL) 1101a2afb611SJerry Jelinek fnvlist_add_int32(ddsa->ddsa_errors, 1102a2afb611SJerry Jelinek name, error); 1103a2afb611SJerry Jelinek rv = error; 1104a2afb611SJerry Jelinek /* only report one error for this check */ 1105a2afb611SJerry Jelinek break; 1106a2afb611SJerry Jelinek } 1107a2afb611SJerry Jelinek } 1108a2afb611SJerry Jelinek nvlist_free(cnt_track); 1109a2afb611SJerry Jelinek } 1110a2afb611SJerry Jelinek 11113b2aab18SMatthew Ahrens for (pair = nvlist_next_nvpair(ddsa->ddsa_snaps, NULL); 11123b2aab18SMatthew Ahrens pair != NULL; pair = nvlist_next_nvpair(ddsa->ddsa_snaps, pair)) { 11133b2aab18SMatthew Ahrens int error = 0; 11143b2aab18SMatthew Ahrens dsl_dataset_t *ds; 11153b2aab18SMatthew Ahrens char *name, *atp; 11163b2aab18SMatthew Ahrens char dsname[MAXNAMELEN]; 11173b2aab18SMatthew Ahrens 11183b2aab18SMatthew Ahrens name = nvpair_name(pair); 11193b2aab18SMatthew Ahrens if (strlen(name) >= MAXNAMELEN) 1120be6fd75aSMatthew Ahrens error = SET_ERROR(ENAMETOOLONG); 11213b2aab18SMatthew Ahrens if (error == 0) { 11223b2aab18SMatthew Ahrens atp = strchr(name, '@'); 11233b2aab18SMatthew Ahrens if (atp == NULL) 1124be6fd75aSMatthew Ahrens error = SET_ERROR(EINVAL); 11253b2aab18SMatthew Ahrens if (error == 0) 11263b2aab18SMatthew Ahrens (void) strlcpy(dsname, name, atp - name + 1); 11273b2aab18SMatthew Ahrens } 11283b2aab18SMatthew Ahrens if (error == 0) 11293b2aab18SMatthew Ahrens error = dsl_dataset_hold(dp, dsname, FTAG, &ds); 11303b2aab18SMatthew Ahrens if (error == 0) { 1131a2afb611SJerry Jelinek /* passing 0/NULL skips dsl_fs_ss_limit_check */ 11323b2aab18SMatthew Ahrens error = dsl_dataset_snapshot_check_impl(ds, 1133a2afb611SJerry Jelinek atp + 1, tx, B_FALSE, 0, NULL); 11343b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 11353b2aab18SMatthew Ahrens } 1136745cd3c5Smaybee 11373b2aab18SMatthew Ahrens if (error != 0) { 11383b2aab18SMatthew Ahrens if (ddsa->ddsa_errors != NULL) { 11393b2aab18SMatthew Ahrens fnvlist_add_int32(ddsa->ddsa_errors, 11403b2aab18SMatthew Ahrens name, error); 11413b2aab18SMatthew Ahrens } 11423b2aab18SMatthew Ahrens rv = error; 11433b2aab18SMatthew Ahrens } 11443b2aab18SMatthew Ahrens } 1145a2afb611SJerry Jelinek 11463b2aab18SMatthew Ahrens return (rv); 1147745cd3c5Smaybee } 1148745cd3c5Smaybee 11493b2aab18SMatthew Ahrens void 11503b2aab18SMatthew Ahrens dsl_dataset_snapshot_sync_impl(dsl_dataset_t *ds, const char *snapname, 11513b2aab18SMatthew Ahrens dmu_tx_t *tx) 1152745cd3c5Smaybee { 11533b2aab18SMatthew Ahrens static zil_header_t zero_zil; 1154745cd3c5Smaybee 11553b2aab18SMatthew Ahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 11563b2aab18SMatthew Ahrens dmu_buf_t *dbuf; 11573b2aab18SMatthew Ahrens dsl_dataset_phys_t *dsphys; 11583b2aab18SMatthew Ahrens uint64_t dsobj, crtxg; 11593b2aab18SMatthew Ahrens objset_t *mos = dp->dp_meta_objset; 11603b2aab18SMatthew Ahrens objset_t *os; 1161745cd3c5Smaybee 11623b2aab18SMatthew Ahrens ASSERT(RRW_WRITE_HELD(&dp->dp_config_rwlock)); 1163c33e334fSMatthew Ahrens 1164c33e334fSMatthew Ahrens /* 11653b2aab18SMatthew Ahrens * If we are on an old pool, the zil must not be active, in which 11663b2aab18SMatthew Ahrens * case it will be zeroed. Usually zil_suspend() accomplishes this. 1167c33e334fSMatthew Ahrens */ 11683b2aab18SMatthew Ahrens ASSERT(spa_version(dmu_tx_pool(tx)->dp_spa) >= SPA_VERSION_FAST_SNAP || 11693b2aab18SMatthew Ahrens dmu_objset_from_ds(ds, &os) != 0 || 11703b2aab18SMatthew Ahrens bcmp(&os->os_phys->os_zil_header, &zero_zil, 11713b2aab18SMatthew Ahrens sizeof (zero_zil)) == 0); 1172c33e334fSMatthew Ahrens 1173a2afb611SJerry Jelinek dsl_fs_ss_count_adjust(ds->ds_dir, 1, DD_FIELD_SNAPSHOT_COUNT, tx); 1174cde58dbcSMatthew Ahrens 1175cde58dbcSMatthew Ahrens /* 11763b2aab18SMatthew Ahrens * The origin's ds_creation_txg has to be < TXG_INITIAL 1177088f3894Sahrens */ 1178088f3894Sahrens if (strcmp(snapname, ORIGIN_DIR_NAME) == 0) 1179088f3894Sahrens crtxg = 1; 1180088f3894Sahrens else 1181088f3894Sahrens crtxg = tx->tx_txg; 1182088f3894Sahrens 11831649cd4bStabriz dsobj = dmu_object_alloc(mos, DMU_OT_DSL_DATASET, 0, 11841649cd4bStabriz DMU_OT_DSL_DATASET, sizeof (dsl_dataset_phys_t), tx); 11853b2aab18SMatthew Ahrens VERIFY0(dmu_bonus_hold(mos, dsobj, FTAG, &dbuf)); 1186fa9e4066Sahrens dmu_buf_will_dirty(dbuf, tx); 1187fa9e4066Sahrens dsphys = dbuf->db_data; 1188745cd3c5Smaybee bzero(dsphys, sizeof (dsl_dataset_phys_t)); 11891d452cf5Sahrens dsphys->ds_dir_obj = ds->ds_dir->dd_object; 1190fa9e4066Sahrens dsphys->ds_fsid_guid = unique_create(); 1191fa9e4066Sahrens (void) random_get_pseudo_bytes((void*)&dsphys->ds_guid, 1192fa9e4066Sahrens sizeof (dsphys->ds_guid)); 1193fa9e4066Sahrens dsphys->ds_prev_snap_obj = ds->ds_phys->ds_prev_snap_obj; 1194fa9e4066Sahrens dsphys->ds_prev_snap_txg = ds->ds_phys->ds_prev_snap_txg; 1195fa9e4066Sahrens dsphys->ds_next_snap_obj = ds->ds_object; 1196fa9e4066Sahrens dsphys->ds_num_children = 1; 1197fa9e4066Sahrens dsphys->ds_creation_time = gethrestime_sec(); 1198088f3894Sahrens dsphys->ds_creation_txg = crtxg; 1199fa9e4066Sahrens dsphys->ds_deadlist_obj = ds->ds_phys->ds_deadlist_obj; 1200ad135b5dSChristopher Siden dsphys->ds_referenced_bytes = ds->ds_phys->ds_referenced_bytes; 1201fa9e4066Sahrens dsphys->ds_compressed_bytes = ds->ds_phys->ds_compressed_bytes; 1202fa9e4066Sahrens dsphys->ds_uncompressed_bytes = ds->ds_phys->ds_uncompressed_bytes; 120399653d4eSeschrock dsphys->ds_flags = ds->ds_phys->ds_flags; 1204fa9e4066Sahrens dsphys->ds_bp = ds->ds_phys->ds_bp; 1205ea8dc4b6Seschrock dmu_buf_rele(dbuf, FTAG); 1206fa9e4066Sahrens 12071d452cf5Sahrens ASSERT3U(ds->ds_prev != 0, ==, ds->ds_phys->ds_prev_snap_obj != 0); 12081d452cf5Sahrens if (ds->ds_prev) { 1209088f3894Sahrens uint64_t next_clones_obj = 1210088f3894Sahrens ds->ds_prev->ds_phys->ds_next_clones_obj; 12111d452cf5Sahrens ASSERT(ds->ds_prev->ds_phys->ds_next_snap_obj == 1212fa9e4066Sahrens ds->ds_object || 12131d452cf5Sahrens ds->ds_prev->ds_phys->ds_num_children > 1); 12141d452cf5Sahrens if (ds->ds_prev->ds_phys->ds_next_snap_obj == ds->ds_object) { 12151d452cf5Sahrens dmu_buf_will_dirty(ds->ds_prev->ds_dbuf, tx); 1216fa9e4066Sahrens ASSERT3U(ds->ds_phys->ds_prev_snap_txg, ==, 12171d452cf5Sahrens ds->ds_prev->ds_phys->ds_creation_txg); 12181d452cf5Sahrens ds->ds_prev->ds_phys->ds_next_snap_obj = dsobj; 1219088f3894Sahrens } else if (next_clones_obj != 0) { 12203b2aab18SMatthew Ahrens dsl_dataset_remove_from_next_clones(ds->ds_prev, 1221c33e334fSMatthew Ahrens dsphys->ds_next_snap_obj, tx); 12223b2aab18SMatthew Ahrens VERIFY0(zap_add_int(mos, 1223088f3894Sahrens next_clones_obj, dsobj, tx)); 1224fa9e4066Sahrens } 1225fa9e4066Sahrens } 1226fa9e4066Sahrens 1227a9799022Sck /* 1228a9799022Sck * If we have a reference-reservation on this dataset, we will 1229a9799022Sck * need to increase the amount of refreservation being charged 1230a9799022Sck * since our unique space is going to zero. 1231a9799022Sck */ 1232a9799022Sck if (ds->ds_reserved) { 12333f9d6ad7SLin Ling int64_t delta; 12343f9d6ad7SLin Ling ASSERT(DS_UNIQUE_IS_ACCURATE(ds)); 12353f9d6ad7SLin Ling delta = MIN(ds->ds_phys->ds_unique_bytes, ds->ds_reserved); 123674e7dc98SMatthew Ahrens dsl_dir_diduse_space(ds->ds_dir, DD_USED_REFRSRV, 12373f9d6ad7SLin Ling delta, 0, 0, tx); 1238a9799022Sck } 1239a9799022Sck 1240fa9e4066Sahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 1241cde58dbcSMatthew Ahrens ds->ds_phys->ds_deadlist_obj = dsl_deadlist_clone(&ds->ds_deadlist, 1242cde58dbcSMatthew Ahrens UINT64_MAX, ds->ds_phys->ds_prev_snap_obj, tx); 1243cde58dbcSMatthew Ahrens dsl_deadlist_close(&ds->ds_deadlist); 1244cde58dbcSMatthew Ahrens dsl_deadlist_open(&ds->ds_deadlist, mos, ds->ds_phys->ds_deadlist_obj); 1245cde58dbcSMatthew Ahrens dsl_deadlist_add_key(&ds->ds_deadlist, 1246cde58dbcSMatthew Ahrens ds->ds_phys->ds_prev_snap_txg, tx); 1247cde58dbcSMatthew Ahrens 1248a4611edeSahrens ASSERT3U(ds->ds_phys->ds_prev_snap_txg, <, tx->tx_txg); 1249fa9e4066Sahrens ds->ds_phys->ds_prev_snap_obj = dsobj; 1250088f3894Sahrens ds->ds_phys->ds_prev_snap_txg = crtxg; 1251fa9e4066Sahrens ds->ds_phys->ds_unique_bytes = 0; 1252a9799022Sck if (spa_version(dp->dp_spa) >= SPA_VERSION_UNIQUE_ACCURATE) 1253a9799022Sck ds->ds_phys->ds_flags |= DS_FLAG_UNIQUE_ACCURATE; 1254fa9e4066Sahrens 12553b2aab18SMatthew Ahrens VERIFY0(zap_add(mos, ds->ds_phys->ds_snapnames_zapobj, 12563b2aab18SMatthew Ahrens snapname, 8, 1, &dsobj, tx)); 1257fa9e4066Sahrens 1258fa9e4066Sahrens if (ds->ds_prev) 12593b2aab18SMatthew Ahrens dsl_dataset_rele(ds->ds_prev, ds); 12603b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold_obj(dp, 1261745cd3c5Smaybee ds->ds_phys->ds_prev_snap_obj, ds, &ds->ds_prev)); 1262ecd6cf80Smarks 12633f9d6ad7SLin Ling dsl_scan_ds_snapshotted(ds, tx); 1264088f3894Sahrens 126571eb0538SChris Kirby dsl_dir_snap_cmtime_update(ds->ds_dir); 126671eb0538SChris Kirby 12674445fffbSMatthew Ahrens spa_history_log_internal_ds(ds->ds_prev, "snapshot", tx, ""); 1268fa9e4066Sahrens } 1269fa9e4066Sahrens 12703b2aab18SMatthew Ahrens static void 12713b2aab18SMatthew Ahrens dsl_dataset_snapshot_sync(void *arg, dmu_tx_t *tx) 1272fa9e4066Sahrens { 12733b2aab18SMatthew Ahrens dsl_dataset_snapshot_arg_t *ddsa = arg; 12743b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 12753b2aab18SMatthew Ahrens nvpair_t *pair; 127691ebeef5Sahrens 12773b2aab18SMatthew Ahrens for (pair = nvlist_next_nvpair(ddsa->ddsa_snaps, NULL); 12783b2aab18SMatthew Ahrens pair != NULL; pair = nvlist_next_nvpair(ddsa->ddsa_snaps, pair)) { 12793b2aab18SMatthew Ahrens dsl_dataset_t *ds; 12803b2aab18SMatthew Ahrens char *name, *atp; 12813b2aab18SMatthew Ahrens char dsname[MAXNAMELEN]; 12823b2aab18SMatthew Ahrens 12833b2aab18SMatthew Ahrens name = nvpair_name(pair); 12843b2aab18SMatthew Ahrens atp = strchr(name, '@'); 12853b2aab18SMatthew Ahrens (void) strlcpy(dsname, name, atp - name + 1); 12863b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold(dp, dsname, FTAG, &ds)); 12873b2aab18SMatthew Ahrens 12883b2aab18SMatthew Ahrens dsl_dataset_snapshot_sync_impl(ds, atp + 1, tx); 12893b2aab18SMatthew Ahrens if (ddsa->ddsa_props != NULL) { 12903b2aab18SMatthew Ahrens dsl_props_set_sync_impl(ds->ds_prev, 12913b2aab18SMatthew Ahrens ZPROP_SRC_LOCAL, ddsa->ddsa_props, tx); 12923b2aab18SMatthew Ahrens } 12933b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 12943b2aab18SMatthew Ahrens } 1295fa9e4066Sahrens } 1296fa9e4066Sahrens 12973b2aab18SMatthew Ahrens /* 12983b2aab18SMatthew Ahrens * The snapshots must all be in the same pool. 12993b2aab18SMatthew Ahrens * All-or-nothing: if there are any failures, nothing will be modified. 13003b2aab18SMatthew Ahrens */ 13013b2aab18SMatthew Ahrens int 13023b2aab18SMatthew Ahrens dsl_dataset_snapshot(nvlist_t *snaps, nvlist_t *props, nvlist_t *errors) 130319b94df9SMatthew Ahrens { 13043b2aab18SMatthew Ahrens dsl_dataset_snapshot_arg_t ddsa; 13053b2aab18SMatthew Ahrens nvpair_t *pair; 13063b2aab18SMatthew Ahrens boolean_t needsuspend; 13073b2aab18SMatthew Ahrens int error; 13083b2aab18SMatthew Ahrens spa_t *spa; 13093b2aab18SMatthew Ahrens char *firstname; 13103b2aab18SMatthew Ahrens nvlist_t *suspended = NULL; 131119b94df9SMatthew Ahrens 13123b2aab18SMatthew Ahrens pair = nvlist_next_nvpair(snaps, NULL); 13133b2aab18SMatthew Ahrens if (pair == NULL) 13143b2aab18SMatthew Ahrens return (0); 13153b2aab18SMatthew Ahrens firstname = nvpair_name(pair); 13163b2aab18SMatthew Ahrens 13173b2aab18SMatthew Ahrens error = spa_open(firstname, &spa, FTAG); 13183b2aab18SMatthew Ahrens if (error != 0) 13193b2aab18SMatthew Ahrens return (error); 13203b2aab18SMatthew Ahrens needsuspend = (spa_version(spa) < SPA_VERSION_FAST_SNAP); 13213b2aab18SMatthew Ahrens spa_close(spa, FTAG); 13223b2aab18SMatthew Ahrens 13233b2aab18SMatthew Ahrens if (needsuspend) { 13243b2aab18SMatthew Ahrens suspended = fnvlist_alloc(); 13253b2aab18SMatthew Ahrens for (pair = nvlist_next_nvpair(snaps, NULL); pair != NULL; 13263b2aab18SMatthew Ahrens pair = nvlist_next_nvpair(snaps, pair)) { 13273b2aab18SMatthew Ahrens char fsname[MAXNAMELEN]; 13283b2aab18SMatthew Ahrens char *snapname = nvpair_name(pair); 13293b2aab18SMatthew Ahrens char *atp; 13303b2aab18SMatthew Ahrens void *cookie; 13313b2aab18SMatthew Ahrens 13323b2aab18SMatthew Ahrens atp = strchr(snapname, '@'); 13333b2aab18SMatthew Ahrens if (atp == NULL) { 1334be6fd75aSMatthew Ahrens error = SET_ERROR(EINVAL); 13353b2aab18SMatthew Ahrens break; 13363b2aab18SMatthew Ahrens } 13373b2aab18SMatthew Ahrens (void) strlcpy(fsname, snapname, atp - snapname + 1); 13383b2aab18SMatthew Ahrens 13393b2aab18SMatthew Ahrens error = zil_suspend(fsname, &cookie); 13403b2aab18SMatthew Ahrens if (error != 0) 13413b2aab18SMatthew Ahrens break; 13423b2aab18SMatthew Ahrens fnvlist_add_uint64(suspended, fsname, 13433b2aab18SMatthew Ahrens (uintptr_t)cookie); 13443b2aab18SMatthew Ahrens } 13453b2aab18SMatthew Ahrens } 13463b2aab18SMatthew Ahrens 13473b2aab18SMatthew Ahrens ddsa.ddsa_snaps = snaps; 13483b2aab18SMatthew Ahrens ddsa.ddsa_props = props; 13493b2aab18SMatthew Ahrens ddsa.ddsa_errors = errors; 1350a2afb611SJerry Jelinek ddsa.ddsa_cr = CRED(); 13513b2aab18SMatthew Ahrens 13523b2aab18SMatthew Ahrens if (error == 0) { 13533b2aab18SMatthew Ahrens error = dsl_sync_task(firstname, dsl_dataset_snapshot_check, 13543b2aab18SMatthew Ahrens dsl_dataset_snapshot_sync, &ddsa, 1355*7d46dc6cSMatthew Ahrens fnvlist_num_pairs(snaps) * 3, ZFS_SPACE_CHECK_NORMAL); 13563b2aab18SMatthew Ahrens } 13573b2aab18SMatthew Ahrens 13583b2aab18SMatthew Ahrens if (suspended != NULL) { 13593b2aab18SMatthew Ahrens for (pair = nvlist_next_nvpair(suspended, NULL); pair != NULL; 13603b2aab18SMatthew Ahrens pair = nvlist_next_nvpair(suspended, pair)) { 13613b2aab18SMatthew Ahrens zil_resume((void *)(uintptr_t) 13623b2aab18SMatthew Ahrens fnvpair_value_uint64(pair)); 13633b2aab18SMatthew Ahrens } 13643b2aab18SMatthew Ahrens fnvlist_free(suspended); 13653b2aab18SMatthew Ahrens } 13663b2aab18SMatthew Ahrens 13673b2aab18SMatthew Ahrens return (error); 13683b2aab18SMatthew Ahrens } 13693b2aab18SMatthew Ahrens 13703b2aab18SMatthew Ahrens typedef struct dsl_dataset_snapshot_tmp_arg { 13713b2aab18SMatthew Ahrens const char *ddsta_fsname; 13723b2aab18SMatthew Ahrens const char *ddsta_snapname; 13733b2aab18SMatthew Ahrens minor_t ddsta_cleanup_minor; 13743b2aab18SMatthew Ahrens const char *ddsta_htag; 13753b2aab18SMatthew Ahrens } dsl_dataset_snapshot_tmp_arg_t; 13763b2aab18SMatthew Ahrens 13773b2aab18SMatthew Ahrens static int 13783b2aab18SMatthew Ahrens dsl_dataset_snapshot_tmp_check(void *arg, dmu_tx_t *tx) 13793b2aab18SMatthew Ahrens { 13803b2aab18SMatthew Ahrens dsl_dataset_snapshot_tmp_arg_t *ddsta = arg; 13813b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 13823b2aab18SMatthew Ahrens dsl_dataset_t *ds; 13833b2aab18SMatthew Ahrens int error; 13843b2aab18SMatthew Ahrens 13853b2aab18SMatthew Ahrens error = dsl_dataset_hold(dp, ddsta->ddsta_fsname, FTAG, &ds); 13863b2aab18SMatthew Ahrens if (error != 0) 13873b2aab18SMatthew Ahrens return (error); 13883b2aab18SMatthew Ahrens 1389a2afb611SJerry Jelinek /* NULL cred means no limit check for tmp snapshot */ 1390ca48f36fSKeith M Wesolowski error = dsl_dataset_snapshot_check_impl(ds, ddsta->ddsta_snapname, 1391a2afb611SJerry Jelinek tx, B_FALSE, 0, NULL); 13923b2aab18SMatthew Ahrens if (error != 0) { 13933b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 13943b2aab18SMatthew Ahrens return (error); 13953b2aab18SMatthew Ahrens } 13963b2aab18SMatthew Ahrens 13973b2aab18SMatthew Ahrens if (spa_version(dp->dp_spa) < SPA_VERSION_USERREFS) { 13983b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 1399be6fd75aSMatthew Ahrens return (SET_ERROR(ENOTSUP)); 14003b2aab18SMatthew Ahrens } 14013b2aab18SMatthew Ahrens error = dsl_dataset_user_hold_check_one(NULL, ddsta->ddsta_htag, 14023b2aab18SMatthew Ahrens B_TRUE, tx); 14033b2aab18SMatthew Ahrens if (error != 0) { 14043b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 14053b2aab18SMatthew Ahrens return (error); 14063b2aab18SMatthew Ahrens } 14073b2aab18SMatthew Ahrens 14083b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 14093b2aab18SMatthew Ahrens return (0); 14103b2aab18SMatthew Ahrens } 14113b2aab18SMatthew Ahrens 14123b2aab18SMatthew Ahrens static void 14133b2aab18SMatthew Ahrens dsl_dataset_snapshot_tmp_sync(void *arg, dmu_tx_t *tx) 14143b2aab18SMatthew Ahrens { 14153b2aab18SMatthew Ahrens dsl_dataset_snapshot_tmp_arg_t *ddsta = arg; 14163b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 14173b2aab18SMatthew Ahrens dsl_dataset_t *ds; 14183b2aab18SMatthew Ahrens 14193b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold(dp, ddsta->ddsta_fsname, FTAG, &ds)); 14203b2aab18SMatthew Ahrens 14213b2aab18SMatthew Ahrens dsl_dataset_snapshot_sync_impl(ds, ddsta->ddsta_snapname, tx); 14223b2aab18SMatthew Ahrens dsl_dataset_user_hold_sync_one(ds->ds_prev, ddsta->ddsta_htag, 14233b2aab18SMatthew Ahrens ddsta->ddsta_cleanup_minor, gethrestime_sec(), tx); 14243b2aab18SMatthew Ahrens dsl_destroy_snapshot_sync_impl(ds->ds_prev, B_TRUE, tx); 14253b2aab18SMatthew Ahrens 14263b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 14273b2aab18SMatthew Ahrens } 14283b2aab18SMatthew Ahrens 14293b2aab18SMatthew Ahrens int 14303b2aab18SMatthew Ahrens dsl_dataset_snapshot_tmp(const char *fsname, const char *snapname, 14313b2aab18SMatthew Ahrens minor_t cleanup_minor, const char *htag) 14323b2aab18SMatthew Ahrens { 14333b2aab18SMatthew Ahrens dsl_dataset_snapshot_tmp_arg_t ddsta; 14343b2aab18SMatthew Ahrens int error; 14353b2aab18SMatthew Ahrens spa_t *spa; 14363b2aab18SMatthew Ahrens boolean_t needsuspend; 14373b2aab18SMatthew Ahrens void *cookie; 14383b2aab18SMatthew Ahrens 14393b2aab18SMatthew Ahrens ddsta.ddsta_fsname = fsname; 14403b2aab18SMatthew Ahrens ddsta.ddsta_snapname = snapname; 14413b2aab18SMatthew Ahrens ddsta.ddsta_cleanup_minor = cleanup_minor; 14423b2aab18SMatthew Ahrens ddsta.ddsta_htag = htag; 14433b2aab18SMatthew Ahrens 14443b2aab18SMatthew Ahrens error = spa_open(fsname, &spa, FTAG); 14453b2aab18SMatthew Ahrens if (error != 0) 14463b2aab18SMatthew Ahrens return (error); 14473b2aab18SMatthew Ahrens needsuspend = (spa_version(spa) < SPA_VERSION_FAST_SNAP); 14483b2aab18SMatthew Ahrens spa_close(spa, FTAG); 14493b2aab18SMatthew Ahrens 14503b2aab18SMatthew Ahrens if (needsuspend) { 14513b2aab18SMatthew Ahrens error = zil_suspend(fsname, &cookie); 14523b2aab18SMatthew Ahrens if (error != 0) 14533b2aab18SMatthew Ahrens return (error); 14543b2aab18SMatthew Ahrens } 14553b2aab18SMatthew Ahrens 14563b2aab18SMatthew Ahrens error = dsl_sync_task(fsname, dsl_dataset_snapshot_tmp_check, 1457*7d46dc6cSMatthew Ahrens dsl_dataset_snapshot_tmp_sync, &ddsta, 3, ZFS_SPACE_CHECK_RESERVED); 14583b2aab18SMatthew Ahrens 14593b2aab18SMatthew Ahrens if (needsuspend) 14603b2aab18SMatthew Ahrens zil_resume(cookie); 14613b2aab18SMatthew Ahrens return (error); 14623b2aab18SMatthew Ahrens } 14633b2aab18SMatthew Ahrens 14643b2aab18SMatthew Ahrens 14653b2aab18SMatthew Ahrens void 14663b2aab18SMatthew Ahrens dsl_dataset_sync(dsl_dataset_t *ds, zio_t *zio, dmu_tx_t *tx) 14673b2aab18SMatthew Ahrens { 14683b2aab18SMatthew Ahrens ASSERT(dmu_tx_is_syncing(tx)); 14693b2aab18SMatthew Ahrens ASSERT(ds->ds_objset != NULL); 14703b2aab18SMatthew Ahrens ASSERT(ds->ds_phys->ds_next_snap_obj == 0); 14713b2aab18SMatthew Ahrens 14723b2aab18SMatthew Ahrens /* 14733b2aab18SMatthew Ahrens * in case we had to change ds_fsid_guid when we opened it, 14743b2aab18SMatthew Ahrens * sync it out now. 14753b2aab18SMatthew Ahrens */ 14763b2aab18SMatthew Ahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 14773b2aab18SMatthew Ahrens ds->ds_phys->ds_fsid_guid = ds->ds_fsid_guid; 14783b2aab18SMatthew Ahrens 14793b2aab18SMatthew Ahrens dmu_objset_sync(ds->ds_objset, zio, tx); 14803b2aab18SMatthew Ahrens } 14813b2aab18SMatthew Ahrens 14823b2aab18SMatthew Ahrens static void 14833b2aab18SMatthew Ahrens get_clones_stat(dsl_dataset_t *ds, nvlist_t *nv) 14843b2aab18SMatthew Ahrens { 14853b2aab18SMatthew Ahrens uint64_t count = 0; 14863b2aab18SMatthew Ahrens objset_t *mos = ds->ds_dir->dd_pool->dp_meta_objset; 14873b2aab18SMatthew Ahrens zap_cursor_t zc; 14883b2aab18SMatthew Ahrens zap_attribute_t za; 14893b2aab18SMatthew Ahrens nvlist_t *propval = fnvlist_alloc(); 14903b2aab18SMatthew Ahrens nvlist_t *val = fnvlist_alloc(); 14913b2aab18SMatthew Ahrens 14923b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(ds->ds_dir->dd_pool)); 149319b94df9SMatthew Ahrens 149419b94df9SMatthew Ahrens /* 14953b2aab18SMatthew Ahrens * There may be missing entries in ds_next_clones_obj 149619b94df9SMatthew Ahrens * due to a bug in a previous version of the code. 149719b94df9SMatthew Ahrens * Only trust it if it has the right number of entries. 149819b94df9SMatthew Ahrens */ 149919b94df9SMatthew Ahrens if (ds->ds_phys->ds_next_clones_obj != 0) { 150003d1795fSAlexander Stetsenko VERIFY0(zap_count(mos, ds->ds_phys->ds_next_clones_obj, 150119b94df9SMatthew Ahrens &count)); 150219b94df9SMatthew Ahrens } 15033b2aab18SMatthew Ahrens if (count != ds->ds_phys->ds_num_children - 1) 150419b94df9SMatthew Ahrens goto fail; 150519b94df9SMatthew Ahrens for (zap_cursor_init(&zc, mos, ds->ds_phys->ds_next_clones_obj); 150619b94df9SMatthew Ahrens zap_cursor_retrieve(&zc, &za) == 0; 150719b94df9SMatthew Ahrens zap_cursor_advance(&zc)) { 150819b94df9SMatthew Ahrens dsl_dataset_t *clone; 150919b94df9SMatthew Ahrens char buf[ZFS_MAXNAMELEN]; 15103b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold_obj(ds->ds_dir->dd_pool, 15113b2aab18SMatthew Ahrens za.za_first_integer, FTAG, &clone)); 151219b94df9SMatthew Ahrens dsl_dir_name(clone->ds_dir, buf); 15133b2aab18SMatthew Ahrens fnvlist_add_boolean(val, buf); 151419b94df9SMatthew Ahrens dsl_dataset_rele(clone, FTAG); 151519b94df9SMatthew Ahrens } 151619b94df9SMatthew Ahrens zap_cursor_fini(&zc); 15173b2aab18SMatthew Ahrens fnvlist_add_nvlist(propval, ZPROP_VALUE, val); 15183b2aab18SMatthew Ahrens fnvlist_add_nvlist(nv, zfs_prop_to_name(ZFS_PROP_CLONES), propval); 151919b94df9SMatthew Ahrens fail: 152019b94df9SMatthew Ahrens nvlist_free(val); 152119b94df9SMatthew Ahrens nvlist_free(propval); 152219b94df9SMatthew Ahrens } 152319b94df9SMatthew Ahrens 1524fa9e4066Sahrens void 1525a2eea2e1Sahrens dsl_dataset_stats(dsl_dataset_t *ds, nvlist_t *nv) 1526fa9e4066Sahrens { 15273b2aab18SMatthew Ahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 1528187d6ac0SMatt Ahrens uint64_t refd, avail, uobjs, aobjs, ratio; 1529a9799022Sck 15303b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(dp)); 15313b2aab18SMatthew Ahrens 15324445fffbSMatthew Ahrens ratio = ds->ds_phys->ds_compressed_bytes == 0 ? 100 : 15334445fffbSMatthew Ahrens (ds->ds_phys->ds_uncompressed_bytes * 100 / 15344445fffbSMatthew Ahrens ds->ds_phys->ds_compressed_bytes); 15354445fffbSMatthew Ahrens 15364445fffbSMatthew Ahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_REFRATIO, ratio); 153777372cb0SMatthew Ahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_LOGICALREFERENCED, 153877372cb0SMatthew Ahrens ds->ds_phys->ds_uncompressed_bytes); 15394445fffbSMatthew Ahrens 15404445fffbSMatthew Ahrens if (dsl_dataset_is_snapshot(ds)) { 15414445fffbSMatthew Ahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_COMPRESSRATIO, ratio); 15424445fffbSMatthew Ahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_USED, 15434445fffbSMatthew Ahrens ds->ds_phys->ds_unique_bytes); 15444445fffbSMatthew Ahrens get_clones_stat(ds, nv); 15454445fffbSMatthew Ahrens } else { 1546b461c746SMatthew Ahrens if (ds->ds_prev != NULL && ds->ds_prev != dp->dp_origin_snap) { 1547b461c746SMatthew Ahrens char buf[MAXNAMELEN]; 1548b461c746SMatthew Ahrens dsl_dataset_name(ds->ds_prev, buf); 1549b461c746SMatthew Ahrens dsl_prop_nvlist_add_string(nv, ZFS_PROP_PREV_SNAP, buf); 1550b461c746SMatthew Ahrens } 1551b461c746SMatthew Ahrens 15524445fffbSMatthew Ahrens dsl_dir_stats(ds->ds_dir, nv); 15534445fffbSMatthew Ahrens } 1554fa9e4066Sahrens 1555a9799022Sck dsl_dataset_space(ds, &refd, &avail, &uobjs, &aobjs); 1556a9799022Sck dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_AVAILABLE, avail); 1557a9799022Sck dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_REFERENCED, refd); 1558a9799022Sck 1559a2eea2e1Sahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_CREATION, 1560a2eea2e1Sahrens ds->ds_phys->ds_creation_time); 1561a2eea2e1Sahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_CREATETXG, 1562a2eea2e1Sahrens ds->ds_phys->ds_creation_txg); 1563a9799022Sck dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_REFQUOTA, 1564a9799022Sck ds->ds_quota); 1565a9799022Sck dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_REFRESERVATION, 1566a9799022Sck ds->ds_reserved); 1567c5904d13Seschrock dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_GUID, 1568c5904d13Seschrock ds->ds_phys->ds_guid); 15691d713200SEric Schrock dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_UNIQUE, 15703f9d6ad7SLin Ling ds->ds_phys->ds_unique_bytes); 15711d713200SEric Schrock dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_OBJSETID, 15721d713200SEric Schrock ds->ds_object); 157392241e0bSTom Erickson dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_USERREFS, 157492241e0bSTom Erickson ds->ds_userrefs); 1575842727c2SChris Kirby dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_DEFER_DESTROY, 1576842727c2SChris Kirby DS_IS_DEFER_DESTROY(ds) ? 1 : 0); 1577fa9e4066Sahrens 157819b94df9SMatthew Ahrens if (ds->ds_phys->ds_prev_snap_obj != 0) { 157919b94df9SMatthew Ahrens uint64_t written, comp, uncomp; 158019b94df9SMatthew Ahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 158119b94df9SMatthew Ahrens dsl_dataset_t *prev; 158219b94df9SMatthew Ahrens 158319b94df9SMatthew Ahrens int err = dsl_dataset_hold_obj(dp, 158419b94df9SMatthew Ahrens ds->ds_phys->ds_prev_snap_obj, FTAG, &prev); 158519b94df9SMatthew Ahrens if (err == 0) { 158619b94df9SMatthew Ahrens err = dsl_dataset_space_written(prev, ds, &written, 158719b94df9SMatthew Ahrens &comp, &uncomp); 158819b94df9SMatthew Ahrens dsl_dataset_rele(prev, FTAG); 158919b94df9SMatthew Ahrens if (err == 0) { 159019b94df9SMatthew Ahrens dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_WRITTEN, 159119b94df9SMatthew Ahrens written); 159219b94df9SMatthew Ahrens } 159319b94df9SMatthew Ahrens } 159419b94df9SMatthew Ahrens } 1595fa9e4066Sahrens } 1596fa9e4066Sahrens 1597a2eea2e1Sahrens void 1598a2eea2e1Sahrens dsl_dataset_fast_stat(dsl_dataset_t *ds, dmu_objset_stats_t *stat) 1599a2eea2e1Sahrens { 16003b2aab18SMatthew Ahrens dsl_pool_t *dp = ds->ds_dir->dd_pool; 16013b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(dp)); 16023b2aab18SMatthew Ahrens 1603a2eea2e1Sahrens stat->dds_creation_txg = ds->ds_phys->ds_creation_txg; 1604a2eea2e1Sahrens stat->dds_inconsistent = ds->ds_phys->ds_flags & DS_FLAG_INCONSISTENT; 16053cb34c60Sahrens stat->dds_guid = ds->ds_phys->ds_guid; 16064445fffbSMatthew Ahrens stat->dds_origin[0] = '\0'; 16074445fffbSMatthew Ahrens if (dsl_dataset_is_snapshot(ds)) { 1608a2eea2e1Sahrens stat->dds_is_snapshot = B_TRUE; 1609a2eea2e1Sahrens stat->dds_num_clones = ds->ds_phys->ds_num_children - 1; 1610ebedde84SEric Taylor } else { 1611ebedde84SEric Taylor stat->dds_is_snapshot = B_FALSE; 1612ebedde84SEric Taylor stat->dds_num_clones = 0; 1613a2eea2e1Sahrens 16144445fffbSMatthew Ahrens if (dsl_dir_is_clone(ds->ds_dir)) { 16154445fffbSMatthew Ahrens dsl_dataset_t *ods; 1616a2eea2e1Sahrens 16173b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold_obj(dp, 16184445fffbSMatthew Ahrens ds->ds_dir->dd_phys->dd_origin_obj, FTAG, &ods)); 16194445fffbSMatthew Ahrens dsl_dataset_name(ods, stat->dds_origin); 16203b2aab18SMatthew Ahrens dsl_dataset_rele(ods, FTAG); 16214445fffbSMatthew Ahrens } 1622a2eea2e1Sahrens } 1623a2eea2e1Sahrens } 1624a2eea2e1Sahrens 1625a2eea2e1Sahrens uint64_t 1626a2eea2e1Sahrens dsl_dataset_fsid_guid(dsl_dataset_t *ds) 1627a2eea2e1Sahrens { 162891ebeef5Sahrens return (ds->ds_fsid_guid); 1629a2eea2e1Sahrens } 1630a2eea2e1Sahrens 1631a2eea2e1Sahrens void 1632a2eea2e1Sahrens dsl_dataset_space(dsl_dataset_t *ds, 1633a2eea2e1Sahrens uint64_t *refdbytesp, uint64_t *availbytesp, 1634a2eea2e1Sahrens uint64_t *usedobjsp, uint64_t *availobjsp) 1635fa9e4066Sahrens { 1636ad135b5dSChristopher Siden *refdbytesp = ds->ds_phys->ds_referenced_bytes; 1637a2eea2e1Sahrens *availbytesp = dsl_dir_space_available(ds->ds_dir, NULL, 0, TRUE); 1638a9799022Sck if (ds->ds_reserved > ds->ds_phys->ds_unique_bytes) 1639a9799022Sck *availbytesp += ds->ds_reserved - ds->ds_phys->ds_unique_bytes; 1640a9799022Sck if (ds->ds_quota != 0) { 1641a9799022Sck /* 1642a9799022Sck * Adjust available bytes according to refquota 1643a9799022Sck */ 1644a9799022Sck if (*refdbytesp < ds->ds_quota) 1645a9799022Sck *availbytesp = MIN(*availbytesp, 1646a9799022Sck ds->ds_quota - *refdbytesp); 1647a9799022Sck else 1648a9799022Sck *availbytesp = 0; 1649a9799022Sck } 16505d7b4d43SMatthew Ahrens *usedobjsp = BP_GET_FILL(&ds->ds_phys->ds_bp); 1651a2eea2e1Sahrens *availobjsp = DN_MAX_OBJECT - *usedobjsp; 1652fa9e4066Sahrens } 1653fa9e4066Sahrens 1654f18faf3fSek boolean_t 165534f2f8cfSMatthew Ahrens dsl_dataset_modified_since_snap(dsl_dataset_t *ds, dsl_dataset_t *snap) 1656f18faf3fSek { 1657f18faf3fSek dsl_pool_t *dp = ds->ds_dir->dd_pool; 1658f18faf3fSek 16593b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(dp)); 166034f2f8cfSMatthew Ahrens if (snap == NULL) 1661f18faf3fSek return (B_FALSE); 1662f18faf3fSek if (ds->ds_phys->ds_bp.blk_birth > 166334f2f8cfSMatthew Ahrens snap->ds_phys->ds_creation_txg) { 166434f2f8cfSMatthew Ahrens objset_t *os, *os_snap; 16656e0cbcaaSMatthew Ahrens /* 16666e0cbcaaSMatthew Ahrens * It may be that only the ZIL differs, because it was 16676e0cbcaaSMatthew Ahrens * reset in the head. Don't count that as being 16686e0cbcaaSMatthew Ahrens * modified. 16696e0cbcaaSMatthew Ahrens */ 16706e0cbcaaSMatthew Ahrens if (dmu_objset_from_ds(ds, &os) != 0) 16716e0cbcaaSMatthew Ahrens return (B_TRUE); 167234f2f8cfSMatthew Ahrens if (dmu_objset_from_ds(snap, &os_snap) != 0) 16736e0cbcaaSMatthew Ahrens return (B_TRUE); 16746e0cbcaaSMatthew Ahrens return (bcmp(&os->os_phys->os_meta_dnode, 167534f2f8cfSMatthew Ahrens &os_snap->os_phys->os_meta_dnode, 16766e0cbcaaSMatthew Ahrens sizeof (os->os_phys->os_meta_dnode)) != 0); 16776e0cbcaaSMatthew Ahrens } 1678f18faf3fSek return (B_FALSE); 1679f18faf3fSek } 1680f18faf3fSek 16813b2aab18SMatthew Ahrens typedef struct dsl_dataset_rename_snapshot_arg { 16823b2aab18SMatthew Ahrens const char *ddrsa_fsname; 16833b2aab18SMatthew Ahrens const char *ddrsa_oldsnapname; 16843b2aab18SMatthew Ahrens const char *ddrsa_newsnapname; 16853b2aab18SMatthew Ahrens boolean_t ddrsa_recursive; 16863b2aab18SMatthew Ahrens dmu_tx_t *ddrsa_tx; 16873b2aab18SMatthew Ahrens } dsl_dataset_rename_snapshot_arg_t; 16883b2aab18SMatthew Ahrens 16891d452cf5Sahrens /* ARGSUSED */ 1690fa9e4066Sahrens static int 16913b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_check_impl(dsl_pool_t *dp, 16923b2aab18SMatthew Ahrens dsl_dataset_t *hds, void *arg) 1693fa9e4066Sahrens { 16943b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_arg_t *ddrsa = arg; 16953b2aab18SMatthew Ahrens int error; 1696fa9e4066Sahrens uint64_t val; 1697fa9e4066Sahrens 16983b2aab18SMatthew Ahrens error = dsl_dataset_snap_lookup(hds, ddrsa->ddrsa_oldsnapname, &val); 16993b2aab18SMatthew Ahrens if (error != 0) { 17003b2aab18SMatthew Ahrens /* ignore nonexistent snapshots */ 17013b2aab18SMatthew Ahrens return (error == ENOENT ? 0 : error); 17023b2aab18SMatthew Ahrens } 17031d452cf5Sahrens 17043b2aab18SMatthew Ahrens /* new name should not exist */ 17053b2aab18SMatthew Ahrens error = dsl_dataset_snap_lookup(hds, ddrsa->ddrsa_newsnapname, &val); 17063b2aab18SMatthew Ahrens if (error == 0) 1707be6fd75aSMatthew Ahrens error = SET_ERROR(EEXIST); 17083b2aab18SMatthew Ahrens else if (error == ENOENT) 17093b2aab18SMatthew Ahrens error = 0; 1710cdf5b4caSmmusante 1711cdf5b4caSmmusante /* dataset name + 1 for the "@" + the new snapshot name must fit */ 17123b2aab18SMatthew Ahrens if (dsl_dir_namelen(hds->ds_dir) + 1 + 17133b2aab18SMatthew Ahrens strlen(ddrsa->ddrsa_newsnapname) >= MAXNAMELEN) 1714be6fd75aSMatthew Ahrens error = SET_ERROR(ENAMETOOLONG); 1715cdf5b4caSmmusante 17163b2aab18SMatthew Ahrens return (error); 17171d452cf5Sahrens } 1718fa9e4066Sahrens 17193b2aab18SMatthew Ahrens static int 17203b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_check(void *arg, dmu_tx_t *tx) 17211d452cf5Sahrens { 17223b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_arg_t *ddrsa = arg; 17233b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 17241d452cf5Sahrens dsl_dataset_t *hds; 17253b2aab18SMatthew Ahrens int error; 1726fa9e4066Sahrens 17273b2aab18SMatthew Ahrens error = dsl_dataset_hold(dp, ddrsa->ddrsa_fsname, FTAG, &hds); 17283b2aab18SMatthew Ahrens if (error != 0) 17293b2aab18SMatthew Ahrens return (error); 1730fa9e4066Sahrens 17313b2aab18SMatthew Ahrens if (ddrsa->ddrsa_recursive) { 17323b2aab18SMatthew Ahrens error = dmu_objset_find_dp(dp, hds->ds_dir->dd_object, 17333b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_check_impl, ddrsa, 17343b2aab18SMatthew Ahrens DS_FIND_CHILDREN); 17353b2aab18SMatthew Ahrens } else { 17363b2aab18SMatthew Ahrens error = dsl_dataset_rename_snapshot_check_impl(dp, hds, ddrsa); 17373b2aab18SMatthew Ahrens } 1738745cd3c5Smaybee dsl_dataset_rele(hds, FTAG); 17393b2aab18SMatthew Ahrens return (error); 1740fa9e4066Sahrens } 1741fa9e4066Sahrens 1742cdf5b4caSmmusante static int 17433b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_sync_impl(dsl_pool_t *dp, 17443b2aab18SMatthew Ahrens dsl_dataset_t *hds, void *arg) 1745cdf5b4caSmmusante { 17463b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_arg_t *ddrsa = arg; 17473b2aab18SMatthew Ahrens dsl_dataset_t *ds; 17483b2aab18SMatthew Ahrens uint64_t val; 17493b2aab18SMatthew Ahrens dmu_tx_t *tx = ddrsa->ddrsa_tx; 17503b2aab18SMatthew Ahrens int error; 1751ecd6cf80Smarks 17523b2aab18SMatthew Ahrens error = dsl_dataset_snap_lookup(hds, ddrsa->ddrsa_oldsnapname, &val); 17533b2aab18SMatthew Ahrens ASSERT(error == 0 || error == ENOENT); 17543b2aab18SMatthew Ahrens if (error == ENOENT) { 17553b2aab18SMatthew Ahrens /* ignore nonexistent snapshots */ 17563b2aab18SMatthew Ahrens return (0); 1757ecd6cf80Smarks } 1758ecd6cf80Smarks 17593b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold_obj(dp, val, FTAG, &ds)); 17603b2aab18SMatthew Ahrens 17613b2aab18SMatthew Ahrens /* log before we change the name */ 17623b2aab18SMatthew Ahrens spa_history_log_internal_ds(ds, "rename", tx, 17633b2aab18SMatthew Ahrens "-> @%s", ddrsa->ddrsa_newsnapname); 1764cdf5b4caSmmusante 1765a2afb611SJerry Jelinek VERIFY0(dsl_dataset_snap_remove(hds, ddrsa->ddrsa_oldsnapname, tx, 1766a2afb611SJerry Jelinek B_FALSE)); 17673b2aab18SMatthew Ahrens mutex_enter(&ds->ds_lock); 17683b2aab18SMatthew Ahrens (void) strcpy(ds->ds_snapname, ddrsa->ddrsa_newsnapname); 17693b2aab18SMatthew Ahrens mutex_exit(&ds->ds_lock); 17703b2aab18SMatthew Ahrens VERIFY0(zap_add(dp->dp_meta_objset, hds->ds_phys->ds_snapnames_zapobj, 17713b2aab18SMatthew Ahrens ds->ds_snapname, 8, 1, &ds->ds_object, tx)); 1772cdf5b4caSmmusante 17733b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 1774cdf5b4caSmmusante return (0); 1775cdf5b4caSmmusante } 1776cdf5b4caSmmusante 17773b2aab18SMatthew Ahrens static void 17783b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_sync(void *arg, dmu_tx_t *tx) 1779cdf5b4caSmmusante { 17803b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_arg_t *ddrsa = arg; 17813b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 17823b2aab18SMatthew Ahrens dsl_dataset_t *hds; 1783cdf5b4caSmmusante 17843b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold(dp, ddrsa->ddrsa_fsname, FTAG, &hds)); 17853b2aab18SMatthew Ahrens ddrsa->ddrsa_tx = tx; 17863b2aab18SMatthew Ahrens if (ddrsa->ddrsa_recursive) { 17873b2aab18SMatthew Ahrens VERIFY0(dmu_objset_find_dp(dp, hds->ds_dir->dd_object, 17883b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_sync_impl, ddrsa, 17893b2aab18SMatthew Ahrens DS_FIND_CHILDREN)); 17903b2aab18SMatthew Ahrens } else { 17913b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_rename_snapshot_sync_impl(dp, hds, ddrsa)); 1792cdf5b4caSmmusante } 17933b2aab18SMatthew Ahrens dsl_dataset_rele(hds, FTAG); 1794cdf5b4caSmmusante } 1795cdf5b4caSmmusante 17963b2aab18SMatthew Ahrens int 17973b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot(const char *fsname, 17983b2aab18SMatthew Ahrens const char *oldsnapname, const char *newsnapname, boolean_t recursive) 17993a5a36beSmmusante { 18003b2aab18SMatthew Ahrens dsl_dataset_rename_snapshot_arg_t ddrsa; 18013a5a36beSmmusante 18023b2aab18SMatthew Ahrens ddrsa.ddrsa_fsname = fsname; 18033b2aab18SMatthew Ahrens ddrsa.ddrsa_oldsnapname = oldsnapname; 18043b2aab18SMatthew Ahrens ddrsa.ddrsa_newsnapname = newsnapname; 18053b2aab18SMatthew Ahrens ddrsa.ddrsa_recursive = recursive; 18063a5a36beSmmusante 18073b2aab18SMatthew Ahrens return (dsl_sync_task(fsname, dsl_dataset_rename_snapshot_check, 1808*7d46dc6cSMatthew Ahrens dsl_dataset_rename_snapshot_sync, &ddrsa, 1809*7d46dc6cSMatthew Ahrens 1, ZFS_SPACE_CHECK_RESERVED)); 18103a5a36beSmmusante } 18113a5a36beSmmusante 181291948b51SKeith M Wesolowski /* 181391948b51SKeith M Wesolowski * If we're doing an ownership handoff, we need to make sure that there is 181491948b51SKeith M Wesolowski * only one long hold on the dataset. We're not allowed to change anything here 181591948b51SKeith M Wesolowski * so we don't permanently release the long hold or regular hold here. We want 181691948b51SKeith M Wesolowski * to do this only when syncing to avoid the dataset unexpectedly going away 181791948b51SKeith M Wesolowski * when we release the long hold. 181891948b51SKeith M Wesolowski */ 181991948b51SKeith M Wesolowski static int 182091948b51SKeith M Wesolowski dsl_dataset_handoff_check(dsl_dataset_t *ds, void *owner, dmu_tx_t *tx) 182191948b51SKeith M Wesolowski { 182291948b51SKeith M Wesolowski boolean_t held; 182391948b51SKeith M Wesolowski 182491948b51SKeith M Wesolowski if (!dmu_tx_is_syncing(tx)) 182591948b51SKeith M Wesolowski return (0); 182691948b51SKeith M Wesolowski 182791948b51SKeith M Wesolowski if (owner != NULL) { 182891948b51SKeith M Wesolowski VERIFY3P(ds->ds_owner, ==, owner); 182991948b51SKeith M Wesolowski dsl_dataset_long_rele(ds, owner); 183091948b51SKeith M Wesolowski } 183191948b51SKeith M Wesolowski 183291948b51SKeith M Wesolowski held = dsl_dataset_long_held(ds); 183391948b51SKeith M Wesolowski 183491948b51SKeith M Wesolowski if (owner != NULL) 183591948b51SKeith M Wesolowski dsl_dataset_long_hold(ds, owner); 183691948b51SKeith M Wesolowski 183791948b51SKeith M Wesolowski if (held) 183891948b51SKeith M Wesolowski return (SET_ERROR(EBUSY)); 183991948b51SKeith M Wesolowski 184091948b51SKeith M Wesolowski return (0); 184191948b51SKeith M Wesolowski } 184291948b51SKeith M Wesolowski 184391948b51SKeith M Wesolowski typedef struct dsl_dataset_rollback_arg { 184491948b51SKeith M Wesolowski const char *ddra_fsname; 184591948b51SKeith M Wesolowski void *ddra_owner; 1846a7027df1SMatthew Ahrens nvlist_t *ddra_result; 184791948b51SKeith M Wesolowski } dsl_dataset_rollback_arg_t; 184891948b51SKeith M Wesolowski 18493b2aab18SMatthew Ahrens static int 18503b2aab18SMatthew Ahrens dsl_dataset_rollback_check(void *arg, dmu_tx_t *tx) 1851fa9e4066Sahrens { 185291948b51SKeith M Wesolowski dsl_dataset_rollback_arg_t *ddra = arg; 18533b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 18541d452cf5Sahrens dsl_dataset_t *ds; 18553b2aab18SMatthew Ahrens int64_t unused_refres_delta; 18563b2aab18SMatthew Ahrens int error; 1857fa9e4066Sahrens 185891948b51SKeith M Wesolowski error = dsl_dataset_hold(dp, ddra->ddra_fsname, FTAG, &ds); 18593b2aab18SMatthew Ahrens if (error != 0) 18603b2aab18SMatthew Ahrens return (error); 1861370c1af0SSanjeev Bagewadi 18623b2aab18SMatthew Ahrens /* must not be a snapshot */ 18633b2aab18SMatthew Ahrens if (dsl_dataset_is_snapshot(ds)) { 18643b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 1865be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 18663b2aab18SMatthew Ahrens } 18673a5a36beSmmusante 18683b2aab18SMatthew Ahrens /* must have a most recent snapshot */ 18693b2aab18SMatthew Ahrens if (ds->ds_phys->ds_prev_snap_txg < TXG_INITIAL) { 18703b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 1871be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 18723b2aab18SMatthew Ahrens } 18733a5a36beSmmusante 187478f17100SMatthew Ahrens /* must not have any bookmarks after the most recent snapshot */ 187578f17100SMatthew Ahrens nvlist_t *proprequest = fnvlist_alloc(); 187678f17100SMatthew Ahrens fnvlist_add_boolean(proprequest, zfs_prop_to_name(ZFS_PROP_CREATETXG)); 187778f17100SMatthew Ahrens nvlist_t *bookmarks = fnvlist_alloc(); 187878f17100SMatthew Ahrens error = dsl_get_bookmarks_impl(ds, proprequest, bookmarks); 187978f17100SMatthew Ahrens fnvlist_free(proprequest); 188078f17100SMatthew Ahrens if (error != 0) 188178f17100SMatthew Ahrens return (error); 188278f17100SMatthew Ahrens for (nvpair_t *pair = nvlist_next_nvpair(bookmarks, NULL); 188378f17100SMatthew Ahrens pair != NULL; pair = nvlist_next_nvpair(bookmarks, pair)) { 188478f17100SMatthew Ahrens nvlist_t *valuenv = 188578f17100SMatthew Ahrens fnvlist_lookup_nvlist(fnvpair_value_nvlist(pair), 188678f17100SMatthew Ahrens zfs_prop_to_name(ZFS_PROP_CREATETXG)); 188778f17100SMatthew Ahrens uint64_t createtxg = fnvlist_lookup_uint64(valuenv, "value"); 188878f17100SMatthew Ahrens if (createtxg > ds->ds_phys->ds_prev_snap_txg) { 188978f17100SMatthew Ahrens fnvlist_free(bookmarks); 189078f17100SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 189178f17100SMatthew Ahrens return (SET_ERROR(EEXIST)); 189278f17100SMatthew Ahrens } 189378f17100SMatthew Ahrens } 189478f17100SMatthew Ahrens fnvlist_free(bookmarks); 189578f17100SMatthew Ahrens 189691948b51SKeith M Wesolowski error = dsl_dataset_handoff_check(ds, ddra->ddra_owner, tx); 189791948b51SKeith M Wesolowski if (error != 0) { 18983b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 189991948b51SKeith M Wesolowski return (error); 19003b2aab18SMatthew Ahrens } 19013b2aab18SMatthew Ahrens 19023b2aab18SMatthew Ahrens /* 19033b2aab18SMatthew Ahrens * Check if the snap we are rolling back to uses more than 19043b2aab18SMatthew Ahrens * the refquota. 19053b2aab18SMatthew Ahrens */ 19063b2aab18SMatthew Ahrens if (ds->ds_quota != 0 && 19073b2aab18SMatthew Ahrens ds->ds_prev->ds_phys->ds_referenced_bytes > ds->ds_quota) { 19083b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 1909be6fd75aSMatthew Ahrens return (SET_ERROR(EDQUOT)); 1910fa9e4066Sahrens } 1911370c1af0SSanjeev Bagewadi 19123b2aab18SMatthew Ahrens /* 19133b2aab18SMatthew Ahrens * When we do the clone swap, we will temporarily use more space 19143b2aab18SMatthew Ahrens * due to the refreservation (the head will no longer have any 19153b2aab18SMatthew Ahrens * unique space, so the entire amount of the refreservation will need 19163b2aab18SMatthew Ahrens * to be free). We will immediately destroy the clone, freeing 19173b2aab18SMatthew Ahrens * this space, but the freeing happens over many txg's. 19183b2aab18SMatthew Ahrens */ 19193b2aab18SMatthew Ahrens unused_refres_delta = (int64_t)MIN(ds->ds_reserved, 19203b2aab18SMatthew Ahrens ds->ds_phys->ds_unique_bytes); 19213b2aab18SMatthew Ahrens 19223b2aab18SMatthew Ahrens if (unused_refres_delta > 0 && 19233b2aab18SMatthew Ahrens unused_refres_delta > 19243b2aab18SMatthew Ahrens dsl_dir_space_available(ds->ds_dir, NULL, 0, TRUE)) { 19253b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 1926be6fd75aSMatthew Ahrens return (SET_ERROR(ENOSPC)); 1927fa9e4066Sahrens } 1928fa9e4066Sahrens 19293b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 19303b2aab18SMatthew Ahrens return (0); 19313b2aab18SMatthew Ahrens } 19321d452cf5Sahrens 19333b2aab18SMatthew Ahrens static void 19343b2aab18SMatthew Ahrens dsl_dataset_rollback_sync(void *arg, dmu_tx_t *tx) 19353b2aab18SMatthew Ahrens { 193691948b51SKeith M Wesolowski dsl_dataset_rollback_arg_t *ddra = arg; 19373b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 19383b2aab18SMatthew Ahrens dsl_dataset_t *ds, *clone; 19393b2aab18SMatthew Ahrens uint64_t cloneobj; 1940a7027df1SMatthew Ahrens char namebuf[ZFS_MAXNAMELEN]; 19411d452cf5Sahrens 194291948b51SKeith M Wesolowski VERIFY0(dsl_dataset_hold(dp, ddra->ddra_fsname, FTAG, &ds)); 19431d452cf5Sahrens 1944a7027df1SMatthew Ahrens dsl_dataset_name(ds->ds_prev, namebuf); 1945a7027df1SMatthew Ahrens fnvlist_add_string(ddra->ddra_result, "target", namebuf); 1946a7027df1SMatthew Ahrens 19473b2aab18SMatthew Ahrens cloneobj = dsl_dataset_create_sync(ds->ds_dir, "%rollback", 19483b2aab18SMatthew Ahrens ds->ds_prev, DS_CREATE_FLAG_NODIRTY, kcred, tx); 19491d452cf5Sahrens 19503b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold_obj(dp, cloneobj, FTAG, &clone)); 19511d452cf5Sahrens 19523b2aab18SMatthew Ahrens dsl_dataset_clone_swap_sync_impl(clone, ds, tx); 19533b2aab18SMatthew Ahrens dsl_dataset_zero_zil(ds, tx); 19543b2aab18SMatthew Ahrens 19553b2aab18SMatthew Ahrens dsl_destroy_head_sync_impl(clone, tx); 19563b2aab18SMatthew Ahrens 19573b2aab18SMatthew Ahrens dsl_dataset_rele(clone, FTAG); 19583b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 19593b2aab18SMatthew Ahrens } 19603b2aab18SMatthew Ahrens 196191948b51SKeith M Wesolowski /* 1962a7027df1SMatthew Ahrens * Rolls back the given filesystem or volume to the most recent snapshot. 1963a7027df1SMatthew Ahrens * The name of the most recent snapshot will be returned under key "target" 1964a7027df1SMatthew Ahrens * in the result nvlist. 196591948b51SKeith M Wesolowski * 1966a7027df1SMatthew Ahrens * If owner != NULL: 196791948b51SKeith M Wesolowski * - The existing dataset MUST be owned by the specified owner at entry 196891948b51SKeith M Wesolowski * - Upon return, dataset will still be held by the same owner, whether we 196991948b51SKeith M Wesolowski * succeed or not. 197091948b51SKeith M Wesolowski * 197191948b51SKeith M Wesolowski * This mode is required any time the existing filesystem is mounted. See 197291948b51SKeith M Wesolowski * notes above zfs_suspend_fs() for further details. 197391948b51SKeith M Wesolowski */ 19743b2aab18SMatthew Ahrens int 1975a7027df1SMatthew Ahrens dsl_dataset_rollback(const char *fsname, void *owner, nvlist_t *result) 19763b2aab18SMatthew Ahrens { 197791948b51SKeith M Wesolowski dsl_dataset_rollback_arg_t ddra; 197891948b51SKeith M Wesolowski 197991948b51SKeith M Wesolowski ddra.ddra_fsname = fsname; 198091948b51SKeith M Wesolowski ddra.ddra_owner = owner; 1981a7027df1SMatthew Ahrens ddra.ddra_result = result; 198291948b51SKeith M Wesolowski 19833b2aab18SMatthew Ahrens return (dsl_sync_task(fsname, dsl_dataset_rollback_check, 1984*7d46dc6cSMatthew Ahrens dsl_dataset_rollback_sync, &ddra, 1985*7d46dc6cSMatthew Ahrens 1, ZFS_SPACE_CHECK_RESERVED)); 1986fa9e4066Sahrens } 198799653d4eSeschrock 1988088f3894Sahrens struct promotenode { 1989745cd3c5Smaybee list_node_t link; 1990745cd3c5Smaybee dsl_dataset_t *ds; 1991745cd3c5Smaybee }; 1992745cd3c5Smaybee 19933b2aab18SMatthew Ahrens typedef struct dsl_dataset_promote_arg { 19943b2aab18SMatthew Ahrens const char *ddpa_clonename; 19953b2aab18SMatthew Ahrens dsl_dataset_t *ddpa_clone; 199674e7dc98SMatthew Ahrens list_t shared_snaps, origin_snaps, clone_snaps; 19973b2aab18SMatthew Ahrens dsl_dataset_t *origin_origin; /* origin of the origin */ 199874e7dc98SMatthew Ahrens uint64_t used, comp, uncomp, unique, cloneusedsnap, originusedsnap; 1999681d9761SEric Taylor char *err_ds; 2000a2afb611SJerry Jelinek cred_t *cr; 20013b2aab18SMatthew Ahrens } dsl_dataset_promote_arg_t; 20021d452cf5Sahrens 200374e7dc98SMatthew Ahrens static int snaplist_space(list_t *l, uint64_t mintxg, uint64_t *spacep); 20043b2aab18SMatthew Ahrens static int promote_hold(dsl_dataset_promote_arg_t *ddpa, dsl_pool_t *dp, 20053b2aab18SMatthew Ahrens void *tag); 20063b2aab18SMatthew Ahrens static void promote_rele(dsl_dataset_promote_arg_t *ddpa, void *tag); 200774e7dc98SMatthew Ahrens 200899653d4eSeschrock static int 20093b2aab18SMatthew Ahrens dsl_dataset_promote_check(void *arg, dmu_tx_t *tx) 201099653d4eSeschrock { 20113b2aab18SMatthew Ahrens dsl_dataset_promote_arg_t *ddpa = arg; 20123b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 20133b2aab18SMatthew Ahrens dsl_dataset_t *hds; 20143b2aab18SMatthew Ahrens struct promotenode *snap; 20153b2aab18SMatthew Ahrens dsl_dataset_t *origin_ds; 2016745cd3c5Smaybee int err; 2017cde58dbcSMatthew Ahrens uint64_t unused; 2018a2afb611SJerry Jelinek uint64_t ss_mv_cnt; 20191d452cf5Sahrens 20203b2aab18SMatthew Ahrens err = promote_hold(ddpa, dp, FTAG); 20213b2aab18SMatthew Ahrens if (err != 0) 20223b2aab18SMatthew Ahrens return (err); 202399653d4eSeschrock 20243b2aab18SMatthew Ahrens hds = ddpa->ddpa_clone; 20251d452cf5Sahrens 20263b2aab18SMatthew Ahrens if (hds->ds_phys->ds_flags & DS_FLAG_NOPROMOTE) { 20273b2aab18SMatthew Ahrens promote_rele(ddpa, FTAG); 2028be6fd75aSMatthew Ahrens return (SET_ERROR(EXDEV)); 20293b2aab18SMatthew Ahrens } 20303b2aab18SMatthew Ahrens 20313b2aab18SMatthew Ahrens /* 20323b2aab18SMatthew Ahrens * Compute and check the amount of space to transfer. Since this is 20333b2aab18SMatthew Ahrens * so expensive, don't do the preliminary check. 20343b2aab18SMatthew Ahrens */ 20353b2aab18SMatthew Ahrens if (!dmu_tx_is_syncing(tx)) { 20363b2aab18SMatthew Ahrens promote_rele(ddpa, FTAG); 20373b2aab18SMatthew Ahrens return (0); 20383b2aab18SMatthew Ahrens } 20393b2aab18SMatthew Ahrens 20403b2aab18SMatthew Ahrens snap = list_head(&ddpa->shared_snaps); 20413b2aab18SMatthew Ahrens origin_ds = snap->ds; 204299653d4eSeschrock 20433cb34c60Sahrens /* compute origin's new unique space */ 20443b2aab18SMatthew Ahrens snap = list_tail(&ddpa->clone_snaps); 204574e7dc98SMatthew Ahrens ASSERT3U(snap->ds->ds_phys->ds_prev_snap_obj, ==, origin_ds->ds_object); 2046cde58dbcSMatthew Ahrens dsl_deadlist_space_range(&snap->ds->ds_deadlist, 2047cde58dbcSMatthew Ahrens origin_ds->ds_phys->ds_prev_snap_txg, UINT64_MAX, 20483b2aab18SMatthew Ahrens &ddpa->unique, &unused, &unused); 204999653d4eSeschrock 2050745cd3c5Smaybee /* 2051745cd3c5Smaybee * Walk the snapshots that we are moving 2052745cd3c5Smaybee * 205374e7dc98SMatthew Ahrens * Compute space to transfer. Consider the incremental changes 20543b2aab18SMatthew Ahrens * to used by each snapshot: 205574e7dc98SMatthew Ahrens * (my used) = (prev's used) + (blocks born) - (blocks killed) 205674e7dc98SMatthew Ahrens * So each snapshot gave birth to: 205774e7dc98SMatthew Ahrens * (blocks born) = (my used) - (prev's used) + (blocks killed) 2058745cd3c5Smaybee * So a sequence would look like: 205974e7dc98SMatthew Ahrens * (uN - u(N-1) + kN) + ... + (u1 - u0 + k1) + (u0 - 0 + k0) 2060745cd3c5Smaybee * Which simplifies to: 206174e7dc98SMatthew Ahrens * uN + kN + kN-1 + ... + k1 + k0 2062745cd3c5Smaybee * Note however, if we stop before we reach the ORIGIN we get: 206374e7dc98SMatthew Ahrens * uN + kN + kN-1 + ... + kM - uM-1 2064745cd3c5Smaybee */ 2065a2afb611SJerry Jelinek ss_mv_cnt = 0; 20663b2aab18SMatthew Ahrens ddpa->used = origin_ds->ds_phys->ds_referenced_bytes; 20673b2aab18SMatthew Ahrens ddpa->comp = origin_ds->ds_phys->ds_compressed_bytes; 20683b2aab18SMatthew Ahrens ddpa->uncomp = origin_ds->ds_phys->ds_uncompressed_bytes; 20693b2aab18SMatthew Ahrens for (snap = list_head(&ddpa->shared_snaps); snap; 20703b2aab18SMatthew Ahrens snap = list_next(&ddpa->shared_snaps, snap)) { 207199653d4eSeschrock uint64_t val, dlused, dlcomp, dluncomp; 2072745cd3c5Smaybee dsl_dataset_t *ds = snap->ds; 207399653d4eSeschrock 2074a2afb611SJerry Jelinek ss_mv_cnt++; 2075a2afb611SJerry Jelinek 20763b2aab18SMatthew Ahrens /* 20773b2aab18SMatthew Ahrens * If there are long holds, we won't be able to evict 20783b2aab18SMatthew Ahrens * the objset. 20793b2aab18SMatthew Ahrens */ 20803b2aab18SMatthew Ahrens if (dsl_dataset_long_held(ds)) { 2081be6fd75aSMatthew Ahrens err = SET_ERROR(EBUSY); 20823b2aab18SMatthew Ahrens goto out; 20833b2aab18SMatthew Ahrens } 20843b2aab18SMatthew Ahrens 208599653d4eSeschrock /* Check that the snapshot name does not conflict */ 20863b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_get_snapname(ds)); 2087745cd3c5Smaybee err = dsl_dataset_snap_lookup(hds, ds->ds_snapname, &val); 2088681d9761SEric Taylor if (err == 0) { 20893b2aab18SMatthew Ahrens (void) strcpy(ddpa->err_ds, snap->ds->ds_snapname); 2090be6fd75aSMatthew Ahrens err = SET_ERROR(EEXIST); 2091681d9761SEric Taylor goto out; 2092681d9761SEric Taylor } 2093745cd3c5Smaybee if (err != ENOENT) 2094681d9761SEric Taylor goto out; 209599653d4eSeschrock 2096745cd3c5Smaybee /* The very first snapshot does not have a deadlist */ 209774e7dc98SMatthew Ahrens if (ds->ds_phys->ds_prev_snap_obj == 0) 209874e7dc98SMatthew Ahrens continue; 209974e7dc98SMatthew Ahrens 2100cde58dbcSMatthew Ahrens dsl_deadlist_space(&ds->ds_deadlist, 2101cde58dbcSMatthew Ahrens &dlused, &dlcomp, &dluncomp); 21023b2aab18SMatthew Ahrens ddpa->used += dlused; 21033b2aab18SMatthew Ahrens ddpa->comp += dlcomp; 21043b2aab18SMatthew Ahrens ddpa->uncomp += dluncomp; 210574e7dc98SMatthew Ahrens } 2106745cd3c5Smaybee 2107745cd3c5Smaybee /* 2108745cd3c5Smaybee * If we are a clone of a clone then we never reached ORIGIN, 2109745cd3c5Smaybee * so we need to subtract out the clone origin's used space. 2110745cd3c5Smaybee */ 21113b2aab18SMatthew Ahrens if (ddpa->origin_origin) { 21123b2aab18SMatthew Ahrens ddpa->used -= ddpa->origin_origin->ds_phys->ds_referenced_bytes; 21133b2aab18SMatthew Ahrens ddpa->comp -= ddpa->origin_origin->ds_phys->ds_compressed_bytes; 21143b2aab18SMatthew Ahrens ddpa->uncomp -= 21153b2aab18SMatthew Ahrens ddpa->origin_origin->ds_phys->ds_uncompressed_bytes; 211699653d4eSeschrock } 211799653d4eSeschrock 2118a2afb611SJerry Jelinek /* Check that there is enough space and limit headroom here */ 211974e7dc98SMatthew Ahrens err = dsl_dir_transfer_possible(origin_ds->ds_dir, hds->ds_dir, 2120a2afb611SJerry Jelinek 0, ss_mv_cnt, ddpa->used, ddpa->cr); 21213b2aab18SMatthew Ahrens if (err != 0) 21223b2aab18SMatthew Ahrens goto out; 212374e7dc98SMatthew Ahrens 212474e7dc98SMatthew Ahrens /* 212574e7dc98SMatthew Ahrens * Compute the amounts of space that will be used by snapshots 212674e7dc98SMatthew Ahrens * after the promotion (for both origin and clone). For each, 212774e7dc98SMatthew Ahrens * it is the amount of space that will be on all of their 212874e7dc98SMatthew Ahrens * deadlists (that was not born before their new origin). 212974e7dc98SMatthew Ahrens */ 213074e7dc98SMatthew Ahrens if (hds->ds_dir->dd_phys->dd_flags & DD_FLAG_USED_BREAKDOWN) { 213174e7dc98SMatthew Ahrens uint64_t space; 213274e7dc98SMatthew Ahrens 213374e7dc98SMatthew Ahrens /* 213474e7dc98SMatthew Ahrens * Note, typically this will not be a clone of a clone, 21353f9d6ad7SLin Ling * so dd_origin_txg will be < TXG_INITIAL, so 2136cde58dbcSMatthew Ahrens * these snaplist_space() -> dsl_deadlist_space_range() 213774e7dc98SMatthew Ahrens * calls will be fast because they do not have to 213874e7dc98SMatthew Ahrens * iterate over all bps. 213974e7dc98SMatthew Ahrens */ 21403b2aab18SMatthew Ahrens snap = list_head(&ddpa->origin_snaps); 21413b2aab18SMatthew Ahrens err = snaplist_space(&ddpa->shared_snaps, 21423b2aab18SMatthew Ahrens snap->ds->ds_dir->dd_origin_txg, &ddpa->cloneusedsnap); 21433b2aab18SMatthew Ahrens if (err != 0) 21443b2aab18SMatthew Ahrens goto out; 214574e7dc98SMatthew Ahrens 21463b2aab18SMatthew Ahrens err = snaplist_space(&ddpa->clone_snaps, 21473f9d6ad7SLin Ling snap->ds->ds_dir->dd_origin_txg, &space); 21483b2aab18SMatthew Ahrens if (err != 0) 21493b2aab18SMatthew Ahrens goto out; 21503b2aab18SMatthew Ahrens ddpa->cloneusedsnap += space; 215174e7dc98SMatthew Ahrens } 215274e7dc98SMatthew Ahrens if (origin_ds->ds_dir->dd_phys->dd_flags & DD_FLAG_USED_BREAKDOWN) { 21533b2aab18SMatthew Ahrens err = snaplist_space(&ddpa->origin_snaps, 21543b2aab18SMatthew Ahrens origin_ds->ds_phys->ds_creation_txg, &ddpa->originusedsnap); 21553b2aab18SMatthew Ahrens if (err != 0) 21563b2aab18SMatthew Ahrens goto out; 2157745cd3c5Smaybee } 21581d452cf5Sahrens 2159681d9761SEric Taylor out: 21603b2aab18SMatthew Ahrens promote_rele(ddpa, FTAG); 2161681d9761SEric Taylor return (err); 21621d452cf5Sahrens } 216399653d4eSeschrock 21641d452cf5Sahrens static void 21653b2aab18SMatthew Ahrens dsl_dataset_promote_sync(void *arg, dmu_tx_t *tx) 21661d452cf5Sahrens { 21673b2aab18SMatthew Ahrens dsl_dataset_promote_arg_t *ddpa = arg; 21683b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 21693b2aab18SMatthew Ahrens dsl_dataset_t *hds; 21703b2aab18SMatthew Ahrens struct promotenode *snap; 21713b2aab18SMatthew Ahrens dsl_dataset_t *origin_ds; 21723b2aab18SMatthew Ahrens dsl_dataset_t *origin_head; 21733b2aab18SMatthew Ahrens dsl_dir_t *dd; 21743cb34c60Sahrens dsl_dir_t *odd = NULL; 2175088f3894Sahrens uint64_t oldnext_obj; 217674e7dc98SMatthew Ahrens int64_t delta; 21771d452cf5Sahrens 21783b2aab18SMatthew Ahrens VERIFY0(promote_hold(ddpa, dp, FTAG)); 21793b2aab18SMatthew Ahrens hds = ddpa->ddpa_clone; 21803b2aab18SMatthew Ahrens 21813b2aab18SMatthew Ahrens ASSERT0(hds->ds_phys->ds_flags & DS_FLAG_NOPROMOTE); 21821d452cf5Sahrens 21833b2aab18SMatthew Ahrens snap = list_head(&ddpa->shared_snaps); 21843b2aab18SMatthew Ahrens origin_ds = snap->ds; 21853b2aab18SMatthew Ahrens dd = hds->ds_dir; 21863b2aab18SMatthew Ahrens 21873b2aab18SMatthew Ahrens snap = list_head(&ddpa->origin_snaps); 218874e7dc98SMatthew Ahrens origin_head = snap->ds; 218974e7dc98SMatthew Ahrens 21900b69c2f0Sahrens /* 21913cb34c60Sahrens * We need to explicitly open odd, since origin_ds's dd will be 21920b69c2f0Sahrens * changing. 21930b69c2f0Sahrens */ 21943b2aab18SMatthew Ahrens VERIFY0(dsl_dir_hold_obj(dp, origin_ds->ds_dir->dd_object, 21953cb34c60Sahrens NULL, FTAG, &odd)); 219699653d4eSeschrock 2197745cd3c5Smaybee /* change origin's next snap */ 2198745cd3c5Smaybee dmu_buf_will_dirty(origin_ds->ds_dbuf, tx); 2199088f3894Sahrens oldnext_obj = origin_ds->ds_phys->ds_next_snap_obj; 22003b2aab18SMatthew Ahrens snap = list_tail(&ddpa->clone_snaps); 220174e7dc98SMatthew Ahrens ASSERT3U(snap->ds->ds_phys->ds_prev_snap_obj, ==, origin_ds->ds_object); 220274e7dc98SMatthew Ahrens origin_ds->ds_phys->ds_next_snap_obj = snap->ds->ds_object; 2203745cd3c5Smaybee 2204088f3894Sahrens /* change the origin's next clone */ 2205088f3894Sahrens if (origin_ds->ds_phys->ds_next_clones_obj) { 22063b2aab18SMatthew Ahrens dsl_dataset_remove_from_next_clones(origin_ds, 22073b2aab18SMatthew Ahrens snap->ds->ds_object, tx); 22083b2aab18SMatthew Ahrens VERIFY0(zap_add_int(dp->dp_meta_objset, 2209088f3894Sahrens origin_ds->ds_phys->ds_next_clones_obj, 2210088f3894Sahrens oldnext_obj, tx)); 2211088f3894Sahrens } 2212088f3894Sahrens 2213745cd3c5Smaybee /* change origin */ 2214745cd3c5Smaybee dmu_buf_will_dirty(dd->dd_dbuf, tx); 2215745cd3c5Smaybee ASSERT3U(dd->dd_phys->dd_origin_obj, ==, origin_ds->ds_object); 2216745cd3c5Smaybee dd->dd_phys->dd_origin_obj = odd->dd_phys->dd_origin_obj; 22173f9d6ad7SLin Ling dd->dd_origin_txg = origin_head->ds_dir->dd_origin_txg; 2218745cd3c5Smaybee dmu_buf_will_dirty(odd->dd_dbuf, tx); 2219745cd3c5Smaybee odd->dd_phys->dd_origin_obj = origin_ds->ds_object; 22203f9d6ad7SLin Ling origin_head->ds_dir->dd_origin_txg = 22213f9d6ad7SLin Ling origin_ds->ds_phys->ds_creation_txg; 2222745cd3c5Smaybee 2223cde58dbcSMatthew Ahrens /* change dd_clone entries */ 2224cde58dbcSMatthew Ahrens if (spa_version(dp->dp_spa) >= SPA_VERSION_DIR_CLONES) { 22253b2aab18SMatthew Ahrens VERIFY0(zap_remove_int(dp->dp_meta_objset, 2226cde58dbcSMatthew Ahrens odd->dd_phys->dd_clones, hds->ds_object, tx)); 22273b2aab18SMatthew Ahrens VERIFY0(zap_add_int(dp->dp_meta_objset, 22283b2aab18SMatthew Ahrens ddpa->origin_origin->ds_dir->dd_phys->dd_clones, 2229cde58dbcSMatthew Ahrens hds->ds_object, tx)); 2230cde58dbcSMatthew Ahrens 22313b2aab18SMatthew Ahrens VERIFY0(zap_remove_int(dp->dp_meta_objset, 22323b2aab18SMatthew Ahrens ddpa->origin_origin->ds_dir->dd_phys->dd_clones, 2233cde58dbcSMatthew Ahrens origin_head->ds_object, tx)); 2234cde58dbcSMatthew Ahrens if (dd->dd_phys->dd_clones == 0) { 2235cde58dbcSMatthew Ahrens dd->dd_phys->dd_clones = zap_create(dp->dp_meta_objset, 2236cde58dbcSMatthew Ahrens DMU_OT_DSL_CLONES, DMU_OT_NONE, 0, tx); 2237cde58dbcSMatthew Ahrens } 22383b2aab18SMatthew Ahrens VERIFY0(zap_add_int(dp->dp_meta_objset, 2239cde58dbcSMatthew Ahrens dd->dd_phys->dd_clones, origin_head->ds_object, tx)); 2240cde58dbcSMatthew Ahrens } 2241cde58dbcSMatthew Ahrens 224299653d4eSeschrock /* move snapshots to this dir */ 22433b2aab18SMatthew Ahrens for (snap = list_head(&ddpa->shared_snaps); snap; 22443b2aab18SMatthew Ahrens snap = list_next(&ddpa->shared_snaps, snap)) { 2245745cd3c5Smaybee dsl_dataset_t *ds = snap->ds; 224699653d4eSeschrock 22473b2aab18SMatthew Ahrens /* 22483b2aab18SMatthew Ahrens * Property callbacks are registered to a particular 22493b2aab18SMatthew Ahrens * dsl_dir. Since ours is changing, evict the objset 22503b2aab18SMatthew Ahrens * so that they will be unregistered from the old dsl_dir. 22513b2aab18SMatthew Ahrens */ 2252503ad85cSMatthew Ahrens if (ds->ds_objset) { 2253503ad85cSMatthew Ahrens dmu_objset_evict(ds->ds_objset); 2254503ad85cSMatthew Ahrens ds->ds_objset = NULL; 22553baa08fcSek } 22563b2aab18SMatthew Ahrens 225799653d4eSeschrock /* move snap name entry */ 22583b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_get_snapname(ds)); 22593b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_snap_remove(origin_head, 2260a2afb611SJerry Jelinek ds->ds_snapname, tx, B_TRUE)); 22613b2aab18SMatthew Ahrens VERIFY0(zap_add(dp->dp_meta_objset, 226299653d4eSeschrock hds->ds_phys->ds_snapnames_zapobj, ds->ds_snapname, 226399653d4eSeschrock 8, 1, &ds->ds_object, tx)); 2264a2afb611SJerry Jelinek dsl_fs_ss_count_adjust(hds->ds_dir, 1, 2265a2afb611SJerry Jelinek DD_FIELD_SNAPSHOT_COUNT, tx); 2266cde58dbcSMatthew Ahrens 226799653d4eSeschrock /* change containing dsl_dir */ 226899653d4eSeschrock dmu_buf_will_dirty(ds->ds_dbuf, tx); 22693cb34c60Sahrens ASSERT3U(ds->ds_phys->ds_dir_obj, ==, odd->dd_object); 227099653d4eSeschrock ds->ds_phys->ds_dir_obj = dd->dd_object; 22713cb34c60Sahrens ASSERT3P(ds->ds_dir, ==, odd); 22723b2aab18SMatthew Ahrens dsl_dir_rele(ds->ds_dir, ds); 22733b2aab18SMatthew Ahrens VERIFY0(dsl_dir_hold_obj(dp, dd->dd_object, 227499653d4eSeschrock NULL, ds, &ds->ds_dir)); 227599653d4eSeschrock 2276cde58dbcSMatthew Ahrens /* move any clone references */ 2277cde58dbcSMatthew Ahrens if (ds->ds_phys->ds_next_clones_obj && 2278cde58dbcSMatthew Ahrens spa_version(dp->dp_spa) >= SPA_VERSION_DIR_CLONES) { 2279cde58dbcSMatthew Ahrens zap_cursor_t zc; 2280cde58dbcSMatthew Ahrens zap_attribute_t za; 2281cde58dbcSMatthew Ahrens 22823b2aab18SMatthew Ahrens for (zap_cursor_init(&zc, dp->dp_meta_objset, 22833b2aab18SMatthew Ahrens ds->ds_phys->ds_next_clones_obj); 22843b2aab18SMatthew Ahrens zap_cursor_retrieve(&zc, &za) == 0; 22853b2aab18SMatthew Ahrens zap_cursor_advance(&zc)) { 22863b2aab18SMatthew Ahrens dsl_dataset_t *cnds; 22873b2aab18SMatthew Ahrens uint64_t o; 2288a9799022Sck 22893b2aab18SMatthew Ahrens if (za.za_first_integer == oldnext_obj) { 22903b2aab18SMatthew Ahrens /* 22913b2aab18SMatthew Ahrens * We've already moved the 22923b2aab18SMatthew Ahrens * origin's reference. 22933b2aab18SMatthew Ahrens */ 22943b2aab18SMatthew Ahrens continue; 22953b2aab18SMatthew Ahrens } 2296a9799022Sck 22973b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold_obj(dp, 22983b2aab18SMatthew Ahrens za.za_first_integer, FTAG, &cnds)); 22993b2aab18SMatthew Ahrens o = cnds->ds_dir->dd_phys->dd_head_dataset_obj; 2300a9799022Sck 23013b2aab18SMatthew Ahrens VERIFY0(zap_remove_int(dp->dp_meta_objset, 23023b2aab18SMatthew Ahrens odd->dd_phys->dd_clones, o, tx)); 23033b2aab18SMatthew Ahrens VERIFY0(zap_add_int(dp->dp_meta_objset, 23043b2aab18SMatthew Ahrens dd->dd_phys->dd_clones, o, tx)); 23053b2aab18SMatthew Ahrens dsl_dataset_rele(cnds, FTAG); 23063b2aab18SMatthew Ahrens } 23073b2aab18SMatthew Ahrens zap_cursor_fini(&zc); 23083b2aab18SMatthew Ahrens } 23099082849eSck 23103b2aab18SMatthew Ahrens ASSERT(!dsl_prop_hascb(ds)); 2311a9799022Sck } 2312a9799022Sck 2313a9799022Sck /* 23143b2aab18SMatthew Ahrens * Change space accounting. 23153b2aab18SMatthew Ahrens * Note, pa->*usedsnap and dd_used_breakdown[SNAP] will either 23163b2aab18SMatthew Ahrens * both be valid, or both be 0 (resulting in delta == 0). This 23173b2aab18SMatthew Ahrens * is true for each of {clone,origin} independently. 2318a9799022Sck */ 2319a9799022Sck 23203b2aab18SMatthew Ahrens delta = ddpa->cloneusedsnap - 23213b2aab18SMatthew Ahrens dd->dd_phys->dd_used_breakdown[DD_USED_SNAP]; 23223b2aab18SMatthew Ahrens ASSERT3S(delta, >=, 0); 23233b2aab18SMatthew Ahrens ASSERT3U(ddpa->used, >=, delta); 23243b2aab18SMatthew Ahrens dsl_dir_diduse_space(dd, DD_USED_SNAP, delta, 0, 0, tx); 23253b2aab18SMatthew Ahrens dsl_dir_diduse_space(dd, DD_USED_HEAD, 23263b2aab18SMatthew Ahrens ddpa->used - delta, ddpa->comp, ddpa->uncomp, tx); 23273b2aab18SMatthew Ahrens 23283b2aab18SMatthew Ahrens delta = ddpa->originusedsnap - 23293b2aab18SMatthew Ahrens odd->dd_phys->dd_used_breakdown[DD_USED_SNAP]; 23303b2aab18SMatthew Ahrens ASSERT3S(delta, <=, 0); 23313b2aab18SMatthew Ahrens ASSERT3U(ddpa->used, >=, -delta); 23323b2aab18SMatthew Ahrens dsl_dir_diduse_space(odd, DD_USED_SNAP, delta, 0, 0, tx); 23333b2aab18SMatthew Ahrens dsl_dir_diduse_space(odd, DD_USED_HEAD, 23343b2aab18SMatthew Ahrens -ddpa->used - delta, -ddpa->comp, -ddpa->uncomp, tx); 23353b2aab18SMatthew Ahrens 23363b2aab18SMatthew Ahrens origin_ds->ds_phys->ds_unique_bytes = ddpa->unique; 23373b2aab18SMatthew Ahrens 23383b2aab18SMatthew Ahrens /* log history record */ 23393b2aab18SMatthew Ahrens spa_history_log_internal_ds(hds, "promote", tx, ""); 23403b2aab18SMatthew Ahrens 23413b2aab18SMatthew Ahrens dsl_dir_rele(odd, FTAG); 23423b2aab18SMatthew Ahrens promote_rele(ddpa, FTAG); 2343a9799022Sck } 2344a9799022Sck 23453b2aab18SMatthew Ahrens /* 23463b2aab18SMatthew Ahrens * Make a list of dsl_dataset_t's for the snapshots between first_obj 23473b2aab18SMatthew Ahrens * (exclusive) and last_obj (inclusive). The list will be in reverse 23483b2aab18SMatthew Ahrens * order (last_obj will be the list_head()). If first_obj == 0, do all 23493b2aab18SMatthew Ahrens * snapshots back to this dataset's origin. 23503b2aab18SMatthew Ahrens */ 2351a9799022Sck static int 23523b2aab18SMatthew Ahrens snaplist_make(dsl_pool_t *dp, 23533b2aab18SMatthew Ahrens uint64_t first_obj, uint64_t last_obj, list_t *l, void *tag) 2354a9799022Sck { 23553b2aab18SMatthew Ahrens uint64_t obj = last_obj; 2356a9799022Sck 23573b2aab18SMatthew Ahrens list_create(l, sizeof (struct promotenode), 23583b2aab18SMatthew Ahrens offsetof(struct promotenode, link)); 2359a9799022Sck 23603b2aab18SMatthew Ahrens while (obj != first_obj) { 23613b2aab18SMatthew Ahrens dsl_dataset_t *ds; 23623b2aab18SMatthew Ahrens struct promotenode *snap; 23633b2aab18SMatthew Ahrens int err; 236492241e0bSTom Erickson 23653b2aab18SMatthew Ahrens err = dsl_dataset_hold_obj(dp, obj, tag, &ds); 23663b2aab18SMatthew Ahrens ASSERT(err != ENOENT); 23673b2aab18SMatthew Ahrens if (err != 0) 23683b2aab18SMatthew Ahrens return (err); 2369a9799022Sck 23703b2aab18SMatthew Ahrens if (first_obj == 0) 23713b2aab18SMatthew Ahrens first_obj = ds->ds_dir->dd_phys->dd_origin_obj; 23723b2aab18SMatthew Ahrens 23733b2aab18SMatthew Ahrens snap = kmem_alloc(sizeof (*snap), KM_SLEEP); 23743b2aab18SMatthew Ahrens snap->ds = ds; 23753b2aab18SMatthew Ahrens list_insert_tail(l, snap); 23763b2aab18SMatthew Ahrens obj = ds->ds_phys->ds_prev_snap_obj; 23773b2aab18SMatthew Ahrens } 2378a9799022Sck 2379a9799022Sck return (0); 2380a9799022Sck } 2381a9799022Sck 23823b2aab18SMatthew Ahrens static int 23833b2aab18SMatthew Ahrens snaplist_space(list_t *l, uint64_t mintxg, uint64_t *spacep) 2384a9799022Sck { 23853b2aab18SMatthew Ahrens struct promotenode *snap; 2386a9799022Sck 23873b2aab18SMatthew Ahrens *spacep = 0; 23883b2aab18SMatthew Ahrens for (snap = list_head(l); snap; snap = list_next(l, snap)) { 23893b2aab18SMatthew Ahrens uint64_t used, comp, uncomp; 23903b2aab18SMatthew Ahrens dsl_deadlist_space_range(&snap->ds->ds_deadlist, 23913b2aab18SMatthew Ahrens mintxg, UINT64_MAX, &used, &comp, &uncomp); 23923b2aab18SMatthew Ahrens *spacep += used; 239392241e0bSTom Erickson } 23943b2aab18SMatthew Ahrens return (0); 2395a9799022Sck } 2396a9799022Sck 23973b2aab18SMatthew Ahrens static void 23983b2aab18SMatthew Ahrens snaplist_destroy(list_t *l, void *tag) 2399a9799022Sck { 24003b2aab18SMatthew Ahrens struct promotenode *snap; 240192241e0bSTom Erickson 24023b2aab18SMatthew Ahrens if (l == NULL || !list_link_active(&l->list_head)) 24033b2aab18SMatthew Ahrens return; 2404a9799022Sck 24053b2aab18SMatthew Ahrens while ((snap = list_tail(l)) != NULL) { 24063b2aab18SMatthew Ahrens list_remove(l, snap); 24073b2aab18SMatthew Ahrens dsl_dataset_rele(snap->ds, tag); 24083b2aab18SMatthew Ahrens kmem_free(snap, sizeof (*snap)); 24093b2aab18SMatthew Ahrens } 24103b2aab18SMatthew Ahrens list_destroy(l); 2411a9799022Sck } 2412a9799022Sck 2413a9799022Sck static int 24143b2aab18SMatthew Ahrens promote_hold(dsl_dataset_promote_arg_t *ddpa, dsl_pool_t *dp, void *tag) 2415a9799022Sck { 24163b2aab18SMatthew Ahrens int error; 24173b2aab18SMatthew Ahrens dsl_dir_t *dd; 24183b2aab18SMatthew Ahrens struct promotenode *snap; 2419a9799022Sck 24203b2aab18SMatthew Ahrens error = dsl_dataset_hold(dp, ddpa->ddpa_clonename, tag, 24213b2aab18SMatthew Ahrens &ddpa->ddpa_clone); 24223b2aab18SMatthew Ahrens if (error != 0) 24233b2aab18SMatthew Ahrens return (error); 24243b2aab18SMatthew Ahrens dd = ddpa->ddpa_clone->ds_dir; 2425a9799022Sck 24263b2aab18SMatthew Ahrens if (dsl_dataset_is_snapshot(ddpa->ddpa_clone) || 24273b2aab18SMatthew Ahrens !dsl_dir_is_clone(dd)) { 24283b2aab18SMatthew Ahrens dsl_dataset_rele(ddpa->ddpa_clone, tag); 2429be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 24303b2aab18SMatthew Ahrens } 2431a9799022Sck 24323b2aab18SMatthew Ahrens error = snaplist_make(dp, 0, dd->dd_phys->dd_origin_obj, 24333b2aab18SMatthew Ahrens &ddpa->shared_snaps, tag); 24343b2aab18SMatthew Ahrens if (error != 0) 24353b2aab18SMatthew Ahrens goto out; 2436a9799022Sck 24373b2aab18SMatthew Ahrens error = snaplist_make(dp, 0, ddpa->ddpa_clone->ds_object, 24383b2aab18SMatthew Ahrens &ddpa->clone_snaps, tag); 24393b2aab18SMatthew Ahrens if (error != 0) 24403b2aab18SMatthew Ahrens goto out; 2441a9799022Sck 24423b2aab18SMatthew Ahrens snap = list_head(&ddpa->shared_snaps); 24433b2aab18SMatthew Ahrens ASSERT3U(snap->ds->ds_object, ==, dd->dd_phys->dd_origin_obj); 24443b2aab18SMatthew Ahrens error = snaplist_make(dp, dd->dd_phys->dd_origin_obj, 24453b2aab18SMatthew Ahrens snap->ds->ds_dir->dd_phys->dd_head_dataset_obj, 24463b2aab18SMatthew Ahrens &ddpa->origin_snaps, tag); 24473b2aab18SMatthew Ahrens if (error != 0) 24483b2aab18SMatthew Ahrens goto out; 2449379c004dSEric Schrock 24503b2aab18SMatthew Ahrens if (snap->ds->ds_dir->dd_phys->dd_origin_obj != 0) { 24513b2aab18SMatthew Ahrens error = dsl_dataset_hold_obj(dp, 24523b2aab18SMatthew Ahrens snap->ds->ds_dir->dd_phys->dd_origin_obj, 24533b2aab18SMatthew Ahrens tag, &ddpa->origin_origin); 24543b2aab18SMatthew Ahrens if (error != 0) 24553b2aab18SMatthew Ahrens goto out; 2456379c004dSEric Schrock } 24573b2aab18SMatthew Ahrens out: 24583b2aab18SMatthew Ahrens if (error != 0) 24593b2aab18SMatthew Ahrens promote_rele(ddpa, tag); 24603b2aab18SMatthew Ahrens return (error); 2461a9799022Sck } 2462a9799022Sck 2463a9799022Sck static void 24643b2aab18SMatthew Ahrens promote_rele(dsl_dataset_promote_arg_t *ddpa, void *tag) 2465a9799022Sck { 24663b2aab18SMatthew Ahrens snaplist_destroy(&ddpa->shared_snaps, tag); 24673b2aab18SMatthew Ahrens snaplist_destroy(&ddpa->clone_snaps, tag); 24683b2aab18SMatthew Ahrens snaplist_destroy(&ddpa->origin_snaps, tag); 24693b2aab18SMatthew Ahrens if (ddpa->origin_origin != NULL) 24703b2aab18SMatthew Ahrens dsl_dataset_rele(ddpa->origin_origin, tag); 24713b2aab18SMatthew Ahrens dsl_dataset_rele(ddpa->ddpa_clone, tag); 24723b2aab18SMatthew Ahrens } 247302c8f3f0SMatthew Ahrens 24743b2aab18SMatthew Ahrens /* 24753b2aab18SMatthew Ahrens * Promote a clone. 24763b2aab18SMatthew Ahrens * 24773b2aab18SMatthew Ahrens * If it fails due to a conflicting snapshot name, "conflsnap" will be filled 24783b2aab18SMatthew Ahrens * in with the name. (It must be at least MAXNAMELEN bytes long.) 24793b2aab18SMatthew Ahrens */ 24803b2aab18SMatthew Ahrens int 24813b2aab18SMatthew Ahrens dsl_dataset_promote(const char *name, char *conflsnap) 24823b2aab18SMatthew Ahrens { 24833b2aab18SMatthew Ahrens dsl_dataset_promote_arg_t ddpa = { 0 }; 24843b2aab18SMatthew Ahrens uint64_t numsnaps; 24853b2aab18SMatthew Ahrens int error; 24863b2aab18SMatthew Ahrens objset_t *os; 248792241e0bSTom Erickson 24883b2aab18SMatthew Ahrens /* 24893b2aab18SMatthew Ahrens * We will modify space proportional to the number of 24903b2aab18SMatthew Ahrens * snapshots. Compute numsnaps. 24913b2aab18SMatthew Ahrens */ 24923b2aab18SMatthew Ahrens error = dmu_objset_hold(name, FTAG, &os); 24933b2aab18SMatthew Ahrens if (error != 0) 24943b2aab18SMatthew Ahrens return (error); 24953b2aab18SMatthew Ahrens error = zap_count(dmu_objset_pool(os)->dp_meta_objset, 24963b2aab18SMatthew Ahrens dmu_objset_ds(os)->ds_phys->ds_snapnames_zapobj, &numsnaps); 24973b2aab18SMatthew Ahrens dmu_objset_rele(os, FTAG); 24983b2aab18SMatthew Ahrens if (error != 0) 24993b2aab18SMatthew Ahrens return (error); 250002c8f3f0SMatthew Ahrens 25013b2aab18SMatthew Ahrens ddpa.ddpa_clonename = name; 25023b2aab18SMatthew Ahrens ddpa.err_ds = conflsnap; 2503a2afb611SJerry Jelinek ddpa.cr = CRED(); 250402c8f3f0SMatthew Ahrens 25053b2aab18SMatthew Ahrens return (dsl_sync_task(name, dsl_dataset_promote_check, 2506*7d46dc6cSMatthew Ahrens dsl_dataset_promote_sync, &ddpa, 2507*7d46dc6cSMatthew Ahrens 2 + numsnaps, ZFS_SPACE_CHECK_RESERVED)); 2508a9799022Sck } 2509a9799022Sck 2510a9799022Sck int 25113b2aab18SMatthew Ahrens dsl_dataset_clone_swap_check_impl(dsl_dataset_t *clone, 251291948b51SKeith M Wesolowski dsl_dataset_t *origin_head, boolean_t force, void *owner, dmu_tx_t *tx) 2513a9799022Sck { 25143b2aab18SMatthew Ahrens int64_t unused_refres_delta; 2515a9799022Sck 25163b2aab18SMatthew Ahrens /* they should both be heads */ 25173b2aab18SMatthew Ahrens if (dsl_dataset_is_snapshot(clone) || 25183b2aab18SMatthew Ahrens dsl_dataset_is_snapshot(origin_head)) 2519be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 252092241e0bSTom Erickson 252134f2f8cfSMatthew Ahrens /* if we are not forcing, the branch point should be just before them */ 252234f2f8cfSMatthew Ahrens if (!force && clone->ds_prev != origin_head->ds_prev) 2523be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 2524a9799022Sck 25253b2aab18SMatthew Ahrens /* clone should be the clone (unless they are unrelated) */ 25263b2aab18SMatthew Ahrens if (clone->ds_prev != NULL && 25273b2aab18SMatthew Ahrens clone->ds_prev != clone->ds_dir->dd_pool->dp_origin_snap && 252834f2f8cfSMatthew Ahrens origin_head->ds_dir != clone->ds_prev->ds_dir) 2529be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 253092241e0bSTom Erickson 25313b2aab18SMatthew Ahrens /* the clone should be a child of the origin */ 25323b2aab18SMatthew Ahrens if (clone->ds_dir->dd_parent != origin_head->ds_dir) 2533be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 2534842727c2SChris Kirby 25353b2aab18SMatthew Ahrens /* origin_head shouldn't be modified unless 'force' */ 253634f2f8cfSMatthew Ahrens if (!force && 253734f2f8cfSMatthew Ahrens dsl_dataset_modified_since_snap(origin_head, origin_head->ds_prev)) 2538be6fd75aSMatthew Ahrens return (SET_ERROR(ETXTBSY)); 2539c99e4bdcSChris Kirby 25403b2aab18SMatthew Ahrens /* origin_head should have no long holds (e.g. is not mounted) */ 254191948b51SKeith M Wesolowski if (dsl_dataset_handoff_check(origin_head, owner, tx)) 2542be6fd75aSMatthew Ahrens return (SET_ERROR(EBUSY)); 25433b2aab18SMatthew Ahrens 25443b2aab18SMatthew Ahrens /* check amount of any unconsumed refreservation */ 25453b2aab18SMatthew Ahrens unused_refres_delta = 25463b2aab18SMatthew Ahrens (int64_t)MIN(origin_head->ds_reserved, 25473b2aab18SMatthew Ahrens origin_head->ds_phys->ds_unique_bytes) - 25483b2aab18SMatthew Ahrens (int64_t)MIN(origin_head->ds_reserved, 25493b2aab18SMatthew Ahrens clone->ds_phys->ds_unique_bytes); 25503b2aab18SMatthew Ahrens 25513b2aab18SMatthew Ahrens if (unused_refres_delta > 0 && 25523b2aab18SMatthew Ahrens unused_refres_delta > 25533b2aab18SMatthew Ahrens dsl_dir_space_available(origin_head->ds_dir, NULL, 0, TRUE)) 2554be6fd75aSMatthew Ahrens return (SET_ERROR(ENOSPC)); 25553b2aab18SMatthew Ahrens 25563b2aab18SMatthew Ahrens /* clone can't be over the head's refquota */ 25573b2aab18SMatthew Ahrens if (origin_head->ds_quota != 0 && 25583b2aab18SMatthew Ahrens clone->ds_phys->ds_referenced_bytes > origin_head->ds_quota) 2559be6fd75aSMatthew Ahrens return (SET_ERROR(EDQUOT)); 2560c99e4bdcSChris Kirby 25613b2aab18SMatthew Ahrens return (0); 2562c99e4bdcSChris Kirby } 2563c99e4bdcSChris Kirby 2564a7f53a56SChris Kirby void 25653b2aab18SMatthew Ahrens dsl_dataset_clone_swap_sync_impl(dsl_dataset_t *clone, 25663b2aab18SMatthew Ahrens dsl_dataset_t *origin_head, dmu_tx_t *tx) 2567a7f53a56SChris Kirby { 25683b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 25693b2aab18SMatthew Ahrens int64_t unused_refres_delta; 2570a7f53a56SChris Kirby 25713b2aab18SMatthew Ahrens ASSERT(clone->ds_reserved == 0); 25723b2aab18SMatthew Ahrens ASSERT(origin_head->ds_quota == 0 || 25733b2aab18SMatthew Ahrens clone->ds_phys->ds_unique_bytes <= origin_head->ds_quota); 257434f2f8cfSMatthew Ahrens ASSERT3P(clone->ds_prev, ==, origin_head->ds_prev); 2575842727c2SChris Kirby 25763b2aab18SMatthew Ahrens dmu_buf_will_dirty(clone->ds_dbuf, tx); 25773b2aab18SMatthew Ahrens dmu_buf_will_dirty(origin_head->ds_dbuf, tx); 2578842727c2SChris Kirby 25793b2aab18SMatthew Ahrens if (clone->ds_objset != NULL) { 25803b2aab18SMatthew Ahrens dmu_objset_evict(clone->ds_objset); 25813b2aab18SMatthew Ahrens clone->ds_objset = NULL; 25823b2aab18SMatthew Ahrens } 2583842727c2SChris Kirby 25843b2aab18SMatthew Ahrens if (origin_head->ds_objset != NULL) { 25853b2aab18SMatthew Ahrens dmu_objset_evict(origin_head->ds_objset); 25863b2aab18SMatthew Ahrens origin_head->ds_objset = NULL; 2587842727c2SChris Kirby } 2588842727c2SChris Kirby 25893b2aab18SMatthew Ahrens unused_refres_delta = 25903b2aab18SMatthew Ahrens (int64_t)MIN(origin_head->ds_reserved, 25913b2aab18SMatthew Ahrens origin_head->ds_phys->ds_unique_bytes) - 25923b2aab18SMatthew Ahrens (int64_t)MIN(origin_head->ds_reserved, 25933b2aab18SMatthew Ahrens clone->ds_phys->ds_unique_bytes); 25943b2aab18SMatthew Ahrens 25953b2aab18SMatthew Ahrens /* 25963b2aab18SMatthew Ahrens * Reset origin's unique bytes, if it exists. 25973b2aab18SMatthew Ahrens */ 25983b2aab18SMatthew Ahrens if (clone->ds_prev) { 25993b2aab18SMatthew Ahrens dsl_dataset_t *origin = clone->ds_prev; 26003b2aab18SMatthew Ahrens uint64_t comp, uncomp; 26013b2aab18SMatthew Ahrens 26023b2aab18SMatthew Ahrens dmu_buf_will_dirty(origin->ds_dbuf, tx); 26033b2aab18SMatthew Ahrens dsl_deadlist_space_range(&clone->ds_deadlist, 26043b2aab18SMatthew Ahrens origin->ds_phys->ds_prev_snap_txg, UINT64_MAX, 26053b2aab18SMatthew Ahrens &origin->ds_phys->ds_unique_bytes, &comp, &uncomp); 26063b2aab18SMatthew Ahrens } 26073b2aab18SMatthew Ahrens 26083b2aab18SMatthew Ahrens /* swap blkptrs */ 26093b2aab18SMatthew Ahrens { 26103b2aab18SMatthew Ahrens blkptr_t tmp; 26113b2aab18SMatthew Ahrens tmp = origin_head->ds_phys->ds_bp; 26123b2aab18SMatthew Ahrens origin_head->ds_phys->ds_bp = clone->ds_phys->ds_bp; 26133b2aab18SMatthew Ahrens clone->ds_phys->ds_bp = tmp; 26143b2aab18SMatthew Ahrens } 26153b2aab18SMatthew Ahrens 26163b2aab18SMatthew Ahrens /* set dd_*_bytes */ 26173b2aab18SMatthew Ahrens { 26183b2aab18SMatthew Ahrens int64_t dused, dcomp, duncomp; 26193b2aab18SMatthew Ahrens uint64_t cdl_used, cdl_comp, cdl_uncomp; 26203b2aab18SMatthew Ahrens uint64_t odl_used, odl_comp, odl_uncomp; 26213b2aab18SMatthew Ahrens 26223b2aab18SMatthew Ahrens ASSERT3U(clone->ds_dir->dd_phys-> 26233b2aab18SMatthew Ahrens dd_used_breakdown[DD_USED_SNAP], ==, 0); 26243b2aab18SMatthew Ahrens 26253b2aab18SMatthew Ahrens dsl_deadlist_space(&clone->ds_deadlist, 26263b2aab18SMatthew Ahrens &cdl_used, &cdl_comp, &cdl_uncomp); 26273b2aab18SMatthew Ahrens dsl_deadlist_space(&origin_head->ds_deadlist, 26283b2aab18SMatthew Ahrens &odl_used, &odl_comp, &odl_uncomp); 262915508ac0SChris Kirby 26303b2aab18SMatthew Ahrens dused = clone->ds_phys->ds_referenced_bytes + cdl_used - 26313b2aab18SMatthew Ahrens (origin_head->ds_phys->ds_referenced_bytes + odl_used); 26323b2aab18SMatthew Ahrens dcomp = clone->ds_phys->ds_compressed_bytes + cdl_comp - 26333b2aab18SMatthew Ahrens (origin_head->ds_phys->ds_compressed_bytes + odl_comp); 26343b2aab18SMatthew Ahrens duncomp = clone->ds_phys->ds_uncompressed_bytes + 26353b2aab18SMatthew Ahrens cdl_uncomp - 26363b2aab18SMatthew Ahrens (origin_head->ds_phys->ds_uncompressed_bytes + odl_uncomp); 2637842727c2SChris Kirby 26383b2aab18SMatthew Ahrens dsl_dir_diduse_space(origin_head->ds_dir, DD_USED_HEAD, 26393b2aab18SMatthew Ahrens dused, dcomp, duncomp, tx); 26403b2aab18SMatthew Ahrens dsl_dir_diduse_space(clone->ds_dir, DD_USED_HEAD, 26413b2aab18SMatthew Ahrens -dused, -dcomp, -duncomp, tx); 2642842727c2SChris Kirby 2643842727c2SChris Kirby /* 26443b2aab18SMatthew Ahrens * The difference in the space used by snapshots is the 26453b2aab18SMatthew Ahrens * difference in snapshot space due to the head's 26463b2aab18SMatthew Ahrens * deadlist (since that's the only thing that's 26473b2aab18SMatthew Ahrens * changing that affects the snapused). 2648842727c2SChris Kirby */ 26493b2aab18SMatthew Ahrens dsl_deadlist_space_range(&clone->ds_deadlist, 26503b2aab18SMatthew Ahrens origin_head->ds_dir->dd_origin_txg, UINT64_MAX, 26513b2aab18SMatthew Ahrens &cdl_used, &cdl_comp, &cdl_uncomp); 26523b2aab18SMatthew Ahrens dsl_deadlist_space_range(&origin_head->ds_deadlist, 26533b2aab18SMatthew Ahrens origin_head->ds_dir->dd_origin_txg, UINT64_MAX, 26543b2aab18SMatthew Ahrens &odl_used, &odl_comp, &odl_uncomp); 26553b2aab18SMatthew Ahrens dsl_dir_transfer_space(origin_head->ds_dir, cdl_used - odl_used, 26563b2aab18SMatthew Ahrens DD_USED_HEAD, DD_USED_SNAP, tx); 2657842727c2SChris Kirby } 2658842727c2SChris Kirby 26593b2aab18SMatthew Ahrens /* swap ds_*_bytes */ 26603b2aab18SMatthew Ahrens SWITCH64(origin_head->ds_phys->ds_referenced_bytes, 26613b2aab18SMatthew Ahrens clone->ds_phys->ds_referenced_bytes); 26623b2aab18SMatthew Ahrens SWITCH64(origin_head->ds_phys->ds_compressed_bytes, 26633b2aab18SMatthew Ahrens clone->ds_phys->ds_compressed_bytes); 26643b2aab18SMatthew Ahrens SWITCH64(origin_head->ds_phys->ds_uncompressed_bytes, 26653b2aab18SMatthew Ahrens clone->ds_phys->ds_uncompressed_bytes); 26663b2aab18SMatthew Ahrens SWITCH64(origin_head->ds_phys->ds_unique_bytes, 26673b2aab18SMatthew Ahrens clone->ds_phys->ds_unique_bytes); 2668842727c2SChris Kirby 26693b2aab18SMatthew Ahrens /* apply any parent delta for change in unconsumed refreservation */ 26703b2aab18SMatthew Ahrens dsl_dir_diduse_space(origin_head->ds_dir, DD_USED_REFRSRV, 26713b2aab18SMatthew Ahrens unused_refres_delta, 0, 0, tx); 2672ca45db41SChris Kirby 26733b2aab18SMatthew Ahrens /* 26743b2aab18SMatthew Ahrens * Swap deadlists. 26753b2aab18SMatthew Ahrens */ 26763b2aab18SMatthew Ahrens dsl_deadlist_close(&clone->ds_deadlist); 26773b2aab18SMatthew Ahrens dsl_deadlist_close(&origin_head->ds_deadlist); 26783b2aab18SMatthew Ahrens SWITCH64(origin_head->ds_phys->ds_deadlist_obj, 26793b2aab18SMatthew Ahrens clone->ds_phys->ds_deadlist_obj); 26803b2aab18SMatthew Ahrens dsl_deadlist_open(&clone->ds_deadlist, dp->dp_meta_objset, 26813b2aab18SMatthew Ahrens clone->ds_phys->ds_deadlist_obj); 26823b2aab18SMatthew Ahrens dsl_deadlist_open(&origin_head->ds_deadlist, dp->dp_meta_objset, 26833b2aab18SMatthew Ahrens origin_head->ds_phys->ds_deadlist_obj); 2684842727c2SChris Kirby 26853b2aab18SMatthew Ahrens dsl_scan_ds_clone_swapped(origin_head, clone, tx); 2686842727c2SChris Kirby 26873b2aab18SMatthew Ahrens spa_history_log_internal_ds(clone, "clone swap", tx, 26883b2aab18SMatthew Ahrens "parent=%s", origin_head->ds_dir->dd_myname); 2689842727c2SChris Kirby } 2690842727c2SChris Kirby 26913b2aab18SMatthew Ahrens /* 26923b2aab18SMatthew Ahrens * Given a pool name and a dataset object number in that pool, 26933b2aab18SMatthew Ahrens * return the name of that dataset. 26943b2aab18SMatthew Ahrens */ 2695a7f53a56SChris Kirby int 26963b2aab18SMatthew Ahrens dsl_dsobj_to_dsname(char *pname, uint64_t obj, char *buf) 2697a7f53a56SChris Kirby { 26983b2aab18SMatthew Ahrens dsl_pool_t *dp; 26993b2aab18SMatthew Ahrens dsl_dataset_t *ds; 2700a7f53a56SChris Kirby int error; 2701a7f53a56SChris Kirby 27023b2aab18SMatthew Ahrens error = dsl_pool_hold(pname, FTAG, &dp); 27033b2aab18SMatthew Ahrens if (error != 0) 27043b2aab18SMatthew Ahrens return (error); 27053b2aab18SMatthew Ahrens 27063b2aab18SMatthew Ahrens error = dsl_dataset_hold_obj(dp, obj, FTAG, &ds); 27073b2aab18SMatthew Ahrens if (error == 0) { 27083b2aab18SMatthew Ahrens dsl_dataset_name(ds, buf); 27093b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 27103b2aab18SMatthew Ahrens } 27113b2aab18SMatthew Ahrens dsl_pool_rele(dp, FTAG); 2712a7f53a56SChris Kirby 2713a7f53a56SChris Kirby return (error); 2714a7f53a56SChris Kirby } 2715a7f53a56SChris Kirby 2716842727c2SChris Kirby int 27173b2aab18SMatthew Ahrens dsl_dataset_check_quota(dsl_dataset_t *ds, boolean_t check_quota, 27183b2aab18SMatthew Ahrens uint64_t asize, uint64_t inflight, uint64_t *used, uint64_t *ref_rsrv) 2719842727c2SChris Kirby { 27203b2aab18SMatthew Ahrens int error = 0; 2721842727c2SChris Kirby 27223b2aab18SMatthew Ahrens ASSERT3S(asize, >, 0); 2723842727c2SChris Kirby 27243b2aab18SMatthew Ahrens /* 27253b2aab18SMatthew Ahrens * *ref_rsrv is the portion of asize that will come from any 27263b2aab18SMatthew Ahrens * unconsumed refreservation space. 27273b2aab18SMatthew Ahrens */ 27283b2aab18SMatthew Ahrens *ref_rsrv = 0; 2729842727c2SChris Kirby 27303b2aab18SMatthew Ahrens mutex_enter(&ds->ds_lock); 27313b2aab18SMatthew Ahrens /* 27323b2aab18SMatthew Ahrens * Make a space adjustment for reserved bytes. 27333b2aab18SMatthew Ahrens */ 27343b2aab18SMatthew Ahrens if (ds->ds_reserved > ds->ds_phys->ds_unique_bytes) { 27353b2aab18SMatthew Ahrens ASSERT3U(*used, >=, 27363b2aab18SMatthew Ahrens ds->ds_reserved - ds->ds_phys->ds_unique_bytes); 27373b2aab18SMatthew Ahrens *used -= (ds->ds_reserved - ds->ds_phys->ds_unique_bytes); 27383b2aab18SMatthew Ahrens *ref_rsrv = 27393b2aab18SMatthew Ahrens asize - MIN(asize, parent_delta(ds, asize + inflight)); 2740842727c2SChris Kirby } 2741842727c2SChris Kirby 27423b2aab18SMatthew Ahrens if (!check_quota || ds->ds_quota == 0) { 27433b2aab18SMatthew Ahrens mutex_exit(&ds->ds_lock); 27443b2aab18SMatthew Ahrens return (0); 2745842727c2SChris Kirby } 27463b2aab18SMatthew Ahrens /* 27473b2aab18SMatthew Ahrens * If they are requesting more space, and our current estimate 27483b2aab18SMatthew Ahrens * is over quota, they get to try again unless the actual 27493b2aab18SMatthew Ahrens * on-disk is over quota and there are no pending changes (which 27503b2aab18SMatthew Ahrens * may free up space for us). 27513b2aab18SMatthew Ahrens */ 27523b2aab18SMatthew Ahrens if (ds->ds_phys->ds_referenced_bytes + inflight >= ds->ds_quota) { 27533b2aab18SMatthew Ahrens if (inflight > 0 || 27543b2aab18SMatthew Ahrens ds->ds_phys->ds_referenced_bytes < ds->ds_quota) 2755be6fd75aSMatthew Ahrens error = SET_ERROR(ERESTART); 27563b2aab18SMatthew Ahrens else 2757be6fd75aSMatthew Ahrens error = SET_ERROR(EDQUOT); 2758842727c2SChris Kirby } 27593b2aab18SMatthew Ahrens mutex_exit(&ds->ds_lock); 2760842727c2SChris Kirby 2761842727c2SChris Kirby return (error); 2762842727c2SChris Kirby } 2763842727c2SChris Kirby 27643b2aab18SMatthew Ahrens typedef struct dsl_dataset_set_qr_arg { 27653b2aab18SMatthew Ahrens const char *ddsqra_name; 27663b2aab18SMatthew Ahrens zprop_source_t ddsqra_source; 27673b2aab18SMatthew Ahrens uint64_t ddsqra_value; 27683b2aab18SMatthew Ahrens } dsl_dataset_set_qr_arg_t; 2769842727c2SChris Kirby 27703b2aab18SMatthew Ahrens 27713b2aab18SMatthew Ahrens /* ARGSUSED */ 2772842727c2SChris Kirby static int 27733b2aab18SMatthew Ahrens dsl_dataset_set_refquota_check(void *arg, dmu_tx_t *tx) 2774842727c2SChris Kirby { 27753b2aab18SMatthew Ahrens dsl_dataset_set_qr_arg_t *ddsqra = arg; 27763b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 27773b2aab18SMatthew Ahrens dsl_dataset_t *ds; 2778842727c2SChris Kirby int error; 27793b2aab18SMatthew Ahrens uint64_t newval; 2780842727c2SChris Kirby 27813b2aab18SMatthew Ahrens if (spa_version(dp->dp_spa) < SPA_VERSION_REFQUOTA) 2782be6fd75aSMatthew Ahrens return (SET_ERROR(ENOTSUP)); 2783842727c2SChris Kirby 27843b2aab18SMatthew Ahrens error = dsl_dataset_hold(dp, ddsqra->ddsqra_name, FTAG, &ds); 27853b2aab18SMatthew Ahrens if (error != 0) 27863b2aab18SMatthew Ahrens return (error); 27873b2aab18SMatthew Ahrens 27883b2aab18SMatthew Ahrens if (dsl_dataset_is_snapshot(ds)) { 27893b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 2790be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 2791842727c2SChris Kirby } 2792842727c2SChris Kirby 27933b2aab18SMatthew Ahrens error = dsl_prop_predict(ds->ds_dir, 27943b2aab18SMatthew Ahrens zfs_prop_to_name(ZFS_PROP_REFQUOTA), 27953b2aab18SMatthew Ahrens ddsqra->ddsqra_source, ddsqra->ddsqra_value, &newval); 27963b2aab18SMatthew Ahrens if (error != 0) { 27973b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 2798842727c2SChris Kirby return (error); 2799842727c2SChris Kirby } 2800842727c2SChris Kirby 28013b2aab18SMatthew Ahrens if (newval == 0) { 28023b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 28033b2aab18SMatthew Ahrens return (0); 28043b2aab18SMatthew Ahrens } 2805842727c2SChris Kirby 28063b2aab18SMatthew Ahrens if (newval < ds->ds_phys->ds_referenced_bytes || 28073b2aab18SMatthew Ahrens newval < ds->ds_reserved) { 28083b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 2809be6fd75aSMatthew Ahrens return (SET_ERROR(ENOSPC)); 28103b2aab18SMatthew Ahrens } 28113b2aab18SMatthew Ahrens 28123b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 2813842727c2SChris Kirby return (0); 2814842727c2SChris Kirby } 2815842727c2SChris Kirby 28163b2aab18SMatthew Ahrens static void 28173b2aab18SMatthew Ahrens dsl_dataset_set_refquota_sync(void *arg, dmu_tx_t *tx) 2818842727c2SChris Kirby { 28193b2aab18SMatthew Ahrens dsl_dataset_set_qr_arg_t *ddsqra = arg; 28203b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 28213b2aab18SMatthew Ahrens dsl_dataset_t *ds; 28223b2aab18SMatthew Ahrens uint64_t newval; 2823842727c2SChris Kirby 28243b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold(dp, ddsqra->ddsqra_name, FTAG, &ds)); 2825842727c2SChris Kirby 28263b2aab18SMatthew Ahrens dsl_prop_set_sync_impl(ds, 28273b2aab18SMatthew Ahrens zfs_prop_to_name(ZFS_PROP_REFQUOTA), 28283b2aab18SMatthew Ahrens ddsqra->ddsqra_source, sizeof (ddsqra->ddsqra_value), 1, 28293b2aab18SMatthew Ahrens &ddsqra->ddsqra_value, tx); 2830842727c2SChris Kirby 28313b2aab18SMatthew Ahrens VERIFY0(dsl_prop_get_int_ds(ds, 28323b2aab18SMatthew Ahrens zfs_prop_to_name(ZFS_PROP_REFQUOTA), &newval)); 2833842727c2SChris Kirby 28343b2aab18SMatthew Ahrens if (ds->ds_quota != newval) { 28353b2aab18SMatthew Ahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 28363b2aab18SMatthew Ahrens ds->ds_quota = newval; 2837842727c2SChris Kirby } 28383b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 2839842727c2SChris Kirby } 2840842727c2SChris Kirby 28413b2aab18SMatthew Ahrens int 28423b2aab18SMatthew Ahrens dsl_dataset_set_refquota(const char *dsname, zprop_source_t source, 28433b2aab18SMatthew Ahrens uint64_t refquota) 2844842727c2SChris Kirby { 28453b2aab18SMatthew Ahrens dsl_dataset_set_qr_arg_t ddsqra; 2846842727c2SChris Kirby 28473b2aab18SMatthew Ahrens ddsqra.ddsqra_name = dsname; 28483b2aab18SMatthew Ahrens ddsqra.ddsqra_source = source; 28493b2aab18SMatthew Ahrens ddsqra.ddsqra_value = refquota; 28503b2aab18SMatthew Ahrens 28513b2aab18SMatthew Ahrens return (dsl_sync_task(dsname, dsl_dataset_set_refquota_check, 2852*7d46dc6cSMatthew Ahrens dsl_dataset_set_refquota_sync, &ddsqra, 0, ZFS_SPACE_CHECK_NONE)); 2853842727c2SChris Kirby } 2854842727c2SChris Kirby 2855842727c2SChris Kirby static int 28563b2aab18SMatthew Ahrens dsl_dataset_set_refreservation_check(void *arg, dmu_tx_t *tx) 2857842727c2SChris Kirby { 28583b2aab18SMatthew Ahrens dsl_dataset_set_qr_arg_t *ddsqra = arg; 28593b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 2860842727c2SChris Kirby dsl_dataset_t *ds; 2861842727c2SChris Kirby int error; 28623b2aab18SMatthew Ahrens uint64_t newval, unique; 2863d7747cbcSChris Kirby 28643b2aab18SMatthew Ahrens if (spa_version(dp->dp_spa) < SPA_VERSION_REFRESERVATION) 2865be6fd75aSMatthew Ahrens return (SET_ERROR(ENOTSUP)); 2866842727c2SChris Kirby 28673b2aab18SMatthew Ahrens error = dsl_dataset_hold(dp, ddsqra->ddsqra_name, FTAG, &ds); 28683b2aab18SMatthew Ahrens if (error != 0) 2869842727c2SChris Kirby return (error); 2870842727c2SChris Kirby 28713b2aab18SMatthew Ahrens if (dsl_dataset_is_snapshot(ds)) { 28723b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 2873be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 2874842727c2SChris Kirby } 2875842727c2SChris Kirby 28763b2aab18SMatthew Ahrens error = dsl_prop_predict(ds->ds_dir, 28773b2aab18SMatthew Ahrens zfs_prop_to_name(ZFS_PROP_REFRESERVATION), 28783b2aab18SMatthew Ahrens ddsqra->ddsqra_source, ddsqra->ddsqra_value, &newval); 28793b2aab18SMatthew Ahrens if (error != 0) { 28803b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 2881842727c2SChris Kirby return (error); 2882842727c2SChris Kirby } 2883842727c2SChris Kirby 28843b2aab18SMatthew Ahrens /* 28853b2aab18SMatthew Ahrens * If we are doing the preliminary check in open context, the 28863b2aab18SMatthew Ahrens * space estimates may be inaccurate. 28873b2aab18SMatthew Ahrens */ 28883b2aab18SMatthew Ahrens if (!dmu_tx_is_syncing(tx)) { 28893b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 28903b2aab18SMatthew Ahrens return (0); 2891842727c2SChris Kirby } 2892842727c2SChris Kirby 28933b2aab18SMatthew Ahrens mutex_enter(&ds->ds_lock); 28943b2aab18SMatthew Ahrens if (!DS_UNIQUE_IS_ACCURATE(ds)) 28953b2aab18SMatthew Ahrens dsl_dataset_recalc_head_uniq(ds); 28963b2aab18SMatthew Ahrens unique = ds->ds_phys->ds_unique_bytes; 28973b2aab18SMatthew Ahrens mutex_exit(&ds->ds_lock); 2898842727c2SChris Kirby 28993b2aab18SMatthew Ahrens if (MAX(unique, newval) > MAX(unique, ds->ds_reserved)) { 29003b2aab18SMatthew Ahrens uint64_t delta = MAX(unique, newval) - 29013b2aab18SMatthew Ahrens MAX(unique, ds->ds_reserved); 2902842727c2SChris Kirby 29033b2aab18SMatthew Ahrens if (delta > 29043b2aab18SMatthew Ahrens dsl_dir_space_available(ds->ds_dir, NULL, 0, B_TRUE) || 29053b2aab18SMatthew Ahrens (ds->ds_quota > 0 && newval > ds->ds_quota)) { 29063b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 2907be6fd75aSMatthew Ahrens return (SET_ERROR(ENOSPC)); 29083b2aab18SMatthew Ahrens } 2909842727c2SChris Kirby } 2910842727c2SChris Kirby 29113b2aab18SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 29123b2aab18SMatthew Ahrens return (0); 2913842727c2SChris Kirby } 2914842727c2SChris Kirby 29153b2aab18SMatthew Ahrens void 29163b2aab18SMatthew Ahrens dsl_dataset_set_refreservation_sync_impl(dsl_dataset_t *ds, 29173b2aab18SMatthew Ahrens zprop_source_t source, uint64_t value, dmu_tx_t *tx) 2918ca45db41SChris Kirby { 29193b2aab18SMatthew Ahrens uint64_t newval; 29203b2aab18SMatthew Ahrens uint64_t unique; 29213b2aab18SMatthew Ahrens int64_t delta; 2922ca45db41SChris Kirby 29233b2aab18SMatthew Ahrens dsl_prop_set_sync_impl(ds, zfs_prop_to_name(ZFS_PROP_REFRESERVATION), 29243b2aab18SMatthew Ahrens source, sizeof (value), 1, &value, tx); 2925ca45db41SChris Kirby 29263b2aab18SMatthew Ahrens VERIFY0(dsl_prop_get_int_ds(ds, 29273b2aab18SMatthew Ahrens zfs_prop_to_name(ZFS_PROP_REFRESERVATION), &newval)); 2928a7f53a56SChris Kirby 29293b2aab18SMatthew Ahrens dmu_buf_will_dirty(ds->ds_dbuf, tx); 29303b2aab18SMatthew Ahrens mutex_enter(&ds->ds_dir->dd_lock); 29313b2aab18SMatthew Ahrens mutex_enter(&ds->ds_lock); 29323b2aab18SMatthew Ahrens ASSERT(DS_UNIQUE_IS_ACCURATE(ds)); 29333b2aab18SMatthew Ahrens unique = ds->ds_phys->ds_unique_bytes; 29343b2aab18SMatthew Ahrens delta = MAX(0, (int64_t)(newval - unique)) - 29353b2aab18SMatthew Ahrens MAX(0, (int64_t)(ds->ds_reserved - unique)); 29363b2aab18SMatthew Ahrens ds->ds_reserved = newval; 29373b2aab18SMatthew Ahrens mutex_exit(&ds->ds_lock); 2938a7f53a56SChris Kirby 29393b2aab18SMatthew Ahrens dsl_dir_diduse_space(ds->ds_dir, DD_USED_REFRSRV, delta, 0, 0, tx); 29403b2aab18SMatthew Ahrens mutex_exit(&ds->ds_dir->dd_lock); 2941ca45db41SChris Kirby } 2942ca45db41SChris Kirby 29433b2aab18SMatthew Ahrens static void 29443b2aab18SMatthew Ahrens dsl_dataset_set_refreservation_sync(void *arg, dmu_tx_t *tx) 2945842727c2SChris Kirby { 29463b2aab18SMatthew Ahrens dsl_dataset_set_qr_arg_t *ddsqra = arg; 29473b2aab18SMatthew Ahrens dsl_pool_t *dp = dmu_tx_pool(tx); 2948842727c2SChris Kirby dsl_dataset_t *ds; 2949842727c2SChris Kirby 29503b2aab18SMatthew Ahrens VERIFY0(dsl_dataset_hold(dp, ddsqra->ddsqra_name, FTAG, &ds)); 29513b2aab18SMatthew Ahrens dsl_dataset_set_refreservation_sync_impl(ds, 29523b2aab18SMatthew Ahrens ddsqra->ddsqra_source, ddsqra->ddsqra_value, tx); 2953842727c2SChris Kirby dsl_dataset_rele(ds, FTAG); 2954842727c2SChris Kirby } 2955503ad85cSMatthew Ahrens 2956503ad85cSMatthew Ahrens int 29573b2aab18SMatthew Ahrens dsl_dataset_set_refreservation(const char *dsname, zprop_source_t source, 29583b2aab18SMatthew Ahrens uint64_t refreservation) 2959503ad85cSMatthew Ahrens { 29603b2aab18SMatthew Ahrens dsl_dataset_set_qr_arg_t ddsqra; 2961503ad85cSMatthew Ahrens 29623b2aab18SMatthew Ahrens ddsqra.ddsqra_name = dsname; 29633b2aab18SMatthew Ahrens ddsqra.ddsqra_source = source; 29643b2aab18SMatthew Ahrens ddsqra.ddsqra_value = refreservation; 29653b2aab18SMatthew Ahrens 29663b2aab18SMatthew Ahrens return (dsl_sync_task(dsname, dsl_dataset_set_refreservation_check, 2967*7d46dc6cSMatthew Ahrens dsl_dataset_set_refreservation_sync, &ddsqra, 2968*7d46dc6cSMatthew Ahrens 0, ZFS_SPACE_CHECK_NONE)); 2969503ad85cSMatthew Ahrens } 297019b94df9SMatthew Ahrens 297119b94df9SMatthew Ahrens /* 297219b94df9SMatthew Ahrens * Return (in *usedp) the amount of space written in new that is not 297319b94df9SMatthew Ahrens * present in oldsnap. New may be a snapshot or the head. Old must be 297419b94df9SMatthew Ahrens * a snapshot before new, in new's filesystem (or its origin). If not then 297519b94df9SMatthew Ahrens * fail and return EINVAL. 297619b94df9SMatthew Ahrens * 297719b94df9SMatthew Ahrens * The written space is calculated by considering two components: First, we 297819b94df9SMatthew Ahrens * ignore any freed space, and calculate the written as new's used space 297919b94df9SMatthew Ahrens * minus old's used space. Next, we add in the amount of space that was freed 298019b94df9SMatthew Ahrens * between the two snapshots, thus reducing new's used space relative to old's. 298119b94df9SMatthew Ahrens * Specifically, this is the space that was born before old->ds_creation_txg, 298219b94df9SMatthew Ahrens * and freed before new (ie. on new's deadlist or a previous deadlist). 298319b94df9SMatthew Ahrens * 298419b94df9SMatthew Ahrens * space freed [---------------------] 298519b94df9SMatthew Ahrens * snapshots ---O-------O--------O-------O------ 298619b94df9SMatthew Ahrens * oldsnap new 298719b94df9SMatthew Ahrens */ 298819b94df9SMatthew Ahrens int 298919b94df9SMatthew Ahrens dsl_dataset_space_written(dsl_dataset_t *oldsnap, dsl_dataset_t *new, 299019b94df9SMatthew Ahrens uint64_t *usedp, uint64_t *compp, uint64_t *uncompp) 299119b94df9SMatthew Ahrens { 299219b94df9SMatthew Ahrens int err = 0; 299319b94df9SMatthew Ahrens uint64_t snapobj; 299419b94df9SMatthew Ahrens dsl_pool_t *dp = new->ds_dir->dd_pool; 299519b94df9SMatthew Ahrens 29963b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(dp)); 29973b2aab18SMatthew Ahrens 299819b94df9SMatthew Ahrens *usedp = 0; 2999ad135b5dSChristopher Siden *usedp += new->ds_phys->ds_referenced_bytes; 3000ad135b5dSChristopher Siden *usedp -= oldsnap->ds_phys->ds_referenced_bytes; 300119b94df9SMatthew Ahrens 300219b94df9SMatthew Ahrens *compp = 0; 300319b94df9SMatthew Ahrens *compp += new->ds_phys->ds_compressed_bytes; 300419b94df9SMatthew Ahrens *compp -= oldsnap->ds_phys->ds_compressed_bytes; 300519b94df9SMatthew Ahrens 300619b94df9SMatthew Ahrens *uncompp = 0; 300719b94df9SMatthew Ahrens *uncompp += new->ds_phys->ds_uncompressed_bytes; 300819b94df9SMatthew Ahrens *uncompp -= oldsnap->ds_phys->ds_uncompressed_bytes; 300919b94df9SMatthew Ahrens 301019b94df9SMatthew Ahrens snapobj = new->ds_object; 301119b94df9SMatthew Ahrens while (snapobj != oldsnap->ds_object) { 301219b94df9SMatthew Ahrens dsl_dataset_t *snap; 301319b94df9SMatthew Ahrens uint64_t used, comp, uncomp; 301419b94df9SMatthew Ahrens 3015ad135b5dSChristopher Siden if (snapobj == new->ds_object) { 3016ad135b5dSChristopher Siden snap = new; 3017ad135b5dSChristopher Siden } else { 3018ad135b5dSChristopher Siden err = dsl_dataset_hold_obj(dp, snapobj, FTAG, &snap); 3019ad135b5dSChristopher Siden if (err != 0) 3020ad135b5dSChristopher Siden break; 3021ad135b5dSChristopher Siden } 302219b94df9SMatthew Ahrens 302319b94df9SMatthew Ahrens if (snap->ds_phys->ds_prev_snap_txg == 302419b94df9SMatthew Ahrens oldsnap->ds_phys->ds_creation_txg) { 302519b94df9SMatthew Ahrens /* 302619b94df9SMatthew Ahrens * The blocks in the deadlist can not be born after 302719b94df9SMatthew Ahrens * ds_prev_snap_txg, so get the whole deadlist space, 302819b94df9SMatthew Ahrens * which is more efficient (especially for old-format 302919b94df9SMatthew Ahrens * deadlists). Unfortunately the deadlist code 303019b94df9SMatthew Ahrens * doesn't have enough information to make this 303119b94df9SMatthew Ahrens * optimization itself. 303219b94df9SMatthew Ahrens */ 303319b94df9SMatthew Ahrens dsl_deadlist_space(&snap->ds_deadlist, 303419b94df9SMatthew Ahrens &used, &comp, &uncomp); 303519b94df9SMatthew Ahrens } else { 303619b94df9SMatthew Ahrens dsl_deadlist_space_range(&snap->ds_deadlist, 303719b94df9SMatthew Ahrens 0, oldsnap->ds_phys->ds_creation_txg, 303819b94df9SMatthew Ahrens &used, &comp, &uncomp); 303919b94df9SMatthew Ahrens } 304019b94df9SMatthew Ahrens *usedp += used; 304119b94df9SMatthew Ahrens *compp += comp; 304219b94df9SMatthew Ahrens *uncompp += uncomp; 304319b94df9SMatthew Ahrens 304419b94df9SMatthew Ahrens /* 304519b94df9SMatthew Ahrens * If we get to the beginning of the chain of snapshots 304619b94df9SMatthew Ahrens * (ds_prev_snap_obj == 0) before oldsnap, then oldsnap 304719b94df9SMatthew Ahrens * was not a snapshot of/before new. 304819b94df9SMatthew Ahrens */ 304919b94df9SMatthew Ahrens snapobj = snap->ds_phys->ds_prev_snap_obj; 3050ad135b5dSChristopher Siden if (snap != new) 3051ad135b5dSChristopher Siden dsl_dataset_rele(snap, FTAG); 305219b94df9SMatthew Ahrens if (snapobj == 0) { 3053be6fd75aSMatthew Ahrens err = SET_ERROR(EINVAL); 305419b94df9SMatthew Ahrens break; 305519b94df9SMatthew Ahrens } 305619b94df9SMatthew Ahrens 305719b94df9SMatthew Ahrens } 305819b94df9SMatthew Ahrens return (err); 305919b94df9SMatthew Ahrens } 306019b94df9SMatthew Ahrens 306119b94df9SMatthew Ahrens /* 306219b94df9SMatthew Ahrens * Return (in *usedp) the amount of space that will be reclaimed if firstsnap, 306319b94df9SMatthew Ahrens * lastsnap, and all snapshots in between are deleted. 306419b94df9SMatthew Ahrens * 306519b94df9SMatthew Ahrens * blocks that would be freed [---------------------------] 306619b94df9SMatthew Ahrens * snapshots ---O-------O--------O-------O--------O 306719b94df9SMatthew Ahrens * firstsnap lastsnap 306819b94df9SMatthew Ahrens * 306919b94df9SMatthew Ahrens * This is the set of blocks that were born after the snap before firstsnap, 307019b94df9SMatthew Ahrens * (birth > firstsnap->prev_snap_txg) and died before the snap after the 307119b94df9SMatthew Ahrens * last snap (ie, is on lastsnap->ds_next->ds_deadlist or an earlier deadlist). 307219b94df9SMatthew Ahrens * We calculate this by iterating over the relevant deadlists (from the snap 307319b94df9SMatthew Ahrens * after lastsnap, backward to the snap after firstsnap), summing up the 307419b94df9SMatthew Ahrens * space on the deadlist that was born after the snap before firstsnap. 307519b94df9SMatthew Ahrens */ 307619b94df9SMatthew Ahrens int 307719b94df9SMatthew Ahrens dsl_dataset_space_wouldfree(dsl_dataset_t *firstsnap, 307819b94df9SMatthew Ahrens dsl_dataset_t *lastsnap, 307919b94df9SMatthew Ahrens uint64_t *usedp, uint64_t *compp, uint64_t *uncompp) 308019b94df9SMatthew Ahrens { 308119b94df9SMatthew Ahrens int err = 0; 308219b94df9SMatthew Ahrens uint64_t snapobj; 308319b94df9SMatthew Ahrens dsl_pool_t *dp = firstsnap->ds_dir->dd_pool; 308419b94df9SMatthew Ahrens 308519b94df9SMatthew Ahrens ASSERT(dsl_dataset_is_snapshot(firstsnap)); 308619b94df9SMatthew Ahrens ASSERT(dsl_dataset_is_snapshot(lastsnap)); 308719b94df9SMatthew Ahrens 308819b94df9SMatthew Ahrens /* 308919b94df9SMatthew Ahrens * Check that the snapshots are in the same dsl_dir, and firstsnap 309019b94df9SMatthew Ahrens * is before lastsnap. 309119b94df9SMatthew Ahrens */ 309219b94df9SMatthew Ahrens if (firstsnap->ds_dir != lastsnap->ds_dir || 309319b94df9SMatthew Ahrens firstsnap->ds_phys->ds_creation_txg > 309419b94df9SMatthew Ahrens lastsnap->ds_phys->ds_creation_txg) 3095be6fd75aSMatthew Ahrens return (SET_ERROR(EINVAL)); 309619b94df9SMatthew Ahrens 309719b94df9SMatthew Ahrens *usedp = *compp = *uncompp = 0; 309819b94df9SMatthew Ahrens 309919b94df9SMatthew Ahrens snapobj = lastsnap->ds_phys->ds_next_snap_obj; 310019b94df9SMatthew Ahrens while (snapobj != firstsnap->ds_object) { 310119b94df9SMatthew Ahrens dsl_dataset_t *ds; 310219b94df9SMatthew Ahrens uint64_t used, comp, uncomp; 310319b94df9SMatthew Ahrens 310419b94df9SMatthew Ahrens err = dsl_dataset_hold_obj(dp, snapobj, FTAG, &ds); 310519b94df9SMatthew Ahrens if (err != 0) 310619b94df9SMatthew Ahrens break; 310719b94df9SMatthew Ahrens 310819b94df9SMatthew Ahrens dsl_deadlist_space_range(&ds->ds_deadlist, 310919b94df9SMatthew Ahrens firstsnap->ds_phys->ds_prev_snap_txg, UINT64_MAX, 311019b94df9SMatthew Ahrens &used, &comp, &uncomp); 311119b94df9SMatthew Ahrens *usedp += used; 311219b94df9SMatthew Ahrens *compp += comp; 311319b94df9SMatthew Ahrens *uncompp += uncomp; 311419b94df9SMatthew Ahrens 311519b94df9SMatthew Ahrens snapobj = ds->ds_phys->ds_prev_snap_obj; 311619b94df9SMatthew Ahrens ASSERT3U(snapobj, !=, 0); 311719b94df9SMatthew Ahrens dsl_dataset_rele(ds, FTAG); 311819b94df9SMatthew Ahrens } 311919b94df9SMatthew Ahrens return (err); 312019b94df9SMatthew Ahrens } 31213b2aab18SMatthew Ahrens 31223b2aab18SMatthew Ahrens /* 31233b2aab18SMatthew Ahrens * Return TRUE if 'earlier' is an earlier snapshot in 'later's timeline. 31243b2aab18SMatthew Ahrens * For example, they could both be snapshots of the same filesystem, and 31253b2aab18SMatthew Ahrens * 'earlier' is before 'later'. Or 'earlier' could be the origin of 31263b2aab18SMatthew Ahrens * 'later's filesystem. Or 'earlier' could be an older snapshot in the origin's 31273b2aab18SMatthew Ahrens * filesystem. Or 'earlier' could be the origin's origin. 312878f17100SMatthew Ahrens * 312978f17100SMatthew Ahrens * If non-zero, earlier_txg is used instead of earlier's ds_creation_txg. 31303b2aab18SMatthew Ahrens */ 31313b2aab18SMatthew Ahrens boolean_t 313278f17100SMatthew Ahrens dsl_dataset_is_before(dsl_dataset_t *later, dsl_dataset_t *earlier, 313378f17100SMatthew Ahrens uint64_t earlier_txg) 31343b2aab18SMatthew Ahrens { 31353b2aab18SMatthew Ahrens dsl_pool_t *dp = later->ds_dir->dd_pool; 31363b2aab18SMatthew Ahrens int error; 31373b2aab18SMatthew Ahrens boolean_t ret; 31383b2aab18SMatthew Ahrens 31393b2aab18SMatthew Ahrens ASSERT(dsl_pool_config_held(dp)); 314078f17100SMatthew Ahrens ASSERT(dsl_dataset_is_snapshot(earlier) || earlier_txg != 0); 314178f17100SMatthew Ahrens 314278f17100SMatthew Ahrens if (earlier_txg == 0) 314378f17100SMatthew Ahrens earlier_txg = earlier->ds_phys->ds_creation_txg; 31443b2aab18SMatthew Ahrens 314578f17100SMatthew Ahrens if (dsl_dataset_is_snapshot(later) && 314678f17100SMatthew Ahrens earlier_txg >= later->ds_phys->ds_creation_txg) 31473b2aab18SMatthew Ahrens return (B_FALSE); 31483b2aab18SMatthew Ahrens 31493b2aab18SMatthew Ahrens if (later->ds_dir == earlier->ds_dir) 31503b2aab18SMatthew Ahrens return (B_TRUE); 31513b2aab18SMatthew Ahrens if (!dsl_dir_is_clone(later->ds_dir)) 31523b2aab18SMatthew Ahrens return (B_FALSE); 31533b2aab18SMatthew Ahrens 31543b2aab18SMatthew Ahrens if (later->ds_dir->dd_phys->dd_origin_obj == earlier->ds_object) 31553b2aab18SMatthew Ahrens return (B_TRUE); 31563b2aab18SMatthew Ahrens dsl_dataset_t *origin; 31573b2aab18SMatthew Ahrens error = dsl_dataset_hold_obj(dp, 31583b2aab18SMatthew Ahrens later->ds_dir->dd_phys->dd_origin_obj, FTAG, &origin); 31593b2aab18SMatthew Ahrens if (error != 0) 31603b2aab18SMatthew Ahrens return (B_FALSE); 316178f17100SMatthew Ahrens ret = dsl_dataset_is_before(origin, earlier, earlier_txg); 31623b2aab18SMatthew Ahrens dsl_dataset_rele(origin, FTAG); 31633b2aab18SMatthew Ahrens return (ret); 31643b2aab18SMatthew Ahrens } 31652acef22dSMatthew Ahrens 31662acef22dSMatthew Ahrens 31672acef22dSMatthew Ahrens void 31682acef22dSMatthew Ahrens dsl_dataset_zapify(dsl_dataset_t *ds, dmu_tx_t *tx) 31692acef22dSMatthew Ahrens { 31702acef22dSMatthew Ahrens objset_t *mos = ds->ds_dir->dd_pool->dp_meta_objset; 31712acef22dSMatthew Ahrens dmu_object_zapify(mos, ds->ds_object, DMU_OT_DSL_DATASET, tx); 31722acef22dSMatthew Ahrens } 3173