spa.c revision 98d1cbfec254295273b6a761bc1861c0374bdf02
1fa9e406ahrens/*
2fa9e406ahrens * CDDL HEADER START
3fa9e406ahrens *
4fa9e406ahrens * The contents of this file are subject to the terms of the
5ea8dc4beschrock * Common Development and Distribution License (the "License").
6ea8dc4beschrock * You may not use this file except in compliance with the License.
7fa9e406ahrens *
8fa9e406ahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9fa9e406ahrens * or http://www.opensolaris.org/os/licensing.
10fa9e406ahrens * See the License for the specific language governing permissions
11fa9e406ahrens * and limitations under the License.
12fa9e406ahrens *
13fa9e406ahrens * When distributing Covered Code, include this CDDL HEADER in each
14fa9e406ahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15fa9e406ahrens * If applicable, add the following below this CDDL HEADER, with the
16fa9e406ahrens * fields enclosed by brackets "[]" replaced with your own identifying
17fa9e406ahrens * information: Portions Copyright [yyyy] [name of copyright owner]
18fa9e406ahrens *
19fa9e406ahrens * CDDL HEADER END
20fa9e406ahrens */
2199653d4eschrock
22fa9e406ahrens/*
2398d1cbfGeorge Wilson * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
24fa9e406ahrens */
25fa9e406ahrens
26fa9e406ahrens/*
27fa9e406ahrens * This file contains all the routines used when modifying on-disk SPA state.
28fa9e406ahrens * This includes opening, importing, destroying, exporting a pool, and syncing a
29fa9e406ahrens * pool.
30fa9e406ahrens */
31fa9e406ahrens
32fa9e406ahrens#include <sys/zfs_context.h>
33ea8dc4beschrock#include <sys/fm/fs/zfs.h>
34fa9e406ahrens#include <sys/spa_impl.h>
35fa9e406ahrens#include <sys/zio.h>
36fa9e406ahrens#include <sys/zio_checksum.h>
37fa9e406ahrens#include <sys/dmu.h>
38fa9e406ahrens#include <sys/dmu_tx.h>
39fa9e406ahrens#include <sys/zap.h>
40fa9e406ahrens#include <sys/zil.h>
41b24ab67Jeff Bonwick#include <sys/ddt.h>
42fa9e406ahrens#include <sys/vdev_impl.h>
43fa9e406ahrens#include <sys/metaslab.h>
4488ecc94George Wilson#include <sys/metaslab_impl.h>
45fa9e406ahrens#include <sys/uberblock_impl.h>
46fa9e406ahrens#include <sys/txg.h>
47fa9e406ahrens#include <sys/avl.h>
48fa9e406ahrens#include <sys/dmu_traverse.h>
49b1b8ab3lling#include <sys/dmu_objset.h>
50fa9e406ahrens#include <sys/unique.h>
51fa9e406ahrens#include <sys/dsl_pool.h>
52b1b8ab3lling#include <sys/dsl_dataset.h>
53fa9e406ahrens#include <sys/dsl_dir.h>
54fa9e406ahrens#include <sys/dsl_prop.h>
55b1b8ab3lling#include <sys/dsl_synctask.h>
56fa9e406ahrens#include <sys/fs/zfs.h>
57fa94a07brendan#include <sys/arc.h>
58fa9e406ahrens#include <sys/callb.h>
599517395ek#include <sys/systeminfo.h>
60e7cbe64gw#include <sys/spa_boot.h>
61573ca77George Wilson#include <sys/zfs_ioctl.h>
62fa9e406ahrens
635679c89jv#ifdef	_KERNEL
64dedec47Jack Meng#include <sys/bootprops.h>
6535a5a35Jonathan Adams#include <sys/callb.h>
6635a5a35Jonathan Adams#include <sys/cpupart.h>
6735a5a35Jonathan Adams#include <sys/pool.h>
6835a5a35Jonathan Adams#include <sys/sysdc.h>
6935a5a35Jonathan Adams#include <sys/zone.h>
705679c89jv#endif	/* _KERNEL */
715679c89jv
72990b485lling#include "zfs_prop.h"
73b7b9745perrin#include "zfs_comutil.h"
74990b485lling
7535a5a35Jonathan Adamstypedef enum zti_modes {
762e0c549Jonathan Adams	zti_mode_fixed,			/* value is # of threads (min 1) */
772e0c549Jonathan Adams	zti_mode_online_percent,	/* value is % of online CPUs */
7835a5a35Jonathan Adams	zti_mode_batch,			/* cpu-intensive; value is ignored */
7980eb36fGeorge Wilson	zti_mode_null,			/* don't create a taskq */
802e0c549Jonathan Adams	zti_nmodes
8135a5a35Jonathan Adams} zti_modes_t;
82416e0cdek
8380eb36fGeorge Wilson#define	ZTI_FIX(n)	{ zti_mode_fixed, (n) }
8480eb36fGeorge Wilson#define	ZTI_PCT(n)	{ zti_mode_online_percent, (n) }
8535a5a35Jonathan Adams#define	ZTI_BATCH	{ zti_mode_batch, 0 }
8680eb36fGeorge Wilson#define	ZTI_NULL	{ zti_mode_null, 0 }
872e0c549Jonathan Adams
8880eb36fGeorge Wilson#define	ZTI_ONE		ZTI_FIX(1)
892e0c549Jonathan Adams
902e0c549Jonathan Adamstypedef struct zio_taskq_info {
9180eb36fGeorge Wilson	enum zti_modes zti_mode;
9280eb36fGeorge Wilson	uint_t zti_value;
932e0c549Jonathan Adams} zio_taskq_info_t;
942e0c549Jonathan Adams
952e0c549Jonathan Adamsstatic const char *const zio_taskq_types[ZIO_TASKQ_TYPES] = {
9635a5a35Jonathan Adams	"issue", "issue_high", "intr", "intr_high"
972e0c549Jonathan Adams};
982e0c549Jonathan Adams
9980eb36fGeorge Wilson/*
10080eb36fGeorge Wilson * Define the taskq threads for the following I/O types:
10180eb36fGeorge Wilson * 	NULL, READ, WRITE, FREE, CLAIM, and IOCTL
10280eb36fGeorge Wilson */
10380eb36fGeorge Wilsonconst zio_taskq_info_t zio_taskqs[ZIO_TYPES][ZIO_TASKQ_TYPES] = {
10480eb36fGeorge Wilson	/* ISSUE	ISSUE_HIGH	INTR		INTR_HIGH */
10580eb36fGeorge Wilson	{ ZTI_ONE,	ZTI_NULL,	ZTI_ONE,	ZTI_NULL },
10635a5a35Jonathan Adams	{ ZTI_FIX(8),	ZTI_NULL,	ZTI_BATCH,	ZTI_NULL },
10735a5a35Jonathan Adams	{ ZTI_BATCH,	ZTI_FIX(5),	ZTI_FIX(8),	ZTI_FIX(5) },
108c6065d0George Wilson	{ ZTI_FIX(10),	ZTI_NULL,	ZTI_FIX(10),	ZTI_NULL },
10980eb36fGeorge Wilson	{ ZTI_ONE,	ZTI_NULL,	ZTI_ONE,	ZTI_NULL },
11080eb36fGeorge Wilson	{ ZTI_ONE,	ZTI_NULL,	ZTI_ONE,	ZTI_NULL },
1112e0c549Jonathan Adams};
1122e0c549Jonathan Adams
113990b485llingstatic void spa_sync_props(void *arg1, void *arg2, cred_t *cr, dmu_tx_t *tx);
11489a89ebllingstatic boolean_t spa_has_active_shared_spare(spa_t *spa);
1151195e68Mark J Musantestatic int spa_load_impl(spa_t *spa, uint64_t, nvlist_t *config,
1161195e68Mark J Musante    spa_load_state_t state, spa_import_type_t type, boolean_t mosconfig,
1171195e68Mark J Musante    char **ereport);
118990b485lling
11935a5a35Jonathan Adamsuint_t		zio_taskq_batch_pct = 100;	/* 1 thread per cpu in pset */
12035a5a35Jonathan Adamsid_t		zio_taskq_psrset_bind = PS_NONE;
12135a5a35Jonathan Adamsboolean_t	zio_taskq_sysdc = B_TRUE;	/* use SDC scheduling class */
12235a5a35Jonathan Adamsuint_t		zio_taskq_basedc = 80;		/* base duty cycle */
12335a5a35Jonathan Adams
12435a5a35Jonathan Adamsboolean_t	spa_create_process = B_TRUE;	/* no process ==> no sysdc */
12535a5a35Jonathan Adams
12635a5a35Jonathan Adams/*
12735a5a35Jonathan Adams * This (illegal) pool name is used when temporarily importing a spa_t in order
12835a5a35Jonathan Adams * to get the vdev stats associated with the imported devices.
12935a5a35Jonathan Adams */
13035a5a35Jonathan Adams#define	TRYIMPORT_NAME	"$import"
13135a5a35Jonathan Adams
132990b485lling/*
133990b485lling * ==========================================================================
134990b485lling * SPA properties routines
135990b485lling * ==========================================================================
136990b485lling */
137990b485lling
138990b485lling/*
139990b485lling * Add a (source=src, propname=propval) list to an nvlist.
140990b485lling */
1419d82f4fllingstatic void
142990b485llingspa_prop_add_list(nvlist_t *nvl, zpool_prop_t prop, char *strval,
143990b485lling    uint64_t intval, zprop_source_t src)
144990b485lling{
145990b485lling	const char *propname = zpool_prop_to_name(prop);
146990b485lling	nvlist_t *propval;
147990b485lling
1489d82f4flling	VERIFY(nvlist_alloc(&propval, NV_UNIQUE_NAME, KM_SLEEP) == 0);
1499d82f4flling	VERIFY(nvlist_add_uint64(propval, ZPROP_SOURCE, src) == 0);
150990b485lling
1519d82f4flling	if (strval != NULL)
1529d82f4flling		VERIFY(nvlist_add_string(propval, ZPROP_VALUE, strval) == 0);
1539d82f4flling	else
1549d82f4flling		VERIFY(nvlist_add_uint64(propval, ZPROP_VALUE, intval) == 0);
155990b485lling
1569d82f4flling	VERIFY(nvlist_add_nvlist(nvl, propname, propval) == 0);
157990b485lling	nvlist_free(propval);
158990b485lling}
159990b485lling
160990b485lling/*
161990b485lling * Get property values from the spa configuration.
162990b485lling */
1639d82f4fllingstatic void
164990b485llingspa_prop_get_config(spa_t *spa, nvlist_t **nvp)
165990b485lling{
166379c004Eric Schrock	uint64_t size;
167485bbbfGeorge Wilson	uint64_t alloc;
168990b485lling	uint64_t cap, version;
169990b485lling	zprop_source_t src = ZPROP_SRC_NONE;
170c5904d1eschrock	spa_config_dirent_t *dp;
171990b485lling
172e14bb32Jeff Bonwick	ASSERT(MUTEX_HELD(&spa->spa_props_lock));
173e14bb32Jeff Bonwick
174379c004Eric Schrock	if (spa->spa_root_vdev != NULL) {
175485bbbfGeorge Wilson		alloc = metaslab_class_get_alloc(spa_normal_class(spa));
176b24ab67Jeff Bonwick		size = metaslab_class_get_space(spa_normal_class(spa));
177379c004Eric Schrock		spa_prop_add_list(*nvp, ZPOOL_PROP_NAME, spa_name(spa), 0, src);
178379c004Eric Schrock		spa_prop_add_list(*nvp, ZPOOL_PROP_SIZE, NULL, size, src);
179485bbbfGeorge Wilson		spa_prop_add_list(*nvp, ZPOOL_PROP_ALLOCATED, NULL, alloc, src);
180485bbbfGeorge Wilson		spa_prop_add_list(*nvp, ZPOOL_PROP_FREE, NULL,
181485bbbfGeorge Wilson		    size - alloc, src);
182379c004Eric Schrock
183485bbbfGeorge Wilson		cap = (size == 0) ? 0 : (alloc * 100 / size);
184379c004Eric Schrock		spa_prop_add_list(*nvp, ZPOOL_PROP_CAPACITY, NULL, cap, src);
185379c004Eric Schrock
186b24ab67Jeff Bonwick		spa_prop_add_list(*nvp, ZPOOL_PROP_DEDUPRATIO, NULL,
187b24ab67Jeff Bonwick		    ddt_get_pool_dedup_ratio(spa), src);
188b24ab67Jeff Bonwick
189379c004Eric Schrock		spa_prop_add_list(*nvp, ZPOOL_PROP_HEALTH, NULL,
190379c004Eric Schrock		    spa->spa_root_vdev->vdev_state, src);
191379c004Eric Schrock
192379c004Eric Schrock		version = spa_version(spa);
193379c004Eric Schrock		if (version == zpool_prop_default_numeric(ZPOOL_PROP_VERSION))
194379c004Eric Schrock			src = ZPROP_SRC_DEFAULT;
195379c004Eric Schrock		else
196379c004Eric Schrock			src = ZPROP_SRC_LOCAL;
197379c004Eric Schrock		spa_prop_add_list(*nvp, ZPOOL_PROP_VERSION, NULL, version, src);
198379c004Eric Schrock	}
199990b485lling
2009d82f4flling	spa_prop_add_list(*nvp, ZPOOL_PROP_GUID, NULL, spa_guid(spa), src);
201990b485lling
2029d82f4flling	if (spa->spa_root != NULL)
2039d82f4flling		spa_prop_add_list(*nvp, ZPOOL_PROP_ALTROOT, spa->spa_root,
2049d82f4flling		    0, ZPROP_SRC_LOCAL);
205990b485lling
206c5904d1eschrock	if ((dp = list_head(&spa->spa_config_list)) != NULL) {
207c5904d1eschrock		if (dp->scd_path == NULL) {
2089d82f4flling			spa_prop_add_list(*nvp, ZPOOL_PROP_CACHEFILE,
209c5904d1eschrock			    "none", 0, ZPROP_SRC_LOCAL);
210c5904d1eschrock		} else if (strcmp(dp->scd_path, spa_config_path) != 0) {
2119d82f4flling			spa_prop_add_list(*nvp, ZPOOL_PROP_CACHEFILE,
212c5904d1eschrock			    dp->scd_path, 0, ZPROP_SRC_LOCAL);
2132f8aaabeschrock		}
2142f8aaabeschrock	}
215990b485lling}
216990b485lling
217990b485lling/*
218990b485lling * Get zpool property values.
219990b485lling */
220990b485llingint
221990b485llingspa_prop_get(spa_t *spa, nvlist_t **nvp)
222990b485lling{
223b24ab67Jeff Bonwick	objset_t *mos = spa->spa_meta_objset;
224990b485lling	zap_cursor_t zc;
225990b485lling	zap_attribute_t za;
226990b485lling	int err;
227990b485lling
2289d82f4flling	VERIFY(nvlist_alloc(nvp, NV_UNIQUE_NAME, KM_SLEEP) == 0);
229990b485lling
230e14bb32Jeff Bonwick	mutex_enter(&spa->spa_props_lock);
231e14bb32Jeff Bonwick
232990b485lling	/*
233990b485lling	 * Get properties from the spa config.
234990b485lling	 */
2359d82f4flling	spa_prop_get_config(spa, nvp);
236990b485lling
237990b485lling	/* If no pool property object, no more prop to get. */
238afee20eGeorge Wilson	if (mos == NULL || spa->spa_pool_props_object == 0) {
239990b485lling		mutex_exit(&spa->spa_props_lock);
240990b485lling		return (0);
241990b485lling	}
242990b485lling
243990b485lling	/*
244990b485lling	 * Get properties from the MOS pool property object.
245990b485lling	 */
246990b485lling	for (zap_cursor_init(&zc, mos, spa->spa_pool_props_object);
247990b485lling	    (err = zap_cursor_retrieve(&zc, &za)) == 0;
248990b485lling	    zap_cursor_advance(&zc)) {
249990b485lling		uint64_t intval = 0;
250990b485lling		char *strval = NULL;
251990b485lling		zprop_source_t src = ZPROP_SRC_DEFAULT;
252990b485lling		zpool_prop_t prop;
253990b485lling
254990b485lling		if ((prop = zpool_name_to_prop(za.za_name)) == ZPROP_INVAL)
255990b485lling			continue;
256990b485lling
257990b485lling		switch (za.za_integer_length) {
258990b485lling		case 8:
259990b485lling			/* integer property */
260990b485lling			if (za.za_first_integer !=
261990b485lling			    zpool_prop_default_numeric(prop))
262990b485lling				src = ZPROP_SRC_LOCAL;
263990b485lling
264990b485lling			if (prop == ZPOOL_PROP_BOOTFS) {
265990b485lling				dsl_pool_t *dp;
266990b485lling				dsl_dataset_t *ds = NULL;
267990b485lling
268990b485lling				dp = spa_get_dsl(spa);
269990b485lling				rw_enter(&dp->dp_config_rwlock, RW_READER);
270745cd3cmaybee				if (err = dsl_dataset_hold_obj(dp,
271745cd3cmaybee				    za.za_first_integer, FTAG, &ds)) {
272990b485lling					rw_exit(&dp->dp_config_rwlock);
273990b485lling					break;
274990b485lling				}
275990b485lling
276990b485lling				strval = kmem_alloc(
277990b485lling				    MAXNAMELEN + strlen(MOS_DIR_NAME) + 1,
278990b485lling				    KM_SLEEP);
279990b485lling				dsl_dataset_name(ds, strval);
280745cd3cmaybee				dsl_dataset_rele(ds, FTAG);
281990b485lling				rw_exit(&dp->dp_config_rwlock);
282990b485lling			} else {
283990b485lling				strval = NULL;
284990b485lling				intval = za.za_first_integer;
285990b485lling			}
286990b485lling
2879d82f4flling			spa_prop_add_list(*nvp, prop, strval, intval, src);
288990b485lling
289990b485lling			if (strval != NULL)
290990b485lling				kmem_free(strval,
291990b485lling				    MAXNAMELEN + strlen(MOS_DIR_NAME) + 1);
292990b485lling
293990b485lling			break;
294990b485lling
295990b485lling		case 1:
296990b485lling			/* string property */
297990b485lling			strval = kmem_alloc(za.za_num_integers, KM_SLEEP);
298990b485lling			err = zap_lookup(mos, spa->spa_pool_props_object,
299990b485lling			    za.za_name, 1, za.za_num_integers, strval);
300990b485lling			if (err) {
301990b485lling				kmem_free(strval, za.za_num_integers);
302990b485lling				break;
303990b485lling			}
3049d82f4flling			spa_prop_add_list(*nvp, prop, strval, 0, src);
305990b485lling			kmem_free(strval, za.za_num_integers);
306990b485lling			break;
307990b485lling
308990b485lling		default:
309990b485lling			break;
310990b485lling		}
311990b485lling	}
312990b485lling	zap_cursor_fini(&zc);
313990b485lling	mutex_exit(&spa->spa_props_lock);
314990b485llingout:
315990b485lling	if (err && err != ENOENT) {
316990b485lling		nvlist_free(*nvp);
3179d82f4flling		*nvp = NULL;
318990b485lling		return (err);
319990b485lling	}
320990b485lling
321990b485lling	return (0);
322990b485lling}
323990b485lling
324990b485lling/*
325990b485lling * Validate the given pool properties nvlist and modify the list
326990b485lling * for the property values to be set.
327990b485lling */
328990b485llingstatic int
329990b485llingspa_prop_validate(spa_t *spa, nvlist_t *props)
330990b485lling{
331990b485lling	nvpair_t *elem;
332990b485lling	int error = 0, reset_bootfs = 0;
333990b485lling	uint64_t objnum;
334990b485lling
335990b485lling	elem = NULL;
336990b485lling	while ((elem = nvlist_next_nvpair(props, elem)) != NULL) {
337990b485lling		zpool_prop_t prop;
338990b485lling		char *propname, *strval;
339990b485lling		uint64_t intval;
340990b485lling		objset_t *os;
3412f8aaabeschrock		char *slash;
342990b485lling
343990b485lling		propname = nvpair_name(elem);
344990b485lling
345990b485lling		if ((prop = zpool_name_to_prop(propname)) == ZPROP_INVAL)
346990b485lling			return (EINVAL);
347990b485lling
348990b485lling		switch (prop) {
349990b485lling		case ZPOOL_PROP_VERSION:
350990b485lling			error = nvpair_value_uint64(elem, &intval);
351990b485lling			if (!error &&
352990b485lling			    (intval < spa_version(spa) || intval > SPA_VERSION))
353990b485lling				error = EINVAL;
354990b485lling			break;
355990b485lling
356990b485lling		case ZPOOL_PROP_DELEGATION:
357990b485lling		case ZPOOL_PROP_AUTOREPLACE:
358d5b5bb2Rich Morris		case ZPOOL_PROP_LISTSNAPS:
359573ca77George Wilson		case ZPOOL_PROP_AUTOEXPAND:
360990b485lling			error = nvpair_value_uint64(elem, &intval);
361990b485lling			if (!error && intval > 1)
362990b485lling				error = EINVAL;
363990b485lling			break;
364990b485lling
365990b485lling		case ZPOOL_PROP_BOOTFS:
36625f89eeJeff Bonwick			/*
36725f89eeJeff Bonwick			 * If the pool version is less than SPA_VERSION_BOOTFS,
36825f89eeJeff Bonwick			 * or the pool is still being created (version == 0),
36925f89eeJeff Bonwick			 * the bootfs property cannot be set.
37025f89eeJeff Bonwick			 */
371990b485lling			if (spa_version(spa) < SPA_VERSION_BOOTFS) {
372990b485lling				error = ENOTSUP;
373990b485lling				break;
374990b485lling			}
375990b485lling
376990b485lling			/*
37715e6edfgw			 * Make sure the vdev config is bootable
378990b485lling			 */
37915e6edfgw			if (!vdev_is_bootable(spa->spa_root_vdev)) {
380990b485lling				error = ENOTSUP;
381990b485lling				break;
382990b485lling			}
383990b485lling
384990b485lling			reset_bootfs = 1;
385990b485lling
386990b485lling			error = nvpair_value_string(elem, &strval);
387990b485lling
388990b485lling			if (!error) {
38915e6edfgw				uint64_t compress;
39015e6edfgw
391990b485lling				if (strval == NULL || strval[0] == '\0') {
392990b485lling					objnum = zpool_prop_default_numeric(
393990b485lling					    ZPOOL_PROP_BOOTFS);
394990b485lling					break;
395990b485lling				}
396990b485lling
397503ad85Matthew Ahrens				if (error = dmu_objset_hold(strval, FTAG, &os))
398990b485lling					break;
39915e6edfgw
400503ad85Matthew Ahrens				/* Must be ZPL and not gzip compressed. */
401503ad85Matthew Ahrens
402503ad85Matthew Ahrens				if (dmu_objset_type(os) != DMU_OST_ZFS) {
403503ad85Matthew Ahrens					error = ENOTSUP;
404503ad85Matthew Ahrens				} else if ((error = dsl_prop_get_integer(strval,
40515e6edfgw				    zfs_prop_to_name(ZFS_PROP_COMPRESSION),
40615e6edfgw				    &compress, NULL)) == 0 &&
40715e6edfgw				    !BOOTFS_COMPRESS_VALID(compress)) {
40815e6edfgw					error = ENOTSUP;
40915e6edfgw				} else {
41015e6edfgw					objnum = dmu_objset_id(os);
41115e6edfgw				}
412503ad85Matthew Ahrens				dmu_objset_rele(os, FTAG);
413990b485lling			}
414990b485lling			break;
415e14bb32Jeff Bonwick
4160a4e951gw		case ZPOOL_PROP_FAILUREMODE:
4170a4e951gw			error = nvpair_value_uint64(elem, &intval);
4180a4e951gw			if (!error && (intval < ZIO_FAILURE_MODE_WAIT ||
4190a4e951gw			    intval > ZIO_FAILURE_MODE_PANIC))
4200a4e951gw				error = EINVAL;
4210a4e951gw
4220a4e951gw			/*
4230a4e951gw			 * This is a special case which only occurs when
4240a4e951gw			 * the pool has completely failed. This allows
4250a4e951gw			 * the user to change the in-core failmode property
4260a4e951gw			 * without syncing it out to disk (I/Os might
4270a4e951gw			 * currently be blocked). We do this by returning
4280a4e951gw			 * EIO to the caller (spa_prop_set) to trick it
4290a4e951gw			 * into thinking we encountered a property validation
4300a4e951gw			 * error.
4310a4e951gw			 */
432e14bb32Jeff Bonwick			if (!error && spa_suspended(spa)) {
4330a4e951gw				spa->spa_failmode = intval;
4340a4e951gw				error = EIO;
4350a4e951gw			}
4360a4e951gw			break;
4372f8aaabeschrock
4382f8aaabeschrock		case ZPOOL_PROP_CACHEFILE:
4392f8aaabeschrock			if ((error = nvpair_value_string(elem, &strval)) != 0)
4402f8aaabeschrock				break;
4412f8aaabeschrock
4422f8aaabeschrock			if (strval[0] == '\0')
4432f8aaabeschrock				break;
4442f8aaabeschrock
4452f8aaabeschrock			if (strcmp(strval, "none") == 0)
4462f8aaabeschrock				break;
4472f8aaabeschrock
4482f8aaabeschrock			if (strval[0] != '/') {
4492f8aaabeschrock				error = EINVAL;
4502f8aaabeschrock				break;
4512f8aaabeschrock			}
4522f8aaabeschrock
4532f8aaabeschrock			slash = strrchr(strval, '/');
4542f8aaabeschrock			ASSERT(slash != NULL);
4552f8aaabeschrock
4562f8aaabeschrock			if (slash[1] == '\0' || strcmp(slash, "/.") == 0 ||
4572f8aaabeschrock			    strcmp(slash, "/..") == 0)
4582f8aaabeschrock				error = EINVAL;
4592f8aaabeschrock			break;
460b24ab67Jeff Bonwick
461b24ab67Jeff Bonwick		case ZPOOL_PROP_DEDUPDITTO:
462b24ab67Jeff Bonwick			if (spa_version(spa) < SPA_VERSION_DEDUP)
463b24ab67Jeff Bonwick				error = ENOTSUP;
464b24ab67Jeff Bonwick			else
465b24ab67Jeff Bonwick				error = nvpair_value_uint64(elem, &intval);
466b24ab67Jeff Bonwick			if (error == 0 &&
467b24ab67Jeff Bonwick			    intval != 0 && intval < ZIO_DEDUPDITTO_MIN)
468b24ab67Jeff Bonwick				error = EINVAL;
469b24ab67Jeff Bonwick			break;
470990b485lling		}
471990b485lling
472990b485lling		if (error)
473990b485lling			break;
474990b485lling	}
475990b485lling
476990b485lling	if (!error && reset_bootfs) {
477990b485lling		error = nvlist_remove(props,
478990b485lling		    zpool_prop_to_name(ZPOOL_PROP_BOOTFS), DATA_TYPE_STRING);
479990b485lling
480990b485lling		if (!error) {
481990b485lling			error = nvlist_add_uint64(props,
482990b485lling			    zpool_prop_to_name(ZPOOL_PROP_BOOTFS), objnum);
483990b485lling		}
484990b485lling	}
485990b485lling
486990b485lling	return (error);
487990b485lling}
488990b485lling
489379c004Eric Schrockvoid
490379c004Eric Schrockspa_configfile_set(spa_t *spa, nvlist_t *nvp, boolean_t need_sync)
491379c004Eric Schrock{
492379c004Eric Schrock	char *cachefile;
493379c004Eric Schrock	spa_config_dirent_t *dp;
494379c004Eric Schrock
495379c004Eric Schrock	if (nvlist_lookup_string(nvp, zpool_prop_to_name(ZPOOL_PROP_CACHEFILE),
496379c004Eric Schrock	    &cachefile) != 0)
497379c004Eric Schrock		return;
498379c004Eric Schrock
499379c004Eric Schrock	dp = kmem_alloc(sizeof (spa_config_dirent_t),
500379c004Eric Schrock	    KM_SLEEP);
501379c004Eric Schrock
502379c004Eric Schrock	if (cachefile[0] == '\0')
503379c004Eric Schrock		dp->scd_path = spa_strdup(spa_config_path);
504379c004Eric Schrock	else if (strcmp(cachefile, "none") == 0)
505379c004Eric Schrock		dp->scd_path = NULL;
506379c004Eric Schrock	else
507379c004Eric Schrock		dp->scd_path = spa_strdup(cachefile);
508379c004Eric Schrock
509379c004Eric Schrock	list_insert_head(&spa->spa_config_list, dp);
510379c004Eric Schrock	if (need_sync)
511379c004Eric Schrock		spa_async_request(spa, SPA_ASYNC_CONFIG_UPDATE);
512379c004Eric Schrock}
513379c004Eric Schrock
514990b485llingint
515990b485llingspa_prop_set(spa_t *spa, nvlist_t *nvp)
516990b485lling{
517990b485lling	int error;
518379c004Eric Schrock	nvpair_t *elem;
519379c004Eric Schrock	boolean_t need_sync = B_FALSE;
520379c004Eric Schrock	zpool_prop_t prop;
521990b485lling
522990b485lling	if ((error = spa_prop_validate(spa, nvp)) != 0)
523990b485lling		return (error);
524990b485lling
525379c004Eric Schrock	elem = NULL;
526379c004Eric Schrock	while ((elem = nvlist_next_nvpair(nvp, elem)) != NULL) {
527379c004Eric Schrock		if ((prop = zpool_name_to_prop(
528379c004Eric Schrock		    nvpair_name(elem))) == ZPROP_INVAL)
529379c004Eric Schrock			return (EINVAL);
530379c004Eric Schrock
531379c004Eric Schrock		if (prop == ZPOOL_PROP_CACHEFILE || prop == ZPOOL_PROP_ALTROOT)
532379c004Eric Schrock			continue;
533379c004Eric Schrock
534379c004Eric Schrock		need_sync = B_TRUE;
535379c004Eric Schrock		break;
536379c004Eric Schrock	}
537379c004Eric Schrock
538379c004Eric Schrock	if (need_sync)
539379c004Eric Schrock		return (dsl_sync_task_do(spa_get_dsl(spa), NULL, spa_sync_props,
540379c004Eric Schrock		    spa, nvp, 3));
541379c004Eric Schrock	else
542379c004Eric Schrock		return (0);
543990b485lling}
544990b485lling
545990b485lling/*
546990b485lling * If the bootfs property value is dsobj, clear it.
547990b485lling */
548990b485llingvoid
549990b485llingspa_prop_clear_bootfs(spa_t *spa, uint64_t dsobj, dmu_tx_t *tx)
550990b485lling{
551990b485lling	if (spa->spa_bootfs == dsobj && spa->spa_pool_props_object != 0) {
552990b485lling		VERIFY(zap_remove(spa->spa_meta_objset,
553990b485lling		    spa->spa_pool_props_object,
554990b485lling		    zpool_prop_to_name(ZPOOL_PROP_BOOTFS), tx) == 0);
555990b485lling		spa->spa_bootfs = 0;
556990b485lling	}
557990b485lling}
558990b485lling
559fa9e406ahrens/*
560fa9e406ahrens * ==========================================================================
561fa9e406ahrens * SPA state manipulation (open/create/destroy/import/export)
562fa9e406ahrens * ==========================================================================
563fa9e406ahrens */
564fa9e406ahrens
565ea8dc4beschrockstatic int
566ea8dc4beschrockspa_error_entry_compare(const void *a, const void *b)
567ea8dc4beschrock{
568ea8dc4beschrock	spa_error_entry_t *sa = (spa_error_entry_t *)a;
569ea8dc4beschrock	spa_error_entry_t *sb = (spa_error_entry_t *)b;
570ea8dc4beschrock	int ret;
571ea8dc4beschrock
572ea8dc4beschrock	ret = bcmp(&sa->se_bookmark, &sb->se_bookmark,
573ea8dc4beschrock	    sizeof (zbookmark_t));
574ea8dc4beschrock
575ea8dc4beschrock	if (ret < 0)
576ea8dc4beschrock		return (-1);
577ea8dc4beschrock	else if (ret > 0)
578ea8dc4beschrock		return (1);
579ea8dc4beschrock	else
580ea8dc4beschrock		return (0);
581ea8dc4beschrock}
582ea8dc4beschrock
583ea8dc4beschrock/*
584ea8dc4beschrock * Utility function which retrieves copies of the current logs and
585ea8dc4beschrock * re-initializes them in the process.
586ea8dc4beschrock */
587ea8dc4beschrockvoid
588ea8dc4beschrockspa_get_errlists(spa_t *spa, avl_tree_t *last, avl_tree_t *scrub)
589ea8dc4beschrock{
590ea8dc4beschrock	ASSERT(MUTEX_HELD(&spa->spa_errlist_lock));
591ea8dc4beschrock
592ea8dc4beschrock	bcopy(&spa->spa_errlist_last, last, sizeof (avl_tree_t));
593ea8dc4beschrock	bcopy(&spa->spa_errlist_scrub, scrub, sizeof (avl_tree_t));
594ea8dc4beschrock
595ea8dc4beschrock	avl_create(&spa->spa_errlist_scrub,
596ea8dc4beschrock	    spa_error_entry_compare, sizeof (spa_error_entry_t),
597ea8dc4beschrock	    offsetof(spa_error_entry_t, se_avl));
598ea8dc4beschrock	avl_create(&spa->spa_errlist_last,
599ea8dc4beschrock	    spa_error_entry_compare, sizeof (spa_error_entry_t),
600ea8dc4beschrock	    offsetof(spa_error_entry_t, se_avl));
601ea8dc4beschrock}
602ea8dc4beschrock
60335a5a35Jonathan Adamsstatic taskq_t *
60435a5a35Jonathan Adamsspa_taskq_create(spa_t *spa, const char *name, enum zti_modes mode,
60535a5a35Jonathan Adams    uint_t value)
606fa9e406ahrens{
60735a5a35Jonathan Adams	uint_t flags = TASKQ_PREPOPULATE;
60835a5a35Jonathan Adams	boolean_t batch = B_FALSE;
609fa9e406ahrens
61035a5a35Jonathan Adams	switch (mode) {
61135a5a35Jonathan Adams	case zti_mode_null:
61235a5a35Jonathan Adams		return (NULL);		/* no taskq needed */
613fa9e406ahrens
61435a5a35Jonathan Adams	case zti_mode_fixed:
61535a5a35Jonathan Adams		ASSERT3U(value, >=, 1);
61635a5a35Jonathan Adams		value = MAX(value, 1);
61735a5a35Jonathan Adams		break;
618fa9e406ahrens
61935a5a35Jonathan Adams	case zti_mode_batch:
62035a5a35Jonathan Adams		batch = B_TRUE;
62135a5a35Jonathan Adams		flags |= TASKQ_THREADS_CPU_PCT;
62235a5a35Jonathan Adams		value = zio_taskq_batch_pct;
62335a5a35Jonathan Adams		break;
62435a5a35Jonathan Adams
62535a5a35Jonathan Adams	case zti_mode_online_percent:
62635a5a35Jonathan Adams		flags |= TASKQ_THREADS_CPU_PCT;
62735a5a35Jonathan Adams		break;
62835a5a35Jonathan Adams
62935a5a35Jonathan Adams	default:
63035a5a35Jonathan Adams		panic("unrecognized mode for %s taskq (%u:%u) in "
63135a5a35Jonathan Adams		    "spa_activate()",
63235a5a35Jonathan Adams		    name, mode, value);
63335a5a35Jonathan Adams		break;
63435a5a35Jonathan Adams	}
63535a5a35Jonathan Adams
63635a5a35Jonathan Adams	if (zio_taskq_sysdc && spa->spa_proc != &p0) {
63735a5a35Jonathan Adams		if (batch)
63835a5a35Jonathan Adams			flags |= TASKQ_DC_BATCH;
63935a5a35Jonathan Adams
64035a5a35Jonathan Adams		return (taskq_create_sysdc(name, value, 50, INT_MAX,
64135a5a35Jonathan Adams		    spa->spa_proc, zio_taskq_basedc, flags));
64235a5a35Jonathan Adams	}
64335a5a35Jonathan Adams	return (taskq_create_proc(name, value, maxclsyspri, 50, INT_MAX,
64435a5a35Jonathan Adams	    spa->spa_proc, flags));
64535a5a35Jonathan Adams}
64635a5a35Jonathan Adams
64735a5a35Jonathan Adamsstatic void
64835a5a35Jonathan Adamsspa_create_zio_taskqs(spa_t *spa)
64935a5a35Jonathan Adams{
650e14bb32Jeff Bonwick	for (int t = 0; t < ZIO_TYPES; t++) {
651e14bb32Jeff Bonwick		for (int q = 0; q < ZIO_TASKQ_TYPES; q++) {
65280eb36fGeorge Wilson			const zio_taskq_info_t *ztip = &zio_taskqs[t][q];
65380eb36fGeorge Wilson			enum zti_modes mode = ztip->zti_mode;
65480eb36fGeorge Wilson			uint_t value = ztip->zti_value;
6552e0c549Jonathan Adams			char name[32];
6562e0c549Jonathan Adams
6572e0c549Jonathan Adams			(void) snprintf(name, sizeof (name),
65880eb36fGeorge Wilson			    "%s_%s", zio_type_name[t], zio_taskq_types[q]);
6592e0c549Jonathan Adams
66035a5a35Jonathan Adams			spa->spa_zio_taskq[t][q] =
66135a5a35Jonathan Adams			    spa_taskq_create(spa, name, mode, value);
66235a5a35Jonathan Adams		}
66335a5a35Jonathan Adams	}
66435a5a35Jonathan Adams}
66535a5a35Jonathan Adams
66635a5a35Jonathan Adams#ifdef _KERNEL
66735a5a35Jonathan Adamsstatic void
66835a5a35Jonathan Adamsspa_thread(void *arg)
66935a5a35Jonathan Adams{
67035a5a35Jonathan Adams	callb_cpr_t cprinfo;
6712e0c549Jonathan Adams
67235a5a35Jonathan Adams	spa_t *spa = arg;
67335a5a35Jonathan Adams	user_t *pu = PTOU(curproc);
6742e0c549Jonathan Adams
67535a5a35Jonathan Adams	CALLB_CPR_INIT(&cprinfo, &spa->spa_proc_lock, callb_generic_cpr,
67635a5a35Jonathan Adams	    spa->spa_name);
6772e0c549Jonathan Adams
67835a5a35Jonathan Adams	ASSERT(curproc != &p0);
67935a5a35Jonathan Adams	(void) snprintf(pu->u_psargs, sizeof (pu->u_psargs),
68035a5a35Jonathan Adams	    "zpool-%s", spa->spa_name);
68135a5a35Jonathan Adams	(void) strlcpy(pu->u_comm, pu->u_psargs, sizeof (pu->u_comm));
6822e0c549Jonathan Adams
68335a5a35Jonathan Adams	/* bind this thread to the requested psrset */
68435a5a35Jonathan Adams	if (zio_taskq_psrset_bind != PS_NONE) {
68535a5a35Jonathan Adams		pool_lock();
68635a5a35Jonathan Adams		mutex_enter(&cpu_lock);
68735a5a35Jonathan Adams		mutex_enter(&pidlock);
68835a5a35Jonathan Adams		mutex_enter(&curproc->p_lock);
68980eb36fGeorge Wilson
69035a5a35Jonathan Adams		if (cpupart_bind_thread(curthread, zio_taskq_psrset_bind,
69135a5a35Jonathan Adams		    0, NULL, NULL) == 0)  {
69235a5a35Jonathan Adams			curthread->t_bind_pset = zio_taskq_psrset_bind;
69335a5a35Jonathan Adams		} else {
69435a5a35Jonathan Adams			cmn_err(CE_WARN,
69535a5a35Jonathan Adams			    "Couldn't bind process for zfs pool \"%s\" to "
69635a5a35Jonathan Adams			    "pset %d\n", spa->spa_name, zio_taskq_psrset_bind);
69735a5a35Jonathan Adams		}
69835a5a35Jonathan Adams
69935a5a35Jonathan Adams		mutex_exit(&curproc->p_lock);
70035a5a35Jonathan Adams		mutex_exit(&pidlock);
70135a5a35Jonathan Adams		mutex_exit(&cpu_lock);
70235a5a35Jonathan Adams		pool_unlock();
70335a5a35Jonathan Adams	}
70435a5a35Jonathan Adams
70535a5a35Jonathan Adams	if (zio_taskq_sysdc) {
706