mirror of
https://git.proxmox.com/git/mirror_zfs.git
synced 2026-05-25 11:47:43 +03:00
2619 asynchronous destruction of ZFS file systems 2747 SPA versioning with zfs feature flags Reviewed by: Matt Ahrens <mahrens@delphix.com> Reviewed by: George Wilson <gwilson@delphix.com> Reviewed by: Richard Lowe <richlowe@richlowe.net> Reviewed by: Dan Kruchinin <dan.kruchinin@gmail.com> Approved by: Eric Schrock <Eric.Schrock@delphix.com> References: illumos/illumos-gate@53089ab7c8 illumos/illumos-gate@ad135b5d64 illumos changeset: 13700:2889e2596bd6 https://www.illumos.org/issues/2619 https://www.illumos.org/issues/2747 NOTE: The grub specific changes were not ported. This change must be made to the Linux grub packages. Ported-by: Brian Behlendorf <behlendorf1@llnl.gov>
This commit is contained in:
committed by
Brian Behlendorf
parent
15313c5e18
commit
9ae529ec5d
+407
-62
@@ -63,6 +63,7 @@
|
||||
#include <sys/spa_boot.h>
|
||||
#include <sys/zfs_ioctl.h>
|
||||
#include <sys/dsl_scan.h>
|
||||
#include <sys/zfeature.h>
|
||||
|
||||
#ifdef _KERNEL
|
||||
#include <sys/bootprops.h>
|
||||
@@ -114,6 +115,7 @@ const zio_taskq_info_t zio_taskqs[ZIO_TYPES][ZIO_TASKQ_TYPES] = {
|
||||
{ ZTI_ONE, ZTI_NULL, ZTI_ONE, ZTI_NULL },
|
||||
};
|
||||
|
||||
static dsl_syncfunc_t spa_sync_version;
|
||||
static dsl_syncfunc_t spa_sync_props;
|
||||
static boolean_t spa_has_active_shared_spare(spa_t *spa);
|
||||
static inline int spa_load_impl(spa_t *spa, uint64_t, nvlist_t *config,
|
||||
@@ -169,6 +171,7 @@ static void
|
||||
spa_prop_get_config(spa_t *spa, nvlist_t **nvp)
|
||||
{
|
||||
vdev_t *rvd = spa->spa_root_vdev;
|
||||
dsl_pool_t *pool = spa->spa_dsl_pool;
|
||||
uint64_t size;
|
||||
uint64_t alloc;
|
||||
uint64_t space;
|
||||
@@ -216,6 +219,22 @@ spa_prop_get_config(spa_t *spa, nvlist_t **nvp)
|
||||
spa_prop_add_list(*nvp, ZPOOL_PROP_VERSION, NULL, version, src);
|
||||
}
|
||||
|
||||
if (pool != NULL) {
|
||||
dsl_dir_t *freedir = pool->dp_free_dir;
|
||||
|
||||
/*
|
||||
* The $FREE directory was introduced in SPA_VERSION_DEADLISTS,
|
||||
* when opening pools before this version freedir will be NULL.
|
||||
*/
|
||||
if (freedir != NULL) {
|
||||
spa_prop_add_list(*nvp, ZPOOL_PROP_FREEING, NULL,
|
||||
freedir->dd_phys->dd_used_bytes, src);
|
||||
} else {
|
||||
spa_prop_add_list(*nvp, ZPOOL_PROP_FREEING,
|
||||
NULL, 0, src);
|
||||
}
|
||||
}
|
||||
|
||||
spa_prop_add_list(*nvp, ZPOOL_PROP_GUID, NULL, spa_guid(spa), src);
|
||||
|
||||
if (spa->spa_comment != NULL) {
|
||||
@@ -357,25 +376,55 @@ spa_prop_validate(spa_t *spa, nvlist_t *props)
|
||||
nvpair_t *elem;
|
||||
int error = 0, reset_bootfs = 0;
|
||||
uint64_t objnum = 0;
|
||||
boolean_t has_feature = B_FALSE;
|
||||
|
||||
elem = NULL;
|
||||
while ((elem = nvlist_next_nvpair(props, elem)) != NULL) {
|
||||
zpool_prop_t prop;
|
||||
char *propname, *strval;
|
||||
uint64_t intval;
|
||||
objset_t *os;
|
||||
char *slash, *check;
|
||||
char *strval, *slash, *check, *fname;
|
||||
const char *propname = nvpair_name(elem);
|
||||
zpool_prop_t prop = zpool_name_to_prop(propname);
|
||||
|
||||
propname = nvpair_name(elem);
|
||||
switch ((int)prop) {
|
||||
case ZPROP_INVAL:
|
||||
if (!zpool_prop_feature(propname)) {
|
||||
error = EINVAL;
|
||||
break;
|
||||
}
|
||||
|
||||
if ((prop = zpool_name_to_prop(propname)) == ZPROP_INVAL)
|
||||
return (EINVAL);
|
||||
/*
|
||||
* Sanitize the input.
|
||||
*/
|
||||
if (nvpair_type(elem) != DATA_TYPE_UINT64) {
|
||||
error = EINVAL;
|
||||
break;
|
||||
}
|
||||
|
||||
if (nvpair_value_uint64(elem, &intval) != 0) {
|
||||
error = EINVAL;
|
||||
break;
|
||||
}
|
||||
|
||||
if (intval != 0) {
|
||||
error = EINVAL;
|
||||
break;
|
||||
}
|
||||
|
||||
fname = strchr(propname, '@') + 1;
|
||||
if (zfeature_lookup_name(fname, NULL) != 0) {
|
||||
error = EINVAL;
|
||||
break;
|
||||
}
|
||||
|
||||
has_feature = B_TRUE;
|
||||
break;
|
||||
|
||||
switch (prop) {
|
||||
case ZPOOL_PROP_VERSION:
|
||||
error = nvpair_value_uint64(elem, &intval);
|
||||
if (!error &&
|
||||
(intval < spa_version(spa) || intval > SPA_VERSION))
|
||||
(intval < spa_version(spa) ||
|
||||
intval > SPA_VERSION_BEFORE_FEATURES ||
|
||||
has_feature))
|
||||
error = EINVAL;
|
||||
break;
|
||||
|
||||
@@ -412,6 +461,7 @@ spa_prop_validate(spa_t *spa, nvlist_t *props)
|
||||
error = nvpair_value_string(elem, &strval);
|
||||
|
||||
if (!error) {
|
||||
objset_t *os;
|
||||
uint64_t compress;
|
||||
|
||||
if (strval == NULL || strval[0] == '\0') {
|
||||
@@ -558,33 +608,58 @@ int
|
||||
spa_prop_set(spa_t *spa, nvlist_t *nvp)
|
||||
{
|
||||
int error;
|
||||
nvpair_t *elem;
|
||||
nvpair_t *elem = NULL;
|
||||
boolean_t need_sync = B_FALSE;
|
||||
zpool_prop_t prop;
|
||||
|
||||
if ((error = spa_prop_validate(spa, nvp)) != 0)
|
||||
return (error);
|
||||
|
||||
elem = NULL;
|
||||
while ((elem = nvlist_next_nvpair(nvp, elem)) != NULL) {
|
||||
if ((prop = zpool_name_to_prop(
|
||||
nvpair_name(elem))) == ZPROP_INVAL)
|
||||
return (EINVAL);
|
||||
zpool_prop_t prop = zpool_name_to_prop(nvpair_name(elem));
|
||||
|
||||
if (prop == ZPOOL_PROP_CACHEFILE ||
|
||||
prop == ZPOOL_PROP_ALTROOT ||
|
||||
prop == ZPOOL_PROP_READONLY)
|
||||
continue;
|
||||
|
||||
if (prop == ZPOOL_PROP_VERSION || prop == ZPROP_INVAL) {
|
||||
uint64_t ver;
|
||||
|
||||
if (prop == ZPOOL_PROP_VERSION) {
|
||||
VERIFY(nvpair_value_uint64(elem, &ver) == 0);
|
||||
} else {
|
||||
ASSERT(zpool_prop_feature(nvpair_name(elem)));
|
||||
ver = SPA_VERSION_FEATURES;
|
||||
need_sync = B_TRUE;
|
||||
}
|
||||
|
||||
/* Save time if the version is already set. */
|
||||
if (ver == spa_version(spa))
|
||||
continue;
|
||||
|
||||
/*
|
||||
* In addition to the pool directory object, we might
|
||||
* create the pool properties object, the features for
|
||||
* read object, the features for write object, or the
|
||||
* feature descriptions object.
|
||||
*/
|
||||
error = dsl_sync_task_do(spa_get_dsl(spa), NULL,
|
||||
spa_sync_version, spa, &ver, 6);
|
||||
if (error)
|
||||
return (error);
|
||||
continue;
|
||||
}
|
||||
|
||||
need_sync = B_TRUE;
|
||||
break;
|
||||
}
|
||||
|
||||
if (need_sync)
|
||||
if (need_sync) {
|
||||
return (dsl_sync_task_do(spa_get_dsl(spa), NULL, spa_sync_props,
|
||||
spa, nvp, 3));
|
||||
else
|
||||
return (0);
|
||||
spa, nvp, 6));
|
||||
}
|
||||
|
||||
return (0);
|
||||
}
|
||||
|
||||
/*
|
||||
@@ -1628,7 +1703,7 @@ spa_load_verify_done(zio_t *zio)
|
||||
int error = zio->io_error;
|
||||
|
||||
if (error) {
|
||||
if ((BP_GET_LEVEL(bp) != 0 || dmu_ot[type].ot_metadata) &&
|
||||
if ((BP_GET_LEVEL(bp) != 0 || DMU_OT_IS_METADATA(type)) &&
|
||||
type != DMU_OT_INTENT_LOG)
|
||||
atomic_add_64(&sle->sle_meta_count, 1);
|
||||
else
|
||||
@@ -1858,6 +1933,9 @@ spa_load(spa_t *spa, spa_load_state_t state, spa_import_type_t type,
|
||||
KM_PUSHPAGE) == 0);
|
||||
}
|
||||
|
||||
nvlist_free(spa->spa_load_info);
|
||||
spa->spa_load_info = fnvlist_alloc();
|
||||
|
||||
gethrestime(&spa->spa_loaded_ts);
|
||||
error = spa_load_impl(spa, pool_guid, config, state, type,
|
||||
mosconfig, &ereport);
|
||||
@@ -1891,12 +1969,14 @@ spa_load_impl(spa_t *spa, uint64_t pool_guid, nvlist_t *config,
|
||||
{
|
||||
int error = 0;
|
||||
nvlist_t *nvroot = NULL;
|
||||
nvlist_t *label;
|
||||
vdev_t *rvd;
|
||||
uberblock_t *ub = &spa->spa_uberblock;
|
||||
uint64_t children, config_cache_txg = spa->spa_config_txg;
|
||||
int orig_mode = spa->spa_mode;
|
||||
int parse;
|
||||
uint64_t obj;
|
||||
boolean_t missing_feat_write = B_FALSE;
|
||||
|
||||
/*
|
||||
* If this is an untrusted config, access the pool in read-only mode.
|
||||
@@ -1976,19 +2056,79 @@ spa_load_impl(spa_t *spa, uint64_t pool_guid, nvlist_t *config,
|
||||
/*
|
||||
* Find the best uberblock.
|
||||
*/
|
||||
vdev_uberblock_load(NULL, rvd, ub);
|
||||
vdev_uberblock_load(rvd, ub, &label);
|
||||
|
||||
/*
|
||||
* If we weren't able to find a single valid uberblock, return failure.
|
||||
*/
|
||||
if (ub->ub_txg == 0)
|
||||
if (ub->ub_txg == 0) {
|
||||
nvlist_free(label);
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_CORRUPT_DATA, ENXIO));
|
||||
}
|
||||
|
||||
/*
|
||||
* If the pool is newer than the code, we can't open it.
|
||||
* If the pool has an unsupported version we can't open it.
|
||||
*/
|
||||
if (ub->ub_version > SPA_VERSION)
|
||||
if (!SPA_VERSION_IS_SUPPORTED(ub->ub_version)) {
|
||||
nvlist_free(label);
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_VERSION_NEWER, ENOTSUP));
|
||||
}
|
||||
|
||||
if (ub->ub_version >= SPA_VERSION_FEATURES) {
|
||||
nvlist_t *features;
|
||||
|
||||
/*
|
||||
* If we weren't able to find what's necessary for reading the
|
||||
* MOS in the label, return failure.
|
||||
*/
|
||||
if (label == NULL || nvlist_lookup_nvlist(label,
|
||||
ZPOOL_CONFIG_FEATURES_FOR_READ, &features) != 0) {
|
||||
nvlist_free(label);
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_CORRUPT_DATA,
|
||||
ENXIO));
|
||||
}
|
||||
|
||||
/*
|
||||
* Update our in-core representation with the definitive values
|
||||
* from the label.
|
||||
*/
|
||||
nvlist_free(spa->spa_label_features);
|
||||
VERIFY(nvlist_dup(features, &spa->spa_label_features, 0) == 0);
|
||||
}
|
||||
|
||||
nvlist_free(label);
|
||||
|
||||
/*
|
||||
* Look through entries in the label nvlist's features_for_read. If
|
||||
* there is a feature listed there which we don't understand then we
|
||||
* cannot open a pool.
|
||||
*/
|
||||
if (ub->ub_version >= SPA_VERSION_FEATURES) {
|
||||
nvlist_t *unsup_feat;
|
||||
nvpair_t *nvp;
|
||||
|
||||
VERIFY(nvlist_alloc(&unsup_feat, NV_UNIQUE_NAME, KM_SLEEP) ==
|
||||
0);
|
||||
|
||||
for (nvp = nvlist_next_nvpair(spa->spa_label_features, NULL);
|
||||
nvp != NULL;
|
||||
nvp = nvlist_next_nvpair(spa->spa_label_features, nvp)) {
|
||||
if (!zfeature_is_supported(nvpair_name(nvp))) {
|
||||
VERIFY(nvlist_add_string(unsup_feat,
|
||||
nvpair_name(nvp), "") == 0);
|
||||
}
|
||||
}
|
||||
|
||||
if (!nvlist_empty(unsup_feat)) {
|
||||
VERIFY(nvlist_add_nvlist(spa->spa_load_info,
|
||||
ZPOOL_CONFIG_UNSUP_FEAT, unsup_feat) == 0);
|
||||
nvlist_free(unsup_feat);
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_UNSUP_FEAT,
|
||||
ENOTSUP));
|
||||
}
|
||||
|
||||
nvlist_free(unsup_feat);
|
||||
}
|
||||
|
||||
/*
|
||||
* If the vdev guid sum doesn't match the uberblock, we have an
|
||||
@@ -2022,7 +2162,7 @@ spa_load_impl(spa_t *spa, uint64_t pool_guid, nvlist_t *config,
|
||||
spa->spa_claim_max_txg = spa->spa_first_txg;
|
||||
spa->spa_prev_software_version = ub->ub_software_version;
|
||||
|
||||
error = dsl_pool_open(spa, spa->spa_first_txg, &spa->spa_dsl_pool);
|
||||
error = dsl_pool_init(spa, spa->spa_first_txg, &spa->spa_dsl_pool);
|
||||
if (error)
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_CORRUPT_DATA, EIO));
|
||||
spa->spa_meta_objset = spa->spa_dsl_pool->dp_meta_objset;
|
||||
@@ -2030,6 +2170,84 @@ spa_load_impl(spa_t *spa, uint64_t pool_guid, nvlist_t *config,
|
||||
if (spa_dir_prop(spa, DMU_POOL_CONFIG, &spa->spa_config_object) != 0)
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_CORRUPT_DATA, EIO));
|
||||
|
||||
if (spa_version(spa) >= SPA_VERSION_FEATURES) {
|
||||
boolean_t missing_feat_read = B_FALSE;
|
||||
nvlist_t *unsup_feat;
|
||||
|
||||
if (spa_dir_prop(spa, DMU_POOL_FEATURES_FOR_READ,
|
||||
&spa->spa_feat_for_read_obj) != 0) {
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_CORRUPT_DATA, EIO));
|
||||
}
|
||||
|
||||
if (spa_dir_prop(spa, DMU_POOL_FEATURES_FOR_WRITE,
|
||||
&spa->spa_feat_for_write_obj) != 0) {
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_CORRUPT_DATA, EIO));
|
||||
}
|
||||
|
||||
if (spa_dir_prop(spa, DMU_POOL_FEATURE_DESCRIPTIONS,
|
||||
&spa->spa_feat_desc_obj) != 0) {
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_CORRUPT_DATA, EIO));
|
||||
}
|
||||
|
||||
VERIFY(nvlist_alloc(&unsup_feat, NV_UNIQUE_NAME, KM_SLEEP) ==
|
||||
0);
|
||||
|
||||
if (!feature_is_supported(spa->spa_meta_objset,
|
||||
spa->spa_feat_for_read_obj, spa->spa_feat_desc_obj,
|
||||
unsup_feat))
|
||||
missing_feat_read = B_TRUE;
|
||||
|
||||
if (spa_writeable(spa) || state == SPA_LOAD_TRYIMPORT) {
|
||||
if (!feature_is_supported(spa->spa_meta_objset,
|
||||
spa->spa_feat_for_write_obj, spa->spa_feat_desc_obj,
|
||||
unsup_feat))
|
||||
missing_feat_write = B_TRUE;
|
||||
}
|
||||
|
||||
if (!nvlist_empty(unsup_feat)) {
|
||||
VERIFY(nvlist_add_nvlist(spa->spa_load_info,
|
||||
ZPOOL_CONFIG_UNSUP_FEAT, unsup_feat) == 0);
|
||||
}
|
||||
|
||||
nvlist_free(unsup_feat);
|
||||
|
||||
if (!missing_feat_read) {
|
||||
fnvlist_add_boolean(spa->spa_load_info,
|
||||
ZPOOL_CONFIG_CAN_RDONLY);
|
||||
}
|
||||
|
||||
/*
|
||||
* If the state is SPA_LOAD_TRYIMPORT, our objective is
|
||||
* twofold: to determine whether the pool is available for
|
||||
* import in read-write mode and (if it is not) whether the
|
||||
* pool is available for import in read-only mode. If the pool
|
||||
* is available for import in read-write mode, it is displayed
|
||||
* as available in userland; if it is not available for import
|
||||
* in read-only mode, it is displayed as unavailable in
|
||||
* userland. If the pool is available for import in read-only
|
||||
* mode but not read-write mode, it is displayed as unavailable
|
||||
* in userland with a special note that the pool is actually
|
||||
* available for open in read-only mode.
|
||||
*
|
||||
* As a result, if the state is SPA_LOAD_TRYIMPORT and we are
|
||||
* missing a feature for write, we must first determine whether
|
||||
* the pool can be opened read-only before returning to
|
||||
* userland in order to know whether to display the
|
||||
* abovementioned note.
|
||||
*/
|
||||
if (missing_feat_read || (missing_feat_write &&
|
||||
spa_writeable(spa))) {
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_UNSUP_FEAT,
|
||||
ENOTSUP));
|
||||
}
|
||||
}
|
||||
|
||||
spa->spa_is_initializing = B_TRUE;
|
||||
error = dsl_pool_open(spa->spa_dsl_pool);
|
||||
spa->spa_is_initializing = B_FALSE;
|
||||
if (error != 0)
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_CORRUPT_DATA, EIO));
|
||||
|
||||
if (!mosconfig) {
|
||||
uint64_t hostid;
|
||||
nvlist_t *policy = NULL, *nvconfig;
|
||||
@@ -2247,7 +2465,7 @@ spa_load_impl(spa_t *spa, uint64_t pool_guid, nvlist_t *config,
|
||||
nvlist_free(nvconfig);
|
||||
|
||||
/*
|
||||
* Now that we've validate the config, check the state of the
|
||||
* Now that we've validated the config, check the state of the
|
||||
* root vdev. If it can't be opened, it indicates one or
|
||||
* more toplevel vdevs are faulted.
|
||||
*/
|
||||
@@ -2260,6 +2478,17 @@ spa_load_impl(spa_t *spa, uint64_t pool_guid, nvlist_t *config,
|
||||
}
|
||||
}
|
||||
|
||||
if (missing_feat_write) {
|
||||
ASSERT(state == SPA_LOAD_TRYIMPORT);
|
||||
|
||||
/*
|
||||
* At this point, we know that we can open the pool in
|
||||
* read-only mode but not read-write mode. We now have enough
|
||||
* information and can return to userland.
|
||||
*/
|
||||
return (spa_vdev_err(rvd, VDEV_AUX_UNSUP_FEAT, ENOTSUP));
|
||||
}
|
||||
|
||||
/*
|
||||
* We've successfully opened the pool, verify that we're ready
|
||||
* to start pushing transactions.
|
||||
@@ -2370,10 +2599,18 @@ spa_load_retry(spa_t *spa, spa_load_state_t state, int mosconfig)
|
||||
return (spa_load(spa, state, SPA_IMPORT_EXISTING, mosconfig));
|
||||
}
|
||||
|
||||
/*
|
||||
* If spa_load() fails this function will try loading prior txg's. If
|
||||
* 'state' is SPA_LOAD_RECOVER and one of these loads succeeds the pool
|
||||
* will be rewound to that txg. If 'state' is not SPA_LOAD_RECOVER this
|
||||
* function will not rewind the pool and will return the same error as
|
||||
* spa_load().
|
||||
*/
|
||||
static int
|
||||
spa_load_best(spa_t *spa, spa_load_state_t state, int mosconfig,
|
||||
uint64_t max_request, int rewind_flags)
|
||||
{
|
||||
nvlist_t *loadinfo = NULL;
|
||||
nvlist_t *config = NULL;
|
||||
int load_error, rewind_error;
|
||||
uint64_t safe_rewind_txg;
|
||||
@@ -2402,9 +2639,18 @@ spa_load_best(spa_t *spa, spa_load_state_t state, int mosconfig,
|
||||
return (load_error);
|
||||
}
|
||||
|
||||
/* Price of rolling back is discarding txgs, including log */
|
||||
if (state == SPA_LOAD_RECOVER)
|
||||
if (state == SPA_LOAD_RECOVER) {
|
||||
/* Price of rolling back is discarding txgs, including log */
|
||||
spa_set_log_state(spa, SPA_LOG_CLEAR);
|
||||
} else {
|
||||
/*
|
||||
* If we aren't rolling back save the load info from our first
|
||||
* import attempt so that we can restore it after attempting
|
||||
* to rewind.
|
||||
*/
|
||||
loadinfo = spa->spa_load_info;
|
||||
spa->spa_load_info = fnvlist_alloc();
|
||||
}
|
||||
|
||||
spa->spa_load_max_txg = spa->spa_last_ubsync_txg;
|
||||
safe_rewind_txg = spa->spa_last_ubsync_txg - TXG_DEFER_SIZE;
|
||||
@@ -2428,7 +2674,20 @@ spa_load_best(spa_t *spa, spa_load_state_t state, int mosconfig,
|
||||
if (config && (rewind_error || state != SPA_LOAD_RECOVER))
|
||||
spa_config_set(spa, config);
|
||||
|
||||
return (state == SPA_LOAD_RECOVER ? rewind_error : load_error);
|
||||
if (state == SPA_LOAD_RECOVER) {
|
||||
ASSERT3P(loadinfo, ==, NULL);
|
||||
return (rewind_error);
|
||||
} else {
|
||||
/* Store the rewind info as part of the initial load info */
|
||||
fnvlist_add_nvlist(loadinfo, ZPOOL_CONFIG_REWIND_INFO,
|
||||
spa->spa_load_info);
|
||||
|
||||
/* Restore the initial load info */
|
||||
fnvlist_free(spa->spa_load_info);
|
||||
spa->spa_load_info = loadinfo;
|
||||
|
||||
return (load_error);
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
@@ -2698,8 +2957,50 @@ spa_add_l2cache(spa_t *spa, nvlist_t *config)
|
||||
}
|
||||
}
|
||||
|
||||
static void
|
||||
spa_add_feature_stats(spa_t *spa, nvlist_t *config)
|
||||
{
|
||||
nvlist_t *features;
|
||||
zap_cursor_t zc;
|
||||
zap_attribute_t za;
|
||||
|
||||
ASSERT(spa_config_held(spa, SCL_CONFIG, RW_READER));
|
||||
VERIFY(nvlist_alloc(&features, NV_UNIQUE_NAME, KM_SLEEP) == 0);
|
||||
|
||||
if (spa->spa_feat_for_read_obj != 0) {
|
||||
for (zap_cursor_init(&zc, spa->spa_meta_objset,
|
||||
spa->spa_feat_for_read_obj);
|
||||
zap_cursor_retrieve(&zc, &za) == 0;
|
||||
zap_cursor_advance(&zc)) {
|
||||
ASSERT(za.za_integer_length == sizeof (uint64_t) &&
|
||||
za.za_num_integers == 1);
|
||||
VERIFY3U(0, ==, nvlist_add_uint64(features, za.za_name,
|
||||
za.za_first_integer));
|
||||
}
|
||||
zap_cursor_fini(&zc);
|
||||
}
|
||||
|
||||
if (spa->spa_feat_for_write_obj != 0) {
|
||||
for (zap_cursor_init(&zc, spa->spa_meta_objset,
|
||||
spa->spa_feat_for_write_obj);
|
||||
zap_cursor_retrieve(&zc, &za) == 0;
|
||||
zap_cursor_advance(&zc)) {
|
||||
ASSERT(za.za_integer_length == sizeof (uint64_t) &&
|
||||
za.za_num_integers == 1);
|
||||
VERIFY3U(0, ==, nvlist_add_uint64(features, za.za_name,
|
||||
za.za_first_integer));
|
||||
}
|
||||
zap_cursor_fini(&zc);
|
||||
}
|
||||
|
||||
VERIFY(nvlist_add_nvlist(config, ZPOOL_CONFIG_FEATURE_STATS,
|
||||
features) == 0);
|
||||
nvlist_free(features);
|
||||
}
|
||||
|
||||
int
|
||||
spa_get_stats(const char *name, nvlist_t **config, char *altroot, size_t buflen)
|
||||
spa_get_stats(const char *name, nvlist_t **config,
|
||||
char *altroot, size_t buflen)
|
||||
{
|
||||
int error;
|
||||
spa_t *spa;
|
||||
@@ -2734,6 +3035,7 @@ spa_get_stats(const char *name, nvlist_t **config, char *altroot, size_t buflen)
|
||||
|
||||
spa_add_spares(spa, *config);
|
||||
spa_add_l2cache(spa, *config);
|
||||
spa_add_feature_stats(spa, *config);
|
||||
}
|
||||
}
|
||||
|
||||
@@ -2954,6 +3256,8 @@ spa_create(const char *pool, nvlist_t *nvroot, nvlist_t *props,
|
||||
nvlist_t **spares, **l2cache;
|
||||
uint_t nspares, nl2cache;
|
||||
uint64_t version, obj;
|
||||
boolean_t has_features;
|
||||
nvpair_t *elem;
|
||||
int c;
|
||||
|
||||
/*
|
||||
@@ -2980,10 +3284,18 @@ spa_create(const char *pool, nvlist_t *nvroot, nvlist_t *props,
|
||||
return (error);
|
||||
}
|
||||
|
||||
if (nvlist_lookup_uint64(props, zpool_prop_to_name(ZPOOL_PROP_VERSION),
|
||||
&version) != 0)
|
||||
has_features = B_FALSE;
|
||||
for (elem = nvlist_next_nvpair(props, NULL);
|
||||
elem != NULL; elem = nvlist_next_nvpair(props, elem)) {
|
||||
if (zpool_prop_feature(nvpair_name(elem)))
|
||||
has_features = B_TRUE;
|
||||
}
|
||||
|
||||
if (has_features || nvlist_lookup_uint64(props,
|
||||
zpool_prop_to_name(ZPOOL_PROP_VERSION), &version) != 0) {
|
||||
version = SPA_VERSION;
|
||||
ASSERT(version <= SPA_VERSION);
|
||||
}
|
||||
ASSERT(SPA_VERSION_IS_SUPPORTED(version));
|
||||
|
||||
spa->spa_first_txg = txg;
|
||||
spa->spa_uberblock.ub_txg = txg - 1;
|
||||
@@ -3059,8 +3371,10 @@ spa_create(const char *pool, nvlist_t *nvroot, nvlist_t *props,
|
||||
spa->spa_l2cache.sav_sync = B_TRUE;
|
||||
}
|
||||
|
||||
spa->spa_is_initializing = B_TRUE;
|
||||
spa->spa_dsl_pool = dp = dsl_pool_create(spa, zplprops, txg);
|
||||
spa->spa_meta_objset = dp->dp_meta_objset;
|
||||
spa->spa_is_initializing = B_FALSE;
|
||||
|
||||
/*
|
||||
* Create DDTs (dedup tables).
|
||||
@@ -3084,6 +3398,9 @@ spa_create(const char *pool, nvlist_t *nvroot, nvlist_t *props,
|
||||
cmn_err(CE_PANIC, "failed to add pool config");
|
||||
}
|
||||
|
||||
if (spa_version(spa) >= SPA_VERSION_FEATURES)
|
||||
spa_feature_create_zap_objects(spa, tx);
|
||||
|
||||
if (zap_add(spa->spa_meta_objset,
|
||||
DMU_POOL_DIRECTORY_OBJECT, DMU_POOL_CREATION_VERSION,
|
||||
sizeof (uint64_t), 1, &version, tx) != 0) {
|
||||
@@ -3276,7 +3593,7 @@ spa_import_rootpool(char *devpath, char *devid)
|
||||
}
|
||||
#endif
|
||||
if (config == NULL) {
|
||||
cmn_err(CE_NOTE, "Can not read the pool label from '%s'",
|
||||
cmn_err(CE_NOTE, "Cannot read the pool label from '%s'",
|
||||
devpath);
|
||||
return (EIO);
|
||||
}
|
||||
@@ -3590,6 +3907,8 @@ spa_tryimport(nvlist_t *tryconfig)
|
||||
state) == 0);
|
||||
VERIFY(nvlist_add_uint64(config, ZPOOL_CONFIG_TIMESTAMP,
|
||||
spa->spa_uberblock.ub_timestamp) == 0);
|
||||
VERIFY(nvlist_add_nvlist(config, ZPOOL_CONFIG_LOAD_INFO,
|
||||
spa->spa_load_info) == 0);
|
||||
|
||||
/*
|
||||
* If the bootfs property exists on this pool then we
|
||||
@@ -5305,7 +5624,7 @@ spa_sync_nvlist(spa_t *spa, uint64_t obj, nvlist_t *nv, dmu_tx_t *tx)
|
||||
* information. This avoids the dbuf_will_dirty() path and
|
||||
* saves us a pre-read to get data we don't actually care about.
|
||||
*/
|
||||
bufsize = P2ROUNDUP(nvsize, SPA_CONFIG_BLOCKSIZE);
|
||||
bufsize = P2ROUNDUP((uint64_t)nvsize, SPA_CONFIG_BLOCKSIZE);
|
||||
packed = vmem_alloc(bufsize, KM_PUSHPAGE);
|
||||
|
||||
VERIFY(nvlist_pack(nv, &packed, &nvsize, NV_ENCODE_XDR,
|
||||
@@ -5390,6 +5709,24 @@ spa_sync_config_object(spa_t *spa, dmu_tx_t *tx)
|
||||
spa_sync_nvlist(spa, spa->spa_config_object, config, tx);
|
||||
}
|
||||
|
||||
static void
|
||||
spa_sync_version(void *arg1, void *arg2, dmu_tx_t *tx)
|
||||
{
|
||||
spa_t *spa = arg1;
|
||||
uint64_t version = *(uint64_t *)arg2;
|
||||
|
||||
/*
|
||||
* Setting the version is special cased when first creating the pool.
|
||||
*/
|
||||
ASSERT(tx->tx_txg != TXG_INITIAL);
|
||||
|
||||
ASSERT(version <= SPA_VERSION);
|
||||
ASSERT(version >= spa_version(spa));
|
||||
|
||||
spa->spa_uberblock.ub_version = version;
|
||||
vdev_config_dirty(spa->spa_root_vdev);
|
||||
}
|
||||
|
||||
/*
|
||||
* Set zpool properties.
|
||||
*/
|
||||
@@ -5399,32 +5736,39 @@ spa_sync_props(void *arg1, void *arg2, dmu_tx_t *tx)
|
||||
spa_t *spa = arg1;
|
||||
objset_t *mos = spa->spa_meta_objset;
|
||||
nvlist_t *nvp = arg2;
|
||||
nvpair_t *elem;
|
||||
uint64_t intval;
|
||||
char *strval;
|
||||
zpool_prop_t prop;
|
||||
const char *propname;
|
||||
zprop_type_t proptype;
|
||||
nvpair_t *elem = NULL;
|
||||
|
||||
mutex_enter(&spa->spa_props_lock);
|
||||
|
||||
elem = NULL;
|
||||
while ((elem = nvlist_next_nvpair(nvp, elem))) {
|
||||
switch (prop = zpool_name_to_prop(nvpair_name(elem))) {
|
||||
case ZPOOL_PROP_VERSION:
|
||||
uint64_t intval;
|
||||
char *strval, *fname;
|
||||
zpool_prop_t prop;
|
||||
const char *propname;
|
||||
zprop_type_t proptype;
|
||||
zfeature_info_t *feature;
|
||||
|
||||
prop = zpool_name_to_prop(nvpair_name(elem));
|
||||
switch ((int)prop) {
|
||||
case ZPROP_INVAL:
|
||||
/*
|
||||
* Only set version for non-zpool-creation cases
|
||||
* (set/import). spa_create() needs special care
|
||||
* for version setting.
|
||||
* We checked this earlier in spa_prop_validate().
|
||||
*/
|
||||
if (tx->tx_txg != TXG_INITIAL) {
|
||||
VERIFY(nvpair_value_uint64(elem,
|
||||
&intval) == 0);
|
||||
ASSERT(intval <= SPA_VERSION);
|
||||
ASSERT(intval >= spa_version(spa));
|
||||
spa->spa_uberblock.ub_version = intval;
|
||||
vdev_config_dirty(spa->spa_root_vdev);
|
||||
}
|
||||
ASSERT(zpool_prop_feature(nvpair_name(elem)));
|
||||
|
||||
fname = strchr(nvpair_name(elem), '@') + 1;
|
||||
VERIFY3U(0, ==, zfeature_lookup_name(fname, &feature));
|
||||
|
||||
spa_feature_enable(spa, feature, tx);
|
||||
break;
|
||||
|
||||
case ZPOOL_PROP_VERSION:
|
||||
VERIFY(nvpair_value_uint64(elem, &intval) == 0);
|
||||
/*
|
||||
* The version is synced seperatly before other
|
||||
* properties and should be correct by now.
|
||||
*/
|
||||
ASSERT3U(spa_version(spa), >=, intval);
|
||||
break;
|
||||
|
||||
case ZPOOL_PROP_ALTROOT:
|
||||
@@ -5461,14 +5805,10 @@ spa_sync_props(void *arg1, void *arg2, dmu_tx_t *tx)
|
||||
* Set pool property values in the poolprops mos object.
|
||||
*/
|
||||
if (spa->spa_pool_props_object == 0) {
|
||||
VERIFY((spa->spa_pool_props_object =
|
||||
zap_create(mos, DMU_OT_POOL_PROPS,
|
||||
DMU_OT_NONE, 0, tx)) > 0);
|
||||
|
||||
VERIFY(zap_update(mos,
|
||||
spa->spa_pool_props_object =
|
||||
zap_create_link(mos, DMU_OT_POOL_PROPS,
|
||||
DMU_POOL_DIRECTORY_OBJECT, DMU_POOL_PROPS,
|
||||
8, 1, &spa->spa_pool_props_object, tx)
|
||||
== 0);
|
||||
tx);
|
||||
}
|
||||
|
||||
/* normalize the property name */
|
||||
@@ -5567,6 +5907,11 @@ spa_sync_upgrades(spa_t *spa, dmu_tx_t *tx)
|
||||
/* Keeping the freedir open increases spa_minref */
|
||||
spa->spa_minref += 3;
|
||||
}
|
||||
|
||||
if (spa->spa_ubsync.ub_version < SPA_VERSION_FEATURES &&
|
||||
spa->spa_uberblock.ub_version >= SPA_VERSION_FEATURES) {
|
||||
spa_feature_create_zap_objects(spa, tx);
|
||||
}
|
||||
}
|
||||
|
||||
/*
|
||||
|
||||
Reference in New Issue
Block a user