PSARC 2006/077 zpool clear
PSARC 2006/139 FMA for ZFS
6284889 arc should replace the znode cache
6333006 DMU & DSL should not panic upon I/O error
6333092 concurrent reads to a file not scaling with number of readers
6338081 ZFS/FMA phase 1
6338386 need persistent error log
6341326 i/o error causes arc buf hash table corruption
6341639 zfs backup/restore should compute/verify checksum of backup stream
6348002 out of space due to changing properties
6354724 inaccurate error message from zfs restore
6354872 dmu_sync() blows predictive accounting
6355416 zpool scrubbing consumes all memory, system hung
6363995 df should only load libzfs when it encounters a ZFS filesystem
6366320 zfs backup/restore doesn't like signals
6368892 mount -m support needed for legacy mounts
6368902 boot archive fstat support needed for ZFS Mountroot
6369424 BFU complains when bfu'ing a ZFS root filesystem
6374062 mountroot support needed for ZFS
6376356 dirtying dbuf obj=43 lvl=0 blkid=0 but not tx_held
6378391 unused members of dmu_objset_stats_t
6378392 clean up zfs_cmd_t structure
6378685 buf_init should allocate its hash table more carefully
6378976 ziltest should be a first class citizen
6381086 zdb segfaults if there is a spa deferred-free bplist
6381203 deadlock due to i/o while assigning (tc_lock held)
6381209 freed space is not immediately available
6381344 'zpool clear'
6381345 FAULTED devices should really be UNAVAIL
6381346 import should mark devices as persistently unavailable
6383272 recursive mutex_enter() during log replay with zfs root
6386326 origin property is not displayed
6386354 libzfs does too much in its _init section, calls exit(1)
6386624 zpool should not complain about non-existent devices from libdiskmgt
6386910 spa needs to be i/o error hardened
6387735 need a mechanism to inject faults into ZFS
6387736 internal ZFS utilities should be placed in an ON-private package
6389928 libzfs should ship a lint library
6390609 malformed vdev config panics on zpool_create()
6390677 version number checking makes upgrades challenging
6390713 ztest hangs in zil_suspend()
6391873 metadata compression should be turned back on
6392113 ztest sometimes reports leaked blocks because ZIL isn't resilvered
6393004 minor memory leak in unique_insert()
/*
* CDDL HEADER START
*
* The contents of this file are subject to the terms of the
* Common Development and Distribution License (the "License").
* You may not use this file except in compliance with the License.
*
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
* or http://www.opensolaris.org/os/licensing.
* See the License for the specific language governing permissions
* and limitations under the License.
*
* When distributing Covered Code, include this CDDL HEADER in each
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
* If applicable, add the following below this CDDL HEADER, with the
* fields enclosed by brackets "[]" replaced with your own identifying
* information: Portions Copyright [yyyy] [name of copyright owner]
*
* CDDL HEADER END
*/
/*
* Copyright 2006 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
#pragma ident "%Z%%M% %I% %E% SMI"
#include <sys/dmu.h>
#include <sys/dmu_objset.h>
#include <sys/dmu_tx.h>
#include <sys/dsl_dataset.h>
#include <sys/dsl_dir.h>
#include <sys/dsl_prop.h>
#include <sys/spa.h>
#include <sys/zio_checksum.h> /* for the default checksum value */
#include <sys/zap.h>
#include <sys/fs/zfs.h>
#include "zfs_prop.h"
static int
dodefault(const char *propname, int intsz, int numint, void *buf)
{
zfs_prop_t prop;
if ((prop = zfs_name_to_prop(propname)) == ZFS_PROP_INVAL ||
zfs_prop_readonly(prop))
return (ENOENT);
if (zfs_prop_get_type(prop) == prop_type_string) {
if (intsz != 1)
return (EOVERFLOW);
(void) strncpy(buf, zfs_prop_default_string(prop), numint);
} else {
if (intsz != 8 || numint < 1)
return (EOVERFLOW);
*(uint64_t *)buf = zfs_prop_default_numeric(prop);
}
return (0);
}
static int
dsl_prop_get_impl(dsl_pool_t *dp, uint64_t ddobj, const char *propname,
int intsz, int numint, void *buf, char *setpoint)
{
int err = 0;
objset_t *mos = dp->dp_meta_objset;
if (setpoint)
setpoint[0] = '\0';
ASSERT(RW_LOCK_HELD(&dp->dp_config_rwlock));
while (ddobj != 0) {
dsl_dir_t *dd;
err = dsl_dir_open_obj(dp, ddobj, NULL, FTAG, &dd);
if (err)
break;
err = zap_lookup(mos, dd->dd_phys->dd_props_zapobj,
propname, intsz, numint, buf);
if (err != ENOENT) {
if (setpoint)
dsl_dir_name(dd, setpoint);
dsl_dir_close(dd, FTAG);
break;
}
ASSERT3U(err, ==, ENOENT);
ddobj = dd->dd_phys->dd_parent_obj;
dsl_dir_close(dd, FTAG);
}
if (err == ENOENT)
err = dodefault(propname, intsz, numint, buf);
return (err);
}
/*
* Register interest in the named property. We'll call the callback
* once to notify it of the current property value, and again each time
* the property changes, until this callback is unregistered.
*
* Return 0 on success, errno if the prop is not an integer value.
*/
int
dsl_prop_register(dsl_dataset_t *ds, const char *propname,
dsl_prop_changed_cb_t *callback, void *cbarg)
{
dsl_dir_t *dd;
uint64_t value;
dsl_prop_cb_record_t *cbr;
int err;
dd = ds->ds_dir;
rw_enter(&dd->dd_pool->dp_config_rwlock, RW_READER);
err = dsl_prop_get_impl(dd->dd_pool, dd->dd_object, propname,
8, 1, &value, NULL);
if (err == ENOENT) {
err = 0;
value = DSL_PROP_VALUE_UNDEFINED;
}
if (err != 0) {
rw_exit(&dd->dd_pool->dp_config_rwlock);
return (err);
}
cbr = kmem_alloc(sizeof (dsl_prop_cb_record_t), KM_SLEEP);
cbr->cbr_propname = kmem_alloc(strlen(propname)+1, KM_SLEEP);
(void) strcpy((char *)cbr->cbr_propname, propname);
cbr->cbr_func = callback;
cbr->cbr_arg = cbarg;
mutex_enter(&dd->dd_lock);
list_insert_head(&dd->dd_prop_cbs, cbr);
mutex_exit(&dd->dd_lock);
cbr->cbr_func(cbr->cbr_arg, value);
VERIFY(0 == dsl_dir_open_obj(dd->dd_pool, dd->dd_object,
NULL, cbr, &dd));
rw_exit(&dd->dd_pool->dp_config_rwlock);
/* Leave dataset open until this callback is unregistered */
return (0);
}
int
dsl_prop_get_ds(dsl_dir_t *dd, const char *propname,
int intsz, int numints, void *buf, char *setpoint)
{
int err;
rw_enter(&dd->dd_pool->dp_config_rwlock, RW_READER);
err = dsl_prop_get_impl(dd->dd_pool, dd->dd_object,
propname, intsz, numints, buf, setpoint);
rw_exit(&dd->dd_pool->dp_config_rwlock);
return (err);
}
int
dsl_prop_get(const char *ddname, const char *propname,
int intsz, int numints, void *buf, char *setpoint)
{
dsl_dir_t *dd;
const char *tail;
int err;
err = dsl_dir_open(ddname, FTAG, &dd, &tail);
if (err)
return (err);
if (tail && tail[0] != '@') {
dsl_dir_close(dd, FTAG);
return (ENOENT);
}
err = dsl_prop_get_ds(dd, propname, intsz, numints, buf, setpoint);
dsl_dir_close(dd, FTAG);
return (err);
}
/*
* Return 0 on success, ENOENT if ddname is invalid, EOVERFLOW if
* valuelen not big enough.
*/
int
dsl_prop_get_string(const char *ddname, const char *propname,
char *value, int valuelen, char *setpoint)
{
return (dsl_prop_get(ddname, propname, 1, valuelen, value, setpoint));
}
/*
* Get the current property value. It may have changed by the time this
* function returns, so it is NOT safe to follow up with
* dsl_prop_register() and assume that the value has not changed in
* between.
*
* Return 0 on success, ENOENT if ddname is invalid.
*/
int
dsl_prop_get_integer(const char *ddname, const char *propname,
uint64_t *valuep, char *setpoint)
{
return (dsl_prop_get(ddname, propname, 8, 1, valuep, setpoint));
}
int
dsl_prop_get_ds_integer(dsl_dir_t *dd, const char *propname,
uint64_t *valuep, char *setpoint)
{
return (dsl_prop_get_ds(dd, propname, 8, 1, valuep, setpoint));
}
/*
* Unregister this callback. Return 0 on success, ENOENT if ddname is
* invalid, ENOMSG if no matching callback registered.
*/
int
dsl_prop_unregister(dsl_dataset_t *ds, const char *propname,
dsl_prop_changed_cb_t *callback, void *cbarg)
{
dsl_dir_t *dd;
dsl_prop_cb_record_t *cbr;
dd = ds->ds_dir;
mutex_enter(&dd->dd_lock);
for (cbr = list_head(&dd->dd_prop_cbs);
cbr; cbr = list_next(&dd->dd_prop_cbs, cbr)) {
if (strcmp(cbr->cbr_propname, propname) == 0 &&
cbr->cbr_func == callback &&
cbr->cbr_arg == cbarg)
break;
}
if (cbr == NULL) {
mutex_exit(&dd->dd_lock);
return (ENOMSG);
}
list_remove(&dd->dd_prop_cbs, cbr);
mutex_exit(&dd->dd_lock);
kmem_free((void*)cbr->cbr_propname, strlen(cbr->cbr_propname)+1);
kmem_free(cbr, sizeof (dsl_prop_cb_record_t));
/* Clean up from dsl_prop_register */
dsl_dir_close(dd, cbr);
return (0);
}
static void
dsl_prop_changed_notify(dsl_pool_t *dp, uint64_t ddobj,
const char *propname, uint64_t value, int first)
{
dsl_dir_t *dd;
dsl_prop_cb_record_t *cbr;
objset_t *mos = dp->dp_meta_objset;
int err;
ASSERT(RW_WRITE_HELD(&dp->dp_config_rwlock));
err = dsl_dir_open_obj(dp, ddobj, NULL, FTAG, &dd);
if (err)
return;
if (!first) {
/*
* If the prop is set here, then this change is not
* being inherited here or below; stop the recursion.
*/
err = zap_lookup(mos, dd->dd_phys->dd_props_zapobj, propname,
8, 1, &value);
if (err == 0) {
dsl_dir_close(dd, FTAG);
return;
}
ASSERT3U(err, ==, ENOENT);
}
mutex_enter(&dd->dd_lock);
for (cbr = list_head(&dd->dd_prop_cbs);
cbr; cbr = list_next(&dd->dd_prop_cbs, cbr)) {
if (strcmp(cbr->cbr_propname, propname) == 0) {
cbr->cbr_func(cbr->cbr_arg, value);
}
}
mutex_exit(&dd->dd_lock);
if (dd->dd_phys->dd_child_dir_zapobj) {
zap_cursor_t zc;
zap_attribute_t za;
for (zap_cursor_init(&zc, mos,
dd->dd_phys->dd_child_dir_zapobj);
zap_cursor_retrieve(&zc, &za) == 0;
zap_cursor_advance(&zc)) {
/* XXX recursion could blow stack; esp. za! */
dsl_prop_changed_notify(dp, za.za_first_integer,
propname, value, FALSE);
}
zap_cursor_fini(&zc);
}
dsl_dir_close(dd, FTAG);
}
struct prop_set_arg {
const char *name;
int intsz;
int numints;
const void *buf;
};
static int
dsl_prop_set_sync(dsl_dir_t *dd, void *arg, dmu_tx_t *tx)
{
struct prop_set_arg *psa = arg;
objset_t *mos = dd->dd_pool->dp_meta_objset;
uint64_t zapobj = dd->dd_phys->dd_props_zapobj;
uint64_t intval;
int err, isint;
rw_enter(&dd->dd_pool->dp_config_rwlock, RW_WRITER);
isint = (dodefault(psa->name, 8, 1, &intval) == 0);
if (psa->numints == 0) {
err = zap_remove(mos, zapobj, psa->name, tx);
if (err == ENOENT) /* that's fine. */
err = 0;
if (err == 0 && isint) {
err = dsl_prop_get_impl(dd->dd_pool,
dd->dd_phys->dd_parent_obj, psa->name,
8, 1, &intval, NULL);
}
} else {
err = zap_update(mos, zapobj, psa->name,
psa->intsz, psa->numints, psa->buf, tx);
if (isint)
intval = *(uint64_t *)psa->buf;
}
if (err == 0 && isint) {
dsl_prop_changed_notify(dd->dd_pool,
dd->dd_object, psa->name, intval, TRUE);
}
rw_exit(&dd->dd_pool->dp_config_rwlock);
return (err);
}
int
dsl_prop_set(const char *ddname, const char *propname,
int intsz, int numints, const void *buf)
{
dsl_dir_t *dd;
int err;
struct prop_set_arg psa;
err = dsl_dir_open(ddname, FTAG, &dd, NULL);
if (err)
return (err);
psa.name = propname;
psa.intsz = intsz;
psa.numints = numints;
psa.buf = buf;
err = dsl_dir_sync_task(dd, dsl_prop_set_sync, &psa, 1<<20);
dsl_dir_close(dd, FTAG);
return (err);
}
/*
* Iterate over all properties for this dataset and return them in an nvlist.
*/
int
dsl_prop_get_all(objset_t *os, nvlist_t **nvp)
{
dsl_dataset_t *ds = os->os->os_dsl_dataset;
dsl_dir_t *dd, *parent;
int err = 0;
dsl_pool_t *dp;
objset_t *mos;
zap_cursor_t zc;
zap_attribute_t za;
char setpoint[MAXNAMELEN];
char *tmp;
nvlist_t *prop;
if (dsl_dataset_is_snapshot(ds)) {
VERIFY(nvlist_alloc(nvp, NV_UNIQUE_NAME, KM_SLEEP) == 0);
return (0);
}
dd = ds->ds_dir;
VERIFY(nvlist_alloc(nvp, NV_UNIQUE_NAME, KM_SLEEP) == 0);
dp = dd->dd_pool;
mos = dp->dp_meta_objset;
rw_enter(&dp->dp_config_rwlock, RW_READER);
while (dd != NULL) {
dsl_dir_name(dd, setpoint);
for (zap_cursor_init(&zc, mos, dd->dd_phys->dd_props_zapobj);
(err = zap_cursor_retrieve(&zc, &za)) == 0;
zap_cursor_advance(&zc)) {
if (nvlist_lookup_nvlist(*nvp, za.za_name, &prop) == 0)
continue;
VERIFY(nvlist_alloc(&prop, NV_UNIQUE_NAME,
KM_SLEEP) == 0);
if (za.za_integer_length == 1) {
/*
* String property
*/
tmp = kmem_alloc(za.za_num_integers, KM_SLEEP);
err = zap_lookup(mos,
dd->dd_phys->dd_props_zapobj,
za.za_name, 1, za.za_num_integers,
tmp);
if (err != 0) {
kmem_free(tmp, za.za_num_integers);
break;
}
VERIFY(nvlist_add_string(prop,
ZFS_PROP_VALUE, tmp) == 0);
kmem_free(tmp, za.za_num_integers);
} else {
/*
* Integer property
*/
ASSERT(za.za_integer_length == 8);
(void) nvlist_add_uint64(prop, ZFS_PROP_VALUE,
za.za_first_integer);
}
VERIFY(nvlist_add_string(prop,
ZFS_PROP_SOURCE, setpoint) == 0);
VERIFY(nvlist_add_nvlist(*nvp, za.za_name,
prop) == 0);
nvlist_free(prop);
}
zap_cursor_fini(&zc);
if (err != ENOENT) {
if (dd != ds->ds_dir)
dsl_dir_close(dd, FTAG);
break;
} else {
err = 0;
}
/*
* Continue to parent.
*/
if (dd->dd_phys->dd_parent_obj == 0)
parent = NULL;
else
err = dsl_dir_open_obj(dp,
dd->dd_phys->dd_parent_obj, NULL, FTAG, &parent);
if (dd != ds->ds_dir)
dsl_dir_close(dd, FTAG);
if (err)
break;
dd = parent;
}
rw_exit(&dp->dp_config_rwlock);
return (err);
}