dmu_objset.c revision a2afb611b30628fb74ad9eade4ae465f9031e262
fa9e4066f08beec538e775443c5be79dd423fcabahrens * CDDL HEADER START
fa9e4066f08beec538e775443c5be79dd423fcabahrens * The contents of this file are subject to the terms of the
ea8dc4b6d2251b437950c0056bc626b311c73c27eschrock * Common Development and Distribution License (the "License").
ea8dc4b6d2251b437950c0056bc626b311c73c27eschrock * You may not use this file except in compliance with the License.
fa9e4066f08beec538e775443c5be79dd423fcabahrens * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
fa9e4066f08beec538e775443c5be79dd423fcabahrens * See the License for the specific language governing permissions
fa9e4066f08beec538e775443c5be79dd423fcabahrens * and limitations under the License.
fa9e4066f08beec538e775443c5be79dd423fcabahrens * When distributing Covered Code, include this CDDL HEADER in each
fa9e4066f08beec538e775443c5be79dd423fcabahrens * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
fa9e4066f08beec538e775443c5be79dd423fcabahrens * If applicable, add the following below this CDDL HEADER, with the
fa9e4066f08beec538e775443c5be79dd423fcabahrens * fields enclosed by brackets "[]" replaced with your own identifying
fa9e4066f08beec538e775443c5be79dd423fcabahrens * information: Portions Copyright [yyyy] [name of copyright owner]
fa9e4066f08beec538e775443c5be79dd423fcabahrens * CDDL HEADER END
8d18220deb04ec7b12410cd90deb4d45e66d49bfMark J Musante * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
840345f69c01af33ad169d6b4a6ae7ea78b4218aGeorge Wilson * Copyright (c) 2013 by Delphix. All rights reserved.
9dc3941c735ef88de46e850f745aa556d3a071a5Sašo Kiselkov * Copyright (c) 2013 by Saso Kiselkov. All rights reserved.
fa9e4066f08beec538e775443c5be79dd423fcabahrens * Copyright (c) 2013, Joyent, Inc. All rights reserved.
fa9e4066f08beec538e775443c5be79dd423fcabahrens/* Portions Copyright 2010 Robert Milkowski */
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * Needed to close a window in dnode_move() that allows the objset to be freed
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * before it can be safely accessed.
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson if ((ds = os->os_dsl_dataset) != NULL && ds->ds_dir)
fa9e4066f08beec538e775443c5be79dd423fcabahrens * Inheritance should have been done by now.
88ecc943b4eb72f7c4fbbd8435997b85ef171fc3George Wilson os->os_checksum = zio_checksum_select(newval, ZIO_CHECKSUM_ON_VALUE);
88ecc943b4eb72f7c4fbbd8435997b85ef171fc3George Wilsoncompression_changed_cb(void *arg, uint64_t newval)
88ecc943b4eb72f7c4fbbd8435997b85ef171fc3George Wilson * Inheritance and range checking should have been done by now.
88ecc943b4eb72f7c4fbbd8435997b85ef171fc3George Wilson os->os_compress = zio_compress_select(newval, ZIO_COMPRESS_ON_VALUE);
88ecc943b4eb72f7c4fbbd8435997b85ef171fc3George Wilson * Inheritance and range checking should have been done by now.
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick ASSERT(newval <= spa_max_replication(os->os_spa));
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick * Inheritance should have been done by now.
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick checksum = zio_checksum_dedup_select(spa, newval, ZIO_CHECKSUM_OFF);
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick os->os_dedup_checksum = checksum & ZIO_CHECKSUM_MASK;
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick os->os_dedup_verify = !!(checksum & ZIO_CHECKSUM_VERIFY);
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwickprimary_cache_changed_cb(void *arg, uint64_t newval)
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick * Inheritance and range checking should have been done by now.
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick ASSERT(newval == ZFS_CACHE_ALL || newval == ZFS_CACHE_NONE ||
fa9e4066f08beec538e775443c5be79dd423fcabahrenssecondary_cache_changed_cb(void *arg, uint64_t newval)
fa9e4066f08beec538e775443c5be79dd423fcabahrens * Inheritance and range checking should have been done by now.
fa9e4066f08beec538e775443c5be79dd423fcabahrens ASSERT(newval == ZFS_CACHE_ALL || newval == ZFS_CACHE_NONE ||
fa9e4066f08beec538e775443c5be79dd423fcabahrens * Inheritance and range checking should have been done by now.
fa9e4066f08beec538e775443c5be79dd423fcabahrens ASSERT(newval == ZFS_SYNC_STANDARD || newval == ZFS_SYNC_ALWAYS ||
a33cae9802e94744efee12a7a77c89360645eae8Tim Haley ASSERT(size == OBJSET_OLD_PHYS_SIZE || size == sizeof (objset_phys_t));
a33cae9802e94744efee12a7a77c89360645eae8Tim Haley byteswap_uint64_array(&osp->os_zil_header, sizeof (zil_header_t));
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwickdmu_objset_open_impl(spa_t *spa, dsl_dataset_t *ds, blkptr_t *bp,
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick ASSERT(ds == NULL || MUTEX_HELD(&ds->ds_opening_lock));
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick SET_BOOKMARK(&zb, ds ? ds->ds_object : DMU_META_OBJSET,
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick ZIO_PRIORITY_SYNC_READ, ZIO_FLAG_CANFAIL, &aflags, &zb);
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick /* convert checksum errors into IO errors */
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick /* Increase the blocksize if we are permitted. */
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick if (spa_version(spa) >= SPA_VERSION_USERSPACE &&
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick arc_buf_size(os->os_phys_buf) < sizeof (objset_phys_t)) {
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick int size = spa_version(spa) >= SPA_VERSION_USERSPACE ?
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * Note: the changed_cb will be called once before the register
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * func returns, thus changing the checksum/compression from the
fa9e4066f08beec538e775443c5be79dd423fcabahrens * default (fletcher2/off). Snapshots don't need to know about
fa9e4066f08beec538e775443c5be79dd423fcabahrens if (err == 0) {
fa9e4066f08beec538e775443c5be79dd423fcabahrens if (err == 0) {
fa9e4066f08beec538e775443c5be79dd423fcabahrens if (err == 0) {
5f5f7a6f9c8e9c1587a54e690556d756ec67558cahrens if (err == 0) {
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick if (err == 0) {
fa9e4066f08beec538e775443c5be79dd423fcabahrens if (err == 0) {
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson /* It's the meta-objset. */
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson os->os_zil_header = os->os_phys->os_zil_header;
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson os->os_zil = zil_alloc(os, &os->os_zil_header);
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick for (i = 0; i < TXG_SIZE; i++) {
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick list_create(&os->os_dirty_dnodes[i], sizeof (dnode_t),
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson list_create(&os->os_free_dnodes[i], sizeof (dnode_t),
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick list_create(&os->os_downgraded_dbufs, sizeof (dmu_buf_impl_t),
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick mutex_init(&os->os_lock, NULL, MUTEX_DEFAULT, NULL);
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick mutex_init(&os->os_obj_lock, NULL, MUTEX_DEFAULT, NULL);
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick mutex_init(&os->os_user_ptr_lock, NULL, MUTEX_DEFAULT, NULL);
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick if (arc_buf_size(os->os_phys_buf) >= sizeof (objset_phys_t)) {
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick &os->os_phys->os_userused_dnode, DMU_USERUSED_OBJECT,
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick &os->os_phys->os_groupused_dnode, DMU_GROUPUSED_OBJECT,
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * We should be the only thread trying to do this because we
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * have ds_opening_lock
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilsondmu_objset_from_ds(dsl_dataset_t *ds, objset_t **osp)
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson err = dmu_objset_open_impl(dsl_dataset_get_spa(ds),
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson * Holds the pool while the objset is held. Therefore only one objset
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson * can be held at a time.
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilsondmu_objset_hold(const char *name, void *tag, objset_t **osp)
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick if (err != 0) {
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * dsl_pool must not be held when this is called.
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson * Upon successful return, there will be a longhold on the dataset,
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson * and the dsl_pool will not be held.
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilsondmu_objset_own(const char *name, dmu_objset_type_t type,
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson boolean_t readonly, void *tag, objset_t **osp)
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson } else if (type != DMU_OST_ANY && type != (*osp)->os_phys->os_type) {
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson } else if (!readonly && dsl_dataset_is_snapshot(ds)) {
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * When we are called, os MUST refer to an objset associated with a dataset
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * that is owned by 'tag'; that is, is held and long held by 'tag' and ds_owner
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * == tag. We will then release and reacquire ownership of the dataset while
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * holding the pool config_rwlock to avoid intervening namespace or ownership
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * changes may occur.
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * This exists solely to accommodate zfs_ioc_userspace_upgrade()'s desire to
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson * release the hold on its dataset and acquire a new one on the dataset of the
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson * same name so that it can be partially torn down and reconstructed.
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilsondmu_objset_refresh_ownership(objset_t *os, void *tag)
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson VERIFY0(dsl_dataset_own(dp, name, tag, &newds));
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson /* process the mdn last, since the other dnodes have holds on it */
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson list_remove(&os->os_dnodes, DMU_META_DNODE(os));
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson list_insert_tail(&os->os_dnodes, DMU_META_DNODE(os));
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * Find the first dnode with holds. We have to do this dance
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * because dnode_add_ref() only works if you already have a
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson * hold. If there are no holds then it has no dbufs so OK to
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson } while (next_dn && !dnode_add_ref(next_dn, FTAG));
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson for (int t = 0; t < TXG_SIZE; t++)
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson ASSERT3P(list_head(&os->os_dnodes), ==, NULL);
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson VERIFY(arc_buf_remove_ref(os->os_phys_buf, &os->os_phys_buf));
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * This is a barrier to prevent the objset from going away in
8d18220deb04ec7b12410cd90deb4d45e66d49bfMark J Musante * dnode_move() until we can safely ensure that the objset is still in
8d18220deb04ec7b12410cd90deb4d45e66d49bfMark J Musante * use. We consider the objset valid before the barrier and invalid
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * after the barrier.
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson return (dsl_dir_snap_cmtime(os->os_dsl_dataset->ds_dir));
8d18220deb04ec7b12410cd90deb4d45e66d49bfMark J Musante/* called from dsl for meta-objset */
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilsondmu_objset_create_impl(spa_t *spa, dsl_dataset_t *ds, blkptr_t *bp,
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson VERIFY0(dmu_objset_open_impl(spa, NULL, bp, &os));
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson dnode_allocate(mdn, DMU_OT_DNODE, 1 << DNODE_BLOCK_SHIFT,
8d18220deb04ec7b12410cd90deb4d45e66d49bfMark J Musante * We don't want to have to increase the meta-dnode's nlevels
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * later, because then we could do it in quescing context while
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * we are also accessing it in open context.
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * This precaution is not necessary for the MOS (ds == NULL),
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * because the MOS is only updated in syncing context.
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * This is most fortunate: the MOS is the only objset that
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * needs to be synced multiple times as spa_sync() iterates
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson * to convergence, so minimizing its dn_nlevels matters.
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * Determine the number of levels necessary for the meta-dnode
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * to contain DN_MAX_OBJECT dnodes.
d6e555bdd793b8bc8fe57d5f12c3d69c813d0661George Wilson while ((uint64_t)mdn->dn_nblkptr << (mdn->dn_datablkshift +
fa9e4066f08beec538e775443c5be79dd423fcabahrens (levels - 1) * (mdn->dn_indblkshift - SPA_BLKPTRSHIFT)) <
5ad820458efd0fdb914baff9c1447c22b819fa23nd os->os_phys->os_flags |= OBJSET_FLAG_USERACCOUNTING_COMPLETE;
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwicktypedef struct dmu_objset_create_arg {
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick const char *doca_name;
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson void (*doca_userfunc)(objset_t *os, void *arg,
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwickdmu_objset_create_check(void *arg, dmu_tx_t *tx)
fa9e4066f08beec538e775443c5be79dd423fcabahrens const char *tail;
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick error = dsl_dir_hold(dp, doca->doca_name, FTAG, &pdd, &tail);
fa9e4066f08beec538e775443c5be79dd423fcabahrens error = dsl_fs_ss_limit_check(pdd, 1, ZFS_PROP_FILESYSTEM_LIMIT, NULL,
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilsondmu_objset_create_sync(void *arg, dmu_tx_t *tx)
fa9e4066f08beec538e775443c5be79dd423fcabahrens const char *tail;
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson VERIFY0(dsl_dir_hold(dp, doca->doca_name, FTAG, &pdd, &tail));
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson obj = dsl_dataset_create_sync(pdd, tail, NULL, doca->doca_flags,
fa9e4066f08beec538e775443c5be79dd423fcabahrens VERIFY0(dsl_dataset_hold_obj(pdd->dd_pool, obj, FTAG, &ds));
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson os = dmu_objset_create_impl(pdd->dd_pool->dp_spa,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billmdmu_objset_create(const char *name, dmu_objset_type_t type, uint64_t flags,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm void (*func)(objset_t *os, void *arg, cred_t *cr, dmu_tx_t *tx), void *arg)
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick dmu_objset_create_check, dmu_objset_create_sync, &doca, 5));
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick const char *tail;
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick error = dsl_dir_hold(dp, doca->doca_clone, FTAG, &pdd, &tail);
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick /* You can't clone across pools. */
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson error = dsl_fs_ss_limit_check(pdd, 1, ZFS_PROP_FILESYSTEM_LIMIT, NULL,
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson error = dsl_dataset_hold(dp, doca->doca_origin, FTAG, &origin);
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson /* You can't clone across pools. */
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson /* You can only clone snapshots, not the head datasets. */
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick return (0);
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson VERIFY0(dsl_dir_hold(dp, doca->doca_clone, FTAG, &pdd, &tail));
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson VERIFY0(dsl_dataset_hold(dp, doca->doca_origin, FTAG, &origin));
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson obj = dsl_dataset_create_sync(pdd, tail, origin, 0,
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick VERIFY0(dsl_dataset_hold_obj(pdd->dd_pool, obj, FTAG, &ds));
44cd46cadd9aab751dae6a4023c1cb5bf316d274billmdmu_objset_clone(const char *clone, const char *origin)
468c413a79615e77179e8d98f22a7e513a8135bdTim Haley dmu_objset_clone_check, dmu_objset_clone_sync, &doca, 5));
468c413a79615e77179e8d98f22a7e513a8135bdTim Haleydmu_objset_snapshot_one(const char *fsname, const char *snapname)
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson char *longsnap = kmem_asprintf("%s@%s", fsname, snapname);
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson err = dsl_dataset_snapshot(snaps, NULL, NULL);
44cd46cadd9aab751dae6a4023c1cb5bf316d274billmdmu_objset_sync_dnodes(list_t *list, list_t *newlist, dmu_tx_t *tx)
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * Initialize dn_zio outside dnode_sync() because the
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * meta-dnode needs to set it ouside dnode_sync().
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson/* ARGSUSED */
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilsondmu_objset_write_ready(zio_t *zio, arc_buf_t *abuf, void *arg)
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson dnode_phys_t *dnp = &os->os_phys->os_meta_dnode;
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * Update rootbp fill count: it should be the number of objects
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * allocated in the object set (not counting the "special"
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * objects that are stored in the objset_phys_t -- the meta
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * dnode and user/group accounting objects).
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson/* ARGSUSED */
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilsondmu_objset_write_done(zio_t *zio, arc_buf_t *abuf, void *arg)
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson (void) dsl_dataset_block_kill(ds, bp_orig, tx, B_TRUE);
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson/* called from dsl */
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilsondmu_objset_sync(objset_t *os, zio_t *pio, dmu_tx_t *tx)
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson dprintf_ds(os->os_dsl_dataset, "txg=%llu\n", tx->tx_txg);
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson /* XXX the write_done callback should really give us the tx... */
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * This is the MOS. If we have upgraded,
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * spa_max_replication() could change, so reset
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * os_copies here.
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson os->os_copies = spa_max_replication(os->os_spa);
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * Create the root block IO
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson os->os_dsl_dataset->ds_object : DMU_META_OBJSET,
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson ZB_ROOT_OBJECT, ZB_ROOT_LEVEL, ZB_ROOT_BLKID);
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson arc_release(os->os_phys_buf, &os->os_phys_buf);
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson os->os_rootbp, os->os_phys_buf, DMU_OS_IS_L2CACHEABLE(os),
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson DMU_OS_IS_L2COMPRESSIBLE(os), &zp, dmu_objset_write_ready,
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson NULL, dmu_objset_write_done, os, ZIO_PRIORITY_ASYNC_WRITE,
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * Sync special dnodes - the parent IO for the sync is the root block
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson DMU_USERUSED_DNODE(os)->dn_type != DMU_OT_NONE) {
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * We must create the list here because it uses the
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * dn_dirty_link[] of this txg.
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson dmu_objset_sync_dnodes(&os->os_free_dnodes[txgoff], newlist, tx);
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson dmu_objset_sync_dnodes(&os->os_dirty_dnodes[txgoff], newlist, tx);
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson list = &DMU_META_DNODE(os)->dn_dirty_records[txgoff];
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * Free intent log blocks up to this tx.
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson os->os_phys->os_zil_header = os->os_zil_header;
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilsondmu_objset_is_dirty(objset_t *os, uint64_t txg)
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson return (!list_is_empty(&os->os_dirty_dnodes[txg & TXG_MASK]) ||
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson !list_is_empty(&os->os_free_dnodes[txg & TXG_MASK]));
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilsonstatic objset_used_cb_t *used_cbs[DMU_OST_NUMTYPES];
fa9e4066f08beec538e775443c5be79dd423fcabahrensdmu_objset_register_type(dmu_objset_type_t ost, objset_used_cb_t *cb)
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick return (spa_version(os->os_spa) >= SPA_VERSION_USERSPACE &&
fa9e4066f08beec538e775443c5be79dd423fcabahrensdo_userquota_update(objset_t *os, uint64_t used, uint64_t flags,
fa9e4066f08beec538e775443c5be79dd423fcabahrens uint64_t user, uint64_t group, boolean_t subtract, dmu_tx_t *tx)
88ecc943b4eb72f7c4fbbd8435997b85ef171fc3George Wilson if ((flags & DNODE_FLAG_USERUSED_ACCOUNTED)) {
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson VERIFY3U(0, ==, zap_increment_int(os, DMU_USERUSED_OBJECT,
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson VERIFY3U(0, ==, zap_increment_int(os, DMU_GROUPUSED_OBJECT,
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilsondmu_objset_do_userquota_updates(objset_t *os, dmu_tx_t *tx)
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick ASSERT(list_head(list) == NULL || dmu_objset_userused_enabled(os));
468c413a79615e77179e8d98f22a7e513a8135bdTim Haley /* Allocate the user/groupused objects if necessary. */
fa9e4066f08beec538e775443c5be79dd423fcabahrens if (DMU_USERUSED_DNODE(os)->dn_type == DMU_OT_NONE) {
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * We intentionally modify the zap object even if the
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * net delta is zero. Otherwise
fa9e4066f08beec538e775443c5be79dd423fcabahrens * the block of the zap obj could be shared between
468c413a79615e77179e8d98f22a7e513a8135bdTim Haley * datasets but need to be different between them after
468c413a79615e77179e8d98f22a7e513a8135bdTim Haley * a bprewrite.
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson do_userquota_update(os, dn->dn_oldused, dn->dn_oldflags,
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * Returns a pointer to data to find uid/gid from
fa9e4066f08beec538e775443c5be79dd423fcabahrens * If a dirty record for transaction group that is syncing can't
fa9e4066f08beec538e775443c5be79dd423fcabahrens * be found then NULL is returned. In the NULL case it is assumed
fa9e4066f08beec538e775443c5be79dd423fcabahrens * the uid/gid aren't changing.
fa9e4066f08beec538e775443c5be79dd423fcabahrensstatic void *
fa9e4066f08beec538e775443c5be79dd423fcabahrensdmu_objset_userquota_find_data(dmu_buf_impl_t *db, dmu_tx_t *tx)
9eb57f7f3fbb970d4b9b89dcd5ecf543fe2414d5George Wilson return (db->db.db_data); /* Nothing is changing */
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick for (drp = &db->db_last_dirty; (dr = *drp) != NULL; drp = &dr->dr_next)
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilsondmu_objset_userquota_get_ids(dnode_t *dn, boolean_t before, dmu_tx_t *tx)
9eb57f7f3fbb970d4b9b89dcd5ecf543fe2414d5George Wilson if (before && (flags & (DN_ID_CHKED_BONUS|DN_ID_OLD_EXIST|
9eb57f7f3fbb970d4b9b89dcd5ecf543fe2414d5George Wilson } else if (dn->dn_bonuslen == 0 && dn->dn_bonustype == DMU_OT_SA) {
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick } else if (data) {
468c413a79615e77179e8d98f22a7e513a8135bdTim Haley * Must always call the callback in case the object
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson * type has changed and that type isn't an object type to track
fa9e4066f08beec538e775443c5be79dd423fcabahrens error = used_cbs[os->os_phys->os_type](dn->dn_bonustype, data,
fa9e4066f08beec538e775443c5be79dd423fcabahrens * Preserve existing uid/gid when the callback can't determine
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * what the new uid/gid are and the callback returned EEXIST.
fa9e4066f08beec538e775443c5be79dd423fcabahrens * The EEXIST error tells us to just use the existing uid/gid.
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * If we don't know what the old values are then just assign
fa9e4066f08beec538e775443c5be79dd423fcabahrens * them to 0, since that is a new file being created.
80eb36f241abf8c076119fb4c49a55fd61ebc710George Wilson if (!before && data == NULL && error == EEXIST) {
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm return (0);
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * We simply need to mark every object dirty, so that it will be
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick * synced out and now accounted. If this is called
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm * concurrently, or if we already did some work before crashing,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm * that's fine, since we track each object's accounted state
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm * independently.
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm for (obj = 0; err == 0; err = dmu_object_next(os, &obj, FALSE, 0)) {
03f8c366886542ed249a15d755ae78ea4e775d9dGeorge Wilsondmu_objset_space(objset_t *os, uint64_t *refdbytesp, uint64_t *availbytesp,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm dsl_dataset_space(os->os_dsl_dataset, refdbytesp, availbytesp,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billmdmu_objset_fast_stat(objset_t *os, dmu_objset_stats_t *stat)
09c9d376e8ccb8fbba74f33cc268964464092b62George Wilson dsl_prop_nvlist_add_uint64(nv, ZFS_PROP_USERACCOUNTING,
ecc2d604e885a75cc75e647b5641af99d5a6f4a6bonwick return (dsl_dataset_is_snapshot(os->os_dsl_dataset));
aeb1c1b609b02f03e8e7448beb88384ebc713525gwdmu_snapshot_realname(objset_t *os, char *name, char *real, int maxlen,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm return (zap_lookup_norm(ds->ds_dir->dd_pool->dp_meta_objset,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm ds->ds_phys->ds_snapnames_zapobj, name, 8, 1, &ignored, MT_FIRST,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billmdmu_snapshot_list_next(objset_t *os, int namelen, char *name,
09c9d376e8ccb8fbba74f33cc268964464092b62George Wilson uint64_t *idp, uint64_t *offp, boolean_t *case_conflict)
03f8c366886542ed249a15d755ae78ea4e775d9dGeorge Wilson ASSERT(dsl_pool_config_held(dmu_objset_pool(os)));
16a4a8074274d2d7cc408589cf6359f4a378c861George Wilson if (zap_cursor_retrieve(&cursor, &attr) != 0) {
fa9e4066f08beec538e775443c5be79dd423fcabahrens return (0);
44cd46cadd9aab751dae6a4023c1cb5bf316d274billmdmu_dir_list_next(objset_t *os, int namelen, char *name,
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm /* there is no next dir on a snapshot! */
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm return (0);
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm * Find objsets under and including ddobj, call func(ds) on each.
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm int func(dsl_pool_t *, dsl_dataset_t *, void *), void *arg, int flags)
a15215608b8bd90f714f6db21ee623b584607cb6Jeff Bonwick err = dsl_dir_hold_obj(dp, ddobj, NULL, FTAG, &dd);
88ecc943b4eb72f7c4fbbd8435997b85ef171fc3George Wilson /* Don't visit hidden ($MOS & $ORIGIN) objsets. */
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm attr = kmem_alloc(sizeof (zap_attribute_t), KM_SLEEP);
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm * Iterate over all children.
8ad4d6dd86f5bc65fb3afa566c8133f3bac21648Jeff Bonwick * Iterate over all snapshots.
9dc3941c735ef88de46e850f745aa556d3a071a5Sašo Kiselkov for (zap_cursor_init(&zc, dp->dp_meta_objset, snapobj);
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick * Apply to self.
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwick err = dsl_dataset_hold_obj(dp, thisobj, FTAG, &ds);
09c9d376e8ccb8fbba74f33cc268964464092b62George Wilson * Find all objsets under name, and for each, call 'func(child_name, arg)'.
09c9d376e8ccb8fbba74f33cc268964464092b62George Wilson * The dp_config_rwlock must not be held when this is called, and it
09c9d376e8ccb8fbba74f33cc268964464092b62George Wilson * will not be held when the callback is called.
09c9d376e8ccb8fbba74f33cc268964464092b62George Wilson * Therefore this function should only be used when the pool is not changing
09c9d376e8ccb8fbba74f33cc268964464092b62George Wilson * (e.g. in syncing context), or the callback can deal with the possible races.
09c9d376e8ccb8fbba74f33cc268964464092b62George Wilsondmu_objset_find_impl(spa_t *spa, const char *name,
fa9e4066f08beec538e775443c5be79dd423fcabahrens int func(const char *, void *), void *arg, int flags)
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm if (err != 0) {
fa9e4066f08beec538e775443c5be79dd423fcabahrens /* Don't visit hidden ($MOS & $ORIGIN) objsets. */
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm return (0);
44cd46cadd9aab751dae6a4023c1cb5bf316d274billm attr = kmem_alloc(sizeof (zap_attribute_t), KM_SLEEP);
8ad4d6dd86f5bc65fb3afa566c8133f3bac21648Jeff Bonwick * Iterate over all children.
fa9e4066f08beec538e775443c5be79dd423fcabahrens if (err != 0) {
d80c45e0f58fa434ba37259ea2e2b12e0380c19abonwick * Iterate over all snapshots.
fa9e4066f08beec538e775443c5be79dd423fcabahrens if (err == 0) {
fa9e4066f08beec538e775443c5be79dd423fcabahrens for (zap_cursor_init(&zc, dp->dp_meta_objset, snapobj);
d80c45e0f58fa434ba37259ea2e2b12e0380c19abonwick /* Apply to self. */
d80c45e0f58fa434ba37259ea2e2b12e0380c19abonwick * See comment above dmu_objset_find_impl().
d80c45e0f58fa434ba37259ea2e2b12e0380c19abonwickdmu_objset_find(char *name, int func(const char *, void *), void *arg,
d80c45e0f58fa434ba37259ea2e2b12e0380c19abonwick error = dmu_objset_find_impl(spa, name, func, arg, flags);
b24ab6762772a3f6a89393947930c7fa61306783Jeff Bonwickdmu_objset_set_user(objset_t *os, void *user_ptr)
d80c45e0f58fa434ba37259ea2e2b12e0380c19abonwick * Determine name of filesystem, given name of snapshot.
d80c45e0f58fa434ba37259ea2e2b12e0380c19abonwick * buf must be at least MAXNAMELEN bytes
d80c45e0f58fa434ba37259ea2e2b12e0380c19abonwick return (0);