2011-11-11 11:15:53 +04:00
|
|
|
/*
|
|
|
|
* CDDL HEADER START
|
|
|
|
*
|
|
|
|
* The contents of this file are subject to the terms of the
|
|
|
|
* Common Development and Distribution License (the "License").
|
|
|
|
* You may not use this file except in compliance with the License.
|
|
|
|
*
|
|
|
|
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
|
2022-07-12 00:16:13 +03:00
|
|
|
* or https://opensource.org/licenses/CDDL-1.0.
|
2011-11-11 11:15:53 +04:00
|
|
|
* See the License for the specific language governing permissions
|
|
|
|
* and limitations under the License.
|
|
|
|
*
|
|
|
|
* When distributing Covered Code, include this CDDL HEADER in each
|
|
|
|
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
|
|
|
|
* If applicable, add the following below this CDDL HEADER, with the
|
|
|
|
* fields enclosed by brackets "[]" replaced with your own identifying
|
|
|
|
* information: Portions Copyright [yyyy] [name of copyright owner]
|
|
|
|
*
|
|
|
|
* CDDL HEADER END
|
|
|
|
*/
|
|
|
|
/*
|
|
|
|
*
|
|
|
|
* Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
|
|
|
|
* Copyright (C) 2011 Lawrence Livermore National Security, LLC.
|
|
|
|
* Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER).
|
|
|
|
* LLNL-CODE-403049.
|
|
|
|
* Rewritten for Linux by:
|
|
|
|
* Rohan Puri <rohan.puri15@gmail.com>
|
|
|
|
* Brian Behlendorf <behlendorf1@llnl.gov>
|
2013-03-08 22:41:28 +04:00
|
|
|
* Copyright (c) 2013 by Delphix. All rights reserved.
|
2016-05-11 22:03:51 +03:00
|
|
|
* Copyright 2015, OmniTI Computer Consulting, Inc. All rights reserved.
|
2018-11-09 03:17:12 +03:00
|
|
|
* Copyright (c) 2018 George Melikov. All Rights Reserved.
|
2019-07-03 23:05:02 +03:00
|
|
|
* Copyright (c) 2019 Datto, Inc. All rights reserved.
|
2020-08-25 03:33:02 +03:00
|
|
|
* Copyright (c) 2020 The MathWorks, Inc. All rights reserved.
|
2011-11-11 11:15:53 +04:00
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* ZFS control directory (a.k.a. ".zfs")
|
|
|
|
*
|
|
|
|
* This directory provides a common location for all ZFS meta-objects.
|
|
|
|
* Currently, this is only the 'snapshot' and 'shares' directory, but this may
|
|
|
|
* expand in the future. The elements are built dynamically, as the hierarchy
|
|
|
|
* does not actually exist on disk.
|
|
|
|
*
|
|
|
|
* For 'snapshot', we don't want to have all snapshots always mounted, because
|
|
|
|
* this would take up a huge amount of space in /etc/mnttab. We have three
|
|
|
|
* types of objects:
|
|
|
|
*
|
|
|
|
* ctldir ------> snapshotdir -------> snapshot
|
|
|
|
* |
|
|
|
|
* |
|
|
|
|
* V
|
|
|
|
* mounted fs
|
|
|
|
*
|
|
|
|
* The 'snapshot' node contains just enough information to lookup '..' and act
|
|
|
|
* as a mountpoint for the snapshot. Whenever we lookup a specific snapshot, we
|
|
|
|
* perform an automount of the underlying filesystem and return the
|
|
|
|
* corresponding inode.
|
|
|
|
*
|
|
|
|
* All mounts are handled automatically by an user mode helper which invokes
|
2019-05-06 01:57:23 +03:00
|
|
|
* the mount procedure. Unmounts are handled by allowing the mount
|
2011-11-11 11:15:53 +04:00
|
|
|
* point to expire so the kernel may automatically unmount it.
|
|
|
|
*
|
|
|
|
* The '.zfs', '.zfs/snapshot', and all directories created under
|
|
|
|
* '.zfs/snapshot' (ie: '.zfs/snapshot/<snapname>') all share the same
|
2019-05-06 01:57:23 +03:00
|
|
|
* zfsvfs_t as the head filesystem (what '.zfs' lives under).
|
2011-11-11 11:15:53 +04:00
|
|
|
*
|
|
|
|
* File systems mounted on top of the '.zfs/snapshot/<snapname>' paths
|
|
|
|
* (ie: snapshots) are complete ZFS filesystems and have their own unique
|
2017-03-08 03:21:37 +03:00
|
|
|
* zfsvfs_t. However, the fsid reported by these mounts will be the same
|
|
|
|
* as that used by the parent zfsvfs_t to make NFS happy.
|
2011-11-11 11:15:53 +04:00
|
|
|
*/
|
|
|
|
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <sys/param.h>
|
|
|
|
#include <sys/time.h>
|
|
|
|
#include <sys/sysmacros.h>
|
|
|
|
#include <sys/pathname.h>
|
|
|
|
#include <sys/vfs.h>
|
|
|
|
#include <sys/zfs_ctldir.h>
|
|
|
|
#include <sys/zfs_ioctl.h>
|
|
|
|
#include <sys/zfs_vfsops.h>
|
|
|
|
#include <sys/zfs_vnops.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <sys/dmu.h>
|
2015-12-08 02:43:53 +03:00
|
|
|
#include <sys/dmu_objset.h>
|
2013-09-04 16:00:57 +04:00
|
|
|
#include <sys/dsl_destroy.h>
|
2011-11-11 11:15:53 +04:00
|
|
|
#include <sys/dsl_deleg.h>
|
|
|
|
#include <sys/zpl.h>
|
2019-05-25 02:43:23 +03:00
|
|
|
#include <sys/mntent.h>
|
2011-11-11 11:15:53 +04:00
|
|
|
#include "zfs_namecheck.h"
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
/*
|
|
|
|
* Two AVL trees are maintained which contain all currently automounted
|
|
|
|
* snapshots. Every automounted snapshots maps to a single zfs_snapentry_t
|
|
|
|
* entry which MUST:
|
|
|
|
*
|
|
|
|
* - be attached to both trees, and
|
|
|
|
* - be unique, no duplicate entries are allowed.
|
|
|
|
*
|
|
|
|
* The zfs_snapshots_by_name tree is indexed by the full dataset name
|
|
|
|
* while the zfs_snapshots_by_objsetid tree is indexed by the unique
|
|
|
|
* objsetid. This allows for fast lookups either by name or objsetid.
|
|
|
|
*/
|
|
|
|
static avl_tree_t zfs_snapshots_by_name;
|
|
|
|
static avl_tree_t zfs_snapshots_by_objsetid;
|
2015-12-11 02:53:37 +03:00
|
|
|
static krwlock_t zfs_snapshot_lock;
|
2015-04-25 02:21:13 +03:00
|
|
|
|
2011-11-11 11:15:53 +04:00
|
|
|
/*
|
|
|
|
* Control Directory Tunables (.zfs)
|
|
|
|
*/
|
|
|
|
int zfs_expire_snapshot = ZFSCTL_EXPIRE_SNAPSHOT;
|
2022-01-15 02:37:55 +03:00
|
|
|
static int zfs_admin_snapshot = 0;
|
2024-10-02 19:12:02 +03:00
|
|
|
static int zfs_snapshot_no_setuid = 0;
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
typedef struct {
|
|
|
|
char *se_name; /* full snapshot name */
|
|
|
|
char *se_path; /* full mount path */
|
2015-12-08 02:43:53 +03:00
|
|
|
spa_t *se_spa; /* pool spa */
|
2015-04-25 02:21:13 +03:00
|
|
|
uint64_t se_objsetid; /* snapshot objset id */
|
|
|
|
struct dentry *se_root_dentry; /* snapshot root dentry */
|
2021-11-03 18:00:08 +03:00
|
|
|
krwlock_t se_taskqid_lock; /* scheduled unmount taskqid lock */
|
2015-04-25 02:21:13 +03:00
|
|
|
taskqid_t se_taskqid; /* scheduled unmount taskqid */
|
|
|
|
avl_node_t se_node_name; /* zfs_snapshots_by_name link */
|
|
|
|
avl_node_t se_node_objsetid; /* zfs_snapshots_by_objsetid link */
|
2018-09-26 20:29:26 +03:00
|
|
|
zfs_refcount_t se_refcount; /* reference count */
|
2015-04-25 02:21:13 +03:00
|
|
|
} zfs_snapentry_t;
|
|
|
|
|
|
|
|
static void zfsctl_snapshot_unmount_delay_impl(zfs_snapentry_t *se, int delay);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Allocate a new zfs_snapentry_t being careful to make a copy of the
|
|
|
|
* the snapshot name and provided mount point. No reference is taken.
|
|
|
|
*/
|
2011-11-11 11:15:53 +04:00
|
|
|
static zfs_snapentry_t *
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapshot_alloc(const char *full_name, const char *full_path, spa_t *spa,
|
2015-12-08 02:43:53 +03:00
|
|
|
uint64_t objsetid, struct dentry *root_dentry)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2015-04-25 02:21:13 +03:00
|
|
|
zfs_snapentry_t *se;
|
|
|
|
|
|
|
|
se = kmem_zalloc(sizeof (zfs_snapentry_t), KM_SLEEP);
|
|
|
|
|
2019-10-10 19:47:06 +03:00
|
|
|
se->se_name = kmem_strdup(full_name);
|
|
|
|
se->se_path = kmem_strdup(full_path);
|
2015-12-08 02:43:53 +03:00
|
|
|
se->se_spa = spa;
|
2015-04-25 02:21:13 +03:00
|
|
|
se->se_objsetid = objsetid;
|
|
|
|
se->se_root_dentry = root_dentry;
|
2016-10-29 01:40:14 +03:00
|
|
|
se->se_taskqid = TASKQID_INVALID;
|
2021-11-03 18:00:08 +03:00
|
|
|
rw_init(&se->se_taskqid_lock, NULL, RW_DEFAULT, NULL);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
2018-10-01 20:42:05 +03:00
|
|
|
zfs_refcount_create(&se->se_refcount);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
|
|
|
return (se);
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
/*
|
2019-05-06 01:57:23 +03:00
|
|
|
* Free a zfs_snapentry_t the caller must ensure there are no active
|
2015-04-25 02:21:13 +03:00
|
|
|
* references.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
zfsctl_snapshot_free(zfs_snapentry_t *se)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2018-10-01 20:42:05 +03:00
|
|
|
zfs_refcount_destroy(&se->se_refcount);
|
2019-10-10 19:47:06 +03:00
|
|
|
kmem_strfree(se->se_name);
|
|
|
|
kmem_strfree(se->se_path);
|
2022-03-31 01:40:31 +03:00
|
|
|
rw_destroy(&se->se_taskqid_lock);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
|
|
|
kmem_free(se, sizeof (zfs_snapentry_t));
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2015-04-25 02:21:13 +03:00
|
|
|
* Hold a reference on the zfs_snapentry_t.
|
2011-11-11 11:15:53 +04:00
|
|
|
*/
|
|
|
|
static void
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_hold(zfs_snapentry_t *se)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2018-09-26 20:29:26 +03:00
|
|
|
zfs_refcount_add(&se->se_refcount, NULL);
|
2015-04-25 02:21:13 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Release a reference on the zfs_snapentry_t. When the number of
|
|
|
|
* references drops to zero the structure will be freed.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
zfsctl_snapshot_rele(zfs_snapentry_t *se)
|
|
|
|
{
|
2018-10-01 20:42:05 +03:00
|
|
|
if (zfs_refcount_remove(&se->se_refcount, NULL) == 0)
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_free(se);
|
|
|
|
}
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
/*
|
|
|
|
* Add a zfs_snapentry_t to both the zfs_snapshots_by_name and
|
|
|
|
* zfs_snapshots_by_objsetid trees. While the zfs_snapentry_t is part
|
|
|
|
* of the trees a reference is held.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
zfsctl_snapshot_add(zfs_snapentry_t *se)
|
|
|
|
{
|
2015-12-11 02:53:37 +03:00
|
|
|
ASSERT(RW_WRITE_HELD(&zfs_snapshot_lock));
|
2019-07-17 19:07:53 +03:00
|
|
|
zfsctl_snapshot_hold(se);
|
2015-04-25 02:21:13 +03:00
|
|
|
avl_add(&zfs_snapshots_by_name, se);
|
|
|
|
avl_add(&zfs_snapshots_by_objsetid, se);
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
/*
|
|
|
|
* Remove a zfs_snapentry_t from both the zfs_snapshots_by_name and
|
|
|
|
* zfs_snapshots_by_objsetid trees. Upon removal a reference is dropped,
|
|
|
|
* this can result in the structure being freed if that was the last
|
|
|
|
* remaining reference.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
zfsctl_snapshot_remove(zfs_snapentry_t *se)
|
|
|
|
{
|
2015-12-11 02:53:37 +03:00
|
|
|
ASSERT(RW_WRITE_HELD(&zfs_snapshot_lock));
|
2015-04-25 02:21:13 +03:00
|
|
|
avl_remove(&zfs_snapshots_by_name, se);
|
|
|
|
avl_remove(&zfs_snapshots_by_objsetid, se);
|
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Snapshot name comparison function for the zfs_snapshots_by_name.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
snapentry_compare_by_name(const void *a, const void *b)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2015-04-25 02:21:13 +03:00
|
|
|
const zfs_snapentry_t *se_a = a;
|
|
|
|
const zfs_snapentry_t *se_b = b;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
ret = strcmp(se_a->se_name, se_b->se_name);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
if (ret < 0)
|
|
|
|
return (-1);
|
|
|
|
else if (ret > 0)
|
|
|
|
return (1);
|
|
|
|
else
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
/*
|
|
|
|
* Snapshot name comparison function for the zfs_snapshots_by_objsetid.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
snapentry_compare_by_objsetid(const void *a, const void *b)
|
|
|
|
{
|
|
|
|
const zfs_snapentry_t *se_a = a;
|
|
|
|
const zfs_snapentry_t *se_b = b;
|
|
|
|
|
2015-12-08 02:43:53 +03:00
|
|
|
if (se_a->se_spa != se_b->se_spa)
|
|
|
|
return ((ulong_t)se_a->se_spa < (ulong_t)se_b->se_spa ? -1 : 1);
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
if (se_a->se_objsetid < se_b->se_objsetid)
|
|
|
|
return (-1);
|
|
|
|
else if (se_a->se_objsetid > se_b->se_objsetid)
|
|
|
|
return (1);
|
|
|
|
else
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Find a zfs_snapentry_t in zfs_snapshots_by_name. If the snapname
|
|
|
|
* is found a pointer to the zfs_snapentry_t is returned and a reference
|
|
|
|
* taken on the structure. The caller is responsible for dropping the
|
|
|
|
* reference with zfsctl_snapshot_rele(). If the snapname is not found
|
|
|
|
* NULL will be returned.
|
|
|
|
*/
|
|
|
|
static zfs_snapentry_t *
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapshot_find_by_name(const char *snapname)
|
2015-04-25 02:21:13 +03:00
|
|
|
{
|
|
|
|
zfs_snapentry_t *se, search;
|
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
ASSERT(RW_LOCK_HELD(&zfs_snapshot_lock));
|
2015-04-25 02:21:13 +03:00
|
|
|
|
2020-10-03 03:44:10 +03:00
|
|
|
search.se_name = (char *)snapname;
|
2015-04-25 02:21:13 +03:00
|
|
|
se = avl_find(&zfs_snapshots_by_name, &search, NULL);
|
|
|
|
if (se)
|
2019-07-17 19:07:53 +03:00
|
|
|
zfsctl_snapshot_hold(se);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
|
|
|
return (se);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Find a zfs_snapentry_t in zfs_snapshots_by_objsetid given the objset id
|
|
|
|
* rather than the snapname. In all other respects it behaves the same
|
|
|
|
* as zfsctl_snapshot_find_by_name().
|
|
|
|
*/
|
|
|
|
static zfs_snapentry_t *
|
2015-12-08 02:43:53 +03:00
|
|
|
zfsctl_snapshot_find_by_objsetid(spa_t *spa, uint64_t objsetid)
|
2015-04-25 02:21:13 +03:00
|
|
|
{
|
|
|
|
zfs_snapentry_t *se, search;
|
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
ASSERT(RW_LOCK_HELD(&zfs_snapshot_lock));
|
2015-04-25 02:21:13 +03:00
|
|
|
|
2015-12-08 02:43:53 +03:00
|
|
|
search.se_spa = spa;
|
2015-04-25 02:21:13 +03:00
|
|
|
search.se_objsetid = objsetid;
|
|
|
|
se = avl_find(&zfs_snapshots_by_objsetid, &search, NULL);
|
|
|
|
if (se)
|
2019-07-17 19:07:53 +03:00
|
|
|
zfsctl_snapshot_hold(se);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
|
|
|
return (se);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Rename a zfs_snapentry_t in the zfs_snapshots_by_name. The structure is
|
|
|
|
* removed, renamed, and added back to the new correct location in the tree.
|
|
|
|
*/
|
|
|
|
static int
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapshot_rename(const char *old_snapname, const char *new_snapname)
|
2015-04-25 02:21:13 +03:00
|
|
|
{
|
|
|
|
zfs_snapentry_t *se;
|
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
ASSERT(RW_WRITE_HELD(&zfs_snapshot_lock));
|
2015-04-25 02:21:13 +03:00
|
|
|
|
|
|
|
se = zfsctl_snapshot_find_by_name(old_snapname);
|
|
|
|
if (se == NULL)
|
2017-08-03 07:16:12 +03:00
|
|
|
return (SET_ERROR(ENOENT));
|
2015-04-25 02:21:13 +03:00
|
|
|
|
|
|
|
zfsctl_snapshot_remove(se);
|
2019-10-10 19:47:06 +03:00
|
|
|
kmem_strfree(se->se_name);
|
|
|
|
se->se_name = kmem_strdup(new_snapname);
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_add(se);
|
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Delayed task responsible for unmounting an expired automounted snapshot.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
snapentry_expire(void *data)
|
|
|
|
{
|
|
|
|
zfs_snapentry_t *se = (zfs_snapentry_t *)data;
|
2015-12-08 02:43:53 +03:00
|
|
|
spa_t *spa = se->se_spa;
|
2015-04-25 02:21:13 +03:00
|
|
|
uint64_t objsetid = se->se_objsetid;
|
|
|
|
|
2015-12-11 02:23:26 +03:00
|
|
|
if (zfs_expire_snapshot <= 0) {
|
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2021-11-03 18:00:08 +03:00
|
|
|
rw_enter(&se->se_taskqid_lock, RW_WRITER);
|
2016-10-29 01:40:14 +03:00
|
|
|
se->se_taskqid = TASKQID_INVALID;
|
2021-11-03 18:00:08 +03:00
|
|
|
rw_exit(&se->se_taskqid_lock);
|
2015-04-25 02:21:13 +03:00
|
|
|
(void) zfsctl_snapshot_unmount(se->se_name, MNT_EXPIRE);
|
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Reschedule the unmount if the zfs_snapentry_t wasn't removed.
|
|
|
|
* This can occur when the snapshot is busy.
|
|
|
|
*/
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_enter(&zfs_snapshot_lock, RW_READER);
|
2015-12-08 02:43:53 +03:00
|
|
|
if ((se = zfsctl_snapshot_find_by_objsetid(spa, objsetid)) != NULL) {
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_unmount_delay_impl(se, zfs_expire_snapshot);
|
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
}
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_exit(&zfs_snapshot_lock);
|
2015-04-25 02:21:13 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Cancel an automatic unmount of a snapname. This callback is responsible
|
|
|
|
* for dropping the reference on the zfs_snapentry_t which was taken when
|
|
|
|
* during dispatch.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
zfsctl_snapshot_unmount_cancel(zfs_snapentry_t *se)
|
|
|
|
{
|
2021-11-03 18:00:08 +03:00
|
|
|
int err = 0;
|
|
|
|
rw_enter(&se->se_taskqid_lock, RW_WRITER);
|
|
|
|
err = taskq_cancel_id(system_delay_taskq, se->se_taskqid);
|
|
|
|
/*
|
|
|
|
* if we get ENOENT, the taskq couldn't be found to be
|
|
|
|
* canceled, so we can just mark it as invalid because
|
|
|
|
* it's already gone. If we got EBUSY, then we already
|
|
|
|
* blocked until it was gone _anyway_, so we don't care.
|
|
|
|
*/
|
|
|
|
se->se_taskqid = TASKQID_INVALID;
|
|
|
|
rw_exit(&se->se_taskqid_lock);
|
|
|
|
if (err == 0) {
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Dispatch the unmount task for delayed handling with a hold protecting it.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
zfsctl_snapshot_unmount_delay_impl(zfs_snapentry_t *se, int delay)
|
|
|
|
{
|
|
|
|
|
2015-12-11 02:23:26 +03:00
|
|
|
if (delay <= 0)
|
|
|
|
return;
|
|
|
|
|
2015-12-14 21:59:25 +03:00
|
|
|
zfsctl_snapshot_hold(se);
|
2021-11-03 18:00:08 +03:00
|
|
|
rw_enter(&se->se_taskqid_lock, RW_WRITER);
|
2023-02-14 03:40:13 +03:00
|
|
|
/*
|
|
|
|
* If this condition happens, we managed to:
|
|
|
|
* - dispatch once
|
|
|
|
* - want to dispatch _again_ before it returned
|
|
|
|
*
|
|
|
|
* So let's just return - if that task fails at unmounting,
|
|
|
|
* we'll eventually dispatch again, and if it succeeds,
|
|
|
|
* no problem.
|
|
|
|
*/
|
|
|
|
if (se->se_taskqid != TASKQID_INVALID) {
|
|
|
|
rw_exit(&se->se_taskqid_lock);
|
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
return;
|
|
|
|
}
|
2016-12-01 00:56:50 +03:00
|
|
|
se->se_taskqid = taskq_dispatch_delay(system_delay_taskq,
|
2015-04-25 02:21:13 +03:00
|
|
|
snapentry_expire, se, TQ_SLEEP, ddi_get_lbolt() + delay * HZ);
|
2021-11-03 18:00:08 +03:00
|
|
|
rw_exit(&se->se_taskqid_lock);
|
2015-04-25 02:21:13 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Schedule an automatic unmount of objset id to occur in delay seconds from
|
|
|
|
* now. Any previous delayed unmount will be cancelled in favor of the
|
|
|
|
* updated deadline. A reference is taken by zfsctl_snapshot_find_by_name()
|
|
|
|
* and held until the outstanding task is handled or cancelled.
|
|
|
|
*/
|
|
|
|
int
|
2015-12-08 02:43:53 +03:00
|
|
|
zfsctl_snapshot_unmount_delay(spa_t *spa, uint64_t objsetid, int delay)
|
2015-04-25 02:21:13 +03:00
|
|
|
{
|
|
|
|
zfs_snapentry_t *se;
|
|
|
|
int error = ENOENT;
|
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_enter(&zfs_snapshot_lock, RW_READER);
|
2015-12-08 02:43:53 +03:00
|
|
|
if ((se = zfsctl_snapshot_find_by_objsetid(spa, objsetid)) != NULL) {
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_unmount_cancel(se);
|
|
|
|
zfsctl_snapshot_unmount_delay_impl(se, delay);
|
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
error = 0;
|
|
|
|
}
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_exit(&zfs_snapshot_lock);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Check if snapname is currently mounted. Returned non-zero when mounted
|
|
|
|
* and zero when unmounted.
|
|
|
|
*/
|
|
|
|
static boolean_t
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapshot_ismounted(const char *snapname)
|
2015-04-25 02:21:13 +03:00
|
|
|
{
|
|
|
|
zfs_snapentry_t *se;
|
|
|
|
boolean_t ismounted = B_FALSE;
|
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_enter(&zfs_snapshot_lock, RW_READER);
|
2015-04-25 02:21:13 +03:00
|
|
|
if ((se = zfsctl_snapshot_find_by_name(snapname)) != NULL) {
|
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
ismounted = B_TRUE;
|
|
|
|
}
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_exit(&zfs_snapshot_lock);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
|
|
|
return (ismounted);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Check if the given inode is a part of the virtual .zfs directory.
|
|
|
|
*/
|
2011-11-11 11:15:53 +04:00
|
|
|
boolean_t
|
|
|
|
zfsctl_is_node(struct inode *ip)
|
|
|
|
{
|
|
|
|
return (ITOZ(ip)->z_is_ctldir);
|
|
|
|
}
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
/*
|
|
|
|
* Check if the given inode is a .zfs/snapshots/snapname directory.
|
|
|
|
*/
|
2011-11-11 11:15:53 +04:00
|
|
|
boolean_t
|
|
|
|
zfsctl_is_snapdir(struct inode *ip)
|
|
|
|
{
|
|
|
|
return (zfsctl_is_node(ip) && (ip->i_ino <= ZFSCTL_INO_SNAPDIRS));
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Allocate a new inode with the passed id and ops.
|
|
|
|
*/
|
|
|
|
static struct inode *
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsctl_inode_alloc(zfsvfs_t *zfsvfs, uint64_t id,
|
2023-08-01 18:50:17 +03:00
|
|
|
const struct file_operations *fops, const struct inode_operations *ops,
|
|
|
|
uint64_t creation)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
|
|
|
struct inode *ip;
|
|
|
|
znode_t *zp;
|
2023-08-01 18:50:17 +03:00
|
|
|
inode_timespec_t now = {.tv_sec = creation};
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
ip = new_inode(zfsvfs->z_sb);
|
2011-11-11 11:15:53 +04:00
|
|
|
if (ip == NULL)
|
|
|
|
return (NULL);
|
|
|
|
|
2023-08-01 18:50:17 +03:00
|
|
|
if (!creation)
|
|
|
|
now = current_time(ip);
|
2011-11-11 11:15:53 +04:00
|
|
|
zp = ITOZ(ip);
|
|
|
|
ASSERT3P(zp->z_dirlocks, ==, NULL);
|
|
|
|
ASSERT3P(zp->z_acl_cached, ==, NULL);
|
|
|
|
ASSERT3P(zp->z_xattr_cached, ==, NULL);
|
|
|
|
zp->z_id = id;
|
2019-08-13 16:58:02 +03:00
|
|
|
zp->z_unlinked = B_FALSE;
|
|
|
|
zp->z_atime_dirty = B_FALSE;
|
|
|
|
zp->z_zn_prefetch = B_FALSE;
|
|
|
|
zp->z_is_sa = B_FALSE;
|
|
|
|
zp->z_is_ctldir = B_TRUE;
|
2011-11-11 11:15:53 +04:00
|
|
|
zp->z_sa_hdl = NULL;
|
|
|
|
zp->z_blksz = 0;
|
|
|
|
zp->z_seq = 0;
|
|
|
|
zp->z_mapcnt = 0;
|
|
|
|
zp->z_size = 0;
|
|
|
|
zp->z_pflags = 0;
|
|
|
|
zp->z_mode = 0;
|
|
|
|
zp->z_sync_cnt = 0;
|
2022-05-03 23:23:26 +03:00
|
|
|
zp->z_sync_writes_cnt = 0;
|
|
|
|
zp->z_async_writes_cnt = 0;
|
2016-04-18 22:08:53 +03:00
|
|
|
ip->i_generation = 0;
|
2011-11-11 11:15:53 +04:00
|
|
|
ip->i_ino = id;
|
2016-06-07 19:16:52 +03:00
|
|
|
ip->i_mode = (S_IFDIR | S_IRWXUGO);
|
2013-07-14 20:59:24 +04:00
|
|
|
ip->i_uid = SUID_TO_KUID(0);
|
|
|
|
ip->i_gid = SGID_TO_KGID(0);
|
2011-11-11 11:15:53 +04:00
|
|
|
ip->i_blkbits = SPA_MINBLOCKSHIFT;
|
2023-12-16 14:31:32 +03:00
|
|
|
zpl_inode_set_atime_to_ts(ip, now);
|
|
|
|
zpl_inode_set_mtime_to_ts(ip, now);
|
2023-09-12 06:21:29 +03:00
|
|
|
zpl_inode_set_ctime_to_ts(ip, now);
|
2011-11-11 11:15:53 +04:00
|
|
|
ip->i_fop = fops;
|
|
|
|
ip->i_op = ops;
|
2017-06-05 21:26:25 +03:00
|
|
|
#if defined(IOP_XATTR)
|
|
|
|
ip->i_opflags &= ~IOP_XATTR;
|
|
|
|
#endif
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
if (insert_inode_locked(ip)) {
|
|
|
|
unlock_new_inode(ip);
|
|
|
|
iput(ip);
|
|
|
|
return (NULL);
|
|
|
|
}
|
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
mutex_enter(&zfsvfs->z_znodes_lock);
|
|
|
|
list_insert_tail(&zfsvfs->z_all_znodes, zp);
|
2011-11-11 11:15:53 +04:00
|
|
|
membar_producer();
|
2017-03-08 03:21:37 +03:00
|
|
|
mutex_exit(&zfsvfs->z_znodes_lock);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
unlock_new_inode(ip);
|
|
|
|
|
|
|
|
return (ip);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Lookup the inode with given id, it will be allocated if needed.
|
|
|
|
*/
|
|
|
|
static struct inode *
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsctl_inode_lookup(zfsvfs_t *zfsvfs, uint64_t id,
|
2011-11-11 11:15:53 +04:00
|
|
|
const struct file_operations *fops, const struct inode_operations *ops)
|
|
|
|
{
|
|
|
|
struct inode *ip = NULL;
|
2023-08-01 18:50:17 +03:00
|
|
|
uint64_t creation = 0;
|
|
|
|
dsl_dataset_t *snap_ds;
|
|
|
|
dsl_pool_t *pool;
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
while (ip == NULL) {
|
2017-03-08 03:21:37 +03:00
|
|
|
ip = ilookup(zfsvfs->z_sb, (unsigned long)id);
|
2011-11-11 11:15:53 +04:00
|
|
|
if (ip)
|
|
|
|
break;
|
|
|
|
|
2023-08-01 18:50:17 +03:00
|
|
|
if (id <= ZFSCTL_INO_SNAPDIRS && !creation) {
|
|
|
|
pool = dmu_objset_pool(zfsvfs->z_os);
|
|
|
|
dsl_pool_config_enter(pool, FTAG);
|
|
|
|
if (!dsl_dataset_hold_obj(pool,
|
|
|
|
ZFSCTL_INO_SNAPDIRS - id, FTAG, &snap_ds)) {
|
|
|
|
creation = dsl_get_creation(snap_ds);
|
|
|
|
dsl_dataset_rele(snap_ds, FTAG);
|
|
|
|
}
|
|
|
|
dsl_pool_config_exit(pool, FTAG);
|
|
|
|
}
|
|
|
|
|
2011-11-11 11:15:53 +04:00
|
|
|
/* May fail due to concurrent zfsctl_inode_alloc() */
|
2023-08-01 18:50:17 +03:00
|
|
|
ip = zfsctl_inode_alloc(zfsvfs, id, fops, ops, creation);
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
return (ip);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Create the '.zfs' directory. This directory is cached as part of the VFS
|
2017-03-08 03:21:37 +03:00
|
|
|
* structure. This results in a hold on the zfsvfs_t. The code in zfs_umount()
|
2011-11-11 11:15:53 +04:00
|
|
|
* therefore checks against a vfs_count of 2 instead of 1. This reference
|
|
|
|
* is removed when the ctldir is destroyed in the unmount. All other entities
|
|
|
|
* under the '.zfs' directory are created dynamically as needed.
|
2012-07-20 01:50:25 +04:00
|
|
|
*
|
|
|
|
* Because the dynamically created '.zfs' directory entries assume the use
|
|
|
|
* of 64-bit inode numbers this support must be disabled on 32-bit systems.
|
2011-11-11 11:15:53 +04:00
|
|
|
*/
|
|
|
|
int
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsctl_create(zfsvfs_t *zfsvfs)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
ASSERT(zfsvfs->z_ctldir == NULL);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs->z_ctldir = zfsctl_inode_alloc(zfsvfs, ZFSCTL_INO_ROOT,
|
2023-08-01 18:50:17 +03:00
|
|
|
&zpl_fops_root, &zpl_ops_root, 0);
|
2017-03-08 03:21:37 +03:00
|
|
|
if (zfsvfs->z_ctldir == NULL)
|
2013-03-08 22:41:28 +04:00
|
|
|
return (SET_ERROR(ENOENT));
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2015-04-25 02:21:13 +03:00
|
|
|
* Destroy the '.zfs' directory or remove a snapshot from zfs_snapshots_by_name.
|
|
|
|
* Only called when the filesystem is unmounted.
|
2011-11-11 11:15:53 +04:00
|
|
|
*/
|
|
|
|
void
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsctl_destroy(zfsvfs_t *zfsvfs)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
if (zfsvfs->z_issnap) {
|
2015-04-25 02:21:13 +03:00
|
|
|
zfs_snapentry_t *se;
|
2017-03-08 03:21:37 +03:00
|
|
|
spa_t *spa = zfsvfs->z_os->os_spa;
|
|
|
|
uint64_t objsetid = dmu_objset_id(zfsvfs->z_os);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_enter(&zfs_snapshot_lock, RW_WRITER);
|
2018-07-28 16:02:12 +03:00
|
|
|
se = zfsctl_snapshot_find_by_objsetid(spa, objsetid);
|
|
|
|
if (se != NULL)
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_remove(se);
|
2018-07-28 16:02:12 +03:00
|
|
|
rw_exit(&zfs_snapshot_lock);
|
|
|
|
if (se != NULL) {
|
|
|
|
zfsctl_snapshot_unmount_cancel(se);
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_rele(se);
|
|
|
|
}
|
2017-03-08 03:21:37 +03:00
|
|
|
} else if (zfsvfs->z_ctldir) {
|
|
|
|
iput(zfsvfs->z_ctldir);
|
|
|
|
zfsvfs->z_ctldir = NULL;
|
2015-04-25 02:21:13 +03:00
|
|
|
}
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Given a root znode, retrieve the associated .zfs directory.
|
|
|
|
* Add a hold to the vnode and return it.
|
|
|
|
*/
|
|
|
|
struct inode *
|
|
|
|
zfsctl_root(znode_t *zp)
|
|
|
|
{
|
|
|
|
ASSERT(zfs_has_ctldir(zp));
|
2021-03-17 02:33:34 +03:00
|
|
|
/* Must have an existing ref, so igrab() cannot return NULL */
|
|
|
|
VERIFY3P(igrab(ZTOZSB(zp)->z_ctldir), !=, NULL);
|
2011-11-11 11:15:53 +04:00
|
|
|
return (ZTOZSB(zp)->z_ctldir);
|
|
|
|
}
|
2017-03-08 20:26:33 +03:00
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
/*
|
2017-03-08 20:26:33 +03:00
|
|
|
* Generate a long fid to indicate a snapdir. We encode whether snapdir is
|
2019-09-03 03:56:41 +03:00
|
|
|
* already mounted in gen field. We do this because nfsd lookup will not
|
2017-03-08 20:26:33 +03:00
|
|
|
* trigger automount. Next time the nfsd does fh_to_dentry, we will notice
|
|
|
|
* this and do automount and return ESTALE to force nfsd revalidate and follow
|
|
|
|
* mount.
|
2015-08-29 00:54:32 +03:00
|
|
|
*/
|
|
|
|
static int
|
|
|
|
zfsctl_snapdir_fid(struct inode *ip, fid_t *fidp)
|
|
|
|
{
|
|
|
|
zfid_short_t *zfid = (zfid_short_t *)fidp;
|
|
|
|
zfid_long_t *zlfid = (zfid_long_t *)fidp;
|
|
|
|
uint32_t gen = 0;
|
|
|
|
uint64_t object;
|
|
|
|
uint64_t objsetid;
|
|
|
|
int i;
|
2017-03-08 20:26:33 +03:00
|
|
|
struct dentry *dentry;
|
|
|
|
|
|
|
|
if (fidp->fid_len < LONG_FID_LEN) {
|
|
|
|
fidp->fid_len = LONG_FID_LEN;
|
|
|
|
return (SET_ERROR(ENOSPC));
|
|
|
|
}
|
2015-08-29 00:54:32 +03:00
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
object = ip->i_ino;
|
2015-08-29 00:54:32 +03:00
|
|
|
objsetid = ZFSCTL_INO_SNAPDIRS - ip->i_ino;
|
|
|
|
zfid->zf_len = LONG_FID_LEN;
|
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
dentry = d_obtain_alias(igrab(ip));
|
|
|
|
if (!IS_ERR(dentry)) {
|
|
|
|
gen = !!d_mountpoint(dentry);
|
|
|
|
dput(dentry);
|
|
|
|
}
|
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
for (i = 0; i < sizeof (zfid->zf_object); i++)
|
|
|
|
zfid->zf_object[i] = (uint8_t)(object >> (8 * i));
|
|
|
|
|
|
|
|
for (i = 0; i < sizeof (zfid->zf_gen); i++)
|
|
|
|
zfid->zf_gen[i] = (uint8_t)(gen >> (8 * i));
|
|
|
|
|
|
|
|
for (i = 0; i < sizeof (zlfid->zf_setid); i++)
|
|
|
|
zlfid->zf_setid[i] = (uint8_t)(objsetid >> (8 * i));
|
|
|
|
|
|
|
|
for (i = 0; i < sizeof (zlfid->zf_setgen); i++)
|
|
|
|
zlfid->zf_setgen[i] = 0;
|
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
/*
|
|
|
|
* Generate an appropriate fid for an entry in the .zfs directory.
|
|
|
|
*/
|
2011-11-11 11:15:53 +04:00
|
|
|
int
|
|
|
|
zfsctl_fid(struct inode *ip, fid_t *fidp)
|
|
|
|
{
|
|
|
|
znode_t *zp = ITOZ(ip);
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs_t *zfsvfs = ITOZSB(ip);
|
2011-11-11 11:15:53 +04:00
|
|
|
uint64_t object = zp->z_id;
|
|
|
|
zfid_short_t *zfid;
|
|
|
|
int i;
|
2022-09-16 23:36:47 +03:00
|
|
|
int error;
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
if ((error = zfs_enter(zfsvfs, FTAG)) != 0)
|
|
|
|
return (error);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
if (zfsctl_is_snapdir(ip)) {
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2017-03-08 20:26:33 +03:00
|
|
|
return (zfsctl_snapdir_fid(ip, fidp));
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
if (fidp->fid_len < SHORT_FID_LEN) {
|
|
|
|
fidp->fid_len = SHORT_FID_LEN;
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2017-03-08 20:26:33 +03:00
|
|
|
return (SET_ERROR(ENOSPC));
|
2015-08-29 00:54:32 +03:00
|
|
|
}
|
|
|
|
|
2011-11-11 11:15:53 +04:00
|
|
|
zfid = (zfid_short_t *)fidp;
|
|
|
|
|
|
|
|
zfid->zf_len = SHORT_FID_LEN;
|
|
|
|
|
|
|
|
for (i = 0; i < sizeof (zfid->zf_object); i++)
|
|
|
|
zfid->zf_object[i] = (uint8_t)(object >> (8 * i));
|
|
|
|
|
|
|
|
/* .zfs znodes always have a generation number of 0 */
|
|
|
|
for (i = 0; i < sizeof (zfid->zf_gen); i++)
|
|
|
|
zfid->zf_gen[i] = 0;
|
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2011-11-11 11:15:53 +04:00
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
/*
|
|
|
|
* Construct a full dataset name in full_name: "pool/dataset@snap_name"
|
|
|
|
*/
|
2011-11-11 11:15:53 +04:00
|
|
|
static int
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsctl_snapshot_name(zfsvfs_t *zfsvfs, const char *snap_name, int len,
|
2015-04-25 02:21:13 +03:00
|
|
|
char *full_name)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
objset_t *os = zfsvfs->z_os;
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
if (zfs_component_namecheck(snap_name, NULL, NULL) != 0)
|
2013-03-08 22:41:28 +04:00
|
|
|
return (SET_ERROR(EILSEQ));
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
dmu_objset_name(os, full_name);
|
|
|
|
if ((strlen(full_name) + 1 + strlen(snap_name)) >= len)
|
2013-03-08 22:41:28 +04:00
|
|
|
return (SET_ERROR(ENAMETOOLONG));
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
(void) strcat(full_name, "@");
|
|
|
|
(void) strcat(full_name, snap_name);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
/*
|
|
|
|
* Returns full path in full_path: "/pool/dataset/.zfs/snapshot/snap_name/"
|
|
|
|
*/
|
|
|
|
static int
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsctl_snapshot_path_objset(zfsvfs_t *zfsvfs, uint64_t objsetid,
|
2015-08-29 00:54:32 +03:00
|
|
|
int path_len, char *full_path)
|
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
objset_t *os = zfsvfs->z_os;
|
2015-08-29 00:54:32 +03:00
|
|
|
fstrans_cookie_t cookie;
|
|
|
|
char *snapname;
|
|
|
|
boolean_t case_conflict;
|
|
|
|
uint64_t id, pos = 0;
|
|
|
|
int error = 0;
|
|
|
|
|
|
|
|
cookie = spl_fstrans_mark();
|
2016-06-16 00:28:36 +03:00
|
|
|
snapname = kmem_alloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
2015-08-29 00:54:32 +03:00
|
|
|
|
|
|
|
while (error == 0) {
|
|
|
|
dsl_pool_config_enter(dmu_objset_pool(os), FTAG);
|
2017-03-08 03:21:37 +03:00
|
|
|
error = dmu_snapshot_list_next(zfsvfs->z_os,
|
2016-06-16 00:28:36 +03:00
|
|
|
ZFS_MAX_DATASET_NAME_LEN, snapname, &id, &pos,
|
|
|
|
&case_conflict);
|
2015-08-29 00:54:32 +03:00
|
|
|
dsl_pool_config_exit(dmu_objset_pool(os), FTAG);
|
|
|
|
if (error)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
if (id == objsetid)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
Fix inconsistent mount options for ZFS root
While mounting ZFS root during boot on Linux distributions from initrd,
mount from busybox is effectively used which executes mount system call
directly. This skips the ZFS helper mount.zfs, which checks and enables
the mount options as specified in dataset properties. As a result,
datasets mounted during boot from initrd do not have correct mount
options as specified in ZFS dataset properties.
There has been an attempt to use mount.zfs in zfs initrd script,
responsible for mounting the ZFS root filesystem (PR#13305). This was
later reverted (PR#14908) after discovering that using mount.zfs breaks
mounting of snapshots on root (/) and other child datasets of root have
the same issue (Issue#9461).
This happens because switching from busybox mount to mount.zfs correctly
parses the mount options but also adds 'mntpoint=/root' to the mount
options, which is then prepended to the snapshot mountpoint in
'.zfs/snapshot'. '/root' is the directory on Debian with initramfs-tools
where root filesystem is mounted before pivot_root. When Linux runtime
is reached, trying to access the snapshots on root results in
automounting the snapshot on '/root/.zfs/*', which fails.
This commit attempts to fix the automounting of snapshots on root, while
using mount.zfs in initrd script. Since the mountpoint of dataset is
stored in vfs_mntpoint field, we can check if current mountpoint of
dataset and vfs_mntpoint are same or not. If they are not same, reset
the vfs_mntpoint field with current mountpoint. This fixes the
mountpoints of root dataset and children in respective vfs_mntpoint
fields when we try to access the snapshots of root dataset or its
children. With correct mountpoint for root dataset and children stored
in vfs_mntpoint, all snapshots of root dataset are mounted correctly
and become accessible.
This fix will come into play only if current process, that is trying to
access the snapshots is not in chroot context. The Linux kernel API
that is used to convert struct path into char format (d_path), returns
the complete path for given struct path. It works in chroot environment
as well and returns the correct path from original filesystem root.
However d_path fails to return the complete path if any directory from
original root filesystem is mounted using --bind flag or --rbind flag
in chroot environment. In this case, if we try to access the snapshot
from outside the chroot environment, d_path returns the path correctly,
i.e. it returns the correct path to the directory that is mounted with
--bind flag. However inside the chroot environment, it only returns the
path inside chroot.
For now, there is not a better way in my understanding that gives the
complete path in char format and handles the case where directories from
root filesystem are mounted with --bind or --rbind on another path which
user will later chroot into. So this fix gets enabled if current
process trying to access the snapshot is not in chroot context.
With the snapshots issue fixed for root filesystem, using mount.zfs in
ZFS initrd script, mounts the datasets with correct mount options.
Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov>
Reviewed-by: Alexander Motin <mav@FreeBSD.org>
Reviewed-by: Ameer Hamza <ahamza@ixsystems.com>
Signed-off-by: Umer Saleem <usaleem@ixsystems.com>
Closes #16646
2024-10-17 16:09:39 +03:00
|
|
|
mutex_enter(&zfsvfs->z_vfs->vfs_mntpt_lock);
|
|
|
|
if (zfsvfs->z_vfs->vfs_mntpoint != NULL) {
|
|
|
|
snprintf(full_path, path_len, "%s/.zfs/snapshot/%s",
|
|
|
|
zfsvfs->z_vfs->vfs_mntpoint, snapname);
|
|
|
|
} else
|
|
|
|
error = SET_ERROR(ENOENT);
|
|
|
|
mutex_exit(&zfsvfs->z_vfs->vfs_mntpt_lock);
|
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
out:
|
2016-06-16 00:28:36 +03:00
|
|
|
kmem_free(snapname, ZFS_MAX_DATASET_NAME_LEN);
|
2015-08-29 00:54:32 +03:00
|
|
|
spl_fstrans_unmark(cookie);
|
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
2011-11-11 11:15:53 +04:00
|
|
|
/*
|
|
|
|
* Special case the handling of "..".
|
|
|
|
*/
|
|
|
|
int
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_root_lookup(struct inode *dip, const char *name, struct inode **ipp,
|
2011-11-11 11:15:53 +04:00
|
|
|
int flags, cred_t *cr, int *direntflags, pathname_t *realpnp)
|
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs_t *zfsvfs = ITOZSB(dip);
|
2011-11-11 11:15:53 +04:00
|
|
|
int error = 0;
|
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
if ((error = zfs_enter(zfsvfs, FTAG)) != 0)
|
|
|
|
return (error);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2024-10-02 19:12:02 +03:00
|
|
|
if (zfsvfs->z_show_ctldir == ZFS_SNAPDIR_DISABLED) {
|
|
|
|
*ipp = NULL;
|
|
|
|
} else if (strcmp(name, "..") == 0) {
|
2011-11-11 11:15:53 +04:00
|
|
|
*ipp = dip->i_sb->s_root->d_inode;
|
|
|
|
} else if (strcmp(name, ZFS_SNAPDIR_NAME) == 0) {
|
2017-03-08 03:21:37 +03:00
|
|
|
*ipp = zfsctl_inode_lookup(zfsvfs, ZFSCTL_INO_SNAPDIR,
|
2011-11-11 11:15:53 +04:00
|
|
|
&zpl_fops_snapdir, &zpl_ops_snapdir);
|
|
|
|
} else if (strcmp(name, ZFS_SHAREDIR_NAME) == 0) {
|
2017-03-08 03:21:37 +03:00
|
|
|
*ipp = zfsctl_inode_lookup(zfsvfs, ZFSCTL_INO_SHARES,
|
2011-11-11 11:15:53 +04:00
|
|
|
&zpl_fops_shares, &zpl_ops_shares);
|
|
|
|
} else {
|
|
|
|
*ipp = NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (*ipp == NULL)
|
2013-03-08 22:41:28 +04:00
|
|
|
error = SET_ERROR(ENOENT);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Lookup entry point for the 'snapshot' directory. Try to open the
|
|
|
|
* snapshot if it exist, creating the pseudo filesystem inode as necessary.
|
|
|
|
*/
|
|
|
|
int
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapdir_lookup(struct inode *dip, const char *name, struct inode **ipp,
|
2011-11-11 11:15:53 +04:00
|
|
|
int flags, cred_t *cr, int *direntflags, pathname_t *realpnp)
|
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs_t *zfsvfs = ITOZSB(dip);
|
2011-11-11 11:15:53 +04:00
|
|
|
uint64_t id;
|
|
|
|
int error;
|
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
if ((error = zfs_enter(zfsvfs, FTAG)) != 0)
|
|
|
|
return (error);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
error = dmu_snapshot_lookup(zfsvfs->z_os, name, &id);
|
2011-11-11 11:15:53 +04:00
|
|
|
if (error) {
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2011-11-11 11:15:53 +04:00
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
*ipp = zfsctl_inode_lookup(zfsvfs, ZFSCTL_INO_SNAPDIRS - id,
|
2011-11-11 11:15:53 +04:00
|
|
|
&simple_dir_operations, &simple_dir_inode_operations);
|
2015-04-25 02:21:13 +03:00
|
|
|
if (*ipp == NULL)
|
2013-03-08 22:41:28 +04:00
|
|
|
error = SET_ERROR(ENOENT);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Renaming a directory under '.zfs/snapshot' will automatically trigger
|
|
|
|
* a rename of the snapshot to the new given name. The rename is confined
|
|
|
|
* to the '.zfs/snapshot' directory snapshots cannot be moved elsewhere.
|
|
|
|
*/
|
|
|
|
int
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapdir_rename(struct inode *sdip, const char *snm,
|
|
|
|
struct inode *tdip, const char *tnm, cred_t *cr, int flags)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs_t *zfsvfs = ITOZSB(sdip);
|
2013-09-04 16:00:57 +04:00
|
|
|
char *to, *from, *real, *fsname;
|
2011-11-11 11:15:53 +04:00
|
|
|
int error;
|
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
if (!zfs_admin_snapshot)
|
2017-08-03 07:16:12 +03:00
|
|
|
return (SET_ERROR(EACCES));
|
2015-08-29 00:54:32 +03:00
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
if ((error = zfs_enter(zfsvfs, FTAG)) != 0)
|
|
|
|
return (error);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2016-06-16 00:28:36 +03:00
|
|
|
to = kmem_alloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
|
|
|
from = kmem_alloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
|
|
|
real = kmem_alloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
|
|
|
fsname = kmem_alloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
if (zfsvfs->z_case == ZFS_CASE_INSENSITIVE) {
|
|
|
|
error = dmu_snapshot_realname(zfsvfs->z_os, snm, real,
|
2016-06-16 00:28:36 +03:00
|
|
|
ZFS_MAX_DATASET_NAME_LEN, NULL);
|
2011-11-11 11:15:53 +04:00
|
|
|
if (error == 0) {
|
2013-09-04 16:00:57 +04:00
|
|
|
snm = real;
|
2011-11-11 11:15:53 +04:00
|
|
|
} else if (error != ENOTSUP) {
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
dmu_objset_name(zfsvfs->z_os, fsname);
|
2013-09-04 16:00:57 +04:00
|
|
|
|
2016-06-16 00:28:36 +03:00
|
|
|
error = zfsctl_snapshot_name(ITOZSB(sdip), snm,
|
|
|
|
ZFS_MAX_DATASET_NAME_LEN, from);
|
2013-09-04 16:00:57 +04:00
|
|
|
if (error == 0)
|
2016-06-16 00:28:36 +03:00
|
|
|
error = zfsctl_snapshot_name(ITOZSB(tdip), tnm,
|
2016-12-12 21:46:26 +03:00
|
|
|
ZFS_MAX_DATASET_NAME_LEN, to);
|
2013-09-04 16:00:57 +04:00
|
|
|
if (error == 0)
|
2011-11-11 11:15:53 +04:00
|
|
|
error = zfs_secpolicy_rename_perms(from, to, cr);
|
2013-09-04 16:00:57 +04:00
|
|
|
if (error != 0)
|
2011-11-11 11:15:53 +04:00
|
|
|
goto out;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Cannot move snapshots out of the snapdir.
|
|
|
|
*/
|
|
|
|
if (sdip != tdip) {
|
2013-03-08 22:41:28 +04:00
|
|
|
error = SET_ERROR(EINVAL);
|
2011-11-11 11:15:53 +04:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* No-op when names are identical.
|
|
|
|
*/
|
2013-09-04 16:00:57 +04:00
|
|
|
if (strcmp(snm, tnm) == 0) {
|
2011-11-11 11:15:53 +04:00
|
|
|
error = 0;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_enter(&zfs_snapshot_lock, RW_WRITER);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2013-09-04 16:00:57 +04:00
|
|
|
error = dsl_dataset_rename_snapshot(fsname, snm, tnm, B_FALSE);
|
2015-04-25 02:21:13 +03:00
|
|
|
if (error == 0)
|
|
|
|
(void) zfsctl_snapshot_rename(snm, tnm);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_exit(&zfs_snapshot_lock);
|
2011-11-11 11:15:53 +04:00
|
|
|
out:
|
2016-06-16 00:28:36 +03:00
|
|
|
kmem_free(from, ZFS_MAX_DATASET_NAME_LEN);
|
|
|
|
kmem_free(to, ZFS_MAX_DATASET_NAME_LEN);
|
|
|
|
kmem_free(real, ZFS_MAX_DATASET_NAME_LEN);
|
|
|
|
kmem_free(fsname, ZFS_MAX_DATASET_NAME_LEN);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Removing a directory under '.zfs/snapshot' will automatically trigger
|
|
|
|
* the removal of the snapshot with the given name.
|
|
|
|
*/
|
|
|
|
int
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapdir_remove(struct inode *dip, const char *name, cred_t *cr,
|
|
|
|
int flags)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs_t *zfsvfs = ITOZSB(dip);
|
2011-11-11 11:15:53 +04:00
|
|
|
char *snapname, *real;
|
|
|
|
int error;
|
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
if (!zfs_admin_snapshot)
|
2017-08-03 07:16:12 +03:00
|
|
|
return (SET_ERROR(EACCES));
|
2015-08-29 00:54:32 +03:00
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
if ((error = zfs_enter(zfsvfs, FTAG)) != 0)
|
|
|
|
return (error);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2016-06-16 00:28:36 +03:00
|
|
|
snapname = kmem_alloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
|
|
|
real = kmem_alloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
if (zfsvfs->z_case == ZFS_CASE_INSENSITIVE) {
|
|
|
|
error = dmu_snapshot_realname(zfsvfs->z_os, name, real,
|
2016-06-16 00:28:36 +03:00
|
|
|
ZFS_MAX_DATASET_NAME_LEN, NULL);
|
2011-11-11 11:15:53 +04:00
|
|
|
if (error == 0) {
|
|
|
|
name = real;
|
|
|
|
} else if (error != ENOTSUP) {
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-06-16 00:28:36 +03:00
|
|
|
error = zfsctl_snapshot_name(ITOZSB(dip), name,
|
|
|
|
ZFS_MAX_DATASET_NAME_LEN, snapname);
|
2013-09-04 16:00:57 +04:00
|
|
|
if (error == 0)
|
2011-11-11 11:15:53 +04:00
|
|
|
error = zfs_secpolicy_destroy_perms(snapname, cr);
|
2013-09-04 16:00:57 +04:00
|
|
|
if (error != 0)
|
2011-11-11 11:15:53 +04:00
|
|
|
goto out;
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
error = zfsctl_snapshot_unmount(snapname, MNT_FORCE);
|
2011-11-11 11:15:53 +04:00
|
|
|
if ((error == 0) || (error == ENOENT))
|
2013-09-04 16:00:57 +04:00
|
|
|
error = dsl_destroy_snapshot(snapname, B_FALSE);
|
2011-11-11 11:15:53 +04:00
|
|
|
out:
|
2016-06-16 00:28:36 +03:00
|
|
|
kmem_free(snapname, ZFS_MAX_DATASET_NAME_LEN);
|
|
|
|
kmem_free(real, ZFS_MAX_DATASET_NAME_LEN);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Creating a directory under '.zfs/snapshot' will automatically trigger
|
|
|
|
* the creation of a new snapshot with the given name.
|
|
|
|
*/
|
|
|
|
int
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapdir_mkdir(struct inode *dip, const char *dirname, vattr_t *vap,
|
2017-01-21 00:17:55 +03:00
|
|
|
struct inode **ipp, cred_t *cr, int flags)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs_t *zfsvfs = ITOZSB(dip);
|
2011-11-11 11:15:53 +04:00
|
|
|
char *dsname;
|
|
|
|
int error;
|
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
if (!zfs_admin_snapshot)
|
2017-08-03 07:16:12 +03:00
|
|
|
return (SET_ERROR(EACCES));
|
2015-08-29 00:54:32 +03:00
|
|
|
|
2016-06-16 00:28:36 +03:00
|
|
|
dsname = kmem_alloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2013-12-12 02:33:41 +04:00
|
|
|
if (zfs_component_namecheck(dirname, NULL, NULL) != 0) {
|
2013-03-08 22:41:28 +04:00
|
|
|
error = SET_ERROR(EILSEQ);
|
2011-11-11 11:15:53 +04:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
dmu_objset_name(zfsvfs->z_os, dsname);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
error = zfs_secpolicy_snapshot_perms(dsname, cr);
|
2013-09-04 16:00:57 +04:00
|
|
|
if (error != 0)
|
2011-11-11 11:15:53 +04:00
|
|
|
goto out;
|
|
|
|
|
|
|
|
if (error == 0) {
|
2013-08-28 15:45:09 +04:00
|
|
|
error = dmu_objset_snapshot_one(dsname, dirname);
|
2013-09-04 16:00:57 +04:00
|
|
|
if (error != 0)
|
2011-11-11 11:15:53 +04:00
|
|
|
goto out;
|
|
|
|
|
|
|
|
error = zfsctl_snapdir_lookup(dip, dirname, ipp,
|
|
|
|
0, cr, NULL, NULL);
|
|
|
|
}
|
|
|
|
out:
|
2016-06-16 00:28:36 +03:00
|
|
|
kmem_free(dsname, ZFS_MAX_DATASET_NAME_LEN);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
2020-08-25 03:33:02 +03:00
|
|
|
/*
|
|
|
|
* Flush everything out of the kernel's export table and such.
|
|
|
|
* This is needed as once the snapshot is used over NFS, its
|
|
|
|
* entries in svc_export and svc_expkey caches hold reference
|
|
|
|
* to the snapshot mount point. There is no known way of flushing
|
|
|
|
* only the entries related to the snapshot.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
exportfs_flush(void)
|
|
|
|
{
|
|
|
|
char *argv[] = { "/usr/sbin/exportfs", "-f", NULL };
|
|
|
|
char *envp[] = { NULL };
|
|
|
|
|
|
|
|
(void) call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
|
|
|
|
}
|
|
|
|
|
Fix inconsistent mount options for ZFS root
While mounting ZFS root during boot on Linux distributions from initrd,
mount from busybox is effectively used which executes mount system call
directly. This skips the ZFS helper mount.zfs, which checks and enables
the mount options as specified in dataset properties. As a result,
datasets mounted during boot from initrd do not have correct mount
options as specified in ZFS dataset properties.
There has been an attempt to use mount.zfs in zfs initrd script,
responsible for mounting the ZFS root filesystem (PR#13305). This was
later reverted (PR#14908) after discovering that using mount.zfs breaks
mounting of snapshots on root (/) and other child datasets of root have
the same issue (Issue#9461).
This happens because switching from busybox mount to mount.zfs correctly
parses the mount options but also adds 'mntpoint=/root' to the mount
options, which is then prepended to the snapshot mountpoint in
'.zfs/snapshot'. '/root' is the directory on Debian with initramfs-tools
where root filesystem is mounted before pivot_root. When Linux runtime
is reached, trying to access the snapshots on root results in
automounting the snapshot on '/root/.zfs/*', which fails.
This commit attempts to fix the automounting of snapshots on root, while
using mount.zfs in initrd script. Since the mountpoint of dataset is
stored in vfs_mntpoint field, we can check if current mountpoint of
dataset and vfs_mntpoint are same or not. If they are not same, reset
the vfs_mntpoint field with current mountpoint. This fixes the
mountpoints of root dataset and children in respective vfs_mntpoint
fields when we try to access the snapshots of root dataset or its
children. With correct mountpoint for root dataset and children stored
in vfs_mntpoint, all snapshots of root dataset are mounted correctly
and become accessible.
This fix will come into play only if current process, that is trying to
access the snapshots is not in chroot context. The Linux kernel API
that is used to convert struct path into char format (d_path), returns
the complete path for given struct path. It works in chroot environment
as well and returns the correct path from original filesystem root.
However d_path fails to return the complete path if any directory from
original root filesystem is mounted using --bind flag or --rbind flag
in chroot environment. In this case, if we try to access the snapshot
from outside the chroot environment, d_path returns the path correctly,
i.e. it returns the correct path to the directory that is mounted with
--bind flag. However inside the chroot environment, it only returns the
path inside chroot.
For now, there is not a better way in my understanding that gives the
complete path in char format and handles the case where directories from
root filesystem are mounted with --bind or --rbind on another path which
user will later chroot into. So this fix gets enabled if current
process trying to access the snapshot is not in chroot context.
With the snapshots issue fixed for root filesystem, using mount.zfs in
ZFS initrd script, mounts the datasets with correct mount options.
Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov>
Reviewed-by: Alexander Motin <mav@FreeBSD.org>
Reviewed-by: Ameer Hamza <ahamza@ixsystems.com>
Signed-off-by: Umer Saleem <usaleem@ixsystems.com>
Closes #16646
2024-10-17 16:09:39 +03:00
|
|
|
/*
|
|
|
|
* Returns the path in char format for given struct path. Uses
|
|
|
|
* d_path exported by kernel to convert struct path to char
|
|
|
|
* format. Returns the correct path for mountpoints and chroot
|
|
|
|
* environments.
|
|
|
|
*
|
|
|
|
* If chroot environment has directories that are mounted with
|
|
|
|
* --bind or --rbind flag, d_path returns the complete path inside
|
|
|
|
* chroot environment but does not return the absolute path, i.e.
|
|
|
|
* the path to chroot environment is missing.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
get_root_path(struct path *path, char *buff, int len)
|
|
|
|
{
|
|
|
|
char *path_buffer, *path_ptr;
|
|
|
|
int error = 0;
|
|
|
|
|
|
|
|
path_get(path);
|
|
|
|
path_buffer = kmem_zalloc(len, KM_SLEEP);
|
|
|
|
path_ptr = d_path(path, path_buffer, len);
|
|
|
|
if (IS_ERR(path_ptr))
|
|
|
|
error = SET_ERROR(-PTR_ERR(path_ptr));
|
|
|
|
else
|
|
|
|
strcpy(buff, path_ptr);
|
|
|
|
|
|
|
|
kmem_free(path_buffer, len);
|
|
|
|
path_put(path);
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Returns if the current process root is chrooted or not. Linux
|
|
|
|
* kernel exposes the task_struct for current process and init.
|
|
|
|
* Since init process root points to actual root filesystem when
|
|
|
|
* Linux runtime is reached, we can compare the current process
|
|
|
|
* root with init process root to determine if root of the current
|
|
|
|
* process is different from init, which can reliably determine if
|
|
|
|
* current process is in chroot context or not.
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
is_current_chrooted(void)
|
|
|
|
{
|
|
|
|
struct task_struct *curr = current, *global = &init_task;
|
|
|
|
struct path cr_root, gl_root;
|
|
|
|
|
|
|
|
task_lock(curr);
|
|
|
|
get_fs_root(curr->fs, &cr_root);
|
|
|
|
task_unlock(curr);
|
|
|
|
|
|
|
|
task_lock(global);
|
|
|
|
get_fs_root(global->fs, &gl_root);
|
|
|
|
task_unlock(global);
|
|
|
|
|
|
|
|
int chrooted = !path_equal(&cr_root, &gl_root);
|
|
|
|
path_put(&gl_root);
|
|
|
|
path_put(&cr_root);
|
|
|
|
|
|
|
|
return (chrooted);
|
|
|
|
}
|
|
|
|
|
2011-11-11 11:15:53 +04:00
|
|
|
/*
|
|
|
|
* Attempt to unmount a snapshot by making a call to user space.
|
|
|
|
* There is no assurance that this can or will succeed, is just a
|
|
|
|
* best effort. In the case where it does fail, perhaps because
|
|
|
|
* it's in use, the unmount will fail harmlessly.
|
|
|
|
*/
|
2015-04-25 02:21:13 +03:00
|
|
|
int
|
2020-10-03 03:44:10 +03:00
|
|
|
zfsctl_snapshot_unmount(const char *snapname, int flags)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
2016-10-06 21:03:41 +03:00
|
|
|
char *argv[] = { "/usr/bin/env", "umount", "-t", "zfs", "-n", NULL,
|
|
|
|
NULL };
|
2011-11-11 11:15:53 +04:00
|
|
|
char *envp[] = { NULL };
|
2015-04-25 02:21:13 +03:00
|
|
|
zfs_snapentry_t *se;
|
2011-11-11 11:15:53 +04:00
|
|
|
int error;
|
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_enter(&zfs_snapshot_lock, RW_READER);
|
2015-04-25 02:21:13 +03:00
|
|
|
if ((se = zfsctl_snapshot_find_by_name(snapname)) == NULL) {
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_exit(&zfs_snapshot_lock);
|
2017-08-03 07:16:12 +03:00
|
|
|
return (SET_ERROR(ENOENT));
|
2015-04-25 02:21:13 +03:00
|
|
|
}
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_exit(&zfs_snapshot_lock);
|
2015-04-25 02:21:13 +03:00
|
|
|
|
2020-08-25 03:33:02 +03:00
|
|
|
exportfs_flush();
|
|
|
|
|
2016-10-06 21:03:41 +03:00
|
|
|
if (flags & MNT_FORCE)
|
|
|
|
argv[4] = "-fn";
|
|
|
|
argv[5] = se->se_path;
|
2015-04-25 02:21:13 +03:00
|
|
|
dprintf("unmount; path=%s\n", se->se_path);
|
2013-01-10 03:46:31 +04:00
|
|
|
error = call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
|
2016-10-06 20:53:27 +03:00
|
|
|
zfsctl_snapshot_rele(se);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
|
2011-11-11 11:15:53 +04:00
|
|
|
/*
|
|
|
|
* The umount system utility will return 256 on error. We must
|
|
|
|
* assume this error is because the file system is busy so it is
|
|
|
|
* converted to the more sensible EBUSY.
|
|
|
|
*/
|
|
|
|
if (error)
|
2013-03-08 22:41:28 +04:00
|
|
|
error = SET_ERROR(EBUSY);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
2015-04-25 02:21:13 +03:00
|
|
|
zfsctl_snapshot_mount(struct path *path, int flags)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
|
|
|
struct dentry *dentry = path->dentry;
|
|
|
|
struct inode *ip = dentry->d_inode;
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs_t *zfsvfs;
|
|
|
|
zfsvfs_t *snap_zfsvfs;
|
2015-04-25 02:21:13 +03:00
|
|
|
zfs_snapentry_t *se;
|
2024-10-02 19:12:02 +03:00
|
|
|
char *full_name, *full_path, *options;
|
2024-08-23 20:39:09 +03:00
|
|
|
char *argv[] = { "/usr/bin/env", "mount", "-i", "-t", "zfs", "-n",
|
2024-10-02 19:12:02 +03:00
|
|
|
"-o", NULL, NULL, NULL, NULL };
|
2011-11-11 11:15:53 +04:00
|
|
|
char *envp[] = { NULL };
|
|
|
|
int error;
|
2015-11-17 03:39:52 +03:00
|
|
|
struct path spath;
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
if (ip == NULL)
|
2017-08-03 07:16:12 +03:00
|
|
|
return (SET_ERROR(EISDIR));
|
2015-04-25 02:21:13 +03:00
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs = ITOZSB(ip);
|
2022-09-16 23:36:47 +03:00
|
|
|
if ((error = zfs_enter(zfsvfs, FTAG)) != 0)
|
|
|
|
return (error);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2016-06-16 00:28:36 +03:00
|
|
|
full_name = kmem_zalloc(ZFS_MAX_DATASET_NAME_LEN, KM_SLEEP);
|
2015-04-25 02:21:13 +03:00
|
|
|
full_path = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
|
2024-10-02 19:12:02 +03:00
|
|
|
options = kmem_zalloc(7, KM_SLEEP);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
error = zfsctl_snapshot_name(zfsvfs, dname(dentry),
|
2016-06-16 00:28:36 +03:00
|
|
|
ZFS_MAX_DATASET_NAME_LEN, full_name);
|
2011-11-11 11:15:53 +04:00
|
|
|
if (error)
|
|
|
|
goto error;
|
|
|
|
|
Fix inconsistent mount options for ZFS root
While mounting ZFS root during boot on Linux distributions from initrd,
mount from busybox is effectively used which executes mount system call
directly. This skips the ZFS helper mount.zfs, which checks and enables
the mount options as specified in dataset properties. As a result,
datasets mounted during boot from initrd do not have correct mount
options as specified in ZFS dataset properties.
There has been an attempt to use mount.zfs in zfs initrd script,
responsible for mounting the ZFS root filesystem (PR#13305). This was
later reverted (PR#14908) after discovering that using mount.zfs breaks
mounting of snapshots on root (/) and other child datasets of root have
the same issue (Issue#9461).
This happens because switching from busybox mount to mount.zfs correctly
parses the mount options but also adds 'mntpoint=/root' to the mount
options, which is then prepended to the snapshot mountpoint in
'.zfs/snapshot'. '/root' is the directory on Debian with initramfs-tools
where root filesystem is mounted before pivot_root. When Linux runtime
is reached, trying to access the snapshots on root results in
automounting the snapshot on '/root/.zfs/*', which fails.
This commit attempts to fix the automounting of snapshots on root, while
using mount.zfs in initrd script. Since the mountpoint of dataset is
stored in vfs_mntpoint field, we can check if current mountpoint of
dataset and vfs_mntpoint are same or not. If they are not same, reset
the vfs_mntpoint field with current mountpoint. This fixes the
mountpoints of root dataset and children in respective vfs_mntpoint
fields when we try to access the snapshots of root dataset or its
children. With correct mountpoint for root dataset and children stored
in vfs_mntpoint, all snapshots of root dataset are mounted correctly
and become accessible.
This fix will come into play only if current process, that is trying to
access the snapshots is not in chroot context. The Linux kernel API
that is used to convert struct path into char format (d_path), returns
the complete path for given struct path. It works in chroot environment
as well and returns the correct path from original filesystem root.
However d_path fails to return the complete path if any directory from
original root filesystem is mounted using --bind flag or --rbind flag
in chroot environment. In this case, if we try to access the snapshot
from outside the chroot environment, d_path returns the path correctly,
i.e. it returns the correct path to the directory that is mounted with
--bind flag. However inside the chroot environment, it only returns the
path inside chroot.
For now, there is not a better way in my understanding that gives the
complete path in char format and handles the case where directories from
root filesystem are mounted with --bind or --rbind on another path which
user will later chroot into. So this fix gets enabled if current
process trying to access the snapshot is not in chroot context.
With the snapshots issue fixed for root filesystem, using mount.zfs in
ZFS initrd script, mounts the datasets with correct mount options.
Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov>
Reviewed-by: Alexander Motin <mav@FreeBSD.org>
Reviewed-by: Ameer Hamza <ahamza@ixsystems.com>
Signed-off-by: Umer Saleem <usaleem@ixsystems.com>
Closes #16646
2024-10-17 16:09:39 +03:00
|
|
|
if (is_current_chrooted() == 0) {
|
|
|
|
/*
|
|
|
|
* Current process is not in chroot context
|
|
|
|
*/
|
|
|
|
|
|
|
|
char *m = kmem_zalloc(MAXPATHLEN, KM_SLEEP);
|
|
|
|
struct path mnt_path;
|
|
|
|
mnt_path.mnt = path->mnt;
|
|
|
|
mnt_path.dentry = path->mnt->mnt_root;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Get path to current mountpoint
|
|
|
|
*/
|
|
|
|
error = get_root_path(&mnt_path, m, MAXPATHLEN);
|
|
|
|
if (error != 0) {
|
|
|
|
kmem_free(m, MAXPATHLEN);
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
mutex_enter(&zfsvfs->z_vfs->vfs_mntpt_lock);
|
|
|
|
if (zfsvfs->z_vfs->vfs_mntpoint != NULL) {
|
|
|
|
/*
|
|
|
|
* If current mnountpoint and vfs_mntpoint are not same,
|
|
|
|
* store current mountpoint in vfs_mntpoint.
|
|
|
|
*/
|
|
|
|
if (strcmp(zfsvfs->z_vfs->vfs_mntpoint, m) != 0) {
|
|
|
|
kmem_strfree(zfsvfs->z_vfs->vfs_mntpoint);
|
|
|
|
zfsvfs->z_vfs->vfs_mntpoint = kmem_strdup(m);
|
|
|
|
}
|
|
|
|
} else
|
|
|
|
zfsvfs->z_vfs->vfs_mntpoint = kmem_strdup(m);
|
|
|
|
mutex_exit(&zfsvfs->z_vfs->vfs_mntpt_lock);
|
|
|
|
kmem_free(m, MAXPATHLEN);
|
|
|
|
}
|
|
|
|
|
2019-07-02 18:25:23 +03:00
|
|
|
/*
|
|
|
|
* Construct a mount point path from sb of the ctldir inode and dirent
|
|
|
|
* name, instead of from d_path(), so that chroot'd process doesn't fail
|
|
|
|
* on mount.zfs(8).
|
|
|
|
*/
|
Fix inconsistent mount options for ZFS root
While mounting ZFS root during boot on Linux distributions from initrd,
mount from busybox is effectively used which executes mount system call
directly. This skips the ZFS helper mount.zfs, which checks and enables
the mount options as specified in dataset properties. As a result,
datasets mounted during boot from initrd do not have correct mount
options as specified in ZFS dataset properties.
There has been an attempt to use mount.zfs in zfs initrd script,
responsible for mounting the ZFS root filesystem (PR#13305). This was
later reverted (PR#14908) after discovering that using mount.zfs breaks
mounting of snapshots on root (/) and other child datasets of root have
the same issue (Issue#9461).
This happens because switching from busybox mount to mount.zfs correctly
parses the mount options but also adds 'mntpoint=/root' to the mount
options, which is then prepended to the snapshot mountpoint in
'.zfs/snapshot'. '/root' is the directory on Debian with initramfs-tools
where root filesystem is mounted before pivot_root. When Linux runtime
is reached, trying to access the snapshots on root results in
automounting the snapshot on '/root/.zfs/*', which fails.
This commit attempts to fix the automounting of snapshots on root, while
using mount.zfs in initrd script. Since the mountpoint of dataset is
stored in vfs_mntpoint field, we can check if current mountpoint of
dataset and vfs_mntpoint are same or not. If they are not same, reset
the vfs_mntpoint field with current mountpoint. This fixes the
mountpoints of root dataset and children in respective vfs_mntpoint
fields when we try to access the snapshots of root dataset or its
children. With correct mountpoint for root dataset and children stored
in vfs_mntpoint, all snapshots of root dataset are mounted correctly
and become accessible.
This fix will come into play only if current process, that is trying to
access the snapshots is not in chroot context. The Linux kernel API
that is used to convert struct path into char format (d_path), returns
the complete path for given struct path. It works in chroot environment
as well and returns the correct path from original filesystem root.
However d_path fails to return the complete path if any directory from
original root filesystem is mounted using --bind flag or --rbind flag
in chroot environment. In this case, if we try to access the snapshot
from outside the chroot environment, d_path returns the path correctly,
i.e. it returns the correct path to the directory that is mounted with
--bind flag. However inside the chroot environment, it only returns the
path inside chroot.
For now, there is not a better way in my understanding that gives the
complete path in char format and handles the case where directories from
root filesystem are mounted with --bind or --rbind on another path which
user will later chroot into. So this fix gets enabled if current
process trying to access the snapshot is not in chroot context.
With the snapshots issue fixed for root filesystem, using mount.zfs in
ZFS initrd script, mounts the datasets with correct mount options.
Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov>
Reviewed-by: Alexander Motin <mav@FreeBSD.org>
Reviewed-by: Ameer Hamza <ahamza@ixsystems.com>
Signed-off-by: Umer Saleem <usaleem@ixsystems.com>
Closes #16646
2024-10-17 16:09:39 +03:00
|
|
|
mutex_enter(&zfsvfs->z_vfs->vfs_mntpt_lock);
|
2019-07-02 18:25:23 +03:00
|
|
|
snprintf(full_path, MAXPATHLEN, "%s/.zfs/snapshot/%s",
|
2019-10-04 22:30:51 +03:00
|
|
|
zfsvfs->z_vfs->vfs_mntpoint ? zfsvfs->z_vfs->vfs_mntpoint : "",
|
|
|
|
dname(dentry));
|
Fix inconsistent mount options for ZFS root
While mounting ZFS root during boot on Linux distributions from initrd,
mount from busybox is effectively used which executes mount system call
directly. This skips the ZFS helper mount.zfs, which checks and enables
the mount options as specified in dataset properties. As a result,
datasets mounted during boot from initrd do not have correct mount
options as specified in ZFS dataset properties.
There has been an attempt to use mount.zfs in zfs initrd script,
responsible for mounting the ZFS root filesystem (PR#13305). This was
later reverted (PR#14908) after discovering that using mount.zfs breaks
mounting of snapshots on root (/) and other child datasets of root have
the same issue (Issue#9461).
This happens because switching from busybox mount to mount.zfs correctly
parses the mount options but also adds 'mntpoint=/root' to the mount
options, which is then prepended to the snapshot mountpoint in
'.zfs/snapshot'. '/root' is the directory on Debian with initramfs-tools
where root filesystem is mounted before pivot_root. When Linux runtime
is reached, trying to access the snapshots on root results in
automounting the snapshot on '/root/.zfs/*', which fails.
This commit attempts to fix the automounting of snapshots on root, while
using mount.zfs in initrd script. Since the mountpoint of dataset is
stored in vfs_mntpoint field, we can check if current mountpoint of
dataset and vfs_mntpoint are same or not. If they are not same, reset
the vfs_mntpoint field with current mountpoint. This fixes the
mountpoints of root dataset and children in respective vfs_mntpoint
fields when we try to access the snapshots of root dataset or its
children. With correct mountpoint for root dataset and children stored
in vfs_mntpoint, all snapshots of root dataset are mounted correctly
and become accessible.
This fix will come into play only if current process, that is trying to
access the snapshots is not in chroot context. The Linux kernel API
that is used to convert struct path into char format (d_path), returns
the complete path for given struct path. It works in chroot environment
as well and returns the correct path from original filesystem root.
However d_path fails to return the complete path if any directory from
original root filesystem is mounted using --bind flag or --rbind flag
in chroot environment. In this case, if we try to access the snapshot
from outside the chroot environment, d_path returns the path correctly,
i.e. it returns the correct path to the directory that is mounted with
--bind flag. However inside the chroot environment, it only returns the
path inside chroot.
For now, there is not a better way in my understanding that gives the
complete path in char format and handles the case where directories from
root filesystem are mounted with --bind or --rbind on another path which
user will later chroot into. So this fix gets enabled if current
process trying to access the snapshot is not in chroot context.
With the snapshots issue fixed for root filesystem, using mount.zfs in
ZFS initrd script, mounts the datasets with correct mount options.
Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov>
Reviewed-by: Alexander Motin <mav@FreeBSD.org>
Reviewed-by: Ameer Hamza <ahamza@ixsystems.com>
Signed-off-by: Umer Saleem <usaleem@ixsystems.com>
Closes #16646
2024-10-17 16:09:39 +03:00
|
|
|
mutex_exit(&zfsvfs->z_vfs->vfs_mntpt_lock);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2024-10-02 19:12:02 +03:00
|
|
|
snprintf(options, 7, "%s",
|
|
|
|
zfs_snapshot_no_setuid ? "nosuid" : "suid");
|
|
|
|
|
2015-04-25 02:21:13 +03:00
|
|
|
/*
|
|
|
|
* Multiple concurrent automounts of a snapshot are never allowed.
|
|
|
|
* The snapshot may be manually mounted as many times as desired.
|
|
|
|
*/
|
|
|
|
if (zfsctl_snapshot_ismounted(full_name)) {
|
2015-12-12 02:24:34 +03:00
|
|
|
error = 0;
|
2015-04-25 02:21:13 +03:00
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2011-11-11 11:15:53 +04:00
|
|
|
/*
|
|
|
|
* Attempt to mount the snapshot from user space. Normally this
|
|
|
|
* would be done using the vfs_kern_mount() function, however that
|
|
|
|
* function is marked GPL-only and cannot be used. On error we
|
|
|
|
* careful to log the real error to the console and return EISDIR
|
|
|
|
* to safely abort the automount. This should be very rare.
|
2013-11-07 09:55:18 +04:00
|
|
|
*
|
|
|
|
* If the user mode helper happens to return EBUSY, a concurrent
|
|
|
|
* mount is already in progress in which case the error is ignored.
|
|
|
|
* Take note that if the program was executed successfully the return
|
|
|
|
* value from call_usermodehelper() will be (exitcode << 8 + signal).
|
2011-11-11 11:15:53 +04:00
|
|
|
*/
|
2015-04-25 02:21:13 +03:00
|
|
|
dprintf("mount; name=%s path=%s\n", full_name, full_path);
|
2024-10-02 19:12:02 +03:00
|
|
|
argv[7] = options;
|
|
|
|
argv[8] = full_name;
|
|
|
|
argv[9] = full_path;
|
2013-01-10 03:46:31 +04:00
|
|
|
error = call_usermodehelper(argv[0], argv, envp, UMH_WAIT_PROC);
|
2015-11-17 03:39:52 +03:00
|
|
|
if (error) {
|
|
|
|
if (!(error & MOUNT_BUSY << 8)) {
|
2019-07-03 23:05:02 +03:00
|
|
|
zfs_dbgmsg("Unable to automount %s error=%d",
|
|
|
|
full_path, error);
|
2015-11-17 03:39:52 +03:00
|
|
|
error = SET_ERROR(EISDIR);
|
|
|
|
} else {
|
|
|
|
/*
|
|
|
|
* EBUSY, this could mean a concurrent mount, or the
|
|
|
|
* snapshot has already been mounted at completely
|
|
|
|
* different place. We return 0 so VFS will retry. For
|
|
|
|
* the latter case the VFS will retry several times
|
|
|
|
* and return ELOOP, which is probably not a very good
|
|
|
|
* behavior.
|
|
|
|
*/
|
|
|
|
error = 0;
|
|
|
|
}
|
2011-11-11 11:15:53 +04:00
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2015-04-25 02:21:13 +03:00
|
|
|
* Follow down in to the mounted snapshot and set MNT_SHRINKABLE
|
|
|
|
* to identify this as an automounted filesystem.
|
2011-11-11 11:15:53 +04:00
|
|
|
*/
|
2015-11-17 03:39:52 +03:00
|
|
|
spath = *path;
|
|
|
|
path_get(&spath);
|
2019-11-12 19:59:06 +03:00
|
|
|
if (follow_down_one(&spath)) {
|
2017-03-08 03:21:37 +03:00
|
|
|
snap_zfsvfs = ITOZSB(spath.dentry->d_inode);
|
|
|
|
snap_zfsvfs->z_parent = zfsvfs;
|
2015-11-17 03:39:52 +03:00
|
|
|
dentry = spath.dentry;
|
|
|
|
spath.mnt->mnt_flags |= MNT_SHRINKABLE;
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_enter(&zfs_snapshot_lock, RW_WRITER);
|
2015-11-17 03:39:52 +03:00
|
|
|
se = zfsctl_snapshot_alloc(full_name, full_path,
|
2017-03-08 03:21:37 +03:00
|
|
|
snap_zfsvfs->z_os->os_spa, dmu_objset_id(snap_zfsvfs->z_os),
|
2015-12-08 02:43:53 +03:00
|
|
|
dentry);
|
2015-11-17 03:39:52 +03:00
|
|
|
zfsctl_snapshot_add(se);
|
|
|
|
zfsctl_snapshot_unmount_delay_impl(se, zfs_expire_snapshot);
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_exit(&zfs_snapshot_lock);
|
2015-11-17 03:39:52 +03:00
|
|
|
}
|
|
|
|
path_put(&spath);
|
2011-11-11 11:15:53 +04:00
|
|
|
error:
|
2016-06-16 00:28:36 +03:00
|
|
|
kmem_free(full_name, ZFS_MAX_DATASET_NAME_LEN);
|
2015-04-25 02:21:13 +03:00
|
|
|
kmem_free(full_path, MAXPATHLEN);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2017-03-08 20:26:33 +03:00
|
|
|
* Get the snapdir inode from fid
|
2011-11-11 11:15:53 +04:00
|
|
|
*/
|
|
|
|
int
|
2017-03-08 20:26:33 +03:00
|
|
|
zfsctl_snapdir_vget(struct super_block *sb, uint64_t objsetid, int gen,
|
|
|
|
struct inode **ipp)
|
2011-11-11 11:15:53 +04:00
|
|
|
{
|
|
|
|
int error;
|
2017-03-08 20:26:33 +03:00
|
|
|
struct path path;
|
|
|
|
char *mnt;
|
|
|
|
struct dentry *dentry;
|
2015-09-23 23:00:28 +03:00
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
mnt = kmem_alloc(MAXPATHLEN, KM_SLEEP);
|
2015-09-23 23:00:28 +03:00
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
error = zfsctl_snapshot_path_objset(sb->s_fs_info, objsetid,
|
|
|
|
MAXPATHLEN, mnt);
|
|
|
|
if (error)
|
|
|
|
goto out;
|
2015-09-23 23:00:28 +03:00
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
/* Trigger automount */
|
2018-09-05 08:26:56 +03:00
|
|
|
error = -kern_path(mnt, LOOKUP_FOLLOW|LOOKUP_DIRECTORY, &path);
|
2017-03-08 20:26:33 +03:00
|
|
|
if (error)
|
|
|
|
goto out;
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
path_put(&path);
|
2015-08-29 00:54:32 +03:00
|
|
|
/*
|
2017-03-08 20:26:33 +03:00
|
|
|
* Get the snapdir inode. Note, we don't want to use the above
|
|
|
|
* path because it contains the root of the snapshot rather
|
|
|
|
* than the snapdir.
|
2015-08-29 00:54:32 +03:00
|
|
|
*/
|
2017-03-08 20:26:33 +03:00
|
|
|
*ipp = ilookup(sb, ZFSCTL_INO_SNAPDIRS - objsetid);
|
|
|
|
if (*ipp == NULL) {
|
|
|
|
error = SET_ERROR(ENOENT);
|
|
|
|
goto out;
|
2015-08-29 00:54:32 +03:00
|
|
|
}
|
|
|
|
|
2017-03-08 20:26:33 +03:00
|
|
|
/* check gen, see zfsctl_snapdir_fid */
|
|
|
|
dentry = d_obtain_alias(igrab(*ipp));
|
|
|
|
if (gen != (!IS_ERR(dentry) && d_mountpoint(dentry))) {
|
|
|
|
iput(*ipp);
|
|
|
|
*ipp = NULL;
|
|
|
|
error = SET_ERROR(ENOENT);
|
|
|
|
}
|
|
|
|
if (!IS_ERR(dentry))
|
|
|
|
dput(dentry);
|
|
|
|
out:
|
|
|
|
kmem_free(mnt, MAXPATHLEN);
|
2011-11-11 11:15:53 +04:00
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
zfsctl_shares_lookup(struct inode *dip, char *name, struct inode **ipp,
|
|
|
|
int flags, cred_t *cr, int *direntflags, pathname_t *realpnp)
|
|
|
|
{
|
2017-03-08 03:21:37 +03:00
|
|
|
zfsvfs_t *zfsvfs = ITOZSB(dip);
|
2019-12-11 22:53:57 +03:00
|
|
|
znode_t *zp;
|
2011-11-11 11:15:53 +04:00
|
|
|
znode_t *dzp;
|
|
|
|
int error;
|
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
if ((error = zfs_enter(zfsvfs, FTAG)) != 0)
|
|
|
|
return (error);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
if (zfsvfs->z_shares_dir == 0) {
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2013-03-08 22:41:28 +04:00
|
|
|
return (SET_ERROR(ENOTSUP));
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
2017-03-08 03:21:37 +03:00
|
|
|
if ((error = zfs_zget(zfsvfs, zfsvfs->z_shares_dir, &dzp)) == 0) {
|
2019-12-11 22:53:57 +03:00
|
|
|
error = zfs_lookup(dzp, name, &zp, 0, cr, NULL, NULL);
|
|
|
|
zrele(dzp);
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
2022-09-16 23:36:47 +03:00
|
|
|
zfs_exit(zfsvfs, FTAG);
|
2011-11-11 11:15:53 +04:00
|
|
|
|
|
|
|
return (error);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Initialize the various pieces we'll need to create and manipulate .zfs
|
|
|
|
* directories. Currently this is unused but available.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
zfsctl_init(void)
|
|
|
|
{
|
2015-04-25 02:21:13 +03:00
|
|
|
avl_create(&zfs_snapshots_by_name, snapentry_compare_by_name,
|
|
|
|
sizeof (zfs_snapentry_t), offsetof(zfs_snapentry_t,
|
|
|
|
se_node_name));
|
|
|
|
avl_create(&zfs_snapshots_by_objsetid, snapentry_compare_by_objsetid,
|
|
|
|
sizeof (zfs_snapentry_t), offsetof(zfs_snapentry_t,
|
|
|
|
se_node_objsetid));
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_init(&zfs_snapshot_lock, NULL, RW_DEFAULT, NULL);
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Cleanup the various pieces we needed for .zfs directories. In particular
|
|
|
|
* ensure the expiry timer is canceled safely.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
zfsctl_fini(void)
|
|
|
|
{
|
2015-04-25 02:21:13 +03:00
|
|
|
avl_destroy(&zfs_snapshots_by_name);
|
|
|
|
avl_destroy(&zfs_snapshots_by_objsetid);
|
2015-12-11 02:53:37 +03:00
|
|
|
rw_destroy(&zfs_snapshot_lock);
|
2011-11-11 11:15:53 +04:00
|
|
|
}
|
|
|
|
|
2015-08-29 00:54:32 +03:00
|
|
|
module_param(zfs_admin_snapshot, int, 0644);
|
|
|
|
MODULE_PARM_DESC(zfs_admin_snapshot, "Enable mkdir/rmdir/mv in .zfs/snapshot");
|
|
|
|
|
2011-11-11 11:15:53 +04:00
|
|
|
module_param(zfs_expire_snapshot, int, 0644);
|
|
|
|
MODULE_PARM_DESC(zfs_expire_snapshot, "Seconds to expire .zfs/snapshot");
|
2024-10-02 19:12:02 +03:00
|
|
|
|
|
|
|
module_param(zfs_snapshot_no_setuid, int, 0644);
|
|
|
|
MODULE_PARM_DESC(zfs_snapshot_no_setuid,
|
|
|
|
"Disable setuid/setgid for automounts in .zfs/snapshot");
|