mirror of
https://git.proxmox.com/git/mirror_zfs.git
synced 2025-01-10 10:10:26 +03:00
1b939560be
UNMAP/TRIM support is a frequently-requested feature to help prevent performance from degrading on SSDs and on various other SAN-like storage back-ends. By issuing UNMAP/TRIM commands for sectors which are no longer allocated the underlying device can often more efficiently manage itself. This TRIM implementation is modeled on the `zpool initialize` feature which writes a pattern to all unallocated space in the pool. The new `zpool trim` command uses the same vdev_xlate() code to calculate what sectors are unallocated, the same per- vdev TRIM thread model and locking, and the same basic CLI for a consistent user experience. The core difference is that instead of writing a pattern it will issue UNMAP/TRIM commands for those extents. The zio pipeline was updated to accommodate this by adding a new ZIO_TYPE_TRIM type and associated spa taskq. This new type makes is straight forward to add the platform specific TRIM/UNMAP calls to vdev_disk.c and vdev_file.c. These new ZIO_TYPE_TRIM zios are handled largely the same way as ZIO_TYPE_READs or ZIO_TYPE_WRITEs. This makes it possible to largely avoid changing the pipieline, one exception is that TRIM zio's may exceed the 16M block size limit since they contain no data. In addition to the manual `zpool trim` command, a background automatic TRIM was added and is controlled by the 'autotrim' property. It relies on the exact same infrastructure as the manual TRIM. However, instead of relying on the extents in a metaslab's ms_allocatable range tree, a ms_trim tree is kept per metaslab. When 'autotrim=on', ranges added back to the ms_allocatable tree are also added to the ms_free tree. The ms_free tree is then periodically consumed by an autotrim thread which systematically walks a top level vdev's metaslabs. Since the automatic TRIM will skip ranges it considers too small there is value in occasionally running a full `zpool trim`. This may occur when the freed blocks are small and not enough time was allowed to aggregate them. An automatic TRIM and a manual `zpool trim` may be run concurrently, in which case the automatic TRIM will yield to the manual TRIM. Reviewed-by: Jorgen Lundman <lundman@lundman.net> Reviewed-by: Tim Chase <tim@chase2k.com> Reviewed-by: Matt Ahrens <mahrens@delphix.com> Reviewed-by: George Wilson <george.wilson@delphix.com> Reviewed-by: Serapheim Dimitropoulos <serapheim@delphix.com> Contributions-by: Saso Kiselkov <saso.kiselkov@nexenta.com> Contributions-by: Tim Chase <tim@chase2k.com> Contributions-by: Chunwei Chen <tuxoko@gmail.com> Signed-off-by: Brian Behlendorf <behlendorf1@llnl.gov> Closes #8419 Closes #598
137 lines
4.7 KiB
C
137 lines
4.7 KiB
C
/*
|
|
* CDDL HEADER START
|
|
*
|
|
* The contents of this file are subject to the terms of the
|
|
* Common Development and Distribution License (the "License").
|
|
* You may not use this file except in compliance with the License.
|
|
*
|
|
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
|
|
* or http://www.opensolaris.org/os/licensing.
|
|
* See the License for the specific language governing permissions
|
|
* and limitations under the License.
|
|
*
|
|
* When distributing Covered Code, include this CDDL HEADER in each
|
|
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
|
|
* If applicable, add the following below this CDDL HEADER, with the
|
|
* fields enclosed by brackets "[]" replaced with your own identifying
|
|
* information: Portions Copyright [yyyy] [name of copyright owner]
|
|
*
|
|
* CDDL HEADER END
|
|
*/
|
|
/*
|
|
* Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
|
|
* Copyright 2015 Nexenta Systems, Inc. All rights reserved.
|
|
* Copyright 2017 Joyent, Inc.
|
|
*/
|
|
|
|
#ifndef _SYS_SYSEVENT_EVENTDEFS_H
|
|
#define _SYS_SYSEVENT_EVENTDEFS_H
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
/*
|
|
* eventdefs.h contains public definitions for sysevent types (classes
|
|
* and subclasses). All additions/removal/changes are subject
|
|
* to PSARC approval.
|
|
*/
|
|
|
|
/* Sysevent Class definitions */
|
|
#define EC_NONE "EC_none"
|
|
#define EC_PRIV "EC_priv"
|
|
#define EC_PLATFORM "EC_platform" /* events private to platform */
|
|
#define EC_DR "EC_dr" /* Dynamic reconfiguration event class */
|
|
#define EC_ENV "EC_env" /* Environmental monitor event class */
|
|
#define EC_DOMAIN "EC_domain" /* Domain event class */
|
|
#define EC_AP_DRIVER "EC_ap_driver" /* Alternate Pathing event class */
|
|
#define EC_IPMP "EC_ipmp" /* IP Multipathing event class */
|
|
#define EC_DEV_ADD "EC_dev_add" /* device add event class */
|
|
#define EC_DEV_REMOVE "EC_dev_remove" /* device remove event class */
|
|
#define EC_DEV_BRANCH "EC_dev_branch" /* device tree branch event class */
|
|
#define EC_DEV_STATUS "EC_dev_status" /* device status event class */
|
|
#define EC_FM "EC_fm" /* FMA error report event */
|
|
#define EC_ZFS "EC_zfs" /* ZFS event */
|
|
#define EC_DATALINK "EC_datalink" /* datalink event */
|
|
#define EC_VRRP "EC_vrrp" /* VRRP event */
|
|
|
|
/*
|
|
* EC_DEV_ADD and EC_DEV_REMOVE subclass definitions - supporting attributes
|
|
* (name/value pairs) are found in sys/sysevent/dev.h
|
|
*/
|
|
#define ESC_DISK "disk" /* disk device */
|
|
#define ESC_NETWORK "network" /* network interface */
|
|
#define ESC_PRINTER "printer" /* printer device */
|
|
#define ESC_LOFI "lofi" /* lofi device */
|
|
|
|
/*
|
|
* EC_DEV_BRANCH subclass definitions - supporting attributes (name/value pairs)
|
|
* are found in sys/sysevent/dev.h
|
|
*/
|
|
|
|
/* device tree branch added */
|
|
#define ESC_DEV_BRANCH_ADD "dev_branch_add"
|
|
|
|
/* device tree branch removed */
|
|
#define ESC_DEV_BRANCH_REMOVE "dev_branch_remove"
|
|
|
|
/*
|
|
* EC_DEV_STATUS subclass definitions
|
|
*
|
|
* device capacity dynamically changed
|
|
*/
|
|
#define ESC_DEV_DLE "dev_dle"
|
|
|
|
/* LUN has received an eject request from the user */
|
|
#define ESC_DEV_EJECT_REQUEST "dev_eject_request"
|
|
|
|
/* FMA Fault and Error event protocol subclass */
|
|
#define ESC_FM_ERROR "error"
|
|
#define ESC_FM_ERROR_REPLAY "error_replay"
|
|
|
|
/*
|
|
* ZFS subclass definitions. supporting attributes (name/value paris) are found
|
|
* in sys/fs/zfs.h
|
|
*/
|
|
#define ESC_ZFS_RESILVER_START "resilver_start"
|
|
#define ESC_ZFS_RESILVER_FINISH "resilver_finish"
|
|
#define ESC_ZFS_VDEV_REMOVE "vdev_remove"
|
|
#define ESC_ZFS_VDEV_REMOVE_AUX "vdev_remove_aux"
|
|
#define ESC_ZFS_VDEV_REMOVE_DEV "vdev_remove_dev"
|
|
#define ESC_ZFS_POOL_CREATE "pool_create"
|
|
#define ESC_ZFS_POOL_DESTROY "pool_destroy"
|
|
#define ESC_ZFS_POOL_IMPORT "pool_import"
|
|
#define ESC_ZFS_POOL_EXPORT "pool_export"
|
|
#define ESC_ZFS_VDEV_ADD "vdev_add"
|
|
#define ESC_ZFS_VDEV_ATTACH "vdev_attach"
|
|
#define ESC_ZFS_VDEV_CLEAR "vdev_clear"
|
|
#define ESC_ZFS_VDEV_CHECK "vdev_check"
|
|
#define ESC_ZFS_VDEV_ONLINE "vdev_online"
|
|
#define ESC_ZFS_CONFIG_SYNC "config_sync"
|
|
#define ESC_ZFS_SCRUB_START "scrub_start"
|
|
#define ESC_ZFS_SCRUB_FINISH "scrub_finish"
|
|
#define ESC_ZFS_SCRUB_ABORT "scrub_abort"
|
|
#define ESC_ZFS_SCRUB_RESUME "scrub_resume"
|
|
#define ESC_ZFS_SCRUB_PAUSED "scrub_paused"
|
|
#define ESC_ZFS_VDEV_SPARE "vdev_spare"
|
|
#define ESC_ZFS_VDEV_AUTOEXPAND "vdev_autoexpand"
|
|
#define ESC_ZFS_BOOTFS_VDEV_ATTACH "bootfs_vdev_attach"
|
|
#define ESC_ZFS_POOL_REGUID "pool_reguid"
|
|
#define ESC_ZFS_HISTORY_EVENT "history_event"
|
|
#define ESC_ZFS_TRIM_START "trim_start"
|
|
#define ESC_ZFS_TRIM_FINISH "trim_finish"
|
|
#define ESC_ZFS_TRIM_CANCEL "trim_cancel"
|
|
#define ESC_ZFS_TRIM_RESUME "trim_resume"
|
|
#define ESC_ZFS_TRIM_SUSPEND "trim_suspend"
|
|
|
|
/*
|
|
* datalink subclass definitions.
|
|
*/
|
|
#define ESC_DATALINK_PHYS_ADD "datalink_phys_add" /* new physical link */
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
|
|
#endif /* _SYS_SYSEVENT_EVENTDEFS_H */
|