1eda14cbcSMatt Macy /* 2eda14cbcSMatt Macy * CDDL HEADER START 3eda14cbcSMatt Macy * 4eda14cbcSMatt Macy * The contents of this file are subject to the terms of the 5eda14cbcSMatt Macy * Common Development and Distribution License (the "License"). 6eda14cbcSMatt Macy * You may not use this file except in compliance with the License. 7eda14cbcSMatt Macy * 8eda14cbcSMatt Macy * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9271171e0SMartin Matuska * or https://opensource.org/licenses/CDDL-1.0. 10eda14cbcSMatt Macy * See the License for the specific language governing permissions 11eda14cbcSMatt Macy * and limitations under the License. 12eda14cbcSMatt Macy * 13eda14cbcSMatt Macy * When distributing Covered Code, include this CDDL HEADER in each 14eda14cbcSMatt Macy * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15eda14cbcSMatt Macy * If applicable, add the following below this CDDL HEADER, with the 16eda14cbcSMatt Macy * fields enclosed by brackets "[]" replaced with your own identifying 17eda14cbcSMatt Macy * information: Portions Copyright [yyyy] [name of copyright owner] 18eda14cbcSMatt Macy * 19eda14cbcSMatt Macy * CDDL HEADER END 20eda14cbcSMatt Macy */ 21eda14cbcSMatt Macy /* 22eda14cbcSMatt Macy * Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved. 23eda14cbcSMatt Macy * Copyright (c) 2012, 2017 by Delphix. All rights reserved. 24eda14cbcSMatt Macy * Copyright (c) 2017, 2019, Datto Inc. All rights reserved. 25eda14cbcSMatt Macy */ 26eda14cbcSMatt Macy 27eda14cbcSMatt Macy #ifndef _SYS_DSL_SCAN_H 28eda14cbcSMatt Macy #define _SYS_DSL_SCAN_H 29eda14cbcSMatt Macy 30eda14cbcSMatt Macy #include <sys/zfs_context.h> 31eda14cbcSMatt Macy #include <sys/zio.h> 32c0a83fe0SMartin Matuska #include <sys/zap.h> 33eda14cbcSMatt Macy #include <sys/ddt.h> 34eda14cbcSMatt Macy #include <sys/bplist.h> 35eda14cbcSMatt Macy 36eda14cbcSMatt Macy #ifdef __cplusplus 37eda14cbcSMatt Macy extern "C" { 38eda14cbcSMatt Macy #endif 39eda14cbcSMatt Macy 40eda14cbcSMatt Macy struct objset; 41eda14cbcSMatt Macy struct dsl_dir; 42eda14cbcSMatt Macy struct dsl_dataset; 43eda14cbcSMatt Macy struct dsl_pool; 44eda14cbcSMatt Macy struct dmu_tx; 45eda14cbcSMatt Macy 46eda14cbcSMatt Macy extern int zfs_scan_suspend_progress; 47eda14cbcSMatt Macy 48eda14cbcSMatt Macy /* 49eda14cbcSMatt Macy * All members of this structure must be uint64_t, for byteswap 50eda14cbcSMatt Macy * purposes. 51eda14cbcSMatt Macy */ 52eda14cbcSMatt Macy typedef struct dsl_scan_phys { 53eda14cbcSMatt Macy uint64_t scn_func; /* pool_scan_func_t */ 54eda14cbcSMatt Macy uint64_t scn_state; /* dsl_scan_state_t */ 55eda14cbcSMatt Macy uint64_t scn_queue_obj; 56eda14cbcSMatt Macy uint64_t scn_min_txg; 57eda14cbcSMatt Macy uint64_t scn_max_txg; 58eda14cbcSMatt Macy uint64_t scn_cur_min_txg; 59eda14cbcSMatt Macy uint64_t scn_cur_max_txg; 60eda14cbcSMatt Macy uint64_t scn_start_time; 61eda14cbcSMatt Macy uint64_t scn_end_time; 62eda14cbcSMatt Macy uint64_t scn_to_examine; /* total bytes to be scanned */ 63eda14cbcSMatt Macy uint64_t scn_examined; /* bytes scanned so far */ 640a97523dSMartin Matuska uint64_t scn_skipped; /* bytes skipped by scanner */ 65eda14cbcSMatt Macy uint64_t scn_processed; 66eda14cbcSMatt Macy uint64_t scn_errors; /* scan I/O error count */ 67eda14cbcSMatt Macy uint64_t scn_ddt_class_max; 68eda14cbcSMatt Macy ddt_bookmark_t scn_ddt_bookmark; 69eda14cbcSMatt Macy zbookmark_phys_t scn_bookmark; 70eda14cbcSMatt Macy uint64_t scn_flags; /* dsl_scan_flags_t */ 71eda14cbcSMatt Macy } dsl_scan_phys_t; 72eda14cbcSMatt Macy 73eda14cbcSMatt Macy #define SCAN_PHYS_NUMINTS (sizeof (dsl_scan_phys_t) / sizeof (uint64_t)) 74eda14cbcSMatt Macy 75eda14cbcSMatt Macy typedef enum dsl_scan_flags { 76eda14cbcSMatt Macy DSF_VISIT_DS_AGAIN = 1<<0, 77eda14cbcSMatt Macy DSF_SCRUB_PAUSED = 1<<1, 78eda14cbcSMatt Macy } dsl_scan_flags_t; 79eda14cbcSMatt Macy 80eda14cbcSMatt Macy #define DSL_SCAN_FLAGS_MASK (DSF_VISIT_DS_AGAIN) 81eda14cbcSMatt Macy 82c0a83fe0SMartin Matuska typedef struct dsl_errorscrub_phys { 83c0a83fe0SMartin Matuska uint64_t dep_func; /* pool_scan_func_t */ 84c0a83fe0SMartin Matuska uint64_t dep_state; /* dsl_scan_state_t */ 85c0a83fe0SMartin Matuska uint64_t dep_cursor; /* serialized zap cursor for tracing progress */ 86c0a83fe0SMartin Matuska uint64_t dep_start_time; /* error scrub start time, unix timestamp */ 87c0a83fe0SMartin Matuska uint64_t dep_end_time; /* error scrub end time, unix timestamp */ 88c0a83fe0SMartin Matuska uint64_t dep_to_examine; /* total error blocks to be scrubbed */ 89c0a83fe0SMartin Matuska uint64_t dep_examined; /* blocks scrubbed so far */ 90c0a83fe0SMartin Matuska uint64_t dep_errors; /* error scrub I/O error count */ 91c0a83fe0SMartin Matuska uint64_t dep_paused_flags; /* flag for paused */ 92c0a83fe0SMartin Matuska } dsl_errorscrub_phys_t; 93c0a83fe0SMartin Matuska 94c0a83fe0SMartin Matuska #define ERRORSCRUB_PHYS_NUMINTS (sizeof (dsl_errorscrub_phys_t) \ 95c0a83fe0SMartin Matuska / sizeof (uint64_t)) 96c0a83fe0SMartin Matuska 97eda14cbcSMatt Macy /* 98eda14cbcSMatt Macy * Every pool will have one dsl_scan_t and this structure will contain 99eda14cbcSMatt Macy * in-memory information about the scan and a pointer to the on-disk 100eda14cbcSMatt Macy * representation (i.e. dsl_scan_phys_t). Most of the state of the scan 101eda14cbcSMatt Macy * is contained on-disk to allow the scan to resume in the event of a reboot 102eda14cbcSMatt Macy * or panic. This structure maintains information about the behavior of a 103eda14cbcSMatt Macy * running scan, some caching information, and how it should traverse the pool. 104eda14cbcSMatt Macy * 105eda14cbcSMatt Macy * The following members of this structure direct the behavior of the scan: 106eda14cbcSMatt Macy * 107eda14cbcSMatt Macy * scn_suspending - a scan that cannot be completed in a single txg or 108eda14cbcSMatt Macy * has exceeded its allotted time will need to suspend. 109eda14cbcSMatt Macy * When this flag is set the scanner will stop traversing 110eda14cbcSMatt Macy * the pool and write out the current state to disk. 111eda14cbcSMatt Macy * 112eda14cbcSMatt Macy * scn_restart_txg - directs the scanner to either restart or start a 113eda14cbcSMatt Macy * a scan at the specified txg value. 114eda14cbcSMatt Macy * 115eda14cbcSMatt Macy * scn_done_txg - when a scan completes its traversal it will set 116eda14cbcSMatt Macy * the completion txg to the next txg. This is necessary 117eda14cbcSMatt Macy * to ensure that any blocks that were freed during 118eda14cbcSMatt Macy * the scan but have not yet been processed (i.e deferred 119eda14cbcSMatt Macy * frees) are accounted for. 120eda14cbcSMatt Macy * 121eda14cbcSMatt Macy * This structure also maintains information about deferred frees which are 122eda14cbcSMatt Macy * a special kind of traversal. Deferred free can exist in either a bptree or 123eda14cbcSMatt Macy * a bpobj structure. The scn_is_bptree flag will indicate the type of 124eda14cbcSMatt Macy * deferred free that is in progress. If the deferred free is part of an 125eda14cbcSMatt Macy * asynchronous destroy then the scn_async_destroying flag will be set. 126eda14cbcSMatt Macy */ 127eda14cbcSMatt Macy typedef struct dsl_scan { 128eda14cbcSMatt Macy struct dsl_pool *scn_dp; 129eda14cbcSMatt Macy uint64_t scn_restart_txg; 130eda14cbcSMatt Macy uint64_t scn_done_txg; 131eda14cbcSMatt Macy uint64_t scn_sync_start_time; 132eda14cbcSMatt Macy uint64_t scn_issued_before_pass; 133eda14cbcSMatt Macy 134eda14cbcSMatt Macy /* for freeing blocks */ 135eda14cbcSMatt Macy boolean_t scn_is_bptree; 136eda14cbcSMatt Macy boolean_t scn_async_destroying; 137eda14cbcSMatt Macy boolean_t scn_async_stalled; 138eda14cbcSMatt Macy uint64_t scn_async_block_min_time_ms; 139eda14cbcSMatt Macy 140eda14cbcSMatt Macy /* flags and stats for controlling scan state */ 141eda14cbcSMatt Macy boolean_t scn_is_sorted; /* doing sequential scan */ 142eda14cbcSMatt Macy boolean_t scn_clearing; /* scan is issuing sequential extents */ 143eda14cbcSMatt Macy boolean_t scn_checkpointing; /* scan is issuing all queued extents */ 144eda14cbcSMatt Macy boolean_t scn_suspending; /* scan is suspending until next txg */ 145eda14cbcSMatt Macy uint64_t scn_last_checkpoint; /* time of last checkpoint */ 146eda14cbcSMatt Macy 147eda14cbcSMatt Macy /* members for thread synchronization */ 148eda14cbcSMatt Macy zio_t *scn_zio_root; /* root zio for waiting on IO */ 149eda14cbcSMatt Macy taskq_t *scn_taskq; /* task queue for issuing extents */ 150eda14cbcSMatt Macy 151eda14cbcSMatt Macy /* for controlling scan prefetch, protected by spa_scrub_lock */ 152eda14cbcSMatt Macy boolean_t scn_prefetch_stop; /* prefetch should stop */ 153eda14cbcSMatt Macy zbookmark_phys_t scn_prefetch_bookmark; /* prefetch start bookmark */ 154eda14cbcSMatt Macy avl_tree_t scn_prefetch_queue; /* priority queue of prefetch IOs */ 155eda14cbcSMatt Macy uint64_t scn_maxinflight_bytes; /* max bytes in flight for pool */ 156eda14cbcSMatt Macy 157eda14cbcSMatt Macy /* per txg statistics */ 158eda14cbcSMatt Macy uint64_t scn_visited_this_txg; /* total bps visited this txg */ 159eda14cbcSMatt Macy uint64_t scn_dedup_frees_this_txg; /* dedup bps freed this txg */ 160eda14cbcSMatt Macy uint64_t scn_holes_this_txg; 161eda14cbcSMatt Macy uint64_t scn_lt_min_this_txg; 162eda14cbcSMatt Macy uint64_t scn_gt_max_this_txg; 163eda14cbcSMatt Macy uint64_t scn_ddt_contained_this_txg; 164eda14cbcSMatt Macy uint64_t scn_objsets_visited_this_txg; 165eda14cbcSMatt Macy uint64_t scn_avg_seg_size_this_txg; 166eda14cbcSMatt Macy uint64_t scn_segs_this_txg; 167eda14cbcSMatt Macy uint64_t scn_avg_zio_size_this_txg; 168eda14cbcSMatt Macy uint64_t scn_zios_this_txg; 169eda14cbcSMatt Macy 170c0a83fe0SMartin Matuska /* zap cursor for tracing error scrub progress */ 171c0a83fe0SMartin Matuska zap_cursor_t errorscrub_cursor; 172eda14cbcSMatt Macy /* members needed for syncing scan status to disk */ 173eda14cbcSMatt Macy dsl_scan_phys_t scn_phys; /* on disk representation of scan */ 174eda14cbcSMatt Macy dsl_scan_phys_t scn_phys_cached; 175eda14cbcSMatt Macy avl_tree_t scn_queue; /* queue of datasets to scan */ 17649086aa3SAlexander Motin kmutex_t scn_queue_lock; /* serializes scn_queue inserts */ 177a0b956f5SMartin Matuska uint64_t scn_queues_pending; /* outstanding data to issue */ 178c0a83fe0SMartin Matuska /* members needed for syncing error scrub status to disk */ 179c0a83fe0SMartin Matuska dsl_errorscrub_phys_t errorscrub_phys; 180eda14cbcSMatt Macy } dsl_scan_t; 181eda14cbcSMatt Macy 182eda14cbcSMatt Macy typedef struct dsl_scan_io_queue dsl_scan_io_queue_t; 183eda14cbcSMatt Macy 184eda14cbcSMatt Macy void scan_init(void); 185eda14cbcSMatt Macy void scan_fini(void); 186eda14cbcSMatt Macy int dsl_scan_init(struct dsl_pool *dp, uint64_t txg); 18716038816SMartin Matuska int dsl_scan_setup_check(void *, dmu_tx_t *); 1887877fdebSMatt Macy void dsl_scan_setup_sync(void *, dmu_tx_t *); 189eda14cbcSMatt Macy void dsl_scan_fini(struct dsl_pool *dp); 190eda14cbcSMatt Macy void dsl_scan_sync(struct dsl_pool *, dmu_tx_t *); 191eda14cbcSMatt Macy int dsl_scan_cancel(struct dsl_pool *); 192eda14cbcSMatt Macy int dsl_scan(struct dsl_pool *, pool_scan_func_t); 193eda14cbcSMatt Macy void dsl_scan_assess_vdev(struct dsl_pool *dp, vdev_t *vd); 194eda14cbcSMatt Macy boolean_t dsl_scan_scrubbing(const struct dsl_pool *dp); 195c0a83fe0SMartin Matuska boolean_t dsl_errorscrubbing(const struct dsl_pool *dp); 196c0a83fe0SMartin Matuska boolean_t dsl_errorscrub_active(dsl_scan_t *scn); 197eda14cbcSMatt Macy void dsl_scan_restart_resilver(struct dsl_pool *, uint64_t txg); 198c0a83fe0SMartin Matuska int dsl_scrub_set_pause_resume(const struct dsl_pool *dp, 199c0a83fe0SMartin Matuska pool_scrub_cmd_t cmd); 200c0a83fe0SMartin Matuska void dsl_errorscrub_sync(struct dsl_pool *, dmu_tx_t *); 201eda14cbcSMatt Macy boolean_t dsl_scan_resilvering(struct dsl_pool *dp); 202eda14cbcSMatt Macy boolean_t dsl_scan_resilver_scheduled(struct dsl_pool *dp); 203eda14cbcSMatt Macy boolean_t dsl_dataset_unstable(struct dsl_dataset *ds); 204eda14cbcSMatt Macy void dsl_scan_ddt_entry(dsl_scan_t *scn, enum zio_checksum checksum, 205*e2df9bb4SMartin Matuska ddt_t *ddt, ddt_lightweight_entry_t *ddlwe, dmu_tx_t *tx); 206eda14cbcSMatt Macy void dsl_scan_ds_destroyed(struct dsl_dataset *ds, struct dmu_tx *tx); 207eda14cbcSMatt Macy void dsl_scan_ds_snapshotted(struct dsl_dataset *ds, struct dmu_tx *tx); 208eda14cbcSMatt Macy void dsl_scan_ds_clone_swapped(struct dsl_dataset *ds1, struct dsl_dataset *ds2, 209eda14cbcSMatt Macy struct dmu_tx *tx); 210eda14cbcSMatt Macy boolean_t dsl_scan_active(dsl_scan_t *scn); 211eda14cbcSMatt Macy boolean_t dsl_scan_is_paused_scrub(const dsl_scan_t *scn); 212c0a83fe0SMartin Matuska boolean_t dsl_errorscrub_is_paused(const dsl_scan_t *scn); 213eda14cbcSMatt Macy void dsl_scan_freed(spa_t *spa, const blkptr_t *bp); 214eda14cbcSMatt Macy void dsl_scan_io_queue_destroy(dsl_scan_io_queue_t *queue); 215eda14cbcSMatt Macy void dsl_scan_io_queue_vdev_xfer(vdev_t *svd, vdev_t *tvd); 216eda14cbcSMatt Macy 217eda14cbcSMatt Macy #ifdef __cplusplus 218eda14cbcSMatt Macy } 219eda14cbcSMatt Macy #endif 220eda14cbcSMatt Macy 221eda14cbcSMatt Macy #endif /* _SYS_DSL_SCAN_H */ 222