xref: /freebsd/sys/contrib/openzfs/include/sys/dsl_scan.h (revision 0a97523d467443fa54171ef7a399b1c9043eac75)
1eda14cbcSMatt Macy /*
2eda14cbcSMatt Macy  * CDDL HEADER START
3eda14cbcSMatt Macy  *
4eda14cbcSMatt Macy  * The contents of this file are subject to the terms of the
5eda14cbcSMatt Macy  * Common Development and Distribution License (the "License").
6eda14cbcSMatt Macy  * You may not use this file except in compliance with the License.
7eda14cbcSMatt Macy  *
8eda14cbcSMatt Macy  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9271171e0SMartin Matuska  * or https://opensource.org/licenses/CDDL-1.0.
10eda14cbcSMatt Macy  * See the License for the specific language governing permissions
11eda14cbcSMatt Macy  * and limitations under the License.
12eda14cbcSMatt Macy  *
13eda14cbcSMatt Macy  * When distributing Covered Code, include this CDDL HEADER in each
14eda14cbcSMatt Macy  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15eda14cbcSMatt Macy  * If applicable, add the following below this CDDL HEADER, with the
16eda14cbcSMatt Macy  * fields enclosed by brackets "[]" replaced with your own identifying
17eda14cbcSMatt Macy  * information: Portions Copyright [yyyy] [name of copyright owner]
18eda14cbcSMatt Macy  *
19eda14cbcSMatt Macy  * CDDL HEADER END
20eda14cbcSMatt Macy  */
21eda14cbcSMatt Macy /*
22eda14cbcSMatt Macy  * Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved.
23eda14cbcSMatt Macy  * Copyright (c) 2012, 2017 by Delphix. All rights reserved.
24eda14cbcSMatt Macy  * Copyright (c) 2017, 2019, Datto Inc. All rights reserved.
25eda14cbcSMatt Macy  */
26eda14cbcSMatt Macy 
27eda14cbcSMatt Macy #ifndef	_SYS_DSL_SCAN_H
28eda14cbcSMatt Macy #define	_SYS_DSL_SCAN_H
29eda14cbcSMatt Macy 
30eda14cbcSMatt Macy #include <sys/zfs_context.h>
31eda14cbcSMatt Macy #include <sys/zio.h>
32c0a83fe0SMartin Matuska #include <sys/zap.h>
33eda14cbcSMatt Macy #include <sys/ddt.h>
34eda14cbcSMatt Macy #include <sys/bplist.h>
35eda14cbcSMatt Macy 
36eda14cbcSMatt Macy #ifdef	__cplusplus
37eda14cbcSMatt Macy extern "C" {
38eda14cbcSMatt Macy #endif
39eda14cbcSMatt Macy 
40eda14cbcSMatt Macy struct objset;
41eda14cbcSMatt Macy struct dsl_dir;
42eda14cbcSMatt Macy struct dsl_dataset;
43eda14cbcSMatt Macy struct dsl_pool;
44eda14cbcSMatt Macy struct dmu_tx;
45eda14cbcSMatt Macy 
46eda14cbcSMatt Macy extern int zfs_scan_suspend_progress;
47eda14cbcSMatt Macy 
48eda14cbcSMatt Macy /*
49eda14cbcSMatt Macy  * All members of this structure must be uint64_t, for byteswap
50eda14cbcSMatt Macy  * purposes.
51eda14cbcSMatt Macy  */
52eda14cbcSMatt Macy typedef struct dsl_scan_phys {
53eda14cbcSMatt Macy 	uint64_t scn_func; /* pool_scan_func_t */
54eda14cbcSMatt Macy 	uint64_t scn_state; /* dsl_scan_state_t */
55eda14cbcSMatt Macy 	uint64_t scn_queue_obj;
56eda14cbcSMatt Macy 	uint64_t scn_min_txg;
57eda14cbcSMatt Macy 	uint64_t scn_max_txg;
58eda14cbcSMatt Macy 	uint64_t scn_cur_min_txg;
59eda14cbcSMatt Macy 	uint64_t scn_cur_max_txg;
60eda14cbcSMatt Macy 	uint64_t scn_start_time;
61eda14cbcSMatt Macy 	uint64_t scn_end_time;
62eda14cbcSMatt Macy 	uint64_t scn_to_examine; /* total bytes to be scanned */
63eda14cbcSMatt Macy 	uint64_t scn_examined; /* bytes scanned so far */
64*0a97523dSMartin Matuska 	uint64_t scn_skipped;	/* bytes skipped by scanner */
65eda14cbcSMatt Macy 	uint64_t scn_processed;
66eda14cbcSMatt Macy 	uint64_t scn_errors;	/* scan I/O error count */
67eda14cbcSMatt Macy 	uint64_t scn_ddt_class_max;
68eda14cbcSMatt Macy 	ddt_bookmark_t scn_ddt_bookmark;
69eda14cbcSMatt Macy 	zbookmark_phys_t scn_bookmark;
70eda14cbcSMatt Macy 	uint64_t scn_flags; /* dsl_scan_flags_t */
71eda14cbcSMatt Macy } dsl_scan_phys_t;
72eda14cbcSMatt Macy 
73eda14cbcSMatt Macy #define	SCAN_PHYS_NUMINTS (sizeof (dsl_scan_phys_t) / sizeof (uint64_t))
74eda14cbcSMatt Macy 
75eda14cbcSMatt Macy typedef enum dsl_scan_flags {
76eda14cbcSMatt Macy 	DSF_VISIT_DS_AGAIN = 1<<0,
77eda14cbcSMatt Macy 	DSF_SCRUB_PAUSED = 1<<1,
78eda14cbcSMatt Macy } dsl_scan_flags_t;
79eda14cbcSMatt Macy 
80eda14cbcSMatt Macy #define	DSL_SCAN_FLAGS_MASK (DSF_VISIT_DS_AGAIN)
81eda14cbcSMatt Macy 
82c0a83fe0SMartin Matuska typedef struct dsl_errorscrub_phys {
83c0a83fe0SMartin Matuska 	uint64_t dep_func; /* pool_scan_func_t */
84c0a83fe0SMartin Matuska 	uint64_t dep_state; /* dsl_scan_state_t */
85c0a83fe0SMartin Matuska 	uint64_t dep_cursor; /* serialized zap cursor for tracing progress */
86c0a83fe0SMartin Matuska 	uint64_t dep_start_time; /* error scrub start time, unix timestamp */
87c0a83fe0SMartin Matuska 	uint64_t dep_end_time; /* error scrub end time, unix timestamp */
88c0a83fe0SMartin Matuska 	uint64_t dep_to_examine; /* total error blocks to be scrubbed */
89c0a83fe0SMartin Matuska 	uint64_t dep_examined; /* blocks scrubbed so far */
90c0a83fe0SMartin Matuska 	uint64_t dep_errors;	/* error scrub I/O error count */
91c0a83fe0SMartin Matuska 	uint64_t dep_paused_flags; /* flag for paused */
92c0a83fe0SMartin Matuska } dsl_errorscrub_phys_t;
93c0a83fe0SMartin Matuska 
94c0a83fe0SMartin Matuska #define	ERRORSCRUB_PHYS_NUMINTS (sizeof (dsl_errorscrub_phys_t) \
95c0a83fe0SMartin Matuska 	/ sizeof (uint64_t))
96c0a83fe0SMartin Matuska 
97eda14cbcSMatt Macy /*
98eda14cbcSMatt Macy  * Every pool will have one dsl_scan_t and this structure will contain
99eda14cbcSMatt Macy  * in-memory information about the scan and a pointer to the on-disk
100eda14cbcSMatt Macy  * representation (i.e. dsl_scan_phys_t). Most of the state of the scan
101eda14cbcSMatt Macy  * is contained on-disk to allow the scan to resume in the event of a reboot
102eda14cbcSMatt Macy  * or panic. This structure maintains information about the behavior of a
103eda14cbcSMatt Macy  * running scan, some caching information, and how it should traverse the pool.
104eda14cbcSMatt Macy  *
105eda14cbcSMatt Macy  * The following members of this structure direct the behavior of the scan:
106eda14cbcSMatt Macy  *
107eda14cbcSMatt Macy  * scn_suspending -	a scan that cannot be completed in a single txg or
108eda14cbcSMatt Macy  *			has exceeded its allotted time will need to suspend.
109eda14cbcSMatt Macy  *			When this flag is set the scanner will stop traversing
110eda14cbcSMatt Macy  *			the pool and write out the current state to disk.
111eda14cbcSMatt Macy  *
112eda14cbcSMatt Macy  * scn_restart_txg -	directs the scanner to either restart or start a
113eda14cbcSMatt Macy  *			a scan at the specified txg value.
114eda14cbcSMatt Macy  *
115eda14cbcSMatt Macy  * scn_done_txg -	when a scan completes its traversal it will set
116eda14cbcSMatt Macy  *			the completion txg to the next txg. This is necessary
117eda14cbcSMatt Macy  *			to ensure that any blocks that were freed during
118eda14cbcSMatt Macy  *			the scan but have not yet been processed (i.e deferred
119eda14cbcSMatt Macy  *			frees) are accounted for.
120eda14cbcSMatt Macy  *
121eda14cbcSMatt Macy  * This structure also maintains information about deferred frees which are
122eda14cbcSMatt Macy  * a special kind of traversal. Deferred free can exist in either a bptree or
123eda14cbcSMatt Macy  * a bpobj structure. The scn_is_bptree flag will indicate the type of
124eda14cbcSMatt Macy  * deferred free that is in progress. If the deferred free is part of an
125eda14cbcSMatt Macy  * asynchronous destroy then the scn_async_destroying flag will be set.
126eda14cbcSMatt Macy  */
127eda14cbcSMatt Macy typedef struct dsl_scan {
128eda14cbcSMatt Macy 	struct dsl_pool *scn_dp;
129eda14cbcSMatt Macy 	uint64_t scn_restart_txg;
130eda14cbcSMatt Macy 	uint64_t scn_done_txg;
131eda14cbcSMatt Macy 	uint64_t scn_sync_start_time;
132eda14cbcSMatt Macy 	uint64_t scn_issued_before_pass;
133eda14cbcSMatt Macy 
134eda14cbcSMatt Macy 	/* for freeing blocks */
135eda14cbcSMatt Macy 	boolean_t scn_is_bptree;
136eda14cbcSMatt Macy 	boolean_t scn_async_destroying;
137eda14cbcSMatt Macy 	boolean_t scn_async_stalled;
138eda14cbcSMatt Macy 	uint64_t  scn_async_block_min_time_ms;
139eda14cbcSMatt Macy 
140eda14cbcSMatt Macy 	/* flags and stats for controlling scan state */
141eda14cbcSMatt Macy 	boolean_t scn_is_sorted;	/* doing sequential scan */
142eda14cbcSMatt Macy 	boolean_t scn_clearing;		/* scan is issuing sequential extents */
143eda14cbcSMatt Macy 	boolean_t scn_checkpointing;	/* scan is issuing all queued extents */
144eda14cbcSMatt Macy 	boolean_t scn_suspending;	/* scan is suspending until next txg */
145eda14cbcSMatt Macy 	uint64_t scn_last_checkpoint;	/* time of last checkpoint */
146eda14cbcSMatt Macy 
147eda14cbcSMatt Macy 	/* members for thread synchronization */
148eda14cbcSMatt Macy 	zio_t *scn_zio_root;		/* root zio for waiting on IO */
149eda14cbcSMatt Macy 	taskq_t *scn_taskq;		/* task queue for issuing extents */
150eda14cbcSMatt Macy 
151eda14cbcSMatt Macy 	/* for controlling scan prefetch, protected by spa_scrub_lock */
152eda14cbcSMatt Macy 	boolean_t scn_prefetch_stop;	/* prefetch should stop */
153eda14cbcSMatt Macy 	zbookmark_phys_t scn_prefetch_bookmark;	/* prefetch start bookmark */
154eda14cbcSMatt Macy 	avl_tree_t scn_prefetch_queue;	/* priority queue of prefetch IOs */
155eda14cbcSMatt Macy 	uint64_t scn_maxinflight_bytes; /* max bytes in flight for pool */
156eda14cbcSMatt Macy 
157eda14cbcSMatt Macy 	/* per txg statistics */
158eda14cbcSMatt Macy 	uint64_t scn_visited_this_txg;	/* total bps visited this txg */
159eda14cbcSMatt Macy 	uint64_t scn_dedup_frees_this_txg;	/* dedup bps freed this txg */
160eda14cbcSMatt Macy 	uint64_t scn_holes_this_txg;
161eda14cbcSMatt Macy 	uint64_t scn_lt_min_this_txg;
162eda14cbcSMatt Macy 	uint64_t scn_gt_max_this_txg;
163eda14cbcSMatt Macy 	uint64_t scn_ddt_contained_this_txg;
164eda14cbcSMatt Macy 	uint64_t scn_objsets_visited_this_txg;
165eda14cbcSMatt Macy 	uint64_t scn_avg_seg_size_this_txg;
166eda14cbcSMatt Macy 	uint64_t scn_segs_this_txg;
167eda14cbcSMatt Macy 	uint64_t scn_avg_zio_size_this_txg;
168eda14cbcSMatt Macy 	uint64_t scn_zios_this_txg;
169eda14cbcSMatt Macy 
170c0a83fe0SMartin Matuska 	/* zap cursor for tracing error scrub progress */
171c0a83fe0SMartin Matuska 	zap_cursor_t errorscrub_cursor;
172eda14cbcSMatt Macy 	/* members needed for syncing scan status to disk */
173eda14cbcSMatt Macy 	dsl_scan_phys_t scn_phys;	/* on disk representation of scan */
174eda14cbcSMatt Macy 	dsl_scan_phys_t scn_phys_cached;
175eda14cbcSMatt Macy 	avl_tree_t scn_queue;		/* queue of datasets to scan */
176a0b956f5SMartin Matuska 	uint64_t scn_queues_pending;	/* outstanding data to issue */
177c0a83fe0SMartin Matuska 	/* members needed for syncing error scrub status to disk */
178c0a83fe0SMartin Matuska 	dsl_errorscrub_phys_t errorscrub_phys;
179eda14cbcSMatt Macy } dsl_scan_t;
180eda14cbcSMatt Macy 
181eda14cbcSMatt Macy typedef struct dsl_scan_io_queue dsl_scan_io_queue_t;
182eda14cbcSMatt Macy 
183eda14cbcSMatt Macy void scan_init(void);
184eda14cbcSMatt Macy void scan_fini(void);
185eda14cbcSMatt Macy int dsl_scan_init(struct dsl_pool *dp, uint64_t txg);
18616038816SMartin Matuska int dsl_scan_setup_check(void *, dmu_tx_t *);
1877877fdebSMatt Macy void dsl_scan_setup_sync(void *, dmu_tx_t *);
188eda14cbcSMatt Macy void dsl_scan_fini(struct dsl_pool *dp);
189eda14cbcSMatt Macy void dsl_scan_sync(struct dsl_pool *, dmu_tx_t *);
190eda14cbcSMatt Macy int dsl_scan_cancel(struct dsl_pool *);
191eda14cbcSMatt Macy int dsl_scan(struct dsl_pool *, pool_scan_func_t);
192eda14cbcSMatt Macy void dsl_scan_assess_vdev(struct dsl_pool *dp, vdev_t *vd);
193eda14cbcSMatt Macy boolean_t dsl_scan_scrubbing(const struct dsl_pool *dp);
194c0a83fe0SMartin Matuska boolean_t dsl_errorscrubbing(const struct dsl_pool *dp);
195c0a83fe0SMartin Matuska boolean_t dsl_errorscrub_active(dsl_scan_t *scn);
196eda14cbcSMatt Macy void dsl_scan_restart_resilver(struct dsl_pool *, uint64_t txg);
197c0a83fe0SMartin Matuska int dsl_scrub_set_pause_resume(const struct dsl_pool *dp,
198c0a83fe0SMartin Matuska     pool_scrub_cmd_t cmd);
199c0a83fe0SMartin Matuska void dsl_errorscrub_sync(struct dsl_pool *, dmu_tx_t *);
200eda14cbcSMatt Macy boolean_t dsl_scan_resilvering(struct dsl_pool *dp);
201eda14cbcSMatt Macy boolean_t dsl_scan_resilver_scheduled(struct dsl_pool *dp);
202eda14cbcSMatt Macy boolean_t dsl_dataset_unstable(struct dsl_dataset *ds);
203eda14cbcSMatt Macy void dsl_scan_ddt_entry(dsl_scan_t *scn, enum zio_checksum checksum,
204eda14cbcSMatt Macy     ddt_entry_t *dde, dmu_tx_t *tx);
205eda14cbcSMatt Macy void dsl_scan_ds_destroyed(struct dsl_dataset *ds, struct dmu_tx *tx);
206eda14cbcSMatt Macy void dsl_scan_ds_snapshotted(struct dsl_dataset *ds, struct dmu_tx *tx);
207eda14cbcSMatt Macy void dsl_scan_ds_clone_swapped(struct dsl_dataset *ds1, struct dsl_dataset *ds2,
208eda14cbcSMatt Macy     struct dmu_tx *tx);
209eda14cbcSMatt Macy boolean_t dsl_scan_active(dsl_scan_t *scn);
210eda14cbcSMatt Macy boolean_t dsl_scan_is_paused_scrub(const dsl_scan_t *scn);
211c0a83fe0SMartin Matuska boolean_t dsl_errorscrub_is_paused(const dsl_scan_t *scn);
212eda14cbcSMatt Macy void dsl_scan_freed(spa_t *spa, const blkptr_t *bp);
213eda14cbcSMatt Macy void dsl_scan_io_queue_destroy(dsl_scan_io_queue_t *queue);
214eda14cbcSMatt Macy void dsl_scan_io_queue_vdev_xfer(vdev_t *svd, vdev_t *tvd);
215eda14cbcSMatt Macy 
216eda14cbcSMatt Macy #ifdef	__cplusplus
217eda14cbcSMatt Macy }
218eda14cbcSMatt Macy #endif
219eda14cbcSMatt Macy 
220eda14cbcSMatt Macy #endif /* _SYS_DSL_SCAN_H */
221