1*eda14cbcSMatt Macy /* 2*eda14cbcSMatt Macy * CDDL HEADER START 3*eda14cbcSMatt Macy * 4*eda14cbcSMatt Macy * The contents of this file are subject to the terms of the 5*eda14cbcSMatt Macy * Common Development and Distribution License (the "License"). 6*eda14cbcSMatt Macy * You may not use this file except in compliance with the License. 7*eda14cbcSMatt Macy * 8*eda14cbcSMatt Macy * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9*eda14cbcSMatt Macy * or http://www.opensolaris.org/os/licensing. 10*eda14cbcSMatt Macy * See the License for the specific language governing permissions 11*eda14cbcSMatt Macy * and limitations under the License. 12*eda14cbcSMatt Macy * 13*eda14cbcSMatt Macy * When distributing Covered Code, include this CDDL HEADER in each 14*eda14cbcSMatt Macy * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15*eda14cbcSMatt Macy * If applicable, add the following below this CDDL HEADER, with the 16*eda14cbcSMatt Macy * fields enclosed by brackets "[]" replaced with your own identifying 17*eda14cbcSMatt Macy * information: Portions Copyright [yyyy] [name of copyright owner] 18*eda14cbcSMatt Macy * 19*eda14cbcSMatt Macy * CDDL HEADER END 20*eda14cbcSMatt Macy */ 21*eda14cbcSMatt Macy /* 22*eda14cbcSMatt Macy * Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved. 23*eda14cbcSMatt Macy * Copyright (c) 2012, 2017 by Delphix. All rights reserved. 24*eda14cbcSMatt Macy * Copyright (c) 2017, 2019, Datto Inc. All rights reserved. 25*eda14cbcSMatt Macy */ 26*eda14cbcSMatt Macy 27*eda14cbcSMatt Macy #ifndef _SYS_DSL_SCAN_H 28*eda14cbcSMatt Macy #define _SYS_DSL_SCAN_H 29*eda14cbcSMatt Macy 30*eda14cbcSMatt Macy #include <sys/zfs_context.h> 31*eda14cbcSMatt Macy #include <sys/zio.h> 32*eda14cbcSMatt Macy #include <sys/ddt.h> 33*eda14cbcSMatt Macy #include <sys/bplist.h> 34*eda14cbcSMatt Macy 35*eda14cbcSMatt Macy #ifdef __cplusplus 36*eda14cbcSMatt Macy extern "C" { 37*eda14cbcSMatt Macy #endif 38*eda14cbcSMatt Macy 39*eda14cbcSMatt Macy struct objset; 40*eda14cbcSMatt Macy struct dsl_dir; 41*eda14cbcSMatt Macy struct dsl_dataset; 42*eda14cbcSMatt Macy struct dsl_pool; 43*eda14cbcSMatt Macy struct dmu_tx; 44*eda14cbcSMatt Macy 45*eda14cbcSMatt Macy extern int zfs_scan_suspend_progress; 46*eda14cbcSMatt Macy 47*eda14cbcSMatt Macy /* 48*eda14cbcSMatt Macy * All members of this structure must be uint64_t, for byteswap 49*eda14cbcSMatt Macy * purposes. 50*eda14cbcSMatt Macy */ 51*eda14cbcSMatt Macy typedef struct dsl_scan_phys { 52*eda14cbcSMatt Macy uint64_t scn_func; /* pool_scan_func_t */ 53*eda14cbcSMatt Macy uint64_t scn_state; /* dsl_scan_state_t */ 54*eda14cbcSMatt Macy uint64_t scn_queue_obj; 55*eda14cbcSMatt Macy uint64_t scn_min_txg; 56*eda14cbcSMatt Macy uint64_t scn_max_txg; 57*eda14cbcSMatt Macy uint64_t scn_cur_min_txg; 58*eda14cbcSMatt Macy uint64_t scn_cur_max_txg; 59*eda14cbcSMatt Macy uint64_t scn_start_time; 60*eda14cbcSMatt Macy uint64_t scn_end_time; 61*eda14cbcSMatt Macy uint64_t scn_to_examine; /* total bytes to be scanned */ 62*eda14cbcSMatt Macy uint64_t scn_examined; /* bytes scanned so far */ 63*eda14cbcSMatt Macy uint64_t scn_to_process; 64*eda14cbcSMatt Macy uint64_t scn_processed; 65*eda14cbcSMatt Macy uint64_t scn_errors; /* scan I/O error count */ 66*eda14cbcSMatt Macy uint64_t scn_ddt_class_max; 67*eda14cbcSMatt Macy ddt_bookmark_t scn_ddt_bookmark; 68*eda14cbcSMatt Macy zbookmark_phys_t scn_bookmark; 69*eda14cbcSMatt Macy uint64_t scn_flags; /* dsl_scan_flags_t */ 70*eda14cbcSMatt Macy } dsl_scan_phys_t; 71*eda14cbcSMatt Macy 72*eda14cbcSMatt Macy #define SCAN_PHYS_NUMINTS (sizeof (dsl_scan_phys_t) / sizeof (uint64_t)) 73*eda14cbcSMatt Macy 74*eda14cbcSMatt Macy typedef enum dsl_scan_flags { 75*eda14cbcSMatt Macy DSF_VISIT_DS_AGAIN = 1<<0, 76*eda14cbcSMatt Macy DSF_SCRUB_PAUSED = 1<<1, 77*eda14cbcSMatt Macy } dsl_scan_flags_t; 78*eda14cbcSMatt Macy 79*eda14cbcSMatt Macy #define DSL_SCAN_FLAGS_MASK (DSF_VISIT_DS_AGAIN) 80*eda14cbcSMatt Macy 81*eda14cbcSMatt Macy /* 82*eda14cbcSMatt Macy * Every pool will have one dsl_scan_t and this structure will contain 83*eda14cbcSMatt Macy * in-memory information about the scan and a pointer to the on-disk 84*eda14cbcSMatt Macy * representation (i.e. dsl_scan_phys_t). Most of the state of the scan 85*eda14cbcSMatt Macy * is contained on-disk to allow the scan to resume in the event of a reboot 86*eda14cbcSMatt Macy * or panic. This structure maintains information about the behavior of a 87*eda14cbcSMatt Macy * running scan, some caching information, and how it should traverse the pool. 88*eda14cbcSMatt Macy * 89*eda14cbcSMatt Macy * The following members of this structure direct the behavior of the scan: 90*eda14cbcSMatt Macy * 91*eda14cbcSMatt Macy * scn_suspending - a scan that cannot be completed in a single txg or 92*eda14cbcSMatt Macy * has exceeded its allotted time will need to suspend. 93*eda14cbcSMatt Macy * When this flag is set the scanner will stop traversing 94*eda14cbcSMatt Macy * the pool and write out the current state to disk. 95*eda14cbcSMatt Macy * 96*eda14cbcSMatt Macy * scn_restart_txg - directs the scanner to either restart or start a 97*eda14cbcSMatt Macy * a scan at the specified txg value. 98*eda14cbcSMatt Macy * 99*eda14cbcSMatt Macy * scn_done_txg - when a scan completes its traversal it will set 100*eda14cbcSMatt Macy * the completion txg to the next txg. This is necessary 101*eda14cbcSMatt Macy * to ensure that any blocks that were freed during 102*eda14cbcSMatt Macy * the scan but have not yet been processed (i.e deferred 103*eda14cbcSMatt Macy * frees) are accounted for. 104*eda14cbcSMatt Macy * 105*eda14cbcSMatt Macy * This structure also maintains information about deferred frees which are 106*eda14cbcSMatt Macy * a special kind of traversal. Deferred free can exist in either a bptree or 107*eda14cbcSMatt Macy * a bpobj structure. The scn_is_bptree flag will indicate the type of 108*eda14cbcSMatt Macy * deferred free that is in progress. If the deferred free is part of an 109*eda14cbcSMatt Macy * asynchronous destroy then the scn_async_destroying flag will be set. 110*eda14cbcSMatt Macy */ 111*eda14cbcSMatt Macy typedef struct dsl_scan { 112*eda14cbcSMatt Macy struct dsl_pool *scn_dp; 113*eda14cbcSMatt Macy uint64_t scn_restart_txg; 114*eda14cbcSMatt Macy uint64_t scn_done_txg; 115*eda14cbcSMatt Macy uint64_t scn_sync_start_time; 116*eda14cbcSMatt Macy uint64_t scn_issued_before_pass; 117*eda14cbcSMatt Macy 118*eda14cbcSMatt Macy /* for freeing blocks */ 119*eda14cbcSMatt Macy boolean_t scn_is_bptree; 120*eda14cbcSMatt Macy boolean_t scn_async_destroying; 121*eda14cbcSMatt Macy boolean_t scn_async_stalled; 122*eda14cbcSMatt Macy uint64_t scn_async_block_min_time_ms; 123*eda14cbcSMatt Macy 124*eda14cbcSMatt Macy /* flags and stats for controlling scan state */ 125*eda14cbcSMatt Macy boolean_t scn_is_sorted; /* doing sequential scan */ 126*eda14cbcSMatt Macy boolean_t scn_clearing; /* scan is issuing sequential extents */ 127*eda14cbcSMatt Macy boolean_t scn_checkpointing; /* scan is issuing all queued extents */ 128*eda14cbcSMatt Macy boolean_t scn_suspending; /* scan is suspending until next txg */ 129*eda14cbcSMatt Macy uint64_t scn_last_checkpoint; /* time of last checkpoint */ 130*eda14cbcSMatt Macy 131*eda14cbcSMatt Macy /* members for thread synchronization */ 132*eda14cbcSMatt Macy zio_t *scn_zio_root; /* root zio for waiting on IO */ 133*eda14cbcSMatt Macy taskq_t *scn_taskq; /* task queue for issuing extents */ 134*eda14cbcSMatt Macy 135*eda14cbcSMatt Macy /* for controlling scan prefetch, protected by spa_scrub_lock */ 136*eda14cbcSMatt Macy boolean_t scn_prefetch_stop; /* prefetch should stop */ 137*eda14cbcSMatt Macy zbookmark_phys_t scn_prefetch_bookmark; /* prefetch start bookmark */ 138*eda14cbcSMatt Macy avl_tree_t scn_prefetch_queue; /* priority queue of prefetch IOs */ 139*eda14cbcSMatt Macy uint64_t scn_maxinflight_bytes; /* max bytes in flight for pool */ 140*eda14cbcSMatt Macy 141*eda14cbcSMatt Macy /* per txg statistics */ 142*eda14cbcSMatt Macy uint64_t scn_visited_this_txg; /* total bps visited this txg */ 143*eda14cbcSMatt Macy uint64_t scn_dedup_frees_this_txg; /* dedup bps freed this txg */ 144*eda14cbcSMatt Macy uint64_t scn_holes_this_txg; 145*eda14cbcSMatt Macy uint64_t scn_lt_min_this_txg; 146*eda14cbcSMatt Macy uint64_t scn_gt_max_this_txg; 147*eda14cbcSMatt Macy uint64_t scn_ddt_contained_this_txg; 148*eda14cbcSMatt Macy uint64_t scn_objsets_visited_this_txg; 149*eda14cbcSMatt Macy uint64_t scn_avg_seg_size_this_txg; 150*eda14cbcSMatt Macy uint64_t scn_segs_this_txg; 151*eda14cbcSMatt Macy uint64_t scn_avg_zio_size_this_txg; 152*eda14cbcSMatt Macy uint64_t scn_zios_this_txg; 153*eda14cbcSMatt Macy 154*eda14cbcSMatt Macy /* members needed for syncing scan status to disk */ 155*eda14cbcSMatt Macy dsl_scan_phys_t scn_phys; /* on disk representation of scan */ 156*eda14cbcSMatt Macy dsl_scan_phys_t scn_phys_cached; 157*eda14cbcSMatt Macy avl_tree_t scn_queue; /* queue of datasets to scan */ 158*eda14cbcSMatt Macy uint64_t scn_bytes_pending; /* outstanding data to issue */ 159*eda14cbcSMatt Macy } dsl_scan_t; 160*eda14cbcSMatt Macy 161*eda14cbcSMatt Macy typedef struct dsl_scan_io_queue dsl_scan_io_queue_t; 162*eda14cbcSMatt Macy 163*eda14cbcSMatt Macy void scan_init(void); 164*eda14cbcSMatt Macy void scan_fini(void); 165*eda14cbcSMatt Macy int dsl_scan_init(struct dsl_pool *dp, uint64_t txg); 166*eda14cbcSMatt Macy void dsl_scan_fini(struct dsl_pool *dp); 167*eda14cbcSMatt Macy void dsl_scan_sync(struct dsl_pool *, dmu_tx_t *); 168*eda14cbcSMatt Macy int dsl_scan_cancel(struct dsl_pool *); 169*eda14cbcSMatt Macy int dsl_scan(struct dsl_pool *, pool_scan_func_t); 170*eda14cbcSMatt Macy void dsl_scan_assess_vdev(struct dsl_pool *dp, vdev_t *vd); 171*eda14cbcSMatt Macy boolean_t dsl_scan_scrubbing(const struct dsl_pool *dp); 172*eda14cbcSMatt Macy int dsl_scrub_set_pause_resume(const struct dsl_pool *dp, pool_scrub_cmd_t cmd); 173*eda14cbcSMatt Macy void dsl_scan_restart_resilver(struct dsl_pool *, uint64_t txg); 174*eda14cbcSMatt Macy boolean_t dsl_scan_resilvering(struct dsl_pool *dp); 175*eda14cbcSMatt Macy boolean_t dsl_scan_resilver_scheduled(struct dsl_pool *dp); 176*eda14cbcSMatt Macy boolean_t dsl_dataset_unstable(struct dsl_dataset *ds); 177*eda14cbcSMatt Macy void dsl_scan_ddt_entry(dsl_scan_t *scn, enum zio_checksum checksum, 178*eda14cbcSMatt Macy ddt_entry_t *dde, dmu_tx_t *tx); 179*eda14cbcSMatt Macy void dsl_scan_ds_destroyed(struct dsl_dataset *ds, struct dmu_tx *tx); 180*eda14cbcSMatt Macy void dsl_scan_ds_snapshotted(struct dsl_dataset *ds, struct dmu_tx *tx); 181*eda14cbcSMatt Macy void dsl_scan_ds_clone_swapped(struct dsl_dataset *ds1, struct dsl_dataset *ds2, 182*eda14cbcSMatt Macy struct dmu_tx *tx); 183*eda14cbcSMatt Macy boolean_t dsl_scan_active(dsl_scan_t *scn); 184*eda14cbcSMatt Macy boolean_t dsl_scan_is_paused_scrub(const dsl_scan_t *scn); 185*eda14cbcSMatt Macy void dsl_scan_freed(spa_t *spa, const blkptr_t *bp); 186*eda14cbcSMatt Macy void dsl_scan_io_queue_destroy(dsl_scan_io_queue_t *queue); 187*eda14cbcSMatt Macy void dsl_scan_io_queue_vdev_xfer(vdev_t *svd, vdev_t *tvd); 188*eda14cbcSMatt Macy 189*eda14cbcSMatt Macy #ifdef __cplusplus 190*eda14cbcSMatt Macy } 191*eda14cbcSMatt Macy #endif 192*eda14cbcSMatt Macy 193*eda14cbcSMatt Macy #endif /* _SYS_DSL_SCAN_H */ 194