1b24ab676SJeff Bonwick /* 2b24ab676SJeff Bonwick * CDDL HEADER START 3b24ab676SJeff Bonwick * 4b24ab676SJeff Bonwick * The contents of this file are subject to the terms of the 5b24ab676SJeff Bonwick * Common Development and Distribution License (the "License"). 6b24ab676SJeff Bonwick * You may not use this file except in compliance with the License. 7b24ab676SJeff Bonwick * 8b24ab676SJeff Bonwick * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9b24ab676SJeff Bonwick * or http://www.opensolaris.org/os/licensing. 10b24ab676SJeff Bonwick * See the License for the specific language governing permissions 11b24ab676SJeff Bonwick * and limitations under the License. 12b24ab676SJeff Bonwick * 13b24ab676SJeff Bonwick * When distributing Covered Code, include this CDDL HEADER in each 14b24ab676SJeff Bonwick * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15b24ab676SJeff Bonwick * If applicable, add the following below this CDDL HEADER, with the 16b24ab676SJeff Bonwick * fields enclosed by brackets "[]" replaced with your own identifying 17b24ab676SJeff Bonwick * information: Portions Copyright [yyyy] [name of copyright owner] 18b24ab676SJeff Bonwick * 19b24ab676SJeff Bonwick * CDDL HEADER END 20b24ab676SJeff Bonwick */ 21b24ab676SJeff Bonwick 22b24ab676SJeff Bonwick /* 233f9d6ad7SLin Ling * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved. 24*45818ee1SMatthew Ahrens * Copyright (c) 2012, 2015 by Delphix. All rights reserved. 25b24ab676SJeff Bonwick */ 26b24ab676SJeff Bonwick 27b24ab676SJeff Bonwick #include <sys/zfs_context.h> 28b24ab676SJeff Bonwick #include <sys/spa.h> 29b24ab676SJeff Bonwick #include <sys/spa_impl.h> 30b24ab676SJeff Bonwick #include <sys/zio.h> 31b24ab676SJeff Bonwick #include <sys/ddt.h> 32b24ab676SJeff Bonwick #include <sys/zap.h> 33b24ab676SJeff Bonwick #include <sys/dmu_tx.h> 34b24ab676SJeff Bonwick #include <sys/arc.h> 35bbfd46c4SJeff Bonwick #include <sys/dsl_pool.h> 36b24ab676SJeff Bonwick #include <sys/zio_checksum.h> 37b24ab676SJeff Bonwick #include <sys/zio_compress.h> 383f9d6ad7SLin Ling #include <sys/dsl_scan.h> 39b24ab676SJeff Bonwick 40837b568bSGeorge Wilson /* 41837b568bSGeorge Wilson * Enable/disable prefetching of dedup-ed blocks which are going to be freed. 42837b568bSGeorge Wilson */ 43837b568bSGeorge Wilson int zfs_dedup_prefetch = 1; 44837b568bSGeorge Wilson 45b24ab676SJeff Bonwick static const ddt_ops_t *ddt_ops[DDT_TYPES] = { 46b24ab676SJeff Bonwick &ddt_zap_ops, 47b24ab676SJeff Bonwick }; 48b24ab676SJeff Bonwick 49b24ab676SJeff Bonwick static const char *ddt_class_name[DDT_CLASSES] = { 50b24ab676SJeff Bonwick "ditto", 51b24ab676SJeff Bonwick "duplicate", 52b24ab676SJeff Bonwick "unique", 53b24ab676SJeff Bonwick }; 54b24ab676SJeff Bonwick 55b24ab676SJeff Bonwick static void 56b24ab676SJeff Bonwick ddt_object_create(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 57b24ab676SJeff Bonwick dmu_tx_t *tx) 58b24ab676SJeff Bonwick { 59b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 60b24ab676SJeff Bonwick objset_t *os = ddt->ddt_os; 61b24ab676SJeff Bonwick uint64_t *objectp = &ddt->ddt_object[type][class]; 62*45818ee1SMatthew Ahrens boolean_t prehash = zio_checksum_table[ddt->ddt_checksum].ci_flags & 63*45818ee1SMatthew Ahrens ZCHECKSUM_FLAG_DEDUP; 64b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 65b24ab676SJeff Bonwick 66b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 67b24ab676SJeff Bonwick 68b24ab676SJeff Bonwick ASSERT(*objectp == 0); 69b24ab676SJeff Bonwick VERIFY(ddt_ops[type]->ddt_op_create(os, objectp, tx, prehash) == 0); 70b24ab676SJeff Bonwick ASSERT(*objectp != 0); 71b24ab676SJeff Bonwick 72b24ab676SJeff Bonwick VERIFY(zap_add(os, DMU_POOL_DIRECTORY_OBJECT, name, 73b24ab676SJeff Bonwick sizeof (uint64_t), 1, objectp, tx) == 0); 74b24ab676SJeff Bonwick 75b24ab676SJeff Bonwick VERIFY(zap_add(os, spa->spa_ddt_stat_object, name, 76b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 77b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class], tx) == 0); 78b24ab676SJeff Bonwick } 79b24ab676SJeff Bonwick 80b24ab676SJeff Bonwick static void 81b24ab676SJeff Bonwick ddt_object_destroy(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 82b24ab676SJeff Bonwick dmu_tx_t *tx) 83b24ab676SJeff Bonwick { 84b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 85b24ab676SJeff Bonwick objset_t *os = ddt->ddt_os; 86b24ab676SJeff Bonwick uint64_t *objectp = &ddt->ddt_object[type][class]; 87b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 88b24ab676SJeff Bonwick 89b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 90b24ab676SJeff Bonwick 91b24ab676SJeff Bonwick ASSERT(*objectp != 0); 92b24ab676SJeff Bonwick ASSERT(ddt_object_count(ddt, type, class) == 0); 93b24ab676SJeff Bonwick ASSERT(ddt_histogram_empty(&ddt->ddt_histogram[type][class])); 94b24ab676SJeff Bonwick VERIFY(zap_remove(os, DMU_POOL_DIRECTORY_OBJECT, name, tx) == 0); 95b24ab676SJeff Bonwick VERIFY(zap_remove(os, spa->spa_ddt_stat_object, name, tx) == 0); 96b24ab676SJeff Bonwick VERIFY(ddt_ops[type]->ddt_op_destroy(os, *objectp, tx) == 0); 9730f608a4SGeorge Wilson bzero(&ddt->ddt_object_stats[type][class], sizeof (ddt_object_t)); 98b24ab676SJeff Bonwick 99b24ab676SJeff Bonwick *objectp = 0; 100b24ab676SJeff Bonwick } 101b24ab676SJeff Bonwick 102b24ab676SJeff Bonwick static int 103b24ab676SJeff Bonwick ddt_object_load(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 104b24ab676SJeff Bonwick { 10530f608a4SGeorge Wilson ddt_object_t *ddo = &ddt->ddt_object_stats[type][class]; 10630f608a4SGeorge Wilson dmu_object_info_t doi; 107b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 108b24ab676SJeff Bonwick int error; 109b24ab676SJeff Bonwick 110b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 111b24ab676SJeff Bonwick 112b24ab676SJeff Bonwick error = zap_lookup(ddt->ddt_os, DMU_POOL_DIRECTORY_OBJECT, name, 113b24ab676SJeff Bonwick sizeof (uint64_t), 1, &ddt->ddt_object[type][class]); 114b24ab676SJeff Bonwick 11543466aaeSMax Grossman if (error != 0) 116b24ab676SJeff Bonwick return (error); 117b24ab676SJeff Bonwick 11843466aaeSMax Grossman VERIFY0(zap_lookup(ddt->ddt_os, ddt->ddt_spa->spa_ddt_stat_object, name, 119b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 12043466aaeSMax Grossman &ddt->ddt_histogram[type][class])); 121b24ab676SJeff Bonwick 12230f608a4SGeorge Wilson /* 12330f608a4SGeorge Wilson * Seed the cached statistics. 12430f608a4SGeorge Wilson */ 12530f608a4SGeorge Wilson VERIFY(ddt_object_info(ddt, type, class, &doi) == 0); 12630f608a4SGeorge Wilson 12730f608a4SGeorge Wilson ddo->ddo_count = ddt_object_count(ddt, type, class); 12830f608a4SGeorge Wilson ddo->ddo_dspace = doi.doi_physical_blocks_512 << 9; 12930f608a4SGeorge Wilson ddo->ddo_mspace = doi.doi_fill_count * doi.doi_data_block_size; 13030f608a4SGeorge Wilson 13143466aaeSMax Grossman return (0); 132b24ab676SJeff Bonwick } 133b24ab676SJeff Bonwick 134b24ab676SJeff Bonwick static void 135b24ab676SJeff Bonwick ddt_object_sync(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 136b24ab676SJeff Bonwick dmu_tx_t *tx) 137b24ab676SJeff Bonwick { 13830f608a4SGeorge Wilson ddt_object_t *ddo = &ddt->ddt_object_stats[type][class]; 13930f608a4SGeorge Wilson dmu_object_info_t doi; 140b24ab676SJeff Bonwick char name[DDT_NAMELEN]; 141b24ab676SJeff Bonwick 142b24ab676SJeff Bonwick ddt_object_name(ddt, type, class, name); 143b24ab676SJeff Bonwick 144b24ab676SJeff Bonwick VERIFY(zap_update(ddt->ddt_os, ddt->ddt_spa->spa_ddt_stat_object, name, 145b24ab676SJeff Bonwick sizeof (uint64_t), sizeof (ddt_histogram_t) / sizeof (uint64_t), 146b24ab676SJeff Bonwick &ddt->ddt_histogram[type][class], tx) == 0); 14730f608a4SGeorge Wilson 14830f608a4SGeorge Wilson /* 14930f608a4SGeorge Wilson * Cache DDT statistics; this is the only time they'll change. 15030f608a4SGeorge Wilson */ 15130f608a4SGeorge Wilson VERIFY(ddt_object_info(ddt, type, class, &doi) == 0); 15230f608a4SGeorge Wilson 15330f608a4SGeorge Wilson ddo->ddo_count = ddt_object_count(ddt, type, class); 15430f608a4SGeorge Wilson ddo->ddo_dspace = doi.doi_physical_blocks_512 << 9; 15530f608a4SGeorge Wilson ddo->ddo_mspace = doi.doi_fill_count * doi.doi_data_block_size; 156b24ab676SJeff Bonwick } 157b24ab676SJeff Bonwick 158b24ab676SJeff Bonwick static int 159b24ab676SJeff Bonwick ddt_object_lookup(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 160b24ab676SJeff Bonwick ddt_entry_t *dde) 161b24ab676SJeff Bonwick { 162b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, type, class)) 163be6fd75aSMatthew Ahrens return (SET_ERROR(ENOENT)); 164b24ab676SJeff Bonwick 165b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_lookup(ddt->ddt_os, 166b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde)); 167b24ab676SJeff Bonwick } 168b24ab676SJeff Bonwick 169c7cd2421SGeorge Wilson static void 170c7cd2421SGeorge Wilson ddt_object_prefetch(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 171c7cd2421SGeorge Wilson ddt_entry_t *dde) 172c7cd2421SGeorge Wilson { 173c7cd2421SGeorge Wilson if (!ddt_object_exists(ddt, type, class)) 174c7cd2421SGeorge Wilson return; 175c7cd2421SGeorge Wilson 176c7cd2421SGeorge Wilson ddt_ops[type]->ddt_op_prefetch(ddt->ddt_os, 177c7cd2421SGeorge Wilson ddt->ddt_object[type][class], dde); 178c7cd2421SGeorge Wilson } 179c7cd2421SGeorge Wilson 1803f9d6ad7SLin Ling int 181b24ab676SJeff Bonwick ddt_object_update(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 182b24ab676SJeff Bonwick ddt_entry_t *dde, dmu_tx_t *tx) 183b24ab676SJeff Bonwick { 184b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 185b24ab676SJeff Bonwick 186b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_update(ddt->ddt_os, 187b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, tx)); 188b24ab676SJeff Bonwick } 189b24ab676SJeff Bonwick 190b24ab676SJeff Bonwick static int 191b24ab676SJeff Bonwick ddt_object_remove(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 192b24ab676SJeff Bonwick ddt_entry_t *dde, dmu_tx_t *tx) 193b24ab676SJeff Bonwick { 194b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 195b24ab676SJeff Bonwick 196b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_remove(ddt->ddt_os, 197b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, tx)); 198b24ab676SJeff Bonwick } 199b24ab676SJeff Bonwick 200b24ab676SJeff Bonwick int 201b24ab676SJeff Bonwick ddt_object_walk(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 202bbfd46c4SJeff Bonwick uint64_t *walk, ddt_entry_t *dde) 203b24ab676SJeff Bonwick { 204b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 205b24ab676SJeff Bonwick 206b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_walk(ddt->ddt_os, 207b24ab676SJeff Bonwick ddt->ddt_object[type][class], dde, walk)); 208b24ab676SJeff Bonwick } 209b24ab676SJeff Bonwick 210b24ab676SJeff Bonwick uint64_t 211b24ab676SJeff Bonwick ddt_object_count(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 212b24ab676SJeff Bonwick { 213b24ab676SJeff Bonwick ASSERT(ddt_object_exists(ddt, type, class)); 214b24ab676SJeff Bonwick 215b24ab676SJeff Bonwick return (ddt_ops[type]->ddt_op_count(ddt->ddt_os, 216b24ab676SJeff Bonwick ddt->ddt_object[type][class])); 217b24ab676SJeff Bonwick } 218b24ab676SJeff Bonwick 219b24ab676SJeff Bonwick int 220b24ab676SJeff Bonwick ddt_object_info(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 221b24ab676SJeff Bonwick dmu_object_info_t *doi) 222b24ab676SJeff Bonwick { 223b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, type, class)) 224be6fd75aSMatthew Ahrens return (SET_ERROR(ENOENT)); 225b24ab676SJeff Bonwick 226b24ab676SJeff Bonwick return (dmu_object_info(ddt->ddt_os, ddt->ddt_object[type][class], 227b24ab676SJeff Bonwick doi)); 228b24ab676SJeff Bonwick } 229b24ab676SJeff Bonwick 230b24ab676SJeff Bonwick boolean_t 231b24ab676SJeff Bonwick ddt_object_exists(ddt_t *ddt, enum ddt_type type, enum ddt_class class) 232b24ab676SJeff Bonwick { 233b24ab676SJeff Bonwick return (!!ddt->ddt_object[type][class]); 234b24ab676SJeff Bonwick } 235b24ab676SJeff Bonwick 236b24ab676SJeff Bonwick void 237b24ab676SJeff Bonwick ddt_object_name(ddt_t *ddt, enum ddt_type type, enum ddt_class class, 238b24ab676SJeff Bonwick char *name) 239b24ab676SJeff Bonwick { 240b24ab676SJeff Bonwick (void) sprintf(name, DMU_POOL_DDT, 241b24ab676SJeff Bonwick zio_checksum_table[ddt->ddt_checksum].ci_name, 242b24ab676SJeff Bonwick ddt_ops[type]->ddt_op_name, ddt_class_name[class]); 243b24ab676SJeff Bonwick } 244b24ab676SJeff Bonwick 245b24ab676SJeff Bonwick void 246b24ab676SJeff Bonwick ddt_bp_fill(const ddt_phys_t *ddp, blkptr_t *bp, uint64_t txg) 247b24ab676SJeff Bonwick { 248b24ab676SJeff Bonwick ASSERT(txg != 0); 249b24ab676SJeff Bonwick 250b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 251b24ab676SJeff Bonwick bp->blk_dva[d] = ddp->ddp_dva[d]; 252b24ab676SJeff Bonwick BP_SET_BIRTH(bp, txg, ddp->ddp_phys_birth); 253b24ab676SJeff Bonwick } 254b24ab676SJeff Bonwick 255b24ab676SJeff Bonwick void 256bbfd46c4SJeff Bonwick ddt_bp_create(enum zio_checksum checksum, 257bbfd46c4SJeff Bonwick const ddt_key_t *ddk, const ddt_phys_t *ddp, blkptr_t *bp) 258b24ab676SJeff Bonwick { 259b24ab676SJeff Bonwick BP_ZERO(bp); 260b24ab676SJeff Bonwick 261b24ab676SJeff Bonwick if (ddp != NULL) 262b24ab676SJeff Bonwick ddt_bp_fill(ddp, bp, ddp->ddp_phys_birth); 263b24ab676SJeff Bonwick 264b24ab676SJeff Bonwick bp->blk_cksum = ddk->ddk_cksum; 2653f9d6ad7SLin Ling bp->blk_fill = 1; 266b24ab676SJeff Bonwick 267b24ab676SJeff Bonwick BP_SET_LSIZE(bp, DDK_GET_LSIZE(ddk)); 268b24ab676SJeff Bonwick BP_SET_PSIZE(bp, DDK_GET_PSIZE(ddk)); 269b24ab676SJeff Bonwick BP_SET_COMPRESS(bp, DDK_GET_COMPRESS(ddk)); 270bbfd46c4SJeff Bonwick BP_SET_CHECKSUM(bp, checksum); 2713f9d6ad7SLin Ling BP_SET_TYPE(bp, DMU_OT_DEDUP); 272b24ab676SJeff Bonwick BP_SET_LEVEL(bp, 0); 273b24ab676SJeff Bonwick BP_SET_DEDUP(bp, 0); 274b24ab676SJeff Bonwick BP_SET_BYTEORDER(bp, ZFS_HOST_BYTEORDER); 275b24ab676SJeff Bonwick } 276b24ab676SJeff Bonwick 277b24ab676SJeff Bonwick void 278b24ab676SJeff Bonwick ddt_key_fill(ddt_key_t *ddk, const blkptr_t *bp) 279b24ab676SJeff Bonwick { 280b24ab676SJeff Bonwick ddk->ddk_cksum = bp->blk_cksum; 281b24ab676SJeff Bonwick ddk->ddk_prop = 0; 282b24ab676SJeff Bonwick 283b24ab676SJeff Bonwick DDK_SET_LSIZE(ddk, BP_GET_LSIZE(bp)); 284b24ab676SJeff Bonwick DDK_SET_PSIZE(ddk, BP_GET_PSIZE(bp)); 285b24ab676SJeff Bonwick DDK_SET_COMPRESS(ddk, BP_GET_COMPRESS(bp)); 286b24ab676SJeff Bonwick } 287b24ab676SJeff Bonwick 288b24ab676SJeff Bonwick void 289b24ab676SJeff Bonwick ddt_phys_fill(ddt_phys_t *ddp, const blkptr_t *bp) 290b24ab676SJeff Bonwick { 291b24ab676SJeff Bonwick ASSERT(ddp->ddp_phys_birth == 0); 292b24ab676SJeff Bonwick 293b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 294b24ab676SJeff Bonwick ddp->ddp_dva[d] = bp->blk_dva[d]; 295b24ab676SJeff Bonwick ddp->ddp_phys_birth = BP_PHYSICAL_BIRTH(bp); 296b24ab676SJeff Bonwick } 297b24ab676SJeff Bonwick 298b24ab676SJeff Bonwick void 299b24ab676SJeff Bonwick ddt_phys_clear(ddt_phys_t *ddp) 300b24ab676SJeff Bonwick { 301b24ab676SJeff Bonwick bzero(ddp, sizeof (*ddp)); 302b24ab676SJeff Bonwick } 303b24ab676SJeff Bonwick 304b24ab676SJeff Bonwick void 305b24ab676SJeff Bonwick ddt_phys_addref(ddt_phys_t *ddp) 306b24ab676SJeff Bonwick { 307b24ab676SJeff Bonwick ddp->ddp_refcnt++; 308b24ab676SJeff Bonwick } 309b24ab676SJeff Bonwick 310b24ab676SJeff Bonwick void 311b24ab676SJeff Bonwick ddt_phys_decref(ddt_phys_t *ddp) 312b24ab676SJeff Bonwick { 313b24ab676SJeff Bonwick ASSERT((int64_t)ddp->ddp_refcnt > 0); 314b24ab676SJeff Bonwick ddp->ddp_refcnt--; 315b24ab676SJeff Bonwick } 316b24ab676SJeff Bonwick 317b24ab676SJeff Bonwick void 318b24ab676SJeff Bonwick ddt_phys_free(ddt_t *ddt, ddt_key_t *ddk, ddt_phys_t *ddp, uint64_t txg) 319b24ab676SJeff Bonwick { 320b24ab676SJeff Bonwick blkptr_t blk; 321b24ab676SJeff Bonwick 322bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, ddk, ddp, &blk); 323b24ab676SJeff Bonwick ddt_phys_clear(ddp); 324b24ab676SJeff Bonwick zio_free(ddt->ddt_spa, txg, &blk); 325b24ab676SJeff Bonwick } 326b24ab676SJeff Bonwick 327b24ab676SJeff Bonwick ddt_phys_t * 328b24ab676SJeff Bonwick ddt_phys_select(const ddt_entry_t *dde, const blkptr_t *bp) 329b24ab676SJeff Bonwick { 330b24ab676SJeff Bonwick ddt_phys_t *ddp = (ddt_phys_t *)dde->dde_phys; 331b24ab676SJeff Bonwick 332b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 333b24ab676SJeff Bonwick if (DVA_EQUAL(BP_IDENTITY(bp), &ddp->ddp_dva[0]) && 334b24ab676SJeff Bonwick BP_PHYSICAL_BIRTH(bp) == ddp->ddp_phys_birth) 335b24ab676SJeff Bonwick return (ddp); 336b24ab676SJeff Bonwick } 337b24ab676SJeff Bonwick return (NULL); 338b24ab676SJeff Bonwick } 339b24ab676SJeff Bonwick 340b24ab676SJeff Bonwick uint64_t 341b24ab676SJeff Bonwick ddt_phys_total_refcnt(const ddt_entry_t *dde) 342b24ab676SJeff Bonwick { 343b24ab676SJeff Bonwick uint64_t refcnt = 0; 344b24ab676SJeff Bonwick 345b24ab676SJeff Bonwick for (int p = DDT_PHYS_SINGLE; p <= DDT_PHYS_TRIPLE; p++) 346b24ab676SJeff Bonwick refcnt += dde->dde_phys[p].ddp_refcnt; 347b24ab676SJeff Bonwick 348b24ab676SJeff Bonwick return (refcnt); 349b24ab676SJeff Bonwick } 350b24ab676SJeff Bonwick 351b24ab676SJeff Bonwick static void 352b24ab676SJeff Bonwick ddt_stat_generate(ddt_t *ddt, ddt_entry_t *dde, ddt_stat_t *dds) 353b24ab676SJeff Bonwick { 354b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 355b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 356b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 357b24ab676SJeff Bonwick uint64_t lsize = DDK_GET_LSIZE(ddk); 358b24ab676SJeff Bonwick uint64_t psize = DDK_GET_PSIZE(ddk); 359b24ab676SJeff Bonwick 360b24ab676SJeff Bonwick bzero(dds, sizeof (*dds)); 361b24ab676SJeff Bonwick 362b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 363b24ab676SJeff Bonwick uint64_t dsize = 0; 364b24ab676SJeff Bonwick uint64_t refcnt = ddp->ddp_refcnt; 365b24ab676SJeff Bonwick 366b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0) 367b24ab676SJeff Bonwick continue; 368b24ab676SJeff Bonwick 369b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++) 370b24ab676SJeff Bonwick dsize += dva_get_dsize_sync(spa, &ddp->ddp_dva[d]); 371b24ab676SJeff Bonwick 372b24ab676SJeff Bonwick dds->dds_blocks += 1; 373b24ab676SJeff Bonwick dds->dds_lsize += lsize; 374b24ab676SJeff Bonwick dds->dds_psize += psize; 375b24ab676SJeff Bonwick dds->dds_dsize += dsize; 376b24ab676SJeff Bonwick 377b24ab676SJeff Bonwick dds->dds_ref_blocks += refcnt; 378b24ab676SJeff Bonwick dds->dds_ref_lsize += lsize * refcnt; 379b24ab676SJeff Bonwick dds->dds_ref_psize += psize * refcnt; 380b24ab676SJeff Bonwick dds->dds_ref_dsize += dsize * refcnt; 381b24ab676SJeff Bonwick } 382b24ab676SJeff Bonwick } 383b24ab676SJeff Bonwick 384b24ab676SJeff Bonwick void 385b24ab676SJeff Bonwick ddt_stat_add(ddt_stat_t *dst, const ddt_stat_t *src, uint64_t neg) 386b24ab676SJeff Bonwick { 387b24ab676SJeff Bonwick const uint64_t *s = (const uint64_t *)src; 388b24ab676SJeff Bonwick uint64_t *d = (uint64_t *)dst; 389b24ab676SJeff Bonwick uint64_t *d_end = (uint64_t *)(dst + 1); 390b24ab676SJeff Bonwick 391b24ab676SJeff Bonwick ASSERT(neg == 0 || neg == -1ULL); /* add or subtract */ 392b24ab676SJeff Bonwick 393b24ab676SJeff Bonwick while (d < d_end) 394b24ab676SJeff Bonwick *d++ += (*s++ ^ neg) - neg; 395b24ab676SJeff Bonwick } 396b24ab676SJeff Bonwick 397b24ab676SJeff Bonwick static void 398b24ab676SJeff Bonwick ddt_stat_update(ddt_t *ddt, ddt_entry_t *dde, uint64_t neg) 399b24ab676SJeff Bonwick { 400b24ab676SJeff Bonwick ddt_stat_t dds; 401b24ab676SJeff Bonwick ddt_histogram_t *ddh; 402b24ab676SJeff Bonwick int bucket; 403b24ab676SJeff Bonwick 404b24ab676SJeff Bonwick ddt_stat_generate(ddt, dde, &dds); 405b24ab676SJeff Bonwick 406bf16b11eSMatthew Ahrens bucket = highbit64(dds.dds_ref_blocks) - 1; 407b24ab676SJeff Bonwick ASSERT(bucket >= 0); 408b24ab676SJeff Bonwick 409b24ab676SJeff Bonwick ddh = &ddt->ddt_histogram[dde->dde_type][dde->dde_class]; 410b24ab676SJeff Bonwick 411b24ab676SJeff Bonwick ddt_stat_add(&ddh->ddh_stat[bucket], &dds, neg); 412b24ab676SJeff Bonwick } 413b24ab676SJeff Bonwick 414b24ab676SJeff Bonwick void 415b24ab676SJeff Bonwick ddt_histogram_add(ddt_histogram_t *dst, const ddt_histogram_t *src) 416b24ab676SJeff Bonwick { 417b24ab676SJeff Bonwick for (int h = 0; h < 64; h++) 418b24ab676SJeff Bonwick ddt_stat_add(&dst->ddh_stat[h], &src->ddh_stat[h], 0); 419b24ab676SJeff Bonwick } 420b24ab676SJeff Bonwick 421b24ab676SJeff Bonwick void 422b24ab676SJeff Bonwick ddt_histogram_stat(ddt_stat_t *dds, const ddt_histogram_t *ddh) 423b24ab676SJeff Bonwick { 424b24ab676SJeff Bonwick bzero(dds, sizeof (*dds)); 425b24ab676SJeff Bonwick 426b24ab676SJeff Bonwick for (int h = 0; h < 64; h++) 427b24ab676SJeff Bonwick ddt_stat_add(dds, &ddh->ddh_stat[h], 0); 428b24ab676SJeff Bonwick } 429b24ab676SJeff Bonwick 430b24ab676SJeff Bonwick boolean_t 431b24ab676SJeff Bonwick ddt_histogram_empty(const ddt_histogram_t *ddh) 432b24ab676SJeff Bonwick { 433b24ab676SJeff Bonwick const uint64_t *s = (const uint64_t *)ddh; 434b24ab676SJeff Bonwick const uint64_t *s_end = (const uint64_t *)(ddh + 1); 435b24ab676SJeff Bonwick 436b24ab676SJeff Bonwick while (s < s_end) 437b24ab676SJeff Bonwick if (*s++ != 0) 438b24ab676SJeff Bonwick return (B_FALSE); 439b24ab676SJeff Bonwick 440b24ab676SJeff Bonwick return (B_TRUE); 441b24ab676SJeff Bonwick } 442b24ab676SJeff Bonwick 4439eb19f4dSGeorge Wilson void 44430f608a4SGeorge Wilson ddt_get_dedup_object_stats(spa_t *spa, ddt_object_t *ddo_total) 445b24ab676SJeff Bonwick { 44630f608a4SGeorge Wilson /* Sum the statistics we cached in ddt_object_sync(). */ 447b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 448b24ab676SJeff Bonwick ddt_t *ddt = spa->spa_ddt[c]; 449b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 450b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; 451b24ab676SJeff Bonwick class++) { 45230f608a4SGeorge Wilson ddt_object_t *ddo = 45330f608a4SGeorge Wilson &ddt->ddt_object_stats[type][class]; 45430f608a4SGeorge Wilson ddo_total->ddo_count += ddo->ddo_count; 45530f608a4SGeorge Wilson ddo_total->ddo_dspace += ddo->ddo_dspace; 45630f608a4SGeorge Wilson ddo_total->ddo_mspace += ddo->ddo_mspace; 45730f608a4SGeorge Wilson } 45830f608a4SGeorge Wilson } 45930f608a4SGeorge Wilson } 4609eb19f4dSGeorge Wilson 46130f608a4SGeorge Wilson /* ... and compute the averages. */ 46230f608a4SGeorge Wilson if (ddo_total->ddo_count != 0) { 46330f608a4SGeorge Wilson ddo_total->ddo_dspace /= ddo_total->ddo_count; 46430f608a4SGeorge Wilson ddo_total->ddo_mspace /= ddo_total->ddo_count; 465b24ab676SJeff Bonwick } 466b24ab676SJeff Bonwick } 467b24ab676SJeff Bonwick 4689eb19f4dSGeorge Wilson void 4699eb19f4dSGeorge Wilson ddt_get_dedup_histogram(spa_t *spa, ddt_histogram_t *ddh) 4709eb19f4dSGeorge Wilson { 4719eb19f4dSGeorge Wilson for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 4729eb19f4dSGeorge Wilson ddt_t *ddt = spa->spa_ddt[c]; 4739eb19f4dSGeorge Wilson for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 4749eb19f4dSGeorge Wilson for (enum ddt_class class = 0; class < DDT_CLASSES; 4759eb19f4dSGeorge Wilson class++) { 4769eb19f4dSGeorge Wilson ddt_histogram_add(ddh, 47730f608a4SGeorge Wilson &ddt->ddt_histogram_cache[type][class]); 4789eb19f4dSGeorge Wilson } 4799eb19f4dSGeorge Wilson } 4809eb19f4dSGeorge Wilson } 4819eb19f4dSGeorge Wilson } 4829eb19f4dSGeorge Wilson 4839eb19f4dSGeorge Wilson void 4849eb19f4dSGeorge Wilson ddt_get_dedup_stats(spa_t *spa, ddt_stat_t *dds_total) 4859eb19f4dSGeorge Wilson { 4869eb19f4dSGeorge Wilson ddt_histogram_t *ddh_total; 4879eb19f4dSGeorge Wilson 4889eb19f4dSGeorge Wilson ddh_total = kmem_zalloc(sizeof (ddt_histogram_t), KM_SLEEP); 4899eb19f4dSGeorge Wilson ddt_get_dedup_histogram(spa, ddh_total); 4909eb19f4dSGeorge Wilson ddt_histogram_stat(dds_total, ddh_total); 4919eb19f4dSGeorge Wilson kmem_free(ddh_total, sizeof (ddt_histogram_t)); 492485bbbf5SGeorge Wilson } 493b24ab676SJeff Bonwick 494485bbbf5SGeorge Wilson uint64_t 495485bbbf5SGeorge Wilson ddt_get_dedup_dspace(spa_t *spa) 496485bbbf5SGeorge Wilson { 497485bbbf5SGeorge Wilson ddt_stat_t dds_total = { 0 }; 498485bbbf5SGeorge Wilson 499485bbbf5SGeorge Wilson ddt_get_dedup_stats(spa, &dds_total); 500485bbbf5SGeorge Wilson return (dds_total.dds_ref_dsize - dds_total.dds_dsize); 501485bbbf5SGeorge Wilson } 502485bbbf5SGeorge Wilson 503485bbbf5SGeorge Wilson uint64_t 504485bbbf5SGeorge Wilson ddt_get_pool_dedup_ratio(spa_t *spa) 505485bbbf5SGeorge Wilson { 506485bbbf5SGeorge Wilson ddt_stat_t dds_total = { 0 }; 507485bbbf5SGeorge Wilson 508485bbbf5SGeorge Wilson ddt_get_dedup_stats(spa, &dds_total); 509b24ab676SJeff Bonwick if (dds_total.dds_dsize == 0) 510b24ab676SJeff Bonwick return (100); 511b24ab676SJeff Bonwick 512b24ab676SJeff Bonwick return (dds_total.dds_ref_dsize * 100 / dds_total.dds_dsize); 513b24ab676SJeff Bonwick } 514b24ab676SJeff Bonwick 515b24ab676SJeff Bonwick int 516b24ab676SJeff Bonwick ddt_ditto_copies_needed(ddt_t *ddt, ddt_entry_t *dde, ddt_phys_t *ddp_willref) 517b24ab676SJeff Bonwick { 518b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 519b24ab676SJeff Bonwick uint64_t total_refcnt = 0; 520b24ab676SJeff Bonwick uint64_t ditto = spa->spa_dedup_ditto; 521b24ab676SJeff Bonwick int total_copies = 0; 522b24ab676SJeff Bonwick int desired_copies = 0; 523b24ab676SJeff Bonwick 524b24ab676SJeff Bonwick for (int p = DDT_PHYS_SINGLE; p <= DDT_PHYS_TRIPLE; p++) { 525b24ab676SJeff Bonwick ddt_phys_t *ddp = &dde->dde_phys[p]; 526b24ab676SJeff Bonwick zio_t *zio = dde->dde_lead_zio[p]; 527b24ab676SJeff Bonwick uint64_t refcnt = ddp->ddp_refcnt; /* committed refs */ 528b24ab676SJeff Bonwick if (zio != NULL) 529b24ab676SJeff Bonwick refcnt += zio->io_parent_count; /* pending refs */ 530b24ab676SJeff Bonwick if (ddp == ddp_willref) 531b24ab676SJeff Bonwick refcnt++; /* caller's ref */ 532b24ab676SJeff Bonwick if (refcnt != 0) { 533b24ab676SJeff Bonwick total_refcnt += refcnt; 534b24ab676SJeff Bonwick total_copies += p; 535b24ab676SJeff Bonwick } 536b24ab676SJeff Bonwick } 537b24ab676SJeff Bonwick 538b24ab676SJeff Bonwick if (ditto == 0 || ditto > UINT32_MAX) 539b24ab676SJeff Bonwick ditto = UINT32_MAX; 540b24ab676SJeff Bonwick 541b24ab676SJeff Bonwick if (total_refcnt >= 1) 542b24ab676SJeff Bonwick desired_copies++; 543b24ab676SJeff Bonwick if (total_refcnt >= ditto) 544b24ab676SJeff Bonwick desired_copies++; 545b24ab676SJeff Bonwick if (total_refcnt >= ditto * ditto) 546b24ab676SJeff Bonwick desired_copies++; 547b24ab676SJeff Bonwick 548b24ab676SJeff Bonwick return (MAX(desired_copies, total_copies) - total_copies); 549b24ab676SJeff Bonwick } 550b24ab676SJeff Bonwick 551b24ab676SJeff Bonwick int 552b24ab676SJeff Bonwick ddt_ditto_copies_present(ddt_entry_t *dde) 553b24ab676SJeff Bonwick { 554b24ab676SJeff Bonwick ddt_phys_t *ddp = &dde->dde_phys[DDT_PHYS_DITTO]; 555b24ab676SJeff Bonwick dva_t *dva = ddp->ddp_dva; 556b24ab676SJeff Bonwick int copies = 0 - DVA_GET_GANG(dva); 557b24ab676SJeff Bonwick 558b24ab676SJeff Bonwick for (int d = 0; d < SPA_DVAS_PER_BP; d++, dva++) 559b24ab676SJeff Bonwick if (DVA_IS_VALID(dva)) 560b24ab676SJeff Bonwick copies++; 561b24ab676SJeff Bonwick 562b24ab676SJeff Bonwick ASSERT(copies >= 0 && copies < SPA_DVAS_PER_BP); 563b24ab676SJeff Bonwick 564b24ab676SJeff Bonwick return (copies); 565b24ab676SJeff Bonwick } 566b24ab676SJeff Bonwick 567b24ab676SJeff Bonwick size_t 568b24ab676SJeff Bonwick ddt_compress(void *src, uchar_t *dst, size_t s_len, size_t d_len) 569b24ab676SJeff Bonwick { 570b24ab676SJeff Bonwick uchar_t *version = dst++; 571b24ab676SJeff Bonwick int cpfunc = ZIO_COMPRESS_ZLE; 572b24ab676SJeff Bonwick zio_compress_info_t *ci = &zio_compress_table[cpfunc]; 573b24ab676SJeff Bonwick size_t c_len; 574b24ab676SJeff Bonwick 575b24ab676SJeff Bonwick ASSERT(d_len >= s_len + 1); /* no compression plus version byte */ 576b24ab676SJeff Bonwick 577b24ab676SJeff Bonwick c_len = ci->ci_compress(src, dst, s_len, d_len - 1, ci->ci_level); 578b24ab676SJeff Bonwick 579b24ab676SJeff Bonwick if (c_len == s_len) { 580b24ab676SJeff Bonwick cpfunc = ZIO_COMPRESS_OFF; 581b24ab676SJeff Bonwick bcopy(src, dst, s_len); 582b24ab676SJeff Bonwick } 583b24ab676SJeff Bonwick 58443466aaeSMax Grossman *version = cpfunc; 58543466aaeSMax Grossman /* CONSTCOND */ 58643466aaeSMax Grossman if (ZFS_HOST_BYTEORDER) 58743466aaeSMax Grossman *version |= DDT_COMPRESS_BYTEORDER_MASK; 588b24ab676SJeff Bonwick 589b24ab676SJeff Bonwick return (c_len + 1); 590b24ab676SJeff Bonwick } 591b24ab676SJeff Bonwick 592b24ab676SJeff Bonwick void 593b24ab676SJeff Bonwick ddt_decompress(uchar_t *src, void *dst, size_t s_len, size_t d_len) 594b24ab676SJeff Bonwick { 595b24ab676SJeff Bonwick uchar_t version = *src++; 596b24ab676SJeff Bonwick int cpfunc = version & DDT_COMPRESS_FUNCTION_MASK; 597b24ab676SJeff Bonwick zio_compress_info_t *ci = &zio_compress_table[cpfunc]; 598b24ab676SJeff Bonwick 599b24ab676SJeff Bonwick if (ci->ci_decompress != NULL) 600b24ab676SJeff Bonwick (void) ci->ci_decompress(src, dst, s_len, d_len, ci->ci_level); 601b24ab676SJeff Bonwick else 602b24ab676SJeff Bonwick bcopy(src, dst, d_len); 603b24ab676SJeff Bonwick 60443466aaeSMax Grossman if (((version & DDT_COMPRESS_BYTEORDER_MASK) != 0) != 60543466aaeSMax Grossman (ZFS_HOST_BYTEORDER != 0)) 606b24ab676SJeff Bonwick byteswap_uint64_array(dst, d_len); 607b24ab676SJeff Bonwick } 608b24ab676SJeff Bonwick 609b24ab676SJeff Bonwick ddt_t * 610b24ab676SJeff Bonwick ddt_select_by_checksum(spa_t *spa, enum zio_checksum c) 611b24ab676SJeff Bonwick { 612b24ab676SJeff Bonwick return (spa->spa_ddt[c]); 613b24ab676SJeff Bonwick } 614b24ab676SJeff Bonwick 615b24ab676SJeff Bonwick ddt_t * 616b24ab676SJeff Bonwick ddt_select(spa_t *spa, const blkptr_t *bp) 617b24ab676SJeff Bonwick { 618b24ab676SJeff Bonwick return (spa->spa_ddt[BP_GET_CHECKSUM(bp)]); 619b24ab676SJeff Bonwick } 620b24ab676SJeff Bonwick 621b24ab676SJeff Bonwick void 622b24ab676SJeff Bonwick ddt_enter(ddt_t *ddt) 623b24ab676SJeff Bonwick { 624b24ab676SJeff Bonwick mutex_enter(&ddt->ddt_lock); 625b24ab676SJeff Bonwick } 626b24ab676SJeff Bonwick 627b24ab676SJeff Bonwick void 628b24ab676SJeff Bonwick ddt_exit(ddt_t *ddt) 629b24ab676SJeff Bonwick { 630b24ab676SJeff Bonwick mutex_exit(&ddt->ddt_lock); 631b24ab676SJeff Bonwick } 632b24ab676SJeff Bonwick 633b24ab676SJeff Bonwick static ddt_entry_t * 634b24ab676SJeff Bonwick ddt_alloc(const ddt_key_t *ddk) 635b24ab676SJeff Bonwick { 636b24ab676SJeff Bonwick ddt_entry_t *dde; 637b24ab676SJeff Bonwick 638b24ab676SJeff Bonwick dde = kmem_zalloc(sizeof (ddt_entry_t), KM_SLEEP); 639b24ab676SJeff Bonwick cv_init(&dde->dde_cv, NULL, CV_DEFAULT, NULL); 640b24ab676SJeff Bonwick 641b24ab676SJeff Bonwick dde->dde_key = *ddk; 642b24ab676SJeff Bonwick 643b24ab676SJeff Bonwick return (dde); 644b24ab676SJeff Bonwick } 645b24ab676SJeff Bonwick 646b24ab676SJeff Bonwick static void 647b24ab676SJeff Bonwick ddt_free(ddt_entry_t *dde) 648b24ab676SJeff Bonwick { 649b24ab676SJeff Bonwick ASSERT(!dde->dde_loading); 650b24ab676SJeff Bonwick 651b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++) 652b24ab676SJeff Bonwick ASSERT(dde->dde_lead_zio[p] == NULL); 653b24ab676SJeff Bonwick 654b24ab676SJeff Bonwick if (dde->dde_repair_data != NULL) 655b24ab676SJeff Bonwick zio_buf_free(dde->dde_repair_data, 656b24ab676SJeff Bonwick DDK_GET_PSIZE(&dde->dde_key)); 657b24ab676SJeff Bonwick 658b24ab676SJeff Bonwick cv_destroy(&dde->dde_cv); 659b24ab676SJeff Bonwick kmem_free(dde, sizeof (*dde)); 660b24ab676SJeff Bonwick } 661b24ab676SJeff Bonwick 662b24ab676SJeff Bonwick void 663b24ab676SJeff Bonwick ddt_remove(ddt_t *ddt, ddt_entry_t *dde) 664b24ab676SJeff Bonwick { 665b24ab676SJeff Bonwick ASSERT(MUTEX_HELD(&ddt->ddt_lock)); 666b24ab676SJeff Bonwick 667b24ab676SJeff Bonwick avl_remove(&ddt->ddt_tree, dde); 668b24ab676SJeff Bonwick ddt_free(dde); 669b24ab676SJeff Bonwick } 670b24ab676SJeff Bonwick 671b24ab676SJeff Bonwick ddt_entry_t * 672b24ab676SJeff Bonwick ddt_lookup(ddt_t *ddt, const blkptr_t *bp, boolean_t add) 673b24ab676SJeff Bonwick { 674b24ab676SJeff Bonwick ddt_entry_t *dde, dde_search; 675b24ab676SJeff Bonwick enum ddt_type type; 676b24ab676SJeff Bonwick enum ddt_class class; 677b24ab676SJeff Bonwick avl_index_t where; 678b24ab676SJeff Bonwick int error; 679b24ab676SJeff Bonwick 680b24ab676SJeff Bonwick ASSERT(MUTEX_HELD(&ddt->ddt_lock)); 681b24ab676SJeff Bonwick 682b24ab676SJeff Bonwick ddt_key_fill(&dde_search.dde_key, bp); 683b24ab676SJeff Bonwick 684b24ab676SJeff Bonwick dde = avl_find(&ddt->ddt_tree, &dde_search, &where); 685b24ab676SJeff Bonwick if (dde == NULL) { 686b24ab676SJeff Bonwick if (!add) 687b24ab676SJeff Bonwick return (NULL); 688b24ab676SJeff Bonwick dde = ddt_alloc(&dde_search.dde_key); 689b24ab676SJeff Bonwick avl_insert(&ddt->ddt_tree, dde, where); 690b24ab676SJeff Bonwick } 691b24ab676SJeff Bonwick 692b24ab676SJeff Bonwick while (dde->dde_loading) 693b24ab676SJeff Bonwick cv_wait(&dde->dde_cv, &ddt->ddt_lock); 694b24ab676SJeff Bonwick 695b24ab676SJeff Bonwick if (dde->dde_loaded) 696b24ab676SJeff Bonwick return (dde); 697b24ab676SJeff Bonwick 698b24ab676SJeff Bonwick dde->dde_loading = B_TRUE; 699b24ab676SJeff Bonwick 700b24ab676SJeff Bonwick ddt_exit(ddt); 701b24ab676SJeff Bonwick 702b24ab676SJeff Bonwick error = ENOENT; 703b24ab676SJeff Bonwick 704b24ab676SJeff Bonwick for (type = 0; type < DDT_TYPES; type++) { 705b24ab676SJeff Bonwick for (class = 0; class < DDT_CLASSES; class++) { 706b24ab676SJeff Bonwick error = ddt_object_lookup(ddt, type, class, dde); 707b24ab676SJeff Bonwick if (error != ENOENT) 708b24ab676SJeff Bonwick break; 709b24ab676SJeff Bonwick } 710b24ab676SJeff Bonwick if (error != ENOENT) 711b24ab676SJeff Bonwick break; 712b24ab676SJeff Bonwick } 713b24ab676SJeff Bonwick 714b24ab676SJeff Bonwick ASSERT(error == 0 || error == ENOENT); 715b24ab676SJeff Bonwick 716b24ab676SJeff Bonwick ddt_enter(ddt); 717b24ab676SJeff Bonwick 718b24ab676SJeff Bonwick ASSERT(dde->dde_loaded == B_FALSE); 719b24ab676SJeff Bonwick ASSERT(dde->dde_loading == B_TRUE); 720b24ab676SJeff Bonwick 721b24ab676SJeff Bonwick dde->dde_type = type; /* will be DDT_TYPES if no entry found */ 722b24ab676SJeff Bonwick dde->dde_class = class; /* will be DDT_CLASSES if no entry found */ 723b24ab676SJeff Bonwick dde->dde_loaded = B_TRUE; 724b24ab676SJeff Bonwick dde->dde_loading = B_FALSE; 725b24ab676SJeff Bonwick 726b24ab676SJeff Bonwick if (error == 0) 727b24ab676SJeff Bonwick ddt_stat_update(ddt, dde, -1ULL); 728b24ab676SJeff Bonwick 729b24ab676SJeff Bonwick cv_broadcast(&dde->dde_cv); 730b24ab676SJeff Bonwick 731b24ab676SJeff Bonwick return (dde); 732b24ab676SJeff Bonwick } 733b24ab676SJeff Bonwick 734c7cd2421SGeorge Wilson void 735c7cd2421SGeorge Wilson ddt_prefetch(spa_t *spa, const blkptr_t *bp) 736c7cd2421SGeorge Wilson { 737c7cd2421SGeorge Wilson ddt_t *ddt; 738c7cd2421SGeorge Wilson ddt_entry_t dde; 739c7cd2421SGeorge Wilson 740837b568bSGeorge Wilson if (!zfs_dedup_prefetch || bp == NULL || !BP_GET_DEDUP(bp)) 741c7cd2421SGeorge Wilson return; 742c7cd2421SGeorge Wilson 743c7cd2421SGeorge Wilson /* 744ce053c9dSGeorge Wilson * We only remove the DDT once all tables are empty and only 745ce053c9dSGeorge Wilson * prefetch dedup blocks when there are entries in the DDT. 746ce053c9dSGeorge Wilson * Thus no locking is required as the DDT can't disappear on us. 747c7cd2421SGeorge Wilson */ 748c7cd2421SGeorge Wilson ddt = ddt_select(spa, bp); 749c7cd2421SGeorge Wilson ddt_key_fill(&dde.dde_key, bp); 750c7cd2421SGeorge Wilson 751c7cd2421SGeorge Wilson for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 752c7cd2421SGeorge Wilson for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 753c7cd2421SGeorge Wilson ddt_object_prefetch(ddt, type, class, &dde); 754c7cd2421SGeorge Wilson } 755c7cd2421SGeorge Wilson } 756c7cd2421SGeorge Wilson } 757c7cd2421SGeorge Wilson 758b24ab676SJeff Bonwick int 759b24ab676SJeff Bonwick ddt_entry_compare(const void *x1, const void *x2) 760b24ab676SJeff Bonwick { 761b24ab676SJeff Bonwick const ddt_entry_t *dde1 = x1; 762b24ab676SJeff Bonwick const ddt_entry_t *dde2 = x2; 763b24ab676SJeff Bonwick const uint64_t *u1 = (const uint64_t *)&dde1->dde_key; 764b24ab676SJeff Bonwick const uint64_t *u2 = (const uint64_t *)&dde2->dde_key; 765b24ab676SJeff Bonwick 766b24ab676SJeff Bonwick for (int i = 0; i < DDT_KEY_WORDS; i++) { 767b24ab676SJeff Bonwick if (u1[i] < u2[i]) 768b24ab676SJeff Bonwick return (-1); 769b24ab676SJeff Bonwick if (u1[i] > u2[i]) 770b24ab676SJeff Bonwick return (1); 771b24ab676SJeff Bonwick } 772b24ab676SJeff Bonwick 773b24ab676SJeff Bonwick return (0); 774b24ab676SJeff Bonwick } 775b24ab676SJeff Bonwick 776b24ab676SJeff Bonwick static ddt_t * 777b24ab676SJeff Bonwick ddt_table_alloc(spa_t *spa, enum zio_checksum c) 778b24ab676SJeff Bonwick { 779b24ab676SJeff Bonwick ddt_t *ddt; 780b24ab676SJeff Bonwick 781b24ab676SJeff Bonwick ddt = kmem_zalloc(sizeof (*ddt), KM_SLEEP); 782b24ab676SJeff Bonwick 783b24ab676SJeff Bonwick mutex_init(&ddt->ddt_lock, NULL, MUTEX_DEFAULT, NULL); 784b24ab676SJeff Bonwick avl_create(&ddt->ddt_tree, ddt_entry_compare, 785b24ab676SJeff Bonwick sizeof (ddt_entry_t), offsetof(ddt_entry_t, dde_node)); 786b24ab676SJeff Bonwick avl_create(&ddt->ddt_repair_tree, ddt_entry_compare, 787b24ab676SJeff Bonwick sizeof (ddt_entry_t), offsetof(ddt_entry_t, dde_node)); 788b24ab676SJeff Bonwick ddt->ddt_checksum = c; 789b24ab676SJeff Bonwick ddt->ddt_spa = spa; 790b24ab676SJeff Bonwick ddt->ddt_os = spa->spa_meta_objset; 791b24ab676SJeff Bonwick 792b24ab676SJeff Bonwick return (ddt); 793b24ab676SJeff Bonwick } 794b24ab676SJeff Bonwick 795b24ab676SJeff Bonwick static void 796b24ab676SJeff Bonwick ddt_table_free(ddt_t *ddt) 797b24ab676SJeff Bonwick { 798b24ab676SJeff Bonwick ASSERT(avl_numnodes(&ddt->ddt_tree) == 0); 799b24ab676SJeff Bonwick ASSERT(avl_numnodes(&ddt->ddt_repair_tree) == 0); 800b24ab676SJeff Bonwick avl_destroy(&ddt->ddt_tree); 801b24ab676SJeff Bonwick avl_destroy(&ddt->ddt_repair_tree); 802b24ab676SJeff Bonwick mutex_destroy(&ddt->ddt_lock); 803b24ab676SJeff Bonwick kmem_free(ddt, sizeof (*ddt)); 804b24ab676SJeff Bonwick } 805b24ab676SJeff Bonwick 806b24ab676SJeff Bonwick void 807b24ab676SJeff Bonwick ddt_create(spa_t *spa) 808b24ab676SJeff Bonwick { 809b24ab676SJeff Bonwick spa->spa_dedup_checksum = ZIO_DEDUPCHECKSUM; 810b24ab676SJeff Bonwick 811b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) 812b24ab676SJeff Bonwick spa->spa_ddt[c] = ddt_table_alloc(spa, c); 813b24ab676SJeff Bonwick } 814b24ab676SJeff Bonwick 815b24ab676SJeff Bonwick int 816b24ab676SJeff Bonwick ddt_load(spa_t *spa) 817b24ab676SJeff Bonwick { 818b24ab676SJeff Bonwick int error; 819b24ab676SJeff Bonwick 820b24ab676SJeff Bonwick ddt_create(spa); 821b24ab676SJeff Bonwick 822b24ab676SJeff Bonwick error = zap_lookup(spa->spa_meta_objset, DMU_POOL_DIRECTORY_OBJECT, 823b24ab676SJeff Bonwick DMU_POOL_DDT_STATS, sizeof (uint64_t), 1, 824b24ab676SJeff Bonwick &spa->spa_ddt_stat_object); 825b24ab676SJeff Bonwick 826b24ab676SJeff Bonwick if (error) 827b24ab676SJeff Bonwick return (error == ENOENT ? 0 : error); 828b24ab676SJeff Bonwick 829b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 83030f608a4SGeorge Wilson ddt_t *ddt = spa->spa_ddt[c]; 831b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 832b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; 833b24ab676SJeff Bonwick class++) { 834b24ab676SJeff Bonwick error = ddt_object_load(ddt, type, class); 835b24ab676SJeff Bonwick if (error != 0 && error != ENOENT) 836b24ab676SJeff Bonwick return (error); 837b24ab676SJeff Bonwick } 838b24ab676SJeff Bonwick } 83930f608a4SGeorge Wilson 84030f608a4SGeorge Wilson /* 84130f608a4SGeorge Wilson * Seed the cached histograms. 84230f608a4SGeorge Wilson */ 84330f608a4SGeorge Wilson bcopy(ddt->ddt_histogram, &ddt->ddt_histogram_cache, 84430f608a4SGeorge Wilson sizeof (ddt->ddt_histogram)); 845b24ab676SJeff Bonwick } 846b24ab676SJeff Bonwick 847b24ab676SJeff Bonwick return (0); 848b24ab676SJeff Bonwick } 849b24ab676SJeff Bonwick 850b24ab676SJeff Bonwick void 851b24ab676SJeff Bonwick ddt_unload(spa_t *spa) 852b24ab676SJeff Bonwick { 853b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 854b24ab676SJeff Bonwick if (spa->spa_ddt[c]) { 855b24ab676SJeff Bonwick ddt_table_free(spa->spa_ddt[c]); 856b24ab676SJeff Bonwick spa->spa_ddt[c] = NULL; 857b24ab676SJeff Bonwick } 858b24ab676SJeff Bonwick } 859b24ab676SJeff Bonwick } 860b24ab676SJeff Bonwick 861bbfd46c4SJeff Bonwick boolean_t 862bbfd46c4SJeff Bonwick ddt_class_contains(spa_t *spa, enum ddt_class max_class, const blkptr_t *bp) 863bbfd46c4SJeff Bonwick { 864bbfd46c4SJeff Bonwick ddt_t *ddt; 865bbfd46c4SJeff Bonwick ddt_entry_t dde; 866bbfd46c4SJeff Bonwick 867bbfd46c4SJeff Bonwick if (!BP_GET_DEDUP(bp)) 868bbfd46c4SJeff Bonwick return (B_FALSE); 869bbfd46c4SJeff Bonwick 870bbfd46c4SJeff Bonwick if (max_class == DDT_CLASS_UNIQUE) 871bbfd46c4SJeff Bonwick return (B_TRUE); 872bbfd46c4SJeff Bonwick 873bbfd46c4SJeff Bonwick ddt = spa->spa_ddt[BP_GET_CHECKSUM(bp)]; 874bbfd46c4SJeff Bonwick 875bbfd46c4SJeff Bonwick ddt_key_fill(&dde.dde_key, bp); 876bbfd46c4SJeff Bonwick 877bbfd46c4SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) 878bbfd46c4SJeff Bonwick for (enum ddt_class class = 0; class <= max_class; class++) 879bbfd46c4SJeff Bonwick if (ddt_object_lookup(ddt, type, class, &dde) == 0) 880bbfd46c4SJeff Bonwick return (B_TRUE); 881bbfd46c4SJeff Bonwick 882bbfd46c4SJeff Bonwick return (B_FALSE); 883bbfd46c4SJeff Bonwick } 884bbfd46c4SJeff Bonwick 885b24ab676SJeff Bonwick ddt_entry_t * 886b24ab676SJeff Bonwick ddt_repair_start(ddt_t *ddt, const blkptr_t *bp) 887b24ab676SJeff Bonwick { 888b24ab676SJeff Bonwick ddt_key_t ddk; 889b24ab676SJeff Bonwick ddt_entry_t *dde; 890b24ab676SJeff Bonwick 891b24ab676SJeff Bonwick ddt_key_fill(&ddk, bp); 892b24ab676SJeff Bonwick 893b24ab676SJeff Bonwick dde = ddt_alloc(&ddk); 894b24ab676SJeff Bonwick 895b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 896b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 897b24ab676SJeff Bonwick /* 898b24ab676SJeff Bonwick * We can only do repair if there are multiple copies 899b24ab676SJeff Bonwick * of the block. For anything in the UNIQUE class, 900b24ab676SJeff Bonwick * there's definitely only one copy, so don't even try. 901b24ab676SJeff Bonwick */ 902b24ab676SJeff Bonwick if (class != DDT_CLASS_UNIQUE && 903b24ab676SJeff Bonwick ddt_object_lookup(ddt, type, class, dde) == 0) 904b24ab676SJeff Bonwick return (dde); 905b24ab676SJeff Bonwick } 906b24ab676SJeff Bonwick } 907b24ab676SJeff Bonwick 908b24ab676SJeff Bonwick bzero(dde->dde_phys, sizeof (dde->dde_phys)); 909b24ab676SJeff Bonwick 910b24ab676SJeff Bonwick return (dde); 911b24ab676SJeff Bonwick } 912b24ab676SJeff Bonwick 913b24ab676SJeff Bonwick void 914b24ab676SJeff Bonwick ddt_repair_done(ddt_t *ddt, ddt_entry_t *dde) 915b24ab676SJeff Bonwick { 916b24ab676SJeff Bonwick avl_index_t where; 917b24ab676SJeff Bonwick 918b24ab676SJeff Bonwick ddt_enter(ddt); 919b24ab676SJeff Bonwick 920b24ab676SJeff Bonwick if (dde->dde_repair_data != NULL && spa_writeable(ddt->ddt_spa) && 921b24ab676SJeff Bonwick avl_find(&ddt->ddt_repair_tree, dde, &where) == NULL) 922b24ab676SJeff Bonwick avl_insert(&ddt->ddt_repair_tree, dde, where); 923b24ab676SJeff Bonwick else 924b24ab676SJeff Bonwick ddt_free(dde); 925b24ab676SJeff Bonwick 926b24ab676SJeff Bonwick ddt_exit(ddt); 927b24ab676SJeff Bonwick } 928b24ab676SJeff Bonwick 929b24ab676SJeff Bonwick static void 930b24ab676SJeff Bonwick ddt_repair_entry_done(zio_t *zio) 931b24ab676SJeff Bonwick { 932b24ab676SJeff Bonwick ddt_entry_t *rdde = zio->io_private; 933b24ab676SJeff Bonwick 934b24ab676SJeff Bonwick ddt_free(rdde); 935b24ab676SJeff Bonwick } 936b24ab676SJeff Bonwick 937b24ab676SJeff Bonwick static void 938b24ab676SJeff Bonwick ddt_repair_entry(ddt_t *ddt, ddt_entry_t *dde, ddt_entry_t *rdde, zio_t *rio) 939b24ab676SJeff Bonwick { 940b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 941b24ab676SJeff Bonwick ddt_phys_t *rddp = rdde->dde_phys; 942b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 943b24ab676SJeff Bonwick ddt_key_t *rddk = &rdde->dde_key; 944b24ab676SJeff Bonwick zio_t *zio; 945b24ab676SJeff Bonwick blkptr_t blk; 946b24ab676SJeff Bonwick 947b24ab676SJeff Bonwick zio = zio_null(rio, rio->io_spa, NULL, 948b24ab676SJeff Bonwick ddt_repair_entry_done, rdde, rio->io_flags); 949b24ab676SJeff Bonwick 950b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++, rddp++) { 951b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0 || 952b24ab676SJeff Bonwick ddp->ddp_phys_birth != rddp->ddp_phys_birth || 953b24ab676SJeff Bonwick bcmp(ddp->ddp_dva, rddp->ddp_dva, sizeof (ddp->ddp_dva))) 954b24ab676SJeff Bonwick continue; 955bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, ddk, ddp, &blk); 956b24ab676SJeff Bonwick zio_nowait(zio_rewrite(zio, zio->io_spa, 0, &blk, 957b24ab676SJeff Bonwick rdde->dde_repair_data, DDK_GET_PSIZE(rddk), NULL, NULL, 958b24ab676SJeff Bonwick ZIO_PRIORITY_SYNC_WRITE, ZIO_DDT_CHILD_FLAGS(zio), NULL)); 959b24ab676SJeff Bonwick } 960b24ab676SJeff Bonwick 961b24ab676SJeff Bonwick zio_nowait(zio); 962b24ab676SJeff Bonwick } 963b24ab676SJeff Bonwick 964b24ab676SJeff Bonwick static void 965b24ab676SJeff Bonwick ddt_repair_table(ddt_t *ddt, zio_t *rio) 966b24ab676SJeff Bonwick { 967b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 968b24ab676SJeff Bonwick ddt_entry_t *dde, *rdde_next, *rdde; 969b24ab676SJeff Bonwick avl_tree_t *t = &ddt->ddt_repair_tree; 970b24ab676SJeff Bonwick blkptr_t blk; 971b24ab676SJeff Bonwick 972b24ab676SJeff Bonwick if (spa_sync_pass(spa) > 1) 973b24ab676SJeff Bonwick return; 974b24ab676SJeff Bonwick 975b24ab676SJeff Bonwick ddt_enter(ddt); 976b24ab676SJeff Bonwick for (rdde = avl_first(t); rdde != NULL; rdde = rdde_next) { 977b24ab676SJeff Bonwick rdde_next = AVL_NEXT(t, rdde); 978b24ab676SJeff Bonwick avl_remove(&ddt->ddt_repair_tree, rdde); 979b24ab676SJeff Bonwick ddt_exit(ddt); 980bbfd46c4SJeff Bonwick ddt_bp_create(ddt->ddt_checksum, &rdde->dde_key, NULL, &blk); 981b24ab676SJeff Bonwick dde = ddt_repair_start(ddt, &blk); 982b24ab676SJeff Bonwick ddt_repair_entry(ddt, dde, rdde, rio); 983b24ab676SJeff Bonwick ddt_repair_done(ddt, dde); 984b24ab676SJeff Bonwick ddt_enter(ddt); 985b24ab676SJeff Bonwick } 986b24ab676SJeff Bonwick ddt_exit(ddt); 987b24ab676SJeff Bonwick } 988b24ab676SJeff Bonwick 989b24ab676SJeff Bonwick static void 990b24ab676SJeff Bonwick ddt_sync_entry(ddt_t *ddt, ddt_entry_t *dde, dmu_tx_t *tx, uint64_t txg) 991b24ab676SJeff Bonwick { 992bbfd46c4SJeff Bonwick dsl_pool_t *dp = ddt->ddt_spa->spa_dsl_pool; 993b24ab676SJeff Bonwick ddt_phys_t *ddp = dde->dde_phys; 994b24ab676SJeff Bonwick ddt_key_t *ddk = &dde->dde_key; 995b24ab676SJeff Bonwick enum ddt_type otype = dde->dde_type; 996b24ab676SJeff Bonwick enum ddt_type ntype = DDT_TYPE_CURRENT; 997b24ab676SJeff Bonwick enum ddt_class oclass = dde->dde_class; 998b24ab676SJeff Bonwick enum ddt_class nclass; 999b24ab676SJeff Bonwick uint64_t total_refcnt = 0; 1000b24ab676SJeff Bonwick 1001b24ab676SJeff Bonwick ASSERT(dde->dde_loaded); 1002b24ab676SJeff Bonwick ASSERT(!dde->dde_loading); 1003b24ab676SJeff Bonwick 1004b24ab676SJeff Bonwick for (int p = 0; p < DDT_PHYS_TYPES; p++, ddp++) { 1005b24ab676SJeff Bonwick ASSERT(dde->dde_lead_zio[p] == NULL); 1006b24ab676SJeff Bonwick ASSERT((int64_t)ddp->ddp_refcnt >= 0); 1007b24ab676SJeff Bonwick if (ddp->ddp_phys_birth == 0) { 1008b24ab676SJeff Bonwick ASSERT(ddp->ddp_refcnt == 0); 1009b24ab676SJeff Bonwick continue; 1010b24ab676SJeff Bonwick } 1011b24ab676SJeff Bonwick if (p == DDT_PHYS_DITTO) { 1012b24ab676SJeff Bonwick if (ddt_ditto_copies_needed(ddt, dde, NULL) == 0) 1013b24ab676SJeff Bonwick ddt_phys_free(ddt, ddk, ddp, txg); 1014b24ab676SJeff Bonwick continue; 1015b24ab676SJeff Bonwick } 1016b24ab676SJeff Bonwick if (ddp->ddp_refcnt == 0) 1017b24ab676SJeff Bonwick ddt_phys_free(ddt, ddk, ddp, txg); 1018b24ab676SJeff Bonwick total_refcnt += ddp->ddp_refcnt; 1019b24ab676SJeff Bonwick } 1020b24ab676SJeff Bonwick 1021b24ab676SJeff Bonwick if (dde->dde_phys[DDT_PHYS_DITTO].ddp_phys_birth != 0) 1022b24ab676SJeff Bonwick nclass = DDT_CLASS_DITTO; 1023b24ab676SJeff Bonwick else if (total_refcnt > 1) 1024b24ab676SJeff Bonwick nclass = DDT_CLASS_DUPLICATE; 1025b24ab676SJeff Bonwick else 1026b24ab676SJeff Bonwick nclass = DDT_CLASS_UNIQUE; 1027b24ab676SJeff Bonwick 1028b24ab676SJeff Bonwick if (otype != DDT_TYPES && 1029b24ab676SJeff Bonwick (otype != ntype || oclass != nclass || total_refcnt == 0)) { 1030b24ab676SJeff Bonwick VERIFY(ddt_object_remove(ddt, otype, oclass, dde, tx) == 0); 1031b24ab676SJeff Bonwick ASSERT(ddt_object_lookup(ddt, otype, oclass, dde) == ENOENT); 1032b24ab676SJeff Bonwick } 1033b24ab676SJeff Bonwick 1034b24ab676SJeff Bonwick if (total_refcnt != 0) { 1035b24ab676SJeff Bonwick dde->dde_type = ntype; 1036b24ab676SJeff Bonwick dde->dde_class = nclass; 1037b24ab676SJeff Bonwick ddt_stat_update(ddt, dde, 0); 1038b24ab676SJeff Bonwick if (!ddt_object_exists(ddt, ntype, nclass)) 1039b24ab676SJeff Bonwick ddt_object_create(ddt, ntype, nclass, tx); 1040b24ab676SJeff Bonwick VERIFY(ddt_object_update(ddt, ntype, nclass, dde, tx) == 0); 1041bbfd46c4SJeff Bonwick 10423f9d6ad7SLin Ling /* 10433f9d6ad7SLin Ling * If the class changes, the order that we scan this bp 10443f9d6ad7SLin Ling * changes. If it decreases, we could miss it, so 10453f9d6ad7SLin Ling * scan it right now. (This covers both class changing 10463f9d6ad7SLin Ling * while we are doing ddt_walk(), and when we are 10473f9d6ad7SLin Ling * traversing.) 10483f9d6ad7SLin Ling */ 10493f9d6ad7SLin Ling if (nclass < oclass) { 10503f9d6ad7SLin Ling dsl_scan_ddt_entry(dp->dp_scan, 10513f9d6ad7SLin Ling ddt->ddt_checksum, dde, tx); 10523f9d6ad7SLin Ling } 1053b24ab676SJeff Bonwick } 1054b24ab676SJeff Bonwick } 1055b24ab676SJeff Bonwick 1056b24ab676SJeff Bonwick static void 1057b24ab676SJeff Bonwick ddt_sync_table(ddt_t *ddt, dmu_tx_t *tx, uint64_t txg) 1058b24ab676SJeff Bonwick { 1059b24ab676SJeff Bonwick spa_t *spa = ddt->ddt_spa; 1060b24ab676SJeff Bonwick ddt_entry_t *dde; 1061b24ab676SJeff Bonwick void *cookie = NULL; 1062b24ab676SJeff Bonwick 1063b24ab676SJeff Bonwick if (avl_numnodes(&ddt->ddt_tree) == 0) 1064b24ab676SJeff Bonwick return; 1065b24ab676SJeff Bonwick 1066b24ab676SJeff Bonwick ASSERT(spa->spa_uberblock.ub_version >= SPA_VERSION_DEDUP); 1067b24ab676SJeff Bonwick 1068b24ab676SJeff Bonwick if (spa->spa_ddt_stat_object == 0) { 1069ad135b5dSChristopher Siden spa->spa_ddt_stat_object = zap_create_link(ddt->ddt_os, 1070ad135b5dSChristopher Siden DMU_OT_DDT_STATS, DMU_POOL_DIRECTORY_OBJECT, 1071ad135b5dSChristopher Siden DMU_POOL_DDT_STATS, tx); 1072b24ab676SJeff Bonwick } 1073b24ab676SJeff Bonwick 1074b24ab676SJeff Bonwick while ((dde = avl_destroy_nodes(&ddt->ddt_tree, &cookie)) != NULL) { 1075b24ab676SJeff Bonwick ddt_sync_entry(ddt, dde, tx, txg); 1076b24ab676SJeff Bonwick ddt_free(dde); 1077b24ab676SJeff Bonwick } 1078b24ab676SJeff Bonwick 1079b24ab676SJeff Bonwick for (enum ddt_type type = 0; type < DDT_TYPES; type++) { 1080ce053c9dSGeorge Wilson uint64_t count = 0; 1081b24ab676SJeff Bonwick for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 1082ce053c9dSGeorge Wilson if (ddt_object_exists(ddt, type, class)) { 1083b24ab676SJeff Bonwick ddt_object_sync(ddt, type, class, tx); 1084ce053c9dSGeorge Wilson count += ddt_object_count(ddt, type, class); 1085ce053c9dSGeorge Wilson } 1086ce053c9dSGeorge Wilson } 1087ce053c9dSGeorge Wilson for (enum ddt_class class = 0; class < DDT_CLASSES; class++) { 1088ce053c9dSGeorge Wilson if (count == 0 && ddt_object_exists(ddt, type, class)) 1089b24ab676SJeff Bonwick ddt_object_destroy(ddt, type, class, tx); 1090b24ab676SJeff Bonwick } 1091b24ab676SJeff Bonwick } 109230f608a4SGeorge Wilson 109330f608a4SGeorge Wilson bcopy(ddt->ddt_histogram, &ddt->ddt_histogram_cache, 109430f608a4SGeorge Wilson sizeof (ddt->ddt_histogram)); 1095b24ab676SJeff Bonwick } 1096b24ab676SJeff Bonwick 1097b24ab676SJeff Bonwick void 1098b24ab676SJeff Bonwick ddt_sync(spa_t *spa, uint64_t txg) 1099b24ab676SJeff Bonwick { 1100b24ab676SJeff Bonwick dmu_tx_t *tx; 1101b24ab676SJeff Bonwick zio_t *rio = zio_root(spa, NULL, NULL, 1102b24ab676SJeff Bonwick ZIO_FLAG_CANFAIL | ZIO_FLAG_SPECULATIVE); 1103b24ab676SJeff Bonwick 1104b24ab676SJeff Bonwick ASSERT(spa_syncing_txg(spa) == txg); 1105b24ab676SJeff Bonwick 1106b24ab676SJeff Bonwick tx = dmu_tx_create_assigned(spa->spa_dsl_pool, txg); 1107b24ab676SJeff Bonwick 1108b24ab676SJeff Bonwick for (enum zio_checksum c = 0; c < ZIO_CHECKSUM_FUNCTIONS; c++) { 1109b24ab676SJeff Bonwick ddt_t *ddt = spa->spa_ddt[c]; 1110b24ab676SJeff Bonwick if (ddt == NULL) 1111b24ab676SJeff Bonwick continue; 1112b24ab676SJeff Bonwick ddt_sync_table(ddt, tx, txg); 1113b24ab676SJeff Bonwick ddt_repair_table(ddt, rio); 1114b24ab676SJeff Bonwick } 1115b24ab676SJeff Bonwick 1116b24ab676SJeff Bonwick (void) zio_wait(rio); 1117b24ab676SJeff Bonwick 1118b24ab676SJeff Bonwick dmu_tx_commit(tx); 1119b24ab676SJeff Bonwick } 1120bbfd46c4SJeff Bonwick 1121bbfd46c4SJeff Bonwick int 1122bbfd46c4SJeff Bonwick ddt_walk(spa_t *spa, ddt_bookmark_t *ddb, ddt_entry_t *dde) 1123bbfd46c4SJeff Bonwick { 1124bbfd46c4SJeff Bonwick do { 1125bbfd46c4SJeff Bonwick do { 1126bbfd46c4SJeff Bonwick do { 1127bbfd46c4SJeff Bonwick ddt_t *ddt = spa->spa_ddt[ddb->ddb_checksum]; 1128bbfd46c4SJeff Bonwick int error = ENOENT; 1129bbfd46c4SJeff Bonwick if (ddt_object_exists(ddt, ddb->ddb_type, 1130bbfd46c4SJeff Bonwick ddb->ddb_class)) { 1131bbfd46c4SJeff Bonwick error = ddt_object_walk(ddt, 1132bbfd46c4SJeff Bonwick ddb->ddb_type, ddb->ddb_class, 1133bbfd46c4SJeff Bonwick &ddb->ddb_cursor, dde); 1134bbfd46c4SJeff Bonwick } 11353f9d6ad7SLin Ling dde->dde_type = ddb->ddb_type; 11363f9d6ad7SLin Ling dde->dde_class = ddb->ddb_class; 1137bbfd46c4SJeff Bonwick if (error == 0) 1138bbfd46c4SJeff Bonwick return (0); 1139bbfd46c4SJeff Bonwick if (error != ENOENT) 1140bbfd46c4SJeff Bonwick return (error); 1141bbfd46c4SJeff Bonwick ddb->ddb_cursor = 0; 1142bbfd46c4SJeff Bonwick } while (++ddb->ddb_checksum < ZIO_CHECKSUM_FUNCTIONS); 1143bbfd46c4SJeff Bonwick ddb->ddb_checksum = 0; 1144bbfd46c4SJeff Bonwick } while (++ddb->ddb_type < DDT_TYPES); 1145bbfd46c4SJeff Bonwick ddb->ddb_type = 0; 1146bbfd46c4SJeff Bonwick } while (++ddb->ddb_class < DDT_CLASSES); 1147bbfd46c4SJeff Bonwick 1148be6fd75aSMatthew Ahrens return (SET_ERROR(ENOENT)); 1149bbfd46c4SJeff Bonwick } 1150