Home | History | Annotate | Line # | Download | only in sys
      1 /*
      2  * CDDL HEADER START
      3  *
      4  * The contents of this file are subject to the terms of the
      5  * Common Development and Distribution License (the "License").
      6  * You may not use this file except in compliance with the License.
      7  *
      8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
      9  * or http://www.opensolaris.org/os/licensing.
     10  * See the License for the specific language governing permissions
     11  * and limitations under the License.
     12  *
     13  * When distributing Covered Code, include this CDDL HEADER in each
     14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
     15  * If applicable, add the following below this CDDL HEADER, with the
     16  * fields enclosed by brackets "[]" replaced with your own identifying
     17  * information: Portions Copyright [yyyy] [name of copyright owner]
     18  *
     19  * CDDL HEADER END
     20  */
     21 /*
     22  * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved.
     23  */
     24 
     25 #ifndef _SYS_DDT_H
     26 #define	_SYS_DDT_H
     27 
     28 #include <sys/sysmacros.h>
     29 #include <sys/types.h>
     30 #include <sys/fs/zfs.h>
     31 #include <sys/zio.h>
     32 #include <sys/dmu.h>
     33 
     34 #ifdef	__cplusplus
     35 extern "C" {
     36 #endif
     37 
     38 /*
     39  * On-disk DDT formats, in the desired search order (newest version first).
     40  */
     41 enum ddt_type {
     42 	DDT_TYPE_ZAP = 0,
     43 	DDT_TYPES
     44 };
     45 
     46 /*
     47  * DDT classes, in the desired search order (highest replication level first).
     48  */
     49 enum ddt_class {
     50 	DDT_CLASS_DITTO = 0,
     51 	DDT_CLASS_DUPLICATE,
     52 	DDT_CLASS_UNIQUE,
     53 	DDT_CLASSES
     54 };
     55 
     56 #define	DDT_TYPE_CURRENT		0
     57 
     58 #define	DDT_COMPRESS_BYTEORDER_MASK	0x80
     59 #define	DDT_COMPRESS_FUNCTION_MASK	0x7f
     60 
     61 /*
     62  * On-disk ddt entry:  key (name) and physical storage (value).
     63  */
     64 typedef struct ddt_key {
     65 	zio_cksum_t	ddk_cksum;	/* 256-bit block checksum */
     66 	/*
     67 	 * Encoded with logical & physical size, and compression, as follows:
     68 	 *   +-------+-------+-------+-------+-------+-------+-------+-------+
     69 	 *   |   0   |   0   |   0   | comp  |     PSIZE     |     LSIZE     |
     70 	 *   +-------+-------+-------+-------+-------+-------+-------+-------+
     71 	 */
     72 	uint64_t	ddk_prop;
     73 } ddt_key_t;
     74 
     75 #define	DDK_GET_LSIZE(ddk)	\
     76 	BF64_GET_SB((ddk)->ddk_prop, 0, 16, SPA_MINBLOCKSHIFT, 1)
     77 #define	DDK_SET_LSIZE(ddk, x)	\
     78 	BF64_SET_SB((ddk)->ddk_prop, 0, 16, SPA_MINBLOCKSHIFT, 1, x)
     79 
     80 #define	DDK_GET_PSIZE(ddk)	\
     81 	BF64_GET_SB((ddk)->ddk_prop, 16, 16, SPA_MINBLOCKSHIFT, 1)
     82 #define	DDK_SET_PSIZE(ddk, x)	\
     83 	BF64_SET_SB((ddk)->ddk_prop, 16, 16, SPA_MINBLOCKSHIFT, 1, x)
     84 
     85 #define	DDK_GET_COMPRESS(ddk)		BF64_GET((ddk)->ddk_prop, 32, 8)
     86 #define	DDK_SET_COMPRESS(ddk, x)	BF64_SET((ddk)->ddk_prop, 32, 8, x)
     87 
     88 #define	DDT_KEY_WORDS	(sizeof (ddt_key_t) / sizeof (uint64_t))
     89 
     90 typedef struct ddt_phys {
     91 	dva_t		ddp_dva[SPA_DVAS_PER_BP];
     92 	uint64_t	ddp_refcnt;
     93 	uint64_t	ddp_phys_birth;
     94 } ddt_phys_t;
     95 
     96 enum ddt_phys_type {
     97 	DDT_PHYS_DITTO = 0,
     98 	DDT_PHYS_SINGLE = 1,
     99 	DDT_PHYS_DOUBLE = 2,
    100 	DDT_PHYS_TRIPLE = 3,
    101 	DDT_PHYS_TYPES
    102 };
    103 
    104 /*
    105  * In-core ddt entry
    106  */
    107 struct ddt_entry {
    108 	ddt_key_t	dde_key;
    109 	ddt_phys_t	dde_phys[DDT_PHYS_TYPES];
    110 	zio_t		*dde_lead_zio[DDT_PHYS_TYPES];
    111 	void		*dde_repair_data;
    112 	enum ddt_type	dde_type;
    113 	enum ddt_class	dde_class;
    114 	uint8_t		dde_loading;
    115 	uint8_t		dde_loaded;
    116 	kcondvar_t	dde_cv;
    117 	avl_node_t	dde_node;
    118 };
    119 
    120 /*
    121  * In-core ddt
    122  */
    123 struct ddt {
    124 	kmutex_t	ddt_lock;
    125 	avl_tree_t	ddt_tree;
    126 	avl_tree_t	ddt_repair_tree;
    127 	enum zio_checksum ddt_checksum;
    128 	spa_t		*ddt_spa;
    129 	objset_t	*ddt_os;
    130 	uint64_t	ddt_stat_object;
    131 	uint64_t	ddt_object[DDT_TYPES][DDT_CLASSES];
    132 	ddt_histogram_t	ddt_histogram[DDT_TYPES][DDT_CLASSES];
    133 	ddt_histogram_t	ddt_histogram_cache[DDT_TYPES][DDT_CLASSES];
    134 	ddt_object_t	ddt_object_stats[DDT_TYPES][DDT_CLASSES];
    135 	avl_node_t	ddt_node;
    136 };
    137 
    138 /*
    139  * In-core and on-disk bookmark for DDT walks
    140  */
    141 typedef struct ddt_bookmark {
    142 	uint64_t	ddb_class;
    143 	uint64_t	ddb_type;
    144 	uint64_t	ddb_checksum;
    145 	uint64_t	ddb_cursor;
    146 } ddt_bookmark_t;
    147 
    148 /*
    149  * Ops vector to access a specific DDT object type.
    150  */
    151 typedef struct ddt_ops {
    152 	char ddt_op_name[32];
    153 	int (*ddt_op_create)(objset_t *os, uint64_t *object, dmu_tx_t *tx,
    154 	    boolean_t prehash);
    155 	int (*ddt_op_destroy)(objset_t *os, uint64_t object, dmu_tx_t *tx);
    156 	int (*ddt_op_lookup)(objset_t *os, uint64_t object, ddt_entry_t *dde);
    157 	void (*ddt_op_prefetch)(objset_t *os, uint64_t object,
    158 	    ddt_entry_t *dde);
    159 	int (*ddt_op_update)(objset_t *os, uint64_t object, ddt_entry_t *dde,
    160 	    dmu_tx_t *tx);
    161 	int (*ddt_op_remove)(objset_t *os, uint64_t object, ddt_entry_t *dde,
    162 	    dmu_tx_t *tx);
    163 	int (*ddt_op_walk)(objset_t *os, uint64_t object, ddt_entry_t *dde,
    164 	    uint64_t *walk);
    165 	int (*ddt_op_count)(objset_t *os, uint64_t object, uint64_t *count);
    166 } ddt_ops_t;
    167 
    168 #define	DDT_NAMELEN	80
    169 
    170 extern void ddt_object_name(ddt_t *ddt, enum ddt_type type,
    171     enum ddt_class cls, char *name);
    172 extern int ddt_object_walk(ddt_t *ddt, enum ddt_type type,
    173     enum ddt_class cls, uint64_t *walk, ddt_entry_t *dde);
    174 extern int ddt_object_count(ddt_t *ddt, enum ddt_type type,
    175     enum ddt_class cls, uint64_t *count);
    176 extern int ddt_object_info(ddt_t *ddt, enum ddt_type type,
    177     enum ddt_class cls, dmu_object_info_t *);
    178 extern boolean_t ddt_object_exists(ddt_t *ddt, enum ddt_type type,
    179     enum ddt_class cls);
    180 
    181 extern void ddt_bp_fill(const ddt_phys_t *ddp, blkptr_t *bp,
    182     uint64_t txg);
    183 extern void ddt_bp_create(enum zio_checksum checksum, const ddt_key_t *ddk,
    184     const ddt_phys_t *ddp, blkptr_t *bp);
    185 
    186 extern void ddt_key_fill(ddt_key_t *ddk, const blkptr_t *bp);
    187 
    188 extern void ddt_phys_fill(ddt_phys_t *ddp, const blkptr_t *bp);
    189 extern void ddt_phys_clear(ddt_phys_t *ddp);
    190 extern void ddt_phys_addref(ddt_phys_t *ddp);
    191 extern void ddt_phys_decref(ddt_phys_t *ddp);
    192 extern void ddt_phys_free(ddt_t *ddt, ddt_key_t *ddk, ddt_phys_t *ddp,
    193     uint64_t txg);
    194 extern ddt_phys_t *ddt_phys_select(const ddt_entry_t *dde, const blkptr_t *bp);
    195 extern uint64_t ddt_phys_total_refcnt(const ddt_entry_t *dde);
    196 
    197 extern void ddt_stat_add(ddt_stat_t *dst, const ddt_stat_t *src, uint64_t neg);
    198 
    199 extern void ddt_histogram_add(ddt_histogram_t *dst, const ddt_histogram_t *src);
    200 extern void ddt_histogram_stat(ddt_stat_t *dds, const ddt_histogram_t *ddh);
    201 extern boolean_t ddt_histogram_empty(const ddt_histogram_t *ddh);
    202 extern void ddt_get_dedup_object_stats(spa_t *spa, ddt_object_t *ddo);
    203 extern void ddt_get_dedup_histogram(spa_t *spa, ddt_histogram_t *ddh);
    204 extern void ddt_get_dedup_stats(spa_t *spa, ddt_stat_t *dds_total);
    205 
    206 extern uint64_t ddt_get_dedup_dspace(spa_t *spa);
    207 extern uint64_t ddt_get_pool_dedup_ratio(spa_t *spa);
    208 
    209 extern int ddt_ditto_copies_needed(ddt_t *ddt, ddt_entry_t *dde,
    210     ddt_phys_t *ddp_willref);
    211 extern int ddt_ditto_copies_present(ddt_entry_t *dde);
    212 
    213 extern size_t ddt_compress(void *src, uchar_t *dst, size_t s_len, size_t d_len);
    214 extern void ddt_decompress(uchar_t *src, void *dst, size_t s_len, size_t d_len);
    215 
    216 extern ddt_t *ddt_select(spa_t *spa, const blkptr_t *bp);
    217 extern void ddt_enter(ddt_t *ddt);
    218 extern void ddt_exit(ddt_t *ddt);
    219 extern ddt_entry_t *ddt_lookup(ddt_t *ddt, const blkptr_t *bp, boolean_t add);
    220 extern void ddt_prefetch(spa_t *spa, const blkptr_t *bp);
    221 extern void ddt_remove(ddt_t *ddt, ddt_entry_t *dde);
    222 
    223 extern boolean_t ddt_class_contains(spa_t *spa, enum ddt_class max_class,
    224     const blkptr_t *bp);
    225 
    226 extern ddt_entry_t *ddt_repair_start(ddt_t *ddt, const blkptr_t *bp);
    227 extern void ddt_repair_done(ddt_t *ddt, ddt_entry_t *dde);
    228 
    229 extern int ddt_entry_compare(const void *x1, const void *x2);
    230 
    231 extern void ddt_create(spa_t *spa);
    232 extern int ddt_load(spa_t *spa);
    233 extern void ddt_unload(spa_t *spa);
    234 extern void ddt_sync(spa_t *spa, uint64_t txg);
    235 extern int ddt_walk(spa_t *spa, ddt_bookmark_t *ddb, ddt_entry_t *dde);
    236 extern int ddt_object_update(ddt_t *ddt, enum ddt_type type,
    237     enum ddt_class cls, ddt_entry_t *dde, dmu_tx_t *tx);
    238 
    239 extern const ddt_ops_t ddt_zap_ops;
    240 
    241 #ifdef	__cplusplus
    242 }
    243 #endif
    244 
    245 #endif	/* _SYS_DDT_H */
    246