1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved.
23  */
24 
25 #ifndef _SYS_DDT_H
26 #define   _SYS_DDT_H
27 
28 #include <sys/sysmacros.h>
29 #include <sys/types.h>
30 #include <sys/fs/zfs.h>
31 #include <sys/zio.h>
32 #include <sys/dmu.h>
33 
34 #ifdef    __cplusplus
35 extern "C" {
36 #endif
37 
38 /*
39  * On-disk DDT formats, in the desired search order (newest version first).
40  */
41 enum ddt_type {
42           DDT_TYPE_ZAP = 0,
43           DDT_TYPES
44 };
45 
46 /*
47  * DDT classes, in the desired search order (highest replication level first).
48  */
49 enum ddt_class {
50           DDT_CLASS_DITTO = 0,
51           DDT_CLASS_DUPLICATE,
52           DDT_CLASS_UNIQUE,
53           DDT_CLASSES
54 };
55 
56 #define   DDT_TYPE_CURRENT              0
57 
58 #define   DDT_COMPRESS_BYTEORDER_MASK   0x80
59 #define   DDT_COMPRESS_FUNCTION_MASK    0x7f
60 
61 /*
62  * On-disk ddt entry:  key (name) and physical storage (value).
63  */
64 typedef struct ddt_key {
65           zio_cksum_t         ddk_cksum;          /* 256-bit block checksum */
66           /*
67            * Encoded with logical & physical size, and compression, as follows:
68            *   +-------+-------+-------+-------+-------+-------+-------+-------+
69            *   |   0   |   0   |   0   | comp  |     PSIZE     |     LSIZE     |
70            *   +-------+-------+-------+-------+-------+-------+-------+-------+
71            */
72           uint64_t  ddk_prop;
73 } ddt_key_t;
74 
75 #define   DDK_GET_LSIZE(ddk)  \
76           BF64_GET_SB((ddk)->ddk_prop, 0, 16, SPA_MINBLOCKSHIFT, 1)
77 #define   DDK_SET_LSIZE(ddk, x)         \
78           BF64_SET_SB((ddk)->ddk_prop, 0, 16, SPA_MINBLOCKSHIFT, 1, x)
79 
80 #define   DDK_GET_PSIZE(ddk)  \
81           BF64_GET_SB((ddk)->ddk_prop, 16, 16, SPA_MINBLOCKSHIFT, 1)
82 #define   DDK_SET_PSIZE(ddk, x)         \
83           BF64_SET_SB((ddk)->ddk_prop, 16, 16, SPA_MINBLOCKSHIFT, 1, x)
84 
85 #define   DDK_GET_COMPRESS(ddk)                   BF64_GET((ddk)->ddk_prop, 32, 8)
86 #define   DDK_SET_COMPRESS(ddk, x)      BF64_SET((ddk)->ddk_prop, 32, 8, x)
87 
88 #define   DDT_KEY_WORDS       (sizeof (ddt_key_t) / sizeof (uint64_t))
89 
90 typedef struct ddt_phys {
91           dva_t               ddp_dva[SPA_DVAS_PER_BP];
92           uint64_t  ddp_refcnt;
93           uint64_t  ddp_phys_birth;
94 } ddt_phys_t;
95 
96 enum ddt_phys_type {
97           DDT_PHYS_DITTO = 0,
98           DDT_PHYS_SINGLE = 1,
99           DDT_PHYS_DOUBLE = 2,
100           DDT_PHYS_TRIPLE = 3,
101           DDT_PHYS_TYPES
102 };
103 
104 /*
105  * In-core ddt entry
106  */
107 struct ddt_entry {
108           ddt_key_t dde_key;
109           ddt_phys_t          dde_phys[DDT_PHYS_TYPES];
110           zio_t               *dde_lead_zio[DDT_PHYS_TYPES];
111           void                *dde_repair_data;
112           enum ddt_type       dde_type;
113           enum ddt_class      dde_class;
114           uint8_t             dde_loading;
115           uint8_t             dde_loaded;
116           kcondvar_t          dde_cv;
117           avl_node_t          dde_node;
118 };
119 
120 /*
121  * In-core ddt
122  */
123 struct ddt {
124           kmutex_t  ddt_lock;
125           avl_tree_t          ddt_tree;
126           avl_tree_t          ddt_repair_tree;
127           enum zio_checksum ddt_checksum;
128           spa_t               *ddt_spa;
129           objset_t  *ddt_os;
130           uint64_t  ddt_stat_object;
131           uint64_t  ddt_object[DDT_TYPES][DDT_CLASSES];
132           ddt_histogram_t     ddt_histogram[DDT_TYPES][DDT_CLASSES];
133           ddt_histogram_t     ddt_histogram_cache[DDT_TYPES][DDT_CLASSES];
134           ddt_object_t        ddt_object_stats[DDT_TYPES][DDT_CLASSES];
135           avl_node_t          ddt_node;
136 };
137 
138 /*
139  * In-core and on-disk bookmark for DDT walks
140  */
141 typedef struct ddt_bookmark {
142           uint64_t  ddb_class;
143           uint64_t  ddb_type;
144           uint64_t  ddb_checksum;
145           uint64_t  ddb_cursor;
146 } ddt_bookmark_t;
147 
148 /*
149  * Ops vector to access a specific DDT object type.
150  */
151 typedef struct ddt_ops {
152           char ddt_op_name[32];
153           int (*ddt_op_create)(objset_t *os, uint64_t *object, dmu_tx_t *tx,
154               boolean_t prehash);
155           int (*ddt_op_destroy)(objset_t *os, uint64_t object, dmu_tx_t *tx);
156           int (*ddt_op_lookup)(objset_t *os, uint64_t object, ddt_entry_t *dde);
157           void (*ddt_op_prefetch)(objset_t *os, uint64_t object,
158               ddt_entry_t *dde);
159           int (*ddt_op_update)(objset_t *os, uint64_t object, ddt_entry_t *dde,
160               dmu_tx_t *tx);
161           int (*ddt_op_remove)(objset_t *os, uint64_t object, ddt_entry_t *dde,
162               dmu_tx_t *tx);
163           int (*ddt_op_walk)(objset_t *os, uint64_t object, ddt_entry_t *dde,
164               uint64_t *walk);
165           int (*ddt_op_count)(objset_t *os, uint64_t object, uint64_t *count);
166 } ddt_ops_t;
167 
168 #define   DDT_NAMELEN         80
169 
170 extern void ddt_object_name(ddt_t *ddt, enum ddt_type type,
171     enum ddt_class cls, char *name);
172 extern int ddt_object_walk(ddt_t *ddt, enum ddt_type type,
173     enum ddt_class cls, uint64_t *walk, ddt_entry_t *dde);
174 extern int ddt_object_count(ddt_t *ddt, enum ddt_type type,
175     enum ddt_class cls, uint64_t *count);
176 extern int ddt_object_info(ddt_t *ddt, enum ddt_type type,
177     enum ddt_class cls, dmu_object_info_t *);
178 extern boolean_t ddt_object_exists(ddt_t *ddt, enum ddt_type type,
179     enum ddt_class cls);
180 
181 extern void ddt_bp_fill(const ddt_phys_t *ddp, blkptr_t *bp,
182     uint64_t txg);
183 extern void ddt_bp_create(enum zio_checksum checksum, const ddt_key_t *ddk,
184     const ddt_phys_t *ddp, blkptr_t *bp);
185 
186 extern void ddt_key_fill(ddt_key_t *ddk, const blkptr_t *bp);
187 
188 extern void ddt_phys_fill(ddt_phys_t *ddp, const blkptr_t *bp);
189 extern void ddt_phys_clear(ddt_phys_t *ddp);
190 extern void ddt_phys_addref(ddt_phys_t *ddp);
191 extern void ddt_phys_decref(ddt_phys_t *ddp);
192 extern void ddt_phys_free(ddt_t *ddt, ddt_key_t *ddk, ddt_phys_t *ddp,
193     uint64_t txg);
194 extern ddt_phys_t *ddt_phys_select(const ddt_entry_t *dde, const blkptr_t *bp);
195 extern uint64_t ddt_phys_total_refcnt(const ddt_entry_t *dde);
196 
197 extern void ddt_stat_add(ddt_stat_t *dst, const ddt_stat_t *src, uint64_t neg);
198 
199 extern void ddt_histogram_add(ddt_histogram_t *dst, const ddt_histogram_t *src);
200 extern void ddt_histogram_stat(ddt_stat_t *dds, const ddt_histogram_t *ddh);
201 extern boolean_t ddt_histogram_empty(const ddt_histogram_t *ddh);
202 extern void ddt_get_dedup_object_stats(spa_t *spa, ddt_object_t *ddo);
203 extern void ddt_get_dedup_histogram(spa_t *spa, ddt_histogram_t *ddh);
204 extern void ddt_get_dedup_stats(spa_t *spa, ddt_stat_t *dds_total);
205 
206 extern uint64_t ddt_get_dedup_dspace(spa_t *spa);
207 extern uint64_t ddt_get_pool_dedup_ratio(spa_t *spa);
208 
209 extern int ddt_ditto_copies_needed(ddt_t *ddt, ddt_entry_t *dde,
210     ddt_phys_t *ddp_willref);
211 extern int ddt_ditto_copies_present(ddt_entry_t *dde);
212 
213 extern size_t ddt_compress(void *src, uchar_t *dst, size_t s_len, size_t d_len);
214 extern void ddt_decompress(uchar_t *src, void *dst, size_t s_len, size_t d_len);
215 
216 extern ddt_t *ddt_select(spa_t *spa, const blkptr_t *bp);
217 extern void ddt_enter(ddt_t *ddt);
218 extern void ddt_exit(ddt_t *ddt);
219 extern ddt_entry_t *ddt_lookup(ddt_t *ddt, const blkptr_t *bp, boolean_t add);
220 extern void ddt_prefetch(spa_t *spa, const blkptr_t *bp);
221 extern void ddt_remove(ddt_t *ddt, ddt_entry_t *dde);
222 
223 extern boolean_t ddt_class_contains(spa_t *spa, enum ddt_class max_class,
224     const blkptr_t *bp);
225 
226 extern ddt_entry_t *ddt_repair_start(ddt_t *ddt, const blkptr_t *bp);
227 extern void ddt_repair_done(ddt_t *ddt, ddt_entry_t *dde);
228 
229 extern int ddt_entry_compare(const void *x1, const void *x2);
230 
231 extern void ddt_create(spa_t *spa);
232 extern int ddt_load(spa_t *spa);
233 extern void ddt_unload(spa_t *spa);
234 extern void ddt_sync(spa_t *spa, uint64_t txg);
235 extern int ddt_walk(spa_t *spa, ddt_bookmark_t *ddb, ddt_entry_t *dde);
236 extern int ddt_object_update(ddt_t *ddt, enum ddt_type type,
237     enum ddt_class cls, ddt_entry_t *dde, dmu_tx_t *tx);
238 
239 extern const ddt_ops_t ddt_zap_ops;
240 
241 #ifdef    __cplusplus
242 }
243 #endif
244 
245 #endif    /* _SYS_DDT_H */
246