1 | /* |
2 | * CDDL HEADER START |
3 | * |
4 | * The contents of this file are subject to the terms of the |
5 | * Common Development and Distribution License (the "License"). |
6 | * You may not use this file except in compliance with the License. |
7 | * |
8 | * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE |
9 | * or http://www.opensolaris.org/os/licensing. |
10 | * See the License for the specific language governing permissions |
11 | * and limitations under the License. |
12 | * |
13 | * When distributing Covered Code, include this CDDL HEADER in each |
14 | * file and include the License file at usr/src/OPENSOLARIS.LICENSE. |
15 | * If applicable, add the following below this CDDL HEADER, with the |
16 | * fields enclosed by brackets "[]" replaced with your own identifying |
17 | * information: Portions Copyright [yyyy] [name of copyright owner] |
18 | * |
19 | * CDDL HEADER END |
20 | */ |
21 | /* |
22 | * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved. |
23 | */ |
24 | |
25 | #ifndef _SYS_DDT_H |
26 | #define _SYS_DDT_H |
27 | |
28 | #include <sys/sysmacros.h> |
29 | #include <sys/types.h> |
30 | #include <sys/fs/zfs.h> |
31 | #include <sys/zio.h> |
32 | #include <sys/dmu.h> |
33 | |
34 | #ifdef __cplusplus |
35 | extern "C" { |
36 | #endif |
37 | |
38 | /* |
39 | * On-disk DDT formats, in the desired search order (newest version first). |
40 | */ |
41 | enum ddt_type { |
42 | DDT_TYPE_ZAP = 0, |
43 | DDT_TYPES |
44 | }; |
45 | |
46 | /* |
47 | * DDT classes, in the desired search order (highest replication level first). |
48 | */ |
49 | enum ddt_class { |
50 | DDT_CLASS_DITTO = 0, |
51 | DDT_CLASS_DUPLICATE, |
52 | DDT_CLASS_UNIQUE, |
53 | DDT_CLASSES |
54 | }; |
55 | |
56 | #define DDT_TYPE_CURRENT 0 |
57 | |
58 | #define DDT_COMPRESS_BYTEORDER_MASK 0x80 |
59 | #define DDT_COMPRESS_FUNCTION_MASK 0x7f |
60 | |
61 | /* |
62 | * On-disk ddt entry: key (name) and physical storage (value). |
63 | */ |
64 | typedef struct ddt_key { |
65 | zio_cksum_t ddk_cksum; /* 256-bit block checksum */ |
66 | /* |
67 | * Encoded with logical & physical size, and compression, as follows: |
68 | * +-------+-------+-------+-------+-------+-------+-------+-------+ |
69 | * | 0 | 0 | 0 | comp | PSIZE | LSIZE | |
70 | * +-------+-------+-------+-------+-------+-------+-------+-------+ |
71 | */ |
72 | uint64_t ddk_prop; |
73 | } ddt_key_t; |
74 | |
75 | #define DDK_GET_LSIZE(ddk) \ |
76 | BF64_GET_SB((ddk)->ddk_prop, 0, 16, SPA_MINBLOCKSHIFT, 1) |
77 | #define DDK_SET_LSIZE(ddk, x) \ |
78 | BF64_SET_SB((ddk)->ddk_prop, 0, 16, SPA_MINBLOCKSHIFT, 1, x) |
79 | |
80 | #define DDK_GET_PSIZE(ddk) \ |
81 | BF64_GET_SB((ddk)->ddk_prop, 16, 16, SPA_MINBLOCKSHIFT, 1) |
82 | #define DDK_SET_PSIZE(ddk, x) \ |
83 | BF64_SET_SB((ddk)->ddk_prop, 16, 16, SPA_MINBLOCKSHIFT, 1, x) |
84 | |
85 | #define DDK_GET_COMPRESS(ddk) BF64_GET((ddk)->ddk_prop, 32, 8) |
86 | #define DDK_SET_COMPRESS(ddk, x) BF64_SET((ddk)->ddk_prop, 32, 8, x) |
87 | |
88 | #define DDT_KEY_WORDS (sizeof (ddt_key_t) / sizeof (uint64_t)) |
89 | |
90 | typedef struct ddt_phys { |
91 | dva_t ddp_dva[SPA_DVAS_PER_BP]; |
92 | uint64_t ddp_refcnt; |
93 | uint64_t ddp_phys_birth; |
94 | } ddt_phys_t; |
95 | |
96 | enum ddt_phys_type { |
97 | DDT_PHYS_DITTO = 0, |
98 | DDT_PHYS_SINGLE = 1, |
99 | DDT_PHYS_DOUBLE = 2, |
100 | DDT_PHYS_TRIPLE = 3, |
101 | DDT_PHYS_TYPES |
102 | }; |
103 | |
104 | /* |
105 | * In-core ddt entry |
106 | */ |
107 | struct ddt_entry { |
108 | ddt_key_t dde_key; |
109 | ddt_phys_t dde_phys[DDT_PHYS_TYPES]; |
110 | zio_t *dde_lead_zio[DDT_PHYS_TYPES]; |
111 | void *dde_repair_data; |
112 | enum ddt_type dde_type; |
113 | enum ddt_class dde_class; |
114 | uint8_t dde_loading; |
115 | uint8_t dde_loaded; |
116 | kcondvar_t dde_cv; |
117 | avl_node_t dde_node; |
118 | }; |
119 | |
120 | /* |
121 | * In-core ddt |
122 | */ |
123 | struct ddt { |
124 | kmutex_t ddt_lock; |
125 | avl_tree_t ddt_tree; |
126 | avl_tree_t ddt_repair_tree; |
127 | enum zio_checksum ddt_checksum; |
128 | spa_t *ddt_spa; |
129 | objset_t *ddt_os; |
130 | uint64_t ddt_stat_object; |
131 | uint64_t ddt_object[DDT_TYPES][DDT_CLASSES]; |
132 | ddt_histogram_t ddt_histogram[DDT_TYPES][DDT_CLASSES]; |
133 | ddt_histogram_t ddt_histogram_cache[DDT_TYPES][DDT_CLASSES]; |
134 | ddt_object_t ddt_object_stats[DDT_TYPES][DDT_CLASSES]; |
135 | avl_node_t ddt_node; |
136 | }; |
137 | |
138 | /* |
139 | * In-core and on-disk bookmark for DDT walks |
140 | */ |
141 | typedef struct ddt_bookmark { |
142 | uint64_t ddb_class; |
143 | uint64_t ddb_type; |
144 | uint64_t ddb_checksum; |
145 | uint64_t ddb_cursor; |
146 | } ddt_bookmark_t; |
147 | |
148 | /* |
149 | * Ops vector to access a specific DDT object type. |
150 | */ |
151 | typedef struct ddt_ops { |
152 | char ddt_op_name[32]; |
153 | int (*ddt_op_create)(objset_t *os, uint64_t *object, dmu_tx_t *tx, |
154 | boolean_t prehash); |
155 | int (*ddt_op_destroy)(objset_t *os, uint64_t object, dmu_tx_t *tx); |
156 | int (*ddt_op_lookup)(objset_t *os, uint64_t object, ddt_entry_t *dde); |
157 | void (*ddt_op_prefetch)(objset_t *os, uint64_t object, |
158 | ddt_entry_t *dde); |
159 | int (*ddt_op_update)(objset_t *os, uint64_t object, ddt_entry_t *dde, |
160 | dmu_tx_t *tx); |
161 | int (*ddt_op_remove)(objset_t *os, uint64_t object, ddt_entry_t *dde, |
162 | dmu_tx_t *tx); |
163 | int (*ddt_op_walk)(objset_t *os, uint64_t object, ddt_entry_t *dde, |
164 | uint64_t *walk); |
165 | int (*ddt_op_count)(objset_t *os, uint64_t object, uint64_t *count); |
166 | } ddt_ops_t; |
167 | |
168 | #define DDT_NAMELEN 80 |
169 | |
170 | extern void ddt_object_name(ddt_t *ddt, enum ddt_type type, |
171 | enum ddt_class cls, char *name); |
172 | extern int ddt_object_walk(ddt_t *ddt, enum ddt_type type, |
173 | enum ddt_class cls, uint64_t *walk, ddt_entry_t *dde); |
174 | extern int ddt_object_count(ddt_t *ddt, enum ddt_type type, |
175 | enum ddt_class cls, uint64_t *count); |
176 | extern int ddt_object_info(ddt_t *ddt, enum ddt_type type, |
177 | enum ddt_class cls, dmu_object_info_t *); |
178 | extern boolean_t ddt_object_exists(ddt_t *ddt, enum ddt_type type, |
179 | enum ddt_class cls); |
180 | |
181 | extern void ddt_bp_fill(const ddt_phys_t *ddp, blkptr_t *bp, |
182 | uint64_t txg); |
183 | extern void ddt_bp_create(enum zio_checksum checksum, const ddt_key_t *ddk, |
184 | const ddt_phys_t *ddp, blkptr_t *bp); |
185 | |
186 | extern void ddt_key_fill(ddt_key_t *ddk, const blkptr_t *bp); |
187 | |
188 | extern void ddt_phys_fill(ddt_phys_t *ddp, const blkptr_t *bp); |
189 | extern void ddt_phys_clear(ddt_phys_t *ddp); |
190 | extern void ddt_phys_addref(ddt_phys_t *ddp); |
191 | extern void ddt_phys_decref(ddt_phys_t *ddp); |
192 | extern void ddt_phys_free(ddt_t *ddt, ddt_key_t *ddk, ddt_phys_t *ddp, |
193 | uint64_t txg); |
194 | extern ddt_phys_t *ddt_phys_select(const ddt_entry_t *dde, const blkptr_t *bp); |
195 | extern uint64_t ddt_phys_total_refcnt(const ddt_entry_t *dde); |
196 | |
197 | extern void ddt_stat_add(ddt_stat_t *dst, const ddt_stat_t *src, uint64_t neg); |
198 | |
199 | extern void ddt_histogram_add(ddt_histogram_t *dst, const ddt_histogram_t *src); |
200 | extern void ddt_histogram_stat(ddt_stat_t *dds, const ddt_histogram_t *ddh); |
201 | extern boolean_t ddt_histogram_empty(const ddt_histogram_t *ddh); |
202 | extern void ddt_get_dedup_object_stats(spa_t *spa, ddt_object_t *ddo); |
203 | extern void ddt_get_dedup_histogram(spa_t *spa, ddt_histogram_t *ddh); |
204 | extern void ddt_get_dedup_stats(spa_t *spa, ddt_stat_t *dds_total); |
205 | |
206 | extern uint64_t ddt_get_dedup_dspace(spa_t *spa); |
207 | extern uint64_t ddt_get_pool_dedup_ratio(spa_t *spa); |
208 | |
209 | extern int ddt_ditto_copies_needed(ddt_t *ddt, ddt_entry_t *dde, |
210 | ddt_phys_t *ddp_willref); |
211 | extern int ddt_ditto_copies_present(ddt_entry_t *dde); |
212 | |
213 | extern size_t ddt_compress(void *src, uchar_t *dst, size_t s_len, size_t d_len); |
214 | extern void ddt_decompress(uchar_t *src, void *dst, size_t s_len, size_t d_len); |
215 | |
216 | extern ddt_t *ddt_select(spa_t *spa, const blkptr_t *bp); |
217 | extern void ddt_enter(ddt_t *ddt); |
218 | extern void ddt_exit(ddt_t *ddt); |
219 | extern ddt_entry_t *ddt_lookup(ddt_t *ddt, const blkptr_t *bp, boolean_t add); |
220 | extern void ddt_prefetch(spa_t *spa, const blkptr_t *bp); |
221 | extern void ddt_remove(ddt_t *ddt, ddt_entry_t *dde); |
222 | |
223 | extern boolean_t ddt_class_contains(spa_t *spa, enum ddt_class max_class, |
224 | const blkptr_t *bp); |
225 | |
226 | extern ddt_entry_t *ddt_repair_start(ddt_t *ddt, const blkptr_t *bp); |
227 | extern void ddt_repair_done(ddt_t *ddt, ddt_entry_t *dde); |
228 | |
229 | extern int ddt_entry_compare(const void *x1, const void *x2); |
230 | |
231 | extern void ddt_create(spa_t *spa); |
232 | extern int ddt_load(spa_t *spa); |
233 | extern void ddt_unload(spa_t *spa); |
234 | extern void ddt_sync(spa_t *spa, uint64_t txg); |
235 | extern int ddt_walk(spa_t *spa, ddt_bookmark_t *ddb, ddt_entry_t *dde); |
236 | extern int ddt_object_update(ddt_t *ddt, enum ddt_type type, |
237 | enum ddt_class cls, ddt_entry_t *dde, dmu_tx_t *tx); |
238 | |
239 | extern const ddt_ops_t ddt_zap_ops; |
240 | |
241 | #ifdef __cplusplus |
242 | } |
243 | #endif |
244 | |
245 | #endif /* _SYS_DDT_H */ |
246 | |