1/*
2 * CDDL HEADER START
3 *
4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
7 *
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
12 *
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
18 *
19 * CDDL HEADER END
20 */
21/*
22 * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved.
23 */
24
25#ifndef _SYS_DDT_H
26#define	_SYS_DDT_H
27
28#include <sys/sysmacros.h>
29#include <sys/types.h>
30#include <sys/fs/zfs.h>
31#include <sys/zio.h>
32#include <sys/dmu.h>
33
34#ifdef	__cplusplus
35extern "C" {
36#endif
37
38/*
39 * On-disk DDT formats, in the desired search order (newest version first).
40 */
41enum ddt_type {
42	DDT_TYPE_ZAP = 0,
43	DDT_TYPES
44};
45
46/*
47 * DDT classes, in the desired search order (highest replication level first).
48 */
49enum ddt_class {
50	DDT_CLASS_DITTO = 0,
51	DDT_CLASS_DUPLICATE,
52	DDT_CLASS_UNIQUE,
53	DDT_CLASSES
54};
55
56#define	DDT_TYPE_CURRENT		0
57
58#define	DDT_COMPRESS_BYTEORDER_MASK	0x80
59#define	DDT_COMPRESS_FUNCTION_MASK	0x7f
60
61/*
62 * On-disk ddt entry:  key (name) and physical storage (value).
63 */
64typedef struct ddt_key {
65	zio_cksum_t	ddk_cksum;	/* 256-bit block checksum */
66	/*
67	 * Encoded with logical & physical size, and compression, as follows:
68	 *   +-------+-------+-------+-------+-------+-------+-------+-------+
69	 *   |   0   |   0   |   0   | comp  |     PSIZE     |     LSIZE     |
70	 *   +-------+-------+-------+-------+-------+-------+-------+-------+
71	 */
72	uint64_t	ddk_prop;
73} ddt_key_t;
74
75#define	DDK_GET_LSIZE(ddk)	\
76	BF64_GET_SB((ddk)->ddk_prop, 0, 16, SPA_MINBLOCKSHIFT, 1)
77#define	DDK_SET_LSIZE(ddk, x)	\
78	BF64_SET_SB((ddk)->ddk_prop, 0, 16, SPA_MINBLOCKSHIFT, 1, x)
79
80#define	DDK_GET_PSIZE(ddk)	\
81	BF64_GET_SB((ddk)->ddk_prop, 16, 16, SPA_MINBLOCKSHIFT, 1)
82#define	DDK_SET_PSIZE(ddk, x)	\
83	BF64_SET_SB((ddk)->ddk_prop, 16, 16, SPA_MINBLOCKSHIFT, 1, x)
84
85#define	DDK_GET_COMPRESS(ddk)		BF64_GET((ddk)->ddk_prop, 32, 8)
86#define	DDK_SET_COMPRESS(ddk, x)	BF64_SET((ddk)->ddk_prop, 32, 8, x)
87
88#define	DDT_KEY_WORDS	(sizeof (ddt_key_t) / sizeof (uint64_t))
89
90typedef struct ddt_phys {
91	dva_t		ddp_dva[SPA_DVAS_PER_BP];
92	uint64_t	ddp_refcnt;
93	uint64_t	ddp_phys_birth;
94} ddt_phys_t;
95
96enum ddt_phys_type {
97	DDT_PHYS_DITTO = 0,
98	DDT_PHYS_SINGLE = 1,
99	DDT_PHYS_DOUBLE = 2,
100	DDT_PHYS_TRIPLE = 3,
101	DDT_PHYS_TYPES
102};
103
104/*
105 * In-core ddt entry
106 */
107struct ddt_entry {
108	ddt_key_t	dde_key;
109	ddt_phys_t	dde_phys[DDT_PHYS_TYPES];
110	zio_t		*dde_lead_zio[DDT_PHYS_TYPES];
111	void		*dde_repair_data;
112	enum ddt_type	dde_type;
113	enum ddt_class	dde_class;
114	uint8_t		dde_loading;
115	uint8_t		dde_loaded;
116	kcondvar_t	dde_cv;
117	avl_node_t	dde_node;
118};
119
120/*
121 * In-core ddt
122 */
123struct ddt {
124	kmutex_t	ddt_lock;
125	avl_tree_t	ddt_tree;
126	avl_tree_t	ddt_repair_tree;
127	enum zio_checksum ddt_checksum;
128	spa_t		*ddt_spa;
129	objset_t	*ddt_os;
130	uint64_t	ddt_stat_object;
131	uint64_t	ddt_object[DDT_TYPES][DDT_CLASSES];
132	ddt_histogram_t	ddt_histogram[DDT_TYPES][DDT_CLASSES];
133	ddt_histogram_t	ddt_histogram_cache[DDT_TYPES][DDT_CLASSES];
134	ddt_object_t	ddt_object_stats[DDT_TYPES][DDT_CLASSES];
135	avl_node_t	ddt_node;
136};
137
138/*
139 * In-core and on-disk bookmark for DDT walks
140 */
141typedef struct ddt_bookmark {
142	uint64_t	ddb_class;
143	uint64_t	ddb_type;
144	uint64_t	ddb_checksum;
145	uint64_t	ddb_cursor;
146} ddt_bookmark_t;
147
148/*
149 * Ops vector to access a specific DDT object type.
150 */
151typedef struct ddt_ops {
152	char ddt_op_name[32];
153	int (*ddt_op_create)(objset_t *os, uint64_t *object, dmu_tx_t *tx,
154	    boolean_t prehash);
155	int (*ddt_op_destroy)(objset_t *os, uint64_t object, dmu_tx_t *tx);
156	int (*ddt_op_lookup)(objset_t *os, uint64_t object, ddt_entry_t *dde);
157	void (*ddt_op_prefetch)(objset_t *os, uint64_t object,
158	    ddt_entry_t *dde);
159	int (*ddt_op_update)(objset_t *os, uint64_t object, ddt_entry_t *dde,
160	    dmu_tx_t *tx);
161	int (*ddt_op_remove)(objset_t *os, uint64_t object, ddt_entry_t *dde,
162	    dmu_tx_t *tx);
163	int (*ddt_op_walk)(objset_t *os, uint64_t object, ddt_entry_t *dde,
164	    uint64_t *walk);
165	int (*ddt_op_count)(objset_t *os, uint64_t object, uint64_t *count);
166} ddt_ops_t;
167
168#define	DDT_NAMELEN	80
169
170extern void ddt_object_name(ddt_t *ddt, enum ddt_type type,
171    enum ddt_class cls, char *name);
172extern int ddt_object_walk(ddt_t *ddt, enum ddt_type type,
173    enum ddt_class cls, uint64_t *walk, ddt_entry_t *dde);
174extern int ddt_object_count(ddt_t *ddt, enum ddt_type type,
175    enum ddt_class cls, uint64_t *count);
176extern int ddt_object_info(ddt_t *ddt, enum ddt_type type,
177    enum ddt_class cls, dmu_object_info_t *);
178extern boolean_t ddt_object_exists(ddt_t *ddt, enum ddt_type type,
179    enum ddt_class cls);
180
181extern void ddt_bp_fill(const ddt_phys_t *ddp, blkptr_t *bp,
182    uint64_t txg);
183extern void ddt_bp_create(enum zio_checksum checksum, const ddt_key_t *ddk,
184    const ddt_phys_t *ddp, blkptr_t *bp);
185
186extern void ddt_key_fill(ddt_key_t *ddk, const blkptr_t *bp);
187
188extern void ddt_phys_fill(ddt_phys_t *ddp, const blkptr_t *bp);
189extern void ddt_phys_clear(ddt_phys_t *ddp);
190extern void ddt_phys_addref(ddt_phys_t *ddp);
191extern void ddt_phys_decref(ddt_phys_t *ddp);
192extern void ddt_phys_free(ddt_t *ddt, ddt_key_t *ddk, ddt_phys_t *ddp,
193    uint64_t txg);
194extern ddt_phys_t *ddt_phys_select(const ddt_entry_t *dde, const blkptr_t *bp);
195extern uint64_t ddt_phys_total_refcnt(const ddt_entry_t *dde);
196
197extern void ddt_stat_add(ddt_stat_t *dst, const ddt_stat_t *src, uint64_t neg);
198
199extern void ddt_histogram_add(ddt_histogram_t *dst, const ddt_histogram_t *src);
200extern void ddt_histogram_stat(ddt_stat_t *dds, const ddt_histogram_t *ddh);
201extern boolean_t ddt_histogram_empty(const ddt_histogram_t *ddh);
202extern void ddt_get_dedup_object_stats(spa_t *spa, ddt_object_t *ddo);
203extern void ddt_get_dedup_histogram(spa_t *spa, ddt_histogram_t *ddh);
204extern void ddt_get_dedup_stats(spa_t *spa, ddt_stat_t *dds_total);
205
206extern uint64_t ddt_get_dedup_dspace(spa_t *spa);
207extern uint64_t ddt_get_pool_dedup_ratio(spa_t *spa);
208
209extern int ddt_ditto_copies_needed(ddt_t *ddt, ddt_entry_t *dde,
210    ddt_phys_t *ddp_willref);
211extern int ddt_ditto_copies_present(ddt_entry_t *dde);
212
213extern size_t ddt_compress(void *src, uchar_t *dst, size_t s_len, size_t d_len);
214extern void ddt_decompress(uchar_t *src, void *dst, size_t s_len, size_t d_len);
215
216extern ddt_t *ddt_select(spa_t *spa, const blkptr_t *bp);
217extern void ddt_enter(ddt_t *ddt);
218extern void ddt_exit(ddt_t *ddt);
219extern ddt_entry_t *ddt_lookup(ddt_t *ddt, const blkptr_t *bp, boolean_t add);
220extern void ddt_prefetch(spa_t *spa, const blkptr_t *bp);
221extern void ddt_remove(ddt_t *ddt, ddt_entry_t *dde);
222
223extern boolean_t ddt_class_contains(spa_t *spa, enum ddt_class max_class,
224    const blkptr_t *bp);
225
226extern ddt_entry_t *ddt_repair_start(ddt_t *ddt, const blkptr_t *bp);
227extern void ddt_repair_done(ddt_t *ddt, ddt_entry_t *dde);
228
229extern int ddt_entry_compare(const void *x1, const void *x2);
230
231extern void ddt_create(spa_t *spa);
232extern int ddt_load(spa_t *spa);
233extern void ddt_unload(spa_t *spa);
234extern void ddt_sync(spa_t *spa, uint64_t txg);
235extern int ddt_walk(spa_t *spa, ddt_bookmark_t *ddb, ddt_entry_t *dde);
236extern int ddt_object_update(ddt_t *ddt, enum ddt_type type,
237    enum ddt_class cls, ddt_entry_t *dde, dmu_tx_t *tx);
238
239extern const ddt_ops_t ddt_zap_ops;
240
241#ifdef	__cplusplus
242}
243#endif
244
245#endif	/* _SYS_DDT_H */
246