g_eli_integrity.c revision 220922
1159307Spjd/*-
2220922Spjd * Copyright (c) 2005-2011 Pawel Jakub Dawidek <pawel@dawidek.net>
3159307Spjd * All rights reserved.
4159307Spjd *
5159307Spjd * Redistribution and use in source and binary forms, with or without
6159307Spjd * modification, are permitted provided that the following conditions
7159307Spjd * are met:
8159307Spjd * 1. Redistributions of source code must retain the above copyright
9159307Spjd *    notice, this list of conditions and the following disclaimer.
10159307Spjd * 2. Redistributions in binary form must reproduce the above copyright
11159307Spjd *    notice, this list of conditions and the following disclaimer in the
12159307Spjd *    documentation and/or other materials provided with the distribution.
13159307Spjd *
14159307Spjd * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
15159307Spjd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16159307Spjd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17159307Spjd * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
18159307Spjd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19159307Spjd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20159307Spjd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21159307Spjd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22159307Spjd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23159307Spjd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24159307Spjd * SUCH DAMAGE.
25159307Spjd */
26159307Spjd
27159307Spjd#include <sys/cdefs.h>
28159307Spjd__FBSDID("$FreeBSD: head/sys/geom/eli/g_eli_integrity.c 220922 2011-04-21 13:31:43Z pjd $");
29159307Spjd
30159307Spjd#include <sys/param.h>
31159307Spjd#include <sys/systm.h>
32159307Spjd#include <sys/kernel.h>
33159307Spjd#include <sys/linker.h>
34159307Spjd#include <sys/module.h>
35159307Spjd#include <sys/lock.h>
36159307Spjd#include <sys/mutex.h>
37159307Spjd#include <sys/bio.h>
38159307Spjd#include <sys/sysctl.h>
39159307Spjd#include <sys/malloc.h>
40159307Spjd#include <sys/kthread.h>
41159307Spjd#include <sys/proc.h>
42159307Spjd#include <sys/sched.h>
43159307Spjd#include <sys/smp.h>
44159307Spjd#include <sys/uio.h>
45159307Spjd#include <sys/vnode.h>
46159307Spjd
47159307Spjd#include <vm/uma.h>
48159307Spjd
49159307Spjd#include <geom/geom.h>
50159307Spjd#include <geom/eli/g_eli.h>
51159307Spjd#include <geom/eli/pkcs5v2.h>
52159307Spjd
53159307Spjd/*
54159307Spjd * The data layout description when integrity verification is configured.
55159307Spjd *
56159307Spjd * One of the most important assumption here is that authenticated data and its
57159307Spjd * HMAC has to be stored in the same place (namely in the same sector) to make
58159307Spjd * it work reliable.
59159307Spjd * The problem is that file systems work only with sectors that are multiple of
60159307Spjd * 512 bytes and a power of two number.
61159307Spjd * My idea to implement it is as follows.
62159307Spjd * Let's store HMAC in sector. This is a must. This leaves us 480 bytes for
63159307Spjd * data. We can't use that directly (ie. we can't create provider with 480 bytes
64159307Spjd * sector size). We need another sector from where we take only 32 bytes of data
65159307Spjd * and we store HMAC of this data as well. This takes two sectors from the
66159307Spjd * original provider at the input and leaves us one sector of authenticated data
67159307Spjd * at the output. Not very efficient, but you got the idea.
68159307Spjd * Now, let's assume, we want to create provider with 4096 bytes sector.
69159307Spjd * To output 4096 bytes of authenticated data we need 8x480 plus 1x256, so we
70159307Spjd * need nine 512-bytes sectors at the input to get one 4096-bytes sector at the
71159307Spjd * output. That's better. With 4096 bytes sector we can use 89% of size of the
72159307Spjd * original provider. I find it as an acceptable cost.
73159307Spjd * The reliability comes from the fact, that every HMAC stored inside the sector
74159307Spjd * is calculated only for the data in the same sector, so its impossible to
75159307Spjd * write new data and leave old HMAC or vice versa.
76159307Spjd *
77159307Spjd * And here is the picture:
78159307Spjd *
79159307Spjd * da0: +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+-----+
80159307Spjd *      |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |256b |
81159307Spjd *      |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data |
82159307Spjd *      +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+-----+
83159307Spjd *      |512 bytes| |512 bytes| |512 bytes| |512 bytes| |512 bytes| |512 bytes| |512 bytes| |512 bytes| |288 bytes |
84159307Spjd *      +---------+ +---------+ +---------+ +---------+ +---------+ +---------+ +---------+ +---------+ |224 unused|
85159307Spjd *                                                                                                      +----------+
86159307Spjd * da0.eli: +----+----+----+----+----+----+----+----+----+
87159307Spjd *          |480b|480b|480b|480b|480b|480b|480b|480b|256b|
88159307Spjd *          +----+----+----+----+----+----+----+----+----+
89159307Spjd *          |                 4096 bytes                 |
90159307Spjd *          +--------------------------------------------+
91159307Spjd *
92159307Spjd * PS. You can use any sector size with geli(8). My example is using 4kB,
93159307Spjd *     because it's most efficient. For 8kB sectors you need 2 extra sectors,
94159307Spjd *     so the cost is the same as for 4kB sectors.
95159307Spjd */
96159307Spjd
97159307Spjd/*
98159307Spjd * Code paths:
99159307Spjd * BIO_READ:
100159307Spjd *	g_eli_start -> g_eli_auth_read -> g_io_request -> g_eli_read_done -> g_eli_auth_run -> g_eli_auth_read_done -> g_io_deliver
101159307Spjd * BIO_WRITE:
102159307Spjd *	g_eli_start -> g_eli_auth_run -> g_eli_auth_write_done -> g_io_request -> g_eli_write_done -> g_io_deliver
103159307Spjd */
104159307Spjd
105159307SpjdMALLOC_DECLARE(M_ELI);
106159307Spjd
107159307Spjd/*
108159307Spjd * Here we generate key for HMAC. Every sector has its own HMAC key, so it is
109159307Spjd * not possible to copy sectors.
110159307Spjd * We cannot depend on fact, that every sector has its own IV, because different
111159307Spjd * IV doesn't change HMAC, when we use encrypt-then-authenticate method.
112159307Spjd */
113159307Spjdstatic void
114159307Spjdg_eli_auth_keygen(struct g_eli_softc *sc, off_t offset, u_char *key)
115159307Spjd{
116159307Spjd	SHA256_CTX ctx;
117159307Spjd
118159307Spjd	/* Copy precalculated SHA256 context. */
119159307Spjd	bcopy(&sc->sc_akeyctx, &ctx, sizeof(ctx));
120159307Spjd	SHA256_Update(&ctx, (uint8_t *)&offset, sizeof(offset));
121159307Spjd	SHA256_Final(key, &ctx);
122159307Spjd}
123159307Spjd
124159307Spjd/*
125159307Spjd * The function is called after we read and decrypt data.
126159307Spjd *
127159307Spjd * g_eli_start -> g_eli_auth_read -> g_io_request -> g_eli_read_done -> g_eli_auth_run -> G_ELI_AUTH_READ_DONE -> g_io_deliver
128159307Spjd */
129159307Spjdstatic int
130159307Spjdg_eli_auth_read_done(struct cryptop *crp)
131159307Spjd{
132214118Spjd	struct g_eli_softc *sc;
133159307Spjd	struct bio *bp;
134159307Spjd
135159307Spjd	if (crp->crp_etype == EAGAIN) {
136159307Spjd		if (g_eli_crypto_rerun(crp) == 0)
137159307Spjd			return (0);
138159307Spjd	}
139159307Spjd	bp = (struct bio *)crp->crp_opaque;
140159307Spjd	bp->bio_inbed++;
141159307Spjd	if (crp->crp_etype == 0) {
142159307Spjd		bp->bio_completed += crp->crp_olen;
143159307Spjd		G_ELI_DEBUG(3, "Crypto READ request done (%d/%d) (add=%jd completed=%jd).",
144159307Spjd		    bp->bio_inbed, bp->bio_children, (intmax_t)crp->crp_olen, (intmax_t)bp->bio_completed);
145159307Spjd	} else {
146159307Spjd		G_ELI_DEBUG(1, "Crypto READ request failed (%d/%d) error=%d.",
147159307Spjd		    bp->bio_inbed, bp->bio_children, crp->crp_etype);
148159307Spjd		if (bp->bio_error == 0)
149159307Spjd			bp->bio_error = crp->crp_etype;
150159307Spjd	}
151220922Spjd	sc = bp->bio_to->geom->softc;
152220922Spjd	g_eli_key_drop(sc, crp->crp_desc->crd_key);
153159307Spjd	/*
154159307Spjd	 * Do we have all sectors already?
155159307Spjd	 */
156159307Spjd	if (bp->bio_inbed < bp->bio_children)
157159307Spjd		return (0);
158159307Spjd	if (bp->bio_error == 0) {
159159307Spjd		u_int i, lsec, nsec, data_secsize, decr_secsize, encr_secsize;
160159307Spjd		u_char *srcdata, *dstdata, *auth;
161159307Spjd		off_t coroff, corsize;
162159307Spjd
163159307Spjd		/*
164159307Spjd		 * Verify data integrity based on calculated and read HMACs.
165159307Spjd		 */
166159307Spjd		/* Sectorsize of decrypted provider eg. 4096. */
167159307Spjd		decr_secsize = bp->bio_to->sectorsize;
168159307Spjd		/* The real sectorsize of encrypted provider, eg. 512. */
169159307Spjd		encr_secsize = LIST_FIRST(&sc->sc_geom->consumer)->provider->sectorsize;
170159307Spjd		/* Number of data bytes in one encrypted sector, eg. 480. */
171159307Spjd		data_secsize = sc->sc_data_per_sector;
172159307Spjd		/* Number of sectors from decrypted provider, eg. 2. */
173159307Spjd		nsec = bp->bio_length / decr_secsize;
174159307Spjd		/* Number of sectors from encrypted provider, eg. 18. */
175159307Spjd		nsec = (nsec * sc->sc_bytes_per_sector) / encr_secsize;
176159307Spjd		/* Last sector number in every big sector, eg. 9. */
177159307Spjd		lsec = sc->sc_bytes_per_sector / encr_secsize;
178159307Spjd
179159307Spjd		srcdata = bp->bio_driver2;
180159307Spjd		dstdata = bp->bio_data;
181159307Spjd		auth = srcdata + encr_secsize * nsec;
182159307Spjd		coroff = -1;
183159307Spjd		corsize = 0;
184159307Spjd
185159307Spjd		for (i = 1; i <= nsec; i++) {
186159307Spjd			data_secsize = sc->sc_data_per_sector;
187159307Spjd			if ((i % lsec) == 0)
188159307Spjd				data_secsize = decr_secsize % data_secsize;
189159307Spjd			if (bcmp(srcdata, auth, sc->sc_alen) != 0) {
190159307Spjd				/*
191159307Spjd				 * Curruption detected, remember the offset if
192159307Spjd				 * this is the first corrupted sector and
193159307Spjd				 * increase size.
194159307Spjd				 */
195159307Spjd				if (bp->bio_error == 0)
196159307Spjd					bp->bio_error = -1;
197159307Spjd				if (coroff == -1) {
198159307Spjd					coroff = bp->bio_offset +
199159307Spjd					    (dstdata - (u_char *)bp->bio_data);
200159307Spjd				}
201159307Spjd				corsize += data_secsize;
202159307Spjd			} else {
203159307Spjd				/*
204159307Spjd				 * No curruption, good.
205159307Spjd				 * Report previous corruption if there was one.
206159307Spjd				 */
207159307Spjd				if (coroff != -1) {
208159307Spjd					G_ELI_DEBUG(0, "%s: %jd bytes "
209159307Spjd					    "corrupted at offset %jd.",
210159307Spjd					    sc->sc_name, (intmax_t)corsize,
211159307Spjd					    (intmax_t)coroff);
212159307Spjd					coroff = -1;
213159307Spjd					corsize = 0;
214159307Spjd				}
215159307Spjd				bcopy(srcdata + sc->sc_alen, dstdata,
216159307Spjd				    data_secsize);
217159307Spjd			}
218159307Spjd			srcdata += encr_secsize;
219159307Spjd			dstdata += data_secsize;
220159307Spjd			auth += sc->sc_alen;
221159307Spjd		}
222159307Spjd		/* Report previous corruption if there was one. */
223159307Spjd		if (coroff != -1) {
224159307Spjd			G_ELI_DEBUG(0, "%s: %jd bytes corrupted at offset %jd.",
225159307Spjd			    sc->sc_name, (intmax_t)corsize, (intmax_t)coroff);
226159307Spjd		}
227159307Spjd	}
228159307Spjd	free(bp->bio_driver2, M_ELI);
229159307Spjd	bp->bio_driver2 = NULL;
230159307Spjd	if (bp->bio_error != 0) {
231159307Spjd		if (bp->bio_error == -1)
232159307Spjd			bp->bio_error = EINVAL;
233159307Spjd		else {
234159307Spjd			G_ELI_LOGREQ(0, bp,
235159307Spjd			    "Crypto READ request failed (error=%d).",
236159307Spjd			    bp->bio_error);
237159307Spjd		}
238159307Spjd		bp->bio_completed = 0;
239159307Spjd	}
240159307Spjd	/*
241159307Spjd	 * Read is finished, send it up.
242159307Spjd	 */
243159307Spjd	g_io_deliver(bp, bp->bio_error);
244214118Spjd	atomic_subtract_int(&sc->sc_inflight, 1);
245159307Spjd	return (0);
246159307Spjd}
247159307Spjd
248159307Spjd/*
249159307Spjd * The function is called after data encryption.
250159307Spjd *
251159307Spjd * g_eli_start -> g_eli_auth_run -> G_ELI_AUTH_WRITE_DONE -> g_io_request -> g_eli_write_done -> g_io_deliver
252159307Spjd */
253159307Spjdstatic int
254159307Spjdg_eli_auth_write_done(struct cryptop *crp)
255159307Spjd{
256159307Spjd	struct g_eli_softc *sc;
257159307Spjd	struct g_consumer *cp;
258159307Spjd	struct bio *bp, *cbp, *cbp2;
259159307Spjd	u_int nsec;
260159307Spjd
261159307Spjd	if (crp->crp_etype == EAGAIN) {
262159307Spjd		if (g_eli_crypto_rerun(crp) == 0)
263159307Spjd			return (0);
264159307Spjd	}
265159307Spjd	bp = (struct bio *)crp->crp_opaque;
266159307Spjd	bp->bio_inbed++;
267159307Spjd	if (crp->crp_etype == 0) {
268159307Spjd		G_ELI_DEBUG(3, "Crypto WRITE request done (%d/%d).",
269159307Spjd		    bp->bio_inbed, bp->bio_children);
270159307Spjd	} else {
271159307Spjd		G_ELI_DEBUG(1, "Crypto WRITE request failed (%d/%d) error=%d.",
272159307Spjd		    bp->bio_inbed, bp->bio_children, crp->crp_etype);
273159307Spjd		if (bp->bio_error == 0)
274159307Spjd			bp->bio_error = crp->crp_etype;
275159307Spjd	}
276220922Spjd	sc = bp->bio_to->geom->softc;
277220922Spjd	g_eli_key_drop(sc, crp->crp_desc->crd_key);
278159307Spjd	/*
279159307Spjd	 * All sectors are already encrypted?
280159307Spjd	 */
281159307Spjd	if (bp->bio_inbed < bp->bio_children)
282159307Spjd		return (0);
283159307Spjd	if (bp->bio_error != 0) {
284159307Spjd		G_ELI_LOGREQ(0, bp, "Crypto WRITE request failed (error=%d).",
285159307Spjd		    bp->bio_error);
286159307Spjd		free(bp->bio_driver2, M_ELI);
287159307Spjd		bp->bio_driver2 = NULL;
288159307Spjd		cbp = bp->bio_driver1;
289159307Spjd		bp->bio_driver1 = NULL;
290159307Spjd		g_destroy_bio(cbp);
291159307Spjd		g_io_deliver(bp, bp->bio_error);
292214118Spjd		atomic_subtract_int(&sc->sc_inflight, 1);
293159307Spjd		return (0);
294159307Spjd	}
295159307Spjd	cp = LIST_FIRST(&sc->sc_geom->consumer);
296159307Spjd	cbp = bp->bio_driver1;
297159307Spjd	bp->bio_driver1 = NULL;
298159307Spjd	cbp->bio_to = cp->provider;
299159307Spjd	cbp->bio_done = g_eli_write_done;
300159307Spjd
301159307Spjd	/* Number of sectors from decrypted provider, eg. 1. */
302159307Spjd	nsec = bp->bio_length / bp->bio_to->sectorsize;
303159307Spjd	/* Number of sectors from encrypted provider, eg. 9. */
304159307Spjd	nsec = (nsec * sc->sc_bytes_per_sector) / cp->provider->sectorsize;
305159307Spjd
306159307Spjd	cbp->bio_length = cp->provider->sectorsize * nsec;
307159307Spjd	cbp->bio_offset = (bp->bio_offset / bp->bio_to->sectorsize) * sc->sc_bytes_per_sector;
308159307Spjd	cbp->bio_data = bp->bio_driver2;
309159307Spjd
310159307Spjd	/*
311159307Spjd	 * We write more than what is requested, so we have to be ready to write
312159307Spjd	 * more than MAXPHYS.
313159307Spjd	 */
314159307Spjd	cbp2 = NULL;
315159307Spjd	if (cbp->bio_length > MAXPHYS) {
316159307Spjd		cbp2 = g_duplicate_bio(bp);
317159307Spjd		cbp2->bio_length = cbp->bio_length - MAXPHYS;
318159307Spjd		cbp2->bio_data = cbp->bio_data + MAXPHYS;
319159307Spjd		cbp2->bio_offset = cbp->bio_offset + MAXPHYS;
320159307Spjd		cbp2->bio_to = cp->provider;
321159307Spjd		cbp2->bio_done = g_eli_write_done;
322159307Spjd		cbp->bio_length = MAXPHYS;
323159307Spjd	}
324159307Spjd	/*
325159307Spjd	 * Send encrypted data to the provider.
326159307Spjd	 */
327159307Spjd	G_ELI_LOGREQ(2, cbp, "Sending request.");
328159307Spjd	bp->bio_inbed = 0;
329159307Spjd	bp->bio_children = (cbp2 != NULL ? 2 : 1);
330159307Spjd	g_io_request(cbp, cp);
331159307Spjd	if (cbp2 != NULL) {
332159307Spjd		G_ELI_LOGREQ(2, cbp2, "Sending request.");
333159307Spjd		g_io_request(cbp2, cp);
334159307Spjd	}
335159307Spjd	return (0);
336159307Spjd}
337159307Spjd
338159307Spjdvoid
339159307Spjdg_eli_auth_read(struct g_eli_softc *sc, struct bio *bp)
340159307Spjd{
341159307Spjd	struct g_consumer *cp;
342159307Spjd	struct bio *cbp, *cbp2;
343159307Spjd	size_t size;
344159307Spjd	off_t nsec;
345159307Spjd
346159307Spjd	bp->bio_pflags = 0;
347159307Spjd
348159307Spjd	cp = LIST_FIRST(&sc->sc_geom->consumer);
349159307Spjd	cbp = bp->bio_driver1;
350159307Spjd	bp->bio_driver1 = NULL;
351159307Spjd	cbp->bio_to = cp->provider;
352159307Spjd	cbp->bio_done = g_eli_read_done;
353159307Spjd
354159307Spjd	/* Number of sectors from decrypted provider, eg. 1. */
355159307Spjd	nsec = bp->bio_length / bp->bio_to->sectorsize;
356159307Spjd	/* Number of sectors from encrypted provider, eg. 9. */
357159307Spjd	nsec = (nsec * sc->sc_bytes_per_sector) / cp->provider->sectorsize;
358159307Spjd
359159307Spjd	cbp->bio_length = cp->provider->sectorsize * nsec;
360159307Spjd	size = cbp->bio_length;
361159307Spjd	size += sc->sc_alen * nsec;
362159307Spjd	size += sizeof(struct cryptop) * nsec;
363159307Spjd	size += sizeof(struct cryptodesc) * nsec * 2;
364159307Spjd	size += G_ELI_AUTH_SECKEYLEN * nsec;
365159307Spjd	size += sizeof(struct uio) * nsec;
366159307Spjd	size += sizeof(struct iovec) * nsec;
367159307Spjd	cbp->bio_offset = (bp->bio_offset / bp->bio_to->sectorsize) * sc->sc_bytes_per_sector;
368159307Spjd	bp->bio_driver2 = malloc(size, M_ELI, M_WAITOK);
369159307Spjd	cbp->bio_data = bp->bio_driver2;
370159307Spjd
371159307Spjd	/*
372159307Spjd	 * We read more than what is requested, so we have to be ready to read
373159307Spjd	 * more than MAXPHYS.
374159307Spjd	 */
375159307Spjd	cbp2 = NULL;
376159307Spjd	if (cbp->bio_length > MAXPHYS) {
377159307Spjd		cbp2 = g_duplicate_bio(bp);
378159307Spjd		cbp2->bio_length = cbp->bio_length - MAXPHYS;
379159307Spjd		cbp2->bio_data = cbp->bio_data + MAXPHYS;
380159307Spjd		cbp2->bio_offset = cbp->bio_offset + MAXPHYS;
381159307Spjd		cbp2->bio_to = cp->provider;
382159307Spjd		cbp2->bio_done = g_eli_read_done;
383159307Spjd		cbp->bio_length = MAXPHYS;
384159307Spjd	}
385159307Spjd	/*
386159307Spjd	 * Read encrypted data from provider.
387159307Spjd	 */
388159307Spjd	G_ELI_LOGREQ(2, cbp, "Sending request.");
389159307Spjd	g_io_request(cbp, cp);
390159307Spjd	if (cbp2 != NULL) {
391159307Spjd		G_ELI_LOGREQ(2, cbp2, "Sending request.");
392159307Spjd		g_io_request(cbp2, cp);
393159307Spjd	}
394159307Spjd}
395159307Spjd
396159307Spjd/*
397159307Spjd * This is the main function responsible for cryptography (ie. communication
398159307Spjd * with crypto(9) subsystem).
399214116Spjd *
400214116Spjd * BIO_READ:
401214116Spjd *	g_eli_start -> g_eli_auth_read -> g_io_request -> g_eli_read_done -> G_ELI_AUTH_RUN -> g_eli_auth_read_done -> g_io_deliver
402214116Spjd * BIO_WRITE:
403214116Spjd *	g_eli_start -> G_ELI_AUTH_RUN -> g_eli_auth_write_done -> g_io_request -> g_eli_write_done -> g_io_deliver
404159307Spjd */
405159307Spjdvoid
406159307Spjdg_eli_auth_run(struct g_eli_worker *wr, struct bio *bp)
407159307Spjd{
408159307Spjd	struct g_eli_softc *sc;
409159307Spjd	struct cryptop *crp;
410159307Spjd	struct cryptodesc *crde, *crda;
411159307Spjd	struct uio *uio;
412159307Spjd	struct iovec *iov;
413159307Spjd	u_int i, lsec, nsec, data_secsize, decr_secsize, encr_secsize;
414159307Spjd	off_t dstoff;
415159307Spjd	int err, error;
416159307Spjd	u_char *p, *data, *auth, *authkey, *plaindata;
417159307Spjd
418159307Spjd	G_ELI_LOGREQ(3, bp, "%s", __func__);
419159307Spjd
420159307Spjd	bp->bio_pflags = wr->w_number;
421159307Spjd	sc = wr->w_softc;
422159307Spjd	/* Sectorsize of decrypted provider eg. 4096. */
423159307Spjd	decr_secsize = bp->bio_to->sectorsize;
424159307Spjd	/* The real sectorsize of encrypted provider, eg. 512. */
425159307Spjd	encr_secsize = LIST_FIRST(&sc->sc_geom->consumer)->provider->sectorsize;
426159307Spjd	/* Number of data bytes in one encrypted sector, eg. 480. */
427159307Spjd	data_secsize = sc->sc_data_per_sector;
428159307Spjd	/* Number of sectors from decrypted provider, eg. 2. */
429159307Spjd	nsec = bp->bio_length / decr_secsize;
430159307Spjd	/* Number of sectors from encrypted provider, eg. 18. */
431159307Spjd	nsec = (nsec * sc->sc_bytes_per_sector) / encr_secsize;
432159307Spjd	/* Last sector number in every big sector, eg. 9. */
433159307Spjd	lsec = sc->sc_bytes_per_sector / encr_secsize;
434159307Spjd	/* Destination offset, used for IV generation. */
435159307Spjd	dstoff = (bp->bio_offset / bp->bio_to->sectorsize) * sc->sc_bytes_per_sector;
436159307Spjd
437159343Spjd	auth = NULL;	/* Silence compiler warning. */
438159307Spjd	plaindata = bp->bio_data;
439159307Spjd	if (bp->bio_cmd == BIO_READ) {
440159307Spjd		data = bp->bio_driver2;
441159307Spjd		auth = data + encr_secsize * nsec;
442159307Spjd		p = auth + sc->sc_alen * nsec;
443159307Spjd	} else {
444159307Spjd		size_t size;
445159307Spjd
446159307Spjd		size = encr_secsize * nsec;
447159307Spjd		size += sizeof(*crp) * nsec;
448159307Spjd		size += sizeof(*crde) * nsec;
449159307Spjd		size += sizeof(*crda) * nsec;
450159307Spjd		size += G_ELI_AUTH_SECKEYLEN * nsec;
451159307Spjd		size += sizeof(*uio) * nsec;
452159307Spjd		size += sizeof(*iov) * nsec;
453159307Spjd		data = malloc(size, M_ELI, M_WAITOK);
454159307Spjd		bp->bio_driver2 = data;
455159307Spjd		p = data + encr_secsize * nsec;
456159307Spjd	}
457159307Spjd	bp->bio_inbed = 0;
458159307Spjd	bp->bio_children = nsec;
459159307Spjd
460159307Spjd	error = 0;
461159307Spjd	for (i = 1; i <= nsec; i++, dstoff += encr_secsize) {
462159307Spjd		crp = (struct cryptop *)p;	p += sizeof(*crp);
463159307Spjd		crde = (struct cryptodesc *)p;	p += sizeof(*crde);
464159307Spjd		crda = (struct cryptodesc *)p;	p += sizeof(*crda);
465159307Spjd		authkey = (u_char *)p;		p += G_ELI_AUTH_SECKEYLEN;
466159307Spjd		uio = (struct uio *)p;		p += sizeof(*uio);
467159307Spjd		iov = (struct iovec *)p;	p += sizeof(*iov);
468159307Spjd
469159307Spjd		data_secsize = sc->sc_data_per_sector;
470159307Spjd		if ((i % lsec) == 0)
471159307Spjd			data_secsize = decr_secsize % data_secsize;
472159307Spjd
473159307Spjd		if (bp->bio_cmd == BIO_READ) {
474159307Spjd			/* Remember read HMAC. */
475159307Spjd			bcopy(data, auth, sc->sc_alen);
476159307Spjd			auth += sc->sc_alen;
477159307Spjd			/* TODO: bzero(9) can be commented out later. */
478159307Spjd			bzero(data, sc->sc_alen);
479159307Spjd		} else {
480159307Spjd			bcopy(plaindata, data + sc->sc_alen, data_secsize);
481159307Spjd			plaindata += data_secsize;
482159307Spjd		}
483159307Spjd
484159307Spjd		iov->iov_len = sc->sc_alen + data_secsize;
485159307Spjd		iov->iov_base = data;
486159307Spjd		data += encr_secsize;
487159307Spjd
488159307Spjd		uio->uio_iov = iov;
489159307Spjd		uio->uio_iovcnt = 1;
490159307Spjd		uio->uio_segflg = UIO_SYSSPACE;
491159307Spjd		uio->uio_resid = iov->iov_len;
492159307Spjd
493159307Spjd		crp->crp_sid = wr->w_sid;
494159343Spjd		crp->crp_ilen = uio->uio_resid;
495160569Spjd		crp->crp_olen = data_secsize;
496159307Spjd		crp->crp_opaque = (void *)bp;
497159307Spjd		crp->crp_buf = (void *)uio;
498159307Spjd		crp->crp_flags = CRYPTO_F_IOV | CRYPTO_F_CBIFSYNC | CRYPTO_F_REL;
499159307Spjd		if (g_eli_batch)
500159307Spjd			crp->crp_flags |= CRYPTO_F_BATCH;
501159307Spjd		if (bp->bio_cmd == BIO_WRITE) {
502159307Spjd			crp->crp_callback = g_eli_auth_write_done;
503159307Spjd			crp->crp_desc = crde;
504159307Spjd			crde->crd_next = crda;
505159307Spjd			crda->crd_next = NULL;
506159307Spjd		} else {
507159307Spjd			crp->crp_callback = g_eli_auth_read_done;
508159307Spjd			crp->crp_desc = crda;
509159307Spjd			crda->crd_next = crde;
510159307Spjd			crde->crd_next = NULL;
511159307Spjd		}
512159307Spjd
513159307Spjd		crde->crd_skip = sc->sc_alen;
514159307Spjd		crde->crd_len = data_secsize;
515159307Spjd		crde->crd_flags = CRD_F_IV_EXPLICIT | CRD_F_IV_PRESENT;
516159307Spjd		if (bp->bio_cmd == BIO_WRITE)
517159307Spjd			crde->crd_flags |= CRD_F_ENCRYPT;
518159307Spjd		crde->crd_alg = sc->sc_ealgo;
519220922Spjd		crde->crd_key = g_eli_key_hold(sc, dstoff, encr_secsize);
520159307Spjd		crde->crd_klen = sc->sc_ekeylen;
521213070Spjd		if (sc->sc_ealgo == CRYPTO_AES_XTS)
522213070Spjd			crde->crd_klen <<= 1;
523159307Spjd		g_eli_crypto_ivgen(sc, dstoff, crde->crd_iv,
524159307Spjd		    sizeof(crde->crd_iv));
525159307Spjd
526159307Spjd		crda->crd_skip = sc->sc_alen;
527159307Spjd		crda->crd_len = data_secsize;
528159307Spjd		crda->crd_inject = 0;
529159307Spjd		crda->crd_flags = CRD_F_KEY_EXPLICIT;
530159307Spjd		crda->crd_alg = sc->sc_aalgo;
531159307Spjd		g_eli_auth_keygen(sc, dstoff, authkey);
532159307Spjd		crda->crd_key = authkey;
533159307Spjd		crda->crd_klen = G_ELI_AUTH_SECKEYLEN * 8;
534159307Spjd
535159307Spjd		crp->crp_etype = 0;
536159307Spjd		err = crypto_dispatch(crp);
537159307Spjd		if (err != 0 && error == 0)
538159307Spjd			error = err;
539159307Spjd	}
540159307Spjd	if (bp->bio_error == 0)
541159307Spjd		bp->bio_error = error;
542159307Spjd}
543