1159307Spjd/*-
2220922Spjd * Copyright (c) 2005-2011 Pawel Jakub Dawidek <pawel@dawidek.net>
3159307Spjd * All rights reserved.
4159307Spjd *
5159307Spjd * Redistribution and use in source and binary forms, with or without
6159307Spjd * modification, are permitted provided that the following conditions
7159307Spjd * are met:
8159307Spjd * 1. Redistributions of source code must retain the above copyright
9159307Spjd *    notice, this list of conditions and the following disclaimer.
10159307Spjd * 2. Redistributions in binary form must reproduce the above copyright
11159307Spjd *    notice, this list of conditions and the following disclaimer in the
12159307Spjd *    documentation and/or other materials provided with the distribution.
13159307Spjd *
14159307Spjd * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
15159307Spjd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16159307Spjd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17159307Spjd * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
18159307Spjd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19159307Spjd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20159307Spjd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21159307Spjd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22159307Spjd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23159307Spjd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24159307Spjd * SUCH DAMAGE.
25159307Spjd */
26159307Spjd
27159307Spjd#include <sys/cdefs.h>
28159307Spjd__FBSDID("$FreeBSD: stable/10/sys/geom/eli/g_eli_integrity.c 330737 2018-03-10 04:17:01Z asomers $");
29159307Spjd
30159307Spjd#include <sys/param.h>
31159307Spjd#include <sys/systm.h>
32159307Spjd#include <sys/kernel.h>
33159307Spjd#include <sys/linker.h>
34159307Spjd#include <sys/module.h>
35159307Spjd#include <sys/lock.h>
36159307Spjd#include <sys/mutex.h>
37159307Spjd#include <sys/bio.h>
38159307Spjd#include <sys/sysctl.h>
39159307Spjd#include <sys/malloc.h>
40159307Spjd#include <sys/kthread.h>
41159307Spjd#include <sys/proc.h>
42159307Spjd#include <sys/sched.h>
43159307Spjd#include <sys/smp.h>
44159307Spjd#include <sys/uio.h>
45159307Spjd#include <sys/vnode.h>
46159307Spjd
47159307Spjd#include <vm/uma.h>
48159307Spjd
49159307Spjd#include <geom/geom.h>
50159307Spjd#include <geom/eli/g_eli.h>
51159307Spjd#include <geom/eli/pkcs5v2.h>
52159307Spjd
53159307Spjd/*
54159307Spjd * The data layout description when integrity verification is configured.
55159307Spjd *
56159307Spjd * One of the most important assumption here is that authenticated data and its
57159307Spjd * HMAC has to be stored in the same place (namely in the same sector) to make
58159307Spjd * it work reliable.
59159307Spjd * The problem is that file systems work only with sectors that are multiple of
60159307Spjd * 512 bytes and a power of two number.
61159307Spjd * My idea to implement it is as follows.
62159307Spjd * Let's store HMAC in sector. This is a must. This leaves us 480 bytes for
63159307Spjd * data. We can't use that directly (ie. we can't create provider with 480 bytes
64159307Spjd * sector size). We need another sector from where we take only 32 bytes of data
65159307Spjd * and we store HMAC of this data as well. This takes two sectors from the
66159307Spjd * original provider at the input and leaves us one sector of authenticated data
67159307Spjd * at the output. Not very efficient, but you got the idea.
68159307Spjd * Now, let's assume, we want to create provider with 4096 bytes sector.
69159307Spjd * To output 4096 bytes of authenticated data we need 8x480 plus 1x256, so we
70159307Spjd * need nine 512-bytes sectors at the input to get one 4096-bytes sector at the
71159307Spjd * output. That's better. With 4096 bytes sector we can use 89% of size of the
72159307Spjd * original provider. I find it as an acceptable cost.
73159307Spjd * The reliability comes from the fact, that every HMAC stored inside the sector
74159307Spjd * is calculated only for the data in the same sector, so its impossible to
75159307Spjd * write new data and leave old HMAC or vice versa.
76159307Spjd *
77159307Spjd * And here is the picture:
78159307Spjd *
79159307Spjd * da0: +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+-----+
80159307Spjd *      |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |480b| |32b |256b |
81159307Spjd *      |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data| |HMAC|Data |
82159307Spjd *      +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+----+ +----+-----+
83159307Spjd *      |512 bytes| |512 bytes| |512 bytes| |512 bytes| |512 bytes| |512 bytes| |512 bytes| |512 bytes| |288 bytes |
84159307Spjd *      +---------+ +---------+ +---------+ +---------+ +---------+ +---------+ +---------+ +---------+ |224 unused|
85159307Spjd *                                                                                                      +----------+
86159307Spjd * da0.eli: +----+----+----+----+----+----+----+----+----+
87159307Spjd *          |480b|480b|480b|480b|480b|480b|480b|480b|256b|
88159307Spjd *          +----+----+----+----+----+----+----+----+----+
89159307Spjd *          |                 4096 bytes                 |
90159307Spjd *          +--------------------------------------------+
91159307Spjd *
92159307Spjd * PS. You can use any sector size with geli(8). My example is using 4kB,
93159307Spjd *     because it's most efficient. For 8kB sectors you need 2 extra sectors,
94159307Spjd *     so the cost is the same as for 4kB sectors.
95159307Spjd */
96159307Spjd
97159307Spjd/*
98159307Spjd * Code paths:
99159307Spjd * BIO_READ:
100159307Spjd *	g_eli_start -> g_eli_auth_read -> g_io_request -> g_eli_read_done -> g_eli_auth_run -> g_eli_auth_read_done -> g_io_deliver
101159307Spjd * BIO_WRITE:
102159307Spjd *	g_eli_start -> g_eli_auth_run -> g_eli_auth_write_done -> g_io_request -> g_eli_write_done -> g_io_deliver
103159307Spjd */
104159307Spjd
105159307SpjdMALLOC_DECLARE(M_ELI);
106159307Spjd
107159307Spjd/*
108159307Spjd * Here we generate key for HMAC. Every sector has its own HMAC key, so it is
109159307Spjd * not possible to copy sectors.
110159307Spjd * We cannot depend on fact, that every sector has its own IV, because different
111159307Spjd * IV doesn't change HMAC, when we use encrypt-then-authenticate method.
112159307Spjd */
113159307Spjdstatic void
114159307Spjdg_eli_auth_keygen(struct g_eli_softc *sc, off_t offset, u_char *key)
115159307Spjd{
116159307Spjd	SHA256_CTX ctx;
117159307Spjd
118159307Spjd	/* Copy precalculated SHA256 context. */
119159307Spjd	bcopy(&sc->sc_akeyctx, &ctx, sizeof(ctx));
120159307Spjd	SHA256_Update(&ctx, (uint8_t *)&offset, sizeof(offset));
121159307Spjd	SHA256_Final(key, &ctx);
122159307Spjd}
123159307Spjd
124159307Spjd/*
125159307Spjd * The function is called after we read and decrypt data.
126159307Spjd *
127159307Spjd * g_eli_start -> g_eli_auth_read -> g_io_request -> g_eli_read_done -> g_eli_auth_run -> G_ELI_AUTH_READ_DONE -> g_io_deliver
128159307Spjd */
129159307Spjdstatic int
130159307Spjdg_eli_auth_read_done(struct cryptop *crp)
131159307Spjd{
132214118Spjd	struct g_eli_softc *sc;
133159307Spjd	struct bio *bp;
134159307Spjd
135159307Spjd	if (crp->crp_etype == EAGAIN) {
136159307Spjd		if (g_eli_crypto_rerun(crp) == 0)
137159307Spjd			return (0);
138159307Spjd	}
139159307Spjd	bp = (struct bio *)crp->crp_opaque;
140159307Spjd	bp->bio_inbed++;
141159307Spjd	if (crp->crp_etype == 0) {
142159307Spjd		bp->bio_completed += crp->crp_olen;
143159307Spjd		G_ELI_DEBUG(3, "Crypto READ request done (%d/%d) (add=%jd completed=%jd).",
144159307Spjd		    bp->bio_inbed, bp->bio_children, (intmax_t)crp->crp_olen, (intmax_t)bp->bio_completed);
145159307Spjd	} else {
146159307Spjd		G_ELI_DEBUG(1, "Crypto READ request failed (%d/%d) error=%d.",
147159307Spjd		    bp->bio_inbed, bp->bio_children, crp->crp_etype);
148159307Spjd		if (bp->bio_error == 0)
149159307Spjd			bp->bio_error = crp->crp_etype;
150159307Spjd	}
151220922Spjd	sc = bp->bio_to->geom->softc;
152221625Spjd	g_eli_key_drop(sc, crp->crp_desc->crd_next->crd_key);
153159307Spjd	/*
154159307Spjd	 * Do we have all sectors already?
155159307Spjd	 */
156159307Spjd	if (bp->bio_inbed < bp->bio_children)
157159307Spjd		return (0);
158159307Spjd	if (bp->bio_error == 0) {
159159307Spjd		u_int i, lsec, nsec, data_secsize, decr_secsize, encr_secsize;
160159307Spjd		u_char *srcdata, *dstdata, *auth;
161159307Spjd		off_t coroff, corsize;
162159307Spjd
163159307Spjd		/*
164159307Spjd		 * Verify data integrity based on calculated and read HMACs.
165159307Spjd		 */
166159307Spjd		/* Sectorsize of decrypted provider eg. 4096. */
167159307Spjd		decr_secsize = bp->bio_to->sectorsize;
168159307Spjd		/* The real sectorsize of encrypted provider, eg. 512. */
169159307Spjd		encr_secsize = LIST_FIRST(&sc->sc_geom->consumer)->provider->sectorsize;
170159307Spjd		/* Number of data bytes in one encrypted sector, eg. 480. */
171159307Spjd		data_secsize = sc->sc_data_per_sector;
172159307Spjd		/* Number of sectors from decrypted provider, eg. 2. */
173159307Spjd		nsec = bp->bio_length / decr_secsize;
174159307Spjd		/* Number of sectors from encrypted provider, eg. 18. */
175159307Spjd		nsec = (nsec * sc->sc_bytes_per_sector) / encr_secsize;
176159307Spjd		/* Last sector number in every big sector, eg. 9. */
177159307Spjd		lsec = sc->sc_bytes_per_sector / encr_secsize;
178159307Spjd
179159307Spjd		srcdata = bp->bio_driver2;
180159307Spjd		dstdata = bp->bio_data;
181159307Spjd		auth = srcdata + encr_secsize * nsec;
182159307Spjd		coroff = -1;
183159307Spjd		corsize = 0;
184159307Spjd
185159307Spjd		for (i = 1; i <= nsec; i++) {
186159307Spjd			data_secsize = sc->sc_data_per_sector;
187159307Spjd			if ((i % lsec) == 0)
188159307Spjd				data_secsize = decr_secsize % data_secsize;
189159307Spjd			if (bcmp(srcdata, auth, sc->sc_alen) != 0) {
190159307Spjd				/*
191159307Spjd				 * Curruption detected, remember the offset if
192159307Spjd				 * this is the first corrupted sector and
193159307Spjd				 * increase size.
194159307Spjd				 */
195159307Spjd				if (bp->bio_error == 0)
196159307Spjd					bp->bio_error = -1;
197159307Spjd				if (coroff == -1) {
198159307Spjd					coroff = bp->bio_offset +
199159307Spjd					    (dstdata - (u_char *)bp->bio_data);
200159307Spjd				}
201159307Spjd				corsize += data_secsize;
202159307Spjd			} else {
203159307Spjd				/*
204159307Spjd				 * No curruption, good.
205159307Spjd				 * Report previous corruption if there was one.
206159307Spjd				 */
207159307Spjd				if (coroff != -1) {
208235201Seadler					G_ELI_DEBUG(0, "%s: Failed to authenticate %jd "
209235419Seadler					    "bytes of data at offset %jd.",
210159307Spjd					    sc->sc_name, (intmax_t)corsize,
211159307Spjd					    (intmax_t)coroff);
212159307Spjd					coroff = -1;
213159307Spjd					corsize = 0;
214159307Spjd				}
215159307Spjd				bcopy(srcdata + sc->sc_alen, dstdata,
216159307Spjd				    data_secsize);
217159307Spjd			}
218159307Spjd			srcdata += encr_secsize;
219159307Spjd			dstdata += data_secsize;
220159307Spjd			auth += sc->sc_alen;
221159307Spjd		}
222159307Spjd		/* Report previous corruption if there was one. */
223159307Spjd		if (coroff != -1) {
224235201Seadler			G_ELI_DEBUG(0, "%s: Failed to authenticate %jd "
225235419Seadler			    "bytes of data at offset %jd.",
226159307Spjd			    sc->sc_name, (intmax_t)corsize, (intmax_t)coroff);
227159307Spjd		}
228159307Spjd	}
229159307Spjd	free(bp->bio_driver2, M_ELI);
230159307Spjd	bp->bio_driver2 = NULL;
231159307Spjd	if (bp->bio_error != 0) {
232159307Spjd		if (bp->bio_error == -1)
233159307Spjd			bp->bio_error = EINVAL;
234159307Spjd		else {
235159307Spjd			G_ELI_LOGREQ(0, bp,
236159307Spjd			    "Crypto READ request failed (error=%d).",
237159307Spjd			    bp->bio_error);
238159307Spjd		}
239159307Spjd		bp->bio_completed = 0;
240159307Spjd	}
241159307Spjd	/*
242159307Spjd	 * Read is finished, send it up.
243159307Spjd	 */
244159307Spjd	g_io_deliver(bp, bp->bio_error);
245214118Spjd	atomic_subtract_int(&sc->sc_inflight, 1);
246159307Spjd	return (0);
247159307Spjd}
248159307Spjd
249159307Spjd/*
250159307Spjd * The function is called after data encryption.
251159307Spjd *
252159307Spjd * g_eli_start -> g_eli_auth_run -> G_ELI_AUTH_WRITE_DONE -> g_io_request -> g_eli_write_done -> g_io_deliver
253159307Spjd */
254159307Spjdstatic int
255159307Spjdg_eli_auth_write_done(struct cryptop *crp)
256159307Spjd{
257159307Spjd	struct g_eli_softc *sc;
258159307Spjd	struct g_consumer *cp;
259159307Spjd	struct bio *bp, *cbp, *cbp2;
260159307Spjd	u_int nsec;
261159307Spjd
262159307Spjd	if (crp->crp_etype == EAGAIN) {
263159307Spjd		if (g_eli_crypto_rerun(crp) == 0)
264159307Spjd			return (0);
265159307Spjd	}
266159307Spjd	bp = (struct bio *)crp->crp_opaque;
267159307Spjd	bp->bio_inbed++;
268159307Spjd	if (crp->crp_etype == 0) {
269159307Spjd		G_ELI_DEBUG(3, "Crypto WRITE request done (%d/%d).",
270159307Spjd		    bp->bio_inbed, bp->bio_children);
271159307Spjd	} else {
272159307Spjd		G_ELI_DEBUG(1, "Crypto WRITE request failed (%d/%d) error=%d.",
273159307Spjd		    bp->bio_inbed, bp->bio_children, crp->crp_etype);
274159307Spjd		if (bp->bio_error == 0)
275159307Spjd			bp->bio_error = crp->crp_etype;
276159307Spjd	}
277220922Spjd	sc = bp->bio_to->geom->softc;
278220922Spjd	g_eli_key_drop(sc, crp->crp_desc->crd_key);
279159307Spjd	/*
280159307Spjd	 * All sectors are already encrypted?
281159307Spjd	 */
282159307Spjd	if (bp->bio_inbed < bp->bio_children)
283159307Spjd		return (0);
284159307Spjd	if (bp->bio_error != 0) {
285159307Spjd		G_ELI_LOGREQ(0, bp, "Crypto WRITE request failed (error=%d).",
286159307Spjd		    bp->bio_error);
287159307Spjd		free(bp->bio_driver2, M_ELI);
288159307Spjd		bp->bio_driver2 = NULL;
289159307Spjd		cbp = bp->bio_driver1;
290159307Spjd		bp->bio_driver1 = NULL;
291159307Spjd		g_destroy_bio(cbp);
292159307Spjd		g_io_deliver(bp, bp->bio_error);
293214118Spjd		atomic_subtract_int(&sc->sc_inflight, 1);
294159307Spjd		return (0);
295159307Spjd	}
296159307Spjd	cp = LIST_FIRST(&sc->sc_geom->consumer);
297159307Spjd	cbp = bp->bio_driver1;
298159307Spjd	bp->bio_driver1 = NULL;
299159307Spjd	cbp->bio_to = cp->provider;
300159307Spjd	cbp->bio_done = g_eli_write_done;
301159307Spjd
302159307Spjd	/* Number of sectors from decrypted provider, eg. 1. */
303159307Spjd	nsec = bp->bio_length / bp->bio_to->sectorsize;
304159307Spjd	/* Number of sectors from encrypted provider, eg. 9. */
305159307Spjd	nsec = (nsec * sc->sc_bytes_per_sector) / cp->provider->sectorsize;
306159307Spjd
307159307Spjd	cbp->bio_length = cp->provider->sectorsize * nsec;
308159307Spjd	cbp->bio_offset = (bp->bio_offset / bp->bio_to->sectorsize) * sc->sc_bytes_per_sector;
309159307Spjd	cbp->bio_data = bp->bio_driver2;
310159307Spjd
311159307Spjd	/*
312159307Spjd	 * We write more than what is requested, so we have to be ready to write
313159307Spjd	 * more than MAXPHYS.
314159307Spjd	 */
315159307Spjd	cbp2 = NULL;
316159307Spjd	if (cbp->bio_length > MAXPHYS) {
317159307Spjd		cbp2 = g_duplicate_bio(bp);
318159307Spjd		cbp2->bio_length = cbp->bio_length - MAXPHYS;
319159307Spjd		cbp2->bio_data = cbp->bio_data + MAXPHYS;
320159307Spjd		cbp2->bio_offset = cbp->bio_offset + MAXPHYS;
321159307Spjd		cbp2->bio_to = cp->provider;
322159307Spjd		cbp2->bio_done = g_eli_write_done;
323159307Spjd		cbp->bio_length = MAXPHYS;
324159307Spjd	}
325159307Spjd	/*
326159307Spjd	 * Send encrypted data to the provider.
327159307Spjd	 */
328159307Spjd	G_ELI_LOGREQ(2, cbp, "Sending request.");
329159307Spjd	bp->bio_inbed = 0;
330159307Spjd	bp->bio_children = (cbp2 != NULL ? 2 : 1);
331159307Spjd	g_io_request(cbp, cp);
332159307Spjd	if (cbp2 != NULL) {
333159307Spjd		G_ELI_LOGREQ(2, cbp2, "Sending request.");
334159307Spjd		g_io_request(cbp2, cp);
335159307Spjd	}
336159307Spjd	return (0);
337159307Spjd}
338159307Spjd
339159307Spjdvoid
340159307Spjdg_eli_auth_read(struct g_eli_softc *sc, struct bio *bp)
341159307Spjd{
342159307Spjd	struct g_consumer *cp;
343159307Spjd	struct bio *cbp, *cbp2;
344159307Spjd	size_t size;
345159307Spjd	off_t nsec;
346159307Spjd
347159307Spjd	bp->bio_pflags = 0;
348159307Spjd
349159307Spjd	cp = LIST_FIRST(&sc->sc_geom->consumer);
350159307Spjd	cbp = bp->bio_driver1;
351159307Spjd	bp->bio_driver1 = NULL;
352159307Spjd	cbp->bio_to = cp->provider;
353159307Spjd	cbp->bio_done = g_eli_read_done;
354159307Spjd
355159307Spjd	/* Number of sectors from decrypted provider, eg. 1. */
356159307Spjd	nsec = bp->bio_length / bp->bio_to->sectorsize;
357159307Spjd	/* Number of sectors from encrypted provider, eg. 9. */
358159307Spjd	nsec = (nsec * sc->sc_bytes_per_sector) / cp->provider->sectorsize;
359159307Spjd
360159307Spjd	cbp->bio_length = cp->provider->sectorsize * nsec;
361159307Spjd	size = cbp->bio_length;
362159307Spjd	size += sc->sc_alen * nsec;
363159307Spjd	size += sizeof(struct cryptop) * nsec;
364159307Spjd	size += sizeof(struct cryptodesc) * nsec * 2;
365159307Spjd	size += G_ELI_AUTH_SECKEYLEN * nsec;
366159307Spjd	size += sizeof(struct uio) * nsec;
367159307Spjd	size += sizeof(struct iovec) * nsec;
368159307Spjd	cbp->bio_offset = (bp->bio_offset / bp->bio_to->sectorsize) * sc->sc_bytes_per_sector;
369159307Spjd	bp->bio_driver2 = malloc(size, M_ELI, M_WAITOK);
370159307Spjd	cbp->bio_data = bp->bio_driver2;
371159307Spjd
372159307Spjd	/*
373159307Spjd	 * We read more than what is requested, so we have to be ready to read
374159307Spjd	 * more than MAXPHYS.
375159307Spjd	 */
376159307Spjd	cbp2 = NULL;
377159307Spjd	if (cbp->bio_length > MAXPHYS) {
378159307Spjd		cbp2 = g_duplicate_bio(bp);
379159307Spjd		cbp2->bio_length = cbp->bio_length - MAXPHYS;
380159307Spjd		cbp2->bio_data = cbp->bio_data + MAXPHYS;
381159307Spjd		cbp2->bio_offset = cbp->bio_offset + MAXPHYS;
382159307Spjd		cbp2->bio_to = cp->provider;
383159307Spjd		cbp2->bio_done = g_eli_read_done;
384159307Spjd		cbp->bio_length = MAXPHYS;
385159307Spjd	}
386159307Spjd	/*
387159307Spjd	 * Read encrypted data from provider.
388159307Spjd	 */
389159307Spjd	G_ELI_LOGREQ(2, cbp, "Sending request.");
390159307Spjd	g_io_request(cbp, cp);
391159307Spjd	if (cbp2 != NULL) {
392159307Spjd		G_ELI_LOGREQ(2, cbp2, "Sending request.");
393159307Spjd		g_io_request(cbp2, cp);
394159307Spjd	}
395159307Spjd}
396159307Spjd
397159307Spjd/*
398159307Spjd * This is the main function responsible for cryptography (ie. communication
399159307Spjd * with crypto(9) subsystem).
400214116Spjd *
401214116Spjd * BIO_READ:
402214116Spjd *	g_eli_start -> g_eli_auth_read -> g_io_request -> g_eli_read_done -> G_ELI_AUTH_RUN -> g_eli_auth_read_done -> g_io_deliver
403214116Spjd * BIO_WRITE:
404214116Spjd *	g_eli_start -> G_ELI_AUTH_RUN -> g_eli_auth_write_done -> g_io_request -> g_eli_write_done -> g_io_deliver
405159307Spjd */
406159307Spjdvoid
407159307Spjdg_eli_auth_run(struct g_eli_worker *wr, struct bio *bp)
408159307Spjd{
409159307Spjd	struct g_eli_softc *sc;
410159307Spjd	struct cryptop *crp;
411159307Spjd	struct cryptodesc *crde, *crda;
412159307Spjd	struct uio *uio;
413159307Spjd	struct iovec *iov;
414159307Spjd	u_int i, lsec, nsec, data_secsize, decr_secsize, encr_secsize;
415159307Spjd	off_t dstoff;
416159307Spjd	int err, error;
417159307Spjd	u_char *p, *data, *auth, *authkey, *plaindata;
418159307Spjd
419159307Spjd	G_ELI_LOGREQ(3, bp, "%s", __func__);
420159307Spjd
421159307Spjd	bp->bio_pflags = wr->w_number;
422159307Spjd	sc = wr->w_softc;
423159307Spjd	/* Sectorsize of decrypted provider eg. 4096. */
424159307Spjd	decr_secsize = bp->bio_to->sectorsize;
425159307Spjd	/* The real sectorsize of encrypted provider, eg. 512. */
426159307Spjd	encr_secsize = LIST_FIRST(&sc->sc_geom->consumer)->provider->sectorsize;
427159307Spjd	/* Number of data bytes in one encrypted sector, eg. 480. */
428159307Spjd	data_secsize = sc->sc_data_per_sector;
429159307Spjd	/* Number of sectors from decrypted provider, eg. 2. */
430159307Spjd	nsec = bp->bio_length / decr_secsize;
431159307Spjd	/* Number of sectors from encrypted provider, eg. 18. */
432159307Spjd	nsec = (nsec * sc->sc_bytes_per_sector) / encr_secsize;
433159307Spjd	/* Last sector number in every big sector, eg. 9. */
434159307Spjd	lsec = sc->sc_bytes_per_sector / encr_secsize;
435159307Spjd	/* Destination offset, used for IV generation. */
436159307Spjd	dstoff = (bp->bio_offset / bp->bio_to->sectorsize) * sc->sc_bytes_per_sector;
437159307Spjd
438159343Spjd	auth = NULL;	/* Silence compiler warning. */
439159307Spjd	plaindata = bp->bio_data;
440159307Spjd	if (bp->bio_cmd == BIO_READ) {
441159307Spjd		data = bp->bio_driver2;
442159307Spjd		auth = data + encr_secsize * nsec;
443159307Spjd		p = auth + sc->sc_alen * nsec;
444159307Spjd	} else {
445159307Spjd		size_t size;
446159307Spjd
447159307Spjd		size = encr_secsize * nsec;
448159307Spjd		size += sizeof(*crp) * nsec;
449159307Spjd		size += sizeof(*crde) * nsec;
450159307Spjd		size += sizeof(*crda) * nsec;
451159307Spjd		size += G_ELI_AUTH_SECKEYLEN * nsec;
452159307Spjd		size += sizeof(*uio) * nsec;
453159307Spjd		size += sizeof(*iov) * nsec;
454159307Spjd		data = malloc(size, M_ELI, M_WAITOK);
455159307Spjd		bp->bio_driver2 = data;
456159307Spjd		p = data + encr_secsize * nsec;
457159307Spjd	}
458159307Spjd	bp->bio_inbed = 0;
459159307Spjd	bp->bio_children = nsec;
460159307Spjd
461159307Spjd	error = 0;
462159307Spjd	for (i = 1; i <= nsec; i++, dstoff += encr_secsize) {
463159307Spjd		crp = (struct cryptop *)p;	p += sizeof(*crp);
464159307Spjd		crde = (struct cryptodesc *)p;	p += sizeof(*crde);
465159307Spjd		crda = (struct cryptodesc *)p;	p += sizeof(*crda);
466159307Spjd		authkey = (u_char *)p;		p += G_ELI_AUTH_SECKEYLEN;
467159307Spjd		uio = (struct uio *)p;		p += sizeof(*uio);
468159307Spjd		iov = (struct iovec *)p;	p += sizeof(*iov);
469159307Spjd
470159307Spjd		data_secsize = sc->sc_data_per_sector;
471330737Sasomers		if ((i % lsec) == 0) {
472159307Spjd			data_secsize = decr_secsize % data_secsize;
473330737Sasomers			/*
474330737Sasomers			 * Last encrypted sector of each decrypted sector is
475330737Sasomers			 * only partially filled.
476330737Sasomers			 */
477330737Sasomers			if (bp->bio_cmd == BIO_WRITE)
478330737Sasomers				memset(data + sc->sc_alen + data_secsize, 0,
479330737Sasomers				    encr_secsize - sc->sc_alen - data_secsize);
480330737Sasomers		}
481159307Spjd
482159307Spjd		if (bp->bio_cmd == BIO_READ) {
483159307Spjd			/* Remember read HMAC. */
484159307Spjd			bcopy(data, auth, sc->sc_alen);
485159307Spjd			auth += sc->sc_alen;
486159307Spjd			/* TODO: bzero(9) can be commented out later. */
487159307Spjd			bzero(data, sc->sc_alen);
488159307Spjd		} else {
489159307Spjd			bcopy(plaindata, data + sc->sc_alen, data_secsize);
490159307Spjd			plaindata += data_secsize;
491159307Spjd		}
492159307Spjd
493159307Spjd		iov->iov_len = sc->sc_alen + data_secsize;
494159307Spjd		iov->iov_base = data;
495159307Spjd		data += encr_secsize;
496159307Spjd
497159307Spjd		uio->uio_iov = iov;
498159307Spjd		uio->uio_iovcnt = 1;
499159307Spjd		uio->uio_segflg = UIO_SYSSPACE;
500159307Spjd		uio->uio_resid = iov->iov_len;
501159307Spjd
502159307Spjd		crp->crp_sid = wr->w_sid;
503159343Spjd		crp->crp_ilen = uio->uio_resid;
504160569Spjd		crp->crp_olen = data_secsize;
505159307Spjd		crp->crp_opaque = (void *)bp;
506159307Spjd		crp->crp_buf = (void *)uio;
507159307Spjd		crp->crp_flags = CRYPTO_F_IOV | CRYPTO_F_CBIFSYNC | CRYPTO_F_REL;
508159307Spjd		if (g_eli_batch)
509159307Spjd			crp->crp_flags |= CRYPTO_F_BATCH;
510159307Spjd		if (bp->bio_cmd == BIO_WRITE) {
511159307Spjd			crp->crp_callback = g_eli_auth_write_done;
512159307Spjd			crp->crp_desc = crde;
513159307Spjd			crde->crd_next = crda;
514159307Spjd			crda->crd_next = NULL;
515159307Spjd		} else {
516159307Spjd			crp->crp_callback = g_eli_auth_read_done;
517159307Spjd			crp->crp_desc = crda;
518159307Spjd			crda->crd_next = crde;
519159307Spjd			crde->crd_next = NULL;
520159307Spjd		}
521159307Spjd
522159307Spjd		crde->crd_skip = sc->sc_alen;
523159307Spjd		crde->crd_len = data_secsize;
524159307Spjd		crde->crd_flags = CRD_F_IV_EXPLICIT | CRD_F_IV_PRESENT;
525221628Spjd		if ((sc->sc_flags & G_ELI_FLAG_FIRST_KEY) == 0)
526221628Spjd			crde->crd_flags |= CRD_F_KEY_EXPLICIT;
527159307Spjd		if (bp->bio_cmd == BIO_WRITE)
528159307Spjd			crde->crd_flags |= CRD_F_ENCRYPT;
529159307Spjd		crde->crd_alg = sc->sc_ealgo;
530220922Spjd		crde->crd_key = g_eli_key_hold(sc, dstoff, encr_secsize);
531159307Spjd		crde->crd_klen = sc->sc_ekeylen;
532213070Spjd		if (sc->sc_ealgo == CRYPTO_AES_XTS)
533213070Spjd			crde->crd_klen <<= 1;
534159307Spjd		g_eli_crypto_ivgen(sc, dstoff, crde->crd_iv,
535159307Spjd		    sizeof(crde->crd_iv));
536159307Spjd
537159307Spjd		crda->crd_skip = sc->sc_alen;
538159307Spjd		crda->crd_len = data_secsize;
539159307Spjd		crda->crd_inject = 0;
540159307Spjd		crda->crd_flags = CRD_F_KEY_EXPLICIT;
541159307Spjd		crda->crd_alg = sc->sc_aalgo;
542159307Spjd		g_eli_auth_keygen(sc, dstoff, authkey);
543159307Spjd		crda->crd_key = authkey;
544159307Spjd		crda->crd_klen = G_ELI_AUTH_SECKEYLEN * 8;
545159307Spjd
546159307Spjd		crp->crp_etype = 0;
547159307Spjd		err = crypto_dispatch(crp);
548159307Spjd		if (err != 0 && error == 0)
549159307Spjd			error = err;
550159307Spjd	}
551159307Spjd	if (bp->bio_error == 0)
552159307Spjd		bp->bio_error = error;
553159307Spjd}
554