ctl_frontend_iscsi.c revision 264525
1/*-
2 * Copyright (c) 2012 The FreeBSD Foundation
3 * All rights reserved.
4 *
5 * This software was developed by Edward Tomasz Napierala under sponsorship
6 * from the FreeBSD Foundation.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 *    notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 *    notice, this list of conditions and the following disclaimer in the
15 *    documentation and/or other materials provided with the distribution.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
28 *
29 * $FreeBSD: head/sys/cam/ctl/ctl_frontend_iscsi.c 264525 2014-04-16 10:18:44Z trasz $
30 */
31
32/*
33 * CTL frontend for the iSCSI protocol.
34 */
35
36#include <sys/cdefs.h>
37__FBSDID("$FreeBSD: head/sys/cam/ctl/ctl_frontend_iscsi.c 264525 2014-04-16 10:18:44Z trasz $");
38
39#include <sys/param.h>
40#include <sys/capsicum.h>
41#include <sys/condvar.h>
42#include <sys/file.h>
43#include <sys/kernel.h>
44#include <sys/kthread.h>
45#include <sys/lock.h>
46#include <sys/malloc.h>
47#include <sys/module.h>
48#include <sys/mutex.h>
49#include <sys/queue.h>
50#include <sys/sbuf.h>
51#include <sys/sysctl.h>
52#include <sys/systm.h>
53#include <sys/uio.h>
54#include <sys/unistd.h>
55#include <vm/uma.h>
56
57#include <cam/scsi/scsi_all.h>
58#include <cam/scsi/scsi_da.h>
59#include <cam/ctl/ctl_io.h>
60#include <cam/ctl/ctl.h>
61#include <cam/ctl/ctl_backend.h>
62#include <cam/ctl/ctl_error.h>
63#include <cam/ctl/ctl_frontend.h>
64#include <cam/ctl/ctl_frontend_internal.h>
65#include <cam/ctl/ctl_debug.h>
66#include <cam/ctl/ctl_ha.h>
67#include <cam/ctl/ctl_ioctl.h>
68#include <cam/ctl/ctl_private.h>
69
70#include "../../dev/iscsi/icl.h"
71#include "../../dev/iscsi/iscsi_proto.h"
72#include "ctl_frontend_iscsi.h"
73
74#ifdef ICL_KERNEL_PROXY
75#include <sys/socketvar.h>
76#endif
77
78#ifdef ICL_KERNEL_PROXY
79FEATURE(cfiscsi_kernel_proxy, "iSCSI target built with ICL_KERNEL_PROXY");
80#endif
81
82static MALLOC_DEFINE(M_CFISCSI, "cfiscsi", "Memory used for CTL iSCSI frontend");
83static uma_zone_t cfiscsi_data_wait_zone;
84
85SYSCTL_NODE(_kern_cam_ctl, OID_AUTO, iscsi, CTLFLAG_RD, 0,
86    "CAM Target Layer iSCSI Frontend");
87static int debug = 3;
88TUNABLE_INT("kern.cam.ctl.iscsi.debug", &debug);
89SYSCTL_INT(_kern_cam_ctl_iscsi, OID_AUTO, debug, CTLFLAG_RWTUN,
90    &debug, 1, "Enable debug messages");
91static int ping_timeout = 5;
92TUNABLE_INT("kern.cam.ctl.iscsi.ping_timeout", &ping_timeout);
93SYSCTL_INT(_kern_cam_ctl_iscsi, OID_AUTO, ping_timeout, CTLFLAG_RWTUN,
94    &ping_timeout, 5, "Interval between ping (NOP-Out) requests, in seconds");
95static int login_timeout = 60;
96TUNABLE_INT("kern.cam.ctl.iscsi.login_timeout", &login_timeout);
97SYSCTL_INT(_kern_cam_ctl_iscsi, OID_AUTO, login_timeout, CTLFLAG_RWTUN,
98    &login_timeout, 60, "Time to wait for ctld(8) to finish Login Phase, in seconds");
99static int maxcmdsn_delta = 256;
100TUNABLE_INT("kern.cam.ctl.iscsi.maxcmdsn_delta", &maxcmdsn_delta);
101SYSCTL_INT(_kern_cam_ctl_iscsi, OID_AUTO, maxcmdsn_delta, CTLFLAG_RWTUN,
102    &maxcmdsn_delta, 256, "Number of commands the initiator can send "
103    "without confirmation");
104
105#define	CFISCSI_DEBUG(X, ...)						\
106	do {								\
107		if (debug > 1) {					\
108			printf("%s: " X "\n",				\
109			    __func__, ## __VA_ARGS__);			\
110		}							\
111	} while (0)
112
113#define	CFISCSI_WARN(X, ...)						\
114	do {								\
115		if (debug > 0) {					\
116			printf("WARNING: %s: " X "\n",			\
117			    __func__, ## __VA_ARGS__);			\
118		}							\
119	} while (0)
120
121#define	CFISCSI_SESSION_DEBUG(S, X, ...)				\
122	do {								\
123		if (debug > 1) {					\
124			printf("%s: %s (%s): " X "\n",			\
125			    __func__, S->cs_initiator_addr,		\
126			    S->cs_initiator_name, ## __VA_ARGS__);	\
127		}							\
128	} while (0)
129
130#define	CFISCSI_SESSION_WARN(S, X, ...)					\
131	do  {								\
132		if (debug > 0) {					\
133			printf("WARNING: %s (%s): " X "\n",		\
134			    S->cs_initiator_addr,			\
135			    S->cs_initiator_name, ## __VA_ARGS__);	\
136		}							\
137	} while (0)
138
139#define CFISCSI_SESSION_LOCK(X)		mtx_lock(&X->cs_lock)
140#define CFISCSI_SESSION_UNLOCK(X)	mtx_unlock(&X->cs_lock)
141#define CFISCSI_SESSION_LOCK_ASSERT(X)	mtx_assert(&X->cs_lock, MA_OWNED)
142
143#define	CONN_SESSION(X)			((struct cfiscsi_session *)(X)->ic_prv0)
144#define	PDU_SESSION(X)			CONN_SESSION((X)->ip_conn)
145#define	PDU_EXPDATASN(X)		(X)->ip_prv0
146#define	PDU_TOTAL_TRANSFER_LEN(X)	(X)->ip_prv1
147#define	PDU_R2TSN(X)			(X)->ip_prv2
148
149int		cfiscsi_init(void);
150static void	cfiscsi_online(void *arg);
151static void	cfiscsi_offline(void *arg);
152static int	cfiscsi_targ_enable(void *arg, struct ctl_id targ_id);
153static int	cfiscsi_targ_disable(void *arg, struct ctl_id targ_id);
154static int	cfiscsi_lun_enable(void *arg,
155		    struct ctl_id target_id, int lun_id);
156static int	cfiscsi_lun_disable(void *arg,
157		    struct ctl_id target_id, int lun_id);
158static int	cfiscsi_ioctl(struct cdev *dev,
159		    u_long cmd, caddr_t addr, int flag, struct thread *td);
160static int	cfiscsi_devid(struct ctl_scsiio *ctsio, int alloc_len);
161static void	cfiscsi_datamove(union ctl_io *io);
162static void	cfiscsi_done(union ctl_io *io);
163static uint32_t	cfiscsi_map_lun(void *arg, uint32_t lun);
164static bool	cfiscsi_pdu_update_cmdsn(const struct icl_pdu *request);
165static void	cfiscsi_pdu_handle_nop_out(struct icl_pdu *request);
166static void	cfiscsi_pdu_handle_scsi_command(struct icl_pdu *request);
167static void	cfiscsi_pdu_handle_task_request(struct icl_pdu *request);
168static void	cfiscsi_pdu_handle_data_out(struct icl_pdu *request);
169static void	cfiscsi_pdu_handle_logout_request(struct icl_pdu *request);
170static void	cfiscsi_session_terminate(struct cfiscsi_session *cs);
171static struct cfiscsi_target	*cfiscsi_target_find(struct cfiscsi_softc
172		    *softc, const char *name);
173static void	cfiscsi_target_release(struct cfiscsi_target *ct);
174static void	cfiscsi_session_delete(struct cfiscsi_session *cs);
175
176static struct cfiscsi_softc cfiscsi_softc;
177extern struct ctl_softc *control_softc;
178
179static int cfiscsi_module_event_handler(module_t, int /*modeventtype_t*/, void *);
180
181static moduledata_t cfiscsi_moduledata = {
182	"ctlcfiscsi",
183	cfiscsi_module_event_handler,
184	NULL
185};
186
187DECLARE_MODULE(ctlcfiscsi, cfiscsi_moduledata, SI_SUB_CONFIGURE, SI_ORDER_FOURTH);
188MODULE_VERSION(ctlcfiscsi, 1);
189MODULE_DEPEND(ctlcfiscsi, ctl, 1, 1, 1);
190MODULE_DEPEND(ctlcfiscsi, icl, 1, 1, 1);
191
192static struct icl_pdu *
193cfiscsi_pdu_new_response(struct icl_pdu *request, int flags)
194{
195
196	return (icl_pdu_new_bhs(request->ip_conn, flags));
197}
198
199static bool
200cfiscsi_pdu_update_cmdsn(const struct icl_pdu *request)
201{
202	const struct iscsi_bhs_scsi_command *bhssc;
203	struct cfiscsi_session *cs;
204	uint32_t cmdsn, expstatsn;
205
206	cs = PDU_SESSION(request);
207
208	/*
209	 * Every incoming PDU - not just NOP-Out - resets the ping timer.
210	 * The purpose of the timeout is to reset the connection when it stalls;
211	 * we don't want this to happen when NOP-In or NOP-Out ends up delayed
212	 * in some queue.
213	 *
214	 * XXX: Locking?
215	 */
216	cs->cs_timeout = 0;
217
218	/*
219	 * Data-Out PDUs don't contain CmdSN.
220	 */
221	if ((request->ip_bhs->bhs_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
222	    ISCSI_BHS_OPCODE_SCSI_DATA_OUT)
223		return (false);
224
225	/*
226	 * We're only using fields common for all the request
227	 * (initiator -> target) PDUs.
228	 */
229	bhssc = (const struct iscsi_bhs_scsi_command *)request->ip_bhs;
230	cmdsn = ntohl(bhssc->bhssc_cmdsn);
231	expstatsn = ntohl(bhssc->bhssc_expstatsn);
232
233	CFISCSI_SESSION_LOCK(cs);
234#if 0
235	if (expstatsn != cs->cs_statsn) {
236		CFISCSI_SESSION_DEBUG(cs, "received PDU with ExpStatSN %d, "
237		    "while current StatSN is %d", expstatsn,
238		    cs->cs_statsn);
239	}
240#endif
241
242	/*
243	 * The target MUST silently ignore any non-immediate command outside
244	 * of this range.
245	 */
246	if (cmdsn < cs->cs_cmdsn || cmdsn > cs->cs_cmdsn + maxcmdsn_delta) {
247		CFISCSI_SESSION_UNLOCK(cs);
248		CFISCSI_SESSION_WARN(cs, "received PDU with CmdSN %d, "
249		    "while expected CmdSN was %d", cmdsn, cs->cs_cmdsn);
250		return (true);
251	}
252
253	if ((request->ip_bhs->bhs_opcode & ISCSI_BHS_OPCODE_IMMEDIATE) == 0)
254		cs->cs_cmdsn++;
255
256	CFISCSI_SESSION_UNLOCK(cs);
257
258	return (false);
259}
260
261static void
262cfiscsi_pdu_handle(struct icl_pdu *request)
263{
264	struct cfiscsi_session *cs;
265	bool ignore;
266
267	cs = PDU_SESSION(request);
268
269	ignore = cfiscsi_pdu_update_cmdsn(request);
270	if (ignore) {
271		icl_pdu_free(request);
272		return;
273	}
274
275	/*
276	 * Handle the PDU; this includes e.g. receiving the remaining
277	 * part of PDU and submitting the SCSI command to CTL
278	 * or queueing a reply.  The handling routine is responsible
279	 * for freeing the PDU when it's no longer needed.
280	 */
281	switch (request->ip_bhs->bhs_opcode &
282	    ~ISCSI_BHS_OPCODE_IMMEDIATE) {
283	case ISCSI_BHS_OPCODE_NOP_OUT:
284		cfiscsi_pdu_handle_nop_out(request);
285		break;
286	case ISCSI_BHS_OPCODE_SCSI_COMMAND:
287		cfiscsi_pdu_handle_scsi_command(request);
288		break;
289	case ISCSI_BHS_OPCODE_TASK_REQUEST:
290		cfiscsi_pdu_handle_task_request(request);
291		break;
292	case ISCSI_BHS_OPCODE_SCSI_DATA_OUT:
293		cfiscsi_pdu_handle_data_out(request);
294		break;
295	case ISCSI_BHS_OPCODE_LOGOUT_REQUEST:
296		cfiscsi_pdu_handle_logout_request(request);
297		break;
298	default:
299		CFISCSI_SESSION_WARN(cs, "received PDU with unsupported "
300		    "opcode 0x%x; dropping connection",
301		    request->ip_bhs->bhs_opcode);
302		icl_pdu_free(request);
303		cfiscsi_session_terminate(cs);
304	}
305
306}
307
308static void
309cfiscsi_receive_callback(struct icl_pdu *request)
310{
311	struct cfiscsi_session *cs;
312
313	cs = PDU_SESSION(request);
314
315#ifdef ICL_KERNEL_PROXY
316	if (cs->cs_waiting_for_ctld || cs->cs_login_phase) {
317		if (cs->cs_login_pdu == NULL)
318			cs->cs_login_pdu = request;
319		else
320			icl_pdu_free(request);
321		cv_signal(&cs->cs_login_cv);
322		return;
323	}
324#endif
325
326	cfiscsi_pdu_handle(request);
327}
328
329static void
330cfiscsi_error_callback(struct icl_conn *ic)
331{
332	struct cfiscsi_session *cs;
333
334	cs = CONN_SESSION(ic);
335
336	CFISCSI_SESSION_WARN(cs, "connection error; dropping connection");
337	cfiscsi_session_terminate(cs);
338}
339
340static int
341cfiscsi_pdu_prepare(struct icl_pdu *response)
342{
343	struct cfiscsi_session *cs;
344	struct iscsi_bhs_scsi_response *bhssr;
345	bool advance_statsn = true;
346
347	cs = PDU_SESSION(response);
348
349	CFISCSI_SESSION_LOCK_ASSERT(cs);
350
351	/*
352	 * We're only using fields common for all the response
353	 * (target -> initiator) PDUs.
354	 */
355	bhssr = (struct iscsi_bhs_scsi_response *)response->ip_bhs;
356
357	/*
358	 * 10.8.3: "The StatSN for this connection is not advanced
359	 * after this PDU is sent."
360	 */
361	if (bhssr->bhssr_opcode == ISCSI_BHS_OPCODE_R2T)
362		advance_statsn = false;
363
364	/*
365	 * 10.19.2: "However, when the Initiator Task Tag is set to 0xffffffff,
366	 * StatSN for the connection is not advanced after this PDU is sent."
367	 */
368	if (bhssr->bhssr_opcode == ISCSI_BHS_OPCODE_NOP_IN &&
369	    bhssr->bhssr_initiator_task_tag == 0xffffffff)
370		advance_statsn = false;
371
372	/*
373	 * See the comment below - StatSN is not meaningful and must
374	 * not be advanced.
375	 */
376	if (bhssr->bhssr_opcode == ISCSI_BHS_OPCODE_SCSI_DATA_IN)
377		advance_statsn = false;
378
379	/*
380	 * 10.7.3: "The fields StatSN, Status, and Residual Count
381	 * only have meaningful content if the S bit is set to 1."
382	 */
383	if (bhssr->bhssr_opcode != ISCSI_BHS_OPCODE_SCSI_DATA_IN)
384		bhssr->bhssr_statsn = htonl(cs->cs_statsn);
385	bhssr->bhssr_expcmdsn = htonl(cs->cs_cmdsn);
386	bhssr->bhssr_maxcmdsn = htonl(cs->cs_cmdsn + maxcmdsn_delta);
387
388	if (advance_statsn)
389		cs->cs_statsn++;
390
391	return (0);
392}
393
394static void
395cfiscsi_pdu_queue(struct icl_pdu *response)
396{
397	struct cfiscsi_session *cs;
398
399	cs = PDU_SESSION(response);
400
401	CFISCSI_SESSION_LOCK(cs);
402	cfiscsi_pdu_prepare(response);
403	icl_pdu_queue(response);
404	CFISCSI_SESSION_UNLOCK(cs);
405}
406
407static uint32_t
408cfiscsi_decode_lun(uint64_t encoded)
409{
410	uint8_t lun[8];
411	uint32_t result;
412
413	/*
414	 * The LUN field in iSCSI PDUs may look like an ordinary 64 bit number,
415	 * but is in fact an evil, multidimensional structure defined
416	 * in SCSI Architecture Model 5 (SAM-5), section 4.6.
417	 */
418	memcpy(lun, &encoded, sizeof(lun));
419	switch (lun[0] & 0xC0) {
420	case 0x00:
421		if ((lun[0] & 0x3f) != 0 || lun[2] != 0 || lun[3] != 0 ||
422		    lun[4] != 0 || lun[5] != 0 || lun[6] != 0 || lun[7] != 0) {
423			CFISCSI_WARN("malformed LUN "
424			    "(peripheral device addressing method): 0x%jx",
425			    (uintmax_t)encoded);
426			result = 0xffffffff;
427			break;
428		}
429		result = lun[1];
430		break;
431	case 0x40:
432		if (lun[2] != 0 || lun[3] != 0 || lun[4] != 0 || lun[5] != 0 ||
433		    lun[6] != 0 || lun[7] != 0) {
434			CFISCSI_WARN("malformed LUN "
435			    "(flat address space addressing method): 0x%jx",
436			    (uintmax_t)encoded);
437			result = 0xffffffff;
438			break;
439		}
440		result = ((lun[0] & 0x3f) << 8) + lun[1];
441		break;
442	case 0xC0:
443		if (lun[0] != 0xD2 || lun[4] != 0 || lun[5] != 0 ||
444		    lun[6] != 0 || lun[7] != 0) {
445			CFISCSI_WARN("malformed LUN (extended flat "
446			    "address space addressing method): 0x%jx",
447			    (uintmax_t)encoded);
448			result = 0xffffffff;
449			break;
450		}
451		result = (lun[1] << 16) + (lun[2] << 8) + lun[3];
452	default:
453		CFISCSI_WARN("unsupported LUN format 0x%jx",
454		    (uintmax_t)encoded);
455		result = 0xffffffff;
456		break;
457	}
458
459	return (result);
460}
461
462static void
463cfiscsi_pdu_handle_nop_out(struct icl_pdu *request)
464{
465	struct cfiscsi_session *cs;
466	struct iscsi_bhs_nop_out *bhsno;
467	struct iscsi_bhs_nop_in *bhsni;
468	struct icl_pdu *response;
469	void *data = NULL;
470	size_t datasize;
471	int error;
472
473	cs = PDU_SESSION(request);
474	bhsno = (struct iscsi_bhs_nop_out *)request->ip_bhs;
475
476	if (bhsno->bhsno_initiator_task_tag == 0xffffffff) {
477		/*
478		 * Nothing to do, iscsi_pdu_update_statsn() already
479		 * zeroed the timeout.
480		 */
481		icl_pdu_free(request);
482		return;
483	}
484
485	datasize = icl_pdu_data_segment_length(request);
486	if (datasize > 0) {
487		data = malloc(datasize, M_CFISCSI, M_NOWAIT | M_ZERO);
488		if (data == NULL) {
489			CFISCSI_SESSION_WARN(cs, "failed to allocate memory; "
490			    "dropping connection");
491			icl_pdu_free(request);
492			cfiscsi_session_terminate(cs);
493			return;
494		}
495		icl_pdu_get_data(request, 0, data, datasize);
496	}
497
498	response = cfiscsi_pdu_new_response(request, M_NOWAIT);
499	if (response == NULL) {
500		CFISCSI_SESSION_WARN(cs, "failed to allocate memory; "
501		    "droppping connection");
502		free(data, M_CFISCSI);
503		icl_pdu_free(request);
504		cfiscsi_session_terminate(cs);
505		return;
506	}
507	bhsni = (struct iscsi_bhs_nop_in *)response->ip_bhs;
508	bhsni->bhsni_opcode = ISCSI_BHS_OPCODE_NOP_IN;
509	bhsni->bhsni_flags = 0x80;
510	bhsni->bhsni_initiator_task_tag = bhsno->bhsno_initiator_task_tag;
511	bhsni->bhsni_target_transfer_tag = 0xffffffff;
512	if (datasize > 0) {
513		error = icl_pdu_append_data(response, data, datasize, M_NOWAIT);
514		if (error != 0) {
515			CFISCSI_SESSION_WARN(cs, "failed to allocate memory; "
516			    "dropping connection");
517			free(data, M_CFISCSI);
518			icl_pdu_free(request);
519			icl_pdu_free(response);
520			cfiscsi_session_terminate(cs);
521			return;
522		}
523		free(data, M_CFISCSI);
524	}
525
526	icl_pdu_free(request);
527	cfiscsi_pdu_queue(response);
528}
529
530static void
531cfiscsi_pdu_handle_scsi_command(struct icl_pdu *request)
532{
533	struct iscsi_bhs_scsi_command *bhssc;
534	struct cfiscsi_session *cs;
535	union ctl_io *io;
536	int error;
537
538	cs = PDU_SESSION(request);
539	bhssc = (struct iscsi_bhs_scsi_command *)request->ip_bhs;
540	//CFISCSI_SESSION_DEBUG(cs, "initiator task tag 0x%x",
541	//    bhssc->bhssc_initiator_task_tag);
542
543	if (request->ip_data_len > 0 && cs->cs_immediate_data == false) {
544		CFISCSI_SESSION_WARN(cs, "unsolicited data with "
545		    "ImmediateData=No; dropping connection");
546		icl_pdu_free(request);
547		cfiscsi_session_terminate(cs);
548		return;
549	}
550	io = ctl_alloc_io(cs->cs_target->ct_softc->fe.ctl_pool_ref);
551	if (io == NULL) {
552		CFISCSI_SESSION_WARN(cs, "can't allocate ctl_io; "
553		    "dropping connection");
554		icl_pdu_free(request);
555		cfiscsi_session_terminate(cs);
556		return;
557	}
558	ctl_zero_io(io);
559	io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr = request;
560	io->io_hdr.io_type = CTL_IO_SCSI;
561	io->io_hdr.nexus.initid.id = cs->cs_ctl_initid;
562	io->io_hdr.nexus.targ_port = cs->cs_target->ct_softc->fe.targ_port;
563	io->io_hdr.nexus.targ_target.id = 0;
564	io->io_hdr.nexus.targ_lun = cfiscsi_decode_lun(bhssc->bhssc_lun);
565	io->io_hdr.nexus.lun_map_fn = cfiscsi_map_lun;
566	io->io_hdr.nexus.lun_map_arg = cs;
567	io->scsiio.tag_num = bhssc->bhssc_initiator_task_tag;
568	switch ((bhssc->bhssc_flags & BHSSC_FLAGS_ATTR)) {
569	case BHSSC_FLAGS_ATTR_UNTAGGED:
570		io->scsiio.tag_type = CTL_TAG_UNTAGGED;
571		break;
572	case BHSSC_FLAGS_ATTR_SIMPLE:
573		io->scsiio.tag_type = CTL_TAG_SIMPLE;
574		break;
575	case BHSSC_FLAGS_ATTR_ORDERED:
576        	io->scsiio.tag_type = CTL_TAG_ORDERED;
577		break;
578	case BHSSC_FLAGS_ATTR_HOQ:
579        	io->scsiio.tag_type = CTL_TAG_HEAD_OF_QUEUE;
580		break;
581	case BHSSC_FLAGS_ATTR_ACA:
582		io->scsiio.tag_type = CTL_TAG_ACA;
583		break;
584	default:
585		io->scsiio.tag_type = CTL_TAG_UNTAGGED;
586		CFISCSI_SESSION_WARN(cs, "unhandled tag type %d",
587		    bhssc->bhssc_flags & BHSSC_FLAGS_ATTR);
588		break;
589	}
590	io->scsiio.cdb_len = sizeof(bhssc->bhssc_cdb); /* Which is 16. */
591	memcpy(io->scsiio.cdb, bhssc->bhssc_cdb, sizeof(bhssc->bhssc_cdb));
592	refcount_acquire(&cs->cs_outstanding_ctl_pdus);
593	error = ctl_queue(io);
594	if (error != CTL_RETVAL_COMPLETE) {
595		CFISCSI_SESSION_WARN(cs, "ctl_queue() failed; error %d; "
596		    "dropping connection", error);
597		ctl_free_io(io);
598		refcount_release(&cs->cs_outstanding_ctl_pdus);
599		icl_pdu_free(request);
600		cfiscsi_session_terminate(cs);
601	}
602}
603
604static void
605cfiscsi_pdu_handle_task_request(struct icl_pdu *request)
606{
607	struct iscsi_bhs_task_management_request *bhstmr;
608	struct iscsi_bhs_task_management_response *bhstmr2;
609	struct icl_pdu *response;
610	struct cfiscsi_session *cs;
611	union ctl_io *io;
612	int error;
613
614	cs = PDU_SESSION(request);
615	bhstmr = (struct iscsi_bhs_task_management_request *)request->ip_bhs;
616	io = ctl_alloc_io(cs->cs_target->ct_softc->fe.ctl_pool_ref);
617	if (io == NULL) {
618		CFISCSI_SESSION_WARN(cs, "can't allocate ctl_io;"
619		    "dropping connection");
620		icl_pdu_free(request);
621		cfiscsi_session_terminate(cs);
622		return;
623	}
624	ctl_zero_io(io);
625	io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr = request;
626	io->io_hdr.io_type = CTL_IO_TASK;
627	io->io_hdr.nexus.initid.id = cs->cs_ctl_initid;
628	io->io_hdr.nexus.targ_port = cs->cs_target->ct_softc->fe.targ_port;
629	io->io_hdr.nexus.targ_target.id = 0;
630	io->io_hdr.nexus.targ_lun = cfiscsi_decode_lun(bhstmr->bhstmr_lun);
631	io->io_hdr.nexus.lun_map_fn = cfiscsi_map_lun;
632	io->io_hdr.nexus.lun_map_arg = cs;
633	io->taskio.tag_type = CTL_TAG_SIMPLE; /* XXX */
634
635	switch (bhstmr->bhstmr_function & ~0x80) {
636	case BHSTMR_FUNCTION_ABORT_TASK:
637#if 0
638		CFISCSI_SESSION_DEBUG(cs, "BHSTMR_FUNCTION_ABORT_TASK");
639#endif
640		io->taskio.task_action = CTL_TASK_ABORT_TASK;
641		io->taskio.tag_num = bhstmr->bhstmr_referenced_task_tag;
642		break;
643	case BHSTMR_FUNCTION_LOGICAL_UNIT_RESET:
644#if 0
645		CFISCSI_SESSION_DEBUG(cs, "BHSTMR_FUNCTION_LOGICAL_UNIT_RESET");
646#endif
647		io->taskio.task_action = CTL_TASK_LUN_RESET;
648		break;
649	case BHSTMR_FUNCTION_TARGET_WARM_RESET:
650#if 0
651		CFISCSI_SESSION_DEBUG(cs, "BHSTMR_FUNCTION_TARGET_WARM_RESET");
652#endif
653		io->taskio.task_action = CTL_TASK_TARGET_RESET;
654		break;
655	default:
656		CFISCSI_SESSION_DEBUG(cs, "unsupported function 0x%x",
657		    bhstmr->bhstmr_function & ~0x80);
658		ctl_free_io(io);
659
660		response = cfiscsi_pdu_new_response(request, M_NOWAIT);
661		if (response == NULL) {
662			CFISCSI_SESSION_WARN(cs, "failed to allocate memory; "
663			    "dropping connection");
664			icl_pdu_free(request);
665			cfiscsi_session_terminate(cs);
666			return;
667		}
668		bhstmr2 = (struct iscsi_bhs_task_management_response *)
669		    response->ip_bhs;
670		bhstmr2->bhstmr_opcode = ISCSI_BHS_OPCODE_TASK_RESPONSE;
671		bhstmr2->bhstmr_flags = 0x80;
672		bhstmr2->bhstmr_response =
673		    BHSTMR_RESPONSE_FUNCTION_NOT_SUPPORTED;
674		bhstmr2->bhstmr_initiator_task_tag =
675		    bhstmr->bhstmr_initiator_task_tag;
676		icl_pdu_free(request);
677		cfiscsi_pdu_queue(response);
678		return;
679	}
680
681	refcount_acquire(&cs->cs_outstanding_ctl_pdus);
682	error = ctl_queue(io);
683	if (error != CTL_RETVAL_COMPLETE) {
684		CFISCSI_SESSION_WARN(cs, "ctl_queue() failed; error %d; "
685		    "dropping connection", error);
686		ctl_free_io(io);
687		refcount_release(&cs->cs_outstanding_ctl_pdus);
688		icl_pdu_free(request);
689		cfiscsi_session_terminate(cs);
690	}
691}
692
693static bool
694cfiscsi_handle_data_segment(struct icl_pdu *request, struct cfiscsi_data_wait *cdw)
695{
696	struct iscsi_bhs_data_out *bhsdo;
697	struct cfiscsi_session *cs;
698	struct ctl_sg_entry ctl_sg_entry, *ctl_sglist;
699	size_t copy_len, len, off, buffer_offset;
700	int ctl_sg_count;
701	union ctl_io *io;
702
703	cs = PDU_SESSION(request);
704
705	KASSERT((request->ip_bhs->bhs_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
706	    ISCSI_BHS_OPCODE_SCSI_DATA_OUT ||
707	    (request->ip_bhs->bhs_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
708	    ISCSI_BHS_OPCODE_SCSI_COMMAND,
709	    ("bad opcode 0x%x", request->ip_bhs->bhs_opcode));
710
711	/*
712	 * We're only using fields common for Data Out and SCSI Command PDUs.
713	 */
714	bhsdo = (struct iscsi_bhs_data_out *)request->ip_bhs;
715
716	io = cdw->cdw_ctl_io;
717	KASSERT((io->io_hdr.flags & CTL_FLAG_DATA_MASK) != CTL_FLAG_DATA_IN,
718	    ("CTL_FLAG_DATA_IN"));
719
720#if 0
721	CFISCSI_SESSION_DEBUG(cs, "received %zd bytes out of %d",
722	    request->ip_data_len, io->scsiio.kern_total_len);
723#endif
724
725	if (io->scsiio.kern_sg_entries > 0) {
726		ctl_sglist = (struct ctl_sg_entry *)io->scsiio.kern_data_ptr;
727		ctl_sg_count = io->scsiio.kern_sg_entries;
728	} else {
729		ctl_sglist = &ctl_sg_entry;
730		ctl_sglist->addr = io->scsiio.kern_data_ptr;
731		ctl_sglist->len = io->scsiio.kern_data_len;
732		ctl_sg_count = 1;
733	}
734
735	if ((request->ip_bhs->bhs_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
736	    ISCSI_BHS_OPCODE_SCSI_DATA_OUT)
737		buffer_offset = ntohl(bhsdo->bhsdo_buffer_offset);
738	else
739		buffer_offset = 0;
740
741	/*
742	 * Make sure the offset, as sent by the initiator, matches the offset
743	 * we're supposed to be at in the scatter-gather list.
744	 */
745	if (buffer_offset != io->scsiio.ext_data_filled) {
746		CFISCSI_SESSION_WARN(cs, "received bad buffer offset %zd, "
747		    "expected %zd", buffer_offset,
748		    (size_t)io->scsiio.ext_data_filled);
749		cfiscsi_session_terminate(cs);
750		return (true);
751	}
752
753	/*
754	 * This is the offset within the PDU data segment, as opposed
755	 * to buffer_offset, which is the offset within the task (SCSI
756	 * command).
757	 */
758	off = 0;
759	len = icl_pdu_data_segment_length(request);
760
761	/*
762	 * Iterate over the scatter/gather segments, filling them with data
763	 * from the PDU data segment.  Note that this can get called multiple
764	 * times for one SCSI command; the cdw structure holds state for the
765	 * scatter/gather list.
766	 */
767	for (;;) {
768		KASSERT(cdw->cdw_sg_index < ctl_sg_count,
769		    ("cdw->cdw_sg_index >= ctl_sg_count"));
770		if (cdw->cdw_sg_len == 0) {
771			cdw->cdw_sg_addr = ctl_sglist[cdw->cdw_sg_index].addr;
772			cdw->cdw_sg_len = ctl_sglist[cdw->cdw_sg_index].len;
773		}
774		KASSERT(off <= len, ("len > off"));
775		copy_len = len - off;
776		if (copy_len > cdw->cdw_sg_len)
777			copy_len = cdw->cdw_sg_len;
778
779		icl_pdu_get_data(request, off, cdw->cdw_sg_addr, copy_len);
780		cdw->cdw_sg_addr += copy_len;
781		cdw->cdw_sg_len -= copy_len;
782		off += copy_len;
783		io->scsiio.ext_data_filled += copy_len;
784
785		if (cdw->cdw_sg_len == 0) {
786			/*
787			 * End of current segment.
788			 */
789			if (cdw->cdw_sg_index == ctl_sg_count - 1) {
790				/*
791				 * Last segment in scatter/gather list.
792				 */
793				break;
794			}
795			cdw->cdw_sg_index++;
796		}
797
798		if (off == len) {
799			/*
800			 * End of PDU payload.
801			 */
802			break;
803		}
804	}
805
806	if (len > off) {
807		CFISCSI_SESSION_WARN(cs, "received too much data: got %zd bytes, "
808		    "expected %zd", icl_pdu_data_segment_length(request), off);
809		cfiscsi_session_terminate(cs);
810		return (true);
811	}
812
813	if (bhsdo->bhsdo_flags & BHSDO_FLAGS_F ||
814	    io->scsiio.ext_data_filled == io->scsiio.kern_total_len) {
815		if ((bhsdo->bhsdo_flags & BHSDO_FLAGS_F) == 0) {
816			CFISCSI_SESSION_WARN(cs, "got the final packet without "
817			    "the F flag; flags = 0x%x; dropping connection",
818			    bhsdo->bhsdo_flags);
819			cfiscsi_session_terminate(cs);
820			return (true);
821		}
822
823		if (io->scsiio.ext_data_filled != io->scsiio.kern_total_len) {
824			if ((request->ip_bhs->bhs_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
825			    ISCSI_BHS_OPCODE_SCSI_DATA_OUT) {
826				CFISCSI_SESSION_WARN(cs, "got the final packet, but the "
827				    "transmitted size was %zd bytes instead of %d; "
828				    "dropping connection",
829				    (size_t)io->scsiio.ext_data_filled,
830				    io->scsiio.kern_total_len);
831				cfiscsi_session_terminate(cs);
832				return (true);
833			} else {
834				/*
835				 * For SCSI Command PDU, this just means we need to
836				 * solicit more data by sending R2T.
837				 */
838				return (false);
839			}
840		}
841#if 0
842		CFISCSI_SESSION_DEBUG(cs, "no longer expecting Data-Out with target "
843		    "transfer tag 0x%x", cdw->cdw_target_transfer_tag);
844#endif
845
846		return (true);
847	}
848
849	return (false);
850}
851
852static void
853cfiscsi_pdu_handle_data_out(struct icl_pdu *request)
854{
855	struct iscsi_bhs_data_out *bhsdo;
856	struct cfiscsi_session *cs;
857	struct cfiscsi_data_wait *cdw = NULL;
858	union ctl_io *io;
859	bool done;
860
861	cs = PDU_SESSION(request);
862	bhsdo = (struct iscsi_bhs_data_out *)request->ip_bhs;
863
864	CFISCSI_SESSION_LOCK(cs);
865	TAILQ_FOREACH(cdw, &cs->cs_waiting_for_data_out, cdw_next) {
866#if 0
867		CFISCSI_SESSION_DEBUG(cs, "have ttt 0x%x, itt 0x%x; looking for "
868		    "ttt 0x%x, itt 0x%x",
869		    bhsdo->bhsdo_target_transfer_tag,
870		    bhsdo->bhsdo_initiator_task_tag,
871		    cdw->cdw_target_transfer_tag, cdw->cdw_initiator_task_tag));
872#endif
873		if (bhsdo->bhsdo_target_transfer_tag ==
874		    cdw->cdw_target_transfer_tag)
875			break;
876	}
877	CFISCSI_SESSION_UNLOCK(cs);
878	if (cdw == NULL) {
879		CFISCSI_SESSION_WARN(cs, "data transfer tag 0x%x, initiator task tag "
880		    "0x%x, not found; dropping connection",
881		    bhsdo->bhsdo_target_transfer_tag, bhsdo->bhsdo_initiator_task_tag);
882		icl_pdu_free(request);
883		cfiscsi_session_terminate(cs);
884		return;
885	}
886
887	io = cdw->cdw_ctl_io;
888	KASSERT((io->io_hdr.flags & CTL_FLAG_DATA_MASK) != CTL_FLAG_DATA_IN,
889	    ("CTL_FLAG_DATA_IN"));
890
891	done = cfiscsi_handle_data_segment(request, cdw);
892	if (done) {
893		CFISCSI_SESSION_LOCK(cs);
894		TAILQ_REMOVE(&cs->cs_waiting_for_data_out, cdw, cdw_next);
895		CFISCSI_SESSION_UNLOCK(cs);
896		uma_zfree(cfiscsi_data_wait_zone, cdw);
897		io->scsiio.be_move_done(io);
898	}
899
900	icl_pdu_free(request);
901}
902
903static void
904cfiscsi_pdu_handle_logout_request(struct icl_pdu *request)
905{
906	struct iscsi_bhs_logout_request *bhslr;
907	struct iscsi_bhs_logout_response *bhslr2;
908	struct icl_pdu *response;
909	struct cfiscsi_session *cs;
910
911	cs = PDU_SESSION(request);
912	bhslr = (struct iscsi_bhs_logout_request *)request->ip_bhs;
913	switch (bhslr->bhslr_reason & 0x7f) {
914	case BHSLR_REASON_CLOSE_SESSION:
915	case BHSLR_REASON_CLOSE_CONNECTION:
916		response = cfiscsi_pdu_new_response(request, M_NOWAIT);
917		if (response == NULL) {
918			CFISCSI_SESSION_DEBUG(cs, "failed to allocate memory");
919			icl_pdu_free(request);
920			cfiscsi_session_terminate(cs);
921			return;
922		}
923		bhslr2 = (struct iscsi_bhs_logout_response *)response->ip_bhs;
924		bhslr2->bhslr_opcode = ISCSI_BHS_OPCODE_LOGOUT_RESPONSE;
925		bhslr2->bhslr_flags = 0x80;
926		bhslr2->bhslr_response = BHSLR_RESPONSE_CLOSED_SUCCESSFULLY;
927		bhslr2->bhslr_initiator_task_tag =
928		    bhslr->bhslr_initiator_task_tag;
929		icl_pdu_free(request);
930		cfiscsi_pdu_queue(response);
931		cfiscsi_session_terminate(cs);
932		break;
933	case BHSLR_REASON_REMOVE_FOR_RECOVERY:
934		response = cfiscsi_pdu_new_response(request, M_NOWAIT);
935		if (response == NULL) {
936			CFISCSI_SESSION_WARN(cs,
937			    "failed to allocate memory; dropping connection");
938			icl_pdu_free(request);
939			cfiscsi_session_terminate(cs);
940			return;
941		}
942		bhslr2 = (struct iscsi_bhs_logout_response *)response->ip_bhs;
943		bhslr2->bhslr_opcode = ISCSI_BHS_OPCODE_LOGOUT_RESPONSE;
944		bhslr2->bhslr_flags = 0x80;
945		bhslr2->bhslr_response = BHSLR_RESPONSE_RECOVERY_NOT_SUPPORTED;
946		bhslr2->bhslr_initiator_task_tag =
947		    bhslr->bhslr_initiator_task_tag;
948		icl_pdu_free(request);
949		cfiscsi_pdu_queue(response);
950		break;
951	default:
952		CFISCSI_SESSION_WARN(cs, "invalid reason 0%x; dropping connection",
953		    bhslr->bhslr_reason);
954		icl_pdu_free(request);
955		cfiscsi_session_terminate(cs);
956		break;
957	}
958}
959
960static void
961cfiscsi_callout(void *context)
962{
963	struct icl_pdu *cp;
964	struct iscsi_bhs_nop_in *bhsni;
965	struct cfiscsi_session *cs;
966
967	cs = context;
968
969	if (cs->cs_terminating)
970		return;
971
972	callout_schedule(&cs->cs_callout, 1 * hz);
973
974	atomic_add_int(&cs->cs_timeout, 1);
975
976#ifdef ICL_KERNEL_PROXY
977	if (cs->cs_waiting_for_ctld || cs->cs_login_phase) {
978		if (cs->cs_timeout > login_timeout) {
979			CFISCSI_SESSION_WARN(cs, "login timed out after "
980			    "%d seconds; dropping connection", cs->cs_timeout);
981			cfiscsi_session_terminate(cs);
982		}
983		return;
984	}
985#endif
986
987	if (cs->cs_timeout >= ping_timeout) {
988		CFISCSI_SESSION_WARN(cs, "no ping reply (NOP-Out) after %d seconds; "
989		    "dropping connection",  ping_timeout);
990		cfiscsi_session_terminate(cs);
991		return;
992	}
993
994	/*
995	 * If the ping was reset less than one second ago - which means
996	 * that we've received some PDU during the last second - assume
997	 * the traffic flows correctly and don't bother sending a NOP-Out.
998	 *
999	 * (It's 2 - one for one second, and one for incrementing is_timeout
1000	 * earlier in this routine.)
1001	 */
1002	if (cs->cs_timeout < 2)
1003		return;
1004
1005	cp = icl_pdu_new_bhs(cs->cs_conn, M_NOWAIT);
1006	if (cp == NULL) {
1007		CFISCSI_SESSION_WARN(cs, "failed to allocate memory");
1008		return;
1009	}
1010	bhsni = (struct iscsi_bhs_nop_in *)cp->ip_bhs;
1011	bhsni->bhsni_opcode = ISCSI_BHS_OPCODE_NOP_IN;
1012	bhsni->bhsni_flags = 0x80;
1013	bhsni->bhsni_initiator_task_tag = 0xffffffff;
1014
1015	cfiscsi_pdu_queue(cp);
1016}
1017
1018static void
1019cfiscsi_session_terminate_tasks(struct cfiscsi_session *cs)
1020{
1021	struct cfiscsi_data_wait *cdw, *tmpcdw;
1022	union ctl_io *io;
1023	int error;
1024
1025#ifdef notyet
1026	io = ctl_alloc_io(cs->cs_target->ct_softc->fe.ctl_pool_ref);
1027	if (io == NULL) {
1028		CFISCSI_SESSION_WARN(cs, "can't allocate ctl_io");
1029		return;
1030	}
1031	ctl_zero_io(io);
1032	io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr = NULL;
1033	io->io_hdr.io_type = CTL_IO_TASK;
1034	io->io_hdr.nexus.initid.id = cs->cs_ctl_initid;
1035	io->io_hdr.nexus.targ_port = cs->cs_target->ct_softc->fe.targ_port;
1036	io->io_hdr.nexus.targ_target.id = 0;
1037	io->io_hdr.nexus.targ_lun = lun;
1038	io->taskio.tag_type = CTL_TAG_SIMPLE; /* XXX */
1039	io->taskio.task_action = CTL_TASK_ABORT_TASK_SET;
1040	error = ctl_queue(io);
1041	if (error != CTL_RETVAL_COMPLETE) {
1042		CFISCSI_SESSION_WARN(cs, "ctl_queue() failed; error %d", error);
1043		ctl_free_io(io);
1044	}
1045#else
1046	/*
1047	 * CTL doesn't currently support CTL_TASK_ABORT_TASK_SET, so instead
1048	 * just iterate over tasks that are waiting for something - data - and
1049	 * terminate those.
1050	 */
1051	CFISCSI_SESSION_LOCK(cs);
1052	TAILQ_FOREACH_SAFE(cdw,
1053	    &cs->cs_waiting_for_data_out, cdw_next, tmpcdw) {
1054		io = ctl_alloc_io(cs->cs_target->ct_softc->fe.ctl_pool_ref);
1055		if (io == NULL) {
1056			CFISCSI_SESSION_WARN(cs, "can't allocate ctl_io");
1057			return;
1058		}
1059		ctl_zero_io(io);
1060		io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr = NULL;
1061		io->io_hdr.io_type = CTL_IO_TASK;
1062		io->io_hdr.nexus.initid.id = cs->cs_ctl_initid;
1063		io->io_hdr.nexus.targ_port =
1064		    cs->cs_target->ct_softc->fe.targ_port;
1065		io->io_hdr.nexus.targ_target.id = 0;
1066		//io->io_hdr.nexus.targ_lun = lun; /* Not needed? */
1067		io->taskio.tag_type = CTL_TAG_SIMPLE; /* XXX */
1068		io->taskio.task_action = CTL_TASK_ABORT_TASK;
1069		io->taskio.tag_num = cdw->cdw_initiator_task_tag;
1070		error = ctl_queue(io);
1071		if (error != CTL_RETVAL_COMPLETE) {
1072			CFISCSI_SESSION_WARN(cs, "ctl_queue() failed; error %d", error);
1073			ctl_free_io(io);
1074			return;
1075		}
1076#if 0
1077		CFISCSI_SESSION_DEBUG(cs, "removing csw for initiator task tag "
1078		    "0x%x", cdw->cdw_initiator_task_tag);
1079#endif
1080		cdw->cdw_ctl_io->scsiio.be_move_done(cdw->cdw_ctl_io);
1081		TAILQ_REMOVE(&cs->cs_waiting_for_data_out, cdw, cdw_next);
1082		uma_zfree(cfiscsi_data_wait_zone, cdw);
1083	}
1084	CFISCSI_SESSION_UNLOCK(cs);
1085#endif
1086}
1087
1088static void
1089cfiscsi_maintenance_thread(void *arg)
1090{
1091	struct cfiscsi_session *cs;
1092
1093	cs = arg;
1094
1095	for (;;) {
1096		CFISCSI_SESSION_LOCK(cs);
1097		if (cs->cs_terminating == false)
1098			cv_wait(&cs->cs_maintenance_cv, &cs->cs_lock);
1099		CFISCSI_SESSION_UNLOCK(cs);
1100
1101		if (cs->cs_terminating) {
1102			cfiscsi_session_terminate_tasks(cs);
1103			callout_drain(&cs->cs_callout);
1104
1105			icl_conn_shutdown(cs->cs_conn);
1106			icl_conn_close(cs->cs_conn);
1107
1108			cs->cs_terminating++;
1109
1110			/*
1111			 * XXX: We used to wait up to 30 seconds to deliver queued PDUs
1112			 * 	to the initiator.  We also tried hard to deliver SCSI Responses
1113			 * 	for the aborted PDUs.  We don't do that anymore.  We might need
1114			 * 	to revisit that.
1115			 */
1116
1117			cfiscsi_session_delete(cs);
1118			kthread_exit();
1119			return;
1120		}
1121		CFISCSI_SESSION_DEBUG(cs, "nothing to do");
1122	}
1123}
1124
1125static void
1126cfiscsi_session_terminate(struct cfiscsi_session *cs)
1127{
1128
1129	if (cs->cs_terminating != 0)
1130		return;
1131	cs->cs_terminating = 1;
1132	cv_signal(&cs->cs_maintenance_cv);
1133}
1134
1135static int
1136cfiscsi_session_register_initiator(struct cfiscsi_session *cs)
1137{
1138	int error, i;
1139	struct cfiscsi_softc *softc;
1140
1141	KASSERT(cs->cs_ctl_initid == -1, ("already registered"));
1142
1143	softc = &cfiscsi_softc;
1144
1145	mtx_lock(&softc->lock);
1146	for (i = 0; i < softc->max_initiators; i++) {
1147		if (softc->ctl_initids[i] == 0)
1148			break;
1149	}
1150	if (i == softc->max_initiators) {
1151		CFISCSI_SESSION_WARN(cs, "too many concurrent sessions (%d)",
1152		    softc->max_initiators);
1153		mtx_unlock(&softc->lock);
1154		return (1);
1155	}
1156	softc->ctl_initids[i] = 1;
1157	mtx_unlock(&softc->lock);
1158
1159#if 0
1160	CFISCSI_SESSION_DEBUG(cs, "adding initiator id %d, max %d",
1161	    i, softc->max_initiators);
1162#endif
1163	cs->cs_ctl_initid = i;
1164	error = ctl_add_initiator(0x0, softc->fe.targ_port, cs->cs_ctl_initid);
1165	if (error != 0) {
1166		CFISCSI_SESSION_WARN(cs, "ctl_add_initiator failed with error %d", error);
1167		mtx_lock(&softc->lock);
1168		softc->ctl_initids[cs->cs_ctl_initid] = 0;
1169		mtx_unlock(&softc->lock);
1170		cs->cs_ctl_initid = -1;
1171		return (1);
1172	}
1173
1174	return (0);
1175}
1176
1177static void
1178cfiscsi_session_unregister_initiator(struct cfiscsi_session *cs)
1179{
1180	int error;
1181	struct cfiscsi_softc *softc;
1182
1183	if (cs->cs_ctl_initid == -1)
1184		return;
1185
1186	softc = &cfiscsi_softc;
1187
1188	error = ctl_remove_initiator(softc->fe.targ_port, cs->cs_ctl_initid);
1189	if (error != 0) {
1190		CFISCSI_SESSION_WARN(cs, "ctl_remove_initiator failed with error %d",
1191		    error);
1192	}
1193	mtx_lock(&softc->lock);
1194	softc->ctl_initids[cs->cs_ctl_initid] = 0;
1195	mtx_unlock(&softc->lock);
1196	cs->cs_ctl_initid = -1;
1197}
1198
1199static struct cfiscsi_session *
1200cfiscsi_session_new(struct cfiscsi_softc *softc)
1201{
1202	struct cfiscsi_session *cs;
1203	int error;
1204
1205	cs = malloc(sizeof(*cs), M_CFISCSI, M_NOWAIT | M_ZERO);
1206	if (cs == NULL) {
1207		CFISCSI_WARN("malloc failed");
1208		return (NULL);
1209	}
1210	cs->cs_ctl_initid = -1;
1211
1212	refcount_init(&cs->cs_outstanding_ctl_pdus, 0);
1213	TAILQ_INIT(&cs->cs_waiting_for_data_out);
1214	mtx_init(&cs->cs_lock, "cfiscsi_lock", NULL, MTX_DEF);
1215	cv_init(&cs->cs_maintenance_cv, "cfiscsi_mt");
1216#ifdef ICL_KERNEL_PROXY
1217	cv_init(&cs->cs_login_cv, "cfiscsi_login");
1218#endif
1219
1220	cs->cs_conn = icl_conn_new("cfiscsi", &cs->cs_lock);
1221	cs->cs_conn->ic_receive = cfiscsi_receive_callback;
1222	cs->cs_conn->ic_error = cfiscsi_error_callback;
1223	cs->cs_conn->ic_prv0 = cs;
1224
1225	error = kthread_add(cfiscsi_maintenance_thread, cs, NULL, NULL, 0, 0, "cfiscsimt");
1226	if (error != 0) {
1227		CFISCSI_SESSION_WARN(cs, "kthread_add(9) failed with error %d", error);
1228		free(cs, M_CFISCSI);
1229		return (NULL);
1230	}
1231
1232	mtx_lock(&softc->lock);
1233	cs->cs_id = softc->last_session_id + 1;
1234	softc->last_session_id++;
1235	mtx_unlock(&softc->lock);
1236
1237	mtx_lock(&softc->lock);
1238	TAILQ_INSERT_TAIL(&softc->sessions, cs, cs_next);
1239	mtx_unlock(&softc->lock);
1240
1241	/*
1242	 * Start pinging the initiator.
1243	 */
1244	callout_init(&cs->cs_callout, 1);
1245	callout_reset(&cs->cs_callout, 1 * hz, cfiscsi_callout, cs);
1246
1247	return (cs);
1248}
1249
1250static void
1251cfiscsi_session_delete(struct cfiscsi_session *cs)
1252{
1253	struct cfiscsi_softc *softc;
1254
1255	softc = &cfiscsi_softc;
1256
1257	KASSERT(cs->cs_outstanding_ctl_pdus == 0,
1258	    ("destroying session with outstanding CTL pdus"));
1259	KASSERT(TAILQ_EMPTY(&cs->cs_waiting_for_data_out),
1260	    ("destroying session with non-empty queue"));
1261
1262	cfiscsi_session_unregister_initiator(cs);
1263	if (cs->cs_target != NULL)
1264		cfiscsi_target_release(cs->cs_target);
1265	icl_conn_close(cs->cs_conn);
1266	icl_conn_free(cs->cs_conn);
1267
1268	mtx_lock(&softc->lock);
1269	TAILQ_REMOVE(&softc->sessions, cs, cs_next);
1270	mtx_unlock(&softc->lock);
1271
1272	free(cs, M_CFISCSI);
1273}
1274
1275int
1276cfiscsi_init(void)
1277{
1278	struct cfiscsi_softc *softc;
1279	struct ctl_frontend *fe;
1280	int retval;
1281
1282	softc = &cfiscsi_softc;
1283	retval = 0;
1284	bzero(softc, sizeof(*softc));
1285	mtx_init(&softc->lock, "cfiscsi", NULL, MTX_DEF);
1286
1287#ifdef ICL_KERNEL_PROXY
1288	cv_init(&softc->accept_cv, "cfiscsi_accept");
1289#endif
1290	TAILQ_INIT(&softc->sessions);
1291	TAILQ_INIT(&softc->targets);
1292
1293	fe = &softc->fe;
1294	fe->port_type = CTL_PORT_ISCSI;
1295	/* XXX KDM what should the real number be here? */
1296	fe->num_requested_ctl_io = 4096;
1297	snprintf(softc->port_name, sizeof(softc->port_name), "iscsi");
1298	fe->port_name = softc->port_name;
1299	fe->port_online = cfiscsi_online;
1300	fe->port_offline = cfiscsi_offline;
1301	fe->onoff_arg = softc;
1302	fe->targ_enable = cfiscsi_targ_enable;
1303	fe->targ_disable = cfiscsi_targ_disable;
1304	fe->lun_enable = cfiscsi_lun_enable;
1305	fe->lun_disable = cfiscsi_lun_disable;
1306	fe->targ_lun_arg = softc;
1307	fe->ioctl = cfiscsi_ioctl;
1308	fe->devid = cfiscsi_devid;
1309	fe->fe_datamove = cfiscsi_datamove;
1310	fe->fe_done = cfiscsi_done;
1311
1312	/* XXX KDM what should we report here? */
1313	/* XXX These should probably be fetched from CTL. */
1314	fe->max_targets = 1;
1315	fe->max_target_id = 15;
1316
1317	retval = ctl_frontend_register(fe, /*master_SC*/ 1);
1318	if (retval != 0) {
1319		CFISCSI_WARN("ctl_frontend_register() failed with error %d",
1320		    retval);
1321		retval = 1;
1322		goto bailout;
1323	}
1324
1325	softc->max_initiators = fe->max_initiators;
1326
1327	cfiscsi_data_wait_zone = uma_zcreate("cfiscsi_data_wait",
1328	    sizeof(struct cfiscsi_data_wait), NULL, NULL, NULL, NULL,
1329	    UMA_ALIGN_PTR, 0);
1330
1331	return (0);
1332
1333bailout:
1334	return (retval);
1335}
1336
1337static int
1338cfiscsi_module_event_handler(module_t mod, int what, void *arg)
1339{
1340
1341	switch (what) {
1342	case MOD_LOAD:
1343		return (cfiscsi_init());
1344	case MOD_UNLOAD:
1345		return (EBUSY);
1346	default:
1347		return (EOPNOTSUPP);
1348	}
1349}
1350
1351#ifdef ICL_KERNEL_PROXY
1352static void
1353cfiscsi_accept(struct socket *so)
1354{
1355	struct cfiscsi_session *cs;
1356
1357	cs = cfiscsi_session_new(&cfiscsi_softc);
1358	if (cs == NULL) {
1359		CFISCSI_WARN("failed to create session");
1360		return;
1361	}
1362
1363	icl_conn_handoff_sock(cs->cs_conn, so);
1364	cs->cs_waiting_for_ctld = true;
1365	cv_signal(&cfiscsi_softc.accept_cv);
1366}
1367#endif
1368
1369static void
1370cfiscsi_online(void *arg)
1371{
1372	struct cfiscsi_softc *softc;
1373
1374	softc = (struct cfiscsi_softc *)arg;
1375
1376	softc->online = 1;
1377#ifdef ICL_KERNEL_PROXY
1378	if (softc->listener != NULL)
1379		icl_listen_free(softc->listener);
1380	softc->listener = icl_listen_new(cfiscsi_accept);
1381#endif
1382}
1383
1384static void
1385cfiscsi_offline(void *arg)
1386{
1387	struct cfiscsi_softc *softc;
1388	struct cfiscsi_session *cs;
1389
1390	softc = (struct cfiscsi_softc *)arg;
1391
1392	softc->online = 0;
1393
1394	mtx_lock(&softc->lock);
1395	TAILQ_FOREACH(cs, &softc->sessions, cs_next)
1396		cfiscsi_session_terminate(cs);
1397	mtx_unlock(&softc->lock);
1398
1399#ifdef ICL_KERNEL_PROXY
1400	icl_listen_free(softc->listener);
1401	softc->listener = NULL;
1402#endif
1403}
1404
1405static int
1406cfiscsi_targ_enable(void *arg, struct ctl_id targ_id)
1407{
1408
1409	return (0);
1410}
1411
1412static int
1413cfiscsi_targ_disable(void *arg, struct ctl_id targ_id)
1414{
1415
1416	return (0);
1417}
1418
1419static void
1420cfiscsi_ioctl_handoff(struct ctl_iscsi *ci)
1421{
1422	struct cfiscsi_softc *softc;
1423	struct cfiscsi_session *cs;
1424	struct cfiscsi_target *ct;
1425	struct ctl_iscsi_handoff_params *cihp;
1426	int error;
1427
1428	cihp = (struct ctl_iscsi_handoff_params *)&(ci->data);
1429	softc = &cfiscsi_softc;
1430
1431	CFISCSI_DEBUG("new connection from %s (%s) to %s",
1432	    cihp->initiator_name, cihp->initiator_addr,
1433	    cihp->target_name);
1434
1435	if (softc->online == 0) {
1436		ci->status = CTL_ISCSI_ERROR;
1437		snprintf(ci->error_str, sizeof(ci->error_str),
1438		    "%s: port offline", __func__);
1439		return;
1440	}
1441
1442	ct = cfiscsi_target_find(softc, cihp->target_name);
1443	if (ct == NULL) {
1444		ci->status = CTL_ISCSI_ERROR;
1445		snprintf(ci->error_str, sizeof(ci->error_str),
1446		    "%s: target not found", __func__);
1447		return;
1448	}
1449
1450#ifdef ICL_KERNEL_PROXY
1451	if (cihp->socket > 0 && cihp->connection_id > 0) {
1452		snprintf(ci->error_str, sizeof(ci->error_str),
1453		    "both socket and connection_id set");
1454		ci->status = CTL_ISCSI_ERROR;
1455		cfiscsi_target_release(ct);
1456		return;
1457	}
1458	if (cihp->socket == 0) {
1459		mtx_lock(&cfiscsi_softc.lock);
1460		TAILQ_FOREACH(cs, &cfiscsi_softc.sessions, cs_next) {
1461			if (cs->cs_id == cihp->socket)
1462				break;
1463		}
1464		if (cs == NULL) {
1465			mtx_unlock(&cfiscsi_softc.lock);
1466			snprintf(ci->error_str, sizeof(ci->error_str),
1467			    "connection not found");
1468			ci->status = CTL_ISCSI_ERROR;
1469			cfiscsi_target_release(ct);
1470			return;
1471		}
1472		mtx_unlock(&cfiscsi_softc.lock);
1473	} else {
1474#endif
1475		cs = cfiscsi_session_new(softc);
1476		if (cs == NULL) {
1477			ci->status = CTL_ISCSI_ERROR;
1478			snprintf(ci->error_str, sizeof(ci->error_str),
1479			    "%s: cfiscsi_session_new failed", __func__);
1480			cfiscsi_target_release(ct);
1481			return;
1482		}
1483#ifdef ICL_KERNEL_PROXY
1484	}
1485#endif
1486	cs->cs_target = ct;
1487
1488	/*
1489	 * First PDU of Full Feature phase has the same CmdSN as the last
1490	 * PDU from the Login Phase received from the initiator.  Thus,
1491	 * the -1 below.
1492	 */
1493	cs->cs_portal_group_tag = cihp->portal_group_tag;
1494	cs->cs_cmdsn = cihp->cmdsn;
1495	cs->cs_statsn = cihp->statsn;
1496	cs->cs_max_data_segment_length = cihp->max_recv_data_segment_length;
1497	cs->cs_max_burst_length = cihp->max_burst_length;
1498	cs->cs_immediate_data = !!cihp->immediate_data;
1499	if (cihp->header_digest == CTL_ISCSI_DIGEST_CRC32C)
1500		cs->cs_conn->ic_header_crc32c = true;
1501	if (cihp->data_digest == CTL_ISCSI_DIGEST_CRC32C)
1502		cs->cs_conn->ic_data_crc32c = true;
1503
1504	strlcpy(cs->cs_initiator_name,
1505	    cihp->initiator_name, sizeof(cs->cs_initiator_name));
1506	strlcpy(cs->cs_initiator_addr,
1507	    cihp->initiator_addr, sizeof(cs->cs_initiator_addr));
1508	strlcpy(cs->cs_initiator_alias,
1509	    cihp->initiator_alias, sizeof(cs->cs_initiator_alias));
1510
1511#ifdef ICL_KERNEL_PROXY
1512	if (cihp->socket > 0) {
1513#endif
1514		error = icl_conn_handoff(cs->cs_conn, cihp->socket);
1515		if (error != 0) {
1516			cfiscsi_session_delete(cs);
1517			ci->status = CTL_ISCSI_ERROR;
1518			snprintf(ci->error_str, sizeof(ci->error_str),
1519			    "%s: icl_conn_handoff failed with error %d",
1520			    __func__, error);
1521			return;
1522		}
1523#ifdef ICL_KERNEL_PROXY
1524	}
1525#endif
1526
1527	/*
1528	 * Register initiator with CTL.
1529	 */
1530	cfiscsi_session_register_initiator(cs);
1531
1532#ifdef ICL_KERNEL_PROXY
1533	cs->cs_login_phase = false;
1534
1535	/*
1536	 * First PDU of the Full Feature phase has likely already arrived.
1537	 * We have to pick it up and execute properly.
1538	 */
1539	if (cs->cs_login_pdu != NULL) {
1540		CFISCSI_SESSION_DEBUG(cs, "picking up first PDU");
1541		cfiscsi_pdu_handle(cs->cs_login_pdu);
1542		cs->cs_login_pdu = NULL;
1543	}
1544#endif
1545
1546	ci->status = CTL_ISCSI_OK;
1547}
1548
1549static void
1550cfiscsi_ioctl_list(struct ctl_iscsi *ci)
1551{
1552	struct ctl_iscsi_list_params *cilp;
1553	struct cfiscsi_session *cs;
1554	struct cfiscsi_softc *softc;
1555	struct sbuf *sb;
1556	int error;
1557
1558	cilp = (struct ctl_iscsi_list_params *)&(ci->data);
1559	softc = &cfiscsi_softc;
1560
1561	sb = sbuf_new(NULL, NULL, cilp->alloc_len, SBUF_FIXEDLEN);
1562	if (sb == NULL) {
1563		ci->status = CTL_ISCSI_ERROR;
1564		snprintf(ci->error_str, sizeof(ci->error_str),
1565		    "Unable to allocate %d bytes for iSCSI session list",
1566		    cilp->alloc_len);
1567		return;
1568	}
1569
1570	sbuf_printf(sb, "<ctlislist>\n");
1571	mtx_lock(&softc->lock);
1572	TAILQ_FOREACH(cs, &softc->sessions, cs_next) {
1573#ifdef ICL_KERNEL_PROXY
1574		if (cs->cs_target == NULL)
1575			continue;
1576#endif
1577		error = sbuf_printf(sb, "<connection id=\"%d\">"
1578		    "<initiator>%s</initiator>"
1579		    "<initiator_addr>%s</initiator_addr>"
1580		    "<initiator_alias>%s</initiator_alias>"
1581		    "<target>%s</target>"
1582		    "<target_alias>%s</target_alias>"
1583		    "<header_digest>%s</header_digest>"
1584		    "<data_digest>%s</data_digest>"
1585		    "<max_data_segment_length>%zd</max_data_segment_length>"
1586		    "<immediate_data>%d</immediate_data>"
1587		    "<iser>%d</iser>"
1588		    "</connection>\n",
1589		    cs->cs_id,
1590		    cs->cs_initiator_name, cs->cs_initiator_addr, cs->cs_initiator_alias,
1591		    cs->cs_target->ct_name, cs->cs_target->ct_alias,
1592		    cs->cs_conn->ic_header_crc32c ? "CRC32C" : "None",
1593		    cs->cs_conn->ic_data_crc32c ? "CRC32C" : "None",
1594		    cs->cs_max_data_segment_length,
1595		    cs->cs_immediate_data,
1596		    cs->cs_conn->ic_iser);
1597		if (error != 0)
1598			break;
1599	}
1600	mtx_unlock(&softc->lock);
1601	error = sbuf_printf(sb, "</ctlislist>\n");
1602	if (error != 0) {
1603		sbuf_delete(sb);
1604		ci->status = CTL_ISCSI_LIST_NEED_MORE_SPACE;
1605		snprintf(ci->error_str, sizeof(ci->error_str),
1606		    "Out of space, %d bytes is too small", cilp->alloc_len);
1607		return;
1608	}
1609	sbuf_finish(sb);
1610
1611	error = copyout(sbuf_data(sb), cilp->conn_xml, sbuf_len(sb) + 1);
1612	cilp->fill_len = sbuf_len(sb) + 1;
1613	ci->status = CTL_ISCSI_OK;
1614	sbuf_delete(sb);
1615}
1616
1617static void
1618cfiscsi_ioctl_terminate(struct ctl_iscsi *ci)
1619{
1620	struct icl_pdu *response;
1621	struct iscsi_bhs_asynchronous_message *bhsam;
1622	struct ctl_iscsi_terminate_params *citp;
1623	struct cfiscsi_session *cs;
1624	struct cfiscsi_softc *softc;
1625	int found = 0;
1626
1627	citp = (struct ctl_iscsi_terminate_params *)&(ci->data);
1628	softc = &cfiscsi_softc;
1629
1630	mtx_lock(&softc->lock);
1631	TAILQ_FOREACH(cs, &softc->sessions, cs_next) {
1632		if (citp->all == 0 && cs->cs_id != citp->connection_id &&
1633		    strcmp(cs->cs_initiator_name, citp->initiator_name) != 0 &&
1634		    strcmp(cs->cs_initiator_addr, citp->initiator_addr) != 0)
1635			continue;
1636
1637		response = icl_pdu_new_bhs(cs->cs_conn, M_NOWAIT);
1638		if (response == NULL) {
1639			/*
1640			 * Oh well.  Just terminate the connection.
1641			 */
1642		} else {
1643			bhsam = (struct iscsi_bhs_asynchronous_message *)
1644			    response->ip_bhs;
1645			bhsam->bhsam_opcode = ISCSI_BHS_OPCODE_ASYNC_MESSAGE;
1646			bhsam->bhsam_flags = 0x80;
1647			bhsam->bhsam_0xffffffff = 0xffffffff;
1648			bhsam->bhsam_async_event =
1649			    BHSAM_EVENT_TARGET_TERMINATES_SESSION;
1650			cfiscsi_pdu_queue(response);
1651		}
1652		cfiscsi_session_terminate(cs);
1653		found++;
1654	}
1655	mtx_unlock(&softc->lock);
1656
1657	if (found == 0) {
1658		ci->status = CTL_ISCSI_SESSION_NOT_FOUND;
1659		snprintf(ci->error_str, sizeof(ci->error_str),
1660		    "No matching connections found");
1661		return;
1662	}
1663
1664	ci->status = CTL_ISCSI_OK;
1665}
1666
1667static void
1668cfiscsi_ioctl_logout(struct ctl_iscsi *ci)
1669{
1670	struct icl_pdu *response;
1671	struct iscsi_bhs_asynchronous_message *bhsam;
1672	struct ctl_iscsi_logout_params *cilp;
1673	struct cfiscsi_session *cs;
1674	struct cfiscsi_softc *softc;
1675	int found = 0;
1676
1677	cilp = (struct ctl_iscsi_logout_params *)&(ci->data);
1678	softc = &cfiscsi_softc;
1679
1680	mtx_lock(&softc->lock);
1681	TAILQ_FOREACH(cs, &softc->sessions, cs_next) {
1682		if (cilp->all == 0 && cs->cs_id != cilp->connection_id &&
1683		    strcmp(cs->cs_initiator_name, cilp->initiator_name) != 0 &&
1684		    strcmp(cs->cs_initiator_addr, cilp->initiator_addr) != 0)
1685			continue;
1686
1687		response = icl_pdu_new_bhs(cs->cs_conn, M_NOWAIT);
1688		if (response == NULL) {
1689			ci->status = CTL_ISCSI_ERROR;
1690			snprintf(ci->error_str, sizeof(ci->error_str),
1691			    "Unable to allocate memory");
1692			mtx_unlock(&softc->lock);
1693			return;
1694		}
1695		bhsam =
1696		    (struct iscsi_bhs_asynchronous_message *)response->ip_bhs;
1697		bhsam->bhsam_opcode = ISCSI_BHS_OPCODE_ASYNC_MESSAGE;
1698		bhsam->bhsam_flags = 0x80;
1699		bhsam->bhsam_async_event = BHSAM_EVENT_TARGET_REQUESTS_LOGOUT;
1700		bhsam->bhsam_parameter3 = htons(10);
1701		cfiscsi_pdu_queue(response);
1702		found++;
1703	}
1704	mtx_unlock(&softc->lock);
1705
1706	if (found == 0) {
1707		ci->status = CTL_ISCSI_SESSION_NOT_FOUND;
1708		snprintf(ci->error_str, sizeof(ci->error_str),
1709		    "No matching connections found");
1710		return;
1711	}
1712
1713	ci->status = CTL_ISCSI_OK;
1714}
1715
1716#ifdef ICL_KERNEL_PROXY
1717static void
1718cfiscsi_ioctl_listen(struct ctl_iscsi *ci)
1719{
1720	struct ctl_iscsi_listen_params *cilp;
1721	struct sockaddr *sa;
1722	int error;
1723
1724	cilp = (struct ctl_iscsi_listen_params *)&(ci->data);
1725
1726	if (cfiscsi_softc.listener == NULL) {
1727		CFISCSI_DEBUG("no listener");
1728		snprintf(ci->error_str, sizeof(ci->error_str), "no listener");
1729		ci->status = CTL_ISCSI_ERROR;
1730		return;
1731	}
1732
1733	error = getsockaddr(&sa, (void *)cilp->addr, cilp->addrlen);
1734	if (error != 0) {
1735		CFISCSI_DEBUG("getsockaddr, error %d", error);
1736		snprintf(ci->error_str, sizeof(ci->error_str), "getsockaddr failed");
1737		ci->status = CTL_ISCSI_ERROR;
1738		return;
1739	}
1740
1741	error = icl_listen_add(cfiscsi_softc.listener, cilp->iser, cilp->domain,
1742	    cilp->socktype, cilp->protocol, sa);
1743	if (error != 0) {
1744		free(sa, M_SONAME);
1745		CFISCSI_DEBUG("icl_listen_add, error %d", error);
1746		snprintf(ci->error_str, sizeof(ci->error_str),
1747		    "icl_listen_add failed, error %d", error);
1748		ci->status = CTL_ISCSI_ERROR;
1749		return;
1750	}
1751
1752	ci->status = CTL_ISCSI_OK;
1753}
1754
1755static void
1756cfiscsi_ioctl_accept(struct ctl_iscsi *ci)
1757{
1758	struct ctl_iscsi_accept_params *ciap;
1759	struct cfiscsi_session *cs;
1760	int error;
1761
1762	ciap = (struct ctl_iscsi_accept_params *)&(ci->data);
1763
1764	mtx_lock(&cfiscsi_softc.lock);
1765	for (;;) {
1766		TAILQ_FOREACH(cs, &cfiscsi_softc.sessions, cs_next) {
1767			if (cs->cs_waiting_for_ctld)
1768				break;
1769		}
1770		if (cs != NULL)
1771			break;
1772		error = cv_wait_sig(&cfiscsi_softc.accept_cv, &cfiscsi_softc.lock);
1773		if (error != 0) {
1774			mtx_unlock(&cfiscsi_softc.lock);
1775			snprintf(ci->error_str, sizeof(ci->error_str), "interrupted");
1776			ci->status = CTL_ISCSI_ERROR;
1777			return;
1778		}
1779	}
1780	mtx_unlock(&cfiscsi_softc.lock);
1781
1782	cs->cs_waiting_for_ctld = false;
1783	cs->cs_login_phase = true;
1784
1785	ciap->connection_id = cs->cs_id;
1786	ci->status = CTL_ISCSI_OK;
1787}
1788
1789static void
1790cfiscsi_ioctl_send(struct ctl_iscsi *ci)
1791{
1792	struct ctl_iscsi_send_params *cisp;
1793	struct cfiscsi_session *cs;
1794	struct icl_pdu *ip;
1795	size_t datalen;
1796	void *data;
1797	int error;
1798
1799	cisp = (struct ctl_iscsi_send_params *)&(ci->data);
1800
1801	mtx_lock(&cfiscsi_softc.lock);
1802	TAILQ_FOREACH(cs, &cfiscsi_softc.sessions, cs_next) {
1803		if (cs->cs_id == cisp->connection_id)
1804			break;
1805	}
1806	if (cs == NULL) {
1807		mtx_unlock(&cfiscsi_softc.lock);
1808		snprintf(ci->error_str, sizeof(ci->error_str), "connection not found");
1809		ci->status = CTL_ISCSI_ERROR;
1810		return;
1811	}
1812	mtx_unlock(&cfiscsi_softc.lock);
1813
1814#if 0
1815	if (cs->cs_login_phase == false)
1816		return (EBUSY);
1817#endif
1818
1819	if (cs->cs_terminating) {
1820		snprintf(ci->error_str, sizeof(ci->error_str), "connection is terminating");
1821		ci->status = CTL_ISCSI_ERROR;
1822		return;
1823	}
1824
1825	datalen = cisp->data_segment_len;
1826	/*
1827	 * XXX
1828	 */
1829	//if (datalen > CFISCSI_MAX_DATA_SEGMENT_LENGTH) {
1830	if (datalen > 65535) {
1831		snprintf(ci->error_str, sizeof(ci->error_str), "data segment too big");
1832		ci->status = CTL_ISCSI_ERROR;
1833		return;
1834	}
1835	if (datalen > 0) {
1836		data = malloc(datalen, M_CFISCSI, M_WAITOK);
1837		error = copyin(cisp->data_segment, data, datalen);
1838		if (error != 0) {
1839			free(data, M_CFISCSI);
1840			snprintf(ci->error_str, sizeof(ci->error_str), "copyin error %d", error);
1841			ci->status = CTL_ISCSI_ERROR;
1842			return;
1843		}
1844	}
1845
1846	ip = icl_pdu_new_bhs(cs->cs_conn, M_WAITOK);
1847	memcpy(ip->ip_bhs, cisp->bhs, sizeof(*ip->ip_bhs));
1848	if (datalen > 0) {
1849		icl_pdu_append_data(ip, data, datalen, M_WAITOK);
1850		free(data, M_CFISCSI);
1851	}
1852	CFISCSI_SESSION_LOCK(cs);
1853	icl_pdu_queue(ip);
1854	CFISCSI_SESSION_UNLOCK(cs);
1855	ci->status = CTL_ISCSI_OK;
1856}
1857
1858static void
1859cfiscsi_ioctl_receive(struct ctl_iscsi *ci)
1860{
1861	struct ctl_iscsi_receive_params *cirp;
1862	struct cfiscsi_session *cs;
1863	struct icl_pdu *ip;
1864	void *data;
1865
1866	cirp = (struct ctl_iscsi_receive_params *)&(ci->data);
1867
1868	mtx_lock(&cfiscsi_softc.lock);
1869	TAILQ_FOREACH(cs, &cfiscsi_softc.sessions, cs_next) {
1870		if (cs->cs_id == cirp->connection_id)
1871			break;
1872	}
1873	if (cs == NULL) {
1874		mtx_unlock(&cfiscsi_softc.lock);
1875		snprintf(ci->error_str, sizeof(ci->error_str), "connection not found");
1876		ci->status = CTL_ISCSI_ERROR;
1877		return;
1878	}
1879	mtx_unlock(&cfiscsi_softc.lock);
1880
1881#if 0
1882	if (is->is_login_phase == false)
1883		return (EBUSY);
1884#endif
1885
1886	CFISCSI_SESSION_LOCK(cs);
1887	while (cs->cs_login_pdu == NULL &&
1888	    cs->cs_terminating == false)
1889		cv_wait(&cs->cs_login_cv, &cs->cs_lock);
1890	if (cs->cs_terminating) {
1891		CFISCSI_SESSION_UNLOCK(cs);
1892		snprintf(ci->error_str, sizeof(ci->error_str), "connection terminating");
1893		ci->status = CTL_ISCSI_ERROR;
1894		return;
1895	}
1896	ip = cs->cs_login_pdu;
1897	cs->cs_login_pdu = NULL;
1898	CFISCSI_SESSION_UNLOCK(cs);
1899
1900	if (ip->ip_data_len > cirp->data_segment_len) {
1901		icl_pdu_free(ip);
1902		snprintf(ci->error_str, sizeof(ci->error_str), "data segment too big");
1903		ci->status = CTL_ISCSI_ERROR;
1904		return;
1905	}
1906
1907	copyout(ip->ip_bhs, cirp->bhs, sizeof(*ip->ip_bhs));
1908	if (ip->ip_data_len > 0) {
1909		data = malloc(ip->ip_data_len, M_CFISCSI, M_WAITOK);
1910		icl_pdu_get_data(ip, 0, data, ip->ip_data_len);
1911		copyout(data, cirp->data_segment, ip->ip_data_len);
1912		free(data, M_CFISCSI);
1913	}
1914
1915	icl_pdu_free(ip);
1916	ci->status = CTL_ISCSI_OK;
1917}
1918
1919static void
1920cfiscsi_ioctl_close(struct ctl_iscsi *ci)
1921{
1922	/*
1923	 * XXX
1924	 */
1925}
1926#endif /* !ICL_KERNEL_PROXY */
1927
1928static int
1929cfiscsi_ioctl(struct cdev *dev,
1930    u_long cmd, caddr_t addr, int flag, struct thread *td)
1931{
1932	struct ctl_iscsi *ci;
1933
1934	if (cmd != CTL_ISCSI)
1935		return (ENOTTY);
1936
1937	ci = (struct ctl_iscsi *)addr;
1938	switch (ci->type) {
1939	case CTL_ISCSI_HANDOFF:
1940		cfiscsi_ioctl_handoff(ci);
1941		break;
1942	case CTL_ISCSI_LIST:
1943		cfiscsi_ioctl_list(ci);
1944		break;
1945	case CTL_ISCSI_TERMINATE:
1946		cfiscsi_ioctl_terminate(ci);
1947		break;
1948	case CTL_ISCSI_LOGOUT:
1949		cfiscsi_ioctl_logout(ci);
1950		break;
1951#ifdef ICL_KERNEL_PROXY
1952	case CTL_ISCSI_LISTEN:
1953		cfiscsi_ioctl_listen(ci);
1954		break;
1955	case CTL_ISCSI_ACCEPT:
1956		cfiscsi_ioctl_accept(ci);
1957		break;
1958	case CTL_ISCSI_SEND:
1959		cfiscsi_ioctl_send(ci);
1960		break;
1961	case CTL_ISCSI_RECEIVE:
1962		cfiscsi_ioctl_receive(ci);
1963		break;
1964	case CTL_ISCSI_CLOSE:
1965		cfiscsi_ioctl_close(ci);
1966		break;
1967#else
1968	case CTL_ISCSI_LISTEN:
1969	case CTL_ISCSI_ACCEPT:
1970	case CTL_ISCSI_SEND:
1971	case CTL_ISCSI_RECEIVE:
1972	case CTL_ISCSI_CLOSE:
1973		ci->status = CTL_ISCSI_ERROR;
1974		snprintf(ci->error_str, sizeof(ci->error_str),
1975		    "%s: CTL compiled without ICL_KERNEL_PROXY",
1976		    __func__);
1977		break;
1978#endif /* !ICL_KERNEL_PROXY */
1979	default:
1980		ci->status = CTL_ISCSI_ERROR;
1981		snprintf(ci->error_str, sizeof(ci->error_str),
1982		    "%s: invalid iSCSI request type %d", __func__, ci->type);
1983		break;
1984	}
1985
1986	return (0);
1987}
1988
1989static int
1990cfiscsi_devid(struct ctl_scsiio *ctsio, int alloc_len)
1991{
1992	struct cfiscsi_session *cs;
1993	struct scsi_vpd_device_id *devid_ptr;
1994	struct scsi_vpd_id_descriptor *desc, *desc1;
1995	struct scsi_vpd_id_descriptor *desc2, *desc3; /* for types 4h and 5h */
1996	struct scsi_vpd_id_t10 *t10id;
1997	struct ctl_lun *lun;
1998	const struct icl_pdu *request;
1999	size_t devid_len, wwpn_len;
2000
2001	lun = (struct ctl_lun *)ctsio->io_hdr.ctl_private[CTL_PRIV_LUN].ptr;
2002	request = ctsio->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr;
2003	cs = PDU_SESSION(request);
2004
2005	wwpn_len = strlen(cs->cs_target->ct_name);
2006	wwpn_len += strlen(",t,0x01");
2007	wwpn_len += 1; /* '\0' */
2008	if ((wwpn_len % 4) != 0)
2009		wwpn_len += (4 - (wwpn_len % 4));
2010
2011	devid_len = sizeof(struct scsi_vpd_device_id) +
2012		sizeof(struct scsi_vpd_id_descriptor) +
2013		sizeof(struct scsi_vpd_id_t10) + CTL_DEVID_LEN +
2014		sizeof(struct scsi_vpd_id_descriptor) + wwpn_len +
2015		sizeof(struct scsi_vpd_id_descriptor) +
2016		sizeof(struct scsi_vpd_id_rel_trgt_port_id) +
2017		sizeof(struct scsi_vpd_id_descriptor) +
2018		sizeof(struct scsi_vpd_id_trgt_port_grp_id);
2019
2020	ctsio->kern_data_ptr = malloc(devid_len, M_CTL, M_WAITOK | M_ZERO);
2021	devid_ptr = (struct scsi_vpd_device_id *)ctsio->kern_data_ptr;
2022	ctsio->kern_sg_entries = 0;
2023
2024	if (devid_len < alloc_len) {
2025		ctsio->residual = alloc_len - devid_len;
2026		ctsio->kern_data_len = devid_len;
2027		ctsio->kern_total_len = devid_len;
2028	} else {
2029		ctsio->residual = 0;
2030		ctsio->kern_data_len = alloc_len;
2031		ctsio->kern_total_len = alloc_len;
2032	}
2033	ctsio->kern_data_resid = 0;
2034	ctsio->kern_rel_offset = 0;
2035	ctsio->kern_sg_entries = 0;
2036
2037	desc = (struct scsi_vpd_id_descriptor *)devid_ptr->desc_list;
2038	t10id = (struct scsi_vpd_id_t10 *)&desc->identifier[0];
2039	desc1 = (struct scsi_vpd_id_descriptor *)(&desc->identifier[0] +
2040	    sizeof(struct scsi_vpd_id_t10) + CTL_DEVID_LEN);
2041	desc2 = (struct scsi_vpd_id_descriptor *)(&desc1->identifier[0] +
2042	    wwpn_len);
2043	desc3 = (struct scsi_vpd_id_descriptor *)(&desc2->identifier[0] +
2044	    sizeof(struct scsi_vpd_id_rel_trgt_port_id));
2045
2046	if (lun != NULL)
2047		devid_ptr->device = (SID_QUAL_LU_CONNECTED << 5) |
2048		    lun->be_lun->lun_type;
2049	else
2050		devid_ptr->device = (SID_QUAL_LU_OFFLINE << 5) | T_DIRECT;
2051
2052	devid_ptr->page_code = SVPD_DEVICE_ID;
2053
2054	scsi_ulto2b(devid_len - 4, devid_ptr->length);
2055
2056	/*
2057	 * We're using a LUN association here.  i.e., this device ID is a
2058	 * per-LUN identifier.
2059	 */
2060	desc->proto_codeset = (SCSI_PROTO_ISCSI << 4) | SVPD_ID_CODESET_ASCII;
2061	desc->id_type = SVPD_ID_PIV | SVPD_ID_ASSOC_LUN | SVPD_ID_TYPE_T10;
2062	desc->length = sizeof(*t10id) + CTL_DEVID_LEN;
2063	strncpy((char *)t10id->vendor, CTL_VENDOR, sizeof(t10id->vendor));
2064
2065	/*
2066	 * If we've actually got a backend, copy the device id from the
2067	 * per-LUN data.  Otherwise, set it to all spaces.
2068	 */
2069	if (lun != NULL) {
2070		/*
2071		 * Copy the backend's LUN ID.
2072		 */
2073		strncpy((char *)t10id->vendor_spec_id,
2074		    (char *)lun->be_lun->device_id, CTL_DEVID_LEN);
2075	} else {
2076		/*
2077		 * No backend, set this to spaces.
2078		 */
2079		memset(t10id->vendor_spec_id, 0x20, CTL_DEVID_LEN);
2080	}
2081
2082	/*
2083	 * desc1 is for the WWPN which is a port asscociation.
2084	 */
2085       	desc1->proto_codeset = (SCSI_PROTO_ISCSI << 4) | SVPD_ID_CODESET_UTF8;
2086	desc1->id_type = SVPD_ID_PIV | SVPD_ID_ASSOC_PORT |
2087	    SVPD_ID_TYPE_SCSI_NAME;
2088	desc1->length = wwpn_len;
2089	snprintf(desc1->identifier, wwpn_len, "%s,t,0x%x",
2090	    cs->cs_target->ct_name, cs->cs_portal_group_tag);
2091
2092	/*
2093	 * desc2 is for the Relative Target Port(type 4h) identifier
2094	 */
2095       	desc2->proto_codeset = (SCSI_PROTO_ISCSI << 4) | SVPD_ID_CODESET_BINARY;
2096	desc2->id_type = SVPD_ID_PIV | SVPD_ID_ASSOC_PORT |
2097	    SVPD_ID_TYPE_RELTARG;
2098	desc2->length = 4;
2099	desc2->identifier[3] = 1;
2100
2101	/*
2102	 * desc3 is for the Target Port Group(type 5h) identifier
2103	 */
2104       	desc3->proto_codeset = (SCSI_PROTO_ISCSI << 4) | SVPD_ID_CODESET_BINARY;
2105	desc3->id_type = SVPD_ID_PIV | SVPD_ID_ASSOC_PORT |
2106	    SVPD_ID_TYPE_TPORTGRP;
2107	desc3->length = 4;
2108	desc3->identifier[3] = 1;
2109
2110	ctsio->scsi_status = SCSI_STATUS_OK;
2111
2112	ctsio->be_move_done = ctl_config_move_done;
2113	ctl_datamove((union ctl_io *)ctsio);
2114
2115	return (CTL_RETVAL_COMPLETE);
2116}
2117
2118static void
2119cfiscsi_target_hold(struct cfiscsi_target *ct)
2120{
2121
2122	refcount_acquire(&ct->ct_refcount);
2123}
2124
2125static void
2126cfiscsi_target_release(struct cfiscsi_target *ct)
2127{
2128	struct cfiscsi_softc *softc;
2129
2130	softc = ct->ct_softc;
2131	mtx_lock(&softc->lock);
2132	if (refcount_release(&ct->ct_refcount)) {
2133		TAILQ_REMOVE(&softc->targets, ct, ct_next);
2134		mtx_unlock(&softc->lock);
2135		free(ct, M_CFISCSI);
2136
2137		return;
2138	}
2139	mtx_unlock(&softc->lock);
2140}
2141
2142static struct cfiscsi_target *
2143cfiscsi_target_find(struct cfiscsi_softc *softc, const char *name)
2144{
2145	struct cfiscsi_target *ct;
2146
2147	mtx_lock(&softc->lock);
2148	TAILQ_FOREACH(ct, &softc->targets, ct_next) {
2149		if (strcmp(name, ct->ct_name) != 0)
2150			continue;
2151		cfiscsi_target_hold(ct);
2152		mtx_unlock(&softc->lock);
2153		return (ct);
2154	}
2155	mtx_unlock(&softc->lock);
2156
2157	return (NULL);
2158}
2159
2160static struct cfiscsi_target *
2161cfiscsi_target_find_or_create(struct cfiscsi_softc *softc, const char *name,
2162    const char *alias)
2163{
2164	struct cfiscsi_target *ct, *newct;
2165	int i;
2166
2167	if (name[0] == '\0' || strlen(name) >= CTL_ISCSI_NAME_LEN)
2168		return (NULL);
2169
2170	newct = malloc(sizeof(*newct), M_CFISCSI, M_WAITOK | M_ZERO);
2171
2172	mtx_lock(&softc->lock);
2173	TAILQ_FOREACH(ct, &softc->targets, ct_next) {
2174		if (strcmp(name, ct->ct_name) != 0)
2175			continue;
2176		cfiscsi_target_hold(ct);
2177		mtx_unlock(&softc->lock);
2178		free(newct, M_CFISCSI);
2179		return (ct);
2180	}
2181
2182	for (i = 0; i < CTL_MAX_LUNS; i++)
2183		newct->ct_luns[i] = -1;
2184
2185	strlcpy(newct->ct_name, name, sizeof(newct->ct_name));
2186	if (alias != NULL)
2187		strlcpy(newct->ct_alias, alias, sizeof(newct->ct_alias));
2188	refcount_init(&newct->ct_refcount, 1);
2189	newct->ct_softc = softc;
2190	TAILQ_INSERT_TAIL(&softc->targets, newct, ct_next);
2191	mtx_unlock(&softc->lock);
2192
2193	return (newct);
2194}
2195
2196/*
2197 * Takes LUN from the target space and returns LUN from the CTL space.
2198 */
2199static uint32_t
2200cfiscsi_map_lun(void *arg, uint32_t lun)
2201{
2202	struct cfiscsi_session *cs;
2203
2204	cs = arg;
2205
2206	if (lun >= CTL_MAX_LUNS) {
2207		CFISCSI_DEBUG("requested lun number %d is higher "
2208		    "than maximum %d", lun, CTL_MAX_LUNS - 1);
2209		return (0xffffffff);
2210	}
2211
2212	if (cs->cs_target->ct_luns[lun] < 0)
2213		return (0xffffffff);
2214
2215	return (cs->cs_target->ct_luns[lun]);
2216}
2217
2218static int
2219cfiscsi_target_set_lun(struct cfiscsi_target *ct,
2220    unsigned long lun_id, unsigned long ctl_lun_id)
2221{
2222
2223	if (lun_id >= CTL_MAX_LUNS) {
2224		CFISCSI_WARN("requested lun number %ld is higher "
2225		    "than maximum %d", lun_id, CTL_MAX_LUNS - 1);
2226		return (-1);
2227	}
2228
2229	if (ct->ct_luns[lun_id] >= 0) {
2230		/*
2231		 * CTL calls cfiscsi_lun_enable() twice for each LUN - once
2232		 * when the LUN is created, and a second time just before
2233		 * the port is brought online; don't emit warnings
2234		 * for that case.
2235		 */
2236		if (ct->ct_luns[lun_id] == ctl_lun_id)
2237			return (0);
2238		CFISCSI_WARN("lun %ld already allocated", lun_id);
2239		return (-1);
2240	}
2241
2242#if 0
2243	CFISCSI_DEBUG("adding mapping for lun %ld, target %s "
2244	    "to ctl lun %ld", lun_id, ct->ct_name, ctl_lun_id);
2245#endif
2246
2247	ct->ct_luns[lun_id] = ctl_lun_id;
2248	cfiscsi_target_hold(ct);
2249
2250	return (0);
2251}
2252
2253static int
2254cfiscsi_target_unset_lun(struct cfiscsi_target *ct, unsigned long lun_id)
2255{
2256
2257	if (ct->ct_luns[lun_id] < 0) {
2258		CFISCSI_WARN("lun %ld not allocated", lun_id);
2259		return (-1);
2260	}
2261
2262	ct->ct_luns[lun_id] = -1;
2263	cfiscsi_target_release(ct);
2264
2265	return (0);
2266}
2267
2268static int
2269cfiscsi_lun_enable(void *arg, struct ctl_id target_id, int lun_id)
2270{
2271	struct cfiscsi_softc *softc;
2272	struct cfiscsi_target *ct;
2273	struct ctl_be_lun_option *opt;
2274	const char *target = NULL, *target_alias = NULL;
2275	const char *lun = NULL;
2276	unsigned long tmp;
2277
2278	softc = (struct cfiscsi_softc *)arg;
2279
2280	STAILQ_FOREACH(opt,
2281	    &control_softc->ctl_luns[lun_id]->be_lun->options, links) {
2282		if (strcmp(opt->name, "cfiscsi_target") == 0)
2283			target = opt->value;
2284		else if (strcmp(opt->name, "cfiscsi_target_alias") == 0)
2285			target_alias = opt->value;
2286		else if (strcmp(opt->name, "cfiscsi_lun") == 0)
2287			lun = opt->value;
2288	}
2289
2290	if (target == NULL && lun == NULL)
2291		return (0);
2292
2293	if (target == NULL || lun == NULL) {
2294		CFISCSI_WARN("lun added with cfiscsi_target, but without "
2295		    "cfiscsi_lun, or the other way around; ignoring");
2296		return (0);
2297	}
2298
2299	ct = cfiscsi_target_find_or_create(softc, target, target_alias);
2300	if (ct == NULL) {
2301		CFISCSI_WARN("failed to create target \"%s\"", target);
2302		return (0);
2303	}
2304
2305	tmp = strtoul(lun, NULL, 10);
2306	cfiscsi_target_set_lun(ct, tmp, lun_id);
2307	cfiscsi_target_release(ct);
2308	return (0);
2309}
2310
2311static int
2312cfiscsi_lun_disable(void *arg, struct ctl_id target_id, int lun_id)
2313{
2314	struct cfiscsi_softc *softc;
2315	struct cfiscsi_target *ct;
2316	int i;
2317
2318	softc = (struct cfiscsi_softc *)arg;
2319
2320	mtx_lock(&softc->lock);
2321	TAILQ_FOREACH(ct, &softc->targets, ct_next) {
2322		for (i = 0; i < CTL_MAX_LUNS; i++) {
2323			if (ct->ct_luns[i] < 0)
2324				continue;
2325			if (ct->ct_luns[i] != lun_id)
2326				continue;
2327			mtx_unlock(&softc->lock);
2328			cfiscsi_target_unset_lun(ct, i);
2329			return (0);
2330		}
2331	}
2332	mtx_unlock(&softc->lock);
2333	return (0);
2334}
2335
2336static void
2337cfiscsi_datamove_in(union ctl_io *io)
2338{
2339	struct cfiscsi_session *cs;
2340	struct icl_pdu *request, *response;
2341	const struct iscsi_bhs_scsi_command *bhssc;
2342	struct iscsi_bhs_data_in *bhsdi;
2343	struct ctl_sg_entry ctl_sg_entry, *ctl_sglist;
2344	size_t len, expected_len, sg_len, buffer_offset;
2345	const char *sg_addr;
2346	int ctl_sg_count, error, i;
2347
2348	request = io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr;
2349	cs = PDU_SESSION(request);
2350
2351	bhssc = (const struct iscsi_bhs_scsi_command *)request->ip_bhs;
2352	KASSERT((bhssc->bhssc_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
2353	    ISCSI_BHS_OPCODE_SCSI_COMMAND,
2354	    ("bhssc->bhssc_opcode != ISCSI_BHS_OPCODE_SCSI_COMMAND"));
2355
2356	if (io->scsiio.kern_sg_entries > 0) {
2357		ctl_sglist = (struct ctl_sg_entry *)io->scsiio.kern_data_ptr;
2358		ctl_sg_count = io->scsiio.kern_sg_entries;
2359	} else {
2360		ctl_sglist = &ctl_sg_entry;
2361		ctl_sglist->addr = io->scsiio.kern_data_ptr;
2362		ctl_sglist->len = io->scsiio.kern_data_len;
2363		ctl_sg_count = 1;
2364	}
2365
2366	/*
2367	 * This is the total amount of data to be transferred within the current
2368	 * SCSI command.  We need to record it so that we can properly report
2369	 * underflow/underflow.
2370	 */
2371	PDU_TOTAL_TRANSFER_LEN(request) = io->scsiio.kern_total_len;
2372
2373	/*
2374	 * This is the offset within the current SCSI command; for the first
2375	 * call to cfiscsi_datamove() it will be 0, and for subsequent ones
2376	 * it will be the sum of lengths of previous ones.  It's being
2377	 * incremented as we append data to the data segment.
2378	 */
2379	buffer_offset = io->scsiio.kern_rel_offset;
2380
2381	/*
2382	 * This is the transfer length expected by the initiator.  In theory,
2383	 * it could be different from the correct amount of data from the SCSI
2384	 * point of view, even if that doesn't make any sense.
2385	 */
2386	expected_len = ntohl(bhssc->bhssc_expected_data_transfer_length);
2387#if 0
2388	if (expected_len != io->scsiio.kern_total_len)
2389		CFISCSI_SESSION_DEBUG(cs, "expected transfer length = %zd, "
2390		    "actual length = %zd", expected_len,
2391		    io->scsiio.kern_total_len);
2392#endif
2393
2394	if (buffer_offset >= expected_len) {
2395#if 0
2396		CFISCSI_SESSION_DEBUG(cs, "buffer_offset = %zd, "
2397		    "already sent the expected len", buffer_offset);
2398#endif
2399		io->scsiio.ext_data_filled = io->scsiio.kern_total_len;
2400		io->scsiio.be_move_done(io);
2401		return;
2402	}
2403
2404	i = 0;
2405	sg_addr = NULL;
2406	sg_len = 0;
2407	response = NULL;
2408	bhsdi = NULL;
2409	for (;;) {
2410		if (response == NULL) {
2411			response = cfiscsi_pdu_new_response(request, M_NOWAIT);
2412			if (response == NULL) {
2413				CFISCSI_SESSION_WARN(cs, "failed to "
2414				    "allocate memory; dropping connection");
2415				ctl_set_busy(&io->scsiio);
2416				io->scsiio.be_move_done(io);
2417				cfiscsi_session_terminate(cs);
2418				return;
2419			}
2420			bhsdi = (struct iscsi_bhs_data_in *)response->ip_bhs;
2421			bhsdi->bhsdi_opcode = ISCSI_BHS_OPCODE_SCSI_DATA_IN;
2422			bhsdi->bhsdi_initiator_task_tag =
2423			    bhssc->bhssc_initiator_task_tag;
2424			bhsdi->bhsdi_datasn = htonl(PDU_EXPDATASN(request));
2425			PDU_EXPDATASN(request)++;
2426			bhsdi->bhsdi_buffer_offset = htonl(buffer_offset);
2427		}
2428
2429		KASSERT(i < ctl_sg_count, ("i >= ctl_sg_count"));
2430		if (sg_len == 0) {
2431			sg_addr = ctl_sglist[i].addr;
2432			sg_len = ctl_sglist[i].len;
2433			KASSERT(sg_len > 0, ("sg_len <= 0"));
2434		}
2435
2436		len = sg_len;
2437
2438		/*
2439		 * Truncate to maximum data segment length.
2440		 */
2441		KASSERT(response->ip_data_len < cs->cs_max_data_segment_length,
2442		    ("max_data_segment_length %zd >= ip_data_len %zd",
2443		    response->ip_data_len, cs->cs_max_data_segment_length));
2444		if (response->ip_data_len + len >
2445		    cs->cs_max_data_segment_length)
2446			len = cs->cs_max_data_segment_length -
2447			    response->ip_data_len;
2448
2449		/*
2450		 * Truncate to expected data transfer length.
2451		 */
2452		KASSERT(buffer_offset + response->ip_data_len < expected_len,
2453		    ("%zd >= %zd", buffer_offset + response->ip_data_len, expected_len));
2454		if (buffer_offset + response->ip_data_len + len > expected_len) {
2455			CFISCSI_SESSION_DEBUG(cs, "truncating from %zd "
2456			    "to expected data transfer length %zd",
2457			    buffer_offset + response->ip_data_len + len, expected_len);
2458			len = expected_len - (buffer_offset + response->ip_data_len);
2459		}
2460
2461		KASSERT(len <= sg_len, ("len > sg_len"));
2462		error = icl_pdu_append_data(response, sg_addr, len, M_NOWAIT);
2463		if (error != 0) {
2464			CFISCSI_SESSION_WARN(cs, "failed to "
2465			    "allocate memory; dropping connection");
2466			icl_pdu_free(response);
2467			ctl_set_busy(&io->scsiio);
2468			io->scsiio.be_move_done(io);
2469			cfiscsi_session_terminate(cs);
2470			return;
2471		}
2472		sg_addr += len;
2473		sg_len -= len;
2474		buffer_offset += len;
2475		io->scsiio.ext_data_filled += len;
2476
2477		if (buffer_offset == expected_len) {
2478			/*
2479			 * Already have the amount of data the initiator wanted.
2480			 */
2481			break;
2482		}
2483
2484		if (sg_len == 0) {
2485			/*
2486			 * End of scatter-gather segment;
2487			 * proceed to the next one...
2488			 */
2489			if (i == ctl_sg_count - 1) {
2490				/*
2491				 * ... unless this was the last one.
2492				 */
2493				break;
2494			}
2495			i++;
2496		}
2497
2498		if (response->ip_data_len == cs->cs_max_data_segment_length) {
2499			/*
2500			 * Can't stuff more data into the current PDU;
2501			 * queue it.  Note that's not enough to check
2502			 * for kern_data_resid == 0 instead; there
2503			 * may be several Data-In PDUs for the final
2504			 * call to cfiscsi_datamove(), and we want
2505			 * to set the F flag only on the last of them.
2506			 */
2507			if (buffer_offset == io->scsiio.kern_total_len ||
2508			    buffer_offset == expected_len)
2509				bhsdi->bhsdi_flags |= BHSDI_FLAGS_F;
2510			cfiscsi_pdu_queue(response);
2511			response = NULL;
2512			bhsdi = NULL;
2513		}
2514	}
2515	if (response != NULL) {
2516		if (buffer_offset == io->scsiio.kern_total_len ||
2517		    buffer_offset == expected_len)
2518			bhsdi->bhsdi_flags |= BHSDI_FLAGS_F;
2519		KASSERT(response->ip_data_len > 0, ("sending empty Data-In"));
2520		cfiscsi_pdu_queue(response);
2521	}
2522
2523	io->scsiio.be_move_done(io);
2524}
2525
2526static void
2527cfiscsi_datamove_out(union ctl_io *io)
2528{
2529	struct cfiscsi_session *cs;
2530	struct icl_pdu *request, *response;
2531	const struct iscsi_bhs_scsi_command *bhssc;
2532	struct iscsi_bhs_r2t *bhsr2t;
2533	struct cfiscsi_data_wait *cdw;
2534	uint32_t target_transfer_tag;
2535	bool done;
2536
2537	request = io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr;
2538	cs = PDU_SESSION(request);
2539
2540	bhssc = (const struct iscsi_bhs_scsi_command *)request->ip_bhs;
2541	KASSERT((bhssc->bhssc_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
2542	    ISCSI_BHS_OPCODE_SCSI_COMMAND,
2543	    ("bhssc->bhssc_opcode != ISCSI_BHS_OPCODE_SCSI_COMMAND"));
2544
2545	/*
2546	 * We need to record it so that we can properly report
2547	 * underflow/underflow.
2548	 */
2549	PDU_TOTAL_TRANSFER_LEN(request) = io->scsiio.kern_total_len;
2550
2551	target_transfer_tag =
2552	    atomic_fetchadd_32(&cs->cs_target_transfer_tag, 1);
2553
2554#if 0
2555	CFISCSI_SESSION_DEBUG(cs, "expecting Data-Out with initiator "
2556	    "task tag 0x%x, target transfer tag 0x%x",
2557	    bhssc->bhssc_initiator_task_tag, target_transfer_tag);
2558#endif
2559	cdw = uma_zalloc(cfiscsi_data_wait_zone, M_NOWAIT | M_ZERO);
2560	if (cdw == NULL) {
2561		CFISCSI_SESSION_WARN(cs, "failed to "
2562		    "allocate memory; dropping connection");
2563		ctl_set_busy(&io->scsiio);
2564		io->scsiio.be_move_done(io);
2565		cfiscsi_session_terminate(cs);
2566		return;
2567	}
2568	cdw->cdw_ctl_io = io;
2569	cdw->cdw_target_transfer_tag = target_transfer_tag;
2570	cdw->cdw_initiator_task_tag = bhssc->bhssc_initiator_task_tag;
2571
2572	if (cs->cs_immediate_data && icl_pdu_data_segment_length(request) > 0) {
2573		done = cfiscsi_handle_data_segment(request, cdw);
2574		if (done) {
2575			uma_zfree(cfiscsi_data_wait_zone, cdw);
2576			io->scsiio.be_move_done(io);
2577			return;
2578		}
2579
2580#if 0
2581		if (io->scsiio.ext_data_filled != 0)
2582			CFISCSI_SESSION_DEBUG(cs, "got %zd bytes of immediate data, need %zd",
2583			    io->scsiio.ext_data_filled, io->scsiio.kern_data_len);
2584#endif
2585	}
2586
2587	CFISCSI_SESSION_LOCK(cs);
2588	TAILQ_INSERT_TAIL(&cs->cs_waiting_for_data_out, cdw, cdw_next);
2589	CFISCSI_SESSION_UNLOCK(cs);
2590
2591	/*
2592	 * XXX: We should limit the number of outstanding R2T PDUs
2593	 * 	per task to MaxOutstandingR2T.
2594	 */
2595	response = cfiscsi_pdu_new_response(request, M_NOWAIT);
2596	if (response == NULL) {
2597		CFISCSI_SESSION_WARN(cs, "failed to "
2598		    "allocate memory; dropping connection");
2599		ctl_set_busy(&io->scsiio);
2600		io->scsiio.be_move_done(io);
2601		cfiscsi_session_terminate(cs);
2602		return;
2603	}
2604	bhsr2t = (struct iscsi_bhs_r2t *)response->ip_bhs;
2605	bhsr2t->bhsr2t_opcode = ISCSI_BHS_OPCODE_R2T;
2606	bhsr2t->bhsr2t_flags = 0x80;
2607	bhsr2t->bhsr2t_lun = bhssc->bhssc_lun;
2608	bhsr2t->bhsr2t_initiator_task_tag = bhssc->bhssc_initiator_task_tag;
2609	bhsr2t->bhsr2t_target_transfer_tag = target_transfer_tag;
2610	/*
2611	 * XXX: Here we assume that cfiscsi_datamove() won't ever
2612	 *	be running concurrently on several CPUs for a given
2613	 *	command.
2614	 */
2615	bhsr2t->bhsr2t_r2tsn = htonl(PDU_R2TSN(request));
2616	PDU_R2TSN(request)++;
2617	/*
2618	 * This is the offset within the current SCSI command;
2619	 * i.e. for the first call of datamove(), it will be 0,
2620	 * and for subsequent ones it will be the sum of lengths
2621	 * of previous ones.
2622	 *
2623	 * The ext_data_filled is to account for unsolicited
2624	 * (immediate) data that might have already arrived.
2625	 */
2626	bhsr2t->bhsr2t_buffer_offset =
2627	    htonl(io->scsiio.kern_rel_offset + io->scsiio.ext_data_filled);
2628	/*
2629	 * This is the total length (sum of S/G lengths) this call
2630	 * to cfiscsi_datamove() is supposed to handle.
2631	 *
2632	 * XXX: Limit it to MaxBurstLength.
2633	 */
2634	bhsr2t->bhsr2t_desired_data_transfer_length =
2635	    htonl(io->scsiio.kern_data_len - io->scsiio.ext_data_filled);
2636	cfiscsi_pdu_queue(response);
2637}
2638
2639static void
2640cfiscsi_datamove(union ctl_io *io)
2641{
2642
2643	if ((io->io_hdr.flags & CTL_FLAG_DATA_MASK) == CTL_FLAG_DATA_IN)
2644		cfiscsi_datamove_in(io);
2645	else
2646		cfiscsi_datamove_out(io);
2647}
2648
2649static void
2650cfiscsi_scsi_command_done(union ctl_io *io)
2651{
2652	struct icl_pdu *request, *response;
2653	struct iscsi_bhs_scsi_command *bhssc;
2654	struct iscsi_bhs_scsi_response *bhssr;
2655#ifdef DIAGNOSTIC
2656	struct cfiscsi_data_wait *cdw;
2657#endif
2658	struct cfiscsi_session *cs;
2659	uint16_t sense_length;
2660
2661	request = io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr;
2662	cs = PDU_SESSION(request);
2663	bhssc = (struct iscsi_bhs_scsi_command *)request->ip_bhs;
2664	KASSERT((bhssc->bhssc_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
2665	    ISCSI_BHS_OPCODE_SCSI_COMMAND,
2666	    ("replying to wrong opcode 0x%x", bhssc->bhssc_opcode));
2667
2668	//CFISCSI_SESSION_DEBUG(cs, "initiator task tag 0x%x",
2669	//    bhssc->bhssc_initiator_task_tag);
2670
2671#ifdef DIAGNOSTIC
2672	CFISCSI_SESSION_LOCK(cs);
2673	TAILQ_FOREACH(cdw, &cs->cs_waiting_for_data_out, cdw_next)
2674		KASSERT(bhssc->bhssc_initiator_task_tag !=
2675		    cdw->cdw_initiator_task_tag, ("dangling cdw"));
2676	CFISCSI_SESSION_UNLOCK(cs);
2677#endif
2678
2679	response = cfiscsi_pdu_new_response(request, M_WAITOK);
2680	bhssr = (struct iscsi_bhs_scsi_response *)response->ip_bhs;
2681	bhssr->bhssr_opcode = ISCSI_BHS_OPCODE_SCSI_RESPONSE;
2682	bhssr->bhssr_flags = 0x80;
2683	/*
2684	 * XXX: We don't deal with bidirectional under/overflows;
2685	 *	does anything actually support those?
2686	 */
2687	if (PDU_TOTAL_TRANSFER_LEN(request) <
2688	    ntohl(bhssc->bhssc_expected_data_transfer_length)) {
2689		bhssr->bhssr_flags |= BHSSR_FLAGS_RESIDUAL_UNDERFLOW;
2690		bhssr->bhssr_residual_count =
2691		    htonl(ntohl(bhssc->bhssc_expected_data_transfer_length) -
2692		    PDU_TOTAL_TRANSFER_LEN(request));
2693		//CFISCSI_SESSION_DEBUG(cs, "underflow; residual count %d",
2694		//    ntohl(bhssr->bhssr_residual_count));
2695	} else if (PDU_TOTAL_TRANSFER_LEN(request) >
2696	    ntohl(bhssc->bhssc_expected_data_transfer_length)) {
2697		bhssr->bhssr_flags |= BHSSR_FLAGS_RESIDUAL_OVERFLOW;
2698		bhssr->bhssr_residual_count =
2699		    htonl(PDU_TOTAL_TRANSFER_LEN(request) -
2700		    ntohl(bhssc->bhssc_expected_data_transfer_length));
2701		//CFISCSI_SESSION_DEBUG(cs, "overflow; residual count %d",
2702		//    ntohl(bhssr->bhssr_residual_count));
2703	}
2704	bhssr->bhssr_response = BHSSR_RESPONSE_COMMAND_COMPLETED;
2705	bhssr->bhssr_status = io->scsiio.scsi_status;
2706	bhssr->bhssr_initiator_task_tag = bhssc->bhssc_initiator_task_tag;
2707	bhssr->bhssr_expdatasn = htonl(PDU_EXPDATASN(request));
2708
2709	if (io->scsiio.sense_len > 0) {
2710#if 0
2711		CFISCSI_SESSION_DEBUG(cs, "returning %d bytes of sense data",
2712		    io->scsiio.sense_len);
2713#endif
2714		sense_length = htons(io->scsiio.sense_len);
2715		icl_pdu_append_data(response,
2716		    &sense_length, sizeof(sense_length), M_WAITOK);
2717		icl_pdu_append_data(response,
2718		    &io->scsiio.sense_data, io->scsiio.sense_len, M_WAITOK);
2719	}
2720
2721	ctl_free_io(io);
2722	icl_pdu_free(request);
2723	cfiscsi_pdu_queue(response);
2724}
2725
2726static void
2727cfiscsi_task_management_done(union ctl_io *io)
2728{
2729	struct icl_pdu *request, *response;
2730	struct iscsi_bhs_task_management_request *bhstmr;
2731	struct iscsi_bhs_task_management_response *bhstmr2;
2732	struct cfiscsi_data_wait *cdw, *tmpcdw;
2733	struct cfiscsi_session *cs;
2734
2735	request = io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr;
2736	cs = PDU_SESSION(request);
2737	bhstmr = (struct iscsi_bhs_task_management_request *)request->ip_bhs;
2738	KASSERT((bhstmr->bhstmr_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) ==
2739	    ISCSI_BHS_OPCODE_TASK_REQUEST,
2740	    ("replying to wrong opcode 0x%x", bhstmr->bhstmr_opcode));
2741
2742#if 0
2743	CFISCSI_SESSION_DEBUG(cs, "initiator task tag 0x%x; referenced task tag 0x%x",
2744	    bhstmr->bhstmr_initiator_task_tag,
2745	    bhstmr->bhstmr_referenced_task_tag);
2746#endif
2747
2748	if ((bhstmr->bhstmr_function & ~0x80) ==
2749	    BHSTMR_FUNCTION_ABORT_TASK) {
2750		/*
2751		 * Make sure we no longer wait for Data-Out for this command.
2752		 */
2753		CFISCSI_SESSION_LOCK(cs);
2754		TAILQ_FOREACH_SAFE(cdw,
2755		    &cs->cs_waiting_for_data_out, cdw_next, tmpcdw) {
2756			if (bhstmr->bhstmr_referenced_task_tag !=
2757			    cdw->cdw_initiator_task_tag)
2758				continue;
2759
2760#if 0
2761			CFISCSI_SESSION_DEBUG(cs, "removing csw for initiator task "
2762			    "tag 0x%x", bhstmr->bhstmr_initiator_task_tag);
2763#endif
2764			TAILQ_REMOVE(&cs->cs_waiting_for_data_out,
2765			    cdw, cdw_next);
2766			cdw->cdw_ctl_io->scsiio.be_move_done(cdw->cdw_ctl_io);
2767			uma_zfree(cfiscsi_data_wait_zone, cdw);
2768		}
2769		CFISCSI_SESSION_UNLOCK(cs);
2770	}
2771
2772	response = cfiscsi_pdu_new_response(request, M_WAITOK);
2773	bhstmr2 = (struct iscsi_bhs_task_management_response *)
2774	    response->ip_bhs;
2775	bhstmr2->bhstmr_opcode = ISCSI_BHS_OPCODE_TASK_RESPONSE;
2776	bhstmr2->bhstmr_flags = 0x80;
2777	if (io->io_hdr.status == CTL_SUCCESS) {
2778		bhstmr2->bhstmr_response = BHSTMR_RESPONSE_FUNCTION_COMPLETE;
2779	} else {
2780		/*
2781		 * XXX: How to figure out what exactly went wrong?  iSCSI spec
2782		 * 	expects us to provide detailed error, e.g. "Task does
2783		 * 	not exist" or "LUN does not exist".
2784		 */
2785		CFISCSI_SESSION_DEBUG(cs, "BHSTMR_RESPONSE_FUNCTION_NOT_SUPPORTED");
2786		bhstmr2->bhstmr_response =
2787		    BHSTMR_RESPONSE_FUNCTION_NOT_SUPPORTED;
2788	}
2789	bhstmr2->bhstmr_initiator_task_tag = bhstmr->bhstmr_initiator_task_tag;
2790
2791	ctl_free_io(io);
2792	icl_pdu_free(request);
2793	cfiscsi_pdu_queue(response);
2794}
2795
2796static void
2797cfiscsi_done(union ctl_io *io)
2798{
2799	struct icl_pdu *request;
2800	struct cfiscsi_session *cs;
2801
2802	KASSERT(((io->io_hdr.status & CTL_STATUS_MASK) != CTL_STATUS_NONE),
2803		("invalid CTL status %#x", io->io_hdr.status));
2804
2805	request = io->io_hdr.ctl_private[CTL_PRIV_FRONTEND].ptr;
2806	if (request == NULL) {
2807		/*
2808		 * Implicit task termination has just completed; nothing to do.
2809		 */
2810		return;
2811	}
2812
2813	cs = PDU_SESSION(request);
2814	refcount_release(&cs->cs_outstanding_ctl_pdus);
2815
2816	switch (request->ip_bhs->bhs_opcode & ~ISCSI_BHS_OPCODE_IMMEDIATE) {
2817	case ISCSI_BHS_OPCODE_SCSI_COMMAND:
2818		cfiscsi_scsi_command_done(io);
2819		break;
2820	case ISCSI_BHS_OPCODE_TASK_REQUEST:
2821		cfiscsi_task_management_done(io);
2822		break;
2823	default:
2824		panic("cfiscsi_done called with wrong opcode 0x%x",
2825		    request->ip_bhs->bhs_opcode);
2826	}
2827}
2828