iscsi.c revision 265508
1/*-
2 * Copyright (c) 2012 The FreeBSD Foundation
3 * All rights reserved.
4 *
5 * This software was developed by Edward Tomasz Napierala under sponsorship
6 * from the FreeBSD Foundation.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 *    notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 *    notice, this list of conditions and the following disclaimer in the
15 *    documentation and/or other materials provided with the distribution.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
28 *
29 * $FreeBSD: stable/10/sys/dev/iscsi/iscsi.c 265508 2014-05-07 07:31:25Z trasz $
30 */
31
32#include <sys/param.h>
33#include <sys/condvar.h>
34#include <sys/conf.h>
35#include <sys/eventhandler.h>
36#include <sys/file.h>
37#include <sys/kernel.h>
38#include <sys/kthread.h>
39#include <sys/lock.h>
40#include <sys/malloc.h>
41#include <sys/mutex.h>
42#include <sys/module.h>
43#include <sys/sysctl.h>
44#include <sys/systm.h>
45#include <sys/sx.h>
46#include <vm/uma.h>
47
48#include <cam/cam.h>
49#include <cam/cam_ccb.h>
50#include <cam/cam_xpt.h>
51#include <cam/cam_debug.h>
52#include <cam/cam_sim.h>
53#include <cam/cam_xpt_sim.h>
54#include <cam/cam_xpt_periph.h>
55#include <cam/cam_periph.h>
56#include <cam/scsi/scsi_all.h>
57#include <cam/scsi/scsi_message.h>
58
59#include "iscsi_ioctl.h"
60#include "iscsi.h"
61#include "icl.h"
62#include "iscsi_proto.h"
63
64#ifdef ICL_KERNEL_PROXY
65#include <sys/socketvar.h>
66#endif
67
68#ifdef ICL_KERNEL_PROXY
69FEATURE(iscsi_kernel_proxy, "iSCSI initiator built with ICL_KERNEL_PROXY");
70#endif
71
72/*
73 * XXX: This is global so the iscsi_unload() can access it.
74 * 	Think about how to do this properly.
75 */
76static struct iscsi_softc	*sc;
77
78SYSCTL_NODE(_kern, OID_AUTO, iscsi, CTLFLAG_RD, 0, "iSCSI initiator");
79static int debug = 1;
80TUNABLE_INT("kern.iscsi.debug", &debug);
81SYSCTL_INT(_kern_iscsi, OID_AUTO, debug, CTLFLAG_RWTUN,
82    &debug, 2, "Enable debug messages");
83static int ping_timeout = 5;
84TUNABLE_INT("kern.iscsi.ping_timeout", &ping_timeout);
85SYSCTL_INT(_kern_iscsi, OID_AUTO, ping_timeout, CTLFLAG_RWTUN, &ping_timeout,
86    5, "Timeout for ping (NOP-Out) requests, in seconds");
87static int iscsid_timeout = 60;
88TUNABLE_INT("kern.iscsi.iscsid_timeout", &iscsid_timeout);
89SYSCTL_INT(_kern_iscsi, OID_AUTO, iscsid_timeout, CTLFLAG_RWTUN, &iscsid_timeout,
90    60, "Time to wait for iscsid(8) to handle reconnection, in seconds");
91static int login_timeout = 60;
92TUNABLE_INT("kern.iscsi.login_timeout", &login_timeout);
93SYSCTL_INT(_kern_iscsi, OID_AUTO, login_timeout, CTLFLAG_RWTUN, &login_timeout,
94    60, "Time to wait for iscsid(8) to finish Login Phase, in seconds");
95static int maxtags = 255;
96TUNABLE_INT("kern.iscsi.maxtags", &maxtags);
97SYSCTL_INT(_kern_iscsi, OID_AUTO, maxtags, CTLFLAG_RWTUN, &maxtags,
98    255, "Max number of IO requests queued");
99
100static MALLOC_DEFINE(M_ISCSI, "iSCSI", "iSCSI initiator");
101static uma_zone_t iscsi_outstanding_zone;
102
103#define	CONN_SESSION(X)	((struct iscsi_session *)X->ic_prv0)
104#define	PDU_SESSION(X)	(CONN_SESSION(X->ip_conn))
105
106#define	ISCSI_DEBUG(X, ...)						\
107	do {								\
108		if (debug > 1) 						\
109			printf("%s: " X "\n", __func__, ## __VA_ARGS__);\
110	} while (0)
111
112#define	ISCSI_WARN(X, ...)						\
113	do {								\
114		if (debug > 0) {					\
115			printf("WARNING: %s: " X "\n",			\
116			    __func__, ## __VA_ARGS__);			\
117		}							\
118	} while (0)
119
120#define	ISCSI_SESSION_DEBUG(S, X, ...)					\
121	do {								\
122		if (debug > 1) {					\
123			printf("%s: %s (%s): " X "\n",			\
124			    __func__, S->is_conf.isc_target_addr,	\
125			    S->is_conf.isc_target, ## __VA_ARGS__);	\
126		}							\
127	} while (0)
128
129#define	ISCSI_SESSION_WARN(S, X, ...)					\
130	do {								\
131		if (debug > 0) {					\
132			printf("WARNING: %s (%s): " X "\n",		\
133			    S->is_conf.isc_target_addr,			\
134			    S->is_conf.isc_target, ## __VA_ARGS__);	\
135		}							\
136	} while (0)
137
138#define ISCSI_SESSION_LOCK(X)		mtx_lock(&X->is_lock)
139#define ISCSI_SESSION_UNLOCK(X)		mtx_unlock(&X->is_lock)
140#define ISCSI_SESSION_LOCK_ASSERT(X)	mtx_assert(&X->is_lock, MA_OWNED)
141
142static int	iscsi_ioctl(struct cdev *dev, u_long cmd, caddr_t arg,
143		    int mode, struct thread *td);
144
145static struct cdevsw iscsi_cdevsw = {
146     .d_version = D_VERSION,
147     .d_ioctl   = iscsi_ioctl,
148     .d_name    = "iscsi",
149};
150
151static void	iscsi_pdu_queue_locked(struct icl_pdu *request);
152static void	iscsi_pdu_queue(struct icl_pdu *request);
153static void	iscsi_pdu_update_statsn(const struct icl_pdu *response);
154static void	iscsi_pdu_handle_nop_in(struct icl_pdu *response);
155static void	iscsi_pdu_handle_scsi_response(struct icl_pdu *response);
156static void	iscsi_pdu_handle_data_in(struct icl_pdu *response);
157static void	iscsi_pdu_handle_logout_response(struct icl_pdu *response);
158static void	iscsi_pdu_handle_r2t(struct icl_pdu *response);
159static void	iscsi_pdu_handle_async_message(struct icl_pdu *response);
160static void	iscsi_pdu_handle_reject(struct icl_pdu *response);
161static void	iscsi_session_reconnect(struct iscsi_session *is);
162static void	iscsi_session_terminate(struct iscsi_session *is);
163static void	iscsi_action(struct cam_sim *sim, union ccb *ccb);
164static void	iscsi_poll(struct cam_sim *sim);
165static struct iscsi_outstanding	*iscsi_outstanding_find(struct iscsi_session *is,
166		    uint32_t initiator_task_tag);
167static int	iscsi_outstanding_add(struct iscsi_session *is,
168		    uint32_t initiator_task_tag, union ccb *ccb);
169static void	iscsi_outstanding_remove(struct iscsi_session *is,
170		    struct iscsi_outstanding *io);
171
172static bool
173iscsi_pdu_prepare(struct icl_pdu *request)
174{
175	struct iscsi_session *is;
176	struct iscsi_bhs_scsi_command *bhssc;
177
178	is = PDU_SESSION(request);
179
180	ISCSI_SESSION_LOCK_ASSERT(is);
181
182	/*
183	 * We're only using fields common for all the request
184	 * (initiator -> target) PDUs.
185	 */
186	bhssc = (struct iscsi_bhs_scsi_command *)request->ip_bhs;
187
188	/*
189	 * Data-Out PDU does not contain CmdSN.
190	 */
191	if (bhssc->bhssc_opcode != ISCSI_BHS_OPCODE_SCSI_DATA_OUT) {
192		if (is->is_cmdsn > is->is_maxcmdsn &&
193		    (bhssc->bhssc_opcode & ISCSI_BHS_OPCODE_IMMEDIATE) == 0) {
194			/*
195			 * Current MaxCmdSN prevents us from sending any more
196			 * SCSI Command PDUs to the target; postpone the PDU.
197			 * It will get resent by either iscsi_pdu_queue(),
198			 * or by maintenance thread.
199			 */
200#if 0
201			ISCSI_SESSION_DEBUG(is, "postponing send, CmdSN %d, ExpCmdSN %d, MaxCmdSN %d, opcode 0x%x",
202			    is->is_cmdsn, is->is_expcmdsn, is->is_maxcmdsn, bhssc->bhssc_opcode);
203#endif
204			return (true);
205		}
206		bhssc->bhssc_cmdsn = htonl(is->is_cmdsn);
207		if ((bhssc->bhssc_opcode & ISCSI_BHS_OPCODE_IMMEDIATE) == 0)
208			is->is_cmdsn++;
209	}
210	bhssc->bhssc_expstatsn = htonl(is->is_statsn + 1);
211
212	return (false);
213}
214
215static void
216iscsi_session_send_postponed(struct iscsi_session *is)
217{
218	struct icl_pdu *request;
219	bool postpone;
220
221	ISCSI_SESSION_LOCK_ASSERT(is);
222
223	while (!STAILQ_EMPTY(&is->is_postponed)) {
224		request = STAILQ_FIRST(&is->is_postponed);
225		postpone = iscsi_pdu_prepare(request);
226		if (postpone)
227			break;
228		STAILQ_REMOVE_HEAD(&is->is_postponed, ip_next);
229		icl_pdu_queue(request);
230	}
231}
232
233static void
234iscsi_pdu_queue_locked(struct icl_pdu *request)
235{
236	struct iscsi_session *is;
237	bool postpone;
238
239	is = PDU_SESSION(request);
240	ISCSI_SESSION_LOCK_ASSERT(is);
241	iscsi_session_send_postponed(is);
242	postpone = iscsi_pdu_prepare(request);
243	if (postpone) {
244		STAILQ_INSERT_TAIL(&is->is_postponed, request, ip_next);
245		return;
246	}
247	icl_pdu_queue(request);
248}
249
250static void
251iscsi_pdu_queue(struct icl_pdu *request)
252{
253	struct iscsi_session *is;
254
255	is = PDU_SESSION(request);
256	ISCSI_SESSION_LOCK(is);
257	iscsi_pdu_queue_locked(request);
258	ISCSI_SESSION_UNLOCK(is);
259}
260
261static void
262iscsi_session_logout(struct iscsi_session *is)
263{
264	struct icl_pdu *request;
265	struct iscsi_bhs_logout_request *bhslr;
266
267	request = icl_pdu_new_bhs(is->is_conn, M_NOWAIT);
268	if (request == NULL)
269		return;
270
271	bhslr = (struct iscsi_bhs_logout_request *)request->ip_bhs;
272	bhslr->bhslr_opcode = ISCSI_BHS_OPCODE_LOGOUT_REQUEST;
273	bhslr->bhslr_reason = BHSLR_REASON_CLOSE_SESSION;
274	iscsi_pdu_queue_locked(request);
275}
276
277static void
278iscsi_session_terminate_tasks(struct iscsi_session *is, bool requeue)
279{
280	struct iscsi_outstanding *io, *tmp;
281
282	ISCSI_SESSION_LOCK_ASSERT(is);
283
284	TAILQ_FOREACH_SAFE(io, &is->is_outstanding, io_next, tmp) {
285		if (requeue) {
286			io->io_ccb->ccb_h.status &= ~CAM_SIM_QUEUED;
287			io->io_ccb->ccb_h.status |= CAM_REQUEUE_REQ;
288		} else {
289			io->io_ccb->ccb_h.status = CAM_REQ_ABORTED;
290		}
291
292		if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
293			xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
294			ISCSI_SESSION_DEBUG(is, "freezing devq");
295		}
296		io->io_ccb->ccb_h.status |= CAM_DEV_QFRZN;
297		xpt_done(io->io_ccb);
298		iscsi_outstanding_remove(is, io);
299	}
300}
301
302static void
303iscsi_maintenance_thread_reconnect(struct iscsi_session *is)
304{
305	struct icl_pdu *pdu;
306
307	icl_conn_shutdown(is->is_conn);
308	icl_conn_close(is->is_conn);
309
310	ISCSI_SESSION_LOCK(is);
311
312#ifdef ICL_KERNEL_PROXY
313	if (is->is_login_pdu != NULL) {
314		icl_pdu_free(is->is_login_pdu);
315		is->is_login_pdu = NULL;
316	}
317	cv_signal(&is->is_login_cv);
318#endif
319
320	/*
321	 * Don't queue any new PDUs.
322	 */
323	if (is->is_sim != NULL && is->is_simq_frozen == false) {
324		ISCSI_SESSION_DEBUG(is, "freezing");
325		xpt_freeze_simq(is->is_sim, 1);
326		is->is_simq_frozen = true;
327	}
328
329	/*
330	 * Remove postponed PDUs.
331	 */
332	while (!STAILQ_EMPTY(&is->is_postponed)) {
333		pdu = STAILQ_FIRST(&is->is_postponed);
334		STAILQ_REMOVE_HEAD(&is->is_postponed, ip_next);
335		icl_pdu_free(pdu);
336	}
337
338	/*
339	 * Terminate SCSI tasks, asking CAM to requeue them.
340	 */
341	//ISCSI_SESSION_DEBUG(is, "terminating tasks");
342	iscsi_session_terminate_tasks(is, true);
343
344	KASSERT(TAILQ_EMPTY(&is->is_outstanding),
345	    ("destroying session with active tasks"));
346	KASSERT(STAILQ_EMPTY(&is->is_postponed),
347	    ("destroying session with postponed PDUs"));
348
349	/*
350	 * Request immediate reconnection from iscsid(8).
351	 */
352	//ISCSI_SESSION_DEBUG(is, "waking up iscsid(8)");
353	is->is_connected = false;
354	is->is_reconnecting = false;
355	is->is_login_phase = false;
356	is->is_waiting_for_iscsid = true;
357	strlcpy(is->is_reason, "Waiting for iscsid(8)", sizeof(is->is_reason));
358	is->is_timeout = 0;
359	ISCSI_SESSION_UNLOCK(is);
360	cv_signal(&is->is_softc->sc_cv);
361}
362
363static void
364iscsi_maintenance_thread_terminate(struct iscsi_session *is)
365{
366	struct iscsi_softc *sc;
367	struct icl_pdu *pdu;
368
369	sc = is->is_softc;
370	sx_xlock(&sc->sc_lock);
371	TAILQ_REMOVE(&sc->sc_sessions, is, is_next);
372	sx_xunlock(&sc->sc_lock);
373
374	icl_conn_close(is->is_conn);
375
376	ISCSI_SESSION_LOCK(is);
377
378	KASSERT(is->is_terminating, ("is_terminating == false"));
379
380#ifdef ICL_KERNEL_PROXY
381	if (is->is_login_pdu != NULL) {
382		icl_pdu_free(is->is_login_pdu);
383		is->is_login_pdu = NULL;
384	}
385	cv_signal(&is->is_login_cv);
386#endif
387
388	/*
389	 * Don't queue any new PDUs.
390	 */
391	callout_drain(&is->is_callout);
392	if (is->is_sim != NULL && is->is_simq_frozen == false) {
393		ISCSI_SESSION_DEBUG(is, "freezing");
394		xpt_freeze_simq(is->is_sim, 1);
395		is->is_simq_frozen = true;
396	}
397
398	/*
399	 * Remove postponed PDUs.
400	 */
401	while (!STAILQ_EMPTY(&is->is_postponed)) {
402		pdu = STAILQ_FIRST(&is->is_postponed);
403		STAILQ_REMOVE_HEAD(&is->is_postponed, ip_next);
404		icl_pdu_free(pdu);
405	}
406
407	/*
408	 * Forcibly terminate SCSI tasks.
409	 */
410	ISCSI_SESSION_DEBUG(is, "terminating tasks");
411	iscsi_session_terminate_tasks(is, false);
412
413	/*
414	 * Deregister CAM.
415	 */
416	if (is->is_sim != NULL) {
417		ISCSI_SESSION_DEBUG(is, "deregistering SIM");
418		xpt_async(AC_LOST_DEVICE, is->is_path, NULL);
419
420		if (is->is_simq_frozen) {
421			xpt_release_simq(is->is_sim, 1);
422			is->is_simq_frozen = false;
423		}
424
425		xpt_free_path(is->is_path);
426		xpt_bus_deregister(cam_sim_path(is->is_sim));
427		cam_sim_free(is->is_sim, TRUE /*free_devq*/);
428		is->is_sim = NULL;
429	}
430
431	KASSERT(TAILQ_EMPTY(&is->is_outstanding),
432	    ("destroying session with active tasks"));
433	KASSERT(STAILQ_EMPTY(&is->is_postponed),
434	    ("destroying session with postponed PDUs"));
435
436	ISCSI_SESSION_UNLOCK(is);
437
438	icl_conn_free(is->is_conn);
439	mtx_destroy(&is->is_lock);
440	cv_destroy(&is->is_maintenance_cv);
441#ifdef ICL_KERNEL_PROXY
442	cv_destroy(&is->is_login_cv);
443#endif
444	ISCSI_SESSION_DEBUG(is, "terminated");
445	free(is, M_ISCSI);
446
447	/*
448	 * The iscsi_unload() routine might be waiting.
449	 */
450	cv_signal(&sc->sc_cv);
451}
452
453static void
454iscsi_maintenance_thread(void *arg)
455{
456	struct iscsi_session *is;
457
458	is = arg;
459
460	for (;;) {
461		ISCSI_SESSION_LOCK(is);
462		if (is->is_reconnecting == false &&
463		    is->is_terminating == false &&
464		    STAILQ_EMPTY(&is->is_postponed))
465			cv_wait(&is->is_maintenance_cv, &is->is_lock);
466
467		if (is->is_reconnecting) {
468			ISCSI_SESSION_UNLOCK(is);
469			iscsi_maintenance_thread_reconnect(is);
470			continue;
471		}
472
473		if (is->is_terminating) {
474			ISCSI_SESSION_UNLOCK(is);
475			iscsi_maintenance_thread_terminate(is);
476			kthread_exit();
477			return;
478		}
479
480		iscsi_session_send_postponed(is);
481		ISCSI_SESSION_UNLOCK(is);
482	}
483}
484
485static void
486iscsi_session_reconnect(struct iscsi_session *is)
487{
488
489	/*
490	 * XXX: We can't use locking here, because
491	 * 	it's being called from various contexts.
492	 * 	Hope it doesn't break anything.
493	 */
494	if (is->is_reconnecting)
495		return;
496
497	is->is_reconnecting = true;
498	cv_signal(&is->is_maintenance_cv);
499}
500
501static void
502iscsi_session_terminate(struct iscsi_session *is)
503{
504	if (is->is_terminating)
505		return;
506
507	is->is_terminating = true;
508
509#if 0
510	iscsi_session_logout(is);
511#endif
512	cv_signal(&is->is_maintenance_cv);
513}
514
515static void
516iscsi_callout(void *context)
517{
518	struct icl_pdu *request;
519	struct iscsi_bhs_nop_out *bhsno;
520	struct iscsi_session *is;
521	bool reconnect_needed = false;
522
523	is = context;
524
525	if (is->is_terminating)
526		return;
527
528	callout_schedule(&is->is_callout, 1 * hz);
529
530	ISCSI_SESSION_LOCK(is);
531	is->is_timeout++;
532
533	if (is->is_waiting_for_iscsid) {
534		if (is->is_timeout > iscsid_timeout) {
535			ISCSI_SESSION_WARN(is, "timed out waiting for iscsid(8) "
536			    "for %d seconds; reconnecting",
537			    is->is_timeout);
538			reconnect_needed = true;
539		}
540		goto out;
541	}
542
543	if (is->is_login_phase) {
544		if (is->is_timeout > login_timeout) {
545			ISCSI_SESSION_WARN(is, "login timed out after %d seconds; "
546			    "reconnecting", is->is_timeout);
547			reconnect_needed = true;
548		}
549		goto out;
550	}
551
552	if (is->is_timeout >= ping_timeout) {
553		ISCSI_SESSION_WARN(is, "no ping reply (NOP-In) after %d seconds; "
554		    "reconnecting", ping_timeout);
555		reconnect_needed = true;
556		goto out;
557	}
558
559	ISCSI_SESSION_UNLOCK(is);
560
561	/*
562	 * If the ping was reset less than one second ago - which means
563	 * that we've received some PDU during the last second - assume
564	 * the traffic flows correctly and don't bother sending a NOP-Out.
565	 *
566	 * (It's 2 - one for one second, and one for incrementing is_timeout
567	 * earlier in this routine.)
568	 */
569	if (is->is_timeout < 2)
570		return;
571
572	request = icl_pdu_new_bhs(is->is_conn, M_NOWAIT);
573	if (request == NULL) {
574		ISCSI_SESSION_WARN(is, "failed to allocate PDU");
575		return;
576	}
577	bhsno = (struct iscsi_bhs_nop_out *)request->ip_bhs;
578	bhsno->bhsno_opcode = ISCSI_BHS_OPCODE_NOP_OUT |
579	    ISCSI_BHS_OPCODE_IMMEDIATE;
580	bhsno->bhsno_flags = 0x80;
581	bhsno->bhsno_target_transfer_tag = 0xffffffff;
582	iscsi_pdu_queue(request);
583	return;
584
585out:
586	ISCSI_SESSION_UNLOCK(is);
587
588	if (reconnect_needed)
589		iscsi_session_reconnect(is);
590}
591
592static void
593iscsi_pdu_update_statsn(const struct icl_pdu *response)
594{
595	const struct iscsi_bhs_data_in *bhsdi;
596	struct iscsi_session *is;
597	uint32_t expcmdsn, maxcmdsn;
598
599	is = PDU_SESSION(response);
600
601	ISCSI_SESSION_LOCK_ASSERT(is);
602
603	/*
604	 * We're only using fields common for all the response
605	 * (target -> initiator) PDUs.
606	 */
607	bhsdi = (const struct iscsi_bhs_data_in *)response->ip_bhs;
608	/*
609	 * Ok, I lied.  In case of Data-In, "The fields StatSN, Status,
610	 * and Residual Count only have meaningful content if the S bit
611	 * is set to 1", so we also need to check the bit specific for
612	 * Data-In PDU.
613	 */
614	if (bhsdi->bhsdi_opcode != ISCSI_BHS_OPCODE_SCSI_DATA_IN ||
615	    (bhsdi->bhsdi_flags & BHSDI_FLAGS_S) != 0) {
616		if (ntohl(bhsdi->bhsdi_statsn) < is->is_statsn) {
617			ISCSI_SESSION_WARN(is,
618			    "PDU StatSN %d >= session StatSN %d, opcode 0x%x",
619			    is->is_statsn, ntohl(bhsdi->bhsdi_statsn),
620			    bhsdi->bhsdi_opcode);
621		}
622		is->is_statsn = ntohl(bhsdi->bhsdi_statsn);
623	}
624
625	expcmdsn = ntohl(bhsdi->bhsdi_expcmdsn);
626	maxcmdsn = ntohl(bhsdi->bhsdi_maxcmdsn);
627
628	/*
629	 * XXX: Compare using Serial Arithmetic Sense.
630	 */
631	if (maxcmdsn + 1 < expcmdsn) {
632		ISCSI_SESSION_DEBUG(is, "PDU MaxCmdSN %d + 1 < PDU ExpCmdSN %d; ignoring",
633		    maxcmdsn, expcmdsn);
634	} else {
635		if (maxcmdsn > is->is_maxcmdsn) {
636			is->is_maxcmdsn = maxcmdsn;
637
638			/*
639			 * Command window increased; kick the maintanance thread
640			 * to send out postponed commands.
641			 */
642			if (!STAILQ_EMPTY(&is->is_postponed))
643				cv_signal(&is->is_maintenance_cv);
644		} else if (maxcmdsn < is->is_maxcmdsn) {
645			ISCSI_SESSION_DEBUG(is, "PDU MaxCmdSN %d < session MaxCmdSN %d; ignoring",
646			    maxcmdsn, is->is_maxcmdsn);
647		}
648
649		if (expcmdsn > is->is_expcmdsn) {
650			is->is_expcmdsn = expcmdsn;
651		} else if (expcmdsn < is->is_expcmdsn) {
652			ISCSI_SESSION_DEBUG(is, "PDU ExpCmdSN %d < session ExpCmdSN %d; ignoring",
653			    expcmdsn, is->is_expcmdsn);
654		}
655	}
656
657	/*
658	 * Every incoming PDU - not just NOP-In - resets the ping timer.
659	 * The purpose of the timeout is to reset the connection when it stalls;
660	 * we don't want this to happen when NOP-In or NOP-Out ends up delayed
661	 * in some queue.
662	 */
663	is->is_timeout = 0;
664}
665
666static void
667iscsi_receive_callback(struct icl_pdu *response)
668{
669	struct iscsi_session *is;
670
671	is = PDU_SESSION(response);
672
673	ISCSI_SESSION_LOCK(is);
674
675#ifdef ICL_KERNEL_PROXY
676	if (is->is_login_phase) {
677		if (is->is_login_pdu == NULL)
678			is->is_login_pdu = response;
679		else
680			icl_pdu_free(response);
681		ISCSI_SESSION_UNLOCK(is);
682		cv_signal(&is->is_login_cv);
683		return;
684	}
685#endif
686
687	iscsi_pdu_update_statsn(response);
688
689	/*
690	 * The handling routine is responsible for freeing the PDU
691	 * when it's no longer needed.
692	 */
693	switch (response->ip_bhs->bhs_opcode) {
694	case ISCSI_BHS_OPCODE_NOP_IN:
695		iscsi_pdu_handle_nop_in(response);
696		break;
697	case ISCSI_BHS_OPCODE_SCSI_RESPONSE:
698		iscsi_pdu_handle_scsi_response(response);
699		break;
700	case ISCSI_BHS_OPCODE_SCSI_DATA_IN:
701		iscsi_pdu_handle_data_in(response);
702		break;
703	case ISCSI_BHS_OPCODE_LOGOUT_RESPONSE:
704		iscsi_pdu_handle_logout_response(response);
705		break;
706	case ISCSI_BHS_OPCODE_R2T:
707		iscsi_pdu_handle_r2t(response);
708		break;
709	case ISCSI_BHS_OPCODE_ASYNC_MESSAGE:
710		iscsi_pdu_handle_async_message(response);
711		break;
712	case ISCSI_BHS_OPCODE_REJECT:
713		iscsi_pdu_handle_reject(response);
714		break;
715	default:
716		ISCSI_SESSION_WARN(is, "received PDU with unsupported "
717		    "opcode 0x%x; reconnecting",
718		    response->ip_bhs->bhs_opcode);
719		iscsi_session_reconnect(is);
720		icl_pdu_free(response);
721	}
722
723	ISCSI_SESSION_UNLOCK(is);
724}
725
726static void
727iscsi_error_callback(struct icl_conn *ic)
728{
729	struct iscsi_session *is;
730
731	is = CONN_SESSION(ic);
732
733	ISCSI_SESSION_WARN(is, "connection error; reconnecting");
734	iscsi_session_reconnect(is);
735}
736
737static void
738iscsi_pdu_handle_nop_in(struct icl_pdu *response)
739{
740	struct iscsi_session *is;
741	struct iscsi_bhs_nop_out *bhsno;
742	struct iscsi_bhs_nop_in *bhsni;
743	struct icl_pdu *request;
744	void *data = NULL;
745	size_t datasize;
746	int error;
747
748	is = PDU_SESSION(response);
749	bhsni = (struct iscsi_bhs_nop_in *)response->ip_bhs;
750
751	if (bhsni->bhsni_target_transfer_tag == 0xffffffff) {
752		/*
753		 * Nothing to do; iscsi_pdu_update_statsn() already
754		 * zeroed the timeout.
755		 */
756		icl_pdu_free(response);
757		return;
758	}
759
760	datasize = icl_pdu_data_segment_length(response);
761	if (datasize > 0) {
762		data = malloc(datasize, M_ISCSI, M_NOWAIT | M_ZERO);
763		if (data == NULL) {
764			ISCSI_SESSION_WARN(is, "failed to allocate memory; "
765			    "reconnecting");
766			icl_pdu_free(response);
767			iscsi_session_reconnect(is);
768			return;
769		}
770		icl_pdu_get_data(response, 0, data, datasize);
771	}
772
773	request = icl_pdu_new_bhs(response->ip_conn, M_NOWAIT);
774	if (request == NULL) {
775		ISCSI_SESSION_WARN(is, "failed to allocate memory; "
776		    "reconnecting");
777		free(data, M_ISCSI);
778		icl_pdu_free(response);
779		iscsi_session_reconnect(is);
780		return;
781	}
782	bhsno = (struct iscsi_bhs_nop_out *)request->ip_bhs;
783	bhsno->bhsno_opcode = ISCSI_BHS_OPCODE_NOP_OUT |
784	    ISCSI_BHS_OPCODE_IMMEDIATE;
785	bhsno->bhsno_flags = 0x80;
786	bhsno->bhsno_initiator_task_tag = 0xffffffff;
787	bhsno->bhsno_target_transfer_tag = bhsni->bhsni_target_transfer_tag;
788	if (datasize > 0) {
789		error = icl_pdu_append_data(request, data, datasize, M_NOWAIT);
790		if (error != 0) {
791			ISCSI_SESSION_WARN(is, "failed to allocate memory; "
792			    "reconnecting");
793			free(data, M_ISCSI);
794			icl_pdu_free(request);
795			icl_pdu_free(response);
796			iscsi_session_reconnect(is);
797			return;
798		}
799		free(data, M_ISCSI);
800	}
801
802	icl_pdu_free(response);
803	iscsi_pdu_queue_locked(request);
804}
805
806static void
807iscsi_pdu_handle_scsi_response(struct icl_pdu *response)
808{
809	struct iscsi_bhs_scsi_response *bhssr;
810	struct iscsi_outstanding *io;
811	struct iscsi_session *is;
812	struct ccb_scsiio *csio;
813	size_t data_segment_len;
814	uint16_t sense_len;
815
816	is = PDU_SESSION(response);
817
818	bhssr = (struct iscsi_bhs_scsi_response *)response->ip_bhs;
819	io = iscsi_outstanding_find(is, bhssr->bhssr_initiator_task_tag);
820	if (io == NULL) {
821		ISCSI_SESSION_WARN(is, "bad itt 0x%x", bhssr->bhssr_initiator_task_tag);
822		icl_pdu_free(response);
823		iscsi_session_reconnect(is);
824		return;
825	}
826
827	if (bhssr->bhssr_response != BHSSR_RESPONSE_COMMAND_COMPLETED) {
828		ISCSI_SESSION_WARN(is, "service response 0x%x", bhssr->bhssr_response);
829 		if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
830 			xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
831			ISCSI_SESSION_DEBUG(is, "freezing devq");
832		}
833 		io->io_ccb->ccb_h.status = CAM_REQ_CMP_ERR | CAM_DEV_QFRZN;
834	} else if (bhssr->bhssr_status == 0) {
835		io->io_ccb->ccb_h.status = CAM_REQ_CMP;
836	} else {
837 		if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
838 			xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
839			ISCSI_SESSION_DEBUG(is, "freezing devq");
840		}
841 		io->io_ccb->ccb_h.status = CAM_SCSI_STATUS_ERROR | CAM_DEV_QFRZN;
842		io->io_ccb->csio.scsi_status = bhssr->bhssr_status;
843	}
844
845	if (bhssr->bhssr_flags & BHSSR_FLAGS_RESIDUAL_OVERFLOW) {
846		ISCSI_SESSION_WARN(is, "target indicated residual overflow");
847		icl_pdu_free(response);
848		iscsi_session_reconnect(is);
849		return;
850	}
851
852	csio = &io->io_ccb->csio;
853
854	data_segment_len = icl_pdu_data_segment_length(response);
855	if (data_segment_len > 0) {
856		if (data_segment_len < sizeof(sense_len)) {
857			ISCSI_SESSION_WARN(is, "truncated data segment (%zd bytes)",
858			    data_segment_len);
859			if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
860				xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
861				ISCSI_SESSION_DEBUG(is, "freezing devq");
862			}
863			io->io_ccb->ccb_h.status = CAM_REQ_CMP_ERR | CAM_DEV_QFRZN;
864			goto out;
865		}
866		icl_pdu_get_data(response, 0, &sense_len, sizeof(sense_len));
867		sense_len = ntohs(sense_len);
868#if 0
869		ISCSI_SESSION_DEBUG(is, "sense_len %d, data len %zd",
870		    sense_len, data_segment_len);
871#endif
872		if (sizeof(sense_len) + sense_len > data_segment_len) {
873			ISCSI_SESSION_WARN(is, "truncated data segment "
874			    "(%zd bytes, should be %zd)",
875			    data_segment_len, sizeof(sense_len) + sense_len);
876			if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
877				xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
878				ISCSI_SESSION_DEBUG(is, "freezing devq");
879			}
880			io->io_ccb->ccb_h.status = CAM_REQ_CMP_ERR | CAM_DEV_QFRZN;
881			goto out;
882		} else if (sizeof(sense_len) + sense_len < data_segment_len)
883			ISCSI_SESSION_WARN(is, "oversize data segment "
884			    "(%zd bytes, should be %zd)",
885			    data_segment_len, sizeof(sense_len) + sense_len);
886		if (sense_len > csio->sense_len) {
887			ISCSI_SESSION_DEBUG(is, "truncating sense from %d to %d",
888			    sense_len, csio->sense_len);
889			sense_len = csio->sense_len;
890		}
891		icl_pdu_get_data(response, sizeof(sense_len), &csio->sense_data, sense_len);
892		csio->sense_resid = csio->sense_len - sense_len;
893		io->io_ccb->ccb_h.status |= CAM_AUTOSNS_VALID;
894	}
895
896out:
897	if (bhssr->bhssr_flags & BHSSR_FLAGS_RESIDUAL_UNDERFLOW)
898		csio->resid = ntohl(bhssr->bhssr_residual_count);
899
900	if ((csio->ccb_h.flags & CAM_DIR_MASK) == CAM_DIR_IN) {
901		KASSERT(io->io_received <= csio->dxfer_len,
902		    ("io->io_received > csio->dxfer_len"));
903		if (io->io_received < csio->dxfer_len) {
904			if (csio->resid != csio->dxfer_len - io->io_received) {
905				ISCSI_SESSION_WARN(is, "underflow mismatch: "
906				    "target indicates %d, we calculated %zd",
907				    csio->resid,
908				    csio->dxfer_len - io->io_received);
909			}
910			csio->resid = csio->dxfer_len - io->io_received;
911		}
912	}
913
914	xpt_done(io->io_ccb);
915	iscsi_outstanding_remove(is, io);
916	icl_pdu_free(response);
917}
918
919static void
920iscsi_pdu_handle_data_in(struct icl_pdu *response)
921{
922	struct iscsi_bhs_data_in *bhsdi;
923	struct iscsi_outstanding *io;
924	struct iscsi_session *is;
925	struct ccb_scsiio *csio;
926	size_t data_segment_len;
927
928	is = PDU_SESSION(response);
929	bhsdi = (struct iscsi_bhs_data_in *)response->ip_bhs;
930	io = iscsi_outstanding_find(is, bhsdi->bhsdi_initiator_task_tag);
931	if (io == NULL) {
932		ISCSI_SESSION_WARN(is, "bad itt 0x%x", bhsdi->bhsdi_initiator_task_tag);
933		icl_pdu_free(response);
934		iscsi_session_reconnect(is);
935		return;
936	}
937
938	data_segment_len = icl_pdu_data_segment_length(response);
939	if (data_segment_len == 0) {
940		/*
941		 * "The sending of 0 length data segments should be avoided,
942		 * but initiators and targets MUST be able to properly receive
943		 * 0 length data segments."
944		 */
945		icl_pdu_free(response);
946		return;
947	}
948
949	/*
950	 * We need to track this for security reasons - without it, malicious target
951	 * could respond to SCSI READ without sending Data-In PDUs, which would result
952	 * in read operation on the initiator side returning random kernel data.
953	 */
954	if (ntohl(bhsdi->bhsdi_buffer_offset) != io->io_received) {
955		ISCSI_SESSION_WARN(is, "data out of order; expected offset %zd, got %zd",
956		    io->io_received, (size_t)ntohl(bhsdi->bhsdi_buffer_offset));
957		icl_pdu_free(response);
958		iscsi_session_reconnect(is);
959		return;
960	}
961
962	csio = &io->io_ccb->csio;
963
964	if (io->io_received + data_segment_len > csio->dxfer_len) {
965		ISCSI_SESSION_WARN(is, "oversize data segment (%zd bytes "
966		    "at offset %zd, buffer is %d)",
967		    data_segment_len, io->io_received, csio->dxfer_len);
968		icl_pdu_free(response);
969		iscsi_session_reconnect(is);
970		return;
971	}
972
973	icl_pdu_get_data(response, 0, csio->data_ptr + io->io_received, data_segment_len);
974	io->io_received += data_segment_len;
975
976	/*
977	 * XXX: Check DataSN.
978	 * XXX: Check F.
979	 */
980	if ((bhsdi->bhsdi_flags & BHSDI_FLAGS_S) == 0) {
981		/*
982		 * Nothing more to do.
983		 */
984		icl_pdu_free(response);
985		return;
986	}
987
988	//ISCSI_SESSION_DEBUG(is, "got S flag; status 0x%x", bhsdi->bhsdi_status);
989	if (bhsdi->bhsdi_status == 0) {
990		io->io_ccb->ccb_h.status = CAM_REQ_CMP;
991	} else {
992		if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
993			xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
994			ISCSI_SESSION_DEBUG(is, "freezing devq");
995		}
996		io->io_ccb->ccb_h.status = CAM_SCSI_STATUS_ERROR | CAM_DEV_QFRZN;
997		csio->scsi_status = bhsdi->bhsdi_status;
998	}
999
1000	if ((csio->ccb_h.flags & CAM_DIR_MASK) == CAM_DIR_IN) {
1001		KASSERT(io->io_received <= csio->dxfer_len,
1002		    ("io->io_received > csio->dxfer_len"));
1003		if (io->io_received < csio->dxfer_len) {
1004			csio->resid = ntohl(bhsdi->bhsdi_residual_count);
1005			if (csio->resid != csio->dxfer_len - io->io_received) {
1006				ISCSI_SESSION_WARN(is, "underflow mismatch: "
1007				    "target indicates %d, we calculated %zd",
1008				    csio->resid,
1009				    csio->dxfer_len - io->io_received);
1010			}
1011			csio->resid = csio->dxfer_len - io->io_received;
1012		}
1013	}
1014
1015	xpt_done(io->io_ccb);
1016	iscsi_outstanding_remove(is, io);
1017	icl_pdu_free(response);
1018}
1019
1020static void
1021iscsi_pdu_handle_logout_response(struct icl_pdu *response)
1022{
1023
1024	ISCSI_SESSION_DEBUG(PDU_SESSION(response), "logout response");
1025	icl_pdu_free(response);
1026}
1027
1028static void
1029iscsi_pdu_handle_r2t(struct icl_pdu *response)
1030{
1031	struct icl_pdu *request;
1032	struct iscsi_session *is;
1033	struct iscsi_bhs_r2t *bhsr2t;
1034	struct iscsi_bhs_data_out *bhsdo;
1035	struct iscsi_outstanding *io;
1036	struct ccb_scsiio *csio;
1037	size_t off, len, total_len;
1038	int error;
1039
1040	is = PDU_SESSION(response);
1041
1042	bhsr2t = (struct iscsi_bhs_r2t *)response->ip_bhs;
1043	io = iscsi_outstanding_find(is, bhsr2t->bhsr2t_initiator_task_tag);
1044	if (io == NULL) {
1045		ISCSI_SESSION_WARN(is, "bad itt 0x%x; reconnecting",
1046		    bhsr2t->bhsr2t_initiator_task_tag);
1047		icl_pdu_free(response);
1048		iscsi_session_reconnect(is);
1049		return;
1050	}
1051
1052	csio = &io->io_ccb->csio;
1053
1054	if ((csio->ccb_h.flags & CAM_DIR_MASK) != CAM_DIR_OUT) {
1055		ISCSI_SESSION_WARN(is, "received R2T for read command; reconnecting");
1056		icl_pdu_free(response);
1057		iscsi_session_reconnect(is);
1058		return;
1059	}
1060
1061	/*
1062	 * XXX: Verify R2TSN.
1063	 */
1064
1065	io->io_datasn = 0;
1066
1067	off = ntohl(bhsr2t->bhsr2t_buffer_offset);
1068	if (off > csio->dxfer_len) {
1069		ISCSI_SESSION_WARN(is, "target requested invalid offset "
1070		    "%zd, buffer is is %d; reconnecting", off, csio->dxfer_len);
1071		icl_pdu_free(response);
1072		iscsi_session_reconnect(is);
1073		return;
1074	}
1075
1076	total_len = ntohl(bhsr2t->bhsr2t_desired_data_transfer_length);
1077	if (total_len == 0 || total_len > csio->dxfer_len) {
1078		ISCSI_SESSION_WARN(is, "target requested invalid length "
1079		    "%zd, buffer is %d; reconnecting", total_len, csio->dxfer_len);
1080		icl_pdu_free(response);
1081		iscsi_session_reconnect(is);
1082		return;
1083	}
1084
1085	//ISCSI_SESSION_DEBUG(is, "r2t; off %zd, len %zd", off, total_len);
1086
1087	for (;;) {
1088		len = total_len;
1089
1090		if (len > is->is_max_data_segment_length)
1091			len = is->is_max_data_segment_length;
1092
1093		if (off + len > csio->dxfer_len) {
1094			ISCSI_SESSION_WARN(is, "target requested invalid "
1095			    "length/offset %zd, buffer is %d; reconnecting",
1096			    off + len, csio->dxfer_len);
1097			icl_pdu_free(response);
1098			iscsi_session_reconnect(is);
1099			return;
1100		}
1101
1102		request = icl_pdu_new_bhs(response->ip_conn, M_NOWAIT);
1103		if (request == NULL) {
1104			icl_pdu_free(response);
1105			iscsi_session_reconnect(is);
1106			return;
1107		}
1108
1109		bhsdo = (struct iscsi_bhs_data_out *)request->ip_bhs;
1110		bhsdo->bhsdo_opcode = ISCSI_BHS_OPCODE_SCSI_DATA_OUT;
1111		bhsdo->bhsdo_lun = bhsr2t->bhsr2t_lun;
1112		bhsdo->bhsdo_initiator_task_tag =
1113		    bhsr2t->bhsr2t_initiator_task_tag;
1114		bhsdo->bhsdo_target_transfer_tag =
1115		    bhsr2t->bhsr2t_target_transfer_tag;
1116		bhsdo->bhsdo_datasn = htonl(io->io_datasn++);
1117		bhsdo->bhsdo_buffer_offset = htonl(off);
1118		error = icl_pdu_append_data(request, csio->data_ptr + off, len,
1119		    M_NOWAIT);
1120		if (error != 0) {
1121			ISCSI_SESSION_WARN(is, "failed to allocate memory; "
1122			    "reconnecting");
1123			icl_pdu_free(request);
1124			icl_pdu_free(response);
1125			iscsi_session_reconnect(is);
1126			return;
1127		}
1128
1129		off += len;
1130		total_len -= len;
1131
1132		if (total_len == 0) {
1133			bhsdo->bhsdo_flags |= BHSDO_FLAGS_F;
1134			//ISCSI_SESSION_DEBUG(is, "setting F, off %zd", off);
1135		} else {
1136			//ISCSI_SESSION_DEBUG(is, "not finished, off %zd", off);
1137		}
1138
1139		iscsi_pdu_queue_locked(request);
1140
1141		if (total_len == 0)
1142			break;
1143	}
1144
1145	icl_pdu_free(response);
1146}
1147
1148static void
1149iscsi_pdu_handle_async_message(struct icl_pdu *response)
1150{
1151	struct iscsi_bhs_asynchronous_message *bhsam;
1152	struct iscsi_session *is;
1153
1154	is = PDU_SESSION(response);
1155	bhsam = (struct iscsi_bhs_asynchronous_message *)response->ip_bhs;
1156	switch (bhsam->bhsam_async_event) {
1157	case BHSAM_EVENT_TARGET_REQUESTS_LOGOUT:
1158		ISCSI_SESSION_WARN(is, "target requests logout; removing session");
1159		iscsi_session_logout(is);
1160		iscsi_session_terminate(is);
1161		break;
1162	case BHSAM_EVENT_TARGET_TERMINATES_CONNECTION:
1163		ISCSI_SESSION_WARN(is, "target indicates it will drop drop the connection");
1164		break;
1165	case BHSAM_EVENT_TARGET_TERMINATES_SESSION:
1166		ISCSI_SESSION_WARN(is, "target indicates it will drop drop the session");
1167		break;
1168	default:
1169		/*
1170		 * XXX: Technically, we're obligated to also handle
1171		 * 	parameter renegotiation.
1172		 */
1173		ISCSI_SESSION_WARN(is, "ignoring AsyncEvent %d", bhsam->bhsam_async_event);
1174		break;
1175	}
1176
1177	icl_pdu_free(response);
1178}
1179
1180static void
1181iscsi_pdu_handle_reject(struct icl_pdu *response)
1182{
1183	struct iscsi_bhs_reject *bhsr;
1184	struct iscsi_session *is;
1185
1186	is = PDU_SESSION(response);
1187	bhsr = (struct iscsi_bhs_reject *)response->ip_bhs;
1188	ISCSI_SESSION_WARN(is, "received Reject PDU, reason 0x%x; protocol error?",
1189	    bhsr->bhsr_reason);
1190
1191	icl_pdu_free(response);
1192}
1193
1194static int
1195iscsi_ioctl_daemon_wait(struct iscsi_softc *sc,
1196    struct iscsi_daemon_request *request)
1197{
1198	struct iscsi_session *is;
1199	int error;
1200
1201	sx_slock(&sc->sc_lock);
1202	for (;;) {
1203		TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
1204			if (is->is_waiting_for_iscsid)
1205				break;
1206		}
1207
1208		if (is == NULL) {
1209			/*
1210			 * No session requires attention from iscsid(8); wait.
1211			 */
1212			error = cv_wait_sig(&sc->sc_cv, &sc->sc_lock);
1213			if (error != 0) {
1214				sx_sunlock(&sc->sc_lock);
1215				return (error);
1216			}
1217			continue;
1218		}
1219
1220		ISCSI_SESSION_LOCK(is);
1221		is->is_waiting_for_iscsid = false;
1222		is->is_login_phase = true;
1223		is->is_reason[0] = '\0';
1224		ISCSI_SESSION_UNLOCK(is);
1225
1226		request->idr_session_id = is->is_id;
1227		memcpy(&request->idr_conf, &is->is_conf,
1228		    sizeof(request->idr_conf));
1229
1230		sx_sunlock(&sc->sc_lock);
1231		return (0);
1232	}
1233}
1234
1235static int
1236iscsi_ioctl_daemon_handoff(struct iscsi_softc *sc,
1237    struct iscsi_daemon_handoff *handoff)
1238{
1239	struct iscsi_session *is;
1240	int error;
1241
1242	sx_slock(&sc->sc_lock);
1243
1244	/*
1245	 * Find the session to hand off socket to.
1246	 */
1247	TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
1248		if (is->is_id == handoff->idh_session_id)
1249			break;
1250	}
1251	if (is == NULL) {
1252		sx_sunlock(&sc->sc_lock);
1253		return (ESRCH);
1254	}
1255	ISCSI_SESSION_LOCK(is);
1256	if (is->is_conf.isc_discovery || is->is_terminating) {
1257		ISCSI_SESSION_UNLOCK(is);
1258		sx_sunlock(&sc->sc_lock);
1259		return (EINVAL);
1260	}
1261	if (is->is_connected) {
1262		/*
1263		 * This might have happened because another iscsid(8)
1264		 * instance handed off the connection in the meantime.
1265		 * Just return.
1266		 */
1267		ISCSI_SESSION_WARN(is, "handoff on already connected "
1268		    "session");
1269		ISCSI_SESSION_UNLOCK(is);
1270		sx_sunlock(&sc->sc_lock);
1271		return (EBUSY);
1272	}
1273
1274	strlcpy(is->is_target_alias, handoff->idh_target_alias,
1275	    sizeof(is->is_target_alias));
1276	memcpy(is->is_isid, handoff->idh_isid, sizeof(is->is_isid));
1277	is->is_statsn = handoff->idh_statsn;
1278	is->is_initial_r2t = handoff->idh_initial_r2t;
1279	is->is_immediate_data = handoff->idh_immediate_data;
1280	is->is_max_data_segment_length = handoff->idh_max_data_segment_length;
1281	is->is_max_burst_length = handoff->idh_max_burst_length;
1282	is->is_first_burst_length = handoff->idh_first_burst_length;
1283
1284	if (handoff->idh_header_digest == ISCSI_DIGEST_CRC32C)
1285		is->is_conn->ic_header_crc32c = true;
1286	else
1287		is->is_conn->ic_header_crc32c = false;
1288	if (handoff->idh_data_digest == ISCSI_DIGEST_CRC32C)
1289		is->is_conn->ic_data_crc32c = true;
1290	else
1291		is->is_conn->ic_data_crc32c = false;
1292
1293	is->is_cmdsn = 0;
1294	is->is_expcmdsn = 0;
1295	is->is_maxcmdsn = 0;
1296	is->is_waiting_for_iscsid = false;
1297	is->is_login_phase = false;
1298	is->is_timeout = 0;
1299	is->is_connected = true;
1300	is->is_reason[0] = '\0';
1301
1302	ISCSI_SESSION_UNLOCK(is);
1303
1304#ifndef ICL_KERNEL_PROXY
1305	error = icl_conn_handoff(is->is_conn, handoff->idh_socket);
1306	if (error != 0) {
1307		sx_sunlock(&sc->sc_lock);
1308		iscsi_session_terminate(is);
1309		return (error);
1310	}
1311#endif
1312
1313	sx_sunlock(&sc->sc_lock);
1314
1315	if (is->is_sim != NULL) {
1316		/*
1317		 * When reconnecting, there already is SIM allocated for the session.
1318		 */
1319		KASSERT(is->is_simq_frozen, ("reconnect without frozen simq"));
1320		ISCSI_SESSION_LOCK(is);
1321		ISCSI_SESSION_DEBUG(is, "releasing");
1322		xpt_release_simq(is->is_sim, 1);
1323		is->is_simq_frozen = false;
1324		ISCSI_SESSION_UNLOCK(is);
1325
1326	} else {
1327		ISCSI_SESSION_LOCK(is);
1328		is->is_devq = cam_simq_alloc(maxtags);
1329		if (is->is_devq == NULL) {
1330			ISCSI_SESSION_WARN(is, "failed to allocate simq");
1331			iscsi_session_terminate(is);
1332			return (ENOMEM);
1333		}
1334
1335		is->is_sim = cam_sim_alloc(iscsi_action, iscsi_poll, "iscsi",
1336		    is, is->is_id /* unit */, &is->is_lock,
1337		    maxtags, maxtags, is->is_devq);
1338		if (is->is_sim == NULL) {
1339			ISCSI_SESSION_UNLOCK(is);
1340			ISCSI_SESSION_WARN(is, "failed to allocate SIM");
1341			cam_simq_free(is->is_devq);
1342			iscsi_session_terminate(is);
1343			return (ENOMEM);
1344		}
1345
1346		error = xpt_bus_register(is->is_sim, NULL, 0);
1347		if (error != 0) {
1348			ISCSI_SESSION_UNLOCK(is);
1349			ISCSI_SESSION_WARN(is, "failed to register bus");
1350			iscsi_session_terminate(is);
1351			return (ENOMEM);
1352		}
1353
1354		error = xpt_create_path(&is->is_path, /*periph*/NULL,
1355		    cam_sim_path(is->is_sim), CAM_TARGET_WILDCARD,
1356		    CAM_LUN_WILDCARD);
1357		if (error != CAM_REQ_CMP) {
1358			ISCSI_SESSION_UNLOCK(is);
1359			ISCSI_SESSION_WARN(is, "failed to create path");
1360			iscsi_session_terminate(is);
1361			return (ENOMEM);
1362		}
1363		ISCSI_SESSION_UNLOCK(is);
1364	}
1365
1366	return (0);
1367}
1368
1369static int
1370iscsi_ioctl_daemon_fail(struct iscsi_softc *sc,
1371    struct iscsi_daemon_fail *fail)
1372{
1373	struct iscsi_session *is;
1374
1375	sx_slock(&sc->sc_lock);
1376
1377	TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
1378		if (is->is_id == fail->idf_session_id)
1379			break;
1380	}
1381	if (is == NULL) {
1382		sx_sunlock(&sc->sc_lock);
1383		return (ESRCH);
1384	}
1385	ISCSI_SESSION_LOCK(is);
1386	ISCSI_SESSION_DEBUG(is, "iscsid(8) failed: %s",
1387	    fail->idf_reason);
1388	strlcpy(is->is_reason, fail->idf_reason, sizeof(is->is_reason));
1389	//is->is_waiting_for_iscsid = false;
1390	//is->is_login_phase = true;
1391	//iscsi_session_reconnect(is);
1392	ISCSI_SESSION_UNLOCK(is);
1393	sx_sunlock(&sc->sc_lock);
1394
1395	return (0);
1396}
1397
1398#ifdef ICL_KERNEL_PROXY
1399static int
1400iscsi_ioctl_daemon_connect(struct iscsi_softc *sc,
1401    struct iscsi_daemon_connect *idc)
1402{
1403	struct iscsi_session *is;
1404	struct sockaddr *from_sa, *to_sa;
1405	int error;
1406
1407	sx_slock(&sc->sc_lock);
1408	TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
1409		if (is->is_id == idc->idc_session_id)
1410			break;
1411	}
1412	if (is == NULL) {
1413		sx_sunlock(&sc->sc_lock);
1414		return (ESRCH);
1415	}
1416	sx_sunlock(&sc->sc_lock);
1417
1418	if (idc->idc_from_addrlen > 0) {
1419		error = getsockaddr(&from_sa, (void *)idc->idc_from_addr, idc->idc_from_addrlen);
1420		if (error != 0)
1421			return (error);
1422	} else {
1423		from_sa = NULL;
1424	}
1425	error = getsockaddr(&to_sa, (void *)idc->idc_to_addr, idc->idc_to_addrlen);
1426	if (error != 0) {
1427		free(from_sa, M_SONAME);
1428		return (error);
1429	}
1430
1431	ISCSI_SESSION_LOCK(is);
1432	is->is_waiting_for_iscsid = false;
1433	is->is_login_phase = true;
1434	is->is_timeout = 0;
1435	ISCSI_SESSION_UNLOCK(is);
1436
1437	error = icl_conn_connect(is->is_conn, idc->idc_iser, idc->idc_domain,
1438	    idc->idc_socktype, idc->idc_protocol, from_sa, to_sa);
1439	free(from_sa, M_SONAME);
1440	free(to_sa, M_SONAME);
1441
1442	/*
1443	 * Digests are always disabled during login phase.
1444	 */
1445	is->is_conn->ic_header_crc32c = false;
1446	is->is_conn->ic_data_crc32c = false;
1447
1448	return (error);
1449}
1450
1451static int
1452iscsi_ioctl_daemon_send(struct iscsi_softc *sc,
1453    struct iscsi_daemon_send *ids)
1454{
1455	struct iscsi_session *is;
1456	struct icl_pdu *ip;
1457	size_t datalen;
1458	void *data;
1459	int error;
1460
1461	sx_slock(&sc->sc_lock);
1462	TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
1463		if (is->is_id == ids->ids_session_id)
1464			break;
1465	}
1466	if (is == NULL) {
1467		sx_sunlock(&sc->sc_lock);
1468		return (ESRCH);
1469	}
1470	sx_sunlock(&sc->sc_lock);
1471
1472	if (is->is_login_phase == false)
1473		return (EBUSY);
1474
1475	if (is->is_terminating || is->is_reconnecting)
1476		return (EIO);
1477
1478	datalen = ids->ids_data_segment_len;
1479	if (datalen > ISCSI_MAX_DATA_SEGMENT_LENGTH)
1480		return (EINVAL);
1481	if (datalen > 0) {
1482		data = malloc(datalen, M_ISCSI, M_WAITOK);
1483		error = copyin(ids->ids_data_segment, data, datalen);
1484		if (error != 0) {
1485			free(data, M_ISCSI);
1486			return (error);
1487		}
1488	}
1489
1490	ip = icl_pdu_new_bhs(is->is_conn, M_WAITOK);
1491	memcpy(ip->ip_bhs, ids->ids_bhs, sizeof(*ip->ip_bhs));
1492	if (datalen > 0) {
1493		error = icl_pdu_append_data(ip, data, datalen, M_WAITOK);
1494		KASSERT(error == 0, ("icl_pdu_append_data(..., M_WAITOK) failed"));
1495		free(data, M_ISCSI);
1496	}
1497	icl_pdu_queue(ip);
1498
1499	return (0);
1500}
1501
1502static int
1503iscsi_ioctl_daemon_receive(struct iscsi_softc *sc,
1504    struct iscsi_daemon_receive *idr)
1505{
1506	struct iscsi_session *is;
1507	struct icl_pdu *ip;
1508	void *data;
1509
1510	sx_slock(&sc->sc_lock);
1511	TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
1512		if (is->is_id == idr->idr_session_id)
1513			break;
1514	}
1515	if (is == NULL) {
1516		sx_sunlock(&sc->sc_lock);
1517		return (ESRCH);
1518	}
1519	sx_sunlock(&sc->sc_lock);
1520
1521	if (is->is_login_phase == false)
1522		return (EBUSY);
1523
1524	ISCSI_SESSION_LOCK(is);
1525	while (is->is_login_pdu == NULL &&
1526	    is->is_terminating == false &&
1527	    is->is_reconnecting == false)
1528		cv_wait(&is->is_login_cv, &is->is_lock);
1529	if (is->is_terminating || is->is_reconnecting) {
1530		ISCSI_SESSION_UNLOCK(is);
1531		return (EIO);
1532	}
1533	ip = is->is_login_pdu;
1534	is->is_login_pdu = NULL;
1535	ISCSI_SESSION_UNLOCK(is);
1536
1537	if (ip->ip_data_len > idr->idr_data_segment_len) {
1538		icl_pdu_free(ip);
1539		return (EMSGSIZE);
1540	}
1541
1542	copyout(ip->ip_bhs, idr->idr_bhs, sizeof(*ip->ip_bhs));
1543	if (ip->ip_data_len > 0) {
1544		data = malloc(ip->ip_data_len, M_ISCSI, M_WAITOK);
1545		icl_pdu_get_data(ip, 0, data, ip->ip_data_len);
1546		copyout(data, idr->idr_data_segment, ip->ip_data_len);
1547		free(data, M_ISCSI);
1548	}
1549
1550	icl_pdu_free(ip);
1551
1552	return (0);
1553}
1554
1555static int
1556iscsi_ioctl_daemon_close(struct iscsi_softc *sc,
1557    struct iscsi_daemon_close *idc)
1558{
1559	struct iscsi_session *is;
1560
1561	sx_slock(&sc->sc_lock);
1562	TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
1563		if (is->is_id == idc->idc_session_id)
1564			break;
1565	}
1566	if (is == NULL) {
1567		sx_sunlock(&sc->sc_lock);
1568		return (ESRCH);
1569	}
1570	sx_sunlock(&sc->sc_lock);
1571
1572	iscsi_session_reconnect(is);
1573
1574	return (0);
1575}
1576#endif /* ICL_KERNEL_PROXY */
1577
1578static void
1579iscsi_sanitize_session_conf(struct iscsi_session_conf *isc)
1580{
1581	/*
1582	 * Just make sure all the fields are null-terminated.
1583	 *
1584	 * XXX: This is not particularly secure.  We should
1585	 * 	create our own conf and then copy in relevant
1586	 * 	fields.
1587	 */
1588	isc->isc_initiator[ISCSI_NAME_LEN - 1] = '\0';
1589	isc->isc_initiator_addr[ISCSI_ADDR_LEN - 1] = '\0';
1590	isc->isc_initiator_alias[ISCSI_ALIAS_LEN - 1] = '\0';
1591	isc->isc_target[ISCSI_NAME_LEN - 1] = '\0';
1592	isc->isc_target_addr[ISCSI_ADDR_LEN - 1] = '\0';
1593	isc->isc_user[ISCSI_NAME_LEN - 1] = '\0';
1594	isc->isc_secret[ISCSI_SECRET_LEN - 1] = '\0';
1595	isc->isc_mutual_user[ISCSI_NAME_LEN - 1] = '\0';
1596	isc->isc_mutual_secret[ISCSI_SECRET_LEN - 1] = '\0';
1597}
1598
1599static int
1600iscsi_ioctl_session_add(struct iscsi_softc *sc, struct iscsi_session_add *isa)
1601{
1602	struct iscsi_session *is;
1603	const struct iscsi_session *is2;
1604	int error;
1605
1606	iscsi_sanitize_session_conf(&isa->isa_conf);
1607
1608	is = malloc(sizeof(*is), M_ISCSI, M_ZERO | M_WAITOK);
1609	memcpy(&is->is_conf, &isa->isa_conf, sizeof(is->is_conf));
1610
1611	if (is->is_conf.isc_initiator[0] == '\0' ||
1612	    is->is_conf.isc_target_addr[0] == '\0') {
1613		free(is, M_ISCSI);
1614		return (EINVAL);
1615	}
1616
1617	if ((is->is_conf.isc_discovery != 0 && is->is_conf.isc_target[0] != 0) ||
1618	    (is->is_conf.isc_discovery == 0 && is->is_conf.isc_target[0] == 0)) {
1619		free(is, M_ISCSI);
1620		return (EINVAL);
1621	}
1622
1623	sx_xlock(&sc->sc_lock);
1624
1625	/*
1626	 * Prevent duplicates.
1627	 */
1628	TAILQ_FOREACH(is2, &sc->sc_sessions, is_next) {
1629		if (!!is->is_conf.isc_discovery !=
1630		    !!is2->is_conf.isc_discovery)
1631			continue;
1632
1633		if (strcmp(is->is_conf.isc_target_addr,
1634		    is2->is_conf.isc_target_addr) != 0)
1635			continue;
1636
1637		if (is->is_conf.isc_discovery == 0 &&
1638		    strcmp(is->is_conf.isc_target,
1639		    is2->is_conf.isc_target) != 0)
1640			continue;
1641
1642		sx_xunlock(&sc->sc_lock);
1643		free(is, M_ISCSI);
1644		return (EBUSY);
1645	}
1646
1647	is->is_conn = icl_conn_new("iscsi", &is->is_lock);
1648	is->is_conn->ic_receive = iscsi_receive_callback;
1649	is->is_conn->ic_error = iscsi_error_callback;
1650	is->is_conn->ic_prv0 = is;
1651	TAILQ_INIT(&is->is_outstanding);
1652	STAILQ_INIT(&is->is_postponed);
1653	mtx_init(&is->is_lock, "iscsi_lock", NULL, MTX_DEF);
1654	cv_init(&is->is_maintenance_cv, "iscsi_mt");
1655#ifdef ICL_KERNEL_PROXY
1656	cv_init(&is->is_login_cv, "iscsi_login");
1657#endif
1658
1659	is->is_softc = sc;
1660	sc->sc_last_session_id++;
1661	is->is_id = sc->sc_last_session_id;
1662	callout_init(&is->is_callout, 1);
1663	callout_reset(&is->is_callout, 1 * hz, iscsi_callout, is);
1664	TAILQ_INSERT_TAIL(&sc->sc_sessions, is, is_next);
1665
1666	error = kthread_add(iscsi_maintenance_thread, is, NULL, NULL, 0, 0, "iscsimt");
1667	if (error != 0) {
1668		ISCSI_SESSION_WARN(is, "kthread_add(9) failed with error %d", error);
1669		return (error);
1670	}
1671
1672	/*
1673	 * Trigger immediate reconnection.
1674	 */
1675	is->is_waiting_for_iscsid = true;
1676	strlcpy(is->is_reason, "Waiting for iscsid(8)", sizeof(is->is_reason));
1677	cv_signal(&sc->sc_cv);
1678
1679	sx_xunlock(&sc->sc_lock);
1680
1681	return (0);
1682}
1683
1684static bool
1685iscsi_session_conf_matches(unsigned int id1, const struct iscsi_session_conf *c1,
1686    unsigned int id2, const struct iscsi_session_conf *c2)
1687{
1688	if (id2 == 0 && c2->isc_target[0] == '\0' &&
1689	    c2->isc_target_addr[0] == '\0')
1690		return (true);
1691	if (id2 != 0 && id2 == id1)
1692		return (true);
1693	if (c2->isc_target[0] != '\0' &&
1694	    strcmp(c1->isc_target, c2->isc_target) == 0)
1695		return (true);
1696	if (c2->isc_target_addr[0] != '\0' &&
1697	    strcmp(c1->isc_target_addr, c2->isc_target_addr) == 0)
1698		return (true);
1699	return (false);
1700}
1701
1702static int
1703iscsi_ioctl_session_remove(struct iscsi_softc *sc,
1704    struct iscsi_session_remove *isr)
1705{
1706	struct iscsi_session *is, *tmp;
1707	bool found = false;
1708
1709	iscsi_sanitize_session_conf(&isr->isr_conf);
1710
1711	sx_xlock(&sc->sc_lock);
1712	TAILQ_FOREACH_SAFE(is, &sc->sc_sessions, is_next, tmp) {
1713		ISCSI_SESSION_LOCK(is);
1714		if (iscsi_session_conf_matches(is->is_id, &is->is_conf,
1715		    isr->isr_session_id, &isr->isr_conf)) {
1716			found = true;
1717			iscsi_session_logout(is);
1718			iscsi_session_terminate(is);
1719		}
1720		ISCSI_SESSION_UNLOCK(is);
1721	}
1722	sx_xunlock(&sc->sc_lock);
1723
1724	if (!found)
1725		return (ESRCH);
1726
1727	return (0);
1728}
1729
1730static int
1731iscsi_ioctl_session_list(struct iscsi_softc *sc, struct iscsi_session_list *isl)
1732{
1733	int error;
1734	unsigned int i = 0;
1735	struct iscsi_session *is;
1736	struct iscsi_session_state iss;
1737
1738	sx_slock(&sc->sc_lock);
1739	TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
1740		if (i >= isl->isl_nentries) {
1741			sx_sunlock(&sc->sc_lock);
1742			return (EMSGSIZE);
1743		}
1744		memset(&iss, 0, sizeof(iss));
1745		memcpy(&iss.iss_conf, &is->is_conf, sizeof(iss.iss_conf));
1746		iss.iss_id = is->is_id;
1747		strlcpy(iss.iss_target_alias, is->is_target_alias, sizeof(iss.iss_target_alias));
1748		strlcpy(iss.iss_reason, is->is_reason, sizeof(iss.iss_reason));
1749
1750		if (is->is_conn->ic_header_crc32c)
1751			iss.iss_header_digest = ISCSI_DIGEST_CRC32C;
1752		else
1753			iss.iss_header_digest = ISCSI_DIGEST_NONE;
1754
1755		if (is->is_conn->ic_data_crc32c)
1756			iss.iss_data_digest = ISCSI_DIGEST_CRC32C;
1757		else
1758			iss.iss_data_digest = ISCSI_DIGEST_NONE;
1759
1760		iss.iss_max_data_segment_length = is->is_max_data_segment_length;
1761		iss.iss_immediate_data = is->is_immediate_data;
1762		iss.iss_connected = is->is_connected;
1763
1764		error = copyout(&iss, isl->isl_pstates + i, sizeof(iss));
1765		if (error != 0) {
1766			sx_sunlock(&sc->sc_lock);
1767			return (error);
1768		}
1769		i++;
1770	}
1771	sx_sunlock(&sc->sc_lock);
1772
1773	isl->isl_nentries = i;
1774
1775	return (0);
1776}
1777
1778static int
1779iscsi_ioctl(struct cdev *dev, u_long cmd, caddr_t arg, int mode,
1780    struct thread *td)
1781{
1782	struct iscsi_softc *sc;
1783
1784	sc = dev->si_drv1;
1785
1786	switch (cmd) {
1787	case ISCSIDWAIT:
1788		return (iscsi_ioctl_daemon_wait(sc,
1789		    (struct iscsi_daemon_request *)arg));
1790	case ISCSIDHANDOFF:
1791		return (iscsi_ioctl_daemon_handoff(sc,
1792		    (struct iscsi_daemon_handoff *)arg));
1793	case ISCSIDFAIL:
1794		return (iscsi_ioctl_daemon_fail(sc,
1795		    (struct iscsi_daemon_fail *)arg));
1796#ifdef ICL_KERNEL_PROXY
1797	case ISCSIDCONNECT:
1798		return (iscsi_ioctl_daemon_connect(sc,
1799		    (struct iscsi_daemon_connect *)arg));
1800	case ISCSIDSEND:
1801		return (iscsi_ioctl_daemon_send(sc,
1802		    (struct iscsi_daemon_send *)arg));
1803	case ISCSIDRECEIVE:
1804		return (iscsi_ioctl_daemon_receive(sc,
1805		    (struct iscsi_daemon_receive *)arg));
1806	case ISCSIDCLOSE:
1807		return (iscsi_ioctl_daemon_close(sc,
1808		    (struct iscsi_daemon_close *)arg));
1809#endif /* ICL_KERNEL_PROXY */
1810	case ISCSISADD:
1811		return (iscsi_ioctl_session_add(sc,
1812		    (struct iscsi_session_add *)arg));
1813	case ISCSISREMOVE:
1814		return (iscsi_ioctl_session_remove(sc,
1815		    (struct iscsi_session_remove *)arg));
1816	case ISCSISLIST:
1817		return (iscsi_ioctl_session_list(sc,
1818		    (struct iscsi_session_list *)arg));
1819	default:
1820		return (EINVAL);
1821	}
1822}
1823
1824static uint64_t
1825iscsi_encode_lun(uint32_t lun)
1826{
1827	uint8_t encoded[8];
1828	uint64_t result;
1829
1830	memset(encoded, 0, sizeof(encoded));
1831
1832	if (lun < 256) {
1833		/*
1834		 * Peripheral device addressing.
1835		 */
1836		encoded[1] = lun;
1837	} else if (lun < 16384) {
1838		/*
1839		 * Flat space addressing.
1840		 */
1841		encoded[0] = 0x40;
1842		encoded[0] |= (lun >> 8) & 0x3f;
1843		encoded[1] = lun & 0xff;
1844	} else {
1845		/*
1846		 * Extended flat space addressing.
1847		 */
1848		encoded[0] = 0xd2;
1849		encoded[1] = lun >> 16;
1850		encoded[2] = lun >> 8;
1851		encoded[3] = lun;
1852	}
1853
1854	memcpy(&result, encoded, sizeof(result));
1855	return (result);
1856}
1857
1858static struct iscsi_outstanding *
1859iscsi_outstanding_find(struct iscsi_session *is, uint32_t initiator_task_tag)
1860{
1861	struct iscsi_outstanding *io;
1862
1863	ISCSI_SESSION_LOCK_ASSERT(is);
1864
1865	TAILQ_FOREACH(io, &is->is_outstanding, io_next) {
1866		if (io->io_initiator_task_tag == initiator_task_tag)
1867			return (io);
1868	}
1869	return (NULL);
1870}
1871
1872static int
1873iscsi_outstanding_add(struct iscsi_session *is,
1874    uint32_t initiator_task_tag, union ccb *ccb)
1875{
1876	struct iscsi_outstanding *io;
1877
1878	ISCSI_SESSION_LOCK_ASSERT(is);
1879
1880	KASSERT(iscsi_outstanding_find(is, initiator_task_tag) == NULL,
1881	    ("initiator_task_tag 0x%x already added", initiator_task_tag));
1882
1883	io = uma_zalloc(iscsi_outstanding_zone, M_NOWAIT | M_ZERO);
1884	if (io == NULL) {
1885		ISCSI_SESSION_WARN(is, "failed to allocate %zd bytes", sizeof(*io));
1886		return (ENOMEM);
1887	}
1888	io->io_initiator_task_tag = initiator_task_tag;
1889	io->io_ccb = ccb;
1890	TAILQ_INSERT_TAIL(&is->is_outstanding, io, io_next);
1891	return (0);
1892}
1893
1894static void
1895iscsi_outstanding_remove(struct iscsi_session *is, struct iscsi_outstanding *io)
1896{
1897
1898	ISCSI_SESSION_LOCK_ASSERT(is);
1899
1900	TAILQ_REMOVE(&is->is_outstanding, io, io_next);
1901	uma_zfree(iscsi_outstanding_zone, io);
1902}
1903
1904static void
1905iscsi_action_scsiio(struct iscsi_session *is, union ccb *ccb)
1906{
1907	struct icl_pdu *request;
1908	struct iscsi_bhs_scsi_command *bhssc;
1909	struct ccb_scsiio *csio;
1910	size_t len;
1911	int error;
1912
1913	ISCSI_SESSION_LOCK_ASSERT(is);
1914
1915#if 0
1916	KASSERT(is->is_login_phase == false, ("%s called during Login Phase", __func__));
1917#else
1918	if (is->is_login_phase) {
1919		ISCSI_SESSION_DEBUG(is, "called during login phase");
1920		if ((ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
1921			xpt_freeze_devq(ccb->ccb_h.path, 1);
1922			ISCSI_SESSION_DEBUG(is, "freezing devq");
1923		}
1924		ccb->ccb_h.status = CAM_REQ_ABORTED | CAM_DEV_QFRZN;
1925		xpt_done(ccb);
1926		return;
1927	}
1928#endif
1929
1930	request = icl_pdu_new_bhs(is->is_conn, M_NOWAIT);
1931	if (request == NULL) {
1932		if ((ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
1933			xpt_freeze_devq(ccb->ccb_h.path, 1);
1934			ISCSI_SESSION_DEBUG(is, "freezing devq");
1935		}
1936		ccb->ccb_h.status = CAM_RESRC_UNAVAIL | CAM_DEV_QFRZN;
1937		xpt_done(ccb);
1938		return;
1939	}
1940
1941	csio = &ccb->csio;
1942	bhssc = (struct iscsi_bhs_scsi_command *)request->ip_bhs;
1943	bhssc->bhssc_opcode = ISCSI_BHS_OPCODE_SCSI_COMMAND;
1944	bhssc->bhssc_flags |= BHSSC_FLAGS_F;
1945	switch (csio->ccb_h.flags & CAM_DIR_MASK) {
1946	case CAM_DIR_IN:
1947		bhssc->bhssc_flags |= BHSSC_FLAGS_R;
1948		break;
1949	case CAM_DIR_OUT:
1950		bhssc->bhssc_flags |= BHSSC_FLAGS_W;
1951		break;
1952	}
1953
1954        switch (csio->tag_action) {
1955        case MSG_HEAD_OF_Q_TAG:
1956		bhssc->bhssc_flags |= BHSSC_FLAGS_ATTR_HOQ;
1957		break;
1958                break;
1959        case MSG_ORDERED_Q_TAG:
1960		bhssc->bhssc_flags |= BHSSC_FLAGS_ATTR_ORDERED;
1961                break;
1962        case MSG_ACA_TASK:
1963		bhssc->bhssc_flags |= BHSSC_FLAGS_ATTR_ACA;
1964                break;
1965        case CAM_TAG_ACTION_NONE:
1966        case MSG_SIMPLE_Q_TAG:
1967        default:
1968		bhssc->bhssc_flags |= BHSSC_FLAGS_ATTR_SIMPLE;
1969                break;
1970        }
1971
1972	bhssc->bhssc_lun = iscsi_encode_lun(csio->ccb_h.target_lun);
1973	bhssc->bhssc_initiator_task_tag = is->is_initiator_task_tag;
1974	is->is_initiator_task_tag++;
1975	bhssc->bhssc_expected_data_transfer_length = htonl(csio->dxfer_len);
1976	KASSERT(csio->cdb_len <= sizeof(bhssc->bhssc_cdb),
1977	    ("unsupported CDB size %zd", (size_t)csio->cdb_len));
1978
1979	if (csio->ccb_h.flags & CAM_CDB_POINTER)
1980		memcpy(&bhssc->bhssc_cdb, csio->cdb_io.cdb_ptr, csio->cdb_len);
1981	else
1982		memcpy(&bhssc->bhssc_cdb, csio->cdb_io.cdb_bytes, csio->cdb_len);
1983
1984	error = iscsi_outstanding_add(is, bhssc->bhssc_initiator_task_tag, ccb);
1985	if (error != 0) {
1986		icl_pdu_free(request);
1987		if ((ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
1988			xpt_freeze_devq(ccb->ccb_h.path, 1);
1989			ISCSI_SESSION_DEBUG(is, "freezing devq");
1990		}
1991		ccb->ccb_h.status = CAM_RESRC_UNAVAIL | CAM_DEV_QFRZN;
1992		xpt_done(ccb);
1993		return;
1994	}
1995
1996	if (is->is_immediate_data &&
1997	    (csio->ccb_h.flags & CAM_DIR_MASK) == CAM_DIR_OUT) {
1998		len = csio->dxfer_len;
1999		//ISCSI_SESSION_DEBUG(is, "adding %zd of immediate data", len);
2000		if (len > is->is_first_burst_length) {
2001			ISCSI_SESSION_DEBUG(is, "len %zd -> %zd", len, is->is_first_burst_length);
2002			len = is->is_first_burst_length;
2003		}
2004
2005		error = icl_pdu_append_data(request, csio->data_ptr, len, M_NOWAIT);
2006		if (error != 0) {
2007			icl_pdu_free(request);
2008			if ((ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
2009				xpt_freeze_devq(ccb->ccb_h.path, 1);
2010				ISCSI_SESSION_DEBUG(is, "freezing devq");
2011			}
2012			ccb->ccb_h.status = CAM_RESRC_UNAVAIL | CAM_DEV_QFRZN;
2013			xpt_done(ccb);
2014			return;
2015		}
2016	}
2017	iscsi_pdu_queue_locked(request);
2018}
2019
2020static void
2021iscsi_action(struct cam_sim *sim, union ccb *ccb)
2022{
2023	struct iscsi_session *is;
2024
2025	is = cam_sim_softc(sim);
2026
2027	ISCSI_SESSION_LOCK_ASSERT(is);
2028
2029	if (is->is_terminating) {
2030		ISCSI_SESSION_DEBUG(is, "called during termination");
2031		ccb->ccb_h.status = CAM_DEV_NOT_THERE;
2032		xpt_done(ccb);
2033		return;
2034	}
2035
2036	switch (ccb->ccb_h.func_code) {
2037	case XPT_PATH_INQ:
2038	{
2039		struct ccb_pathinq *cpi = &ccb->cpi;
2040
2041		cpi->version_num = 1;
2042		cpi->hba_inquiry = PI_TAG_ABLE;
2043		cpi->target_sprt = 0;
2044		//cpi->hba_misc = PIM_NOBUSRESET;
2045		cpi->hba_misc = 0;
2046		cpi->hba_eng_cnt = 0;
2047		cpi->max_target = 0;
2048		cpi->max_lun = 255;
2049		//cpi->initiator_id = 0; /* XXX */
2050		cpi->initiator_id = 64; /* XXX */
2051		strlcpy(cpi->sim_vid, "FreeBSD", SIM_IDLEN);
2052		strlcpy(cpi->hba_vid, "iSCSI", HBA_IDLEN);
2053		strlcpy(cpi->dev_name, cam_sim_name(sim), DEV_IDLEN);
2054		cpi->unit_number = cam_sim_unit(sim);
2055		cpi->bus_id = cam_sim_bus(sim);
2056		cpi->base_transfer_speed = 150000; /* XXX */
2057		cpi->transport = XPORT_ISCSI;
2058		cpi->transport_version = 0;
2059		cpi->protocol = PROTO_SCSI;
2060		cpi->protocol_version = SCSI_REV_SPC3;
2061		cpi->maxio = MAXPHYS;
2062		cpi->ccb_h.status = CAM_REQ_CMP;
2063		break;
2064	}
2065	case XPT_CALC_GEOMETRY:
2066		cam_calc_geometry(&ccb->ccg, /*extended*/1);
2067		ccb->ccb_h.status = CAM_REQ_CMP;
2068		break;
2069#if 0
2070	/*
2071	 * XXX: What's the point?
2072	 */
2073	case XPT_RESET_BUS:
2074	case XPT_ABORT:
2075	case XPT_TERM_IO:
2076		ISCSI_SESSION_DEBUG(is, "faking success for reset, abort, or term_io");
2077		ccb->ccb_h.status = CAM_REQ_CMP;
2078		break;
2079#endif
2080	case XPT_SCSI_IO:
2081		iscsi_action_scsiio(is, ccb);
2082		return;
2083	default:
2084#if 0
2085		ISCSI_SESSION_DEBUG(is, "got unsupported code 0x%x", ccb->ccb_h.func_code);
2086#endif
2087		ccb->ccb_h.status = CAM_FUNC_NOTAVAIL;
2088		break;
2089	}
2090	xpt_done(ccb);
2091}
2092
2093static void
2094iscsi_poll(struct cam_sim *sim)
2095{
2096
2097	KASSERT(0, ("%s: you're not supposed to be here", __func__));
2098}
2099
2100static void
2101iscsi_shutdown(struct iscsi_softc *sc)
2102{
2103	struct iscsi_session *is;
2104
2105	ISCSI_DEBUG("removing all sessions due to shutdown");
2106
2107	sx_slock(&sc->sc_lock);
2108	TAILQ_FOREACH(is, &sc->sc_sessions, is_next)
2109		iscsi_session_terminate(is);
2110	sx_sunlock(&sc->sc_lock);
2111}
2112
2113static int
2114iscsi_load(void)
2115{
2116	int error;
2117
2118	sc = malloc(sizeof(*sc), M_ISCSI, M_ZERO | M_WAITOK);
2119	sx_init(&sc->sc_lock, "iscsi");
2120	TAILQ_INIT(&sc->sc_sessions);
2121	cv_init(&sc->sc_cv, "iscsi_cv");
2122
2123	iscsi_outstanding_zone = uma_zcreate("iscsi_outstanding",
2124	    sizeof(struct iscsi_outstanding), NULL, NULL, NULL, NULL,
2125	    UMA_ALIGN_PTR, 0);
2126
2127	error = make_dev_p(MAKEDEV_CHECKNAME, &sc->sc_cdev, &iscsi_cdevsw,
2128	    NULL, UID_ROOT, GID_WHEEL, 0600, "iscsi");
2129	if (error != 0) {
2130		ISCSI_WARN("failed to create device node, error %d", error);
2131		return (error);
2132	}
2133	sc->sc_cdev->si_drv1 = sc;
2134
2135	/*
2136	 * Note that this needs to get run before dashutdown().  Otherwise,
2137	 * when rebooting with iSCSI session with outstanding requests,
2138	 * but disconnected, dashutdown() will hang on cam_periph_runccb().
2139	 */
2140	sc->sc_shutdown_eh = EVENTHANDLER_REGISTER(shutdown_post_sync,
2141	    iscsi_shutdown, sc, SHUTDOWN_PRI_FIRST);
2142
2143	return (0);
2144}
2145
2146static int
2147iscsi_unload(void)
2148{
2149	struct iscsi_session *is, *tmp;
2150
2151	if (sc->sc_cdev != NULL) {
2152		ISCSI_DEBUG("removing device node");
2153		destroy_dev(sc->sc_cdev);
2154		ISCSI_DEBUG("device node removed");
2155	}
2156
2157	if (sc->sc_shutdown_eh != NULL)
2158		EVENTHANDLER_DEREGISTER(shutdown_post_sync, sc->sc_shutdown_eh);
2159
2160	sx_slock(&sc->sc_lock);
2161	TAILQ_FOREACH_SAFE(is, &sc->sc_sessions, is_next, tmp)
2162		iscsi_session_terminate(is);
2163	while(!TAILQ_EMPTY(&sc->sc_sessions)) {
2164		ISCSI_DEBUG("waiting for sessions to terminate");
2165		cv_wait(&sc->sc_cv, &sc->sc_lock);
2166	}
2167	ISCSI_DEBUG("all sessions terminated");
2168	sx_sunlock(&sc->sc_lock);
2169
2170	uma_zdestroy(iscsi_outstanding_zone);
2171	sx_destroy(&sc->sc_lock);
2172	cv_destroy(&sc->sc_cv);
2173	free(sc, M_ISCSI);
2174	return (0);
2175}
2176
2177static int
2178iscsi_quiesce(void)
2179{
2180	sx_slock(&sc->sc_lock);
2181	if (!TAILQ_EMPTY(&sc->sc_sessions)) {
2182		sx_sunlock(&sc->sc_lock);
2183		return (EBUSY);
2184	}
2185	sx_sunlock(&sc->sc_lock);
2186	return (0);
2187}
2188
2189static int
2190iscsi_modevent(module_t mod, int what, void *arg)
2191{
2192	int error;
2193
2194	switch (what) {
2195	case MOD_LOAD:
2196		error = iscsi_load();
2197		break;
2198	case MOD_UNLOAD:
2199		error = iscsi_unload();
2200		break;
2201	case MOD_QUIESCE:
2202		error = iscsi_quiesce();
2203		break;
2204	default:
2205		error = EINVAL;
2206		break;
2207	}
2208	return (error);
2209}
2210
2211moduledata_t iscsi_data = {
2212	"iscsi",
2213	iscsi_modevent,
2214	0
2215};
2216
2217DECLARE_MODULE(iscsi, iscsi_data, SI_SUB_DRIVERS, SI_ORDER_MIDDLE);
2218MODULE_DEPEND(iscsi, cam, 1, 1, 1);
2219MODULE_DEPEND(iscsi, icl, 1, 1, 1);
2220