aboutsummaryrefslogtreecommitdiff
path: root/sys/dev
diff options
context:
space:
mode:
authorEdward Tomasz Napierala <trasz@FreeBSD.org>2013-09-14 15:29:06 +0000
committerEdward Tomasz Napierala <trasz@FreeBSD.org>2013-09-14 15:29:06 +0000
commit009ea47eb2d21856af4529aaaca32cd67748daea (patch)
treed04af1389a0e20c7613b9dccaf4f3176084e40cc /sys/dev
parent196beb53597c7f328bf31034397007e494ce7421 (diff)
Bring in the new iSCSI target and initiator.
Reviewed by: ken (parts) Approved by: re (delphij) Sponsored by: FreeBSD Foundation
Notes
Notes: svn path=/head/; revision=255570
Diffstat (limited to 'sys/dev')
-rw-r--r--sys/dev/iscsi/icl.c1292
-rw-r--r--sys/dev/iscsi/icl.h151
-rw-r--r--sys/dev/iscsi/icl_proxy.c397
-rw-r--r--sys/dev/iscsi/iscsi.c2109
-rw-r--r--sys/dev/iscsi/iscsi.h135
-rw-r--r--sys/dev/iscsi/iscsi_ioctl.h201
-rw-r--r--sys/dev/iscsi/iscsi_proto.h439
-rw-r--r--sys/dev/iscsi_initiator/iscsi.c6
8 files changed, 4727 insertions, 3 deletions
diff --git a/sys/dev/iscsi/icl.c b/sys/dev/iscsi/icl.c
new file mode 100644
index 000000000000..eb9cf4efcd3a
--- /dev/null
+++ b/sys/dev/iscsi/icl.c
@@ -0,0 +1,1292 @@
+/*-
+ * Copyright (c) 2012 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Edward Tomasz Napierala under sponsorship
+ * from the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * $FreeBSD$
+ */
+
+/*
+ * iSCSI Common Layer. It's used by both the initiator and target to send
+ * and receive iSCSI PDUs.
+ */
+
+#include <sys/param.h>
+#include <sys/capability.h>
+#include <sys/condvar.h>
+#include <sys/conf.h>
+#include <sys/file.h>
+#include <sys/kernel.h>
+#include <sys/kthread.h>
+#include <sys/lock.h>
+#include <sys/mbuf.h>
+#include <sys/mutex.h>
+#include <sys/module.h>
+#include <sys/socket.h>
+#include <sys/socketvar.h>
+#include <sys/sysctl.h>
+#include <sys/systm.h>
+#include <sys/sx.h>
+#include <sys/uio.h>
+#include <vm/uma.h>
+#include <netinet/in.h>
+#include <netinet/tcp.h>
+
+#include "icl.h"
+#include "iscsi_proto.h"
+
+SYSCTL_NODE(_kern, OID_AUTO, icl, CTLFLAG_RD, 0, "iSCSI Common Layer");
+static int debug = 1;
+TUNABLE_INT("kern.icl.debug", &debug);
+SYSCTL_INT(_kern_icl, OID_AUTO, debug, CTLFLAG_RW,
+ &debug, 1, "Enable debug messages");
+static int partial_receive_len = 1 * 1024; /* XXX: More? */
+TUNABLE_INT("kern.icl.partial_receive_len", &partial_receive_len);
+SYSCTL_INT(_kern_icl, OID_AUTO, partial_receive_len, CTLFLAG_RW,
+ &partial_receive_len, 1 * 1024, "Minimum read size for partially received "
+ "data segment");
+
+static uma_zone_t icl_conn_zone;
+static uma_zone_t icl_pdu_zone;
+
+static volatile u_int icl_ncons;
+
+#define ICL_DEBUG(X, ...) \
+ if (debug > 1) { \
+ printf("%s: " X "\n", __func__, ## __VA_ARGS__);\
+ } while (0)
+
+#define ICL_WARN(X, ...) \
+ if (debug > 0) { \
+ printf("WARNING: %s: " X "\n", \
+ __func__, ## __VA_ARGS__); \
+ } while (0)
+
+#define ICL_CONN_LOCK(X) mtx_lock(&X->ic_lock)
+#define ICL_CONN_UNLOCK(X) mtx_unlock(&X->ic_lock)
+#define ICL_CONN_LOCK_ASSERT(X) mtx_assert(&X->ic_lock, MA_OWNED)
+
+static void
+icl_conn_fail(struct icl_conn *ic)
+{
+ if (ic->ic_socket == NULL)
+ return;
+
+ /*
+ * XXX
+ */
+ ic->ic_socket->so_error = EDOOFUS;
+ (ic->ic_error)(ic);
+}
+
+static struct mbuf *
+icl_conn_receive(struct icl_conn *ic, size_t len)
+{
+ struct uio uio;
+ struct socket *so;
+ struct mbuf *m;
+ int error, flags;
+
+ so = ic->ic_socket;
+
+ memset(&uio, 0, sizeof(uio));
+ uio.uio_resid = len;
+
+ flags = MSG_DONTWAIT;
+ error = soreceive(so, NULL, &uio, &m, NULL, &flags);
+ if (error != 0) {
+ ICL_DEBUG("soreceive error %d", error);
+ return (NULL);
+ }
+ if (uio.uio_resid != 0) {
+ m_freem(m);
+ ICL_DEBUG("short read");
+ return (NULL);
+ }
+
+ return (m);
+}
+
+static struct icl_pdu *
+icl_pdu_new(struct icl_conn *ic, int flags)
+{
+ struct icl_pdu *ip;
+
+ refcount_acquire(&ic->ic_outstanding_pdus);
+ ip = uma_zalloc(icl_pdu_zone, flags | M_ZERO);
+ if (ip == NULL) {
+ ICL_WARN("failed to allocate %zd bytes", sizeof(*ip));
+ refcount_release(&ic->ic_outstanding_pdus);
+ return (NULL);
+ }
+
+ ip->ip_conn = ic;
+
+ return (ip);
+}
+
+void
+icl_pdu_free(struct icl_pdu *ip)
+{
+ struct icl_conn *ic;
+
+ ic = ip->ip_conn;
+
+ m_freem(ip->ip_bhs_mbuf);
+ m_freem(ip->ip_ahs_mbuf);
+ m_freem(ip->ip_data_mbuf);
+ uma_zfree(icl_pdu_zone, ip);
+ refcount_release(&ic->ic_outstanding_pdus);
+}
+
+/*
+ * Allocate icl_pdu with empty BHS to fill up by the caller.
+ */
+struct icl_pdu *
+icl_pdu_new_bhs(struct icl_conn *ic, int flags)
+{
+ struct icl_pdu *ip;
+
+ ip = icl_pdu_new(ic, flags);
+ if (ip == NULL)
+ return (NULL);
+
+ ip->ip_bhs_mbuf = m_getm2(NULL, sizeof(struct iscsi_bhs),
+ flags, MT_DATA, M_PKTHDR);
+ if (ip->ip_bhs_mbuf == NULL) {
+ ICL_WARN("failed to allocate %zd bytes", sizeof(*ip));
+ icl_pdu_free(ip);
+ return (NULL);
+ }
+ ip->ip_bhs = mtod(ip->ip_bhs_mbuf, struct iscsi_bhs *);
+ memset(ip->ip_bhs, 0, sizeof(struct iscsi_bhs));
+ ip->ip_bhs_mbuf->m_len = sizeof(struct iscsi_bhs);
+
+ return (ip);
+}
+
+static int
+icl_pdu_ahs_length(const struct icl_pdu *request)
+{
+
+ return (request->ip_bhs->bhs_total_ahs_len * 4);
+}
+
+size_t
+icl_pdu_data_segment_length(const struct icl_pdu *request)
+{
+ uint32_t len = 0;
+
+ len += request->ip_bhs->bhs_data_segment_len[0];
+ len <<= 8;
+ len += request->ip_bhs->bhs_data_segment_len[1];
+ len <<= 8;
+ len += request->ip_bhs->bhs_data_segment_len[2];
+
+ return (len);
+}
+
+static void
+icl_pdu_set_data_segment_length(struct icl_pdu *response, uint32_t len)
+{
+
+ response->ip_bhs->bhs_data_segment_len[2] = len;
+ response->ip_bhs->bhs_data_segment_len[1] = len >> 8;
+ response->ip_bhs->bhs_data_segment_len[0] = len >> 16;
+}
+
+static size_t
+icl_pdu_padding(const struct icl_pdu *ip)
+{
+
+ if ((ip->ip_data_len % 4) != 0)
+ return (4 - (ip->ip_data_len % 4));
+
+ return (0);
+}
+
+static size_t
+icl_pdu_size(const struct icl_pdu *response)
+{
+ size_t len;
+
+ KASSERT(response->ip_ahs_len == 0, ("responding with AHS"));
+
+ len = sizeof(struct iscsi_bhs) + response->ip_data_len +
+ icl_pdu_padding(response);
+ if (response->ip_conn->ic_header_crc32c)
+ len += ISCSI_HEADER_DIGEST_SIZE;
+ if (response->ip_conn->ic_data_crc32c)
+ len += ISCSI_DATA_DIGEST_SIZE;
+
+ return (len);
+}
+
+static int
+icl_pdu_receive_bhs(struct icl_pdu *request, size_t *availablep)
+{
+ struct mbuf *m;
+
+ m = icl_conn_receive(request->ip_conn, sizeof(struct iscsi_bhs));
+ if (m == NULL) {
+ ICL_DEBUG("failed to receive BHS");
+ return (-1);
+ }
+
+ request->ip_bhs_mbuf = m_pullup(m, sizeof(struct iscsi_bhs));
+ if (request->ip_bhs_mbuf == NULL) {
+ ICL_WARN("m_pullup failed");
+ return (-1);
+ }
+ request->ip_bhs = mtod(request->ip_bhs_mbuf, struct iscsi_bhs *);
+
+ /*
+ * XXX: For architectures with strict alignment requirements
+ * we may need to allocate ip_bhs and copy the data into it.
+ * For some reason, though, not doing this doesn't seem
+ * to cause problems; tested on sparc64.
+ */
+
+ *availablep -= sizeof(struct iscsi_bhs);
+ return (0);
+}
+
+static int
+icl_pdu_receive_ahs(struct icl_pdu *request, size_t *availablep)
+{
+
+ request->ip_ahs_len = icl_pdu_ahs_length(request);
+ if (request->ip_ahs_len == 0)
+ return (0);
+
+ request->ip_ahs_mbuf = icl_conn_receive(request->ip_conn,
+ request->ip_ahs_len);
+ if (request->ip_ahs_mbuf == NULL) {
+ ICL_DEBUG("failed to receive AHS");
+ return (-1);
+ }
+
+ *availablep -= request->ip_ahs_len;
+ return (0);
+}
+
+static uint32_t
+icl_mbuf_to_crc32c(const struct mbuf *m0)
+{
+ uint32_t digest = 0xffffffff;
+ const struct mbuf *m;
+
+ for (m = m0; m != NULL; m = m->m_next)
+ digest = calculate_crc32c(digest,
+ mtod(m, const void *), m->m_len);
+
+ digest = digest ^ 0xffffffff;
+
+ return (digest);
+}
+
+static int
+icl_pdu_check_header_digest(struct icl_pdu *request, size_t *availablep)
+{
+ struct mbuf *m;
+ uint32_t received_digest, valid_digest;
+
+ if (request->ip_conn->ic_header_crc32c == false)
+ return (0);
+
+ m = icl_conn_receive(request->ip_conn, ISCSI_HEADER_DIGEST_SIZE);
+ if (m == NULL) {
+ ICL_DEBUG("failed to receive header digest");
+ return (-1);
+ }
+
+ CTASSERT(sizeof(received_digest) == ISCSI_HEADER_DIGEST_SIZE);
+ memcpy(&received_digest, mtod(m, void *), ISCSI_HEADER_DIGEST_SIZE);
+ m_freem(m);
+
+ *availablep -= ISCSI_HEADER_DIGEST_SIZE;
+
+ /*
+ * XXX: Handle AHS.
+ */
+ valid_digest = icl_mbuf_to_crc32c(request->ip_bhs_mbuf);
+ if (received_digest != valid_digest) {
+ ICL_WARN("header digest check failed; got 0x%x, "
+ "should be 0x%x", received_digest, valid_digest);
+ return (-1);
+ }
+
+ return (0);
+}
+
+/*
+ * Return the number of bytes that should be waiting in the receive socket
+ * before icl_pdu_receive_data_segment() gets called.
+ */
+static size_t
+icl_pdu_data_segment_receive_len(const struct icl_pdu *request)
+{
+ size_t len;
+
+ len = icl_pdu_data_segment_length(request);
+ if (len == 0)
+ return (0);
+
+ /*
+ * Account for the parts of data segment already read from
+ * the socket buffer.
+ */
+ KASSERT(len > request->ip_data_len, ("len <= request->ip_data_len"));
+ len -= request->ip_data_len;
+
+ /*
+ * Don't always wait for the full data segment to be delivered
+ * to the socket; this might badly affect performance due to
+ * TCP window scaling.
+ */
+ if (len > partial_receive_len) {
+#if 0
+ ICL_DEBUG("need %zd bytes of data, limiting to %zd",
+ len, partial_receive_len));
+#endif
+ len = partial_receive_len;
+
+ return (len);
+ }
+
+ /*
+ * Account for padding. Note that due to the way code is written,
+ * the icl_pdu_receive_data_segment() must always receive padding
+ * along with the last part of data segment, because it would be
+ * impossible to tell whether we've already received the full data
+ * segment including padding, or without it.
+ */
+ if ((len % 4) != 0)
+ len += 4 - (len % 4);
+
+#if 0
+ ICL_DEBUG("need %zd bytes of data", len));
+#endif
+
+ return (len);
+}
+
+static int
+icl_pdu_receive_data_segment(struct icl_pdu *request,
+ size_t *availablep, bool *more_neededp)
+{
+ struct icl_conn *ic;
+ size_t len, padding = 0;
+ struct mbuf *m;
+
+ ic = request->ip_conn;
+
+ *more_neededp = false;
+ ic->ic_receive_len = 0;
+
+ len = icl_pdu_data_segment_length(request);
+ if (len == 0)
+ return (0);
+
+ if ((len % 4) != 0)
+ padding = 4 - (len % 4);
+
+ /*
+ * Account for already received parts of data segment.
+ */
+ KASSERT(len > request->ip_data_len, ("len <= request->ip_data_len"));
+ len -= request->ip_data_len;
+
+ if (len + padding > *availablep) {
+ /*
+ * Not enough data in the socket buffer. Receive as much
+ * as we can. Don't receive padding, since, obviously, it's
+ * not the end of data segment yet.
+ */
+#if 0
+ ICL_DEBUG("limited from %zd to %zd",
+ len + padding, *availablep - padding));
+#endif
+ len = *availablep - padding;
+ *more_neededp = true;
+ padding = 0;
+ }
+
+ /*
+ * Must not try to receive padding without at least one byte
+ * of actual data segment.
+ */
+ if (len > 0) {
+ m = icl_conn_receive(request->ip_conn, len + padding);
+ if (m == NULL) {
+ ICL_DEBUG("failed to receive data segment");
+ return (-1);
+ }
+
+ if (request->ip_data_mbuf == NULL)
+ request->ip_data_mbuf = m;
+ else
+ m_cat(request->ip_data_mbuf, m);
+
+ request->ip_data_len += len;
+ *availablep -= len + padding;
+ } else
+ ICL_DEBUG("len 0");
+
+ if (*more_neededp)
+ ic->ic_receive_len =
+ icl_pdu_data_segment_receive_len(request);
+
+ return (0);
+}
+
+static int
+icl_pdu_check_data_digest(struct icl_pdu *request, size_t *availablep)
+{
+ struct mbuf *m;
+ uint32_t received_digest, valid_digest;
+
+ if (request->ip_conn->ic_data_crc32c == false)
+ return (0);
+
+ if (request->ip_data_len == 0)
+ return (0);
+
+ m = icl_conn_receive(request->ip_conn, ISCSI_DATA_DIGEST_SIZE);
+ if (m == NULL) {
+ ICL_DEBUG("failed to receive data digest");
+ return (-1);
+ }
+
+ CTASSERT(sizeof(received_digest) == ISCSI_DATA_DIGEST_SIZE);
+ memcpy(&received_digest, mtod(m, void *), ISCSI_DATA_DIGEST_SIZE);
+ m_freem(m);
+
+ *availablep -= ISCSI_DATA_DIGEST_SIZE;
+
+ /*
+ * Note that ip_data_mbuf also contains padding; since digest
+ * calculation is supposed to include that, we iterate over
+ * the entire ip_data_mbuf chain, not just ip_data_len bytes of it.
+ */
+ valid_digest = icl_mbuf_to_crc32c(request->ip_data_mbuf);
+ if (received_digest != valid_digest) {
+ ICL_WARN("data digest check failed; got 0x%x, "
+ "should be 0x%x", received_digest, valid_digest);
+ return (-1);
+ }
+
+ return (0);
+}
+
+/*
+ * Somewhat contrary to the name, this attempts to receive only one
+ * "part" of PDU at a time; call it repeatedly until it returns non-NULL.
+ */
+static struct icl_pdu *
+icl_conn_receive_pdu(struct icl_conn *ic, size_t *availablep)
+{
+ struct icl_pdu *request;
+ struct socket *so;
+ size_t len;
+ int error;
+ bool more_needed;
+
+ so = ic->ic_socket;
+
+ if (ic->ic_receive_state == ICL_CONN_STATE_BHS) {
+ KASSERT(ic->ic_receive_pdu == NULL,
+ ("ic->ic_receive_pdu != NULL"));
+ request = icl_pdu_new(ic, M_NOWAIT);
+ if (request == NULL) {
+ ICL_DEBUG("failed to allocate PDU; "
+ "dropping connection");
+ icl_conn_fail(ic);
+ return (NULL);
+ }
+ ic->ic_receive_pdu = request;
+ } else {
+ KASSERT(ic->ic_receive_pdu != NULL,
+ ("ic->ic_receive_pdu == NULL"));
+ request = ic->ic_receive_pdu;
+ }
+
+ if (*availablep < ic->ic_receive_len) {
+#if 0
+ ICL_DEBUG("not enough data; need %zd, "
+ "have %zd", ic->ic_receive_len, *availablep);
+#endif
+ return (NULL);
+ }
+
+ switch (ic->ic_receive_state) {
+ case ICL_CONN_STATE_BHS:
+ //ICL_DEBUG("receiving BHS");
+ error = icl_pdu_receive_bhs(request, availablep);
+ if (error != 0) {
+ ICL_DEBUG("failed to receive BHS; "
+ "dropping connection");
+ break;
+ }
+
+ /*
+ * We don't enforce any limit for AHS length;
+ * its length is stored in 8 bit field.
+ */
+
+ len = icl_pdu_data_segment_length(request);
+ if (len > ic->ic_max_data_segment_length) {
+ ICL_WARN("received data segment "
+ "length %zd is larger than negotiated "
+ "MaxDataSegmentLength %zd; "
+ "dropping connection",
+ len, ic->ic_max_data_segment_length);
+ break;
+ }
+
+ ic->ic_receive_state = ICL_CONN_STATE_AHS;
+ ic->ic_receive_len = icl_pdu_ahs_length(request);
+ break;
+
+ case ICL_CONN_STATE_AHS:
+ //ICL_DEBUG("receiving AHS");
+ error = icl_pdu_receive_ahs(request, availablep);
+ if (error != 0) {
+ ICL_DEBUG("failed to receive AHS; "
+ "dropping connection");
+ break;
+ }
+ ic->ic_receive_state = ICL_CONN_STATE_HEADER_DIGEST;
+ if (ic->ic_header_crc32c == false)
+ ic->ic_receive_len = 0;
+ else
+ ic->ic_receive_len = ISCSI_HEADER_DIGEST_SIZE;
+ break;
+
+ case ICL_CONN_STATE_HEADER_DIGEST:
+ //ICL_DEBUG("receiving header digest");
+ error = icl_pdu_check_header_digest(request, availablep);
+ if (error != 0) {
+ ICL_DEBUG("header digest failed; "
+ "dropping connection");
+ break;
+ }
+
+ ic->ic_receive_state = ICL_CONN_STATE_DATA;
+ ic->ic_receive_len =
+ icl_pdu_data_segment_receive_len(request);
+ break;
+
+ case ICL_CONN_STATE_DATA:
+ //ICL_DEBUG("receiving data segment");
+ error = icl_pdu_receive_data_segment(request, availablep,
+ &more_needed);
+ if (error != 0) {
+ ICL_DEBUG("failed to receive data segment;"
+ "dropping connection");
+ break;
+ }
+
+ if (more_needed)
+ break;
+
+ ic->ic_receive_state = ICL_CONN_STATE_DATA_DIGEST;
+ if (ic->ic_data_crc32c == false)
+ ic->ic_receive_len = 0;
+ else
+ ic->ic_receive_len = ISCSI_DATA_DIGEST_SIZE;
+ break;
+
+ case ICL_CONN_STATE_DATA_DIGEST:
+ //ICL_DEBUG("receiving data digest");
+ error = icl_pdu_check_data_digest(request, availablep);
+ if (error != 0) {
+ ICL_DEBUG("data digest failed; "
+ "dropping connection");
+ break;
+ }
+
+ /*
+ * We've received complete PDU; reset the receive state machine
+ * and return the PDU.
+ */
+ ic->ic_receive_state = ICL_CONN_STATE_BHS;
+ ic->ic_receive_len = sizeof(struct iscsi_bhs);
+ ic->ic_receive_pdu = NULL;
+ return (request);
+
+ default:
+ panic("invalid ic_receive_state %d\n", ic->ic_receive_state);
+ }
+
+ if (error != 0) {
+ icl_pdu_free(request);
+ icl_conn_fail(ic);
+ }
+
+ return (NULL);
+}
+
+static void
+icl_conn_receive_pdus(struct icl_conn *ic, size_t available)
+{
+ struct icl_pdu *response;
+ struct socket *so;
+
+ so = ic->ic_socket;
+
+ /*
+ * This can never happen; we're careful to only mess with ic->ic_socket
+ * pointer when the send/receive threads are not running.
+ */
+ KASSERT(so != NULL, ("NULL socket"));
+
+ for (;;) {
+ if (ic->ic_disconnecting)
+ return;
+
+ if (so->so_error != 0) {
+ ICL_DEBUG("connection error %d; "
+ "dropping connection", so->so_error);
+ icl_conn_fail(ic);
+ return;
+ }
+
+ /*
+ * Loop until we have a complete PDU or there is not enough
+ * data in the socket buffer.
+ */
+ if (available < ic->ic_receive_len) {
+#if 0
+ ICL_DEBUG("not enough data; have %zd, "
+ "need %zd", available,
+ ic->ic_receive_len);
+#endif
+ return;
+ }
+
+ response = icl_conn_receive_pdu(ic, &available);
+ if (response == NULL)
+ continue;
+
+ if (response->ip_ahs_len > 0) {
+ ICL_WARN("received PDU with unsupported "
+ "AHS; opcode 0x%x; dropping connection",
+ response->ip_bhs->bhs_opcode);
+ icl_pdu_free(response);
+ icl_conn_fail(ic);
+ return;
+ }
+
+ (ic->ic_receive)(response);
+ }
+}
+
+static void
+icl_receive_thread(void *arg)
+{
+ struct icl_conn *ic;
+ size_t available;
+ struct socket *so;
+
+ ic = arg;
+ so = ic->ic_socket;
+
+ ICL_CONN_LOCK(ic);
+ ic->ic_receive_running = true;
+ ICL_CONN_UNLOCK(ic);
+
+ for (;;) {
+ if (ic->ic_disconnecting) {
+ //ICL_DEBUG("terminating");
+ ICL_CONN_LOCK(ic);
+ ic->ic_receive_running = false;
+ ICL_CONN_UNLOCK(ic);
+ kthread_exit();
+ return;
+ }
+
+ SOCKBUF_LOCK(&so->so_rcv);
+ available = so->so_rcv.sb_cc;
+ if (available < ic->ic_receive_len) {
+ so->so_rcv.sb_lowat = ic->ic_receive_len;
+ cv_wait(&ic->ic_receive_cv, &so->so_rcv.sb_mtx);
+ }
+ SOCKBUF_UNLOCK(&so->so_rcv);
+
+ icl_conn_receive_pdus(ic, available);
+ }
+}
+
+static int
+icl_soupcall_receive(struct socket *so, void *arg, int waitflag)
+{
+ struct icl_conn *ic;
+
+ ic = arg;
+ cv_signal(&ic->ic_receive_cv);
+ return (SU_OK);
+}
+
+static int
+icl_pdu_send(struct icl_pdu *request)
+{
+ size_t padding, pdu_len;
+ uint32_t digest, zero = 0;
+ int error, ok;
+ struct socket *so;
+ struct icl_conn *ic;
+
+ ic = request->ip_conn;
+ so = request->ip_conn->ic_socket;
+
+ ICL_CONN_LOCK_ASSERT(ic);
+
+ icl_pdu_set_data_segment_length(request, request->ip_data_len);
+
+ pdu_len = icl_pdu_size(request);
+
+ if (ic->ic_header_crc32c) {
+ digest = icl_mbuf_to_crc32c(request->ip_bhs_mbuf);
+ ok = m_append(request->ip_bhs_mbuf, sizeof(digest),
+ (void *)&digest);
+ if (ok != 1) {
+ ICL_WARN("failed to append header digest");
+ return (1);
+ }
+ }
+
+ if (request->ip_data_len != 0) {
+ padding = icl_pdu_padding(request);
+ if (padding > 0) {
+ ok = m_append(request->ip_data_mbuf, padding,
+ (void *)&zero);
+ if (ok != 1) {
+ ICL_WARN("failed to append padding");
+ return (1);
+ }
+ }
+
+ if (ic->ic_data_crc32c) {
+ digest = icl_mbuf_to_crc32c(request->ip_data_mbuf);
+
+ ok = m_append(request->ip_data_mbuf, sizeof(digest),
+ (void *)&digest);
+ if (ok != 1) {
+ ICL_WARN("failed to append header digest");
+ return (1);
+ }
+ }
+
+ m_cat(request->ip_bhs_mbuf, request->ip_data_mbuf);
+ request->ip_data_mbuf = NULL;
+ }
+
+ request->ip_bhs_mbuf->m_pkthdr.len = pdu_len;
+
+ error = sosend(so, NULL, NULL, request->ip_bhs_mbuf,
+ NULL, MSG_DONTWAIT, curthread);
+ request->ip_bhs_mbuf = NULL; /* Sosend consumes the mbuf. */
+ if (error != 0) {
+ ICL_DEBUG("sosend error %d", error);
+ return (error);
+ }
+
+ return (0);
+}
+
+static void
+icl_conn_send_pdus(struct icl_conn *ic)
+{
+ struct icl_pdu *request;
+ struct socket *so;
+ size_t available, size;
+ int error;
+
+ ICL_CONN_LOCK_ASSERT(ic);
+
+ so = ic->ic_socket;
+
+ SOCKBUF_LOCK(&so->so_snd);
+ available = sbspace(&so->so_snd);
+ SOCKBUF_UNLOCK(&so->so_snd);
+
+ while (!TAILQ_EMPTY(&ic->ic_to_send)) {
+ if (ic->ic_disconnecting)
+ return;
+
+ request = TAILQ_FIRST(&ic->ic_to_send);
+ size = icl_pdu_size(request);
+ if (available < size) {
+ /*
+ * Set the low watermark on the socket,
+ * to avoid waking up until there is enough
+ * space.
+ */
+ SOCKBUF_LOCK(&so->so_snd);
+ so->so_snd.sb_lowat = size;
+ SOCKBUF_UNLOCK(&so->so_snd);
+#if 1
+ ICL_DEBUG("no space to send; "
+ "have %zd, need %zd",
+ available, size);
+#endif
+ return;
+ }
+ available -= size;
+ TAILQ_REMOVE(&ic->ic_to_send, request, ip_next);
+ error = icl_pdu_send(request);
+ if (error != 0) {
+ ICL_DEBUG("failed to send PDU; "
+ "dropping connection");
+ icl_conn_fail(ic);
+ return;
+ }
+ icl_pdu_free(request);
+ }
+}
+
+static void
+icl_send_thread(void *arg)
+{
+ struct icl_conn *ic;
+
+ ic = arg;
+
+ ICL_CONN_LOCK(ic);
+ ic->ic_send_running = true;
+ ICL_CONN_UNLOCK(ic);
+
+ for (;;) {
+ ICL_CONN_LOCK(ic);
+ if (ic->ic_disconnecting) {
+ //ICL_DEBUG("terminating");
+ ic->ic_send_running = false;
+ ICL_CONN_UNLOCK(ic);
+ kthread_exit();
+ return;
+ }
+ if (TAILQ_EMPTY(&ic->ic_to_send))
+ cv_wait(&ic->ic_send_cv, &ic->ic_lock);
+ icl_conn_send_pdus(ic);
+ ICL_CONN_UNLOCK(ic);
+ }
+}
+
+static int
+icl_soupcall_send(struct socket *so, void *arg, int waitflag)
+{
+ struct icl_conn *ic;
+
+ ic = arg;
+ cv_signal(&ic->ic_send_cv);
+ return (SU_OK);
+}
+
+int
+icl_pdu_append_data(struct icl_pdu *request, const void *addr, size_t len, int flags)
+{
+ struct mbuf *mb, *newmb;
+ size_t copylen, off = 0;
+
+ KASSERT(len > 0, ("len == 0"));
+
+ newmb = m_getm2(NULL, len, flags, MT_DATA, M_PKTHDR);
+ if (newmb == NULL) {
+ ICL_WARN("failed to allocate mbuf for %zd bytes", len);
+ return (ENOMEM);
+ }
+
+ for (mb = newmb; mb != NULL; mb = mb->m_next) {
+ copylen = min(M_TRAILINGSPACE(mb), len - off);
+ memcpy(mtod(mb, char *), (const char *)addr + off, copylen);
+ mb->m_len = copylen;
+ off += copylen;
+ }
+ KASSERT(off == len, ("%s: off != len", __func__));
+
+ if (request->ip_data_mbuf == NULL) {
+ request->ip_data_mbuf = newmb;
+ request->ip_data_len = len;
+ } else {
+ m_cat(request->ip_data_mbuf, newmb);
+ request->ip_data_len += len;
+ }
+
+ return (0);
+}
+
+void
+icl_pdu_get_data(struct icl_pdu *ip, size_t off, void *addr, size_t len)
+{
+
+ m_copydata(ip->ip_data_mbuf, off, len, addr);
+}
+
+void
+icl_pdu_queue(struct icl_pdu *ip)
+{
+ struct icl_conn *ic;
+
+ ic = ip->ip_conn;
+
+ ICL_CONN_LOCK(ic);
+ if (ic->ic_disconnecting || ic->ic_socket == NULL) {
+ ICL_DEBUG("icl_pdu_queue on closed connection");
+ ICL_CONN_UNLOCK(ic);
+ return;
+ }
+ TAILQ_INSERT_TAIL(&ic->ic_to_send, ip, ip_next);
+ ICL_CONN_UNLOCK(ic);
+ cv_signal(&ic->ic_send_cv);
+}
+
+struct icl_conn *
+icl_conn_new(void)
+{
+ struct icl_conn *ic;
+
+ refcount_acquire(&icl_ncons);
+
+ ic = uma_zalloc(icl_conn_zone, M_WAITOK | M_ZERO);
+
+ TAILQ_INIT(&ic->ic_to_send);
+ mtx_init(&ic->ic_lock, "icl_lock", NULL, MTX_DEF);
+ cv_init(&ic->ic_send_cv, "icl_tx");
+ cv_init(&ic->ic_receive_cv, "icl_rx");
+ refcount_init(&ic->ic_outstanding_pdus, 0);
+ ic->ic_max_data_segment_length = ICL_MAX_DATA_SEGMENT_LENGTH;
+
+ return (ic);
+}
+
+void
+icl_conn_free(struct icl_conn *ic)
+{
+
+ mtx_destroy(&ic->ic_lock);
+ cv_destroy(&ic->ic_send_cv);
+ cv_destroy(&ic->ic_receive_cv);
+ uma_zfree(icl_conn_zone, ic);
+ refcount_release(&icl_ncons);
+}
+
+static int
+icl_conn_start(struct icl_conn *ic)
+{
+ size_t bufsize;
+ struct sockopt opt;
+ int error, one = 1;
+
+ ICL_CONN_LOCK(ic);
+
+ /*
+ * XXX: Ugly hack.
+ */
+ if (ic->ic_socket == NULL) {
+ ICL_CONN_UNLOCK(ic);
+ return (EINVAL);
+ }
+
+ ic->ic_receive_state = ICL_CONN_STATE_BHS;
+ ic->ic_receive_len = sizeof(struct iscsi_bhs);
+ ic->ic_disconnecting = false;
+
+ ICL_CONN_UNLOCK(ic);
+
+ /*
+ * Use max available sockbuf size for sending. Do it manually
+ * instead of sbreserve(9) to work around resource limits.
+ *
+ * XXX: This kind of sucks. On one hand, we don't currently support
+ * sending a part of data segment; we always do it in one piece,
+ * so we have to make sure it can fit in the socket buffer.
+ * Once I've implemented partial send, we'll get rid of this
+ * and use autoscaling.
+ */
+ bufsize = (sizeof(struct iscsi_bhs) +
+ ic->ic_max_data_segment_length) * 8;
+ error = soreserve(ic->ic_socket, bufsize, bufsize);
+ if (error != 0) {
+ ICL_WARN("soreserve failed with error %d", error);
+ icl_conn_close(ic);
+ return (error);
+ }
+
+ /*
+ * Disable Nagle.
+ */
+ bzero(&opt, sizeof(opt));
+ opt.sopt_dir = SOPT_SET;
+ opt.sopt_level = IPPROTO_TCP;
+ opt.sopt_name = TCP_NODELAY;
+ opt.sopt_val = &one;
+ opt.sopt_valsize = sizeof(one);
+ error = sosetopt(ic->ic_socket, &opt);
+ if (error != 0) {
+ ICL_WARN("disabling TCP_NODELAY failed with error %d", error);
+ icl_conn_close(ic);
+ return (error);
+ }
+
+ /*
+ * Start threads.
+ */
+ error = kthread_add(icl_send_thread, ic, NULL, NULL, 0, 0, "icltx");
+ if (error != 0) {
+ ICL_WARN("kthread_add(9) failed with error %d", error);
+ icl_conn_close(ic);
+ return (error);
+ }
+
+ error = kthread_add(icl_receive_thread, ic, NULL, NULL, 0, 0, "iclrx");
+ if (error != 0) {
+ ICL_WARN("kthread_add(9) failed with error %d", error);
+ icl_conn_close(ic);
+ return (error);
+ }
+
+ /*
+ * Register socket upcall, to get notified about incoming PDUs
+ * and free space to send outgoing ones.
+ */
+ SOCKBUF_LOCK(&ic->ic_socket->so_snd);
+ soupcall_set(ic->ic_socket, SO_SND, icl_soupcall_send, ic);
+ SOCKBUF_UNLOCK(&ic->ic_socket->so_snd);
+ SOCKBUF_LOCK(&ic->ic_socket->so_rcv);
+ soupcall_set(ic->ic_socket, SO_RCV, icl_soupcall_receive, ic);
+ SOCKBUF_UNLOCK(&ic->ic_socket->so_rcv);
+
+ return (0);
+}
+
+int
+icl_conn_handoff(struct icl_conn *ic, int fd)
+{
+ struct file *fp;
+ struct socket *so;
+ cap_rights_t rights;
+ int error;
+
+ /*
+ * Steal the socket from userland.
+ */
+ error = fget(curthread, fd,
+ cap_rights_init(&rights, CAP_SOCK_CLIENT), &fp);
+ if (error != 0)
+ return (error);
+ if (fp->f_type != DTYPE_SOCKET) {
+ fdrop(fp, curthread);
+ return (EINVAL);
+ }
+ so = fp->f_data;
+ if (so->so_type != SOCK_STREAM) {
+ fdrop(fp, curthread);
+ return (EINVAL);
+ }
+
+ ICL_CONN_LOCK(ic);
+
+ if (ic->ic_socket != NULL) {
+ ICL_CONN_UNLOCK(ic);
+ fdrop(fp, curthread);
+ return (EBUSY);
+ }
+
+ ic->ic_socket = fp->f_data;
+ fp->f_ops = &badfileops;
+ fp->f_data = NULL;
+ fdrop(fp, curthread);
+ ICL_CONN_UNLOCK(ic);
+
+ error = icl_conn_start(ic);
+
+ return (error);
+}
+
+void
+icl_conn_shutdown(struct icl_conn *ic)
+{
+
+ ICL_CONN_LOCK(ic);
+ if (ic->ic_socket == NULL) {
+ ICL_CONN_UNLOCK(ic);
+ return;
+ }
+ ICL_CONN_UNLOCK(ic);
+
+ soshutdown(ic->ic_socket, SHUT_RDWR);
+}
+
+void
+icl_conn_close(struct icl_conn *ic)
+{
+ struct icl_pdu *pdu;
+
+ ICL_CONN_LOCK(ic);
+ if (ic->ic_socket == NULL) {
+ ICL_CONN_UNLOCK(ic);
+ return;
+ }
+
+ ic->ic_disconnecting = true;
+
+ /*
+ * Wake up the threads, so they can properly terminate.
+ */
+ cv_signal(&ic->ic_receive_cv);
+ cv_signal(&ic->ic_send_cv);
+ while (ic->ic_receive_running || ic->ic_send_running) {
+ //ICL_DEBUG("waiting for send/receive threads to terminate");
+ ICL_CONN_UNLOCK(ic);
+ cv_signal(&ic->ic_receive_cv);
+ cv_signal(&ic->ic_send_cv);
+ pause("icl_close", 1 * hz);
+ ICL_CONN_LOCK(ic);
+ }
+ //ICL_DEBUG("send/receive threads terminated");
+
+ soclose(ic->ic_socket);
+ ic->ic_socket = NULL;
+
+ if (ic->ic_receive_pdu != NULL) {
+ //ICL_DEBUG("freeing partially received PDU");
+ icl_pdu_free(ic->ic_receive_pdu);
+ ic->ic_receive_pdu = NULL;
+ }
+
+ /*
+ * Remove any outstanding PDUs from the send queue.
+ */
+ while (!TAILQ_EMPTY(&ic->ic_to_send)) {
+ pdu = TAILQ_FIRST(&ic->ic_to_send);
+ TAILQ_REMOVE(&ic->ic_to_send, pdu, ip_next);
+ icl_pdu_free(pdu);
+ }
+
+ KASSERT(TAILQ_EMPTY(&ic->ic_to_send),
+ ("destroying session with non-empty send queue"));
+ /*
+ * XXX
+ */
+#if 0
+ KASSERT(ic->ic_outstanding_pdus == 0,
+ ("destroying session with %d outstanding PDUs",
+ ic->ic_outstanding_pdus));
+#endif
+ ICL_CONN_UNLOCK(ic);
+}
+
+bool
+icl_conn_connected(struct icl_conn *ic)
+{
+
+ ICL_CONN_LOCK(ic);
+ if (ic->ic_socket == NULL) {
+ ICL_CONN_UNLOCK(ic);
+ return (false);
+ }
+ if (ic->ic_socket->so_error != 0) {
+ ICL_CONN_UNLOCK(ic);
+ return (false);
+ }
+ ICL_CONN_UNLOCK(ic);
+ return (true);
+}
+
+#ifdef ICL_KERNEL_PROXY
+int
+icl_conn_handoff_sock(struct icl_conn *ic, struct socket *so)
+{
+ int error;
+
+ if (so->so_type != SOCK_STREAM)
+ return (EINVAL);
+
+ ICL_CONN_LOCK(ic);
+ if (ic->ic_socket != NULL) {
+ ICL_CONN_UNLOCK(ic);
+ return (EBUSY);
+ }
+ ic->ic_socket = so;
+ ICL_CONN_UNLOCK(ic);
+
+ error = icl_conn_start(ic);
+
+ return (error);
+}
+#endif /* ICL_KERNEL_PROXY */
+
+static int
+icl_unload(void)
+{
+
+ if (icl_ncons != 0)
+ return (EBUSY);
+
+ uma_zdestroy(icl_conn_zone);
+ uma_zdestroy(icl_pdu_zone);
+
+ return (0);
+}
+
+static void
+icl_load(void)
+{
+
+ icl_conn_zone = uma_zcreate("icl_conn",
+ sizeof(struct icl_conn), NULL, NULL, NULL, NULL,
+ UMA_ALIGN_PTR, UMA_ZONE_NOFREE);
+ icl_pdu_zone = uma_zcreate("icl_pdu",
+ sizeof(struct icl_pdu), NULL, NULL, NULL, NULL,
+ UMA_ALIGN_PTR, UMA_ZONE_NOFREE);
+
+ refcount_init(&icl_ncons, 0);
+}
+
+static int
+icl_modevent(module_t mod, int what, void *arg)
+{
+
+ switch (what) {
+ case MOD_LOAD:
+ icl_load();
+ return (0);
+ case MOD_UNLOAD:
+ return (icl_unload());
+ default:
+ return (EINVAL);
+ }
+}
+
+moduledata_t icl_data = {
+ "icl",
+ icl_modevent,
+ 0
+};
+
+DECLARE_MODULE(icl, icl_data, SI_SUB_DRIVERS, SI_ORDER_FIRST);
+MODULE_VERSION(icl, 1);
diff --git a/sys/dev/iscsi/icl.h b/sys/dev/iscsi/icl.h
new file mode 100644
index 000000000000..87a565269562
--- /dev/null
+++ b/sys/dev/iscsi/icl.h
@@ -0,0 +1,151 @@
+/*-
+ * Copyright (c) 2012 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Edward Tomasz Napierala under sponsorship
+ * from the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * $FreeBSD$
+ */
+
+#ifndef ICL_H
+#define ICL_H
+
+/*
+ * iSCSI Common Layer. It's used by both the initiator and target to send
+ * and receive iSCSI PDUs.
+ */
+
+struct icl_conn;
+
+struct icl_pdu {
+ TAILQ_ENTRY(icl_pdu) ip_next;
+ struct icl_conn *ip_conn;
+ struct iscsi_bhs *ip_bhs;
+ struct mbuf *ip_bhs_mbuf;
+ size_t ip_ahs_len;
+ struct mbuf *ip_ahs_mbuf;
+ size_t ip_data_len;
+ struct mbuf *ip_data_mbuf;
+
+ /*
+ * User (initiator or provider) private fields.
+ */
+ uint32_t ip_prv0;
+ uint32_t ip_prv1;
+ uint32_t ip_prv2;
+};
+
+struct icl_pdu *icl_pdu_new_bhs(struct icl_conn *ic, int flags);
+size_t icl_pdu_data_segment_length(const struct icl_pdu *ip);
+int icl_pdu_append_data(struct icl_pdu *ip, const void *addr, size_t len, int flags);
+void icl_pdu_get_data(struct icl_pdu *ip, size_t off, void *addr, size_t len);
+void icl_pdu_queue(struct icl_pdu *ip);
+void icl_pdu_free(struct icl_pdu *ip);
+
+#define ICL_CONN_STATE_INVALID 0
+#define ICL_CONN_STATE_BHS 1
+#define ICL_CONN_STATE_AHS 2
+#define ICL_CONN_STATE_HEADER_DIGEST 3
+#define ICL_CONN_STATE_DATA 4
+#define ICL_CONN_STATE_DATA_DIGEST 5
+
+#define ICL_MAX_DATA_SEGMENT_LENGTH (128 * 1024)
+
+struct icl_conn {
+ struct mtx ic_lock;
+ struct socket *ic_socket;
+ volatile u_int ic_outstanding_pdus;
+ TAILQ_HEAD(, icl_pdu) ic_to_send;
+ size_t ic_receive_len;
+ int ic_receive_state;
+ struct icl_pdu *ic_receive_pdu;
+ struct cv ic_send_cv;
+ struct cv ic_receive_cv;
+ bool ic_header_crc32c;
+ bool ic_data_crc32c;
+ bool ic_send_running;
+ bool ic_receive_running;
+ size_t ic_max_data_segment_length;
+ bool ic_disconnecting;
+ bool ic_iser;
+
+ void (*ic_receive)(struct icl_pdu *);
+ void (*ic_error)(struct icl_conn *);
+
+ /*
+ * User (initiator or provider) private fields.
+ */
+ void *ic_prv0;
+};
+
+struct icl_conn *icl_conn_new(void);
+void icl_conn_free(struct icl_conn *ic);
+int icl_conn_handoff(struct icl_conn *ic, int fd);
+void icl_conn_shutdown(struct icl_conn *ic);
+void icl_conn_close(struct icl_conn *ic);
+bool icl_conn_connected(struct icl_conn *ic);
+
+#ifdef ICL_KERNEL_PROXY
+
+struct sockaddr;
+struct icl_listen;
+
+struct icl_listen_sock {
+ TAILQ_ENTRY(icl_listen_sock) ils_next;
+ struct icl_listen *ils_listen;
+ struct socket *ils_socket;
+ bool ils_running;
+ bool ils_disconnecting;
+};
+
+struct icl_listen {
+ TAILQ_HEAD(, icl_listen_sock) il_sockets;
+ struct sx il_lock;
+ void (*il_accept)(struct socket *);
+};
+
+/*
+ * Initiator part.
+ */
+int icl_conn_connect(struct icl_conn *ic, bool rdma,
+ int domain, int socktype, int protocol,
+ struct sockaddr *from_sa, struct sockaddr *to_sa);
+/*
+ * Target part.
+ */
+struct icl_listen *icl_listen_new(void (*accept_cb)(struct socket *));
+void icl_listen_free(struct icl_listen *il);
+int icl_listen_add(struct icl_listen *il, bool rdma, int domain,
+ int socktype, int protocol, struct sockaddr *sa);
+int icl_listen_remove(struct icl_listen *il, struct sockaddr *sa);
+
+/*
+ * This one is not a public API; only to be used by icl_proxy.c.
+ */
+int icl_conn_handoff_sock(struct icl_conn *ic, struct socket *so);
+
+#endif /* ICL_KERNEL_PROXY */
+
+#endif /* !ICL_H */
diff --git a/sys/dev/iscsi/icl_proxy.c b/sys/dev/iscsi/icl_proxy.c
new file mode 100644
index 000000000000..41e64c352a9e
--- /dev/null
+++ b/sys/dev/iscsi/icl_proxy.c
@@ -0,0 +1,397 @@
+/*-
+ * Copyright (c) 2012 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Edward Tomasz Napierala under sponsorship
+ * from the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * $FreeBSD$
+ */
+/*-
+ * Copyright (c) 1982, 1986, 1989, 1990, 1993
+ * The Regents of the University of California. All rights reserved.
+ *
+ * sendfile(2) and related extensions:
+ * Copyright (c) 1998, David Greenman. All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ * 4. Neither the name of the University nor the names of its contributors
+ * may be used to endorse or promote products derived from this software
+ * without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * @(#)uipc_syscalls.c 8.4 (Berkeley) 2/21/94
+ */
+
+/*
+ * iSCSI Common Layer, kernel proxy part.
+ */
+
+#ifdef ICL_KERNEL_PROXY
+
+#include <sys/param.h>
+#include <sys/capability.h>
+#include <sys/condvar.h>
+#include <sys/conf.h>
+#include <sys/kernel.h>
+#include <sys/kthread.h>
+#include <sys/malloc.h>
+#include <sys/proc.h>
+#include <sys/socket.h>
+#include <sys/socketvar.h>
+#include <sys/sx.h>
+#include <sys/systm.h>
+#include <netinet/in.h>
+#include <netinet/tcp.h>
+#include <linux/types.h>
+#include <rdma/rdma_cm.h>
+
+#include "icl.h"
+
+static int debug = 1;
+
+#define ICL_DEBUG(X, ...) \
+ if (debug > 1) { \
+ printf("%s: " X "\n", __func__, ## __VA_ARGS__);\
+ } while (0)
+
+#define ICL_WARN(X, ...) \
+ if (debug > 0) { \
+ printf("WARNING: %s: " X "\n", \
+ __func__, ## __VA_ARGS__); \
+ } while (0)
+
+static MALLOC_DEFINE(M_ICL_PROXY, "ICL_PROXY", "iSCSI common layer proxy");
+
+#ifdef ICL_RDMA
+static int icl_conn_connect_rdma(struct icl_conn *ic, int domain, int socktype,
+ int protocol, struct sockaddr *from_sa, struct sockaddr *to_sa);
+static int icl_listen_add_rdma(struct icl_listen *il, int domain, int socktype, int protocol,
+ struct sockaddr *sa);
+#endif /* ICL_RDMA */
+
+static int
+icl_conn_connect_tcp(struct icl_conn *ic, int domain, int socktype,
+ int protocol, struct sockaddr *from_sa, struct sockaddr *to_sa)
+{
+ struct socket *so;
+ int error;
+ int interrupted = 0;
+
+ error = socreate(domain, &so, socktype, protocol,
+ curthread->td_ucred, curthread);
+ if (error != 0)
+ return (error);
+
+ if (from_sa != NULL) {
+ error = sobind(so, from_sa, curthread);
+ if (error != 0) {
+ soclose(so);
+ return (error);
+ }
+ }
+
+ error = soconnect(so, to_sa, curthread);
+ if (error != 0) {
+ soclose(so);
+ return (error);
+ }
+
+ SOCK_LOCK(so);
+ while ((so->so_state & SS_ISCONNECTING) && so->so_error == 0) {
+ error = msleep(&so->so_timeo, SOCK_MTX(so), PSOCK | PCATCH,
+ "icl_connect", 0);
+ if (error) {
+ if (error == EINTR || error == ERESTART)
+ interrupted = 1;
+ break;
+ }
+ }
+ if (error == 0) {
+ error = so->so_error;
+ so->so_error = 0;
+ }
+ SOCK_UNLOCK(so);
+
+ if (error != 0) {
+ soclose(so);
+ return (error);
+ }
+
+ error = icl_conn_handoff_sock(ic, so);
+ if (error != 0)
+ soclose(so);
+
+ return (error);
+}
+
+int
+icl_conn_connect(struct icl_conn *ic, bool rdma, int domain, int socktype,
+ int protocol, struct sockaddr *from_sa, struct sockaddr *to_sa)
+{
+
+ if (rdma) {
+#ifdef ICL_RDMA
+ return (icl_conn_connect_rdma(ic, domain, socktype, protocol, from_sa, to_sa));
+#else
+ ICL_DEBUG("RDMA not supported");
+ return (EOPNOTSUPP);
+#endif
+ }
+
+ return (icl_conn_connect_tcp(ic, domain, socktype, protocol, from_sa, to_sa));
+}
+
+struct icl_listen *
+icl_listen_new(void (*accept_cb)(struct socket *))
+{
+ struct icl_listen *il;
+
+ il = malloc(sizeof(*il), M_ICL_PROXY, M_ZERO | M_WAITOK);
+ TAILQ_INIT(&il->il_sockets);
+ sx_init(&il->il_lock, "icl_listen");
+ il->il_accept = accept_cb;
+
+ return (il);
+}
+
+void
+icl_listen_free(struct icl_listen *il)
+{
+ struct icl_listen_sock *ils;
+
+ sx_xlock(&il->il_lock);
+ while (!TAILQ_EMPTY(&il->il_sockets)) {
+ ils = TAILQ_FIRST(&il->il_sockets);
+ while (ils->ils_running) {
+ ICL_DEBUG("waiting for accept thread to terminate");
+ sx_xunlock(&il->il_lock);
+ ils->ils_disconnecting = true;
+ wakeup(&ils->ils_socket->so_timeo);
+ pause("icl_unlisten", 1 * hz);
+ sx_xlock(&il->il_lock);
+ }
+
+ TAILQ_REMOVE(&il->il_sockets, ils, ils_next);
+ soclose(ils->ils_socket);
+ free(ils, M_ICL_PROXY);
+ }
+ sx_xunlock(&il->il_lock);
+
+ free(il, M_ICL_PROXY);
+}
+
+/*
+ * XXX: Doing accept in a separate thread in each socket might not be the best way
+ * to do stuff, but it's pretty clean and debuggable - and you probably won't
+ * have hundreds of listening sockets anyway.
+ */
+static void
+icl_accept_thread(void *arg)
+{
+ struct icl_listen_sock *ils;
+ struct socket *head, *so;
+ struct sockaddr *sa;
+ int error;
+
+ ils = arg;
+ head = ils->ils_socket;
+
+ ils->ils_running = true;
+
+ for (;;) {
+ ACCEPT_LOCK();
+ while (TAILQ_EMPTY(&head->so_comp) && head->so_error == 0 && ils->ils_disconnecting == false) {
+ if (head->so_rcv.sb_state & SBS_CANTRCVMORE) {
+ head->so_error = ECONNABORTED;
+ break;
+ }
+ error = msleep(&head->so_timeo, &accept_mtx, PSOCK | PCATCH,
+ "accept", 0);
+ if (error) {
+ ACCEPT_UNLOCK();
+ ICL_WARN("msleep failed with error %d", error);
+ continue;
+ }
+ if (ils->ils_disconnecting) {
+ ACCEPT_UNLOCK();
+ ICL_DEBUG("terminating");
+ ils->ils_running = false;
+ kthread_exit();
+ return;
+ }
+ }
+ if (head->so_error) {
+ error = head->so_error;
+ head->so_error = 0;
+ ACCEPT_UNLOCK();
+ ICL_WARN("socket error %d", error);
+ continue;
+ }
+ so = TAILQ_FIRST(&head->so_comp);
+ KASSERT(so != NULL, ("NULL so"));
+ KASSERT(!(so->so_qstate & SQ_INCOMP), ("accept1: so SQ_INCOMP"));
+ KASSERT(so->so_qstate & SQ_COMP, ("accept1: so not SQ_COMP"));
+
+ /*
+ * Before changing the flags on the socket, we have to bump the
+ * reference count. Otherwise, if the protocol calls sofree(),
+ * the socket will be released due to a zero refcount.
+ */
+ SOCK_LOCK(so); /* soref() and so_state update */
+ soref(so); /* file descriptor reference */
+
+ TAILQ_REMOVE(&head->so_comp, so, so_list);
+ head->so_qlen--;
+ so->so_state |= (head->so_state & SS_NBIO);
+ so->so_qstate &= ~SQ_COMP;
+ so->so_head = NULL;
+
+ SOCK_UNLOCK(so);
+ ACCEPT_UNLOCK();
+
+ sa = NULL;
+ error = soaccept(so, &sa);
+ if (error != 0) {
+ ICL_WARN("soaccept error %d", error);
+ if (sa != NULL)
+ free(sa, M_SONAME);
+ soclose(so);
+ }
+
+ (ils->ils_listen->il_accept)(so);
+ }
+}
+
+static int
+icl_listen_add_tcp(struct icl_listen *il, int domain, int socktype, int protocol,
+ struct sockaddr *sa)
+{
+ struct icl_listen_sock *ils;
+ struct socket *so;
+ struct sockopt sopt;
+ int error, one = 1;
+
+ error = socreate(domain, &so, socktype, protocol,
+ curthread->td_ucred, curthread);
+ if (error != 0) {
+ ICL_WARN("socreate failed with error %d", error);
+ return (error);
+ }
+
+ sopt.sopt_dir = SOPT_SET;
+ sopt.sopt_level = SOL_SOCKET;
+ sopt.sopt_name = SO_REUSEADDR;
+ sopt.sopt_val = &one;
+ sopt.sopt_valsize = sizeof(one);
+ sopt.sopt_td = NULL;
+ error = sosetopt(so, &sopt);
+ if (error != 0) {
+ ICL_WARN("failed to set SO_REUSEADDR with error %d", error);
+ soclose(so);
+ return (error);
+ }
+
+ error = sobind(so, sa, curthread);
+ if (error != 0) {
+ ICL_WARN("sobind failed with error %d", error);
+ soclose(so);
+ return (error);
+ }
+
+ error = solisten(so, -1, curthread);
+ if (error != 0) {
+ ICL_WARN("solisten failed with error %d", error);
+ soclose(so);
+ return (error);
+ }
+
+ ils = malloc(sizeof(*ils), M_ICL_PROXY, M_ZERO | M_WAITOK);
+ ils->ils_listen = il;
+ ils->ils_socket = so;
+
+ error = kthread_add(icl_accept_thread, ils, NULL, NULL, 0, 0, "iclacc");
+ if (error != 0) {
+ ICL_WARN("kthread_add failed with error %d", error);
+ soclose(so);
+ free(ils, M_ICL_PROXY);
+
+ return (error);
+ }
+
+ sx_xlock(&il->il_lock);
+ TAILQ_INSERT_TAIL(&il->il_sockets, ils, ils_next);
+ sx_xunlock(&il->il_lock);
+
+ return (0);
+}
+
+int
+icl_listen_add(struct icl_listen *il, bool rdma, int domain, int socktype, int protocol,
+ struct sockaddr *sa)
+{
+
+ if (rdma) {
+#ifndef ICL_RDMA
+ ICL_DEBUG("RDMA not supported");
+ return (EOPNOTSUPP);
+#else
+ return (icl_listen_add_rdma(il, domain, socktype, protocol, sa));
+#endif
+ }
+
+
+ return (icl_listen_add_tcp(il, domain, socktype, protocol, sa));
+}
+
+int
+icl_listen_remove(struct icl_listen *il, struct sockaddr *sa)
+{
+
+ /*
+ * XXX
+ */
+
+ return (EOPNOTSUPP);
+}
+
+#endif /* ICL_KERNEL_PROXY */
diff --git a/sys/dev/iscsi/iscsi.c b/sys/dev/iscsi/iscsi.c
new file mode 100644
index 000000000000..0a956e832a94
--- /dev/null
+++ b/sys/dev/iscsi/iscsi.c
@@ -0,0 +1,2109 @@
+/*-
+ * Copyright (c) 2012 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Edward Tomasz Napierala under sponsorship
+ * from the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * $FreeBSD$
+ */
+
+#include <sys/param.h>
+#include <sys/condvar.h>
+#include <sys/conf.h>
+#include <sys/eventhandler.h>
+#include <sys/file.h>
+#include <sys/kernel.h>
+#include <sys/kthread.h>
+#include <sys/lock.h>
+#include <sys/malloc.h>
+#include <sys/mutex.h>
+#include <sys/module.h>
+#include <sys/sysctl.h>
+#include <sys/systm.h>
+#include <sys/sx.h>
+#include <vm/uma.h>
+
+#include <cam/cam.h>
+#include <cam/cam_ccb.h>
+#include <cam/cam_xpt.h>
+#include <cam/cam_debug.h>
+#include <cam/cam_sim.h>
+#include <cam/cam_xpt_sim.h>
+#include <cam/cam_xpt_periph.h>
+#include <cam/cam_periph.h>
+#include <cam/scsi/scsi_all.h>
+#include <cam/scsi/scsi_message.h>
+
+#include "iscsi_ioctl.h"
+#include "iscsi.h"
+#include "icl.h"
+#include "iscsi_proto.h"
+
+#ifdef ICL_KERNEL_PROXY
+#include <sys/socketvar.h>
+#endif
+
+/*
+ * XXX: This is global so the iscsi_unload() can access it.
+ * Think about how to do this properly.
+ */
+static struct iscsi_softc *sc;
+
+SYSCTL_NODE(_kern, OID_AUTO, iscsi, CTLFLAG_RD, 0, "iSCSI initiator");
+static int debug = 1;
+TUNABLE_INT("kern.iscsi.debug", &debug);
+SYSCTL_INT(_kern_iscsi, OID_AUTO, debug, CTLFLAG_RW,
+ &debug, 2, "Enable debug messages");
+static int ping_timeout = 5;
+TUNABLE_INT("kern.iscsi.ping_timeout", &ping_timeout);
+SYSCTL_INT(_kern_iscsi, OID_AUTO, ping_timeout, CTLFLAG_RW, &ping_timeout,
+ 5, "Timeout for ping (NOP-Out) requests, in seconds");
+static int iscsid_timeout = 60;
+TUNABLE_INT("kern.iscsi.iscsid_timeout", &iscsid_timeout);
+SYSCTL_INT(_kern_iscsi, OID_AUTO, iscsid_timeout, CTLFLAG_RW, &iscsid_timeout,
+ 60, "Time to wait for iscsid(8) to handle reconnection, in seconds");
+static int login_timeout = 60;
+TUNABLE_INT("kern.iscsi.login_timeout", &login_timeout);
+SYSCTL_INT(_kern_iscsi, OID_AUTO, login_timeout, CTLFLAG_RW, &login_timeout,
+ 60, "Time to wait for iscsid(8) to finish Login Phase, in seconds");
+static int maxtags = 255;
+TUNABLE_INT("kern.iscsi.maxtags", &maxtags);
+SYSCTL_INT(_kern_iscsi, OID_AUTO, maxtags, CTLFLAG_RW, &maxtags,
+ 255, "Max number of IO requests queued");
+
+static MALLOC_DEFINE(M_ISCSI, "iSCSI", "iSCSI initiator");
+static uma_zone_t iscsi_outstanding_zone;
+
+#define CONN_SESSION(X) ((struct iscsi_session *)X->ic_prv0)
+#define PDU_SESSION(X) (CONN_SESSION(X->ip_conn))
+
+#define ISCSI_DEBUG(X, ...) \
+ if (debug > 1) { \
+ printf("%s: " X "\n", __func__, ## __VA_ARGS__);\
+ } while (0)
+
+#define ISCSI_WARN(X, ...) \
+ if (debug > 0) { \
+ printf("WARNING: %s: " X "\n", \
+ __func__, ## __VA_ARGS__); \
+ } while (0)
+
+#define ISCSI_SESSION_DEBUG(S, X, ...) \
+ if (debug > 1) { \
+ printf("%s: %s (%s): " X "\n", \
+ __func__, S->is_conf.isc_target_addr, \
+ S->is_conf.isc_target, ## __VA_ARGS__); \
+ } while (0)
+
+#define ISCSI_SESSION_WARN(S, X, ...) \
+ if (debug > 0) { \
+ printf("WARNING: %s (%s): " X "\n", \
+ S->is_conf.isc_target_addr, \
+ S->is_conf.isc_target, ## __VA_ARGS__); \
+ } while (0)
+
+#define ISCSI_SESSION_LOCK(X) mtx_lock(&X->is_lock)
+#define ISCSI_SESSION_UNLOCK(X) mtx_unlock(&X->is_lock)
+#define ISCSI_SESSION_LOCK_ASSERT(X) mtx_assert(&X->is_lock, MA_OWNED)
+
+static int iscsi_ioctl(struct cdev *dev, u_long cmd, caddr_t arg,
+ int mode, struct thread *td);
+
+static struct cdevsw iscsi_cdevsw = {
+ .d_version = D_VERSION,
+ .d_ioctl = iscsi_ioctl,
+ .d_name = "iscsi",
+};
+
+static void iscsi_pdu_queue_locked(struct icl_pdu *request);
+static void iscsi_pdu_queue(struct icl_pdu *request);
+static void iscsi_pdu_update_statsn(const struct icl_pdu *response);
+static void iscsi_pdu_handle_nop_in(struct icl_pdu *response);
+static void iscsi_pdu_handle_scsi_response(struct icl_pdu *response);
+static void iscsi_pdu_handle_data_in(struct icl_pdu *response);
+static void iscsi_pdu_handle_logout_response(struct icl_pdu *response);
+static void iscsi_pdu_handle_r2t(struct icl_pdu *response);
+static void iscsi_pdu_handle_async_message(struct icl_pdu *response);
+static void iscsi_pdu_handle_reject(struct icl_pdu *response);
+static void iscsi_session_reconnect(struct iscsi_session *is);
+static void iscsi_session_terminate(struct iscsi_session *is);
+static void iscsi_action(struct cam_sim *sim, union ccb *ccb);
+static void iscsi_poll(struct cam_sim *sim);
+static struct iscsi_outstanding *iscsi_outstanding_find(struct iscsi_session *is,
+ uint32_t initiator_task_tag);
+static int iscsi_outstanding_add(struct iscsi_session *is,
+ uint32_t initiator_task_tag, union ccb *ccb);
+static void iscsi_outstanding_remove(struct iscsi_session *is,
+ struct iscsi_outstanding *io);
+
+static bool
+iscsi_pdu_prepare(struct icl_pdu *request)
+{
+ struct iscsi_session *is;
+ struct iscsi_bhs_scsi_command *bhssc;
+
+ is = PDU_SESSION(request);
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+ /*
+ * We're only using fields common for all the request
+ * (initiator -> target) PDUs.
+ */
+ bhssc = (struct iscsi_bhs_scsi_command *)request->ip_bhs;
+
+ /*
+ * Data-Out PDU does not contain CmdSN.
+ */
+ if (bhssc->bhssc_opcode != ISCSI_BHS_OPCODE_SCSI_DATA_OUT) {
+ if (is->is_cmdsn > is->is_maxcmdsn &&
+ (bhssc->bhssc_opcode & ISCSI_BHS_OPCODE_IMMEDIATE) == 0) {
+ /*
+ * Current MaxCmdSN prevents us from sending any more
+ * SCSI Command PDUs to the target; postpone the PDU.
+ * It will get resent by either iscsi_pdu_queue(),
+ * or by maintenance thread.
+ */
+#if 0
+ ISCSI_SESSION_DEBUG(is, "postponing send, CmdSN %d, ExpCmdSN %d, MaxCmdSN %d, opcode 0x%x",
+ is->is_cmdsn, is->is_expcmdsn, is->is_maxcmdsn, bhssc->bhssc_opcode);
+#endif
+ return (true);
+ }
+ bhssc->bhssc_cmdsn = htonl(is->is_cmdsn);
+ if ((bhssc->bhssc_opcode & ISCSI_BHS_OPCODE_IMMEDIATE) == 0)
+ is->is_cmdsn++;
+ }
+ bhssc->bhssc_expstatsn = htonl(is->is_statsn + 1);
+
+ return (false);
+}
+
+static void
+iscsi_session_send_postponed(struct iscsi_session *is)
+{
+ struct icl_pdu *request;
+ bool postpone;
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+ while (!TAILQ_EMPTY(&is->is_postponed)) {
+ request = TAILQ_FIRST(&is->is_postponed);
+ postpone = iscsi_pdu_prepare(request);
+ if (postpone)
+ break;
+ TAILQ_REMOVE(&is->is_postponed, request, ip_next);
+ icl_pdu_queue(request);
+ }
+}
+
+static void
+iscsi_pdu_queue_locked(struct icl_pdu *request)
+{
+ struct iscsi_session *is;
+ bool postpone;
+
+ is = PDU_SESSION(request);
+ ISCSI_SESSION_LOCK_ASSERT(is);
+ iscsi_session_send_postponed(is);
+ postpone = iscsi_pdu_prepare(request);
+ if (postpone) {
+ TAILQ_INSERT_TAIL(&is->is_postponed, request, ip_next);
+ return;
+ }
+ icl_pdu_queue(request);
+}
+
+static void
+iscsi_pdu_queue(struct icl_pdu *request)
+{
+ struct iscsi_session *is;
+
+ is = PDU_SESSION(request);
+ ISCSI_SESSION_LOCK(is);
+ iscsi_pdu_queue_locked(request);
+ ISCSI_SESSION_UNLOCK(is);
+}
+
+static void
+iscsi_session_logout(struct iscsi_session *is)
+{
+ struct icl_pdu *request;
+ struct iscsi_bhs_logout_request *bhslr;
+
+ request = icl_pdu_new_bhs(is->is_conn, M_NOWAIT);
+ if (request == NULL)
+ return;
+
+ bhslr = (struct iscsi_bhs_logout_request *)request->ip_bhs;
+ bhslr->bhslr_opcode = ISCSI_BHS_OPCODE_LOGOUT_REQUEST;
+ bhslr->bhslr_reason = BHSLR_REASON_CLOSE_SESSION;
+ iscsi_pdu_queue_locked(request);
+}
+
+static void
+iscsi_session_terminate_tasks(struct iscsi_session *is, bool requeue)
+{
+ struct iscsi_outstanding *io, *tmp;
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+ TAILQ_FOREACH_SAFE(io, &is->is_outstanding, io_next, tmp) {
+ if (requeue) {
+ io->io_ccb->ccb_h.status &= ~CAM_SIM_QUEUED;
+ io->io_ccb->ccb_h.status |= CAM_REQUEUE_REQ;
+ } else {
+ io->io_ccb->ccb_h.status = CAM_REQ_ABORTED;
+ }
+
+ if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ io->io_ccb->ccb_h.status |= CAM_DEV_QFRZN;
+ xpt_done(io->io_ccb);
+ iscsi_outstanding_remove(is, io);
+ }
+}
+
+static void
+iscsi_maintenance_thread_reconnect(struct iscsi_session *is)
+{
+ struct icl_pdu *pdu;
+
+ icl_conn_shutdown(is->is_conn);
+ icl_conn_close(is->is_conn);
+
+ ISCSI_SESSION_LOCK(is);
+
+#ifdef ICL_KERNEL_PROXY
+ if (is->is_login_pdu != NULL) {
+ icl_pdu_free(is->is_login_pdu);
+ is->is_login_pdu = NULL;
+ }
+ cv_signal(&is->is_login_cv);
+#endif
+
+ /*
+ * Don't queue any new PDUs.
+ */
+ if (is->is_sim != NULL && is->is_simq_frozen == false) {
+ ISCSI_SESSION_DEBUG(is, "freezing");
+ xpt_freeze_simq(is->is_sim, 1);
+ is->is_simq_frozen = true;
+ }
+
+ /*
+ * Remove postponed PDUs.
+ */
+ while (!TAILQ_EMPTY(&is->is_postponed)) {
+ pdu = TAILQ_FIRST(&is->is_postponed);
+ TAILQ_REMOVE(&is->is_postponed, pdu, ip_next);
+ icl_pdu_free(pdu);
+ }
+
+ /*
+ * Terminate SCSI tasks, asking CAM to requeue them.
+ */
+ //ISCSI_SESSION_DEBUG(is, "terminating tasks");
+ iscsi_session_terminate_tasks(is, true);
+
+ KASSERT(TAILQ_EMPTY(&is->is_outstanding),
+ ("destroying session with active tasks"));
+ KASSERT(TAILQ_EMPTY(&is->is_postponed),
+ ("destroying session with postponed PDUs"));
+
+ /*
+ * Request immediate reconnection from iscsid(8).
+ */
+ //ISCSI_SESSION_DEBUG(is, "waking up iscsid(8)");
+ is->is_connected = false;
+ is->is_reconnecting = false;
+ is->is_login_phase = false;
+ is->is_waiting_for_iscsid = true;
+ strlcpy(is->is_reason, "Waiting for iscsid(8)", sizeof(is->is_reason));
+ is->is_timeout = 0;
+ ISCSI_SESSION_UNLOCK(is);
+ cv_signal(&is->is_softc->sc_cv);
+}
+
+static void
+iscsi_maintenance_thread_terminate(struct iscsi_session *is)
+{
+ struct iscsi_softc *sc;
+ struct icl_pdu *pdu;
+
+ sc = is->is_softc;
+ sx_xlock(&sc->sc_lock);
+ TAILQ_REMOVE(&sc->sc_sessions, is, is_next);
+ sx_xunlock(&sc->sc_lock);
+
+ icl_conn_close(is->is_conn);
+
+ ISCSI_SESSION_LOCK(is);
+
+ KASSERT(is->is_terminating, ("is_terminating == false"));
+
+#ifdef ICL_KERNEL_PROXY
+ if (is->is_login_pdu != NULL) {
+ icl_pdu_free(is->is_login_pdu);
+ is->is_login_pdu = NULL;
+ }
+ cv_signal(&is->is_login_cv);
+#endif
+
+ /*
+ * Don't queue any new PDUs.
+ */
+ callout_drain(&is->is_callout);
+ if (is->is_sim != NULL && is->is_simq_frozen == false) {
+ ISCSI_SESSION_DEBUG(is, "freezing");
+ xpt_freeze_simq(is->is_sim, 1);
+ is->is_simq_frozen = true;
+ }
+
+ /*
+ * Remove postponed PDUs.
+ */
+ while (!TAILQ_EMPTY(&is->is_postponed)) {
+ pdu = TAILQ_FIRST(&is->is_postponed);
+ TAILQ_REMOVE(&is->is_postponed, pdu, ip_next);
+ icl_pdu_free(pdu);
+ }
+
+ /*
+ * Forcibly terminate SCSI tasks.
+ */
+ ISCSI_SESSION_DEBUG(is, "terminating tasks");
+ iscsi_session_terminate_tasks(is, false);
+
+ /*
+ * Deregister CAM.
+ */
+ if (is->is_sim != NULL) {
+ ISCSI_SESSION_DEBUG(is, "deregistering SIM");
+ xpt_async(AC_LOST_DEVICE, is->is_path, NULL);
+
+ if (is->is_simq_frozen) {
+ xpt_release_simq(is->is_sim, 1);
+ is->is_simq_frozen = false;
+ }
+
+ xpt_free_path(is->is_path);
+ xpt_bus_deregister(cam_sim_path(is->is_sim));
+ cam_sim_free(is->is_sim, TRUE /*free_devq*/);
+ is->is_sim = NULL;
+ }
+
+ KASSERT(TAILQ_EMPTY(&is->is_outstanding),
+ ("destroying session with active tasks"));
+ KASSERT(TAILQ_EMPTY(&is->is_postponed),
+ ("destroying session with postponed PDUs"));
+
+ ISCSI_SESSION_UNLOCK(is);
+
+ icl_conn_free(is->is_conn);
+ mtx_destroy(&is->is_lock);
+ cv_destroy(&is->is_maintenance_cv);
+#ifdef ICL_KERNEL_PROXY
+ cv_destroy(&is->is_login_cv);
+#endif
+ ISCSI_SESSION_DEBUG(is, "terminated");
+ free(is, M_ISCSI);
+
+ /*
+ * The iscsi_unload() routine might be waiting.
+ */
+ cv_signal(&sc->sc_cv);
+}
+
+static void
+iscsi_maintenance_thread(void *arg)
+{
+ struct iscsi_session *is;
+
+ is = arg;
+
+ for (;;) {
+ ISCSI_SESSION_LOCK(is);
+ if (is->is_reconnecting == false &&
+ is->is_terminating == false &&
+ TAILQ_EMPTY(&is->is_postponed))
+ cv_wait(&is->is_maintenance_cv, &is->is_lock);
+
+ if (is->is_reconnecting) {
+ ISCSI_SESSION_UNLOCK(is);
+ iscsi_maintenance_thread_reconnect(is);
+ continue;
+ }
+
+ if (is->is_terminating) {
+ ISCSI_SESSION_UNLOCK(is);
+ iscsi_maintenance_thread_terminate(is);
+ kthread_exit();
+ return;
+ }
+
+ iscsi_session_send_postponed(is);
+ ISCSI_SESSION_UNLOCK(is);
+ }
+}
+
+static void
+iscsi_session_reconnect(struct iscsi_session *is)
+{
+
+ /*
+ * XXX: We can't use locking here, because
+ * it's being called from various contexts.
+ * Hope it doesn't break anything.
+ */
+ if (is->is_reconnecting)
+ return;
+
+ is->is_reconnecting = true;
+ cv_signal(&is->is_maintenance_cv);
+}
+
+static void
+iscsi_session_terminate(struct iscsi_session *is)
+{
+ if (is->is_terminating)
+ return;
+
+ is->is_terminating = true;
+
+#if 0
+ iscsi_session_logout(is);
+#endif
+ cv_signal(&is->is_maintenance_cv);
+}
+
+static void
+iscsi_callout(void *context)
+{
+ struct icl_pdu *request;
+ struct iscsi_bhs_nop_out *bhsno;
+ struct iscsi_session *is;
+ bool reconnect_needed = false;
+
+ is = context;
+
+ if (is->is_terminating)
+ return;
+
+ callout_schedule(&is->is_callout, 1 * hz);
+
+ ISCSI_SESSION_LOCK(is);
+ is->is_timeout++;
+
+ if (is->is_waiting_for_iscsid) {
+ if (is->is_timeout > iscsid_timeout) {
+ ISCSI_SESSION_WARN(is, "timed out waiting for iscsid(8) "
+ "for %d seconds; reconnecting",
+ is->is_timeout);
+ reconnect_needed = true;
+ }
+ goto out;
+ }
+
+ if (is->is_login_phase) {
+ if (is->is_timeout > login_timeout) {
+ ISCSI_SESSION_WARN(is, "login timed out after %d seconds; "
+ "reconnecting", is->is_timeout);
+ reconnect_needed = true;
+ }
+ goto out;
+ }
+
+ if (is->is_timeout >= ping_timeout) {
+ ISCSI_SESSION_WARN(is, "no ping reply (NOP-In) after %d seconds; "
+ "reconnecting", ping_timeout);
+ reconnect_needed = true;
+ goto out;
+ }
+
+ ISCSI_SESSION_UNLOCK(is);
+
+ /*
+ * If the ping was reset less than one second ago - which means
+ * that we've received some PDU during the last second - assume
+ * the traffic flows correctly and don't bother sending a NOP-Out.
+ *
+ * (It's 2 - one for one second, and one for incrementing is_timeout
+ * earlier in this routine.)
+ */
+ if (is->is_timeout < 2)
+ return;
+
+ request = icl_pdu_new_bhs(is->is_conn, M_WAITOK);
+ bhsno = (struct iscsi_bhs_nop_out *)request->ip_bhs;
+ bhsno->bhsno_opcode = ISCSI_BHS_OPCODE_NOP_OUT |
+ ISCSI_BHS_OPCODE_IMMEDIATE;
+ bhsno->bhsno_flags = 0x80;
+ bhsno->bhsno_target_transfer_tag = 0xffffffff;
+ iscsi_pdu_queue(request);
+ return;
+
+out:
+ ISCSI_SESSION_UNLOCK(is);
+
+ if (reconnect_needed)
+ iscsi_session_reconnect(is);
+}
+
+static void
+iscsi_pdu_update_statsn(const struct icl_pdu *response)
+{
+ const struct iscsi_bhs_data_in *bhsdi;
+ struct iscsi_session *is;
+ uint32_t expcmdsn, maxcmdsn;
+
+ is = PDU_SESSION(response);
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+ /*
+ * We're only using fields common for all the response
+ * (target -> initiator) PDUs.
+ */
+ bhsdi = (const struct iscsi_bhs_data_in *)response->ip_bhs;
+ /*
+ * Ok, I lied. In case of Data-In, "The fields StatSN, Status,
+ * and Residual Count only have meaningful content if the S bit
+ * is set to 1", so we also need to check the bit specific for
+ * Data-In PDU.
+ */
+ if (bhsdi->bhsdi_opcode != ISCSI_BHS_OPCODE_SCSI_DATA_IN ||
+ (bhsdi->bhsdi_flags & BHSDI_FLAGS_S) != 0) {
+ if (ntohl(bhsdi->bhsdi_statsn) < is->is_statsn) {
+ ISCSI_SESSION_WARN(is,
+ "PDU StatSN %d >= session StatSN %d, opcode 0x%x",
+ is->is_statsn, ntohl(bhsdi->bhsdi_statsn),
+ bhsdi->bhsdi_opcode);
+ }
+ is->is_statsn = ntohl(bhsdi->bhsdi_statsn);
+ }
+
+ expcmdsn = ntohl(bhsdi->bhsdi_expcmdsn);
+ maxcmdsn = ntohl(bhsdi->bhsdi_maxcmdsn);
+
+ /*
+ * XXX: Compare using Serial Arithmetic Sense.
+ */
+ if (maxcmdsn + 1 < expcmdsn) {
+ ISCSI_SESSION_DEBUG(is, "PDU MaxCmdSN %d + 1 < PDU ExpCmdSN %d; ignoring",
+ maxcmdsn, expcmdsn);
+ } else {
+ if (maxcmdsn > is->is_maxcmdsn) {
+ is->is_maxcmdsn = maxcmdsn;
+
+ /*
+ * Command window increased; kick the maintanance thread
+ * to send out postponed commands.
+ */
+ if (!TAILQ_EMPTY(&is->is_postponed))
+ cv_signal(&is->is_maintenance_cv);
+ } else if (maxcmdsn < is->is_maxcmdsn) {
+ ISCSI_SESSION_DEBUG(is, "PDU MaxCmdSN %d < session MaxCmdSN %d; ignoring",
+ maxcmdsn, is->is_maxcmdsn);
+ }
+
+ if (expcmdsn > is->is_expcmdsn) {
+ is->is_expcmdsn = expcmdsn;
+ } else if (expcmdsn < is->is_expcmdsn) {
+ ISCSI_SESSION_DEBUG(is, "PDU ExpCmdSN %d < session ExpCmdSN %d; ignoring",
+ expcmdsn, is->is_expcmdsn);
+ }
+ }
+
+ /*
+ * Every incoming PDU - not just NOP-In - resets the ping timer.
+ * The purpose of the timeout is to reset the connection when it stalls;
+ * we don't want this to happen when NOP-In or NOP-Out ends up delayed
+ * in some queue.
+ */
+ is->is_timeout = 0;
+}
+
+static void
+iscsi_receive_callback(struct icl_pdu *response)
+{
+ struct iscsi_session *is;
+
+ is = PDU_SESSION(response);
+
+ ISCSI_SESSION_LOCK(is);
+
+#ifdef ICL_KERNEL_PROXY
+ if (is->is_login_phase) {
+ if (is->is_login_pdu == NULL)
+ is->is_login_pdu = response;
+ else
+ icl_pdu_free(response);
+ ISCSI_SESSION_UNLOCK(is);
+ cv_signal(&is->is_login_cv);
+ return;
+ }
+#endif
+
+ iscsi_pdu_update_statsn(response);
+
+ /*
+ * The handling routine is responsible for freeing the PDU
+ * when it's no longer needed.
+ */
+ switch (response->ip_bhs->bhs_opcode) {
+ case ISCSI_BHS_OPCODE_NOP_IN:
+ iscsi_pdu_handle_nop_in(response);
+ break;
+ case ISCSI_BHS_OPCODE_SCSI_RESPONSE:
+ iscsi_pdu_handle_scsi_response(response);
+ break;
+ case ISCSI_BHS_OPCODE_SCSI_DATA_IN:
+ iscsi_pdu_handle_data_in(response);
+ break;
+ case ISCSI_BHS_OPCODE_LOGOUT_RESPONSE:
+ iscsi_pdu_handle_logout_response(response);
+ break;
+ case ISCSI_BHS_OPCODE_R2T:
+ iscsi_pdu_handle_r2t(response);
+ break;
+ case ISCSI_BHS_OPCODE_ASYNC_MESSAGE:
+ iscsi_pdu_handle_async_message(response);
+ break;
+ case ISCSI_BHS_OPCODE_REJECT:
+ iscsi_pdu_handle_reject(response);
+ break;
+ default:
+ ISCSI_SESSION_WARN(is, "received PDU with unsupported "
+ "opcode 0x%x; reconnecting",
+ response->ip_bhs->bhs_opcode);
+ iscsi_session_reconnect(is);
+ icl_pdu_free(response);
+ }
+
+ ISCSI_SESSION_UNLOCK(is);
+}
+
+static void
+iscsi_error_callback(struct icl_conn *ic)
+{
+ struct iscsi_session *is;
+
+ is = CONN_SESSION(ic);
+
+ ISCSI_SESSION_WARN(is, "connection error; reconnecting");
+ iscsi_session_reconnect(is);
+}
+
+static void
+iscsi_pdu_handle_nop_in(struct icl_pdu *response)
+{
+ struct iscsi_bhs_nop_out *bhsno;
+ struct iscsi_bhs_nop_in *bhsni;
+ struct icl_pdu *request;
+
+ bhsni = (struct iscsi_bhs_nop_in *)response->ip_bhs;
+
+ if (bhsni->bhsni_target_transfer_tag == 0xffffffff) {
+ /*
+ * Nothing to do; iscsi_pdu_update_statsn() already
+ * zeroed the timeout.
+ */
+ icl_pdu_free(response);
+ return;
+ }
+
+ request = icl_pdu_new_bhs(response->ip_conn, M_NOWAIT);
+ if (request == NULL) {
+ icl_pdu_free(response);
+ return;
+ }
+ bhsno = (struct iscsi_bhs_nop_out *)request->ip_bhs;
+ bhsno->bhsno_opcode = ISCSI_BHS_OPCODE_NOP_OUT |
+ ISCSI_BHS_OPCODE_IMMEDIATE;
+ bhsno->bhsno_flags = 0x80;
+ bhsno->bhsno_initiator_task_tag = 0xffffffff; /* XXX */
+ bhsno->bhsno_target_transfer_tag = bhsni->bhsni_target_transfer_tag;
+
+ request->ip_data_len = response->ip_data_len;
+ request->ip_data_mbuf = response->ip_data_mbuf;
+ response->ip_data_len = 0;
+ response->ip_data_mbuf = NULL;
+
+ icl_pdu_free(response);
+ iscsi_pdu_queue_locked(request);
+}
+
+static void
+iscsi_pdu_handle_scsi_response(struct icl_pdu *response)
+{
+ struct iscsi_bhs_scsi_response *bhssr;
+ struct iscsi_outstanding *io;
+ struct iscsi_session *is;
+ struct ccb_scsiio *csio;
+ size_t data_segment_len;
+ uint16_t sense_len;
+
+ is = PDU_SESSION(response);
+
+ bhssr = (struct iscsi_bhs_scsi_response *)response->ip_bhs;
+ io = iscsi_outstanding_find(is, bhssr->bhssr_initiator_task_tag);
+ if (io == NULL) {
+ ISCSI_SESSION_WARN(is, "bad itt 0x%x", bhssr->bhssr_initiator_task_tag);
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ if (bhssr->bhssr_response != BHSSR_RESPONSE_COMMAND_COMPLETED) {
+ ISCSI_SESSION_WARN(is, "service response 0x%x", bhssr->bhssr_response);
+ if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ io->io_ccb->ccb_h.status = CAM_REQ_CMP_ERR | CAM_DEV_QFRZN;
+ } else if (bhssr->bhssr_status == 0) {
+ io->io_ccb->ccb_h.status = CAM_REQ_CMP;
+ } else {
+ if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ io->io_ccb->ccb_h.status = CAM_SCSI_STATUS_ERROR | CAM_DEV_QFRZN;
+ io->io_ccb->csio.scsi_status = bhssr->bhssr_status;
+ }
+
+ if (bhssr->bhssr_flags & BHSSR_FLAGS_RESIDUAL_OVERFLOW) {
+ ISCSI_SESSION_WARN(is, "target indicated residual overflow");
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ csio = &io->io_ccb->csio;
+
+ data_segment_len = icl_pdu_data_segment_length(response);
+ if (data_segment_len > 0) {
+ if (data_segment_len < sizeof(sense_len)) {
+ ISCSI_SESSION_WARN(is, "truncated data segment (%zd bytes)",
+ data_segment_len);
+ if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ io->io_ccb->ccb_h.status = CAM_REQ_CMP_ERR | CAM_DEV_QFRZN;
+ goto out;
+ }
+ icl_pdu_get_data(response, 0, &sense_len, sizeof(sense_len));
+ sense_len = ntohs(sense_len);
+#if 0
+ ISCSI_SESSION_DEBUG(is, "sense_len %d, data len %zd",
+ sense_len, data_segment_len);
+#endif
+ if (sizeof(sense_len) + sense_len > data_segment_len) {
+ ISCSI_SESSION_WARN(is, "truncated data segment "
+ "(%zd bytes, should be %zd)",
+ data_segment_len, sizeof(sense_len) + sense_len);
+ if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ io->io_ccb->ccb_h.status = CAM_REQ_CMP_ERR | CAM_DEV_QFRZN;
+ goto out;
+ } else if (sizeof(sense_len) + sense_len < data_segment_len)
+ ISCSI_SESSION_WARN(is, "oversize data segment "
+ "(%zd bytes, should be %zd)",
+ data_segment_len, sizeof(sense_len) + sense_len);
+ if (sense_len > csio->sense_len) {
+ ISCSI_SESSION_DEBUG(is, "truncating sense from %d to %d",
+ sense_len, csio->sense_len);
+ sense_len = csio->sense_len;
+ }
+ icl_pdu_get_data(response, sizeof(sense_len), &csio->sense_data, sense_len);
+ csio->sense_resid = csio->sense_len - sense_len;
+ io->io_ccb->ccb_h.status |= CAM_AUTOSNS_VALID;
+ }
+
+out:
+ if (bhssr->bhssr_flags & BHSSR_FLAGS_RESIDUAL_UNDERFLOW)
+ csio->resid = ntohl(bhssr->bhssr_residual_count);
+
+ if ((csio->ccb_h.flags & CAM_DIR_MASK) == CAM_DIR_IN) {
+ KASSERT(io->io_received <= csio->dxfer_len,
+ ("io->io_received > csio->dxfer_len"));
+ if (io->io_received < csio->dxfer_len) {
+ if (csio->resid != csio->dxfer_len - io->io_received) {
+ ISCSI_SESSION_WARN(is, "underflow mismatch: "
+ "target indicates %d, we calculated %zd",
+ csio->resid,
+ csio->dxfer_len - io->io_received);
+ }
+ csio->resid = csio->dxfer_len - io->io_received;
+ }
+ }
+
+ xpt_done(io->io_ccb);
+ iscsi_outstanding_remove(is, io);
+ icl_pdu_free(response);
+}
+
+static void
+iscsi_pdu_handle_data_in(struct icl_pdu *response)
+{
+ struct iscsi_bhs_data_in *bhsdi;
+ struct iscsi_outstanding *io;
+ struct iscsi_session *is;
+ struct ccb_scsiio *csio;
+ size_t data_segment_len;
+
+ is = PDU_SESSION(response);
+ bhsdi = (struct iscsi_bhs_data_in *)response->ip_bhs;
+ io = iscsi_outstanding_find(is, bhsdi->bhsdi_initiator_task_tag);
+ if (io == NULL) {
+ ISCSI_SESSION_WARN(is, "bad itt 0x%x", bhsdi->bhsdi_initiator_task_tag);
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ data_segment_len = icl_pdu_data_segment_length(response);
+ if (data_segment_len == 0) {
+ /*
+ * "The sending of 0 length data segments should be avoided,
+ * but initiators and targets MUST be able to properly receive
+ * 0 length data segments."
+ */
+ icl_pdu_free(response);
+ return;
+ }
+
+ /*
+ * We need to track this for security reasons - without it, malicious target
+ * could respond to SCSI READ without sending Data-In PDUs, which would result
+ * in read operation on the initiator side returning random kernel data.
+ */
+ if (ntohl(bhsdi->bhsdi_buffer_offset) != io->io_received) {
+ ISCSI_SESSION_WARN(is, "data out of order; expected offset %zd, got %zd",
+ io->io_received, (size_t)ntohl(bhsdi->bhsdi_buffer_offset));
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ csio = &io->io_ccb->csio;
+
+ if (ntohl(bhsdi->bhsdi_buffer_offset) + data_segment_len >
+ csio->dxfer_len) {
+ ISCSI_SESSION_WARN(is, "oversize data segment (%zd bytes "
+ "at offset %d, buffer is %d)",
+ data_segment_len, ntohl(bhsdi->bhsdi_buffer_offset),
+ csio->dxfer_len);
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ icl_pdu_get_data(response, 0, csio->data_ptr + ntohl(bhsdi->bhsdi_buffer_offset), data_segment_len);
+ io->io_received += data_segment_len;
+
+ /*
+ * XXX: Check DataSN.
+ * XXX: Check F.
+ */
+ if (bhsdi->bhsdi_flags & BHSDI_FLAGS_S) {
+ //ISCSI_SESSION_DEBUG(is, "got S flag; status 0x%x", bhsdi->bhsdi_status);
+ if (bhsdi->bhsdi_status == 0) {
+ io->io_ccb->ccb_h.status = CAM_REQ_CMP;
+ } else {
+ if ((io->io_ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(io->io_ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ io->io_ccb->ccb_h.status = CAM_SCSI_STATUS_ERROR | CAM_DEV_QFRZN;
+ csio->scsi_status = bhsdi->bhsdi_status;
+ }
+ xpt_done(io->io_ccb);
+ iscsi_outstanding_remove(is, io);
+ }
+
+ icl_pdu_free(response);
+}
+
+static void
+iscsi_pdu_handle_logout_response(struct icl_pdu *response)
+{
+
+ ISCSI_SESSION_DEBUG(PDU_SESSION(response), "logout response");
+ icl_pdu_free(response);
+}
+
+static void
+iscsi_pdu_handle_r2t(struct icl_pdu *response)
+{
+ struct icl_pdu *request;
+ struct iscsi_session *is;
+ struct iscsi_bhs_r2t *bhsr2t;
+ struct iscsi_bhs_data_out *bhsdo;
+ struct iscsi_outstanding *io;
+ struct ccb_scsiio *csio;
+ size_t off, len, total_len;
+ int error;
+
+ is = PDU_SESSION(response);
+
+ bhsr2t = (struct iscsi_bhs_r2t *)response->ip_bhs;
+ io = iscsi_outstanding_find(is, bhsr2t->bhsr2t_initiator_task_tag);
+ if (io == NULL) {
+ ISCSI_SESSION_WARN(is, "bad itt 0x%x; reconnecting",
+ bhsr2t->bhsr2t_initiator_task_tag);
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ csio = &io->io_ccb->csio;
+
+ if ((csio->ccb_h.flags & CAM_DIR_MASK) != CAM_DIR_OUT) {
+ ISCSI_SESSION_WARN(is, "received R2T for read command; reconnecting");
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ /*
+ * XXX: Verify R2TSN.
+ */
+
+ io->io_datasn = 0;
+ off = ntohl(bhsr2t->bhsr2t_buffer_offset);
+ total_len = ntohl(bhsr2t->bhsr2t_desired_data_transfer_length);
+
+ //ISCSI_SESSION_DEBUG(is, "r2t; off %zd, len %zd", off, total_len);
+
+ for (;;) {
+ len = total_len;
+
+ if (len > is->is_max_data_segment_length)
+ len = is->is_max_data_segment_length;
+
+ if (off + len > csio->dxfer_len) {
+ ISCSI_SESSION_WARN(is, "bad off %zd, len %d",
+ off + len, csio->dxfer_len);
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ request = icl_pdu_new_bhs(response->ip_conn, M_NOWAIT);
+ if (request == NULL) {
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ bhsdo = (struct iscsi_bhs_data_out *)request->ip_bhs;
+ bhsdo->bhsdo_opcode = ISCSI_BHS_OPCODE_SCSI_DATA_OUT;
+ bhsdo->bhsdo_lun = bhsr2t->bhsr2t_lun;
+ bhsdo->bhsdo_initiator_task_tag =
+ bhsr2t->bhsr2t_initiator_task_tag;
+ bhsdo->bhsdo_target_transfer_tag =
+ bhsr2t->bhsr2t_target_transfer_tag;
+ bhsdo->bhsdo_datasn = htonl(io->io_datasn++);
+ bhsdo->bhsdo_buffer_offset = htonl(off);
+ error = icl_pdu_append_data(request, csio->data_ptr + off, len, M_NOWAIT);
+ if (error != 0) {
+ icl_pdu_free(request);
+ icl_pdu_free(response);
+ iscsi_session_reconnect(is);
+ return;
+ }
+
+ off += len;
+ total_len -= len;
+
+ if (total_len == 0) {
+ bhsdo->bhsdo_flags |= BHSDO_FLAGS_F;
+ //ISCSI_SESSION_DEBUG(is, "setting F, off %zd", off);
+ } else {
+ //ISCSI_SESSION_DEBUG(is, "not finished, off %zd", off);
+ }
+
+ iscsi_pdu_queue_locked(request);
+
+ if (total_len == 0)
+ break;
+ }
+
+ icl_pdu_free(response);
+}
+
+static void
+iscsi_pdu_handle_async_message(struct icl_pdu *response)
+{
+ struct iscsi_bhs_asynchronous_message *bhsam;
+ struct iscsi_session *is;
+
+ is = PDU_SESSION(response);
+ bhsam = (struct iscsi_bhs_asynchronous_message *)response->ip_bhs;
+ switch (bhsam->bhsam_async_event) {
+ case BHSAM_EVENT_TARGET_REQUESTS_LOGOUT:
+ ISCSI_SESSION_WARN(is, "target requests logout; removing session");
+ iscsi_session_logout(is);
+ iscsi_session_terminate(is);
+ break;
+ case BHSAM_EVENT_TARGET_TERMINATES_CONNECTION:
+ ISCSI_SESSION_WARN(is, "target indicates it will drop drop the connection");
+ break;
+ case BHSAM_EVENT_TARGET_TERMINATES_SESSION:
+ ISCSI_SESSION_WARN(is, "target indicates it will drop drop the session");
+ break;
+ default:
+ /*
+ * XXX: Technically, we're obligated to also handle
+ * parameter renegotiation.
+ */
+ ISCSI_SESSION_WARN(is, "ignoring AsyncEvent %d", bhsam->bhsam_async_event);
+ break;
+ }
+
+ icl_pdu_free(response);
+}
+
+static void
+iscsi_pdu_handle_reject(struct icl_pdu *response)
+{
+ struct iscsi_bhs_reject *bhsr;
+ struct iscsi_session *is;
+
+ is = PDU_SESSION(response);
+ bhsr = (struct iscsi_bhs_reject *)response->ip_bhs;
+ ISCSI_SESSION_WARN(is, "received Reject PDU, reason 0x%x; protocol error?",
+ bhsr->bhsr_reason);
+
+ icl_pdu_free(response);
+}
+
+static int
+iscsi_ioctl_daemon_wait(struct iscsi_softc *sc,
+ struct iscsi_daemon_request *request)
+{
+ struct iscsi_session *is;
+ int error;
+
+ sx_slock(&sc->sc_lock);
+ for (;;) {
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
+ if (is->is_waiting_for_iscsid)
+ break;
+ }
+
+ if (is == NULL) {
+ /*
+ * No session requires attention from iscsid(8); wait.
+ */
+ error = cv_wait_sig(&sc->sc_cv, &sc->sc_lock);
+ if (error != 0) {
+ sx_sunlock(&sc->sc_lock);
+ return (error);
+ }
+ continue;
+ }
+
+ ISCSI_SESSION_LOCK(is);
+ is->is_waiting_for_iscsid = false;
+ is->is_login_phase = true;
+ is->is_reason[0] = '\0';
+ ISCSI_SESSION_UNLOCK(is);
+
+ request->idr_session_id = is->is_id;
+ memcpy(&request->idr_conf, &is->is_conf,
+ sizeof(request->idr_conf));
+
+ sx_sunlock(&sc->sc_lock);
+ return (0);
+ }
+}
+
+static int
+iscsi_ioctl_daemon_handoff(struct iscsi_softc *sc,
+ struct iscsi_daemon_handoff *handoff)
+{
+ struct iscsi_session *is;
+ int error;
+
+ sx_slock(&sc->sc_lock);
+
+ /*
+ * Find the session to hand off socket to.
+ */
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
+ if (is->is_id == handoff->idh_session_id)
+ break;
+ }
+ if (is == NULL) {
+ sx_sunlock(&sc->sc_lock);
+ return (ESRCH);
+ }
+ ISCSI_SESSION_LOCK(is);
+ if (is->is_conf.isc_discovery || is->is_terminating) {
+ ISCSI_SESSION_UNLOCK(is);
+ sx_sunlock(&sc->sc_lock);
+ return (EINVAL);
+ }
+
+ strlcpy(is->is_target_alias, handoff->idh_target_alias,
+ sizeof(is->is_target_alias));
+ memcpy(is->is_isid, handoff->idh_isid, sizeof(is->is_isid));
+ is->is_statsn = handoff->idh_statsn;
+ is->is_initial_r2t = handoff->idh_initial_r2t;
+ is->is_immediate_data = handoff->idh_immediate_data;
+ is->is_max_data_segment_length = handoff->idh_max_data_segment_length;
+ is->is_max_burst_length = handoff->idh_max_burst_length;
+ is->is_first_burst_length = handoff->idh_first_burst_length;
+
+ if (handoff->idh_header_digest == ISCSI_DIGEST_CRC32C)
+ is->is_conn->ic_header_crc32c = true;
+ else
+ is->is_conn->ic_header_crc32c = false;
+ if (handoff->idh_data_digest == ISCSI_DIGEST_CRC32C)
+ is->is_conn->ic_data_crc32c = true;
+ else
+ is->is_conn->ic_data_crc32c = false;
+
+ is->is_cmdsn = 0;
+ is->is_expcmdsn = 1;
+ is->is_maxcmdsn = 1;
+ is->is_waiting_for_iscsid = false;
+ is->is_login_phase = false;
+ is->is_timeout = 0;
+ is->is_connected = true;
+ is->is_reason[0] = '\0';
+
+ ISCSI_SESSION_UNLOCK(is);
+
+#ifndef ICL_KERNEL_PROXY
+ error = icl_conn_handoff(is->is_conn, handoff->idh_socket);
+ if (error != 0) {
+ sx_sunlock(&sc->sc_lock);
+ iscsi_session_terminate(is);
+ return (error);
+ }
+#endif
+
+ sx_sunlock(&sc->sc_lock);
+
+ if (is->is_sim != NULL) {
+ /*
+ * When reconnecting, there already is SIM allocated for the session.
+ */
+ KASSERT(is->is_simq_frozen, ("reconnect without frozen simq"));
+ ISCSI_SESSION_LOCK(is);
+ ISCSI_SESSION_DEBUG(is, "releasing");
+ xpt_release_simq(is->is_sim, 1);
+ is->is_simq_frozen = false;
+ ISCSI_SESSION_UNLOCK(is);
+
+ } else {
+ ISCSI_SESSION_LOCK(is);
+ is->is_devq = cam_simq_alloc(maxtags);
+ if (is->is_devq == NULL) {
+ ISCSI_SESSION_WARN(is, "failed to allocate simq");
+ iscsi_session_terminate(is);
+ return (ENOMEM);
+ }
+
+ is->is_sim = cam_sim_alloc(iscsi_action, iscsi_poll, "iscsi",
+ is, is->is_id /* unit */, &is->is_lock,
+ maxtags, maxtags, is->is_devq);
+ if (is->is_sim == NULL) {
+ ISCSI_SESSION_UNLOCK(is);
+ ISCSI_SESSION_WARN(is, "failed to allocate SIM");
+ cam_simq_free(is->is_devq);
+ iscsi_session_terminate(is);
+ return (ENOMEM);
+ }
+
+ error = xpt_bus_register(is->is_sim, NULL, 0);
+ if (error != 0) {
+ ISCSI_SESSION_UNLOCK(is);
+ ISCSI_SESSION_WARN(is, "failed to register bus");
+ iscsi_session_terminate(is);
+ return (ENOMEM);
+ }
+
+ error = xpt_create_path(&is->is_path, /*periph*/NULL,
+ cam_sim_path(is->is_sim), CAM_TARGET_WILDCARD,
+ CAM_LUN_WILDCARD);
+ if (error != CAM_REQ_CMP) {
+ ISCSI_SESSION_UNLOCK(is);
+ ISCSI_SESSION_WARN(is, "failed to create path");
+ iscsi_session_terminate(is);
+ return (ENOMEM);
+ }
+ ISCSI_SESSION_UNLOCK(is);
+ }
+
+ return (0);
+}
+
+static int
+iscsi_ioctl_daemon_fail(struct iscsi_softc *sc,
+ struct iscsi_daemon_fail *fail)
+{
+ struct iscsi_session *is;
+
+ sx_slock(&sc->sc_lock);
+
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
+ if (is->is_id == fail->idf_session_id)
+ break;
+ }
+ if (is == NULL) {
+ sx_sunlock(&sc->sc_lock);
+ return (ESRCH);
+ }
+ ISCSI_SESSION_LOCK(is);
+ ISCSI_SESSION_DEBUG(is, "iscsid(8) failed: %s",
+ fail->idf_reason);
+ strlcpy(is->is_reason, fail->idf_reason, sizeof(is->is_reason));
+ //is->is_waiting_for_iscsid = false;
+ //is->is_login_phase = true;
+ //iscsi_session_reconnect(is);
+ ISCSI_SESSION_UNLOCK(is);
+ sx_sunlock(&sc->sc_lock);
+
+ return (0);
+}
+
+#ifdef ICL_KERNEL_PROXY
+static int
+iscsi_ioctl_daemon_connect(struct iscsi_softc *sc,
+ struct iscsi_daemon_connect *idc)
+{
+ struct iscsi_session *is;
+ struct sockaddr *from_sa, *to_sa;
+ int error;
+
+ sx_slock(&sc->sc_lock);
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
+ if (is->is_id == idc->idc_session_id)
+ break;
+ }
+ if (is == NULL) {
+ sx_sunlock(&sc->sc_lock);
+ return (ESRCH);
+ }
+ sx_sunlock(&sc->sc_lock);
+
+ if (idc->idc_from_addrlen > 0) {
+ error = getsockaddr(&from_sa, (void *)idc->idc_from_addr, idc->idc_from_addrlen);
+ if (error != 0)
+ return (error);
+ } else {
+ from_sa = NULL;
+ }
+ error = getsockaddr(&to_sa, (void *)idc->idc_to_addr, idc->idc_to_addrlen);
+ if (error != 0) {
+ free(from_sa, M_SONAME);
+ return (error);
+ }
+
+ ISCSI_SESSION_LOCK(is);
+ is->is_waiting_for_iscsid = false;
+ is->is_login_phase = true;
+ is->is_timeout = 0;
+ ISCSI_SESSION_UNLOCK(is);
+
+ error = icl_conn_connect(is->is_conn, idc->idc_iser, idc->idc_domain,
+ idc->idc_socktype, idc->idc_protocol, from_sa, to_sa);
+ free(from_sa, M_SONAME);
+ free(to_sa, M_SONAME);
+
+ /*
+ * Digests are always disabled during login phase.
+ */
+ is->is_conn->ic_header_crc32c = false;
+ is->is_conn->ic_data_crc32c = false;
+
+ return (error);
+}
+
+static int
+iscsi_ioctl_daemon_send(struct iscsi_softc *sc,
+ struct iscsi_daemon_send *ids)
+{
+ struct iscsi_session *is;
+ struct icl_pdu *ip;
+ size_t datalen;
+ void *data;
+ int error;
+
+ sx_slock(&sc->sc_lock);
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
+ if (is->is_id == ids->ids_session_id)
+ break;
+ }
+ if (is == NULL) {
+ sx_sunlock(&sc->sc_lock);
+ return (ESRCH);
+ }
+ sx_sunlock(&sc->sc_lock);
+
+ if (is->is_login_phase == false)
+ return (EBUSY);
+
+ if (is->is_terminating || is->is_reconnecting)
+ return (EIO);
+
+ datalen = ids->ids_data_segment_len;
+ if (datalen > ISCSI_MAX_DATA_SEGMENT_LENGTH)
+ return (EINVAL);
+ if (datalen > 0) {
+ data = malloc(datalen, M_ISCSI, M_WAITOK);
+ error = copyin(ids->ids_data_segment, data, datalen);
+ if (error != 0) {
+ free(data, M_ISCSI);
+ return (error);
+ }
+ }
+
+ ip = icl_pdu_new_bhs(is->is_conn, M_WAITOK);
+ memcpy(ip->ip_bhs, ids->ids_bhs, sizeof(*ip->ip_bhs));
+ if (datalen > 0) {
+ error = icl_pdu_append_data(ip, data, datalen, M_WAITOK);
+ KASSERT(error == 0, ("icl_pdu_append_data(..., M_WAITOK) failed"));
+ free(data, M_ISCSI);
+ }
+ icl_pdu_queue(ip);
+
+ return (0);
+}
+
+static int
+iscsi_ioctl_daemon_receive(struct iscsi_softc *sc,
+ struct iscsi_daemon_receive *idr)
+{
+ struct iscsi_session *is;
+ struct icl_pdu *ip;
+ void *data;
+
+ sx_slock(&sc->sc_lock);
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
+ if (is->is_id == idr->idr_session_id)
+ break;
+ }
+ if (is == NULL) {
+ sx_sunlock(&sc->sc_lock);
+ return (ESRCH);
+ }
+ sx_sunlock(&sc->sc_lock);
+
+ if (is->is_login_phase == false)
+ return (EBUSY);
+
+ ISCSI_SESSION_LOCK(is);
+ while (is->is_login_pdu == NULL &&
+ is->is_terminating == false &&
+ is->is_reconnecting == false)
+ cv_wait(&is->is_login_cv, &is->is_lock);
+ if (is->is_terminating || is->is_reconnecting) {
+ ISCSI_SESSION_UNLOCK(is);
+ return (EIO);
+ }
+ ip = is->is_login_pdu;
+ is->is_login_pdu = NULL;
+ ISCSI_SESSION_UNLOCK(is);
+
+ if (ip->ip_data_len > idr->idr_data_segment_len) {
+ icl_pdu_free(ip);
+ return (EMSGSIZE);
+ }
+
+ copyout(ip->ip_bhs, idr->idr_bhs, sizeof(*ip->ip_bhs));
+ if (ip->ip_data_len > 0) {
+ data = malloc(ip->ip_data_len, M_ISCSI, M_WAITOK);
+ icl_pdu_get_data(ip, 0, data, ip->ip_data_len);
+ copyout(data, idr->idr_data_segment, ip->ip_data_len);
+ free(data, M_ISCSI);
+ }
+
+ icl_pdu_free(ip);
+
+ return (0);
+}
+
+static int
+iscsi_ioctl_daemon_close(struct iscsi_softc *sc,
+ struct iscsi_daemon_close *idc)
+{
+ struct iscsi_session *is;
+
+ sx_slock(&sc->sc_lock);
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
+ if (is->is_id == idc->idc_session_id)
+ break;
+ }
+ if (is == NULL) {
+ sx_sunlock(&sc->sc_lock);
+ return (ESRCH);
+ }
+ sx_sunlock(&sc->sc_lock);
+
+ iscsi_session_reconnect(is);
+
+ return (0);
+}
+#endif /* ICL_KERNEL_PROXY */
+
+static void
+iscsi_sanitize_session_conf(struct iscsi_session_conf *isc)
+{
+ /*
+ * Just make sure all the fields are null-terminated.
+ *
+ * XXX: This is not particularly secure. We should
+ * create our own conf and then copy in relevant
+ * fields.
+ */
+ isc->isc_initiator[ISCSI_NAME_LEN - 1] = '\0';
+ isc->isc_initiator_addr[ISCSI_ADDR_LEN - 1] = '\0';
+ isc->isc_initiator_alias[ISCSI_ALIAS_LEN - 1] = '\0';
+ isc->isc_target[ISCSI_NAME_LEN - 1] = '\0';
+ isc->isc_target_addr[ISCSI_ADDR_LEN - 1] = '\0';
+ isc->isc_user[ISCSI_NAME_LEN - 1] = '\0';
+ isc->isc_secret[ISCSI_SECRET_LEN - 1] = '\0';
+ isc->isc_mutual_user[ISCSI_NAME_LEN - 1] = '\0';
+ isc->isc_mutual_secret[ISCSI_SECRET_LEN - 1] = '\0';
+}
+
+static int
+iscsi_ioctl_session_add(struct iscsi_softc *sc, struct iscsi_session_add *isa)
+{
+ struct iscsi_session *is;
+ const struct iscsi_session *is2;
+ int error;
+
+ iscsi_sanitize_session_conf(&isa->isa_conf);
+
+ is = malloc(sizeof(*is), M_ISCSI, M_ZERO | M_WAITOK);
+ memcpy(&is->is_conf, &isa->isa_conf, sizeof(is->is_conf));
+
+ if (is->is_conf.isc_initiator[0] == '\0' ||
+ is->is_conf.isc_target == '\0' ||
+ is->is_conf.isc_target_addr == '\0') {
+ free(is, M_ISCSI);
+ return (EINVAL);
+ }
+
+ sx_xlock(&sc->sc_lock);
+
+ /*
+ * Prevent duplicates.
+ */
+ TAILQ_FOREACH(is2, &sc->sc_sessions, is_next) {
+ if (strcmp(is2->is_conf.isc_target,
+ is->is_conf.isc_target) == 0) {
+ sx_xunlock(&sc->sc_lock);
+ return (EBUSY);
+ }
+ }
+
+ is->is_conn = icl_conn_new();
+ is->is_conn->ic_receive = iscsi_receive_callback;
+ is->is_conn->ic_error = iscsi_error_callback;
+ is->is_conn->ic_prv0 = is;
+ TAILQ_INIT(&is->is_outstanding);
+ TAILQ_INIT(&is->is_postponed);
+ mtx_init(&is->is_lock, "iscsi_lock", NULL, MTX_DEF);
+ cv_init(&is->is_maintenance_cv, "iscsi_mt");
+#ifdef ICL_KERNEL_PROXY
+ cv_init(&is->is_login_cv, "iscsi_login");
+#endif
+
+ is->is_softc = sc;
+ sc->sc_last_session_id++;
+ is->is_id = sc->sc_last_session_id;
+ callout_init(&is->is_callout, 1);
+ callout_reset(&is->is_callout, 1 * hz, iscsi_callout, is);
+ TAILQ_INSERT_TAIL(&sc->sc_sessions, is, is_next);
+
+ error = kthread_add(iscsi_maintenance_thread, is, NULL, NULL, 0, 0, "iscsimt");
+ if (error != 0) {
+ ISCSI_SESSION_WARN(is, "kthread_add(9) failed with error %d", error);
+ return (error);
+ }
+
+ /*
+ * Trigger immediate reconnection.
+ */
+ is->is_waiting_for_iscsid = true;
+ strlcpy(is->is_reason, "Waiting for iscsid(8)", sizeof(is->is_reason));
+ cv_signal(&sc->sc_cv);
+
+ sx_xunlock(&sc->sc_lock);
+
+ return (0);
+}
+
+static bool
+iscsi_session_conf_matches(unsigned int id1, const struct iscsi_session_conf *c1,
+ unsigned int id2, const struct iscsi_session_conf *c2)
+{
+ if (id2 == 0 && c2->isc_target[0] == '\0' &&
+ c2->isc_target_addr[0] == '\0')
+ return (true);
+ if (id2 != 0 && id2 == id1)
+ return (true);
+ if (c2->isc_target[0] != '\0' &&
+ strcmp(c1->isc_target, c2->isc_target) == 0)
+ return (true);
+ if (c2->isc_target_addr[0] != '\0' &&
+ strcmp(c1->isc_target_addr, c2->isc_target_addr) == 0)
+ return (true);
+ return (false);
+}
+
+static int
+iscsi_ioctl_session_remove(struct iscsi_softc *sc,
+ struct iscsi_session_remove *isr)
+{
+ struct iscsi_session *is, *tmp;
+ bool found = false;
+
+ iscsi_sanitize_session_conf(&isr->isr_conf);
+
+ sx_xlock(&sc->sc_lock);
+ TAILQ_FOREACH_SAFE(is, &sc->sc_sessions, is_next, tmp) {
+ ISCSI_SESSION_LOCK(is);
+ if (iscsi_session_conf_matches(is->is_id, &is->is_conf,
+ isr->isr_session_id, &isr->isr_conf)) {
+ found = true;
+ iscsi_session_logout(is);
+ iscsi_session_terminate(is);
+ }
+ ISCSI_SESSION_UNLOCK(is);
+ }
+ sx_xunlock(&sc->sc_lock);
+
+ if (!found)
+ return (ESRCH);
+
+ return (0);
+}
+
+static int
+iscsi_ioctl_session_list(struct iscsi_softc *sc, struct iscsi_session_list *isl)
+{
+ int error;
+ unsigned int i = 0;
+ struct iscsi_session *is;
+ struct iscsi_session_state iss;
+
+ sx_slock(&sc->sc_lock);
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next) {
+ if (i >= isl->isl_nentries) {
+ sx_sunlock(&sc->sc_lock);
+ return (EMSGSIZE);
+ }
+ memset(&iss, 0, sizeof(iss));
+ memcpy(&iss.iss_conf, &is->is_conf, sizeof(iss.iss_conf));
+ iss.iss_id = is->is_id;
+ strlcpy(iss.iss_target_alias, is->is_target_alias, sizeof(iss.iss_target_alias));
+ strlcpy(iss.iss_reason, is->is_reason, sizeof(iss.iss_reason));
+
+ if (is->is_conn->ic_header_crc32c)
+ iss.iss_header_digest = ISCSI_DIGEST_CRC32C;
+ else
+ iss.iss_header_digest = ISCSI_DIGEST_NONE;
+
+ if (is->is_conn->ic_data_crc32c)
+ iss.iss_data_digest = ISCSI_DIGEST_CRC32C;
+ else
+ iss.iss_data_digest = ISCSI_DIGEST_NONE;
+
+ iss.iss_max_data_segment_length = is->is_max_data_segment_length;
+ iss.iss_immediate_data = is->is_immediate_data;
+ iss.iss_connected = is->is_connected;
+
+ error = copyout(&iss, isl->isl_pstates + i, sizeof(iss));
+ if (error != 0) {
+ sx_sunlock(&sc->sc_lock);
+ return (error);
+ }
+ i++;
+ }
+ sx_sunlock(&sc->sc_lock);
+
+ isl->isl_nentries = i;
+
+ return (0);
+}
+
+static int
+iscsi_ioctl(struct cdev *dev, u_long cmd, caddr_t arg, int mode,
+ struct thread *td)
+{
+ struct iscsi_softc *sc;
+
+ sc = dev->si_drv1;
+
+ switch (cmd) {
+ case ISCSIDWAIT:
+ return (iscsi_ioctl_daemon_wait(sc,
+ (struct iscsi_daemon_request *)arg));
+ case ISCSIDHANDOFF:
+ return (iscsi_ioctl_daemon_handoff(sc,
+ (struct iscsi_daemon_handoff *)arg));
+ case ISCSIDFAIL:
+ return (iscsi_ioctl_daemon_fail(sc,
+ (struct iscsi_daemon_fail *)arg));
+#ifdef ICL_KERNEL_PROXY
+ case ISCSIDCONNECT:
+ return (iscsi_ioctl_daemon_connect(sc,
+ (struct iscsi_daemon_connect *)arg));
+ case ISCSIDSEND:
+ return (iscsi_ioctl_daemon_send(sc,
+ (struct iscsi_daemon_send *)arg));
+ case ISCSIDRECEIVE:
+ return (iscsi_ioctl_daemon_receive(sc,
+ (struct iscsi_daemon_receive *)arg));
+ case ISCSIDCLOSE:
+ return (iscsi_ioctl_daemon_close(sc,
+ (struct iscsi_daemon_close *)arg));
+#endif /* ICL_KERNEL_PROXY */
+ case ISCSISADD:
+ return (iscsi_ioctl_session_add(sc,
+ (struct iscsi_session_add *)arg));
+ case ISCSISREMOVE:
+ return (iscsi_ioctl_session_remove(sc,
+ (struct iscsi_session_remove *)arg));
+ case ISCSISLIST:
+ return (iscsi_ioctl_session_list(sc,
+ (struct iscsi_session_list *)arg));
+ default:
+ return (EINVAL);
+ }
+}
+
+static uint64_t
+iscsi_encode_lun(uint32_t lun)
+{
+ uint8_t encoded[8];
+ uint64_t result;
+
+ memset(encoded, 0, sizeof(encoded));
+
+ if (lun < 256) {
+ /*
+ * Peripheral device addressing.
+ */
+ encoded[1] = lun;
+ } else if (lun < 16384) {
+ /*
+ * Flat space addressing.
+ */
+ encoded[0] = 0x40;
+ encoded[0] |= (lun >> 8) & 0x3f;
+ encoded[1] = lun & 0xff;
+ } else {
+ /*
+ * Extended flat space addressing.
+ */
+ encoded[0] = 0xd2;
+ encoded[1] = lun >> 16;
+ encoded[2] = lun >> 8;
+ encoded[3] = lun;
+ }
+
+ memcpy(&result, encoded, sizeof(result));
+ return (result);
+}
+
+static struct iscsi_outstanding *
+iscsi_outstanding_find(struct iscsi_session *is, uint32_t initiator_task_tag)
+{
+ struct iscsi_outstanding *io;
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+ TAILQ_FOREACH(io, &is->is_outstanding, io_next) {
+ if (io->io_initiator_task_tag == initiator_task_tag)
+ return (io);
+ }
+ return (NULL);
+}
+
+static int
+iscsi_outstanding_add(struct iscsi_session *is,
+ uint32_t initiator_task_tag, union ccb *ccb)
+{
+ struct iscsi_outstanding *io;
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+ KASSERT(iscsi_outstanding_find(is, initiator_task_tag) == NULL,
+ ("initiator_task_tag 0x%x already added", initiator_task_tag));
+
+ io = uma_zalloc(iscsi_outstanding_zone, M_NOWAIT | M_ZERO);
+ if (io == NULL) {
+ ISCSI_SESSION_WARN(is, "failed to allocate %zd bytes", sizeof(*io));
+ return (ENOMEM);
+ }
+ io->io_initiator_task_tag = initiator_task_tag;
+ io->io_ccb = ccb;
+ TAILQ_INSERT_TAIL(&is->is_outstanding, io, io_next);
+ return (0);
+}
+
+static void
+iscsi_outstanding_remove(struct iscsi_session *is, struct iscsi_outstanding *io)
+{
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+ TAILQ_REMOVE(&is->is_outstanding, io, io_next);
+ uma_zfree(iscsi_outstanding_zone, io);
+}
+
+static void
+iscsi_action_scsiio(struct iscsi_session *is, union ccb *ccb)
+{
+ struct icl_pdu *request;
+ struct iscsi_bhs_scsi_command *bhssc;
+ struct ccb_scsiio *csio;
+ size_t len;
+ int error;
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+#if 0
+ KASSERT(is->is_login_phase == false, ("%s called during Login Phase", __func__));
+#else
+ if (is->is_login_phase) {
+ ISCSI_SESSION_DEBUG(is, "called during login phase");
+ if ((ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ ccb->ccb_h.status = CAM_REQ_ABORTED | CAM_DEV_QFRZN;
+ xpt_done(ccb);
+ return;
+ }
+#endif
+
+ request = icl_pdu_new_bhs(is->is_conn, M_NOWAIT);
+ if (request == NULL) {
+ if ((ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ ccb->ccb_h.status = CAM_RESRC_UNAVAIL | CAM_DEV_QFRZN;
+ xpt_done(ccb);
+ return;
+ }
+
+ csio = &ccb->csio;
+ bhssc = (struct iscsi_bhs_scsi_command *)request->ip_bhs;
+ bhssc->bhssc_opcode = ISCSI_BHS_OPCODE_SCSI_COMMAND;
+ bhssc->bhssc_flags |= BHSSC_FLAGS_F;
+ switch (csio->ccb_h.flags & CAM_DIR_MASK) {
+ case CAM_DIR_IN:
+ bhssc->bhssc_flags |= BHSSC_FLAGS_R;
+ break;
+ case CAM_DIR_OUT:
+ bhssc->bhssc_flags |= BHSSC_FLAGS_W;
+ break;
+ }
+
+ switch (csio->tag_action) {
+ case MSG_HEAD_OF_Q_TAG:
+ bhssc->bhssc_flags |= BHSSC_FLAGS_ATTR_HOQ;
+ break;
+ break;
+ case MSG_ORDERED_Q_TAG:
+ bhssc->bhssc_flags |= BHSSC_FLAGS_ATTR_ORDERED;
+ break;
+ case MSG_ACA_TASK:
+ bhssc->bhssc_flags |= BHSSC_FLAGS_ATTR_ACA;
+ break;
+ case CAM_TAG_ACTION_NONE:
+ case MSG_SIMPLE_Q_TAG:
+ default:
+ bhssc->bhssc_flags |= BHSSC_FLAGS_ATTR_SIMPLE;
+ break;
+ }
+
+ bhssc->bhssc_lun = iscsi_encode_lun(csio->ccb_h.target_lun);
+ bhssc->bhssc_initiator_task_tag = is->is_initiator_task_tag;
+ is->is_initiator_task_tag++;
+ bhssc->bhssc_expected_data_transfer_length = htonl(csio->dxfer_len);
+ KASSERT(csio->cdb_len <= sizeof(bhssc->bhssc_cdb),
+ ("unsupported CDB size %zd", (size_t)csio->cdb_len));
+
+ if (csio->ccb_h.flags & CAM_CDB_POINTER)
+ memcpy(&bhssc->bhssc_cdb, csio->cdb_io.cdb_ptr, csio->cdb_len);
+ else
+ memcpy(&bhssc->bhssc_cdb, csio->cdb_io.cdb_bytes, csio->cdb_len);
+
+ error = iscsi_outstanding_add(is, bhssc->bhssc_initiator_task_tag, ccb);
+ if (error != 0) {
+ icl_pdu_free(request);
+ if ((ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ ccb->ccb_h.status = CAM_RESRC_UNAVAIL | CAM_DEV_QFRZN;
+ xpt_done(ccb);
+ return;
+ }
+
+ if (is->is_immediate_data &&
+ (csio->ccb_h.flags & CAM_DIR_MASK) == CAM_DIR_OUT) {
+ len = csio->dxfer_len;
+ //ISCSI_SESSION_DEBUG(is, "adding %zd of immediate data", len);
+ if (len > is->is_first_burst_length) {
+ ISCSI_SESSION_DEBUG(is, "len %zd -> %zd", len, is->is_first_burst_length);
+ len = is->is_first_burst_length;
+ }
+
+ error = icl_pdu_append_data(request, csio->data_ptr, len, M_NOWAIT);
+ if (error != 0) {
+ icl_pdu_free(request);
+ if ((ccb->ccb_h.status & CAM_DEV_QFRZN) == 0) {
+ xpt_freeze_devq(ccb->ccb_h.path, 1);
+ ISCSI_SESSION_DEBUG(is, "freezing devq");
+ }
+ ccb->ccb_h.status = CAM_RESRC_UNAVAIL | CAM_DEV_QFRZN;
+ xpt_done(ccb);
+ return;
+ }
+ }
+ iscsi_pdu_queue_locked(request);
+}
+
+static void
+iscsi_action(struct cam_sim *sim, union ccb *ccb)
+{
+ struct iscsi_session *is;
+
+ is = cam_sim_softc(sim);
+
+ ISCSI_SESSION_LOCK_ASSERT(is);
+
+ if (is->is_terminating) {
+ ISCSI_SESSION_DEBUG(is, "called during termination");
+ ccb->ccb_h.status = CAM_DEV_NOT_THERE;
+ xpt_done(ccb);
+ return;
+ }
+
+ switch (ccb->ccb_h.func_code) {
+ case XPT_PATH_INQ:
+ {
+ struct ccb_pathinq *cpi = &ccb->cpi;
+
+ cpi->version_num = 1;
+ cpi->hba_inquiry = PI_TAG_ABLE;
+ cpi->target_sprt = 0;
+ //cpi->hba_misc = PIM_NOBUSRESET;
+ cpi->hba_misc = 0;
+ cpi->hba_eng_cnt = 0;
+ cpi->max_target = 0;
+ cpi->max_lun = 255;
+ //cpi->initiator_id = 0; /* XXX */
+ cpi->initiator_id = 64; /* XXX */
+ strncpy(cpi->sim_vid, "FreeBSD", SIM_IDLEN);
+ strncpy(cpi->hba_vid, "iSCSI", HBA_IDLEN);
+ strncpy(cpi->dev_name, cam_sim_name(sim), DEV_IDLEN);
+ cpi->unit_number = cam_sim_unit(sim);
+ cpi->bus_id = cam_sim_bus(sim);
+ cpi->base_transfer_speed = 150000; /* XXX */
+ cpi->transport = XPORT_ISCSI;
+ cpi->transport_version = 0;
+ cpi->protocol = PROTO_SCSI;
+ cpi->protocol_version = SCSI_REV_SPC3;
+ cpi->maxio = MAXPHYS;
+ cpi->ccb_h.status = CAM_REQ_CMP;
+ break;
+ }
+ case XPT_CALC_GEOMETRY:
+ cam_calc_geometry(&ccb->ccg, /*extended*/1);
+ ccb->ccb_h.status = CAM_REQ_CMP;
+ break;
+#if 0
+ /*
+ * XXX: What's the point?
+ */
+ case XPT_RESET_BUS:
+ case XPT_ABORT:
+ case XPT_TERM_IO:
+ ISCSI_SESSION_DEBUG(is, "faking success for reset, abort, or term_io");
+ ccb->ccb_h.status = CAM_REQ_CMP;
+ break;
+#endif
+ case XPT_SCSI_IO:
+ iscsi_action_scsiio(is, ccb);
+ return;
+ default:
+#if 0
+ ISCSI_SESSION_DEBUG(is, "got unsupported code 0x%x", ccb->ccb_h.func_code);
+#endif
+ ccb->ccb_h.status = CAM_FUNC_NOTAVAIL;
+ break;
+ }
+ xpt_done(ccb);
+}
+
+static void
+iscsi_poll(struct cam_sim *sim)
+{
+
+ KASSERT(0, ("%s: you're not supposed to be here", __func__));
+}
+
+static void
+iscsi_shutdown(struct iscsi_softc *sc)
+{
+ struct iscsi_session *is;
+
+ ISCSI_DEBUG("removing all sessions due to shutdown");
+
+ sx_slock(&sc->sc_lock);
+ TAILQ_FOREACH(is, &sc->sc_sessions, is_next)
+ iscsi_session_terminate(is);
+ sx_sunlock(&sc->sc_lock);
+}
+
+static int
+iscsi_load(void)
+{
+ int error;
+
+ sc = malloc(sizeof(*sc), M_ISCSI, M_ZERO | M_WAITOK);
+ sx_init(&sc->sc_lock, "iscsi");
+ TAILQ_INIT(&sc->sc_sessions);
+ cv_init(&sc->sc_cv, "iscsi_cv");
+
+ iscsi_outstanding_zone = uma_zcreate("iscsi_outstanding",
+ sizeof(struct iscsi_outstanding), NULL, NULL, NULL, NULL,
+ UMA_ALIGN_PTR, UMA_ZONE_NOFREE);
+
+ error = make_dev_p(MAKEDEV_CHECKNAME, &sc->sc_cdev, &iscsi_cdevsw,
+ NULL, UID_ROOT, GID_WHEEL, 0600, "iscsi");
+ if (error != 0) {
+ ISCSI_WARN("failed to create device node, error %d", error);
+ sx_destroy(&sc->sc_lock);
+ cv_destroy(&sc->sc_cv);
+ uma_zdestroy(iscsi_outstanding_zone);
+ free(sc, M_ISCSI);
+ return (error);
+ }
+ sc->sc_cdev->si_drv1 = sc;
+
+ /*
+ * XXX: For some reason this doesn't do its job; active sessions still hang out there
+ * after final sync, making the reboot effectively hang.
+ */
+ sc->sc_shutdown_eh = EVENTHANDLER_REGISTER(shutdown_post_sync, iscsi_shutdown, sc, SHUTDOWN_PRI_DEFAULT);
+
+ return (0);
+}
+
+static int
+iscsi_unload(void)
+{
+ /*
+ * XXX: kldunload hangs on "devdrn".
+ */
+ struct iscsi_session *is, *tmp;
+
+ ISCSI_DEBUG("removing device node");
+ destroy_dev(sc->sc_cdev);
+ ISCSI_DEBUG("device node removed");
+
+ EVENTHANDLER_DEREGISTER(shutdown_post_sync, sc->sc_shutdown_eh);
+
+ sx_slock(&sc->sc_lock);
+ TAILQ_FOREACH_SAFE(is, &sc->sc_sessions, is_next, tmp)
+ iscsi_session_terminate(is);
+ while(!TAILQ_EMPTY(&sc->sc_sessions)) {
+ ISCSI_DEBUG("waiting for sessions to terminate");
+ cv_wait(&sc->sc_cv, &sc->sc_lock);
+ }
+ ISCSI_DEBUG("all sessions terminated");
+ sx_sunlock(&sc->sc_lock);
+
+ uma_zdestroy(iscsi_outstanding_zone);
+ sx_destroy(&sc->sc_lock);
+ cv_destroy(&sc->sc_cv);
+ free(sc, M_ISCSI);
+ return (0);
+}
+
+static int
+iscsi_quiesce(void)
+{
+ sx_slock(&sc->sc_lock);
+ if (!TAILQ_EMPTY(&sc->sc_sessions)) {
+ sx_sunlock(&sc->sc_lock);
+ return (EBUSY);
+ }
+ sx_sunlock(&sc->sc_lock);
+ return (0);
+}
+
+static int
+iscsi_modevent(module_t mod, int what, void *arg)
+{
+ int error;
+
+ switch (what) {
+ case MOD_LOAD:
+ error = iscsi_load();
+ break;
+ case MOD_UNLOAD:
+ error = iscsi_unload();
+ break;
+ case MOD_QUIESCE:
+ error = iscsi_quiesce();
+ break;
+ default:
+ error = EINVAL;
+ break;
+ }
+ return (error);
+}
+
+moduledata_t iscsi_data = {
+ "iscsi",
+ iscsi_modevent,
+ 0
+};
+
+DECLARE_MODULE(iscsi, iscsi_data, SI_SUB_DRIVERS, SI_ORDER_MIDDLE);
+MODULE_DEPEND(iscsi, cam, 1, 1, 1);
+MODULE_DEPEND(iscsi, icl, 1, 1, 1);
diff --git a/sys/dev/iscsi/iscsi.h b/sys/dev/iscsi/iscsi.h
new file mode 100644
index 000000000000..dd78852b4716
--- /dev/null
+++ b/sys/dev/iscsi/iscsi.h
@@ -0,0 +1,135 @@
+/*-
+ * Copyright (c) 2012 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Edward Tomasz Napierala under sponsorship
+ * from the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * $FreeBSD$
+ */
+
+#ifndef ISCSI_H
+#define ISCSI_H
+
+struct iscsi_softc;
+struct icl_conn;
+
+#define ISCSI_NAME_LEN 224 /* 223 bytes, by RFC 3720, + '\0' */
+#define ISCSI_ADDR_LEN 47 /* INET6_ADDRSTRLEN + '\0' */
+#define ISCSI_SECRET_LEN 17 /* 16 + '\0' */
+
+struct iscsi_outstanding {
+ TAILQ_ENTRY(iscsi_outstanding) io_next;
+ union ccb *io_ccb;
+ size_t io_received;
+ uint32_t io_initiator_task_tag;
+ uint32_t io_datasn;
+};
+
+struct iscsi_session {
+ TAILQ_ENTRY(iscsi_session) is_next;
+
+ struct icl_conn *is_conn;
+ struct mtx is_lock;
+
+ uint32_t is_statsn;
+ uint32_t is_cmdsn;
+ uint32_t is_expcmdsn;
+ uint32_t is_maxcmdsn;
+ uint32_t is_initiator_task_tag;
+ int is_header_digest;
+ int is_data_digest;
+ int is_initial_r2t;
+ size_t is_max_burst_length;
+ size_t is_first_burst_length;
+ uint8_t is_isid[6];
+ bool is_immediate_data;
+ size_t is_max_data_segment_length;
+ char is_target_alias[ISCSI_ALIAS_LEN];
+
+ TAILQ_HEAD(, iscsi_outstanding) is_outstanding;
+ TAILQ_HEAD(, icl_pdu) is_postponed;
+
+ struct callout is_callout;
+ unsigned int is_timeout;
+
+ /*
+ * XXX: This could be rewritten using a single variable,
+ * but somehow it results in uglier code.
+ */
+ /*
+ * We're waiting for iscsid(8); after iscsid_timeout
+ * expires, kernel will wake up an iscsid(8) to handle
+ * the session.
+ */
+ bool is_waiting_for_iscsid;
+
+ /*
+ * Some iscsid(8) instance is handling the session;
+ * after login_timeout expires, kernel will wake up
+ * another iscsid(8) to handle the session.
+ */
+ bool is_login_phase;
+
+ /*
+ * We're in the process of removing the iSCSI session.
+ */
+ bool is_terminating;
+
+ /*
+ * We're waiting for the maintenance thread to do some
+ * reconnection tasks.
+ */
+ bool is_reconnecting;
+
+ bool is_connected;
+
+ struct cam_devq *is_devq;
+ struct cam_sim *is_sim;
+ struct cam_path *is_path;
+ struct cv is_maintenance_cv;
+ struct iscsi_softc *is_softc;
+ unsigned int is_id;
+ struct iscsi_session_conf is_conf;
+ bool is_simq_frozen;
+
+ char is_reason[ISCSI_REASON_LEN];
+
+#ifdef ICL_KERNEL_PROXY
+ struct cv is_login_cv;;
+ struct icl_pdu *is_login_pdu;
+#endif
+};
+
+struct iscsi_softc {
+ device_t sc_dev;
+ struct sx sc_lock;
+ struct cdev *sc_cdev;
+ TAILQ_HEAD(, iscsi_session) sc_sessions;
+ struct cv sc_cv;
+ unsigned int sc_last_session_id;
+ eventhandler_tag sc_shutdown_eh;
+};
+
+#endif /* !ISCSI_H */
diff --git a/sys/dev/iscsi/iscsi_ioctl.h b/sys/dev/iscsi/iscsi_ioctl.h
new file mode 100644
index 000000000000..9e278445d815
--- /dev/null
+++ b/sys/dev/iscsi/iscsi_ioctl.h
@@ -0,0 +1,201 @@
+/*-
+ * Copyright (c) 2012 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Edward Tomasz Napierala under sponsorship
+ * from the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * $FreeBSD$
+ */
+
+#ifndef ISCSI_IOCTL_H
+#define ISCSI_IOCTL_H
+
+#ifdef ICL_KERNEL_PROXY
+#include <sys/socket.h>
+#endif
+
+#define ISCSI_PATH "/dev/iscsi"
+#define ISCSI_MAX_DATA_SEGMENT_LENGTH (128 * 1024)
+
+#define ISCSI_NAME_LEN 224 /* 223 bytes, by RFC 3720, + '\0' */
+#define ISCSI_ADDR_LEN 47 /* INET6_ADDRSTRLEN + '\0' */
+#define ISCSI_ALIAS_LEN 256 /* XXX: Where did it come from? */
+#define ISCSI_SECRET_LEN 17 /* 16 + '\0' */
+#define ISCSI_REASON_LEN 32
+
+#define ISCSI_DIGEST_NONE 0
+#define ISCSI_DIGEST_CRC32C 1
+
+/*
+ * Session configuration, set when adding the session.
+ */
+struct iscsi_session_conf {
+ char isc_initiator[ISCSI_NAME_LEN];
+ char isc_initiator_addr[ISCSI_ADDR_LEN];
+ char isc_initiator_alias[ISCSI_ALIAS_LEN];
+ char isc_target[ISCSI_NAME_LEN];
+ char isc_target_addr[ISCSI_ADDR_LEN];
+ char isc_user[ISCSI_NAME_LEN];
+ char isc_secret[ISCSI_SECRET_LEN];
+ char isc_mutual_user[ISCSI_NAME_LEN];
+ char isc_mutual_secret[ISCSI_SECRET_LEN];
+ int isc_discovery;
+ int isc_header_digest;
+ int isc_data_digest;
+ int isc_iser;
+ int isc_spare[4];
+};
+
+/*
+ * Session state, negotiated by iscsid(8) and queried by iscsictl(8).
+ */
+struct iscsi_session_state {
+ struct iscsi_session_conf iss_conf;
+ unsigned int iss_id;
+ char iss_target_alias[ISCSI_ALIAS_LEN];
+ int iss_header_digest;
+ int iss_data_digest;
+ int iss_max_data_segment_length;
+ int iss_immediate_data;
+ int iss_connected;
+ char iss_reason[ISCSI_REASON_LEN];
+ int iss_spare[4];
+};
+
+/*
+ * For use with iscsid(8).
+ */
+
+struct iscsi_daemon_request {
+ unsigned int idr_session_id;
+ struct iscsi_session_conf idr_conf;
+ int idr_spare[4];
+};
+
+struct iscsi_daemon_handoff {
+ unsigned int idh_session_id;
+ int idh_socket;
+ char idh_target_alias[ISCSI_ALIAS_LEN];
+ uint8_t idh_isid[6];
+ uint32_t idh_statsn;
+ int idh_header_digest;
+ int idh_data_digest;
+ int idh_initial_r2t;
+ int idh_immediate_data;
+ size_t idh_max_data_segment_length;
+ size_t idh_max_burst_length;
+ size_t idh_first_burst_length;
+};
+
+struct iscsi_daemon_fail {
+ unsigned int idf_session_id;
+ char idf_reason[ISCSI_REASON_LEN];
+};
+
+#define ISCSIDWAIT _IOR('I', 0x01, struct iscsi_daemon_request)
+#define ISCSIDHANDOFF _IOW('I', 0x02, struct iscsi_daemon_handoff)
+#define ISCSIDFAIL _IOW('I', 0x03, struct iscsi_daemon_fail)
+
+#ifdef ICL_KERNEL_PROXY
+
+/*
+ * When ICL_KERNEL_PROXY is not defined, the iscsid(8) is responsible
+ * for creating the socket, connecting, performing Login Phase using
+ * socked in the usual userspace way, and then passing the socket file
+ * descriptor to the kernel part using ISCSIDHANDOFF.
+ *
+ * When ICL_KERNEL_PROXY is defined, the iscsid(8) creates the session
+ * using ISCSICONNECT, performs Login Phase using ISCSISEND/ISCSIRECEIVE
+ * instead of read(2)/write(2), and then calls ISCSIDHANDOFF with
+ * idh_socket set to 0.
+ *
+ * The purpose of ICL_KERNEL_PROXY is to workaround the fact that,
+ * at this time, it's not possible to do iWARP (RDMA) in userspace.
+ */
+
+struct iscsi_daemon_connect {
+ int idc_session_id;
+ int idc_iser;
+ int idc_domain;
+ int idc_socktype;
+ int idc_protocol;
+ struct sockaddr *idc_from_addr;
+ socklen_t idc_from_addrlen;
+ struct sockaddr *idc_to_addr;
+ socklen_t idc_to_addrlen;
+};
+
+struct iscsi_daemon_send {
+ int ids_session_id;
+ void *ids_bhs;
+ size_t ids_spare;
+ void *ids_spare2;
+ size_t ids_data_segment_len;
+ void *ids_data_segment;
+};
+
+struct iscsi_daemon_receive {
+ int idr_session_id;
+ void *idr_bhs;
+ size_t idr_spare;
+ void *idr_spare2;
+ size_t idr_data_segment_len;
+ void *idr_data_segment;
+};
+
+struct iscsi_daemon_close {
+ int idc_session_id;
+};
+
+#define ISCSIDCONNECT _IOWR('I', 0x04, struct iscsi_daemon_connect)
+#define ISCSIDSEND _IOWR('I', 0x05, struct iscsi_daemon_send)
+#define ISCSIDRECEIVE _IOWR('I', 0x06, struct iscsi_daemon_receive)
+#define ISCSIDCLOSE _IOWR('I', 0x07, struct iscsi_daemon_close)
+
+#endif /* ICL_KERNEL_PROXY */
+
+/*
+ * For use with iscsictl(8).
+ */
+
+struct iscsi_session_add {
+ struct iscsi_session_conf isa_conf;
+};
+
+struct iscsi_session_remove {
+ unsigned int isr_session_id;
+ struct iscsi_session_conf isr_conf;
+};
+
+struct iscsi_session_list {
+ unsigned int isl_nentries;
+ struct iscsi_session_state *isl_pstates;
+};
+
+#define ISCSISADD _IOW('I', 0x11, struct iscsi_session_add)
+#define ISCSISREMOVE _IOW('I', 0x12, struct iscsi_session_remove)
+#define ISCSISLIST _IOWR('I', 0x13, struct iscsi_session_list)
+
+#endif /* !ISCSI_IOCTL_H */
diff --git a/sys/dev/iscsi/iscsi_proto.h b/sys/dev/iscsi/iscsi_proto.h
new file mode 100644
index 000000000000..97d73a7a074e
--- /dev/null
+++ b/sys/dev/iscsi/iscsi_proto.h
@@ -0,0 +1,439 @@
+/*-
+ * Copyright (c) 2012 The FreeBSD Foundation
+ * All rights reserved.
+ *
+ * This software was developed by Edward Tomasz Napierala under sponsorship
+ * from the FreeBSD Foundation.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ * $FreeBSD$
+ */
+
+#ifndef ISCSI_PROTO_H
+#define ISCSI_PROTO_H
+
+#ifndef CTASSERT
+#define CTASSERT(x) _CTASSERT(x, __LINE__)
+#define _CTASSERT(x, y) __CTASSERT(x, y)
+#define __CTASSERT(x, y) typedef char __assert_ ## y [(x) ? 1 : -1]
+#endif
+
+#define ISCSI_BHS_SIZE 48
+#define ISCSI_HEADER_DIGEST_SIZE 4
+#define ISCSI_DATA_DIGEST_SIZE 4
+
+#define ISCSI_BHS_OPCODE_IMMEDIATE 0x40
+
+#define ISCSI_BHS_OPCODE_NOP_OUT 0x00
+#define ISCSI_BHS_OPCODE_SCSI_COMMAND 0x01
+#define ISCSI_BHS_OPCODE_TASK_REQUEST 0x02
+#define ISCSI_BHS_OPCODE_LOGIN_REQUEST 0x03
+#define ISCSI_BHS_OPCODE_TEXT_REQUEST 0x04
+#define ISCSI_BHS_OPCODE_SCSI_DATA_OUT 0x05
+#define ISCSI_BHS_OPCODE_LOGOUT_REQUEST 0x06
+
+#define ISCSI_BHS_OPCODE_NOP_IN 0x20
+#define ISCSI_BHS_OPCODE_SCSI_RESPONSE 0x21
+#define ISCSI_BHS_OPCODE_TASK_RESPONSE 0x22
+#define ISCSI_BHS_OPCODE_LOGIN_RESPONSE 0x23
+#define ISCSI_BHS_OPCODE_TEXT_RESPONSE 0x24
+#define ISCSI_BHS_OPCODE_SCSI_DATA_IN 0x25
+#define ISCSI_BHS_OPCODE_LOGOUT_RESPONSE 0x26
+#define ISCSI_BHS_OPCODE_R2T 0x31
+#define ISCSI_BHS_OPCODE_ASYNC_MESSAGE 0x32
+#define ISCSI_BHS_OPCODE_REJECT 0x3f
+
+struct iscsi_bhs {
+ uint8_t bhs_opcode;
+ uint8_t bhs_opcode_specific1[3];
+ uint8_t bhs_total_ahs_len;
+ uint8_t bhs_data_segment_len[3];
+ uint64_t bhs_lun;
+ uint8_t bhs_inititator_task_tag[4];
+ uint8_t bhs_opcode_specific4[28];
+};
+CTASSERT(sizeof(struct iscsi_bhs) == ISCSI_BHS_SIZE);
+
+#define BHSSC_FLAGS_F 0x80
+#define BHSSC_FLAGS_R 0x40
+#define BHSSC_FLAGS_W 0x20
+#define BHSSC_FLAGS_ATTR 0x07
+
+#define BHSSC_FLAGS_ATTR_UNTAGGED 0
+#define BHSSC_FLAGS_ATTR_SIMPLE 1
+#define BHSSC_FLAGS_ATTR_ORDERED 2
+#define BHSSC_FLAGS_ATTR_HOQ 3
+#define BHSSC_FLAGS_ATTR_ACA 4
+
+struct iscsi_bhs_scsi_command {
+ uint8_t bhssc_opcode;
+ uint8_t bhssc_flags;
+ uint8_t bhssc_reserved[2];
+ uint8_t bhssc_total_ahs_len;
+ uint8_t bhssc_data_segment_len[3];
+ uint64_t bhssc_lun;
+ uint32_t bhssc_initiator_task_tag;
+ uint32_t bhssc_expected_data_transfer_length;
+ uint32_t bhssc_cmdsn;
+ uint32_t bhssc_expstatsn;
+ uint8_t bhssc_cdb[16];
+};
+CTASSERT(sizeof(struct iscsi_bhs_scsi_command) == ISCSI_BHS_SIZE);
+
+#define BHSSR_FLAGS_RESIDUAL_UNDERFLOW 0x02
+#define BHSSR_FLAGS_RESIDUAL_OVERFLOW 0x04
+
+#define BHSSR_RESPONSE_COMMAND_COMPLETED 0x00
+
+struct iscsi_bhs_scsi_response {
+ uint8_t bhssr_opcode;
+ uint8_t bhssr_flags;
+ uint8_t bhssr_response;
+ uint8_t bhssr_status;
+ uint8_t bhssr_total_ahs_len;
+ uint8_t bhssr_data_segment_len[3];
+ uint64_t bhssr_reserved;
+ uint32_t bhssr_initiator_task_tag;
+ uint32_t bhssr_snack_tag;
+ uint32_t bhssr_statsn;
+ uint32_t bhssr_expcmdsn;
+ uint32_t bhssr_maxcmdsn;
+ uint32_t bhssr_expdatasn;
+ uint32_t bhssr_bidirectional_read_residual_count;
+ uint32_t bhssr_residual_count;
+};
+CTASSERT(sizeof(struct iscsi_bhs_scsi_response) == ISCSI_BHS_SIZE);
+
+#define BHSTMR_FUNCTION_ABORT_TASK 1
+#define BHSTMR_FUNCTION_ABORT_TASK_SET 2
+#define BHSTMR_FUNCTION_CLEAR_ACA 3
+#define BHSTMR_FUNCTION_CLEAR_TASK_SET 4
+#define BHSTMR_FUNCTION_LOGICAL_UNIT_RESET 5
+#define BHSTMR_FUNCTION_TARGET_WARM_RESET 6
+#define BHSTMR_FUNCTION_TARGET_COLD_RESET 7
+#define BHSTMR_FUNCTION_TASK_REASSIGN 8
+
+struct iscsi_bhs_task_management_request {
+ uint8_t bhstmr_opcode;
+ uint8_t bhstmr_function;
+ uint8_t bhstmr_reserved[2];
+ uint8_t bhstmr_total_ahs_len;
+ uint8_t bhstmr_data_segment_len[3];
+ uint64_t bhstmr_lun;
+ uint32_t bhstmr_initiator_task_tag;
+ uint32_t bhstmr_referenced_task_tag;
+ uint32_t bhstmr_cmdsn;
+ uint32_t bhstmr_expstatsn;
+ uint32_t bhstmr_refcmdsn;
+ uint32_t bhstmr_expdatasn;
+ uint64_t bhstmr_reserved2;
+};
+CTASSERT(sizeof(struct iscsi_bhs_task_management_request) == ISCSI_BHS_SIZE);
+
+#define BHSTMR_RESPONSE_FUNCTION_COMPLETE 0
+#define BHSTMR_RESPONSE_FUNCTION_NOT_SUPPORTED 5
+
+struct iscsi_bhs_task_management_response {
+ uint8_t bhstmr_opcode;
+ uint8_t bhstmr_flags;
+ uint8_t bhstmr_response;
+ uint8_t bhstmr_reserved;
+ uint8_t bhstmr_total_ahs_len;
+ uint8_t bhstmr_data_segment_len[3];
+ uint64_t bhstmr_reserved2;
+ uint32_t bhstmr_initiator_task_tag;
+ uint32_t bhstmr_reserved3;
+ uint32_t bhstmr_statsn;
+ uint32_t bhstmr_expcmdsn;
+ uint32_t bhstmr_maxcmdsn;
+ uint8_t bhstmr_reserved4[12];
+};
+CTASSERT(sizeof(struct iscsi_bhs_task_management_response) == ISCSI_BHS_SIZE);
+
+#define BHSLR_FLAGS_TRANSIT 0x80
+#define BHSLR_FLAGS_CONTINUE 0x40
+
+#define BHSLR_STAGE_SECURITY_NEGOTIATION 0
+#define BHSLR_STAGE_OPERATIONAL_NEGOTIATION 1
+#define BHSLR_STAGE_FULL_FEATURE_PHASE 3 /* Yes, 3. */
+
+struct iscsi_bhs_login_request {
+ uint8_t bhslr_opcode;
+ uint8_t bhslr_flags;
+ uint8_t bhslr_version_max;
+ uint8_t bhslr_version_min;
+ uint8_t bhslr_total_ahs_len;
+ uint8_t bhslr_data_segment_len[3];
+ uint8_t bhslr_isid[6];
+ uint16_t bhslr_tsih;
+ uint32_t bhslr_initiator_task_tag;
+ uint16_t bhslr_cid;
+ uint16_t bhslr_reserved;
+ uint32_t bhslr_cmdsn;
+ uint32_t bhslr_expstatsn;
+ uint8_t bhslr_reserved2[16];
+};
+CTASSERT(sizeof(struct iscsi_bhs_login_request) == ISCSI_BHS_SIZE);
+
+struct iscsi_bhs_login_response {
+ uint8_t bhslr_opcode;
+ uint8_t bhslr_flags;
+ uint8_t bhslr_version_max;
+ uint8_t bhslr_version_active;
+ uint8_t bhslr_total_ahs_len;
+ uint8_t bhslr_data_segment_len[3];
+ uint8_t bhslr_isid[6];
+ uint16_t bhslr_tsih;
+ uint32_t bhslr_initiator_task_tag;
+ uint32_t bhslr_reserved;
+ uint32_t bhslr_statsn;
+ uint32_t bhslr_expcmdsn;
+ uint32_t bhslr_maxcmdsn;
+ uint8_t bhslr_status_class;
+ uint8_t bhslr_status_detail;
+ uint16_t bhslr_reserved2;
+ uint8_t bhslr_reserved3[8];
+};
+CTASSERT(sizeof(struct iscsi_bhs_login_response) == ISCSI_BHS_SIZE);
+
+#define BHSTR_FLAGS_FINAL 0x80
+#define BHSTR_FLAGS_CONTINUE 0x40
+
+struct iscsi_bhs_text_request {
+ uint8_t bhstr_opcode;
+ uint8_t bhstr_flags;
+ uint16_t bhstr_reserved;
+ uint8_t bhstr_total_ahs_len;
+ uint8_t bhstr_data_segment_len[3];
+ uint64_t bhstr_lun;
+ uint32_t bhstr_initiator_task_tag;
+ uint32_t bhstr_target_transfer_tag;
+ uint32_t bhstr_cmdsn;
+ uint32_t bhstr_expstatsn;
+ uint8_t bhstr_reserved2[16];
+};
+CTASSERT(sizeof(struct iscsi_bhs_text_request) == ISCSI_BHS_SIZE);
+
+struct iscsi_bhs_text_response {
+ uint8_t bhstr_opcode;
+ uint8_t bhstr_flags;
+ uint16_t bhstr_reserved;
+ uint8_t bhstr_total_ahs_len;
+ uint8_t bhstr_data_segment_len[3];
+ uint64_t bhstr_lun;
+ uint32_t bhstr_initiator_task_tag;
+ uint32_t bhstr_target_transfer_tag;
+ uint32_t bhstr_statsn;
+ uint32_t bhstr_expcmdsn;
+ uint32_t bhstr_maxcmdsn;
+ uint8_t bhstr_reserved2[12];
+};
+CTASSERT(sizeof(struct iscsi_bhs_text_response) == ISCSI_BHS_SIZE);
+
+#define BHSDO_FLAGS_F 0x80
+
+struct iscsi_bhs_data_out {
+ uint8_t bhsdo_opcode;
+ uint8_t bhsdo_flags;
+ uint8_t bhsdo_reserved[2];
+ uint8_t bhsdo_total_ahs_len;
+ uint8_t bhsdo_data_segment_len[3];
+ uint64_t bhsdo_lun;
+ uint32_t bhsdo_initiator_task_tag;
+ uint32_t bhsdo_target_transfer_tag;
+ uint32_t bhsdo_reserved2;
+ uint32_t bhsdo_expstatsn;
+ uint32_t bhsdo_reserved3;
+ uint32_t bhsdo_datasn;
+ uint32_t bhsdo_buffer_offset;
+ uint32_t bhsdo_reserved4;
+};
+CTASSERT(sizeof(struct iscsi_bhs_data_out) == ISCSI_BHS_SIZE);
+
+#define BHSDI_FLAGS_F 0x80
+#define BHSDI_FLAGS_A 0x40
+#define BHSDI_FLAGS_O 0x04
+#define BHSDI_FLAGS_U 0x02
+#define BHSDI_FLAGS_S 0x01
+
+struct iscsi_bhs_data_in {
+ uint8_t bhsdi_opcode;
+ uint8_t bhsdi_flags;
+ uint8_t bhsdi_reserved;
+ uint8_t bhsdi_status;
+ uint8_t bhsdi_total_ahs_len;
+ uint8_t bhsdi_data_segment_len[3];
+ uint64_t bhsdi_lun;
+ uint32_t bhsdi_initiator_task_tag;
+ uint32_t bhsdi_target_transfer_tag;
+ uint32_t bhsdi_statsn;
+ uint32_t bhsdi_expcmdsn;
+ uint32_t bhsdi_maxcmdsn;
+ uint32_t bhsdi_datasn;
+ uint32_t bhsdi_buffer_offset;
+ uint32_t bhsdi_residual_count;
+};
+CTASSERT(sizeof(struct iscsi_bhs_data_in) == ISCSI_BHS_SIZE);
+
+struct iscsi_bhs_r2t {
+ uint8_t bhsr2t_opcode;
+ uint8_t bhsr2t_flags;
+ uint16_t bhsr2t_reserved;
+ uint8_t bhsr2t_total_ahs_len;
+ uint8_t bhsr2t_data_segment_len[3];
+ uint64_t bhsr2t_lun;
+ uint32_t bhsr2t_initiator_task_tag;
+ uint32_t bhsr2t_target_transfer_tag;
+ uint32_t bhsr2t_statsn;
+ uint32_t bhsr2t_expcmdsn;
+ uint32_t bhsr2t_maxcmdsn;
+ uint32_t bhsr2t_r2tsn;
+ uint32_t bhsr2t_buffer_offset;
+ uint32_t bhsr2t_desired_data_transfer_length;
+};
+CTASSERT(sizeof(struct iscsi_bhs_r2t) == ISCSI_BHS_SIZE);
+
+struct iscsi_bhs_nop_out {
+ uint8_t bhsno_opcode;
+ uint8_t bhsno_flags;
+ uint16_t bhsno_reserved;
+ uint8_t bhsno_total_ahs_len;
+ uint8_t bhsno_data_segment_len[3];
+ uint64_t bhsno_lun;
+ uint32_t bhsno_initiator_task_tag;
+ uint32_t bhsno_target_transfer_tag;
+ uint32_t bhsno_cmdsn;
+ uint32_t bhsno_expstatsn;
+ uint8_t bhsno_reserved2[16];
+};
+CTASSERT(sizeof(struct iscsi_bhs_nop_out) == ISCSI_BHS_SIZE);
+
+struct iscsi_bhs_nop_in {
+ uint8_t bhsni_opcode;
+ uint8_t bhsni_flags;
+ uint16_t bhsni_reserved;
+ uint8_t bhsni_total_ahs_len;
+ uint8_t bhsni_data_segment_len[3];
+ uint64_t bhsni_lun;
+ uint32_t bhsni_initiator_task_tag;
+ uint32_t bhsni_target_transfer_tag;
+ uint32_t bhsni_statsn;
+ uint32_t bhsni_expcmdsn;
+ uint32_t bhsni_maxcmdsn;
+ uint8_t bhsno_reserved2[12];
+};
+CTASSERT(sizeof(struct iscsi_bhs_nop_in) == ISCSI_BHS_SIZE);
+
+#define BHSLR_REASON_CLOSE_SESSION 0
+#define BHSLR_REASON_CLOSE_CONNECTION 1
+#define BHSLR_REASON_REMOVE_FOR_RECOVERY 2
+
+struct iscsi_bhs_logout_request {
+ uint8_t bhslr_opcode;
+ uint8_t bhslr_reason;
+ uint16_t bhslr_reserved;
+ uint8_t bhslr_total_ahs_len;
+ uint8_t bhslr_data_segment_len[3];
+ uint64_t bhslr_reserved2;
+ uint32_t bhslr_initiator_task_tag;
+ uint16_t bhslr_cid;
+ uint16_t bhslr_reserved3;
+ uint32_t bhslr_cmdsn;
+ uint32_t bhslr_expstatsn;
+ uint8_t bhslr_reserved4[16];
+};
+CTASSERT(sizeof(struct iscsi_bhs_logout_request) == ISCSI_BHS_SIZE);
+
+#define BHSLR_RESPONSE_CLOSED_SUCCESSFULLY 0
+#define BHSLR_RESPONSE_RECOVERY_NOT_SUPPORTED 2
+
+struct iscsi_bhs_logout_response {
+ uint8_t bhslr_opcode;
+ uint8_t bhslr_flags;
+ uint8_t bhslr_response;
+ uint8_t bhslr_reserved;
+ uint8_t bhslr_total_ahs_len;
+ uint8_t bhslr_data_segment_len[3];
+ uint64_t bhslr_reserved2;
+ uint32_t bhslr_initiator_task_tag;
+ uint32_t bhslr_reserved3;
+ uint32_t bhslr_statsn;
+ uint32_t bhslr_expcmdsn;
+ uint32_t bhslr_maxcmdsn;
+ uint32_t bhslr_reserved4;
+ uint16_t bhslr_time2wait;
+ uint16_t bhslr_time2retain;
+ uint32_t bhslr_reserved5;
+};
+CTASSERT(sizeof(struct iscsi_bhs_logout_response) == ISCSI_BHS_SIZE);
+
+#define BHSAM_EVENT_TARGET_REQUESTS_LOGOUT 1
+#define BHSAM_EVENT_TARGET_TERMINATES_CONNECTION 2
+#define BHSAM_EVENT_TARGET_TERMINATES_SESSION 3
+
+struct iscsi_bhs_asynchronous_message {
+ uint8_t bhsam_opcode;
+ uint8_t bhsam_flags;
+ uint16_t bhsam_reserved;
+ uint8_t bhsam_total_ahs_len;
+ uint8_t bhsam_data_segment_len[3];
+ uint64_t bhsam_lun;
+ uint32_t bhsam_0xffffffff;
+ uint32_t bhsam_reserved2;
+ uint32_t bhsam_statsn;
+ uint32_t bhsam_expcmdsn;
+ uint32_t bhsam_maxcmdsn;
+ uint8_t bhsam_async_event;
+ uint8_t bhsam_async_vcode;
+ uint16_t bhsam_parameter1;
+ uint16_t bhsam_parameter2;
+ uint16_t bhsam_parameter3;
+ uint32_t bhsam_reserved3;
+};
+CTASSERT(sizeof(struct iscsi_bhs_asynchronous_message) == ISCSI_BHS_SIZE);
+
+#define BHSSR_REASON_DATA_DIGEST_ERROR 0x02
+#define BHSSR_PROTOCOL_ERROR 0x04
+#define BHSSR_COMMAND_NOT_SUPPORTED 0x05
+#define BHSSR_INVALID_PDU_FIELD 0x09
+
+struct iscsi_bhs_reject {
+ uint8_t bhsr_opcode;
+ uint8_t bhsr_flags;
+ uint8_t bhsr_reason;
+ uint8_t bhsr_reserved;
+ uint8_t bhsr_total_ahs_len;
+ uint8_t bhsr_data_segment_len[3];
+ uint64_t bhsr_reserved2;
+ uint32_t bhsr_0xffffffff;
+ uint32_t bhsr_reserved3;
+ uint32_t bhsr_statsn;
+ uint32_t bhsr_expcmdsn;
+ uint32_t bhsr_maxcmdsn;
+ uint32_t bhsr_datasn_r2tsn;
+ uint32_t bhsr_reserved4;
+ uint32_t bhsr_reserved5;
+};
+CTASSERT(sizeof(struct iscsi_bhs_reject) == ISCSI_BHS_SIZE);
+
+#endif /* !ISCSI_PROTO_H */
diff --git a/sys/dev/iscsi_initiator/iscsi.c b/sys/dev/iscsi_initiator/iscsi.c
index 4a1cb967ffa0..6e06718aabfc 100644
--- a/sys/dev/iscsi_initiator/iscsi.c
+++ b/sys/dev/iscsi_initiator/iscsi.c
@@ -858,7 +858,7 @@ iscsi_modevent(module_t mod, int what, void *arg)
}
moduledata_t iscsi_mod = {
- "iscsi",
+ "iscsi_initiator",
(modeventhand_t) iscsi_modevent,
0
};
@@ -878,5 +878,5 @@ iscsi_rootconf(void)
SYSINIT(cpu_rootconf1, SI_SUB_ROOT_CONF, SI_ORDER_FIRST, iscsi_rootconf, NULL)
#endif
-DECLARE_MODULE(iscsi, iscsi_mod, SI_SUB_DRIVERS, SI_ORDER_MIDDLE);
-MODULE_DEPEND(iscsi, cam, 1, 1, 1);
+DECLARE_MODULE(iscsi_initiator, iscsi_mod, SI_SUB_DRIVERS, SI_ORDER_MIDDLE);
+MODULE_DEPEND(iscsi_initiator, cam, 1, 1, 1);