xref: /illumos-gate/usr/src/uts/common/io/idm/idm_so.c (revision 2727bb05)
1a6d42e7dSPeter Dunlap /*
2a6d42e7dSPeter Dunlap  * CDDL HEADER START
3a6d42e7dSPeter Dunlap  *
4a6d42e7dSPeter Dunlap  * The contents of this file are subject to the terms of the
5a6d42e7dSPeter Dunlap  * Common Development and Distribution License (the "License").
6a6d42e7dSPeter Dunlap  * You may not use this file except in compliance with the License.
7a6d42e7dSPeter Dunlap  *
8a6d42e7dSPeter Dunlap  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9a6d42e7dSPeter Dunlap  * or http://www.opensolaris.org/os/licensing.
10a6d42e7dSPeter Dunlap  * See the License for the specific language governing permissions
11a6d42e7dSPeter Dunlap  * and limitations under the License.
12a6d42e7dSPeter Dunlap  *
13a6d42e7dSPeter Dunlap  * When distributing Covered Code, include this CDDL HEADER in each
14a6d42e7dSPeter Dunlap  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15a6d42e7dSPeter Dunlap  * If applicable, add the following below this CDDL HEADER, with the
16a6d42e7dSPeter Dunlap  * fields enclosed by brackets "[]" replaced with your own identifying
17a6d42e7dSPeter Dunlap  * information: Portions Copyright [yyyy] [name of copyright owner]
18a6d42e7dSPeter Dunlap  *
19a6d42e7dSPeter Dunlap  * CDDL HEADER END
20a6d42e7dSPeter Dunlap  */
21a6d42e7dSPeter Dunlap /*
22e97fb153SPeter Cudhea - Sun Microsystems - Burlington, MA United States  * Copyright 2010 Sun Microsystems, Inc.  All rights reserved.
23a6d42e7dSPeter Dunlap  * Use is subject to license terms.
24a6d42e7dSPeter Dunlap  */
250f94976eSJeff Biseda /*
260f94976eSJeff Biseda  * Copyright (c) 2013 by Delphix. All rights reserved.
27*2727bb05STim Kordas  * Copyright (c) 2017, Joyent, Inc.  All rights reserved.
280f94976eSJeff Biseda  */
29a6d42e7dSPeter Dunlap 
30a6d42e7dSPeter Dunlap #include <sys/conf.h>
31a6d42e7dSPeter Dunlap #include <sys/stat.h>
32a6d42e7dSPeter Dunlap #include <sys/file.h>
33a6d42e7dSPeter Dunlap #include <sys/ddi.h>
34a6d42e7dSPeter Dunlap #include <sys/sunddi.h>
35a6d42e7dSPeter Dunlap #include <sys/modctl.h>
36a6d42e7dSPeter Dunlap #include <sys/priv.h>
37a6d42e7dSPeter Dunlap #include <sys/cpuvar.h>
38a6d42e7dSPeter Dunlap #include <sys/socket.h>
39a6d42e7dSPeter Dunlap #include <sys/strsubr.h>
40a6d42e7dSPeter Dunlap #include <sys/sysmacros.h>
41a6d42e7dSPeter Dunlap #include <sys/sdt.h>
42a6d42e7dSPeter Dunlap #include <netinet/tcp.h>
43a6d42e7dSPeter Dunlap #include <inet/tcp.h>
44a6d42e7dSPeter Dunlap #include <sys/socketvar.h>
45a6d42e7dSPeter Dunlap #include <sys/pathname.h>
46a6d42e7dSPeter Dunlap #include <sys/fs/snode.h>
47a6d42e7dSPeter Dunlap #include <sys/fs/dv_node.h>
48a6d42e7dSPeter Dunlap #include <sys/vnode.h>
49a6d42e7dSPeter Dunlap #include <netinet/in.h>
50a6d42e7dSPeter Dunlap #include <net/if.h>
51a6d42e7dSPeter Dunlap #include <sys/sockio.h>
520f1702c5SYu Xiangning #include <sys/ksocket.h>
53bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States #include <sys/filio.h>		/* FIONBIO */
5456261083SCharles Ting #include <sys/iscsi_protocol.h>
55a6d42e7dSPeter Dunlap #include <sys/idm/idm.h>
56a6d42e7dSPeter Dunlap #include <sys/idm/idm_so.h>
57a6d42e7dSPeter Dunlap #include <sys/idm/idm_text.h>
58a6d42e7dSPeter Dunlap 
59aff4bce5Syi zhang - Sun Microsystems - Beijing China #define	IN_PROGRESS_DELAY	1
60aff4bce5Syi zhang - Sun Microsystems - Beijing China 
61a6d42e7dSPeter Dunlap /*
62a6d42e7dSPeter Dunlap  * in6addr_any is currently all zeroes, but use the macro in case this
63a6d42e7dSPeter Dunlap  * ever changes.
64a6d42e7dSPeter Dunlap  */
65e42a0851Speter dunlap static const struct in6_addr in6addr_any = IN6ADDR_ANY_INIT;
66a6d42e7dSPeter Dunlap 
67a6d42e7dSPeter Dunlap static void idm_sorx_cache_pdu_cb(idm_pdu_t *pdu, idm_status_t status);
68a6d42e7dSPeter Dunlap static void idm_sorx_addl_pdu_cb(idm_pdu_t *pdu, idm_status_t status);
69a6d42e7dSPeter Dunlap static void idm_sotx_cache_pdu_cb(idm_pdu_t *pdu, idm_status_t status);
70a6d42e7dSPeter Dunlap 
710f1702c5SYu Xiangning static idm_status_t idm_so_conn_create_common(idm_conn_t *ic, ksocket_t new_so);
72a6d42e7dSPeter Dunlap static void idm_so_conn_destroy_common(idm_conn_t *ic);
73a6d42e7dSPeter Dunlap static void idm_so_conn_connect_common(idm_conn_t *ic);
74a6d42e7dSPeter Dunlap 
75dedec472SJack Meng static void idm_set_ini_preconnect_options(idm_so_conn_t *sc,
76dedec472SJack Meng     boolean_t boot_conn);
770f94976eSJeff Biseda static void idm_set_postconnect_options(ksocket_t so);
78a6d42e7dSPeter Dunlap static idm_status_t idm_i_so_tx(idm_pdu_t *pdu);
79a6d42e7dSPeter Dunlap 
80a6d42e7dSPeter Dunlap static idm_status_t idm_sorecvdata(idm_conn_t *ic, idm_pdu_t *pdu);
8130e7468fSPeter Dunlap static void idm_so_send_rtt_data(idm_conn_t *ic, idm_task_t *idt,
8230e7468fSPeter Dunlap     idm_buf_t *idb, uint32_t offset, uint32_t length);
8330e7468fSPeter Dunlap static void idm_so_send_rtt_data_done(idm_task_t *idt, idm_buf_t *idb);
8430e7468fSPeter Dunlap static idm_status_t idm_so_send_buf_region(idm_task_t *idt,
85a6d42e7dSPeter Dunlap     idm_buf_t *idb, uint32_t buf_region_offset, uint32_t buf_region_length);
86a6d42e7dSPeter Dunlap 
87a6d42e7dSPeter Dunlap static uint32_t idm_fill_iov(idm_pdu_t *pdu, idm_buf_t *idb,
88a6d42e7dSPeter Dunlap     uint32_t ro, uint32_t dlength);
89a6d42e7dSPeter Dunlap 
90a6d42e7dSPeter Dunlap static idm_status_t idm_so_handle_digest(idm_conn_t *it,
91a6d42e7dSPeter Dunlap     nvpair_t *digest_choice, const idm_kv_xlate_t *ikvx);
92a6d42e7dSPeter Dunlap 
93aff4bce5Syi zhang - Sun Microsystems - Beijing China static void idm_so_socket_set_nonblock(struct sonode *node);
94aff4bce5Syi zhang - Sun Microsystems - Beijing China static void idm_so_socket_set_block(struct sonode *node);
95aff4bce5Syi zhang - Sun Microsystems - Beijing China 
96a6d42e7dSPeter Dunlap /*
97a6d42e7dSPeter Dunlap  * Transport ops prototypes
98a6d42e7dSPeter Dunlap  */
99a6d42e7dSPeter Dunlap static void idm_so_tx(idm_conn_t *ic, idm_pdu_t *pdu);
100a6d42e7dSPeter Dunlap static idm_status_t idm_so_buf_tx_to_ini(idm_task_t *idt, idm_buf_t *idb);
101a6d42e7dSPeter Dunlap static idm_status_t idm_so_buf_rx_from_ini(idm_task_t *idt, idm_buf_t *idb);
102a6d42e7dSPeter Dunlap static void idm_so_rx_datain(idm_conn_t *ic, idm_pdu_t *pdu);
103a6d42e7dSPeter Dunlap static void idm_so_rx_rtt(idm_conn_t *ic, idm_pdu_t *pdu);
104a6d42e7dSPeter Dunlap static void idm_so_rx_dataout(idm_conn_t *ic, idm_pdu_t *pdu);
105a6d42e7dSPeter Dunlap static idm_status_t idm_so_free_task_rsrc(idm_task_t *idt);
106a6d42e7dSPeter Dunlap static kv_status_t idm_so_negotiate_key_values(idm_conn_t *it,
107a6d42e7dSPeter Dunlap     nvlist_t *request_nvl, nvlist_t *response_nvl, nvlist_t *negotiated_nvl);
10830e7468fSPeter Dunlap static void idm_so_notice_key_values(idm_conn_t *it,
109a6d42e7dSPeter Dunlap     nvlist_t *negotiated_nvl);
11056261083SCharles Ting static kv_status_t idm_so_declare_key_values(idm_conn_t *it,
11156261083SCharles Ting     nvlist_t *config_nvl, nvlist_t *outgoing_nvl);
112a6d42e7dSPeter Dunlap static boolean_t idm_so_conn_is_capable(idm_conn_req_t *ic,
113a6d42e7dSPeter Dunlap     idm_transport_caps_t *caps);
114a6d42e7dSPeter Dunlap static idm_status_t idm_so_buf_alloc(idm_buf_t *idb, uint64_t buflen);
115a6d42e7dSPeter Dunlap static void idm_so_buf_free(idm_buf_t *idb);
116a6d42e7dSPeter Dunlap static idm_status_t idm_so_buf_setup(idm_buf_t *idb);
117a6d42e7dSPeter Dunlap static void idm_so_buf_teardown(idm_buf_t *idb);
118a6d42e7dSPeter Dunlap static idm_status_t idm_so_tgt_svc_create(idm_svc_req_t *sr, idm_svc_t *is);
119a6d42e7dSPeter Dunlap static void idm_so_tgt_svc_destroy(idm_svc_t *is);
120a6d42e7dSPeter Dunlap static idm_status_t idm_so_tgt_svc_online(idm_svc_t *is);
121a6d42e7dSPeter Dunlap static void idm_so_tgt_svc_offline(idm_svc_t *is);
122a6d42e7dSPeter Dunlap static void idm_so_tgt_conn_destroy(idm_conn_t *ic);
123a6d42e7dSPeter Dunlap static idm_status_t idm_so_tgt_conn_connect(idm_conn_t *ic);
124a6d42e7dSPeter Dunlap static void idm_so_conn_disconnect(idm_conn_t *ic);
125a6d42e7dSPeter Dunlap static idm_status_t idm_so_ini_conn_create(idm_conn_req_t *cr, idm_conn_t *ic);
126a6d42e7dSPeter Dunlap static void idm_so_ini_conn_destroy(idm_conn_t *ic);
127a6d42e7dSPeter Dunlap static idm_status_t idm_so_ini_conn_connect(idm_conn_t *ic);
128a6d42e7dSPeter Dunlap 
129a6d42e7dSPeter Dunlap /*
130a6d42e7dSPeter Dunlap  * IDM Native Sockets transport operations
131a6d42e7dSPeter Dunlap  */
132a6d42e7dSPeter Dunlap static
133a6d42e7dSPeter Dunlap idm_transport_ops_t idm_so_transport_ops = {
134a6d42e7dSPeter Dunlap 	idm_so_tx,			/* it_tx_pdu */
135a6d42e7dSPeter Dunlap 	idm_so_buf_tx_to_ini,		/* it_buf_tx_to_ini */
136a6d42e7dSPeter Dunlap 	idm_so_buf_rx_from_ini,		/* it_buf_rx_from_ini */
137a6d42e7dSPeter Dunlap 	idm_so_rx_datain,		/* it_rx_datain */
138a6d42e7dSPeter Dunlap 	idm_so_rx_rtt,			/* it_rx_rtt */
139a6d42e7dSPeter Dunlap 	idm_so_rx_dataout,		/* it_rx_dataout */
140a6d42e7dSPeter Dunlap 	NULL,				/* it_alloc_conn_rsrc */
141a6d42e7dSPeter Dunlap 	NULL,				/* it_free_conn_rsrc */
142a6d42e7dSPeter Dunlap 	NULL,				/* it_tgt_enable_datamover */
143a6d42e7dSPeter Dunlap 	NULL,				/* it_ini_enable_datamover */
144a6d42e7dSPeter Dunlap 	NULL,				/* it_conn_terminate */
145a6d42e7dSPeter Dunlap 	idm_so_free_task_rsrc,		/* it_free_task_rsrc */
146a6d42e7dSPeter Dunlap 	idm_so_negotiate_key_values,	/* it_negotiate_key_values */
147a6d42e7dSPeter Dunlap 	idm_so_notice_key_values,	/* it_notice_key_values */
148a6d42e7dSPeter Dunlap 	idm_so_conn_is_capable,		/* it_conn_is_capable */
149a6d42e7dSPeter Dunlap 	idm_so_buf_alloc,		/* it_buf_alloc */
150a6d42e7dSPeter Dunlap 	idm_so_buf_free,		/* it_buf_free */
151a6d42e7dSPeter Dunlap 	idm_so_buf_setup,		/* it_buf_setup */
152a6d42e7dSPeter Dunlap 	idm_so_buf_teardown,		/* it_buf_teardown */
153a6d42e7dSPeter Dunlap 	idm_so_tgt_svc_create,		/* it_tgt_svc_create */
154a6d42e7dSPeter Dunlap 	idm_so_tgt_svc_destroy,		/* it_tgt_svc_destroy */
155a6d42e7dSPeter Dunlap 	idm_so_tgt_svc_online,		/* it_tgt_svc_online */
156a6d42e7dSPeter Dunlap 	idm_so_tgt_svc_offline,		/* it_tgt_svc_offline */
157a6d42e7dSPeter Dunlap 	idm_so_tgt_conn_destroy,	/* it_tgt_conn_destroy */
158a6d42e7dSPeter Dunlap 	idm_so_tgt_conn_connect,	/* it_tgt_conn_connect */
159a6d42e7dSPeter Dunlap 	idm_so_conn_disconnect,		/* it_tgt_conn_disconnect */
160a6d42e7dSPeter Dunlap 	idm_so_ini_conn_create,		/* it_ini_conn_create */
161a6d42e7dSPeter Dunlap 	idm_so_ini_conn_destroy,	/* it_ini_conn_destroy */
162a6d42e7dSPeter Dunlap 	idm_so_ini_conn_connect,	/* it_ini_conn_connect */
16356261083SCharles Ting 	idm_so_conn_disconnect,		/* it_ini_conn_disconnect */
16456261083SCharles Ting 	idm_so_declare_key_values	/* it_declare_key_values */
165a6d42e7dSPeter Dunlap };
166a6d42e7dSPeter Dunlap 
167bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States kmutex_t	idm_so_timed_socket_mutex;
1680f94976eSJeff Biseda 
1690f94976eSJeff Biseda int32_t idm_so_sndbuf = IDM_SNDBUF_SIZE;
1700f94976eSJeff Biseda int32_t idm_so_rcvbuf = IDM_RCVBUF_SIZE;
1710f94976eSJeff Biseda 
172a6d42e7dSPeter Dunlap /*
173a6d42e7dSPeter Dunlap  * idm_so_init()
174a6d42e7dSPeter Dunlap  * Sockets transport initialization
175a6d42e7dSPeter Dunlap  */
176a6d42e7dSPeter Dunlap void
177a6d42e7dSPeter Dunlap idm_so_init(idm_transport_t *it)
178a6d42e7dSPeter Dunlap {
179a6d42e7dSPeter Dunlap 	/* Cache for IDM Data and R2T Transmit PDU's */
180a6d42e7dSPeter Dunlap 	idm.idm_sotx_pdu_cache = kmem_cache_create("idm_tx_pdu_cache",
181a6d42e7dSPeter Dunlap 	    sizeof (idm_pdu_t) + sizeof (iscsi_hdr_t), 8,
182a6d42e7dSPeter Dunlap 	    &idm_sotx_pdu_constructor, NULL, NULL, NULL, NULL, KM_SLEEP);
183a6d42e7dSPeter Dunlap 
184a6d42e7dSPeter Dunlap 	/* Cache for IDM Receive PDU's */
185a6d42e7dSPeter Dunlap 	idm.idm_sorx_pdu_cache = kmem_cache_create("idm_rx_pdu_cache",
186a6d42e7dSPeter Dunlap 	    sizeof (idm_pdu_t) + IDM_SORX_CACHE_HDRLEN, 8,
187a6d42e7dSPeter Dunlap 	    &idm_sorx_pdu_constructor, NULL, NULL, NULL, NULL, KM_SLEEP);
188a6d42e7dSPeter Dunlap 
189cf8c0ebaSPeter Dunlap 	/* 128k buffer cache */
190cf8c0ebaSPeter Dunlap 	idm.idm_so_128k_buf_cache = kmem_cache_create("idm_128k_buf_cache",
191cf8c0ebaSPeter Dunlap 	    IDM_SO_BUF_CACHE_UB, 8, NULL, NULL, NULL, NULL, NULL, KM_SLEEP);
192cf8c0ebaSPeter Dunlap 
193a6d42e7dSPeter Dunlap 	/* Set the sockets transport ops */
194a6d42e7dSPeter Dunlap 	it->it_ops = &idm_so_transport_ops;
195bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
196bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	mutex_init(&idm_so_timed_socket_mutex, NULL, MUTEX_DEFAULT, NULL);
197bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
198a6d42e7dSPeter Dunlap }
199a6d42e7dSPeter Dunlap 
200a6d42e7dSPeter Dunlap /*
201a6d42e7dSPeter Dunlap  * idm_so_fini()
202a6d42e7dSPeter Dunlap  * Sockets transport teardown
203a6d42e7dSPeter Dunlap  */
204a6d42e7dSPeter Dunlap void
205a6d42e7dSPeter Dunlap idm_so_fini(void)
206a6d42e7dSPeter Dunlap {
207cf8c0ebaSPeter Dunlap 	kmem_cache_destroy(idm.idm_so_128k_buf_cache);
208a6d42e7dSPeter Dunlap 	kmem_cache_destroy(idm.idm_sotx_pdu_cache);
209a6d42e7dSPeter Dunlap 	kmem_cache_destroy(idm.idm_sorx_pdu_cache);
210bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	mutex_destroy(&idm_so_timed_socket_mutex);
211a6d42e7dSPeter Dunlap }
212a6d42e7dSPeter Dunlap 
2130f1702c5SYu Xiangning ksocket_t
214a6d42e7dSPeter Dunlap idm_socreate(int domain, int type, int protocol)
215a6d42e7dSPeter Dunlap {
2160f1702c5SYu Xiangning 	ksocket_t ks;
217a6d42e7dSPeter Dunlap 
2180f1702c5SYu Xiangning 	if (!ksocket_socket(&ks, domain, type, protocol, KSOCKET_NOSLEEP,
2190f1702c5SYu Xiangning 	    CRED())) {
2200f1702c5SYu Xiangning 		return (ks);
2210f1702c5SYu Xiangning 	} else {
2220f1702c5SYu Xiangning 		return (NULL);
223a6d42e7dSPeter Dunlap 	}
224a6d42e7dSPeter Dunlap }
225a6d42e7dSPeter Dunlap 
226a6d42e7dSPeter Dunlap /*
227a6d42e7dSPeter Dunlap  * idm_soshutdown will disconnect the socket and prevent subsequent PDU
228a6d42e7dSPeter Dunlap  * reception and transmission.  The sonode still exists but its state
229a6d42e7dSPeter Dunlap  * gets modified to indicate it is no longer connected.  Calls to
230a6d42e7dSPeter Dunlap  * idm_sorecv/idm_iov_sorecv will return so idm_soshutdown can be used
231a6d42e7dSPeter Dunlap  * regain control of a thread stuck in idm_sorecv.
232a6d42e7dSPeter Dunlap  */
233a6d42e7dSPeter Dunlap void
2340f1702c5SYu Xiangning idm_soshutdown(ksocket_t so)
235a6d42e7dSPeter Dunlap {
2360f1702c5SYu Xiangning 	(void) ksocket_shutdown(so, SHUT_RDWR, CRED());
237a6d42e7dSPeter Dunlap }
238a6d42e7dSPeter Dunlap 
239a6d42e7dSPeter Dunlap /*
240a6d42e7dSPeter Dunlap  * idm_sodestroy releases all resources associated with a socket previously
241a6d42e7dSPeter Dunlap  * created with idm_socreate.  The socket must be shutdown using
242a6d42e7dSPeter Dunlap  * idm_soshutdown before the socket is destroyed with idm_sodestroy,
243a6d42e7dSPeter Dunlap  * otherwise undefined behavior will result.
244a6d42e7dSPeter Dunlap  */
245a6d42e7dSPeter Dunlap void
2460f1702c5SYu Xiangning idm_sodestroy(ksocket_t ks)
247a6d42e7dSPeter Dunlap {
2480f1702c5SYu Xiangning 	(void) ksocket_close(ks, CRED());
249a6d42e7dSPeter Dunlap }
250a6d42e7dSPeter Dunlap 
251e42a0851Speter dunlap /*
252e42a0851Speter dunlap  * Function to compare two addresses in sockaddr_storage format
253e42a0851Speter dunlap  */
254e42a0851Speter dunlap 
255e42a0851Speter dunlap int
256e42a0851Speter dunlap idm_ss_compare(const struct sockaddr_storage *cmp_ss1,
257e42a0851Speter dunlap     const struct sockaddr_storage *cmp_ss2,
258bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States     boolean_t v4_mapped_as_v4,
259bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States     boolean_t compare_ports)
260e42a0851Speter dunlap {
261e42a0851Speter dunlap 	struct sockaddr_storage			mapped_v4_ss1, mapped_v4_ss2;
262e42a0851Speter dunlap 	const struct sockaddr_storage		*ss1, *ss2;
263e42a0851Speter dunlap 	struct in_addr				*in1, *in2;
264e42a0851Speter dunlap 	struct in6_addr				*in61, *in62;
265e42a0851Speter dunlap 	int i;
266e42a0851Speter dunlap 
267e42a0851Speter dunlap 	/*
268e42a0851Speter dunlap 	 * Normalize V4-mapped IPv6 addresses into V4 format if
269e42a0851Speter dunlap 	 * v4_mapped_as_v4 is B_TRUE.
270e42a0851Speter dunlap 	 */
271e42a0851Speter dunlap 	ss1 = cmp_ss1;
272e42a0851Speter dunlap 	ss2 = cmp_ss2;
273e42a0851Speter dunlap 	if (v4_mapped_as_v4 && (ss1->ss_family == AF_INET6)) {
274e42a0851Speter dunlap 		in61 = &((struct sockaddr_in6 *)ss1)->sin6_addr;
275e42a0851Speter dunlap 		if (IN6_IS_ADDR_V4MAPPED(in61)) {
276e42a0851Speter dunlap 			bzero(&mapped_v4_ss1, sizeof (mapped_v4_ss1));
277e42a0851Speter dunlap 			mapped_v4_ss1.ss_family = AF_INET;
278e42a0851Speter dunlap 			((struct sockaddr_in *)&mapped_v4_ss1)->sin_port =
279e42a0851Speter dunlap 			    ((struct sockaddr_in *)ss1)->sin_port;
280e42a0851Speter dunlap 			IN6_V4MAPPED_TO_INADDR(in61,
281e42a0851Speter dunlap 			    &((struct sockaddr_in *)&mapped_v4_ss1)->sin_addr);
282e42a0851Speter dunlap 			ss1 = &mapped_v4_ss1;
283e42a0851Speter dunlap 		}
284e42a0851Speter dunlap 	}
285e42a0851Speter dunlap 	ss2 = cmp_ss2;
286e42a0851Speter dunlap 	if (v4_mapped_as_v4 && (ss2->ss_family == AF_INET6)) {
287e42a0851Speter dunlap 		in62 = &((struct sockaddr_in6 *)ss2)->sin6_addr;
288e42a0851Speter dunlap 		if (IN6_IS_ADDR_V4MAPPED(in62)) {
289e42a0851Speter dunlap 			bzero(&mapped_v4_ss2, sizeof (mapped_v4_ss2));
290e42a0851Speter dunlap 			mapped_v4_ss2.ss_family = AF_INET;
291e42a0851Speter dunlap 			((struct sockaddr_in *)&mapped_v4_ss2)->sin_port =
292e42a0851Speter dunlap 			    ((struct sockaddr_in *)ss2)->sin_port;
293e42a0851Speter dunlap 			IN6_V4MAPPED_TO_INADDR(in62,
294e42a0851Speter dunlap 			    &((struct sockaddr_in *)&mapped_v4_ss2)->sin_addr);
295e42a0851Speter dunlap 			ss2 = &mapped_v4_ss2;
296e42a0851Speter dunlap 		}
297e42a0851Speter dunlap 	}
298e42a0851Speter dunlap 
299e42a0851Speter dunlap 	/*
300e42a0851Speter dunlap 	 * Compare ports, then address family, then ip address
301e42a0851Speter dunlap 	 */
302bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	if (compare_ports &&
303bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	    (((struct sockaddr_in *)ss1)->sin_port !=
304bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	    ((struct sockaddr_in *)ss2)->sin_port)) {
305e42a0851Speter dunlap 		if (((struct sockaddr_in *)ss1)->sin_port >
306e42a0851Speter dunlap 		    ((struct sockaddr_in *)ss2)->sin_port)
307e42a0851Speter dunlap 			return (1);
308e42a0851Speter dunlap 		else
309e42a0851Speter dunlap 			return (-1);
310e42a0851Speter dunlap 	}
311e42a0851Speter dunlap 
312e42a0851Speter dunlap 	/*
313e42a0851Speter dunlap 	 * ports are the same
314e42a0851Speter dunlap 	 */
315e42a0851Speter dunlap 	if (ss1->ss_family != ss2->ss_family) {
316e42a0851Speter dunlap 		if (ss1->ss_family == AF_INET)
317e42a0851Speter dunlap 			return (1);
318e42a0851Speter dunlap 		else
319e42a0851Speter dunlap 			return (-1);
320e42a0851Speter dunlap 	}
321e42a0851Speter dunlap 
322e42a0851Speter dunlap 	/*
323e42a0851Speter dunlap 	 * address families are the same
324e42a0851Speter dunlap 	 */
325e42a0851Speter dunlap 	if (ss1->ss_family == AF_INET) {
326e42a0851Speter dunlap 		in1 = &((struct sockaddr_in *)ss1)->sin_addr;
327e42a0851Speter dunlap 		in2 = &((struct sockaddr_in *)ss2)->sin_addr;
328e42a0851Speter dunlap 
329e42a0851Speter dunlap 		if (in1->s_addr > in2->s_addr)
330e42a0851Speter dunlap 			return (1);
331e42a0851Speter dunlap 		else if (in1->s_addr < in2->s_addr)
332e42a0851Speter dunlap 			return (-1);
333e42a0851Speter dunlap 		else
334e42a0851Speter dunlap 			return (0);
335e42a0851Speter dunlap 	} else if (ss1->ss_family == AF_INET6) {
336e42a0851Speter dunlap 		in61 = &((struct sockaddr_in6 *)ss1)->sin6_addr;
337e42a0851Speter dunlap 		in62 = &((struct sockaddr_in6 *)ss2)->sin6_addr;
338e42a0851Speter dunlap 
339e42a0851Speter dunlap 		for (i = 0; i < 4; i++) {
340e42a0851Speter dunlap 			if (in61->s6_addr32[i] > in62->s6_addr32[i])
341e42a0851Speter dunlap 				return (1);
342e42a0851Speter dunlap 			else if (in61->s6_addr32[i] < in62->s6_addr32[i])
343e42a0851Speter dunlap 				return (-1);
344e42a0851Speter dunlap 		}
345e42a0851Speter dunlap 		return (0);
346e42a0851Speter dunlap 	}
347e42a0851Speter dunlap 
348e42a0851Speter dunlap 	return (1);
349e42a0851Speter dunlap }
350e42a0851Speter dunlap 
351a6d42e7dSPeter Dunlap /*
352a6d42e7dSPeter Dunlap  * IP address filter functions to flag addresses that should not
353a6d42e7dSPeter Dunlap  * go out to initiators through discovery.
354a6d42e7dSPeter Dunlap  */
355a6d42e7dSPeter Dunlap static boolean_t
356a6d42e7dSPeter Dunlap idm_v4_addr_okay(struct in_addr *in_addr)
357a6d42e7dSPeter Dunlap {
358a6d42e7dSPeter Dunlap 	in_addr_t addr = ntohl(in_addr->s_addr);
359a6d42e7dSPeter Dunlap 
360a6d42e7dSPeter Dunlap 	if ((INADDR_NONE == addr) ||
361a6d42e7dSPeter Dunlap 	    (IN_MULTICAST(addr)) ||
362a6d42e7dSPeter Dunlap 	    ((addr >> IN_CLASSA_NSHIFT) == 0) ||
363a6d42e7dSPeter Dunlap 	    ((addr >> IN_CLASSA_NSHIFT) == IN_LOOPBACKNET)) {
364a6d42e7dSPeter Dunlap 		return (B_FALSE);
365a6d42e7dSPeter Dunlap 	}
366a6d42e7dSPeter Dunlap 	return (B_TRUE);
367a6d42e7dSPeter Dunlap }
368a6d42e7dSPeter Dunlap 
369a6d42e7dSPeter Dunlap static boolean_t
370a6d42e7dSPeter Dunlap idm_v6_addr_okay(struct in6_addr *addr6)
371a6d42e7dSPeter Dunlap {
372a6d42e7dSPeter Dunlap 
373a6d42e7dSPeter Dunlap 	if ((IN6_IS_ADDR_UNSPECIFIED(addr6)) ||
374a6d42e7dSPeter Dunlap 	    (IN6_IS_ADDR_LOOPBACK(addr6)) ||
375a6d42e7dSPeter Dunlap 	    (IN6_IS_ADDR_MULTICAST(addr6)) ||
376a6d42e7dSPeter Dunlap 	    (IN6_IS_ADDR_V4MAPPED(addr6)) ||
377a6d42e7dSPeter Dunlap 	    (IN6_IS_ADDR_V4COMPAT(addr6)) ||
378a6d42e7dSPeter Dunlap 	    (IN6_IS_ADDR_LINKLOCAL(addr6))) {
379a6d42e7dSPeter Dunlap 		return (B_FALSE);
380a6d42e7dSPeter Dunlap 	}
381a6d42e7dSPeter Dunlap 	return (B_TRUE);
382a6d42e7dSPeter Dunlap }
383a6d42e7dSPeter Dunlap 
384a6d42e7dSPeter Dunlap /*
385a6d42e7dSPeter Dunlap  * idm_get_ipaddr will retrieve a list of IP Addresses which the host is
386a6d42e7dSPeter Dunlap  * configured with by sending down a sequence of kernel ioctl to IP STREAMS.
387a6d42e7dSPeter Dunlap  */
388a6d42e7dSPeter Dunlap int
389a6d42e7dSPeter Dunlap idm_get_ipaddr(idm_addr_list_t **ipaddr_p)
390a6d42e7dSPeter Dunlap {
3910f1702c5SYu Xiangning 	ksocket_t 		so4, so6;
392a6d42e7dSPeter Dunlap 	struct lifnum		lifn;
393a6d42e7dSPeter Dunlap 	struct lifconf		lifc;
394a6d42e7dSPeter Dunlap 	struct lifreq		*lp;
395a6d42e7dSPeter Dunlap 	int			rval;
396a6d42e7dSPeter Dunlap 	int			numifs;
397a6d42e7dSPeter Dunlap 	int			bufsize;
398a6d42e7dSPeter Dunlap 	void			*buf;
399a6d42e7dSPeter Dunlap 	int			i, j, n, rc;
400a6d42e7dSPeter Dunlap 	struct sockaddr_storage	ss;
401a6d42e7dSPeter Dunlap 	struct sockaddr_in	*sin;
402a6d42e7dSPeter Dunlap 	struct sockaddr_in6	*sin6;
403a6d42e7dSPeter Dunlap 	idm_addr_t		*ip;
404fcc214c3SCharles Ting 	idm_addr_list_t		*ipaddr = NULL;
405a6d42e7dSPeter Dunlap 	int			size_ipaddr;
406a6d42e7dSPeter Dunlap 
407a6d42e7dSPeter Dunlap 	*ipaddr_p = NULL;
408a6d42e7dSPeter Dunlap 	size_ipaddr = 0;
409a6d42e7dSPeter Dunlap 	buf = NULL;
410a6d42e7dSPeter Dunlap 
411a6d42e7dSPeter Dunlap 	/* create an ipv4 and ipv6 UDP socket */
412a6d42e7dSPeter Dunlap 	if ((so6 = idm_socreate(PF_INET6, SOCK_DGRAM, 0)) == NULL)
413a6d42e7dSPeter Dunlap 		return (0);
414a6d42e7dSPeter Dunlap 	if ((so4 = idm_socreate(PF_INET, SOCK_DGRAM, 0)) == NULL) {
415a6d42e7dSPeter Dunlap 		idm_sodestroy(so6);
416a6d42e7dSPeter Dunlap 		return (0);
417a6d42e7dSPeter Dunlap 	}
418a6d42e7dSPeter Dunlap 
419a6d42e7dSPeter Dunlap 
420a6d42e7dSPeter Dunlap retry_count:
421a6d42e7dSPeter Dunlap 	/* snapshot the current number of interfaces */
422a6d42e7dSPeter Dunlap 	lifn.lifn_family = PF_UNSPEC;
423a6d42e7dSPeter Dunlap 	lifn.lifn_flags = LIFC_NOXMIT | LIFC_TEMPORARY | LIFC_ALLZONES;
424a6d42e7dSPeter Dunlap 	lifn.lifn_count = 0;
4250f1702c5SYu Xiangning 	/* use vp6 for ioctls with unspecified families by default */
4260f1702c5SYu Xiangning 	if (ksocket_ioctl(so6, SIOCGLIFNUM, (intptr_t)&lifn, &rval, CRED())
4270f1702c5SYu Xiangning 	    != 0) {
428a6d42e7dSPeter Dunlap 		goto cleanup;
429a6d42e7dSPeter Dunlap 	}
430a6d42e7dSPeter Dunlap 
431a6d42e7dSPeter Dunlap 	numifs = lifn.lifn_count;
432a6d42e7dSPeter Dunlap 	if (numifs <= 0) {
433a6d42e7dSPeter Dunlap 		goto cleanup;
434a6d42e7dSPeter Dunlap 	}
435a6d42e7dSPeter Dunlap 
436a6d42e7dSPeter Dunlap 	/* allocate extra room in case more interfaces appear */
437a6d42e7dSPeter Dunlap 	numifs += 10;
438a6d42e7dSPeter Dunlap 
439a6d42e7dSPeter Dunlap 	/* get the interface names and ip addresses */
440a6d42e7dSPeter Dunlap 	bufsize = numifs * sizeof (struct lifreq);
441a6d42e7dSPeter Dunlap 	buf = kmem_alloc(bufsize, KM_SLEEP);
442a6d42e7dSPeter Dunlap 
443a6d42e7dSPeter Dunlap 	lifc.lifc_family = AF_UNSPEC;
444a6d42e7dSPeter Dunlap 	lifc.lifc_flags = LIFC_NOXMIT | LIFC_TEMPORARY | LIFC_ALLZONES;
445a6d42e7dSPeter Dunlap 	lifc.lifc_len = bufsize;
446a6d42e7dSPeter Dunlap 	lifc.lifc_buf = buf;
4470f1702c5SYu Xiangning 	rc = ksocket_ioctl(so6, SIOCGLIFCONF, (intptr_t)&lifc, &rval, CRED());
448a6d42e7dSPeter Dunlap 	if (rc != 0) {
449a6d42e7dSPeter Dunlap 		goto cleanup;
450a6d42e7dSPeter Dunlap 	}
451a6d42e7dSPeter Dunlap 	/* if our extra room is used up, try again */
452a6d42e7dSPeter Dunlap 	if (bufsize <= lifc.lifc_len) {
453a6d42e7dSPeter Dunlap 		kmem_free(buf, bufsize);
454a6d42e7dSPeter Dunlap 		buf = NULL;
455a6d42e7dSPeter Dunlap 		goto retry_count;
456a6d42e7dSPeter Dunlap 	}
457a6d42e7dSPeter Dunlap 	/* calc actual number of ifconfs */
458a6d42e7dSPeter Dunlap 	n = lifc.lifc_len / sizeof (struct lifreq);
459a6d42e7dSPeter Dunlap 
460a6d42e7dSPeter Dunlap 	/* get ip address */
461a6d42e7dSPeter Dunlap 	if (n > 0) {
462a6d42e7dSPeter Dunlap 		size_ipaddr = sizeof (idm_addr_list_t) +
463a6d42e7dSPeter Dunlap 		    (n - 1) * sizeof (idm_addr_t);
464a6d42e7dSPeter Dunlap 		ipaddr = kmem_zalloc(size_ipaddr, KM_SLEEP);
465a6d42e7dSPeter Dunlap 	} else {
466a6d42e7dSPeter Dunlap 		goto cleanup;
467a6d42e7dSPeter Dunlap 	}
468a6d42e7dSPeter Dunlap 
469a6d42e7dSPeter Dunlap 	/*
470a6d42e7dSPeter Dunlap 	 * Examine the array of interfaces and filter uninteresting ones
471a6d42e7dSPeter Dunlap 	 */
472a6d42e7dSPeter Dunlap 	for (i = 0, j = 0, lp = lifc.lifc_req; i < n; i++, lp++) {
473a6d42e7dSPeter Dunlap 
474a6d42e7dSPeter Dunlap 		/*
475a6d42e7dSPeter Dunlap 		 * Copy the address as the SIOCGLIFFLAGS ioctl is destructive
476a6d42e7dSPeter Dunlap 		 */
477a6d42e7dSPeter Dunlap 		ss = lp->lifr_addr;
478a6d42e7dSPeter Dunlap 		/*
479a6d42e7dSPeter Dunlap 		 * fetch the flags using the socket of the correct family
480a6d42e7dSPeter Dunlap 		 */
481a6d42e7dSPeter Dunlap 		switch (ss.ss_family) {
482a6d42e7dSPeter Dunlap 		case AF_INET:
4830f1702c5SYu Xiangning 			rc = ksocket_ioctl(so4, SIOCGLIFFLAGS, (intptr_t)lp,
4840f1702c5SYu Xiangning 			    &rval, CRED());
485a6d42e7dSPeter Dunlap 			break;
486a6d42e7dSPeter Dunlap 		case AF_INET6:
4870f1702c5SYu Xiangning 			rc = ksocket_ioctl(so6, SIOCGLIFFLAGS, (intptr_t)lp,
4880f1702c5SYu Xiangning 			    &rval, CRED());
489a6d42e7dSPeter Dunlap 			break;
490a6d42e7dSPeter Dunlap 		default:
491a6d42e7dSPeter Dunlap 			continue;
492a6d42e7dSPeter Dunlap 		}
493a6d42e7dSPeter Dunlap 		if (rc == 0) {
494a6d42e7dSPeter Dunlap 			/*
495a6d42e7dSPeter Dunlap 			 * If we got the flags, skip uninteresting
496a6d42e7dSPeter Dunlap 			 * interfaces based on flags
497a6d42e7dSPeter Dunlap 			 */
498a6d42e7dSPeter Dunlap 			if ((lp->lifr_flags & IFF_UP) != IFF_UP)
499a6d42e7dSPeter Dunlap 				continue;
500a6d42e7dSPeter Dunlap 			if (lp->lifr_flags &
501a6d42e7dSPeter Dunlap 			    (IFF_ANYCAST|IFF_NOLOCAL|IFF_DEPRECATED))
502a6d42e7dSPeter Dunlap 				continue;
503a6d42e7dSPeter Dunlap 		}
504a6d42e7dSPeter Dunlap 
505a6d42e7dSPeter Dunlap 		/* save ip address */
506a6d42e7dSPeter Dunlap 		ip = &ipaddr->al_addrs[j];
507a6d42e7dSPeter Dunlap 		switch (ss.ss_family) {
508a6d42e7dSPeter Dunlap 		case AF_INET:
509a6d42e7dSPeter Dunlap 			sin = (struct sockaddr_in *)&ss;
510a6d42e7dSPeter Dunlap 			if (!idm_v4_addr_okay(&sin->sin_addr))
511a6d42e7dSPeter Dunlap 				continue;
512a6d42e7dSPeter Dunlap 			ip->a_addr.i_addr.in4 = sin->sin_addr;
513a6d42e7dSPeter Dunlap 			ip->a_addr.i_insize = sizeof (struct in_addr);
514a6d42e7dSPeter Dunlap 			break;
515a6d42e7dSPeter Dunlap 		case AF_INET6:
516a6d42e7dSPeter Dunlap 			sin6 = (struct sockaddr_in6 *)&ss;
517a6d42e7dSPeter Dunlap 			if (!idm_v6_addr_okay(&sin6->sin6_addr))
518a6d42e7dSPeter Dunlap 				continue;
519a6d42e7dSPeter Dunlap 			ip->a_addr.i_addr.in6 = sin6->sin6_addr;
520a6d42e7dSPeter Dunlap 			ip->a_addr.i_insize = sizeof (struct in6_addr);
521a6d42e7dSPeter Dunlap 			break;
522a6d42e7dSPeter Dunlap 		default:
523a6d42e7dSPeter Dunlap 			continue;
524a6d42e7dSPeter Dunlap 		}
525a6d42e7dSPeter Dunlap 		j++;
526a6d42e7dSPeter Dunlap 	}
527a6d42e7dSPeter Dunlap 
528a6d42e7dSPeter Dunlap 	if (j == 0) {
529a6d42e7dSPeter Dunlap 		/* no valid ifaddr */
530a6d42e7dSPeter Dunlap 		kmem_free(ipaddr, size_ipaddr);
531a6d42e7dSPeter Dunlap 		size_ipaddr = 0;
532a6d42e7dSPeter Dunlap 		ipaddr = NULL;
533a6d42e7dSPeter Dunlap 	} else {
534a6d42e7dSPeter Dunlap 		ipaddr->al_out_cnt = j;
535a6d42e7dSPeter Dunlap 	}
536a6d42e7dSPeter Dunlap 
537a6d42e7dSPeter Dunlap 
538a6d42e7dSPeter Dunlap cleanup:
539a6d42e7dSPeter Dunlap 	idm_sodestroy(so6);
540a6d42e7dSPeter Dunlap 	idm_sodestroy(so4);
541a6d42e7dSPeter Dunlap 
542a6d42e7dSPeter Dunlap 	if (buf != NULL)
543a6d42e7dSPeter Dunlap 		kmem_free(buf, bufsize);
544a6d42e7dSPeter Dunlap 
545a6d42e7dSPeter Dunlap 	*ipaddr_p = ipaddr;
546a6d42e7dSPeter Dunlap 	return (size_ipaddr);
547a6d42e7dSPeter Dunlap }
548a6d42e7dSPeter Dunlap 
549a6d42e7dSPeter Dunlap int
5500f1702c5SYu Xiangning idm_sorecv(ksocket_t so, void *msg, size_t len)
551a6d42e7dSPeter Dunlap {
552a6d42e7dSPeter Dunlap 	iovec_t iov;
553a6d42e7dSPeter Dunlap 
554a6d42e7dSPeter Dunlap 	ASSERT(so != NULL);
555a6d42e7dSPeter Dunlap 	ASSERT(len != 0);
556a6d42e7dSPeter Dunlap 
557a6d42e7dSPeter Dunlap 	/*
558a6d42e7dSPeter Dunlap 	 * Fill in iovec and receive data
559a6d42e7dSPeter Dunlap 	 */
560a6d42e7dSPeter Dunlap 	iov.iov_base = msg;
561a6d42e7dSPeter Dunlap 	iov.iov_len = len;
562a6d42e7dSPeter Dunlap 
563a6d42e7dSPeter Dunlap 	return (idm_iov_sorecv(so, &iov, 1, len));
564a6d42e7dSPeter Dunlap }
565a6d42e7dSPeter Dunlap 
566a6d42e7dSPeter Dunlap /*
567a6d42e7dSPeter Dunlap  * idm_sosendto - Sends a buffered data on a non-connected socket.
568a6d42e7dSPeter Dunlap  *
569a6d42e7dSPeter Dunlap  * This function puts the data provided on the wire by calling sosendmsg.
570a6d42e7dSPeter Dunlap  * It will return only when all the data has been sent or if an error
571a6d42e7dSPeter Dunlap  * occurs.
572a6d42e7dSPeter Dunlap  *
573a6d42e7dSPeter Dunlap  * Returns 0 for success, the socket errno value if sosendmsg fails, and
574a6d42e7dSPeter Dunlap  * -1 if sosendmsg returns success but uio_resid != 0
575a6d42e7dSPeter Dunlap  */
576a6d42e7dSPeter Dunlap int
5770f1702c5SYu Xiangning idm_sosendto(ksocket_t so, void *buff, size_t len,
578a6d42e7dSPeter Dunlap     struct sockaddr *name, socklen_t namelen)
579a6d42e7dSPeter Dunlap {
580a6d42e7dSPeter Dunlap 	struct msghdr		msg;
581a6d42e7dSPeter Dunlap 	struct iovec		iov[1];
582a6d42e7dSPeter Dunlap 	int			error;
5830f1702c5SYu Xiangning 	size_t			sent = 0;
584a6d42e7dSPeter Dunlap 
585a6d42e7dSPeter Dunlap 	iov[0].iov_base	= buff;
586a6d42e7dSPeter Dunlap 	iov[0].iov_len	= len;
587a6d42e7dSPeter Dunlap 
588a6d42e7dSPeter Dunlap 	/* Initialization of the message header. */
589a6d42e7dSPeter Dunlap 	bzero(&msg, sizeof (msg));
590a6d42e7dSPeter Dunlap 	msg.msg_iov	= iov;
591a6d42e7dSPeter Dunlap 	msg.msg_iovlen	= 1;
592a6d42e7dSPeter Dunlap 	msg.msg_name	= name;
593a6d42e7dSPeter Dunlap 	msg.msg_namelen	= namelen;
594a6d42e7dSPeter Dunlap 
5950f1702c5SYu Xiangning 	if ((error = ksocket_sendmsg(so, &msg, 0, &sent, CRED())) == 0) {
596a6d42e7dSPeter Dunlap 		/* Data sent */
5970f1702c5SYu Xiangning 		if (sent == len) {
598a6d42e7dSPeter Dunlap 			/* All data sent.  Success. */
599a6d42e7dSPeter Dunlap 			return (0);
600a6d42e7dSPeter Dunlap 		} else {
601a6d42e7dSPeter Dunlap 			/* Not all data was sent.  Failure */
602a6d42e7dSPeter Dunlap 			return (-1);
603a6d42e7dSPeter Dunlap 		}
604a6d42e7dSPeter Dunlap 	}
605a6d42e7dSPeter Dunlap 
606a6d42e7dSPeter Dunlap 	/* Send failed */
607a6d42e7dSPeter Dunlap 	return (error);
608a6d42e7dSPeter Dunlap }
609a6d42e7dSPeter Dunlap 
610a6d42e7dSPeter Dunlap /*
611a6d42e7dSPeter Dunlap  * idm_iov_sosend - Sends an iovec on a connection.
612a6d42e7dSPeter Dunlap  *
613a6d42e7dSPeter Dunlap  * This function puts the data provided on the wire by calling sosendmsg.
614a6d42e7dSPeter Dunlap  * It will return only when all the data has been sent or if an error
615a6d42e7dSPeter Dunlap  * occurs.
616a6d42e7dSPeter Dunlap  *
617a6d42e7dSPeter Dunlap  * Returns 0 for success, the socket errno value if sosendmsg fails, and
618a6d42e7dSPeter Dunlap  * -1 if sosendmsg returns success but uio_resid != 0
619a6d42e7dSPeter Dunlap  */
620a6d42e7dSPeter Dunlap int
6210f1702c5SYu Xiangning idm_iov_sosend(ksocket_t so, iovec_t *iop, int iovlen, size_t total_len)
622a6d42e7dSPeter Dunlap {
623a6d42e7dSPeter Dunlap 	struct msghdr		msg;
624a6d42e7dSPeter Dunlap 	int			error;
6250f1702c5SYu Xiangning 	size_t 			sent = 0;
626a6d42e7dSPeter Dunlap 
627a6d42e7dSPeter Dunlap 	ASSERT(iop != NULL);
628a6d42e7dSPeter Dunlap 
629a6d42e7dSPeter Dunlap 	/* Initialization of the message header. */
630a6d42e7dSPeter Dunlap 	bzero(&msg, sizeof (msg));
631a6d42e7dSPeter Dunlap 	msg.msg_iov	= iop;
632a6d42e7dSPeter Dunlap 	msg.msg_iovlen	= iovlen;
633a6d42e7dSPeter Dunlap 
6340f1702c5SYu Xiangning 	if ((error = ksocket_sendmsg(so, &msg, 0, &sent, CRED()))
6350f1702c5SYu Xiangning 	    == 0) {
636a6d42e7dSPeter Dunlap 		/* Data sent */
6370f1702c5SYu Xiangning 		if (sent == total_len) {
638a6d42e7dSPeter Dunlap 			/* All data sent.  Success. */
639a6d42e7dSPeter Dunlap 			return (0);
640a6d42e7dSPeter Dunlap 		} else {
641a6d42e7dSPeter Dunlap 			/* Not all data was sent.  Failure */
642a6d42e7dSPeter Dunlap 			return (-1);
643a6d42e7dSPeter Dunlap 		}
644a6d42e7dSPeter Dunlap 	}
645a6d42e7dSPeter Dunlap 
646a6d42e7dSPeter Dunlap 	/* Send failed */
647a6d42e7dSPeter Dunlap 	return (error);
648a6d42e7dSPeter Dunlap }
649a6d42e7dSPeter Dunlap 
650a6d42e7dSPeter Dunlap /*
651a6d42e7dSPeter Dunlap  * idm_iov_sorecv - Receives an iovec from a connection
652a6d42e7dSPeter Dunlap  *
653a6d42e7dSPeter Dunlap  * This function gets the data asked for from the socket.  It will return
654a6d42e7dSPeter Dunlap  * only when all the requested data has been retrieved or if an error
655a6d42e7dSPeter Dunlap  * occurs.
656a6d42e7dSPeter Dunlap  *
657a6d42e7dSPeter Dunlap  * Returns 0 for success, the socket errno value if sorecvmsg fails, and
658a6d42e7dSPeter Dunlap  * -1 if sorecvmsg returns success but uio_resid != 0
659a6d42e7dSPeter Dunlap  */
660a6d42e7dSPeter Dunlap int
6610f1702c5SYu Xiangning idm_iov_sorecv(ksocket_t so, iovec_t *iop, int iovlen, size_t total_len)
662a6d42e7dSPeter Dunlap {
663a6d42e7dSPeter Dunlap 	struct msghdr		msg;
664a6d42e7dSPeter Dunlap 	int			error;
6650f1702c5SYu Xiangning 	size_t			recv;
6660f1702c5SYu Xiangning 	int 			flags;
667a6d42e7dSPeter Dunlap 
668a6d42e7dSPeter Dunlap 	ASSERT(iop != NULL);
669a6d42e7dSPeter Dunlap 
670a6d42e7dSPeter Dunlap 	/* Initialization of the message header. */
671a6d42e7dSPeter Dunlap 	bzero(&msg, sizeof (msg));
672a6d42e7dSPeter Dunlap 	msg.msg_iov	= iop;
673a6d42e7dSPeter Dunlap 	msg.msg_iovlen	= iovlen;
6740f1702c5SYu Xiangning 	flags		= MSG_WAITALL;
675a6d42e7dSPeter Dunlap 
6760f1702c5SYu Xiangning 	if ((error = ksocket_recvmsg(so, &msg, flags, &recv, CRED()))
6770f1702c5SYu Xiangning 	    == 0) {
678a6d42e7dSPeter Dunlap 		/* Received data */
6790f1702c5SYu Xiangning 		if (recv == total_len) {
680a6d42e7dSPeter Dunlap 			/* All requested data received.  Success */
681a6d42e7dSPeter Dunlap 			return (0);
682a6d42e7dSPeter Dunlap 		} else {
683a6d42e7dSPeter Dunlap 			/*
684a6d42e7dSPeter Dunlap 			 * Not all data was received.  The connection has
685a6d42e7dSPeter Dunlap 			 * probably failed.
686a6d42e7dSPeter Dunlap 			 */
687a6d42e7dSPeter Dunlap 			return (-1);
688a6d42e7dSPeter Dunlap 		}
689a6d42e7dSPeter Dunlap 	}
690a6d42e7dSPeter Dunlap 
691a6d42e7dSPeter Dunlap 	/* Receive failed */
692a6d42e7dSPeter Dunlap 	return (error);
693a6d42e7dSPeter Dunlap }
694a6d42e7dSPeter Dunlap 
695a6d42e7dSPeter Dunlap static void
696dedec472SJack Meng idm_set_ini_preconnect_options(idm_so_conn_t *sc, boolean_t boot_conn)
697a6d42e7dSPeter Dunlap {
698a6d42e7dSPeter Dunlap 	int	conn_abort = 10000;
699a6d42e7dSPeter Dunlap 	int	conn_notify = 2000;
700a6d42e7dSPeter Dunlap 	int	abort = 30000;
701a6d42e7dSPeter Dunlap 
702a6d42e7dSPeter Dunlap 	/* Pre-connect socket options */
7030f1702c5SYu Xiangning 	(void) ksocket_setsockopt(sc->ic_so, IPPROTO_TCP,
7040f1702c5SYu Xiangning 	    TCP_CONN_NOTIFY_THRESHOLD, (char *)&conn_notify, sizeof (int),
7050f1702c5SYu Xiangning 	    CRED());
706dedec472SJack Meng 	if (boot_conn == B_FALSE) {
707dedec472SJack Meng 		(void) ksocket_setsockopt(sc->ic_so, IPPROTO_TCP,
708dedec472SJack Meng 		    TCP_CONN_ABORT_THRESHOLD, (char *)&conn_abort, sizeof (int),
709dedec472SJack Meng 		    CRED());
710dedec472SJack Meng 		(void) ksocket_setsockopt(sc->ic_so, IPPROTO_TCP,
711dedec472SJack Meng 		    TCP_ABORT_THRESHOLD,
712dedec472SJack Meng 		    (char *)&abort, sizeof (int), CRED());
713dedec472SJack Meng 	}
714a6d42e7dSPeter Dunlap }
715a6d42e7dSPeter Dunlap 
716a6d42e7dSPeter Dunlap static void
7170f94976eSJeff Biseda idm_set_postconnect_options(ksocket_t ks)
718a6d42e7dSPeter Dunlap {
719a6d42e7dSPeter Dunlap 	const int	on = 1;
720a6d42e7dSPeter Dunlap 
721a6d42e7dSPeter Dunlap 	/* Set connect options */
7220f1702c5SYu Xiangning 	(void) ksocket_setsockopt(ks, SOL_SOCKET, SO_RCVBUF,
723f99db78fSChristopher Siden 	    (char *)&idm_so_rcvbuf, sizeof (idm_so_rcvbuf), CRED());
7240f1702c5SYu Xiangning 	(void) ksocket_setsockopt(ks, SOL_SOCKET, SO_SNDBUF,
725f99db78fSChristopher Siden 	    (char *)&idm_so_sndbuf, sizeof (idm_so_sndbuf), CRED());
7260f1702c5SYu Xiangning 	(void) ksocket_setsockopt(ks, IPPROTO_TCP, TCP_NODELAY,
7270f1702c5SYu Xiangning 	    (char *)&on, sizeof (on), CRED());
728a6d42e7dSPeter Dunlap }
729a6d42e7dSPeter Dunlap 
730a6d42e7dSPeter Dunlap static uint32_t
731a6d42e7dSPeter Dunlap n2h24(const uchar_t *ptr)
732a6d42e7dSPeter Dunlap {
733a6d42e7dSPeter Dunlap 	return ((ptr[0] << 16) | (ptr[1] << 8) | ptr[2]);
734a6d42e7dSPeter Dunlap }
735a6d42e7dSPeter Dunlap 
736*2727bb05STim Kordas static boolean_t
737*2727bb05STim Kordas idm_dataseglenokay(idm_conn_t *ic, idm_pdu_t *pdu)
738*2727bb05STim Kordas {
739*2727bb05STim Kordas 	iscsi_hdr_t	*bhs;
740*2727bb05STim Kordas 
741*2727bb05STim Kordas 	if (ic->ic_conn_type == CONN_TYPE_TGT &&
742*2727bb05STim Kordas 	    pdu->isp_datalen > ic->ic_conn_params.max_recv_dataseglen) {
743*2727bb05STim Kordas 		IDM_CONN_LOG(CE_WARN,
744*2727bb05STim Kordas 		    "idm_dataseglenokay: exceeded the max data segment length");
745*2727bb05STim Kordas 		return (B_FALSE);
746*2727bb05STim Kordas 	}
747*2727bb05STim Kordas 
748*2727bb05STim Kordas 	bhs = pdu->isp_hdr;
749*2727bb05STim Kordas 	/*
750*2727bb05STim Kordas 	 * Filter out any RFC3720 data-size violations.
751*2727bb05STim Kordas 	 */
752*2727bb05STim Kordas 	switch (IDM_PDU_OPCODE(pdu)) {
753*2727bb05STim Kordas 	case ISCSI_OP_SCSI_TASK_MGT_MSG:
754*2727bb05STim Kordas 	case ISCSI_OP_SCSI_TASK_MGT_RSP:
755*2727bb05STim Kordas 	case ISCSI_OP_RTT_RSP:
756*2727bb05STim Kordas 	case ISCSI_OP_LOGOUT_CMD:
757*2727bb05STim Kordas 		/*
758*2727bb05STim Kordas 		 * Data-segment not allowed and additional headers not allowed.
759*2727bb05STim Kordas 		 * (both must be zero according to the RFC3720.)
760*2727bb05STim Kordas 		 */
761*2727bb05STim Kordas 		if (bhs->hlength != 0 || pdu->isp_datalen != 0)
762*2727bb05STim Kordas 			return (B_FALSE);
763*2727bb05STim Kordas 		break;
764*2727bb05STim Kordas 	case ISCSI_OP_NOOP_OUT:
765*2727bb05STim Kordas 	case ISCSI_OP_LOGIN_CMD:
766*2727bb05STim Kordas 	case ISCSI_OP_TEXT_CMD:
767*2727bb05STim Kordas 	case ISCSI_OP_SNACK_CMD:
768*2727bb05STim Kordas 	case ISCSI_OP_NOOP_IN:
769*2727bb05STim Kordas 	case ISCSI_OP_SCSI_RSP:
770*2727bb05STim Kordas 	case ISCSI_OP_LOGIN_RSP:
771*2727bb05STim Kordas 	case ISCSI_OP_TEXT_RSP:
772*2727bb05STim Kordas 	case ISCSI_OP_SCSI_DATA_RSP:
773*2727bb05STim Kordas 	case ISCSI_OP_LOGOUT_RSP:
774*2727bb05STim Kordas 	case ISCSI_OP_ASYNC_EVENT:
775*2727bb05STim Kordas 	case ISCSI_OP_REJECT_MSG:
776*2727bb05STim Kordas 		/*
777*2727bb05STim Kordas 		 * Additional headers not allowed.
778*2727bb05STim Kordas 		 * (must be zero according to RFC3720.)
779*2727bb05STim Kordas 		 */
780*2727bb05STim Kordas 		if (bhs->hlength)
781*2727bb05STim Kordas 			return (B_FALSE);
782*2727bb05STim Kordas 		break;
783*2727bb05STim Kordas 	case ISCSI_OP_SCSI_CMD:
784*2727bb05STim Kordas 		/*
785*2727bb05STim Kordas 		 * See RFC3720, section 10.3
786*2727bb05STim Kordas 		 *
787*2727bb05STim Kordas 		 * For pure read cmds, data-segment-length must be zero.
788*2727bb05STim Kordas 		 * For non-final transfers, data-size must be even number of
789*2727bb05STim Kordas 		 * 4-byte words.
790*2727bb05STim Kordas 		 * For any transfer, an expected byte count must be provided.
791*2727bb05STim Kordas 		 * For bidirectional transfers, an additional-header must be
792*2727bb05STim Kordas 		 * provided (for the read byte-count.)
793*2727bb05STim Kordas 		 */
794*2727bb05STim Kordas 		if (pdu->isp_datalen) {
795*2727bb05STim Kordas 			if ((bhs->flags & (ISCSI_FLAG_CMD_READ |
796*2727bb05STim Kordas 			    ISCSI_FLAG_CMD_WRITE)) == ISCSI_FLAG_CMD_READ)
797*2727bb05STim Kordas 				return (B_FALSE);
798*2727bb05STim Kordas 			if ((bhs->flags & ISCSI_FLAG_FINAL) == 0 &&
799*2727bb05STim Kordas 			    ((pdu->isp_datalen & 0x3) != 0))
800*2727bb05STim Kordas 				return (B_FALSE);
801*2727bb05STim Kordas 		}
802*2727bb05STim Kordas 		if (bhs->flags & (ISCSI_FLAG_CMD_READ |
803*2727bb05STim Kordas 		    ISCSI_FLAG_CMD_WRITE)) {
804*2727bb05STim Kordas 			iscsi_scsi_cmd_hdr_t *cmdhdr =
805*2727bb05STim Kordas 			    (iscsi_scsi_cmd_hdr_t *)bhs;
806*2727bb05STim Kordas 			/*
807*2727bb05STim Kordas 			 * we're transfering some data, we must have a
808*2727bb05STim Kordas 			 * byte count
809*2727bb05STim Kordas 			 */
810*2727bb05STim Kordas 			if (cmdhdr->data_length == 0)
811*2727bb05STim Kordas 				return (B_FALSE);
812*2727bb05STim Kordas 		}
813*2727bb05STim Kordas 		break;
814*2727bb05STim Kordas 	case ISCSI_OP_SCSI_DATA:
815*2727bb05STim Kordas 		/*
816*2727bb05STim Kordas 		 * See RFC3720, section 10.7
817*2727bb05STim Kordas 		 *
818*2727bb05STim Kordas 		 * Additional headers aren't allowed, and the data-size must
819*2727bb05STim Kordas 		 * be an even number of 4-byte words (unless the final bit
820*2727bb05STim Kordas 		 * is set.)
821*2727bb05STim Kordas 		 */
822*2727bb05STim Kordas 		if (bhs->hlength)
823*2727bb05STim Kordas 			return (B_FALSE);
824*2727bb05STim Kordas 		if ((bhs->flags & ISCSI_FLAG_FINAL) == 0 &&
825*2727bb05STim Kordas 		    ((pdu->isp_datalen & 0x3) != 0))
826*2727bb05STim Kordas 			return (B_FALSE);
827*2727bb05STim Kordas 		break;
828*2727bb05STim Kordas 	default:
829*2727bb05STim Kordas 		break;
830*2727bb05STim Kordas 	}
831*2727bb05STim Kordas 	return (B_TRUE);
832*2727bb05STim Kordas }
833a6d42e7dSPeter Dunlap 
834a6d42e7dSPeter Dunlap static idm_status_t
835a6d42e7dSPeter Dunlap idm_sorecvhdr(idm_conn_t *ic, idm_pdu_t *pdu)
836a6d42e7dSPeter Dunlap {
837a6d42e7dSPeter Dunlap 	iscsi_hdr_t	*bhs;
838a6d42e7dSPeter Dunlap 	uint32_t	hdr_digest_crc;
839a6d42e7dSPeter Dunlap 	uint32_t	crc_calculated;
840a6d42e7dSPeter Dunlap 	void		*new_hdr;
841a6d42e7dSPeter Dunlap 	int		ahslen = 0;
842a6d42e7dSPeter Dunlap 	int		total_len = 0;
843a6d42e7dSPeter Dunlap 	int		iovlen = 0;
844a6d42e7dSPeter Dunlap 	struct iovec	iov[2];
845a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
846a6d42e7dSPeter Dunlap 	int		rc;
847a6d42e7dSPeter Dunlap 
848a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
849a6d42e7dSPeter Dunlap 
850a6d42e7dSPeter Dunlap 	/*
851a6d42e7dSPeter Dunlap 	 * Read BHS
852a6d42e7dSPeter Dunlap 	 */
853a6d42e7dSPeter Dunlap 	bhs = pdu->isp_hdr;
854a6d42e7dSPeter Dunlap 	rc = idm_sorecv(so_conn->ic_so, pdu->isp_hdr, sizeof (iscsi_hdr_t));
855a6d42e7dSPeter Dunlap 	if (rc != IDM_STATUS_SUCCESS) {
856a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
857a6d42e7dSPeter Dunlap 	}
858a6d42e7dSPeter Dunlap 
859a6d42e7dSPeter Dunlap 	/*
860a6d42e7dSPeter Dunlap 	 * Check actual AHS length against the amount available in the buffer
861a6d42e7dSPeter Dunlap 	 */
862a6d42e7dSPeter Dunlap 	pdu->isp_hdrlen = sizeof (iscsi_hdr_t) +
863a6d42e7dSPeter Dunlap 	    (bhs->hlength * sizeof (uint32_t));
864a6d42e7dSPeter Dunlap 	pdu->isp_datalen = n2h24(bhs->dlength);
865*2727bb05STim Kordas 
866*2727bb05STim Kordas 	if (!idm_dataseglenokay(ic, pdu)) {
86756261083SCharles Ting 		IDM_CONN_LOG(CE_WARN,
868*2727bb05STim Kordas 		    "idm_sorecvhdr: invalid data segment length");
86956261083SCharles Ting 		return (IDM_STATUS_FAIL);
87056261083SCharles Ting 	}
871a6d42e7dSPeter Dunlap 	if (bhs->hlength > IDM_SORX_CACHE_AHSLEN) {
872a6d42e7dSPeter Dunlap 		/* Allocate a new header segment and change the callback */
873a6d42e7dSPeter Dunlap 		new_hdr = kmem_alloc(pdu->isp_hdrlen, KM_SLEEP);
874a6d42e7dSPeter Dunlap 		bcopy(pdu->isp_hdr, new_hdr, sizeof (iscsi_hdr_t));
875a6d42e7dSPeter Dunlap 		pdu->isp_hdr = new_hdr;
876a6d42e7dSPeter Dunlap 		pdu->isp_flags |= IDM_PDU_ADDL_HDR;
877a6d42e7dSPeter Dunlap 
878a6d42e7dSPeter Dunlap 		/*
879a6d42e7dSPeter Dunlap 		 * This callback will restore the expected values after
880a6d42e7dSPeter Dunlap 		 * the RX PDU has been processed.
881a6d42e7dSPeter Dunlap 		 */
882a6d42e7dSPeter Dunlap 		pdu->isp_callback = idm_sorx_addl_pdu_cb;
883a6d42e7dSPeter Dunlap 	}
884a6d42e7dSPeter Dunlap 
885a6d42e7dSPeter Dunlap 	/*
886a6d42e7dSPeter Dunlap 	 * Setup receipt of additional header and header digest (if enabled).
887a6d42e7dSPeter Dunlap 	 */
888a6d42e7dSPeter Dunlap 	if (bhs->hlength > 0) {
889a6d42e7dSPeter Dunlap 		iov[iovlen].iov_base = (caddr_t)(pdu->isp_hdr + 1);
890a6d42e7dSPeter Dunlap 		ahslen = pdu->isp_hdrlen - sizeof (iscsi_hdr_t);
891a6d42e7dSPeter Dunlap 		iov[iovlen].iov_len = ahslen;
892a6d42e7dSPeter Dunlap 		total_len += iov[iovlen].iov_len;
893a6d42e7dSPeter Dunlap 		iovlen++;
894a6d42e7dSPeter Dunlap 	}
895a6d42e7dSPeter Dunlap 
896a6d42e7dSPeter Dunlap 	if (ic->ic_conn_flags & IDM_CONN_HEADER_DIGEST) {
897a6d42e7dSPeter Dunlap 		iov[iovlen].iov_base = (caddr_t)&hdr_digest_crc;
898a6d42e7dSPeter Dunlap 		iov[iovlen].iov_len = sizeof (hdr_digest_crc);
899a6d42e7dSPeter Dunlap 		total_len += iov[iovlen].iov_len;
900a6d42e7dSPeter Dunlap 		iovlen++;
901a6d42e7dSPeter Dunlap 	}
902a6d42e7dSPeter Dunlap 
903a6d42e7dSPeter Dunlap 	if ((iovlen != 0) &&
904a6d42e7dSPeter Dunlap 	    (idm_iov_sorecv(so_conn->ic_so, &iov[0], iovlen,
905a6d42e7dSPeter Dunlap 	    total_len) != 0)) {
906a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
907a6d42e7dSPeter Dunlap 	}
908a6d42e7dSPeter Dunlap 
909a6d42e7dSPeter Dunlap 	/*
910a6d42e7dSPeter Dunlap 	 * Validate header digest if enabled
911a6d42e7dSPeter Dunlap 	 */
912a6d42e7dSPeter Dunlap 	if (ic->ic_conn_flags & IDM_CONN_HEADER_DIGEST) {
913a6d42e7dSPeter Dunlap 		crc_calculated = idm_crc32c(pdu->isp_hdr,
914a6d42e7dSPeter Dunlap 		    sizeof (iscsi_hdr_t) + ahslen);
915a6d42e7dSPeter Dunlap 		if (crc_calculated != hdr_digest_crc) {
916a6d42e7dSPeter Dunlap 			/* Invalid Header Digest */
917a6d42e7dSPeter Dunlap 			return (IDM_STATUS_HEADER_DIGEST);
918a6d42e7dSPeter Dunlap 		}
919a6d42e7dSPeter Dunlap 	}
920a6d42e7dSPeter Dunlap 
921a6d42e7dSPeter Dunlap 	return (0);
922a6d42e7dSPeter Dunlap }
923a6d42e7dSPeter Dunlap 
924a6d42e7dSPeter Dunlap /*
925a6d42e7dSPeter Dunlap  * idm_so_ini_conn_create()
926a6d42e7dSPeter Dunlap  * Allocate the sockets transport connection resources.
927a6d42e7dSPeter Dunlap  */
928a6d42e7dSPeter Dunlap static idm_status_t
929a6d42e7dSPeter Dunlap idm_so_ini_conn_create(idm_conn_req_t *cr, idm_conn_t *ic)
930a6d42e7dSPeter Dunlap {
9310f1702c5SYu Xiangning 	ksocket_t	so;
932a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
933a6d42e7dSPeter Dunlap 	idm_status_t	idmrc;
934a6d42e7dSPeter Dunlap 
935a6d42e7dSPeter Dunlap 	so = idm_socreate(cr->cr_domain, cr->cr_type,
936a6d42e7dSPeter Dunlap 	    cr->cr_protocol);
937a6d42e7dSPeter Dunlap 	if (so == NULL) {
938a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
939a6d42e7dSPeter Dunlap 	}
940a6d42e7dSPeter Dunlap 
941a6d42e7dSPeter Dunlap 	/* Bind the socket if configured to do so */
942a6d42e7dSPeter Dunlap 	if (cr->cr_bound) {
9430f1702c5SYu Xiangning 		if (ksocket_bind(so, &cr->cr_bound_addr.sin,
9440f1702c5SYu Xiangning 		    SIZEOF_SOCKADDR(&cr->cr_bound_addr.sin), CRED()) != 0) {
945a6d42e7dSPeter Dunlap 			idm_sodestroy(so);
946a6d42e7dSPeter Dunlap 			return (IDM_STATUS_FAIL);
947a6d42e7dSPeter Dunlap 		}
948a6d42e7dSPeter Dunlap 	}
949a6d42e7dSPeter Dunlap 
950a6d42e7dSPeter Dunlap 	idmrc = idm_so_conn_create_common(ic, so);
951a6d42e7dSPeter Dunlap 	if (idmrc != IDM_STATUS_SUCCESS) {
952a6d42e7dSPeter Dunlap 		idm_soshutdown(so);
953a6d42e7dSPeter Dunlap 		idm_sodestroy(so);
954a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
955a6d42e7dSPeter Dunlap 	}
956a6d42e7dSPeter Dunlap 
957a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
958a6d42e7dSPeter Dunlap 	/* Set up socket options */
959dedec472SJack Meng 	idm_set_ini_preconnect_options(so_conn, cr->cr_boot_conn);
960a6d42e7dSPeter Dunlap 
961a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
962a6d42e7dSPeter Dunlap }
963a6d42e7dSPeter Dunlap 
964a6d42e7dSPeter Dunlap /*
965a6d42e7dSPeter Dunlap  * idm_so_ini_conn_destroy()
966a6d42e7dSPeter Dunlap  * Tear down the sockets transport connection resources.
967a6d42e7dSPeter Dunlap  */
968a6d42e7dSPeter Dunlap static void
969a6d42e7dSPeter Dunlap idm_so_ini_conn_destroy(idm_conn_t *ic)
970a6d42e7dSPeter Dunlap {
971a6d42e7dSPeter Dunlap 	idm_so_conn_destroy_common(ic);
972a6d42e7dSPeter Dunlap }
973a6d42e7dSPeter Dunlap 
974a6d42e7dSPeter Dunlap /*
975a6d42e7dSPeter Dunlap  * idm_so_ini_conn_connect()
976a6d42e7dSPeter Dunlap  * Establish the connection referred to by the handle previously allocated via
977a6d42e7dSPeter Dunlap  * idm_so_ini_conn_create().
978a6d42e7dSPeter Dunlap  */
979a6d42e7dSPeter Dunlap static idm_status_t
980a6d42e7dSPeter Dunlap idm_so_ini_conn_connect(idm_conn_t *ic)
981a6d42e7dSPeter Dunlap {
982a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
983aff4bce5Syi zhang - Sun Microsystems - Beijing China 	struct sonode	*node = NULL;
984aff4bce5Syi zhang - Sun Microsystems - Beijing China 	int 		rc;
985aff4bce5Syi zhang - Sun Microsystems - Beijing China 	clock_t		lbolt, conn_login_max, conn_login_interval;
986aff4bce5Syi zhang - Sun Microsystems - Beijing China 	boolean_t	nonblock;
987a6d42e7dSPeter Dunlap 
988a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
989aff4bce5Syi zhang - Sun Microsystems - Beijing China 	nonblock = ic->ic_conn_params.nonblock_socket;
990aff4bce5Syi zhang - Sun Microsystems - Beijing China 	conn_login_max = ic->ic_conn_params.conn_login_max;
991aff4bce5Syi zhang - Sun Microsystems - Beijing China 	conn_login_interval = ddi_get_lbolt() +
992aff4bce5Syi zhang - Sun Microsystems - Beijing China 	    SEC_TO_TICK(ic->ic_conn_params.conn_login_interval);
993aff4bce5Syi zhang - Sun Microsystems - Beijing China 
994aff4bce5Syi zhang - Sun Microsystems - Beijing China 	if (nonblock == B_TRUE) {
995aff4bce5Syi zhang - Sun Microsystems - Beijing China 		node = ((struct sonode *)(so_conn->ic_so));
996aff4bce5Syi zhang - Sun Microsystems - Beijing China 		/* Set to none block socket mode */
997aff4bce5Syi zhang - Sun Microsystems - Beijing China 		idm_so_socket_set_nonblock(node);
998aff4bce5Syi zhang - Sun Microsystems - Beijing China 		do {
999aff4bce5Syi zhang - Sun Microsystems - Beijing China 			rc = ksocket_connect(so_conn->ic_so,
1000aff4bce5Syi zhang - Sun Microsystems - Beijing China 			    &ic->ic_ini_dst_addr.sin,
1001aff4bce5Syi zhang - Sun Microsystems - Beijing China 			    (SIZEOF_SOCKADDR(&ic->ic_ini_dst_addr.sin)),
1002aff4bce5Syi zhang - Sun Microsystems - Beijing China 			    CRED());
1003aff4bce5Syi zhang - Sun Microsystems - Beijing China 			if (rc == 0 || rc == EISCONN) {
1004aff4bce5Syi zhang - Sun Microsystems - Beijing China 				/* socket success or already success */
1005aff4bce5Syi zhang - Sun Microsystems - Beijing China 				rc = IDM_STATUS_SUCCESS;
1006aff4bce5Syi zhang - Sun Microsystems - Beijing China 				break;
1007aff4bce5Syi zhang - Sun Microsystems - Beijing China 			}
1008aff4bce5Syi zhang - Sun Microsystems - Beijing China 			if ((rc == ETIMEDOUT) || (rc == ECONNREFUSED) ||
1009aff4bce5Syi zhang - Sun Microsystems - Beijing China 			    (rc == ECONNRESET)) {
1010aff4bce5Syi zhang - Sun Microsystems - Beijing China 				/* socket connection timeout or refuse */
1011aff4bce5Syi zhang - Sun Microsystems - Beijing China 				break;
1012aff4bce5Syi zhang - Sun Microsystems - Beijing China 			}
1013aff4bce5Syi zhang - Sun Microsystems - Beijing China 			lbolt = ddi_get_lbolt();
1014aff4bce5Syi zhang - Sun Microsystems - Beijing China 			if (lbolt > conn_login_max) {
1015aff4bce5Syi zhang - Sun Microsystems - Beijing China 				/*
1016aff4bce5Syi zhang - Sun Microsystems - Beijing China 				 * Connection retry timeout,
1017aff4bce5Syi zhang - Sun Microsystems - Beijing China 				 * failed connect to target.
1018aff4bce5Syi zhang - Sun Microsystems - Beijing China 				 */
1019aff4bce5Syi zhang - Sun Microsystems - Beijing China 				break;
1020aff4bce5Syi zhang - Sun Microsystems - Beijing China 			}
1021aff4bce5Syi zhang - Sun Microsystems - Beijing China 			if (lbolt < conn_login_interval) {
1022aff4bce5Syi zhang - Sun Microsystems - Beijing China 				if ((rc == EINPROGRESS) || (rc == EALREADY)) {
1023aff4bce5Syi zhang - Sun Microsystems - Beijing China 					/* TCP connect still in progress */
1024aff4bce5Syi zhang - Sun Microsystems - Beijing China 					delay(SEC_TO_TICK(IN_PROGRESS_DELAY));
1025aff4bce5Syi zhang - Sun Microsystems - Beijing China 					continue;
1026aff4bce5Syi zhang - Sun Microsystems - Beijing China 				} else {
1027aff4bce5Syi zhang - Sun Microsystems - Beijing China 					delay(conn_login_interval - lbolt);
1028aff4bce5Syi zhang - Sun Microsystems - Beijing China 				}
1029aff4bce5Syi zhang - Sun Microsystems - Beijing China 			}
1030aff4bce5Syi zhang - Sun Microsystems - Beijing China 			conn_login_interval = ddi_get_lbolt() +
1031aff4bce5Syi zhang - Sun Microsystems - Beijing China 			    SEC_TO_TICK(ic->ic_conn_params.conn_login_interval);
1032aff4bce5Syi zhang - Sun Microsystems - Beijing China 		} while (rc != 0);
1033aff4bce5Syi zhang - Sun Microsystems - Beijing China 		/* resume to nonblock mode */
1034aff4bce5Syi zhang - Sun Microsystems - Beijing China 		if (rc == IDM_STATUS_SUCCESS) {
1035aff4bce5Syi zhang - Sun Microsystems - Beijing China 			idm_so_socket_set_block(node);
1036aff4bce5Syi zhang - Sun Microsystems - Beijing China 		}
1037aff4bce5Syi zhang - Sun Microsystems - Beijing China 	} else {
1038aff4bce5Syi zhang - Sun Microsystems - Beijing China 		rc = ksocket_connect(so_conn->ic_so, &ic->ic_ini_dst_addr.sin,
1039aff4bce5Syi zhang - Sun Microsystems - Beijing China 		    (SIZEOF_SOCKADDR(&ic->ic_ini_dst_addr.sin)), CRED());
1040aff4bce5Syi zhang - Sun Microsystems - Beijing China 	}
1041a6d42e7dSPeter Dunlap 
1042aff4bce5Syi zhang - Sun Microsystems - Beijing China 	if (rc != 0) {
1043a6d42e7dSPeter Dunlap 		idm_soshutdown(so_conn->ic_so);
1044a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
1045a6d42e7dSPeter Dunlap 	}
1046a6d42e7dSPeter Dunlap 
1047a6d42e7dSPeter Dunlap 	idm_so_conn_connect_common(ic);
1048a6d42e7dSPeter Dunlap 
10490f94976eSJeff Biseda 	idm_set_postconnect_options(so_conn->ic_so);
1050a6d42e7dSPeter Dunlap 
1051a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
1052a6d42e7dSPeter Dunlap }
1053a6d42e7dSPeter Dunlap 
1054a6d42e7dSPeter Dunlap idm_status_t
10550f1702c5SYu Xiangning idm_so_tgt_conn_create(idm_conn_t *ic, ksocket_t new_so)
1056a6d42e7dSPeter Dunlap {
1057a6d42e7dSPeter Dunlap 	idm_status_t	idmrc;
1058a6d42e7dSPeter Dunlap 
10590f94976eSJeff Biseda 	idm_set_postconnect_options(new_so);
1060a6d42e7dSPeter Dunlap 	idmrc = idm_so_conn_create_common(ic, new_so);
1061a6d42e7dSPeter Dunlap 
1062a6d42e7dSPeter Dunlap 	return (idmrc);
1063a6d42e7dSPeter Dunlap }
1064a6d42e7dSPeter Dunlap 
1065a6d42e7dSPeter Dunlap static void
1066a6d42e7dSPeter Dunlap idm_so_tgt_conn_destroy(idm_conn_t *ic)
1067a6d42e7dSPeter Dunlap {
1068a6d42e7dSPeter Dunlap 	idm_so_conn_destroy_common(ic);
1069a6d42e7dSPeter Dunlap }
1070a6d42e7dSPeter Dunlap 
1071a6d42e7dSPeter Dunlap /*
1072a6d42e7dSPeter Dunlap  * idm_so_tgt_conn_connect()
1073a6d42e7dSPeter Dunlap  * Establish the connection in ic, passed from idm_tgt_conn_finish(), which
1074a6d42e7dSPeter Dunlap  * is invoked from the SM as a result of an inbound connection request.
1075a6d42e7dSPeter Dunlap  */
1076a6d42e7dSPeter Dunlap static idm_status_t
1077a6d42e7dSPeter Dunlap idm_so_tgt_conn_connect(idm_conn_t *ic)
1078a6d42e7dSPeter Dunlap {
1079a6d42e7dSPeter Dunlap 	idm_so_conn_connect_common(ic);
1080a6d42e7dSPeter Dunlap 
1081a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
1082a6d42e7dSPeter Dunlap }
1083a6d42e7dSPeter Dunlap 
1084a6d42e7dSPeter Dunlap static idm_status_t
10850f1702c5SYu Xiangning idm_so_conn_create_common(idm_conn_t *ic, ksocket_t new_so)
1086a6d42e7dSPeter Dunlap {
1087a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
1088a6d42e7dSPeter Dunlap 
1089a6d42e7dSPeter Dunlap 	so_conn = kmem_zalloc(sizeof (idm_so_conn_t), KM_SLEEP);
1090a6d42e7dSPeter Dunlap 	so_conn->ic_so = new_so;
1091a6d42e7dSPeter Dunlap 
1092a6d42e7dSPeter Dunlap 	ic->ic_transport_private = so_conn;
1093a6d42e7dSPeter Dunlap 	ic->ic_transport_hdrlen = 0;
1094a6d42e7dSPeter Dunlap 
1095a6d42e7dSPeter Dunlap 	/* Set the scoreboarding flag on this connection */
1096a6d42e7dSPeter Dunlap 	ic->ic_conn_flags |= IDM_CONN_USE_SCOREBOARD;
109756261083SCharles Ting 	ic->ic_conn_params.max_recv_dataseglen =
109856261083SCharles Ting 	    ISCSI_DEFAULT_MAX_RECV_SEG_LEN;
109956261083SCharles Ting 	ic->ic_conn_params.max_xmit_dataseglen =
110056261083SCharles Ting 	    ISCSI_DEFAULT_MAX_XMIT_SEG_LEN;
1101a6d42e7dSPeter Dunlap 
1102a6d42e7dSPeter Dunlap 	/*
1103a6d42e7dSPeter Dunlap 	 * Initialize tx thread mutex and list
1104a6d42e7dSPeter Dunlap 	 */
1105a6d42e7dSPeter Dunlap 	mutex_init(&so_conn->ic_tx_mutex, NULL, MUTEX_DEFAULT, NULL);
1106a6d42e7dSPeter Dunlap 	cv_init(&so_conn->ic_tx_cv, NULL, CV_DEFAULT, NULL);
1107a6d42e7dSPeter Dunlap 	list_create(&so_conn->ic_tx_list, sizeof (idm_pdu_t),
1108a6d42e7dSPeter Dunlap 	    offsetof(idm_pdu_t, idm_tx_link));
1109a6d42e7dSPeter Dunlap 
1110a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
1111a6d42e7dSPeter Dunlap }
1112a6d42e7dSPeter Dunlap 
1113a6d42e7dSPeter Dunlap static void
1114a6d42e7dSPeter Dunlap idm_so_conn_destroy_common(idm_conn_t *ic)
1115a6d42e7dSPeter Dunlap {
1116a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn = ic->ic_transport_private;
1117a6d42e7dSPeter Dunlap 
1118a6d42e7dSPeter Dunlap 	ic->ic_transport_private = NULL;
1119a6d42e7dSPeter Dunlap 	idm_sodestroy(so_conn->ic_so);
1120a6d42e7dSPeter Dunlap 	list_destroy(&so_conn->ic_tx_list);
1121a6d42e7dSPeter Dunlap 	mutex_destroy(&so_conn->ic_tx_mutex);
1122a6d42e7dSPeter Dunlap 	cv_destroy(&so_conn->ic_tx_cv);
1123a6d42e7dSPeter Dunlap 
1124a6d42e7dSPeter Dunlap 	kmem_free(so_conn, sizeof (idm_so_conn_t));
1125a6d42e7dSPeter Dunlap }
1126a6d42e7dSPeter Dunlap 
1127a6d42e7dSPeter Dunlap static void
1128a6d42e7dSPeter Dunlap idm_so_conn_connect_common(idm_conn_t *ic)
1129a6d42e7dSPeter Dunlap {
1130a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
11310f1702c5SYu Xiangning 	struct sockaddr_in6	t_addr;
11320f1702c5SYu Xiangning 	socklen_t	t_addrlen = 0;
1133a6d42e7dSPeter Dunlap 
1134a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
11350f1702c5SYu Xiangning 	bzero(&t_addr, sizeof (struct sockaddr_in6));
11360f1702c5SYu Xiangning 	t_addrlen = sizeof (struct sockaddr_in6);
1137a6d42e7dSPeter Dunlap 
1138a6d42e7dSPeter Dunlap 	/* Set the local and remote addresses in the idm conn handle */
1139aedf2b3bSsrivijitha dugganapalli 	(void) ksocket_getsockname(so_conn->ic_so, (struct sockaddr *)&t_addr,
11400f1702c5SYu Xiangning 	    &t_addrlen, CRED());
11410f1702c5SYu Xiangning 	bcopy(&t_addr, &ic->ic_laddr, t_addrlen);
1142aedf2b3bSsrivijitha dugganapalli 	(void) ksocket_getpeername(so_conn->ic_so, (struct sockaddr *)&t_addr,
11430f1702c5SYu Xiangning 	    &t_addrlen, CRED());
11440f1702c5SYu Xiangning 	bcopy(&t_addr, &ic->ic_raddr, t_addrlen);
1145a6d42e7dSPeter Dunlap 
1146a6d42e7dSPeter Dunlap 	mutex_enter(&ic->ic_mutex);
1147a6d42e7dSPeter Dunlap 	so_conn->ic_tx_thread = thread_create(NULL, 0, idm_sotx_thread, ic, 0,
1148a6d42e7dSPeter Dunlap 	    &p0, TS_RUN, minclsyspri);
1149a6d42e7dSPeter Dunlap 	so_conn->ic_rx_thread = thread_create(NULL, 0, idm_sorx_thread, ic, 0,
1150a6d42e7dSPeter Dunlap 	    &p0, TS_RUN, minclsyspri);
1151a6d42e7dSPeter Dunlap 
1152e97fb153SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	while (so_conn->ic_rx_thread_did == 0 ||
1153e97fb153SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	    so_conn->ic_tx_thread_did == 0)
1154a6d42e7dSPeter Dunlap 		cv_wait(&ic->ic_cv, &ic->ic_mutex);
1155a6d42e7dSPeter Dunlap 	mutex_exit(&ic->ic_mutex);
1156a6d42e7dSPeter Dunlap }
1157a6d42e7dSPeter Dunlap 
1158a6d42e7dSPeter Dunlap /*
1159a6d42e7dSPeter Dunlap  * idm_so_conn_disconnect()
1160a6d42e7dSPeter Dunlap  * Shutdown the socket connection and stop the thread
1161a6d42e7dSPeter Dunlap  */
1162a6d42e7dSPeter Dunlap static void
1163a6d42e7dSPeter Dunlap idm_so_conn_disconnect(idm_conn_t *ic)
1164a6d42e7dSPeter Dunlap {
1165a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
1166a6d42e7dSPeter Dunlap 
1167a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
1168a6d42e7dSPeter Dunlap 
1169a6d42e7dSPeter Dunlap 	mutex_enter(&ic->ic_mutex);
1170a6d42e7dSPeter Dunlap 	so_conn->ic_rx_thread_running = B_FALSE;
1171a6d42e7dSPeter Dunlap 	so_conn->ic_tx_thread_running = B_FALSE;
1172a6d42e7dSPeter Dunlap 	/* We need to wakeup the TX thread */
1173a6d42e7dSPeter Dunlap 	mutex_enter(&so_conn->ic_tx_mutex);
1174a6d42e7dSPeter Dunlap 	cv_signal(&so_conn->ic_tx_cv);
1175a6d42e7dSPeter Dunlap 	mutex_exit(&so_conn->ic_tx_mutex);
1176a6d42e7dSPeter Dunlap 	mutex_exit(&ic->ic_mutex);
1177a6d42e7dSPeter Dunlap 
1178a6d42e7dSPeter Dunlap 	/* This should wakeup the RX thread if it is sleeping */
1179a6d42e7dSPeter Dunlap 	idm_soshutdown(so_conn->ic_so);
1180a6d42e7dSPeter Dunlap 
1181a6d42e7dSPeter Dunlap 	thread_join(so_conn->ic_tx_thread_did);
1182a6d42e7dSPeter Dunlap 	thread_join(so_conn->ic_rx_thread_did);
1183a6d42e7dSPeter Dunlap }
1184a6d42e7dSPeter Dunlap 
1185a6d42e7dSPeter Dunlap /*
1186a6d42e7dSPeter Dunlap  * idm_so_tgt_svc_create()
1187a6d42e7dSPeter Dunlap  * Establish a service on an IP address and port.  idm_svc_req_t contains
1188a6d42e7dSPeter Dunlap  * the service parameters.
1189a6d42e7dSPeter Dunlap  */
1190a6d42e7dSPeter Dunlap /*ARGSUSED*/
1191a6d42e7dSPeter Dunlap static idm_status_t
1192a6d42e7dSPeter Dunlap idm_so_tgt_svc_create(idm_svc_req_t *sr, idm_svc_t *is)
1193a6d42e7dSPeter Dunlap {
1194a6d42e7dSPeter Dunlap 	idm_so_svc_t		*so_svc;
1195a6d42e7dSPeter Dunlap 
1196a6d42e7dSPeter Dunlap 	so_svc = kmem_zalloc(sizeof (idm_so_svc_t), KM_SLEEP);
1197a6d42e7dSPeter Dunlap 
1198a6d42e7dSPeter Dunlap 	/* Set the new sockets service in svc handle */
1199a6d42e7dSPeter Dunlap 	is->is_so_svc = (void *)so_svc;
1200a6d42e7dSPeter Dunlap 
1201a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
1202a6d42e7dSPeter Dunlap }
1203a6d42e7dSPeter Dunlap 
1204a6d42e7dSPeter Dunlap /*
1205a6d42e7dSPeter Dunlap  * idm_so_tgt_svc_destroy()
1206a6d42e7dSPeter Dunlap  * Teardown sockets resources allocated in idm_so_tgt_svc_create()
1207a6d42e7dSPeter Dunlap  */
1208a6d42e7dSPeter Dunlap static void
1209a6d42e7dSPeter Dunlap idm_so_tgt_svc_destroy(idm_svc_t *is)
1210a6d42e7dSPeter Dunlap {
1211a6d42e7dSPeter Dunlap 	/* the socket will have been torn down; free the service */
1212a6d42e7dSPeter Dunlap 	kmem_free(is->is_so_svc, sizeof (idm_so_svc_t));
1213a6d42e7dSPeter Dunlap }
1214a6d42e7dSPeter Dunlap 
1215a6d42e7dSPeter Dunlap /*
1216a6d42e7dSPeter Dunlap  * idm_so_tgt_svc_online()
1217a6d42e7dSPeter Dunlap  * Launch a watch thread on the svc allocated in idm_so_tgt_svc_create()
1218a6d42e7dSPeter Dunlap  */
1219a6d42e7dSPeter Dunlap 
1220a6d42e7dSPeter Dunlap static idm_status_t
1221a6d42e7dSPeter Dunlap idm_so_tgt_svc_online(idm_svc_t *is)
1222a6d42e7dSPeter Dunlap {
1223a6d42e7dSPeter Dunlap 	idm_so_svc_t		*so_svc;
1224a6d42e7dSPeter Dunlap 	idm_svc_req_t		*sr = &is->is_svc_req;
1225a6d42e7dSPeter Dunlap 	struct sockaddr_in6	sin6_ip;
1226a6d42e7dSPeter Dunlap 	const uint32_t		on = 1;
1227a6d42e7dSPeter Dunlap 	const uint32_t		off = 0;
1228a6d42e7dSPeter Dunlap 
1229a6d42e7dSPeter Dunlap 	mutex_enter(&is->is_mutex);
1230a6d42e7dSPeter Dunlap 	so_svc = (idm_so_svc_t *)is->is_so_svc;
1231a6d42e7dSPeter Dunlap 
1232a6d42e7dSPeter Dunlap 	/*
1233a6d42e7dSPeter Dunlap 	 * Try creating an IPv6 socket first
1234a6d42e7dSPeter Dunlap 	 */
1235a6d42e7dSPeter Dunlap 	if ((so_svc->is_so = idm_socreate(PF_INET6, SOCK_STREAM, 0)) == NULL) {
1236a6d42e7dSPeter Dunlap 		mutex_exit(&is->is_mutex);
1237a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
1238a6d42e7dSPeter Dunlap 	} else {
1239a6d42e7dSPeter Dunlap 		bzero(&sin6_ip, sizeof (sin6_ip));
1240a6d42e7dSPeter Dunlap 		sin6_ip.sin6_family = AF_INET6;
1241a6d42e7dSPeter Dunlap 		sin6_ip.sin6_port = htons(sr->sr_port);
1242a6d42e7dSPeter Dunlap 		sin6_ip.sin6_addr = in6addr_any;
1243a6d42e7dSPeter Dunlap 
12440f1702c5SYu Xiangning 		(void) ksocket_setsockopt(so_svc->is_so, SOL_SOCKET,
12450f1702c5SYu Xiangning 		    SO_REUSEADDR, (char *)&on, sizeof (on), CRED());
1246a6d42e7dSPeter Dunlap 		/*
1247a6d42e7dSPeter Dunlap 		 * Turn off SO_MAC_EXEMPT so future sobinds succeed
1248a6d42e7dSPeter Dunlap 		 */
12490f1702c5SYu Xiangning 		(void) ksocket_setsockopt(so_svc->is_so, SOL_SOCKET,
12500f1702c5SYu Xiangning 		    SO_MAC_EXEMPT, (char *)&off, sizeof (off), CRED());
1251a6d42e7dSPeter Dunlap 
12520f1702c5SYu Xiangning 		if (ksocket_bind(so_svc->is_so, (struct sockaddr *)&sin6_ip,
12530f1702c5SYu Xiangning 		    sizeof (sin6_ip), CRED()) != 0) {
1254a6d42e7dSPeter Dunlap 			mutex_exit(&is->is_mutex);
1255a6d42e7dSPeter Dunlap 			idm_sodestroy(so_svc->is_so);
1256a6d42e7dSPeter Dunlap 			return (IDM_STATUS_FAIL);
1257a6d42e7dSPeter Dunlap 		}
1258a6d42e7dSPeter Dunlap 	}
1259a6d42e7dSPeter Dunlap 
12600f94976eSJeff Biseda 	idm_set_postconnect_options(so_svc->is_so);
1261a6d42e7dSPeter Dunlap 
12620f1702c5SYu Xiangning 	if (ksocket_listen(so_svc->is_so, 5, CRED()) != 0) {
1263a6d42e7dSPeter Dunlap 		mutex_exit(&is->is_mutex);
1264a6d42e7dSPeter Dunlap 		idm_soshutdown(so_svc->is_so);
1265a6d42e7dSPeter Dunlap 		idm_sodestroy(so_svc->is_so);
1266a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
1267a6d42e7dSPeter Dunlap 	}
1268a6d42e7dSPeter Dunlap 
1269a6d42e7dSPeter Dunlap 	/* Launch a watch thread */
1270a6d42e7dSPeter Dunlap 	so_svc->is_thread = thread_create(NULL, 0, idm_so_svc_port_watcher,
1271a6d42e7dSPeter Dunlap 	    is, 0, &p0, TS_RUN, minclsyspri);
1272a6d42e7dSPeter Dunlap 
1273a6d42e7dSPeter Dunlap 	if (so_svc->is_thread == NULL) {
1274a6d42e7dSPeter Dunlap 		/* Failure to launch; teardown the socket */
1275a6d42e7dSPeter Dunlap 		mutex_exit(&is->is_mutex);
1276a6d42e7dSPeter Dunlap 		idm_soshutdown(so_svc->is_so);
1277a6d42e7dSPeter Dunlap 		idm_sodestroy(so_svc->is_so);
1278a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
1279a6d42e7dSPeter Dunlap 	}
12800f1702c5SYu Xiangning 	ksocket_hold(so_svc->is_so);
1281a6d42e7dSPeter Dunlap 	/* Wait for the port watcher thread to start */
1282a6d42e7dSPeter Dunlap 	while (!so_svc->is_thread_running)
1283a6d42e7dSPeter Dunlap 		cv_wait(&is->is_cv, &is->is_mutex);
1284a6d42e7dSPeter Dunlap 	mutex_exit(&is->is_mutex);
1285a6d42e7dSPeter Dunlap 
1286a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
1287a6d42e7dSPeter Dunlap }
1288a6d42e7dSPeter Dunlap 
1289a6d42e7dSPeter Dunlap /*
1290a6d42e7dSPeter Dunlap  * idm_so_tgt_svc_offline
1291a6d42e7dSPeter Dunlap  *
1292a6d42e7dSPeter Dunlap  * Stop listening on the IP address and port identified by idm_svc_t.
1293a6d42e7dSPeter Dunlap  */
1294a6d42e7dSPeter Dunlap static void
1295a6d42e7dSPeter Dunlap idm_so_tgt_svc_offline(idm_svc_t *is)
1296a6d42e7dSPeter Dunlap {
1297a6d42e7dSPeter Dunlap 	idm_so_svc_t		*so_svc;
1298a6d42e7dSPeter Dunlap 	mutex_enter(&is->is_mutex);
1299a6d42e7dSPeter Dunlap 	so_svc = (idm_so_svc_t *)is->is_so_svc;
1300a6d42e7dSPeter Dunlap 	so_svc->is_thread_running = B_FALSE;
1301a6d42e7dSPeter Dunlap 	mutex_exit(&is->is_mutex);
1302a6d42e7dSPeter Dunlap 
1303a6d42e7dSPeter Dunlap 	/*
13040f1702c5SYu Xiangning 	 * Teardown socket
1305a6d42e7dSPeter Dunlap 	 */
13060f1702c5SYu Xiangning 	idm_sodestroy(so_svc->is_so);
1307a6d42e7dSPeter Dunlap 
1308a6d42e7dSPeter Dunlap 	/*
1309a6d42e7dSPeter Dunlap 	 * Now we expect the port watcher thread to terminate
1310a6d42e7dSPeter Dunlap 	 */
1311a6d42e7dSPeter Dunlap 	thread_join(so_svc->is_thread_did);
1312a6d42e7dSPeter Dunlap }
1313a6d42e7dSPeter Dunlap 
1314a6d42e7dSPeter Dunlap /*
1315a6d42e7dSPeter Dunlap  * Watch thread for target service connection establishment.
1316a6d42e7dSPeter Dunlap  */
1317a6d42e7dSPeter Dunlap void
1318a6d42e7dSPeter Dunlap idm_so_svc_port_watcher(void *arg)
1319a6d42e7dSPeter Dunlap {
1320a6d42e7dSPeter Dunlap 	idm_svc_t		*svc = arg;
13210f1702c5SYu Xiangning 	ksocket_t		new_so;
1322a6d42e7dSPeter Dunlap 	idm_conn_t		*ic;
1323a6d42e7dSPeter Dunlap 	idm_status_t		idmrc;
1324a6d42e7dSPeter Dunlap 	idm_so_svc_t		*so_svc;
1325a6d42e7dSPeter Dunlap 	int			rc;
1326a6d42e7dSPeter Dunlap 	const uint32_t		off = 0;
13270f1702c5SYu Xiangning 	struct sockaddr_in6 	t_addr;
13280f1702c5SYu Xiangning 	socklen_t		t_addrlen;
1329a6d42e7dSPeter Dunlap 
13300f1702c5SYu Xiangning 	bzero(&t_addr, sizeof (struct sockaddr_in6));
13310f1702c5SYu Xiangning 	t_addrlen = sizeof (struct sockaddr_in6);
1332a6d42e7dSPeter Dunlap 	mutex_enter(&svc->is_mutex);
1333a6d42e7dSPeter Dunlap 
1334a6d42e7dSPeter Dunlap 	so_svc = svc->is_so_svc;
1335a6d42e7dSPeter Dunlap 	so_svc->is_thread_running = B_TRUE;
1336a6d42e7dSPeter Dunlap 	so_svc->is_thread_did = so_svc->is_thread->t_did;
1337a6d42e7dSPeter Dunlap 
1338a6d42e7dSPeter Dunlap 	cv_signal(&svc->is_cv);
1339a6d42e7dSPeter Dunlap 
1340a6d42e7dSPeter Dunlap 	IDM_SVC_LOG(CE_NOTE, "iSCSI service (%p/%d) online", (void *)svc,
1341a6d42e7dSPeter Dunlap 	    svc->is_svc_req.sr_port);
1342a6d42e7dSPeter Dunlap 
1343a6d42e7dSPeter Dunlap 	while (so_svc->is_thread_running) {
1344a6d42e7dSPeter Dunlap 		mutex_exit(&svc->is_mutex);
1345a6d42e7dSPeter Dunlap 
13460f1702c5SYu Xiangning 		if ((rc = ksocket_accept(so_svc->is_so,
13470f1702c5SYu Xiangning 		    (struct sockaddr *)&t_addr, &t_addrlen,
13480f1702c5SYu Xiangning 		    &new_so, CRED())) != 0) {
1349a6d42e7dSPeter Dunlap 			mutex_enter(&svc->is_mutex);
135057ff5e7eSJeff Biseda 			if (rc != ECONNABORTED && rc != EINTR) {
135157ff5e7eSJeff Biseda 				IDM_SVC_LOG(CE_NOTE, "idm_so_svc_port_watcher:"
135257ff5e7eSJeff Biseda 				    " ksocket_accept failed %d", rc);
135357ff5e7eSJeff Biseda 			}
135457ff5e7eSJeff Biseda 			/*
135557ff5e7eSJeff Biseda 			 * Unclean shutdown of this thread is not handled
135657ff5e7eSJeff Biseda 			 * wait for !is_thread_running.
135757ff5e7eSJeff Biseda 			 */
135857ff5e7eSJeff Biseda 			continue;
1359a6d42e7dSPeter Dunlap 		}
1360a6d42e7dSPeter Dunlap 		/*
1361a6d42e7dSPeter Dunlap 		 * Turn off SO_MAC_EXEMPT so future sobinds succeed
1362a6d42e7dSPeter Dunlap 		 */
13630f1702c5SYu Xiangning 		(void) ksocket_setsockopt(new_so, SOL_SOCKET, SO_MAC_EXEMPT,
13640f1702c5SYu Xiangning 		    (char *)&off, sizeof (off), CRED());
1365a6d42e7dSPeter Dunlap 
1366a6d42e7dSPeter Dunlap 		idmrc = idm_svc_conn_create(svc, IDM_TRANSPORT_TYPE_SOCKETS,
1367a6d42e7dSPeter Dunlap 		    &ic);
1368a6d42e7dSPeter Dunlap 		if (idmrc != IDM_STATUS_SUCCESS) {
1369a6d42e7dSPeter Dunlap 			/* Drop connection */
1370a6d42e7dSPeter Dunlap 			idm_soshutdown(new_so);
1371a6d42e7dSPeter Dunlap 			idm_sodestroy(new_so);
1372a6d42e7dSPeter Dunlap 			mutex_enter(&svc->is_mutex);
1373a6d42e7dSPeter Dunlap 			continue;
1374a6d42e7dSPeter Dunlap 		}
1375a6d42e7dSPeter Dunlap 
1376a6d42e7dSPeter Dunlap 		idmrc = idm_so_tgt_conn_create(ic, new_so);
1377a6d42e7dSPeter Dunlap 		if (idmrc != IDM_STATUS_SUCCESS) {
1378a6d42e7dSPeter Dunlap 			idm_svc_conn_destroy(ic);
1379a6d42e7dSPeter Dunlap 			idm_soshutdown(new_so);
1380a6d42e7dSPeter Dunlap 			idm_sodestroy(new_so);
1381a6d42e7dSPeter Dunlap 			mutex_enter(&svc->is_mutex);
1382a6d42e7dSPeter Dunlap 			continue;
1383a6d42e7dSPeter Dunlap 		}
1384a6d42e7dSPeter Dunlap 
1385a6d42e7dSPeter Dunlap 		/*
1386a6d42e7dSPeter Dunlap 		 * Kick the state machine.  At CS_S3_XPT_UP the state machine
1387a6d42e7dSPeter Dunlap 		 * will notify the client (target) about the new connection.
1388a6d42e7dSPeter Dunlap 		 */
1389a6d42e7dSPeter Dunlap 		idm_conn_event(ic, CE_CONNECT_ACCEPT, NULL);
1390a6d42e7dSPeter Dunlap 
1391a6d42e7dSPeter Dunlap 		mutex_enter(&svc->is_mutex);
1392a6d42e7dSPeter Dunlap 	}
13930f1702c5SYu Xiangning 	ksocket_rele(so_svc->is_so);
1394a6d42e7dSPeter Dunlap 	so_svc->is_thread_running = B_FALSE;
1395a6d42e7dSPeter Dunlap 	mutex_exit(&svc->is_mutex);
1396a6d42e7dSPeter Dunlap 
1397a6d42e7dSPeter Dunlap 	IDM_SVC_LOG(CE_NOTE, "iSCSI service (%p/%d) offline", (void *)svc,
1398a6d42e7dSPeter Dunlap 	    svc->is_svc_req.sr_port);
1399a6d42e7dSPeter Dunlap 
1400a6d42e7dSPeter Dunlap 	thread_exit();
1401a6d42e7dSPeter Dunlap }
1402a6d42e7dSPeter Dunlap 
1403a6d42e7dSPeter Dunlap /*
1404a6d42e7dSPeter Dunlap  * idm_so_free_task_rsrc() stops any ongoing processing of the task and
1405a6d42e7dSPeter Dunlap  * frees resources associated with the task.
1406a6d42e7dSPeter Dunlap  *
1407a6d42e7dSPeter Dunlap  * It's not clear that this should return idm_status_t.  What do we do
1408a6d42e7dSPeter Dunlap  * if it fails?
1409a6d42e7dSPeter Dunlap  */
1410a6d42e7dSPeter Dunlap static idm_status_t
1411a6d42e7dSPeter Dunlap idm_so_free_task_rsrc(idm_task_t *idt)
1412a6d42e7dSPeter Dunlap {
141392adbba7SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	idm_buf_t	*idb, *next_idb;
1414a6d42e7dSPeter Dunlap 
141530e7468fSPeter Dunlap 	/*
141630e7468fSPeter Dunlap 	 * There is nothing to cleanup on initiator connections
141730e7468fSPeter Dunlap 	 */
141830e7468fSPeter Dunlap 	if (IDM_CONN_ISINI(idt->idt_ic))
141930e7468fSPeter Dunlap 		return (IDM_STATUS_SUCCESS);
142030e7468fSPeter Dunlap 
1421a6d42e7dSPeter Dunlap 	/*
1422a6d42e7dSPeter Dunlap 	 * If this is a target connection, call idm_buf_rx_from_ini_done for
1423a6d42e7dSPeter Dunlap 	 * any buffer on the "outbufv" list with idb->idb_in_transport==B_TRUE.
1424a6d42e7dSPeter Dunlap 	 *
1425a6d42e7dSPeter Dunlap 	 * In addition, remove any buffers associated with this task from
1426a6d42e7dSPeter Dunlap 	 * the ic_tx_list.  We'll do this by walking the idt_inbufv list, but
1427a6d42e7dSPeter Dunlap 	 * items don't actually get removed from that list (and completion
1428a6d42e7dSPeter Dunlap 	 * routines called) until idm_task_cleanup.
1429a6d42e7dSPeter Dunlap 	 */
1430a6d42e7dSPeter Dunlap 	mutex_enter(&idt->idt_mutex);
1431a6d42e7dSPeter Dunlap 
143292adbba7SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	for (idb = list_head(&idt->idt_outbufv); idb != NULL; idb = next_idb) {
143392adbba7SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		next_idb = list_next(&idt->idt_outbufv, idb);
1434a6d42e7dSPeter Dunlap 		if (idb->idb_in_transport) {
1435a6d42e7dSPeter Dunlap 			/*
1436a6d42e7dSPeter Dunlap 			 * idm_buf_rx_from_ini_done releases idt->idt_mutex
1437a6d42e7dSPeter Dunlap 			 */
1438a668b114SPriya Krishnan 			DTRACE_ISCSI_8(xfer__done, idm_conn_t *, idt->idt_ic,
1439a668b114SPriya Krishnan 			    uintptr_t, idb->idb_buf,
1440a668b114SPriya Krishnan 			    uint32_t, idb->idb_bufoffset,
1441a668b114SPriya Krishnan 			    uint64_t, 0, uint32_t, 0, uint32_t, 0,
1442a668b114SPriya Krishnan 			    uint32_t, idb->idb_xfer_len,
1443a668b114SPriya Krishnan 			    int, XFER_BUF_RX_FROM_INI);
1444a6d42e7dSPeter Dunlap 			idm_buf_rx_from_ini_done(idt, idb, IDM_STATUS_ABORTED);
1445a6d42e7dSPeter Dunlap 			mutex_enter(&idt->idt_mutex);
1446a6d42e7dSPeter Dunlap 		}
1447a6d42e7dSPeter Dunlap 	}
1448a6d42e7dSPeter Dunlap 
144992adbba7SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	for (idb = list_head(&idt->idt_inbufv); idb != NULL; idb = next_idb) {
145092adbba7SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		next_idb = list_next(&idt->idt_inbufv, idb);
1451a6d42e7dSPeter Dunlap 		/*
1452a6d42e7dSPeter Dunlap 		 * We want to remove these items from the tx_list as well,
1453a6d42e7dSPeter Dunlap 		 * but knowing it's in the idt_inbufv list is not a guarantee
1454a6d42e7dSPeter Dunlap 		 * that it's in the tx_list.  If it's on the tx list then
1455a6d42e7dSPeter Dunlap 		 * let idm_sotx_thread() clean it up.
1456a6d42e7dSPeter Dunlap 		 */
1457a6d42e7dSPeter Dunlap 		if (idb->idb_in_transport && !idb->idb_tx_thread) {
1458a6d42e7dSPeter Dunlap 			/*
1459a6d42e7dSPeter Dunlap 			 * idm_buf_tx_to_ini_done releases idt->idt_mutex
1460a6d42e7dSPeter Dunlap 			 */
1461a668b114SPriya Krishnan 			DTRACE_ISCSI_8(xfer__done, idm_conn_t *, idt->idt_ic,
1462a668b114SPriya Krishnan 			    uintptr_t, idb->idb_buf,
1463a668b114SPriya Krishnan 			    uint32_t, idb->idb_bufoffset,
1464a668b114SPriya Krishnan 			    uint64_t, 0, uint32_t, 0, uint32_t, 0,
1465a668b114SPriya Krishnan 			    uint32_t, idb->idb_xfer_len,
1466a668b114SPriya Krishnan 			    int, XFER_BUF_TX_TO_INI);
1467a6d42e7dSPeter Dunlap 			idm_buf_tx_to_ini_done(idt, idb, IDM_STATUS_ABORTED);
1468a6d42e7dSPeter Dunlap 			mutex_enter(&idt->idt_mutex);
1469a6d42e7dSPeter Dunlap 		}
1470a6d42e7dSPeter Dunlap 	}
1471a6d42e7dSPeter Dunlap 
1472a6d42e7dSPeter Dunlap 	mutex_exit(&idt->idt_mutex);
1473a6d42e7dSPeter Dunlap 
1474a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
1475a6d42e7dSPeter Dunlap }
1476a6d42e7dSPeter Dunlap 
1477a6d42e7dSPeter Dunlap /*
1478a6d42e7dSPeter Dunlap  * idm_so_negotiate_key_values() validates the key values for this connection
1479a6d42e7dSPeter Dunlap  */
1480a6d42e7dSPeter Dunlap /* ARGSUSED */
1481a6d42e7dSPeter Dunlap static kv_status_t
1482a6d42e7dSPeter Dunlap idm_so_negotiate_key_values(idm_conn_t *it, nvlist_t *request_nvl,
1483a6d42e7dSPeter Dunlap     nvlist_t *response_nvl, nvlist_t *negotiated_nvl)
1484a6d42e7dSPeter Dunlap {
1485a6d42e7dSPeter Dunlap 	/* All parameters are negotiated at the iscsit level */
1486a6d42e7dSPeter Dunlap 	return (KV_HANDLED);
1487a6d42e7dSPeter Dunlap }
1488a6d42e7dSPeter Dunlap 
1489a6d42e7dSPeter Dunlap /*
1490a6d42e7dSPeter Dunlap  * idm_so_notice_key_values() activates the negotiated key values for
1491a6d42e7dSPeter Dunlap  * this connection.
1492a6d42e7dSPeter Dunlap  */
149330e7468fSPeter Dunlap static void
1494a6d42e7dSPeter Dunlap idm_so_notice_key_values(idm_conn_t *it, nvlist_t *negotiated_nvl)
1495a6d42e7dSPeter Dunlap {
1496a6d42e7dSPeter Dunlap 	char			*nvp_name;
1497a6d42e7dSPeter Dunlap 	nvpair_t		*nvp;
1498a6d42e7dSPeter Dunlap 	nvpair_t		*next_nvp;
1499a6d42e7dSPeter Dunlap 	int			nvrc;
1500a6d42e7dSPeter Dunlap 	idm_status_t		idm_status;
1501a6d42e7dSPeter Dunlap 	const idm_kv_xlate_t	*ikvx;
150256261083SCharles Ting 	uint64_t		num_val;
1503a6d42e7dSPeter Dunlap 
1504a6d42e7dSPeter Dunlap 	for (nvp = nvlist_next_nvpair(negotiated_nvl, NULL);
1505a6d42e7dSPeter Dunlap 	    nvp != NULL; nvp = next_nvp) {
1506a6d42e7dSPeter Dunlap 		next_nvp = nvlist_next_nvpair(negotiated_nvl, nvp);
1507a6d42e7dSPeter Dunlap 		nvp_name = nvpair_name(nvp);
1508a6d42e7dSPeter Dunlap 
1509a6d42e7dSPeter Dunlap 		ikvx = idm_lookup_kv_xlate(nvp_name, strlen(nvp_name));
1510a6d42e7dSPeter Dunlap 		switch (ikvx->ik_key_id) {
1511a6d42e7dSPeter Dunlap 		case KI_HEADER_DIGEST:
1512a6d42e7dSPeter Dunlap 		case KI_DATA_DIGEST:
1513a6d42e7dSPeter Dunlap 			idm_status = idm_so_handle_digest(it, nvp, ikvx);
1514a6d42e7dSPeter Dunlap 			ASSERT(idm_status == 0);
1515a6d42e7dSPeter Dunlap 
1516a6d42e7dSPeter Dunlap 			/* Remove processed item from negotiated_nvl list */
1517a6d42e7dSPeter Dunlap 			nvrc = nvlist_remove_all(
1518a6d42e7dSPeter Dunlap 			    negotiated_nvl, ikvx->ik_key_name);
1519a6d42e7dSPeter Dunlap 			ASSERT(nvrc == 0);
1520a6d42e7dSPeter Dunlap 			break;
152156261083SCharles Ting 		case KI_MAX_RECV_DATA_SEGMENT_LENGTH:
152256261083SCharles Ting 			/*
152356261083SCharles Ting 			 * Just pass the value down to idm layer.
152456261083SCharles Ting 			 * No need to remove it from negotiated_nvl list here.
152556261083SCharles Ting 			 */
152656261083SCharles Ting 			nvrc = nvpair_value_uint64(nvp, &num_val);
152756261083SCharles Ting 			ASSERT(nvrc == 0);
152856261083SCharles Ting 			it->ic_conn_params.max_xmit_dataseglen =
152956261083SCharles Ting 			    (uint32_t)num_val;
153056261083SCharles Ting 			break;
1531a6d42e7dSPeter Dunlap 		default:
1532a6d42e7dSPeter Dunlap 			break;
1533a6d42e7dSPeter Dunlap 		}
1534a6d42e7dSPeter Dunlap 	}
1535a6d42e7dSPeter Dunlap }
1536a6d42e7dSPeter Dunlap 
153756261083SCharles Ting /*
153856261083SCharles Ting  * idm_so_declare_key_values() declares the key values for this connection
153956261083SCharles Ting  */
154056261083SCharles Ting /* ARGSUSED */
154156261083SCharles Ting static kv_status_t
154256261083SCharles Ting idm_so_declare_key_values(idm_conn_t *it, nvlist_t *config_nvl,
154356261083SCharles Ting     nvlist_t *outgoing_nvl)
154456261083SCharles Ting {
154556261083SCharles Ting 	char			*nvp_name;
154656261083SCharles Ting 	nvpair_t		*nvp;
154756261083SCharles Ting 	nvpair_t		*next_nvp;
154856261083SCharles Ting 	kv_status_t		kvrc;
154956261083SCharles Ting 	int			nvrc = 0;
155056261083SCharles Ting 	const idm_kv_xlate_t	*ikvx;
155156261083SCharles Ting 	uint64_t		num_val;
155256261083SCharles Ting 
155356261083SCharles Ting 	for (nvp = nvlist_next_nvpair(config_nvl, NULL);
155456261083SCharles Ting 	    nvp != NULL && nvrc == 0; nvp = next_nvp) {
155556261083SCharles Ting 		next_nvp = nvlist_next_nvpair(config_nvl, nvp);
155656261083SCharles Ting 		nvp_name = nvpair_name(nvp);
155756261083SCharles Ting 
155856261083SCharles Ting 		ikvx = idm_lookup_kv_xlate(nvp_name, strlen(nvp_name));
155956261083SCharles Ting 		switch (ikvx->ik_key_id) {
156056261083SCharles Ting 		case KI_MAX_RECV_DATA_SEGMENT_LENGTH:
156156261083SCharles Ting 			if ((nvrc = nvpair_value_uint64(nvp, &num_val)) != 0) {
156256261083SCharles Ting 				break;
156356261083SCharles Ting 			}
156456261083SCharles Ting 			if (outgoing_nvl &&
156556261083SCharles Ting 			    (nvrc = nvlist_add_uint64(outgoing_nvl,
156656261083SCharles Ting 			    nvp_name, num_val)) != 0) {
156756261083SCharles Ting 				break;
156856261083SCharles Ting 			}
156956261083SCharles Ting 			it->ic_conn_params.max_recv_dataseglen =
157056261083SCharles Ting 			    (uint32_t)num_val;
157156261083SCharles Ting 			break;
157256261083SCharles Ting 		default:
157356261083SCharles Ting 			break;
157456261083SCharles Ting 		}
157556261083SCharles Ting 	}
157656261083SCharles Ting 	kvrc = idm_nvstat_to_kvstat(nvrc);
157756261083SCharles Ting 	return (kvrc);
157856261083SCharles Ting }
1579a6d42e7dSPeter Dunlap 
1580a6d42e7dSPeter Dunlap static idm_status_t
1581a6d42e7dSPeter Dunlap idm_so_handle_digest(idm_conn_t *it, nvpair_t *digest_choice,
1582a6d42e7dSPeter Dunlap     const idm_kv_xlate_t *ikvx)
1583a6d42e7dSPeter Dunlap {
1584a6d42e7dSPeter Dunlap 	int			nvrc;
1585a6d42e7dSPeter Dunlap 	char			*digest_choice_string;
1586a6d42e7dSPeter Dunlap 
1587a6d42e7dSPeter Dunlap 	nvrc = nvpair_value_string(digest_choice,
1588a6d42e7dSPeter Dunlap 	    &digest_choice_string);
1589a6d42e7dSPeter Dunlap 	ASSERT(nvrc == 0);
1590a6d42e7dSPeter Dunlap 	if (strcasecmp(digest_choice_string, "crc32c") == 0) {
1591a6d42e7dSPeter Dunlap 		switch (ikvx->ik_key_id) {
1592a6d42e7dSPeter Dunlap 		case KI_HEADER_DIGEST:
1593a6d42e7dSPeter Dunlap 			it->ic_conn_flags |= IDM_CONN_HEADER_DIGEST;
1594a6d42e7dSPeter Dunlap 			break;
1595a6d42e7dSPeter Dunlap 		case KI_DATA_DIGEST:
1596a6d42e7dSPeter Dunlap 			it->ic_conn_flags |= IDM_CONN_DATA_DIGEST;
1597a6d42e7dSPeter Dunlap 			break;
1598a6d42e7dSPeter Dunlap 		default:
1599a6d42e7dSPeter Dunlap 			ASSERT(0);
1600a6d42e7dSPeter Dunlap 			break;
1601a6d42e7dSPeter Dunlap 		}
1602a6d42e7dSPeter Dunlap 	} else if (strcasecmp(digest_choice_string, "none") == 0) {
1603a6d42e7dSPeter Dunlap 		switch (ikvx->ik_key_id) {
1604a6d42e7dSPeter Dunlap 		case KI_HEADER_DIGEST:
1605a6d42e7dSPeter Dunlap 			it->ic_conn_flags &= ~IDM_CONN_HEADER_DIGEST;
1606a6d42e7dSPeter Dunlap 			break;
1607a6d42e7dSPeter Dunlap 		case KI_DATA_DIGEST:
1608a6d42e7dSPeter Dunlap 			it->ic_conn_flags &= ~IDM_CONN_DATA_DIGEST;
1609a6d42e7dSPeter Dunlap 			break;
1610a6d42e7dSPeter Dunlap 		default:
1611a6d42e7dSPeter Dunlap 			ASSERT(0);
1612a6d42e7dSPeter Dunlap 			break;
1613a6d42e7dSPeter Dunlap 		}
1614a6d42e7dSPeter Dunlap 	} else {
1615a6d42e7dSPeter Dunlap 		ASSERT(0);
1616a6d42e7dSPeter Dunlap 	}
1617a6d42e7dSPeter Dunlap 
1618a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
1619a6d42e7dSPeter Dunlap }
1620a6d42e7dSPeter Dunlap 
1621a6d42e7dSPeter Dunlap 
1622a6d42e7dSPeter Dunlap /*
1623a6d42e7dSPeter Dunlap  * idm_so_conn_is_capable() verifies that the passed connection is provided
1624a6d42e7dSPeter Dunlap  * for by the sockets interface.
1625a6d42e7dSPeter Dunlap  */
1626a6d42e7dSPeter Dunlap /* ARGSUSED */
1627a6d42e7dSPeter Dunlap static boolean_t
1628a6d42e7dSPeter Dunlap idm_so_conn_is_capable(idm_conn_req_t *ic, idm_transport_caps_t *caps)
1629a6d42e7dSPeter Dunlap {
1630a6d42e7dSPeter Dunlap 	return (B_TRUE);
1631a6d42e7dSPeter Dunlap }
1632a6d42e7dSPeter Dunlap 
1633a6d42e7dSPeter Dunlap /*
1634a6d42e7dSPeter Dunlap  * idm_so_rx_datain() validates the Data Sequence number of the PDU. The
1635a6d42e7dSPeter Dunlap  * idm_sorecv_scsidata() function invoked earlier actually reads the data
1636a6d42e7dSPeter Dunlap  * off the socket into the appropriate buffers.
1637a6d42e7dSPeter Dunlap  */
1638a6d42e7dSPeter Dunlap static void
1639a6d42e7dSPeter Dunlap idm_so_rx_datain(idm_conn_t *ic, idm_pdu_t *pdu)
1640a6d42e7dSPeter Dunlap {
1641a6d42e7dSPeter Dunlap 	iscsi_data_hdr_t	*bhs;
1642a6d42e7dSPeter Dunlap 	idm_task_t		*idt;
1643a6d42e7dSPeter Dunlap 	idm_buf_t		*idb;
1644a6d42e7dSPeter Dunlap 	uint32_t		datasn;
1645a6d42e7dSPeter Dunlap 	size_t			offset;
1646a6d42e7dSPeter Dunlap 	iscsi_hdr_t		*ihp = (iscsi_hdr_t *)pdu->isp_hdr;
1647a6d42e7dSPeter Dunlap 	iscsi_data_rsp_hdr_t    *idrhp = (iscsi_data_rsp_hdr_t *)ihp;
1648a6d42e7dSPeter Dunlap 
1649a6d42e7dSPeter Dunlap 	ASSERT(ic != NULL);
1650a6d42e7dSPeter Dunlap 	ASSERT(pdu != NULL);
1651*2727bb05STim Kordas 	ASSERT(IDM_PDU_OPCODE(pdu) == ISCSI_OP_SCSI_DATA_RSP);
1652a6d42e7dSPeter Dunlap 
1653a6d42e7dSPeter Dunlap 	bhs	= (iscsi_data_hdr_t *)pdu->isp_hdr;
1654a6d42e7dSPeter Dunlap 	datasn	= ntohl(bhs->datasn);
1655a6d42e7dSPeter Dunlap 	offset	= ntohl(bhs->offset);
1656a6d42e7dSPeter Dunlap 
1657a6d42e7dSPeter Dunlap 	/*
1658a6d42e7dSPeter Dunlap 	 * Look up the task corresponding to the initiator task tag
1659a6d42e7dSPeter Dunlap 	 * to get the buffers affiliated with the task.
1660a6d42e7dSPeter Dunlap 	 */
1661a6d42e7dSPeter Dunlap 	idt = idm_task_find(ic, bhs->itt, bhs->ttt);
1662a6d42e7dSPeter Dunlap 	if (idt == NULL) {
1663a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN, "idm_so_rx_datain: failed to find task");
1664a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1665a6d42e7dSPeter Dunlap 		return;
1666a6d42e7dSPeter Dunlap 	}
1667a6d42e7dSPeter Dunlap 
1668a6d42e7dSPeter Dunlap 	idb = pdu->isp_sorx_buf;
1669a6d42e7dSPeter Dunlap 	if (idb == NULL) {
1670a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN,
1671a6d42e7dSPeter Dunlap 		    "idm_so_rx_datain: failed to find buffer");
1672a6d42e7dSPeter Dunlap 		idm_task_rele(idt);
1673a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1674a6d42e7dSPeter Dunlap 		return;
1675a6d42e7dSPeter Dunlap 	}
1676a6d42e7dSPeter Dunlap 
1677a6d42e7dSPeter Dunlap 	/*
1678a6d42e7dSPeter Dunlap 	 * DataSN values should be sequential and should not have any gaps or
1679a6d42e7dSPeter Dunlap 	 * repetitions. Check the DataSN with the one stored in the task.
1680a6d42e7dSPeter Dunlap 	 */
1681a6d42e7dSPeter Dunlap 	if (datasn == idt->idt_exp_datasn) {
1682a6d42e7dSPeter Dunlap 		idt->idt_exp_datasn++; /* keep track of DataSN received */
1683a6d42e7dSPeter Dunlap 	} else {
1684a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN, "idm_so_rx_datain: datasn out of order");
1685a6d42e7dSPeter Dunlap 		idm_task_rele(idt);
1686a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1687a6d42e7dSPeter Dunlap 		return;
1688a6d42e7dSPeter Dunlap 	}
1689a6d42e7dSPeter Dunlap 
1690a6d42e7dSPeter Dunlap 	/*
1691a6d42e7dSPeter Dunlap 	 * PDUs in a sequence should be in continuously increasing
1692a6d42e7dSPeter Dunlap 	 * address offset
1693a6d42e7dSPeter Dunlap 	 */
1694a6d42e7dSPeter Dunlap 	if (offset != idb->idb_exp_offset) {
1695a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN, "idm_so_rx_datain: unexpected offset");
169630e7468fSPeter Dunlap 		idm_task_rele(idt);
1697a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1698a6d42e7dSPeter Dunlap 		return;
1699a6d42e7dSPeter Dunlap 	}
1700a6d42e7dSPeter Dunlap 	/* Expected next relative buffer offset */
1701a6d42e7dSPeter Dunlap 	idb->idb_exp_offset += n2h24(bhs->dlength);
170230e7468fSPeter Dunlap 	idt->idt_rx_bytes += n2h24(bhs->dlength);
170330e7468fSPeter Dunlap 
170430e7468fSPeter Dunlap 	idm_task_rele(idt);
1705a6d42e7dSPeter Dunlap 
1706a6d42e7dSPeter Dunlap 	/*
1707a6d42e7dSPeter Dunlap 	 * For now call scsi_rsp which will process the data rsp
1708a6d42e7dSPeter Dunlap 	 * Revisit, need to provide an explicit client entry point for
1709a6d42e7dSPeter Dunlap 	 * phase collapse completions.
1710a6d42e7dSPeter Dunlap 	 */
1711*2727bb05STim Kordas 	if ((IDM_PDU_OPCODE(pdu) == ISCSI_OP_SCSI_DATA_RSP) &&
1712a6d42e7dSPeter Dunlap 	    (idrhp->flags & ISCSI_FLAG_DATA_STATUS)) {
1713a6d42e7dSPeter Dunlap 		(*ic->ic_conn_ops.icb_rx_scsi_rsp)(ic, pdu);
1714a6d42e7dSPeter Dunlap 	}
1715a6d42e7dSPeter Dunlap 
1716a6d42e7dSPeter Dunlap 	idm_pdu_complete(pdu, IDM_STATUS_SUCCESS);
1717a6d42e7dSPeter Dunlap }
1718a6d42e7dSPeter Dunlap 
1719a6d42e7dSPeter Dunlap /*
1720a6d42e7dSPeter Dunlap  * The idm_so_rx_dataout() function is used by the iSCSI target to read
1721a6d42e7dSPeter Dunlap  * data from the Data-Out PDU sent by the iSCSI initiator.
1722a6d42e7dSPeter Dunlap  *
1723a6d42e7dSPeter Dunlap  * This function gets the Initiator Task Tag from the PDU BHS and looks up the
1724a6d42e7dSPeter Dunlap  * task to get the buffers associated with the PDU. A PDU might span buffers.
1725a6d42e7dSPeter Dunlap  * The data is then read into the respective buffer.
1726a6d42e7dSPeter Dunlap  */
1727a6d42e7dSPeter Dunlap static void
1728a6d42e7dSPeter Dunlap idm_so_rx_dataout(idm_conn_t *ic, idm_pdu_t *pdu)
1729a6d42e7dSPeter Dunlap {
1730a6d42e7dSPeter Dunlap 
1731a6d42e7dSPeter Dunlap 	iscsi_data_hdr_t	*bhs;
1732a6d42e7dSPeter Dunlap 	idm_task_t		*idt;
1733a6d42e7dSPeter Dunlap 	idm_buf_t		*idb;
1734a6d42e7dSPeter Dunlap 	size_t			offset;
1735a6d42e7dSPeter Dunlap 
1736a6d42e7dSPeter Dunlap 	ASSERT(ic != NULL);
1737a6d42e7dSPeter Dunlap 	ASSERT(pdu != NULL);
1738*2727bb05STim Kordas 	ASSERT(IDM_PDU_OPCODE(pdu) == ISCSI_OP_SCSI_DATA);
1739a6d42e7dSPeter Dunlap 
1740a6d42e7dSPeter Dunlap 	bhs = (iscsi_data_hdr_t *)pdu->isp_hdr;
1741a6d42e7dSPeter Dunlap 	offset = ntohl(bhs->offset);
1742a6d42e7dSPeter Dunlap 
1743a6d42e7dSPeter Dunlap 	/*
1744a6d42e7dSPeter Dunlap 	 * Look up the task corresponding to the initiator task tag
1745a6d42e7dSPeter Dunlap 	 * to get the buffers affiliated with the task.
1746a6d42e7dSPeter Dunlap 	 */
1747a6d42e7dSPeter Dunlap 	idt = idm_task_find(ic, bhs->itt, bhs->ttt);
1748a6d42e7dSPeter Dunlap 	if (idt == NULL) {
1749a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN,
1750a6d42e7dSPeter Dunlap 		    "idm_so_rx_dataout: failed to find task");
1751a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1752a6d42e7dSPeter Dunlap 		return;
1753a6d42e7dSPeter Dunlap 	}
1754a6d42e7dSPeter Dunlap 
1755a6d42e7dSPeter Dunlap 	idb = pdu->isp_sorx_buf;
1756a6d42e7dSPeter Dunlap 	if (idb == NULL) {
1757a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN,
1758a6d42e7dSPeter Dunlap 		    "idm_so_rx_dataout: failed to find buffer");
1759a6d42e7dSPeter Dunlap 		idm_task_rele(idt);
1760a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1761a6d42e7dSPeter Dunlap 		return;
1762a6d42e7dSPeter Dunlap 	}
1763a6d42e7dSPeter Dunlap 
1764a6d42e7dSPeter Dunlap 	/* Keep track of data transferred - check data offsets */
1765a6d42e7dSPeter Dunlap 	if (offset != idb->idb_exp_offset) {
1766a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_NOTE, "idm_so_rx_dataout: offset out of seq: "
1767a6d42e7dSPeter Dunlap 		    "%ld, %d", offset, idb->idb_exp_offset);
1768a6d42e7dSPeter Dunlap 		idm_task_rele(idt);
1769a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1770a6d42e7dSPeter Dunlap 		return;
1771a6d42e7dSPeter Dunlap 	}
1772a6d42e7dSPeter Dunlap 	/* Expected next relative offset */
1773a6d42e7dSPeter Dunlap 	idb->idb_exp_offset += ntoh24(bhs->dlength);
177430e7468fSPeter Dunlap 	idt->idt_rx_bytes += n2h24(bhs->dlength);
1775a6d42e7dSPeter Dunlap 
1776a6d42e7dSPeter Dunlap 	/*
1777a6d42e7dSPeter Dunlap 	 * Call the buffer callback when the transfer is complete
1778a6d42e7dSPeter Dunlap 	 *
1779a6d42e7dSPeter Dunlap 	 * The connection state machine should only abort tasks after
1780a6d42e7dSPeter Dunlap 	 * shutting down the connection so we are assured that there
1781a6d42e7dSPeter Dunlap 	 * won't be a simultaneous attempt to abort this task at the
1782a6d42e7dSPeter Dunlap 	 * same time as we are processing this PDU (due to a connection
1783a6d42e7dSPeter Dunlap 	 * state change).
1784a6d42e7dSPeter Dunlap 	 */
1785a6d42e7dSPeter Dunlap 	if (bhs->flags & ISCSI_FLAG_FINAL) {
1786*2727bb05STim Kordas 		/*
1787*2727bb05STim Kordas 		 * We have gotten the last data-message for the current
1788*2727bb05STim Kordas 		 * transfer.  idb_xfer_len represents the data that the
1789*2727bb05STim Kordas 		 * command intended to transfer, it does not represent the
1790*2727bb05STim Kordas 		 * actual number of bytes transferred. If we have not
1791*2727bb05STim Kordas 		 * transferred the expected number of bytes something is
1792*2727bb05STim Kordas 		 * wrong.
1793*2727bb05STim Kordas 		 *
1794*2727bb05STim Kordas 		 * We have two options, when there is a mismatch, we can
1795*2727bb05STim Kordas 		 * regard the transfer as invalid -- or we can modify our
1796*2727bb05STim Kordas 		 * notion of "xfer_len." In order to be as stringent as
1797*2727bb05STim Kordas 		 * possible, here we regard this transfer as in error; and
1798*2727bb05STim Kordas 		 * bail out.
1799*2727bb05STim Kordas 		 */
1800*2727bb05STim Kordas 		if (idb->idb_buflen == idb->idb_xfer_len &&
1801*2727bb05STim Kordas 		    idb->idb_buflen !=
1802*2727bb05STim Kordas 		    (idb->idb_exp_offset - idb->idb_bufoffset)) {
1803*2727bb05STim Kordas 			printf("idm_so_rx_dataout: incomplete transfer, "
1804*2727bb05STim Kordas 			    "protocol err");
1805*2727bb05STim Kordas 			IDM_CONN_LOG(CE_NOTE,
1806*2727bb05STim Kordas 			    "idm_so_rx_dataout: incomplete transfer: %ld, %d",
1807*2727bb05STim Kordas 			    offset, (int)(idb->idb_exp_offset - offset));
1808*2727bb05STim Kordas 			idm_task_rele(idt);
1809*2727bb05STim Kordas 			idm_pdu_rx_protocol_error(ic, pdu);
1810*2727bb05STim Kordas 			return;
1811*2727bb05STim Kordas 		}
1812a6d42e7dSPeter Dunlap 		/*
1813a6d42e7dSPeter Dunlap 		 * We only want to call idm_buf_rx_from_ini_done once
1814a6d42e7dSPeter Dunlap 		 * per transfer.  It's possible that this task has
1815a6d42e7dSPeter Dunlap 		 * already been aborted in which case
1816a6d42e7dSPeter Dunlap 		 * idm_so_free_task_rsrc will call idm_buf_rx_from_ini_done
1817a6d42e7dSPeter Dunlap 		 * for each buffer with idb_in_transport==B_TRUE.  To
1818a6d42e7dSPeter Dunlap 		 * close this window and ensure that this doesn't happen,
1819a6d42e7dSPeter Dunlap 		 * we'll clear idb->idb_in_transport now while holding
1820a6d42e7dSPeter Dunlap 		 * the task mutex.   This is only really an issue for
1821a6d42e7dSPeter Dunlap 		 * SCSI task abort -- if tasks were being aborted because
1822a6d42e7dSPeter Dunlap 		 * of a connection state change the state machine would
1823a6d42e7dSPeter Dunlap 		 * have already stopped the receive thread.
1824a6d42e7dSPeter Dunlap 		 */
1825a6d42e7dSPeter Dunlap 		mutex_enter(&idt->idt_mutex);
1826a6d42e7dSPeter Dunlap 
1827a6d42e7dSPeter Dunlap 		/*
1828a6d42e7dSPeter Dunlap 		 * Release the task hold here (obtained in idm_task_find)
1829a6d42e7dSPeter Dunlap 		 * because the task may complete synchronously during
1830a6d42e7dSPeter Dunlap 		 * idm_buf_rx_from_ini_done.  Since we still have an active
1831a6d42e7dSPeter Dunlap 		 * buffer we know there is at least one additional hold on idt.
1832a6d42e7dSPeter Dunlap 		 */
1833a6d42e7dSPeter Dunlap 		idm_task_rele(idt);
1834a6d42e7dSPeter Dunlap 
1835a6d42e7dSPeter Dunlap 		/*
1836a6d42e7dSPeter Dunlap 		 * idm_buf_rx_from_ini_done releases idt->idt_mutex
1837a6d42e7dSPeter Dunlap 		 */
1838a668b114SPriya Krishnan 		DTRACE_ISCSI_8(xfer__done, idm_conn_t *, idt->idt_ic,
1839a668b114SPriya Krishnan 		    uintptr_t, idb->idb_buf, uint32_t, idb->idb_bufoffset,
1840a668b114SPriya Krishnan 		    uint64_t, 0, uint32_t, 0, uint32_t, 0,
1841a668b114SPriya Krishnan 		    uint32_t, idb->idb_xfer_len,
1842a668b114SPriya Krishnan 		    int, XFER_BUF_RX_FROM_INI);
1843a6d42e7dSPeter Dunlap 		idm_buf_rx_from_ini_done(idt, idb, IDM_STATUS_SUCCESS);
1844a6d42e7dSPeter Dunlap 		idm_pdu_complete(pdu, IDM_STATUS_SUCCESS);
1845a6d42e7dSPeter Dunlap 		return;
1846a6d42e7dSPeter Dunlap 	}
1847a6d42e7dSPeter Dunlap 
1848a6d42e7dSPeter Dunlap 	idm_task_rele(idt);
1849a6d42e7dSPeter Dunlap 	idm_pdu_complete(pdu, IDM_STATUS_SUCCESS);
1850a6d42e7dSPeter Dunlap }
1851a6d42e7dSPeter Dunlap 
1852a6d42e7dSPeter Dunlap /*
1853a6d42e7dSPeter Dunlap  * The idm_so_rx_rtt() function is used by the iSCSI initiator to handle
1854a6d42e7dSPeter Dunlap  * the R2T PDU sent by the iSCSI target indicating that it is ready to
1855a6d42e7dSPeter Dunlap  * accept data. This gets the Initiator Task Tag (itt) from the PDU BHS
1856a6d42e7dSPeter Dunlap  * and looks up the task in the task tree using the itt to get the output
1857a6d42e7dSPeter Dunlap  * buffers associated the task. The R2T PDU contains the offset of the
1858a6d42e7dSPeter Dunlap  * requested data and the data length. This function then constructs a
1859a6d42e7dSPeter Dunlap  * sequence of iSCSI PDUs and outputs the requested data. Each Data-Out
1860a6d42e7dSPeter Dunlap  * PDU is associated with the R2T by the Target Transfer Tag  (ttt).
1861a6d42e7dSPeter Dunlap  */
186230e7468fSPeter Dunlap 
1863a6d42e7dSPeter Dunlap static void
1864a6d42e7dSPeter Dunlap idm_so_rx_rtt(idm_conn_t *ic, idm_pdu_t *pdu)
1865a6d42e7dSPeter Dunlap {
1866a6d42e7dSPeter Dunlap 	idm_task_t		*idt;
1867a6d42e7dSPeter Dunlap 	idm_buf_t		*idb;
1868a6d42e7dSPeter Dunlap 	iscsi_rtt_hdr_t		*rtt_hdr;
1869a6d42e7dSPeter Dunlap 	uint32_t		data_offset;
187030e7468fSPeter Dunlap 	uint32_t		data_length;
1871a6d42e7dSPeter Dunlap 
1872a6d42e7dSPeter Dunlap 	ASSERT(ic != NULL);
1873a6d42e7dSPeter Dunlap 	ASSERT(pdu != NULL);
1874a6d42e7dSPeter Dunlap 
1875a6d42e7dSPeter Dunlap 	rtt_hdr	= (iscsi_rtt_hdr_t *)pdu->isp_hdr;
1876a6d42e7dSPeter Dunlap 	data_offset = ntohl(rtt_hdr->data_offset);
187730e7468fSPeter Dunlap 	data_length = ntohl(rtt_hdr->data_length);
1878a6d42e7dSPeter Dunlap 	idt	= idm_task_find(ic, rtt_hdr->itt, rtt_hdr->ttt);
1879a6d42e7dSPeter Dunlap 
1880a6d42e7dSPeter Dunlap 	if (idt == NULL) {
1881a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN, "idm_so_rx_rtt: could not find task");
1882a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1883a6d42e7dSPeter Dunlap 		return;
1884a6d42e7dSPeter Dunlap 	}
1885a6d42e7dSPeter Dunlap 
1886a6d42e7dSPeter Dunlap 	/* Find the buffer bound to the task by the iSCSI initiator */
1887a6d42e7dSPeter Dunlap 	mutex_enter(&idt->idt_mutex);
1888a6d42e7dSPeter Dunlap 	idb = idm_buf_find(&idt->idt_outbufv, data_offset);
1889a6d42e7dSPeter Dunlap 	if (idb == NULL) {
1890a6d42e7dSPeter Dunlap 		mutex_exit(&idt->idt_mutex);
1891a6d42e7dSPeter Dunlap 		idm_task_rele(idt);
1892a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN, "idm_so_rx_rtt: could not find buffer");
1893a6d42e7dSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
1894a6d42e7dSPeter Dunlap 		return;
1895a6d42e7dSPeter Dunlap 	}
1896a6d42e7dSPeter Dunlap 
189730e7468fSPeter Dunlap 	/* return buffer contains this data */
189830e7468fSPeter Dunlap 	if (data_offset + data_length > idb->idb_buflen) {
189930e7468fSPeter Dunlap 		/* Overflow */
190030e7468fSPeter Dunlap 		mutex_exit(&idt->idt_mutex);
190130e7468fSPeter Dunlap 		idm_task_rele(idt);
190230e7468fSPeter Dunlap 		IDM_CONN_LOG(CE_WARN, "idm_so_rx_rtt: read from outside "
190330e7468fSPeter Dunlap 		    "buffer");
190430e7468fSPeter Dunlap 		idm_pdu_rx_protocol_error(ic, pdu);
190530e7468fSPeter Dunlap 		return;
190630e7468fSPeter Dunlap 	}
190730e7468fSPeter Dunlap 
190830e7468fSPeter Dunlap 	idt->idt_r2t_ttt = rtt_hdr->ttt;
190930e7468fSPeter Dunlap 	idt->idt_exp_datasn = 0;
191030e7468fSPeter Dunlap 
191130e7468fSPeter Dunlap 	idm_so_send_rtt_data(ic, idt, idb, data_offset,
191230e7468fSPeter Dunlap 	    ntohl(rtt_hdr->data_length));
1913c158b55cSJack Meng 	/*
1914c158b55cSJack Meng 	 * the idt_mutex is released in idm_so_send_rtt_data
1915c158b55cSJack Meng 	 */
1916a6d42e7dSPeter Dunlap 
1917a6d42e7dSPeter Dunlap 	idm_pdu_complete(pdu, IDM_STATUS_SUCCESS);
1918a6d42e7dSPeter Dunlap 	idm_task_rele(idt);
1919a6d42e7dSPeter Dunlap 
1920a6d42e7dSPeter Dunlap }
1921a6d42e7dSPeter Dunlap 
1922a6d42e7dSPeter Dunlap idm_status_t
1923a6d42e7dSPeter Dunlap idm_sorecvdata(idm_conn_t *ic, idm_pdu_t *pdu)
1924a6d42e7dSPeter Dunlap {
1925a6d42e7dSPeter Dunlap 	uint8_t		pad[ISCSI_PAD_WORD_LEN];
1926a6d42e7dSPeter Dunlap 	int		pad_len;
1927a6d42e7dSPeter Dunlap 	uint32_t	data_digest_crc;
1928a6d42e7dSPeter Dunlap 	uint32_t	crc_calculated;
1929a6d42e7dSPeter Dunlap 	int		total_len;
1930a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
1931a6d42e7dSPeter Dunlap 
1932a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
1933a6d42e7dSPeter Dunlap 
1934a6d42e7dSPeter Dunlap 	pad_len = ((ISCSI_PAD_WORD_LEN -
1935a6d42e7dSPeter Dunlap 	    (pdu->isp_datalen & (ISCSI_PAD_WORD_LEN - 1))) &
1936a6d42e7dSPeter Dunlap 	    (ISCSI_PAD_WORD_LEN - 1));
1937a6d42e7dSPeter Dunlap 
1938a6d42e7dSPeter Dunlap 	ASSERT(pdu->isp_iovlen < (PDU_MAX_IOVLEN - 2)); /* pad + data digest */
1939a6d42e7dSPeter Dunlap 
1940a6d42e7dSPeter Dunlap 	total_len = pdu->isp_datalen;
1941a6d42e7dSPeter Dunlap 
1942a6d42e7dSPeter Dunlap 	if (pad_len) {
1943a6d42e7dSPeter Dunlap 		pdu->isp_iov[pdu->isp_iovlen].iov_base	= (char *)&pad;
1944a6d42e7dSPeter Dunlap 		pdu->isp_iov[pdu->isp_iovlen].iov_len	= pad_len;
1945a6d42e7dSPeter Dunlap 		total_len		+= pad_len;
1946a6d42e7dSPeter Dunlap 		pdu->isp_iovlen++;
1947a6d42e7dSPeter Dunlap 	}
1948a6d42e7dSPeter Dunlap 
1949a6d42e7dSPeter Dunlap 	/* setup data digest */
1950a6d42e7dSPeter Dunlap 	if ((ic->ic_conn_flags & IDM_CONN_DATA_DIGEST) != 0) {
1951a6d42e7dSPeter Dunlap 		pdu->isp_iov[pdu->isp_iovlen].iov_base =
1952a6d42e7dSPeter Dunlap 		    (char *)&data_digest_crc;
1953a6d42e7dSPeter Dunlap 		pdu->isp_iov[pdu->isp_iovlen].iov_len =
1954a6d42e7dSPeter Dunlap 		    sizeof (data_digest_crc);
1955a6d42e7dSPeter Dunlap 		total_len		+= sizeof (data_digest_crc);
1956a6d42e7dSPeter Dunlap 		pdu->isp_iovlen++;
1957a6d42e7dSPeter Dunlap 	}
1958a6d42e7dSPeter Dunlap 
195930e7468fSPeter Dunlap 	pdu->isp_data = (uint8_t *)(uintptr_t)pdu->isp_iov[0].iov_base;
196030e7468fSPeter Dunlap 
1961a6d42e7dSPeter Dunlap 	if (idm_iov_sorecv(so_conn->ic_so, &pdu->isp_iov[0],
1962a6d42e7dSPeter Dunlap 	    pdu->isp_iovlen, total_len) != 0) {
1963a6d42e7dSPeter Dunlap 		return (IDM_STATUS_IO);
1964a6d42e7dSPeter Dunlap 	}
1965a6d42e7dSPeter Dunlap 
1966a6d42e7dSPeter Dunlap 	if ((ic->ic_conn_flags & IDM_CONN_DATA_DIGEST) != 0) {
1967a6d42e7dSPeter Dunlap 		crc_calculated = idm_crc32c(pdu->isp_data,
1968a6d42e7dSPeter Dunlap 		    pdu->isp_datalen);
1969a6d42e7dSPeter Dunlap 		if (pad_len) {
1970a6d42e7dSPeter Dunlap 			crc_calculated = idm_crc32c_continued((char *)&pad,
1971a6d42e7dSPeter Dunlap 			    pad_len, crc_calculated);
1972a6d42e7dSPeter Dunlap 		}
1973a6d42e7dSPeter Dunlap 		if (crc_calculated != data_digest_crc) {
1974a6d42e7dSPeter Dunlap 			IDM_CONN_LOG(CE_WARN,
1975a6d42e7dSPeter Dunlap 			    "idm_sorecvdata: "
1976a6d42e7dSPeter Dunlap 			    "CRC error: actual 0x%x, calc 0x%x",
1977a6d42e7dSPeter Dunlap 			    data_digest_crc, crc_calculated);
1978a6d42e7dSPeter Dunlap 
1979a6d42e7dSPeter Dunlap 			/* Invalid Data Digest */
1980a6d42e7dSPeter Dunlap 			return (IDM_STATUS_DATA_DIGEST);
1981a6d42e7dSPeter Dunlap 		}
1982a6d42e7dSPeter Dunlap 	}
1983a6d42e7dSPeter Dunlap 
1984a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
1985a6d42e7dSPeter Dunlap }
1986a6d42e7dSPeter Dunlap 
1987a6d42e7dSPeter Dunlap /*
1988a6d42e7dSPeter Dunlap  * idm_sorecv_scsidata() is used to receive scsi data from the socket. The
1989a6d42e7dSPeter Dunlap  * Data-type PDU header must be read into the idm_pdu_t structure prior to
1990a6d42e7dSPeter Dunlap  * calling this function.
1991a6d42e7dSPeter Dunlap  */
1992a6d42e7dSPeter Dunlap idm_status_t
1993a6d42e7dSPeter Dunlap idm_sorecv_scsidata(idm_conn_t *ic, idm_pdu_t *pdu)
1994a6d42e7dSPeter Dunlap {
1995a6d42e7dSPeter Dunlap 	iscsi_data_hdr_t	*bhs;
1996a6d42e7dSPeter Dunlap 	idm_task_t		*task;
1997a6d42e7dSPeter Dunlap 	uint32_t		offset;
1998a6d42e7dSPeter Dunlap 	uint8_t			opcode;
1999a6d42e7dSPeter Dunlap 	uint32_t		dlength;
2000a6d42e7dSPeter Dunlap 	list_t			*buflst;
2001a6d42e7dSPeter Dunlap 	uint32_t		xfer_bytes;
2002a6d42e7dSPeter Dunlap 	idm_status_t		status;
2003a6d42e7dSPeter Dunlap 
2004a6d42e7dSPeter Dunlap 	ASSERT(ic != NULL);
2005a6d42e7dSPeter Dunlap 	ASSERT(pdu != NULL);
2006a6d42e7dSPeter Dunlap 
2007a6d42e7dSPeter Dunlap 	bhs	= (iscsi_data_hdr_t *)pdu->isp_hdr;
2008a6d42e7dSPeter Dunlap 
2009a6d42e7dSPeter Dunlap 	offset	= ntohl(bhs->offset);
2010*2727bb05STim Kordas 	opcode	= IDM_PDU_OPCODE(pdu);
2011a6d42e7dSPeter Dunlap 	dlength = n2h24(bhs->dlength);
2012a6d42e7dSPeter Dunlap 
2013a6d42e7dSPeter Dunlap 	ASSERT((opcode == ISCSI_OP_SCSI_DATA_RSP) ||
2014a6d42e7dSPeter Dunlap 	    (opcode == ISCSI_OP_SCSI_DATA));
2015a6d42e7dSPeter Dunlap 
2016a6d42e7dSPeter Dunlap 	/*
2017a6d42e7dSPeter Dunlap 	 * Successful lookup implicitly gets a "hold" on the task.  This
2018a6d42e7dSPeter Dunlap 	 * hold must be released before leaving this function.  At one
2019a6d42e7dSPeter Dunlap 	 * point we were caching this task context and retaining the hold
2020a6d42e7dSPeter Dunlap 	 * but it turned out to be very difficult to release the hold properly.
2021a6d42e7dSPeter Dunlap 	 * The task can be aborted and the connection shutdown between this
2022a6d42e7dSPeter Dunlap 	 * call and the subsequent expected call to idm_so_rx_datain/
2023a6d42e7dSPeter Dunlap 	 * idm_so_rx_dataout (in which case those functions are not called).
2024a6d42e7dSPeter Dunlap 	 * Releasing the hold in the PDU callback doesn't work well either
2025a6d42e7dSPeter Dunlap 	 * because the whole task may be completed by then at which point
2026a6d42e7dSPeter Dunlap 	 * it is too late to release the hold -- for better or worse this
2027a6d42e7dSPeter Dunlap 	 * code doesn't wait on the refcnts during normal operation.
2028a6d42e7dSPeter Dunlap 	 * idm_task_find() is very fast and it is not a huge burden if we
2029a6d42e7dSPeter Dunlap 	 * have to do it twice.
2030a6d42e7dSPeter Dunlap 	 */
2031a6d42e7dSPeter Dunlap 	task = idm_task_find(ic, bhs->itt, bhs->ttt);
2032a6d42e7dSPeter Dunlap 	if (task == NULL) {
2033a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN,
2034a6d42e7dSPeter Dunlap 		    "idm_sorecv_scsidata: could not find task");
2035a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
2036a6d42e7dSPeter Dunlap 	}
2037a6d42e7dSPeter Dunlap 
2038a6d42e7dSPeter Dunlap 	mutex_enter(&task->idt_mutex);
2039a6d42e7dSPeter Dunlap 	buflst	= (opcode == ISCSI_OP_SCSI_DATA_RSP) ?
2040a6d42e7dSPeter Dunlap 	    &task->idt_inbufv : &task->idt_outbufv;
2041a6d42e7dSPeter Dunlap 	pdu->isp_sorx_buf = idm_buf_find(buflst, offset);
2042a6d42e7dSPeter Dunlap 	mutex_exit(&task->idt_mutex);
2043a6d42e7dSPeter Dunlap 
2044a6d42e7dSPeter Dunlap 	if (pdu->isp_sorx_buf == NULL) {
2045a6d42e7dSPeter Dunlap 		idm_task_rele(task);
2046a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN, "idm_sorecv_scsidata: could not find "
2047a6d42e7dSPeter Dunlap 		    "buffer for offset %x opcode=%x",
2048a6d42e7dSPeter Dunlap 		    offset, opcode);
2049a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
2050a6d42e7dSPeter Dunlap 	}
2051a6d42e7dSPeter Dunlap 
2052a6d42e7dSPeter Dunlap 	xfer_bytes = idm_fill_iov(pdu, pdu->isp_sorx_buf, offset, dlength);
2053a6d42e7dSPeter Dunlap 	ASSERT(xfer_bytes != 0);
2054a6d42e7dSPeter Dunlap 	if (xfer_bytes != dlength) {
2055a6d42e7dSPeter Dunlap 		idm_task_rele(task);
2056a6d42e7dSPeter Dunlap 		/*
2057a6d42e7dSPeter Dunlap 		 * Buffer overflow, connection error.  The PDU data is still
2058a6d42e7dSPeter Dunlap 		 * sitting in the socket so we can't use the connection
2059a6d42e7dSPeter Dunlap 		 * again until that data is drained.
2060a6d42e7dSPeter Dunlap 		 */
2061a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
2062a6d42e7dSPeter Dunlap 	}
2063a6d42e7dSPeter Dunlap 
2064a6d42e7dSPeter Dunlap 	status = idm_sorecvdata(ic, pdu);
2065a6d42e7dSPeter Dunlap 
2066a6d42e7dSPeter Dunlap 	idm_task_rele(task);
2067a6d42e7dSPeter Dunlap 
2068a6d42e7dSPeter Dunlap 	return (status);
2069a6d42e7dSPeter Dunlap }
2070a6d42e7dSPeter Dunlap 
2071a6d42e7dSPeter Dunlap static uint32_t
2072a6d42e7dSPeter Dunlap idm_fill_iov(idm_pdu_t *pdu, idm_buf_t *idb, uint32_t ro, uint32_t dlength)
2073a6d42e7dSPeter Dunlap {
2074a6d42e7dSPeter Dunlap 	uint32_t	buf_ro = ro - idb->idb_bufoffset;
2075a6d42e7dSPeter Dunlap 	uint32_t	xfer_len = min(dlength, idb->idb_buflen - buf_ro);
2076a6d42e7dSPeter Dunlap 
2077a6d42e7dSPeter Dunlap 	ASSERT(ro >= idb->idb_bufoffset);
2078a6d42e7dSPeter Dunlap 
2079a6d42e7dSPeter Dunlap 	pdu->isp_iov[pdu->isp_iovlen].iov_base	=
2080a6d42e7dSPeter Dunlap 	    (caddr_t)idb->idb_buf + buf_ro;
2081a6d42e7dSPeter Dunlap 	pdu->isp_iov[pdu->isp_iovlen].iov_len	= xfer_len;
2082a6d42e7dSPeter Dunlap 	pdu->isp_iovlen++;
2083a6d42e7dSPeter Dunlap 
2084a6d42e7dSPeter Dunlap 	return (xfer_len);
2085a6d42e7dSPeter Dunlap }
2086a6d42e7dSPeter Dunlap 
2087a6d42e7dSPeter Dunlap int
2088a6d42e7dSPeter Dunlap idm_sorecv_nonscsidata(idm_conn_t *ic, idm_pdu_t *pdu)
2089a6d42e7dSPeter Dunlap {
2090a6d42e7dSPeter Dunlap 	pdu->isp_data = kmem_alloc(pdu->isp_datalen, KM_SLEEP);
2091a6d42e7dSPeter Dunlap 	ASSERT(pdu->isp_data != NULL);
2092a6d42e7dSPeter Dunlap 
2093a6d42e7dSPeter Dunlap 	pdu->isp_databuflen = pdu->isp_datalen;
2094a6d42e7dSPeter Dunlap 	pdu->isp_iov[0].iov_base = (caddr_t)pdu->isp_data;
2095a6d42e7dSPeter Dunlap 	pdu->isp_iov[0].iov_len = pdu->isp_datalen;
2096a6d42e7dSPeter Dunlap 	pdu->isp_iovlen = 1;
2097a6d42e7dSPeter Dunlap 	/*
2098a6d42e7dSPeter Dunlap 	 * Since we are associating a new data buffer with this received
2099a6d42e7dSPeter Dunlap 	 * PDU we need to set a specific callback to free the data
2100a6d42e7dSPeter Dunlap 	 * after the PDU is processed.
2101a6d42e7dSPeter Dunlap 	 */
2102a6d42e7dSPeter Dunlap 	pdu->isp_flags |= IDM_PDU_ADDL_DATA;
2103a6d42e7dSPeter Dunlap 	pdu->isp_callback = idm_sorx_addl_pdu_cb;
2104a6d42e7dSPeter Dunlap 
2105a6d42e7dSPeter Dunlap 	return (idm_sorecvdata(ic, pdu));
2106a6d42e7dSPeter Dunlap }
2107a6d42e7dSPeter Dunlap 
2108a6d42e7dSPeter Dunlap void
2109a6d42e7dSPeter Dunlap idm_sorx_thread(void *arg)
2110a6d42e7dSPeter Dunlap {
2111a6d42e7dSPeter Dunlap 	boolean_t	conn_failure = B_FALSE;
2112a6d42e7dSPeter Dunlap 	idm_conn_t	*ic = (idm_conn_t *)arg;
2113a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
2114a6d42e7dSPeter Dunlap 	idm_pdu_t	*pdu;
2115a6d42e7dSPeter Dunlap 	idm_status_t	rc;
2116a6d42e7dSPeter Dunlap 
2117a6d42e7dSPeter Dunlap 	idm_conn_hold(ic);
2118a6d42e7dSPeter Dunlap 
2119a6d42e7dSPeter Dunlap 	mutex_enter(&ic->ic_mutex);
2120a6d42e7dSPeter Dunlap 
2121a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
2122a6d42e7dSPeter Dunlap 	so_conn->ic_rx_thread_running = B_TRUE;
2123a6d42e7dSPeter Dunlap 	so_conn->ic_rx_thread_did = so_conn->ic_rx_thread->t_did;
2124a6d42e7dSPeter Dunlap 	cv_signal(&ic->ic_cv);
2125a6d42e7dSPeter Dunlap 
2126a6d42e7dSPeter Dunlap 	while (so_conn->ic_rx_thread_running) {
2127a6d42e7dSPeter Dunlap 		mutex_exit(&ic->ic_mutex);
2128a6d42e7dSPeter Dunlap 
2129a6d42e7dSPeter Dunlap 		/*
2130a6d42e7dSPeter Dunlap 		 * Get PDU with default header size (large enough for
2131a6d42e7dSPeter Dunlap 		 * BHS plus any anticipated AHS).  PDU from
2132a6d42e7dSPeter Dunlap 		 * the cache will have all values set correctly
2133a6d42e7dSPeter Dunlap 		 * for sockets RX including callback.
2134a6d42e7dSPeter Dunlap 		 */
2135a6d42e7dSPeter Dunlap 		pdu = kmem_cache_alloc(idm.idm_sorx_pdu_cache, KM_SLEEP);
2136a6d42e7dSPeter Dunlap 		pdu->isp_ic = ic;
2137a6d42e7dSPeter Dunlap 		pdu->isp_flags = 0;
2138a6d42e7dSPeter Dunlap 		pdu->isp_transport_hdrlen = 0;
2139a6d42e7dSPeter Dunlap 
2140a6d42e7dSPeter Dunlap 		if ((rc = idm_sorecvhdr(ic, pdu)) != 0) {
2141a6d42e7dSPeter Dunlap 			/*
2142a6d42e7dSPeter Dunlap 			 * Call idm_pdu_complete so that we call the callback
2143a6d42e7dSPeter Dunlap 			 * and ensure any memory allocated in idm_sorecvhdr
2144a6d42e7dSPeter Dunlap 			 * gets freed up.
2145a6d42e7dSPeter Dunlap 			 */
2146a6d42e7dSPeter Dunlap 			idm_pdu_complete(pdu, IDM_STATUS_FAIL);
2147a6d42e7dSPeter Dunlap 
2148a6d42e7dSPeter Dunlap 			/*
2149a6d42e7dSPeter Dunlap 			 * If ic_rx_thread_running is still set then
2150a6d42e7dSPeter Dunlap 			 * this is some kind of connection problem
2151a6d42e7dSPeter Dunlap 			 * on the socket.  In this case we want to
2152a6d42e7dSPeter Dunlap 			 * generate an event.  Otherwise some other
2153a6d42e7dSPeter Dunlap 			 * thread closed the socket due to another
2154a6d42e7dSPeter Dunlap 			 * issue in which case we don't need to
2155a6d42e7dSPeter Dunlap 			 * generate an event.
2156a6d42e7dSPeter Dunlap 			 */
2157a6d42e7dSPeter Dunlap 			mutex_enter(&ic->ic_mutex);
2158a6d42e7dSPeter Dunlap 			if (so_conn->ic_rx_thread_running) {
2159a6d42e7dSPeter Dunlap 				conn_failure = B_TRUE;
2160a6d42e7dSPeter Dunlap 				so_conn->ic_rx_thread_running = B_FALSE;
2161a6d42e7dSPeter Dunlap 			}
2162a6d42e7dSPeter Dunlap 
2163a6d42e7dSPeter Dunlap 			continue;
2164a6d42e7dSPeter Dunlap 		}
2165a6d42e7dSPeter Dunlap 
2166a6d42e7dSPeter Dunlap 		/*
2167a6d42e7dSPeter Dunlap 		 * Header has been read and validated.  Now we need
2168a6d42e7dSPeter Dunlap 		 * to read the PDU data payload (if present).  SCSI data
2169a6d42e7dSPeter Dunlap 		 * need to be transferred from the socket directly into
2170a6d42e7dSPeter Dunlap 		 * the associated transfer buffer for the SCSI task.
2171a6d42e7dSPeter Dunlap 		 */
2172a6d42e7dSPeter Dunlap 		if (pdu->isp_datalen != 0) {
2173a6d42e7dSPeter Dunlap 			if ((IDM_PDU_OPCODE(pdu) == ISCSI_OP_SCSI_DATA) ||
2174a6d42e7dSPeter Dunlap 			    (IDM_PDU_OPCODE(pdu) == ISCSI_OP_SCSI_DATA_RSP)) {
2175a6d42e7dSPeter Dunlap 				rc = idm_sorecv_scsidata(ic, pdu);
2176a6d42e7dSPeter Dunlap 				/*
2177a6d42e7dSPeter Dunlap 				 * All SCSI errors are fatal to the
2178a6d42e7dSPeter Dunlap 				 * connection right now since we have no
2179a6d42e7dSPeter Dunlap 				 * place to put the data.  What we need
2180a6d42e7dSPeter Dunlap 				 * is some kind of sink to dispose of unwanted
2181a6d42e7dSPeter Dunlap 				 * SCSI data.  For example an invalid task tag
2182a6d42e7dSPeter Dunlap 				 * should not kill the connection (although
2183a6d42e7dSPeter Dunlap 				 * we may want to drop the connection).
2184a6d42e7dSPeter Dunlap 				 */
2185a6d42e7dSPeter Dunlap 			} else {
2186a6d42e7dSPeter Dunlap 				/*
2187a6d42e7dSPeter Dunlap 				 * Not data PDUs so allocate a buffer for the
2188a6d42e7dSPeter Dunlap 				 * data segment and read the remaining data.
2189a6d42e7dSPeter Dunlap 				 */
2190a6d42e7dSPeter Dunlap 				rc = idm_sorecv_nonscsidata(ic, pdu);
2191a6d42e7dSPeter Dunlap 			}
2192a6d42e7dSPeter Dunlap 			if (rc != 0) {
2193a6d42e7dSPeter Dunlap 				/*
2194a6d42e7dSPeter Dunlap 				 * Call idm_pdu_complete so that we call the
2195a6d42e7dSPeter Dunlap 				 * callback and ensure any memory allocated
2196a6d42e7dSPeter Dunlap 				 * in idm_sorecvhdr gets freed up.
2197a6d42e7dSPeter Dunlap 				 */
2198a6d42e7dSPeter Dunlap 				idm_pdu_complete(pdu, IDM_STATUS_FAIL);
2199a6d42e7dSPeter Dunlap 
2200a6d42e7dSPeter Dunlap 				/*
2201a6d42e7dSPeter Dunlap 				 * If ic_rx_thread_running is still set then
2202a6d42e7dSPeter Dunlap 				 * this is some kind of connection problem
2203a6d42e7dSPeter Dunlap 				 * on the socket.  In this case we want to
2204a6d42e7dSPeter Dunlap 				 * generate an event.  Otherwise some other
2205a6d42e7dSPeter Dunlap 				 * thread closed the socket due to another
2206a6d42e7dSPeter Dunlap 				 * issue in which case we don't need to
2207a6d42e7dSPeter Dunlap 				 * generate an event.
2208a6d42e7dSPeter Dunlap 				 */
2209a6d42e7dSPeter Dunlap 				mutex_enter(&ic->ic_mutex);
2210a6d42e7dSPeter Dunlap 				if (so_conn->ic_rx_thread_running) {
2211a6d42e7dSPeter Dunlap 					conn_failure = B_TRUE;
2212a6d42e7dSPeter Dunlap 					so_conn->ic_rx_thread_running = B_FALSE;
2213a6d42e7dSPeter Dunlap 				}
2214a6d42e7dSPeter Dunlap 				continue;
2215a6d42e7dSPeter Dunlap 			}
2216a6d42e7dSPeter Dunlap 		}
2217a6d42e7dSPeter Dunlap 
2218a6d42e7dSPeter Dunlap 		/*
2219a6d42e7dSPeter Dunlap 		 * Process RX PDU
2220a6d42e7dSPeter Dunlap 		 */
2221a6d42e7dSPeter Dunlap 		idm_pdu_rx(ic, pdu);
2222a6d42e7dSPeter Dunlap 
2223a6d42e7dSPeter Dunlap 		mutex_enter(&ic->ic_mutex);
2224a6d42e7dSPeter Dunlap 	}
2225a6d42e7dSPeter Dunlap 
2226a6d42e7dSPeter Dunlap 	mutex_exit(&ic->ic_mutex);
2227a6d42e7dSPeter Dunlap 
2228a6d42e7dSPeter Dunlap 	/*
2229a6d42e7dSPeter Dunlap 	 * If we dropped out of the RX processing loop because of
2230a6d42e7dSPeter Dunlap 	 * a socket problem or other connection failure (including
2231a6d42e7dSPeter Dunlap 	 * digest errors) then we need to generate a state machine
2232a6d42e7dSPeter Dunlap 	 * event to shut the connection down.
2233a6d42e7dSPeter Dunlap 	 * If the state machine is already in, for example, INIT_ERROR, this
2234a6d42e7dSPeter Dunlap 	 * event will get dropped, and the TX thread will never be notified
2235a6d42e7dSPeter Dunlap 	 * to shut down.  To be safe, we'll just notify it here.
2236a6d42e7dSPeter Dunlap 	 */
2237a6d42e7dSPeter Dunlap 	if (conn_failure) {
2238a6d42e7dSPeter Dunlap 		if (so_conn->ic_tx_thread_running) {
2239a6d42e7dSPeter Dunlap 			so_conn->ic_tx_thread_running = B_FALSE;
2240a6d42e7dSPeter Dunlap 			mutex_enter(&so_conn->ic_tx_mutex);
2241a6d42e7dSPeter Dunlap 			cv_signal(&so_conn->ic_tx_cv);
2242a6d42e7dSPeter Dunlap 			mutex_exit(&so_conn->ic_tx_mutex);
2243a6d42e7dSPeter Dunlap 		}
2244a6d42e7dSPeter Dunlap 
2245a6d42e7dSPeter Dunlap 		idm_conn_event(ic, CE_TRANSPORT_FAIL, rc);
2246a6d42e7dSPeter Dunlap 	}
2247a6d42e7dSPeter Dunlap 
2248a6d42e7dSPeter Dunlap 	idm_conn_rele(ic);
2249a6d42e7dSPeter Dunlap 
2250a6d42e7dSPeter Dunlap 	thread_exit();
2251a6d42e7dSPeter Dunlap }
2252a6d42e7dSPeter Dunlap 
2253a6d42e7dSPeter Dunlap /*
2254a6d42e7dSPeter Dunlap  * idm_so_tx
2255a6d42e7dSPeter Dunlap  *
2256a6d42e7dSPeter Dunlap  * This is the implementation of idm_transport_ops_t's it_tx_pdu entry
2257a6d42e7dSPeter Dunlap  * point.  By definition, it is supposed to be fast.  So, simply queue
2258a6d42e7dSPeter Dunlap  * the entry and return.  The real work is done by idm_i_so_tx() via
2259a6d42e7dSPeter Dunlap  * idm_sotx_thread().
2260a6d42e7dSPeter Dunlap  */
2261a6d42e7dSPeter Dunlap 
2262a6d42e7dSPeter Dunlap static void
2263a6d42e7dSPeter Dunlap idm_so_tx(idm_conn_t *ic, idm_pdu_t *pdu)
2264a6d42e7dSPeter Dunlap {
2265a6d42e7dSPeter Dunlap 	idm_so_conn_t *so_conn = ic->ic_transport_private;
2266a6d42e7dSPeter Dunlap 
2267a6d42e7dSPeter Dunlap 	ASSERT(pdu->isp_ic == ic);
2268a6d42e7dSPeter Dunlap 	mutex_enter(&so_conn->ic_tx_mutex);
2269a6d42e7dSPeter Dunlap 
2270a6d42e7dSPeter Dunlap 	if (!so_conn->ic_tx_thread_running) {
2271a6d42e7dSPeter Dunlap 		mutex_exit(&so_conn->ic_tx_mutex);
2272a6d42e7dSPeter Dunlap 		idm_pdu_complete(pdu, IDM_STATUS_ABORTED);
2273a6d42e7dSPeter Dunlap 		return;
2274a6d42e7dSPeter Dunlap 	}
2275a6d42e7dSPeter Dunlap 
2276a6d42e7dSPeter Dunlap 	list_insert_tail(&so_conn->ic_tx_list, (void *)pdu);
2277a6d42e7dSPeter Dunlap 	cv_signal(&so_conn->ic_tx_cv);
2278a6d42e7dSPeter Dunlap 	mutex_exit(&so_conn->ic_tx_mutex);
2279a6d42e7dSPeter Dunlap }
2280a6d42e7dSPeter Dunlap 
2281a6d42e7dSPeter Dunlap static idm_status_t
2282a6d42e7dSPeter Dunlap idm_i_so_tx(idm_pdu_t *pdu)
2283a6d42e7dSPeter Dunlap {
2284a6d42e7dSPeter Dunlap 	idm_conn_t	*ic = pdu->isp_ic;
2285a6d42e7dSPeter Dunlap 	idm_status_t	status = IDM_STATUS_SUCCESS;
2286a6d42e7dSPeter Dunlap 	uint8_t		pad[ISCSI_PAD_WORD_LEN];
2287a6d42e7dSPeter Dunlap 	int		pad_len;
2288a6d42e7dSPeter Dunlap 	uint32_t	hdr_digest_crc;
2289a6d42e7dSPeter Dunlap 	uint32_t	data_digest_crc = 0;
2290a6d42e7dSPeter Dunlap 	int		total_len = 0;
2291a6d42e7dSPeter Dunlap 	int		iovlen = 0;
2292a6d42e7dSPeter Dunlap 	struct iovec	iov[6];
2293a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
2294a6d42e7dSPeter Dunlap 
2295a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
2296a6d42e7dSPeter Dunlap 
2297a6d42e7dSPeter Dunlap 	/* Setup BHS */
2298a6d42e7dSPeter Dunlap 	iov[iovlen].iov_base	= (caddr_t)pdu->isp_hdr;
2299a6d42e7dSPeter Dunlap 	iov[iovlen].iov_len	= pdu->isp_hdrlen;
2300a6d42e7dSPeter Dunlap 	total_len		+= iov[iovlen].iov_len;
2301a6d42e7dSPeter Dunlap 	iovlen++;
2302a6d42e7dSPeter Dunlap 
2303a6d42e7dSPeter Dunlap 	/* Setup header digest */
2304a6d42e7dSPeter Dunlap 	if (((pdu->isp_flags & IDM_PDU_LOGIN_TX) == 0) &&
2305a6d42e7dSPeter Dunlap 	    (ic->ic_conn_flags & IDM_CONN_HEADER_DIGEST)) {
2306a6d42e7dSPeter Dunlap 		hdr_digest_crc = idm_crc32c(pdu->isp_hdr, pdu->isp_hdrlen);
2307a6d42e7dSPeter Dunlap 
2308a6d42e7dSPeter Dunlap 		iov[iovlen].iov_base	= (caddr_t)&hdr_digest_crc;
2309a6d42e7dSPeter Dunlap 		iov[iovlen].iov_len	= sizeof (hdr_digest_crc);
2310a6d42e7dSPeter Dunlap 		total_len		+= iov[iovlen].iov_len;
2311a6d42e7dSPeter Dunlap 		iovlen++;
2312a6d42e7dSPeter Dunlap 	}
2313a6d42e7dSPeter Dunlap 
2314a6d42e7dSPeter Dunlap 	/* Setup the data */
2315a6d42e7dSPeter Dunlap 	if (pdu->isp_datalen) {
2316a6d42e7dSPeter Dunlap 		idm_task_t		*idt;
2317a6d42e7dSPeter Dunlap 		idm_buf_t		*idb;
2318a6d42e7dSPeter Dunlap 		iscsi_data_hdr_t	*ihp;
2319a6d42e7dSPeter Dunlap 		ihp = (iscsi_data_hdr_t *)pdu->isp_hdr;
2320a6d42e7dSPeter Dunlap 		/* Write of immediate data */
2321a6d42e7dSPeter Dunlap 		if (ic->ic_ffp &&
2322*2727bb05STim Kordas 		    (IDM_PDU_OPCODE(pdu) == ISCSI_OP_SCSI_CMD ||
2323*2727bb05STim Kordas 		    IDM_PDU_OPCODE(pdu) == ISCSI_OP_SCSI_DATA)) {
2324a6d42e7dSPeter Dunlap 			idt = idm_task_find(ic, ihp->itt, ihp->ttt);
2325a6d42e7dSPeter Dunlap 			if (idt) {
2326a6d42e7dSPeter Dunlap 				mutex_enter(&idt->idt_mutex);
2327a6d42e7dSPeter Dunlap 				idb = idm_buf_find(&idt->idt_outbufv, 0);
2328a6d42e7dSPeter Dunlap 				mutex_exit(&idt->idt_mutex);
232930e7468fSPeter Dunlap 				/*
233030e7468fSPeter Dunlap 				 * If the initiator call to idm_buf_alloc
233130e7468fSPeter Dunlap 				 * failed then we can get to this point
233230e7468fSPeter Dunlap 				 * without a bound buffer.  The associated
233330e7468fSPeter Dunlap 				 * connection failure will clean things up
233430e7468fSPeter Dunlap 				 * later.  It would be nice to come up with
233530e7468fSPeter Dunlap 				 * a cleaner way to handle this.  In
233630e7468fSPeter Dunlap 				 * particular it seems absurd to look up
233730e7468fSPeter Dunlap 				 * the task and the buffer just to update
233830e7468fSPeter Dunlap 				 * this counter.
233930e7468fSPeter Dunlap 				 */
234030e7468fSPeter Dunlap 				if (idb)
234130e7468fSPeter Dunlap 					idb->idb_xfer_len += pdu->isp_datalen;
234230e7468fSPeter Dunlap 				idm_task_rele(idt);
2343a6d42e7dSPeter Dunlap 			}
2344a6d42e7dSPeter Dunlap 		}
2345a6d42e7dSPeter Dunlap 
2346a6d42e7dSPeter Dunlap 		iov[iovlen].iov_base = (caddr_t)pdu->isp_data;
2347a6d42e7dSPeter Dunlap 		iov[iovlen].iov_len  = pdu->isp_datalen;
2348a6d42e7dSPeter Dunlap 		total_len += iov[iovlen].iov_len;
2349a6d42e7dSPeter Dunlap 		iovlen++;
2350a6d42e7dSPeter Dunlap 	}
2351a6d42e7dSPeter Dunlap 
2352a6d42e7dSPeter Dunlap 	/* Setup the data pad if necessary */
2353a6d42e7dSPeter Dunlap 	pad_len = ((ISCSI_PAD_WORD_LEN -
2354a6d42e7dSPeter Dunlap 	    (pdu->isp_datalen & (ISCSI_PAD_WORD_LEN - 1))) &
2355a6d42e7dSPeter Dunlap 	    (ISCSI_PAD_WORD_LEN - 1));
2356a6d42e7dSPeter Dunlap 
2357a6d42e7dSPeter Dunlap 	if (pad_len) {
2358a6d42e7dSPeter Dunlap 		bzero(pad, sizeof (pad));
2359a6d42e7dSPeter Dunlap 		iov[iovlen].iov_base = (void *)&pad;
2360a6d42e7dSPeter Dunlap 		iov[iovlen].iov_len  = pad_len;
2361a6d42e7dSPeter Dunlap 		total_len		+= iov[iovlen].iov_len;
2362a6d42e7dSPeter Dunlap 		iovlen++;
2363a6d42e7dSPeter Dunlap 	}
2364a6d42e7dSPeter Dunlap 
2365a6d42e7dSPeter Dunlap 	/*
2366a6d42e7dSPeter Dunlap 	 * Setup the data digest if enabled.  Data-digest is not sent
2367a6d42e7dSPeter Dunlap 	 * for login-phase PDUs.
2368a6d42e7dSPeter Dunlap 	 */
2369a6d42e7dSPeter Dunlap 	if ((ic->ic_conn_flags & IDM_CONN_DATA_DIGEST) &&
2370a6d42e7dSPeter Dunlap 	    ((pdu->isp_flags & IDM_PDU_LOGIN_TX) == 0) &&
2371a6d42e7dSPeter Dunlap 	    (pdu->isp_datalen || pad_len)) {
2372a6d42e7dSPeter Dunlap 		/*
2373a6d42e7dSPeter Dunlap 		 * RFC3720/10.2.3: A zero-length Data Segment also
2374a6d42e7dSPeter Dunlap 		 * implies a zero-length data digest.
2375a6d42e7dSPeter Dunlap 		 */
2376a6d42e7dSPeter Dunlap 		if (pdu->isp_datalen) {
2377a6d42e7dSPeter Dunlap 			data_digest_crc = idm_crc32c(pdu->isp_data,
2378a6d42e7dSPeter Dunlap 			    pdu->isp_datalen);
2379a6d42e7dSPeter Dunlap 		}
2380a6d42e7dSPeter Dunlap 		if (pad_len) {
2381a6d42e7dSPeter Dunlap 			data_digest_crc = idm_crc32c_continued(&pad,
2382a6d42e7dSPeter Dunlap 			    pad_len, data_digest_crc);
2383a6d42e7dSPeter Dunlap 		}
2384a6d42e7dSPeter Dunlap 
2385a6d42e7dSPeter Dunlap 		iov[iovlen].iov_base	= (caddr_t)&data_digest_crc;
2386a6d42e7dSPeter Dunlap 		iov[iovlen].iov_len	= sizeof (data_digest_crc);
2387a6d42e7dSPeter Dunlap 		total_len		+= iov[iovlen].iov_len;
2388a6d42e7dSPeter Dunlap 		iovlen++;
2389a6d42e7dSPeter Dunlap 	}
2390a6d42e7dSPeter Dunlap 
2391a6d42e7dSPeter Dunlap 	/* Transmit the PDU */
2392a6d42e7dSPeter Dunlap 	if (idm_iov_sosend(so_conn->ic_so, &iov[0], iovlen,
2393a6d42e7dSPeter Dunlap 	    total_len) != 0) {
2394a6d42e7dSPeter Dunlap 		/* Set error status */
2395a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_WARN,
2396a6d42e7dSPeter Dunlap 		    "idm_so_tx: failed to transmit the PDU, so: %p ic: %p "
2397a6d42e7dSPeter Dunlap 		    "data: %p", (void *) so_conn->ic_so, (void *) ic,
2398a6d42e7dSPeter Dunlap 		    (void *) pdu->isp_data);
2399a6d42e7dSPeter Dunlap 		status = IDM_STATUS_IO;
2400a6d42e7dSPeter Dunlap 	}
2401a6d42e7dSPeter Dunlap 
2402a6d42e7dSPeter Dunlap 	/*
2403a6d42e7dSPeter Dunlap 	 * Success does not mean that the PDU actually reached the
2404a6d42e7dSPeter Dunlap 	 * remote node since it could get dropped along the way.
2405a6d42e7dSPeter Dunlap 	 */
2406a6d42e7dSPeter Dunlap 	idm_pdu_complete(pdu, status);
2407a6d42e7dSPeter Dunlap 
2408a6d42e7dSPeter Dunlap 	return (status);
2409a6d42e7dSPeter Dunlap }
2410a6d42e7dSPeter Dunlap 
2411a6d42e7dSPeter Dunlap /*
2412a6d42e7dSPeter Dunlap  * The idm_so_buf_tx_to_ini() is used by the target iSCSI layer to transmit the
2413a6d42e7dSPeter Dunlap  * Data-In PDUs using sockets. Based on the negotiated MaxRecvDataSegmentLength,
2414a6d42e7dSPeter Dunlap  * the buffer is segmented into a sequence of Data-In PDUs, ordered by DataSN.
2415a6d42e7dSPeter Dunlap  * A target can invoke this function multiple times for a single read command
2416a6d42e7dSPeter Dunlap  * (identified by the same ITT) to split the input into several sequences.
2417a6d42e7dSPeter Dunlap  *
2418a6d42e7dSPeter Dunlap  * DataSN starts with 0 for the first data PDU of an input command and advances
2419a6d42e7dSPeter Dunlap  * by 1 for each subsequent data PDU. Each sequence will have its own F bit,
2420a6d42e7dSPeter Dunlap  * which is set to 1 for the last data PDU of a sequence.
242160220f10SPriya Krishnan  * If the initiator supports phase collapse, the status bit must be set along
242260220f10SPriya Krishnan  * with the F bit to indicate that the status is shipped together with the last
242360220f10SPriya Krishnan  * Data-In PDU.
2424a6d42e7dSPeter Dunlap  *
2425a6d42e7dSPeter Dunlap  * The data PDUs within a sequence will be sent in order with the buffer offset
2426a6d42e7dSPeter Dunlap  * in increasing order. i.e. initiator and target must have negotiated the
2427a6d42e7dSPeter Dunlap  * "DataPDUInOrder" to "Yes". The order between sequences is not enforced.
2428a6d42e7dSPeter Dunlap  *
2429a6d42e7dSPeter Dunlap  * Caller holds idt->idt_mutex
2430a6d42e7dSPeter Dunlap  */
2431a6d42e7dSPeter Dunlap static idm_status_t
2432a6d42e7dSPeter Dunlap idm_so_buf_tx_to_ini(idm_task_t *idt, idm_buf_t *idb)
2433a6d42e7dSPeter Dunlap {
2434a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn = idb->idb_ic->ic_transport_private;
2435a6d42e7dSPeter Dunlap 	idm_pdu_t	tmppdu;
2436a6d42e7dSPeter Dunlap 
2437a6d42e7dSPeter Dunlap 	ASSERT(mutex_owned(&idt->idt_mutex));
2438a6d42e7dSPeter Dunlap 
2439a6d42e7dSPeter Dunlap 	/*
2440a6d42e7dSPeter Dunlap 	 * Put the idm_buf_t on the tx queue.  It will be transmitted by
2441a6d42e7dSPeter Dunlap 	 * idm_sotx_thread.
2442a6d42e7dSPeter Dunlap 	 */
2443a6d42e7dSPeter Dunlap 	mutex_enter(&so_conn->ic_tx_mutex);
2444a6d42e7dSPeter Dunlap 
2445a668b114SPriya Krishnan 	DTRACE_ISCSI_8(xfer__start, idm_conn_t *, idt->idt_ic,
2446a668b114SPriya Krishnan 	    uintptr_t, idb->idb_buf, uint32_t, idb->idb_bufoffset,
2447a668b114SPriya Krishnan 	    uint64_t, 0, uint32_t, 0, uint32_t, 0,
2448a668b114SPriya Krishnan 	    uint32_t, idb->idb_xfer_len, int, XFER_BUF_TX_TO_INI);
2449a668b114SPriya Krishnan 
2450a6d42e7dSPeter Dunlap 	if (!so_conn->ic_tx_thread_running) {
2451a6d42e7dSPeter Dunlap 		mutex_exit(&so_conn->ic_tx_mutex);
2452a6d42e7dSPeter Dunlap 		/*
2453a6d42e7dSPeter Dunlap 		 * Don't release idt->idt_mutex since we're supposed to hold
2454a6d42e7dSPeter Dunlap 		 * in when calling idm_buf_tx_to_ini_done
2455a6d42e7dSPeter Dunlap 		 */
2456a668b114SPriya Krishnan 		DTRACE_ISCSI_8(xfer__done, idm_conn_t *, idt->idt_ic,
2457a668b114SPriya Krishnan 		    uintptr_t, idb->idb_buf, uint32_t, idb->idb_bufoffset,
2458a668b114SPriya Krishnan 		    uint64_t, 0, uint32_t, 0, uint32_t, 0,
2459a668b114SPriya Krishnan 		    uint32_t, idb->idb_xfer_len,
2460a668b114SPriya Krishnan 		    int, XFER_BUF_TX_TO_INI);
2461a6d42e7dSPeter Dunlap 		idm_buf_tx_to_ini_done(idt, idb, IDM_STATUS_ABORTED);
2462a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
2463a6d42e7dSPeter Dunlap 	}
2464a6d42e7dSPeter Dunlap 
2465a6d42e7dSPeter Dunlap 	/*
2466a6d42e7dSPeter Dunlap 	 * Build a template for the data PDU headers we will use so that
2467a6d42e7dSPeter Dunlap 	 * the SN values will stay consistent with other PDU's we are
2468a6d42e7dSPeter Dunlap 	 * transmitting like R2T and SCSI status.
2469a6d42e7dSPeter Dunlap 	 */
2470a6d42e7dSPeter Dunlap 	bzero(&idb->idb_data_hdr_tmpl, sizeof (iscsi_hdr_t));
2471a6d42e7dSPeter Dunlap 	tmppdu.isp_hdr = &idb->idb_data_hdr_tmpl;
2472a6d42e7dSPeter Dunlap 	(*idt->idt_ic->ic_conn_ops.icb_build_hdr)(idt, &tmppdu,
2473a6d42e7dSPeter Dunlap 	    ISCSI_OP_SCSI_DATA_RSP);
2474a6d42e7dSPeter Dunlap 	idb->idb_tx_thread = B_TRUE;
2475a6d42e7dSPeter Dunlap 	list_insert_tail(&so_conn->ic_tx_list, (void *)idb);
2476a6d42e7dSPeter Dunlap 	cv_signal(&so_conn->ic_tx_cv);
2477a6d42e7dSPeter Dunlap 	mutex_exit(&so_conn->ic_tx_mutex);
2478a6d42e7dSPeter Dunlap 	mutex_exit(&idt->idt_mutex);
2479a6d42e7dSPeter Dunlap 
2480a6d42e7dSPeter Dunlap 	/*
2481a6d42e7dSPeter Dunlap 	 * Returning success here indicates the transfer was successfully
2482a6d42e7dSPeter Dunlap 	 * dispatched -- it does not mean that the transfer completed
2483a6d42e7dSPeter Dunlap 	 * successfully.
2484a6d42e7dSPeter Dunlap 	 */
2485a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
2486a6d42e7dSPeter Dunlap }
2487a6d42e7dSPeter Dunlap 
2488a6d42e7dSPeter Dunlap /*
2489a6d42e7dSPeter Dunlap  * The idm_so_buf_rx_from_ini() is used by the target iSCSI layer to specify the
2490a6d42e7dSPeter Dunlap  * data blocks it is ready to receive from the initiator in response to a WRITE
2491a6d42e7dSPeter Dunlap  * SCSI command. The target iSCSI layer passes the information about the desired
2492a6d42e7dSPeter Dunlap  * data blocks to the initiator in one R2T PDU. The receiving buffer, the buffer
2493a6d42e7dSPeter Dunlap  * offset and datalen are passed via the 'idb' argument.
2494a6d42e7dSPeter Dunlap  *
2495a6d42e7dSPeter Dunlap  * Scope for Prototype build:
2496a6d42e7dSPeter Dunlap  * R2Ts are required for any Data-Out PDU, i.e. initiator and target must have
2497a6d42e7dSPeter Dunlap  * negotiated the "InitialR2T" to "Yes".
2498a6d42e7dSPeter Dunlap  *
2499a6d42e7dSPeter Dunlap  * Caller holds idt->idt_mutex
2500a6d42e7dSPeter Dunlap  */
2501a6d42e7dSPeter Dunlap static idm_status_t
2502a6d42e7dSPeter Dunlap idm_so_buf_rx_from_ini(idm_task_t *idt, idm_buf_t *idb)
2503a6d42e7dSPeter Dunlap {
2504a6d42e7dSPeter Dunlap 	idm_pdu_t		*pdu;
2505a6d42e7dSPeter Dunlap 	iscsi_rtt_hdr_t		*rtt;
2506a6d42e7dSPeter Dunlap 
2507a6d42e7dSPeter Dunlap 	ASSERT(mutex_owned(&idt->idt_mutex));
2508a6d42e7dSPeter Dunlap 
2509a668b114SPriya Krishnan 	DTRACE_ISCSI_8(xfer__start, idm_conn_t *, idt->idt_ic,
2510a668b114SPriya Krishnan 	    uintptr_t, idb->idb_buf, uint32_t, idb->idb_bufoffset,
2511a668b114SPriya Krishnan 	    uint64_t, 0, uint32_t, 0, uint32_t, 0,
2512a668b114SPriya Krishnan 	    uint32_t, idb->idb_xfer_len, int, XFER_BUF_RX_FROM_INI);
2513a668b114SPriya Krishnan 
2514a6d42e7dSPeter Dunlap 	pdu = kmem_cache_alloc(idm.idm_sotx_pdu_cache, KM_SLEEP);
2515a6d42e7dSPeter Dunlap 	pdu->isp_ic = idt->idt_ic;
2516a2383ac5SPriya Krishnan 	pdu->isp_flags = IDM_PDU_SET_STATSN;
2517a6d42e7dSPeter Dunlap 	bzero(pdu->isp_hdr, sizeof (iscsi_rtt_hdr_t));
2518a6d42e7dSPeter Dunlap 
2519a2383ac5SPriya Krishnan 	/* iSCSI layer fills the TTT, ITT, ExpCmdSN, MaxCmdSN */
2520a6d42e7dSPeter Dunlap 	(*idt->idt_ic->ic_conn_ops.icb_build_hdr)(idt, pdu, ISCSI_OP_RTT_RSP);
2521a6d42e7dSPeter Dunlap 
2522a6d42e7dSPeter Dunlap 	/* set the rttsn, rtt.flags, rtt.data_offset and rtt.data_length */
2523a6d42e7dSPeter Dunlap 	rtt = (iscsi_rtt_hdr_t *)(pdu->isp_hdr);
2524a6d42e7dSPeter Dunlap 
2525a6d42e7dSPeter Dunlap 	rtt->opcode		= ISCSI_OP_RTT_RSP;
2526a6d42e7dSPeter Dunlap 	rtt->flags		= ISCSI_FLAG_FINAL;
2527a6d42e7dSPeter Dunlap 	rtt->data_offset	= htonl(idb->idb_bufoffset);
2528a6d42e7dSPeter Dunlap 	rtt->data_length	= htonl(idb->idb_xfer_len);
2529a6d42e7dSPeter Dunlap 	rtt->rttsn		= htonl(idt->idt_exp_rttsn++);
2530a6d42e7dSPeter Dunlap 
2531a6d42e7dSPeter Dunlap 	/* Keep track of buffer offsets */
2532a6d42e7dSPeter Dunlap 	idb->idb_exp_offset	= idb->idb_bufoffset;
2533a6d42e7dSPeter Dunlap 	mutex_exit(&idt->idt_mutex);
2534a6d42e7dSPeter Dunlap 
2535a6d42e7dSPeter Dunlap 	/*
253663528ae4SJames Moore 	 * Transmit the PDU.
2537a6d42e7dSPeter Dunlap 	 */
253863528ae4SJames Moore 	idm_pdu_tx(pdu);
2539a6d42e7dSPeter Dunlap 
2540a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
2541a6d42e7dSPeter Dunlap }
2542a6d42e7dSPeter Dunlap 
2543a6d42e7dSPeter Dunlap static idm_status_t
2544a6d42e7dSPeter Dunlap idm_so_buf_alloc(idm_buf_t *idb, uint64_t buflen)
2545a6d42e7dSPeter Dunlap {
2546cf8c0ebaSPeter Dunlap 	if ((buflen > IDM_SO_BUF_CACHE_LB) && (buflen <= IDM_SO_BUF_CACHE_UB)) {
2547cf8c0ebaSPeter Dunlap 		idb->idb_buf = kmem_cache_alloc(idm.idm_so_128k_buf_cache,
2548cf8c0ebaSPeter Dunlap 		    KM_NOSLEEP);
2549cf8c0ebaSPeter Dunlap 		idb->idb_buf_private = idm.idm_so_128k_buf_cache;
2550cf8c0ebaSPeter Dunlap 	} else {
2551cf8c0ebaSPeter Dunlap 		idb->idb_buf = kmem_alloc(buflen, KM_NOSLEEP);
2552cf8c0ebaSPeter Dunlap 		idb->idb_buf_private = NULL;
2553cf8c0ebaSPeter Dunlap 	}
2554cf8c0ebaSPeter Dunlap 
2555a6d42e7dSPeter Dunlap 	if (idb->idb_buf == NULL) {
2556a6d42e7dSPeter Dunlap 		IDM_CONN_LOG(CE_NOTE,
2557a6d42e7dSPeter Dunlap 		    "idm_so_buf_alloc: failed buffer allocation");
2558a6d42e7dSPeter Dunlap 		return (IDM_STATUS_FAIL);
2559a6d42e7dSPeter Dunlap 	}
2560cf8c0ebaSPeter Dunlap 
2561a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
2562a6d42e7dSPeter Dunlap }
2563a6d42e7dSPeter Dunlap 
2564a6d42e7dSPeter Dunlap /* ARGSUSED */
2565a6d42e7dSPeter Dunlap static idm_status_t
2566a6d42e7dSPeter Dunlap idm_so_buf_setup(idm_buf_t *idb)
2567a6d42e7dSPeter Dunlap {
256830e7468fSPeter Dunlap 	/* Ensure bufalloc'd flag is unset */
256930e7468fSPeter Dunlap 	idb->idb_bufalloc = B_FALSE;
257030e7468fSPeter Dunlap 
2571a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
2572a6d42e7dSPeter Dunlap }
2573a6d42e7dSPeter Dunlap 
2574a6d42e7dSPeter Dunlap /* ARGSUSED */
2575a6d42e7dSPeter Dunlap static void
2576a6d42e7dSPeter Dunlap idm_so_buf_teardown(idm_buf_t *idb)
2577a6d42e7dSPeter Dunlap {
2578a6d42e7dSPeter Dunlap 	/* nothing to do here */
2579a6d42e7dSPeter Dunlap }
2580a6d42e7dSPeter Dunlap 
2581a6d42e7dSPeter Dunlap static void
2582a6d42e7dSPeter Dunlap idm_so_buf_free(idm_buf_t *idb)
2583a6d42e7dSPeter Dunlap {
2584cf8c0ebaSPeter Dunlap 	if (idb->idb_buf_private == NULL) {
2585cf8c0ebaSPeter Dunlap 		kmem_free(idb->idb_buf, idb->idb_buflen);
2586cf8c0ebaSPeter Dunlap 	} else {
2587cf8c0ebaSPeter Dunlap 		kmem_cache_free(idb->idb_buf_private, idb->idb_buf);
2588cf8c0ebaSPeter Dunlap 	}
2589a6d42e7dSPeter Dunlap }
2590a6d42e7dSPeter Dunlap 
259130e7468fSPeter Dunlap static void
259230e7468fSPeter Dunlap idm_so_send_rtt_data(idm_conn_t *ic, idm_task_t *idt, idm_buf_t *idb,
259330e7468fSPeter Dunlap     uint32_t offset, uint32_t length)
259430e7468fSPeter Dunlap {
259530e7468fSPeter Dunlap 	idm_so_conn_t	*so_conn = ic->ic_transport_private;
259630e7468fSPeter Dunlap 	idm_pdu_t	tmppdu;
259730e7468fSPeter Dunlap 	idm_buf_t	*rtt_buf;
259830e7468fSPeter Dunlap 
259930e7468fSPeter Dunlap 	ASSERT(mutex_owned(&idt->idt_mutex));
260030e7468fSPeter Dunlap 
260130e7468fSPeter Dunlap 	/*
260230e7468fSPeter Dunlap 	 * Allocate a buffer to represent the RTT transfer.  We could further
260330e7468fSPeter Dunlap 	 * optimize this by allocating the buffers internally from an rtt
260430e7468fSPeter Dunlap 	 * specific buffer cache since this is socket-specific code but for
260530e7468fSPeter Dunlap 	 * now we will keep it simple.
260630e7468fSPeter Dunlap 	 */
260730e7468fSPeter Dunlap 	rtt_buf = idm_buf_alloc(ic, (uint8_t *)idb->idb_buf + offset, length);
260830e7468fSPeter Dunlap 	if (rtt_buf == NULL) {
260930e7468fSPeter Dunlap 		/*
261030e7468fSPeter Dunlap 		 * If we're in FFP then the failure was likely a resource
261130e7468fSPeter Dunlap 		 * allocation issue and we should close the connection by
261230e7468fSPeter Dunlap 		 * sending a CE_TRANSPORT_FAIL event.
261330e7468fSPeter Dunlap 		 *
261430e7468fSPeter Dunlap 		 * If we're not in FFP then idm_buf_alloc will always
261530e7468fSPeter Dunlap 		 * fail and the state is transitioning to "complete" anyway
261630e7468fSPeter Dunlap 		 * so we won't bother to send an event.
261730e7468fSPeter Dunlap 		 */
261830e7468fSPeter Dunlap 		mutex_enter(&ic->ic_state_mutex);
261930e7468fSPeter Dunlap 		if (ic->ic_ffp)
262030e7468fSPeter Dunlap 			idm_conn_event_locked(ic, CE_TRANSPORT_FAIL,
262130e7468fSPeter Dunlap 			    NULL, CT_NONE);
262230e7468fSPeter Dunlap 		mutex_exit(&ic->ic_state_mutex);
2623c158b55cSJack Meng 		mutex_exit(&idt->idt_mutex);
262430e7468fSPeter Dunlap 		return;
262530e7468fSPeter Dunlap 	}
262630e7468fSPeter Dunlap 
262730e7468fSPeter Dunlap 	rtt_buf->idb_buf_cb = NULL;
262830e7468fSPeter Dunlap 	rtt_buf->idb_cb_arg = NULL;
262930e7468fSPeter Dunlap 	rtt_buf->idb_bufoffset = offset;
263030e7468fSPeter Dunlap 	rtt_buf->idb_xfer_len = length;
263130e7468fSPeter Dunlap 	rtt_buf->idb_ic = idt->idt_ic;
263230e7468fSPeter Dunlap 	rtt_buf->idb_task_binding = idt;
263330e7468fSPeter Dunlap 
2634c158b55cSJack Meng 	/*
2635c158b55cSJack Meng 	 * The new buffer (if any) represents an additional
2636c158b55cSJack Meng 	 * reference on the task
2637c158b55cSJack Meng 	 */
2638c158b55cSJack Meng 	idm_task_hold(idt);
2639c158b55cSJack Meng 	mutex_exit(&idt->idt_mutex);
2640c158b55cSJack Meng 
264130e7468fSPeter Dunlap 	/*
264230e7468fSPeter Dunlap 	 * Put the idm_buf_t on the tx queue.  It will be transmitted by
264330e7468fSPeter Dunlap 	 * idm_sotx_thread.
264430e7468fSPeter Dunlap 	 */
264530e7468fSPeter Dunlap 	mutex_enter(&so_conn->ic_tx_mutex);
264630e7468fSPeter Dunlap 
264730e7468fSPeter Dunlap 	if (!so_conn->ic_tx_thread_running) {
264830e7468fSPeter Dunlap 		idm_buf_free(rtt_buf);
264930e7468fSPeter Dunlap 		mutex_exit(&so_conn->ic_tx_mutex);
2650c158b55cSJack Meng 		idm_task_rele(idt);
265130e7468fSPeter Dunlap 		return;
265230e7468fSPeter Dunlap 	}
265330e7468fSPeter Dunlap 
265430e7468fSPeter Dunlap 	/*
265530e7468fSPeter Dunlap 	 * Build a template for the data PDU headers we will use so that
265630e7468fSPeter Dunlap 	 * the SN values will stay consistent with other PDU's we are
265730e7468fSPeter Dunlap 	 * transmitting like R2T and SCSI status.
265830e7468fSPeter Dunlap 	 */
265930e7468fSPeter Dunlap 	bzero(&rtt_buf->idb_data_hdr_tmpl, sizeof (iscsi_hdr_t));
266030e7468fSPeter Dunlap 	tmppdu.isp_hdr = &rtt_buf->idb_data_hdr_tmpl;
266130e7468fSPeter Dunlap 	(*idt->idt_ic->ic_conn_ops.icb_build_hdr)(idt, &tmppdu,
266230e7468fSPeter Dunlap 	    ISCSI_OP_SCSI_DATA);
266330e7468fSPeter Dunlap 	rtt_buf->idb_tx_thread = B_TRUE;
266430e7468fSPeter Dunlap 	rtt_buf->idb_in_transport = B_TRUE;
266530e7468fSPeter Dunlap 	list_insert_tail(&so_conn->ic_tx_list, (void *)rtt_buf);
266630e7468fSPeter Dunlap 	cv_signal(&so_conn->ic_tx_cv);
266730e7468fSPeter Dunlap 	mutex_exit(&so_conn->ic_tx_mutex);
266830e7468fSPeter Dunlap }
266930e7468fSPeter Dunlap 
267030e7468fSPeter Dunlap static void
267130e7468fSPeter Dunlap idm_so_send_rtt_data_done(idm_task_t *idt, idm_buf_t *idb)
267230e7468fSPeter Dunlap {
267330e7468fSPeter Dunlap 	/*
267430e7468fSPeter Dunlap 	 * Don't worry about status -- we assume any error handling
267530e7468fSPeter Dunlap 	 * is performed by the caller (idm_sotx_thread).
267630e7468fSPeter Dunlap 	 */
267730e7468fSPeter Dunlap 	idb->idb_in_transport = B_FALSE;
267830e7468fSPeter Dunlap 	idm_task_rele(idt);
267930e7468fSPeter Dunlap 	idm_buf_free(idb);
268030e7468fSPeter Dunlap }
268130e7468fSPeter Dunlap 
268230e7468fSPeter Dunlap static idm_status_t
268330e7468fSPeter Dunlap idm_so_send_buf_region(idm_task_t *idt, idm_buf_t *idb,
2684a6d42e7dSPeter Dunlap     uint32_t buf_region_offset, uint32_t buf_region_length)
2685a6d42e7dSPeter Dunlap {
2686a6d42e7dSPeter Dunlap 	idm_conn_t		*ic;
2687a6d42e7dSPeter Dunlap 	uint32_t		max_dataseglen;
2688a6d42e7dSPeter Dunlap 	size_t			remainder, chunk;
2689a6d42e7dSPeter Dunlap 	uint32_t		data_offset = buf_region_offset;
2690a6d42e7dSPeter Dunlap 	iscsi_data_hdr_t	*bhs;
2691a6d42e7dSPeter Dunlap 	idm_pdu_t		*pdu;
269230e7468fSPeter Dunlap 	idm_status_t		tx_status;
2693a6d42e7dSPeter Dunlap 
2694a6d42e7dSPeter Dunlap 	ASSERT(mutex_owned(&idt->idt_mutex));
2695a6d42e7dSPeter Dunlap 
2696a6d42e7dSPeter Dunlap 	ic = idt->idt_ic;
2697a6d42e7dSPeter Dunlap 
269856261083SCharles Ting 	max_dataseglen = ic->ic_conn_params.max_xmit_dataseglen;
2699a6d42e7dSPeter Dunlap 	remainder = buf_region_length;
2700a6d42e7dSPeter Dunlap 
2701a6d42e7dSPeter Dunlap 	while (remainder) {
2702a6d42e7dSPeter Dunlap 		if (idt->idt_state != TASK_ACTIVE) {
2703a6d42e7dSPeter Dunlap 			ASSERT((idt->idt_state != TASK_IDLE) &&
2704a6d42e7dSPeter Dunlap 			    (idt->idt_state != TASK_COMPLETE));
2705a6d42e7dSPeter Dunlap 			return (IDM_STATUS_ABORTED);
2706a6d42e7dSPeter Dunlap 		}
2707a6d42e7dSPeter Dunlap 
2708a6d42e7dSPeter Dunlap 		/* check to see if we need to chunk the data */
2709a6d42e7dSPeter Dunlap 		if (remainder > max_dataseglen) {
2710a6d42e7dSPeter Dunlap 			chunk = max_dataseglen;
2711a6d42e7dSPeter Dunlap 		} else {
2712a6d42e7dSPeter Dunlap 			chunk = remainder;
2713a6d42e7dSPeter Dunlap 		}
2714a6d42e7dSPeter Dunlap 
2715a6d42e7dSPeter Dunlap 		/* Data PDU headers will always be sizeof (iscsi_hdr_t) */
2716a6d42e7dSPeter Dunlap 		pdu = kmem_cache_alloc(idm.idm_sotx_pdu_cache, KM_SLEEP);
2717a6d42e7dSPeter Dunlap 		pdu->isp_ic = ic;
271860220f10SPriya Krishnan 		pdu->isp_flags = 0;	/* initialize isp_flags */
2719a6d42e7dSPeter Dunlap 
2720a6d42e7dSPeter Dunlap 		/*
272130e7468fSPeter Dunlap 		 * We've already built a build a header template
2722a6d42e7dSPeter Dunlap 		 * to use during the transfer.  Use this template so that
2723a6d42e7dSPeter Dunlap 		 * the SN values stay consistent with any unrelated PDU's
2724a6d42e7dSPeter Dunlap 		 * being transmitted.
2725a6d42e7dSPeter Dunlap 		 */
272630e7468fSPeter Dunlap 		bcopy(&idb->idb_data_hdr_tmpl, pdu->isp_hdr,
272730e7468fSPeter Dunlap 		    sizeof (iscsi_hdr_t));
2728a6d42e7dSPeter Dunlap 
2729a6d42e7dSPeter Dunlap 		/*
2730a6d42e7dSPeter Dunlap 		 * Set DataSN, data offset, and flags in BHS
2731a6d42e7dSPeter Dunlap 		 * For the prototype build, A = 0, S = 0, U = 0
2732a6d42e7dSPeter Dunlap 		 */
2733a6d42e7dSPeter Dunlap 		bhs = (iscsi_data_hdr_t *)(pdu->isp_hdr);
2734a6d42e7dSPeter Dunlap 
2735a6d42e7dSPeter Dunlap 		bhs->datasn		= htonl(idt->idt_exp_datasn++);
2736a6d42e7dSPeter Dunlap 
2737a6d42e7dSPeter Dunlap 		hton24(bhs->dlength, chunk);
2738a6d42e7dSPeter Dunlap 		bhs->offset = htonl(idb->idb_bufoffset + data_offset);
2739a6d42e7dSPeter Dunlap 
274060220f10SPriya Krishnan 		/* setup data */
274160220f10SPriya Krishnan 		pdu->isp_data	=  (uint8_t *)idb->idb_buf + data_offset;
274260220f10SPriya Krishnan 		pdu->isp_datalen = (uint_t)chunk;
274360220f10SPriya Krishnan 
2744a6d42e7dSPeter Dunlap 		if (chunk == remainder) {
2745a6d42e7dSPeter Dunlap 			bhs->flags = ISCSI_FLAG_FINAL; /* F bit set to 1 */
274660220f10SPriya Krishnan 			/* Piggyback the status with the last data PDU */
274760220f10SPriya Krishnan 			if (idt->idt_flags & IDM_TASK_PHASECOLLAPSE_REQ) {
274860220f10SPriya Krishnan 				pdu->isp_flags |= IDM_PDU_SET_STATSN |
274960220f10SPriya Krishnan 				    IDM_PDU_ADVANCE_STATSN;
275060220f10SPriya Krishnan 				(*idt->idt_ic->ic_conn_ops.icb_update_statsn)
275160220f10SPriya Krishnan 				    (idt, pdu);
275260220f10SPriya Krishnan 				idt->idt_flags |=
275360220f10SPriya Krishnan 				    IDM_TASK_PHASECOLLAPSE_SUCCESS;
275460220f10SPriya Krishnan 
275560220f10SPriya Krishnan 			}
2756a6d42e7dSPeter Dunlap 		}
2757a6d42e7dSPeter Dunlap 
275860220f10SPriya Krishnan 		remainder	-= chunk;
275960220f10SPriya Krishnan 		data_offset	+= chunk;
276060220f10SPriya Krishnan 
2761a668b114SPriya Krishnan 		/* Instrument the data-send DTrace probe. */
2762a668b114SPriya Krishnan 		if (IDM_PDU_OPCODE(pdu) == ISCSI_OP_SCSI_DATA_RSP) {
2763a668b114SPriya Krishnan 			DTRACE_ISCSI_2(data__send,
2764a668b114SPriya Krishnan 			    idm_conn_t *, idt->idt_ic,
2765a668b114SPriya Krishnan 			    iscsi_data_rsp_hdr_t *,
2766a668b114SPriya Krishnan 			    (iscsi_data_rsp_hdr_t *)pdu->isp_hdr);
2767a668b114SPriya Krishnan 		}
2768a6d42e7dSPeter Dunlap 
2769a6d42e7dSPeter Dunlap 		/*
2770a6d42e7dSPeter Dunlap 		 * Now that we're done working with idt_exp_datasn,
2771a6d42e7dSPeter Dunlap 		 * idt->idt_state and idb->idb_bufoffset we can release
2772a6d42e7dSPeter Dunlap 		 * the task lock -- don't want to hold it across the
2773a6d42e7dSPeter Dunlap 		 * call to idm_i_so_tx since we could block.
2774a6d42e7dSPeter Dunlap 		 */
2775a6d42e7dSPeter Dunlap 		mutex_exit(&idt->idt_mutex);
2776a6d42e7dSPeter Dunlap 
2777a6d42e7dSPeter Dunlap 		/*
2778a6d42e7dSPeter Dunlap 		 * Transmit the PDU.  Call the internal routine directly
2779a6d42e7dSPeter Dunlap 		 * as there is already implicit ordering.
2780a6d42e7dSPeter Dunlap 		 */
278130e7468fSPeter Dunlap 		if ((tx_status = idm_i_so_tx(pdu)) != IDM_STATUS_SUCCESS) {
278230e7468fSPeter Dunlap 			mutex_enter(&idt->idt_mutex);
278330e7468fSPeter Dunlap 			return (tx_status);
278430e7468fSPeter Dunlap 		}
2785a6d42e7dSPeter Dunlap 
2786a6d42e7dSPeter Dunlap 		mutex_enter(&idt->idt_mutex);
278730e7468fSPeter Dunlap 		idt->idt_tx_bytes += chunk;
2788a6d42e7dSPeter Dunlap 	}
2789a6d42e7dSPeter Dunlap 
2790a6d42e7dSPeter Dunlap 	return (IDM_STATUS_SUCCESS);
2791a6d42e7dSPeter Dunlap }
2792a6d42e7dSPeter Dunlap 
2793a6d42e7dSPeter Dunlap /*
2794a6d42e7dSPeter Dunlap  * TX PDU cache
2795a6d42e7dSPeter Dunlap  */
2796a6d42e7dSPeter Dunlap /* ARGSUSED */
2797a6d42e7dSPeter Dunlap int
2798a6d42e7dSPeter Dunlap idm_sotx_pdu_constructor(void *hdl, void *arg, int flags)
2799a6d42e7dSPeter Dunlap {
2800a6d42e7dSPeter Dunlap 	idm_pdu_t	*pdu = hdl;
2801a6d42e7dSPeter Dunlap 
2802a6d42e7dSPeter Dunlap 	bzero(pdu, sizeof (idm_pdu_t));
2803a6d42e7dSPeter Dunlap 	pdu->isp_hdr = (iscsi_hdr_t *)(pdu + 1); /* Ptr arithmetic */
2804a6d42e7dSPeter Dunlap 	pdu->isp_hdrlen = sizeof (iscsi_hdr_t);
2805a6d42e7dSPeter Dunlap 	pdu->isp_callback = idm_sotx_cache_pdu_cb;
2806a6d42e7dSPeter Dunlap 	pdu->isp_magic = IDM_PDU_MAGIC;
2807a6d42e7dSPeter Dunlap 	bzero(pdu->isp_hdr, sizeof (iscsi_hdr_t));
2808a6d42e7dSPeter Dunlap 
2809a6d42e7dSPeter Dunlap 	return (0);
2810a6d42e7dSPeter Dunlap }
2811a6d42e7dSPeter Dunlap 
2812a6d42e7dSPeter Dunlap /* ARGSUSED */
2813a6d42e7dSPeter Dunlap void
2814a6d42e7dSPeter Dunlap idm_sotx_cache_pdu_cb(idm_pdu_t *pdu, idm_status_t status)
2815a6d42e7dSPeter Dunlap {
2816a6d42e7dSPeter Dunlap 	/* reset values between use */
2817a6d42e7dSPeter Dunlap 	pdu->isp_datalen = 0;
2818a6d42e7dSPeter Dunlap 
2819a6d42e7dSPeter Dunlap 	kmem_cache_free(idm.idm_sotx_pdu_cache, pdu);
2820a6d42e7dSPeter Dunlap }
2821a6d42e7dSPeter Dunlap 
2822a6d42e7dSPeter Dunlap /*
2823a6d42e7dSPeter Dunlap  * RX PDU cache
2824a6d42e7dSPeter Dunlap  */
2825a6d42e7dSPeter Dunlap /* ARGSUSED */
2826a6d42e7dSPeter Dunlap int
2827a6d42e7dSPeter Dunlap idm_sorx_pdu_constructor(void *hdl, void *arg, int flags)
2828a6d42e7dSPeter Dunlap {
2829a6d42e7dSPeter Dunlap 	idm_pdu_t	*pdu = hdl;
2830a6d42e7dSPeter Dunlap 
2831a6d42e7dSPeter Dunlap 	bzero(pdu, sizeof (idm_pdu_t));
2832a6d42e7dSPeter Dunlap 	pdu->isp_magic = IDM_PDU_MAGIC;
2833a6d42e7dSPeter Dunlap 	pdu->isp_hdr = (iscsi_hdr_t *)(pdu + 1); /* Ptr arithmetic */
2834a6d42e7dSPeter Dunlap 	pdu->isp_callback = idm_sorx_cache_pdu_cb;
2835a6d42e7dSPeter Dunlap 
2836a6d42e7dSPeter Dunlap 	return (0);
2837a6d42e7dSPeter Dunlap }
2838a6d42e7dSPeter Dunlap 
2839a6d42e7dSPeter Dunlap /* ARGSUSED */
2840a6d42e7dSPeter Dunlap static void
2841a6d42e7dSPeter Dunlap idm_sorx_cache_pdu_cb(idm_pdu_t *pdu, idm_status_t status)
2842a6d42e7dSPeter Dunlap {
2843a6d42e7dSPeter Dunlap 	pdu->isp_iovlen = 0;
2844a6d42e7dSPeter Dunlap 	pdu->isp_sorx_buf = 0;
2845a6d42e7dSPeter Dunlap 	kmem_cache_free(idm.idm_sorx_pdu_cache, pdu);
2846a6d42e7dSPeter Dunlap }
2847a6d42e7dSPeter Dunlap 
2848a6d42e7dSPeter Dunlap static void
2849a6d42e7dSPeter Dunlap idm_sorx_addl_pdu_cb(idm_pdu_t *pdu, idm_status_t status)
2850a6d42e7dSPeter Dunlap {
2851a6d42e7dSPeter Dunlap 	/*
2852a6d42e7dSPeter Dunlap 	 * We had to modify our cached RX PDU with a longer header buffer
2853a6d42e7dSPeter Dunlap 	 * and/or a longer data buffer.  Release the new buffers and fix
2854a6d42e7dSPeter Dunlap 	 * the fields back to what we would expect for a cached RX PDU.
2855a6d42e7dSPeter Dunlap 	 */
2856a6d42e7dSPeter Dunlap 	if (pdu->isp_flags & IDM_PDU_ADDL_HDR) {
2857a6d42e7dSPeter Dunlap 		kmem_free(pdu->isp_hdr, pdu->isp_hdrlen);
2858a6d42e7dSPeter Dunlap 	}
2859a6d42e7dSPeter Dunlap 	if (pdu->isp_flags & IDM_PDU_ADDL_DATA) {
2860a6d42e7dSPeter Dunlap 		kmem_free(pdu->isp_data, pdu->isp_datalen);
2861a6d42e7dSPeter Dunlap 	}
2862a6d42e7dSPeter Dunlap 	pdu->isp_hdr = (iscsi_hdr_t *)(pdu + 1);
2863a6d42e7dSPeter Dunlap 	pdu->isp_hdrlen = sizeof (iscsi_hdr_t);
2864a6d42e7dSPeter Dunlap 	pdu->isp_data = NULL;
2865a6d42e7dSPeter Dunlap 	pdu->isp_datalen = 0;
2866a6d42e7dSPeter Dunlap 	pdu->isp_sorx_buf = 0;
2867a6d42e7dSPeter Dunlap 	pdu->isp_callback = idm_sorx_cache_pdu_cb;
2868a6d42e7dSPeter Dunlap 	idm_sorx_cache_pdu_cb(pdu, status);
2869a6d42e7dSPeter Dunlap }
2870a6d42e7dSPeter Dunlap 
2871a6d42e7dSPeter Dunlap /*
2872a6d42e7dSPeter Dunlap  * This thread is only active when I/O is queued for transmit
2873a6d42e7dSPeter Dunlap  * because the socket is busy.
2874a6d42e7dSPeter Dunlap  */
2875a6d42e7dSPeter Dunlap void
2876a6d42e7dSPeter Dunlap idm_sotx_thread(void *arg)
2877a6d42e7dSPeter Dunlap {
2878a6d42e7dSPeter Dunlap 	idm_conn_t	*ic = arg;
2879a6d42e7dSPeter Dunlap 	idm_tx_obj_t	*object, *next;
2880a6d42e7dSPeter Dunlap 	idm_so_conn_t	*so_conn;
2881a6d42e7dSPeter Dunlap 	idm_status_t	status = IDM_STATUS_SUCCESS;
2882a6d42e7dSPeter Dunlap 
2883a6d42e7dSPeter Dunlap 	idm_conn_hold(ic);
2884a6d42e7dSPeter Dunlap 
2885a6d42e7dSPeter Dunlap 	mutex_enter(&ic->ic_mutex);
2886a6d42e7dSPeter Dunlap 	so_conn = ic->ic_transport_private;
2887a6d42e7dSPeter Dunlap 	so_conn->ic_tx_thread_running = B_TRUE;
2888a6d42e7dSPeter Dunlap 	so_conn->ic_tx_thread_did = so_conn->ic_tx_thread->t_did;
2889a6d42e7dSPeter Dunlap 	cv_signal(&ic->ic_cv);
2890a6d42e7dSPeter Dunlap 	mutex_exit(&ic->ic_mutex);
2891a6d42e7dSPeter Dunlap 
2892a6d42e7dSPeter Dunlap 	mutex_enter(&so_conn->ic_tx_mutex);
2893a6d42e7dSPeter Dunlap 
2894a6d42e7dSPeter Dunlap 	while (so_conn->ic_tx_thread_running) {
2895a6d42e7dSPeter Dunlap 		while (list_is_empty(&so_conn->ic_tx_list)) {
2896a6d42e7dSPeter Dunlap 			DTRACE_PROBE1(soconn__tx__sleep, idm_conn_t *, ic);
2897a6d42e7dSPeter Dunlap 			cv_wait(&so_conn->ic_tx_cv, &so_conn->ic_tx_mutex);
2898a6d42e7dSPeter Dunlap 			DTRACE_PROBE1(soconn__tx__wakeup, idm_conn_t *, ic);
2899a6d42e7dSPeter Dunlap 
2900a6d42e7dSPeter Dunlap 			if (!so_conn->ic_tx_thread_running) {
2901a6d42e7dSPeter Dunlap 				goto tx_bail;
2902a6d42e7dSPeter Dunlap 			}
2903a6d42e7dSPeter Dunlap 		}
2904a6d42e7dSPeter Dunlap 
2905a6d42e7dSPeter Dunlap 		object = (idm_tx_obj_t *)list_head(&so_conn->ic_tx_list);
2906a6d42e7dSPeter Dunlap 		list_remove(&so_conn->ic_tx_list, object);
2907a6d42e7dSPeter Dunlap 		mutex_exit(&so_conn->ic_tx_mutex);
2908a6d42e7dSPeter Dunlap 
2909a6d42e7dSPeter Dunlap 		switch (object->idm_tx_obj_magic) {
291060220f10SPriya Krishnan 		case IDM_PDU_MAGIC: {
291160220f10SPriya Krishnan 			idm_pdu_t *pdu = (idm_pdu_t *)object;
2912a6d42e7dSPeter Dunlap 			DTRACE_PROBE2(soconn__tx__pdu, idm_conn_t *, ic,
2913a6d42e7dSPeter Dunlap 			    idm_pdu_t *, (idm_pdu_t *)object);
2914a6d42e7dSPeter Dunlap 
291560220f10SPriya Krishnan 			if (pdu->isp_flags & IDM_PDU_SET_STATSN) {
291660220f10SPriya Krishnan 				/* No IDM task */
291760220f10SPriya Krishnan 				(ic->ic_conn_ops.icb_update_statsn)(NULL, pdu);
291860220f10SPriya Krishnan 			}
2919a6d42e7dSPeter Dunlap 			status = idm_i_so_tx((idm_pdu_t *)object);
2920a6d42e7dSPeter Dunlap 			break;
292160220f10SPriya Krishnan 		}
2922a6d42e7dSPeter Dunlap 		case IDM_BUF_MAGIC: {
2923a6d42e7dSPeter Dunlap 			idm_buf_t *idb = (idm_buf_t *)object;
2924a6d42e7dSPeter Dunlap 			idm_task_t *idt = idb->idb_task_binding;
2925a6d42e7dSPeter Dunlap 
2926a6d42e7dSPeter Dunlap 			DTRACE_PROBE2(soconn__tx__buf, idm_conn_t *, ic,
2927a6d42e7dSPeter Dunlap 			    idm_buf_t *, idb);
2928a6d42e7dSPeter Dunlap 
2929a6d42e7dSPeter Dunlap 			mutex_enter(&idt->idt_mutex);
2930a6d42e7dSPeter Dunlap 			status = idm_so_send_buf_region(idt,
293130e7468fSPeter Dunlap 			    idb, 0, idb->idb_xfer_len);
2932a6d42e7dSPeter Dunlap 
2933a6d42e7dSPeter Dunlap 			/*
2934a6d42e7dSPeter Dunlap 			 * TX thread owns the buffer so we expect it to
2935a6d42e7dSPeter Dunlap 			 * be "in transport"
2936a6d42e7dSPeter Dunlap 			 */
2937a6d42e7dSPeter Dunlap 			ASSERT(idb->idb_in_transport);
293830e7468fSPeter Dunlap 			if (IDM_CONN_ISTGT(ic)) {
293930e7468fSPeter Dunlap 				/*
294030e7468fSPeter Dunlap 				 * idm_buf_tx_to_ini_done releases
294130e7468fSPeter Dunlap 				 * idt->idt_mutex
294230e7468fSPeter Dunlap 				 */
2943a668b114SPriya Krishnan 				DTRACE_ISCSI_8(xfer__done,
2944a668b114SPriya Krishnan 				    idm_conn_t *, idt->idt_ic,
2945a668b114SPriya Krishnan 				    uintptr_t, idb->idb_buf,
2946a668b114SPriya Krishnan 				    uint32_t, idb->idb_bufoffset,
2947a668b114SPriya Krishnan 				    uint64_t, 0, uint32_t, 0, uint32_t, 0,
2948a668b114SPriya Krishnan 				    uint32_t, idb->idb_xfer_len,
2949a668b114SPriya Krishnan 				    int, XFER_BUF_TX_TO_INI);
295030e7468fSPeter Dunlap 				idm_buf_tx_to_ini_done(idt, idb, status);
295130e7468fSPeter Dunlap 			} else {
295230e7468fSPeter Dunlap 				idm_so_send_rtt_data_done(idt, idb);
295330e7468fSPeter Dunlap 				mutex_exit(&idt->idt_mutex);
295430e7468fSPeter Dunlap 			}
2955a6d42e7dSPeter Dunlap 			break;
2956a6d42e7dSPeter Dunlap 		}
2957a6d42e7dSPeter Dunlap 
2958a6d42e7dSPeter Dunlap 		default:
2959a6d42e7dSPeter Dunlap 			IDM_CONN_LOG(CE_WARN, "idm_sotx_thread: Unknown magic "
2960a6d42e7dSPeter Dunlap 			    "(0x%08x)", object->idm_tx_obj_magic);
2961a6d42e7dSPeter Dunlap 			status = IDM_STATUS_FAIL;
2962a6d42e7dSPeter Dunlap 		}
2963a6d42e7dSPeter Dunlap 
2964a6d42e7dSPeter Dunlap 		mutex_enter(&so_conn->ic_tx_mutex);
2965a6d42e7dSPeter Dunlap 
2966a6d42e7dSPeter Dunlap 		if (status != IDM_STATUS_SUCCESS) {
2967a6d42e7dSPeter Dunlap 			so_conn->ic_tx_thread_running = B_FALSE;
2968a6d42e7dSPeter Dunlap 			idm_conn_event(ic, CE_TRANSPORT_FAIL, status);
2969a6d42e7dSPeter Dunlap 		}
2970a6d42e7dSPeter Dunlap 	}
2971a6d42e7dSPeter Dunlap 
2972a6d42e7dSPeter Dunlap 	/*
2973a6d42e7dSPeter Dunlap 	 * Before we leave, we need to abort every item remaining in the
2974a6d42e7dSPeter Dunlap 	 * TX list.
2975a6d42e7dSPeter Dunlap 	 */
2976a6d42e7dSPeter Dunlap 
2977a6d42e7dSPeter Dunlap tx_bail:
2978a6d42e7dSPeter Dunlap 	object = (idm_tx_obj_t *)list_head(&so_conn->ic_tx_list);
2979a6d42e7dSPeter Dunlap 
2980a6d42e7dSPeter Dunlap 	while (object != NULL) {
2981a6d42e7dSPeter Dunlap 		next = list_next(&so_conn->ic_tx_list, object);
2982a6d42e7dSPeter Dunlap 
2983a6d42e7dSPeter Dunlap 		list_remove(&so_conn->ic_tx_list, object);
2984a6d42e7dSPeter Dunlap 		switch (object->idm_tx_obj_magic) {
2985a6d42e7dSPeter Dunlap 		case IDM_PDU_MAGIC:
2986a6d42e7dSPeter Dunlap 			idm_pdu_complete((idm_pdu_t *)object,
2987a6d42e7dSPeter Dunlap 			    IDM_STATUS_ABORTED);
2988a6d42e7dSPeter Dunlap 			break;
2989a6d42e7dSPeter Dunlap 
2990a6d42e7dSPeter Dunlap 		case IDM_BUF_MAGIC: {
2991a6d42e7dSPeter Dunlap 			idm_buf_t *idb = (idm_buf_t *)object;
2992a6d42e7dSPeter Dunlap 			idm_task_t *idt = idb->idb_task_binding;
2993a6d42e7dSPeter Dunlap 			mutex_exit(&so_conn->ic_tx_mutex);
2994a6d42e7dSPeter Dunlap 			mutex_enter(&idt->idt_mutex);
2995a6d42e7dSPeter Dunlap 			/*
2996a6d42e7dSPeter Dunlap 			 * TX thread owns the buffer so we expect it to
2997a6d42e7dSPeter Dunlap 			 * be "in transport"
2998a6d42e7dSPeter Dunlap 			 */
2999a6d42e7dSPeter Dunlap 			ASSERT(idb->idb_in_transport);
300030e7468fSPeter Dunlap 			if (IDM_CONN_ISTGT(ic)) {
300130e7468fSPeter Dunlap 				/*
300230e7468fSPeter Dunlap 				 * idm_buf_tx_to_ini_done releases
300330e7468fSPeter Dunlap 				 * idt->idt_mutex
300430e7468fSPeter Dunlap 				 */
3005a668b114SPriya Krishnan 				DTRACE_ISCSI_8(xfer__done,
3006a668b114SPriya Krishnan 				    idm_conn_t *, idt->idt_ic,
3007a668b114SPriya Krishnan 				    uintptr_t, idb->idb_buf,
3008a668b114SPriya Krishnan 				    uint32_t, idb->idb_bufoffset,
3009a668b114SPriya Krishnan 				    uint64_t, 0, uint32_t, 0, uint32_t, 0,
3010a668b114SPriya Krishnan 				    uint32_t, idb->idb_xfer_len,
3011a668b114SPriya Krishnan 				    int, XFER_BUF_TX_TO_INI);
301230e7468fSPeter Dunlap 				idm_buf_tx_to_ini_done(idt, idb,
301330e7468fSPeter Dunlap 				    IDM_STATUS_ABORTED);
301430e7468fSPeter Dunlap 			} else {
301530e7468fSPeter Dunlap 				idm_so_send_rtt_data_done(idt, idb);
301630e7468fSPeter Dunlap 				mutex_exit(&idt->idt_mutex);
301730e7468fSPeter Dunlap 			}
3018a6d42e7dSPeter Dunlap 			mutex_enter(&so_conn->ic_tx_mutex);
3019a6d42e7dSPeter Dunlap 			break;
3020a6d42e7dSPeter Dunlap 		}
3021a6d42e7dSPeter Dunlap 		default:
3022a6d42e7dSPeter Dunlap 			IDM_CONN_LOG(CE_WARN,
3023a6d42e7dSPeter Dunlap 			    "idm_sotx_thread: Unexpected magic "
3024a6d42e7dSPeter Dunlap 			    "(0x%08x)", object->idm_tx_obj_magic);
3025a6d42e7dSPeter Dunlap 		}
3026a6d42e7dSPeter Dunlap 
3027a6d42e7dSPeter Dunlap 		object = next;
3028a6d42e7dSPeter Dunlap 	}
3029a6d42e7dSPeter Dunlap 
3030a6d42e7dSPeter Dunlap 	mutex_exit(&so_conn->ic_tx_mutex);
3031a6d42e7dSPeter Dunlap 	idm_conn_rele(ic);
3032a6d42e7dSPeter Dunlap 	thread_exit();
3033a6d42e7dSPeter Dunlap 	/*NOTREACHED*/
3034a6d42e7dSPeter Dunlap }
3035aff4bce5Syi zhang - Sun Microsystems - Beijing China 
3036aff4bce5Syi zhang - Sun Microsystems - Beijing China static void
3037aff4bce5Syi zhang - Sun Microsystems - Beijing China idm_so_socket_set_nonblock(struct sonode *node)
3038aff4bce5Syi zhang - Sun Microsystems - Beijing China {
3039aff4bce5Syi zhang - Sun Microsystems - Beijing China 	(void) VOP_SETFL(node->so_vnode, node->so_flag,
3040aff4bce5Syi zhang - Sun Microsystems - Beijing China 	    (node->so_state | FNONBLOCK), CRED(), NULL);
3041aff4bce5Syi zhang - Sun Microsystems - Beijing China }
3042aff4bce5Syi zhang - Sun Microsystems - Beijing China 
3043aff4bce5Syi zhang - Sun Microsystems - Beijing China static void
3044aff4bce5Syi zhang - Sun Microsystems - Beijing China idm_so_socket_set_block(struct sonode *node)
3045aff4bce5Syi zhang - Sun Microsystems - Beijing China {
3046aff4bce5Syi zhang - Sun Microsystems - Beijing China 	(void) VOP_SETFL(node->so_vnode, node->so_flag,
3047aff4bce5Syi zhang - Sun Microsystems - Beijing China 	    (node->so_state & (~FNONBLOCK)), CRED(), NULL);
3048aff4bce5Syi zhang - Sun Microsystems - Beijing China }
3049bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3050bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3051bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States /*
3052bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  * Called by kernel sockets when the connection has been accepted or
3053bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  * rejected. In early volo, a "disconnect" callback was sent instead of
3054bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  * "connectfailed", so we check for both.
3055bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  */
3056bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States /* ARGSUSED */
3057bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States void
3058bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States idm_so_timed_socket_connect_cb(ksocket_t ks,
3059bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States     ksocket_callback_event_t ev, void *arg, uintptr_t info)
3060bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States {
3061bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	idm_so_timed_socket_t	*itp = arg;
3062bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	ASSERT(itp != NULL);
3063bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	ASSERT(ev == KSOCKET_EV_CONNECTED ||
3064bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	    ev == KSOCKET_EV_CONNECTFAILED ||
3065bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	    ev == KSOCKET_EV_DISCONNECTED);
3066bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3067bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	mutex_enter(&idm_so_timed_socket_mutex);
3068bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	itp->it_callback_called = B_TRUE;
3069bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	if (ev == KSOCKET_EV_CONNECTED) {
3070bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		itp->it_socket_error_code = 0;
3071bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	} else {
3072bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		/* Make sure the error code is non-zero on error */
3073bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		if (info == 0)
3074bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			info = ECONNRESET;
3075bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		itp->it_socket_error_code = (int)info;
3076bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	}
3077bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	cv_signal(&itp->it_cv);
3078bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	mutex_exit(&idm_so_timed_socket_mutex);
3079bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States }
3080bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3081bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States int
3082bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States idm_so_timed_socket_connect(ksocket_t ks,
3083bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States     struct sockaddr_storage *sa, int sa_sz, int login_max_usec)
3084bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States {
3085bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	clock_t			conn_login_max;
3086bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	int			rc, nonblocking, rval;
3087bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	idm_so_timed_socket_t	it;
3088bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	ksocket_callbacks_t	ks_cb;
3089bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3090bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	conn_login_max = ddi_get_lbolt() + drv_usectohz(login_max_usec);
3091bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3092bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	/*
3093bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	 * Set to non-block socket mode, with callback on connect
3094bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	 * Early volo used "disconnected" instead of "connectfailed",
3095bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	 * so set callback to look for both.
3096bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	 */
3097bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	bzero(&it, sizeof (it));
3098bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	ks_cb.ksock_cb_flags = KSOCKET_CB_CONNECTED |
3099bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	    KSOCKET_CB_CONNECTFAILED | KSOCKET_CB_DISCONNECTED;
3100bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	ks_cb.ksock_cb_connected = idm_so_timed_socket_connect_cb;
3101bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	ks_cb.ksock_cb_connectfailed = idm_so_timed_socket_connect_cb;
3102bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	ks_cb.ksock_cb_disconnected = idm_so_timed_socket_connect_cb;
3103bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	cv_init(&it.it_cv, NULL, CV_DEFAULT, NULL);
3104bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	rc = ksocket_setcallbacks(ks, &ks_cb, &it, CRED());
3105bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	if (rc != 0)
3106bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		return (rc);
3107bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3108bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	/* Set to non-blocking mode */
3109bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	nonblocking = 1;
3110bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	rc = ksocket_ioctl(ks, FIONBIO, (intptr_t)&nonblocking, &rval,
3111bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	    CRED());
3112bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	if (rc != 0)
3113bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		goto cleanup;
3114bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3115bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	bzero(&it, sizeof (it));
3116bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	for (;;) {
3117bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		/*
3118bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		 * Warning -- in a loopback scenario, the call to
3119bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		 * the connect_cb can occur inside the call to
3120bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		 * ksocket_connect. Do not hold the mutex around the
3121bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		 * call to ksocket_connect.
3122bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		 */
3123bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		rc = ksocket_connect(ks, (struct sockaddr *)sa, sa_sz, CRED());
3124bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		if (rc == 0 || rc == EISCONN) {
3125bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			/* socket success or already success */
3126bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			rc = 0;
3127bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			break;
3128bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		}
3129bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		if ((rc != EINPROGRESS) && (rc != EALREADY)) {
3130bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			break;
3131bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		}
3132bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3133bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		/* TCP connect still in progress. See if out of time. */
3134bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		if (ddi_get_lbolt() > conn_login_max) {
3135bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			/*
3136bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			 * Connection retry timeout,
3137bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			 * failed connect to target.
3138bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			 */
3139bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			rc = ETIMEDOUT;
3140bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			break;
3141bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		}
3142bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3143bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		/*
3144bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		 * TCP connect still in progress.  Sleep until callback.
3145bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		 * Do NOT go to sleep if the callback already occurred!
3146bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		 */
3147bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		mutex_enter(&idm_so_timed_socket_mutex);
3148bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		if (!it.it_callback_called) {
3149bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			(void) cv_timedwait(&it.it_cv,
3150bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			    &idm_so_timed_socket_mutex, conn_login_max);
3151bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		}
3152bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		if (it.it_callback_called) {
3153bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			rc = it.it_socket_error_code;
3154bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			mutex_exit(&idm_so_timed_socket_mutex);
3155bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 			break;
3156bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		}
3157bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		/* If timer expires, go call ksocket_connect one last time. */
3158bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		mutex_exit(&idm_so_timed_socket_mutex);
3159bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	}
3160bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3161bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	/* resume blocking mode */
3162bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	nonblocking = 0;
3163aedf2b3bSsrivijitha dugganapalli 	(void) ksocket_ioctl(ks, FIONBIO, (intptr_t)&nonblocking, &rval,
3164bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	    CRED());
3165bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States cleanup:
3166aedf2b3bSsrivijitha dugganapalli 	(void) ksocket_setcallbacks(ks, NULL, NULL, CRED());
3167bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	cv_destroy(&it.it_cv);
3168bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	if (rc != 0) {
3169bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		idm_soshutdown(ks);
3170bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	}
3171bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	return (rc);
3172bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States }
3173bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3174bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3175bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States void
3176bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States idm_addr_to_sa(idm_addr_t *dportal, struct sockaddr_storage *sa)
3177bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States {
3178bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	int			dp_addr_size;
3179bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	struct sockaddr_in	*sin;
3180bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	struct sockaddr_in6	*sin6;
3181bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3182bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	/* Build sockaddr_storage for this portal (idm_addr_t) */
3183bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	bzero(sa, sizeof (*sa));
3184bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	dp_addr_size = dportal->a_addr.i_insize;
3185bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	if (dp_addr_size == sizeof (struct in_addr)) {
3186bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		/* IPv4 */
3187bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		sa->ss_family = AF_INET;
3188bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		sin = (struct sockaddr_in *)sa;
3189bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		sin->sin_port = htons(dportal->a_port);
3190bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		bcopy(&dportal->a_addr.i_addr.in4,
3191bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		    &sin->sin_addr, sizeof (struct in_addr));
3192bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	} else if (dp_addr_size == sizeof (struct in6_addr)) {
3193bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		/* IPv6 */
3194bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		sa->ss_family = AF_INET6;
3195bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		sin6 = (struct sockaddr_in6 *)sa;
3196bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		sin6->sin6_port = htons(dportal->a_port);
3197bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		bcopy(&dportal->a_addr.i_addr.in6,
3198bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		    &sin6->sin6_addr, sizeof (struct in6_addr));
3199bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	} else {
3200bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		ASSERT(0);
3201bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	}
3202bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States }
3203bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3204bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3205bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States /*
3206bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  * return a human-readable form of a sockaddr_storage, in the form
3207bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  * [ip-address]:port.  This is used in calls to logging functions.
3208bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  * If several calls to idm_sa_ntop are made within the same invocation
3209bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  * of a logging function, then each one needs its own buf.
3210bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States  */
3211bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States const char *
3212bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States idm_sa_ntop(const struct sockaddr_storage *sa,
3213bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States     char *buf, size_t size)
3214bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States {
3215bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	static const char bogus_ip[] = "[0].-1";
3216bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	char tmp[INET6_ADDRSTRLEN];
3217bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 
3218bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	switch (sa->ss_family) {
32190b905b49SYuri Pankov 	case AF_INET6: {
32200b905b49SYuri Pankov 		const struct sockaddr_in6 *in6 =
32210b905b49SYuri Pankov 		    (const struct sockaddr_in6 *) sa;
32220b905b49SYuri Pankov 
32230b905b49SYuri Pankov 		(void) inet_ntop(in6->sin6_family, &in6->sin6_addr, tmp,
32240b905b49SYuri Pankov 		    sizeof (tmp));
32250b905b49SYuri Pankov 		if (strlen(tmp) + sizeof ("[].65535") > size)
32260b905b49SYuri Pankov 			goto err;
32270b905b49SYuri Pankov 		/* struct sockaddr_storage gets port info from v4 loc */
32280b905b49SYuri Pankov 		(void) snprintf(buf, size, "[%s].%u", tmp,
32290b905b49SYuri Pankov 		    ntohs(in6->sin6_port));
32300b905b49SYuri Pankov 		return (buf);
32310b905b49SYuri Pankov 	}
32320b905b49SYuri Pankov 	case AF_INET: {
32330b905b49SYuri Pankov 		const struct sockaddr_in *in = (const struct sockaddr_in *) sa;
32340b905b49SYuri Pankov 
32350b905b49SYuri Pankov 		(void) inet_ntop(in->sin_family, &in->sin_addr, tmp,
32360b905b49SYuri Pankov 		    sizeof (tmp));
32370b905b49SYuri Pankov 		if (strlen(tmp) + sizeof ("[].65535") > size)
3238bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 				goto err;
32390b905b49SYuri Pankov 		(void) snprintf(buf, size,  "[%s].%u", tmp,
32400b905b49SYuri Pankov 		    ntohs(in->sin_port));
32410b905b49SYuri Pankov 		return (buf);
32420b905b49SYuri Pankov 	}
3243bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	default:
3244bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 		break;
3245bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	}
3246bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States err:
3247bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	(void) snprintf(buf, size, "%s", bogus_ip);
3248bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States 	return (buf);
3249bdbe8dc6SPeter Cudhea - Sun Microsystems - Burlington, MA United States }
3250