1c0dd49bdSEiji Ota /*
216e76cddSagiri  * Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved.
3c0dd49bdSEiji Ota  */
416e76cddSagiri 
5c0dd49bdSEiji Ota /*
616e76cddSagiri  * This file contains code imported from the OFED rds source file loop.c
716e76cddSagiri  * Oracle elects to have and use the contents of loop.c under and governed
816e76cddSagiri  * by the OpenIB.org BSD license (see below for full license text). However,
916e76cddSagiri  * the following notice accompanied the original version of this file:
10c0dd49bdSEiji Ota  */
11c0dd49bdSEiji Ota 
12c0dd49bdSEiji Ota /*
13c0dd49bdSEiji Ota  * Copyright (c) 2006 Oracle.  All rights reserved.
14c0dd49bdSEiji Ota  *
15c0dd49bdSEiji Ota  * This software is available to you under a choice of one of two
16c0dd49bdSEiji Ota  * licenses.  You may choose to be licensed under the terms of the GNU
17c0dd49bdSEiji Ota  * General Public License (GPL) Version 2, available from the file
18c0dd49bdSEiji Ota  * COPYING in the main directory of this source tree, or the
19c0dd49bdSEiji Ota  * OpenIB.org BSD license below:
20c0dd49bdSEiji Ota  *
21c0dd49bdSEiji Ota  *     Redistribution and use in source and binary forms, with or
22c0dd49bdSEiji Ota  *     without modification, are permitted provided that the following
23c0dd49bdSEiji Ota  *     conditions are met:
24c0dd49bdSEiji Ota  *
25c0dd49bdSEiji Ota  *      - Redistributions of source code must retain the above
26c0dd49bdSEiji Ota  *        copyright notice, this list of conditions and the following
27c0dd49bdSEiji Ota  *        disclaimer.
28c0dd49bdSEiji Ota  *
29c0dd49bdSEiji Ota  *      - Redistributions in binary form must reproduce the above
30c0dd49bdSEiji Ota  *        copyright notice, this list of conditions and the following
31c0dd49bdSEiji Ota  *        disclaimer in the documentation and/or other materials
32c0dd49bdSEiji Ota  *        provided with the distribution.
33c0dd49bdSEiji Ota  *
34c0dd49bdSEiji Ota  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
35c0dd49bdSEiji Ota  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
36c0dd49bdSEiji Ota  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
37c0dd49bdSEiji Ota  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
38c0dd49bdSEiji Ota  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
39c0dd49bdSEiji Ota  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
40c0dd49bdSEiji Ota  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
41c0dd49bdSEiji Ota  * SOFTWARE.
42c0dd49bdSEiji Ota  *
43c0dd49bdSEiji Ota  */
44c0dd49bdSEiji Ota #include <sys/rds.h>
45*94c3dad2SToomas Soome #include <sys/containerof.h>
46c0dd49bdSEiji Ota 
47c0dd49bdSEiji Ota #include <sys/ib/clients/rdsv3/rdsv3.h>
48c0dd49bdSEiji Ota #include <sys/ib/clients/rdsv3/loop.h>
49c0dd49bdSEiji Ota #include <sys/ib/clients/rdsv3/rdsv3_debug.h>
50c0dd49bdSEiji Ota 
51c0dd49bdSEiji Ota kmutex_t loop_conns_lock;
52c0dd49bdSEiji Ota list_t loop_conns;
53c0dd49bdSEiji Ota 
54c0dd49bdSEiji Ota /*
55c0dd49bdSEiji Ota  * This 'loopback' transport is a special case for flows that originate
56c0dd49bdSEiji Ota  * and terminate on the same machine.
57c0dd49bdSEiji Ota  *
58c0dd49bdSEiji Ota  * Connection build-up notices if the destination address is thought of
59c0dd49bdSEiji Ota  * as a local address by a transport.  At that time it decides to use the
60c0dd49bdSEiji Ota  * loopback transport instead of the bound transport of the sending socket.
61c0dd49bdSEiji Ota  *
62c0dd49bdSEiji Ota  * The loopback transport's sending path just hands the sent rds_message
63c0dd49bdSEiji Ota  * straight to the receiving path via an embedded rds_incoming.
64c0dd49bdSEiji Ota  */
65c0dd49bdSEiji Ota 
66c0dd49bdSEiji Ota /*
67c0dd49bdSEiji Ota  * Usually a message transits both the sender and receiver's conns as it
68c0dd49bdSEiji Ota  * flows to the receiver.  In the loopback case, though, the receive path
69c0dd49bdSEiji Ota  * is handed the sending conn so the sense of the addresses is reversed.
70c0dd49bdSEiji Ota  */
71c0dd49bdSEiji Ota static int
rdsv3_loop_xmit(struct rdsv3_connection * conn,struct rdsv3_message * rm,unsigned int hdr_off,unsigned int sg,unsigned int off)72c0dd49bdSEiji Ota rdsv3_loop_xmit(struct rdsv3_connection *conn, struct rdsv3_message *rm,
73c0dd49bdSEiji Ota     unsigned int hdr_off, unsigned int sg,
74c0dd49bdSEiji Ota     unsigned int off)
75c0dd49bdSEiji Ota {
765d5562f5SEiji Ota 	/* Do not send cong updates to loopback */
775d5562f5SEiji Ota 	if (rm->m_inc.i_hdr.h_flags & RDSV3_FLAG_CONG_BITMAP) {
785d5562f5SEiji Ota 		rdsv3_cong_map_updated(conn->c_fcong, ~(uint64_t)0);
795d5562f5SEiji Ota 		return (sizeof (struct rdsv3_header) + RDSV3_CONG_MAP_BYTES);
805d5562f5SEiji Ota 	}
81c0dd49bdSEiji Ota 	ASSERT(!(hdr_off || sg || off));
82c0dd49bdSEiji Ota 
83c0dd49bdSEiji Ota 	RDSV3_DPRINTF4("rdsv3_loop_xmit", "Enter(conn: %p, rm: %p)", conn, rm);
84c0dd49bdSEiji Ota 
85c0dd49bdSEiji Ota 	rdsv3_inc_init(&rm->m_inc, conn, conn->c_laddr);
865d5562f5SEiji Ota 	/* For the embedded inc. Matching put is in loop_inc_free() */
875d5562f5SEiji Ota 	rdsv3_message_addref(rm);
88c0dd49bdSEiji Ota 
89c0dd49bdSEiji Ota 	rdsv3_recv_incoming(conn, conn->c_laddr, conn->c_faddr, &rm->m_inc,
90c0dd49bdSEiji Ota 	    KM_NOSLEEP);
91c0dd49bdSEiji Ota 
92c0dd49bdSEiji Ota 	rdsv3_send_drop_acked(conn, ntohll(rm->m_inc.i_hdr.h_sequence),
93c0dd49bdSEiji Ota 	    NULL);
94c0dd49bdSEiji Ota 
95c0dd49bdSEiji Ota 	rdsv3_inc_put(&rm->m_inc);
96c0dd49bdSEiji Ota 
97c0dd49bdSEiji Ota 	RDSV3_DPRINTF4("rdsv3_loop_xmit", "Return(conn: %p, rm: %p)", conn, rm);
98c0dd49bdSEiji Ota 
99c0dd49bdSEiji Ota 	return (sizeof (struct rdsv3_header) +
100c0dd49bdSEiji Ota 	    ntohl(rm->m_inc.i_hdr.h_len));
101c0dd49bdSEiji Ota }
102c0dd49bdSEiji Ota 
1035d5562f5SEiji Ota /*
1045d5562f5SEiji Ota  * See rds_loop_xmit(). Since our inc is embedded in the rm, we
1055d5562f5SEiji Ota  * make sure the rm lives at least until the inc is done.
1065d5562f5SEiji Ota  */
1075d5562f5SEiji Ota static void
rdsv3_loop_inc_free(struct rdsv3_incoming * inc)1085d5562f5SEiji Ota rdsv3_loop_inc_free(struct rdsv3_incoming *inc)
1095d5562f5SEiji Ota {
110*94c3dad2SToomas Soome 	struct rdsv3_message *rm = __containerof(inc, struct rdsv3_message,
1115d5562f5SEiji Ota 	    m_inc);
1125d5562f5SEiji Ota 	rdsv3_message_put(rm);
1135d5562f5SEiji Ota }
1145d5562f5SEiji Ota 
115c0dd49bdSEiji Ota static int
rdsv3_loop_xmit_cong_map(struct rdsv3_connection * conn,struct rdsv3_cong_map * map,unsigned long offset)116c0dd49bdSEiji Ota rdsv3_loop_xmit_cong_map(struct rdsv3_connection *conn,
117c0dd49bdSEiji Ota     struct rdsv3_cong_map *map,
118c0dd49bdSEiji Ota     unsigned long offset)
119c0dd49bdSEiji Ota {
120c0dd49bdSEiji Ota 	RDSV3_DPRINTF4("rdsv3_loop_xmit_cong_map", "Enter(conn: %p)", conn);
121c0dd49bdSEiji Ota 
122c0dd49bdSEiji Ota 	ASSERT(!offset);
123c0dd49bdSEiji Ota 	ASSERT(map == conn->c_lcong);
124c0dd49bdSEiji Ota 
125c0dd49bdSEiji Ota 	rdsv3_cong_map_updated(conn->c_fcong, ~(uint64_t)0);
126c0dd49bdSEiji Ota 
127c0dd49bdSEiji Ota 	RDSV3_DPRINTF4("rdsv3_loop_xmit_cong_map", "Return(conn: %p)", conn);
128c0dd49bdSEiji Ota 
129c0dd49bdSEiji Ota 	return (sizeof (struct rdsv3_header) + RDSV3_CONG_MAP_BYTES);
130c0dd49bdSEiji Ota }
131c0dd49bdSEiji Ota 
132c0dd49bdSEiji Ota /* we need to at least give the thread something to succeed */
133c0dd49bdSEiji Ota /* ARGSUSED */
134c0dd49bdSEiji Ota static int
rdsv3_loop_recv(struct rdsv3_connection * conn)135c0dd49bdSEiji Ota rdsv3_loop_recv(struct rdsv3_connection *conn)
136c0dd49bdSEiji Ota {
137c0dd49bdSEiji Ota 	return (0);
138c0dd49bdSEiji Ota }
139c0dd49bdSEiji Ota 
140cadbfdc3SEiji Ota struct rdsv3_loop_connection {
141c0dd49bdSEiji Ota 	struct list_node loop_node;
142c0dd49bdSEiji Ota 	struct rdsv3_connection *conn;
143c0dd49bdSEiji Ota };
144c0dd49bdSEiji Ota 
145c0dd49bdSEiji Ota /*
146c0dd49bdSEiji Ota  * Even the loopback transport needs to keep track of its connections,
147c0dd49bdSEiji Ota  * so it can call rdsv3_conn_destroy() on them on exit. N.B. there are
148c0dd49bdSEiji Ota  * 1+ loopback addresses (127.*.*.*) so it's not a bug to have
149c0dd49bdSEiji Ota  * multiple loopback conns allocated, although rather useless.
150c0dd49bdSEiji Ota  */
151c0dd49bdSEiji Ota /* ARGSUSED */
152c0dd49bdSEiji Ota static int
rdsv3_loop_conn_alloc(struct rdsv3_connection * conn,int gfp)153c0dd49bdSEiji Ota rdsv3_loop_conn_alloc(struct rdsv3_connection *conn, int gfp)
154c0dd49bdSEiji Ota {
155c0dd49bdSEiji Ota 	struct rdsv3_loop_connection *lc;
156c0dd49bdSEiji Ota 
157c0dd49bdSEiji Ota 	RDSV3_DPRINTF4("rdsv3_loop_conn_alloc", "Enter(conn: %p)", conn);
158c0dd49bdSEiji Ota 
159c0dd49bdSEiji Ota 	lc = kmem_zalloc(sizeof (struct rdsv3_loop_connection), KM_NOSLEEP);
1605d5562f5SEiji Ota 	if (!lc)
161c0dd49bdSEiji Ota 		return (-ENOMEM);
162c0dd49bdSEiji Ota 
163c0dd49bdSEiji Ota 	list_link_init(&lc->loop_node);
164c0dd49bdSEiji Ota 	lc->conn = conn;
165c0dd49bdSEiji Ota 	conn->c_transport_data = lc;
166c0dd49bdSEiji Ota 
167c0dd49bdSEiji Ota 	mutex_enter(&loop_conns_lock);
168c0dd49bdSEiji Ota 	list_insert_tail(&loop_conns, lc);
169c0dd49bdSEiji Ota 	mutex_exit(&loop_conns_lock);
170c0dd49bdSEiji Ota 
171c0dd49bdSEiji Ota 	RDSV3_DPRINTF4("rdsv3_loop_conn_alloc", "Return(conn: %p)", conn);
172c0dd49bdSEiji Ota 
173c0dd49bdSEiji Ota 	return (0);
174c0dd49bdSEiji Ota }
175c0dd49bdSEiji Ota 
176c0dd49bdSEiji Ota static void
rdsv3_loop_conn_free(void * arg)177c0dd49bdSEiji Ota rdsv3_loop_conn_free(void *arg)
178c0dd49bdSEiji Ota {
179c0dd49bdSEiji Ota 	struct rdsv3_loop_connection *lc = arg;
180c0dd49bdSEiji Ota 	RDSV3_DPRINTF5("rdsv3_loop_conn_free", "lc %p\n", lc);
181c0dd49bdSEiji Ota 	list_remove_node(&lc->loop_node);
182c0dd49bdSEiji Ota 	kmem_free(lc, sizeof (struct rdsv3_loop_connection));
183c0dd49bdSEiji Ota }
184c0dd49bdSEiji Ota 
185c0dd49bdSEiji Ota static int
rdsv3_loop_conn_connect(struct rdsv3_connection * conn)186c0dd49bdSEiji Ota rdsv3_loop_conn_connect(struct rdsv3_connection *conn)
187c0dd49bdSEiji Ota {
188c0dd49bdSEiji Ota 	rdsv3_connect_complete(conn);
189c0dd49bdSEiji Ota 	return (0);
190c0dd49bdSEiji Ota }
191c0dd49bdSEiji Ota 
192c0dd49bdSEiji Ota /* ARGSUSED */
193c0dd49bdSEiji Ota static void
rdsv3_loop_conn_shutdown(struct rdsv3_connection * conn)194c0dd49bdSEiji Ota rdsv3_loop_conn_shutdown(struct rdsv3_connection *conn)
195c0dd49bdSEiji Ota {
196c0dd49bdSEiji Ota }
197c0dd49bdSEiji Ota 
198c0dd49bdSEiji Ota void
rdsv3_loop_exit(void)199c0dd49bdSEiji Ota rdsv3_loop_exit(void)
200c0dd49bdSEiji Ota {
201c0dd49bdSEiji Ota 	struct rdsv3_loop_connection *lc, *_lc;
202c0dd49bdSEiji Ota 	list_t tmp_list;
203c0dd49bdSEiji Ota 
204c0dd49bdSEiji Ota 	RDSV3_DPRINTF4("rdsv3_loop_exit", "Enter");
205c0dd49bdSEiji Ota 
206c0dd49bdSEiji Ota 	list_create(&tmp_list, sizeof (struct rdsv3_loop_connection),
207c0dd49bdSEiji Ota 	    offsetof(struct rdsv3_loop_connection, loop_node));
208c0dd49bdSEiji Ota 
209c0dd49bdSEiji Ota 	/* avoid calling conn_destroy with irqs off */
210c0dd49bdSEiji Ota 	mutex_enter(&loop_conns_lock);
211c0dd49bdSEiji Ota 	list_splice(&loop_conns, &tmp_list);
212c0dd49bdSEiji Ota 	mutex_exit(&loop_conns_lock);
213c0dd49bdSEiji Ota 
214c0dd49bdSEiji Ota 	RDSV3_FOR_EACH_LIST_NODE_SAFE(lc, _lc, &tmp_list, loop_node) {
215c0dd49bdSEiji Ota 		ASSERT(!lc->conn->c_passive);
216c0dd49bdSEiji Ota 		rdsv3_conn_destroy(lc->conn);
217c0dd49bdSEiji Ota 	}
218c0dd49bdSEiji Ota 
219c0dd49bdSEiji Ota 	list_destroy(&loop_conns);
220c0dd49bdSEiji Ota 	mutex_destroy(&loop_conns_lock);
221c0dd49bdSEiji Ota 
222c0dd49bdSEiji Ota 	RDSV3_DPRINTF4("rdsv3_loop_exit", "Return");
223c0dd49bdSEiji Ota }
224c0dd49bdSEiji Ota 
225c0dd49bdSEiji Ota /*
226c0dd49bdSEiji Ota  * This is missing .xmit_* because loop doesn't go through generic
227c0dd49bdSEiji Ota  * rdsv3_send_xmit() and doesn't call rdsv3_recv_incoming().  .listen_stop and
228c0dd49bdSEiji Ota  * .laddr_check are missing because transport.c doesn't iterate over
229c0dd49bdSEiji Ota  * rdsv3_loop_transport.
230c0dd49bdSEiji Ota  */
231c0dd49bdSEiji Ota #ifndef __lock_lint
232c0dd49bdSEiji Ota struct rdsv3_transport rdsv3_loop_transport = {
233c0dd49bdSEiji Ota 	.xmit			= rdsv3_loop_xmit,
234c0dd49bdSEiji Ota 	.xmit_cong_map		= rdsv3_loop_xmit_cong_map,
235c0dd49bdSEiji Ota 	.recv			= rdsv3_loop_recv,
236c0dd49bdSEiji Ota 	.conn_alloc		= rdsv3_loop_conn_alloc,
237c0dd49bdSEiji Ota 	.conn_free		= rdsv3_loop_conn_free,
238c0dd49bdSEiji Ota 	.conn_connect		= rdsv3_loop_conn_connect,
239c0dd49bdSEiji Ota 	.conn_shutdown		= rdsv3_loop_conn_shutdown,
240c0dd49bdSEiji Ota 	.inc_copy_to_user	= rdsv3_message_inc_copy_to_user,
2415d5562f5SEiji Ota 	.inc_free		= rdsv3_loop_inc_free,
242c0dd49bdSEiji Ota 	.t_name			= "loopback",
243c0dd49bdSEiji Ota };
244c0dd49bdSEiji Ota #else
245c0dd49bdSEiji Ota struct rdsv3_transport rdsv3_loop_transport;
246c0dd49bdSEiji Ota #endif
247