1c0dd49bdSEiji Ota /*
216e76cddSagiri  * Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved.
3c0dd49bdSEiji Ota  */
416e76cddSagiri 
5c0dd49bdSEiji Ota /*
616e76cddSagiri  * This file contains code imported from the OFED rds source file info.c
716e76cddSagiri  * Oracle elects to have and use the contents of info.c under and governed
816e76cddSagiri  * by the OpenIB.org BSD license (see below for full license text). However,
916e76cddSagiri  * the following notice accompanied the original version of this file:
10c0dd49bdSEiji Ota  */
11c0dd49bdSEiji Ota 
12c0dd49bdSEiji Ota /*
13c0dd49bdSEiji Ota  * Copyright (c) 2006 Oracle.  All rights reserved.
14c0dd49bdSEiji Ota  *
15c0dd49bdSEiji Ota  * This software is available to you under a choice of one of two
16c0dd49bdSEiji Ota  * licenses.  You may choose to be licensed under the terms of the GNU
17c0dd49bdSEiji Ota  * General Public License (GPL) Version 2, available from the file
18c0dd49bdSEiji Ota  * COPYING in the main directory of this source tree, or the
19c0dd49bdSEiji Ota  * OpenIB.org BSD license below:
20c0dd49bdSEiji Ota  *
21c0dd49bdSEiji Ota  *     Redistribution and use in source and binary forms, with or
22c0dd49bdSEiji Ota  *     without modification, are permitted provided that the following
23c0dd49bdSEiji Ota  *     conditions are met:
24c0dd49bdSEiji Ota  *
25c0dd49bdSEiji Ota  *      - Redistributions of source code must retain the above
26c0dd49bdSEiji Ota  *        copyright notice, this list of conditions and the following
27c0dd49bdSEiji Ota  *        disclaimer.
28c0dd49bdSEiji Ota  *
29c0dd49bdSEiji Ota  *      - Redistributions in binary form must reproduce the above
30c0dd49bdSEiji Ota  *        copyright notice, this list of conditions and the following
31c0dd49bdSEiji Ota  *        disclaimer in the documentation and/or other materials
32c0dd49bdSEiji Ota  *        provided with the distribution.
33c0dd49bdSEiji Ota  *
34c0dd49bdSEiji Ota  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
35c0dd49bdSEiji Ota  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
36c0dd49bdSEiji Ota  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
37c0dd49bdSEiji Ota  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
38c0dd49bdSEiji Ota  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
39c0dd49bdSEiji Ota  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
40c0dd49bdSEiji Ota  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
41c0dd49bdSEiji Ota  * SOFTWARE.
42c0dd49bdSEiji Ota  *
43c0dd49bdSEiji Ota  */
44c0dd49bdSEiji Ota #include <sys/rds.h>
45c0dd49bdSEiji Ota 
46c0dd49bdSEiji Ota #include <sys/ib/clients/rdsv3/rdsv3.h>
47b27516f5Sagiri #include <sys/ib/clients/rdsv3/rdsv3_debug.h>
48c0dd49bdSEiji Ota 
49c0dd49bdSEiji Ota /*
50c0dd49bdSEiji Ota  * This file implements a getsockopt() call which copies a set of fixed
51c0dd49bdSEiji Ota  * sized structs into a user-specified buffer as a means of providing
52c0dd49bdSEiji Ota  * read-only information about RDS.
53c0dd49bdSEiji Ota  *
54c0dd49bdSEiji Ota  * For a given information source there are a given number of fixed sized
55c0dd49bdSEiji Ota  * structs at a given time.  The structs are only copied if the user-specified
56c0dd49bdSEiji Ota  * buffer is big enough.  The destination pages that make up the buffer
57c0dd49bdSEiji Ota  * are pinned for the duration of the copy.
58c0dd49bdSEiji Ota  *
59c0dd49bdSEiji Ota  * This gives us the following benefits:
60c0dd49bdSEiji Ota  *
61c0dd49bdSEiji Ota  * - simple implementation, no copy "position" across multiple calls
62c0dd49bdSEiji Ota  * - consistent snapshot of an info source
63c0dd49bdSEiji Ota  * - atomic copy works well with whatever locking info source has
64c0dd49bdSEiji Ota  * - one portable tool to get rds info across implementations
65c0dd49bdSEiji Ota  * - long-lived tool can get info without allocating
66c0dd49bdSEiji Ota  *
67c0dd49bdSEiji Ota  * at the following costs:
68c0dd49bdSEiji Ota  *
69c0dd49bdSEiji Ota  * - info source copy must be pinned, may be "large"
70c0dd49bdSEiji Ota  */
71c0dd49bdSEiji Ota 
72c0dd49bdSEiji Ota static kmutex_t rdsv3_info_lock;
73fe817b60SEiji Ota static rdsv3_info_func rdsv3_info_funcs[RDS_INFO_LAST - RDS_INFO_FIRST + 1];
74c0dd49bdSEiji Ota 
75c0dd49bdSEiji Ota void
rdsv3_info_register_func(int optname,rdsv3_info_func func)76c0dd49bdSEiji Ota rdsv3_info_register_func(int optname, rdsv3_info_func func)
77c0dd49bdSEiji Ota {
78fe817b60SEiji Ota 	int offset = optname - RDS_INFO_FIRST;
79c0dd49bdSEiji Ota 
80fe817b60SEiji Ota 	ASSERT(optname >= RDS_INFO_FIRST && optname <= RDS_INFO_LAST);
81c0dd49bdSEiji Ota 
82c0dd49bdSEiji Ota 	mutex_enter(&rdsv3_info_lock);
835d5562f5SEiji Ota 	ASSERT(!rdsv3_info_funcs[offset]);
84c0dd49bdSEiji Ota 	rdsv3_info_funcs[offset] = func;
85c0dd49bdSEiji Ota 	mutex_exit(&rdsv3_info_lock);
86c0dd49bdSEiji Ota }
87c0dd49bdSEiji Ota 
88c0dd49bdSEiji Ota /* ARGSUSED */
89c0dd49bdSEiji Ota void
rdsv3_info_deregister_func(int optname,rdsv3_info_func func)90c0dd49bdSEiji Ota rdsv3_info_deregister_func(int optname, rdsv3_info_func func)
91c0dd49bdSEiji Ota {
92fe817b60SEiji Ota 	int offset = optname - RDS_INFO_FIRST;
93c0dd49bdSEiji Ota 
94fe817b60SEiji Ota 	ASSERT(optname >= RDS_INFO_FIRST && optname <= RDS_INFO_LAST);
95c0dd49bdSEiji Ota 
96c0dd49bdSEiji Ota 	mutex_enter(&rdsv3_info_lock);
97c0dd49bdSEiji Ota 	rdsv3_info_funcs[offset] = NULL;
98c0dd49bdSEiji Ota 	mutex_exit(&rdsv3_info_lock);
99c0dd49bdSEiji Ota }
100c0dd49bdSEiji Ota 
101c0dd49bdSEiji Ota /*
102c0dd49bdSEiji Ota  * @optval points to the userspace buffer that the information snapshot
103c0dd49bdSEiji Ota  * will be copied into.
104c0dd49bdSEiji Ota  *
105c0dd49bdSEiji Ota  * This function returns -errno if there is a failure, particularly -ENOSPC
106c0dd49bdSEiji Ota  * if the given userspace buffer was not large enough to fit the snapshot.
107c0dd49bdSEiji Ota  * On success it returns the positive number of bytes of each array element
108c0dd49bdSEiji Ota  * in the snapshot.
109c0dd49bdSEiji Ota  */
110c0dd49bdSEiji Ota int
rdsv3_info_ioctl(struct rsock * sock,int optname,char * optval,int32_t * rvalp)111b27516f5Sagiri rdsv3_info_ioctl(struct rsock *sock, int optname, char *optval,
112b27516f5Sagiri     int32_t *rvalp)
113c0dd49bdSEiji Ota {
114c0dd49bdSEiji Ota 	struct rdsv3_info_iterator iter;
115c0dd49bdSEiji Ota 	struct rdsv3_info_lengths lens;
116c0dd49bdSEiji Ota 	rdsv3_info_func func;
117b27516f5Sagiri 	struct rds_info_arg arg;
118b27516f5Sagiri 	uint32_t ulen = 0, klen;
119c0dd49bdSEiji Ota 
120fe817b60SEiji Ota 	func = rdsv3_info_funcs[optname - RDS_INFO_FIRST];
121c0dd49bdSEiji Ota 	if (func == NULL) {
122b27516f5Sagiri 		RDSV3_DPRINTF2("rdsv3_info_ioctl",
123b27516f5Sagiri 		    "No Info Function, optname: %d", optname);
124b27516f5Sagiri 		return (ENOPROTOOPT);
125b27516f5Sagiri 	}
126b27516f5Sagiri 
127b27516f5Sagiri 	if (optval == NULL) {
128b27516f5Sagiri 		RDSV3_DPRINTF2("rdsv3_info_ioctl", "optval is NULL");
129b27516f5Sagiri 		return (EINVAL);
130b27516f5Sagiri 	}
131b27516f5Sagiri 	if (ddi_copyin(optval, &arg, sizeof (struct rds_info_arg), 0) != 0) {
132b27516f5Sagiri 		RDSV3_DPRINTF2("rdsv3_info_ioctl",
133b27516f5Sagiri 		    "ddi_copyin for address: 0x%p failed", optval);
134b27516f5Sagiri 		return (EFAULT);
135b27516f5Sagiri 	}
136b27516f5Sagiri 
137b27516f5Sagiri 	RDSV3_DPRINTF4("rdsv3_info_ioctl",
138b27516f5Sagiri 	    "optname: %d lenp: %llx datap: %llx", optname, arg.lenp, arg.datap);
139b27516f5Sagiri 
140*9af7e484SToomas Soome 	if (arg.lenp == (uintptr_t)NULL) {
141b27516f5Sagiri 		RDSV3_DPRINTF2("rdsv3_info_ioctl", "arg.lenp is NULL");
142b27516f5Sagiri 		return (EFAULT);
143b27516f5Sagiri 	}
144b27516f5Sagiri 
145b27516f5Sagiri 	if (ddi_copyin((void *)(uintptr_t)arg.lenp, &ulen,
146b27516f5Sagiri 	    sizeof (uint32_t), 0) != 0) {
147b27516f5Sagiri 		RDSV3_DPRINTF2("rdsv3_info_ioctl",
148b27516f5Sagiri 		    "ddi_copyin for address, lenp: 0x%p failed", arg.lenp);
149b27516f5Sagiri 		return (EFAULT);
150c0dd49bdSEiji Ota 	}
151c0dd49bdSEiji Ota 
152b27516f5Sagiri 	RDSV3_DPRINTF3("rdsv3_info_ioctl", "optname: %d len: %d datap: %p",
153b27516f5Sagiri 	    optname, ulen, arg.datap);
154b27516f5Sagiri 
155b27516f5Sagiri 	bzero(&iter, sizeof (struct rdsv3_info_iterator));
156b27516f5Sagiri 	/* a 0 len call is just trying to probe its length */
157b27516f5Sagiri 	if (ulen == 0) {
158c0dd49bdSEiji Ota 		iter.addr = NULL;
159*9af7e484SToomas Soome 	} else if (arg.datap == (uintptr_t)NULL) {
160b27516f5Sagiri 		RDSV3_DPRINTF2("rdsv3_info_ioctl",
161b27516f5Sagiri 		    "arg.datap is NULL, ulen set to: %d", ulen);
162b27516f5Sagiri 		return (EINVAL);
163c0dd49bdSEiji Ota 	} else {
164b27516f5Sagiri 		iter.addr = (char *)(uintptr_t)arg.datap;
165c0dd49bdSEiji Ota 	}
166c0dd49bdSEiji Ota 	iter.offset = 0;
167c0dd49bdSEiji Ota 
168b27516f5Sagiri 	bzero(&lens, sizeof (struct rdsv3_info_lengths));
169b27516f5Sagiri 	func(sock, ulen, &iter, &lens);
170c0dd49bdSEiji Ota 
171b27516f5Sagiri 	klen = lens.nr * lens.each;
172b27516f5Sagiri 
173b27516f5Sagiri 	if (ddi_copyout(&klen, (void *)(uintptr_t)arg.lenp,
174b27516f5Sagiri 	    sizeof (uint32_t), 0) != 0) {
175b27516f5Sagiri 		RDSV3_DPRINTF2("rdsv3_info_ioctl",
176b27516f5Sagiri 		    "ddi_copyout(%p %p) failed", &klen, arg.lenp);
177b27516f5Sagiri 		return (EFAULT);
178c0dd49bdSEiji Ota 	}
179c0dd49bdSEiji Ota 
180b27516f5Sagiri 	RDSV3_DPRINTF3("rdsv3_info_ioctl",
181b27516f5Sagiri 	    "optname: %d ulen: %d klen: %d each: %d", optname, ulen, klen,
182b27516f5Sagiri 	    lens.each);
183b27516f5Sagiri 
184b27516f5Sagiri 	if (ulen < klen) {
185b27516f5Sagiri 		return (ENOSPC);
186b27516f5Sagiri 	}
187b27516f5Sagiri 
188b27516f5Sagiri 	RDSV3_DPRINTF4("rdsv3_info_ioctl", "Return optname: %d", optname);
189b27516f5Sagiri 
190b27516f5Sagiri 	*rvalp = lens.each;
191c0dd49bdSEiji Ota 	return (0);
192c0dd49bdSEiji Ota }
193