1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
23  * Use is subject to license terms.
24  */
25 
26 #pragma ident	"%Z%%M%	%I%	%E% SMI"
27 
28 #include <sys/types.h>
29 #include <sys/stream.h>
30 #define	_SUN_TPI_VERSION 2
31 #include <sys/tihdr.h>
32 #include <sys/socket.h>
33 #include <sys/xti_xtiopt.h>
34 #include <sys/xti_inet.h>
35 
36 #include <inet/common.h>
37 #include <netinet/ip6.h>
38 #include <inet/ip.h>
39 
40 #include <netinet/in.h>
41 #include <netinet/tcp.h>
42 #include <inet/optcom.h>
43 
44 
45 extern int	tcp_opt_default(queue_t *q, int level, int name, uchar_t *ptr);
46 extern int	tcp_opt_get(queue_t *q, int level, int name, uchar_t *ptr);
47 extern int	tcp_opt_set(queue_t *q, uint_t optset_context, int level,
48     int name, uint_t inlen, uchar_t *invalp, uint_t *outlenp, uchar_t *outvalp,
49     void *thisdg_attrs, cred_t *cr, mblk_t *mblk);
50 
51 /*
52  * Table of all known options handled on a TCP protocol stack.
53  *
54  * Note: This table contains options processed by both TCP and IP levels
55  *       and is the superset of options that can be performed on a TCP over IP
56  *       stack.
57  */
58 opdes_t	tcp_opt_arr[] = {
59 
60 { SO_LINGER,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
61 	sizeof (struct linger), 0 },
62 
63 { SO_DEBUG,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
64 { SO_KEEPALIVE,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
65 { SO_DONTROUTE,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
66 { SO_USELOOPBACK, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0
67 	},
68 { SO_BROADCAST,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
69 { SO_REUSEADDR, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
70 { SO_OOBINLINE, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
71 { SO_TYPE,	SOL_SOCKET, OA_R, OA_R, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
72 { SO_SNDBUF,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
73 { SO_RCVBUF,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
74 { SO_DGRAM_ERRIND, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0
75 	},
76 { SO_SND_COPYAVOID, SOL_SOCKET, OA_RW, OA_RW, OP_NP, 0, sizeof (int), 0 },
77 { SO_ANON_MLP, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int),
78     0 },
79 { SO_MAC_EXEMPT, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int),
80     0 },
81 { TCP_NODELAY,	IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0
82 	},
83 { TCP_MAXSEG,	IPPROTO_TCP, OA_R, OA_R, OP_NP, OP_PASSNEXT, sizeof (uint_t),
84 	536 },
85 
86 { TCP_NOTIFY_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP,
87 	(OP_PASSNEXT|OP_DEF_FN), sizeof (int), -1 /* not initialized */ },
88 
89 { TCP_ABORT_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP,
90 	(OP_PASSNEXT|OP_DEF_FN), sizeof (int), -1 /* not initialized */ },
91 
92 { TCP_CONN_NOTIFY_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP,
93 	(OP_PASSNEXT|OP_DEF_FN), sizeof (int), -1 /* not initialized */ },
94 
95 { TCP_CONN_ABORT_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP,
96 	(OP_PASSNEXT|OP_DEF_FN), sizeof (int), -1 /* not initialized */ },
97 
98 { TCP_RECVDSTADDR, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int),
99 	0 },
100 
101 { TCP_ANONPRIVBIND, IPPROTO_TCP, OA_R, OA_RW, OP_PRIVPORT, OP_PASSNEXT,
102 	sizeof (int), 0 },
103 
104 { TCP_EXCLBIND, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0
105 	},
106 
107 { TCP_INIT_CWND, IPPROTO_TCP, OA_RW, OA_RW, OP_CONFIG, OP_PASSNEXT,
108 	sizeof (int), 0 },
109 
110 { TCP_KEEPALIVE_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
111 	sizeof (int), 0	},
112 
113 { TCP_KEEPALIVE_ABORT_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
114 	sizeof (int), 0	},
115 
116 { TCP_CORK, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
117 
118 { IP_OPTIONS,	IPPROTO_IP, OA_RW, OA_RW, OP_NP,
119 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT),
120 	40, -1 /* not initialized */ },
121 { T_IP_OPTIONS,	IPPROTO_IP, OA_RW, OA_RW, OP_NP,
122 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT),
123 	40, -1 /* not initialized */ },
124 
125 { IP_TOS,	IPPROTO_IP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
126 { T_IP_TOS,	IPPROTO_IP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
127 { IP_TTL,	IPPROTO_IP, OA_RW, OA_RW, OP_NP, (OP_PASSNEXT|OP_DEF_FN),
128 	sizeof (int), -1 /* not initialized */ },
129 
130 { IP_SEC_OPT, IPPROTO_IP, OA_RW, OA_RW, OP_NP, (OP_PASSNEXT|OP_NODEFAULT),
131 	sizeof (ipsec_req_t), -1 /* not initialized */ },
132 
133 { IP_BOUND_IF, IPPROTO_IP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
134 	sizeof (int),	0 /* no ifindex */ },
135 
136 { IP_UNSPEC_SRC, IPPROTO_IP, OA_R, OA_RW, OP_RAW, OP_PASSNEXT,
137 	sizeof (int), 0 },
138 
139 { IPV6_UNICAST_HOPS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, (OP_PASSNEXT|OP_DEF_FN),
140 	sizeof (int), -1 /* not initialized */ },
141 
142 { IPV6_BOUND_IF, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
143 	sizeof (int),	0 /* no ifindex */ },
144 
145 { IP_NEXTHOP, IPPROTO_IP, OA_RW, OA_RW, OP_CONFIG, OP_PASSNEXT,
146 	sizeof (in_addr_t),	-1 /* not initialized  */ },
147 
148 { IPV6_BOUND_PIF, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
149 	sizeof (int),	0 /* no ifindex */ },
150 
151 { IPV6_UNSPEC_SRC, IPPROTO_IPV6, OA_R, OA_RW, OP_RAW, OP_PASSNEXT,
152 	sizeof (int), 0 },
153 
154 { IPV6_PKTINFO, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
155 	(OP_PASSNEXT|OP_NODEFAULT|OP_VARLEN),
156 	sizeof (struct in6_pktinfo), -1 /* not initialized */ },
157 { IPV6_NEXTHOP, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
158 	(OP_PASSNEXT|OP_NODEFAULT),
159 	sizeof (sin6_t), -1 /* not initialized */ },
160 { IPV6_HOPOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
161 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT), 255*8,
162 	-1 /* not initialized */ },
163 { IPV6_DSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
164 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT), 255*8,
165 	-1 /* not initialized */ },
166 { IPV6_RTHDRDSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
167 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT), 255*8,
168 	-1 /* not initialized */ },
169 { IPV6_RTHDR, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
170 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT), 255*8,
171 	-1 /* not initialized */ },
172 { IPV6_TCLASS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
173 	(OP_PASSNEXT|OP_NODEFAULT),
174 	sizeof (int), -1 /* not initialized */ },
175 { IPV6_PATHMTU, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
176 	(OP_PASSNEXT|OP_NODEFAULT),
177 	sizeof (struct ip6_mtuinfo), -1 /* not initialized */ },
178 { IPV6_USE_MIN_MTU, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
179 	sizeof (int), 0 },
180 { IPV6_V6ONLY, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
181 	sizeof (int), 0 },
182 
183 /* Enable receipt of ancillary data */
184 { IPV6_RECVPKTINFO, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
185 	sizeof (int), 0 },
186 { IPV6_RECVHOPLIMIT, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
187 	sizeof (int), 0 },
188 { IPV6_RECVHOPOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
189 	sizeof (int), 0 },
190 { _OLD_IPV6_RECVDSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
191 	sizeof (int), 0 },
192 { IPV6_RECVDSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
193 	sizeof (int), 0 },
194 { IPV6_RECVRTHDR, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
195 	sizeof (int), 0 },
196 { IPV6_RECVRTHDRDSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
197 	sizeof (int), 0 },
198 { IPV6_RECVTCLASS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
199 	sizeof (int), 0 },
200 
201 { IPV6_SEC_OPT, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, (OP_PASSNEXT|OP_NODEFAULT),
202 	sizeof (ipsec_req_t), -1 /* not initialized */ },
203 { IPV6_SRC_PREFERENCES, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
204 	sizeof (uint32_t), IPV6_PREFER_SRC_DEFAULT },
205 };
206 
207 /*
208  * Table of all supported levels
209  * Note: Some levels (e.g. XTI_GENERIC) may be valid but may not have
210  * any supported options so we need this info separately.
211  *
212  * This is needed only for topmost tpi providers and is used only by
213  * XTI interfaces.
214  */
215 optlevel_t	tcp_valid_levels_arr[] = {
216 	XTI_GENERIC,
217 	SOL_SOCKET,
218 	IPPROTO_TCP,
219 	IPPROTO_IP,
220 	IPPROTO_IPV6
221 };
222 
223 
224 #define	TCP_OPT_ARR_CNT		A_CNT(tcp_opt_arr)
225 #define	TCP_VALID_LEVELS_CNT	A_CNT(tcp_valid_levels_arr)
226 
227 uint_t tcp_max_optsize; /* initialized when TCP driver is loaded */
228 
229 /*
230  * Initialize option database object for TCP
231  *
232  * This object represents database of options to search passed to
233  * {sock,tpi}optcom_req() interface routine to take care of option
234  * management and associated methods.
235  */
236 
237 optdb_obj_t tcp_opt_obj = {
238 	tcp_opt_default,	/* TCP default value function pointer */
239 	tcp_opt_get,		/* TCP get function pointer */
240 	tcp_opt_set,		/* TCP set function pointer */
241 	B_TRUE,			/* TCP is tpi provider */
242 	TCP_OPT_ARR_CNT,	/* TCP option database count of entries */
243 	tcp_opt_arr,		/* TCP option database */
244 	TCP_VALID_LEVELS_CNT,	/* TCP valid level count of entries */
245 	tcp_valid_levels_arr	/* TCP valid level array */
246 };
247