xref: /illumos-gate/usr/src/uts/common/inet/tcp/tcp_opt_data.c (revision 1f6352c601b7f3c744b4684ff673c813927da24c)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
23  * Use is subject to license terms.
24  */
25 
26 #include <sys/types.h>
27 #include <sys/stream.h>
28 #define	_SUN_TPI_VERSION 2
29 #include <sys/tihdr.h>
30 #include <sys/socket.h>
31 #include <sys/xti_xtiopt.h>
32 #include <sys/xti_inet.h>
33 
34 #include <inet/common.h>
35 #include <netinet/ip6.h>
36 #include <inet/ip.h>
37 
38 #include <netinet/in.h>
39 #include <netinet/tcp.h>
40 #include <inet/optcom.h>
41 
42 
43 extern int	tcp_opt_default(queue_t *q, int level, int name, uchar_t *ptr);
44 extern int	tcp_tpi_opt_get(queue_t *q, int level, int name, uchar_t *ptr);
45 extern int	tcp_tpi_opt_set(queue_t *q, uint_t optset_context, int level,
46     int name, uint_t inlen, uchar_t *invalp, uint_t *outlenp, uchar_t *outvalp,
47     void *thisdg_attrs, cred_t *cr, mblk_t *mblk);
48 
49 /*
50  * Table of all known options handled on a TCP protocol stack.
51  *
52  * Note: This table contains options processed by both TCP and IP levels
53  *       and is the superset of options that can be performed on a TCP over IP
54  *       stack.
55  */
56 opdes_t	tcp_opt_arr[] = {
57 
58 { SO_LINGER,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
59 	sizeof (struct linger), 0 },
60 
61 { SO_DEBUG,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
62 { SO_KEEPALIVE,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
63 { SO_DONTROUTE,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
64 { SO_USELOOPBACK, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0
65 	},
66 { SO_BROADCAST,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
67 { SO_REUSEADDR, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
68 { SO_OOBINLINE, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
69 { SO_TYPE,	SOL_SOCKET, OA_R, OA_R, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
70 { SO_SNDBUF,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
71 { SO_RCVBUF,	SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
72 { SO_DGRAM_ERRIND, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0
73 	},
74 { SO_SND_COPYAVOID, SOL_SOCKET, OA_RW, OA_RW, OP_NP, 0, sizeof (int), 0 },
75 { SO_ANON_MLP, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int),
76 	0 },
77 { SO_MAC_EXEMPT, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int),
78 	0 },
79 { SO_ALLZONES, SOL_SOCKET, OA_R, OA_RW, OP_CONFIG, OP_PASSNEXT, sizeof (int),
80 	0 },
81 { SO_EXCLBIND, SOL_SOCKET, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
82 
83 { SO_DOMAIN,	SOL_SOCKET, OA_R, OA_R, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
84 
85 { SO_PROTOTYPE,	SOL_SOCKET, OA_R, OA_R, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
86 
87 { TCP_NODELAY,	IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0
88 	},
89 { TCP_MAXSEG,	IPPROTO_TCP, OA_R, OA_R, OP_NP, OP_PASSNEXT, sizeof (uint_t),
90 	536 },
91 
92 { TCP_NOTIFY_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP,
93 	(OP_PASSNEXT|OP_DEF_FN), sizeof (int), -1 /* not initialized */ },
94 
95 { TCP_ABORT_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP,
96 	(OP_PASSNEXT|OP_DEF_FN), sizeof (int), -1 /* not initialized */ },
97 
98 { TCP_CONN_NOTIFY_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP,
99 	(OP_PASSNEXT|OP_DEF_FN), sizeof (int), -1 /* not initialized */ },
100 
101 { TCP_CONN_ABORT_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP,
102 	(OP_PASSNEXT|OP_DEF_FN), sizeof (int), -1 /* not initialized */ },
103 
104 { TCP_RECVDSTADDR, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int),
105 	0 },
106 
107 { TCP_ANONPRIVBIND, IPPROTO_TCP, OA_R, OA_RW, OP_PRIVPORT, OP_PASSNEXT,
108 	sizeof (int), 0 },
109 
110 { TCP_EXCLBIND, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0
111 	},
112 
113 { TCP_INIT_CWND, IPPROTO_TCP, OA_RW, OA_RW, OP_CONFIG, OP_PASSNEXT,
114 	sizeof (int), 0 },
115 
116 { TCP_KEEPALIVE_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
117 	sizeof (int), 0	},
118 
119 { TCP_KEEPALIVE_ABORT_THRESHOLD, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
120 	sizeof (int), 0	},
121 
122 { TCP_CORK, IPPROTO_TCP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
123 
124 { IP_OPTIONS,	IPPROTO_IP, OA_RW, OA_RW, OP_NP,
125 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT),
126 	IP_MAX_OPT_LENGTH + IP_ADDR_LEN, -1 /* not initialized */ },
127 { T_IP_OPTIONS,	IPPROTO_IP, OA_RW, OA_RW, OP_NP,
128 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT),
129 	IP_MAX_OPT_LENGTH + IP_ADDR_LEN, -1 /* not initialized */ },
130 
131 { IP_TOS,	IPPROTO_IP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
132 { T_IP_TOS,	IPPROTO_IP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT, sizeof (int), 0 },
133 { IP_TTL,	IPPROTO_IP, OA_RW, OA_RW, OP_NP, (OP_PASSNEXT|OP_DEF_FN),
134 	sizeof (int), -1 /* not initialized */ },
135 
136 { IP_SEC_OPT, IPPROTO_IP, OA_RW, OA_RW, OP_NP, (OP_PASSNEXT|OP_NODEFAULT),
137 	sizeof (ipsec_req_t), -1 /* not initialized */ },
138 
139 { IP_BOUND_IF, IPPROTO_IP, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
140 	sizeof (int),	0 /* no ifindex */ },
141 
142 { IP_UNSPEC_SRC, IPPROTO_IP, OA_R, OA_RW, OP_RAW, OP_PASSNEXT,
143 	sizeof (int), 0 },
144 
145 { IPV6_UNICAST_HOPS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, (OP_PASSNEXT|OP_DEF_FN),
146 	sizeof (int), -1 /* not initialized */ },
147 
148 { IPV6_BOUND_IF, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
149 	sizeof (int),	0 /* no ifindex */ },
150 
151 { IP_NEXTHOP, IPPROTO_IP, OA_R, OA_RW, OP_CONFIG, OP_PASSNEXT,
152 	sizeof (in_addr_t),	-1 /* not initialized  */ },
153 
154 { IPV6_UNSPEC_SRC, IPPROTO_IPV6, OA_R, OA_RW, OP_RAW, OP_PASSNEXT,
155 	sizeof (int), 0 },
156 
157 { IPV6_PKTINFO, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
158 	(OP_PASSNEXT|OP_NODEFAULT|OP_VARLEN),
159 	sizeof (struct in6_pktinfo), -1 /* not initialized */ },
160 { IPV6_NEXTHOP, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
161 	(OP_PASSNEXT|OP_NODEFAULT),
162 	sizeof (sin6_t), -1 /* not initialized */ },
163 { IPV6_HOPOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
164 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT), 255*8,
165 	-1 /* not initialized */ },
166 { IPV6_DSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
167 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT), 255*8,
168 	-1 /* not initialized */ },
169 { IPV6_RTHDRDSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
170 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT), 255*8,
171 	-1 /* not initialized */ },
172 { IPV6_RTHDR, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
173 	(OP_PASSNEXT|OP_VARLEN|OP_NODEFAULT), 255*8,
174 	-1 /* not initialized */ },
175 { IPV6_TCLASS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
176 	(OP_PASSNEXT|OP_NODEFAULT),
177 	sizeof (int), -1 /* not initialized */ },
178 { IPV6_PATHMTU, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP,
179 	(OP_PASSNEXT|OP_NODEFAULT),
180 	sizeof (struct ip6_mtuinfo), -1 /* not initialized */ },
181 { IPV6_USE_MIN_MTU, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
182 	sizeof (int), 0 },
183 { IPV6_V6ONLY, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
184 	sizeof (int), 0 },
185 
186 /* Enable receipt of ancillary data */
187 { IPV6_RECVPKTINFO, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
188 	sizeof (int), 0 },
189 { IPV6_RECVHOPLIMIT, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
190 	sizeof (int), 0 },
191 { IPV6_RECVHOPOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
192 	sizeof (int), 0 },
193 { _OLD_IPV6_RECVDSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
194 	sizeof (int), 0 },
195 { IPV6_RECVDSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
196 	sizeof (int), 0 },
197 { IPV6_RECVRTHDR, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
198 	sizeof (int), 0 },
199 { IPV6_RECVRTHDRDSTOPTS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
200 	sizeof (int), 0 },
201 { IPV6_RECVTCLASS, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
202 	sizeof (int), 0 },
203 
204 { IPV6_SEC_OPT, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, (OP_PASSNEXT|OP_NODEFAULT),
205 	sizeof (ipsec_req_t), -1 /* not initialized */ },
206 { IPV6_SRC_PREFERENCES, IPPROTO_IPV6, OA_RW, OA_RW, OP_NP, OP_PASSNEXT,
207 	sizeof (uint32_t), IPV6_PREFER_SRC_DEFAULT },
208 };
209 
210 /*
211  * Table of all supported levels
212  * Note: Some levels (e.g. XTI_GENERIC) may be valid but may not have
213  * any supported options so we need this info separately.
214  *
215  * This is needed only for topmost tpi providers and is used only by
216  * XTI interfaces.
217  */
218 optlevel_t	tcp_valid_levels_arr[] = {
219 	XTI_GENERIC,
220 	SOL_SOCKET,
221 	IPPROTO_TCP,
222 	IPPROTO_IP,
223 	IPPROTO_IPV6
224 };
225 
226 
227 #define	TCP_OPT_ARR_CNT		A_CNT(tcp_opt_arr)
228 #define	TCP_VALID_LEVELS_CNT	A_CNT(tcp_valid_levels_arr)
229 
230 uint_t tcp_max_optsize; /* initialized when TCP driver is loaded */
231 
232 /*
233  * Initialize option database object for TCP
234  *
235  * This object represents database of options to search passed to
236  * {sock,tpi}optcom_req() interface routine to take care of option
237  * management and associated methods.
238  */
239 
240 optdb_obj_t tcp_opt_obj = {
241 	tcp_opt_default,	/* TCP default value function pointer */
242 	tcp_tpi_opt_get,	/* TCP get function pointer */
243 	tcp_tpi_opt_set,	/* TCP set function pointer */
244 	B_TRUE,			/* TCP is tpi provider */
245 	TCP_OPT_ARR_CNT,	/* TCP option database count of entries */
246 	tcp_opt_arr,		/* TCP option database */
247 	TCP_VALID_LEVELS_CNT,	/* TCP valid level count of entries */
248 	tcp_valid_levels_arr	/* TCP valid level array */
249 };
250