xref: /freebsd/sys/dev/irdma/irdma_cm.h (revision 1165fc9a526630487a1feb63daef65c5aee1a583)
1 /*-
2  * SPDX-License-Identifier: GPL-2.0 or Linux-OpenIB
3  *
4  * Copyright (c) 2015 - 2021 Intel Corporation
5  *
6  * This software is available to you under a choice of one of two
7  * licenses.  You may choose to be licensed under the terms of the GNU
8  * General Public License (GPL) Version 2, available from the file
9  * COPYING in the main directory of this source tree, or the
10  * OpenFabrics.org BSD license below:
11  *
12  *   Redistribution and use in source and binary forms, with or
13  *   without modification, are permitted provided that the following
14  *   conditions are met:
15  *
16  *    - Redistributions of source code must retain the above
17  *	copyright notice, this list of conditions and the following
18  *	disclaimer.
19  *
20  *    - Redistributions in binary form must reproduce the above
21  *	copyright notice, this list of conditions and the following
22  *	disclaimer in the documentation and/or other materials
23  *	provided with the distribution.
24  *
25  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
26  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
27  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
28  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
29  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
30  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
31  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
32  * SOFTWARE.
33  */
34 /*$FreeBSD$*/
35 
36 #ifndef IRDMA_CM_H
37 #define IRDMA_CM_H
38 
39 #define IRDMA_MPA_REQUEST_ACCEPT	1
40 #define IRDMA_MPA_REQUEST_REJECT	2
41 
42 /* IETF MPA -- defines */
43 #define IEFT_MPA_KEY_REQ	"MPA ID Req Frame"
44 #define IEFT_MPA_KEY_REP	"MPA ID Rep Frame"
45 #define IETF_MPA_KEY_SIZE	16
46 #define IETF_MPA_VER		1
47 #define IETF_MAX_PRIV_DATA_LEN	512
48 #define IETF_MPA_FRAME_SIZE	20
49 #define IETF_RTR_MSG_SIZE	4
50 #define IETF_MPA_V2_FLAG	0x10
51 #define SNDMARKER_SEQNMASK	0x000001ff
52 #define IRDMA_MAX_IETF_SIZE	32
53 
54 /* IETF RTR MSG Fields */
55 #define IETF_PEER_TO_PEER	0x8000
56 #define IETF_FLPDU_ZERO_LEN	0x4000
57 #define IETF_RDMA0_WRITE	0x8000
58 #define IETF_RDMA0_READ		0x4000
59 #define IETF_NO_IRD_ORD		0x3fff
60 
61 #define MAX_PORTS	65536
62 
63 #define IRDMA_PASSIVE_STATE_INDICATED	0
64 #define IRDMA_DO_NOT_SEND_RESET_EVENT	1
65 #define IRDMA_SEND_RESET_EVENT		2
66 
67 #define MAX_IRDMA_IFS	4
68 
69 #define SET_ACK		1
70 #define SET_SYN		2
71 #define SET_FIN		4
72 #define SET_RST		8
73 
74 #define TCP_OPTIONS_PADDING	3
75 
76 #define IRDMA_DEFAULT_RETRYS	64
77 #define IRDMA_DEFAULT_RETRANS	8
78 #define IRDMA_DEFAULT_TTL		0x40
79 #define IRDMA_DEFAULT_RTT_VAR		6
80 #define IRDMA_DEFAULT_SS_THRESH		0x3fffffff
81 #define IRDMA_DEFAULT_REXMIT_THRESH	8
82 
83 #define IRDMA_RETRY_TIMEOUT	HZ
84 #define IRDMA_SHORT_TIME	10
85 #define IRDMA_LONG_TIME		(2 * HZ)
86 #define IRDMA_MAX_TIMEOUT	((unsigned long)(12 * HZ))
87 
88 #define IRDMA_CM_HASHTABLE_SIZE		1024
89 #define IRDMA_CM_TCP_TIMER_INTERVAL	3000
90 #define IRDMA_CM_DEFAULT_MTU		1540
91 #define IRDMA_CM_DEFAULT_FRAME_CNT	10
92 #define IRDMA_CM_THREAD_STACK_SIZE	256
93 #define IRDMA_CM_DEFAULT_RCV_WND	64240
94 #define IRDMA_CM_DEFAULT_RCV_WND_SCALED	0x3FFFC
95 #define IRDMA_CM_DEFAULT_RCV_WND_SCALE	2
96 #define IRDMA_CM_DEFAULT_FREE_PKTS	10
97 #define IRDMA_CM_FREE_PKT_LO_WATERMARK	2
98 #define IRDMA_CM_DEFAULT_MSS		536
99 #define IRDMA_CM_DEFAULT_MPA_VER	2
100 #define IRDMA_CM_DEFAULT_SEQ		0x159bf75f
101 #define IRDMA_CM_DEFAULT_LOCAL_ID	0x3b47
102 #define IRDMA_CM_DEFAULT_SEQ2		0x18ed5740
103 #define IRDMA_CM_DEFAULT_LOCAL_ID2	0xb807
104 #define IRDMA_MAX_CM_BUF		(IRDMA_MAX_IETF_SIZE + IETF_MAX_PRIV_DATA_LEN)
105 
106 enum ietf_mpa_flags {
107 	IETF_MPA_FLAGS_REJECT  = 0x20,
108 	IETF_MPA_FLAGS_CRC     = 0x40,
109 	IETF_MPA_FLAGS_MARKERS = 0x80,
110 };
111 
112 enum irdma_timer_type {
113 	IRDMA_TIMER_TYPE_SEND,
114 	IRDMA_TIMER_TYPE_CLOSE,
115 };
116 
117 enum option_nums {
118 	OPTION_NUM_EOL,
119 	OPTION_NUM_NONE,
120 	OPTION_NUM_MSS,
121 	OPTION_NUM_WINDOW_SCALE,
122 	OPTION_NUM_SACK_PERM,
123 	OPTION_NUM_SACK,
124 	OPTION_NUM_WRITE0 = 0xbc,
125 };
126 
127 /* cm node transition states */
128 enum irdma_cm_node_state {
129 	IRDMA_CM_STATE_UNKNOWN,
130 	IRDMA_CM_STATE_INITED,
131 	IRDMA_CM_STATE_LISTENING,
132 	IRDMA_CM_STATE_SYN_RCVD,
133 	IRDMA_CM_STATE_SYN_SENT,
134 	IRDMA_CM_STATE_ONE_SIDE_ESTABLISHED,
135 	IRDMA_CM_STATE_ESTABLISHED,
136 	IRDMA_CM_STATE_ACCEPTING,
137 	IRDMA_CM_STATE_MPAREQ_SENT,
138 	IRDMA_CM_STATE_MPAREQ_RCVD,
139 	IRDMA_CM_STATE_MPAREJ_RCVD,
140 	IRDMA_CM_STATE_OFFLOADED,
141 	IRDMA_CM_STATE_FIN_WAIT1,
142 	IRDMA_CM_STATE_FIN_WAIT2,
143 	IRDMA_CM_STATE_CLOSE_WAIT,
144 	IRDMA_CM_STATE_TIME_WAIT,
145 	IRDMA_CM_STATE_LAST_ACK,
146 	IRDMA_CM_STATE_CLOSING,
147 	IRDMA_CM_STATE_LISTENER_DESTROYED,
148 	IRDMA_CM_STATE_CLOSED,
149 };
150 
151 enum mpa_frame_ver {
152 	IETF_MPA_V1 = 1,
153 	IETF_MPA_V2 = 2,
154 };
155 
156 enum mpa_frame_key {
157 	MPA_KEY_REQUEST,
158 	MPA_KEY_REPLY,
159 };
160 
161 enum send_rdma0 {
162 	SEND_RDMA_READ_ZERO  = 1,
163 	SEND_RDMA_WRITE_ZERO = 2,
164 };
165 
166 enum irdma_tcpip_pkt_type {
167 	IRDMA_PKT_TYPE_UNKNOWN,
168 	IRDMA_PKT_TYPE_SYN,
169 	IRDMA_PKT_TYPE_SYNACK,
170 	IRDMA_PKT_TYPE_ACK,
171 	IRDMA_PKT_TYPE_FIN,
172 	IRDMA_PKT_TYPE_RST,
173 };
174 
175 enum irdma_cm_listener_state {
176 	IRDMA_CM_LISTENER_PASSIVE_STATE = 1,
177 	IRDMA_CM_LISTENER_ACTIVE_STATE  = 2,
178 	IRDMA_CM_LISTENER_EITHER_STATE  = 3,
179 };
180 
181 /* CM event codes */
182 enum irdma_cm_event_type {
183 	IRDMA_CM_EVENT_UNKNOWN,
184 	IRDMA_CM_EVENT_ESTABLISHED,
185 	IRDMA_CM_EVENT_MPA_REQ,
186 	IRDMA_CM_EVENT_MPA_CONNECT,
187 	IRDMA_CM_EVENT_MPA_ACCEPT,
188 	IRDMA_CM_EVENT_MPA_REJECT,
189 	IRDMA_CM_EVENT_MPA_ESTABLISHED,
190 	IRDMA_CM_EVENT_CONNECTED,
191 	IRDMA_CM_EVENT_RESET,
192 	IRDMA_CM_EVENT_ABORTED,
193 };
194 
195 struct irdma_bth { /* Base Trasnport Header */
196 	u8 opcode;
197 	u8 flags;
198 	__be16 pkey;
199 	__be32 qpn;
200 	__be32 apsn;
201 };
202 
203 struct ietf_mpa_v1 {
204 	u8 key[IETF_MPA_KEY_SIZE];
205 	u8 flags;
206 	u8 rev;
207 	__be16 priv_data_len;
208 	u8 priv_data[];
209 };
210 
211 struct ietf_rtr_msg {
212 	__be16 ctrl_ird;
213 	__be16 ctrl_ord;
214 };
215 
216 struct ietf_mpa_v2 {
217 	u8 key[IETF_MPA_KEY_SIZE];
218 	u8 flags;
219 	u8 rev;
220 	__be16 priv_data_len;
221 	struct ietf_rtr_msg rtr_msg;
222 	u8 priv_data[];
223 };
224 
225 struct option_base {
226 	u8 optionnum;
227 	u8 len;
228 };
229 
230 struct option_mss {
231 	u8 optionnum;
232 	u8 len;
233 	__be16 mss;
234 };
235 
236 struct option_windowscale {
237 	u8 optionnum;
238 	u8 len;
239 	u8 shiftcount;
240 };
241 
242 union all_known_options {
243 	char eol;
244 	struct option_base base;
245 	struct option_mss mss;
246 	struct option_windowscale windowscale;
247 };
248 
249 struct irdma_timer_entry {
250 	struct list_head list;
251 	unsigned long timetosend; /* jiffies */
252 	struct irdma_puda_buf *sqbuf;
253 	u32 type;
254 	u32 retrycount;
255 	u32 retranscount;
256 	u32 context;
257 	u32 send_retrans;
258 	int close_when_complete;
259 };
260 
261 /* CM context params */
262 struct irdma_cm_tcp_context {
263 	u8 client;
264 	u32 loc_seq_num;
265 	u32 loc_ack_num;
266 	u32 rem_ack_num;
267 	u32 rcv_nxt;
268 	u32 loc_id;
269 	u32 rem_id;
270 	u32 snd_wnd;
271 	u32 max_snd_wnd;
272 	u32 rcv_wnd;
273 	u32 mss;
274 	u8 snd_wscale;
275 	u8 rcv_wscale;
276 };
277 
278 struct irdma_apbvt_entry {
279 	struct hlist_node hlist;
280 	u32 use_cnt;
281 	u16 port;
282 };
283 
284 struct irdma_cm_listener {
285 	struct list_head list;
286 	struct iw_cm_id *cm_id;
287 	struct irdma_cm_core *cm_core;
288 	struct irdma_device *iwdev;
289 	struct list_head child_listen_list;
290 	struct irdma_apbvt_entry *apbvt_entry;
291 	enum irdma_cm_listener_state listener_state;
292 	atomic_t refcnt;
293 	atomic_t pend_accepts_cnt;
294 	u32 loc_addr[4];
295 	u32 reused_node;
296 	int backlog;
297 	u16 loc_port;
298 	u16 vlan_id;
299 	u8 loc_mac[ETH_ALEN];
300 	u8 user_pri;
301 	u8 tos;
302 	bool qhash_set:1;
303 	bool ipv4:1;
304 };
305 
306 struct irdma_kmem_info {
307 	void *addr;
308 	u32 size;
309 };
310 
311 struct irdma_mpa_priv_info {
312 	const void *addr;
313 	u32 size;
314 };
315 
316 struct irdma_cm_node {
317 	struct irdma_qp *iwqp;
318 	struct irdma_device *iwdev;
319 	struct irdma_sc_dev *dev;
320 	struct irdma_cm_tcp_context tcp_cntxt;
321 	struct irdma_cm_core *cm_core;
322 	struct irdma_timer_entry *send_entry;
323 	struct irdma_timer_entry *close_entry;
324 	struct irdma_cm_listener *listener;
325 	struct list_head timer_entry;
326 	struct list_head reset_entry;
327 	struct list_head teardown_entry;
328 	struct irdma_apbvt_entry *apbvt_entry;
329 	struct rcu_head rcu_head;
330 	struct irdma_mpa_priv_info pdata;
331 	struct irdma_sc_ah *ah;
332 	struct irdma_kmem_info mpa_hdr;
333 	struct iw_cm_id *cm_id;
334 	struct hlist_node list;
335 	struct completion establish_comp;
336 	spinlock_t retrans_list_lock; /* protect CM node rexmit updates*/
337 	atomic_t passive_state;
338 	atomic_t refcnt;
339 	enum irdma_cm_node_state state;
340 	enum send_rdma0 send_rdma0_op;
341 	enum mpa_frame_ver mpa_frame_rev;
342 	u32 loc_addr[4], rem_addr[4];
343 	u16 loc_port, rem_port;
344 	int apbvt_set;
345 	int accept_pend;
346 	u16 vlan_id;
347 	u16 ird_size;
348 	u16 ord_size;
349 	u16 mpav2_ird_ord;
350 	u16 lsmm_size;
351 	u8 pdata_buf[IETF_MAX_PRIV_DATA_LEN];
352 	u8 loc_mac[ETH_ALEN];
353 	u8 rem_mac[ETH_ALEN];
354 	u8 user_pri;
355 	u8 tos;
356 	bool ack_rcvd:1;
357 	bool qhash_set:1;
358 	bool ipv4:1;
359 	bool snd_mark_en:1;
360 	bool rcv_mark_en:1;
361 	bool do_lpb:1;
362 	bool accelerated:1;
363 	struct ietf_mpa_v2 mpa_v2_frame;
364 };
365 
366 /* Used by internal CM APIs to pass CM information*/
367 struct irdma_cm_info {
368 	struct iw_cm_id *cm_id;
369 	u16 loc_port;
370 	u16 rem_port;
371 	u32 loc_addr[4];
372 	u32 rem_addr[4];
373 	u32 qh_qpid;
374 	u16 vlan_id;
375 	int backlog;
376 	u8 user_pri;
377 	u8 tos;
378 	bool ipv4;
379 };
380 
381 struct irdma_cm_event {
382 	enum irdma_cm_event_type type;
383 	struct irdma_cm_info cm_info;
384 	struct work_struct event_work;
385 	struct irdma_cm_node *cm_node;
386 };
387 
388 struct irdma_cm_core {
389 	struct irdma_device *iwdev;
390 	struct irdma_sc_dev *dev;
391 	struct list_head listen_list;
392 	DECLARE_HASHTABLE(cm_hash_tbl, 8);
393 	DECLARE_HASHTABLE(apbvt_hash_tbl, 8);
394 	struct timer_list tcp_timer;
395 	struct workqueue_struct *event_wq;
396 	spinlock_t ht_lock; /* protect CM node (active side) list */
397 	spinlock_t listen_list_lock; /* protect listener list */
398 	spinlock_t apbvt_lock; /*serialize apbvt add/del entries*/
399 	u64 stats_nodes_created;
400 	u64 stats_nodes_destroyed;
401 	u64 stats_listen_created;
402 	u64 stats_listen_destroyed;
403 	u64 stats_listen_nodes_created;
404 	u64 stats_listen_nodes_destroyed;
405 	u64 stats_lpbs;
406 	u64 stats_accepts;
407 	u64 stats_rejects;
408 	u64 stats_connect_errs;
409 	u64 stats_passive_errs;
410 	u64 stats_pkt_retrans;
411 	u64 stats_backlog_drops;
412 	struct irdma_puda_buf *(*form_cm_frame)(struct irdma_cm_node *cm_node,
413 						struct irdma_kmem_info *options,
414 						struct irdma_kmem_info *hdr,
415 						struct irdma_mpa_priv_info *pdata,
416 						u8 flags);
417 	int (*cm_create_ah)(struct irdma_cm_node *cm_node, bool wait);
418 	void (*cm_free_ah)(struct irdma_cm_node *cm_node);
419 };
420 
421 int irdma_schedule_cm_timer(struct irdma_cm_node *cm_node,
422 			    struct irdma_puda_buf *sqbuf,
423 			    enum irdma_timer_type type, int send_retrans,
424 			    int close_when_complete);
425 
426 static inline u8 irdma_tos2dscp(u8 tos)
427 {
428 #define IRDMA_DSCP_S 2
429 #define IRDMA_DSCP_M (0x3f << IRDMA_DSCP_S)
430 	return RS_32(tos, IRDMA_DSCP);
431 }
432 
433 int irdma_accept(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param);
434 int irdma_reject(struct iw_cm_id *cm_id, const void *pdata, u8 pdata_len);
435 int irdma_connect(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param);
436 int irdma_create_listen(struct iw_cm_id *cm_id, int backlog);
437 int irdma_destroy_listen(struct iw_cm_id *cm_id);
438 int irdma_add_arp(struct irdma_pci_f *rf, u32 *ip, u8 *mac);
439 void irdma_cm_teardown_connections(struct irdma_device *iwdev, u32 *ipaddr,
440 				   struct irdma_cm_info *nfo,
441 				   bool disconnect_all);
442 int irdma_cm_start(struct irdma_device *dev);
443 int irdma_cm_stop(struct irdma_device *dev);
444 bool irdma_ipv4_is_lpb(u32 loc_addr, u32 rem_addr);
445 bool irdma_ipv6_is_lpb(u32 *loc_addr, u32 *rem_addr);
446 int irdma_arp_table(struct irdma_pci_f *rf, u32 *ip_addr,
447 		    u8 *mac_addr, u32 action);
448 bool irdma_port_in_use(struct irdma_cm_core *cm_core, u16 port);
449 void irdma_send_ack(struct irdma_cm_node *cm_node);
450 void irdma_lpb_nop(struct irdma_sc_qp *qp);
451 void irdma_rem_ref_cm_node(struct irdma_cm_node *cm_node);
452 void irdma_add_conn_est_qh(struct irdma_cm_node *cm_node);
453 #endif /* IRDMA_CM_H */
454