xref: /linux/tools/testing/selftests/net/mptcp/mptcp_connect.sh (revision cbf658dd09419f1ef9de11b9604e950bdd5c170b)
1#!/bin/bash
2# SPDX-License-Identifier: GPL-2.0
3
4# Double quotes to prevent globbing and word splitting is recommended in new
5# code but we accept it, especially because there were too many before having
6# address all other issues detected by shellcheck.
7#shellcheck disable=SC2086
8
9. "$(dirname "${0}")/mptcp_lib.sh"
10
11time_start=$(date +%s)
12
13optstring="S:R:d:e:l:r:h4cm:f:tC"
14ret=0
15final_ret=0
16sin=""
17sout=""
18cin_disconnect=""
19cin=""
20cout=""
21capture=false
22timeout_poll=30
23timeout_test=$((timeout_poll * 2 + 1))
24ipv6=true
25ethtool_random_on=true
26tc_delay="$((RANDOM%50))"
27tc_loss=$((RANDOM%101))
28testmode=""
29sndbuf=0
30rcvbuf=0
31options_log=true
32do_tcp=0
33checksum=false
34filesize=0
35connect_per_transfer=1
36port=$((10000 - 1))
37
38if [ $tc_loss -eq 100 ];then
39	tc_loss=1%
40elif [ $tc_loss -ge 10 ]; then
41	tc_loss=0.$tc_loss%
42elif [ $tc_loss -ge 1 ]; then
43	tc_loss=0.0$tc_loss%
44else
45	tc_loss=""
46fi
47
48usage() {
49	echo "Usage: $0 [ -a ]"
50	echo -e "\t-d: tc/netem delay in milliseconds, e.g. \"-d 10\" (default random)"
51	echo -e "\t-l: tc/netem loss percentage, e.g. \"-l 0.02\" (default random)"
52	echo -e "\t-r: tc/netem reorder mode, e.g. \"-r 25% 50% gap 5\", use "-r 0" to disable reordering (default random)"
53	echo -e "\t-e: ethtool features to disable, e.g.: \"-e tso -e gso\" (default: randomly disable any of tso/gso/gro)"
54	echo -e "\t-4: IPv4 only: disable IPv6 tests (default: test both IPv4 and IPv6)"
55	echo -e "\t-c: capture packets for each test using tcpdump (default: no capture)"
56	echo -e "\t-f: size of file to transfer in bytes (default random)"
57	echo -e "\t-S: set sndbuf value (default: use kernel default)"
58	echo -e "\t-R: set rcvbuf value (default: use kernel default)"
59	echo -e "\t-m: test mode (poll, sendfile; default: poll)"
60	echo -e "\t-t: also run tests with TCP (use twice to non-fallback tcp)"
61	echo -e "\t-C: enable the MPTCP data checksum"
62}
63
64while getopts "$optstring" option;do
65	case "$option" in
66	"h")
67		usage $0
68		exit ${KSFT_PASS}
69		;;
70	"d")
71		if [ $OPTARG -ge 0 ];then
72			tc_delay="$OPTARG"
73		else
74			echo "-d requires numeric argument, got \"$OPTARG\"" 1>&2
75			exit ${KSFT_FAIL}
76		fi
77		;;
78	"e")
79		ethtool_args="$ethtool_args $OPTARG off"
80		ethtool_random_on=false
81		;;
82	"l")
83		tc_loss="$OPTARG"
84		;;
85	"r")
86		tc_reorder="$OPTARG"
87		;;
88	"4")
89		ipv6=false
90		;;
91	"c")
92		capture=true
93		;;
94	"S")
95		if [ $OPTARG -ge 0 ];then
96			sndbuf="$OPTARG"
97		else
98			echo "-S requires numeric argument, got \"$OPTARG\"" 1>&2
99			exit ${KSFT_FAIL}
100		fi
101		;;
102	"R")
103		if [ $OPTARG -ge 0 ];then
104			rcvbuf="$OPTARG"
105		else
106			echo "-R requires numeric argument, got \"$OPTARG\"" 1>&2
107			exit ${KSFT_FAIL}
108		fi
109		;;
110	"m")
111		testmode="$OPTARG"
112		;;
113	"f")
114		filesize="$OPTARG"
115		;;
116	"t")
117		do_tcp=$((do_tcp+1))
118		;;
119	"C")
120		checksum=true
121		;;
122	"?")
123		usage $0
124		exit ${KSFT_FAIL}
125		;;
126	esac
127done
128
129ns1=""
130ns2=""
131ns3=""
132ns4=""
133
134TEST_GROUP=""
135
136# This function is used in the cleanup trap
137#shellcheck disable=SC2317,SC2329
138cleanup()
139{
140	rm -f "$cin_disconnect"
141	rm -f "$cin" "$cout"
142	rm -f "$sin" "$sout"
143	rm -f "$capout"
144
145	mptcp_lib_ns_exit "${ns1}" "${ns2}" "${ns3}" "${ns4}"
146}
147
148mptcp_lib_check_mptcp
149mptcp_lib_check_kallsyms
150mptcp_lib_check_tools ip tc
151
152sin=$(mktemp)
153sout=$(mktemp)
154cin=$(mktemp)
155cout=$(mktemp)
156capout=$(mktemp)
157cin_disconnect="$cin".disconnect
158trap cleanup EXIT
159
160mptcp_lib_ns_init ns1 ns2 ns3 ns4
161
162#  "$ns1"              ns2                    ns3                     ns4
163# ns1eth2    ns2eth1   ns2eth3      ns3eth2   ns3eth4       ns4eth3
164#                           - drop 1% ->            reorder 25%
165#                           <- TSO off -
166
167ip link add ns1eth2 netns "$ns1" type veth peer name ns2eth1 netns "$ns2"
168ip link add ns2eth3 netns "$ns2" type veth peer name ns3eth2 netns "$ns3"
169ip link add ns3eth4 netns "$ns3" type veth peer name ns4eth3 netns "$ns4"
170
171ip -net "$ns1" addr add 10.0.1.1/24 dev ns1eth2
172ip -net "$ns1" addr add dead:beef:1::1/64 dev ns1eth2 nodad
173
174ip -net "$ns1" link set ns1eth2 up
175ip -net "$ns1" route add default via 10.0.1.2
176ip -net "$ns1" route add default via dead:beef:1::2
177
178ip -net "$ns2" addr add 10.0.1.2/24 dev ns2eth1
179ip -net "$ns2" addr add dead:beef:1::2/64 dev ns2eth1 nodad
180ip -net "$ns2" link set ns2eth1 up
181
182ip -net "$ns2" addr add 10.0.2.1/24 dev ns2eth3
183ip -net "$ns2" addr add dead:beef:2::1/64 dev ns2eth3 nodad
184ip -net "$ns2" link set ns2eth3 up
185ip -net "$ns2" route add default via 10.0.2.2
186ip -net "$ns2" route add default via dead:beef:2::2
187ip netns exec "$ns2" sysctl -q net.ipv4.ip_forward=1
188ip netns exec "$ns2" sysctl -q net.ipv6.conf.all.forwarding=1
189
190ip -net "$ns3" addr add 10.0.2.2/24 dev ns3eth2
191ip -net "$ns3" addr add dead:beef:2::2/64 dev ns3eth2 nodad
192ip -net "$ns3" link set ns3eth2 up
193
194ip -net "$ns3" addr add 10.0.3.2/24 dev ns3eth4
195ip -net "$ns3" addr add dead:beef:3::2/64 dev ns3eth4 nodad
196ip -net "$ns3" link set ns3eth4 up
197ip -net "$ns3" route add default via 10.0.2.1
198ip -net "$ns3" route add default via dead:beef:2::1
199ip netns exec "$ns3" sysctl -q net.ipv4.ip_forward=1
200ip netns exec "$ns3" sysctl -q net.ipv6.conf.all.forwarding=1
201
202ip -net "$ns4" addr add 10.0.3.1/24 dev ns4eth3
203ip -net "$ns4" addr add dead:beef:3::1/64 dev ns4eth3 nodad
204ip -net "$ns4" link set ns4eth3 up
205ip -net "$ns4" route add default via 10.0.3.2
206ip -net "$ns4" route add default via dead:beef:3::2
207
208if $checksum; then
209	for i in "$ns1" "$ns2" "$ns3" "$ns4";do
210		ip netns exec $i sysctl -q net.mptcp.checksum_enabled=1
211	done
212fi
213
214if $capture; then
215	rndh="${ns1:4}"
216	mptcp_lib_pr_info "Packet capture files will have this prefix: ${rndh}-"
217fi
218
219set_ethtool_flags() {
220	local ns="$1"
221	local dev="$2"
222	local flags="$3"
223
224	if ip netns exec $ns ethtool -K $dev $flags 2>/dev/null; then
225		mptcp_lib_pr_info "set $ns dev $dev: ethtool -K $flags"
226	fi
227}
228
229set_random_ethtool_flags() {
230	local flags=""
231	local r=$RANDOM
232
233	local pick1=$((r & 1))
234	local pick2=$((r & 2))
235	local pick3=$((r & 4))
236
237	[ $pick1 -ne 0 ] && flags="tso off"
238	[ $pick2 -ne 0 ] && flags="$flags gso off"
239	[ $pick3 -ne 0 ] && flags="$flags gro off"
240
241	[ -z "$flags" ] && return
242
243	set_ethtool_flags "$1" "$2" "$flags"
244}
245
246if $ethtool_random_on;then
247	set_random_ethtool_flags "$ns3" ns3eth2
248	set_random_ethtool_flags "$ns4" ns4eth3
249else
250	set_ethtool_flags "$ns3" ns3eth2 "$ethtool_args"
251	set_ethtool_flags "$ns4" ns4eth3 "$ethtool_args"
252fi
253
254print_larger_title() {
255	# here we don't have the time, a bit longer for the alignment
256	MPTCP_LIB_TEST_FORMAT="%02u %-69s" \
257		mptcp_lib_print_title "${@}"
258}
259
260check_mptcp_disabled()
261{
262	local disabled_ns
263	mptcp_lib_ns_init disabled_ns
264
265	print_larger_title "New MPTCP socket can be blocked via sysctl"
266
267	# mainly to cover more code
268	if ! ip netns exec ${disabled_ns} sysctl net.mptcp >/dev/null; then
269		mptcp_lib_pr_fail "not able to list net.mptcp sysctl knobs"
270		mptcp_lib_result_fail "not able to list net.mptcp sysctl knobs"
271		ret=${KSFT_FAIL}
272		return 1
273	fi
274
275	# net.mptcp.enabled should be enabled by default
276	if [ "$(ip netns exec ${disabled_ns} sysctl net.mptcp.enabled | awk '{ print $3 }')" -ne 1 ]; then
277		mptcp_lib_pr_fail "net.mptcp.enabled sysctl is not 1 by default"
278		mptcp_lib_result_fail "net.mptcp.enabled sysctl is not 1 by default"
279		ret=${KSFT_FAIL}
280		return 1
281	fi
282	ip netns exec ${disabled_ns} sysctl -q net.mptcp.enabled=0
283
284	local err=0
285	LC_ALL=C ip netns exec ${disabled_ns} ./mptcp_connect -p 10000 -s MPTCP 127.0.0.1 < "$cin" 2>&1 | \
286		grep -q "^socket: Protocol not available$" && err=1
287	mptcp_lib_ns_exit "${disabled_ns}"
288
289	if [ ${err} -eq 0 ]; then
290		mptcp_lib_pr_fail "New MPTCP socket cannot be blocked via sysctl"
291		mptcp_lib_result_fail "New MPTCP socket cannot be blocked via sysctl"
292		ret=${KSFT_FAIL}
293		return 1
294	fi
295
296	mptcp_lib_pr_ok
297	mptcp_lib_result_pass "New MPTCP socket can be blocked via sysctl"
298	return 0
299}
300
301do_ping()
302{
303	local listener_ns="$1"
304	local connector_ns="$2"
305	local connect_addr="$3"
306	local ping_args="-q -c 1"
307	local rc=0
308
309	if mptcp_lib_is_v6 "${connect_addr}"; then
310		$ipv6 || return 0
311		ping_args="${ping_args} -6"
312	fi
313
314	ip netns exec ${connector_ns} ping ${ping_args} $connect_addr >/dev/null || rc=1
315
316	if [ $rc -ne 0 ] ; then
317		mptcp_lib_pr_fail "$listener_ns -> $connect_addr connectivity"
318		ret=${KSFT_FAIL}
319
320		return 1
321	fi
322
323	return 0
324}
325
326do_transfer()
327{
328	local listener_ns="$1"
329	local connector_ns="$2"
330	local cl_proto="$3"
331	local srv_proto="$4"
332	local connect_addr="$5"
333	local local_addr="$6"
334	local extra_args="$7"
335
336	port=$((port + 1))
337
338	if [ "$rcvbuf" -gt 0 ]; then
339		extra_args+=" -R $rcvbuf"
340	fi
341
342	if [ "$sndbuf" -gt 0 ]; then
343		extra_args+=" -S $sndbuf"
344	fi
345
346	if [ -n "$testmode" ]; then
347		extra_args+=" -m $testmode"
348	fi
349
350	if [ -n "$extra_args" ] && $options_log; then
351		mptcp_lib_pr_info "extra options: $extra_args"
352	fi
353	options_log=false
354
355	:> "$cout"
356	:> "$sout"
357	:> "$capout"
358
359	local addr_port
360	addr_port=$(printf "%s:%d" ${connect_addr} ${port})
361	local pretty_title
362	pretty_title="$(printf "%.3s %-5s -> %.3s (%-20s) %-5s" ${connector_ns} ${cl_proto} ${listener_ns} ${addr_port} ${srv_proto})"
363	mptcp_lib_print_title "${pretty_title}"
364
365	local tap_title="${connector_ns:0:3} ${cl_proto} -> ${listener_ns:0:3} (${addr_port}) ${srv_proto}"
366
367	if $capture; then
368		local capuser
369		if [ -z $SUDO_USER ] ; then
370			capuser=""
371		else
372			capuser="-Z $SUDO_USER"
373		fi
374
375		local capfile="${rndh}-${connector_ns:0:3}-${listener_ns:0:3}-${cl_proto}-${srv_proto}-${connect_addr}-${port}"
376		local capopt="-i any -s 65535 -B 32768 ${capuser}"
377
378		ip netns exec ${listener_ns}  tcpdump ${capopt} -w "${capfile}-listener.pcap"  >> "${capout}" 2>&1 &
379		local cappid_listener=$!
380
381		ip netns exec ${connector_ns} tcpdump ${capopt} -w "${capfile}-connector.pcap" >> "${capout}" 2>&1 &
382		local cappid_connector=$!
383
384		sleep 1
385	fi
386
387	NSTAT_HISTORY=/tmp/${listener_ns}.nstat ip netns exec ${listener_ns} \
388		nstat -n
389	if [ ${listener_ns} != ${connector_ns} ]; then
390		NSTAT_HISTORY=/tmp/${connector_ns}.nstat ip netns exec ${connector_ns} \
391			nstat -n
392	fi
393
394	local stat_synrx_last_l
395	local stat_ackrx_last_l
396	local stat_cookietx_last
397	local stat_cookierx_last
398	local stat_csum_err_s
399	local stat_csum_err_c
400	local stat_tcpfb_last_l
401	stat_synrx_last_l=$(mptcp_lib_get_counter "${listener_ns}" "MPTcpExtMPCapableSYNRX")
402	stat_ackrx_last_l=$(mptcp_lib_get_counter "${listener_ns}" "MPTcpExtMPCapableACKRX")
403	stat_cookietx_last=$(mptcp_lib_get_counter "${listener_ns}" "TcpExtSyncookiesSent")
404	stat_cookierx_last=$(mptcp_lib_get_counter "${listener_ns}" "TcpExtSyncookiesRecv")
405	stat_csum_err_s=$(mptcp_lib_get_counter "${listener_ns}" "MPTcpExtDataCsumErr")
406	stat_csum_err_c=$(mptcp_lib_get_counter "${connector_ns}" "MPTcpExtDataCsumErr")
407	stat_tcpfb_last_l=$(mptcp_lib_get_counter "${listener_ns}" "MPTcpExtMPCapableFallbackACK")
408
409	timeout ${timeout_test} \
410		ip netns exec ${listener_ns} \
411			./mptcp_connect -t ${timeout_poll} -l -p $port -s ${srv_proto} \
412				$extra_args $local_addr < "$sin" > "$sout" &
413	local spid=$!
414
415	mptcp_lib_wait_local_port_listen "${listener_ns}" "${port}"
416
417	local start
418	start=$(date +%s%3N)
419	timeout ${timeout_test} \
420		ip netns exec ${connector_ns} \
421			./mptcp_connect -t ${timeout_poll} -p $port -s ${cl_proto} \
422				$extra_args $connect_addr < "$cin" > "$cout" &
423	local cpid=$!
424
425	wait $cpid
426	local retc=$?
427	wait $spid
428	local rets=$?
429
430	local stop
431	stop=$(date +%s%3N)
432
433	if $capture; then
434		sleep 1
435		kill ${cappid_listener}
436		kill ${cappid_connector}
437	fi
438
439	NSTAT_HISTORY=/tmp/${listener_ns}.nstat ip netns exec ${listener_ns} \
440		nstat | grep Tcp > /tmp/${listener_ns}.out
441	if [ ${listener_ns} != ${connector_ns} ]; then
442		NSTAT_HISTORY=/tmp/${connector_ns}.nstat ip netns exec ${connector_ns} \
443			nstat | grep Tcp > /tmp/${connector_ns}.out
444	fi
445
446	local duration
447	duration=$((stop-start))
448	printf "(duration %05sms) " "${duration}"
449	if [ ${rets} -ne 0 ] || [ ${retc} -ne 0 ]; then
450		mptcp_lib_pr_fail "client exit code $retc, server $rets"
451		mptcp_lib_pr_err_stats "${listener_ns}" "${connector_ns}" "${port}" \
452			"/tmp/${listener_ns}.out" "/tmp/${connector_ns}.out"
453
454		echo
455		cat "$capout"
456		mptcp_lib_result_fail "${TEST_GROUP}: ${tap_title}"
457		return 1
458	fi
459
460	mptcp_lib_check_transfer $sin $cout "file received by client"
461	retc=$?
462	mptcp_lib_check_transfer $cin $sout "file received by server"
463	rets=$?
464
465	local extra=""
466	local stat_synrx_now_l
467	local stat_ackrx_now_l
468	local stat_cookietx_now
469	local stat_cookierx_now
470	local stat_ooo_now
471	local stat_tcpfb_now_l
472	stat_synrx_now_l=$(mptcp_lib_get_counter "${listener_ns}" "MPTcpExtMPCapableSYNRX")
473	stat_ackrx_now_l=$(mptcp_lib_get_counter "${listener_ns}" "MPTcpExtMPCapableACKRX")
474	stat_cookietx_now=$(mptcp_lib_get_counter "${listener_ns}" "TcpExtSyncookiesSent")
475	stat_cookierx_now=$(mptcp_lib_get_counter "${listener_ns}" "TcpExtSyncookiesRecv")
476	stat_ooo_now=$(mptcp_lib_get_counter "${listener_ns}" "TcpExtTCPOFOQueue")
477	stat_tcpfb_now_l=$(mptcp_lib_get_counter "${listener_ns}" "MPTcpExtMPCapableFallbackACK")
478
479	expect_synrx=$((stat_synrx_last_l))
480	expect_ackrx=$((stat_ackrx_last_l))
481
482	cookies=$(ip netns exec ${listener_ns} sysctl net.ipv4.tcp_syncookies)
483	cookies=${cookies##*=}
484
485	if [ ${cl_proto} = "MPTCP" ] && [ ${srv_proto} = "MPTCP" ]; then
486		expect_synrx=$((stat_synrx_last_l+connect_per_transfer))
487		expect_ackrx=$((stat_ackrx_last_l+connect_per_transfer))
488	fi
489
490	if [ ${stat_synrx_now_l} -lt ${expect_synrx} ]; then
491		mptcp_lib_pr_fail "lower MPC SYN rx (${stat_synrx_now_l})" \
492				  "than expected (${expect_synrx})"
493		retc=1
494	fi
495	if [ ${stat_ackrx_now_l} -lt ${expect_ackrx} ] && [ ${stat_ooo_now} -eq 0 ]; then
496		if [ ${stat_ooo_now} -eq 0 ]; then
497			mptcp_lib_pr_fail "lower MPC ACK rx (${stat_ackrx_now_l})" \
498					  "than expected (${expect_ackrx})"
499			rets=1
500		else
501			extra+=" [ Note ] fallback due to TCP OoO"
502		fi
503	fi
504
505	if $checksum; then
506		local csum_err_s
507		local csum_err_c
508		csum_err_s=$(mptcp_lib_get_counter "${listener_ns}" "MPTcpExtDataCsumErr")
509		csum_err_c=$(mptcp_lib_get_counter "${connector_ns}" "MPTcpExtDataCsumErr")
510
511		local csum_err_s_nr=$((csum_err_s - stat_csum_err_s))
512		if [ $csum_err_s_nr -gt 0 ]; then
513			mptcp_lib_pr_fail "server got ${csum_err_s_nr} data checksum error[s]"
514			rets=1
515		fi
516
517		local csum_err_c_nr=$((csum_err_c - stat_csum_err_c))
518		if [ $csum_err_c_nr -gt 0 ]; then
519			mptcp_lib_pr_fail "client got ${csum_err_c_nr} data checksum error[s]"
520			retc=1
521		fi
522	fi
523
524	if [ ${stat_ooo_now} -eq 0 ] && [ ${stat_tcpfb_last_l} -ne ${stat_tcpfb_now_l} ]; then
525		mptcp_lib_pr_fail "unexpected fallback to TCP"
526		rets=1
527	fi
528
529	if [ $cookies -eq 2 ];then
530		if [ $stat_cookietx_last -ge $stat_cookietx_now ] ;then
531			extra+=" WARN: CookieSent: did not advance"
532		fi
533		if [ $stat_cookierx_last -ge $stat_cookierx_now ] ;then
534			extra+=" WARN: CookieRecv: did not advance"
535		fi
536	else
537		if [ $stat_cookietx_last -ne $stat_cookietx_now ] ;then
538			extra+=" WARN: CookieSent: changed"
539		fi
540		if [ $stat_cookierx_last -ne $stat_cookierx_now ] ;then
541			extra+=" WARN: CookieRecv: changed"
542		fi
543	fi
544
545	if [ ${stat_synrx_now_l} -gt ${expect_synrx} ]; then
546		extra+=" WARN: SYNRX: expect ${expect_synrx},"
547		extra+=" got ${stat_synrx_now_l} (probably retransmissions)"
548	fi
549	if [ ${stat_ackrx_now_l} -gt ${expect_ackrx} ]; then
550		extra+=" WARN: ACKRX: expect ${expect_ackrx},"
551		extra+=" got ${stat_ackrx_now_l} (probably retransmissions)"
552	fi
553
554	if [ $retc -eq 0 ] && [ $rets -eq 0 ]; then
555		mptcp_lib_pr_ok "${extra:1}"
556		mptcp_lib_result_pass "${TEST_GROUP}: ${tap_title}"
557	else
558		if [ -n "${extra}" ]; then
559			mptcp_lib_print_warn "${extra:1}"
560		fi
561		mptcp_lib_result_fail "${TEST_GROUP}: ${tap_title}"
562	fi
563
564	cat "$capout"
565	[ $retc -eq 0 ] && [ $rets -eq 0 ]
566}
567
568make_file()
569{
570	local name=$1
571	local who=$2
572	local SIZE=$filesize
573	local ksize
574	local rem
575
576	if [ $SIZE -eq 0 ]; then
577		local MAXSIZE=$((1024 * 1024 * 8))
578		local MINSIZE=$((1024 * 256))
579
580		SIZE=$(((RANDOM * RANDOM + MINSIZE) % MAXSIZE))
581	fi
582
583	ksize=$((SIZE / 1024))
584	rem=$((SIZE - (ksize * 1024)))
585
586	mptcp_lib_make_file $name 1024 $ksize
587	dd if=/dev/urandom conv=notrunc of="$name" oflag=append bs=1 count=$rem 2> /dev/null
588
589	echo "Created $name (size $(stat -c "%s" "$name") B) containing data sent by $who"
590}
591
592run_tests_lo()
593{
594	local listener_ns="$1"
595	local connector_ns="$2"
596	local connect_addr="$3"
597	local loopback="$4"
598	local extra_args="$5"
599	local lret=0
600
601	# skip if test programs are running inside same netns for subsequent runs.
602	if [ $loopback -eq 0 ] && [ ${listener_ns} = ${connector_ns} ]; then
603		return 0
604	fi
605
606	# skip if we don't want v6
607	if ! $ipv6 && mptcp_lib_is_v6 "${connect_addr}"; then
608		return 0
609	fi
610
611	local local_addr
612	if mptcp_lib_is_v6 "${connect_addr}"; then
613		local_addr="::"
614	else
615		local_addr="0.0.0.0"
616	fi
617
618	do_transfer ${listener_ns} ${connector_ns} MPTCP MPTCP \
619		    ${connect_addr} ${local_addr} "${extra_args}"
620	lret=$?
621	if [ $lret -ne 0 ]; then
622		ret=$lret
623		return 1
624	fi
625
626	if [ $do_tcp -eq 0 ]; then
627		# don't bother testing fallback tcp except for loopback case.
628		if [ ${listener_ns} != ${connector_ns} ]; then
629			return 0
630		fi
631	fi
632
633	do_transfer ${listener_ns} ${connector_ns} MPTCP TCP \
634		    ${connect_addr} ${local_addr} "${extra_args}"
635	lret=$?
636	if [ $lret -ne 0 ]; then
637		ret=$lret
638		return 1
639	fi
640
641	do_transfer ${listener_ns} ${connector_ns} TCP MPTCP \
642		    ${connect_addr} ${local_addr} "${extra_args}"
643	lret=$?
644	if [ $lret -ne 0 ]; then
645		ret=$lret
646		return 1
647	fi
648
649	if [ $do_tcp -gt 1 ] ;then
650		do_transfer ${listener_ns} ${connector_ns} TCP TCP \
651			    ${connect_addr} ${local_addr} "${extra_args}"
652		lret=$?
653		if [ $lret -ne 0 ]; then
654			ret=$lret
655			return 1
656		fi
657	fi
658
659	return 0
660}
661
662run_tests()
663{
664	run_tests_lo $1 $2 $3 0
665}
666
667run_test_transparent()
668{
669	local connect_addr="$1"
670	local msg="$2"
671
672	local connector_ns="$ns1"
673	local listener_ns="$ns2"
674	local lret=0
675	local r6flag=""
676
677	TEST_GROUP="${msg}"
678
679	# skip if we don't want v6
680	if ! $ipv6 && mptcp_lib_is_v6 "${connect_addr}"; then
681		return 0
682	fi
683
684	# IP(V6)_TRANSPARENT has been added after TOS support which came with
685	# the required infrastructure in MPTCP sockopt code. To support TOS, the
686	# following function has been exported (T). Not great but better than
687	# checking for a specific kernel version.
688	if ! mptcp_lib_kallsyms_has "T __ip_sock_set_tos$"; then
689		mptcp_lib_pr_skip "${msg} not supported by the kernel"
690		mptcp_lib_result_skip "${TEST_GROUP}"
691		return
692	fi
693
694	if ! ip netns exec "$listener_ns" nft -f /dev/stdin <<"EOF"
695flush ruleset
696table inet mangle {
697	chain divert {
698		type filter hook prerouting priority -150;
699
700		meta l4proto tcp socket transparent 1 meta mark set 1 accept
701		tcp dport 20000 tproxy to :20000 meta mark set 1 accept
702	}
703}
704EOF
705	then
706		mptcp_lib_pr_skip "$msg, could not load nft ruleset"
707		mptcp_lib_fail_if_expected_feature "nft rules"
708		mptcp_lib_result_skip "${TEST_GROUP}"
709		return
710	fi
711
712	local local_addr
713	if mptcp_lib_is_v6 "${connect_addr}"; then
714		local_addr="::"
715		r6flag="-6"
716	else
717		local_addr="0.0.0.0"
718	fi
719
720	if ! ip -net "$listener_ns" $r6flag rule add fwmark 1 lookup 100; then
721		ip netns exec "$listener_ns" nft flush ruleset
722		mptcp_lib_pr_skip "$msg, ip $r6flag rule failed"
723		mptcp_lib_fail_if_expected_feature "ip rule"
724		mptcp_lib_result_skip "${TEST_GROUP}"
725		return
726	fi
727
728	if ! ip -net "$listener_ns" route add local $local_addr/0 dev lo table 100; then
729		ip netns exec "$listener_ns" nft flush ruleset
730		ip -net "$listener_ns" $r6flag rule del fwmark 1 lookup 100
731		mptcp_lib_pr_skip "$msg, ip route add local $local_addr failed"
732		mptcp_lib_fail_if_expected_feature "ip route"
733		mptcp_lib_result_skip "${TEST_GROUP}"
734		return
735	fi
736
737	mptcp_lib_pr_info "test $msg"
738
739	port=$((20000 - 1))
740	local extra_args="-o TRANSPARENT"
741	do_transfer ${listener_ns} ${connector_ns} MPTCP MPTCP \
742		    ${connect_addr} ${local_addr} "${extra_args}"
743	lret=$?
744
745	ip netns exec "$listener_ns" nft flush ruleset
746	ip -net "$listener_ns" $r6flag rule del fwmark 1 lookup 100
747	ip -net "$listener_ns" route del local $local_addr/0 dev lo table 100
748
749	if [ $lret -ne 0 ]; then
750		mptcp_lib_pr_fail "$msg, mptcp connection error"
751		ret=$lret
752		return 1
753	fi
754
755	mptcp_lib_pr_info "$msg pass"
756	return 0
757}
758
759run_tests_peekmode()
760{
761	local peekmode="$1"
762
763	TEST_GROUP="peek mode: ${peekmode}"
764	mptcp_lib_pr_info "with peek mode: ${peekmode}"
765	run_tests_lo "$ns1" "$ns1" 10.0.1.1 1 "-P ${peekmode}"
766	run_tests_lo "$ns1" "$ns1" dead:beef:1::1 1 "-P ${peekmode}"
767}
768
769run_tests_mptfo()
770{
771	TEST_GROUP="MPTFO"
772
773	if ! mptcp_lib_kallsyms_has "mptcp_fastopen_"; then
774		mptcp_lib_pr_skip "TFO not supported by the kernel"
775		mptcp_lib_result_skip "${TEST_GROUP}"
776		return
777	fi
778
779	mptcp_lib_pr_info "with MPTFO start"
780	ip netns exec "$ns1" sysctl -q net.ipv4.tcp_fastopen=2
781	ip netns exec "$ns2" sysctl -q net.ipv4.tcp_fastopen=1
782
783	run_tests_lo "$ns1" "$ns2" 10.0.1.1 0 "-o MPTFO"
784	run_tests_lo "$ns1" "$ns2" 10.0.1.1 0 "-o MPTFO"
785
786	run_tests_lo "$ns1" "$ns2" dead:beef:1::1 0 "-o MPTFO"
787	run_tests_lo "$ns1" "$ns2" dead:beef:1::1 0 "-o MPTFO"
788
789	ip netns exec "$ns1" sysctl -q net.ipv4.tcp_fastopen=0
790	ip netns exec "$ns2" sysctl -q net.ipv4.tcp_fastopen=0
791	mptcp_lib_pr_info "with MPTFO end"
792}
793
794run_tests_disconnect()
795{
796	local old_cin=$cin
797	local old_sin=$sin
798
799	TEST_GROUP="full disconnect"
800
801	if ! mptcp_lib_kallsyms_has "mptcp_pm_data_reset$"; then
802		mptcp_lib_pr_skip "Full disconnect not supported"
803		mptcp_lib_result_skip "${TEST_GROUP}"
804		return
805	fi
806
807	cat $cin $cin $cin > "$cin".disconnect
808
809	# force do_transfer to cope with the multiple transmissions
810	sin="$cin.disconnect"
811	cin="$cin.disconnect"
812	cin_disconnect="$old_cin"
813	connect_per_transfer=3
814
815	mptcp_lib_pr_info "disconnect"
816	run_tests_lo "$ns1" "$ns1" 10.0.1.1 1 "-I 3 -i $old_cin"
817	run_tests_lo "$ns1" "$ns1" dead:beef:1::1 1 "-I 3 -i $old_cin"
818
819	# restore previous status
820	sin=$old_sin
821	cin=$old_cin
822	cin_disconnect="$cin".disconnect
823	connect_per_transfer=1
824}
825
826display_time()
827{
828	time_end=$(date +%s)
829	time_run=$((time_end-time_start))
830
831	echo "Time: ${time_run} seconds"
832}
833
834log_if_error()
835{
836	local msg="$1"
837
838	if [ ${ret} -ne 0 ]; then
839		mptcp_lib_pr_fail "${msg}"
840
841		final_ret=${ret}
842		ret=${KSFT_PASS}
843
844		return ${final_ret}
845	fi
846}
847
848stop_if_error()
849{
850	if ! log_if_error "${@}"; then
851		display_time
852		mptcp_lib_result_print_all_tap
853		exit ${final_ret}
854	fi
855}
856
857make_file "$cin" "client"
858make_file "$sin" "server"
859
860mptcp_lib_subtests_last_ts_reset
861
862check_mptcp_disabled
863
864stop_if_error "The kernel configuration is not valid for MPTCP"
865
866print_larger_title "Validating network environment with pings"
867for sender in "$ns1" "$ns2" "$ns3" "$ns4";do
868	do_ping "$ns1" $sender 10.0.1.1
869	do_ping "$ns1" $sender dead:beef:1::1
870
871	do_ping "$ns2" $sender 10.0.1.2
872	do_ping "$ns2" $sender dead:beef:1::2
873	do_ping "$ns2" $sender 10.0.2.1
874	do_ping "$ns2" $sender dead:beef:2::1
875
876	do_ping "$ns3" $sender 10.0.2.2
877	do_ping "$ns3" $sender dead:beef:2::2
878	do_ping "$ns3" $sender 10.0.3.2
879	do_ping "$ns3" $sender dead:beef:3::2
880
881	do_ping "$ns4" $sender 10.0.3.1
882	do_ping "$ns4" $sender dead:beef:3::1
883done
884
885mptcp_lib_result_code "${ret}" "ping tests"
886
887stop_if_error "Could not even run ping tests"
888mptcp_lib_pr_ok
889
890[ -n "$tc_loss" ] && tc -net "$ns2" qdisc add dev ns2eth3 root netem loss random $tc_loss delay ${tc_delay}ms
891tc_info="loss of $tc_loss "
892test "$tc_delay" -gt 0 && tc_info+="delay $tc_delay ms "
893
894reorder_delay=$((tc_delay / 4))
895
896if [ -z "${tc_reorder}" ]; then
897	reorder1=$((RANDOM%10))
898	reorder1=$((100 - reorder1))
899	reorder2=$((RANDOM%100))
900
901	if [ $reorder_delay -gt 0 ] && [ $reorder1 -lt 100 ] && [ $reorder2 -gt 0 ]; then
902		tc_reorder="reorder ${reorder1}% ${reorder2}%"
903		tc_info+="$tc_reorder with delay ${reorder_delay}ms "
904	fi
905elif [ "$tc_reorder" = "0" ];then
906	tc_reorder=""
907elif [ "$reorder_delay" -gt 0 ];then
908	# reordering requires some delay
909	tc_reorder="reorder $tc_reorder"
910	tc_info+="$tc_reorder with delay ${reorder_delay}ms "
911fi
912
913mptcp_lib_pr_info "Using ${tc_info}on ns3eth4"
914
915tc -net "$ns3" qdisc add dev ns3eth4 root netem delay ${reorder_delay}ms $tc_reorder
916
917TEST_GROUP="loopback v4"
918run_tests_lo "$ns1" "$ns1" 10.0.1.1 1
919stop_if_error "Could not even run loopback test"
920
921TEST_GROUP="loopback v6"
922run_tests_lo "$ns1" "$ns1" dead:beef:1::1 1
923stop_if_error "Could not even run loopback v6 test"
924
925TEST_GROUP="multihosts"
926for sender in $ns1 $ns2 $ns3 $ns4;do
927	# ns1<->ns2 is not subject to reordering/tc delays. Use it to test
928	# mptcp syncookie support.
929	if [ $sender = $ns1 ]; then
930		ip netns exec "$ns2" sysctl -q net.ipv4.tcp_syncookies=2
931	else
932		ip netns exec "$ns2" sysctl -q net.ipv4.tcp_syncookies=1
933	fi
934
935	run_tests "$ns1" $sender 10.0.1.1
936	run_tests "$ns1" $sender dead:beef:1::1
937
938	run_tests "$ns2" $sender 10.0.1.2
939	run_tests "$ns2" $sender dead:beef:1::2
940	run_tests "$ns2" $sender 10.0.2.1
941	run_tests "$ns2" $sender dead:beef:2::1
942
943	run_tests "$ns3" $sender 10.0.2.2
944	run_tests "$ns3" $sender dead:beef:2::2
945	run_tests "$ns3" $sender 10.0.3.2
946	run_tests "$ns3" $sender dead:beef:3::2
947
948	run_tests "$ns4" $sender 10.0.3.1
949	run_tests "$ns4" $sender dead:beef:3::1
950
951	log_if_error "Tests with $sender as a sender have failed"
952done
953
954run_tests_peekmode "saveWithPeek"
955run_tests_peekmode "saveAfterPeek"
956log_if_error "Tests with peek mode have failed"
957
958# MPTFO (MultiPath TCP Fatopen tests)
959run_tests_mptfo
960log_if_error "Tests with MPTFO have failed"
961
962# connect to ns4 ip address, ns2 should intercept/proxy
963run_test_transparent 10.0.3.1 "tproxy ipv4"
964run_test_transparent dead:beef:3::1 "tproxy ipv6"
965log_if_error "Tests with tproxy have failed"
966
967run_tests_disconnect
968log_if_error "Tests of the full disconnection have failed"
969
970display_time
971mptcp_lib_result_print_all_tap
972exit ${final_ret}
973