2 # SPDX-License-Identifier: GPL-2.0
6 optstring="S:R:d:e:l:r:h4cm:f:t"
15 timeout_test=$((timeout_poll * 2 + 1))
17 ethtool_random_on=true
18 tc_delay="$((RANDOM%50))"
19 tc_loss=$((RANDOM%101))
27 if [ $tc_loss -eq 100 ];then
29 elif [ $tc_loss -ge 10 ]; then
31 elif [ $tc_loss -ge 1 ]; then
38 echo "Usage: $0 [ -a ]"
39 echo -e "\t-d: tc/netem delay in milliseconds, e.g. \"-d 10\" (default random)"
40 echo -e "\t-l: tc/netem loss percentage, e.g. \"-l 0.02\" (default random)"
41 echo -e "\t-r: tc/netem reorder mode, e.g. \"-r 25% 50% gap 5\", use "-r 0" to disable reordering (default random)"
42 echo -e "\t-e: ethtool features to disable, e.g.: \"-e tso -e gso\" (default: randomly disable any of tso/gso/gro)"
43 echo -e "\t-4: IPv4 only: disable IPv6 tests (default: test both IPv4 and IPv6)"
44 echo -e "\t-c: capture packets for each test using tcpdump (default: no capture)"
45 echo -e "\t-f: size of file to transfer in bytes (default random)"
46 echo -e "\t-S: set sndbuf value (default: use kernel default)"
47 echo -e "\t-R: set rcvbuf value (default: use kernel default)"
48 echo -e "\t-m: test mode (poll, sendfile; default: poll)"
49 echo -e "\t-t: also run tests with TCP (use twice to non-fallback tcp)"
52 while getopts "$optstring" option;do
59 if [ $OPTARG -ge 0 ];then
62 echo "-d requires numeric argument, got \"$OPTARG\"" 1>&2
67 ethtool_args="$ethtool_args $OPTARG off"
68 ethtool_random_on=false
83 if [ $OPTARG -ge 0 ];then
86 echo "-S requires numeric argument, got \"$OPTARG\"" 1>&2
91 if [ $OPTARG -ge 0 ];then
94 echo "-R requires numeric argument, got \"$OPTARG\"" 1>&2
115 rndh=$(printf %x $sec)-$(mktemp -u XXXXXX)
130 for netns in "$ns1" "$ns2" "$ns3" "$ns4";do
132 rm -f /tmp/$netns.{nstat,out}
136 ip -Version > /dev/null 2>&1
138 echo "SKIP: Could not run test without ip tool"
149 for i in "$ns1" "$ns2" "$ns3" "$ns4";do
150 ip netns add $i || exit $ksft_skip
151 ip -net $i link set lo up
155 # ns1eth2 ns2eth1 ns2eth3 ns3eth2 ns3eth4 ns4eth3
156 # - drop 1% -> reorder 25%
159 ip link add ns1eth2 netns "$ns1" type veth peer name ns2eth1 netns "$ns2"
160 ip link add ns2eth3 netns "$ns2" type veth peer name ns3eth2 netns "$ns3"
161 ip link add ns3eth4 netns "$ns3" type veth peer name ns4eth3 netns "$ns4"
163 ip -net "$ns1" addr add 10.0.1.1/24 dev ns1eth2
164 ip -net "$ns1" addr add dead:beef:1::1/64 dev ns1eth2 nodad
166 ip -net "$ns1" link set ns1eth2 up
167 ip -net "$ns1" route add default via 10.0.1.2
168 ip -net "$ns1" route add default via dead:beef:1::2
170 ip -net "$ns2" addr add 10.0.1.2/24 dev ns2eth1
171 ip -net "$ns2" addr add dead:beef:1::2/64 dev ns2eth1 nodad
172 ip -net "$ns2" link set ns2eth1 up
174 ip -net "$ns2" addr add 10.0.2.1/24 dev ns2eth3
175 ip -net "$ns2" addr add dead:beef:2::1/64 dev ns2eth3 nodad
176 ip -net "$ns2" link set ns2eth3 up
177 ip -net "$ns2" route add default via 10.0.2.2
178 ip -net "$ns2" route add default via dead:beef:2::2
179 ip netns exec "$ns2" sysctl -q net.ipv4.ip_forward=1
180 ip netns exec "$ns2" sysctl -q net.ipv6.conf.all.forwarding=1
182 ip -net "$ns3" addr add 10.0.2.2/24 dev ns3eth2
183 ip -net "$ns3" addr add dead:beef:2::2/64 dev ns3eth2 nodad
184 ip -net "$ns3" link set ns3eth2 up
186 ip -net "$ns3" addr add 10.0.3.2/24 dev ns3eth4
187 ip -net "$ns3" addr add dead:beef:3::2/64 dev ns3eth4 nodad
188 ip -net "$ns3" link set ns3eth4 up
189 ip -net "$ns3" route add default via 10.0.2.1
190 ip -net "$ns3" route add default via dead:beef:2::1
191 ip netns exec "$ns3" sysctl -q net.ipv4.ip_forward=1
192 ip netns exec "$ns3" sysctl -q net.ipv6.conf.all.forwarding=1
194 ip -net "$ns4" addr add 10.0.3.1/24 dev ns4eth3
195 ip -net "$ns4" addr add dead:beef:3::1/64 dev ns4eth3 nodad
196 ip -net "$ns4" link set ns4eth3 up
197 ip -net "$ns4" route add default via 10.0.3.2
198 ip -net "$ns4" route add default via dead:beef:3::2
200 set_ethtool_flags() {
205 ip netns exec $ns ethtool -K $dev $flags 2>/dev/null
206 [ $? -eq 0 ] && echo "INFO: set $ns dev $dev: ethtool -K $flags"
209 set_random_ethtool_flags() {
213 local pick1=$((r & 1))
214 local pick2=$((r & 2))
215 local pick3=$((r & 4))
217 [ $pick1 -ne 0 ] && flags="tso off"
218 [ $pick2 -ne 0 ] && flags="$flags gso off"
219 [ $pick3 -ne 0 ] && flags="$flags gro off"
221 [ -z "$flags" ] && return
223 set_ethtool_flags "$1" "$2" "$flags"
226 if $ethtool_random_on;then
227 set_random_ethtool_flags "$ns3" ns3eth2
228 set_random_ethtool_flags "$ns4" ns4eth3
230 set_ethtool_flags "$ns3" ns3eth2 "$ethtool_args"
231 set_ethtool_flags "$ns4" ns4eth3 "$ethtool_args"
237 echo "Trailing bytes are: "
247 cmp "$in" "$out" > /dev/null 2>&1
248 if [ $? -ne 0 ] ;then
249 echo "[ FAIL ] $what does not match (in, out):"
251 print_file_err "$out"
259 check_mptcp_disabled()
262 disabled_ns="ns_disabled-$sech-$(mktemp -u XXXXXX)"
263 ip netns add ${disabled_ns} || exit $ksft_skip
265 # net.mptcp.enabled should be enabled by default
266 if [ "$(ip netns exec ${disabled_ns} sysctl net.mptcp.enabled | awk '{ print $3 }')" -ne 1 ]; then
267 echo -e "net.mptcp.enabled sysctl is not 1 by default\t\t[ FAIL ]"
271 ip netns exec ${disabled_ns} sysctl -q net.mptcp.enabled=0
274 LC_ALL=C ip netns exec ${disabled_ns} ./mptcp_connect -p 10000 -s MPTCP 127.0.0.1 < "$cin" 2>&1 | \
275 grep -q "^socket: Protocol not available$" && err=1
276 ip netns delete ${disabled_ns}
278 if [ ${err} -eq 0 ]; then
279 echo -e "New MPTCP socket cannot be blocked via sysctl\t\t[ FAIL ]"
284 echo -e "New MPTCP socket can be blocked via sysctl\t\t[ OK ]"
288 check_mptcp_ulp_setsockopt()
291 t="ns_ulp-$sech-$(mktemp -u XXXXXX)"
293 ip netns add ${t} || exit $ksft_skip
294 if ! ip netns exec ${t} ./mptcp_connect -u -p 10000 -s TCP 127.0.0.1 2>&1; then
295 printf "setsockopt(..., TCP_ULP, \"mptcp\", ...) allowed\t[ FAIL ]\n"
299 printf "setsockopt(..., TCP_ULP, \"mptcp\", ...) blocked\t[ OK ]\n"
314 local listener_ns="$1"
315 local connector_ns="$2"
316 local connect_addr="$3"
317 local ping_args="-q -c 1"
319 if is_v6 "${connect_addr}"; then
321 ping_args="${ping_args} -6"
324 ip netns exec ${connector_ns} ping ${ping_args} $connect_addr >/dev/null
325 if [ $? -ne 0 ] ; then
326 echo "$listener_ns -> $connect_addr connectivity [ FAIL ]" 1>&2
335 # $1: ns, $2: MIB counter
338 local listener_ns="${1}"
342 ip netns exec "${listener_ns}" \
343 nstat -z -a "${mib}" | \
345 while read a count c rest; do
351 wait_local_port_listen()
353 local listener_ns="${1}"
358 port_hex="$(printf "%04X" "${port}")"
359 for i in $(seq 10); do
360 ip netns exec "${listener_ns}" cat /proc/net/tcp* | \
361 awk "BEGIN {rc=1} {if (\$2 ~ /:${port_hex}\$/ && \$4 ~ /0A/) {rc=0; exit}} END {exit rc}" &&
369 local listener_ns="$1"
370 local connector_ns="$2"
373 local connect_addr="$5"
374 local local_addr="$6"
375 local extra_args="$7"
378 port=$((10000+$TEST_COUNT))
379 TEST_COUNT=$((TEST_COUNT+1))
381 if [ "$rcvbuf" -gt 0 ]; then
382 extra_args="$extra_args -R $rcvbuf"
385 if [ "$sndbuf" -gt 0 ]; then
386 extra_args="$extra_args -S $sndbuf"
389 if [ -n "$testmode" ]; then
390 extra_args="$extra_args -m $testmode"
393 if [ -n "$extra_args" ] && $options_log; then
394 echo "INFO: extra options: $extra_args"
403 addr_port=$(printf "%s:%d" ${connect_addr} ${port})
404 printf "%.3s %-5s -> %.3s (%-20s) %-5s\t" ${connector_ns} ${cl_proto} ${listener_ns} ${addr_port} ${srv_proto}
408 if [ -z $SUDO_USER ] ; then
411 capuser="-Z $SUDO_USER"
414 local capfile="${rndh}-${connector_ns:0:3}-${listener_ns:0:3}-${cl_proto}-${srv_proto}-${connect_addr}-${port}"
415 local capopt="-i any -s 65535 -B 32768 ${capuser}"
417 ip netns exec ${listener_ns} tcpdump ${capopt} -w "${capfile}-listener.pcap" >> "${capout}" 2>&1 &
418 local cappid_listener=$!
420 ip netns exec ${connector_ns} tcpdump ${capopt} -w "${capfile}-connector.pcap" >> "${capout}" 2>&1 &
421 local cappid_connector=$!
426 NSTAT_HISTORY=/tmp/${listener_ns}.nstat ip netns exec ${listener_ns} \
428 if [ ${listener_ns} != ${connector_ns} ]; then
429 NSTAT_HISTORY=/tmp/${connector_ns}.nstat ip netns exec ${connector_ns} \
433 local stat_synrx_last_l=$(get_mib_counter "${listener_ns}" "MPTcpExtMPCapableSYNRX")
434 local stat_ackrx_last_l=$(get_mib_counter "${listener_ns}" "MPTcpExtMPCapableACKRX")
435 local stat_cookietx_last=$(get_mib_counter "${listener_ns}" "TcpExtSyncookiesSent")
436 local stat_cookierx_last=$(get_mib_counter "${listener_ns}" "TcpExtSyncookiesRecv")
438 timeout ${timeout_test} \
439 ip netns exec ${listener_ns} \
440 ./mptcp_connect -t ${timeout_poll} -l -p $port -s ${srv_proto} \
441 $extra_args $local_addr < "$sin" > "$sout" &
444 wait_local_port_listen "${listener_ns}" "${port}"
448 timeout ${timeout_test} \
449 ip netns exec ${connector_ns} \
450 ./mptcp_connect -t ${timeout_poll} -p $port -s ${cl_proto} \
451 $extra_args $connect_addr < "$cin" > "$cout" &
464 kill ${cappid_listener}
465 kill ${cappid_connector}
468 NSTAT_HISTORY=/tmp/${listener_ns}.nstat ip netns exec ${listener_ns} \
469 nstat | grep Tcp > /tmp/${listener_ns}.out
470 if [ ${listener_ns} != ${connector_ns} ]; then
471 NSTAT_HISTORY=/tmp/${connector_ns}.nstat ip netns exec ${connector_ns} \
472 nstat | grep Tcp > /tmp/${connector_ns}.out
476 duration=$((stop-start))
477 printf "(duration %05sms) " "${duration}"
478 if [ ${rets} -ne 0 ] || [ ${retc} -ne 0 ]; then
479 echo "[ FAIL ] client exit code $retc, server $rets" 1>&2
480 echo -e "\nnetns ${listener_ns} socket stat for ${port}:" 1>&2
481 ip netns exec ${listener_ns} ss -Menita 1>&2 -o "sport = :$port"
482 cat /tmp/${listener_ns}.out
483 echo -e "\nnetns ${connector_ns} socket stat for ${port}:" 1>&2
484 ip netns exec ${connector_ns} ss -Menita 1>&2 -o "dport = :$port"
485 [ ${listener_ns} != ${connector_ns} ] && cat /tmp/${connector_ns}.out
492 check_transfer $sin $cout "file received by client"
494 check_transfer $cin $sout "file received by server"
497 local stat_synrx_now_l=$(get_mib_counter "${listener_ns}" "MPTcpExtMPCapableSYNRX")
498 local stat_ackrx_now_l=$(get_mib_counter "${listener_ns}" "MPTcpExtMPCapableACKRX")
499 local stat_cookietx_now=$(get_mib_counter "${listener_ns}" "TcpExtSyncookiesSent")
500 local stat_cookierx_now=$(get_mib_counter "${listener_ns}" "TcpExtSyncookiesRecv")
501 local stat_ooo_now=$(get_mib_counter "${listener_ns}" "TcpExtTCPOFOQueue")
503 expect_synrx=$((stat_synrx_last_l))
504 expect_ackrx=$((stat_ackrx_last_l))
506 cookies=$(ip netns exec ${listener_ns} sysctl net.ipv4.tcp_syncookies)
507 cookies=${cookies##*=}
509 if [ ${cl_proto} = "MPTCP" ] && [ ${srv_proto} = "MPTCP" ]; then
510 expect_synrx=$((stat_synrx_last_l+1))
511 expect_ackrx=$((stat_ackrx_last_l+1))
514 if [ ${stat_synrx_now_l} -lt ${expect_synrx} ]; then
515 printf "[ FAIL ] lower MPC SYN rx (%d) than expected (%d)\n" \
516 "${stat_synrx_now_l}" "${expect_synrx}" 1>&2
519 if [ ${stat_ackrx_now_l} -lt ${expect_ackrx} -a ${stat_ooo_now} -eq 0 ]; then
520 if [ ${stat_ooo_now} -eq 0 ]; then
521 printf "[ FAIL ] lower MPC ACK rx (%d) than expected (%d)\n" \
522 "${stat_ackrx_now_l}" "${expect_ackrx}" 1>&2
525 printf "[ Note ] fallback due to TCP OoO"
529 if [ $retc -eq 0 ] && [ $rets -eq 0 ]; then
533 if [ $cookies -eq 2 ];then
534 if [ $stat_cookietx_last -ge $stat_cookietx_now ] ;then
535 printf " WARN: CookieSent: did not advance"
537 if [ $stat_cookierx_last -ge $stat_cookierx_now ] ;then
538 printf " WARN: CookieRecv: did not advance"
541 if [ $stat_cookietx_last -ne $stat_cookietx_now ] ;then
542 printf " WARN: CookieSent: changed"
544 if [ $stat_cookierx_last -ne $stat_cookierx_now ] ;then
545 printf " WARN: CookieRecv: changed"
549 if [ ${stat_synrx_now_l} -gt ${expect_synrx} ]; then
550 printf " WARN: SYNRX: expect %d, got %d (probably retransmissions)" \
551 "${expect_synrx}" "${stat_synrx_now_l}"
553 if [ ${stat_ackrx_now_l} -gt ${expect_ackrx} ]; then
554 printf " WARN: ACKRX: expect %d, got %d (probably retransmissions)" \
555 "${expect_ackrx}" "${stat_ackrx_now_l}"
560 [ $retc -eq 0 ] && [ $rets -eq 0 ]
571 if [ $SIZE -eq 0 ]; then
572 local MAXSIZE=$((1024 * 1024 * 8))
573 local MINSIZE=$((1024 * 256))
575 SIZE=$(((RANDOM * RANDOM + MINSIZE) % MAXSIZE))
578 ksize=$((SIZE / 1024))
579 rem=$((SIZE - (ksize * 1024)))
581 dd if=/dev/urandom of="$name" bs=1024 count=$ksize 2> /dev/null
582 dd if=/dev/urandom conv=notrunc of="$name" bs=1 count=$rem 2> /dev/null
583 echo -e "\nMPTCP_TEST_FILE_END_MARKER" >> "$name"
585 echo "Created $name (size $(du -b "$name")) containing data sent by $who"
590 local listener_ns="$1"
591 local connector_ns="$2"
592 local connect_addr="$3"
594 local extra_args="$5"
597 # skip if test programs are running inside same netns for subsequent runs.
598 if [ $loopback -eq 0 ] && [ ${listener_ns} = ${connector_ns} ]; then
602 # skip if we don't want v6
603 if ! $ipv6 && is_v6 "${connect_addr}"; then
608 if is_v6 "${connect_addr}"; then
614 do_transfer ${listener_ns} ${connector_ns} MPTCP MPTCP \
615 ${connect_addr} ${local_addr} "${extra_args}"
617 if [ $lret -ne 0 ]; then
622 if [ $do_tcp -eq 0 ]; then
623 # don't bother testing fallback tcp except for loopback case.
624 if [ ${listener_ns} != ${connector_ns} ]; then
629 do_transfer ${listener_ns} ${connector_ns} MPTCP TCP \
630 ${connect_addr} ${local_addr} "${extra_args}"
632 if [ $lret -ne 0 ]; then
637 do_transfer ${listener_ns} ${connector_ns} TCP MPTCP \
638 ${connect_addr} ${local_addr} "${extra_args}"
640 if [ $lret -ne 0 ]; then
645 if [ $do_tcp -gt 1 ] ;then
646 do_transfer ${listener_ns} ${connector_ns} TCP TCP \
647 ${connect_addr} ${local_addr} "${extra_args}"
649 if [ $lret -ne 0 ]; then
660 run_tests_lo $1 $2 $3 0
667 echo "INFO: with peek mode: ${peekmode}"
668 run_tests_lo "$ns1" "$ns1" 10.0.1.1 1 "-P ${peekmode}"
669 run_tests_lo "$ns1" "$ns1" dead:beef:1::1 1 "-P ${peekmode}"
672 make_file "$cin" "client"
673 make_file "$sin" "server"
677 check_mptcp_ulp_setsockopt
679 echo "INFO: validating network environment with pings"
680 for sender in "$ns1" "$ns2" "$ns3" "$ns4";do
681 do_ping "$ns1" $sender 10.0.1.1
682 do_ping "$ns1" $sender dead:beef:1::1
684 do_ping "$ns2" $sender 10.0.1.2
685 do_ping "$ns2" $sender dead:beef:1::2
686 do_ping "$ns2" $sender 10.0.2.1
687 do_ping "$ns2" $sender dead:beef:2::1
689 do_ping "$ns3" $sender 10.0.2.2
690 do_ping "$ns3" $sender dead:beef:2::2
691 do_ping "$ns3" $sender 10.0.3.2
692 do_ping "$ns3" $sender dead:beef:3::2
694 do_ping "$ns4" $sender 10.0.3.1
695 do_ping "$ns4" $sender dead:beef:3::1
698 [ -n "$tc_loss" ] && tc -net "$ns2" qdisc add dev ns2eth3 root netem loss random $tc_loss delay ${tc_delay}ms
699 echo -n "INFO: Using loss of $tc_loss "
700 test "$tc_delay" -gt 0 && echo -n "delay $tc_delay ms "
702 reorder_delay=$(($tc_delay / 4))
704 if [ -z "${tc_reorder}" ]; then
705 reorder1=$((RANDOM%10))
706 reorder1=$((100 - reorder1))
707 reorder2=$((RANDOM%100))
709 if [ $reorder_delay -gt 0 ] && [ $reorder1 -lt 100 ] && [ $reorder2 -gt 0 ]; then
710 tc_reorder="reorder ${reorder1}% ${reorder2}%"
711 echo -n "$tc_reorder with delay ${reorder_delay}ms "
713 elif [ "$tc_reorder" = "0" ];then
715 elif [ "$reorder_delay" -gt 0 ];then
716 # reordering requires some delay
717 tc_reorder="reorder $tc_reorder"
718 echo -n "$tc_reorder with delay ${reorder_delay}ms "
723 tc -net "$ns3" qdisc add dev ns3eth4 root netem delay ${reorder_delay}ms $tc_reorder
725 for sender in $ns1 $ns2 $ns3 $ns4;do
726 run_tests_lo "$ns1" "$sender" 10.0.1.1 1
727 if [ $ret -ne 0 ] ;then
728 echo "FAIL: Could not even run loopback test" 1>&2
731 run_tests_lo "$ns1" $sender dead:beef:1::1 1
732 if [ $ret -ne 0 ] ;then
733 echo "FAIL: Could not even run loopback v6 test" 2>&1
737 # ns1<->ns2 is not subject to reordering/tc delays. Use it to test
738 # mptcp syncookie support.
739 if [ $sender = $ns1 ]; then
740 ip netns exec "$ns2" sysctl -q net.ipv4.tcp_syncookies=2
742 ip netns exec "$ns2" sysctl -q net.ipv4.tcp_syncookies=1
745 run_tests "$ns2" $sender 10.0.1.2
746 run_tests "$ns2" $sender dead:beef:1::2
747 run_tests "$ns2" $sender 10.0.2.1
748 run_tests "$ns2" $sender dead:beef:2::1
750 run_tests "$ns3" $sender 10.0.2.2
751 run_tests "$ns3" $sender dead:beef:2::2
752 run_tests "$ns3" $sender 10.0.3.2
753 run_tests "$ns3" $sender dead:beef:3::2
755 run_tests "$ns4" $sender 10.0.3.1
756 run_tests "$ns4" $sender dead:beef:3::1
759 run_tests_peekmode "saveWithPeek"
760 run_tests_peekmode "saveAfterPeek"
763 time_run=$((time_end-time_start))
765 echo "Time: ${time_run} seconds"