test/nvmf: Restart target between shutdown tests

For RDMA, it seems we may have to wait out some timeouts to reset all of the connections to make this test work reliably. Instead, just restart the target for each test. If there's a way to force close all of the connections properly in the future we can go back to running these all on a single target. Change-Id: If79257349007765dc16bacebf810312a025d70a3 Signed-off-by: Ben Walker <benjamin.walker@intel.com> Reviewed-on: https://review.spdk.io/gerrit/c/spdk/spdk/+/1609 Community-CI: Broadcom CI Tested-by: SPDK CI Jenkins <sys_sgci@intel.com> Reviewed-by: Shuhei Matsumoto <shuhei.matsumoto.xt@hitachi.com> Reviewed-by: Jim Harris <james.r.harris@intel.com> Reviewed-by: Aleksey Marchuk <alexeymar@mellanox.com>
2020-03-31 11:01:08 -07:00 · 2020-03-31 11:01:08 -07:00 · 5dfd4f261f
commit 5dfd4f261f
parent f76cf58294
1 changed files with 55 additions and 40 deletions
--- a/test/nvmf/target/shutdown.sh
+++ b/test/nvmf/target/shutdown.sh
@ -10,98 +10,8 @@ MALLOC_BLOCK_SIZE=512
 rpc_py="$rootdir/scripts/rpc.py"
-function waitforio() {
+function starttarget() {
-	# $1 = RPC socket
+	# Start the target
 	if [ -z "$1" ]; then
 		exit 1
 	fi
 	# $2 = bdev name
 	if [ -z "$2" ]; then
 		exit 1
 	fi
 	local ret=1
 	local i
 	for (( i = 10; i != 0; i-- )); do
 		read_io_count=$($rpc_py -s $1 bdev_get_iostat -b $2 | jq -r '.bdevs[0].num_read_ops')
 		# A few I/O will happen during initial examine.  So wait until at least 100 I/O
 		#  have completed to know that bdevperf is really generating the I/O.
 		if [ $read_io_count -ge 100 ]; then
 			ret=0
 			break
 		fi
 		sleep 0.25
 	done
 	return $ret
 }
 # Test 1: Kill the initiator unexpectedly with no I/O outstanding
 function nvmf_shutdown_tc1 {
 	# Run bdev_svc, which connects but does not issue I/O
 	$rootdir/test/app/bdev_svc/bdev_svc -m 0x1 -i 1 -r /var/tmp/bdevperf.sock -c $testdir/bdevperf.conf &
 	perfpid=$!
 	waitforlisten $perfpid /var/tmp/bdevperf.sock
 	$rpc_py -s /var/tmp/bdevperf.sock framework_wait_init
 	# Kill bdev_svc
 	kill -9 $perfpid || true
 	rm -f /var/run/spdk_bdev1
 	# Verify the target stays up
 	sleep 1
 	kill -0 $nvmfpid
 	# Connect with bdevperf and confirm it works
 	$rootdir/test/bdev/bdevperf/bdevperf -r /var/tmp/bdevperf.sock -c $testdir/bdevperf.conf -q 64 -o 65536 -w verify -t 1
 	# We have seen the latent failure that the test 2 will see that the target is still finishing
 	# tearing down the qpair when connecting it.  As a workaround, leave a few seconds here to wait
 	# for the completion.
 	sleep 2
 }
 # Test 2: Kill initiator unexpectedly with I/O outstanding
 function nvmf_shutdown_tc2 {
 	# Run bdevperf
 	$rootdir/test/bdev/bdevperf/bdevperf -r /var/tmp/bdevperf.sock -c $testdir/bdevperf.conf -q 64 -o 65536 -w verify -t 10 &
 	perfpid=$!
 	waitforlisten $perfpid /var/tmp/bdevperf.sock
 	$rpc_py -s /var/tmp/bdevperf.sock framework_wait_init
 	waitforio /var/tmp/bdevperf.sock Nvme1n1
 	# Kill bdevperf half way through
 	killprocess $perfpid
 	# Verify the target stays up
 	sleep 1
 	kill -0 $nvmfpid
 }
 # Test 3: Kill the target unexpectedly with I/O outstanding
 function nvmf_shutdown_tc3 {
 	# Run bdevperf
 	$rootdir/test/bdev/bdevperf/bdevperf -r /var/tmp/bdevperf.sock -c $testdir/bdevperf.conf -q 64 -o 65536 -w verify -t 10 &
 	perfpid=$!
 	waitforlisten $perfpid /var/tmp/bdevperf.sock
 	$rpc_py -s /var/tmp/bdevperf.sock framework_wait_init
 	# Expand the trap to clean up bdevperf if something goes wrong
 	trap 'process_shm --id $NVMF_APP_SHM_ID; kill -9 $perfpid || true; nvmftestfini; exit 1' SIGINT SIGTERM EXIT
 	waitforio /var/tmp/bdevperf.sock Nvme1n1
 	# Kill the target half way through
 	killprocess $nvmfpid
 	nvmfpid=
 	# Verify bdevperf exits successfully
 	sleep 1
 	# TODO: Right now the NVMe-oF initiator will not correctly detect broken connections
 	# and so it will never shut down. Just kill it.
 	kill -9 $perfpid || true
 }
 nvmftestinit
 	nvmfappstart "-m 0x1E"
 	$rpc_py nvmf_create_transport $NVMF_TRANSPORT_OPTS -u 8192
@ -134,13 +44,118 @@ done
 	$rpc_py < $testdir/rpcs.txt
 	timing_exit create_subsystems
 }
 function stoptarget() {
 	rm -f ./local-job0-0-verify.state
 	rm -rf $testdir/bdevperf.conf
 	rm -rf $testdir/rpcs.txt
 	nvmftestfini
 }
 function waitforio() {
 	# $1 = RPC socket
 	if [ -z "$1" ]; then
 		exit 1
 	fi
 	# $2 = bdev name
 	if [ -z "$2" ]; then
 		exit 1
 	fi
 	local ret=1
 	local i
 	for (( i = 10; i != 0; i-- )); do
 		read_io_count=$($rpc_py -s $1 bdev_get_iostat -b $2 | jq -r '.bdevs[0].num_read_ops')
 		# A few I/O will happen during initial examine.  So wait until at least 100 I/O
 		#  have completed to know that bdevperf is really generating the I/O.
 		if [ $read_io_count -ge 100 ]; then
 			ret=0
 			break
 		fi
 		sleep 0.25
 	done
 	return $ret
 }
 # Test 1: Kill the initiator unexpectedly with no I/O outstanding
 function nvmf_shutdown_tc1 {
 	starttarget
 	# Run bdev_svc, which connects but does not issue I/O
 	$rootdir/test/app/bdev_svc/bdev_svc -m 0x1 -i 1 -r /var/tmp/bdevperf.sock -c $testdir/bdevperf.conf &
 	perfpid=$!
 	waitforlisten $perfpid /var/tmp/bdevperf.sock
 	$rpc_py -s /var/tmp/bdevperf.sock framework_wait_init
 	# Kill bdev_svc
 	kill -9 $perfpid || true
 	rm -f /var/run/spdk_bdev1
 	# Verify the target stays up
 	sleep 1
 	kill -0 $nvmfpid
 	# Connect with bdevperf and confirm it works
 	$rootdir/test/bdev/bdevperf/bdevperf -r /var/tmp/bdevperf.sock -c $testdir/bdevperf.conf -q 64 -o 65536 -w verify -t 1
 	stoptarget
 }
 # Test 2: Kill initiator unexpectedly with I/O outstanding
 function nvmf_shutdown_tc2 {
 	starttarget
 	# Run bdevperf
 	$rootdir/test/bdev/bdevperf/bdevperf -r /var/tmp/bdevperf.sock -c $testdir/bdevperf.conf -q 64 -o 65536 -w verify -t 10 &
 	perfpid=$!
 	waitforlisten $perfpid /var/tmp/bdevperf.sock
 	$rpc_py -s /var/tmp/bdevperf.sock framework_wait_init
 	waitforio /var/tmp/bdevperf.sock Nvme1n1
 	# Kill bdevperf half way through
 	killprocess $perfpid
 	# Verify the target stays up
 	sleep 1
 	kill -0 $nvmfpid
 	stoptarget
 }
 # Test 3: Kill the target unexpectedly with I/O outstanding
 function nvmf_shutdown_tc3 {
 	starttarget
 	# Run bdevperf
 	$rootdir/test/bdev/bdevperf/bdevperf -r /var/tmp/bdevperf.sock -c $testdir/bdevperf.conf -q 64 -o 65536 -w verify -t 10 &
 	perfpid=$!
 	waitforlisten $perfpid /var/tmp/bdevperf.sock
 	$rpc_py -s /var/tmp/bdevperf.sock framework_wait_init
 	# Expand the trap to clean up bdevperf if something goes wrong
 	trap 'process_shm --id $NVMF_APP_SHM_ID; kill -9 $perfpid || true; nvmftestfini; exit 1' SIGINT SIGTERM EXIT
 	waitforio /var/tmp/bdevperf.sock Nvme1n1
 	# Kill the target half way through
 	killprocess $nvmfpid
 	nvmfpid=
 	# Verify bdevperf exits successfully
 	sleep 1
 	# TODO: Right now the NVMe-oF initiator will not correctly detect broken connections
 	# and so it will never shut down. Just kill it.
 	kill -9 $perfpid || true
 	stoptarget
 }
 nvmftestinit
 run_test "nvmf_shutdown_tc1" nvmf_shutdown_tc1
 run_test "nvmf_shutdown_tc2" nvmf_shutdown_tc2
 run_test "nvmf_shutdown_tc3" nvmf_shutdown_tc3
 rm -f ./local-job0-0-verify.state
 rm -rf $testdir/bdevperf.conf
 rm -rf $testdir/rpcs.txt
 trap - SIGINT SIGTERM EXIT
 nvmftestfini