mirror of
https://github.com/drwetter/testssl.sh.git
synced 2025-01-03 23:39:45 +01:00
Improvements to mass testing in parallel
This PR provides improvements to `run_mass_testing_parallel()`. Currently, `run_mass_testing_parallel()` treats `$MAX_PARALLEL` as the maximum difference between the number of the test whose results were last processed and the number of the most recently started test. This means that test #40 will not be started until the results of test #20 have been processed. I've encountered situations in which tests 21 though 39 have completed, but test #20 is still running, and so no new tests are started. This PR fixes the problem by checking the status of all running child tests to see if any are complete, rather than just looking at `$NEXT_PARALLEL_TEST_TO_FINISH`. This prevents one slow child test (or a few slow child tests) from slowing up the entire mass testing process. This PR also changes the basis for determining whether a slow child process should be killed. Rather than waiting `$MAX_WAIT_TEST` seconds from the time that the parent started waiting (which is rather arbitrary), it kills the process if `$MAX_WAIT_TEST` seconds have passed since the child test was started. Given this, and that the above change makes it less likely that a slow child test will slow up the overall testing, I increased `$MAX_WAIT_TEST` from 600 seconds to 1200 seconds. I added some `debugme` statements that provide feedback on the status of testing, but in non-debug mode there may be a perception issue. If one test (e.g., test #20) is very slow, testssl.sh will not display any results from later tests until the slow test finishes, even though testssl.sh will continue running new tests in the background. The user, seeing no output from testssl.sh for an extended period of time, may think that testssl.sh has frozen, even though it is really just holding back on displaying the later results so that the results will be displayed in the order in which the tests were started.
This commit is contained in:
parent
2936a42bc7
commit
55df788937
73
testssl.sh
73
testssl.sh
@ -305,9 +305,9 @@ SERVER_COUNTER=0 # Counter for multiple servers
|
||||
|
||||
########### Global variables for parallel mass testing
|
||||
readonly PARALLEL_SLEEP=1 # Time to sleep after starting each test
|
||||
readonly MAX_WAIT_TEST=600 # Maximum time to wait for a test to complete
|
||||
readonly MAX_WAIT_TEST=1200 # Maximum time (in seconds) to wait for a test to complete
|
||||
readonly MAX_PARALLEL=20 # Maximum number of tests to run in parallel
|
||||
declare -a -i PARALLEL_TESTING_PID=() # process id for each child test
|
||||
declare -a -i PARALLEL_TESTING_PID=() # process id for each child test (or 0 to indicate test has already completed)
|
||||
declare -a PARALLEL_TESTING_CMDLINE=() # command line for each child test
|
||||
declare -i NR_PARALLEL_TESTS=0 # number of parallel tests run
|
||||
declare -i NEXT_PARALLEL_TEST_TO_FINISH=0 # number of parallel tests that have completed and have been processed
|
||||
@ -11311,7 +11311,8 @@ cleanup () {
|
||||
# to be killed before $TEMPDIR is deleted. Otherwise, error messages
|
||||
# will be created if testssl.sh is stopped before all testing is complete.
|
||||
while [[ $NEXT_PARALLEL_TEST_TO_FINISH -lt $NR_PARALLEL_TESTS ]]; do
|
||||
if ps ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} >/dev/null ; then
|
||||
if [[ ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} -ne 0 ]] && \
|
||||
ps ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} >/dev/null ; then
|
||||
kill ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} >&2 2>/dev/null
|
||||
wait ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} 2>/dev/null # make sure pid terminated, see wait(1p)
|
||||
else
|
||||
@ -12246,6 +12247,9 @@ get_next_message_testing_parallel_result() {
|
||||
#FIXME: not called/tested yet
|
||||
run_mass_testing_parallel() {
|
||||
local cmdline=""
|
||||
local -i i nr_active_tests=0
|
||||
local -a -i start_time=()
|
||||
local -i curr_time
|
||||
|
||||
if [[ ! -r "$FNAME" ]] && $IKNOW_FNAME; then
|
||||
fatal "Can't read file \"$FNAME\"" "2"
|
||||
@ -12269,32 +12273,73 @@ run_mass_testing_parallel() {
|
||||
CHILD_MASS_TESTING=true "$0" "${MASS_TESTING_CMDLINE[@]}" > "$TEMPDIR/term_output_$(printf "%08d" $NR_PARALLEL_TESTS).log" &
|
||||
fi
|
||||
PARALLEL_TESTING_PID[NR_PARALLEL_TESTS]=$!
|
||||
start_time[NR_PARALLEL_TESTS]=$(date +%s)
|
||||
debugme echo "Started test #$NR_PARALLEL_TESTS"
|
||||
NR_PARALLEL_TESTS+=1
|
||||
nr_active_tests+=1
|
||||
sleep $PARALLEL_SLEEP
|
||||
# Get the results of any completed tests
|
||||
while [[ $NEXT_PARALLEL_TEST_TO_FINISH -lt $NR_PARALLEL_TESTS ]]; do
|
||||
if ! ps ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} >/dev/null ; then
|
||||
if [[ ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} -eq 0 ]]; then
|
||||
get_next_message_testing_parallel_result
|
||||
NEXT_PARALLEL_TEST_TO_FINISH+=1
|
||||
elif ! ps ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} >/dev/null ; then
|
||||
debugme echo "Test #$NEXT_PARALLEL_TEST_TO_FINISH complete"
|
||||
get_next_message_testing_parallel_result
|
||||
NEXT_PARALLEL_TEST_TO_FINISH+=1
|
||||
nr_active_tests=$nr_active_tests-1
|
||||
else
|
||||
break
|
||||
fi
|
||||
done
|
||||
if [[ $NR_PARALLEL_TESTS-$NEXT_PARALLEL_TEST_TO_FINISH -ge $MAX_PARALLEL ]]; then
|
||||
# The maximum number of tests that may be run in parallel has
|
||||
# been reached. Need to wait for one to finish before starting
|
||||
# another.
|
||||
wait_kill ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} $MAX_WAIT_TEST
|
||||
[[ $? -eq 0 ]] && get_next_message_testing_parallel_result
|
||||
NEXT_PARALLEL_TEST_TO_FINISH+=1
|
||||
if [[ $nr_active_tests -ge $MAX_PARALLEL ]]; then
|
||||
curr_time=$(date +%s)
|
||||
while true; do
|
||||
# Check to see if any test completed
|
||||
for (( i=NEXT_PARALLEL_TEST_TO_FINISH; i < NR_PARALLEL_TESTS; i++ )); do
|
||||
if [[ ${PARALLEL_TESTING_PID[i]} -ne 0 ]] && \
|
||||
! ps ${PARALLEL_TESTING_PID[i]} >/dev/null ; then
|
||||
PARALLEL_TESTING_PID[i]=0
|
||||
nr_active_tests=$nr_active_tests-1
|
||||
debugme echo "Test #$i complete"
|
||||
break
|
||||
fi
|
||||
done
|
||||
[[ $nr_active_tests -lt $MAX_PARALLEL ]] && break
|
||||
if [[ $curr_time-${start_time[NEXT_PARALLEL_TEST_TO_FINISH]} -ge $MAX_WAIT_TEST ]]; then
|
||||
# No test completed in the allocated time, so the first one to
|
||||
# start will be killed.
|
||||
kill ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} >&2 2>/dev/null
|
||||
wait ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} 2>/dev/null # make sure pid terminated, see wait(1p)
|
||||
debugme echo "Test #$NEXT_PARALLEL_TEST_TO_FINISH stopped"
|
||||
NEXT_PARALLEL_TEST_TO_FINISH+=1
|
||||
nr_active_tests=$nr_active_tests-1
|
||||
break
|
||||
fi
|
||||
debugme echo "Waiting for test #$NEXT_PARALLEL_TEST_TO_FINISH"
|
||||
sleep 1
|
||||
curr_time+=1
|
||||
done
|
||||
fi
|
||||
done < "$FNAME"
|
||||
|
||||
# Wait for remaining tests to finish
|
||||
curr_time=$(date +%s)
|
||||
while [[ $NEXT_PARALLEL_TEST_TO_FINISH -lt $NR_PARALLEL_TESTS ]]; do
|
||||
wait_kill ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} $MAX_WAIT_TEST
|
||||
[[ $? -eq 0 ]] && get_next_message_testing_parallel_result
|
||||
NEXT_PARALLEL_TEST_TO_FINISH+=1
|
||||
if [[ ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} -eq 0 ]] || \
|
||||
! ps ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} >/dev/null ; then
|
||||
get_next_message_testing_parallel_result
|
||||
NEXT_PARALLEL_TEST_TO_FINISH+=1
|
||||
elif [[ $curr_time-${start_time[NEXT_PARALLEL_TEST_TO_FINISH]} -ge $MAX_WAIT_TEST ]]; then
|
||||
kill ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} >&2 2>/dev/null
|
||||
wait ${PARALLEL_TESTING_PID[NEXT_PARALLEL_TEST_TO_FINISH]} 2>/dev/null # make sure pid terminated, see wait(1p)
|
||||
debugme echo "Test #$NEXT_PARALLEL_TEST_TO_FINISH stopped"
|
||||
NEXT_PARALLEL_TEST_TO_FINISH+=1
|
||||
else
|
||||
debugme echo "Waiting for test #$NEXT_PARALLEL_TEST_TO_FINISH"
|
||||
sleep 1
|
||||
curr_time+=1
|
||||
fi
|
||||
done
|
||||
return $?
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user