blob: 035f39b7e0b6b999ac22dd931ea76866d3d0337b [file] [log] [blame]
#!/usr/bin/expect
############################################################################
# Purpose: Stress test of stdin broadcast
#
# Output: "TEST: #.#" followed by "SUCCESS" if test was successful, OR
# "FAILURE: ..." otherwise with an explanation of the failure, OR
# anything else indicates a failure mode that must be investigated.
#
# Note: This script generates and then deletes files in the working directory
# named test9.1.input and test9.1.output
############################################################################
# Copyright (C) 2002 The Regents of the University of California.
# Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER).
# Written by Morris Jette <jette1@llnl.gov>
# UCRL-CODE-226842.
#
# This file is part of SLURM, a resource management program.
# For details, see <http://www.llnl.gov/linux/slurm/>.
#
# SLURM is free software; you can redistribute it and/or modify it under
# the terms of the GNU General Public License as published by the Free
# Software Foundation; either version 2 of the License, or (at your option)
# any later version.
#
# SLURM is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
# FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
# details.
#
# You should have received a copy of the GNU General Public License along
# with SLURM; if not, write to the Free Software Foundation, Inc.,
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
############################################################################
source ./globals
set test_id "9.1"
set cycle_count 100
set exit_code 0
set file_in "test$test_id.input"
set file_out "test$test_id.output"
set job_name "test$test_id"
set task_cnt $max_stress_tasks
if { [test_bluegene] } {
set node_cnt 1-2048
} else {
if { [test_xcpu] } {
set node_cnt 1-1
} else {
set node_cnt 1-6
}
}
set other_opts "-O"
print_header $test_id
# Execute an srun job to cat input_file to output_file, wait for completion
# Returns 0 on successful completion, returns 1 otherwise
proc run_cat_job { input_file output_file } {
global bin_cat bin_rm job_name srun node_cnt other_opts task_cnt timeout
exec $bin_rm -f $output_file
set srun_pid [spawn $srun --job-name=$job_name --input=$input_file --output=$output_file --error=/dev/null -n$task_cnt -N$node_cnt $other_opts -t1 $bin_cat - ]
expect {
-re "Unable to contact" {
send_user "\nFAILURE: slurm appears to be down\n"
return 1
}
timeout {
send_user "\nFAILURE: srun not responding\n"
slow_kill $srun_pid
return 1
}
eof {
wait
}
}
return [wait_for_file $output_file]
}
#
# Create a sizable text file
#
exec $bin_rm -f $file_in $file_out
exec $bin_cat /etc/hosts >$file_in
exec $bin_cat /etc/passwd >>$file_in
set stdin_lines [get_line_cnt $file_in]
set stdout_target [expr $stdin_lines * $task_cnt]
#
# Run cycle_count jobs to copy job input to job output and compare sizes
#
set success_cnt 0
set timeout $max_job_delay
for {set inx 0} {$inx < $cycle_count} {incr inx} {
if {[run_cat_job $file_in $file_out]} {
set exit_code 1
continue
}
set stdout_lines [get_line_cnt $file_out]
if {$stdout_lines != $stdout_target} {
exec $bin_sleep 1
set stdout_lines [get_line_cnt $file_out]
}
if {$stdout_lines != $stdout_target} {
send_user "\nFAILURE: stdout is incomplete\n"
set exit_code 1
} else {
incr success_cnt
}
}
exec $bin_rm -f $file_in $file_out
if {$exit_code == 0} {
send_user "\nSUCCESS\n"
} else {
send_user "\nFAILURE: Only $success_cnt of $cycle_count"
send_user " copy tests passed\n"
}
exit $exit_code