| #!/usr/bin/expect |
| ############################################################################ |
| # Purpose: Stress test of stdin broadcast |
| # |
| # Output: "TEST: #.#" followed by "SUCCESS" if test was successful, OR |
| # "FAILURE: ..." otherwise with an explanation of the failure, OR |
| # anything else indicates a failure mode that must be investigated. |
| # |
| # Note: This script generates and then deletes files in the working directory |
| # named test9.1.input and test9.1.output |
| ############################################################################ |
| # Copyright (C) 2002 The Regents of the University of California. |
| # Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER). |
| # Written by Morris Jette <jette1@llnl.gov> |
| # UCRL-CODE-226842. |
| # |
| # This file is part of SLURM, a resource management program. |
| # For details, see <http://www.llnl.gov/linux/slurm/>. |
| # |
| # SLURM is free software; you can redistribute it and/or modify it under |
| # the terms of the GNU General Public License as published by the Free |
| # Software Foundation; either version 2 of the License, or (at your option) |
| # any later version. |
| # |
| # SLURM is distributed in the hope that it will be useful, but WITHOUT ANY |
| # WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
| # FOR A PARTICULAR PURPOSE. See the GNU General Public License for more |
| # details. |
| # |
| # You should have received a copy of the GNU General Public License along |
| # with SLURM; if not, write to the Free Software Foundation, Inc., |
| # 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. |
| ############################################################################ |
| source ./globals |
| |
| set test_id "9.1" |
| set cycle_count 100 |
| set exit_code 0 |
| set file_in "test$test_id.input" |
| set file_out "test$test_id.output" |
| set job_name "test$test_id" |
| set task_cnt $max_stress_tasks |
| |
| if { [test_bluegene] } { |
| set node_cnt 1-2048 |
| } else { |
| if { [test_xcpu] } { |
| set node_cnt 1-1 |
| } else { |
| set node_cnt 1-6 |
| } |
| } |
| |
| set other_opts "-O" |
| |
| print_header $test_id |
| |
| # Execute an srun job to cat input_file to output_file, wait for completion |
| # Returns 0 on successful completion, returns 1 otherwise |
| proc run_cat_job { input_file output_file } { |
| global bin_cat bin_rm job_name srun node_cnt other_opts task_cnt timeout |
| exec $bin_rm -f $output_file |
| |
| set srun_pid [spawn $srun --job-name=$job_name --input=$input_file --output=$output_file --error=/dev/null -n$task_cnt -N$node_cnt $other_opts -t1 $bin_cat - ] |
| expect { |
| -re "Unable to contact" { |
| send_user "\nFAILURE: slurm appears to be down\n" |
| return 1 |
| } |
| timeout { |
| send_user "\nFAILURE: srun not responding\n" |
| slow_kill $srun_pid |
| return 1 |
| } |
| eof { |
| wait |
| } |
| } |
| |
| return [wait_for_file $output_file] |
| } |
| |
| # |
| # Create a sizable text file |
| # |
| exec $bin_rm -f $file_in $file_out |
| exec $bin_cat /etc/hosts >$file_in |
| exec $bin_cat /etc/passwd >>$file_in |
| set stdin_lines [get_line_cnt $file_in] |
| set stdout_target [expr $stdin_lines * $task_cnt] |
| |
| # |
| # Run cycle_count jobs to copy job input to job output and compare sizes |
| # |
| set success_cnt 0 |
| set timeout $max_job_delay |
| for {set inx 0} {$inx < $cycle_count} {incr inx} { |
| if {[run_cat_job $file_in $file_out]} { |
| set exit_code 1 |
| continue |
| } |
| set stdout_lines [get_line_cnt $file_out] |
| if {$stdout_lines != $stdout_target} { |
| exec $bin_sleep 1 |
| set stdout_lines [get_line_cnt $file_out] |
| } |
| if {$stdout_lines != $stdout_target} { |
| send_user "\nFAILURE: stdout is incomplete\n" |
| set exit_code 1 |
| } else { |
| incr success_cnt |
| } |
| } |
| exec $bin_rm -f $file_in $file_out |
| |
| if {$exit_code == 0} { |
| send_user "\nSUCCESS\n" |
| } else { |
| send_user "\nFAILURE: Only $success_cnt of $cycle_count" |
| send_user " copy tests passed\n" |
| } |
| exit $exit_code |