blob: 9b7130295a853b1dccf65e8cb3889ebcab3a3a04 [file] [log] [blame]
#!/usr/bin/env expect
############################################################################
# Purpose: Test of Slurm functionality
# Verify srun behaves when its controlling terminal disappears.
############################################################################
# Copyright (C) 2006 The Regents of the University of California.
# Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER).
# Written by Christopher J. Morrone <morrone2@llnl.gov>
# CODE-OCEC-09-009. All rights reserved.
#
# This file is part of Slurm, a resource management program.
# For details, see <https://slurm.schedmd.com/>.
# Please also read the included file: DISCLAIMER.
#
# Slurm is free software; you can redistribute it and/or modify it under
# the terms of the GNU General Public License as published by the Free
# Software Foundation; either version 2 of the License, or (at your option)
# any later version.
#
# Slurm is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
# FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
# details.
#
# You should have received a copy of the GNU General Public License along
# with Slurm; if not, write to the Free Software Foundation, Inc.,
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
############################################################################
source ./globals
set test_script "$test_dir/job_script"
set job_id 0
#
# Create a test script to be launch by srun
#
make_bash_script $test_script {
echo "Running"
sleep 5
for ((i = 0; i < 100; i++)); do
cat /etc/hosts
done
}
proc cleanup {} {
global job_id
cancel_job $job_id
}
#
# Launch the test script
#
set timeout $max_job_delay
set step_id 0
set job_running 0
spawn $srun --unbuffered -v -n1 -t1 $test_script
expect {
-re "launching StepId=(($number)\\.$re_word_str)" {
set step_id $expect_out(1,string)
set job_id $expect_out(2,string)
exp_continue
}
"Running" {
set job_running 1
}
timeout {
fail "Failed to launch test program through srun"
}
eof {
wait
}
}
if {$job_id == 0 || $job_running == 0} {
fail "Failed to launch test program through srun"
}
#
# Kill srun's stdio streams
#
log_debug "Test saw step id $step_id"
set file [exp_open]
close $file
#
# Lets see if the job step finishes normally
#
set running "seed"
set i 0
while {$running ne ""} {
set running [exec $squeue --noheader --states=running --steps=$step_id]
sleep 1
if {$i == 30} {
cancel_job $job_id
sleep 5
exec kill -9 $srun_pid
fail "Job step is not completing"
}
incr i 1
}
log_debug "Test sees step is gone, srun should have exited as well"
#
# And finally check to see if srun is still hanging around (it should
# have exited by now) and job has completed
#
if [catch {exec kill -0 $srun_pid}] {
log_debug "Srun command is terminated, as desired"
} else {
fail "srun is still running after job exits!"
}
spawn $squeue --noheader --jobs=$job_id
expect {
-re "R" {
fail "Job not completed!"
}
timeout {
fail "squeue not responding"
}
eof {
wait
}
}