blob: ace2da58994468517e36385d9c9fa781b53981d2 [file] [log] [blame]
#!/usr/bin/env expect
############################################################################
# Purpose: Test of Slurm functionality
# Validate that the mcs plugin (mcs/user) is OK with sbatch
############################################################################
# Copyright (C) 2015 CEA/DAM/DIF
# Written by Aline Roy <aline.roy@cea.fr>
#
# This file is part of Slurm, a resource management program.
# For details, see <https://slurm.schedmd.com/>.
# Please also read the included file: DISCLAIMER.
#
# Slurm is free software; you can redistribute it and/or modify it under
# the terms of the GNU General Public License as published by the Free
# Software Foundation; either version 2 of the License, or (at your option)
# any later version.
#
# Slurm is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
# FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
# details.
#
# You should have received a copy of the GNU General Public License along
# with Slurm; if not, write to the Free Software Foundation, Inc.
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
############################################################################
source ./globals
set cwd "[$bin_pwd]"
set config_path ""
set tmp_job "$test_dir/script"
set job_id 0
if {![is_super_user]} {
skip "This test can't be run except as SlurmUser"
}
set config_path [get_conf_path]
set config_file $config_path/slurm.conf
save_conf $config_file
proc cleanup {} {
global job_id config_file
# Clean up vestigial files, jobs and restore original slurm.conf file
cancel_job $job_id
restore_conf $config_file
reconfigure
}
log_info "---Checking sbatch uses mcs-label only for some jobs (ondemand,select mode)---"
#
# Change the slurm.conf MCSparameters and MCSPlugin
# test with ondemand,select
#
exec $bin_sed -i /^\[\t\s\]*MCSPlugin\[\t\s\]*=/Id $config_file
exec $bin_sed -i /^\[\t\s\]*MCSParameters\[\t\s\]*=/Id $config_file
exec $bin_sed -i /^\[\t\s\]*PrivateData\[\t\s\]*=/Id $config_file
exec $bin_echo -e "\nMCSPlugin=mcs/user" >> $config_file
exec $bin_echo MCSParameters=ondemand,select,privatedata >> $config_file
exec $bin_echo PrivateData=jobs,nodes >> $config_file
reconfigure -fail
#
# verify slurm conf parameters MCS
#
set found 0
spawn -noecho $bin_bash -c "exec $scontrol show config | $bin_grep MCS"
expect {
-re "MCSPlugin = mcs/user" {
log_debug " MCSPlugin=mcs/user OK"
set found 1
exp_continue
}
timeout {
fail "scontrol is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "MCSPlugin parameter in scontrol show config is not mcs/user"
}
###### Check that sbatch fails with a bad mcs-label ######
log_info "---Checking sbatch fails with a bad mcs-label ---"
set timeout $max_job_delay
make_bash_script $tmp_job "sleep 30"
spawn $sbatch -N1 --mcs-label=foo -t10 $tmp_job
expect {
-re "Batch job submission failed: Invalid mcs_label specified" {
log_debug "This error is expected, no worries"
exp_continue
}
timeout {
fail "sbatch not responding"
}
eof {
wait
}
}
###### Check that sbatch uses mcs-label=user ######
log_info "---Checking sbatch uses mcs-label=user---"
make_bash_script $tmp_job "sleep 30"
spawn $sbatch -N1 -o/dev/null --exclusive=mcs -t10 $tmp_job
expect {
-re "Submitted batch job ($number)" {
set job_id $expect_out(1,string)
exp_continue
}
timeout {
fail "sbatch is not responding"
}
eof {
wait
}
}
if {$job_id == 0} {
fail "Job was not submitted"
}
wait_for_job -fail $job_id "RUNNING"
set user_name [get_my_user_name]
set found 0
spawn $squeue --jobs=$job_id --noheader -O "mcslabel"
expect {
-re "(null)" {
log_debug "NO MCS-label for this job : this is not expected"
exp_continue
}
-re "$user_name" {
log_debug "MCS-label OK for this job"
set found 1
exp_continue
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "Job was submitted with a bad mcs-label"
}
cancel_job $job_id
make_bash_script $tmp_job "sleep 30"
set job_id 0
spawn $sbatch -N1 --mcs-label=$user_name --exclusive=mcs -o/dev/null -t10 $tmp_job
expect {
-re "Submitted batch job ($number)" {
set job_id $expect_out(1,string)
exp_continue
}
timeout {
fail "sbatch is not responding"
}
eof {
wait
}
}
if {$job_id == 0} {
fail "Job was not submitted"
}
wait_for_job -fail $job_id "RUNNING"
set found 0
spawn $squeue --jobs=$job_id --noheader -O "mcslabel"
expect {
-re "$user_name" {
log_debug "MCS-label OK for this job"
set found 1
exp_continue
}
-re "Invalid job format specification" {
fail "Invalid job format specification mcslabel"
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "Job was submitted with a bad mcs-label"
}
# If accounting is configured, test mcs-label in sacct
if {[get_config_param "AccountingStorageType"] eq "accounting_storage/slurmdbd"} {
subtest {![wait_for_command_match "$sacct -j $job_id --allocations --format McsLabel --parsable2 --noheader" $user_name]} "Verify MCS-label in sacct"
} else {
subskip "Test needs AccountingStorageType=accounting_storage/slurmdbd to verify MCS-labels in sacct"
}
set found 0
set node 0
spawn $squeue --jobs=$job_id --noheader -O "nodelist"
expect {
-re "($re_word_str)" {
set node $expect_out(1,string)
log_debug "Node for this job : $node"
set found 1
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "No node found in squeue command"
}
#
# verify MCS of nodes
#
set found 0
spawn -noecho $bin_bash -c "exec $scontrol show node=$node | $bin_grep MCS"
expect {
-re "MCS_label=$user_name" {
log_debug "mcs_label OK for node $node"
set found 1
exp_continue
}
timeout {
fail "scontrol is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "Job was submitted with node with bad mcs-label"
}
cancel_job $job_id
#
# Change the slurm.conf MCSparameters and MCSPlugin
# test with enforced,noselect
#
log_info "---Checking sbatch uses mcs-label with all jobs (enforced,noselect mode)---"
exec $bin_sed -i /^\[\t\s\]*MCSPlugin\[\t\s\]*=/Id $config_file
exec $bin_sed -i /^\[\t\s\]*MCSParameters\[\t\s\]*=/Id $config_file
exec $bin_sed -i /^\[\t\s\]*PrivateData\[\t\s\]*=/Id $config_file
exec $bin_echo -e "\nMCSPlugin=mcs/user" >> $config_file
exec $bin_echo MCSParameters=enforced,noselect,privatedata >> $config_file
exec $bin_echo PrivateData=jobs,nodes >> $config_file
reconfigure -fail
###### Check that sbatch uses mcs-label=user ######
log_info "---Checking sbatch uses mcs-label=user---"
make_bash_script $tmp_job "sleep 30"
spawn $sbatch -N1 -o/dev/null -t1 $tmp_job
expect {
-re "Submitted batch job ($number)" {
set job_id $expect_out(1,string)
exp_continue
}
timeout {
fail "sbatch is not responding"
}
eof {
wait
}
}
if {$job_id == 0} {
fail "Job was not submitted"
}
wait_for_job -fail $job_id "RUNNING"
set found 0
spawn $squeue --jobs=$job_id --noheader -O "mcslabel"
expect {
-re "$user_name" {
log_debug "MCS-label OK for this job"
set found 1
exp_continue
}
-re "(null)" {
fail "NO MCS-label for this job"
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "Job was submitted with a bad mcs-label"
}
set found 0
set node 0
spawn $squeue --jobs=$job_id --noheader -O "nodelist"
expect {
-re "($re_word_str)" {
set node $expect_out(1,string)
log_debug "Node for this job : $node"
set found 1
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "No node found in squeue command"
}
#
# verify MCS of nodes
#
set found 0
spawn -noecho $bin_bash -c "exec $scontrol show node=$node | $bin_grep MCS"
expect {
-re "MCS_label=$user_name" {
fail "An mcs_label is found for this job. It was not expected"
}
-re "MCS_label=N/A" {
log_debug "No mcs_label for this node. It was expected"
}
timeout {
fail "scontrol is not responding"
}
eof {
wait
}
}
cancel_job $job_id
#
# Change the slurm.conf MCSparameters and MCSPlugin
# test with ondemand,noselect
#
log_info "---Checking sbatch doesn't use mcs-label on filter (ondemand,noselect mode)---"
exec $bin_sed -i /^\[\t\s\]*MCSPlugin\[\t\s\]*=/Id $config_file
exec $bin_sed -i /^\[\t\s\]*MCSParameters\[\t\s\]*=/Id $config_file
exec $bin_sed -i /^\[\t\s\]*PrivateData\[\t\s\]*=/Id $config_file
exec $bin_echo -e "\nMCSPlugin=mcs/user" >> $config_file
exec $bin_echo MCSParameters=ondemand,noselect,privatedata >> $config_file
exec $bin_echo PrivateData=jobs,nodes >> $config_file
reconfigure -fail
###### Check that sbatch uses mcs-label=user ######
log_info "---Checking sbatch uses --exclusive=mcs ---"
make_bash_script $tmp_job "sleep 30"
spawn $sbatch -N1 --exclusive=mcs -o/dev/null -t10 $tmp_job
expect {
-re "Submitted batch job ($number)" {
set job_id $expect_out(1,string)
exp_continue
}
timeout {
fail "sbatch is not responding"
}
eof {
wait
}
}
if {$job_id == 0} {
fail "Job was not submitted"
}
wait_for_job -fail $job_id "RUNNING"
set found 0
spawn $squeue --jobs=$job_id --noheader -O "mcslabel"
expect {
-re "$user_name" {
log_debug "MCS-label OK for this job"
set found 1
exp_continue
}
-re "(null)" {
fail "NO MCS-label for this job"
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "Job was submitted with a bad mcs-label"
}
set found 0
set node 0
spawn $squeue --jobs=$job_id --noheader -O "nodelist"
expect {
-re "($re_word_str)" {
set node $expect_out(1,string)
log_debug "Node for this job : $node"
set found 1
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "No node found in squeue command"
}
#
# verify MCS of nodes
#
set found 0
spawn -noecho $bin_bash -c "exec $scontrol show node=$node | $bin_grep MCS"
expect {
-re "MCS_label=$user_name" {
fail "An mcs_label is found for this job. It was not expected"
}
-re "MCS_label=N/A" {
log_debug "No mcs_label for this node. It was expected"
}
timeout {
fail "scontrol is not responding"
}
eof {
wait
}
}
cancel_job $job_id
###### Check that sbatch doesn't use mcs-label ######
log_info "---Checking sbatch uses --exclusive=mcs ---"
make_bash_script $tmp_job "sleep 30"
set job_id 0
spawn $sbatch -N1 -o/dev/null -t10 $tmp_job
expect {
-re "Submitted batch job ($number)" {
set job_id $expect_out(1,string)
exp_continue
}
timeout {
fail "sbatch is not responding"
}
eof {
wait
}
}
if {$job_id == 0} {
fail "job was not submitted"
}
wait_for_job -fail $job_id "RUNNING"
set found 0
spawn $squeue --jobs=$job_id --noheader -O "mcslabel"
expect {
-re "(null)" {
log_debug "NO MCS-label for this job : this is expected"
exp_continue
}
-re "$user_name" {
log_debug "A MCS-label for this job : this is not expected"
set found 1
exp_continue
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 1} {
fail "Job was submitted with a bad mcs-label"
}
cancel_job $job_id
wait_for_job -fail $job_id "DONE"
log_info "---Checking sbatch uses mcs-label for all jobs (enforced,select mode)---"
#
# Change the slurm.conf MCSparameters and MCSPlugin
# test with enforced,select
#
exec $bin_sed -i /^\[\t\s\]*MCSPlugin\[\t\s\]*=/Id $config_file
exec $bin_sed -i /^\[\t\s\]*MCSParameters\[\t\s\]*=/Id $config_file
exec $bin_sed -i /^\[\t\s\]*PrivateData\[\t\s\]*=/Id $config_file
exec $bin_echo -e "\nMCSPlugin=mcs/user" >> $config_file
exec $bin_echo MCSParameters=enforced,select,privatedata >> $config_file
exec $bin_echo PrivateData=jobs,nodes >> $config_file
reconfigure -fail
###### Check that sbatch uses mcs-label=user ######
log_info "---Checking sbatch with no --exclusive=mcs ---"
make_bash_script $tmp_job "sleep 30"
set job_id 0
spawn $sbatch -N1 -o/dev/null -t20 $tmp_job
expect {
-re "Submitted batch job ($number)" {
set job_id $expect_out(1,string)
exp_continue
}
timeout {
fail "sbatch is not responding"
}
eof {
wait
}
}
if {$job_id == 0} {
fail "Job was not submitted"
}
wait_for_job -fail $job_id "RUNNING"
set found 0
spawn $squeue --jobs=$job_id --noheader -O "mcslabel"
expect {
-re "(null)" {
log_debug "NO MCS-label for this job : this is not expected"
exp_continue
}
-re "$user_name" {
log_debug "MCS-label OK for this job"
set found 1
exp_continue
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "Job was submitted with a bad mcs-label"
}
set found 0
set node 0
spawn $squeue --jobs=$job_id --noheader -O "nodelist"
expect {
-re "($re_word_str)" {
set node $expect_out(1,string)
log_debug "Node for this job : $node"
set found 1
}
timeout {
fail "squeue is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "No node found in squeue command"
}
#
# verify MCS of nodes
#
set found 0
spawn -noecho $bin_bash -c "exec $scontrol show node=$node | $bin_grep MCS"
expect {
-re "MCS_label=$user_name" {
log_debug "mcs_label OK for node $node"
set found 1
exp_continue
}
timeout {
fail "scontrol is not responding"
}
eof {
wait
}
}
if {$found == 0} {
fail "Job was submitted with node with bad mcs-label"
}