1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176
|
#!/usr/bin/env expect
############################################################################
# Purpose: Validate sbatch hetjob environment variables.
#
# Reqs: 1. Using slurmdbd accounting storage type and is up
# 2. controllers are up and running.
############################################################################
# Copyright (C) 2017 SchedMD LLC.
# Written by Isaac Hartung <ihartung@schedmd.com>
#
# This file is part of Slurm, a resource management program.
# For details, see <https://slurm.schedmd.com/>.
# Please also read the included file: DISCLAIMER.
#
# Slurm is free software; you can redistribute it and/or modify it under
# the terms of the GNU General Public License as published by the Free
# Software Foundation; either version 2 of the License, or (at your option)
# any later version.
#
# Slurm is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
# FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
# details.
#
# You should have received a copy of the GNU General Public License along
# with Slurm; if not, write to the Free Software Foundation, Inc.,
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
############################################################################
source ./globals
set job_id 0
set file_in "$test_dir/input"
set file_out "$test_dir/output"
if {[get_config_param "SchedulerType"] ne "sched/backfill"} {
skip "This test requires SchedulerType = sched/backfill"
}
# find out if we have enough nodes to test functionality
set node_count [get_partition_param [default_partition] "TotalNodes"]
if { $node_count < 3 } {
skip "Insufficient nodes in default partition ($node_count < 3)"
}
proc sbatch {} {
global number sbatch file_in bin_sleep file_out job_id
set matches 0
set job_id 0
set command "$sbatch -t1 -o $file_out $file_in"
set regex "Submitted batch job ($number).+"
spawn {*}$command
expect {
-re "Batch job submission failed" {
skip "Unable to execute test due to system configuration"
}
-re "$regex" {
incr matches
set job_id $expect_out(1,string)
}
timeout {
fail "sbatch not responding"
}
eof {
wait
}
}
if {$matches != 1} {
fail "Batch submit failure"
}
}
proc test_env {value} {
global bin_cat file_out
set matches 0
log_user 0
spawn $bin_cat $file_out
expect {
-re "$value" {
incr matches
exp_continue
}
eof {
wait
}
}
log_user 1
if {$matches != 1} {
fail "Output of env $value incorrect ($matches != 1)"
}
}
proc cleanup { } {
global job_id
cancel_job $job_id
}
# Start test
make_bash_script $file_in "#SBATCH --cpus-per-task=4 --mem-per-cpu=10 --ntasks=1
#SBATCH hetjob
#SBATCH --cpus-per-task=2 --mem-per-cpu=2 --ntasks=1 -t1
#SBATCH hetjob
#SBATCH --cpus-per-task=1 --mem-per-cpu=6 --ntasks=1 -t1
env"
log_info "\n################################################################\n"
log_info "Submit hetjob and verify output from scontrol show job"
log_info "\n################################################################\n"
sbatch
if {$job_id == 0} {
fail "Error submitting job ($job_id)"
}
#
# Check for desired output
#
wait_for_job -fail $job_id DONE
wait_for_file -fail $file_out
set matches 0
spawn $bin_cat $file_out
expect {
-re "SLURM_HET_SIZE=3" {
#once
incr matches
exp_continue
}
eof {
wait
}
}
if {$matches != 1} {
fail "Output of env SLURM_HET_SIZE=3 incorrect ($matches != 1)"
}
set matches 0
log_user 0
spawn $bin_cat $file_out
expect {
-re "SLURM_JOB_PARTITION_HET_GROUP" {
#three
incr matches
exp_continue
}
eof {
wait
}
}
log_user 1
if {$matches != 3} {
fail "Output of env SLURM_JOB_PARTITION_HET_GROUP incorrect ($matches != 3)"
}
test_env "SLURM_CPUS_PER_TASK_HET_GROUP_0=4"
test_env "SLURM_CPUS_PER_TASK_HET_GROUP_1=2"
test_env "SLURM_CPUS_PER_TASK_HET_GROUP_2=1"
test_env "SLURM_JOB_ID_HET_GROUP_0=$job_id"
test_env "SLURM_JOB_ID_HET_GROUP_1="
test_env "SLURM_JOB_ID_HET_GROUP_2="
test_env "SLURM_MEM_PER_CPU_HET_GROUP_0=10"
test_env "SLURM_MEM_PER_CPU_HET_GROUP_1=2"
test_env "SLURM_MEM_PER_CPU_HET_GROUP_2=6"
test_env "SLURM_NTASKS_HET_GROUP_0=1"
test_env "SLURM_NTASKS_HET_GROUP_1=1"
test_env "SLURM_NTASKS_HET_GROUP_2=1"
|