Skip to content
Snippets Groups Projects
Commit 87e647bd authored by jette's avatar jette
Browse files

Fix for timing issue in job steps now that slurm is much faster

(at initiating pending job steps), interupt driven rather than
retry based.\
parent 1967d512
No related branches found
No related tags found
No related merge requests found
......@@ -35,6 +35,7 @@ source ./globals
set test_id "1.14"
set exit_code 0
set file_in "test$test_id.input"
set file_in2 "test$test_id.input2"
set file_out "test$test_id.output"
set job_id 0
set sleep_secs 10
......@@ -59,19 +60,23 @@ if {[test_launch_poe]} {
# Run one more step than allocated CPUs and make sure it waits
# The "sleep 2" is meant to insure the earlier job steps start first
#
exec $bin_rm -f $file_in $file_out
exec $bin_rm -f $file_in $file_in2 $file_out
make_bash_script $file_in "
echo tasks_per_node=\$SLURM_TASKS_PER_NODE
inx=0
while \[ \$inx -lt \$SLURM_TASKS_PER_NODE \]
do
$srun --exclusive -n1 sleep $sleep_secs &
$srun --exclusive -n1 $bin_sleep $sleep_secs &
inx=\$((inx+1))
done
$bin_sleep 2
$srun -v --exclusive -n1 $scontrol show steps &
$srun -v --exclusive -n1 $file_in2 &
wait
"
make_bash_script $file_in2 "
$bin_sleep 2
$scontrol show steps
"
#
# Spawn a job via sbatch
......@@ -147,11 +152,11 @@ make_bash_script $file_in "
inx=0
while \[ \$inx -lt \$SLURM_TASKS_PER_NODE \]
do
$srun --exclusive -n1 sleep $sleep_secs &
$srun --exclusive -n1 $bin_sleep $sleep_secs &
inx=\$((inx+1))
done
$bin_sleep 2
$srun -v --exclusive -n1 --immediate $scontrol show steps &
$srun -v --exclusive -n1 --immediate $file_in2 &
wait
"
......@@ -218,7 +223,7 @@ if { $matches != 1 } {
}
if {$exit_code == 0} {
exec $bin_rm -f $file_in $file_out
exec $bin_rm -f $file_in $file_in2 $file_out
send_user "\nSUCCESS\n"
}
exit $exit_code
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment