Skip to content
Snippets Groups Projects
Commit 6cb7ef77 authored by Morris Jette's avatar Morris Jette
Browse files

Merge branch 'slurm-15.08'

parents 6128db25 14ba53b2
No related branches found
No related tags found
No related merge requests found
...@@ -46,6 +46,7 @@ documents those changes that are of interest to users and administrators. ...@@ -46,6 +46,7 @@ documents those changes that are of interest to users and administrators.
node. node.
-- Don't requeue RPC going out from slurmctld to DOWN nodes (can generate -- Don't requeue RPC going out from slurmctld to DOWN nodes (can generate
repeating communication errors). repeating communication errors).
-- Propagate sbatch "--dist=plane=#" option to srun.
* Changes in Slurm 15.08.1 * Changes in Slurm 15.08.1
========================== ==========================
...@@ -506,6 +507,7 @@ documents those changes that are of interest to users and administrators. ...@@ -506,6 +507,7 @@ documents those changes that are of interest to users and administrators.
race condition of the node suspend and ping logic. race condition of the node suspend and ping logic.
-- Don't requeue RPC going out from slurmctld to DOWN nodes (can generate -- Don't requeue RPC going out from slurmctld to DOWN nodes (can generate
repeating communication errors). repeating communication errors).
-- Propagate sbatch "--dist=plane=#" option to srun.
* Changes in Slurm 14.11.9 * Changes in Slurm 14.11.9
========================== ==========================
......
...@@ -14,7 +14,7 @@ cluster. ...@@ -14,7 +14,7 @@ cluster.
Good responsiveness and throughput can be achieved while you only pay for the Good responsiveness and throughput can be achieved while you only pay for the
resources needed.</p> resources needed.</p>
<p>The rest of this document describes details abou. Slurm's infrastructure that <p>The rest of this document describes details about Slurm's infrastructure that
can be used to support Elastic Computing.</p> can be used to support Elastic Computing.</p>
<p>Slurm's Elastic Computing logic relies heavily upon the existing power save <p>Slurm's Elastic Computing logic relies heavily upon the existing power save
......
...@@ -256,9 +256,14 @@ task_dist_states_t verify_dist_type(const char *arg, uint32_t *plane_size) ...@@ -256,9 +256,14 @@ task_dist_states_t verify_dist_type(const char *arg, uint32_t *plane_size)
} else { } else {
/* -m plane=<plane_size> */ /* -m plane=<plane_size> */
dist_str = strchr(tok, '='); dist_str = strchr(tok, '=');
if (dist_str != NULL) { if (!dist_str)
*plane_size = atoi(dist_str + 1); dist_str = getenv("SLURM_DIST_PLANESIZE");
else {
len = dist_str - tok; len = dist_str - tok;
dist_str++;
}
if (dist_str) {
*plane_size = atoi(dist_str);
plane_dist = true; plane_dist = true;
} }
} }
......
...@@ -1939,7 +1939,7 @@ proc test_select_type { } { ...@@ -1939,7 +1939,7 @@ proc test_select_type { } {
# #
# Purpose: Determine SelectTypeParameters being used # Purpose: Determine SelectTypeParameters being used
# #
# Returns value of SelectTypeParameters # Returns 1 if "type" (input) is found, 0 otherwise
# #
################################################################ ################################################################
......
...@@ -68,6 +68,20 @@ if {[test_select_type_params "CR_CPU"]} { ...@@ -68,6 +68,20 @@ if {[test_select_type_params "CR_CPU"]} {
set cr_cpu 1 set cr_cpu 1
} }
log_user 0
set job_mem_opt "--comment=no_mem"
spawn -noecho $bin_bash -c "exec $scontrol show config | $bin_grep SelectTypeParameters"
expect {
-re "MEMORY" {
set job_mem_opt "--mem-per-cpu=4"
exp_continue
}
eof {
wait
}
}
log_user 1
proc cr_core_cpu { node } { proc cr_core_cpu { node } {
global cr_cpu cr_core core_cnt socket_cnt scontrol number exit_code global cr_cpu cr_core core_cnt socket_cnt scontrol number exit_code
...@@ -147,11 +161,11 @@ proc delete_part {part} { ...@@ -147,11 +161,11 @@ proc delete_part {part} {
} }
proc sub_job { job shared part } { proc sub_job { job shared part } {
global sbatch file_in number job_id exit_code global sbatch file_in number job_id exit_code job_mem_opt
set job_id 0 set job_id 0
if { $shared } { if { $shared } {
spawn $sbatch -a$job -t1 -p$part --share -o/dev/null $file_in spawn $sbatch -a$job -t1 $job_mem_opt -p$part --share -o/dev/null $file_in
expect { expect {
-re "Submitted batch job ($number)" { -re "Submitted batch job ($number)" {
set job_id $expect_out(1,string) set job_id $expect_out(1,string)
...@@ -166,7 +180,7 @@ proc sub_job { job shared part } { ...@@ -166,7 +180,7 @@ proc sub_job { job shared part } {
} }
} }
} else { } else {
spawn $sbatch -a$job -t1 -p$part -o/dev/null $file_in spawn $sbatch -a$job -t1 $job_mem_opt -p$part -o/dev/null $file_in
expect { expect {
-re "Submitted batch job ($number)" { -re "Submitted batch job ($number)" {
set job_id $expect_out(1,string) set job_id $expect_out(1,string)
......
...@@ -56,7 +56,7 @@ if {![test_select_type_params "Memory"]} { ...@@ -56,7 +56,7 @@ if {![test_select_type_params "Memory"]} {
} elseif {[test_launch_poe]} { } elseif {[test_launch_poe]} {
set mem_per_step 200 set mem_per_step 200
} else { } else {
set mem_per_step 1 set mem_per_step 4
} }
# #
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment