diff --git a/doc/man/man5/slurm.conf.5 b/doc/man/man5/slurm.conf.5 index 1e3748f1959812ed4a31e24fecabf0f4c4148115..20a0c9af661d6362b846c31425f396cde0db63e0 100644 --- a/doc/man/man5/slurm.conf.5 +++ b/doc/man/man5/slurm.conf.5 @@ -1310,7 +1310,7 @@ and resumes communications). A DOWN node will become available for use upon registration with a valid configuration only if it was set DOWN due to being non\-responsive. If the node was set DOWN for any other reason (low memory, prolog failure, -epilog failure, silently rebooting, etc.), its state will not automatically +epilog failure, unexpected reboot, etc.), its state will not automatically be changed. .TP \fB2\fR diff --git a/src/slurmctld/node_mgr.c b/src/slurmctld/node_mgr.c index c27e4238665ae6bd9938b6d88f4ce1c90c673e93..edc8dec5b6f3f70ae62443ff8b35757075198ba7 100644 --- a/src/slurmctld/node_mgr.c +++ b/src/slurmctld/node_mgr.c @@ -1718,9 +1718,9 @@ extern int validate_node_specs(slurm_node_registration_status_msg_t *reg_msg) node_ptr->reason_uid = slurm_get_slurm_user_id(); node_ptr->reason = xstrdup( - "Node silently failed and came back"); + "Node unexpectedly rebooted"); } - info("Node %s silently failed and came back", + info("Node %s unexpectedly rebooted", reg_msg->node_name); _make_node_down(node_ptr, now); kill_running_job_by_node_name(reg_msg->node_name); @@ -1790,8 +1790,8 @@ static front_end_record_t * _front_end_reg( (front_end_ptr->boot_time > front_end_ptr->last_response) && (slurmctld_conf.ret2service != 2)) { set_front_end_down(front_end_ptr, - "Front end silently failed and came back"); - info("Front end %s silently failed and came back", + "Front end unexpectedly rebooted"); + info("Front end %s unexpectedly rebooted", reg_msg->node_name); reg_msg->job_count = 0; }