From b6e99ea80011d1e3911e1ba2ae62143a90c5deab Mon Sep 17 00:00:00 2001 From: Moe Jette <jette1@llnl.gov> Date: Tue, 26 Sep 2006 16:45:21 +0000 Subject: [PATCH] Report a job's exit status in "scontrol show job". --- NEWS | 1 + doc/man/man1/scontrol.1 | 10 ++++++++-- slurm/slurm.h.in | 1 + src/api/job_info.c | 12 ++++++++++-- src/common/slurm_protocol_pack.c | 1 + src/slurmctld/job_mgr.c | 1 + src/slurmctld/slurmctld.h | 3 ++- 7 files changed, 24 insertions(+), 5 deletions(-) diff --git a/NEWS b/NEWS index a1345c7b217..caec6a36367 100644 --- a/NEWS +++ b/NEWS @@ -17,6 +17,7 @@ documents those changes that are of interest to users and admins. -- Removed addresses from slurm_step_layout_t -- Added new job field, "comment". Set by srun, salloc and sbatch. See with "scontrol show job". Used in sched/wiki2. + -- Report a job's exit status in "scontrol show job". * Changes in SLURM 1.2.0-pre2 ============================= diff --git a/doc/man/man1/scontrol.1 b/doc/man/man1/scontrol.1 index ccec95e2eba..3552eb4e28a 100644 --- a/doc/man/man1/scontrol.1 +++ b/doc/man/man1/scontrol.1 @@ -1,4 +1,4 @@ -.TH SCONTROL "1" "May 2006" "scontrol 1.2" "Slurm components" +.TH SCONTROL "1" "September 2006" "scontrol 1.2" "Slurm components" .SH "NAME" scontrol \- Used view and modify Slurm configuration and state. @@ -180,7 +180,7 @@ Display the version number of scontrol being executed. \fI!!\fP Repeat the last command executed. .TP -\fBSPECIFICATIONS FOR UPDATE COMMAND, JOBS\fR +\fBSPECIFICATIONS FOR SHOW AND UPDATE COMMANDS, JOBS\fR .TP \fIAccount\fP=<account> Account name to be changed for this job's resource use. @@ -194,6 +194,12 @@ Possible values are"YES" and "NO". Defer job's initiation until specified job_id completes. Cancel dependency with job_id value of "0", "Depedency=0". .TP +\fIExitCode\fP=<exit>:<sig> +Exit status reported for the job by the wait() function. +The first number is the exit code, typically as set by the exit() function. +The second number of the signal that caused the process to terminate if +it was terminated by a signal. +.TP \fIFeatures\fP=<features> Set the job's required features on nodes specified value. Multiple values may be comma separated if all features are required (AND operation) or diff --git a/slurm/slurm.h.in b/slurm/slurm.h.in index 9f6e44ed0cb..abbf1043257 100644 --- a/slurm/slurm.h.in +++ b/slurm/slurm.h.in @@ -470,6 +470,7 @@ typedef struct job_info { * start_range_2, .., -1 */ char *features; /* comma separated list of required features */ uint32_t dependency; /* defer until specified job completes */ + uint32_t exit_code; /* exit code for job (status from wait call) */ char *account; /* charge to specified account */ uint16_t wait_reason; /* reason job still pending, see * slurm.h:enum job_wait_reason */ diff --git a/src/api/job_info.c b/src/api/job_info.c index 92e007e51a5..5597d95d04e 100644 --- a/src/api/job_info.c +++ b/src/api/job_info.c @@ -47,6 +47,7 @@ #include <stdlib.h> #include <string.h> #include <sys/types.h> +#include <sys/wait.h> #include <time.h> #include <slurm/slurm.h> @@ -117,6 +118,7 @@ slurm_sprint_job_info ( job_info_t * job_ptr, int one_liner ) char tmp_line[128]; uint16_t quarter = (uint16_t) NO_VAL; uint16_t nodecard = (uint16_t) NO_VAL; + uint16_t term_sig = 0; char *out = NULL; #ifdef HAVE_BG @@ -178,9 +180,15 @@ slurm_sprint_job_info ( job_info_t * job_ptr, int one_liner ) if (job_ptr->time_limit == INFINITE) sprintf(tmp_line, "UNLIMITED"); else if (job_ptr->time_limit == NO_VAL) - sprintf(tmp_line, "Partition_Limit"); + sprintf(tmp_line, "Partition_Limit "); else - sprintf(tmp_line, "%u", job_ptr->time_limit); + sprintf(tmp_line, "%u ", job_ptr->time_limit); + xstrcat(out, tmp_line); + if (WIFSIGNALED(job_ptr->exit_code)) + term_sig = WTERMSIG(job_ptr->exit_code); + snprintf(tmp_line, sizeof(tmp_line), + "ExitCode=%u:%u", + WEXITSTATUS(job_ptr->exit_code), term_sig); xstrcat(out, tmp_line); if (one_liner) xstrcat(out, " "); diff --git a/src/common/slurm_protocol_pack.c b/src/common/slurm_protocol_pack.c index d33e191dd71..941b0d7a2f4 100644 --- a/src/common/slurm_protocol_pack.c +++ b/src/common/slurm_protocol_pack.c @@ -1929,6 +1929,7 @@ _unpack_job_info_members(job_info_t * job, Buf buffer) safe_unpackstr_xmalloc(&job->network, &uint16_tmp, buffer); safe_unpackstr_xmalloc(&job->comment, &uint16_tmp, buffer); safe_unpack32(&job->dependency, buffer); + safe_unpack32(&job->exit_code, buffer); safe_unpackstr_xmalloc(&job->name, &uint16_tmp, buffer); safe_unpackstr_xmalloc(&job->alloc_node, &uint16_tmp, buffer); diff --git a/src/slurmctld/job_mgr.c b/src/slurmctld/job_mgr.c index e1a37ddefb0..6e612e28ede 100644 --- a/src/slurmctld/job_mgr.c +++ b/src/slurmctld/job_mgr.c @@ -2797,6 +2797,7 @@ void pack_job(struct job_record *dump_job_ptr, Buf buffer) packstr(dump_job_ptr->network, buffer); packstr(dump_job_ptr->comment, buffer); pack32((uint32_t)dump_job_ptr->dependency, buffer); + pack32((uint32_t)dump_job_ptr->exit_code, buffer); packstr(dump_job_ptr->name, buffer); packstr(dump_job_ptr->alloc_node, buffer); diff --git a/src/slurmctld/slurmctld.h b/src/slurmctld/slurmctld.h index 67ecc367373..6566915f976 100644 --- a/src/slurmctld/slurmctld.h +++ b/src/slurmctld/slurmctld.h @@ -356,7 +356,8 @@ struct job_record { uint16_t mail_type; /* see MAIL_JOB_* in slurm.h */ char *mail_user; /* user to get e-mail notification */ uint32_t requid; /* requester user ID */ - uint32_t exit_code; /* exit code for the job */ + uint32_t exit_code; /* exit code for job (status from + * wait call) */ }; struct step_record { -- GitLab