Skip to content
Snippets Groups Projects
Commit 136fdc76 authored by Moe Jette's avatar Moe Jette
Browse files

add calls to slurm_attr_init() before calls to pthread_create()

in order to get a decent stack size (~2k per thread on AIX).
parent 60659648
No related branches found
No related tags found
No related merge requests found
...@@ -100,6 +100,7 @@ extern allocation_msg_thread_t *slurm_allocation_msg_thr_create( ...@@ -100,6 +100,7 @@ extern allocation_msg_thread_t *slurm_allocation_msg_thr_create(
uint16_t *port, uint16_t *port,
const slurm_allocation_callbacks_t *callbacks) const slurm_allocation_callbacks_t *callbacks)
{ {
pthread_attr_t attr;
int sock = -1; int sock = -1;
eio_obj_t *obj; eio_obj_t *obj;
struct allocation_msg_thread *msg_thr = NULL; struct allocation_msg_thread *msg_thr = NULL;
...@@ -133,13 +134,16 @@ extern allocation_msg_thread_t *slurm_allocation_msg_thr_create( ...@@ -133,13 +134,16 @@ extern allocation_msg_thread_t *slurm_allocation_msg_thr_create(
msg_thr->handle = eio_handle_create(); msg_thr->handle = eio_handle_create();
eio_new_initial_obj(msg_thr->handle, obj); eio_new_initial_obj(msg_thr->handle, obj);
pthread_mutex_lock(&msg_thr_start_lock); pthread_mutex_lock(&msg_thr_start_lock);
if (pthread_create(&msg_thr->id, NULL, slurm_attr_init(&attr);
if (pthread_create(&msg_thr->id, &attr,
_msg_thr_internal, (void *)msg_thr->handle) != 0) { _msg_thr_internal, (void *)msg_thr->handle) != 0) {
error("pthread_create of message thread: %m"); error("pthread_create of message thread: %m");
slurm_attr_destroy(&attr);
eio_handle_destroy(msg_thr->handle); eio_handle_destroy(msg_thr->handle);
xfree(msg_thr); xfree(msg_thr);
return NULL; return NULL;
} }
slurm_attr_destroy(&attr);
/* Wait until the message thread has blocked signals /* Wait until the message thread has blocked signals
before continuing. */ before continuing. */
pthread_cond_wait(&msg_thr_start_cond, &msg_thr_start_lock); pthread_cond_wait(&msg_thr_start_cond, &msg_thr_start_lock);
......
...@@ -560,22 +560,20 @@ struct step_launch_state *step_launch_state_create(slurm_step_ctx_t *ctx) ...@@ -560,22 +560,20 @@ struct step_launch_state *step_launch_state_create(slurm_step_ctx_t *ctx)
slurm_step_layout_t *layout = ctx->step_resp->step_layout; slurm_step_layout_t *layout = ctx->step_resp->step_layout;
sls = xmalloc(sizeof(struct step_launch_state)); sls = xmalloc(sizeof(struct step_launch_state));
if (sls != NULL) { sls->slurmctld_socket_fd = -1;
sls->slurmctld_socket_fd = -1; sls->tasks_requested = layout->task_cnt;
sls->tasks_requested = layout->task_cnt; sls->tasks_started = bit_alloc(layout->task_cnt);
sls->tasks_started = bit_alloc(layout->task_cnt); sls->tasks_exited = bit_alloc(layout->task_cnt);
sls->tasks_exited = bit_alloc(layout->task_cnt); sls->layout = layout;
sls->layout = layout; sls->resp_port = NULL;
sls->resp_port = NULL; sls->abort = false;
sls->abort = false; sls->abort_action_taken = false;
sls->abort_action_taken = false; sls->mpi_info->jobid = ctx->step_req->job_id;
sls->mpi_info->jobid = ctx->step_req->job_id; sls->mpi_info->stepid = ctx->step_resp->job_step_id;
sls->mpi_info->stepid = ctx->step_resp->job_step_id; sls->mpi_info->step_layout = layout;
sls->mpi_info->step_layout = layout; sls->mpi_state = NULL;
sls->mpi_state = NULL; pthread_mutex_init(&sls->lock, NULL);
pthread_mutex_init(&sls->lock, NULL); pthread_cond_init(&sls->cond, NULL);
pthread_cond_init(&sls->cond, NULL);
}
return sls; return sls;
} }
...@@ -621,7 +619,8 @@ static int _msg_thr_create(struct step_launch_state *sls, int num_nodes) ...@@ -621,7 +619,8 @@ static int _msg_thr_create(struct step_launch_state *sls, int num_nodes)
int sock = -1; int sock = -1;
short port = -1; short port = -1;
eio_obj_t *obj; eio_obj_t *obj;
int i; int i, rc = SLURM_SUCCESS;
pthread_attr_t attr;
debug("Entering _msg_thr_create()"); debug("Entering _msg_thr_create()");
slurm_uid = (uid_t) slurm_get_slurm_user_id(); slurm_uid = (uid_t) slurm_get_slurm_user_id();
...@@ -646,12 +645,15 @@ static int _msg_thr_create(struct step_launch_state *sls, int num_nodes) ...@@ -646,12 +645,15 @@ static int _msg_thr_create(struct step_launch_state *sls, int num_nodes)
eio_new_initial_obj(sls->msg_handle, obj); eio_new_initial_obj(sls->msg_handle, obj);
} }
slurm_attr_init(&attr);
if (pthread_create(&sls->msg_thread, NULL, if (pthread_create(&sls->msg_thread, NULL,
_msg_thr_internal, (void *)sls) != 0) { _msg_thr_internal, (void *)sls) != 0) {
error("pthread_create of message thread: %m"); error("pthread_create of message thread: %m");
return SLURM_ERROR;
rc = SLURM_ERROR;
} }
return SLURM_SUCCESS; slurm_attr_destroy(&attr);
return rc;
} }
static bool _message_socket_readable(eio_obj_t *obj) static bool _message_socket_readable(eio_obj_t *obj)
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment