Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
S
Slurm
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Package registry
Model registry
Operate
Environments
Terraform modules
Monitor
Incidents
Service Desk
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Terms and privacy
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
tud-zih-energy
Slurm
Commits
57788a07
Commit
57788a07
authored
11 years ago
by
David Gloe
Committed by
Danny Auble
11 years ago
Browse files
Options
Downloads
Patches
Plain Diff
CRAY - Move port functions to new file
parent
44673064
No related branches found
No related tags found
No related merge requests found
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
src/plugins/switch/cray/ports.c
+153
-0
153 additions, 0 deletions
src/plugins/switch/cray/ports.c
src/plugins/switch/cray/switch_cray.c
+2
-98
2 additions, 98 deletions
src/plugins/switch/cray/switch_cray.c
with
155 additions
and
98 deletions
src/plugins/switch/cray/ports.c
0 → 100644
+
153
−
0
View file @
57788a07
/*****************************************************************************\
* ports.c - Library for managing a switch on a Cray system.
*****************************************************************************
* Copyright (C) 2014 SchedMD LLC
* Copyright 2014 Cray Inc. All Rights Reserved.
* Written by David Gloe <c16817@cray.com>
*
* This file is part of SLURM, a resource management program.
* For details, see <http://slurm.schedmd.com/>.
* Please also read the included file: DISCLAIMER.
*
* SLURM is free software; you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the Free
* Software Foundation; either version 2 of the License, or (at your option)
* any later version.
*
* In addition, as a special exception, the copyright holders give permission
* to link the code of portions of this program with the OpenSSL library under
* certain conditions as described in each individual source file, and
* distribute linked combinations including the two. You must obey the GNU
* General Public License in all respects for all of the code used other than
* OpenSSL. If you modify file(s) with this exception, you may extend this
* exception to your version of the file(s), but you are not obligated to do
* so. If you do not wish to do so, delete this exception statement from your
* version. If you delete this exception statement from all source files in
* the program, then also delete it here.
*
* SLURM is distributed in the hope that it will be useful, but WITHOUT ANY
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License along
* with SLURM; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
\*****************************************************************************/
#include
"switch_cray.h"
#ifdef HAVE_NATIVE_CRAY
#include
<unistd.h>
// Global variables
bitstr_t
*
port_resv
=
NULL
;
uint32_t
last_alloc_port
=
0
;
pthread_mutex_t
port_mutex
=
PTHREAD_MUTEX_INITIALIZER
;
/*
* Function: assign_port
* Description:
* Looks for and assigns the next free port. This port is used by Cray's
* PMI for its communications to manage its control tree.
*
* To avoid port conflicts, this function selects a large range of
* ports within the middle of the port range where it assumes no
* ports are used. No special precautions are taken to handle a
* selected port already in use by some other non-SLURM component
* on the node.
*
* If there are no free ports, then it loops through the entire table
* ATTEMPTS number of times before declaring a failure.
*
* Returns:
* 0 on success and -1 on failure.
*/
int
assign_port
(
uint32_t
*
real_port
)
{
int
port
,
tmp
,
attempts
=
0
;
if
(
!
real_port
)
{
CRAY_ERR
(
"real_port address was NULL."
);
return
-
1
;
}
/*
* Ports is an index into the reserved port table.
* The ports range from 0 up to PORT_CNT.
*/
pthread_mutex_lock
(
&
port_mutex
);
port
=
++
last_alloc_port
%
PORT_CNT
;
/*
* Find an unreserved port to assign.
* Abandon the attempt if we've been through the available ports ATTEMPT
* number of times
*/
while
(
bit_test
(
port_resv
,
port
))
{
tmp
=
++
port
%
PORT_CNT
;
port
=
tmp
;
attempts
++
;
if
((
attempts
/
PORT_CNT
)
>=
ATTEMPTS
)
{
CRAY_ERR
(
"No free ports among %d ports. "
"Went through entire port list %d times"
,
PORT_CNT
,
ATTEMPTS
);
pthread_mutex_unlock
(
&
port_mutex
);
return
-
1
;
}
else
if
((
attempts
%
PORT_CNT
)
==
0
)
{
/*
* Each time through give other threads a chance
* to release ports
*/
pthread_mutex_unlock
(
&
port_mutex
);
sleep
(
1
);
pthread_mutex_lock
(
&
port_mutex
);
}
}
bit_set
(
port_resv
,
port
);
last_alloc_port
=
port
;
pthread_mutex_unlock
(
&
port_mutex
);
/*
* The port index must be scaled up by the MIN_PORT.
*/
*
real_port
=
(
port
+
MIN_PORT
);
return
0
;
}
/*
* Function: release_port
* Description:
* Release the port.
*
* Returns:
* 0 on success and -1 on failure.
*/
int
release_port
(
uint32_t
real_port
)
{
uint32_t
port
;
if
((
real_port
<
MIN_PORT
)
||
(
real_port
>=
MAX_PORT
))
{
CRAY_ERR
(
"Port %"
PRIu32
" outside of valid range %"
PRIu32
" : %"
PRIu32
,
real_port
,
MIN_PORT
,
MAX_PORT
);
return
-
1
;
}
port
=
real_port
-
MIN_PORT
;
pthread_mutex_lock
(
&
port_mutex
);
if
(
bit_test
(
port_resv
,
port
))
{
bit_clear
(
port_resv
,
port
);
pthread_mutex_unlock
(
&
port_mutex
);
}
else
{
CRAY_ERR
(
"Attempting to release port %d,"
" but it was not reserved."
,
real_port
);
pthread_mutex_unlock
(
&
port_mutex
);
return
-
1
;
}
return
0
;
}
#endif
This diff is collapsed.
Click to expand it.
src/plugins/switch/cray/switch_cray.c
+
2
−
98
View file @
57788a07
...
...
@@ -580,7 +580,7 @@ int switch_p_build_jobinfo(switch_jobinfo_t *switch_job,
/*
* Get a unique port for PMI communications
*/
rc
=
_
assign_port
(
&
port
);
rc
=
assign_port
(
&
port
);
if
(
rc
<
0
)
{
info
(
"(%s: %d: %s) assign_port failed"
,
THIS_FILE
,
__LINE__
,
__FUNCTION__
);
...
...
@@ -1434,7 +1434,7 @@ extern int switch_p_job_step_complete(switch_jobinfo_t *jobinfo,
* Release the reserved PMI port
* If this fails, do not exit with an error.
*/
rc
=
_
release_port
(
job
->
port
);
rc
=
release_port
(
job
->
port
);
if
(
rc
!=
0
)
{
error
(
"(%s: %d: %s) Releasing port %"
PRIu32
" failed."
,
THIS_FILE
,
__LINE__
,
__FUNCTION__
,
job
->
port
);
...
...
@@ -1591,102 +1591,6 @@ static int _get_cpu_total(void)
return
total
;
}
/*
* Function: assign_port
* Description:
* Looks for and assigns the next free port. This port is used by Cray's
* PMI for its communications to manage its control tree.
*
* To avoid port conflicts, this function selects a large range of
* ports within the middle of the port range where it assumes no
* ports are used. No special precautions are taken to handle a
* selected port already in use by some other non-SLURM component
* on the node.
*
* If there are no free ports, then it loops through the entire table
* ATTEMPTS number of times before declaring a failure.
*
* Returns:
* 0 on success and -1 on failure.
*/
static
int
_assign_port
(
uint32_t
*
real_port
)
{
int
port
,
tmp
,
attempts
=
0
;
if
(
!
real_port
)
{
error
(
"(%s: %d: %s) real_port address was NULL."
,
THIS_FILE
,
__LINE__
,
__FUNCTION__
);
return
-
1
;
}
/*
* Ports is an index into the reserved port table.
* The ports range from 0 up to PORT_CNT.
*/
port
=
++
last_alloc_port
%
PORT_CNT
;
/*
* Find an unreserved port to assign.
* Abandon the attempt if we've been through the available ports ATTEMPT
* number of times
*/
while
(
port_resv
[
port
]
==
1
)
{
tmp
=
++
port
%
PORT_CNT
;
port
=
tmp
;
attempts
++
;
if
((
attempts
/
PORT_CNT
)
>=
ATTEMPTS
)
{
error
(
"(%s: %d: %s) No free ports among %d ports. "
" Went through entire port list %d times"
,
THIS_FILE
,
__LINE__
,
__FUNCTION__
,
PORT_CNT
,
ATTEMPTS
);
return
-
1
;
}
}
port_resv
[
port
]
=
1
;
last_alloc_port
=
port
;
/*
* The port index must be scaled up by the MIN_PORT.
*/
*
real_port
=
(
port
+
MIN_PORT
);
return
0
;
}
/*
* Function: release_port
* Description:
* Release the port.
*
* Returns:
* 0 on success and -1 on failure.
*/
static
int
_release_port
(
uint32_t
real_port
)
{
uint32_t
port
;
if
((
real_port
<
MIN_PORT
)
||
(
real_port
>=
MAX_PORT
))
{
error
(
"(%s: %d: %s) Port %"
PRIu32
"outside of valid range %"
PRIu32
": %"
PRIu32
,
THIS_FILE
,
__LINE__
,
__FUNCTION__
,
real_port
,
MIN_PORT
,
MAX_PORT
);
return
-
1
;
}
port
=
real_port
-
MIN_PORT
;
if
(
port_resv
[
port
])
{
port_resv
[
port
]
=
0
;
}
else
{
error
(
"(%s: %d: %s) Attempting to release port %d,"
" but it was not reserved."
,
THIS_FILE
,
__LINE__
,
__FUNCTION__
,
real_port
);
return
-
1
;
}
return
0
;
}
/*
* Function: _free_alpsc_pe_info
* Description:
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment