blob: 46d481ee54d5434a30b37e2631515686da362d9a [file] [log] [blame]
/*****************************************************************************\
* opt.c - options processing for srun
* $Id$
*****************************************************************************
* Copyright (C) 2002-2006 The Regents of the University of California.
* Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER).
* Written by Mark Grondona <grondona1@llnl.gov>, et. al.
* UCRL-CODE-217948.
*
* This file is part of SLURM, a resource management program.
* For details, see <http://www.llnl.gov/linux/slurm/>.
*
* SLURM is free software; you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the Free
* Software Foundation; either version 2 of the License, or (at your option)
* any later version.
*
* In addition, as a special exception, the copyright holders give permission
* to link the code of portions of this program with the OpenSSL library under
* certain conditions as described in each individual source file, and
* distribute linked combinations including the two. You must obey the GNU
* General Public License in all respects for all of the code used other than
* OpenSSL. If you modify file(s) with this exception, you may extend this
* exception to your version of the file(s), but you are not obligated to do
* so. If you do not wish to do so, delete this exception statement from your
* version. If you delete this exception statement from all source files in
* the program, then also delete it here.
*
* SLURM is distributed in the hope that it will be useful, but WITHOUT ANY
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License along
* with SLURM; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
\*****************************************************************************/
#if HAVE_CONFIG_H
# include "config.h"
#endif
#include <string.h> /* strcpy, strncasecmp */
#ifdef HAVE_STRINGS_H
# include <strings.h>
#endif
#ifndef _GNU_SOURCE
# define _GNU_SOURCE
#endif
#if HAVE_GETOPT_H
# include <getopt.h>
#else
# include "src/common/getopt.h"
#endif
#include <fcntl.h>
#include <stdarg.h> /* va_start */
#include <stdio.h>
#include <stdlib.h> /* getenv */
#include <pwd.h> /* getpwuid */
#include <ctype.h> /* isdigit */
#include <sys/param.h> /* MAXPATHLEN */
#include <sys/stat.h>
#include <unistd.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <sys/utsname.h>
#include "src/common/list.h"
#include "src/common/log.h"
#include "src/common/parse_time.h"
#include "src/common/slurm_protocol_api.h"
#include "src/common/slurm_protocol_interface.h"
#include "src/common/uid.h"
#include "src/common/xmalloc.h"
#include "src/common/xstring.h"
#include "src/common/slurm_rlimits_info.h"
#include "src/common/plugstack.h"
#include "src/common/optz.h"
#include "src/srun/opt.h"
#include "src/srun/attach.h"
#include "src/common/mpi.h"
/* generic OPT_ definitions -- mainly for use with env vars */
#define OPT_NONE 0x00
#define OPT_INT 0x01
#define OPT_STRING 0x02
#define OPT_DISTRIB 0x04
#define OPT_NODES 0x05
#define OPT_OVERCOMMIT 0x06
#define OPT_CORE 0x07
#define OPT_CONN_TYPE 0x08
#define OPT_NO_ROTATE 0x0a
#define OPT_GEOMETRY 0x0b
#define OPT_MPI 0x0c
#define OPT_CPU_BIND 0x0d
#define OPT_MEM_BIND 0x0e
#define OPT_MULTI 0x0f
#define OPT_EXCLUSIVE 0x10
/* generic getopt_long flags, integers and *not* valid characters */
#define LONG_OPT_HELP 0x100
#define LONG_OPT_USAGE 0x101
#define LONG_OPT_XTO 0x102
#define LONG_OPT_LAUNCH 0x103
#define LONG_OPT_TIMEO 0x104
#define LONG_OPT_JOBID 0x105
#define LONG_OPT_TMP 0x106
#define LONG_OPT_MEM 0x107
#define LONG_OPT_MINCPU 0x108
#define LONG_OPT_CONT 0x109
#define LONG_OPT_UID 0x10a
#define LONG_OPT_GID 0x10b
#define LONG_OPT_MPI 0x10c
#define LONG_OPT_CORE 0x10e
#define LONG_OPT_NOSHELL 0x10f
#define LONG_OPT_DEBUG_TS 0x110
#define LONG_OPT_CONNTYPE 0x111
#define LONG_OPT_TEST_ONLY 0x113
#define LONG_OPT_NETWORK 0x114
#define LONG_OPT_EXCLUSIVE 0x115
#define LONG_OPT_PROPAGATE 0x116
#define LONG_OPT_PROLOG 0x117
#define LONG_OPT_EPILOG 0x118
#define LONG_OPT_BEGIN 0x119
#define LONG_OPT_MAIL_TYPE 0x11a
#define LONG_OPT_MAIL_USER 0x11b
#define LONG_OPT_TASK_PROLOG 0x11c
#define LONG_OPT_TASK_EPILOG 0x11d
#define LONG_OPT_NICE 0x11e
#define LONG_OPT_CPU_BIND 0x11f
#define LONG_OPT_MEM_BIND 0x120
#define LONG_OPT_CTRL_COMM_IFHN 0x121
#define LONG_OPT_MULTI 0x122
#define LONG_OPT_COMMENT 0x123
#define LONG_OPT_GET_USER_ENV 0x145
/*---- forward declarations of static functions ----*/
typedef struct env_vars env_vars_t;
/* return command name from its full path name */
static char * _base_name(char* command);
static List _create_path_list(void);
/* Get a decimal integer from arg */
static int _get_int(const char *arg, const char *what);
static void _help(void);
/* load a multi-program configuration file */
static void _load_multi(int *argc, char **argv);
/* fill in default options */
static void _opt_default(void);
/* set options based upon env vars */
static void _opt_env(void);
static void _opt_args(int argc, char **argv);
/* list known options and their settings */
static void _opt_list(void);
/* verify options sanity */
static bool _opt_verify(void);
static void _print_version(void);
static void _process_env_var(env_vars_t *e, const char *val);
static uint16_t _parse_mail_type(const char *arg);
static char *_print_mail_type(const uint16_t type);
/* search PATH for command returns full path */
static char *_search_path(char *, bool, int);
static long _to_bytes(const char *arg);
static bool _under_parallel_debugger(void);
static void _usage(void);
static bool _valid_node_list(char **node_list_pptr);
static enum task_dist_states _verify_dist_type(const char *arg);
static bool _verify_node_count(const char *arg, int *min, int *max);
static int _verify_cpu_bind(const char *arg, char **cpu_bind,
cpu_bind_type_t *cpu_bind_type);
static int _verify_geometry(const char *arg, uint16_t *geometry);
static int _verify_mem_bind(const char *arg, char **mem_bind,
mem_bind_type_t *mem_bind_type);
static int _verify_conn_type(const char *arg);
/*---[ end forward declarations of static functions ]---------------------*/
int initialize_and_process_args(int argc, char *argv[])
{
/* initialize option defaults */
_opt_default();
/* initialize options with env vars */
_opt_env();
/* initialize options with argv */
_opt_args(argc, argv);
if (_verbose > 3)
_opt_list();
return 1;
}
static void _print_version(void)
{
printf("%s %s\n", PACKAGE, SLURM_VERSION);
}
/*
* If the node list supplied is a file name, translate that into
* a list of nodes, we orphan the data pointed to
* RET true if the node list is a valid one
*/
static bool _valid_node_list(char **node_list_pptr)
{
char *nodelist = NULL;
if (strchr(*node_list_pptr, '/') == NULL)
return true; /* not a file name */
/* If we are using Arbitrary and we specified the number of
procs to use then we need exactly this many since we are
saying, lay it out this way! Same for max and min nodes.
Other than that just read in as many in the hostfile */
if(opt.distribution == SLURM_DIST_ARBITRARY) {
if(opt.nprocs_set)
nodelist = slurm_read_hostfile(*node_list_pptr,
opt.nprocs);
else if(opt.max_nodes)
nodelist = slurm_read_hostfile(*node_list_pptr,
opt.max_nodes);
else if(opt.min_nodes)
nodelist = slurm_read_hostfile(*node_list_pptr,
opt.min_nodes);
} else
nodelist = slurm_read_hostfile(*node_list_pptr, NO_VAL);
if (nodelist == NULL)
return false;
xfree(*node_list_pptr);
*node_list_pptr = xstrdup(nodelist);
free(nodelist);
return true;
}
/*
* verify that a distribution type in arg is of a known form
* returns the task_dist_states or SLURM_DIST_UNKNOWN
*/
static enum task_dist_states _verify_dist_type(const char *arg)
{
int len = strlen(arg);
enum task_dist_states result = SLURM_DIST_UNKNOWN;
if (strncasecmp(arg, "cyclic", len) == 0)
result = SLURM_DIST_CYCLIC;
else if (strncasecmp(arg, "block", len) == 0)
result = SLURM_DIST_BLOCK;
else if ((strncasecmp(arg, "arbitrary", len) == 0) ||
(strncasecmp(arg, "hostfile", len) == 0))
result = SLURM_DIST_ARBITRARY;
return result;
}
/*
* verify that a connection type in arg is of known form
* returns the connection_type or -1 if not recognized
*/
static int _verify_conn_type(const char *arg)
{
int len = strlen(arg);
if (!strncasecmp(arg, "MESH", len))
return SELECT_MESH;
else if (!strncasecmp(arg, "TORUS", len))
return SELECT_TORUS;
else if (!strncasecmp(arg, "NAV", len))
return SELECT_NAV;
error("invalid --conn-type argument %s ignored.", arg);
return -1;
}
/*
* verify geometry arguments, must have proper count
* returns -1 on error, 0 otherwise
*/
static int _verify_geometry(const char *arg, uint16_t *geometry)
{
char* token, *delimiter = ",x", *next_ptr;
int i, rc = 0;
char* geometry_tmp = xstrdup(arg);
char* original_ptr = geometry_tmp;
token = strtok_r(geometry_tmp, delimiter, &next_ptr);
for (i=0; i<SYSTEM_DIMENSIONS; i++) {
if (token == NULL) {
error("insufficient dimensions in --geometry");
rc = -1;
break;
}
geometry[i] = (uint16_t)atoi(token);
if (geometry[i] == 0 || geometry[i] == (uint16_t)NO_VAL) {
error("invalid --geometry argument");
rc = -1;
break;
}
geometry_tmp = next_ptr;
token = strtok_r(geometry_tmp, delimiter, &next_ptr);
}
if (token != NULL) {
error("too many dimensions in --geometry");
rc = -1;
}
if (original_ptr)
xfree(original_ptr);
return rc;
}
/*
* verify cpu_bind arguments
* returns -1 on error, 0 otherwise
*/
static int _verify_cpu_bind(const char *arg, char **cpu_bind,
cpu_bind_type_t *cpu_bind_type)
{
char *buf = xstrdup(arg);
char *pos = buf;
/* we support different launch policy names
* we also allow a verbose setting to be specified
* --cpu_bind=v
* --cpu_bind=rank,v
* --cpu_bind=rank
* --cpu_bind={MAP_CPU|MAP_MASK}:0,1,2,3,4
*/
if (*pos) {
/* parse --cpu_bind command line arguments */
bool fl_cpubind_verbose = 0;
char *cmd_line_affinity = NULL;
char *cmd_line_mapping = NULL;
char *mappos = strchr(pos,':');
if (!mappos) {
mappos = strchr(pos,'=');
}
if (strncasecmp(pos, "quiet", 5) == 0) {
fl_cpubind_verbose=0;
pos+=5;
} else if (*pos=='q' || *pos=='Q') {
fl_cpubind_verbose=0;
pos++;
}
if (strncasecmp(pos, "verbose", 7) == 0) {
fl_cpubind_verbose=1;
pos+=7;
} else if (*pos=='v' || *pos=='V') {
fl_cpubind_verbose=1;
pos++;
}
if (*pos==',') {
pos++;
}
if (*pos) {
char *vpos=NULL;
cmd_line_affinity = pos;
if (((vpos=strstr(pos,",q")) !=0 ) ||
((vpos=strstr(pos,",Q")) !=0 )) {
*vpos='\0';
fl_cpubind_verbose=0;
}
if (((vpos=strstr(pos,",v")) !=0 ) ||
((vpos=strstr(pos,",V")) !=0 )) {
*vpos='\0';
fl_cpubind_verbose=1;
}
}
if (mappos) {
*mappos='\0';
mappos++;
cmd_line_mapping=mappos;
}
/* convert parsed command line args into interface */
if (cmd_line_mapping) {
xfree(*cpu_bind);
*cpu_bind = xstrdup(cmd_line_mapping);
}
if (fl_cpubind_verbose) {
*cpu_bind_type |= CPU_BIND_VERBOSE;
}
if (cmd_line_affinity) {
*cpu_bind_type &= CPU_BIND_VERBOSE; /* clear any
* previous type */
if ((strcasecmp(cmd_line_affinity, "no") == 0) ||
(strcasecmp(cmd_line_affinity, "none") == 0)) {
*cpu_bind_type |= CPU_BIND_NONE;
} else if (strcasecmp(cmd_line_affinity, "rank") == 0) {
*cpu_bind_type |= CPU_BIND_RANK;
} else if ((strcasecmp(cmd_line_affinity, "map_cpu") == 0) ||
(strcasecmp(cmd_line_affinity, "mapcpu") == 0)) {
*cpu_bind_type |= CPU_BIND_MAPCPU;
} else if ((strcasecmp(cmd_line_affinity, "mask_cpu") == 0) ||
(strcasecmp(cmd_line_affinity, "maskcpu") == 0)) {
*cpu_bind_type |= CPU_BIND_MASKCPU;
} else {
error("unrecognized --cpu_bind argument \"%s\"",
cmd_line_affinity);
xfree(buf);
return 1;
}
}
}
xfree(buf);
return 0;
}
/*
* verify mem_bind arguments
* returns -1 on error, 0 otherwise
*/
static int _verify_mem_bind(const char *arg, char **mem_bind,
mem_bind_type_t *mem_bind_type)
{
char *buf = xstrdup(arg);
char *pos = buf;
/* we support different launch policy names
* we also allow a verbose setting to be specified
* --mem_bind=v
* --mem_bind=rank,v
* --mem_bind=rank
* --mem_bind={MAP_CPU|MAP_MASK}:0,1,2,3,4
*/
if (*pos) {
/* parse --mem_bind command line arguments */
bool fl_membind_verbose = 0;
char *cmd_line_affinity = NULL;
char *cmd_line_mapping = NULL;
char *mappos = strchr(pos,':');
if (!mappos) {
mappos = strchr(pos,'=');
}
if (strncasecmp(pos, "quiet", 5) == 0) {
fl_membind_verbose = 0;
pos+=5;
} else if (*pos=='q' || *pos=='Q') {
fl_membind_verbose = 0;
pos++;
}
if (strncasecmp(pos, "verbose", 7) == 0) {
fl_membind_verbose = 1;
pos+=7;
} else if (*pos=='v' || *pos=='V') {
fl_membind_verbose = 1;
pos++;
}
if (*pos==',') {
pos++;
}
if (*pos) {
char *vpos=NULL;
cmd_line_affinity = pos;
if (((vpos=strstr(pos,",q")) !=0 ) ||
((vpos=strstr(pos,",Q")) !=0 )) {
*vpos='\0';
fl_membind_verbose = 0;
}
if (((vpos=strstr(pos,",v")) !=0 ) ||
((vpos=strstr(pos,",V")) !=0 )) {
*vpos='\0';
fl_membind_verbose = 1;
}
}
if (mappos) {
*mappos='\0';
mappos++;
cmd_line_mapping=mappos;
}
/* convert parsed command line args into interface */
if (cmd_line_mapping) {
xfree(*mem_bind);
*mem_bind = xstrdup(cmd_line_mapping);
}
if (fl_membind_verbose) {
*mem_bind_type |= MEM_BIND_VERBOSE;
}
if (cmd_line_affinity) {
*mem_bind_type &= MEM_BIND_VERBOSE; /* clear any
* previous type */
if ((strcasecmp(cmd_line_affinity, "no") == 0) ||
(strcasecmp(cmd_line_affinity, "none") == 0)) {
*mem_bind_type |= MEM_BIND_NONE;
} else if (strcasecmp(cmd_line_affinity, "rank") == 0) {
*mem_bind_type |= MEM_BIND_RANK;
} else if (strcasecmp(cmd_line_affinity, "local") == 0) {
*mem_bind_type |= MEM_BIND_LOCAL;
} else if ((strcasecmp(cmd_line_affinity, "map_mem") == 0) ||
(strcasecmp(cmd_line_affinity, "mapmem") == 0)) {
*mem_bind_type |= MEM_BIND_MAPCPU;
} else if ((strcasecmp(cmd_line_affinity, "mask_mem") == 0) ||
(strcasecmp(cmd_line_affinity, "maskmem") == 0)) {
*mem_bind_type |= MEM_BIND_MASKCPU;
} else {
error("unrecognized --mem_bind argument \"%s\"",
cmd_line_affinity);
xfree(buf);
return 1;
}
}
}
xfree(buf);
return 0;
}
/*
* verify that a node count in arg is of a known form (count or min-max)
* OUT min, max specified minimum and maximum node counts
* RET true if valid
*/
static bool
_verify_node_count(const char *arg, int *min_nodes, int *max_nodes)
{
char *end_ptr;
double val1, val2;
val1 = strtod(arg, &end_ptr);
if (end_ptr[0] == 'k' || end_ptr[0] == 'K') {
val1 *= 1024;
end_ptr++;
}
if (end_ptr[0] == '\0') {
*min_nodes = val1;
return true;
}
if (end_ptr[0] != '-')
return false;
val2 = strtod(&end_ptr[1], &end_ptr);
if (end_ptr[0] == 'k' || end_ptr[0] == 'K') {
val2 *= 1024;
end_ptr++;
}
if (end_ptr[0] == '\0') {
*min_nodes = val1;
*max_nodes = val2;
return true;
} else
return false;
}
/* return command name from its full path name */
static char * _base_name(char* command)
{
char *char_ptr, *name;
int i;
if (command == NULL)
return NULL;
char_ptr = strrchr(command, (int)'/');
if (char_ptr == NULL)
char_ptr = command;
else
char_ptr++;
i = strlen(char_ptr);
name = xmalloc(i+1);
strcpy(name, char_ptr);
return name;
}
/*
* _to_bytes(): verify that arg is numeric with optional "G" or "M" at end
* if "G" or "M" is there, multiply by proper power of 2 and return
* number in bytes
*/
static long _to_bytes(const char *arg)
{
char *buf;
char *endptr;
int end;
int multiplier = 1;
long result;
buf = xstrdup(arg);
end = strlen(buf) - 1;
if (isdigit(buf[end])) {
result = strtol(buf, &endptr, 10);
if (*endptr != '\0')
result = -result;
} else {
switch (toupper(buf[end])) {
case 'G':
multiplier = 1024;
break;
case 'M':
/* do nothing */
break;
default:
multiplier = -1;
}
buf[end] = '\0';
result = multiplier * strtol(buf, &endptr, 10);
if (*endptr != '\0')
result = -result;
}
return result;
}
/*
* print error message to stderr with opt.progname prepended
*/
#undef USE_ARGERROR
#if USE_ARGERROR
static void argerror(const char *msg, ...)
{
va_list ap;
char buf[256];
va_start(ap, msg);
vsnprintf(buf, sizeof(buf), msg, ap);
fprintf(stderr, "%s: %s\n",
opt.progname ? opt.progname : "srun", buf);
va_end(ap);
}
#else
# define argerror error
#endif /* USE_ARGERROR */
/*
* _opt_default(): used by initialize_and_process_args to set defaults
*/
static void _opt_default()
{
char buf[MAXPATHLEN + 1];
struct passwd *pw;
int i;
char hostname[64];
if ((pw = getpwuid(getuid())) != NULL) {
strncpy(opt.user, pw->pw_name, MAX_USERNAME);
opt.uid = pw->pw_uid;
} else
error("who are you?");
opt.gid = getgid();
if ((getcwd(buf, MAXPATHLEN)) == NULL)
fatal("getcwd failed: %m");
opt.cwd = xstrdup(buf);
opt.cwd_set = false;
opt.progname = NULL;
opt.nprocs = 1;
opt.nprocs_set = false;
opt.cpus_per_task = 1;
opt.cpus_set = false;
opt.min_nodes = 1;
opt.max_nodes = 0;
opt.nodes_set = false;
opt.cpu_bind_type = 0;
opt.cpu_bind = NULL;
opt.mem_bind_type = 0;
opt.mem_bind = NULL;
opt.time_limit = -1;
opt.partition = NULL;
opt.max_threads = MAX_THREADS;
opt.job_name = NULL;
opt.job_name_set = false;
opt.jobid = NO_VAL;
opt.jobid_set = false;
opt.dependency = NO_VAL;
opt.account = NULL;
opt.distribution = SLURM_DIST_UNKNOWN;
opt.ofname = NULL;
opt.ifname = NULL;
opt.efname = NULL;
opt.core_type = CORE_DEFAULT;
opt.labelio = false;
opt.unbuffered = false;
opt.overcommit = false;
opt.batch = false;
opt.share = false;
opt.no_kill = false;
opt.kill_bad_exit = false;
opt.immediate = false;
opt.allocate = false;
opt.noshell = false;
opt.attach = NULL;
opt.join = false;
opt.max_wait = slurm_get_wait_time();
opt.quit_on_intr = false;
opt.disable_status = false;
opt.test_only = false;
opt.quiet = 0;
_verbose = 0;
opt.slurmd_debug = LOG_LEVEL_QUIET;
/* constraint default (-1 is no constraint) */
opt.mincpus = -1;
opt.realmem = -1;
opt.tmpdisk = -1;
opt.hold = false;
opt.constraints = NULL;
opt.contiguous = false;
opt.exclusive = false;
opt.nodelist = NULL;
opt.exc_nodes = NULL;
opt.max_launch_time = 120;/* 120 seconds to launch job */
opt.max_exit_timeout= 60; /* Warn user 60 seconds after task exit */
/* Default launch msg timeout */
opt.msg_timeout = SLURM_MESSAGE_TIMEOUT_SEC_STATIC;
for (i=0; i<SYSTEM_DIMENSIONS; i++)
opt.geometry[i] = (uint16_t) NO_VAL;
opt.no_rotate = false;
opt.conn_type = -1;
opt.euid = (uid_t) -1;
opt.egid = (gid_t) -1;
opt.propagate = NULL; /* propagate specific rlimits */
opt.prolog = slurm_get_srun_prolog();
opt.epilog = slurm_get_srun_epilog();
opt.task_prolog = NULL;
opt.task_epilog = NULL;
mode = MODE_NORMAL;
getnodename(hostname, sizeof(hostname));
opt.ctrl_comm_ifhn = xstrdup(hostname);
/*
* Reset some default values if running under a parallel debugger
*/
if ((opt.parallel_debug = _under_parallel_debugger())) {
opt.max_launch_time = 120;
opt.max_threads = 1;
opt.msg_timeout = 15;
}
opt.get_user_env = false;
}
/*---[ env var processing ]-----------------------------------------------*/
/*
* try to use a similar scheme as popt.
*
* in order to add a new env var (to be processed like an option):
*
* define a new entry into env_vars[], if the option is a simple int
* or string you may be able to get away with adding a pointer to the
* option to set. Otherwise, process var based on "type" in _opt_env.
*/
struct env_vars {
const char *var;
int type;
void *arg;
void *set_flag;
};
env_vars_t env_vars[] = {
{"SLURM_ACCOUNT", OPT_STRING, &opt.account, NULL },
{"SLURMD_DEBUG", OPT_INT, &opt.slurmd_debug, NULL },
{"SLURM_CPUS_PER_TASK", OPT_INT, &opt.cpus_per_task, &opt.cpus_set },
{"SLURM_CONN_TYPE", OPT_CONN_TYPE, NULL, NULL },
{"SLURM_CORE_FORMAT", OPT_CORE, NULL, NULL },
{"SLURM_CPU_BIND", OPT_CPU_BIND, NULL, NULL },
{"SLURM_MEM_BIND", OPT_MEM_BIND, NULL, NULL },
{"SLURM_DEPENDENCY", OPT_INT, &opt.dependency, NULL },
{"SLURM_DISTRIBUTION", OPT_DISTRIB, NULL, NULL },
{"SLURM_GEOMETRY", OPT_GEOMETRY, NULL, NULL },
{"SLURM_IMMEDIATE", OPT_INT, &opt.immediate, NULL },
{"SLURM_JOB_NAME", OPT_STRING, &opt.job_name, &opt.job_name_set},
{"SLURM_JOBID", OPT_INT, &opt.jobid, NULL },
{"SLURM_KILL_BAD_EXIT", OPT_INT, &opt.kill_bad_exit, NULL },
{"SLURM_LABELIO", OPT_INT, &opt.labelio, NULL },
{"SLURM_NNODES", OPT_NODES, NULL, NULL },
{"SLURM_NO_ROTATE", OPT_NO_ROTATE, NULL, NULL },
{"SLURM_NPROCS", OPT_INT, &opt.nprocs, &opt.nprocs_set},
{"SLURM_OVERCOMMIT", OPT_OVERCOMMIT, NULL, NULL },
{"SLURM_EXCLUSIVE", OPT_EXCLUSIVE, NULL, NULL },
{"SLURM_PARTITION", OPT_STRING, &opt.partition, NULL },
{"SLURM_REMOTE_CWD", OPT_STRING, &opt.cwd, NULL },
{"SLURM_STDERRMODE", OPT_STRING, &opt.efname, NULL },
{"SLURM_STDINMODE", OPT_STRING, &opt.ifname, NULL },
{"SLURM_STDOUTMODE", OPT_STRING, &opt.ofname, NULL },
{"SLURM_TIMELIMIT", OPT_INT, &opt.time_limit, NULL },
{"SLURM_WAIT", OPT_INT, &opt.max_wait, NULL },
{"SLURM_DISABLE_STATUS",OPT_INT, &opt.disable_status,NULL },
{"SLURM_MPI_TYPE", OPT_MPI, NULL, NULL },
{"SLURM_SRUN_COMM_IFHN",OPT_STRING, &opt.ctrl_comm_ifhn,NULL },
{"SLURM_SRUN_MULTI", OPT_MULTI, NULL, NULL },
{"SLURM_UNBUFFEREDIO", OPT_INT, &opt.unbuffered, NULL },
{"SLURM_WORKING_DIR", OPT_STRING, &opt.cwd, &opt.cwd_set },
{NULL, 0, NULL, NULL}
};
/*
* _opt_env(): used by initialize_and_process_args to set options via
* environment variables. See comments above for how to
* extend srun to process different vars
*/
static void _opt_env()
{
char *val = NULL;
env_vars_t *e = env_vars;
while (e->var) {
if ((val = getenv(e->var)) != NULL)
_process_env_var(e, val);
e++;
}
}
static void
_process_env_var(env_vars_t *e, const char *val)
{
char *end = NULL;
enum task_dist_states dt;
debug2("now processing env var %s=%s", e->var, val);
if (e->set_flag) {
*((bool *) e->set_flag) = true;
}
switch (e->type) {
case OPT_STRING:
*((char **) e->arg) = xstrdup(val);
break;
case OPT_INT:
if (val != NULL) {
*((int *) e->arg) = (int) strtol(val, &end, 10);
if (!(end && *end == '\0'))
error("%s=%s invalid. ignoring...", e->var, val);
}
break;
case OPT_DISTRIB:
dt = _verify_dist_type(val);
if (dt == SLURM_DIST_UNKNOWN) {
error("\"%s=%s\" -- invalid distribution type. "
"ignoring...", e->var, val);
} else
opt.distribution = dt;
break;
case OPT_CPU_BIND:
if (_verify_cpu_bind(val, &opt.cpu_bind,
&opt.cpu_bind_type))
exit(1);
break;
case OPT_MEM_BIND:
if (_verify_mem_bind(val, &opt.mem_bind,
&opt.mem_bind_type))
exit(1);
break;
case OPT_NODES:
opt.nodes_set = _verify_node_count( val,
&opt.min_nodes,
&opt.max_nodes );
if (opt.nodes_set == false) {
error("\"%s=%s\" -- invalid node count. ignoring...",
e->var, val);
}
break;
case OPT_OVERCOMMIT:
opt.overcommit = true;
break;
case OPT_EXCLUSIVE:
opt.exclusive = true;
break;
case OPT_CORE:
opt.core_type = core_format_type (val);
break;
case OPT_CONN_TYPE:
opt.conn_type = _verify_conn_type(val);
break;
case OPT_NO_ROTATE:
opt.no_rotate = true;
break;
case OPT_GEOMETRY:
if (_verify_geometry(val, opt.geometry)) {
error("\"%s=%s\" -- invalid geometry, ignoring...",
e->var, val);
}
break;
case OPT_MPI:
if (srun_mpi_init((char *)val) == SLURM_ERROR) {
fatal("\"%s=%s\" -- invalid MPI type, "
"--mpi=list for acceptable types.",
e->var, val);
}
break;
default:
/* do nothing */
break;
}
}
/*
* Get a decimal integer from arg.
*
* Returns the integer on success, exits program on failure.
*
*/
static int
_get_int(const char *arg, const char *what)
{
char *p;
long int result = strtol(arg, &p, 10);
if ((*p != '\0') || (result < 0L)) {
error ("Invalid numeric value \"%s\" for %s.", arg, what);
exit(1);
}
if (result > INT_MAX) {
error ("Numeric argument (%ld) to big for %s.", result, what);
}
return (int) result;
}
void set_options(const int argc, char **argv, int first)
{
int opt_char, option_index = 0;
struct utsname name;
static struct option long_options[] = {
{"attach", required_argument, 0, 'a'},
{"allocate", no_argument, 0, 'A'},
{"batch", no_argument, 0, 'b'},
{"cpus-per-task", required_argument, 0, 'c'},
{"constraint", required_argument, 0, 'C'},
{"slurmd-debug", required_argument, 0, 'd'},
{"chdir", required_argument, 0, 'D'},
{"error", required_argument, 0, 'e'},
{"geometry", required_argument, 0, 'g'},
{"hold", no_argument, 0, 'H'},
{"input", required_argument, 0, 'i'},
{"immediate", no_argument, 0, 'I'},
{"join", no_argument, 0, 'j'},
{"job-name", required_argument, 0, 'J'},
{"no-kill", no_argument, 0, 'k'},
{"kill-on-bad-exit", no_argument, 0, 'K'},
{"label", no_argument, 0, 'l'},
{"distribution", required_argument, 0, 'm'},
{"ntasks", required_argument, 0, 'n'},
{"nodes", required_argument, 0, 'N'},
{"output", required_argument, 0, 'o'},
{"overcommit", no_argument, 0, 'O'},
{"partition", required_argument, 0, 'p'},
{"dependency", required_argument, 0, 'P'},
{"quit-on-interrupt", no_argument, 0, 'q'},
{"quiet", no_argument, 0, 'Q'},
{"relative", required_argument, 0, 'r'},
{"no-rotate", no_argument, 0, 'R'},
{"share", no_argument, 0, 's'},
{"time", required_argument, 0, 't'},
{"threads", required_argument, 0, 'T'},
{"unbuffered", no_argument, 0, 'u'},
{"account", required_argument, 0, 'U'},
{"verbose", no_argument, 0, 'v'},
{"version", no_argument, 0, 'V'},
{"nodelist", required_argument, 0, 'w'},
{"wait", required_argument, 0, 'W'},
{"exclude", required_argument, 0, 'x'},
{"disable-status", no_argument, 0, 'X'},
{"no-allocate", no_argument, 0, 'Z'},
{"contiguous", no_argument, 0, LONG_OPT_CONT},
{"exclusive", no_argument, 0, LONG_OPT_EXCLUSIVE},
{"cpu_bind", required_argument, 0, LONG_OPT_CPU_BIND},
{"mem_bind", required_argument, 0, LONG_OPT_MEM_BIND},
{"core", required_argument, 0, LONG_OPT_CORE},
{"mincpus", required_argument, 0, LONG_OPT_MINCPU},
{"mem", required_argument, 0, LONG_OPT_MEM},
{"mpi", required_argument, 0, LONG_OPT_MPI},
{"no-shell", no_argument, 0, LONG_OPT_NOSHELL},
{"tmp", required_argument, 0, LONG_OPT_TMP},
{"jobid", required_argument, 0, LONG_OPT_JOBID},
{"msg-timeout", required_argument, 0, LONG_OPT_TIMEO},
{"max-launch-time", required_argument, 0, LONG_OPT_LAUNCH},
{"max-exit-timeout", required_argument, 0, LONG_OPT_XTO},
{"uid", required_argument, 0, LONG_OPT_UID},
{"gid", required_argument, 0, LONG_OPT_GID},
{"debugger-test", no_argument, 0, LONG_OPT_DEBUG_TS},
{"help", no_argument, 0, LONG_OPT_HELP},
{"usage", no_argument, 0, LONG_OPT_USAGE},
{"conn-type", required_argument, 0, LONG_OPT_CONNTYPE},
{"test-only", no_argument, 0, LONG_OPT_TEST_ONLY},
{"network", required_argument, 0, LONG_OPT_NETWORK},
{"propagate", optional_argument, 0, LONG_OPT_PROPAGATE},
{"prolog", required_argument, 0, LONG_OPT_PROLOG},
{"epilog", required_argument, 0, LONG_OPT_EPILOG},
{"begin", required_argument, 0, LONG_OPT_BEGIN},
{"mail-type", required_argument, 0, LONG_OPT_MAIL_TYPE},
{"mail-user", required_argument, 0, LONG_OPT_MAIL_USER},
{"task-prolog", required_argument, 0, LONG_OPT_TASK_PROLOG},
{"task-epilog", required_argument, 0, LONG_OPT_TASK_EPILOG},
{"nice", optional_argument, 0, LONG_OPT_NICE},
{"ctrl-comm-ifhn", required_argument, 0, LONG_OPT_CTRL_COMM_IFHN},
{"multi-prog", no_argument, 0, LONG_OPT_MULTI},
{"comment", required_argument, 0, LONG_OPT_COMMENT},
{"get-user-env", no_argument, 0, LONG_OPT_GET_USER_ENV},
{NULL, 0, 0, 0}
};
char *opt_string = "+a:Abc:C:d:D:e:g:Hi:IjJ:kKlm:n:N:"
"o:Op:P:qQr:R:st:T:uU:vVw:W:x:XZ";
struct option *optz = spank_option_table_create (long_options);
if (!optz) {
error ("Unable to create option table");
exit (1);
}
if(opt.progname == NULL)
opt.progname = xbasename(argv[0]);
else if(!first)
argv[0] = opt.progname;
else
error("opt.progname is set but it is the first time through.");
optind = 0;
while((opt_char = getopt_long(argc, argv, opt_string,
optz, &option_index)) != -1) {
switch (opt_char) {
case (int)'?':
if(first) {
fprintf(stderr, "Try \"srun --help\" for more "
"information\n");
exit(1);
}
break;
case (int)'a':
if(first) {
if (opt.allocate || opt.batch) {
error("can only specify one mode: "
"allocate, attach or batch.");
exit(1);
}
mode = MODE_ATTACH;
opt.attach = strdup(optarg);
} else {
error("Option '%c' can only be set "
"from srun commandline.", opt_char);
}
break;
case (int)'A':
if(first) {
if (opt.attach || opt.batch) {
error("can only specify one mode: "
"allocate, attach or batch.");
exit(1);
}
mode = MODE_ALLOCATE;
opt.allocate = true;
} else {
error("Option '%c' can only be set "
"from srun commandline.", opt_char);
}
break;
case (int)'b':
if(first) {
if (opt.allocate || opt.attach) {
error("can only specify one mode: "
"allocate, attach or batch.");
exit(1);
}
mode = MODE_BATCH;
opt.batch = true;
} else {
error("Option '%c' can only be set "
"from srun commandline.", opt_char);
}
break;
case (int)'c':
if(!first && opt.cpus_set)
break;
opt.cpus_set = true;
opt.cpus_per_task =
_get_int(optarg, "cpus-per-task");
break;
case (int)'C':
if(!first && opt.constraints)
break;
xfree(opt.constraints);
opt.constraints = xstrdup(optarg);
break;
case (int)'d':
if(!first && opt.slurmd_debug)
break;
opt.slurmd_debug =
_get_int(optarg, "slurmd-debug");
break;
case (int)'D':
if(!first && opt.cwd_set)
break;
opt.cwd_set = true;
xfree(opt.cwd);
opt.cwd = xstrdup(optarg);
break;
case (int)'e':
if(!first && opt.efname)
break;
xfree(opt.efname);
if (strncasecmp(optarg, "none", (size_t) 4) == 0)
opt.efname = xstrdup("/dev/null");
else
opt.efname = xstrdup(optarg);
break;
case (int)'g':
if(!first && opt.geometry)
break;
if (_verify_geometry(optarg, opt.geometry))
exit(1);
break;
case (int)'H':
opt.hold = true;
break;
case (int)'i':
if(!first && opt.ifname)
break;
xfree(opt.ifname);
opt.ifname = xstrdup(optarg);
break;
case (int)'I':
opt.immediate = true;
break;
case (int)'j':
opt.join = true;
break;
case (int)'J':
if(!first && opt.job_name_set)
break;
opt.job_name_set = true;
xfree(opt.job_name);
opt.job_name = xstrdup(optarg);
break;
case (int)'k':
opt.no_kill = true;
break;
case (int)'K':
opt.kill_bad_exit = true;
break;
case (int)'l':
opt.labelio = true;
break;
case (int)'m':
if(!first && opt.distribution)
break;
opt.distribution = _verify_dist_type(optarg);
if (opt.distribution == SLURM_DIST_UNKNOWN) {
error("distribution type `%s' "
"is not recognized", optarg);
exit(1);
}
break;
case (int)'n':
if(!first && opt.nprocs_set)
break;
opt.nprocs_set = true;
opt.nprocs =
_get_int(optarg, "number of tasks");
break;
case (int)'N':
if(!first && opt.nodes_set)
break;
opt.nodes_set =
_verify_node_count(optarg,
&opt.min_nodes,
&opt.max_nodes);
if (opt.nodes_set == false) {
error("invalid node count `%s'",
optarg);
exit(1);
}
break;
case (int)'o':
if(!first && opt.ofname)
break;
xfree(opt.ofname);
if (strncasecmp(optarg, "none", (size_t) 4) == 0)
opt.ofname = xstrdup("/dev/null");
else
opt.ofname = xstrdup(optarg);
break;
case (int)'O':
opt.overcommit = true;
break;
case (int)'p':
if(!first && opt.partition)
break;
xfree(opt.partition);
opt.partition = xstrdup(optarg);
break;
case (int)'P':
if(!first && opt.dependency)
break;
opt.dependency = _get_int(optarg, "dependency");
break;
case (int)'q':
opt.quit_on_intr = true;
break;
case (int) 'Q':
if(!first && opt.quiet)
break;
opt.quiet++;
break;
case (int)'r':
if(!first && opt.relative)
break;
xfree(opt.relative);
opt.relative = xstrdup(optarg);
break;
case (int)'R':
opt.no_rotate = true;
break;
case (int)'s':
opt.share = true;
break;
case (int)'t':
if(!first && opt.time_limit)
break;
opt.time_limit = _get_int(optarg, "time");
break;
case (int)'T':
if(!first && opt.max_threads)
break;
opt.max_threads =
_get_int(optarg, "max_threads");
break;
case (int)'u':
opt.unbuffered = true;
break;
case (int)'U':
if(!first && opt.account)
break;
xfree(opt.account);
opt.account = xstrdup(optarg);
break;
case (int)'v':
if(!first && _verbose)
break;
_verbose++;
break;
case (int)'V':
_print_version();
exit(0);
break;
case (int)'w':
if(!first && opt.nodelist)
break;
xfree(opt.nodelist);
opt.nodelist = xstrdup(optarg);
#ifdef HAVE_BG
info("\tThe nodelist option should only be used if\n"
"\tthe block you are asking for can be created.\n"
"\tPlease consult smap before using this option\n"
"\tor your job may be stuck with no way to run.");
#endif
break;
case (int)'W':
opt.max_wait = _get_int(optarg, "wait");
break;
case (int)'x':
xfree(opt.exc_nodes);
opt.exc_nodes = xstrdup(optarg);
if (!_valid_node_list(&opt.exc_nodes))
exit(1);
break;
case (int)'X':
opt.disable_status = true;
break;
case (int)'Z':
opt.no_alloc = true;
uname(&name);
if (strcasecmp(name.sysname, "AIX") == 0)
opt.network = xstrdup("ip");
break;
case LONG_OPT_CONT:
opt.contiguous = true;
break;
case LONG_OPT_EXCLUSIVE:
opt.exclusive = true;
break;
case LONG_OPT_CPU_BIND:
if (_verify_cpu_bind(optarg, &opt.cpu_bind,
&opt.cpu_bind_type))
exit(1);
break;
case LONG_OPT_MEM_BIND:
if (_verify_mem_bind(optarg, &opt.mem_bind,
&opt.mem_bind_type))
exit(1);
break;
case LONG_OPT_CORE:
opt.core_type = core_format_type (optarg);
if (opt.core_type == CORE_INVALID)
error ("--core=\"%s\" Invalid -- ignoring.\n",
optarg);
break;
case LONG_OPT_MINCPU:
opt.mincpus = _get_int(optarg, "mincpus");
break;
case LONG_OPT_MEM:
opt.realmem = (int) _to_bytes(optarg);
if (opt.realmem < 0) {
error("invalid memory constraint %s",
optarg);
exit(1);
}
break;
case LONG_OPT_MPI:
if (srun_mpi_init((char *)optarg) == SLURM_ERROR) {
fatal("\"--mpi=%s\" -- long invalid MPI type, "
"--mpi=list for acceptable types.",
optarg);
}
break;
case LONG_OPT_NOSHELL:
opt.noshell = true;
break;
case LONG_OPT_TMP:
opt.tmpdisk = _to_bytes(optarg);
if (opt.tmpdisk < 0) {
error("invalid tmp value %s", optarg);
exit(1);
}
break;
case LONG_OPT_JOBID:
opt.jobid = _get_int(optarg, "jobid");
opt.jobid_set = true;
break;
case LONG_OPT_TIMEO:
opt.msg_timeout =
_get_int(optarg, "msg-timeout");
break;
case LONG_OPT_LAUNCH:
opt.max_launch_time =
_get_int(optarg, "max-launch-time");
break;
case LONG_OPT_XTO:
opt.max_exit_timeout =
_get_int(optarg, "max-exit-timeout");
break;
case LONG_OPT_UID:
opt.euid = uid_from_string (optarg);
if (opt.euid == (uid_t) -1)
fatal ("--uid=\"%s\" invalid", optarg);
break;
case LONG_OPT_GID:
opt.egid = gid_from_string (optarg);
if (opt.egid == (gid_t) -1)
fatal ("--gid=\"%s\" invalid", optarg);
break;
case LONG_OPT_DEBUG_TS:
opt.debugger_test = true;
/* make other parameters look like debugger
* is really attached */
opt.parallel_debug = true;
MPIR_being_debugged = 1;
opt.max_launch_time = 120;
opt.max_threads = 1;
opt.msg_timeout = 15;
break;
case LONG_OPT_HELP:
_help();
exit(0);
case LONG_OPT_USAGE:
_usage();
exit(0);
case LONG_OPT_CONNTYPE:
opt.conn_type = _verify_conn_type(optarg);
break;
case LONG_OPT_TEST_ONLY:
opt.test_only = true;
break;
case LONG_OPT_NETWORK:
xfree(opt.network);
opt.network = xstrdup(optarg);
#ifdef HAVE_AIX
setenv("SLURM_NETWORK", opt.network, 1);
#endif
break;
case LONG_OPT_PROPAGATE:
xfree(opt.propagate);
if (optarg) opt.propagate = xstrdup(optarg);
else opt.propagate = xstrdup("ALL");
break;
case LONG_OPT_PROLOG:
xfree(opt.prolog);
opt.prolog = xstrdup(optarg);
break;
case LONG_OPT_EPILOG:
xfree(opt.epilog);
opt.epilog = xstrdup(optarg);
break;
case LONG_OPT_BEGIN:
opt.begin = parse_time(optarg);
break;
case LONG_OPT_MAIL_TYPE:
opt.mail_type |= _parse_mail_type(optarg);
if (opt.mail_type == 0)
fatal("--mail-type=%s invalid", optarg);
break;
case LONG_OPT_MAIL_USER:
xfree(opt.mail_user);
opt.mail_user = xstrdup(optarg);
break;
case LONG_OPT_TASK_PROLOG:
xfree(opt.task_prolog);
opt.task_prolog = xstrdup(optarg);
break;
case LONG_OPT_TASK_EPILOG:
xfree(opt.task_epilog);
opt.task_epilog = xstrdup(optarg);
break;
case LONG_OPT_NICE:
if (optarg)
opt.nice = strtol(optarg, NULL, 10);
else
opt.nice = 100;
if (abs(opt.nice) > NICE_OFFSET) {
error("Invalid nice value, must be between "
"-%d and %d", NICE_OFFSET, NICE_OFFSET);
exit(1);
}
break;
case LONG_OPT_CTRL_COMM_IFHN:
xfree(opt.ctrl_comm_ifhn);
opt.ctrl_comm_ifhn = xstrdup(optarg);
break;
case LONG_OPT_MULTI:
opt.multi_prog = true;
break;
case LONG_OPT_COMMENT:
/* Use account for Moab until job comment field
* is actually available in slurm v1.2 */
if(!first && opt.account)
break;
xfree(opt.account);
opt.account = xstrdup(optarg);
break;
case LONG_OPT_GET_USER_ENV:
opt.get_user_env = true;
break;
default:
if (spank_process_option (opt_char, optarg) < 0) {
exit (1);
}
}
}
if (!first) {
if (!_opt_verify())
exit(1);
if (_verbose > 3)
_opt_list();
}
spank_option_table_destroy (optz);
}
/* Load the multi_prog config file into argv, pass the entire file contents
* in order to avoid having to read the file on every node. We could parse
* the infomration here too for loading the MPIR records for TotalView */
static void _load_multi(int *argc, char **argv)
{
int config_fd, data_read = 0, i;
struct stat stat_buf;
char *data_buf;
if ((config_fd = open(argv[0], O_RDONLY)) == -1) {
error("Could not open multi_prog config file %s",
argv[0]);
exit(1);
}
if (fstat(config_fd, &stat_buf) == -1) {
error("Could not stat multi_prog config file %s",
argv[0]);
exit(1);
}
if (stat_buf.st_size > 60000) {
error("Multi_prog config file %s is too large",
argv[0]);
exit(1);
}
data_buf = xmalloc(stat_buf.st_size + 1);
while ((i = read(config_fd, &data_buf[data_read], stat_buf.st_size
- data_read)) != 0) {
if (i < 0) {
error("Error reading multi_prog config file %s",
argv[0]);
exit(1);
} else
data_read += i;
}
close(config_fd);
for (i=1; i<*argc; i++)
xfree(argv[i]);
argv[1] = data_buf;
*argc = 2;
}
/*
* _opt_args() : set options via commandline args and popt
*/
static void _opt_args(int argc, char **argv)
{
int i;
char **rest = NULL;
set_options(argc, argv, 1);
#ifdef HAVE_AIX
if (opt.network == NULL) {
opt.network = "us,sn_all,bulk_xfer";
setenv("SLURM_NETWORK", opt.network, 1);
}
#endif
remote_argc = 0;
if (optind < argc) {
rest = argv + optind;
while (rest[remote_argc] != NULL)
remote_argc++;
}
remote_argv = (char **) xmalloc((remote_argc + 1) * sizeof(char *));
for (i = 0; i < remote_argc; i++)
remote_argv[i] = xstrdup(rest[i]);
remote_argv[i] = NULL; /* End of argv's (for possible execv) */
if (opt.multi_prog) {
if (remote_argc < 1) {
error("configuration file not specified");
exit(1);
}
_load_multi(&remote_argc, remote_argv);
}
else if (remote_argc > 0) {
char *fullpath;
char *cmd = remote_argv[0];
bool search_cwd = (opt.batch || opt.allocate);
int mode = (search_cwd) ? R_OK : R_OK | X_OK;
if ((fullpath = _search_path(cmd, search_cwd, mode))) {
xfree(remote_argv[0]);
remote_argv[0] = fullpath;
}
}
if (!_opt_verify())
exit(1);
}
/*
* _opt_verify : perform some post option processing verification
*
*/
static bool _opt_verify(void)
{
bool verified = true;
/*
* Do not set slurmd debug level higher than DEBUG2,
* as DEBUG3 is used for slurmd IO operations, which
* are not appropriate to be sent back to srun. (because
* these debug messages cause the generation of more
* debug messages ad infinitum)
*/
if (opt.slurmd_debug + LOG_LEVEL_ERROR > LOG_LEVEL_DEBUG2)
opt.slurmd_debug = LOG_LEVEL_DEBUG2 - LOG_LEVEL_ERROR;
if (opt.quiet && _verbose) {
error ("don't specify both --verbose (-v) and --quiet (-Q)");
verified = false;
}
if (opt.no_alloc && !opt.nodelist) {
error("must specify a node list with -Z, --no-allocate.");
verified = false;
}
if (opt.no_alloc && opt.exc_nodes) {
error("can not specify --exclude list with -Z, --no-allocate.");
verified = false;
}
if (opt.no_alloc && opt.relative) {
error("do not specify -r,--relative with -Z,--no-allocate.");
verified = false;
}
if (opt.relative && (opt.exc_nodes || opt.nodelist)) {
error("-r,--relative not allowed with "
"-w,--nodelist or -x,--exclude.");
verified = false;
}
if (opt.mincpus < opt.cpus_per_task)
opt.mincpus = opt.cpus_per_task;
if ((opt.job_name == NULL) && (remote_argc > 0))
opt.job_name = _base_name(remote_argv[0]);
if(!opt.nodelist) {
if((opt.nodelist = xstrdup(getenv("SLURM_HOSTFILE")))) {
/* make sure the file being read in has a / in
it to make sure it is a file in the
valid_node_list function */
if(!strstr(opt.nodelist, "/")) {
char *add_slash = xstrdup("./");
xstrcat(add_slash, opt.nodelist);
xfree(opt.nodelist);
opt.nodelist = add_slash;
}
opt.distribution = SLURM_DIST_ARBITRARY;
if (!_valid_node_list(&opt.nodelist)) {
error("Failure getting NodeNames from "
"hostfile");
exit(1);
} else {
debug("loaded nodes (%s) from hostfile",
opt.nodelist);
}
}
} else
if (!_valid_node_list(&opt.nodelist))
exit(1);
/* now if max is set make sure we have <= max_nodes in the
* nodelist but only if it isn't arbitrary since the user has
* laid it out how it should be so don't mess with it print an
* error later if it doesn't work the way they wanted */
if(opt.max_nodes && opt.nodelist
&& opt.distribution != SLURM_DIST_ARBITRARY) {
hostlist_t hl = hostlist_create(opt.nodelist);
int count = hostlist_count(hl);
if(count > opt.max_nodes) {
int i = 0;
char buf[8192];
count -= opt.max_nodes;
while(i<count) {
char *name = hostlist_pop(hl);
if(name)
free(name);
else
break;
i++;
}
hostlist_ranged_string(hl, sizeof(buf), buf);
xfree(opt.nodelist);
opt.nodelist = xstrdup(buf);
}
hostlist_destroy(hl);
}
if (mode == MODE_ATTACH) { /* attach to a running job */
if (opt.nodes_set || opt.cpus_set || opt.nprocs_set) {
error("do not specific a node allocation "
"with --attach (-a)");
verified = false;
}
/* if (constraints_given()) {
* error("do not specify any constraints with "
* "--attach (-a)");
* verified = false;
*}
*/
} else { /* mode != MODE_ATTACH */
if ((remote_argc == 0) && (mode != MODE_ALLOCATE)) {
error("must supply remote command");
verified = false;
}
/* check for realistic arguments */
if (opt.nprocs <= 0) {
error("%s: invalid number of processes (-n %d)",
opt.progname, opt.nprocs);
verified = false;
}
if (opt.cpus_per_task <= 0) {
error("%s: invalid number of cpus per task (-c %d)\n",
opt.progname, opt.cpus_per_task);
verified = false;
}
if ((opt.min_nodes <= 0) || (opt.max_nodes < 0) ||
(opt.max_nodes && (opt.min_nodes > opt.max_nodes))) {
error("%s: invalid number of nodes (-N %d-%d)\n",
opt.progname, opt.min_nodes, opt.max_nodes);
verified = false;
}
core_format_enable (opt.core_type);
/* massage the numbers */
if(opt.distribution == SLURM_DIST_ARBITRARY
&& !opt.nprocs_set && opt.nodelist) {
hostlist_t hl = hostlist_create(opt.nodelist);
opt.nprocs = hostlist_count(hl);
hostlist_destroy(hl);
opt.nprocs_set = true;
} else if (opt.nodes_set && !opt.nprocs_set) {
/* 1 proc / node default */
opt.nprocs = opt.min_nodes;
} else if (opt.nodes_set && opt.nprocs_set) {
/*
* make sure # of procs >= min_nodes
*/
if (opt.nprocs < opt.min_nodes) {
info ("Warning: can't run %d processes on %d "
"nodes, setting nnodes to %d",
opt.nprocs, opt.min_nodes, opt.nprocs);
opt.min_nodes = opt.nprocs;
if ( opt.max_nodes
&& (opt.min_nodes > opt.max_nodes) )
opt.max_nodes = opt.min_nodes;
}
} /* else if (opt.nprocs_set && !opt.nodes_set) */
}
if (opt.max_threads <= 0) { /* set default */
error("Thread value invalid, reset to 1");
opt.max_threads = 1;
} else if (opt.max_threads > MAX_THREADS) {
error("Thread value exceeds defined limit, reset to %d",
MAX_THREADS);
}
if (opt.labelio && opt.unbuffered) {
error("Do not specify both -l (--label) and "
"-u (--unbuffered)");
exit(1);
}
/*
* --wait always overrides hidden max_exit_timeout
*/
if (opt.max_wait)
opt.max_exit_timeout = opt.max_wait;
if (opt.time_limit == 0)
opt.time_limit = INFINITE;
if ((opt.euid != (uid_t) -1) && (opt.euid != opt.uid))
opt.uid = opt.euid;
if ((opt.egid != (gid_t) -1) && (opt.egid != opt.gid))
opt.gid = opt.egid;
if ((opt.egid != (gid_t) -1) && (opt.egid != opt.gid))
opt.gid = opt.egid;
if (opt.noshell && !opt.allocate) {
error ("--no-shell only valid with -A (--allocate)");
verified = false;
}
if (opt.propagate && parse_rlimits( opt.propagate, PROPAGATE_RLIMITS)) {
error( "--propagate=%s is not valid.", opt.propagate );
verified = false;
}
return verified;
}
static uint16_t _parse_mail_type(const char *arg)
{
uint16_t rc;
if (strcasecmp(arg, "BEGIN") == 0)
rc = MAIL_JOB_BEGIN;
else if (strcasecmp(arg, "END") == 0)
rc = MAIL_JOB_END;
else if (strcasecmp(arg, "FAIL") == 0)
rc = MAIL_JOB_FAIL;
else if (strcasecmp(arg, "ALL") == 0)
rc = MAIL_JOB_BEGIN | MAIL_JOB_END | MAIL_JOB_FAIL;
else
rc = 0; /* failure */
return rc;
}
static char *_print_mail_type(const uint16_t type)
{
if (type == 0)
return "NONE";
if (type == MAIL_JOB_BEGIN)
return "BEGIN";
if (type == MAIL_JOB_END)
return "END";
if (type == MAIL_JOB_FAIL)
return "FAIL";
if (type == (MAIL_JOB_BEGIN | MAIL_JOB_END | MAIL_JOB_FAIL))
return "ALL";
return "MULTIPLE";
}
static void
_freeF(void *data)
{
xfree(data);
}
static List
_create_path_list(void)
{
List l = list_create(_freeF);
char *path = xstrdup(getenv("PATH"));
char *c, *lc;
if (!path) {
verbose("No PATH environment variable");
return l;
}
c = lc = path;
while (*c != '\0') {
if (*c == ':') {
/* nullify and push token onto list */
*c = '\0';
if (lc != NULL && strlen(lc) > 0)
list_append(l, xstrdup(lc));
lc = ++c;
} else
c++;
}
if (strlen(lc) > 0)
list_append(l, xstrdup(lc));
xfree(path);
return l;
}
static char *
_search_path(char *cmd, bool check_current_dir, int access_mode)
{
List l = _create_path_list();
ListIterator i = NULL;
char *path, *fullpath = NULL;
if ( (cmd[0] == '.' || cmd[0] == '/')
&& (access(cmd, access_mode) == 0 ) ) {
if (cmd[0] == '.')
xstrfmtcat(fullpath, "%s/", opt.cwd);
xstrcat(fullpath, cmd);
goto done;
}
if (check_current_dir)
list_prepend(l, xstrdup(opt.cwd));
i = list_iterator_create(l);
while ((path = list_next(i))) {
xstrfmtcat(fullpath, "%s/%s", path, cmd);
if (access(fullpath, access_mode) == 0)
goto done;
xfree(fullpath);
fullpath = NULL;
}
done:
list_destroy(l);
return fullpath;
}
/* helper function for printing options
*
* warning: returns pointer to memory allocated on the stack.
*/
static char *print_constraints()
{
char *buf = xstrdup("");
if (opt.mincpus > 0)
xstrfmtcat(buf, "mincpus=%d ", opt.mincpus);
if (opt.realmem > 0)
xstrfmtcat(buf, "mem=%dM ", opt.realmem);
if (opt.tmpdisk > 0)
xstrfmtcat(buf, "tmp=%ld ", opt.tmpdisk);
if (opt.contiguous == true)
xstrcat(buf, "contiguous ");
if (opt.exclusive == true)
xstrcat(buf, "exclusive ");
if (opt.nodelist != NULL)
xstrfmtcat(buf, "nodelist=%s ", opt.nodelist);
if (opt.exc_nodes != NULL)
xstrfmtcat(buf, "exclude=%s ", opt.exc_nodes);
if (opt.constraints != NULL)
xstrfmtcat(buf, "constraints=`%s' ", opt.constraints);
return buf;
}
static char *
print_commandline()
{
int i;
char buf[256];
buf[0] = '\0';
for (i = 0; i < remote_argc; i++)
snprintf(buf, 256, "%s", remote_argv[i]);
return xstrdup(buf);
}
static char *
print_geometry()
{
int i;
char buf[32], *rc = NULL;
if ((SYSTEM_DIMENSIONS == 0)
|| (opt.geometry[0] == (uint16_t)NO_VAL))
return NULL;
for (i=0; i<SYSTEM_DIMENSIONS; i++) {
if (i > 0)
snprintf(buf, sizeof(buf), "x%u", opt.geometry[i]);
else
snprintf(buf, sizeof(buf), "%u", opt.geometry[i]);
xstrcat(rc, buf);
}
return rc;
}
#define tf_(b) (b == true) ? "true" : "false"
static void _opt_list()
{
char *str;
info("defined options for program `%s'", opt.progname);
info("--------------- ---------------------");
info("user : `%s'", opt.user);
info("uid : %ld", (long) opt.uid);
info("gid : %ld", (long) opt.gid);
info("cwd : %s", opt.cwd);
info("nprocs : %d %s", opt.nprocs,
opt.nprocs_set ? "(set)" : "(default)");
info("cpus_per_task : %d %s", opt.cpus_per_task,
opt.cpus_set ? "(set)" : "(default)");
if (opt.max_nodes)
info("nodes : %d-%d", opt.min_nodes, opt.max_nodes);
else {
info("nodes : %d %s", opt.min_nodes,
opt.nodes_set ? "(set)" : "(default)");
}
info("jobid : %u %s", opt.jobid,
opt.jobid_set ? "(set)" : "(default)");
info("partition : %s",
opt.partition == NULL ? "default" : opt.partition);
info("job name : `%s'", opt.job_name);
info("distribution : %s", format_task_dist_states(opt.distribution));
info("cpu_bind : %s",
opt.cpu_bind == NULL ? "default" : opt.cpu_bind);
info("mem_bind : %s",
opt.mem_bind == NULL ? "default" : opt.mem_bind);
info("core format : %s", core_format_name (opt.core_type));
info("verbose : %d", _verbose);
info("slurmd_debug : %d", opt.slurmd_debug);
info("immediate : %s", tf_(opt.immediate));
info("label output : %s", tf_(opt.labelio));
info("unbuffered IO : %s", tf_(opt.unbuffered));
info("allocate : %s", tf_(opt.allocate));
info("attach : `%s'", opt.attach);
info("overcommit : %s", tf_(opt.overcommit));
info("batch : %s", tf_(opt.batch));
info("threads : %d", opt.max_threads);
if (opt.time_limit == INFINITE)
info("time_limit : INFINITE");
else
info("time_limit : %d", opt.time_limit);
info("wait : %d", opt.max_wait);
if (opt.nice)
info("nice : %d", opt.nice);
info("account : %s", opt.account);
if (opt.dependency == NO_VAL)
info("dependency : none");
else
info("dependency : %u", opt.dependency);
str = print_constraints();
info("constraints : %s", str);
xfree(str);
if (opt.conn_type >= 0)
info("conn_type : %u", opt.conn_type);
str = print_geometry();
info("geometry : %s", str);
xfree(str);
info("rotate : %s", opt.no_rotate ? "yes" : "no");
info("network : %s", opt.network);
info("propagate : %s",
opt.propagate == NULL ? "NONE" : opt.propagate);
if (opt.begin) {
char time_str[32];
slurm_make_time_str(&opt.begin, time_str, sizeof(time_str));
info("begin : %s", time_str);
}
info("prolog : %s", opt.prolog);
info("epilog : %s", opt.epilog);
info("mail_type : %s", _print_mail_type(opt.mail_type));
info("mail_user : %s", opt.mail_user);
info("task_prolog : %s", opt.task_prolog);
info("task_epilog : %s", opt.task_epilog);
info("ctrl_comm_ifhn : %s", opt.ctrl_comm_ifhn);
info("multi_prog : %s", opt.multi_prog ? "yes" : "no");
str = print_commandline();
info("remote command : `%s'", str);
xfree(str);
}
/* Determine if srun is under the control of a parallel debugger or not */
static bool _under_parallel_debugger (void)
{
return (MPIR_being_debugged != 0);
}
static void _usage(void)
{
printf(
"Usage: srun [-N nnodes] [-n ntasks] [-i in] [-o out] [-e err]\n"
" [-c ncpus] [-r n] [-p partition] [--hold] [-t minutes]\n"
" [-D path] [--immediate] [--overcommit] [--no-kill]\n"
" [--share] [--label] [--unbuffered] [-m dist] [-J jobname]\n"
" [--jobid=id] [--batch] [--verbose] [--slurmd_debug=#]\n"
" [--core=type] [-T threads] [-W sec] [--attach] [--join] \n"
" [--contiguous] [--mincpus=n] [--mem=MB] [--tmp=MB] [-C list]\n"
" [--mpi=type] [--account=name] [--dependency=jobid]\n"
" [--kill-on-bad-exit] [--propagate[=rlimits] ]\n"
" [--cpu_bind=...] [--mem_bind=...]\n"
#ifdef HAVE_BG /* Blue gene specific options */
" [--geometry=XxYxZ] [--conn-type=type] [--no-rotate]\n"
#endif
" [--mail-type=type] [--mail-user=user][--nice[=value]]\n"
" [--prolog=fname] [--epilog=fname]\n"
" [--task-prolog=fname] [--task-epilog=fname]\n"
" [--ctrl-comm-ifhn=addr] [--multi-prog]\n"
" [-w hosts...] [-x hosts...] executable [args...]\n");
}
static void _help(void)
{
printf (
"Usage: srun [OPTIONS...] executable [args...]\n"
"\n"
"Parallel run options:\n"
" -n, --ntasks=ntasks number of tasks to run\n"
" -N, --nodes=N number of nodes on which to run (N = min[-max])\n"
" -c, --cpus-per-task=ncpus number of cpus required per task\n"
" -i, --input=in location of stdin redirection\n"
" -o, --output=out location of stdout redirection\n"
" -e, --error=err location of stderr redirection\n"
" -r, --relative=n run job step relative to node n of allocation\n"
" -p, --partition=partition partition requested\n"
" -H, --hold submit job in held state\n"
" -t, --time=minutes time limit\n"
" -D, --chdir=path change remote current working directory\n"
" -I, --immediate exit if resources are not immediately available\n"
" -O, --overcommit overcommit resources\n"
" -k, --no-kill do not kill job on node failure\n"
" -K, --kill-on-bad-exit kill the job if any task terminates with a\n"
" non-zero exit code\n"
" -s, --share share nodes with other jobs\n"
" -l, --label prepend task number to lines of stdout/err\n"
" -u, --unbuffered do not line-buffer stdout/err\n"
" -m, --distribution=type distribution method for processes to nodes\n"
" (type = block|cyclic|arbitrary)\n"
" -J, --job-name=jobname name of job\n"
" --jobid=id run under already allocated job\n"
" --mpi=type type of MPI being used\n"
" -b, --batch submit as batch job for later execution\n"
" -T, --threads=threads set srun launch fanout\n"
" -W, --wait=sec seconds to wait after first task exits\n"
" before killing job\n"
" -q, --quit-on-interrupt quit on single Ctrl-C\n"
" -X, --disable-status Disable Ctrl-C status feature\n"
" -v, --verbose verbose mode (multiple -v's increase verbosity)\n"
" -Q, --quiet quiet mode (suppress informational messages)\n"
" -d, --slurmd-debug=level slurmd debug level\n"
" --core=type change default corefile format type\n"
" (type=\"list\" to list of valid formats)\n"
" -P, --dependency=jobid defer job until specified jobid completes\n"
" --nice[=value] decrease secheduling priority by value\n"
" -U, --account=name charge job to specified account\n"
" --propagate[=rlimits] propagate all [or specific list of] rlimits\n"
" --mpi=type specifies version of MPI to use\n"
" --prolog=program run \"program\" before launching job step\n"
" --epilog=program run \"program\" after launching job step\n"
" --task-prolog=program run \"program\" before launching task\n"
" --task-epilog=program run \"program\" after launching task\n"
" --begin=time defer job until HH:MM DD/MM/YY\n"
" --mail-type=type notify on state change: BEGIN, END, FAIL or ALL\n"
" --mail-user=user who to send email notification for job state changes\n"
" --ctrl-comm-ifhn=addr interface hostname for PMI communications from srun\n"
" --multi-prog if set the program name specified is the\n"
" configuration specification for multiple programs\n"
" --get-user-env used by Moab. See srun man page.\n"
"\n"
"Allocate only:\n"
" -A, --allocate allocate resources and spawn a shell\n"
" --no-shell don't spawn shell in allocate mode\n"
"\n"
"Attach to running job:\n"
" -a, --attach=jobid attach to running job with specified id\n"
" -j, --join when used with --attach, allow forwarding of\n"
" signals and stdin.\n"
"\n"
"Constraint options:\n"
" --mincpus=n minimum number of cpus per node\n"
" --mem=MB minimum amount of real memory\n"
" --tmp=MB minimum amount of temporary disk\n"
" --contiguous demand a contiguous range of nodes\n"
" -C, --constraint=list specify a list of constraints\n"
" -w, --nodelist=hosts... request a specific list of hosts\n"
" -x, --exclude=hosts... exclude a specific list of hosts\n"
" -Z, --no-allocate don't allocate nodes (must supply -w)\n"
"\n"
"Consumable resources related options:\n"
" --exclusive allocate nodes in exclusive mode when\n"
" cpu consumable resource is enabled\n"
"\n"
"Affinity/Multi-core options: (when the task/affinity plugin is enabled)\n"
" --cpu_bind= Bind tasks to CPUs\n"
" q[uiet], quietly bind before task runs (default)\n"
" v[erbose], verbosely report binding before task runs\n"
" no[ne] don't bind tasks to CPUs (default)\n"
" rank bind by task rank\n"
" map_cpu:<list> bind by mapping CPU IDs to tasks as specified\n"
" where <list> is <cpuid1>,<cpuid2>,...<cpuidN>\n"
" mask_cpu:<list> bind by setting CPU masks on tasks as specified\n"
" where <list> is <mask1>,<mask2>,...<maskN>\n"
" --mem_bind= Bind tasks to memory\n"
" q[uiet], quietly bind before task runs (default)\n"
" v[erbose], verbosely report binding before task runs\n"
" no[ne] don't bind tasks to memory (default)\n"
" rank bind by task rank\n"
" local bind to memory local to processor\n"
" map_mem:<list> bind by mapping memory of CPU IDs to tasks as specified\n"
" where <list> is <cpuid1>,<cpuid2>,...<cpuidN>\n"
" mask_mem:<list> bind by setting menory of CPU masks on tasks as specified\n"
" where <list> is <mask1>,<mask2>,...<maskN>\n");
printf("\n");
spank_print_options (stdout, 6, 30);
printf("\n");
printf(
#ifdef HAVE_AIX /* AIX/Federation specific options */
"AIX related options:\n"
" --network=type communication protocol to be used\n"
"\n"
#endif
#ifdef HAVE_BG /* Blue gene specific options */
"Blue Gene related options:\n"
" -g, --geometry=XxYxZ geometry constraints of the job\n"
" -R, --no-rotate disable geometry rotation\n"
" --conn-type=type constraint on type of connection, MESH or TORUS\n"
" if not set, then tries to fit TORUS else MESH\n"
"\n"
#endif
"Help options:\n"
" --help show this help message\n"
" --usage display brief usage message\n"
"\n"
"Other options:\n"
" -V, --version output version information and exit\n"
"\n"
);
}