blob: 5e37d15a01d70f5a25259bee3854ad84da44f051 [file] [log] [blame] [edit]
/*****************************************************************************\
* state_control.c - state control common functions
*****************************************************************************
* Copyright (C) 2017 SchedMD LLC.
* Written by Alejandro Sanchez <alex@schedmd.com>
*
* This file is part of Slurm, a resource management program.
* For details, see <https://slurm.schedmd.com/>.
* Please also read the included file: DISCLAIMER.
*
* Slurm is free software; you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the Free
* Software Foundation; either version 2 of the License, or (at your option)
* any later version.
*
* In addition, as a special exception, the copyright holders give permission
* to link the code of portions of this program with the OpenSSL library under
* certain conditions as described in each individual source file, and
* distribute linked combinations including the two. You must obey the GNU
* General Public License in all respects for all of the code used other than
* OpenSSL. If you modify file(s) with this exception, you may extend this
* exception to your version of the file(s), but you are not obligated to do
* so. If you do not wish to do so, delete this exception statement from your
* version. If you delete this exception statement from all source files in
* the program, then also delete it here.
*
* Slurm is distributed in the hope that it will be useful, but WITHOUT ANY
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License along
* with Slurm; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
\*****************************************************************************/
#include <ctype.h>
#include <limits.h> /* For LONG_MAX */
#include "src/common/state_control.h"
#include "src/common/working_cluster.h"
#include "src/common/xmalloc.h"
#include "src/common/xstring.h"
extern char *state_control_watts_to_str(uint32_t watts)
{
char *str = NULL;
if ((watts == NO_VAL) || (watts == 0))
xstrcat(str, "n/a");
else if (watts == INFINITE)
xstrcat(str, "INFINITE");
else if ((watts % 1000000) == 0)
xstrfmtcat(str, "%uM", watts / 1000000);
else if ((watts % 1000) == 0)
xstrfmtcat(str, "%uK", watts / 1000);
else
xstrfmtcat(str, "%u", watts);
return str;
}
extern uint32_t state_control_parse_resv_watts(char *watts_str,
resv_desc_msg_t *resv_msg_ptr,
char **err_msg)
{
resv_msg_ptr->resv_watts = 0;
char *end_ptr = NULL;
if (!xstrcasecmp(watts_str, "n/a") || !xstrcasecmp(watts_str, "none"))
return SLURM_SUCCESS;
if (!xstrcasecmp(watts_str, "INFINITE")) {
resv_msg_ptr->resv_watts = INFINITE;
return SLURM_SUCCESS;
}
resv_msg_ptr->resv_watts = (uint32_t)strtoul(watts_str, &end_ptr, 10);
if ((end_ptr[0] == 'k') || (end_ptr[0] == 'K')) {
resv_msg_ptr->resv_watts *= 1000;
} else if ((end_ptr[0] == 'm') || (end_ptr[0] == 'M')) {
resv_msg_ptr->resv_watts *= 1000000;
} else if (end_ptr[0] != '\0') {
if (err_msg)
xstrfmtcat(*err_msg, "Invalid Watts value: %s",
watts_str);
resv_msg_ptr->resv_watts = NO_VAL;
return SLURM_ERROR;
}
return SLURM_SUCCESS;
}
extern int state_control_configured_tres(char *type)
{
int i, cc;
int rc = SLURM_ERROR;
assoc_mgr_info_request_msg_t req;
assoc_mgr_info_msg_t *msg = NULL;
memset(&req, 0, sizeof(assoc_mgr_info_request_msg_t));
cc = slurm_load_assoc_mgr_info(&req, &msg);
if (cc != SLURM_SUCCESS) {
slurm_perror("slurm_load_assoc_mgr_info error");
goto cleanup;
}
for (i = 0; i < msg->tres_cnt; ++i) {
if (!xstrcasecmp(msg->tres_names[i], type)) {
rc = SLURM_SUCCESS;
goto cleanup;
}
}
cleanup:
slurm_free_assoc_mgr_info_msg(msg);
return rc;
}
extern int state_control_corecnt_supported(void)
{
uint32_t select_type = slurmdb_setup_plugin_id_select();
if ((select_type != SELECT_PLUGIN_CONS_RES) &&
(select_type != SELECT_PLUGIN_CONS_TRES) &&
(select_type != SELECT_PLUGIN_CRAY_CONS_RES) &&
(select_type != SELECT_PLUGIN_CRAY_CONS_TRES))
return SLURM_ERROR;
return SLURM_SUCCESS;
}
extern int state_control_parse_resv_corecnt(resv_desc_msg_t *resv_msg_ptr,
char *val, int *free_tres_corecnt,
bool from_tres, char **err_msg)
{
char *endptr = NULL, *core_cnt, *tok, *ptrptr = NULL;
int node_inx = 0;
/*
* CoreCnt and TRES=cpu= might appear within the same request,
* so we free the first and realloc the second.
*/
if (*free_tres_corecnt)
xfree(resv_msg_ptr->core_cnt);
core_cnt = xstrdup(val);
tok = strtok_r(core_cnt, ",", &ptrptr);
while (tok) {
xrealloc(resv_msg_ptr->core_cnt,
sizeof(uint32_t) * (node_inx + 2));
*free_tres_corecnt = 1;
resv_msg_ptr->core_cnt[node_inx] =
strtol(tok, &endptr, 10);
if ((endptr == NULL) ||
(endptr[0] != '\0') ||
(tok[0] == '\0')) {
if (err_msg) {
if (from_tres)
xstrfmtcat(*err_msg,
"Invalid TRES core count %s",
val);
else
xstrfmtcat(*err_msg,
"Invalid core count %s",
val);
}
xfree(core_cnt);
return SLURM_ERROR;
}
node_inx++;
tok = strtok_r(NULL, ",", &ptrptr);
}
xfree(core_cnt);
return SLURM_SUCCESS;
}
extern int parse_resv_nodecnt(resv_desc_msg_t *resv_msg_ptr, char *val,
int *free_tres_nodecnt, bool from_tres,
char **err_msg)
{
char *endptr = NULL, *node_cnt, *tok, *ptrptr = NULL;
int node_inx = 0;
long node_cnt_l;
int ret_code = SLURM_SUCCESS;
/*
* NodeCnt and TRES=node= might appear within the same request,
* so we free the first and realloc the second.
*/
if (*free_tres_nodecnt)
xfree(resv_msg_ptr->node_cnt);
node_cnt = xstrdup(val);
tok = strtok_r(node_cnt, ",", &ptrptr);
while (tok) {
xrealloc(resv_msg_ptr->node_cnt,
sizeof(uint32_t) * (node_inx + 2));
*free_tres_nodecnt = 1;
/*
* Use temporary variable to check for negative or huge values
* since resv_msg_ptr->node_cnt is uint32_t.
*/
node_cnt_l = strtol(tok, &endptr, 10);
if ((node_cnt_l < 0) || (node_cnt_l == LONG_MAX)) {
ret_code = SLURM_ERROR;
break;
} else {
resv_msg_ptr->node_cnt[node_inx] = node_cnt_l;
}
if ((endptr != NULL) &&
((endptr[0] == 'k') ||
(endptr[0] == 'K'))) {
resv_msg_ptr->node_cnt[node_inx] *= 1024;
} else if ((endptr != NULL) &&
((endptr[0] == 'm') ||
(endptr[0] == 'M'))) {
resv_msg_ptr->node_cnt[node_inx] *= 1024 * 1024;
} else if ((endptr == NULL) ||
(endptr[0] != '\0') ||
(tok[0] == '\0')) {
ret_code = SLURM_ERROR;
break;
}
node_inx++;
tok = strtok_r(NULL, ",", &ptrptr);
}
if (ret_code != SLURM_SUCCESS) {
if (err_msg) {
xfree(*err_msg);
if (from_tres) {
xstrfmtcat(*err_msg,
"Invalid TRES node count %s", val);
} else {
xstrfmtcat(*err_msg,
"Invalid node count %s", val);
}
} else {
info("%s: Invalid node count (%s)", __func__, tok);
}
}
xfree(node_cnt);
return ret_code;
}
extern int state_control_parse_resv_tres(char *val,
resv_desc_msg_t *resv_msg_ptr,
int *free_tres_license,
int *free_tres_bb,
int *free_tres_corecnt,
int *free_tres_nodecnt,
char **err_msg)
{
int i, ret, len;
char *tres_bb = NULL, *tres_license = NULL,
*tres_corecnt = NULL, *tres_nodecnt = NULL,
*token, *type = NULL, *saveptr1 = NULL,
*value_str = NULL, *name = NULL, *compound = NULL,
*tmp = NULL;
bool discard, first;
*free_tres_license = 0;
*free_tres_bb = 0;
*free_tres_corecnt = 0;
*free_tres_nodecnt = 0;
token = strtok_r(val, ",", &saveptr1);
while (token) {
compound = strtok_r(token, "=", &value_str);
if (!compound || !value_str || !*value_str) {
xstrfmtcat(*err_msg, "invalid TRES '%s'", token);
goto error;
}
if (strchr(compound, '/')) {
tmp = xstrdup(compound);
type = strtok_r(tmp, "/", &name);
} else
type = compound;
if (state_control_configured_tres(compound) != SLURM_SUCCESS) {
xstrfmtcat(*err_msg,
"couldn't identify configured TRES '%s'",
compound);
goto error;
}
if (!xstrcasecmp(type, "license")) {
if (tres_license && tres_license[0] != '\0')
xstrcatchar(tres_license, ',');
xstrfmtcat(tres_license, "%s:%s", name, value_str);
token = strtok_r(NULL, ",", &saveptr1);
} else if (xstrcasecmp(type, "bb") == 0) {
if (tres_bb && tres_bb[0] != '\0')
xstrcatchar(tres_bb, ',');
xstrfmtcat(tres_bb, "%s:%s", name, value_str);
token = strtok_r(NULL, ",", &saveptr1);
} else if (xstrcasecmp(type, "cpu") == 0) {
first = true;
discard = false;
do {
len = strlen(value_str);
for (i = 0; i < len; i++) {
if (!isdigit(value_str[i])) {
if (first) {
xstrfmtcat(*err_msg,
"invalid TRES cpu value '%s'",
value_str);
goto error;
} else
discard = true;
break;
}
}
first = false;
if (!discard) {
if (tres_corecnt && tres_corecnt[0]
!= '\0')
xstrcatchar(tres_corecnt, ',');
xstrcat(tres_corecnt, value_str);
token = strtok_r(NULL, ",", &saveptr1);
value_str = token;
}
} while (!discard && token);
} else if (xstrcasecmp(type, "node") == 0) {
if (tres_nodecnt && tres_nodecnt[0] != '\0')
xstrcatchar(tres_nodecnt, ',');
xstrcat(tres_nodecnt, value_str);
token = strtok_r(NULL, ",", &saveptr1);
} else {
xstrfmtcat(*err_msg, "TRES type '%s' not supported with reservations",
compound);
goto error;
}
}
if (tres_corecnt && tres_corecnt[0] != '\0') {
/* only have this on a cons_res machine */
ret = state_control_corecnt_supported();
if (ret != SLURM_SUCCESS) {
xstrfmtcat(*err_msg, "CoreCnt or CPUCnt is only supported when SelectType includes select/cons_res or SelectTypeParameters includes OTHER_CONS_RES on a Cray.");
goto error;
}
ret = state_control_parse_resv_corecnt(resv_msg_ptr,
tres_corecnt,
free_tres_corecnt, true,
err_msg);
xfree(tres_corecnt);
if (ret != SLURM_SUCCESS)
goto error;
}
if (tres_nodecnt && tres_nodecnt[0] != '\0') {
ret = parse_resv_nodecnt(resv_msg_ptr, tres_nodecnt,
free_tres_nodecnt, true, err_msg);
xfree(tres_nodecnt);
if (ret != SLURM_SUCCESS)
goto error;
}
if (tres_license && tres_license[0] != '\0') {
resv_msg_ptr->licenses = tres_license;
*free_tres_license = 1;
}
if (tres_bb && tres_bb[0] != '\0') {
resv_msg_ptr->burst_buffer = tres_bb;
*free_tres_bb = 1;
}
xfree(tmp);
return SLURM_SUCCESS;
error:
xfree(tmp);
xfree(tres_nodecnt);
xfree(tres_corecnt);
return SLURM_ERROR;
}