blob: a5944e33d1216c926060dba14971e75f6e979ac9 [file] [log] [blame] [edit]
/*****************************************************************************\
* resv_reports.c - functions for generating reservation reports
* from accounting infrastructure.
*****************************************************************************
*
* Copyright (C) 2008 Lawrence Livermore National Security.
* Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER).
* Written by Danny Auble <da@llnl.gov>
* CODE-OCEC-09-009. All rights reserved.
*
* This file is part of SLURM, a resource management program.
* For details, see <http://slurm.schedmd.com/>.
* Please also read the included file: DISCLAIMER.
*
* SLURM is free software; you can redistribute it and/or modify it under
* the terms of the GNU General Public License as published by the Free
* Software Foundation; either version 2 of the License, or (at your option)
* any later version.
*
* In addition, as a special exception, the copyright holders give permission
* to link the code of portions of this program with the OpenSSL library under
* certain conditions as described in each individual source file, and
* distribute linked combinations including the two. You must obey the GNU
* General Public License in all respects for all of the code used other than
* OpenSSL. If you modify file(s) with this exception, you may extend this
* exception to your version of the file(s), but you are not obligated to do
* so. If you do not wish to do so, delete this exception statement from your
* version. If you delete this exception statement from all source files in
* the program, then also delete it here.
*
* SLURM is distributed in the hope that it will be useful, but WITHOUT ANY
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License along
* with SLURM; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
\*****************************************************************************/
#include "cluster_reports.h"
enum {
PRINT_RESV_NAME,
PRINT_RESV_CLUSTER,
PRINT_RESV_CPUS,
PRINT_RESV_ACPU,
PRINT_RESV_DCPU,
PRINT_RESV_ICPU,
PRINT_RESV_NODES,
PRINT_RESV_ASSOCS,
PRINT_RESV_START,
PRINT_RESV_END,
PRINT_RESV_FLAGS,
PRINT_RESV_TIME,
PRINT_RESV_CPUTIME,
};
typedef enum {
GROUP_BY_ACCOUNT,
GROUP_BY_ACCOUNT_JOB_SIZE,
GROUP_BY_ACCOUNT_JOB_SIZE_DURATION,
GROUP_BY_USER,
GROUP_BY_USER_JOB_SIZE,
GROUP_BY_USER_JOB_SIZE_DURATION,
GROUP_BY_NONE
} report_grouping_t;
static List print_fields_list = NULL; /* types are of print_field_t */
static int _set_resv_cond(int *start, int argc, char *argv[],
slurmdb_reservation_cond_t *resv_cond,
List format_list)
{
int i;
int set = 0;
int end = 0;
int local_cluster_flag = all_clusters_flag;
time_t start_time, end_time;
int command_len = 0;
if (!resv_cond) {
error("We need an slurmdb_reservation_cond to call this");
return SLURM_ERROR;
}
resv_cond->with_usage = 1;
if (!resv_cond->cluster_list)
resv_cond->cluster_list = list_create(slurm_destroy_char);
for (i=(*start); i<argc; i++) {
end = parse_option_end(argv[i]);
if (!end)
command_len=strlen(argv[i]);
else {
command_len=end-1;
if (argv[i][end] == '=') {
end++;
}
}
if (!end && !strncasecmp(argv[i], "all_clusters",
MAX(command_len, 1))) {
local_cluster_flag = 1;
} else if (!end
|| !strncasecmp (argv[i], "Names",
MAX(command_len, 1))) {
if (!resv_cond->name_list)
resv_cond->name_list =
list_create(slurm_destroy_char);
slurm_addto_char_list(resv_cond->name_list,
argv[i]+end);
set = 1;
} else if (!strncasecmp (argv[i], "Clusters",
MAX(command_len, 1))) {
slurm_addto_char_list(resv_cond->cluster_list,
argv[i]+end);
set = 1;
} else if (!strncasecmp (argv[i], "End", MAX(command_len, 1))) {
resv_cond->time_end = parse_time(argv[i]+end, 1);
set = 1;
} else if (!strncasecmp (argv[i], "Flags",
MAX(command_len, 2))) {
/* FIX ME: make flags work here */
//resv_cond->flags = parse_resv_flags(argv[i]+end);
set = 1;
} else if (!strncasecmp (argv[i], "Format",
MAX(command_len, 2))) {
if (format_list)
slurm_addto_char_list(format_list,
argv[i]+end);
} else if (!strncasecmp (argv[i], "Ids",
MAX(command_len, 1))) {
if (!resv_cond->id_list)
resv_cond->id_list =
list_create(slurm_destroy_char);
slurm_addto_char_list(resv_cond->id_list, argv[i]+end);
set = 1;
} else if (!strncasecmp (argv[i], "Nodes",
MAX(command_len, 1))) {
if (resv_cond->nodes) {
error("You already specified nodes '%s' "
" combine your request into 1 nodes=.",
resv_cond->nodes);
exit_code = 1;
break;
}
resv_cond->nodes = xstrdup(argv[i]+end);
set = 1;
} else if (!strncasecmp (argv[i], "Start",
MAX(command_len, 1))) {
resv_cond->time_start = parse_time(argv[i]+end, 1);
set = 1;
} else {
exit_code=1;
fprintf(stderr," Unknown condition: %s\n"
"Use keyword set to modify value\n", argv[i]);
}
}
(*start) = i;
if (!local_cluster_flag && !list_count(resv_cond->cluster_list)) {
char *temp = slurm_get_cluster_name();
if (temp)
list_append(resv_cond->cluster_list, temp);
}
/* This needs to be done on some systems to make sure
cluster_cond isn't messed. This has happened on some 64
bit machines and this is here to be on the safe side.
*/
start_time = resv_cond->time_start;
end_time = resv_cond->time_end;
slurmdb_report_set_start_end_time(&start_time, &end_time);
resv_cond->time_start = start_time;
resv_cond->time_end = end_time;
return set;
}
static int _setup_print_fields_list(List format_list)
{
ListIterator itr = NULL;
print_field_t *field = NULL;
char *object = NULL;
if (!format_list || !list_count(format_list)) {
exit_code=1;
fprintf(stderr, " we need a format list "
"to set up the print.\n");
return SLURM_ERROR;
}
if (!print_fields_list)
print_fields_list = list_create(destroy_print_field);
itr = list_iterator_create(format_list);
while((object = list_next(itr))) {
char *tmp_char = NULL;
int command_len = 0;
int newlen = 0;
if ((tmp_char = strstr(object, "\%"))) {
newlen = atoi(tmp_char+1);
tmp_char[0] = '\0';
}
command_len = strlen(object);
field = xmalloc(sizeof(print_field_t));
if (!strncasecmp("allocated", object,
MAX(command_len, 2))) {
field->type = PRINT_RESV_ACPU;
field->name = xstrdup("Allocated");
if (time_format == SLURMDB_REPORT_TIME_SECS_PER
|| time_format == SLURMDB_REPORT_TIME_MINS_PER
|| time_format == SLURMDB_REPORT_TIME_HOURS_PER)
field->len = 20;
else
field->len = 9;
field->print_routine = slurmdb_report_print_time;
} else if (!strncasecmp("Associations",
object, MAX(command_len, 2))) {
field->type = PRINT_RESV_ASSOCS;
field->name = xstrdup("Associations");
field->len = 15;
field->print_routine = print_fields_str;
} else if (!strncasecmp("Cluster", object,
MAX(command_len, 2))) {
field->type = PRINT_RESV_CLUSTER;
field->name = xstrdup("Cluster");
field->len = 9;
field->print_routine = print_fields_str;
} else if (!strncasecmp("cpucount", object,
MAX(command_len, 2))) {
field->type = PRINT_RESV_CPUS;
field->name = xstrdup("CPU count");
field->len = 9;
field->print_routine = print_fields_uint;
} else if (!strncasecmp("down", object, MAX(command_len, 1))) {
field->type = PRINT_RESV_DCPU;
field->name = xstrdup("Down");
if (time_format == SLURMDB_REPORT_TIME_SECS_PER
|| time_format == SLURMDB_REPORT_TIME_MINS_PER
|| time_format == SLURMDB_REPORT_TIME_HOURS_PER)
field->len = 20;
else
field->len = 9;
field->print_routine = slurmdb_report_print_time;
} else if (!strncasecmp("idle", object, MAX(command_len, 1))) {
field->type = PRINT_RESV_ICPU;
field->name = xstrdup("Idle");
if (time_format == SLURMDB_REPORT_TIME_SECS_PER
|| time_format == SLURMDB_REPORT_TIME_MINS_PER
|| time_format == SLURMDB_REPORT_TIME_HOURS_PER)
field->len = 20;
else
field->len = 9;
field->print_routine = slurmdb_report_print_time;
} else if (!strncasecmp("Nodes", object, MAX(command_len, 2))) {
field->type = PRINT_RESV_NODES;
field->name = xstrdup("Nodes");
field->len = 15;
field->print_routine = print_fields_str;
} else if (!strncasecmp("Name", object,
MAX(command_len, 2))) {
field->type = PRINT_RESV_NAME;
field->name = xstrdup("Name");
field->len = 9;
field->print_routine = print_fields_str;
} else if (!strncasecmp("Start", object,
MAX(command_len, 2))) {
field->type = PRINT_RESV_START;
field->name = xstrdup("Start");
field->len = 19;
field->print_routine = print_fields_date;
} else if (!strncasecmp("End", object,
MAX(command_len, 2))) {
field->type = PRINT_RESV_END;
field->name = xstrdup("End");
field->len = 19;
field->print_routine = print_fields_date;
} else if (!strncasecmp("TotalTime", object,
MAX(command_len, 2))) {
field->type = PRINT_RESV_TIME;
field->name = xstrdup("TotalTime");
field->len = 9;
field->print_routine = print_fields_time_from_secs;
} else if (!strncasecmp("CPUTime", object,
MAX(command_len, 2))) {
field->type = PRINT_RESV_CPUTIME;
field->name = xstrdup("CPUTime");
field->len = 9;
field->print_routine = print_fields_time_from_secs;
} else {
exit_code=1;
fprintf(stderr, " Unknown field '%s'\n", object);
xfree(field);
continue;
}
if (newlen)
field->len = newlen;
list_append(print_fields_list, field);
}
list_iterator_destroy(itr);
return SLURM_SUCCESS;
}
static List _get_resv_list(int argc, char *argv[],
char *report_name, List format_list)
{
slurmdb_reservation_cond_t *resv_cond =
xmalloc(sizeof(slurmdb_reservation_cond_t));
int i=0;
List resv_list = NULL;
resv_cond->with_usage = 1;
_set_resv_cond(&i, argc, argv, resv_cond, format_list);
resv_list = slurmdb_reservations_get(db_conn, resv_cond);
if (!resv_list) {
exit_code=1;
fprintf(stderr, " Problem with resv query.\n");
return NULL;
}
if (print_fields_have_header) {
char start_char[20];
char end_char[20];
time_t my_start = resv_cond->time_start;
time_t my_end = resv_cond->time_end-1;
slurm_make_time_str(&my_start,
start_char, sizeof(start_char));
slurm_make_time_str(&my_end,
end_char, sizeof(end_char));
printf("----------------------------------------"
"----------------------------------------\n");
printf("%s %s - %s\n",
report_name, start_char, end_char);
switch(time_format) {
case SLURMDB_REPORT_TIME_PERCENT:
printf("Time reported in %s\n", time_format_string);
break;
default:
printf("Time reported in CPU %s\n", time_format_string);
break;
}
printf("----------------------------------------"
"----------------------------------------\n");
}
slurmdb_destroy_reservation_cond(resv_cond);
return resv_list;
}
extern int resv_utilization(int argc, char *argv[])
{
int rc = SLURM_SUCCESS;
ListIterator itr = NULL;
ListIterator tot_itr = NULL;
ListIterator itr2 = NULL;
slurmdb_reservation_rec_t *resv = NULL;
slurmdb_reservation_rec_t *tot_resv = NULL;
print_field_t *field = NULL;
int32_t total_time = 0;
List resv_list = NULL;
List tot_resv_list = NULL;
List format_list = list_create(slurm_destroy_char);
int field_count = 0;
print_fields_list = list_create(destroy_print_field);
if (!(resv_list = _get_resv_list(argc, argv,
"Reservation Utilization",
format_list)))
goto end_it;
if (!list_count(format_list))
slurm_addto_char_list(format_list,
"Cl,name,start,end,al,i");
_setup_print_fields_list(format_list);
list_destroy(format_list);
/* we will just use the pointers returned from the
get_resv_list here, so don't remove them
*/
tot_resv_list = list_create(NULL);
itr = list_iterator_create(resv_list);
tot_itr = list_iterator_create(tot_resv_list);
itr2 = list_iterator_create(print_fields_list);
print_fields_header(print_fields_list);
field_count = list_count(print_fields_list);
/* compress all the reservations into a single reservation.
Since reservations can have multiple entries like if the
node count changes or something after the reservation
starts. Here we colapse them into 1 record.
*/
while((resv = list_next(itr))) {
while((tot_resv = list_next(tot_itr))) {
if (tot_resv->id == resv->id) {
/* get an average of cpus if the
reservation changes we will just
get an average.
*/
tot_resv->cpus += resv->cpus;
tot_resv->cpus /= 2;
tot_resv->alloc_secs += resv->alloc_secs;
tot_resv->down_secs += resv->down_secs;
if (resv->time_start < tot_resv->time_start)
tot_resv->time_start = resv->time_start;
if (resv->time_end > tot_resv->time_end)
tot_resv->time_end = resv->time_end;
break;
}
}
if (!tot_resv)
list_append(tot_resv_list, resv);
list_iterator_reset(tot_itr);
}
list_sort(tot_resv_list, (ListCmpF)sort_reservations_dec);
list_iterator_reset(tot_itr);
while((tot_resv = list_next(tot_itr))) {
uint64_t idle_secs = 0, total_reported = 0;
int curr_inx = 1;
total_time = tot_resv->time_end - tot_resv->time_start;
if (total_time <= 0)
continue;
total_reported = (uint64_t)(total_time * tot_resv->cpus);
idle_secs = total_reported
- tot_resv->alloc_secs - tot_resv->down_secs;
while((field = list_next(itr2))) {
switch(field->type) {
case PRINT_RESV_NAME:
field->print_routine(field,
tot_resv->name,
(curr_inx ==
field_count));
break;
case PRINT_RESV_CLUSTER:
field->print_routine(field,
tot_resv->cluster,
(curr_inx ==
field_count));
break;
case PRINT_RESV_CPUS:
field->print_routine(field,
tot_resv->cpus,
(curr_inx ==
field_count));
break;
case PRINT_RESV_ACPU:
field->print_routine(field,
tot_resv->alloc_secs,
total_reported,
(curr_inx ==
field_count));
break;
case PRINT_RESV_DCPU:
field->print_routine(field,
tot_resv->down_secs,
total_reported,
(curr_inx ==
field_count));
break;
case PRINT_RESV_ICPU:
field->print_routine(field,
idle_secs,
total_reported,
(curr_inx ==
field_count));
break;
case PRINT_RESV_NODES:
field->print_routine(field,
tot_resv->nodes,
(curr_inx ==
field_count));
break;
case PRINT_RESV_ASSOCS:
field->print_routine(field,
tot_resv->assocs,
(curr_inx ==
field_count));
break;
case PRINT_RESV_START:
field->print_routine(field,
tot_resv->time_start,
(curr_inx ==
field_count));
break;
case PRINT_RESV_END:
field->print_routine(field,
tot_resv->time_end,
(curr_inx ==
field_count));
break;
case PRINT_RESV_TIME:
field->print_routine(field,
(uint64_t)total_time,
(curr_inx ==
field_count));
break;
case PRINT_RESV_CPUTIME:
field->print_routine(field,
total_reported,
(curr_inx ==
field_count));
break;
default:
field->print_routine(
field, NULL,
(curr_inx == field_count));
break;
}
curr_inx++;
}
list_iterator_reset(itr2);
printf("\n");
}
list_iterator_destroy(tot_itr);
list_iterator_destroy(itr2);
list_iterator_destroy(itr);
end_it:
if (resv_list) {
list_destroy(resv_list);
resv_list = NULL;
}
if (tot_resv_list) {
list_destroy(tot_resv_list);
tot_resv_list = NULL;
}
if (print_fields_list) {
list_destroy(print_fields_list);
print_fields_list = NULL;
}
return rc;
}