| /*****************************************************************************\ |
| * Test gres.conf and system GPU normalization and merging logic. |
| ***************************************************************************** |
| * Copyright (C) SchedMD LLC. |
| * |
| * This file is part of Slurm, a resource management program. |
| * For details, see <https://slurm.schedmd.com/>. |
| * Please also read the included file: DISCLAIMER. |
| * |
| * Slurm is free software; you can redistribute it and/or modify it under |
| * the terms of the GNU General Public License as published by the Free |
| * Software Foundation; either version 2 of the License, or (at your option) |
| * any later version. |
| * |
| * In addition, as a special exception, the copyright holders give permission |
| * to link the code of portions of this program with the OpenSSL library under |
| * certain conditions as described in each individual source file, and |
| * distribute linked combinations including the two. You must obey the GNU |
| * General Public License in all respects for all of the code used other than |
| * OpenSSL. If you modify file(s) with this exception, you may extend this |
| * exception to your version of the file(s), but you are not obligated to do |
| * so. If you do not wish to do so, delete this exception statement from your |
| * version. If you delete this exception statement from all source files in |
| * the program, then also delete it here. |
| * |
| * Slurm is distributed in the hope that it will be useful, but WITHOUT ANY |
| * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
| * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more |
| * details. |
| * |
| * You should have received a copy of the GNU General Public License along |
| * with Slurm; if not, write to the Free Software Foundation, Inc., |
| * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. |
| \*****************************************************************************/ |
| |
| #include <sys/stat.h> |
| #include "src/interfaces/gres.h" |
| #include "src/common/read_config.h" |
| #include "src/interfaces/select.h" |
| #include "src/common/xstring.h" |
| |
| /* |
| * test39.18.prog <etc_dir> <nodename> <conf_gres> [<debug_level>] |
| * |
| * etc_dir The directory containing slurm.conf, gres.conf, and |
| * fake_gpus.conf. |
| * nodename The name of the node. |
| * conf_gres A string indicating the GRES ostensibly parsed from a |
| * slurm.conf for the node. E.g., `gpu:4`. |
| * debug_level (optional) A number representing the log_level_t the program |
| * should use. If unspecified, defaults to LOG_LEVEL_INFO. |
| * LOG_LEVEL_INFO is the lowest log level allowed. |
| * Note that debug, debug2, and debug3 may produce too much output |
| * and cause expect to fail to parse things properly. This will |
| * show up as a test failure. Only use debug+ when debugging and |
| * developing tests, and NOT when running the tests in production. |
| * |
| * Note that slurm.conf only needs to specify the following fields: |
| * ControlMachine=test_machine |
| * ClusterName=test_cluster |
| * GresTypes=gpu,mps,nic,mic,tmpdisk |
| * |
| * The actual GRES for the node is specified in conf_gres, not slurm.conf. This |
| * makes it so we don't need to re-create the slurm.conf each time we run this |
| * test runner program. |
| * |
| * However, gres.conf and fake_gpus.conf do need to be re-created for each test. |
| */ |
| int main(int argc, char *argv[]) |
| { |
| log_options_t opts = LOG_OPTS_STDERR_ONLY; |
| int rc; |
| char *etc_dir = NULL; |
| char *node_name = NULL; |
| char *slurm_conf_gres_str = NULL; |
| char *slurm_conf = NULL; |
| char *gres_conf = NULL; |
| char *fake_gpus_conf = NULL; |
| struct stat stat_buf; |
| list_t *gres_list = NULL; |
| log_level_t debug_level = LOG_LEVEL_INFO; |
| |
| if (argc < 4) { |
| printf("FAILURE: Not enough arguments!\n"); |
| exit(1); |
| } |
| |
| if (argc > 5) { |
| printf("FAILURE: Too many arguments!\n"); |
| exit(1); |
| } |
| |
| etc_dir = argv[1]; |
| node_name = argv[2]; |
| slurm_conf_gres_str = argv[3]; |
| if (argc == 5) |
| debug_level = atoi(argv[4]); |
| |
| if (debug_level < LOG_LEVEL_INFO) { |
| printf("FAILURE: LOG_LEVEL_INFO is the lowest log level allowed!\n"); |
| exit(1); |
| } |
| |
| xstrfmtcat(slurm_conf, "%s/%s", etc_dir, "slurm.conf"); |
| xstrfmtcat(gres_conf, "%s/%s", etc_dir, "gres.conf"); |
| xstrfmtcat(fake_gpus_conf, "%s/%s", etc_dir, "fake_gpus.conf"); |
| |
| if (stat(slurm_conf, &stat_buf) != 0) { |
| printf("FAILURE: Could not find slurm_conf file at %s\n", |
| slurm_conf); |
| exit(1); |
| } |
| if (stat(gres_conf, &stat_buf) != 0) { |
| printf("FAILURE: Could not find gres_conf file at %s\n", |
| gres_conf); |
| exit(1); |
| } |
| if (stat(fake_gpus_conf, &stat_buf) != 0) { |
| printf("FAILURE: Could not find fake_gpus_conf file at %s\n", |
| fake_gpus_conf); |
| exit(1); |
| } |
| printf("slurm_conf: %s\n", slurm_conf); |
| printf("gres_conf: %s\n", gres_conf); |
| printf("fake_gpus_conf: %s\n", fake_gpus_conf); |
| |
| opts.stderr_level = debug_level; |
| log_init(argv[0], opts, SYSLOG_FACILITY_USER, NULL); |
| |
| // Override where Slurm looks for conf files |
| setenv("SLURM_CONF", slurm_conf, 1); |
| |
| slurm_init(NULL); |
| |
| if (select_g_init() != SLURM_SUCCESS) |
| fatal("failed to initialize node selection plugin"); |
| |
| // Initialize GRES info (from slurm.conf) |
| gres_init_node_config(slurm_conf_gres_str, &gres_list); |
| rc = gres_g_node_config_load(4, node_name, gres_list, NULL, NULL); |
| FREE_NULL_LIST(gres_list); |
| if (rc != SLURM_SUCCESS) { |
| slurm_perror("FAILURE: gres_node_config_load"); |
| exit(1); |
| } |
| |
| /* |
| * You'll have to reconfigure Slurm with --enable-memory-leak-debug to eliminate |
| * all "possibly lost" blocks and to see the full call stack of valgrind memory |
| * errors inside plugins. See plugin_unload() in src/common/plugin.c |
| */ |
| #ifdef USING_VALGRIND |
| // Clean up for valgrind |
| slurm_conf_destroy(); |
| gres_fini(); |
| select_g_fini(); |
| log_fini(); |
| xfree(slurm_conf); |
| xfree(gres_conf); |
| xfree(fake_gpus_conf); |
| #endif |
| |
| printf("Test ran to completion\n"); |
| exit(0); |
| } |