| /*****************************************************************************\ |
| * other_select.h - Define other select plugin needed for cray since |
| * it can leverage other plugins. |
| ***************************************************************************** |
| * Copyright (C) 2010 Lawrence Livermore National Security. |
| * Produced at Lawrence Livermore National Laboratory (cf, DISCLAIMER). |
| * Written by Danny Auble <da@llnl.gov> |
| * CODE-OCEC-09-009. All rights reserved. |
| * |
| * This file is part of SLURM, a resource management program. |
| * For details, see <https://computing.llnl.gov/linux/slurm/>. |
| * Please also read the included file: DISCLAIMER. |
| * |
| * SLURM is free software; you can redistribute it and/or modify it under |
| * the terms of the GNU General Public License as published by the Free |
| * Software Foundation; either version 2 of the License, or (at your option) |
| * any later version. |
| * |
| * In addition, as a special exception, the copyright holders give permission |
| * to link the code of portions of this program with the OpenSSL library under |
| * certain conditions as described in each individual source file, and |
| * distribute linked combinations including the two. You must obey the GNU |
| * General Public License in all respects for all of the code used other than |
| * OpenSSL. If you modify file(s) with this exception, you may extend this |
| * exception to your version of the file(s), but you are not obligated to do |
| * so. If you do not wish to do so, delete this exception statement from your |
| * version. If you delete this exception statement from all source files in |
| * the program, then also delete it here. |
| * |
| * SLURM is distributed in the hope that it will be useful, but WITHOUT ANY |
| * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
| * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more |
| * details. |
| * |
| * You should have received a copy of the GNU General Public License along |
| * with SLURM; if not, write to the Free Software Foundation, Inc., |
| * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. |
| \*****************************************************************************/ |
| |
| #ifndef _CRAY_OTHER_SELECT_H |
| #define _CRAY_OTHER_SELECT_H |
| |
| #include <slurm/slurm.h> |
| #include <slurm/slurm_errno.h> |
| |
| #include "src/common/slurm_xlator.h" /* Must be first */ |
| #include "src/common/list.h" |
| #include "src/slurmctld/slurmctld.h" |
| |
| /* |
| * Initialize context for node selection plugin |
| */ |
| extern int other_select_init(void); |
| |
| /* |
| * Terminate plugin and free all associated memory |
| */ |
| extern int other_select_fini(void); |
| |
| /* |
| * Save any global state information |
| * IN dir_name - directory into which the data can be stored |
| */ |
| extern int other_state_save(char *dir_name); |
| |
| /* |
| * Initialize context for node selection plugin and |
| * restore any global state information |
| * IN dir_name - directory from which the data can be restored |
| */ |
| extern int other_state_restore(char *dir_name); |
| |
| /* |
| * Note the initialization of job records, issued upon restart of |
| * slurmctld and used to synchronize any job state. |
| */ |
| extern int other_job_init(List job_list); |
| |
| /* |
| * Note re/initialization of node record data structure |
| * IN node_ptr - current node data |
| * IN node_count - number of node entries |
| */ |
| extern int other_node_init(struct node_record *node_ptr, int node_cnt); |
| |
| /* |
| * Note re/initialization of partition record data structure |
| * IN part_list - list of partition records |
| */ |
| extern int other_block_init(List part_list); |
| |
| /* |
| * Update specific block (usually something has gone wrong) |
| * IN block_desc_ptr - information about the block |
| */ |
| extern int other_update_block(update_block_msg_t *block_desc_ptr); |
| |
| /* |
| * Update specific sub nodes(usually something has gone wrong) |
| * IN block_desc_ptr - information about the block |
| */ |
| extern int other_update_sub_node(update_block_msg_t *block_desc_ptr); |
| |
| /* |
| * Get select data from a plugin |
| * IN node_pts - current node record |
| * IN dinfo - type of data to get from the node record |
| * (see enum select_plugindata_info) |
| * IN job_ptr - pointer to the job that's related to this query(may be NULL) |
| * IN/OUT data - the data to get from node record |
| */ |
| extern int other_get_info_from_plugin(enum select_plugindata_info dinfo, |
| struct job_record *job_ptr, |
| void *data); |
| |
| /* |
| * Updated a node configuration. This happens when a node registers with |
| * more resources than originally configured(e.g. memory). |
| * IN index - index into the node record list |
| * RETURN SLURM_SUCCESS on success || SLURM_ERROR else wise |
| */ |
| extern int other_update_node_config(int index); |
| |
| /* |
| * Updated a node state in the plugin, this should happen when a node is |
| * drained or put into a down state then changed back. |
| * IN index - index into the node record list |
| * IN state - state to update to |
| * RETURN SLURM_SUCCESS on success || SLURM_ERROR else wise |
| */ |
| extern int other_update_node_state(int index, uint16_t state); |
| |
| /* |
| * Alter the node count for a job given the type of system we are on |
| * IN/OUT job_desc - current job desc |
| */ |
| extern int other_alter_node_cnt(enum select_node_cnt type, void *data); |
| |
| /* |
| * Select the "best" nodes for given job from those available |
| * IN/OUT job_ptr - pointer to job being considered for initiation, |
| * set's start_time when job expected to start |
| * IN/OUT bitmap - map of nodes being considered for allocation on input, |
| * map of nodes actually to be assigned on output |
| * IN min_nodes - minimum number of nodes to allocate to job |
| * IN max_nodes - maximum number of nodes to allocate to job |
| * IN req_nodes - requested(or desired) count of nodes |
| * IN mode - SELECT_MODE_RUN_NOW: try to schedule job now |
| * SELECT_MODE_TEST_ONLY: test if job can ever run |
| * SELECT_MODE_WILL_RUN: determine when and where job can run |
| * IN preemptee_candidates - List of pointers to jobs which can bee preempted |
| * IN/OUT preemptee_job_list - Pointer to list of job pointers. These are the |
| * jobs to be preempted to initiate the pending job. Not set |
| * if mode=SELECT_MODE_TEST_ONLY or input pointer is NULL. |
| * Existing list is appended to. |
| * RET zero on success, EINVAL otherwise |
| */ |
| extern int other_job_test(struct job_record *job_ptr, bitstr_t *bitmap, |
| uint32_t min_nodes, uint32_t max_nodes, |
| uint32_t req_nodes, uint16_t mode, |
| List preemptee_candidates, |
| List *preemptee_job_list); |
| |
| /* |
| * Note initiation of job is about to begin. Called immediately |
| * after other_job_test(). Executed from slurmctld. |
| * IN job_ptr - pointer to job being initiated |
| */ |
| extern int other_job_begin(struct job_record *job_ptr); |
| |
| /* |
| * determine if job is ready to execute per the node select plugin |
| * IN job_ptr - pointer to job being tested |
| * RET -1 on error, 1 if ready to execute, 0 otherwise |
| */ |
| extern int other_job_ready(struct job_record *job_ptr); |
| |
| /* |
| * Modify internal data structures for a job that has changed size |
| * Only support jobs shrinking now. |
| * RET: 0 or an error code |
| */ |
| extern int other_job_resized(struct job_record *job_ptr, |
| struct node_record *node_ptr); |
| |
| /* |
| * Note termination of job is starting. Executed from slurmctld. |
| * IN job_ptr - pointer to job being terminated |
| */ |
| extern int other_job_fini(struct job_record *job_ptr); |
| |
| /* |
| * Suspend a job. Executed from slurmctld. |
| * IN job_ptr - pointer to job being suspended |
| * RET SLURM_SUCCESS or error code |
| */ |
| extern int other_job_suspend(struct job_record *job_ptr); |
| |
| /* |
| * Resume a job. Executed from slurmctld. |
| * IN job_ptr - pointer to job being resumed |
| * RET SLURM_SUCCESS or error code |
| */ |
| extern int other_job_resume(struct job_record *job_ptr); |
| |
| /* allocate storage for a select job credential |
| * RET jobinfo - storage for a select job credential |
| * NOTE: storage must be freed using other_free_jobinfo |
| */ |
| extern select_jobinfo_t *other_select_jobinfo_alloc(void); |
| |
| /* free storage previously allocated for a select job credential |
| * IN jobinfo - the select job credential to be freed |
| * RET - slurm error code |
| */ |
| extern int other_select_jobinfo_free(select_jobinfo_t *jobinfo); |
| |
| /* fill in a previously allocated select job credential |
| * IN/OUT jobinfo - updated select job credential |
| * IN data_type - type of data to enter into job credential |
| * IN data - the data to enter into job credential |
| */ |
| extern int other_select_jobinfo_set(select_jobinfo_t *jobinfo, |
| enum select_jobdata_type data_type, |
| void *data); |
| |
| /* get data from a select job credential |
| * IN jobinfo - updated select job credential |
| * IN data_type - type of data to enter into job credential |
| * OUT data - the data to get from job credential, caller must xfree |
| * data for data_type == SELECT_JOBDATA_PART_ID |
| */ |
| extern int other_select_jobinfo_get(select_jobinfo_t *jobinfo, |
| enum select_jobdata_type data_type, |
| void *data); |
| |
| /* copy a select job credential |
| * IN jobinfo - the select job credential to be copied |
| * RET - the copy or NULL on failure |
| * NOTE: returned value must be freed using other_select_jobinfo_free |
| */ |
| extern select_jobinfo_t *other_select_jobinfo_copy( |
| select_jobinfo_t *jobinfo); |
| |
| /* pack a select job credential into a buffer in machine independent form |
| * IN jobinfo - the select job credential to be saved |
| * OUT buffer - buffer with select credential appended |
| * IN protocol_version - slurm protocol version of client |
| * RET - slurm error code |
| */ |
| extern int other_select_jobinfo_pack(select_jobinfo_t *jobinfo, |
| Buf buffer, |
| uint16_t protocol_version); |
| |
| /* unpack a select job credential from a buffer |
| * OUT jobinfo - the select job credential read |
| * IN buffer - buffer with select credential read from current pointer loc |
| * IN protocol_version - slurm protocol version of client |
| * RET - slurm error code |
| * NOTE: returned value must be freed using other_select_jobinfo_free |
| */ |
| extern int other_select_jobinfo_unpack(select_jobinfo_t **jobinfo, |
| Buf buffer, |
| uint16_t protocol_version); |
| |
| /* write select job info to a string |
| * IN jobinfo - a select job credential |
| * OUT buf - location to write job info contents |
| * IN size - byte size of buf |
| * IN mode - print mode, see enum select_print_mode |
| * RET - the string, same as buf |
| */ |
| extern char *other_select_jobinfo_sprint(select_jobinfo_t *jobinfo, |
| char *buf, size_t size, int mode); |
| |
| /* write select job info to a string |
| * IN jobinfo - a select job credential |
| * OUT buf - location to write job info contents |
| * IN mode - print mode, see enum select_print_mode |
| * RET - the string, same as buf |
| */ |
| extern char *other_select_jobinfo_xstrdup(select_jobinfo_t *jobinfo, |
| int mode); |
| |
| /*******************************************************\ |
| * NODE-SPECIFIC SELECT CREDENTIAL MANAGEMENT FUNCIONS * |
| \*******************************************************/ |
| |
| extern int other_select_nodeinfo_pack(select_nodeinfo_t *nodeinfo, |
| Buf buffer, |
| uint16_t protocol_version); |
| |
| extern int other_select_nodeinfo_unpack(select_nodeinfo_t **nodeinfo, |
| Buf buffer, |
| uint16_t protocol_version); |
| |
| extern select_nodeinfo_t *other_select_nodeinfo_alloc(uint32_t size); |
| |
| extern int other_select_nodeinfo_free(select_nodeinfo_t *nodeinfo); |
| |
| extern int other_select_nodeinfo_set_all(time_t last_query_time); |
| |
| extern int other_select_nodeinfo_set(struct job_record *job_ptr); |
| |
| extern int other_select_nodeinfo_get(select_nodeinfo_t *nodeinfo, |
| enum select_nodedata_type dinfo, |
| enum node_states state, |
| void *data); |
| |
| |
| /******************************************************\ |
| * NODE-SELECT PLUGIN SPECIFIC INFORMATION FUNCTIONS * |
| \******************************************************/ |
| |
| /* pack node-select plugin specific information into a buffer in |
| * machine independent form |
| * IN last_update_time - time of latest information consumer has |
| * IN show_flags - flags to control information output |
| * OUT buffer - location to hold the data, consumer must free |
| * IN protocol_version - slurm protocol version of client |
| * RET - slurm error code |
| */ |
| extern int other_pack_select_info(time_t last_query_time, uint16_t show_flags, |
| Buf *buffer, uint16_t protocol_version); |
| |
| /* Note reconfiguration or change in partition configuration */ |
| extern int other_reconfigure(void); |
| |
| #endif /* _CRAY_OTHER_SELECT_H */ |