| /*****************************************************************************\ |
| * oracle.c - Infrastructure for the bf_topopt/"oracle" subsystem |
| * |
| * The oracle() function controls job start delays based on |
| * fragmentation costs, optimizing job placement for efficiency. |
| * |
| ***************************************************************************** |
| * Copyright (C) SchedMD LLC. |
| * |
| * This file is part of Slurm, a resource management program. |
| * For details, see <https://slurm.schedmd.com/>. |
| * Please also read the included file: DISCLAIMER. |
| * |
| * Slurm is free software; you can redistribute it and/or modify it under |
| * the terms of the GNU General Public License as published by the Free |
| * Software Foundation; either version 2 of the License, or (at your option) |
| * any later version. |
| * |
| * In addition, as a special exception, the copyright holders give permission |
| * to link the code of portions of this program with the OpenSSL library under |
| * certain conditions as described in each individual source file, and |
| * distribute linked combinations including the two. You must obey the GNU |
| * General Public License in all respects for all of the code used other than |
| * OpenSSL. If you modify file(s) with this exception, you may extend this |
| * exception to your version of the file(s), but you are not obligated to do |
| * so. If you do not wish to do so, delete this exception statement from your |
| * version. If you delete this exception statement from all source files in |
| * the program, then also delete it here. |
| * |
| * Slurm is distributed in the hope that it will be useful, but WITHOUT ANY |
| * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
| * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more |
| * details. |
| * |
| * You should have received a copy of the GNU General Public License along |
| * with Slurm; if not, write to the Free Software Foundation, Inc., |
| * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. |
| \*****************************************************************************/ |
| |
| #include "src/interfaces/topology.h" |
| |
| #include "backfill.h" |
| #include "oracle.h" |
| |
| int bf_topopt_iterations; |
| |
| static bf_slot_t *slots; |
| int used_slots; |
| |
| static int _get_bitmap_from_nspace(node_space_map_t *node_space, |
| time_t start_time, bitstr_t *out_bitmap, |
| uint32_t *fragmentation) |
| { |
| int j = 0; |
| while (true) { |
| if ((node_space[j].end_time > start_time) && |
| (node_space[j].begin_time <= start_time)) { |
| bit_copybits(out_bitmap, |
| node_space[j].avail_bitmap); |
| *fragmentation = node_space[j].fragmentation; |
| |
| return SLURM_SUCCESS; |
| } |
| |
| if ((j = node_space[j].next) == 0) |
| return SLURM_ERROR; |
| } |
| } |
| |
| static void _add_slot(job_record_t *job_ptr, bitstr_t *job_bitmap, |
| uint32_t time_limit, uint32_t boot_time, |
| node_space_map_t *node_space) |
| { |
| bf_slot_t *new_slot; |
| uint32_t previous_cluster_score; |
| int rc; |
| |
| if (used_slots >= bf_topopt_iterations) |
| return; |
| |
| new_slot = &(slots[used_slots]); |
| |
| |
| rc = _get_bitmap_from_nspace(node_space, job_ptr->start_time, |
| new_slot->cluster_bitmap, |
| &previous_cluster_score); |
| if (rc == SLURM_SUCCESS) { |
| bit_and_not(new_slot->cluster_bitmap, new_slot->job_bitmap); |
| new_slot->cluster_score = |
| topology_g_get_fragmentation(new_slot->cluster_bitmap); |
| |
| COPY_BITMAP(new_slot->job_bitmap, job_bitmap); |
| |
| COPY_BITMAP(new_slot->job_mask, job_bitmap); |
| |
| if (IS_JOB_WHOLE_TOPO(job_ptr)) |
| topology_g_whole_topo(new_slot->job_mask, |
| job_ptr->part_ptr->topology_idx); |
| |
| bit_not(new_slot->job_mask); |
| |
| new_slot->job_score = |
| topology_g_get_fragmentation(new_slot->job_mask); |
| new_slot->start = job_ptr->start_time; |
| new_slot->boot_time = boot_time; |
| new_slot->time_limit = time_limit; |
| |
| log_flag(BACKFILL, "%pJ add slot:%d start_time:%ld previous_cluster_score:%u cluster_score:%u job_score:%u", |
| job_ptr, used_slots, new_slot->start, |
| previous_cluster_score, new_slot->cluster_score, |
| new_slot->job_score); |
| |
| (used_slots)++; |
| } |
| |
| return; |
| } |
| |
| void init_oracle(void) |
| { |
| slots = xcalloc(bf_topopt_iterations, sizeof(bf_slot_t)); |
| for (int i = 0; i < bf_topopt_iterations; i++) { |
| slots[i].job_bitmap = bit_alloc(node_record_count); |
| slots[i].job_mask = bit_alloc(node_record_count); |
| slots[i].cluster_bitmap = bit_alloc(node_record_count); |
| } |
| } |
| |
| void fini_oracle(void) |
| { |
| for (int i = 0; i < bf_topopt_iterations; i++) { |
| FREE_NULL_BITMAP(slots[i].job_bitmap); |
| FREE_NULL_BITMAP(slots[i].job_mask); |
| FREE_NULL_BITMAP(slots[i].cluster_bitmap); |
| } |
| xfree(slots); |
| } |
| |
| /* |
| * Select the "best" slot for given job from those available |
| * IN/OUT job_ptr - pointer to job being considered |
| * IN/OUT job_bitmap - map of nodes being considered for allocation on input, |
| * map of nodes choose to allocation on output |
| * IN later_start |
| * IN/OUT time_limit - time_limit of job |
| * IN/OUT boot_time - boot_time of job |
| * IN node_space |
| * RET true - When we should check the later start of the job |
| * false if we want to start/plan. |
| */ |
| |
| bool oracle(job_record_t *job_ptr, bitstr_t *job_bitmap, time_t later_start, |
| uint32_t *time_limit, uint32_t *boot_time, |
| node_space_map_t *node_space) |
| { |
| /* |
| * Always if possible add a new slot to slots array |
| */ |
| if (used_slots < bf_topopt_iterations) |
| _add_slot(job_ptr, job_bitmap, *time_limit, *boot_time, |
| node_space); |
| |
| /* |
| * The code below is only an example implementation |
| */ |
| |
| /* |
| * Check later if later_start set and we have space in slots array |
| */ |
| if (later_start && used_slots < bf_topopt_iterations) |
| return true; |
| |
| if (used_slots > 0) { |
| int best_slot = 0; |
| |
| /* |
| * Find slot with minimal job_score |
| */ |
| for (int i = 1; i < used_slots; i++) |
| if (slots[best_slot].job_score > slots[i].job_score) |
| best_slot = i; |
| |
| /* |
| * Set start_time and job_bitmap according to the 'best' slot |
| */ |
| job_ptr->start_time = slots[best_slot].start; |
| bit_copybits(job_bitmap, slots[best_slot].job_bitmap); |
| *time_limit = slots[best_slot].time_limit; |
| *boot_time = slots[best_slot].boot_time; |
| log_flag(BACKFILL, "%pJ use:%u start_time: %ld", |
| job_ptr, best_slot, job_ptr->start_time); |
| } |
| |
| return false; |
| } |