| /*****************************************************************************\ |
| * as_ext_dbd.c - External Database connections |
| ***************************************************************************** |
| * Copyright (C) SchedMD LLC. |
| * |
| * This file is part of Slurm, a resource management program. |
| * For details, see <https://slurm.schedmd.com/>. |
| * Please also read the included file: DISCLAIMER. |
| * |
| * Slurm is free software; you can redistribute it and/or modify it under |
| * the terms of the GNU General Public License as published by the Free |
| * Software Foundation; either version 2 of the License, or (at your option) |
| * any later version. |
| * |
| * In addition, as a special exception, the copyright holders give permission |
| * to link the code of portions of this program with the OpenSSL library under |
| * certain conditions as described in each individual source file, and |
| * distribute linked combinations including the two. You must obey the GNU |
| * General Public License in all respects for all of the code used other than |
| * OpenSSL. If you modify file(s) with this exception, you may extend this |
| * exception to your version of the file(s), but you are not obligated to do |
| * so. If you do not wish to do so, delete this exception statement from your |
| * version. If you delete this exception statement from all source files in |
| * the program, then also delete it here. |
| * |
| * Slurm is distributed in the hope that it will be useful, but WITHOUT ANY |
| * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
| * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more |
| * details. |
| * |
| * You should have received a copy of the GNU General Public License along |
| * with Slurm; if not, write to the Free Software Foundation, Inc., |
| * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. |
| \*****************************************************************************/ |
| |
| #include "src/common/slurm_xlator.h" |
| |
| #include "src/interfaces/accounting_storage.h" |
| |
| #if HAVE_SYS_PRCTL_H |
| # include <sys/prctl.h> |
| #endif |
| |
| #include "dbd_conn.h" |
| #include "as_ext_dbd.h" |
| |
| static list_t *ext_conns_list; |
| static pthread_t ext_thread_tid = 0; |
| static time_t ext_shutdown = 0; |
| |
| extern int clusteracct_storage_p_register_ctld(void *db_conn, uint16_t port); |
| |
| static pthread_mutex_t ext_conns_mutex = PTHREAD_MUTEX_INITIALIZER; |
| |
| static pthread_cond_t ext_thread_cond = PTHREAD_COND_INITIALIZER; |
| static pthread_mutex_t ext_thread_mutex = PTHREAD_MUTEX_INITIALIZER; |
| |
| static void _destroy_external_host_conns(void *object) |
| { |
| persist_conn_t *conn = object; |
| /* |
| * Don't call dbd_conn_close() to prevent DBD_FINI being sent to |
| * external DBDs. |
| */ |
| slurm_persist_conn_destroy(conn); |
| } |
| |
| /* don't connect now as it will block the ctld */ |
| extern persist_conn_t *_create_slurmdbd_conn(char *host, int port) |
| { |
| uint16_t persist_conn_flags = PERSIST_FLAG_EXT_DBD; |
| persist_conn_t *dbd_conn = |
| dbd_conn_open(&persist_conn_flags, NULL, host, port); |
| |
| dbd_conn->shutdown = &ext_shutdown; |
| |
| if ((clusteracct_storage_p_register_ctld(dbd_conn, |
| slurm_conf.slurmctld_port) == |
| ESLURM_ACCESS_DENIED)) { |
| error("Not allowed to register to external cluster, not going to try again."); |
| dbd_conn_close(&dbd_conn); |
| dbd_conn = NULL; |
| } |
| |
| return dbd_conn; |
| } |
| |
| static int _find_ext_conn(void *x, void *key) |
| { |
| persist_conn_t *selected_conn = x; |
| persist_conn_t *query_conn = key; |
| |
| if (!xstrcmp(selected_conn->rem_host, query_conn->rem_host) && |
| (selected_conn->rem_port == query_conn->rem_port)) |
| return 1; |
| |
| return 0; |
| } |
| |
| static void _create_ext_conns(void) |
| { |
| char *ext_hosts; |
| char *tok = NULL, *save_ptr = NULL; |
| list_t *new_list = list_create(_destroy_external_host_conns); |
| |
| if ((ext_hosts = xstrdup(slurm_conf.accounting_storage_ext_host))) |
| tok = strtok_r(ext_hosts, ",", &save_ptr); |
| while (ext_hosts && tok) { |
| persist_conn_t *dbd_conn, tmp_conn = {0}; |
| char *colon = xstrstr(tok, ":"); |
| int port = slurm_conf.accounting_storage_port; |
| if (colon) { |
| *(colon++) = '\0'; |
| port = strtol(colon, NULL, 10); |
| } |
| |
| tmp_conn.rem_host = tok; |
| tmp_conn.rem_port = port; |
| |
| /* |
| * Transfer existing connections to new list so that existing |
| * connections are preserved and old can be removed. |
| */ |
| if (!ext_conns_list || |
| !(dbd_conn = list_remove_first(ext_conns_list, |
| _find_ext_conn, |
| &tmp_conn))) |
| dbd_conn = _create_slurmdbd_conn(tok, port); |
| |
| if (dbd_conn) |
| list_append(new_list, dbd_conn); |
| |
| tok = strtok_r(NULL, ",", &save_ptr); |
| } |
| xfree(ext_hosts); |
| |
| /* Remove old connections we don't service now by freeing the list */ |
| FREE_NULL_LIST(ext_conns_list); |
| if (list_count(new_list)) |
| ext_conns_list = new_list; |
| else |
| FREE_NULL_LIST(new_list); |
| } |
| |
| static int _for_each_check_ext_conn(void *x, void *arg) |
| { |
| bool delete = false; |
| persist_conn_t *dbd_conn = x; |
| |
| if (slurm_persist_conn_writeable(dbd_conn) == -1) { |
| int rc; |
| slurm_persist_conn_reopen(dbd_conn); |
| |
| /* slurm_persist_send_msg will reconnect */ |
| rc = clusteracct_storage_p_register_ctld( |
| dbd_conn, slurm_conf.slurmctld_port); |
| if (rc == ESLURM_ACCESS_DENIED) { |
| error("Not allowed to register to external cluster, not going to try again."); |
| delete = true; |
| } |
| } |
| |
| return delete; |
| } |
| |
| static void _check_ext_conns() |
| { |
| slurm_mutex_lock(&ext_conns_mutex); |
| if (!ext_conns_list) { |
| slurm_mutex_unlock(&ext_conns_mutex); |
| return; |
| } |
| |
| /* Use list_delete_all() to be able to delete within the lock */ |
| list_delete_all(ext_conns_list, _for_each_check_ext_conn, NULL); |
| slurm_mutex_unlock(&ext_conns_mutex); |
| } |
| |
| static void *_ext_thread(void *x) |
| { |
| struct timespec ts = {0, 0}; |
| |
| #if HAVE_SYS_PRCTL_H |
| if (prctl(PR_SET_NAME, "ext_dbd", NULL, NULL, NULL) < 0) { |
| error("%s: cannot set my name to %s %m", __func__, "ext_dbd"); |
| } |
| #endif |
| |
| while (!ext_shutdown) { |
| _check_ext_conns(); |
| |
| ts.tv_sec = time(NULL) + 5; |
| slurm_mutex_lock(&ext_thread_mutex); |
| if (!ext_shutdown) |
| slurm_cond_timedwait(&ext_thread_cond, |
| &ext_thread_mutex, &ts); |
| slurm_mutex_unlock(&ext_thread_mutex); |
| } |
| |
| return NULL; |
| } |
| |
| static void _create_ext_thread(void) |
| { |
| ext_shutdown = 0; |
| |
| slurm_mutex_lock(&ext_thread_mutex); |
| slurm_thread_create(&ext_thread_tid, _ext_thread, NULL); |
| slurm_mutex_unlock(&ext_thread_mutex); |
| } |
| |
| static void _destroy_ext_thread(void) |
| { |
| ext_shutdown = time(NULL); |
| |
| slurm_mutex_lock(&ext_thread_mutex); |
| slurm_cond_broadcast(&ext_thread_cond); |
| slurm_mutex_unlock(&ext_thread_mutex); |
| |
| slurm_thread_join(ext_thread_tid); |
| } |
| |
| extern void ext_dbd_init(void) |
| { |
| if (!running_in_slurmctld()) |
| return; |
| |
| slurm_mutex_lock(&ext_conns_mutex); |
| _create_ext_conns(); |
| if (ext_conns_list) |
| _create_ext_thread(); |
| slurm_mutex_unlock(&ext_conns_mutex); |
| } |
| |
| extern void ext_dbd_fini(void) |
| { |
| if (!running_in_slurmctld()) |
| return; |
| |
| _destroy_ext_thread(); |
| |
| slurm_mutex_lock(&ext_conns_mutex); |
| FREE_NULL_LIST(ext_conns_list); |
| slurm_mutex_unlock(&ext_conns_mutex); |
| } |
| |
| extern void ext_dbd_reconfig(void) |
| { |
| bool create = false, destroy = false; |
| |
| if (!running_in_slurmctld()) |
| return; |
| |
| slurm_mutex_lock(&ext_conns_mutex); |
| _create_ext_conns(); |
| if (ext_thread_tid && !ext_conns_list) |
| destroy = true; |
| else if (!ext_thread_tid && ext_conns_list) |
| create = true; |
| slurm_mutex_unlock(&ext_conns_mutex); |
| |
| if (destroy) |
| _destroy_ext_thread(); |
| else if (create) |
| _create_ext_thread(); |
| } |