/* ctdb_control protocol code Copyright (C) Andrew Tridgell 2007 This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, see . */ #include "includes.h" #include "lib/events/events.h" #include "lib/tdb/include/tdb.h" #include "system/network.h" #include "system/filesys.h" #include "system/wait.h" #include "../include/ctdb_private.h" #include "lib/util/dlinklist.h" #include "db_wrap.h" struct ctdb_control_state { struct ctdb_context *ctdb; uint32_t reqid; ctdb_control_callback_fn_t callback; void *private_data; unsigned flags; }; /* dump talloc memory hierarchy, returning it as a blob to the client */ int32_t ctdb_dump_memory(struct ctdb_context *ctdb, TDB_DATA *outdata) { /* dump to a file, then send the file as a blob */ FILE *f; long fsize; f = tmpfile(); if (f == NULL) { DEBUG(DEBUG_ERR,(__location__ " Unable to open tmpfile - %s\n", strerror(errno))); return -1; } talloc_report_full(NULL, f); fsize = ftell(f); rewind(f); outdata->dptr = talloc_size(outdata, fsize); CTDB_NO_MEMORY(ctdb, outdata->dptr); outdata->dsize = fread(outdata->dptr, 1, fsize, f); fclose(f); if (outdata->dsize != fsize) { DEBUG(DEBUG_ERR,(__location__ " Unable to read tmpfile\n")); return -1; } return 0; } /* process a control request */ static int32_t ctdb_control_dispatch(struct ctdb_context *ctdb, struct ctdb_req_control *c, TDB_DATA indata, TDB_DATA *outdata, uint32_t srcnode, const char **errormsg, bool *async_reply) { uint32_t opcode = c->opcode; uint64_t srvid = c->srvid; uint32_t client_id = c->client_id; switch (opcode) { case CTDB_CONTROL_PROCESS_EXISTS: { CHECK_CONTROL_DATA_SIZE(sizeof(pid_t)); return kill(*(pid_t *)indata.dptr, 0); } case CTDB_CONTROL_SET_DEBUG: { CHECK_CONTROL_DATA_SIZE(sizeof(int32_t)); LogLevel = *(int32_t *)indata.dptr; return 0; } case CTDB_CONTROL_GET_DEBUG: { CHECK_CONTROL_DATA_SIZE(0); outdata->dptr = (uint8_t *)&LogLevel; outdata->dsize = sizeof(LogLevel); return 0; } case CTDB_CONTROL_STATISTICS: { CHECK_CONTROL_DATA_SIZE(0); ctdb->statistics.memory_used = talloc_total_size(NULL); ctdb->statistics.frozen = (ctdb->freeze_mode == CTDB_FREEZE_FROZEN); ctdb->statistics.recovering = (ctdb->recovery_mode == CTDB_RECOVERY_ACTIVE); outdata->dptr = (uint8_t *)&ctdb->statistics; outdata->dsize = sizeof(ctdb->statistics); return 0; } case CTDB_CONTROL_GET_ALL_TUNABLES: { CHECK_CONTROL_DATA_SIZE(0); outdata->dptr = (uint8_t *)&ctdb->tunable; outdata->dsize = sizeof(ctdb->tunable); return 0; } case CTDB_CONTROL_DUMP_MEMORY: { CHECK_CONTROL_DATA_SIZE(0); return ctdb_dump_memory(ctdb, outdata); } case CTDB_CONTROL_STATISTICS_RESET: { CHECK_CONTROL_DATA_SIZE(0); ZERO_STRUCT(ctdb->statistics); return 0; } case CTDB_CONTROL_GETVNNMAP: return ctdb_control_getvnnmap(ctdb, opcode, indata, outdata); case CTDB_CONTROL_GET_DBMAP: return ctdb_control_getdbmap(ctdb, opcode, indata, outdata); case CTDB_CONTROL_GET_NODEMAP: return ctdb_control_getnodemap(ctdb, opcode, indata, outdata); case CTDB_CONTROL_RELOAD_NODES_FILE: CHECK_CONTROL_DATA_SIZE(0); return ctdb_control_reload_nodes_file(ctdb, opcode); case CTDB_CONTROL_SETVNNMAP: return ctdb_control_setvnnmap(ctdb, opcode, indata, outdata); case CTDB_CONTROL_PULL_DB: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_pulldb)); return ctdb_control_pull_db(ctdb, indata, outdata); case CTDB_CONTROL_SET_DMASTER: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_dmaster)); return ctdb_control_set_dmaster(ctdb, indata); case CTDB_CONTROL_PUSH_DB: return ctdb_control_push_db(ctdb, indata); case CTDB_CONTROL_GET_RECMODE: { return ctdb->recovery_mode; } case CTDB_CONTROL_SET_RECMASTER: { CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t)); if (ctdb->freeze_mode != CTDB_FREEZE_FROZEN) { DEBUG(DEBUG_NOTICE,("Attempt to set recmaster when not frozen\n")); return -1; } ctdb->recovery_master = ((uint32_t *)(&indata.dptr[0]))[0]; return 0; } case CTDB_CONTROL_GET_RECMASTER: return ctdb->recovery_master; case CTDB_CONTROL_GET_PID: return getpid(); case CTDB_CONTROL_GET_PNN: return ctdb->pnn; case CTDB_CONTROL_PING: CHECK_CONTROL_DATA_SIZE(0); return ctdb->statistics.num_clients; case CTDB_CONTROL_GET_DBNAME: { uint32_t db_id; struct ctdb_db_context *ctdb_db; CHECK_CONTROL_DATA_SIZE(sizeof(db_id)); db_id = *(uint32_t *)indata.dptr; ctdb_db = find_ctdb_db(ctdb, db_id); if (ctdb_db == NULL) return -1; outdata->dptr = discard_const(ctdb_db->db_name); outdata->dsize = strlen(ctdb_db->db_name)+1; return 0; } case CTDB_CONTROL_GETDBPATH: { uint32_t db_id; struct ctdb_db_context *ctdb_db; CHECK_CONTROL_DATA_SIZE(sizeof(db_id)); db_id = *(uint32_t *)indata.dptr; ctdb_db = find_ctdb_db(ctdb, db_id); if (ctdb_db == NULL) return -1; outdata->dptr = discard_const(ctdb_db->db_path); outdata->dsize = strlen(ctdb_db->db_path)+1; return 0; } case CTDB_CONTROL_DB_ATTACH: return ctdb_control_db_attach(ctdb, indata, outdata, false); case CTDB_CONTROL_DB_ATTACH_PERSISTENT: return ctdb_control_db_attach(ctdb, indata, outdata, true); case CTDB_CONTROL_SET_CALL: { struct ctdb_control_set_call *sc = (struct ctdb_control_set_call *)indata.dptr; CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_call)); return ctdb_daemon_set_call(ctdb, sc->db_id, sc->fn, sc->id); } case CTDB_CONTROL_TRAVERSE_START: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_traverse_start)); return ctdb_control_traverse_start(ctdb, indata, outdata, srcnode); case CTDB_CONTROL_TRAVERSE_ALL: return ctdb_control_traverse_all(ctdb, indata, outdata); case CTDB_CONTROL_TRAVERSE_DATA: return ctdb_control_traverse_data(ctdb, indata, outdata); case CTDB_CONTROL_REGISTER_SRVID: return daemon_register_message_handler(ctdb, client_id, srvid); case CTDB_CONTROL_DEREGISTER_SRVID: return daemon_deregister_message_handler(ctdb, client_id, srvid); case CTDB_CONTROL_ENABLE_SEQNUM: CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t)); return ctdb_ltdb_enable_seqnum(ctdb, *(uint32_t *)indata.dptr); case CTDB_CONTROL_UPDATE_SEQNUM: CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t)); return ctdb_ltdb_update_seqnum(ctdb, *(uint32_t *)indata.dptr, srcnode); case CTDB_CONTROL_FREEZE: CHECK_CONTROL_DATA_SIZE(0); return ctdb_control_freeze(ctdb, c, async_reply); case CTDB_CONTROL_THAW: CHECK_CONTROL_DATA_SIZE(0); return ctdb_control_thaw(ctdb); case CTDB_CONTROL_SET_RECMODE: CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t)); return ctdb_control_set_recmode(ctdb, c, indata, async_reply, errormsg); case CTDB_CONTROL_GET_MONMODE: CHECK_CONTROL_DATA_SIZE(0); return ctdb_monitoring_mode(ctdb); case CTDB_CONTROL_ENABLE_MONITOR: CHECK_CONTROL_DATA_SIZE(0); ctdb_enable_monitoring(ctdb); return 0; case CTDB_CONTROL_RUN_EVENTSCRIPTS: return ctdb_run_eventscripts(ctdb, c, indata, async_reply); case CTDB_CONTROL_DISABLE_MONITOR: CHECK_CONTROL_DATA_SIZE(0); ctdb_disable_monitoring(ctdb); return 0; case CTDB_CONTROL_SHUTDOWN: ctdb_stop_recoverd(ctdb); ctdb_stop_keepalive(ctdb); ctdb_stop_monitoring(ctdb); ctdb_release_all_ips(ctdb); ctdb->methods->shutdown(ctdb); ctdb_event_script(ctdb, "shutdown"); DEBUG(DEBUG_NOTICE,("Received SHUTDOWN command. Stopping CTDB daemon.\n")); exit(0); case CTDB_CONTROL_TAKEOVER_IP: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip)); return ctdb_control_takeover_ip(ctdb, c, indata, async_reply); case CTDB_CONTROL_RELEASE_IP: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip)); return ctdb_control_release_ip(ctdb, c, indata, async_reply); case CTDB_CONTROL_GET_PUBLIC_IPS: CHECK_CONTROL_DATA_SIZE(0); return ctdb_control_get_public_ips(ctdb, c, outdata); case CTDB_CONTROL_TCP_CLIENT: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp)); return ctdb_control_tcp_client(ctdb, client_id, indata); case CTDB_CONTROL_STARTUP: CHECK_CONTROL_DATA_SIZE(0); return ctdb_control_startup(ctdb, srcnode); case CTDB_CONTROL_TCP_ADD: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp_vnn)); return ctdb_control_tcp_add(ctdb, indata); case CTDB_CONTROL_SET_TUNABLE: return ctdb_control_set_tunable(ctdb, indata); case CTDB_CONTROL_GET_TUNABLE: return ctdb_control_get_tunable(ctdb, indata, outdata); case CTDB_CONTROL_LIST_TUNABLES: return ctdb_control_list_tunables(ctdb, outdata); case CTDB_CONTROL_MODIFY_FLAGS: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_node_modflags)); return ctdb_control_modflags(ctdb, indata); case CTDB_CONTROL_KILL_TCP: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_killtcp)); return ctdb_control_kill_tcp(ctdb, indata); case CTDB_CONTROL_GET_TCP_TICKLE_LIST: CHECK_CONTROL_DATA_SIZE(sizeof(struct sockaddr_in)); return ctdb_control_get_tcp_tickle_list(ctdb, indata, outdata); case CTDB_CONTROL_SET_TCP_TICKLE_LIST: /* data size is verified in the called function */ return ctdb_control_set_tcp_tickle_list(ctdb, indata); case CTDB_CONTROL_REGISTER_SERVER_ID: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id)); return ctdb_control_register_server_id(ctdb, client_id, indata); case CTDB_CONTROL_UNREGISTER_SERVER_ID: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id)); return ctdb_control_unregister_server_id(ctdb, indata); case CTDB_CONTROL_CHECK_SERVER_ID: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id)); return ctdb_control_check_server_id(ctdb, indata); case CTDB_CONTROL_GET_SERVER_ID_LIST: CHECK_CONTROL_DATA_SIZE(0); return ctdb_control_get_server_id_list(ctdb, outdata); case CTDB_CONTROL_PERSISTENT_STORE: return ctdb_control_persistent_store(ctdb, c, indata, async_reply); case CTDB_CONTROL_UPDATE_RECORD: return ctdb_control_update_record(ctdb, c, indata, async_reply); case CTDB_CONTROL_SEND_GRATIOUS_ARP: return ctdb_control_send_gratious_arp(ctdb, indata); case CTDB_CONTROL_TRANSACTION_START: CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t)); return ctdb_control_transaction_start(ctdb, *(uint32_t *)indata.dptr); case CTDB_CONTROL_TRANSACTION_COMMIT: CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t)); return ctdb_control_transaction_commit(ctdb, *(uint32_t *)indata.dptr); case CTDB_CONTROL_WIPE_DATABASE: CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_wipe_database)); return ctdb_control_wipe_database(ctdb, indata); case CTDB_CONTROL_UPTIME: return ctdb_control_uptime(ctdb, outdata); case CTDB_CONTROL_START_RECOVERY: return ctdb_control_start_recovery(ctdb, c, async_reply); case CTDB_CONTROL_END_RECOVERY: return ctdb_control_end_recovery(ctdb, c, async_reply); case CTDB_CONTROL_GET_RECLOCK_FILE: CHECK_CONTROL_DATA_SIZE(0); return ctdb_control_get_reclock_file(ctdb, outdata); case CTDB_CONTROL_TRY_DELETE_RECORDS: return ctdb_control_try_delete_records(ctdb, indata, outdata); case CTDB_CONTROL_ADD_PUBLIC_IP: return ctdb_control_add_public_address(ctdb, indata); case CTDB_CONTROL_DEL_PUBLIC_IP: return ctdb_control_del_public_address(ctdb, indata); default: DEBUG(DEBUG_CRIT,(__location__ " Unknown CTDB control opcode %u\n", opcode)); return -1; } } /* send a reply for a ctdb control */ void ctdb_request_control_reply(struct ctdb_context *ctdb, struct ctdb_req_control *c, TDB_DATA *outdata, int32_t status, const char *errormsg) { struct ctdb_reply_control *r; size_t len; /* some controls send no reply */ if (c->flags & CTDB_CTRL_FLAG_NOREPLY) { return; } len = offsetof(struct ctdb_reply_control, data) + (outdata?outdata->dsize:0); if (errormsg) { len += strlen(errormsg); } r = ctdb_transport_allocate(ctdb, ctdb, CTDB_REPLY_CONTROL, len, struct ctdb_reply_control); CTDB_NO_MEMORY_VOID(ctdb, r); r->hdr.destnode = c->hdr.srcnode; r->hdr.reqid = c->hdr.reqid; r->status = status; r->datalen = outdata?outdata->dsize:0; if (outdata && outdata->dsize) { memcpy(&r->data[0], outdata->dptr, outdata->dsize); } if (errormsg) { r->errorlen = strlen(errormsg); memcpy(&r->data[r->datalen], errormsg, r->errorlen); } ctdb_queue_packet(ctdb, &r->hdr); talloc_free(r); } /* called when a CTDB_REQ_CONTROL packet comes in */ void ctdb_request_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr) { struct ctdb_req_control *c = (struct ctdb_req_control *)hdr; TDB_DATA data, *outdata; int32_t status; bool async_reply = False; const char *errormsg = NULL; data.dptr = &c->data[0]; data.dsize = c->datalen; outdata = talloc_zero(c, TDB_DATA); status = ctdb_control_dispatch(ctdb, c, data, outdata, hdr->srcnode, &errormsg, &async_reply); if (!async_reply) { ctdb_request_control_reply(ctdb, c, outdata, status, errormsg); } } /* called when a CTDB_REPLY_CONTROL packet comes in */ void ctdb_reply_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr) { struct ctdb_reply_control *c = (struct ctdb_reply_control *)hdr; TDB_DATA data; struct ctdb_control_state *state; const char *errormsg = NULL; state = ctdb_reqid_find(ctdb, hdr->reqid, struct ctdb_control_state); if (state == NULL) { DEBUG(DEBUG_ERR,("pnn %u Invalid reqid %u in ctdb_reply_control\n", ctdb->pnn, hdr->reqid)); return; } if (hdr->reqid != state->reqid) { /* we found a record but it was the wrong one */ DEBUG(DEBUG_ERR, ("Dropped orphaned control reply with reqid:%u\n", hdr->reqid)); return; } data.dptr = &c->data[0]; data.dsize = c->datalen; if (c->errorlen) { errormsg = talloc_strndup(state, (char *)&c->data[c->datalen], c->errorlen); } /* make state a child of the packet, so it goes away when the packet is freed. */ talloc_steal(hdr, state); state->callback(ctdb, c->status, data, errormsg, state->private_data); } static int ctdb_control_destructor(struct ctdb_control_state *state) { ctdb_reqid_remove(state->ctdb, state->reqid); return 0; } /* handle a timeout of a control */ static void ctdb_control_timeout(struct event_context *ev, struct timed_event *te, struct timeval t, void *private_data) { struct ctdb_control_state *state = talloc_get_type(private_data, struct ctdb_control_state); TALLOC_CTX *tmp_ctx = talloc_new(ev); state->ctdb->statistics.timeouts.control++; talloc_steal(tmp_ctx, state); state->callback(state->ctdb, -1, tdb_null, "ctdb_control timed out", state->private_data); talloc_free(tmp_ctx); } /* send a control message to a node */ int ctdb_daemon_send_control(struct ctdb_context *ctdb, uint32_t destnode, uint64_t srvid, uint32_t opcode, uint32_t client_id, uint32_t flags, TDB_DATA data, ctdb_control_callback_fn_t callback, void *private_data) { struct ctdb_req_control *c; struct ctdb_control_state *state; size_t len; if (((destnode == CTDB_BROADCAST_VNNMAP) || (destnode == CTDB_BROADCAST_ALL) || (destnode == CTDB_BROADCAST_CONNECTED)) && !(flags & CTDB_CTRL_FLAG_NOREPLY)) { DEBUG(DEBUG_CRIT,("Attempt to broadcast control without NOREPLY\n")); return -1; } if (destnode != CTDB_BROADCAST_VNNMAP && destnode != CTDB_BROADCAST_ALL && destnode != CTDB_BROADCAST_CONNECTED && (!ctdb_validate_pnn(ctdb, destnode) || (ctdb->nodes[destnode]->flags & NODE_FLAGS_DISCONNECTED))) { if (!(flags & CTDB_CTRL_FLAG_NOREPLY)) { callback(ctdb, -1, tdb_null, "ctdb_control to disconnected node", private_data); } return 0; } /* the state is made a child of private_data if possible. This means any reply will be discarded if the private_data goes away */ state = talloc(private_data?private_data:ctdb, struct ctdb_control_state); CTDB_NO_MEMORY(ctdb, state); state->reqid = ctdb_reqid_new(ctdb, state); state->callback = callback; state->private_data = private_data; state->ctdb = ctdb; state->flags = flags; talloc_set_destructor(state, ctdb_control_destructor); len = offsetof(struct ctdb_req_control, data) + data.dsize; c = ctdb_transport_allocate(ctdb, state, CTDB_REQ_CONTROL, len, struct ctdb_req_control); CTDB_NO_MEMORY(ctdb, c); talloc_set_name_const(c, "ctdb_req_control packet"); c->hdr.destnode = destnode; c->hdr.reqid = state->reqid; c->opcode = opcode; c->client_id = client_id; c->flags = flags; c->srvid = srvid; c->datalen = data.dsize; if (data.dsize) { memcpy(&c->data[0], data.dptr, data.dsize); } ctdb_queue_packet(ctdb, &c->hdr); if (flags & CTDB_CTRL_FLAG_NOREPLY) { talloc_free(state); return 0; } if (ctdb->tunable.control_timeout) { event_add_timed(ctdb->ev, state, timeval_current_ofs(ctdb->tunable.control_timeout, 0), ctdb_control_timeout, state); } talloc_free(c); return 0; }