/* ctdb control tool Copyright (C) Andrew Tridgell 2007 This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */ #include "includes.h" #include "lib/events/events.h" #include "system/filesys.h" #include "system/network.h" #include "popt.h" #include "cmdline.h" #include "../include/ctdb.h" #include "../include/ctdb_private.h" static void usage(void); static struct { int timelimit; uint32_t vnn; int machinereadable; } options; #define TIMELIMIT() timeval_current_ofs(options.timelimit, 0) /* see if a process exists */ static int control_process_exists(struct ctdb_context *ctdb, int argc, const char **argv) { uint32_t vnn, pid; int ret; if (argc < 1) { usage(); } if (sscanf(argv[0], "%u:%u", &vnn, &pid) != 2) { printf("Badly formed vnn:pid\n"); return -1; } ret = ctdb_ctrl_process_exists(ctdb, vnn, pid); if (ret == 0) { printf("%u:%u exists\n", vnn, pid); } else { printf("%u:%u does not exist\n", vnn, pid); } return ret; } /* display statistics structure */ static void show_statistics(struct ctdb_statistics *s) { TALLOC_CTX *tmp_ctx = talloc_new(NULL); int i; const char *prefix=NULL; int preflen=0; const struct { const char *name; uint32_t offset; } fields[] = { #define STATISTICS_FIELD(n) { #n, offsetof(struct ctdb_statistics, n) } STATISTICS_FIELD(num_clients), STATISTICS_FIELD(frozen), STATISTICS_FIELD(recovering), STATISTICS_FIELD(client_packets_sent), STATISTICS_FIELD(client_packets_recv), STATISTICS_FIELD(node_packets_sent), STATISTICS_FIELD(node_packets_recv), STATISTICS_FIELD(keepalive_packets_sent), STATISTICS_FIELD(keepalive_packets_recv), STATISTICS_FIELD(node.req_call), STATISTICS_FIELD(node.reply_call), STATISTICS_FIELD(node.req_dmaster), STATISTICS_FIELD(node.reply_dmaster), STATISTICS_FIELD(node.reply_error), STATISTICS_FIELD(node.req_message), STATISTICS_FIELD(node.req_control), STATISTICS_FIELD(node.reply_control), STATISTICS_FIELD(client.req_call), STATISTICS_FIELD(client.req_message), STATISTICS_FIELD(client.req_control), STATISTICS_FIELD(timeouts.call), STATISTICS_FIELD(timeouts.control), STATISTICS_FIELD(timeouts.traverse), STATISTICS_FIELD(total_calls), STATISTICS_FIELD(pending_calls), STATISTICS_FIELD(lockwait_calls), STATISTICS_FIELD(pending_lockwait_calls), STATISTICS_FIELD(memory_used), STATISTICS_FIELD(max_hop_count), }; printf("CTDB version %u\n", CTDB_VERSION); for (i=0;imax_call_latency); printf(" %-30s %.6f sec\n", "max_lockwait_latency", s->max_lockwait_latency); talloc_free(tmp_ctx); } /* display remote ctdb statistics combined from all nodes */ static int control_statistics_all(struct ctdb_context *ctdb) { int ret, i; struct ctdb_statistics statistics; uint32_t *nodes; uint32_t num_nodes; nodes = ctdb_get_connected_nodes(ctdb, TIMELIMIT(), ctdb, &num_nodes); CTDB_NO_MEMORY(ctdb, nodes); ZERO_STRUCT(statistics); for (i=0;inum;i++){ printf(":%d:%s:%d:%d:%d:\n", nodemap->nodes[i].vnn, inet_ntoa(nodemap->nodes[i].sin.sin_addr), !!(nodemap->nodes[i].flags&NODE_FLAGS_DISCONNECTED), !!(nodemap->nodes[i].flags&NODE_FLAGS_UNHEALTHY), !!(nodemap->nodes[i].flags&NODE_FLAGS_PERMANENTLY_DISABLED)); } return 0; } printf("Number of nodes:%d\n", nodemap->num); for(i=0;inum;i++){ static const struct { uint32_t flag; const char *name; } flag_names[] = { { NODE_FLAGS_DISCONNECTED, "DISCONNECTED" }, { NODE_FLAGS_PERMANENTLY_DISABLED, "DISABLED" }, { NODE_FLAGS_BANNED, "BANNED" }, { NODE_FLAGS_UNHEALTHY, "UNHEALTHY" }, }; char *flags_str = NULL; int j; for (j=0;jnodes[i].flags & flag_names[j].flag) { if (flags_str == NULL) { flags_str = talloc_strdup(ctdb, flag_names[j].name); } else { flags_str = talloc_asprintf_append(flags_str, "|%s", flag_names[j].name); } CTDB_NO_MEMORY_FATAL(ctdb, flags_str); } } if (flags_str == NULL) { flags_str = talloc_strdup(ctdb, "OK"); CTDB_NO_MEMORY_FATAL(ctdb, flags_str); } printf("vnn:%d %-16s %s%s\n", nodemap->nodes[i].vnn, inet_ntoa(nodemap->nodes[i].sin.sin_addr), flags_str, nodemap->nodes[i].vnn == myvnn?" (THIS NODE)":""); talloc_free(flags_str); } ret = ctdb_ctrl_getvnnmap(ctdb, TIMELIMIT(), options.vnn, ctdb, &vnnmap); if (ret != 0) { printf("Unable to get vnnmap from node %u\n", options.vnn); return ret; } printf("Generation:%d\n",vnnmap->generation); printf("Size:%d\n",vnnmap->size); for(i=0;isize;i++){ printf("hash:%d lmaster:%d\n", i, vnnmap->map[i]); } ret = ctdb_ctrl_getrecmode(ctdb, TIMELIMIT(), options.vnn, &recmode); if (ret != 0) { printf("Unable to get recmode from node %u\n", options.vnn); return ret; } printf("Recovery mode:%s (%d)\n",recmode==CTDB_RECOVERY_NORMAL?"NORMAL":"RECOVERY",recmode); ret = ctdb_ctrl_getrecmaster(ctdb, TIMELIMIT(), options.vnn, &recmaster); if (ret != 0) { printf("Unable to get recmaster from node %u\n", options.vnn); return ret; } printf("Recovery master:%d\n",recmaster); return 0; } /* kill a tcp connection */ static int kill_tcp(struct ctdb_context *ctdb, int argc, const char **argv) { int i, ret; struct sockaddr_in src, dst; if (argc < 2) { usage(); } if (!parse_ip_port(argv[0], &src)) { printf("Bad IP:port '%s'\n", argv[1]); return -1; } if (!parse_ip_port(argv[1], &dst)) { printf("Bad IP:port '%s'\n", argv[1]); return -1; } for (i=0;i<5;i++) { ret = ctdb_sys_kill_tcp(ctdb->ev, &src, &dst); printf("ret:%d\n", ret); if (ret==0) { return 0; } } return -1; } /* send a tcp tickle ack */ static int tickle_tcp(struct ctdb_context *ctdb, int argc, const char **argv) { int ret; struct sockaddr_in src, dst; if (argc < 2) { usage(); } if (!parse_ip_port(argv[0], &src)) { printf("Bad IP:port '%s'\n", argv[1]); return -1; } if (!parse_ip_port(argv[1], &dst)) { printf("Bad IP:port '%s'\n", argv[1]); return -1; } ret = ctdb_sys_send_tcp(&src, &dst, 0, 0, 0); if (ret==0) { return 0; } printf("Error while sending tickle ack\n"); return -1; } /* display public ip status */ static int control_ip(struct ctdb_context *ctdb, int argc, const char **argv) { int i, ret; struct ctdb_all_public_ips *ips; uint32_t myvnn; myvnn = ctdb_ctrl_getvnn(ctdb, TIMELIMIT(), options.vnn); ret = ctdb_ctrl_get_public_ips(ctdb, TIMELIMIT(), options.vnn, ctdb, &ips); if (ret != 0) { printf("Unable to get public ips from node %u\n", options.vnn); return ret; } if(options.machinereadable){ printf(":Public IP:Node:\n"); for(i=0;inum;i++){ printf(":%s:%d:\n", inet_ntoa(ips->ips[i].sin.sin_addr), ips->ips[i].takeover_vnn); } return 0; } printf("Number of nodes:%d\n", ips->num); for(i=0;inum;i++){ printf("%-16s %d\n", inet_ntoa(ips->ips[i].sin.sin_addr), ips->ips[i].takeover_vnn); } return 0; } /* display pid of a ctdb daemon */ static int control_getpid(struct ctdb_context *ctdb, int argc, const char **argv) { uint32_t pid; int ret; ret = ctdb_ctrl_getpid(ctdb, TIMELIMIT(), options.vnn, &pid); if (ret != 0) { printf("Unable to get daemon pid from node %u\n", options.vnn); return ret; } printf("Pid:%d\n", pid); return 0; } /* disable a remote node */ static int control_disable(struct ctdb_context *ctdb, int argc, const char **argv) { int ret; ret = ctdb_ctrl_modflags(ctdb, TIMELIMIT(), options.vnn, NODE_FLAGS_PERMANENTLY_DISABLED, 0); if (ret != 0) { printf("Unable to disable node %u\n", options.vnn); return ret; } return 0; } /* enable a disabled remote node */ static int control_enable(struct ctdb_context *ctdb, int argc, const char **argv) { int ret; ret = ctdb_ctrl_modflags(ctdb, TIMELIMIT(), options.vnn, 0, NODE_FLAGS_PERMANENTLY_DISABLED); if (ret != 0) { printf("Unable to enable node %u\n", options.vnn); return ret; } return 0; } /* ban a node from the cluster */ static int control_ban(struct ctdb_context *ctdb, int argc, const char **argv) { int ret; uint32_t recmaster; struct ctdb_ban_info b; TDB_DATA data; uint32_t ban_time; if (argc < 1) { usage(); } ban_time = strtoul(argv[0], NULL, 0); ret = ctdb_ctrl_getrecmaster(ctdb, TIMELIMIT(), options.vnn, &recmaster); if (ret != 0) { DEBUG(0,("Failed to find the recmaster\n")); return -1; } b.vnn = options.vnn; b.ban_time = ban_time; data.dptr = (uint8_t *)&b; data.dsize = sizeof(b); ret = ctdb_send_message(ctdb, recmaster, CTDB_SRVID_BAN_NODE, data); if (ret != 0) { DEBUG(0,("Failed to tell the recmaster to ban node %u\n", options.vnn)); return -1; } return 0; } /* unban a node from the cluster */ static int control_unban(struct ctdb_context *ctdb, int argc, const char **argv) { int ret; uint32_t recmaster; TDB_DATA data; ret = ctdb_ctrl_getrecmaster(ctdb, TIMELIMIT(), options.vnn, &recmaster); if (ret != 0) { DEBUG(0,("Failed to find the recmaster\n")); return -1; } data.dptr = (uint8_t *)&options.vnn; data.dsize = sizeof(uint32_t); ret = ctdb_send_message(ctdb, recmaster, CTDB_SRVID_UNBAN_NODE, data); if (ret != 0) { DEBUG(0,("Failed to tell the recmaster to unban node %u\n", options.vnn)); return -1; } return 0; } /* shutdown a daemon */ static int control_shutdown(struct ctdb_context *ctdb, int argc, const char **argv) { int ret; ret = ctdb_ctrl_shutdown(ctdb, TIMELIMIT(), options.vnn); if (ret != 0) { printf("Unable to shutdown node %u\n", options.vnn); return ret; } return 0; } /* trigger a recovery */ static int control_recover(struct ctdb_context *ctdb, int argc, const char **argv) { int ret; ret = ctdb_ctrl_freeze(ctdb, TIMELIMIT(), options.vnn); if (ret != 0) { printf("Unable to freeze node\n"); return ret; } ret = ctdb_ctrl_setrecmode(ctdb, TIMELIMIT(), options.vnn, CTDB_RECOVERY_ACTIVE); if (ret != 0) { printf("Unable to set recovery mode\n"); return ret; } return 0; } /* display monitoring mode of a remote node */ static int control_getmonmode(struct ctdb_context *ctdb, int argc, const char **argv) { uint32_t monmode; int ret; ret = ctdb_ctrl_getmonmode(ctdb, TIMELIMIT(), options.vnn, &monmode); if (ret != 0) { printf("Unable to get monmode from node %u\n", options.vnn); return ret; } printf("Monitoring mode:%s (%d)\n",monmode==CTDB_MONITORING_ACTIVE?"ACTIVE":"DISABLED",monmode); return 0; } /* set the monitoring mode of a remote node */ static int control_setmonmode(struct ctdb_context *ctdb, int argc, const char **argv) { uint32_t monmode; int ret; if (argc < 1) { usage(); } monmode = strtoul(argv[0], NULL, 0); ret = ctdb_ctrl_setmonmode(ctdb, TIMELIMIT(), options.vnn, monmode); if (ret != 0) { printf("Unable to set monmode on node %u\n", options.vnn); return ret; } return 0; } /* display remote list of keys/data for a db */ static int control_catdb(struct ctdb_context *ctdb, int argc, const char **argv) { const char *db_name; struct ctdb_db_context *ctdb_db; int ret; if (argc < 1) { usage(); } db_name = argv[0]; ctdb_db = ctdb_attach(ctdb, db_name); if (ctdb_db == NULL) { DEBUG(0,("Unable to attach to database '%s'\n", db_name)); return -1; } /* traverse and dump the cluster tdb */ ret = ctdb_dump_db(ctdb_db, stdout); if (ret == -1) { printf("Unable to dump database\n"); return -1; } talloc_free(ctdb_db); printf("Dumped %d records\n", ret); return 0; } /* display a list of the databases on a remote ctdb */ static int control_getdbmap(struct ctdb_context *ctdb, int argc, const char **argv) { int i, ret; struct ctdb_dbid_map *dbmap=NULL; ret = ctdb_ctrl_getdbmap(ctdb, TIMELIMIT(), options.vnn, ctdb, &dbmap); if (ret != 0) { printf("Unable to get dbids from node %u\n", options.vnn); return ret; } printf("Number of databases:%d\n", dbmap->num); for(i=0;inum;i++){ const char *path; const char *name; ctdb_ctrl_getdbpath(ctdb, TIMELIMIT(), options.vnn, dbmap->dbids[i], ctdb, &path); ctdb_ctrl_getdbname(ctdb, TIMELIMIT(), options.vnn, dbmap->dbids[i], ctdb, &name); printf("dbid:0x%08x name:%s path:%s\n", dbmap->dbids[i], name, path); } return 0; } /* ping a node */ static int control_ping(struct ctdb_context *ctdb, int argc, const char **argv) { int ret; struct timeval tv = timeval_current(); ret = ctdb_ctrl_ping(ctdb, options.vnn); if (ret == -1) { printf("Unable to get ping response from node %u\n", options.vnn); } else { printf("response from %u time=%.6f sec (%d clients)\n", options.vnn, timeval_elapsed(&tv), ret); } return 0; } /* get a tunable */ static int control_getvar(struct ctdb_context *ctdb, int argc, const char **argv) { const char *name; uint32_t value; int ret; if (argc < 1) { usage(); } name = argv[0]; ret = ctdb_ctrl_get_tunable(ctdb, TIMELIMIT(), options.vnn, name, &value); if (ret == -1) { printf("Unable to get tunable variable '%s'\n", name); return -1; } printf("%-19s = %u\n", name, value); return 0; } /* set a tunable */ static int control_setvar(struct ctdb_context *ctdb, int argc, const char **argv) { const char *name; uint32_t value; int ret; if (argc < 2) { usage(); } name = argv[0]; value = strtoul(argv[1], NULL, 0); ret = ctdb_ctrl_set_tunable(ctdb, TIMELIMIT(), options.vnn, name, value); if (ret == -1) { printf("Unable to set tunable variable '%s'\n", name); return -1; } return 0; } /* list all tunables */ static int control_listvars(struct ctdb_context *ctdb, int argc, const char **argv) { uint32_t count; const char **list; int ret, i; ret = ctdb_ctrl_list_tunables(ctdb, TIMELIMIT(), options.vnn, ctdb, &list, &count); if (ret == -1) { printf("Unable to list tunable variables\n"); return -1; } for (i=0;i"}, { "setvar", control_setvar, true, "set a tunable variable", " "}, { "listvars", control_listvars, true, "list tunable variables"}, { "statistics", control_statistics, false, "show statistics" }, { "statisticsreset", control_statistics_reset, true, "reset statistics"}, { "ip", control_ip, true, "show which public ip's that ctdb manages" }, { "process-exists", control_process_exists, true, "check if a process exists on a node", ""}, { "getdbmap", control_getdbmap, true, "show the database map" }, { "catdb", control_catdb, true, "dump a database" , ""}, { "getmonmode", control_getmonmode, true, "show monitoring mode" }, { "setmonmode", control_setmonmode, true, "set monitoring mode", "<0|1>" }, { "setdebug", control_setdebug, true, "set debug level", "" }, { "getdebug", control_getdebug, true, "get debug level" }, { "attach", control_attach, true, "attach to a database", "" }, { "dumpmemory", control_dumpmemory, true, "dump memory map to logs" }, { "getpid", control_getpid, true, "get ctdbd process ID" }, { "disable", control_disable, true, "disable a nodes public IP" }, { "enable", control_enable, true, "enable a nodes public IP" }, { "ban", control_ban, true, "ban a node from the cluster", ""}, { "unban", control_unban, true, "unban a node from the cluster" }, { "shutdown", control_shutdown, true, "shutdown ctdbd" }, { "recover", control_recover, true, "force recovery" }, { "freeze", control_freeze, true, "freeze all databases" }, { "thaw", control_thaw, true, "thaw all databases" }, { "killtcp", kill_tcp, false, "kill a tcp connection", " " }, { "tickle", tickle_tcp, false, "send a tcp tickle ack", " " }, }; /* show usage message */ static void usage(void) { int i; printf( "Usage: ctdb [options] \n" \ "Options:\n" \ " -n choose node number, or 'all' (defaults to local node)\n" " -Y generate machinereadable output\n" " -t set timelimit for control in seconds (default %u)\n", options.timelimit); printf("Controls:\n"); for (i=0;i