2 ctdb_control protocol code
4 Copyright (C) Andrew Tridgell 2007
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, see <http://www.gnu.org/licenses/>.
20 #include "lib/events/events.h"
21 #include "lib/tdb/include/tdb.h"
22 #include "system/network.h"
23 #include "system/filesys.h"
24 #include "system/wait.h"
25 #include "../include/ctdb_private.h"
26 #include "lib/util/dlinklist.h"
30 struct ctdb_control_state {
31 struct ctdb_context *ctdb;
33 ctdb_control_callback_fn_t callback;
40 dump talloc memory hierarchy, returning it as a blob to the client
42 int32_t ctdb_dump_memory(struct ctdb_context *ctdb, TDB_DATA *outdata)
44 /* dump to a file, then send the file as a blob */
49 DEBUG(DEBUG_ERR,(__location__ " Unable to open tmpfile - %s\n", strerror(errno)));
52 talloc_report_full(NULL, f);
55 outdata->dptr = talloc_size(outdata, fsize);
56 CTDB_NO_MEMORY(ctdb, outdata->dptr);
57 outdata->dsize = fread(outdata->dptr, 1, fsize, f);
59 if (outdata->dsize != fsize) {
60 DEBUG(DEBUG_ERR,(__location__ " Unable to read tmpfile\n"));
68 process a control request
70 static int32_t ctdb_control_dispatch(struct ctdb_context *ctdb,
71 struct ctdb_req_control *c,
73 TDB_DATA *outdata, uint32_t srcnode,
74 const char **errormsg,
77 uint32_t opcode = c->opcode;
78 uint64_t srvid = c->srvid;
79 uint32_t client_id = c->client_id;
82 case CTDB_CONTROL_PROCESS_EXISTS: {
83 CHECK_CONTROL_DATA_SIZE(sizeof(pid_t));
84 return kill(*(pid_t *)indata.dptr, 0);
87 case CTDB_CONTROL_SET_DEBUG: {
88 CHECK_CONTROL_DATA_SIZE(sizeof(int32_t));
89 LogLevel = *(int32_t *)indata.dptr;
93 case CTDB_CONTROL_GET_DEBUG: {
94 CHECK_CONTROL_DATA_SIZE(0);
95 outdata->dptr = (uint8_t *)&LogLevel;
96 outdata->dsize = sizeof(LogLevel);
100 case CTDB_CONTROL_STATISTICS: {
101 CHECK_CONTROL_DATA_SIZE(0);
102 ctdb->statistics.memory_used = talloc_total_size(NULL);
103 ctdb->statistics.frozen = (ctdb->freeze_mode == CTDB_FREEZE_FROZEN);
104 ctdb->statistics.recovering = (ctdb->recovery_mode == CTDB_RECOVERY_ACTIVE);
105 outdata->dptr = (uint8_t *)&ctdb->statistics;
106 outdata->dsize = sizeof(ctdb->statistics);
110 case CTDB_CONTROL_GET_ALL_TUNABLES: {
111 CHECK_CONTROL_DATA_SIZE(0);
112 outdata->dptr = (uint8_t *)&ctdb->tunable;
113 outdata->dsize = sizeof(ctdb->tunable);
117 case CTDB_CONTROL_DUMP_MEMORY: {
118 CHECK_CONTROL_DATA_SIZE(0);
119 return ctdb_dump_memory(ctdb, outdata);
122 case CTDB_CONTROL_STATISTICS_RESET: {
123 CHECK_CONTROL_DATA_SIZE(0);
124 ZERO_STRUCT(ctdb->statistics);
128 case CTDB_CONTROL_GETVNNMAP:
129 return ctdb_control_getvnnmap(ctdb, opcode, indata, outdata);
131 case CTDB_CONTROL_GET_DBMAP:
132 return ctdb_control_getdbmap(ctdb, opcode, indata, outdata);
134 case CTDB_CONTROL_GET_NODEMAP:
135 return ctdb_control_getnodemap(ctdb, opcode, indata, outdata);
137 case CTDB_CONTROL_RELOAD_NODES_FILE:
138 CHECK_CONTROL_DATA_SIZE(0);
139 return ctdb_control_reload_nodes_file(ctdb, opcode);
141 case CTDB_CONTROL_SETVNNMAP:
142 return ctdb_control_setvnnmap(ctdb, opcode, indata, outdata);
144 case CTDB_CONTROL_PULL_DB:
145 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_pulldb));
146 return ctdb_control_pull_db(ctdb, indata, outdata);
148 case CTDB_CONTROL_SET_DMASTER:
149 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_dmaster));
150 return ctdb_control_set_dmaster(ctdb, indata);
152 case CTDB_CONTROL_PUSH_DB:
153 return ctdb_control_push_db(ctdb, indata);
155 case CTDB_CONTROL_GET_RECMODE: {
156 return ctdb->recovery_mode;
159 case CTDB_CONTROL_SET_RECMASTER: {
160 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
161 if (ctdb->freeze_mode != CTDB_FREEZE_FROZEN) {
162 DEBUG(DEBUG_NOTICE,("Attempt to set recmaster when not frozen\n"));
165 ctdb->recovery_master = ((uint32_t *)(&indata.dptr[0]))[0];
169 case CTDB_CONTROL_GET_RECMASTER:
170 return ctdb->recovery_master;
172 case CTDB_CONTROL_GET_PID:
175 case CTDB_CONTROL_GET_PNN:
178 case CTDB_CONTROL_PING:
179 CHECK_CONTROL_DATA_SIZE(0);
180 return ctdb->statistics.num_clients;
182 case CTDB_CONTROL_GET_DBNAME: {
184 struct ctdb_db_context *ctdb_db;
186 CHECK_CONTROL_DATA_SIZE(sizeof(db_id));
187 db_id = *(uint32_t *)indata.dptr;
188 ctdb_db = find_ctdb_db(ctdb, db_id);
189 if (ctdb_db == NULL) return -1;
190 outdata->dptr = discard_const(ctdb_db->db_name);
191 outdata->dsize = strlen(ctdb_db->db_name)+1;
195 case CTDB_CONTROL_GETDBPATH: {
197 struct ctdb_db_context *ctdb_db;
199 CHECK_CONTROL_DATA_SIZE(sizeof(db_id));
200 db_id = *(uint32_t *)indata.dptr;
201 ctdb_db = find_ctdb_db(ctdb, db_id);
202 if (ctdb_db == NULL) return -1;
203 outdata->dptr = discard_const(ctdb_db->db_path);
204 outdata->dsize = strlen(ctdb_db->db_path)+1;
208 case CTDB_CONTROL_DB_ATTACH:
209 return ctdb_control_db_attach(ctdb, indata, outdata, srvid, false);
211 case CTDB_CONTROL_DB_ATTACH_PERSISTENT:
212 return ctdb_control_db_attach(ctdb, indata, outdata, srvid, true);
214 case CTDB_CONTROL_SET_CALL: {
215 struct ctdb_control_set_call *sc =
216 (struct ctdb_control_set_call *)indata.dptr;
217 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_call));
218 return ctdb_daemon_set_call(ctdb, sc->db_id, sc->fn, sc->id);
221 case CTDB_CONTROL_TRAVERSE_START:
222 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_traverse_start));
223 return ctdb_control_traverse_start(ctdb, indata, outdata, srcnode);
225 case CTDB_CONTROL_TRAVERSE_ALL:
226 return ctdb_control_traverse_all(ctdb, indata, outdata);
228 case CTDB_CONTROL_TRAVERSE_DATA:
229 return ctdb_control_traverse_data(ctdb, indata, outdata);
231 case CTDB_CONTROL_REGISTER_SRVID:
232 return daemon_register_message_handler(ctdb, client_id, srvid);
234 case CTDB_CONTROL_DEREGISTER_SRVID:
235 return daemon_deregister_message_handler(ctdb, client_id, srvid);
237 case CTDB_CONTROL_ENABLE_SEQNUM:
238 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
239 return ctdb_ltdb_enable_seqnum(ctdb, *(uint32_t *)indata.dptr);
241 case CTDB_CONTROL_UPDATE_SEQNUM:
242 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
243 return ctdb_ltdb_update_seqnum(ctdb, *(uint32_t *)indata.dptr, srcnode);
245 case CTDB_CONTROL_FREEZE:
246 CHECK_CONTROL_DATA_SIZE(0);
247 return ctdb_control_freeze(ctdb, c, async_reply);
249 case CTDB_CONTROL_THAW:
250 CHECK_CONTROL_DATA_SIZE(0);
251 return ctdb_control_thaw(ctdb);
253 case CTDB_CONTROL_SET_RECMODE:
254 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
255 return ctdb_control_set_recmode(ctdb, c, indata, async_reply, errormsg);
257 case CTDB_CONTROL_GET_MONMODE:
258 CHECK_CONTROL_DATA_SIZE(0);
259 return ctdb_monitoring_mode(ctdb);
261 case CTDB_CONTROL_ENABLE_MONITOR:
262 CHECK_CONTROL_DATA_SIZE(0);
263 ctdb_enable_monitoring(ctdb);
266 case CTDB_CONTROL_RUN_EVENTSCRIPTS:
267 return ctdb_run_eventscripts(ctdb, c, indata, async_reply);
269 case CTDB_CONTROL_DISABLE_MONITOR:
270 CHECK_CONTROL_DATA_SIZE(0);
271 ctdb_disable_monitoring(ctdb);
274 case CTDB_CONTROL_SHUTDOWN:
275 ctdb_stop_recoverd(ctdb);
276 ctdb_stop_keepalive(ctdb);
277 ctdb_stop_monitoring(ctdb);
278 ctdb_release_all_ips(ctdb);
279 if (ctdb->methods != NULL) {
280 ctdb->methods->shutdown(ctdb);
282 ctdb_event_script(ctdb, "shutdown");
283 DEBUG(DEBUG_NOTICE,("Received SHUTDOWN command. Stopping CTDB daemon.\n"));
286 case CTDB_CONTROL_TAKEOVER_IP:
287 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip));
288 return ctdb_control_takeover_ip(ctdb, c, indata, async_reply);
290 case CTDB_CONTROL_RELEASE_IP:
291 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip));
292 return ctdb_control_release_ip(ctdb, c, indata, async_reply);
294 case CTDB_CONTROL_GET_PUBLIC_IPS:
295 CHECK_CONTROL_DATA_SIZE(0);
296 return ctdb_control_get_public_ips(ctdb, c, outdata);
298 case CTDB_CONTROL_TCP_CLIENT:
299 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp));
300 return ctdb_control_tcp_client(ctdb, client_id, indata);
302 case CTDB_CONTROL_STARTUP:
303 CHECK_CONTROL_DATA_SIZE(0);
304 return ctdb_control_startup(ctdb, srcnode);
306 case CTDB_CONTROL_TCP_ADD:
307 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp_vnn));
308 return ctdb_control_tcp_add(ctdb, indata);
310 case CTDB_CONTROL_SET_TUNABLE:
311 return ctdb_control_set_tunable(ctdb, indata);
313 case CTDB_CONTROL_GET_TUNABLE:
314 return ctdb_control_get_tunable(ctdb, indata, outdata);
316 case CTDB_CONTROL_LIST_TUNABLES:
317 return ctdb_control_list_tunables(ctdb, outdata);
319 case CTDB_CONTROL_MODIFY_FLAGS:
320 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_node_modflags));
321 return ctdb_control_modflags(ctdb, indata);
323 case CTDB_CONTROL_KILL_TCP:
324 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_killtcp));
325 return ctdb_control_kill_tcp(ctdb, indata);
327 case CTDB_CONTROL_GET_TCP_TICKLE_LIST:
328 CHECK_CONTROL_DATA_SIZE(sizeof(struct sockaddr_in));
329 return ctdb_control_get_tcp_tickle_list(ctdb, indata, outdata);
331 case CTDB_CONTROL_SET_TCP_TICKLE_LIST:
332 /* data size is verified in the called function */
333 return ctdb_control_set_tcp_tickle_list(ctdb, indata);
335 case CTDB_CONTROL_REGISTER_SERVER_ID:
336 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id));
337 return ctdb_control_register_server_id(ctdb, client_id, indata);
339 case CTDB_CONTROL_UNREGISTER_SERVER_ID:
340 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id));
341 return ctdb_control_unregister_server_id(ctdb, indata);
343 case CTDB_CONTROL_CHECK_SERVER_ID:
344 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id));
345 return ctdb_control_check_server_id(ctdb, indata);
347 case CTDB_CONTROL_GET_SERVER_ID_LIST:
348 CHECK_CONTROL_DATA_SIZE(0);
349 return ctdb_control_get_server_id_list(ctdb, outdata);
351 case CTDB_CONTROL_PERSISTENT_STORE:
352 return ctdb_control_persistent_store(ctdb, c, indata, async_reply);
354 case CTDB_CONTROL_UPDATE_RECORD:
355 return ctdb_control_update_record(ctdb, c, indata, async_reply);
357 case CTDB_CONTROL_SEND_GRATIOUS_ARP:
358 return ctdb_control_send_gratious_arp(ctdb, indata);
360 case CTDB_CONTROL_TRANSACTION_START:
361 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
362 return ctdb_control_transaction_start(ctdb, *(uint32_t *)indata.dptr);
364 case CTDB_CONTROL_TRANSACTION_COMMIT:
365 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
366 return ctdb_control_transaction_commit(ctdb, *(uint32_t *)indata.dptr);
368 case CTDB_CONTROL_WIPE_DATABASE:
369 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_wipe_database));
370 return ctdb_control_wipe_database(ctdb, indata);
372 case CTDB_CONTROL_UPTIME:
373 return ctdb_control_uptime(ctdb, outdata);
375 case CTDB_CONTROL_START_RECOVERY:
376 return ctdb_control_start_recovery(ctdb, c, async_reply);
378 case CTDB_CONTROL_END_RECOVERY:
379 return ctdb_control_end_recovery(ctdb, c, async_reply);
381 case CTDB_CONTROL_GET_RECLOCK_FILE:
382 CHECK_CONTROL_DATA_SIZE(0);
383 return ctdb_control_get_reclock_file(ctdb, outdata);
385 case CTDB_CONTROL_TRY_DELETE_RECORDS:
386 return ctdb_control_try_delete_records(ctdb, indata, outdata);
388 case CTDB_CONTROL_ADD_PUBLIC_IP:
389 return ctdb_control_add_public_address(ctdb, indata);
391 case CTDB_CONTROL_DEL_PUBLIC_IP:
392 return ctdb_control_del_public_address(ctdb, indata);
394 case CTDB_CONTROL_GET_CAPABILITIES:
395 return ctdb_control_get_capabilities(ctdb, outdata);
397 case CTDB_CONTROL_START_PERSISTENT_UPDATE:
398 return ctdb_control_start_persistent_update(ctdb, c, indata);
400 case CTDB_CONTROL_CANCEL_PERSISTENT_UPDATE:
401 return ctdb_control_cancel_persistent_update(ctdb, c, indata);
404 DEBUG(DEBUG_CRIT,(__location__ " Unknown CTDB control opcode %u\n", opcode));
410 send a reply for a ctdb control
412 void ctdb_request_control_reply(struct ctdb_context *ctdb, struct ctdb_req_control *c,
413 TDB_DATA *outdata, int32_t status, const char *errormsg)
415 struct ctdb_reply_control *r;
418 /* some controls send no reply */
419 if (c->flags & CTDB_CTRL_FLAG_NOREPLY) {
423 len = offsetof(struct ctdb_reply_control, data) + (outdata?outdata->dsize:0);
425 len += strlen(errormsg);
427 r = ctdb_transport_allocate(ctdb, ctdb, CTDB_REPLY_CONTROL, len, struct ctdb_reply_control);
428 CTDB_NO_MEMORY_VOID(ctdb, r);
430 r->hdr.destnode = c->hdr.srcnode;
431 r->hdr.reqid = c->hdr.reqid;
433 r->datalen = outdata?outdata->dsize:0;
434 if (outdata && outdata->dsize) {
435 memcpy(&r->data[0], outdata->dptr, outdata->dsize);
438 r->errorlen = strlen(errormsg);
439 memcpy(&r->data[r->datalen], errormsg, r->errorlen);
442 ctdb_queue_packet_opcode(ctdb, &r->hdr, c->opcode);
448 called when a CTDB_REQ_CONTROL packet comes in
450 void ctdb_request_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr)
452 struct ctdb_req_control *c = (struct ctdb_req_control *)hdr;
453 TDB_DATA data, *outdata;
455 bool async_reply = False;
456 const char *errormsg = NULL;
458 data.dptr = &c->data[0];
459 data.dsize = c->datalen;
461 outdata = talloc_zero(c, TDB_DATA);
463 status = ctdb_control_dispatch(ctdb, c, data, outdata, hdr->srcnode,
464 &errormsg, &async_reply);
467 ctdb_request_control_reply(ctdb, c, outdata, status, errormsg);
472 called when a CTDB_REPLY_CONTROL packet comes in
474 void ctdb_reply_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr)
476 struct ctdb_reply_control *c = (struct ctdb_reply_control *)hdr;
478 struct ctdb_control_state *state;
479 const char *errormsg = NULL;
481 state = ctdb_reqid_find(ctdb, hdr->reqid, struct ctdb_control_state);
483 DEBUG(DEBUG_ERR,("pnn %u Invalid reqid %u in ctdb_reply_control\n",
484 ctdb->pnn, hdr->reqid));
488 if (hdr->reqid != state->reqid) {
489 /* we found a record but it was the wrong one */
490 DEBUG(DEBUG_ERR, ("Dropped orphaned control reply with reqid:%u\n", hdr->reqid));
494 data.dptr = &c->data[0];
495 data.dsize = c->datalen;
497 errormsg = talloc_strndup(state,
498 (char *)&c->data[c->datalen], c->errorlen);
501 /* make state a child of the packet, so it goes away when the packet
503 talloc_steal(hdr, state);
505 state->callback(ctdb, c->status, data, errormsg, state->private_data);
508 static int ctdb_control_destructor(struct ctdb_control_state *state)
510 ctdb_reqid_remove(state->ctdb, state->reqid);
515 handle a timeout of a control
517 static void ctdb_control_timeout(struct event_context *ev, struct timed_event *te,
518 struct timeval t, void *private_data)
520 struct ctdb_control_state *state = talloc_get_type(private_data, struct ctdb_control_state);
521 TALLOC_CTX *tmp_ctx = talloc_new(ev);
523 state->ctdb->statistics.timeouts.control++;
525 talloc_steal(tmp_ctx, state);
527 state->callback(state->ctdb, -1, tdb_null,
528 "ctdb_control timed out",
529 state->private_data);
530 talloc_free(tmp_ctx);
535 send a control message to a node
537 int ctdb_daemon_send_control(struct ctdb_context *ctdb, uint32_t destnode,
538 uint64_t srvid, uint32_t opcode, uint32_t client_id,
541 ctdb_control_callback_fn_t callback,
544 struct ctdb_req_control *c;
545 struct ctdb_control_state *state;
548 if (((destnode == CTDB_BROADCAST_VNNMAP) ||
549 (destnode == CTDB_BROADCAST_ALL) ||
550 (destnode == CTDB_BROADCAST_CONNECTED)) &&
551 !(flags & CTDB_CTRL_FLAG_NOREPLY)) {
552 DEBUG(DEBUG_CRIT,("Attempt to broadcast control without NOREPLY\n"));
556 if (destnode != CTDB_BROADCAST_VNNMAP &&
557 destnode != CTDB_BROADCAST_ALL &&
558 destnode != CTDB_BROADCAST_CONNECTED &&
559 (!ctdb_validate_pnn(ctdb, destnode) ||
560 (ctdb->nodes[destnode]->flags & NODE_FLAGS_DISCONNECTED))) {
561 if (!(flags & CTDB_CTRL_FLAG_NOREPLY)) {
562 callback(ctdb, -1, tdb_null, "ctdb_control to disconnected node", private_data);
567 /* the state is made a child of private_data if possible. This means any reply
568 will be discarded if the private_data goes away */
569 state = talloc(private_data?private_data:ctdb, struct ctdb_control_state);
570 CTDB_NO_MEMORY(ctdb, state);
572 state->reqid = ctdb_reqid_new(ctdb, state);
573 state->callback = callback;
574 state->private_data = private_data;
576 state->flags = flags;
578 talloc_set_destructor(state, ctdb_control_destructor);
580 len = offsetof(struct ctdb_req_control, data) + data.dsize;
581 c = ctdb_transport_allocate(ctdb, state, CTDB_REQ_CONTROL, len,
582 struct ctdb_req_control);
583 CTDB_NO_MEMORY(ctdb, c);
584 talloc_set_name_const(c, "ctdb_req_control packet");
586 c->hdr.destnode = destnode;
587 c->hdr.reqid = state->reqid;
589 c->client_id = client_id;
592 c->datalen = data.dsize;
594 memcpy(&c->data[0], data.dptr, data.dsize);
597 ctdb_queue_packet(ctdb, &c->hdr);
599 if (flags & CTDB_CTRL_FLAG_NOREPLY) {
604 if (ctdb->tunable.control_timeout) {
605 event_add_timed(ctdb->ev, state,
606 timeval_current_ofs(ctdb->tunable.control_timeout, 0),
607 ctdb_control_timeout, state);