2 ctdb_control protocol code
4 Copyright (C) Andrew Tridgell 2007
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, write to the Free Software
18 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
21 #include "lib/events/events.h"
22 #include "lib/tdb/include/tdb.h"
23 #include "system/network.h"
24 #include "system/filesys.h"
25 #include "system/wait.h"
26 #include "../include/ctdb_private.h"
27 #include "lib/util/dlinklist.h"
30 struct ctdb_control_state {
31 struct ctdb_context *ctdb;
33 ctdb_control_callback_fn_t callback;
39 process a control request
41 static int32_t ctdb_control_dispatch(struct ctdb_context *ctdb,
42 struct ctdb_req_control *c,
44 TDB_DATA *outdata, uint32_t srcnode,
45 const char **errormsg,
48 uint32_t opcode = c->opcode;
49 uint64_t srvid = c->srvid;
50 uint32_t client_id = c->client_id;
53 case CTDB_CONTROL_PROCESS_EXISTS: {
54 CHECK_CONTROL_DATA_SIZE(sizeof(pid_t));
55 return kill(*(pid_t *)indata.dptr, 0);
58 case CTDB_CONTROL_SET_DEBUG: {
59 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
60 LogLevel = *(uint32_t *)indata.dptr;
64 case CTDB_CONTROL_GET_DEBUG: {
65 CHECK_CONTROL_DATA_SIZE(0);
66 outdata->dptr = (uint8_t *)&LogLevel;
67 outdata->dsize = sizeof(LogLevel);
71 case CTDB_CONTROL_STATISTICS: {
72 CHECK_CONTROL_DATA_SIZE(0);
73 ctdb->statistics.memory_used = talloc_total_size(ctdb);
74 ctdb->statistics.frozen = (ctdb->freeze_mode == CTDB_FREEZE_FROZEN);
75 ctdb->statistics.recovering = (ctdb->recovery_mode == CTDB_RECOVERY_ACTIVE);
76 outdata->dptr = (uint8_t *)&ctdb->statistics;
77 outdata->dsize = sizeof(ctdb->statistics);
81 case CTDB_CONTROL_GET_ALL_TUNABLES: {
82 CHECK_CONTROL_DATA_SIZE(0);
83 outdata->dptr = (uint8_t *)&ctdb->tunable;
84 outdata->dsize = sizeof(ctdb->tunable);
88 case CTDB_CONTROL_DUMP_MEMORY: {
89 CHECK_CONTROL_DATA_SIZE(0);
90 talloc_report_full(ctdb, stdout);
94 case CTDB_CONTROL_STATISTICS_RESET: {
95 CHECK_CONTROL_DATA_SIZE(0);
96 ZERO_STRUCT(ctdb->statistics);
100 case CTDB_CONTROL_GETVNNMAP:
101 return ctdb_control_getvnnmap(ctdb, opcode, indata, outdata);
103 case CTDB_CONTROL_GET_DBMAP:
104 return ctdb_control_getdbmap(ctdb, opcode, indata, outdata);
106 case CTDB_CONTROL_GET_NODEMAP:
107 return ctdb_control_getnodemap(ctdb, opcode, indata, outdata);
109 case CTDB_CONTROL_SETVNNMAP:
110 return ctdb_control_setvnnmap(ctdb, opcode, indata, outdata);
112 case CTDB_CONTROL_PULL_DB:
113 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_pulldb));
114 return ctdb_control_pull_db(ctdb, indata, outdata);
116 case CTDB_CONTROL_SET_DMASTER:
117 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_dmaster));
118 return ctdb_control_set_dmaster(ctdb, indata);
120 case CTDB_CONTROL_PUSH_DB:
121 return ctdb_control_push_db(ctdb, indata);
123 case CTDB_CONTROL_GET_RECMODE: {
124 return ctdb->recovery_mode;
127 case CTDB_CONTROL_SET_RECMASTER: {
128 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
129 if (ctdb->freeze_mode != CTDB_FREEZE_FROZEN) {
130 DEBUG(0,("Attempt to set recmaster when not frozen\n"));
133 ctdb->recovery_master = ((uint32_t *)(&indata.dptr[0]))[0];
137 case CTDB_CONTROL_GET_RECMASTER:
138 return ctdb->recovery_master;
140 case CTDB_CONTROL_GET_PID:
143 case CTDB_CONTROL_GET_VNN:
146 case CTDB_CONTROL_PING:
147 CHECK_CONTROL_DATA_SIZE(0);
148 return ctdb->statistics.num_clients;
150 case CTDB_CONTROL_GET_DBNAME: {
152 struct ctdb_db_context *ctdb_db;
154 CHECK_CONTROL_DATA_SIZE(sizeof(db_id));
155 db_id = *(uint32_t *)indata.dptr;
156 ctdb_db = find_ctdb_db(ctdb, db_id);
157 if (ctdb_db == NULL) return -1;
158 outdata->dptr = discard_const(ctdb_db->db_name);
159 outdata->dsize = strlen(ctdb_db->db_name)+1;
163 case CTDB_CONTROL_GETDBPATH: {
165 struct ctdb_db_context *ctdb_db;
167 CHECK_CONTROL_DATA_SIZE(sizeof(db_id));
168 db_id = *(uint32_t *)indata.dptr;
169 ctdb_db = find_ctdb_db(ctdb, db_id);
170 if (ctdb_db == NULL) return -1;
171 outdata->dptr = discard_const(ctdb_db->db_path);
172 outdata->dsize = strlen(ctdb_db->db_path)+1;
176 case CTDB_CONTROL_DB_ATTACH:
177 return ctdb_control_db_attach(ctdb, indata, outdata);
179 case CTDB_CONTROL_SET_CALL: {
180 struct ctdb_control_set_call *sc =
181 (struct ctdb_control_set_call *)indata.dptr;
182 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_call));
183 return ctdb_daemon_set_call(ctdb, sc->db_id, sc->fn, sc->id);
186 case CTDB_CONTROL_TRAVERSE_START:
187 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_traverse_start));
188 return ctdb_control_traverse_start(ctdb, indata, outdata, srcnode);
190 case CTDB_CONTROL_TRAVERSE_ALL:
191 return ctdb_control_traverse_all(ctdb, indata, outdata);
193 case CTDB_CONTROL_TRAVERSE_DATA:
194 return ctdb_control_traverse_data(ctdb, indata, outdata);
196 case CTDB_CONTROL_REGISTER_SRVID:
197 return daemon_register_message_handler(ctdb, client_id, srvid);
199 case CTDB_CONTROL_DEREGISTER_SRVID:
200 return daemon_deregister_message_handler(ctdb, client_id, srvid);
202 case CTDB_CONTROL_ENABLE_SEQNUM:
203 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
204 return ctdb_ltdb_enable_seqnum(ctdb, *(uint32_t *)indata.dptr);
206 case CTDB_CONTROL_UPDATE_SEQNUM:
207 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
208 return ctdb_ltdb_update_seqnum(ctdb, *(uint32_t *)indata.dptr, srcnode);
210 case CTDB_CONTROL_FREEZE:
211 CHECK_CONTROL_DATA_SIZE(0);
212 return ctdb_control_freeze(ctdb, c, async_reply);
214 case CTDB_CONTROL_THAW:
215 CHECK_CONTROL_DATA_SIZE(0);
216 return ctdb_control_thaw(ctdb);
218 case CTDB_CONTROL_SET_RECMODE:
219 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
220 return ctdb_control_set_recmode(ctdb, c, indata, async_reply, errormsg);
222 case CTDB_CONTROL_SET_MONMODE:
223 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
224 ctdb->monitoring_mode = *(uint32_t *)indata.dptr;
227 case CTDB_CONTROL_GET_MONMODE:
228 return ctdb->monitoring_mode;
230 case CTDB_CONTROL_SHUTDOWN:
231 ctdb_release_all_ips(ctdb);
232 ctdb->methods->shutdown(ctdb);
233 ctdb_event_script(ctdb, "shutdown");
234 DEBUG(0,("shutting down\n"));
237 case CTDB_CONTROL_MAX_RSN:
238 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
239 return ctdb_control_max_rsn(ctdb, indata, outdata);
241 case CTDB_CONTROL_SET_RSN_NONEMPTY:
242 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_rsn_nonempty));
243 return ctdb_control_set_rsn_nonempty(ctdb, indata, outdata);
245 case CTDB_CONTROL_TAKEOVER_IP:
246 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip));
247 return ctdb_control_takeover_ip(ctdb, c, indata, async_reply);
249 case CTDB_CONTROL_RELEASE_IP:
250 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip));
251 return ctdb_control_release_ip(ctdb, c, indata, async_reply);
253 case CTDB_CONTROL_GET_PUBLIC_IPS:
254 CHECK_CONTROL_DATA_SIZE(0);
255 return ctdb_control_get_public_ips(ctdb, c, outdata);
257 case CTDB_CONTROL_DELETE_LOW_RSN:
258 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_delete_low_rsn));
259 return ctdb_control_delete_low_rsn(ctdb, indata, outdata);
261 case CTDB_CONTROL_TCP_CLIENT:
262 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp));
263 return ctdb_control_tcp_client(ctdb, client_id, srcnode, indata);
265 case CTDB_CONTROL_STARTUP:
266 CHECK_CONTROL_DATA_SIZE(0);
267 return ctdb_control_startup(ctdb, srcnode);
269 case CTDB_CONTROL_TCP_ADD:
270 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp_vnn));
271 return ctdb_control_tcp_add(ctdb, indata);
273 case CTDB_CONTROL_TCP_REMOVE:
274 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp_vnn));
275 return ctdb_control_tcp_remove(ctdb, indata);
277 case CTDB_CONTROL_SET_TUNABLE:
278 return ctdb_control_set_tunable(ctdb, indata);
280 case CTDB_CONTROL_GET_TUNABLE:
281 return ctdb_control_get_tunable(ctdb, indata, outdata);
283 case CTDB_CONTROL_LIST_TUNABLES:
284 return ctdb_control_list_tunables(ctdb, outdata);
286 case CTDB_CONTROL_MODIFY_FLAGS:
287 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_node_modflags));
288 return ctdb_control_modflags(ctdb, indata);
291 DEBUG(0,(__location__ " Unknown CTDB control opcode %u\n", opcode));
298 send a reply for a ctdb control
300 void ctdb_request_control_reply(struct ctdb_context *ctdb, struct ctdb_req_control *c,
301 TDB_DATA *outdata, int32_t status, const char *errormsg)
303 struct ctdb_reply_control *r;
306 /* some controls send no reply */
307 if (c->flags & CTDB_CTRL_FLAG_NOREPLY) {
311 len = offsetof(struct ctdb_reply_control, data) + (outdata?outdata->dsize:0);
313 len += strlen(errormsg);
315 r = ctdb_transport_allocate(ctdb, ctdb, CTDB_REPLY_CONTROL, len, struct ctdb_reply_control);
316 CTDB_NO_MEMORY_VOID(ctdb, r);
318 r->hdr.destnode = c->hdr.srcnode;
319 r->hdr.reqid = c->hdr.reqid;
321 r->datalen = outdata?outdata->dsize:0;
322 if (outdata && outdata->dsize) {
323 memcpy(&r->data[0], outdata->dptr, outdata->dsize);
326 r->errorlen = strlen(errormsg);
327 memcpy(&r->data[r->datalen], errormsg, r->errorlen);
330 ctdb_queue_packet(ctdb, &r->hdr);
336 called when a CTDB_REQ_CONTROL packet comes in
338 void ctdb_request_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr)
340 struct ctdb_req_control *c = (struct ctdb_req_control *)hdr;
341 TDB_DATA data, *outdata;
343 bool async_reply = False;
344 const char *errormsg = NULL;
346 data.dptr = &c->data[0];
347 data.dsize = c->datalen;
349 outdata = talloc_zero(c, TDB_DATA);
351 status = ctdb_control_dispatch(ctdb, c, data, outdata, hdr->srcnode,
352 &errormsg, &async_reply);
355 ctdb_request_control_reply(ctdb, c, outdata, status, errormsg);
360 called when a CTDB_REPLY_CONTROL packet comes in
362 void ctdb_reply_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr)
364 struct ctdb_reply_control *c = (struct ctdb_reply_control *)hdr;
366 struct ctdb_control_state *state;
367 const char *errormsg = NULL;
369 state = ctdb_reqid_find(ctdb, hdr->reqid, struct ctdb_control_state);
371 DEBUG(0,("vnn %u Invalid reqid %u in ctdb_reply_control\n",
372 ctdb->vnn, hdr->reqid));
376 if (hdr->reqid != state->reqid) {
377 /* we found a record but it was the wrong one */
378 DEBUG(0, ("Dropped orphaned control reply with reqid:%u\n", hdr->reqid));
382 data.dptr = &c->data[0];
383 data.dsize = c->datalen;
385 errormsg = talloc_strndup(state,
386 (char *)&c->data[c->datalen], c->errorlen);
389 /* make state a child of the packet, so it goes away when the packet
391 talloc_steal(hdr, state);
393 state->callback(ctdb, c->status, data, errormsg, state->private_data);
396 static int ctdb_control_destructor(struct ctdb_control_state *state)
398 ctdb_reqid_remove(state->ctdb, state->reqid);
403 handle a timeout of a control
405 static void ctdb_control_timeout(struct event_context *ev, struct timed_event *te,
406 struct timeval t, void *private_data)
408 struct ctdb_control_state *state = talloc_get_type(private_data, struct ctdb_control_state);
409 TALLOC_CTX *tmp_ctx = talloc_new(ev);
411 state->ctdb->statistics.timeouts.control++;
413 talloc_steal(tmp_ctx, state);
415 state->callback(state->ctdb, -1, tdb_null,
416 "ctdb_control timed out",
417 state->private_data);
418 talloc_free(tmp_ctx);
423 send a control message to a node
425 int ctdb_daemon_send_control(struct ctdb_context *ctdb, uint32_t destnode,
426 uint64_t srvid, uint32_t opcode, uint32_t client_id,
429 ctdb_control_callback_fn_t callback,
432 struct ctdb_req_control *c;
433 struct ctdb_control_state *state;
436 if (((destnode == CTDB_BROADCAST_VNNMAP) || (destnode == CTDB_BROADCAST_VNNMAP)) && !(flags & CTDB_CTRL_FLAG_NOREPLY)) {
437 DEBUG(0,("Attempt to broadcast control without NOREPLY\n"));
441 if (destnode != CTDB_BROADCAST_VNNMAP && destnode != CTDB_BROADCAST_ALL &&
442 (!ctdb_validate_vnn(ctdb, destnode) ||
443 (ctdb->nodes[destnode]->flags & NODE_FLAGS_DISCONNECTED))) {
444 if (!(flags & CTDB_CTRL_FLAG_NOREPLY)) {
445 callback(ctdb, -1, tdb_null, "ctdb_control to disconnected node", private_data);
450 /* the state is made a child of private_data if possible. This means any reply
451 will be discarded if the private_data goes away */
452 state = talloc(private_data?private_data:ctdb, struct ctdb_control_state);
453 CTDB_NO_MEMORY(ctdb, state);
455 state->reqid = ctdb_reqid_new(ctdb, state);
456 state->callback = callback;
457 state->private_data = private_data;
459 state->flags = flags;
461 talloc_set_destructor(state, ctdb_control_destructor);
463 len = offsetof(struct ctdb_req_control, data) + data.dsize;
464 c = ctdb_transport_allocate(ctdb, state, CTDB_REQ_CONTROL, len,
465 struct ctdb_req_control);
466 CTDB_NO_MEMORY(ctdb, c);
467 talloc_set_name_const(c, "ctdb_req_control packet");
469 c->hdr.destnode = destnode;
470 c->hdr.reqid = state->reqid;
472 c->client_id = client_id;
475 c->datalen = data.dsize;
477 memcpy(&c->data[0], data.dptr, data.dsize);
480 ctdb_queue_packet(ctdb, &c->hdr);
482 if (flags & CTDB_CTRL_FLAG_NOREPLY) {
487 if (ctdb->tunable.control_timeout) {
488 event_add_timed(ctdb->ev, state,
489 timeval_current_ofs(ctdb->tunable.control_timeout, 0),
490 ctdb_control_timeout, state);