959705de6e3c0859b88b75943a97eac78b44e38d
[vlendec/samba-autobuild/.git] / ctdb / server / ctdb_control.c
1 /* 
2    ctdb_control protocol code
3
4    Copyright (C) Andrew Tridgell  2007
5
6    This program is free software; you can redistribute it and/or modify
7    it under the terms of the GNU General Public License as published by
8    the Free Software Foundation; either version 3 of the License, or
9    (at your option) any later version.
10    
11    This program is distributed in the hope that it will be useful,
12    but WITHOUT ANY WARRANTY; without even the implied warranty of
13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14    GNU General Public License for more details.
15    
16    You should have received a copy of the GNU General Public License
17    along with this program; if not, see <http://www.gnu.org/licenses/>.
18 */
19 #include "includes.h"
20 #include "lib/events/events.h"
21 #include "lib/tdb/include/tdb.h"
22 #include "system/network.h"
23 #include "system/filesys.h"
24 #include "system/wait.h"
25 #include "../include/ctdb_private.h"
26 #include "lib/util/dlinklist.h"
27 #include "db_wrap.h"
28
29
30 struct ctdb_control_state {
31         struct ctdb_context *ctdb;
32         uint32_t reqid;
33         ctdb_control_callback_fn_t callback;
34         void *private_data;
35         unsigned flags;
36 };
37
38
39 /*
40   process a control request
41  */
42 static int32_t ctdb_control_dispatch(struct ctdb_context *ctdb, 
43                                      struct ctdb_req_control *c,
44                                      TDB_DATA indata,
45                                      TDB_DATA *outdata, uint32_t srcnode,
46                                      const char **errormsg,
47                                      bool *async_reply)
48 {
49         uint32_t opcode = c->opcode;
50         uint64_t srvid = c->srvid;
51         uint32_t client_id = c->client_id;
52
53         switch (opcode) {
54         case CTDB_CONTROL_PROCESS_EXISTS: {
55                 CHECK_CONTROL_DATA_SIZE(sizeof(pid_t));
56                 return kill(*(pid_t *)indata.dptr, 0);
57         }
58
59         case CTDB_CONTROL_SET_DEBUG: {
60                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
61                 LogLevel = *(uint32_t *)indata.dptr;
62                 return 0;
63         }
64
65         case CTDB_CONTROL_GET_DEBUG: {
66                 CHECK_CONTROL_DATA_SIZE(0);
67                 outdata->dptr = (uint8_t *)&LogLevel;
68                 outdata->dsize = sizeof(LogLevel);
69                 return 0;
70         }
71
72         case CTDB_CONTROL_STATISTICS: {
73                 CHECK_CONTROL_DATA_SIZE(0);
74                 ctdb->statistics.memory_used = talloc_total_size(ctdb);
75                 ctdb->statistics.frozen = (ctdb->freeze_mode == CTDB_FREEZE_FROZEN);
76                 ctdb->statistics.recovering = (ctdb->recovery_mode == CTDB_RECOVERY_ACTIVE);
77                 outdata->dptr = (uint8_t *)&ctdb->statistics;
78                 outdata->dsize = sizeof(ctdb->statistics);
79                 return 0;
80         }
81
82         case CTDB_CONTROL_GET_ALL_TUNABLES: {
83                 CHECK_CONTROL_DATA_SIZE(0);
84                 outdata->dptr = (uint8_t *)&ctdb->tunable;
85                 outdata->dsize = sizeof(ctdb->tunable);
86                 return 0;
87         }
88
89         case CTDB_CONTROL_DUMP_MEMORY: {
90                 CHECK_CONTROL_DATA_SIZE(0);
91                 talloc_report_full(ctdb, stdout);
92                 return 0;
93         }
94
95         case CTDB_CONTROL_STATISTICS_RESET: {
96                 CHECK_CONTROL_DATA_SIZE(0);
97                 ZERO_STRUCT(ctdb->statistics);
98                 return 0;
99         }
100
101         case CTDB_CONTROL_GETVNNMAP:
102                 return ctdb_control_getvnnmap(ctdb, opcode, indata, outdata);
103
104         case CTDB_CONTROL_GET_DBMAP:
105                 return ctdb_control_getdbmap(ctdb, opcode, indata, outdata);
106
107         case CTDB_CONTROL_GET_NODEMAP:
108                 return ctdb_control_getnodemap(ctdb, opcode, indata, outdata);
109
110         case CTDB_CONTROL_SETVNNMAP:
111                 return ctdb_control_setvnnmap(ctdb, opcode, indata, outdata);
112
113         case CTDB_CONTROL_PULL_DB: 
114                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_pulldb));
115                 return ctdb_control_pull_db(ctdb, indata, outdata);
116
117         case CTDB_CONTROL_SET_DMASTER: 
118                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_dmaster));
119                 return ctdb_control_set_dmaster(ctdb, indata);
120
121         case CTDB_CONTROL_PUSH_DB:
122                 return ctdb_control_push_db(ctdb, indata);
123
124         case CTDB_CONTROL_GET_RECMODE: {
125                 return ctdb->recovery_mode;
126         }
127
128         case CTDB_CONTROL_SET_RECMASTER: {
129                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
130                 if (ctdb->freeze_mode != CTDB_FREEZE_FROZEN) {
131                         DEBUG(0,("Attempt to set recmaster when not frozen\n"));
132                         return -1;
133                 }
134                 ctdb->recovery_master = ((uint32_t *)(&indata.dptr[0]))[0];
135                 return 0;
136         }
137
138         case CTDB_CONTROL_GET_RECMASTER:
139                 return ctdb->recovery_master;
140
141         case CTDB_CONTROL_GET_PID:
142                 return getpid();
143
144         case CTDB_CONTROL_GET_PNN:
145                 return ctdb->pnn;
146
147         case CTDB_CONTROL_PING:
148                 CHECK_CONTROL_DATA_SIZE(0);
149                 return ctdb->statistics.num_clients;
150
151         case CTDB_CONTROL_GET_DBNAME: {
152                 uint32_t db_id;
153                 struct ctdb_db_context *ctdb_db;
154
155                 CHECK_CONTROL_DATA_SIZE(sizeof(db_id));
156                 db_id = *(uint32_t *)indata.dptr;
157                 ctdb_db = find_ctdb_db(ctdb, db_id);
158                 if (ctdb_db == NULL) return -1;
159                 outdata->dptr = discard_const(ctdb_db->db_name);
160                 outdata->dsize = strlen(ctdb_db->db_name)+1;
161                 return 0;
162         }
163
164         case CTDB_CONTROL_GETDBPATH: {
165                 uint32_t db_id;
166                 struct ctdb_db_context *ctdb_db;
167
168                 CHECK_CONTROL_DATA_SIZE(sizeof(db_id));
169                 db_id = *(uint32_t *)indata.dptr;
170                 ctdb_db = find_ctdb_db(ctdb, db_id);
171                 if (ctdb_db == NULL) return -1;
172                 outdata->dptr = discard_const(ctdb_db->db_path);
173                 outdata->dsize = strlen(ctdb_db->db_path)+1;
174                 return 0;
175         }
176
177         case CTDB_CONTROL_DB_ATTACH:
178                 return ctdb_control_db_attach(ctdb, indata, outdata, false);
179
180         case CTDB_CONTROL_DB_ATTACH_PERSISTENT:
181                 return ctdb_control_db_attach(ctdb, indata, outdata, true);
182
183         case CTDB_CONTROL_SET_CALL: {
184                 struct ctdb_control_set_call *sc = 
185                         (struct ctdb_control_set_call *)indata.dptr;
186                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_call));
187                 return ctdb_daemon_set_call(ctdb, sc->db_id, sc->fn, sc->id);
188         }
189
190         case CTDB_CONTROL_TRAVERSE_START:
191                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_traverse_start));
192                 return ctdb_control_traverse_start(ctdb, indata, outdata, srcnode);
193
194         case CTDB_CONTROL_TRAVERSE_ALL:
195                 return ctdb_control_traverse_all(ctdb, indata, outdata);
196
197         case CTDB_CONTROL_TRAVERSE_DATA:
198                 return ctdb_control_traverse_data(ctdb, indata, outdata);
199
200         case CTDB_CONTROL_REGISTER_SRVID:
201                 return daemon_register_message_handler(ctdb, client_id, srvid);
202
203         case CTDB_CONTROL_DEREGISTER_SRVID:
204                 return daemon_deregister_message_handler(ctdb, client_id, srvid);
205
206         case CTDB_CONTROL_ENABLE_SEQNUM:
207                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
208                 return ctdb_ltdb_enable_seqnum(ctdb, *(uint32_t *)indata.dptr);
209
210         case CTDB_CONTROL_UPDATE_SEQNUM:
211                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));              
212                 return ctdb_ltdb_update_seqnum(ctdb, *(uint32_t *)indata.dptr, srcnode);
213
214         case CTDB_CONTROL_FREEZE:
215                 CHECK_CONTROL_DATA_SIZE(0);
216                 return ctdb_control_freeze(ctdb, c, async_reply);
217
218         case CTDB_CONTROL_THAW:
219                 CHECK_CONTROL_DATA_SIZE(0);
220                 return ctdb_control_thaw(ctdb);
221
222         case CTDB_CONTROL_SET_RECMODE:
223                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));              
224                 return ctdb_control_set_recmode(ctdb, c, indata, async_reply, errormsg);
225
226         case CTDB_CONTROL_SET_MONMODE:
227                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));              
228                 ctdb->monitoring_mode = *(uint32_t *)indata.dptr;
229                 return 0;
230
231         case CTDB_CONTROL_GET_MONMODE: 
232                 return ctdb->monitoring_mode;
233
234         case CTDB_CONTROL_SHUTDOWN:
235                 ctdb_release_all_ips(ctdb);
236                 ctdb->methods->shutdown(ctdb);
237                 ctdb_event_script(ctdb, "shutdown");
238                 DEBUG(0,("Received SHUTDOWN command. Stopping CTDB daemon.\n"));
239                 exit(0);
240
241         case CTDB_CONTROL_MAX_RSN: 
242                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
243                 return ctdb_control_max_rsn(ctdb, indata, outdata);
244
245         case CTDB_CONTROL_SET_RSN_NONEMPTY: 
246                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_rsn_nonempty));
247                 return ctdb_control_set_rsn_nonempty(ctdb, indata, outdata);
248
249         case CTDB_CONTROL_TAKEOVER_IP:
250                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip));
251                 return ctdb_control_takeover_ip(ctdb, c, indata, async_reply);
252
253         case CTDB_CONTROL_RELEASE_IP:
254                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip));
255                 return ctdb_control_release_ip(ctdb, c, indata, async_reply);
256
257         case CTDB_CONTROL_GET_PUBLIC_IPS:
258                 CHECK_CONTROL_DATA_SIZE(0);
259                 return ctdb_control_get_public_ips(ctdb, c, outdata);
260
261         case CTDB_CONTROL_DELETE_LOW_RSN: 
262                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_delete_low_rsn));
263                 return ctdb_control_delete_low_rsn(ctdb, indata, outdata);
264
265         case CTDB_CONTROL_TCP_CLIENT: 
266                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp));
267                 return ctdb_control_tcp_client(ctdb, client_id, indata);
268
269         case CTDB_CONTROL_STARTUP: 
270                 CHECK_CONTROL_DATA_SIZE(0);
271                 return ctdb_control_startup(ctdb, srcnode);
272
273         case CTDB_CONTROL_TCP_ADD: 
274                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp_vnn));
275                 return ctdb_control_tcp_add(ctdb, indata);
276
277         case CTDB_CONTROL_SET_TUNABLE:
278                 return ctdb_control_set_tunable(ctdb, indata);
279
280         case CTDB_CONTROL_GET_TUNABLE:
281                 return ctdb_control_get_tunable(ctdb, indata, outdata);
282
283         case CTDB_CONTROL_LIST_TUNABLES:
284                 return ctdb_control_list_tunables(ctdb, outdata);
285
286         case CTDB_CONTROL_MODIFY_FLAGS:
287                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_node_modflags));
288                 return ctdb_control_modflags(ctdb, indata);
289
290         case CTDB_CONTROL_KILL_TCP: 
291                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_killtcp));
292                 return ctdb_control_kill_tcp(ctdb, indata);
293
294         case CTDB_CONTROL_GET_TCP_TICKLE_LIST:
295                 CHECK_CONTROL_DATA_SIZE(sizeof(struct sockaddr_in));
296                 return ctdb_control_get_tcp_tickle_list(ctdb, indata, outdata);
297
298         case CTDB_CONTROL_SET_TCP_TICKLE_LIST:
299                 /* data size is verified in the called function */
300                 return ctdb_control_set_tcp_tickle_list(ctdb, indata);
301
302         case CTDB_CONTROL_REGISTER_SERVER_ID: 
303                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id));
304                 return ctdb_control_register_server_id(ctdb, client_id, indata);
305
306         case CTDB_CONTROL_UNREGISTER_SERVER_ID: 
307                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id));
308                 return ctdb_control_unregister_server_id(ctdb, indata);
309
310         case CTDB_CONTROL_CHECK_SERVER_ID: 
311                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_server_id));
312                 return ctdb_control_check_server_id(ctdb, indata);
313
314         case CTDB_CONTROL_GET_SERVER_ID_LIST:
315                 CHECK_CONTROL_DATA_SIZE(0);
316                 return ctdb_control_get_server_id_list(ctdb, outdata);
317
318         case CTDB_CONTROL_PERSISTENT_STORE:
319                 return ctdb_control_persistent_store(ctdb, c, indata, async_reply);
320
321         case CTDB_CONTROL_UPDATE_RECORD:
322                 return ctdb_control_update_record(ctdb, c, indata, async_reply);
323
324         case CTDB_CONTROL_SEND_GRATIOUS_ARP:
325                 return ctdb_control_send_gratious_arp(ctdb, indata);
326
327         default:
328                 DEBUG(0,(__location__ " Unknown CTDB control opcode %u\n", opcode));
329                 return -1;
330         }
331 }
332
333
334 /*
335   send a reply for a ctdb control
336  */
337 void ctdb_request_control_reply(struct ctdb_context *ctdb, struct ctdb_req_control *c,
338                                 TDB_DATA *outdata, int32_t status, const char *errormsg)
339 {
340         struct ctdb_reply_control *r;
341         size_t len;
342         
343         /* some controls send no reply */
344         if (c->flags & CTDB_CTRL_FLAG_NOREPLY) {
345                 return;
346         }
347
348         len = offsetof(struct ctdb_reply_control, data) + (outdata?outdata->dsize:0);
349         if (errormsg) {
350                 len += strlen(errormsg);
351         }
352         r = ctdb_transport_allocate(ctdb, ctdb, CTDB_REPLY_CONTROL, len, struct ctdb_reply_control);
353         CTDB_NO_MEMORY_VOID(ctdb, r);
354
355         r->hdr.destnode     = c->hdr.srcnode;
356         r->hdr.reqid        = c->hdr.reqid;
357         r->status           = status;
358         r->datalen          = outdata?outdata->dsize:0;
359         if (outdata && outdata->dsize) {
360                 memcpy(&r->data[0], outdata->dptr, outdata->dsize);
361         }
362         if (errormsg) {
363                 r->errorlen = strlen(errormsg);
364                 memcpy(&r->data[r->datalen], errormsg, r->errorlen);
365         }
366         
367         ctdb_queue_packet(ctdb, &r->hdr);       
368
369         talloc_free(r);
370 }
371
372 /*
373   called when a CTDB_REQ_CONTROL packet comes in
374 */
375 void ctdb_request_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr)
376 {
377         struct ctdb_req_control *c = (struct ctdb_req_control *)hdr;
378         TDB_DATA data, *outdata;
379         int32_t status;
380         bool async_reply = False;
381         const char *errormsg = NULL;
382
383         data.dptr = &c->data[0];
384         data.dsize = c->datalen;
385
386         outdata = talloc_zero(c, TDB_DATA);
387
388         status = ctdb_control_dispatch(ctdb, c, data, outdata, hdr->srcnode, 
389                                        &errormsg, &async_reply);
390
391         if (!async_reply) {
392                 ctdb_request_control_reply(ctdb, c, outdata, status, errormsg);
393         }
394 }
395
396 /*
397   called when a CTDB_REPLY_CONTROL packet comes in
398 */
399 void ctdb_reply_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr)
400 {
401         struct ctdb_reply_control *c = (struct ctdb_reply_control *)hdr;
402         TDB_DATA data;
403         struct ctdb_control_state *state;
404         const char *errormsg = NULL;
405
406         state = ctdb_reqid_find(ctdb, hdr->reqid, struct ctdb_control_state);
407         if (state == NULL) {
408                 DEBUG(0,("pnn %u Invalid reqid %u in ctdb_reply_control\n",
409                          ctdb->pnn, hdr->reqid));
410                 return;
411         }
412
413         if (hdr->reqid != state->reqid) {
414                 /* we found a record  but it was the wrong one */
415                 DEBUG(0, ("Dropped orphaned control reply with reqid:%u\n", hdr->reqid));
416                 return;
417         }
418
419         data.dptr = &c->data[0];
420         data.dsize = c->datalen;
421         if (c->errorlen) {
422                 errormsg = talloc_strndup(state, 
423                                           (char *)&c->data[c->datalen], c->errorlen);
424         }
425
426         /* make state a child of the packet, so it goes away when the packet
427            is freed. */
428         talloc_steal(hdr, state);
429
430         state->callback(ctdb, c->status, data, errormsg, state->private_data);
431 }
432
433 static int ctdb_control_destructor(struct ctdb_control_state *state)
434 {
435         ctdb_reqid_remove(state->ctdb, state->reqid);
436         return 0;
437 }
438
439 /*
440   handle a timeout of a control
441  */
442 static void ctdb_control_timeout(struct event_context *ev, struct timed_event *te, 
443                        struct timeval t, void *private_data)
444 {
445         struct ctdb_control_state *state = talloc_get_type(private_data, struct ctdb_control_state);
446         TALLOC_CTX *tmp_ctx = talloc_new(ev);
447
448         state->ctdb->statistics.timeouts.control++;
449
450         talloc_steal(tmp_ctx, state);
451
452         state->callback(state->ctdb, -1, tdb_null,
453                         "ctdb_control timed out", 
454                         state->private_data);
455         talloc_free(tmp_ctx);
456 }
457
458
459 /*
460   send a control message to a node
461  */
462 int ctdb_daemon_send_control(struct ctdb_context *ctdb, uint32_t destnode,
463                              uint64_t srvid, uint32_t opcode, uint32_t client_id,
464                              uint32_t flags,
465                              TDB_DATA data,
466                              ctdb_control_callback_fn_t callback,
467                              void *private_data)
468 {
469         struct ctdb_req_control *c;
470         struct ctdb_control_state *state;
471         size_t len;
472
473         if (((destnode == CTDB_BROADCAST_VNNMAP) || 
474              (destnode == CTDB_BROADCAST_ALL) ||
475              (destnode == CTDB_BROADCAST_CONNECTED)) && 
476             !(flags & CTDB_CTRL_FLAG_NOREPLY)) {
477                 DEBUG(0,("Attempt to broadcast control without NOREPLY\n"));
478                 return -1;
479         }
480
481         if (destnode != CTDB_BROADCAST_VNNMAP && 
482             destnode != CTDB_BROADCAST_ALL && 
483             destnode != CTDB_BROADCAST_CONNECTED && 
484             (!ctdb_validate_pnn(ctdb, destnode) || 
485              (ctdb->nodes[destnode]->flags & NODE_FLAGS_DISCONNECTED))) {
486                 if (!(flags & CTDB_CTRL_FLAG_NOREPLY)) {
487                         callback(ctdb, -1, tdb_null, "ctdb_control to disconnected node", private_data);
488                 }
489                 return 0;
490         }
491
492         /* the state is made a child of private_data if possible. This means any reply
493            will be discarded if the private_data goes away */
494         state = talloc(private_data?private_data:ctdb, struct ctdb_control_state);
495         CTDB_NO_MEMORY(ctdb, state);
496
497         state->reqid = ctdb_reqid_new(ctdb, state);
498         state->callback = callback;
499         state->private_data = private_data;
500         state->ctdb = ctdb;
501         state->flags = flags;
502
503         talloc_set_destructor(state, ctdb_control_destructor);
504
505         len = offsetof(struct ctdb_req_control, data) + data.dsize;
506         c = ctdb_transport_allocate(ctdb, state, CTDB_REQ_CONTROL, len, 
507                                     struct ctdb_req_control);
508         CTDB_NO_MEMORY(ctdb, c);
509         talloc_set_name_const(c, "ctdb_req_control packet");
510
511         c->hdr.destnode     = destnode;
512         c->hdr.reqid        = state->reqid;
513         c->opcode           = opcode;
514         c->client_id        = client_id;
515         c->flags            = flags;
516         c->srvid            = srvid;
517         c->datalen          = data.dsize;
518         if (data.dsize) {
519                 memcpy(&c->data[0], data.dptr, data.dsize);
520         }
521
522         ctdb_queue_packet(ctdb, &c->hdr);       
523
524         if (flags & CTDB_CTRL_FLAG_NOREPLY) {
525                 talloc_free(state);
526                 return 0;
527         }
528
529         if (ctdb->tunable.control_timeout) {
530                 event_add_timed(ctdb->ev, state, 
531                                 timeval_current_ofs(ctdb->tunable.control_timeout, 0), 
532                                 ctdb_control_timeout, state);
533         }
534
535         talloc_free(c);
536         return 0;
537 }