Make Samba 3 and Samba 4 both use the same single copy of libreplace.
[kai/samba.git] / source4 / cluster / ctdb / server / ctdb_control.c
1 /* 
2    ctdb_control protocol code
3
4    Copyright (C) Andrew Tridgell  2007
5
6    This program is free software; you can redistribute it and/or modify
7    it under the terms of the GNU General Public License as published by
8    the Free Software Foundation; either version 3 of the License, or
9    (at your option) any later version.
10    
11    This program is distributed in the hope that it will be useful,
12    but WITHOUT ANY WARRANTY; without even the implied warranty of
13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14    GNU General Public License for more details.
15    
16    You should have received a copy of the GNU General Public License
17    along with this program; if not, see <http://www.gnu.org/licenses/>.
18 */
19 #include "includes.h"
20 #include "lib/events/events.h"
21 #include "lib/tdb/include/tdb.h"
22 #include "system/network.h"
23 #include "system/filesys.h"
24 #include "system/wait.h"
25 #include "../include/ctdb_private.h"
26 #include "lib/util/dlinklist.h"
27
28 struct ctdb_control_state {
29         struct ctdb_context *ctdb;
30         uint32_t reqid;
31         ctdb_control_callback_fn_t callback;
32         void *private_data;
33         unsigned flags;
34 };
35
36 /*
37   process a control request
38  */
39 static int32_t ctdb_control_dispatch(struct ctdb_context *ctdb, 
40                                      struct ctdb_req_control *c,
41                                      TDB_DATA indata,
42                                      TDB_DATA *outdata, uint32_t srcnode,
43                                      const char **errormsg,
44                                      bool *async_reply)
45 {
46         uint32_t opcode = c->opcode;
47         uint64_t srvid = c->srvid;
48         uint32_t client_id = c->client_id;
49
50         switch (opcode) {
51         case CTDB_CONTROL_PROCESS_EXISTS: {
52                 CHECK_CONTROL_DATA_SIZE(sizeof(pid_t));
53                 return kill(*(pid_t *)indata.dptr, 0);
54         }
55
56         case CTDB_CONTROL_SET_DEBUG: {
57                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
58                 LogLevel = *(uint32_t *)indata.dptr;
59                 return 0;
60         }
61
62         case CTDB_CONTROL_GET_DEBUG: {
63                 CHECK_CONTROL_DATA_SIZE(0);
64                 outdata->dptr = (uint8_t *)&LogLevel;
65                 outdata->dsize = sizeof(LogLevel);
66                 return 0;
67         }
68
69         case CTDB_CONTROL_STATISTICS: {
70                 CHECK_CONTROL_DATA_SIZE(0);
71                 ctdb->statistics.memory_used = talloc_total_size(ctdb);
72                 ctdb->statistics.frozen = (ctdb->freeze_mode == CTDB_FREEZE_FROZEN);
73                 ctdb->statistics.recovering = (ctdb->recovery_mode == CTDB_RECOVERY_ACTIVE);
74                 outdata->dptr = (uint8_t *)&ctdb->statistics;
75                 outdata->dsize = sizeof(ctdb->statistics);
76                 return 0;
77         }
78
79         case CTDB_CONTROL_GET_ALL_TUNABLES: {
80                 CHECK_CONTROL_DATA_SIZE(0);
81                 outdata->dptr = (uint8_t *)&ctdb->tunable;
82                 outdata->dsize = sizeof(ctdb->tunable);
83                 return 0;
84         }
85
86         case CTDB_CONTROL_DUMP_MEMORY: {
87                 CHECK_CONTROL_DATA_SIZE(0);
88                 talloc_report_full(ctdb, stdout);
89                 return 0;
90         }
91
92         case CTDB_CONTROL_STATISTICS_RESET: {
93                 CHECK_CONTROL_DATA_SIZE(0);
94                 ZERO_STRUCT(ctdb->statistics);
95                 return 0;
96         }
97
98         case CTDB_CONTROL_GETVNNMAP:
99                 return ctdb_control_getvnnmap(ctdb, opcode, indata, outdata);
100
101         case CTDB_CONTROL_GET_DBMAP:
102                 return ctdb_control_getdbmap(ctdb, opcode, indata, outdata);
103
104         case CTDB_CONTROL_GET_NODEMAP:
105                 return ctdb_control_getnodemap(ctdb, opcode, indata, outdata);
106
107         case CTDB_CONTROL_SETVNNMAP:
108                 return ctdb_control_setvnnmap(ctdb, opcode, indata, outdata);
109
110         case CTDB_CONTROL_PULL_DB: 
111                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_pulldb));
112                 return ctdb_control_pull_db(ctdb, indata, outdata);
113
114         case CTDB_CONTROL_SET_DMASTER: 
115                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_dmaster));
116                 return ctdb_control_set_dmaster(ctdb, indata);
117
118         case CTDB_CONTROL_PUSH_DB:
119                 return ctdb_control_push_db(ctdb, indata);
120
121         case CTDB_CONTROL_GET_RECMODE: {
122                 return ctdb->recovery_mode;
123         }
124
125         case CTDB_CONTROL_SET_RECMASTER: {
126                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
127                 if (ctdb->freeze_mode != CTDB_FREEZE_FROZEN) {
128                         DEBUG(0,("Attempt to set recmaster when not frozen\n"));
129                         return -1;
130                 }
131                 ctdb->recovery_master = ((uint32_t *)(&indata.dptr[0]))[0];
132                 return 0;
133         }
134
135         case CTDB_CONTROL_GET_RECMASTER:
136                 return ctdb->recovery_master;
137
138         case CTDB_CONTROL_GET_PID:
139                 return getpid();
140
141         case CTDB_CONTROL_GET_VNN:
142                 return ctdb->vnn;
143
144         case CTDB_CONTROL_PING:
145                 CHECK_CONTROL_DATA_SIZE(0);
146                 return ctdb->statistics.num_clients;
147
148         case CTDB_CONTROL_GET_DBNAME: {
149                 uint32_t db_id;
150                 struct ctdb_db_context *ctdb_db;
151
152                 CHECK_CONTROL_DATA_SIZE(sizeof(db_id));
153                 db_id = *(uint32_t *)indata.dptr;
154                 ctdb_db = find_ctdb_db(ctdb, db_id);
155                 if (ctdb_db == NULL) return -1;
156                 outdata->dptr = discard_const(ctdb_db->db_name);
157                 outdata->dsize = strlen(ctdb_db->db_name)+1;
158                 return 0;
159         }
160
161         case CTDB_CONTROL_GETDBPATH: {
162                 uint32_t db_id;
163                 struct ctdb_db_context *ctdb_db;
164
165                 CHECK_CONTROL_DATA_SIZE(sizeof(db_id));
166                 db_id = *(uint32_t *)indata.dptr;
167                 ctdb_db = find_ctdb_db(ctdb, db_id);
168                 if (ctdb_db == NULL) return -1;
169                 outdata->dptr = discard_const(ctdb_db->db_path);
170                 outdata->dsize = strlen(ctdb_db->db_path)+1;
171                 return 0;
172         }
173
174         case CTDB_CONTROL_DB_ATTACH:
175                 return ctdb_control_db_attach(ctdb, indata, outdata);
176
177         case CTDB_CONTROL_SET_CALL: {
178                 struct ctdb_control_set_call *sc = 
179                         (struct ctdb_control_set_call *)indata.dptr;
180                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_call));
181                 return ctdb_daemon_set_call(ctdb, sc->db_id, sc->fn, sc->id);
182         }
183
184         case CTDB_CONTROL_TRAVERSE_START:
185                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_traverse_start));
186                 return ctdb_control_traverse_start(ctdb, indata, outdata, srcnode);
187
188         case CTDB_CONTROL_TRAVERSE_ALL:
189                 return ctdb_control_traverse_all(ctdb, indata, outdata);
190
191         case CTDB_CONTROL_TRAVERSE_DATA:
192                 return ctdb_control_traverse_data(ctdb, indata, outdata);
193
194         case CTDB_CONTROL_REGISTER_SRVID:
195                 return daemon_register_message_handler(ctdb, client_id, srvid);
196
197         case CTDB_CONTROL_DEREGISTER_SRVID:
198                 return daemon_deregister_message_handler(ctdb, client_id, srvid);
199
200         case CTDB_CONTROL_ENABLE_SEQNUM:
201                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
202                 return ctdb_ltdb_enable_seqnum(ctdb, *(uint32_t *)indata.dptr);
203
204         case CTDB_CONTROL_UPDATE_SEQNUM:
205                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));              
206                 return ctdb_ltdb_update_seqnum(ctdb, *(uint32_t *)indata.dptr, srcnode);
207
208         case CTDB_CONTROL_FREEZE:
209                 CHECK_CONTROL_DATA_SIZE(0);
210                 return ctdb_control_freeze(ctdb, c, async_reply);
211
212         case CTDB_CONTROL_THAW:
213                 CHECK_CONTROL_DATA_SIZE(0);
214                 return ctdb_control_thaw(ctdb);
215
216         case CTDB_CONTROL_SET_RECMODE:
217                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));              
218                 return ctdb_control_set_recmode(ctdb, c, indata, async_reply, errormsg);
219
220         case CTDB_CONTROL_SET_MONMODE:
221                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));              
222                 ctdb->monitoring_mode = *(uint32_t *)indata.dptr;
223                 return 0;
224
225         case CTDB_CONTROL_GET_MONMODE: 
226                 return ctdb->monitoring_mode;
227
228         case CTDB_CONTROL_SHUTDOWN:
229                 ctdb_release_all_ips(ctdb);
230                 ctdb->methods->shutdown(ctdb);
231                 ctdb_event_script(ctdb, "shutdown");
232                 DEBUG(0,("shutting down\n"));
233                 exit(0);
234
235         case CTDB_CONTROL_MAX_RSN: 
236                 CHECK_CONTROL_DATA_SIZE(sizeof(uint32_t));
237                 return ctdb_control_max_rsn(ctdb, indata, outdata);
238
239         case CTDB_CONTROL_SET_RSN_NONEMPTY: 
240                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_set_rsn_nonempty));
241                 return ctdb_control_set_rsn_nonempty(ctdb, indata, outdata);
242
243         case CTDB_CONTROL_TAKEOVER_IP:
244                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip));
245                 return ctdb_control_takeover_ip(ctdb, c, indata, async_reply);
246
247         case CTDB_CONTROL_RELEASE_IP:
248                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_public_ip));
249                 return ctdb_control_release_ip(ctdb, c, indata, async_reply);
250
251         case CTDB_CONTROL_GET_PUBLIC_IPS:
252                 CHECK_CONTROL_DATA_SIZE(0);
253                 return ctdb_control_get_public_ips(ctdb, c, outdata);
254
255         case CTDB_CONTROL_DELETE_LOW_RSN: 
256                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_delete_low_rsn));
257                 return ctdb_control_delete_low_rsn(ctdb, indata, outdata);
258
259         case CTDB_CONTROL_TCP_CLIENT: 
260                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp));
261                 return ctdb_control_tcp_client(ctdb, client_id, srcnode, indata);
262
263         case CTDB_CONTROL_STARTUP: 
264                 CHECK_CONTROL_DATA_SIZE(0);
265                 return ctdb_control_startup(ctdb, srcnode);
266
267         case CTDB_CONTROL_TCP_ADD: 
268                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp_vnn));
269                 return ctdb_control_tcp_add(ctdb, indata);
270
271         case CTDB_CONTROL_TCP_REMOVE: 
272                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_control_tcp_vnn));
273                 return ctdb_control_tcp_remove(ctdb, indata);
274
275         case CTDB_CONTROL_SET_TUNABLE:
276                 return ctdb_control_set_tunable(ctdb, indata);
277
278         case CTDB_CONTROL_GET_TUNABLE:
279                 return ctdb_control_get_tunable(ctdb, indata, outdata);
280
281         case CTDB_CONTROL_LIST_TUNABLES:
282                 return ctdb_control_list_tunables(ctdb, outdata);
283
284         case CTDB_CONTROL_MODIFY_FLAGS:
285                 CHECK_CONTROL_DATA_SIZE(sizeof(struct ctdb_node_modflags));
286                 return ctdb_control_modflags(ctdb, indata);
287
288         default:
289                 DEBUG(0,(__location__ " Unknown CTDB control opcode %u\n", opcode));
290                 return -1;
291         }
292 }
293
294
295 /*
296   send a reply for a ctdb control
297  */
298 void ctdb_request_control_reply(struct ctdb_context *ctdb, struct ctdb_req_control *c,
299                                 TDB_DATA *outdata, int32_t status, const char *errormsg)
300 {
301         struct ctdb_reply_control *r;
302         size_t len;
303         
304         /* some controls send no reply */
305         if (c->flags & CTDB_CTRL_FLAG_NOREPLY) {
306                 return;
307         }
308
309         len = offsetof(struct ctdb_reply_control, data) + (outdata?outdata->dsize:0);
310         if (errormsg) {
311                 len += strlen(errormsg);
312         }
313         r = ctdb_transport_allocate(ctdb, ctdb, CTDB_REPLY_CONTROL, len, struct ctdb_reply_control);
314         CTDB_NO_MEMORY_VOID(ctdb, r);
315
316         r->hdr.destnode     = c->hdr.srcnode;
317         r->hdr.reqid        = c->hdr.reqid;
318         r->status           = status;
319         r->datalen          = outdata?outdata->dsize:0;
320         if (outdata && outdata->dsize) {
321                 memcpy(&r->data[0], outdata->dptr, outdata->dsize);
322         }
323         if (errormsg) {
324                 r->errorlen = strlen(errormsg);
325                 memcpy(&r->data[r->datalen], errormsg, r->errorlen);
326         }
327         
328         ctdb_queue_packet(ctdb, &r->hdr);       
329
330         talloc_free(r);
331 }
332
333 /*
334   called when a CTDB_REQ_CONTROL packet comes in
335 */
336 void ctdb_request_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr)
337 {
338         struct ctdb_req_control *c = (struct ctdb_req_control *)hdr;
339         TDB_DATA data, *outdata;
340         int32_t status;
341         bool async_reply = False;
342         const char *errormsg = NULL;
343
344         data.dptr = &c->data[0];
345         data.dsize = c->datalen;
346
347         outdata = talloc_zero(c, TDB_DATA);
348
349         status = ctdb_control_dispatch(ctdb, c, data, outdata, hdr->srcnode, 
350                                        &errormsg, &async_reply);
351
352         if (!async_reply) {
353                 ctdb_request_control_reply(ctdb, c, outdata, status, errormsg);
354         }
355 }
356
357 /*
358   called when a CTDB_REPLY_CONTROL packet comes in
359 */
360 void ctdb_reply_control(struct ctdb_context *ctdb, struct ctdb_req_header *hdr)
361 {
362         struct ctdb_reply_control *c = (struct ctdb_reply_control *)hdr;
363         TDB_DATA data;
364         struct ctdb_control_state *state;
365         const char *errormsg = NULL;
366
367         state = ctdb_reqid_find(ctdb, hdr->reqid, struct ctdb_control_state);
368         if (state == NULL) {
369                 DEBUG(0,("vnn %u Invalid reqid %u in ctdb_reply_control\n",
370                          ctdb->vnn, hdr->reqid));
371                 return;
372         }
373
374         if (hdr->reqid != state->reqid) {
375                 /* we found a record  but it was the wrong one */
376                 DEBUG(0, ("Dropped orphaned control reply with reqid:%u\n", hdr->reqid));
377                 return;
378         }
379
380         data.dptr = &c->data[0];
381         data.dsize = c->datalen;
382         if (c->errorlen) {
383                 errormsg = talloc_strndup(state, 
384                                           (char *)&c->data[c->datalen], c->errorlen);
385         }
386
387         /* make state a child of the packet, so it goes away when the packet
388            is freed. */
389         talloc_steal(hdr, state);
390
391         state->callback(ctdb, c->status, data, errormsg, state->private_data);
392 }
393
394 static int ctdb_control_destructor(struct ctdb_control_state *state)
395 {
396         ctdb_reqid_remove(state->ctdb, state->reqid);
397         return 0;
398 }
399
400 /*
401   handle a timeout of a control
402  */
403 static void ctdb_control_timeout(struct event_context *ev, struct timed_event *te, 
404                        struct timeval t, void *private_data)
405 {
406         struct ctdb_control_state *state = talloc_get_type(private_data, struct ctdb_control_state);
407         TALLOC_CTX *tmp_ctx = talloc_new(ev);
408
409         state->ctdb->statistics.timeouts.control++;
410
411         talloc_steal(tmp_ctx, state);
412
413         state->callback(state->ctdb, -1, tdb_null,
414                         "ctdb_control timed out", 
415                         state->private_data);
416         talloc_free(tmp_ctx);
417 }
418
419
420 /*
421   send a control message to a node
422  */
423 int ctdb_daemon_send_control(struct ctdb_context *ctdb, uint32_t destnode,
424                              uint64_t srvid, uint32_t opcode, uint32_t client_id,
425                              uint32_t flags,
426                              TDB_DATA data,
427                              ctdb_control_callback_fn_t callback,
428                              void *private_data)
429 {
430         struct ctdb_req_control *c;
431         struct ctdb_control_state *state;
432         size_t len;
433
434         if (((destnode == CTDB_BROADCAST_VNNMAP) || 
435              (destnode == CTDB_BROADCAST_ALL) ||
436              (destnode == CTDB_BROADCAST_CONNECTED)) && 
437             !(flags & CTDB_CTRL_FLAG_NOREPLY)) {
438                 DEBUG(0,("Attempt to broadcast control without NOREPLY\n"));
439                 return -1;
440         }
441
442         if (destnode != CTDB_BROADCAST_VNNMAP && 
443             destnode != CTDB_BROADCAST_ALL && 
444             destnode != CTDB_BROADCAST_CONNECTED && 
445             (!ctdb_validate_vnn(ctdb, destnode) || 
446              (ctdb->nodes[destnode]->flags & NODE_FLAGS_DISCONNECTED))) {
447                 if (!(flags & CTDB_CTRL_FLAG_NOREPLY)) {
448                         callback(ctdb, -1, tdb_null, "ctdb_control to disconnected node", private_data);
449                 }
450                 return 0;
451         }
452
453         /* the state is made a child of private_data if possible. This means any reply
454            will be discarded if the private_data goes away */
455         state = talloc(private_data?private_data:ctdb, struct ctdb_control_state);
456         CTDB_NO_MEMORY(ctdb, state);
457
458         state->reqid = ctdb_reqid_new(ctdb, state);
459         state->callback = callback;
460         state->private_data = private_data;
461         state->ctdb = ctdb;
462         state->flags = flags;
463
464         talloc_set_destructor(state, ctdb_control_destructor);
465
466         len = offsetof(struct ctdb_req_control, data) + data.dsize;
467         c = ctdb_transport_allocate(ctdb, state, CTDB_REQ_CONTROL, len, 
468                                     struct ctdb_req_control);
469         CTDB_NO_MEMORY(ctdb, c);
470         talloc_set_name_const(c, "ctdb_req_control packet");
471
472         c->hdr.destnode     = destnode;
473         c->hdr.reqid        = state->reqid;
474         c->opcode           = opcode;
475         c->client_id        = client_id;
476         c->flags            = flags;
477         c->srvid            = srvid;
478         c->datalen          = data.dsize;
479         if (data.dsize) {
480                 memcpy(&c->data[0], data.dptr, data.dsize);
481         }
482
483         ctdb_queue_packet(ctdb, &c->hdr);       
484
485         if (flags & CTDB_CTRL_FLAG_NOREPLY) {
486                 talloc_free(state);
487                 return 0;
488         }
489
490         if (ctdb->tunable.control_timeout) {
491                 event_add_timed(ctdb->ev, state, 
492                                 timeval_current_ofs(ctdb->tunable.control_timeout, 0), 
493                                 ctdb_control_timeout, state);
494         }
495
496         talloc_free(c);
497         return 0;
498 }