4 Copyright (C) Andrew Tridgell 2006
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, see <http://www.gnu.org/licenses/>.
22 #include "system/network.h"
23 #include "system/filesys.h"
24 #include "system/wait.h"
25 #include "system/shmem.h"
26 #include "../include/ctdb_private.h"
29 return error string for last error
31 const char *ctdb_errstr(struct ctdb_context *ctdb)
38 remember an error message
40 void ctdb_set_error(struct ctdb_context *ctdb, const char *fmt, ...)
43 talloc_free(ctdb->err_msg);
45 ctdb->err_msg = talloc_vasprintf(ctdb, fmt, ap);
46 DEBUG(DEBUG_ERR,("ctdb error: %s\n", ctdb->err_msg));
51 a fatal internal error occurred - no hope for recovery
53 void ctdb_fatal(struct ctdb_context *ctdb, const char *msg)
55 DEBUG(DEBUG_ALERT,("ctdb fatal error: %s\n", msg));
60 like ctdb_fatal() but a core/backtrace would not be useful
62 void ctdb_die(struct ctdb_context *ctdb, const char *msg)
64 DEBUG(DEBUG_ALERT,("ctdb exiting with error: %s\n", msg));
68 /* Invoke an external program to do some sort of tracing on the CTDB
69 * process. This might block for a little while. The external
70 * program is specified by the environment variable
71 * CTDB_EXTERNAL_TRACE. This program should take one argument: the
72 * pid of the process to trace. Commonly, the program would be a
73 * wrapper script around gcore.
75 void ctdb_external_trace(void)
78 const char * t = getenv("CTDB_EXTERNAL_TRACE");
85 cmd = talloc_asprintf(NULL, "%s %lu", t, (unsigned long) getpid());
86 DEBUG(DEBUG_WARNING,("begin external trace: %s\n", cmd));
88 DEBUG(DEBUG_WARNING,("end external trace: %s\n", cmd));
95 int ctdb_parse_address(struct ctdb_context *ctdb,
96 TALLOC_CTX *mem_ctx, const char *str,
97 struct ctdb_address *address)
102 se = getservbyname("ctdb", "tcp");
105 address->address = talloc_strdup(mem_ctx, str);
106 CTDB_NO_MEMORY(ctdb, address->address);
109 address->port = CTDB_PORT;
111 address->port = ntohs(se->s_port);
118 check if two addresses are the same
120 bool ctdb_same_address(struct ctdb_address *a1, struct ctdb_address *a2)
122 return strcmp(a1->address, a2->address) == 0 && a1->port == a2->port;
127 hash function for mapping data to a VNN - taken from tdb
129 uint32_t ctdb_hash(const TDB_DATA *key)
131 return tdb_jenkins_hash(discard_const(key));
135 a type checking varient of idr_find
137 static void *_idr_find_type(struct idr_context *idp, int id, const char *type, const char *location)
139 void *p = idr_find(idp, id);
140 if (p && talloc_check_name(p, type) == NULL) {
141 DEBUG(DEBUG_ERR,("%s idr_find_type expected type %s but got %s\n",
142 location, type, talloc_get_name(p)));
148 uint32_t ctdb_reqid_new(struct ctdb_context *ctdb, void *state)
150 int id = idr_get_new_above(ctdb->idr, state, ctdb->lastid+1, INT_MAX);
152 DEBUG(DEBUG_DEBUG, ("Reqid wrap!\n"));
153 id = idr_get_new(ctdb->idr, state, INT_MAX);
159 void *_ctdb_reqid_find(struct ctdb_context *ctdb, uint32_t reqid, const char *type, const char *location)
163 p = _idr_find_type(ctdb->idr, reqid, type, location);
165 DEBUG(DEBUG_WARNING, ("Could not find idr:%u\n",reqid));
172 void ctdb_reqid_remove(struct ctdb_context *ctdb, uint32_t reqid)
176 ret = idr_remove(ctdb->idr, reqid);
178 DEBUG(DEBUG_ERR, ("Removing idr that does not exist\n"));
184 form a ctdb_rec_data record from a key/data pair
186 note that header may be NULL. If not NULL then it is included in the data portion
189 struct ctdb_rec_data *ctdb_marshall_record(TALLOC_CTX *mem_ctx, uint32_t reqid,
191 struct ctdb_ltdb_header *header,
195 struct ctdb_rec_data *d;
197 length = offsetof(struct ctdb_rec_data, data) + key.dsize +
198 data.dsize + (header?sizeof(*header):0);
199 d = (struct ctdb_rec_data *)talloc_size(mem_ctx, length);
205 d->keylen = key.dsize;
206 memcpy(&d->data[0], key.dptr, key.dsize);
208 d->datalen = data.dsize + sizeof(*header);
209 memcpy(&d->data[key.dsize], header, sizeof(*header));
210 memcpy(&d->data[key.dsize+sizeof(*header)], data.dptr, data.dsize);
212 d->datalen = data.dsize;
213 memcpy(&d->data[key.dsize], data.dptr, data.dsize);
219 /* helper function for marshalling multiple records */
220 struct ctdb_marshall_buffer *ctdb_marshall_add(TALLOC_CTX *mem_ctx,
221 struct ctdb_marshall_buffer *m,
225 struct ctdb_ltdb_header *header,
228 struct ctdb_rec_data *r;
229 size_t m_size, r_size;
230 struct ctdb_marshall_buffer *m2;
232 r = ctdb_marshall_record(mem_ctx, reqid, key, header, data);
239 m = talloc_zero_size(mem_ctx, offsetof(struct ctdb_marshall_buffer, data));
246 m_size = talloc_get_size(m);
247 r_size = talloc_get_size(r);
249 m2 = talloc_realloc_size(mem_ctx, m, m_size + r_size);
255 memcpy(m_size + (uint8_t *)m2, r, r_size);
264 /* we've finished marshalling, return a data blob with the marshalled records */
265 TDB_DATA ctdb_marshall_finish(struct ctdb_marshall_buffer *m)
268 data.dptr = (uint8_t *)m;
269 data.dsize = talloc_get_size(m);
274 loop over a marshalling buffer
276 - pass r==NULL to start
277 - loop the number of times indicated by m->count
279 struct ctdb_rec_data *ctdb_marshall_loop_next(struct ctdb_marshall_buffer *m, struct ctdb_rec_data *r,
281 struct ctdb_ltdb_header *header,
282 TDB_DATA *key, TDB_DATA *data)
285 r = (struct ctdb_rec_data *)&m->data[0];
287 r = (struct ctdb_rec_data *)(r->length + (uint8_t *)r);
295 key->dptr = &r->data[0];
296 key->dsize = r->keylen;
299 data->dptr = &r->data[r->keylen];
300 data->dsize = r->datalen;
301 if (header != NULL) {
302 data->dptr += sizeof(*header);
303 data->dsize -= sizeof(*header);
307 if (header != NULL) {
308 if (r->datalen < sizeof(*header)) {
311 *header = *(struct ctdb_ltdb_header *)&r->data[r->keylen];
318 This is used to canonicalize a ctdb_sock_addr structure.
320 void ctdb_canonicalize_ip(const ctdb_sock_addr *ip, ctdb_sock_addr *cip)
322 char prefix[12] = { 0,0,0,0,0,0,0,0,0,0,0xff,0xff };
324 memcpy(cip, ip, sizeof (*cip));
326 if ( (ip->sa.sa_family == AF_INET6)
327 && !memcmp(&ip->ip6.sin6_addr, prefix, 12)) {
328 memset(cip, 0, sizeof(*cip));
329 #ifdef HAVE_SOCK_SIN_LEN
330 cip->ip.sin_len = sizeof(*cip);
332 cip->ip.sin_family = AF_INET;
333 cip->ip.sin_port = ip->ip6.sin6_port;
334 memcpy(&cip->ip.sin_addr, &ip->ip6.sin6_addr.s6_addr[12], 4);
338 bool ctdb_same_ip(const ctdb_sock_addr *tip1, const ctdb_sock_addr *tip2)
340 ctdb_sock_addr ip1, ip2;
342 ctdb_canonicalize_ip(tip1, &ip1);
343 ctdb_canonicalize_ip(tip2, &ip2);
345 if (ip1.sa.sa_family != ip2.sa.sa_family) {
349 switch (ip1.sa.sa_family) {
351 return ip1.ip.sin_addr.s_addr == ip2.ip.sin_addr.s_addr;
353 return !memcmp(&ip1.ip6.sin6_addr.s6_addr[0],
354 &ip2.ip6.sin6_addr.s6_addr[0],
357 DEBUG(DEBUG_ERR, (__location__ " CRITICAL Can not compare sockaddr structures of type %u\n", ip1.sa.sa_family));
365 compare two ctdb_sock_addr structures
367 bool ctdb_same_sockaddr(const ctdb_sock_addr *ip1, const ctdb_sock_addr *ip2)
369 return ctdb_same_ip(ip1, ip2) && ip1->ip.sin_port == ip2->ip.sin_port;
372 char *ctdb_addr_to_str(ctdb_sock_addr *addr)
374 static char cip[128] = "";
376 switch (addr->sa.sa_family) {
378 inet_ntop(addr->ip.sin_family, &addr->ip.sin_addr, cip, sizeof(cip));
381 inet_ntop(addr->ip6.sin6_family, &addr->ip6.sin6_addr, cip, sizeof(cip));
384 DEBUG(DEBUG_ERR, (__location__ " ERROR, unknown family %u\n", addr->sa.sa_family));
385 ctdb_external_trace();
391 unsigned ctdb_addr_to_port(ctdb_sock_addr *addr)
393 switch (addr->sa.sa_family) {
395 return ntohs(addr->ip.sin_port);
398 return ntohs(addr->ip6.sin6_port);
401 DEBUG(DEBUG_ERR, (__location__ " ERROR, unknown family %u\n", addr->sa.sa_family));
407 /* we don't lock future pages here; it would increase the chance that
408 * we'd fail to mmap later on. */
409 void ctdb_lockdown_memory(bool valgrinding)
411 #if defined(HAVE_MLOCKALL) && !defined(_AIX_)
412 /* Extra stack, please! */
414 memset(dummy, 0, sizeof(dummy));
420 /* Ignore when running in local daemons mode */
425 /* Avoid compiler optimizing out dummy. */
426 mlock(dummy, sizeof(dummy));
427 if (mlockall(MCL_CURRENT) != 0) {
428 DEBUG(DEBUG_WARNING,("Failed to lockdown memory: %s'\n",
434 const char *ctdb_eventscript_call_names[] = {
451 /* Runstate handling */
453 enum ctdb_runstate runstate;
456 { CTDB_RUNSTATE_UNKNOWN, "UNKNOWN" },
457 { CTDB_RUNSTATE_INIT, "INIT" },
458 { CTDB_RUNSTATE_SETUP, "SETUP" },
459 { CTDB_RUNSTATE_FIRST_RECOVERY, "FIRST_RECOVERY" },
460 { CTDB_RUNSTATE_STARTUP, "STARTUP" },
461 { CTDB_RUNSTATE_RUNNING, "RUNNING" },
462 { CTDB_RUNSTATE_SHUTDOWN, "SHUTDOWN" },
466 const char *runstate_to_string(enum ctdb_runstate runstate)
469 for (i=0; runstate_map[i].label != NULL ; i++) {
470 if (runstate_map[i].runstate == runstate) {
471 return runstate_map[i].label;
475 return runstate_map[0].label;
478 enum ctdb_runstate runstate_from_string(const char *label)
481 for (i=0; runstate_map[i].label != NULL; i++) {
482 if (strcasecmp(runstate_map[i].label, label) == 0) {
483 return runstate_map[i].runstate;
487 return CTDB_RUNSTATE_UNKNOWN;
490 void ctdb_set_runstate(struct ctdb_context *ctdb, enum ctdb_runstate runstate)
492 if (runstate <= ctdb->runstate) {
493 ctdb_fatal(ctdb, "runstate must always increase");
496 DEBUG(DEBUG_NOTICE,("Set runstate to %s (%d)\n",
497 runstate_to_string(runstate), runstate));
498 ctdb->runstate = runstate;
501 void ctdb_mkdir_p_or_die(struct ctdb_context *ctdb, const char *dir, int mode)
505 ret = mkdir_p(dir, mode);
508 ("ctdb exiting with error: "
509 "failed to create directory \"%s\" (%s)\n",
510 dir, strerror(errno)));