s4-dsdb: Add documentation link for Tombstone Reanimation
[Samba.git] / ctdb / common / ctdb_util.c
blob137e0a8a095d2146fd383f45729b0770aa2afdc0
1 /*
2 ctdb utility code
4 Copyright (C) Andrew Tridgell 2006
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, see <http://www.gnu.org/licenses/>.
20 #include "includes.h"
21 #include "tdb.h"
22 #include "system/network.h"
23 #include "system/filesys.h"
24 #include "system/wait.h"
25 #include "../include/ctdb_private.h"
28 return error string for last error
30 const char *ctdb_errstr(struct ctdb_context *ctdb)
32 return ctdb->err_msg;
37 remember an error message
39 void ctdb_set_error(struct ctdb_context *ctdb, const char *fmt, ...)
41 va_list ap;
42 talloc_free(ctdb->err_msg);
43 va_start(ap, fmt);
44 ctdb->err_msg = talloc_vasprintf(ctdb, fmt, ap);
45 DEBUG(DEBUG_ERR,("ctdb error: %s\n", ctdb->err_msg));
46 va_end(ap);
50 a fatal internal error occurred - no hope for recovery
52 void ctdb_fatal(struct ctdb_context *ctdb, const char *msg)
54 DEBUG(DEBUG_ALERT,("ctdb fatal error: %s\n", msg));
55 abort();
59 like ctdb_fatal() but a core/backtrace would not be useful
61 void ctdb_die(struct ctdb_context *ctdb, const char *msg)
63 DEBUG(DEBUG_ALERT,("ctdb exiting with error: %s\n", msg));
64 exit(1);
67 /* Invoke an external program to do some sort of tracing on the CTDB
68 * process. This might block for a little while. The external
69 * program is specified by the environment variable
70 * CTDB_EXTERNAL_TRACE. This program should take one argument: the
71 * pid of the process to trace. Commonly, the program would be a
72 * wrapper script around gcore.
74 void ctdb_external_trace(void)
76 int ret;
77 const char * t = getenv("CTDB_EXTERNAL_TRACE");
78 char * cmd;
80 if (t == NULL) {
81 return;
84 cmd = talloc_asprintf(NULL, "%s %lu", t, (unsigned long) getpid());
85 DEBUG(DEBUG_WARNING,("begin external trace: %s\n", cmd));
86 ret = system(cmd);
87 if (ret == -1) {
88 DEBUG(DEBUG_ERR,
89 ("external trace command \"%s\" failed\n", cmd));
91 DEBUG(DEBUG_WARNING,("end external trace: %s\n", cmd));
92 talloc_free(cmd);
96 parse a IP:port pair
98 int ctdb_parse_address(struct ctdb_context *ctdb,
99 TALLOC_CTX *mem_ctx, const char *str,
100 struct ctdb_address *address)
102 struct servent *se;
103 ctdb_sock_addr addr;
105 setservent(0);
106 se = getservbyname("ctdb", "tcp");
107 endservent();
109 /* Parse IP address and re-convert to string. This ensure correct
110 * string form for IPv6 addresses.
112 if (! parse_ip(str, NULL, 0, &addr)) {
113 return -1;
116 address->address = talloc_strdup(mem_ctx, ctdb_addr_to_str(&addr));
117 CTDB_NO_MEMORY(ctdb, address->address);
119 if (se == NULL) {
120 address->port = CTDB_PORT;
121 } else {
122 address->port = ntohs(se->s_port);
124 return 0;
129 check if two addresses are the same
131 bool ctdb_same_address(struct ctdb_address *a1, struct ctdb_address *a2)
133 return strcmp(a1->address, a2->address) == 0 && a1->port == a2->port;
138 hash function for mapping data to a VNN - taken from tdb
140 uint32_t ctdb_hash(const TDB_DATA *key)
142 return tdb_jenkins_hash(discard_const(key));
146 a type checking varient of idr_find
148 static void *_idr_find_type(struct idr_context *idp, int id, const char *type, const char *location)
150 void *p = idr_find(idp, id);
151 if (p && talloc_check_name(p, type) == NULL) {
152 DEBUG(DEBUG_ERR,("%s idr_find_type expected type %s but got %s\n",
153 location, type, talloc_get_name(p)));
154 return NULL;
156 return p;
159 uint32_t ctdb_reqid_new(struct ctdb_context *ctdb, void *state)
161 int id = idr_get_new_above(ctdb->idr, state, ctdb->lastid+1, INT_MAX);
162 if (id < 0) {
163 DEBUG(DEBUG_DEBUG, ("Reqid wrap!\n"));
164 id = idr_get_new(ctdb->idr, state, INT_MAX);
166 ctdb->lastid = id;
167 return id;
170 void *_ctdb_reqid_find(struct ctdb_context *ctdb, uint32_t reqid, const char *type, const char *location)
172 void *p;
174 p = _idr_find_type(ctdb->idr, reqid, type, location);
175 if (p == NULL) {
176 DEBUG(DEBUG_WARNING, ("Could not find idr:%u\n",reqid));
179 return p;
183 void ctdb_reqid_remove(struct ctdb_context *ctdb, uint32_t reqid)
185 int ret;
187 ret = idr_remove(ctdb->idr, reqid);
188 if (ret != 0) {
189 DEBUG(DEBUG_ERR, ("Removing idr that does not exist\n"));
194 static uint32_t ctdb_marshall_record_size(TDB_DATA key,
195 struct ctdb_ltdb_header *header,
196 TDB_DATA data)
198 return offsetof(struct ctdb_rec_data, data) + key.dsize +
199 data.dsize + (header ? sizeof(*header) : 0);
202 static void ctdb_marshall_record_copy(struct ctdb_rec_data *rec,
203 uint32_t reqid,
204 TDB_DATA key,
205 struct ctdb_ltdb_header *header,
206 TDB_DATA data,
207 uint32_t length)
209 uint32_t offset;
211 rec->length = length;
212 rec->reqid = reqid;
213 rec->keylen = key.dsize;
214 memcpy(&rec->data[0], key.dptr, key.dsize);
215 offset = key.dsize;
217 if (header) {
218 rec->datalen = data.dsize + sizeof(*header);
219 memcpy(&rec->data[offset], header, sizeof(*header));
220 offset += sizeof(*header);
221 } else {
222 rec->datalen = data.dsize;
224 memcpy(&rec->data[offset], data.dptr, data.dsize);
228 form a ctdb_rec_data record from a key/data pair
230 note that header may be NULL. If not NULL then it is included in the data portion
231 of the record
233 struct ctdb_rec_data *ctdb_marshall_record(TALLOC_CTX *mem_ctx, uint32_t reqid,
234 TDB_DATA key,
235 struct ctdb_ltdb_header *header,
236 TDB_DATA data)
238 size_t length;
239 struct ctdb_rec_data *d;
241 length = ctdb_marshall_record_size(key, header, data);
243 d = (struct ctdb_rec_data *)talloc_size(mem_ctx, length);
244 if (d == NULL) {
245 return NULL;
248 ctdb_marshall_record_copy(d, reqid, key, header, data, length);
249 return d;
253 /* helper function for marshalling multiple records */
254 struct ctdb_marshall_buffer *ctdb_marshall_add(TALLOC_CTX *mem_ctx,
255 struct ctdb_marshall_buffer *m,
256 uint64_t db_id,
257 uint32_t reqid,
258 TDB_DATA key,
259 struct ctdb_ltdb_header *header,
260 TDB_DATA data)
262 struct ctdb_rec_data *r;
263 struct ctdb_marshall_buffer *m2;
264 uint32_t length, offset;
266 length = ctdb_marshall_record_size(key, header, data);
268 if (m == NULL) {
269 offset = offsetof(struct ctdb_marshall_buffer, data);
270 m2 = talloc_zero_size(mem_ctx, offset + length);
271 } else {
272 offset = talloc_get_size(m);
273 m2 = talloc_realloc_size(mem_ctx, m, offset + length);
275 if (m2 == NULL) {
276 TALLOC_FREE(m);
277 return NULL;
280 if (m == NULL) {
281 m2->db_id = db_id;
284 r = (struct ctdb_rec_data *)((uint8_t *)m2 + offset);
285 ctdb_marshall_record_copy(r, reqid, key, header, data, length);
286 m2->count++;
288 return m2;
291 /* we've finished marshalling, return a data blob with the marshalled records */
292 TDB_DATA ctdb_marshall_finish(struct ctdb_marshall_buffer *m)
294 TDB_DATA data;
295 data.dptr = (uint8_t *)m;
296 data.dsize = talloc_get_size(m);
297 return data;
301 loop over a marshalling buffer
303 - pass r==NULL to start
304 - loop the number of times indicated by m->count
306 struct ctdb_rec_data *ctdb_marshall_loop_next(struct ctdb_marshall_buffer *m, struct ctdb_rec_data *r,
307 uint32_t *reqid,
308 struct ctdb_ltdb_header *header,
309 TDB_DATA *key, TDB_DATA *data)
311 if (r == NULL) {
312 r = (struct ctdb_rec_data *)&m->data[0];
313 } else {
314 r = (struct ctdb_rec_data *)(r->length + (uint8_t *)r);
317 if (reqid != NULL) {
318 *reqid = r->reqid;
321 if (key != NULL) {
322 key->dptr = &r->data[0];
323 key->dsize = r->keylen;
325 if (data != NULL) {
326 data->dptr = &r->data[r->keylen];
327 data->dsize = r->datalen;
328 if (header != NULL) {
329 data->dptr += sizeof(*header);
330 data->dsize -= sizeof(*header);
334 if (header != NULL) {
335 if (r->datalen < sizeof(*header)) {
336 return NULL;
338 memcpy(header, &r->data[r->keylen], sizeof(*header));
341 return r;
345 This is used to canonicalize a ctdb_sock_addr structure.
347 void ctdb_canonicalize_ip(const ctdb_sock_addr *ip, ctdb_sock_addr *cip)
349 char prefix[12] = { 0,0,0,0,0,0,0,0,0,0,0xff,0xff };
351 memcpy(cip, ip, sizeof (*cip));
353 if ( (ip->sa.sa_family == AF_INET6)
354 && !memcmp(&ip->ip6.sin6_addr, prefix, 12)) {
355 memset(cip, 0, sizeof(*cip));
356 #ifdef HAVE_SOCK_SIN_LEN
357 cip->ip.sin_len = sizeof(*cip);
358 #endif
359 cip->ip.sin_family = AF_INET;
360 cip->ip.sin_port = ip->ip6.sin6_port;
361 memcpy(&cip->ip.sin_addr, &ip->ip6.sin6_addr.s6_addr[12], 4);
365 bool ctdb_same_ip(const ctdb_sock_addr *tip1, const ctdb_sock_addr *tip2)
367 ctdb_sock_addr ip1, ip2;
369 ctdb_canonicalize_ip(tip1, &ip1);
370 ctdb_canonicalize_ip(tip2, &ip2);
372 if (ip1.sa.sa_family != ip2.sa.sa_family) {
373 return false;
376 switch (ip1.sa.sa_family) {
377 case AF_INET:
378 return ip1.ip.sin_addr.s_addr == ip2.ip.sin_addr.s_addr;
379 case AF_INET6:
380 return !memcmp(&ip1.ip6.sin6_addr.s6_addr[0],
381 &ip2.ip6.sin6_addr.s6_addr[0],
382 16);
383 default:
384 DEBUG(DEBUG_ERR, (__location__ " CRITICAL Can not compare sockaddr structures of type %u\n", ip1.sa.sa_family));
385 return false;
388 return true;
392 compare two ctdb_sock_addr structures
394 bool ctdb_same_sockaddr(const ctdb_sock_addr *ip1, const ctdb_sock_addr *ip2)
396 return ctdb_same_ip(ip1, ip2) && ip1->ip.sin_port == ip2->ip.sin_port;
399 char *ctdb_addr_to_str(ctdb_sock_addr *addr)
401 static char cip[128] = "";
403 switch (addr->sa.sa_family) {
404 case AF_INET:
405 inet_ntop(addr->ip.sin_family, &addr->ip.sin_addr, cip, sizeof(cip));
406 break;
407 case AF_INET6:
408 inet_ntop(addr->ip6.sin6_family, &addr->ip6.sin6_addr, cip, sizeof(cip));
409 break;
410 default:
411 DEBUG(DEBUG_ERR, (__location__ " ERROR, unknown family %u\n", addr->sa.sa_family));
412 ctdb_external_trace();
415 return cip;
418 unsigned ctdb_addr_to_port(ctdb_sock_addr *addr)
420 switch (addr->sa.sa_family) {
421 case AF_INET:
422 return ntohs(addr->ip.sin_port);
423 break;
424 case AF_INET6:
425 return ntohs(addr->ip6.sin6_port);
426 break;
427 default:
428 DEBUG(DEBUG_ERR, (__location__ " ERROR, unknown family %u\n", addr->sa.sa_family));
431 return 0;
435 const char *ctdb_eventscript_call_names[] = {
436 "init",
437 "setup",
438 "startup",
439 "startrecovery",
440 "recovered",
441 "takeip",
442 "releaseip",
443 "stopped",
444 "monitor",
445 "status",
446 "shutdown",
447 "reload",
448 "updateip",
449 "ipreallocated"
452 /* Runstate handling */
453 static struct {
454 enum ctdb_runstate runstate;
455 const char * label;
456 } runstate_map[] = {
457 { CTDB_RUNSTATE_UNKNOWN, "UNKNOWN" },
458 { CTDB_RUNSTATE_INIT, "INIT" },
459 { CTDB_RUNSTATE_SETUP, "SETUP" },
460 { CTDB_RUNSTATE_FIRST_RECOVERY, "FIRST_RECOVERY" },
461 { CTDB_RUNSTATE_STARTUP, "STARTUP" },
462 { CTDB_RUNSTATE_RUNNING, "RUNNING" },
463 { CTDB_RUNSTATE_SHUTDOWN, "SHUTDOWN" },
464 { -1, NULL },
467 const char *runstate_to_string(enum ctdb_runstate runstate)
469 int i;
470 for (i=0; runstate_map[i].label != NULL ; i++) {
471 if (runstate_map[i].runstate == runstate) {
472 return runstate_map[i].label;
476 return runstate_map[0].label;
479 enum ctdb_runstate runstate_from_string(const char *label)
481 int i;
482 for (i=0; runstate_map[i].label != NULL; i++) {
483 if (strcasecmp(runstate_map[i].label, label) == 0) {
484 return runstate_map[i].runstate;
488 return CTDB_RUNSTATE_UNKNOWN;
491 void ctdb_set_runstate(struct ctdb_context *ctdb, enum ctdb_runstate runstate)
493 if (runstate <= ctdb->runstate) {
494 ctdb_fatal(ctdb, "runstate must always increase");
497 DEBUG(DEBUG_NOTICE,("Set runstate to %s (%d)\n",
498 runstate_to_string(runstate), runstate));
499 ctdb->runstate = runstate;
502 /* Convert arbitrary data to 4-byte boundary padded uint32 array */
503 uint32_t *ctdb_key_to_idkey(TALLOC_CTX *mem_ctx, TDB_DATA key)
505 uint32_t idkey_size, *k;
507 idkey_size = 1 + (key.dsize + sizeof(uint32_t)-1) / sizeof(uint32_t);
509 k = talloc_zero_array(mem_ctx, uint32_t, idkey_size);
510 if (k == NULL) {
511 return NULL;
514 k[0] = idkey_size;
515 memcpy(&k[1], key.dptr, key.dsize);
517 return k;