4 Copyright (C) Andrew Tridgell 2006
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, see <http://www.gnu.org/licenses/>.
21 #include "system/network.h"
22 #include "system/filesys.h"
23 #include "system/wait.h"
27 #include "lib/util/debug.h"
28 #include "lib/util/samba_util.h"
30 #include "ctdb_private.h"
32 #include "protocol/protocol_util.h"
34 #include "common/reqid.h"
35 #include "common/system.h"
36 #include "common/common.h"
37 #include "common/logging.h"
40 return error string for last error
42 const char *ctdb_errstr(struct ctdb_context
*ctdb
)
49 remember an error message
51 void ctdb_set_error(struct ctdb_context
*ctdb
, const char *fmt
, ...)
54 talloc_free(ctdb
->err_msg
);
56 ctdb
->err_msg
= talloc_vasprintf(ctdb
, fmt
, ap
);
57 DEBUG(DEBUG_ERR
,("ctdb error: %s\n", ctdb
->err_msg
));
62 a fatal internal error occurred - no hope for recovery
64 void ctdb_fatal(struct ctdb_context
*ctdb
, const char *msg
)
66 DEBUG(DEBUG_ALERT
,("ctdb fatal error: %s\n", msg
));
71 like ctdb_fatal() but a core/backtrace would not be useful
73 void ctdb_die(struct ctdb_context
*ctdb
, const char *msg
)
75 DEBUG(DEBUG_ALERT
,("ctdb exiting with error: %s\n", msg
));
79 /* Set the path of a helper program from envvar, falling back to
80 * dir/file if envvar unset. type is a string to print in log
81 * messages. helper is assumed to point to a statically allocated
82 * array of size bytes, initialised to "". If file is NULL don't fall
83 * back if envvar is unset. If dir is NULL and envvar is unset (but
84 * file is not NULL) then this is an error. Returns true if helper is
85 * set, either previously or this time. */
86 bool ctdb_set_helper(const char *type
, char *helper
, size_t size
,
88 const char *dir
, const char *file
)
93 if (helper
[0] != '\0') {
100 if (strlen(t
) >= size
) {
102 ("Unable to set %s - path too long\n", type
));
106 strncpy(helper
, t
, size
);
107 } else if (file
== NULL
) {
109 } else if (dir
== NULL
) {
111 ("Unable to set %s - dir is NULL\n", type
));
116 ret
= snprintf(helper
, size
, "%s/%s", dir
, file
);
117 if (ret
< 0 || (size_t)ret
>= size
) {
119 ("Unable to set %s - path too long\n", type
));
124 if (stat(helper
, &st
) != 0) {
126 ("Unable to set %s \"%s\" - %s\n",
127 type
, helper
, strerror(errno
)));
130 if (!(st
.st_mode
& S_IXUSR
)) {
132 ("Unable to set %s \"%s\" - not executable\n",
138 ("Set %s to \"%s\"\n", type
, helper
));
145 int ctdb_parse_address(TALLOC_CTX
*mem_ctx
, const char *str
,
146 ctdb_sock_addr
*address
)
153 se
= getservbyname("ctdb", "tcp");
159 port
= ntohs(se
->s_port
);
162 ret
= ctdb_sock_addr_from_string(str
, address
, false);
166 ctdb_sock_addr_set_port(address
, port
);
173 check if two addresses are the same
175 bool ctdb_same_address(ctdb_sock_addr
*a1
, ctdb_sock_addr
*a2
)
177 return ctdb_same_ip(a1
, a2
) &&
178 ctdb_addr_to_port(a1
) == ctdb_addr_to_port(a2
);
183 hash function for mapping data to a VNN - taken from tdb
185 uint32_t ctdb_hash(const TDB_DATA
*key
)
187 return tdb_jenkins_hash(discard_const(key
));
191 static uint32_t ctdb_marshall_record_size(TDB_DATA key
,
192 struct ctdb_ltdb_header
*header
,
195 return offsetof(struct ctdb_rec_data_old
, data
) + key
.dsize
+
196 data
.dsize
+ (header
? sizeof(*header
) : 0);
199 static void ctdb_marshall_record_copy(struct ctdb_rec_data_old
*rec
,
202 struct ctdb_ltdb_header
*header
,
208 rec
->length
= length
;
210 rec
->keylen
= key
.dsize
;
211 memcpy(&rec
->data
[0], key
.dptr
, key
.dsize
);
215 rec
->datalen
= data
.dsize
+ sizeof(*header
);
216 memcpy(&rec
->data
[offset
], header
, sizeof(*header
));
217 offset
+= sizeof(*header
);
219 rec
->datalen
= data
.dsize
;
221 memcpy(&rec
->data
[offset
], data
.dptr
, data
.dsize
);
225 form a ctdb_rec_data record from a key/data pair
227 note that header may be NULL. If not NULL then it is included in the data portion
230 struct ctdb_rec_data_old
*ctdb_marshall_record(TALLOC_CTX
*mem_ctx
,
233 struct ctdb_ltdb_header
*header
,
237 struct ctdb_rec_data_old
*d
;
239 length
= ctdb_marshall_record_size(key
, header
, data
);
241 d
= (struct ctdb_rec_data_old
*)talloc_size(mem_ctx
, length
);
246 ctdb_marshall_record_copy(d
, reqid
, key
, header
, data
, length
);
251 /* helper function for marshalling multiple records */
252 struct ctdb_marshall_buffer
*ctdb_marshall_add(TALLOC_CTX
*mem_ctx
,
253 struct ctdb_marshall_buffer
*m
,
257 struct ctdb_ltdb_header
*header
,
260 struct ctdb_rec_data_old
*r
;
261 struct ctdb_marshall_buffer
*m2
;
262 uint32_t length
, offset
;
264 length
= ctdb_marshall_record_size(key
, header
, data
);
267 offset
= offsetof(struct ctdb_marshall_buffer
, data
);
268 m2
= talloc_zero_size(mem_ctx
, offset
+ length
);
270 offset
= talloc_get_size(m
);
271 m2
= talloc_realloc_size(mem_ctx
, m
, offset
+ length
);
282 r
= (struct ctdb_rec_data_old
*)((uint8_t *)m2
+ offset
);
283 ctdb_marshall_record_copy(r
, reqid
, key
, header
, data
, length
);
289 /* we've finished marshalling, return a data blob with the marshalled records */
290 TDB_DATA
ctdb_marshall_finish(struct ctdb_marshall_buffer
*m
)
293 data
.dptr
= (uint8_t *)m
;
294 data
.dsize
= talloc_get_size(m
);
299 loop over a marshalling buffer
301 - pass r==NULL to start
302 - loop the number of times indicated by m->count
304 struct ctdb_rec_data_old
*ctdb_marshall_loop_next(
305 struct ctdb_marshall_buffer
*m
,
306 struct ctdb_rec_data_old
*r
,
308 struct ctdb_ltdb_header
*header
,
309 TDB_DATA
*key
, TDB_DATA
*data
)
312 r
= (struct ctdb_rec_data_old
*)&m
->data
[0];
314 r
= (struct ctdb_rec_data_old
*)(r
->length
+ (uint8_t *)r
);
322 key
->dptr
= &r
->data
[0];
323 key
->dsize
= r
->keylen
;
326 data
->dptr
= &r
->data
[r
->keylen
];
327 data
->dsize
= r
->datalen
;
328 if (header
!= NULL
) {
329 data
->dptr
+= sizeof(*header
);
330 data
->dsize
-= sizeof(*header
);
334 if (header
!= NULL
) {
335 if (r
->datalen
< sizeof(*header
)) {
338 memcpy(header
, &r
->data
[r
->keylen
], sizeof(*header
));
345 This is used to canonicalize a ctdb_sock_addr structure.
347 void ctdb_canonicalize_ip(const ctdb_sock_addr
*ip
, ctdb_sock_addr
*cip
)
351 if (ip
->sa
.sa_family
== AF_INET6
) {
352 const char prefix
[12] = { 0,0,0,0,0,0,0,0,0,0,0xff,0xff };
353 if (memcmp(&ip
->ip6
.sin6_addr
, prefix
, sizeof(prefix
)) == 0) {
354 /* Copy IPv4-mapped IPv6 addresses as IPv4 */
355 cip
->ip
.sin_family
= AF_INET
;
356 #ifdef HAVE_SOCK_SIN_LEN
357 cip
->ip
.sin_len
= sizeof(ctdb_sock_addr
);
359 cip
->ip
.sin_port
= ip
->ip6
.sin6_port
;
360 memcpy(&cip
->ip
.sin_addr
,
361 &ip
->ip6
.sin6_addr
.s6_addr
[12],
362 sizeof(cip
->ip
.sin_addr
));
364 cip
->ip6
.sin6_family
= AF_INET6
;
365 #ifdef HAVE_SOCK_SIN6_LEN
366 cip
->ip6
.sin6_len
= sizeof(ctdb_sock_addr
);
368 cip
->ip6
.sin6_port
= ip
->ip6
.sin6_port
;
369 memcpy(&cip
->ip6
.sin6_addr
,
371 sizeof(cip
->ip6
.sin6_addr
));
377 if (ip
->sa
.sa_family
== AF_INET
) {
378 cip
->ip
.sin_family
= AF_INET
;
379 #ifdef HAVE_SOCK_SIN_LEN
380 cip
->ip
.sin_len
= sizeof(ctdb_sock_addr
);
382 cip
->ip
.sin_port
= ip
->ip
.sin_port
;
383 memcpy(&cip
->ip
.sin_addr
,
385 sizeof(ip
->ip
.sin_addr
));
391 bool ctdb_same_ip(const ctdb_sock_addr
*tip1
, const ctdb_sock_addr
*tip2
)
393 ctdb_sock_addr ip1
, ip2
;
395 ctdb_canonicalize_ip(tip1
, &ip1
);
396 ctdb_canonicalize_ip(tip2
, &ip2
);
398 if (ip1
.sa
.sa_family
!= ip2
.sa
.sa_family
) {
402 switch (ip1
.sa
.sa_family
) {
404 return ip1
.ip
.sin_addr
.s_addr
== ip2
.ip
.sin_addr
.s_addr
;
406 return !memcmp(&ip1
.ip6
.sin6_addr
.s6_addr
[0],
407 &ip2
.ip6
.sin6_addr
.s6_addr
[0],
410 DEBUG(DEBUG_ERR
, (__location__
" CRITICAL Can not compare sockaddr structures of type %u\n", ip1
.sa
.sa_family
));
418 compare two ctdb_sock_addr structures
420 bool ctdb_same_sockaddr(const ctdb_sock_addr
*ip1
, const ctdb_sock_addr
*ip2
)
422 return ctdb_same_ip(ip1
, ip2
) && ip1
->ip
.sin_port
== ip2
->ip
.sin_port
;
425 char *ctdb_addr_to_str(ctdb_sock_addr
*addr
)
427 static char cip
[128] = "";
429 switch (addr
->sa
.sa_family
) {
431 inet_ntop(addr
->ip
.sin_family
, &addr
->ip
.sin_addr
, cip
, sizeof(cip
));
434 inet_ntop(addr
->ip6
.sin6_family
, &addr
->ip6
.sin6_addr
, cip
, sizeof(cip
));
437 DEBUG(DEBUG_ERR
, (__location__
" ERROR, unknown family %u\n", addr
->sa
.sa_family
));
443 unsigned ctdb_addr_to_port(ctdb_sock_addr
*addr
)
445 switch (addr
->sa
.sa_family
) {
447 return ntohs(addr
->ip
.sin_port
);
450 return ntohs(addr
->ip6
.sin6_port
);
453 DEBUG(DEBUG_ERR
, (__location__
" ERROR, unknown family %u\n", addr
->sa
.sa_family
));
459 /* Add a node to a node map with given address and flags */
460 static bool node_map_add(TALLOC_CTX
*mem_ctx
,
461 const char *nstr
, uint32_t flags
,
462 struct ctdb_node_map_old
**node_map
)
467 struct ctdb_node_and_flags
*n
;
469 /* Might as well do this before trying to allocate memory */
470 if (ctdb_parse_address(mem_ctx
, nstr
, &addr
) == -1) {
474 num
= (*node_map
)->num
+ 1;
475 s
= offsetof(struct ctdb_node_map_old
, nodes
) +
476 num
* sizeof(struct ctdb_node_and_flags
);
477 *node_map
= talloc_realloc_size(mem_ctx
, *node_map
, s
);
478 if (*node_map
== NULL
) {
479 DEBUG(DEBUG_ERR
, (__location__
" Out of memory\n"));
483 n
= &(*node_map
)->nodes
[(*node_map
)->num
];
485 n
->pnn
= (*node_map
)->num
;
493 /* Read a nodes file into a node map */
494 struct ctdb_node_map_old
*ctdb_read_nodes_file(TALLOC_CTX
*mem_ctx
,
500 struct ctdb_node_map_old
*ret
;
502 /* Allocate node map header */
503 ret
= talloc_zero_size(mem_ctx
, offsetof(struct ctdb_node_map_old
, nodes
));
505 DEBUG(DEBUG_ERR
, (__location__
" Out of memory\n"));
509 lines
= file_lines_load(nlist
, &nlines
, 0, mem_ctx
);
511 DEBUG(DEBUG_ERR
, ("Failed to read nodes file \"%s\"\n", nlist
));
514 while (nlines
> 0 && strcmp(lines
[nlines
-1], "") == 0) {
518 for (i
=0; i
< nlines
; i
++) {
524 /* strip leading spaces */
525 while((*node
== ' ') || (*node
== '\t')) {
532 ((node
[len
-1] == ' ') || (node
[len
-1] == '\t')))
542 /* A "deleted" node is a node that is
543 commented out in the nodes file. This is
544 used instead of removing a line, which
545 would cause subsequent nodes to change
547 flags
= NODE_FLAGS_DELETED
;
548 node
= discard_const("0.0.0.0");
552 if (!node_map_add(mem_ctx
, node
, flags
, &ret
)) {
563 struct ctdb_node_map_old
*
564 ctdb_node_list_to_map(struct ctdb_node
**nodes
, uint32_t num_nodes
,
569 struct ctdb_node_map_old
*node_map
;
571 size
= offsetof(struct ctdb_node_map_old
, nodes
) +
572 num_nodes
* sizeof(struct ctdb_node_and_flags
);
573 node_map
= (struct ctdb_node_map_old
*)talloc_zero_size(mem_ctx
, size
);
574 if (node_map
== NULL
) {
576 (__location__
" Failed to allocate nodemap array\n"));
580 node_map
->num
= num_nodes
;
581 for (i
=0; i
<num_nodes
; i
++) {
582 node_map
->nodes
[i
].addr
= nodes
[i
]->address
;
583 node_map
->nodes
[i
].pnn
= nodes
[i
]->pnn
;
584 node_map
->nodes
[i
].flags
= nodes
[i
]->flags
;
590 const char *ctdb_eventscript_call_names
[] = {
607 /* Runstate handling */
609 enum ctdb_runstate runstate
;
612 { CTDB_RUNSTATE_UNKNOWN
, "UNKNOWN" },
613 { CTDB_RUNSTATE_INIT
, "INIT" },
614 { CTDB_RUNSTATE_SETUP
, "SETUP" },
615 { CTDB_RUNSTATE_FIRST_RECOVERY
, "FIRST_RECOVERY" },
616 { CTDB_RUNSTATE_STARTUP
, "STARTUP" },
617 { CTDB_RUNSTATE_RUNNING
, "RUNNING" },
618 { CTDB_RUNSTATE_SHUTDOWN
, "SHUTDOWN" },
622 const char *runstate_to_string(enum ctdb_runstate runstate
)
625 for (i
=0; runstate_map
[i
].label
!= NULL
; i
++) {
626 if (runstate_map
[i
].runstate
== runstate
) {
627 return runstate_map
[i
].label
;
631 return runstate_map
[0].label
;
634 enum ctdb_runstate
runstate_from_string(const char *label
)
637 for (i
=0; runstate_map
[i
].label
!= NULL
; i
++) {
638 if (strcasecmp(runstate_map
[i
].label
, label
) == 0) {
639 return runstate_map
[i
].runstate
;
643 return CTDB_RUNSTATE_UNKNOWN
;
646 void ctdb_set_runstate(struct ctdb_context
*ctdb
, enum ctdb_runstate runstate
)
648 DEBUG(DEBUG_NOTICE
,("Set runstate to %s (%d)\n",
649 runstate_to_string(runstate
), runstate
));
651 if (runstate
<= ctdb
->runstate
) {
652 ctdb_fatal(ctdb
, "runstate must always increase");
655 ctdb
->runstate
= runstate
;
658 /* Convert arbitrary data to 4-byte boundary padded uint32 array */
659 uint32_t *ctdb_key_to_idkey(TALLOC_CTX
*mem_ctx
, TDB_DATA key
)
661 uint32_t idkey_size
, *k
;
663 idkey_size
= 1 + (key
.dsize
+ sizeof(uint32_t)-1) / sizeof(uint32_t);
665 k
= talloc_zero_array(mem_ctx
, uint32_t, idkey_size
);
671 memcpy(&k
[1], key
.dptr
, key
.dsize
);