4 Copyright (C) Andrew Tridgell 2006
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, see <http://www.gnu.org/licenses/>.
21 #include "system/network.h"
22 #include "system/filesys.h"
23 #include "system/wait.h"
27 #include "lib/util/debug.h"
28 #include "lib/util/samba_util.h"
30 #include "ctdb_private.h"
32 #include "protocol/protocol_util.h"
34 #include "common/reqid.h"
35 #include "common/system.h"
36 #include "common/common.h"
37 #include "common/logging.h"
40 return error string for last error
42 const char *ctdb_errstr(struct ctdb_context
*ctdb
)
49 remember an error message
51 void ctdb_set_error(struct ctdb_context
*ctdb
, const char *fmt
, ...)
54 talloc_free(ctdb
->err_msg
);
56 ctdb
->err_msg
= talloc_vasprintf(ctdb
, fmt
, ap
);
57 DEBUG(DEBUG_ERR
,("ctdb error: %s\n", ctdb
->err_msg
));
62 a fatal internal error occurred - no hope for recovery
64 void ctdb_fatal(struct ctdb_context
*ctdb
, const char *msg
)
66 DEBUG(DEBUG_ALERT
,("ctdb fatal error: %s\n", msg
));
71 like ctdb_fatal() but a core/backtrace would not be useful
73 void ctdb_die(struct ctdb_context
*ctdb
, const char *msg
)
75 DEBUG(DEBUG_ALERT
,("ctdb exiting with error: %s\n", msg
));
79 /* Set the path of a helper program from envvar, falling back to
80 * dir/file if envvar unset. type is a string to print in log
81 * messages. helper is assumed to point to a statically allocated
82 * array of size bytes, initialised to "". If file is NULL don't fall
83 * back if envvar is unset. If dir is NULL and envvar is unset (but
84 * file is not NULL) then this is an error. Returns true if helper is
85 * set, either previously or this time. */
86 bool ctdb_set_helper(const char *type
, char *helper
, size_t size
,
88 const char *dir
, const char *file
)
93 if (helper
[0] != '\0') {
100 if (strlen(t
) >= size
) {
102 ("Unable to set %s - path too long\n", type
));
106 strncpy(helper
, t
, size
);
107 } else if (file
== NULL
) {
109 } else if (dir
== NULL
) {
111 ("Unable to set %s - dir is NULL\n", type
));
114 if (snprintf(helper
, size
, "%s/%s", dir
, file
) >= size
) {
116 ("Unable to set %s - path too long\n", type
));
121 if (stat(helper
, &st
) != 0) {
123 ("Unable to set %s \"%s\" - %s\n",
124 type
, helper
, strerror(errno
)));
127 if (!(st
.st_mode
& S_IXUSR
)) {
129 ("Unable to set %s \"%s\" - not executable\n",
135 ("Set %s to \"%s\"\n", type
, helper
));
142 int ctdb_parse_address(TALLOC_CTX
*mem_ctx
, const char *str
,
143 ctdb_sock_addr
*address
)
150 se
= getservbyname("ctdb", "tcp");
156 port
= ntohs(se
->s_port
);
159 ret
= ctdb_sock_addr_from_string(str
, address
, false);
163 ctdb_sock_addr_set_port(address
, port
);
170 check if two addresses are the same
172 bool ctdb_same_address(ctdb_sock_addr
*a1
, ctdb_sock_addr
*a2
)
174 return ctdb_same_ip(a1
, a2
) &&
175 ctdb_addr_to_port(a1
) == ctdb_addr_to_port(a2
);
180 hash function for mapping data to a VNN - taken from tdb
182 uint32_t ctdb_hash(const TDB_DATA
*key
)
184 return tdb_jenkins_hash(discard_const(key
));
188 static uint32_t ctdb_marshall_record_size(TDB_DATA key
,
189 struct ctdb_ltdb_header
*header
,
192 return offsetof(struct ctdb_rec_data_old
, data
) + key
.dsize
+
193 data
.dsize
+ (header
? sizeof(*header
) : 0);
196 static void ctdb_marshall_record_copy(struct ctdb_rec_data_old
*rec
,
199 struct ctdb_ltdb_header
*header
,
205 rec
->length
= length
;
207 rec
->keylen
= key
.dsize
;
208 memcpy(&rec
->data
[0], key
.dptr
, key
.dsize
);
212 rec
->datalen
= data
.dsize
+ sizeof(*header
);
213 memcpy(&rec
->data
[offset
], header
, sizeof(*header
));
214 offset
+= sizeof(*header
);
216 rec
->datalen
= data
.dsize
;
218 memcpy(&rec
->data
[offset
], data
.dptr
, data
.dsize
);
222 form a ctdb_rec_data record from a key/data pair
224 note that header may be NULL. If not NULL then it is included in the data portion
227 struct ctdb_rec_data_old
*ctdb_marshall_record(TALLOC_CTX
*mem_ctx
,
230 struct ctdb_ltdb_header
*header
,
234 struct ctdb_rec_data_old
*d
;
236 length
= ctdb_marshall_record_size(key
, header
, data
);
238 d
= (struct ctdb_rec_data_old
*)talloc_size(mem_ctx
, length
);
243 ctdb_marshall_record_copy(d
, reqid
, key
, header
, data
, length
);
248 /* helper function for marshalling multiple records */
249 struct ctdb_marshall_buffer
*ctdb_marshall_add(TALLOC_CTX
*mem_ctx
,
250 struct ctdb_marshall_buffer
*m
,
254 struct ctdb_ltdb_header
*header
,
257 struct ctdb_rec_data_old
*r
;
258 struct ctdb_marshall_buffer
*m2
;
259 uint32_t length
, offset
;
261 length
= ctdb_marshall_record_size(key
, header
, data
);
264 offset
= offsetof(struct ctdb_marshall_buffer
, data
);
265 m2
= talloc_zero_size(mem_ctx
, offset
+ length
);
267 offset
= talloc_get_size(m
);
268 m2
= talloc_realloc_size(mem_ctx
, m
, offset
+ length
);
279 r
= (struct ctdb_rec_data_old
*)((uint8_t *)m2
+ offset
);
280 ctdb_marshall_record_copy(r
, reqid
, key
, header
, data
, length
);
286 /* we've finished marshalling, return a data blob with the marshalled records */
287 TDB_DATA
ctdb_marshall_finish(struct ctdb_marshall_buffer
*m
)
290 data
.dptr
= (uint8_t *)m
;
291 data
.dsize
= talloc_get_size(m
);
296 loop over a marshalling buffer
298 - pass r==NULL to start
299 - loop the number of times indicated by m->count
301 struct ctdb_rec_data_old
*ctdb_marshall_loop_next(
302 struct ctdb_marshall_buffer
*m
,
303 struct ctdb_rec_data_old
*r
,
305 struct ctdb_ltdb_header
*header
,
306 TDB_DATA
*key
, TDB_DATA
*data
)
309 r
= (struct ctdb_rec_data_old
*)&m
->data
[0];
311 r
= (struct ctdb_rec_data_old
*)(r
->length
+ (uint8_t *)r
);
319 key
->dptr
= &r
->data
[0];
320 key
->dsize
= r
->keylen
;
323 data
->dptr
= &r
->data
[r
->keylen
];
324 data
->dsize
= r
->datalen
;
325 if (header
!= NULL
) {
326 data
->dptr
+= sizeof(*header
);
327 data
->dsize
-= sizeof(*header
);
331 if (header
!= NULL
) {
332 if (r
->datalen
< sizeof(*header
)) {
335 memcpy(header
, &r
->data
[r
->keylen
], sizeof(*header
));
342 This is used to canonicalize a ctdb_sock_addr structure.
344 void ctdb_canonicalize_ip(const ctdb_sock_addr
*ip
, ctdb_sock_addr
*cip
)
348 if (ip
->sa
.sa_family
== AF_INET6
) {
349 const char prefix
[12] = { 0,0,0,0,0,0,0,0,0,0,0xff,0xff };
350 if (memcmp(&ip
->ip6
.sin6_addr
, prefix
, sizeof(prefix
)) == 0) {
351 /* Copy IPv4-mapped IPv6 addresses as IPv4 */
352 cip
->ip
.sin_family
= AF_INET
;
353 #ifdef HAVE_SOCK_SIN_LEN
354 cip
->ip
.sin_len
= sizeof(ctdb_sock_addr
);
356 cip
->ip
.sin_port
= ip
->ip6
.sin6_port
;
357 memcpy(&cip
->ip
.sin_addr
,
358 &ip
->ip6
.sin6_addr
.s6_addr
[12],
359 sizeof(cip
->ip
.sin_addr
));
361 cip
->ip6
.sin6_family
= AF_INET6
;
362 #ifdef HAVE_SOCK_SIN6_LEN
363 cip
->ip6
.sin6_len
= sizeof(ctdb_sock_addr
);
365 cip
->ip6
.sin6_port
= ip
->ip6
.sin6_port
;
366 memcpy(&cip
->ip6
.sin6_addr
,
368 sizeof(cip
->ip6
.sin6_addr
));
374 if (ip
->sa
.sa_family
== AF_INET
) {
375 cip
->ip
.sin_family
= AF_INET
;
376 #ifdef HAVE_SOCK_SIN_LEN
377 cip
->ip
.sin_len
= sizeof(ctdb_sock_addr
);
379 cip
->ip
.sin_port
= ip
->ip
.sin_port
;
380 memcpy(&cip
->ip
.sin_addr
,
382 sizeof(ip
->ip
.sin_addr
));
388 bool ctdb_same_ip(const ctdb_sock_addr
*tip1
, const ctdb_sock_addr
*tip2
)
390 ctdb_sock_addr ip1
, ip2
;
392 ctdb_canonicalize_ip(tip1
, &ip1
);
393 ctdb_canonicalize_ip(tip2
, &ip2
);
395 if (ip1
.sa
.sa_family
!= ip2
.sa
.sa_family
) {
399 switch (ip1
.sa
.sa_family
) {
401 return ip1
.ip
.sin_addr
.s_addr
== ip2
.ip
.sin_addr
.s_addr
;
403 return !memcmp(&ip1
.ip6
.sin6_addr
.s6_addr
[0],
404 &ip2
.ip6
.sin6_addr
.s6_addr
[0],
407 DEBUG(DEBUG_ERR
, (__location__
" CRITICAL Can not compare sockaddr structures of type %u\n", ip1
.sa
.sa_family
));
415 compare two ctdb_sock_addr structures
417 bool ctdb_same_sockaddr(const ctdb_sock_addr
*ip1
, const ctdb_sock_addr
*ip2
)
419 return ctdb_same_ip(ip1
, ip2
) && ip1
->ip
.sin_port
== ip2
->ip
.sin_port
;
422 char *ctdb_addr_to_str(ctdb_sock_addr
*addr
)
424 static char cip
[128] = "";
426 switch (addr
->sa
.sa_family
) {
428 inet_ntop(addr
->ip
.sin_family
, &addr
->ip
.sin_addr
, cip
, sizeof(cip
));
431 inet_ntop(addr
->ip6
.sin6_family
, &addr
->ip6
.sin6_addr
, cip
, sizeof(cip
));
434 DEBUG(DEBUG_ERR
, (__location__
" ERROR, unknown family %u\n", addr
->sa
.sa_family
));
440 unsigned ctdb_addr_to_port(ctdb_sock_addr
*addr
)
442 switch (addr
->sa
.sa_family
) {
444 return ntohs(addr
->ip
.sin_port
);
447 return ntohs(addr
->ip6
.sin6_port
);
450 DEBUG(DEBUG_ERR
, (__location__
" ERROR, unknown family %u\n", addr
->sa
.sa_family
));
456 /* Add a node to a node map with given address and flags */
457 static bool node_map_add(TALLOC_CTX
*mem_ctx
,
458 const char *nstr
, uint32_t flags
,
459 struct ctdb_node_map_old
**node_map
)
464 struct ctdb_node_and_flags
*n
;
466 /* Might as well do this before trying to allocate memory */
467 if (ctdb_parse_address(mem_ctx
, nstr
, &addr
) == -1) {
471 num
= (*node_map
)->num
+ 1;
472 s
= offsetof(struct ctdb_node_map_old
, nodes
) +
473 num
* sizeof(struct ctdb_node_and_flags
);
474 *node_map
= talloc_realloc_size(mem_ctx
, *node_map
, s
);
475 if (*node_map
== NULL
) {
476 DEBUG(DEBUG_ERR
, (__location__
" Out of memory\n"));
480 n
= &(*node_map
)->nodes
[(*node_map
)->num
];
482 n
->pnn
= (*node_map
)->num
;
490 /* Read a nodes file into a node map */
491 struct ctdb_node_map_old
*ctdb_read_nodes_file(TALLOC_CTX
*mem_ctx
,
497 struct ctdb_node_map_old
*ret
;
499 /* Allocate node map header */
500 ret
= talloc_zero_size(mem_ctx
, offsetof(struct ctdb_node_map_old
, nodes
));
502 DEBUG(DEBUG_ERR
, (__location__
" Out of memory\n"));
506 lines
= file_lines_load(nlist
, &nlines
, 0, mem_ctx
);
508 DEBUG(DEBUG_ERR
, ("Failed to read nodes file \"%s\"\n", nlist
));
511 while (nlines
> 0 && strcmp(lines
[nlines
-1], "") == 0) {
515 for (i
=0; i
< nlines
; i
++) {
521 /* strip leading spaces */
522 while((*node
== ' ') || (*node
== '\t')) {
529 ((node
[len
-1] == ' ') || (node
[len
-1] == '\t')))
539 /* A "deleted" node is a node that is
540 commented out in the nodes file. This is
541 used instead of removing a line, which
542 would cause subsequent nodes to change
544 flags
= NODE_FLAGS_DELETED
;
545 node
= discard_const("0.0.0.0");
549 if (!node_map_add(mem_ctx
, node
, flags
, &ret
)) {
560 struct ctdb_node_map_old
*
561 ctdb_node_list_to_map(struct ctdb_node
**nodes
, uint32_t num_nodes
,
566 struct ctdb_node_map_old
*node_map
;
568 size
= offsetof(struct ctdb_node_map_old
, nodes
) +
569 num_nodes
* sizeof(struct ctdb_node_and_flags
);
570 node_map
= (struct ctdb_node_map_old
*)talloc_zero_size(mem_ctx
, size
);
571 if (node_map
== NULL
) {
573 (__location__
" Failed to allocate nodemap array\n"));
577 node_map
->num
= num_nodes
;
578 for (i
=0; i
<num_nodes
; i
++) {
579 node_map
->nodes
[i
].addr
= nodes
[i
]->address
;
580 node_map
->nodes
[i
].pnn
= nodes
[i
]->pnn
;
581 node_map
->nodes
[i
].flags
= nodes
[i
]->flags
;
587 const char *ctdb_eventscript_call_names
[] = {
604 /* Runstate handling */
606 enum ctdb_runstate runstate
;
609 { CTDB_RUNSTATE_UNKNOWN
, "UNKNOWN" },
610 { CTDB_RUNSTATE_INIT
, "INIT" },
611 { CTDB_RUNSTATE_SETUP
, "SETUP" },
612 { CTDB_RUNSTATE_FIRST_RECOVERY
, "FIRST_RECOVERY" },
613 { CTDB_RUNSTATE_STARTUP
, "STARTUP" },
614 { CTDB_RUNSTATE_RUNNING
, "RUNNING" },
615 { CTDB_RUNSTATE_SHUTDOWN
, "SHUTDOWN" },
619 const char *runstate_to_string(enum ctdb_runstate runstate
)
622 for (i
=0; runstate_map
[i
].label
!= NULL
; i
++) {
623 if (runstate_map
[i
].runstate
== runstate
) {
624 return runstate_map
[i
].label
;
628 return runstate_map
[0].label
;
631 enum ctdb_runstate
runstate_from_string(const char *label
)
634 for (i
=0; runstate_map
[i
].label
!= NULL
; i
++) {
635 if (strcasecmp(runstate_map
[i
].label
, label
) == 0) {
636 return runstate_map
[i
].runstate
;
640 return CTDB_RUNSTATE_UNKNOWN
;
643 void ctdb_set_runstate(struct ctdb_context
*ctdb
, enum ctdb_runstate runstate
)
645 DEBUG(DEBUG_NOTICE
,("Set runstate to %s (%d)\n",
646 runstate_to_string(runstate
), runstate
));
648 if (runstate
<= ctdb
->runstate
) {
649 ctdb_fatal(ctdb
, "runstate must always increase");
652 ctdb
->runstate
= runstate
;
655 /* Convert arbitrary data to 4-byte boundary padded uint32 array */
656 uint32_t *ctdb_key_to_idkey(TALLOC_CTX
*mem_ctx
, TDB_DATA key
)
658 uint32_t idkey_size
, *k
;
660 idkey_size
= 1 + (key
.dsize
+ sizeof(uint32_t)-1) / sizeof(uint32_t);
662 k
= talloc_zero_array(mem_ctx
, uint32_t, idkey_size
);
668 memcpy(&k
[1], key
.dptr
, key
.dsize
);