4 Copyright (C) Andrew Tridgell 2006
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, see <http://www.gnu.org/licenses/>.
22 #include "system/network.h"
23 #include "system/filesys.h"
24 #include "system/wait.h"
25 #include "system/shmem.h"
26 #include "../include/ctdb_private.h"
29 return error string for last error
31 const char *ctdb_errstr(struct ctdb_context
*ctdb
)
38 remember an error message
40 void ctdb_set_error(struct ctdb_context
*ctdb
, const char *fmt
, ...)
43 talloc_free(ctdb
->err_msg
);
45 ctdb
->err_msg
= talloc_vasprintf(ctdb
, fmt
, ap
);
46 DEBUG(DEBUG_ERR
,("ctdb error: %s\n", ctdb
->err_msg
));
51 a fatal internal error occurred - no hope for recovery
53 void ctdb_fatal(struct ctdb_context
*ctdb
, const char *msg
)
55 DEBUG(DEBUG_ALERT
,("ctdb fatal error: %s\n", msg
));
60 like ctdb_fatal() but a core/backtrace would not be useful
62 void ctdb_die(struct ctdb_context
*ctdb
, const char *msg
)
64 DEBUG(DEBUG_ALERT
,("ctdb exiting with error: %s\n", msg
));
68 /* Invoke an external program to do some sort of tracing on the CTDB
69 * process. This might block for a little while. The external
70 * program is specified by the environment variable
71 * CTDB_EXTERNAL_TRACE. This program should take one argument: the
72 * pid of the process to trace. Commonly, the program would be a
73 * wrapper script around gcore.
75 void ctdb_external_trace(void)
78 const char * t
= getenv("CTDB_EXTERNAL_TRACE");
85 cmd
= talloc_asprintf(NULL
, "%s %lu", t
, (unsigned long) getpid());
86 DEBUG(DEBUG_WARNING
,("begin external trace: %s\n", cmd
));
88 DEBUG(DEBUG_WARNING
,("end external trace: %s\n", cmd
));
95 int ctdb_parse_address(struct ctdb_context
*ctdb
,
96 TALLOC_CTX
*mem_ctx
, const char *str
,
97 struct ctdb_address
*address
)
102 se
= getservbyname("ctdb", "tcp");
105 address
->address
= talloc_strdup(mem_ctx
, str
);
106 CTDB_NO_MEMORY(ctdb
, address
->address
);
109 address
->port
= CTDB_PORT
;
111 address
->port
= ntohs(se
->s_port
);
118 check if two addresses are the same
120 bool ctdb_same_address(struct ctdb_address
*a1
, struct ctdb_address
*a2
)
122 return strcmp(a1
->address
, a2
->address
) == 0 && a1
->port
== a2
->port
;
127 hash function for mapping data to a VNN - taken from tdb
129 uint32_t ctdb_hash(const TDB_DATA
*key
)
131 return tdb_jenkins_hash(discard_const(key
));
135 a type checking varient of idr_find
137 static void *_idr_find_type(struct idr_context
*idp
, int id
, const char *type
, const char *location
)
139 void *p
= idr_find(idp
, id
);
140 if (p
&& talloc_check_name(p
, type
) == NULL
) {
141 DEBUG(DEBUG_ERR
,("%s idr_find_type expected type %s but got %s\n",
142 location
, type
, talloc_get_name(p
)));
148 uint32_t ctdb_reqid_new(struct ctdb_context
*ctdb
, void *state
)
150 int id
= idr_get_new_above(ctdb
->idr
, state
, ctdb
->lastid
+1, INT_MAX
);
152 DEBUG(DEBUG_DEBUG
, ("Reqid wrap!\n"));
153 id
= idr_get_new(ctdb
->idr
, state
, INT_MAX
);
159 void *_ctdb_reqid_find(struct ctdb_context
*ctdb
, uint32_t reqid
, const char *type
, const char *location
)
163 p
= _idr_find_type(ctdb
->idr
, reqid
, type
, location
);
165 DEBUG(DEBUG_WARNING
, ("Could not find idr:%u\n",reqid
));
172 void ctdb_reqid_remove(struct ctdb_context
*ctdb
, uint32_t reqid
)
176 ret
= idr_remove(ctdb
->idr
, reqid
);
178 DEBUG(DEBUG_ERR
, ("Removing idr that does not exist\n"));
184 form a ctdb_rec_data record from a key/data pair
186 note that header may be NULL. If not NULL then it is included in the data portion
189 struct ctdb_rec_data
*ctdb_marshall_record(TALLOC_CTX
*mem_ctx
, uint32_t reqid
,
191 struct ctdb_ltdb_header
*header
,
195 struct ctdb_rec_data
*d
;
197 length
= offsetof(struct ctdb_rec_data
, data
) + key
.dsize
+
198 data
.dsize
+ (header
?sizeof(*header
):0);
199 d
= (struct ctdb_rec_data
*)talloc_size(mem_ctx
, length
);
205 d
->keylen
= key
.dsize
;
206 memcpy(&d
->data
[0], key
.dptr
, key
.dsize
);
208 d
->datalen
= data
.dsize
+ sizeof(*header
);
209 memcpy(&d
->data
[key
.dsize
], header
, sizeof(*header
));
210 memcpy(&d
->data
[key
.dsize
+sizeof(*header
)], data
.dptr
, data
.dsize
);
212 d
->datalen
= data
.dsize
;
213 memcpy(&d
->data
[key
.dsize
], data
.dptr
, data
.dsize
);
219 /* helper function for marshalling multiple records */
220 struct ctdb_marshall_buffer
*ctdb_marshall_add(TALLOC_CTX
*mem_ctx
,
221 struct ctdb_marshall_buffer
*m
,
225 struct ctdb_ltdb_header
*header
,
228 struct ctdb_rec_data
*r
;
229 size_t m_size
, r_size
;
230 struct ctdb_marshall_buffer
*m2
;
232 r
= ctdb_marshall_record(mem_ctx
, reqid
, key
, header
, data
);
239 m
= talloc_zero_size(mem_ctx
, offsetof(struct ctdb_marshall_buffer
, data
));
246 m_size
= talloc_get_size(m
);
247 r_size
= talloc_get_size(r
);
249 m2
= talloc_realloc_size(mem_ctx
, m
, m_size
+ r_size
);
255 memcpy(m_size
+ (uint8_t *)m2
, r
, r_size
);
264 /* we've finished marshalling, return a data blob with the marshalled records */
265 TDB_DATA
ctdb_marshall_finish(struct ctdb_marshall_buffer
*m
)
268 data
.dptr
= (uint8_t *)m
;
269 data
.dsize
= talloc_get_size(m
);
274 loop over a marshalling buffer
276 - pass r==NULL to start
277 - loop the number of times indicated by m->count
279 struct ctdb_rec_data
*ctdb_marshall_loop_next(struct ctdb_marshall_buffer
*m
, struct ctdb_rec_data
*r
,
281 struct ctdb_ltdb_header
*header
,
282 TDB_DATA
*key
, TDB_DATA
*data
)
285 r
= (struct ctdb_rec_data
*)&m
->data
[0];
287 r
= (struct ctdb_rec_data
*)(r
->length
+ (uint8_t *)r
);
295 key
->dptr
= &r
->data
[0];
296 key
->dsize
= r
->keylen
;
299 data
->dptr
= &r
->data
[r
->keylen
];
300 data
->dsize
= r
->datalen
;
301 if (header
!= NULL
) {
302 data
->dptr
+= sizeof(*header
);
303 data
->dsize
-= sizeof(*header
);
307 if (header
!= NULL
) {
308 if (r
->datalen
< sizeof(*header
)) {
311 *header
= *(struct ctdb_ltdb_header
*)&r
->data
[r
->keylen
];
318 This is used to canonicalize a ctdb_sock_addr structure.
320 void ctdb_canonicalize_ip(const ctdb_sock_addr
*ip
, ctdb_sock_addr
*cip
)
322 char prefix
[12] = { 0,0,0,0,0,0,0,0,0,0,0xff,0xff };
324 memcpy(cip
, ip
, sizeof (*cip
));
326 if ( (ip
->sa
.sa_family
== AF_INET6
)
327 && !memcmp(&ip
->ip6
.sin6_addr
, prefix
, 12)) {
328 memset(cip
, 0, sizeof(*cip
));
329 #ifdef HAVE_SOCK_SIN_LEN
330 cip
->ip
.sin_len
= sizeof(*cip
);
332 cip
->ip
.sin_family
= AF_INET
;
333 cip
->ip
.sin_port
= ip
->ip6
.sin6_port
;
334 memcpy(&cip
->ip
.sin_addr
, &ip
->ip6
.sin6_addr
.s6_addr
[12], 4);
338 bool ctdb_same_ip(const ctdb_sock_addr
*tip1
, const ctdb_sock_addr
*tip2
)
340 ctdb_sock_addr ip1
, ip2
;
342 ctdb_canonicalize_ip(tip1
, &ip1
);
343 ctdb_canonicalize_ip(tip2
, &ip2
);
345 if (ip1
.sa
.sa_family
!= ip2
.sa
.sa_family
) {
349 switch (ip1
.sa
.sa_family
) {
351 return ip1
.ip
.sin_addr
.s_addr
== ip2
.ip
.sin_addr
.s_addr
;
353 return !memcmp(&ip1
.ip6
.sin6_addr
.s6_addr
[0],
354 &ip2
.ip6
.sin6_addr
.s6_addr
[0],
357 DEBUG(DEBUG_ERR
, (__location__
" CRITICAL Can not compare sockaddr structures of type %u\n", ip1
.sa
.sa_family
));
365 compare two ctdb_sock_addr structures
367 bool ctdb_same_sockaddr(const ctdb_sock_addr
*ip1
, const ctdb_sock_addr
*ip2
)
369 return ctdb_same_ip(ip1
, ip2
) && ip1
->ip
.sin_port
== ip2
->ip
.sin_port
;
372 char *ctdb_addr_to_str(ctdb_sock_addr
*addr
)
374 static char cip
[128] = "";
376 switch (addr
->sa
.sa_family
) {
378 inet_ntop(addr
->ip
.sin_family
, &addr
->ip
.sin_addr
, cip
, sizeof(cip
));
381 inet_ntop(addr
->ip6
.sin6_family
, &addr
->ip6
.sin6_addr
, cip
, sizeof(cip
));
384 DEBUG(DEBUG_ERR
, (__location__
" ERROR, unknown family %u\n", addr
->sa
.sa_family
));
385 ctdb_external_trace();
391 unsigned ctdb_addr_to_port(ctdb_sock_addr
*addr
)
393 switch (addr
->sa
.sa_family
) {
395 return ntohs(addr
->ip
.sin_port
);
398 return ntohs(addr
->ip6
.sin6_port
);
401 DEBUG(DEBUG_ERR
, (__location__
" ERROR, unknown family %u\n", addr
->sa
.sa_family
));
407 /* we don't lock future pages here; it would increase the chance that
408 * we'd fail to mmap later on. */
409 void ctdb_lockdown_memory(bool valgrinding
)
411 #if defined(HAVE_MLOCKALL) && !defined(_AIX_)
412 /* Extra stack, please! */
414 memset(dummy
, 0, sizeof(dummy
));
420 /* Ignore when running in local daemons mode */
425 /* Avoid compiler optimizing out dummy. */
426 mlock(dummy
, sizeof(dummy
));
427 if (mlockall(MCL_CURRENT
) != 0) {
428 DEBUG(DEBUG_WARNING
,("Failed to lockdown memory: %s'\n",
434 const char *ctdb_eventscript_call_names
[] = {
451 /* Runstate handling */
453 enum ctdb_runstate runstate
;
456 { CTDB_RUNSTATE_UNKNOWN
, "UNKNOWN" },
457 { CTDB_RUNSTATE_INIT
, "INIT" },
458 { CTDB_RUNSTATE_SETUP
, "SETUP" },
459 { CTDB_RUNSTATE_FIRST_RECOVERY
, "FIRST_RECOVERY" },
460 { CTDB_RUNSTATE_STARTUP
, "STARTUP" },
461 { CTDB_RUNSTATE_RUNNING
, "RUNNING" },
462 { CTDB_RUNSTATE_SHUTDOWN
, "SHUTDOWN" },
466 const char *runstate_to_string(enum ctdb_runstate runstate
)
469 for (i
=0; runstate_map
[i
].label
!= NULL
; i
++) {
470 if (runstate_map
[i
].runstate
== runstate
) {
471 return runstate_map
[i
].label
;
475 return runstate_map
[0].label
;
478 enum ctdb_runstate
runstate_from_string(const char *label
)
481 for (i
=0; runstate_map
[i
].label
!= NULL
; i
++) {
482 if (strcasecmp(runstate_map
[i
].label
, label
) == 0) {
483 return runstate_map
[i
].runstate
;
487 return CTDB_RUNSTATE_UNKNOWN
;
490 void ctdb_set_runstate(struct ctdb_context
*ctdb
, enum ctdb_runstate runstate
)
492 if (runstate
<= ctdb
->runstate
) {
493 ctdb_fatal(ctdb
, "runstate must always increase");
496 DEBUG(DEBUG_NOTICE
,("Set runstate to %s (%d)\n",
497 runstate_to_string(runstate
), runstate
));
498 ctdb
->runstate
= runstate
;
501 void ctdb_mkdir_p_or_die(struct ctdb_context
*ctdb
, const char *dir
, int mode
)
505 ret
= mkdir_p(dir
, mode
);
508 ("ctdb exiting with error: "
509 "failed to create directory \"%s\" (%s)\n",
510 dir
, strerror(errno
)));