3 # Run commands on CTDB nodes.
5 # See http://ctdb.samba.org/ for more information about CTDB.
7 # Copyright (C) Martin Schwenke 2008
9 # Based on an earlier script by Andrew Tridgell and Ronnie Sahlberg.
11 # Copyright (C) Andrew Tridgell 2007
13 # This program is free software; you can redistribute it and/or modify
14 # it under the terms of the GNU General Public License as published by
15 # the Free Software Foundation; either version 3 of the License, or
16 # (at your option) any later version.
18 # This program is distributed in the hope that it will be useful,
19 # but WITHOUT ANY WARRANTY; without even the implied warranty of
20 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
21 # GNU General Public License for more details.
23 # You should have received a copy of the GNU General Public License
24 # along with this program; if not, see <http://www.gnu.org/licenses/>.
31 Usage: onnode [OPTION] ... <NODES> <COMMAND> ...
33 -c Run in current working directory on specified nodes.
34 -f Specify nodes file, overrides CTDB_NODES_FILE.
35 -i Keep standard input open - the default is to close it.
36 -n Allow nodes to be specified by name.
37 -o <prefix> Save standard output from each node to file <prefix>.<ip>
38 -p Run command in parallel on specified nodes.
39 -P Push given files to nodes instead of running commands.
40 -q Do not print node addresses (overrides -v).
41 -v Print node address even for a single node.
42 <NODES> "all", "any", "ok" (or "healthy"), "con" (or "connected"),
43 "rm" (or "recmaster"), "lvs" (or "lvsmaster"),
44 "natgw" (or "natgwlist"); or
45 a node number (0 base); or
46 a hostname (if -n is specified); or
47 list (comma separated) of <NODES>; or
48 range (hyphen separated) of node numbers.
56 echo "Invalid <nodespec>" >&2 ; echo >&2
70 if [ -z "$CTDB_BASE" ] ; then
71 CTDB_BASE
="/usr/local/etc/ctdb"
74 .
"${CTDB_BASE}/functions"
79 # $POSIXLY_CORRECT means that the command passed to onnode can
80 # take options and getopt won't reorder things to make them
83 # Not on the previous line - local returns 0!
84 temp
=$
(POSIXLY_CORRECT
=1 getopt
-n "$prog" -o "cf:hno:pqvPi" -l help -- "$@")
92 -c) current
=true
; shift ;;
93 -f) CTDB_NODES_FILE
="$2" ; shift 2 ;;
94 -n) names_ok
=true
; shift ;;
95 -o) prefix
="$2" ; shift 2 ;;
96 -p) parallel
=true
; shift ;;
97 -q) quiet
=true
; shift ;;
98 -v) verbose
=true
; shift ;;
99 -P) push
=true
; shift ;;
100 -i) stdin
=true
; shift ;;
102 -h|
--help|
*) usage
;; # Shouldn't happen, so this is reasonable.
106 [ $# -lt 2 ] && usage
108 nodespec
="$1" ; shift
119 if [ -n "$node" -a "$node" != "#DEAD" ] ; then
122 echo "${prog}: \"node ${n}\" does not exist" >&2
129 # Subshell avoids hacks to restore $IFS.
134 *-*) seq "${i%-*}" "${i#*-}" 2>/dev
/null || invalid_nodespec
;;
135 # Separate lines for readability.
136 all|any|ok|healthy|con|connected
) echo "$i" ;;
137 rm|recmaster|lvs|lvsmaster|natgw|natgwlist
) echo "$i" ;;
139 [ $i -gt -1 ] 2>/dev
/null ||
$names_ok || invalid_nodespec
146 ctdb_status_output
="" # cache
147 get_nodes_with_status
()
152 if [ -z "$ctdb_status_output" ] ; then
153 ctdb_status_output
=$
(ctdb
-X status
2>&1)
154 if [ $?
-ne 0 ] ; then
155 echo "${prog}: unable to get status of CTDB nodes" >&2
156 echo "$ctdb_status_output" >&2
161 ctdb_status_output
="${ctdb_status_output#*${nl}}"
167 while IFS
="" read i
; do
169 set -- $i # split line on colons
170 shift # line starts with : so 1st field is empty
171 local pnn
="$1" ; shift
172 local ip
="$1" ; shift
176 # If any bit is 1, don't match this address.
179 [ "$s" != "1" ] ||
continue 2
183 # If disconnected bit is not 0, don't match this address.
184 [ "$1" = "0" ] ||
continue
190 echo_nth
"$pnn" $all_nodes
191 done <<<"$ctdb_status_output"
195 ctdb_props
="" # cache
196 get_node_with_property
()
202 if [ "${ctdb_props##:${prop}:}" = "$ctdb_props" ] ; then
204 prop_node
=$
(ctdb
"$prop" -X 2>/dev
/null
)
205 if [ $?
-eq 0 ] ; then
206 if [ "$prop" = "natgwlist" ] ; then
207 prop_node
="${prop_node%% *}" # 1st word
208 if [ "$prop_node" = "-1" ] ; then
209 # This works around natgwlist returning 0 even
210 # when there's no natgw.
214 # We only want the first line.
217 prop_node
="${prop_node%%${nl}*}"
223 if [ -n "$prop_node" ] ; then
225 ctdb_props
="${ctdb_props}${ctdb_props:+ }:${prop}:${prop_node}"
229 prop_node
="${ctdb_props##:${prop}:}"
230 prop_node
="${prop_node%% *}"
233 if [ -n "$prop_node" ] ; then
234 echo_nth
"$prop_node" $all_nodes
236 echo "${prog}: No ${prop} available" >&2
241 get_any_available_node
()
245 # We do a recursive onnode to find which nodes are up and running.
246 local out
=$
($0 -pq all ctdb pnn
2>&1)
249 local pnn
="${line#PNN:}"
250 if [ "$pnn" != "$line" ] ; then
251 echo_nth
"$pnn" $all_nodes
254 # Else must be an error message from a down node.
263 if [ -n "$CTDB_NODES_SOCKETS" ] ; then
264 all_nodes
="$CTDB_NODES_SOCKETS"
266 local f
="${CTDB_BASE}/nodes"
267 if [ -n "$CTDB_NODES_FILE" ] ; then
269 if [ ! -e "$f" -a "${f#/}" = "$f" ] ; then
270 # $f is relative, try in $CTDB_BASE
271 f
="${CTDB_BASE}/${f}"
273 elif [ -n "$CTDB_NODES" ] ; then
277 if [ ! -r "$f" ] ; then
278 echo "${prog}: unable to open nodes file \"${f}\"" >&2
282 all_nodes
=$
(sed -e 's@#.*@@g' -e 's@ *@@g' -e 's@^$@#DEAD@' "$f")
287 for n
in $
(parse_nodespec
"$1") ; do
288 [ $?
!= 0 ] && exit 1 # Required to catch exit in above subshell.
291 echo "${all_nodes//#DEAD/}"
294 get_any_available_node
"$all_nodes" ||
exit 1
297 get_nodes_with_status
"$all_nodes" "healthy" ||
exit 1
300 get_nodes_with_status
"$all_nodes" "connected" ||
exit 1
303 get_node_with_property
"$all_nodes" "recmaster" ||
exit 1
306 get_node_with_property
"$all_nodes" "lvsmaster" ||
exit 1
309 get_node_with_property
"$all_nodes" "natgwlist" ||
exit 1
311 [0-9]|
[0-9][0-9]|
[0-9][0-9][0-9])
312 echo_nth
$n $all_nodes
315 $names_ok || invalid_nodespec
328 $verbose && echo "Pushing $f"
330 /*) rsync
"$f" "[${host}]:${f}" ;;
331 *) rsync
"${PWD}/${f}" "[${host}]:${PWD}/${f}" ;;
338 CTDB_SOCKET
="$1" sh
-c "$2" 3>/dev
/null
343 if [ -n "$prefix" ] ; then
344 cat >"${prefix}.${n//\//_}"
345 elif $verbose && $parallel ; then
354 if $verbose && $parallel ; then
361 ######################################################################
370 $current && command="cd $PWD && $command"
372 if [ -n "$CTDB_NODES_SOCKETS" ] ; then
376 # Could "2>/dev/null || true" but want to see errors from typos in file.
377 [ -r "${CTDB_BASE}/onnode.conf" ] && .
"${CTDB_BASE}/onnode.conf"
378 [ -n "$SSH" ] || SSH
=ssh
379 if [ "$SSH" = "ssh" ] ; then
380 if $parallel ||
! $stdin ; then
384 : # rsh? All bets are off!
389 ######################################################################
391 nodes
=$
(get_nodes
"$nodespec")
392 [ $?
!= 0 ] && exit 1 # Required to catch exit in above subshell.
397 # If $nodes contains a space or a newline then assume multiple nodes.
400 [ "$nodes" != "${nodes%[ ${nl}]*}" ] && verbose
=true
404 trap 'kill -TERM $pids 2>/dev/null' INT TERM
405 # There's a small race here where the kill can fail if no processes
406 # have been added to $pids and the script is interrupted. However,
407 # the part of the window where it matter is very small.
410 set -o pipefail
2>/dev
/null
412 { exec 3>&1 ; { $SSH $ssh_opts $EXTRA_SSH_OPTS $n "$command" | stdout_filter
>&3 ; } 2>&1 | stderr_filter
; } &
416 echo >&2 ; echo ">> NODE: $n <<" >&2
419 { exec 3>&1 ; { $SSH $ssh_opts $EXTRA_SSH_OPTS $n "$command" | stdout_filter
>&3 ; } 2>&1 | stderr_filter
; }
420 [ $?
= 0 ] || retcode
=$?
427 [ $?
= 0 ] || retcode
=$?