1 # utility functions for ctdb event scripts
3 PATH=/bin:/usr/bin:/usr/sbin:/sbin:$PATH
5 #######################################
6 # pull in a system config file, if any
10 foo="${service_config:-${service_name}}"
11 if [ -n "$foo" ] ; then
14 elif [ "$1" != "ctdb" ] ; then
19 if [ -f /etc/sysconfig/$1 ]; then
21 elif [ -f /etc/default/$1 ]; then
23 elif [ -f $CTDB_BASE/sysconfig/$1 ]; then
24 . $CTDB_BASE/sysconfig/$1
28 ##############################################################
29 # determine on what type of system (init style) we are running
31 # only do detection if not already set:
32 test "x$CTDB_INIT_STYLE" != "x" && return
34 if [ -x /sbin/startproc ]; then
35 CTDB_INIT_STYLE="suse"
36 elif [ -x /sbin/start-stop-daemon ]; then
37 CTDB_INIT_STYLE="debian"
39 CTDB_INIT_STYLE="redhat"
43 ######################################################
44 # simulate /sbin/service on platforms that don't have it
49 # do nothing, when no service was specified
50 [ -z "$_service_name" ] && return
52 if [ -x /sbin/service ]; then
53 /sbin/service "$_service_name" "$_op"
54 elif [ -x /etc/init.d/$_service_name ]; then
55 /etc/init.d/$_service_name "$_op"
56 elif [ -x /etc/rc.d/init.d/$_service_name ]; then
57 /etc/rc.d/init.d/$_service_name "$_op"
61 ######################################################
62 # simulate /sbin/service (niced) on platforms that don't have it
67 # do nothing, when no service was specified
68 [ -z "$_service_name" ] && return
70 if [ -x /sbin/service ]; then
71 nice /sbin/service "$_service_name" "$_op"
72 elif [ -x /etc/init.d/$_service_name ]; then
73 nice /etc/init.d/$_service_name "$_op"
74 elif [ -x /etc/rc.d/init.d/$_service_name ]; then
75 nice /etc/rc.d/init.d/$_service_name "$_op"
79 ######################################################
80 # wait for a command to return a zero exit status
81 # usage: ctdb_wait_command SERVICE_NAME <command>
82 ######################################################
86 [ -z "$wait_cmd" ] && return;
88 echo "Waiting for service $service_name to start"
89 while [ $all_ok -eq 0 ]; do
90 $wait_cmd > /dev/null 2>&1 && all_ok=1
91 ctdb status > /dev/null 2>&1 || {
92 echo "ctdb daemon has died. Exiting wait for $service_name"
95 [ $all_ok -eq 1 ] || sleep 1
97 echo "Local service $service_name is up"
101 ######################################################
102 # wait for a set of tcp ports
103 # usage: ctdb_wait_tcp_ports SERVICE_NAME <ports...>
104 ######################################################
105 ctdb_wait_tcp_ports() {
109 [ -z "$wait_ports" ] && return;
111 echo "Waiting for tcp service $service_name to start"
112 while [ $all_ok -eq 0 ]; do
114 for p in $wait_ports; do
115 if [ -x /usr/bin/netcat ]; then
116 /usr/bin/netcat -z 127.0.0.1 $p > /dev/null || all_ok=0
117 elif [ -x /usr/bin/nc ]; then
118 /usr/bin/nc -z 127.0.0.1 $p > /dev/null || all_ok=0
119 elif [ -x /usr/bin/netstat ]; then
120 (netstat -a -n | egrep "0.0.0.0:$p[[:space:]]*LISTEN" > /dev/null) || all_ok=0
121 elif [ -x /bin/netstat ]; then
122 (netstat -a -n | egrep "0.0.0.0:$p[[:space:]]*LISTEN" > /dev/null) || all_ok=0
124 echo "No tool to check tcp ports availabe. can not check in ctdb_wait_tcp_ports"
128 [ $all_ok -eq 1 ] || sleep 1
129 ctdb status > /dev/null 2>&1 || {
130 echo "ctdb daemon has died. Exiting tcp wait $service_name"
134 echo "Local tcp services for $service_name are up"
138 ######################################################
139 # check that a rpc server is registered with portmap
140 # and responding to requests
141 # usage: ctdb_check_rpc SERVICE_NAME PROGNUM VERSION
142 ######################################################
147 rpcinfo -u localhost $prognum $version > /dev/null || {
148 echo "ERROR: $progname not responding to rpc requests"
153 ######################################################
154 # check a set of directories is available
155 # return 1 on a missing directory
156 # usage: ctdb_check_directories_probe SERVICE_NAME <directories...>
157 ######################################################
158 ctdb_check_directories_probe() {
159 while IFS="" read d ; do
165 [ -d "${d}/." ] || return 1
170 ######################################################
171 # check a set of directories is available
172 # usage: ctdb_check_directories SERVICE_NAME <directories...>
173 ######################################################
174 ctdb_check_directories() {
175 n="${1:-${service_name}}"
176 ctdb_check_directories_probe || {
177 echo "ERROR: $n directory \"$d\" not available"
182 ######################################################
183 # check a set of tcp ports
184 # usage: ctdb_check_tcp_ports <ports...>
185 ######################################################
186 ctdb_check_tcp_ports() {
189 if ! netstat -a -t -n | grep -q "0\.0\.0\.0:$p .*LISTEN" ; then
190 if ! netstat -a -t -n | grep -q ":::$p .*LISTEN" ; then
191 echo "ERROR: $service_name tcp port $p is not responding"
198 ######################################################
199 # check a unix socket
200 # usage: ctdb_check_unix_socket SERVICE_NAME <socket_path>
201 ######################################################
202 ctdb_check_unix_socket() {
204 [ -z "$socket_path" ] && return
206 if ! netstat --unix -a -n | grep -q "^unix.*LISTEN.*${socket_path}$"; then
207 echo "ERROR: $service_name socket $socket_path not found"
212 ######################################################
213 # check a command returns zero status
214 # usage: ctdb_check_command SERVICE_NAME <command>
215 ######################################################
216 ctdb_check_command() {
219 [ -z "$wait_cmd" ] && return;
220 $wait_cmd > /dev/null 2>&1 || {
221 echo "ERROR: $service_name - $wait_cmd returned error"
226 ################################################
227 # kill off any TCP connections with the given IP
228 ################################################
229 kill_tcp_connections() {
234 connfile="$CTDB_VARDIR/state/connections.$_IP"
235 netstat -tn |egrep "^tcp.*[[:space:]]+$_IP:.*ESTABLISHED" | awk '{print $4" "$5}' > $connfile
236 netstat -tn |egrep "^tcp.*[[:space:]]+::ffff:$_IP:.*ESTABLISHED" | awk '{print $4" "$5}' >> $connfile
238 while read dest src; do
239 srcip=`echo $src | sed -e "s/:[^:]*$//"`
240 srcport=`echo $src | sed -e "s/^.*://"`
241 destip=`echo $dest | sed -e "s/:[^:]*$//"`
242 destport=`echo $dest | sed -e "s/^.*://"`
243 echo "Killing TCP connection $srcip:$srcport $destip:$destport"
244 ctdb killtcp $srcip:$srcport $destip:$destport >/dev/null 2>&1 || _failed=1
246 # we only do one-way killtcp for CIFS
248 # for all others we do 2-way
250 ctdb killtcp $destip:$destport $srcip:$srcport >/dev/null 2>&1 || _failed=1
253 _killcount=`expr $_killcount + 1`
257 [ $_failed = 0 ] || {
258 echo "Failed to send killtcp control"
261 [ $_killcount -gt 0 ] || {
265 while netstat -tn |egrep "^tcp.*[[:space:]]+$_IP:.*ESTABLISHED" > /dev/null; do
267 _count=`expr $_count + 1`
268 [ $_count -gt 3 ] && {
269 echo "Timed out killing tcp connections for IP $_IP"
273 echo "killed $_killcount TCP connections to released IP $_IP"
276 ##################################################################
277 # kill off the local end for any TCP connections with the given IP
278 ##################################################################
279 kill_tcp_connections_local_only() {
284 connfile="$CTDB_VARDIR/state/connections.$_IP"
285 netstat -tn |egrep "^tcp.*[[:space:]]+$_IP:.*ESTABLISHED" | awk '{print $4" "$5}' > $connfile
286 netstat -tn |egrep "^tcp.*[[:space:]]+::ffff:$_IP:.*ESTABLISHED" | awk '{print $4" "$5}' >> $connfile
288 while read dest src; do
289 srcip=`echo $src | sed -e "s/:[^:]*$//"`
290 srcport=`echo $src | sed -e "s/^.*://"`
291 destip=`echo $dest | sed -e "s/:[^:]*$//"`
292 destport=`echo $dest | sed -e "s/^.*://"`
293 echo "Killing TCP connection $srcip:$srcport $destip:$destport"
294 ctdb killtcp $srcip:$srcport $destip:$destport >/dev/null 2>&1 || _failed=1
295 _killcount=`expr $_killcount + 1`
299 [ $_failed = 0 ] || {
300 echo "Failed to send killtcp control"
303 [ $_killcount -gt 0 ] || {
307 while netstat -tn |egrep "^tcp.*[[:space:]]+$_IP:.*ESTABLISHED" > /dev/null; do
309 _count=`expr $_count + 1`
310 [ $_count -gt 3 ] && {
311 echo "Timed out killing tcp connections for IP $_IP"
315 echo "killed $_killcount TCP connections to released IP $_IP"
318 ##################################################################
319 # tickle any TCP connections with the given IP
320 ##################################################################
321 tickle_tcp_connections() {
326 connfile="$CTDB_VARDIR/state/connections.$_IP"
327 netstat -tn |egrep "^tcp.*[[:space:]]+$_IP:.*ESTABLISHED" | awk '{print $4" "$5}' > $connfile
328 netstat -tn |egrep "^tcp.*[[:space:]]+::ffff:$_IP:.*ESTABLISHED" | awk '{print $4" "$5}' >> $connfile
330 while read dest src; do
331 srcip=`echo $src | sed -e "s/:[^:]*$//"`
332 srcport=`echo $src | sed -e "s/^.*://"`
333 destip=`echo $dest | sed -e "s/:[^:]*$//"`
334 destport=`echo $dest | sed -e "s/^.*://"`
335 echo "Tickle TCP connection $srcip:$srcport $destip:$destport"
336 ctdb tickle $srcip:$srcport $destip:$destport >/dev/null 2>&1 || _failed=1
337 echo "Tickle TCP connection $destip:$destport $srcip:$srcport"
338 ctdb tickle $destip:$destport $srcip:$srcport >/dev/null 2>&1 || _failed=1
342 [ $_failed = 0 ] || {
343 echo "Failed to send tickle control"
348 ########################################################
349 # start/stop the nfs service on different platforms
350 ########################################################
353 [ -x /etc/init.d/nfsserver ] && {
356 [ -x /etc/init.d/nfslock ] && {
364 service nfsserver start
367 service nfsserver stop > /dev/null 2>&1
370 service nfsserver restart
377 service nfslock start
381 service nfs stop > /dev/null 2>&1
382 service nfslock stop > /dev/null 2>&1
385 service nfslock restart
391 echo "Unknown platform. NFS is not supported with ctdb"
397 ########################################################
398 # start/stop the nfs lockmanager service on different platforms
399 ########################################################
400 startstop_nfslock() {
402 [ -x /etc/init.d/nfsserver ] && {
405 [ -x /etc/init.d/nfslock ] && {
411 # for sles there is no service for lockmanager
412 # so we instead just shutdown/restart nfs
415 service nfsserver start
418 service nfsserver stop > /dev/null 2>&1
421 service nfsserver stop
422 service nfsserver start
429 service nfslock start
432 service nfslock stop > /dev/null 2>&1
436 service nfslock start
441 echo "Unknown platform. NFS locking is not supported with ctdb"
447 # better use delete_ip_from_iface() together with add_ip_to_iface
448 # remove_ip should be removed in future
450 local _ip_maskbits=$1
452 local _ip=`echo "$_ip_maskbits" | cut -d '/' -f1`
453 local _maskbits=`echo "$_ip_maskbits" | cut -d '/' -f2`
455 delete_ip_from_iface "$_iface" "$_ip" "$_maskbits"
464 local _state_dir="$CTDB_VARDIR/state/interface_modify"
465 local _lockfile="$_state_dir/$_iface.flock"
466 local _readd_base="$_state_dir/$_iface.readd.d"
468 mkdir -p $_state_dir || {
470 echo "Failed to mkdir -p $_state_dir - $ret"
474 test -f $_lockfile || {
478 flock --timeout 30 $_lockfile $CTDB_BASE/interface_modify.sh add "$_iface" "$_ip" "$_maskbits" "$_readd_base"
482 delete_ip_from_iface()
487 local _state_dir="$CTDB_VARDIR/state/interface_modify"
488 local _lockfile="$_state_dir/$_iface.flock"
489 local _readd_base="$_state_dir/$_iface.readd.d"
491 mkdir -p $_state_dir || {
493 echo "Failed to mkdir -p $_state_dir - $ret"
497 test -f $_lockfile || {
501 flock --timeout 30 $_lockfile $CTDB_BASE/interface_modify.sh delete "$_iface" "$_ip" "$_maskbits" "$_readd_base"
505 setup_iface_ip_readd_script()
510 local _readd_script=$4
511 local _state_dir="$CTDB_VARDIR/state/interface_modify"
512 local _lockfile="$_state_dir/$_iface.flock"
513 local _readd_base="$_state_dir/$_iface.readd.d"
515 mkdir -p $_state_dir || {
517 echo "Failed to mkdir -p $_state_dir - $ret"
521 test -f $_lockfile || {
525 flock --timeout 30 $_lockfile $CTDB_BASE/interface_modify.sh readd_script "$_iface" "$_ip" "$_maskbits" "$_readd_base" "$_readd_script"
529 ########################################################
530 # some simple logic for counting events - per eventscript
531 # usage: ctdb_counter_init
533 # ctdb_check_counter_limit <limit>
534 # ctdb_check_counter_limit succeeds when count >= <limit>
535 ########################################################
536 _ctdb_counter_common () {
537 _counter_file="$ctdb_fail_dir/$service_name"
538 mkdir -p "${_counter_file%/*}" # dirname
540 ctdb_counter_init () {
545 ctdb_counter_incr () {
549 echo -n 1 >> "$_counter_file"
551 ctdb_check_counter_limit () {
554 _limit="${1:-${service_fail_limit}}"
558 _size=$(stat -c "%s" "$_counter_file" 2>/dev/null || echo 0)
559 if [ $_size -ge $_limit ] ; then
560 echo "ERROR: more than $_limit consecutive failures for $service_name, marking cluster unhealthy"
562 elif [ $_size -gt 0 -a -z "$_quiet" ] ; then
563 echo "WARNING: less than $_limit consecutive failures ($_size) for $service_name, not unhealthy yet"
566 ########################################################
568 ctdb_spool_dir="/var/spool/ctdb"
569 ctdb_status_dir="$ctdb_spool_dir/status"
570 ctdb_fail_dir="$ctdb_spool_dir/failcount"
571 ctdb_active_dir="$ctdb_spool_dir/active"
575 echo "node is \"$1\", \"${script_name}\" reports problem: $(cat $2)"
580 if [ -r "$ctdb_status_dir/$script_name/unhealthy" ] ; then
581 log_status_cat "unhealthy" "$ctdb_status_dir/$script_name/unhealthy"
583 elif [ -r "$ctdb_status_dir/$script_name/banned" ] ; then
584 log_status_cat "banned" "$ctdb_status_dir/$script_name/banned"
593 d="$ctdb_status_dir/$script_name"
600 for i in "banned" "unhealthy" ; do
607 ctdb_service_needs_reconfigure ()
609 [ -e "$ctdb_status_dir/$service_name/reconfigure" ]
612 ctdb_service_set_reconfigure ()
614 d="$ctdb_status_dir/$service_name"
619 ctdb_service_unset_reconfigure ()
621 rm -f "$ctdb_status_dir/$service_name/reconfigure"
624 ctdb_service_reconfigure ()
626 if [ -n "$service_reconfigure" ] ; then
627 eval $service_reconfigure
629 service "$service_name" restart
631 ctdb_service_unset_reconfigure
635 ctdb_compat_managed_service ()
637 if [ "$1" = "yes" ] ; then
642 is_ctdb_managed_service ()
644 t=" $CTDB_MANAGED_SERVICES "
646 ctdb_compat_managed_service "$CTDB_MANAGES_VSFTPD" "vsftpd"
647 ctdb_compat_managed_service "$CTDB_MANAGES_SAMBA" "samba"
648 ctdb_compat_managed_service "$CTDB_MANAGES_SCP" "scp"
649 ctdb_compat_managed_service "$CTDB_MANAGES_WINDBIND" "windbind"
650 ctdb_compat_managed_service "$CTDB_MANAGES_HTTPD" "httpd"
651 ctdb_compat_managed_service "$CTDB_MANAGES_ISCSI" "iscsi"
652 ctdb_compat_managed_service "$CTDB_MANAGES_CLAMD" "clamd"
653 ctdb_compat_managed_service "$CTDB_MANAGES_NFS" "nfs"
655 # Returns 0 if "<space>$service_name<space>" appears in $t
656 [ "${t#* ${service_name} }" != "${t}" ]
659 ctdb_start_stop_service ()
661 _active="$ctdb_active_dir/$service_name"
663 if is_ctdb_managed_service ; then
664 if ! [ -e "$_active" ] ; then
665 echo "Starting service $service_name"
666 ctdb_service_start || exit $?
667 mkdir -p "$ctdb_active_dir"
671 elif ! is_ctdb_managed_service ; then
672 if [ -e "$_active" ] ; then
673 echo "Stopping service $service_name"
674 ctdb_service_stop || exit $?
681 ctdb_service_start ()
683 if [ -n "$service_start" ] ; then
686 service "$service_name" start
693 if [ -n "$service_stop" ] ; then
696 service "$service_name" stop
700 ctdb_standard_event_handler ()
715 ipv4_host_addr_to_net_addr()
720 local HOST0=$(echo $HOST | awk -F . '{print $4}')
721 local HOST1=$(echo $HOST | awk -F . '{print $3}')
722 local HOST2=$(echo $HOST | awk -F . '{print $2}')
723 local HOST3=$(echo $HOST | awk -F . '{print $1}')
725 local HOST_NUM=$(( $HOST0 + $HOST1 * 256 + $HOST2 * (256 ** 2) + $HOST3 * (256 ** 3) ))
727 local MASK_NUM=$(( ( (2**32 - 1) * (2**(32 - $MASKBITS)) ) & (2**32 - 1) ))
729 local NET_NUM=$(( $HOST_NUM & $MASK_NUM))
731 local NET0=$(( $NET_NUM & 255 ))
732 local NET1=$(( ($NET_NUM & (255 * 256)) / 256 ))
733 local NET2=$(( ($NET_NUM & (255 * 256**2)) / 256**2 ))
734 local NET3=$(( ($NET_NUM & (255 * 256**3)) / 256**3 ))
736 echo "$NET3.$NET2.$NET1.$NET0"
739 ipv4_maskbits_to_net_mask()
743 local MASK_NUM=$(( ( (2**32 - 1) * (2**(32 - $MASKBITS)) ) & (2**32 - 1) ))
745 local MASK0=$(( $MASK_NUM & 255 ))
746 local MASK1=$(( ($MASK_NUM & (255 * 256)) / 256 ))
747 local MASK2=$(( ($MASK_NUM & (255 * 256**2)) / 256**2 ))
748 local MASK3=$(( ($MASK_NUM & (255 * 256**3)) / 256**3 ))
750 echo "$MASK3.$MASK2.$MASK1.$MASK0"
758 local N=`echo $ADDR | sed -e 's/[0-9][0-9]*\.[0-9][0-9]*\.[0-9][0-9]*\.[0-9][0-9]*//'`
759 test -n "$N" && fail=1
761 local ADDR0=$(echo $ADDR | awk -F . '{print $4}')
762 local ADDR1=$(echo $ADDR | awk -F . '{print $3}')
763 local ADDR2=$(echo $ADDR | awk -F . '{print $2}')
764 local ADDR3=$(echo $ADDR | awk -F . '{print $1}')
766 test "$ADDR0" -gt 255 && fail=1
767 test "$ADDR1" -gt 255 && fail=1
768 test "$ADDR2" -gt 255 && fail=1
769 test "$ADDR3" -gt 255 && fail=1
771 test x"$fail" != x"0" && {
772 #echo "IPv4: '$ADDR' is not a valid address"
779 # iptables doesn't like being re-entered, so flock-wrap it.
782 flock -w 30 /var/ctdb/iptables-ctdb.flock /sbin/iptables "$@"
785 ########################################################
787 ########################################################
789 # Temporary directory for tickles.
790 tickledir="$CTDB_VARDIR/state/tickles"
791 mkdir -p "$tickledir"
797 mkdir -p "$tickledir" # Just in case
800 _pnn=$(ctdb pnn) ; _pnn=${_pnn#PNN:}
802 # What public IPs do I hold?
803 _ips=$(ctdb -Y ip | awk -F: -v pnn=$_pnn '$3 == pnn {print $2}')
805 # IPs as a regexp choice
806 _ipschoice="($(echo $_ips | sed -e 's/ /|/g' -e 's/\./\\\\./g'))"
808 # Record connections to our public IPs in a temporary file
809 _my_connections="${tickledir}/${_port}.connections"
810 rm -f "$_my_connections"
812 awk -v destpat="^${_ipschoice}:${_port}\$" \
813 '$1 == "tcp" && $6 == "ESTABLISHED" && $4 ~ destpat {print $5, $4}' |
814 sort >"$_my_connections"
816 # Record our current tickles in a temporary file
817 _my_tickles="${tickledir}/${_port}.tickles"
820 ctdb -Y gettickles $_i $_port |
821 awk -F: 'NR > 1 { printf "%s:%s %s:%s\n", $2, $3, $4, $5 }'
825 # Add tickles for connections that we haven't already got tickles for
826 comm -23 "$_my_connections" "$_my_tickles" |
827 while read _src _dst ; do
828 ctdb addtickle $_src $_dst
831 # Remove tickles for connections that are no longer there
832 comm -13 "$_my_connections" "$_my_tickles" |
833 while read _src _dst ; do
834 ctdb deltickle $_src $_dst
837 rm -f "$_my_connections" "$_my_tickles"
840 ########################################################
841 # load a site local config file
842 ########################################################
844 [ -x $CTDB_BASE/rc.local ] && {
845 . $CTDB_BASE/rc.local
848 [ -d $CTDB_BASE/rc.local.d ] && {
849 for i in $CTDB_BASE/rc.local.d/* ; do
850 [ -x "$i" ] && . "$i"
854 script_name="${0##*/}" # basename
855 service_name="$script_name" # default is just the script name