When memory allocations for recovery fails,
[metze/ctdb/wip.git] / config / ctdb.init
1 #!/bin/sh
2 #
3 ##############################
4 # ctdb:                        Starts the clustered tdb daemon
5 #
6 # chkconfig:           - 90 01
7 #
8 # description:                 Starts and stops the clustered tdb daemon
9 # pidfile:             /var/run/ctdbd/ctdbd.pid
10 #
11
12 ### BEGIN INIT INFO
13 # Provides:            ctdb
14 # Required-Start:      $network
15 # Required-Stop:       $network
16 # Default-Stop:
17 # Default-Start:       3 5
18 # Short-Description:   start and stop ctdb service
19 # Description:         initscript for the ctdb service
20 ### END INIT INFO
21
22 # Source function library.
23 if [ -f /etc/init.d/functions ] ; then
24     . /etc/init.d/functions
25 elif [ -f /etc/rc.d/init.d/functions ] ; then
26     . /etc/rc.d/init.d/functions
27 fi
28
29 [ -f /etc/rc.status ] && {
30     . /etc/rc.status
31     rc_reset
32     LC_ALL=en_US.UTF-8
33 }
34
35 # Avoid using root's TMPDIR
36 unset TMPDIR
37
38 [ -z "$CTDB_BASE" ] && {
39     export CTDB_BASE="/etc/ctdb"
40 }
41
42 . $CTDB_BASE/functions
43 loadconfig network
44 loadconfig ctdb
45
46 # check networking is up (for redhat)
47 [ "$NETWORKING" = "no" ] && exit 0
48
49 detect_init_style
50 export CTDB_INIT_STYLE
51
52 ctdbd=${CTDBD:-/usr/sbin/ctdbd}
53
54 if [ "$CTDB_VALGRIND" = "yes" ]; then
55     init_style="valgrind"
56 else
57     init_style="$CTDB_INIT_STYLE"
58 fi
59
60 build_ctdb_options () {
61
62     maybe_set () {
63         # If the 2nd arg is null then return - don't set anything.
64         # Else if the 3rd arg is set and it doesn't match the 2nd arg
65         # then return
66         [ -z "$2" -o \( -n "$3" -a "$3" != "$2" \) ] && return
67
68         val="$2"
69         case "$1" in
70             --*) sep="=" ;;
71             -*)  sep=" " ;;
72         esac
73         # For these options we're only passing a value-less flag.
74         [ -n "$3" ] && {
75             val=""
76             sep=""
77         }
78
79         CTDB_OPTIONS="${CTDB_OPTIONS}${CTDB_OPTIONS:+ }${1}${sep}${val}"
80     }
81
82     [ -z "$CTDB_RECOVERY_LOCK" ] && {
83         echo "No recovery lock specified. Starting CTDB without split brain prevention"
84     }
85     maybe_set "--reclock"                "$CTDB_RECOVERY_LOCK"
86
87     # build up CTDB_OPTIONS variable from optional parameters
88     maybe_set "--logfile"                "$CTDB_LOGFILE"
89     maybe_set "--nlist"                  "$CTDB_NODES"
90     maybe_set "--socket"                 "$CTDB_SOCKET"
91     maybe_set "--public-addresses"       "$CTDB_PUBLIC_ADDRESSES"
92     maybe_set "--public-interface"       "$CTDB_PUBLIC_INTERFACE"
93     maybe_set "--dbdir"                  "$CTDB_DBDIR"
94     maybe_set "--dbdir-persistent"       "$CTDB_DBDIR_PERSISTENT"
95     maybe_set "--event-script-dir"       "$CTDB_EVENT_SCRIPT_DIR"
96     maybe_set "--transport"              "$CTDB_TRANSPORT"
97     maybe_set "-d"                       "$CTDB_DEBUGLEVEL"
98     maybe_set "--notification-script"    "$CTDB_NOTIFY_SCRIPT"
99     maybe_set "--start-as-disabled"      "$CTDB_START_AS_DISABLED"    "yes"
100     maybe_set "--start-as-stopped "      "$CTDB_START_AS_STOPPED"     "yes"
101     maybe_set "--no-recmaster"           "$CTDB_CAPABILITY_RECMASTER" "no"
102     maybe_set "--no-lmaster"             "$CTDB_CAPABILITY_LMASTER"   "no"
103     maybe_set "--lvs --single-public-ip" "$CTDB_LVS_PUBLIC_IP"
104     maybe_set "--script-log-level"       "$CTDB_SCRIPT_LOG_LEVEL"
105     maybe_set "--syslog"                 "$CTDB_SYSLOG"               "yes"
106     maybe_set "--max-persistent-check-errors" "$CTDB_MAX_PERSISTENT_CHECK_ERRORS"
107 }
108
109 check_tdb () {
110         local PDBASE=$1
111
112         local TDBTOOL_HAS_CHECK=`echo "help" | /usr/bin/tdbtool | grep check | wc -l`
113
114         test x"$TDBTOOL_HAS_CHECK" = x"1" && {
115                 #
116                 # Note tdbtool always exits with 0
117                 #
118                 local OK=`/usr/bin/tdbtool $PDBASE check | grep "Database integrity is OK" | wc -l`
119                 test x"$OK" = x"1" || {
120                         return 1;
121                 }
122
123                 return 0;
124         }
125
126         /usr/bin/tdbdump $PDBASE >/dev/null 2>/dev/null || {
127                 return $?;
128         }
129
130         return 0;
131 }
132
133 check_persistent_databases () {
134     PERSISTENT_DB_DIR="${CTDB_DBDIR:-/var/ctdb}/persistent"
135     mkdir -p $PERSISTENT_DB_DIR 2>/dev/null
136     local ERRCOUNT=$CTDB_MAX_PERSISTENT_CHECK_ERRORS
137
138     test -z "$ERRCOUNT" && {
139         ERRCOUNT="0"
140     }
141     test x"$ERRCOUNT" != x"0" && {
142         return 0;
143     }
144     for PDBASE in `ls $PERSISTENT_DB_DIR/*.tdb.[0-9] 2>/dev/null`; do
145         check_tdb $PDBASE || {
146             echo "Persistent database $PDBASE is corrupted! CTDB will not start."
147             return 1
148         }
149     done
150 }
151
152 set_ctdb_variables () {
153     # set any tunables from the config file
154     set | grep ^CTDB_SET_ | cut -d_ -f3- | 
155     while read v; do
156         varname=`echo $v | cut -d= -f1`
157         value=`echo $v | cut -d= -f2`
158         ctdb setvar $varname $value || RETVAL=1
159     done || exit 1
160 }
161
162 set_retval() {
163     return $1
164 }
165
166 ctdbd=${CTDBD:-/usr/sbin/ctdbd}
167
168 start() {
169     echo -n $"Starting ctdbd service: "
170
171     ctdb ping >/dev/null 2>&1 && {
172         echo $"CTDB is already running"
173         return 1
174     }
175
176     build_ctdb_options
177
178     check_persistent_databases || return $?
179
180     if [ yes == "$CTDB_SUPPRESS_COREFILE" ]; then
181         ulimit -c 0
182     else
183         ulimit -c unlimited
184     fi
185
186     case $init_style in
187         valgrind)
188             valgrind -q --log-file=/var/log/ctdb_valgrind \
189                 $ctdbd --valgrinding $CTDB_OPTIONS
190             RETVAL=$?
191             echo
192             ;;
193         suse)
194             startproc $ctdbd $CTDB_OPTIONS
195             rc_status -v
196             RETVAL=$?
197             ;;
198         redhat)
199             daemon $ctdbd $CTDB_OPTIONS
200             RETVAL=$?
201             echo
202             [ $RETVAL -eq 0 ] && touch /var/lock/subsys/ctdb || RETVAL=1
203             ;;
204         debian)
205             start-stop-daemon --start --quiet --background \
206                 --exec $ctdbd -- $CTDB_OPTIONS
207             RETVAL=$?
208             ;;
209     esac
210
211     sleep 1
212
213     set_ctdb_variables
214
215     return $RETVAL
216 }       
217
218 stop() {
219     echo -n $"Shutting down ctdbd service: "
220     pkill -0 -f $ctdbd || {
221         echo -n "  Warning: ctdbd not running ! "
222         case $init_style in
223             suse)
224                 rc_status -v
225                 ;;
226             redhat)
227                 echo ""
228                 ;;
229         esac
230         return 0
231     }
232     ctdb shutdown >/dev/null 2>&1
233     RETVAL=$?
234     count=0
235     while pkill -0 -f $ctdbd ; do
236         sleep 1
237         count=$(($count + 1))
238         [ $count -gt 10 ] && {
239             echo -n $"killing ctdbd "
240             pkill -9 -f $ctdbd
241             pkill -9 -f $CTDB_BASE/events.d/
242         }
243     done
244     case $init_style in
245         suse)
246             # re-set the return code to the recorded RETVAL in order
247             # to print the correct status message
248             set_retval $RETVAL
249             rc_status -v
250             ;;
251         redhat)
252             [ $RETVAL -eq 0 ] && success || failure
253             [ $RETVAL -eq 0 ] && rm -f /var/lock/subsys/ctdb
254             echo ""
255             ;;
256     esac
257     return $RETVAL
258 }
259
260 restart() {
261     stop
262     start
263 }       
264
265 status() {
266     echo -n $"Checking for ctdbd service: "
267     ctdb ping >/dev/null 2>&1 || {
268         RETVAL=$?
269         echo -n "  ctdbd not running. "
270         case $init_style in
271             suse)
272                 set_retval $RETVAL
273                 rc_status -v
274                 ;;
275             redhat)
276                 echo ""
277                 ;;
278         esac
279         return $RETVAL
280     }
281     echo ""
282     ctdb status
283 }
284
285
286 case "$1" in
287     start)
288         start
289         ;;
290     stop)
291         stop
292         ;;
293     restart|reload)
294         restart
295         ;;
296     status)
297         status
298         ;;
299     condrestart)
300         ctdb status > /dev/null && restart || :
301         ;;
302     cron)
303         # used from cron to auto-restart ctdb
304         ctdb status > /dev/null || restart
305         ;;
306     *)
307         echo $"Usage: $0 {start|stop|restart|status|cron|condrestart}"
308         exit 1
309 esac
310
311 exit $?