ctdb/config/functions

   1 # Hey Emacs, this is a -*- shell-script -*- !!!
   2
   3 # utility functions for ctdb event scripts
   4
   5 PATH=/bin:/usr/bin:/usr/sbin:/sbin:$PATH
   6
   7 [ -z "$CTDB_VARDIR" ] && {
   8     if [ -d "/var/lib/ctdb" ] ; then
   9         export CTDB_VARDIR="/var/lib/ctdb"
  10     else
  11         export CTDB_VARDIR="/var/ctdb"
  12     fi
  13 }
  14 [ -z "$CTDB_ETCDIR" ] && {
  15     export CTDB_ETCDIR="/etc"
  16 }
  17
  18 #######################################
  19 # pull in a system config file, if any
  20 _loadconfig() {
  21
  22     if [ -z "$1" ] ; then
  23         foo="${service_config:-${service_name}}"
  24         if [ -n "$foo" ] ; then
  25             loadconfig "$foo"
  26             return
  27         fi
  28     fi
  29
  30     if [ "$1" != "ctdb" ] ; then
  31         loadconfig "ctdb"
  32     fi
  33
  34     if [ -z "$1" ] ; then
  35         return
  36     fi
  37
  38     if [ -f $CTDB_ETCDIR/sysconfig/$1 ]; then
  39         . $CTDB_ETCDIR/sysconfig/$1
  40     elif [ -f $CTDB_ETCDIR/default/$1 ]; then
  41         . $CTDB_ETCDIR/default/$1
  42     elif [ -f $CTDB_BASE/sysconfig/$1 ]; then
  43         . $CTDB_BASE/sysconfig/$1
  44     fi
  45 }
  46
  47 loadconfig () {
  48     _loadconfig "$@"
  49 }
  50
  51 ##############################################################
  52
  53 # CTDB_SCRIPT_DEBUGLEVEL can be overwritten by setting it in a
  54 # configuration file.
  55 debug ()
  56 {
  57     if [ ${CTDB_SCRIPT_DEBUGLEVEL:-2} -ge 4 ] ; then
  58         # If there are arguments then echo them.  Otherwise expect to
  59         # use stdin, which allows us to pass lots of debug using a
  60         # here document.
  61         if [ -n "$1" ] ; then
  62             echo "DEBUG: $*"
  63         elif ! tty -s ; then
  64             sed -e 's@^@DEBUG: @'
  65         fi
  66     fi
  67 }
  68
  69 die ()
  70 {
  71     _msg="$1"
  72     _rc="${2:-1}"
  73
  74     echo "$_msg"
  75     exit $_rc
  76 }
  77
  78 # Log given message or stdin to either syslog or a CTDB log file
  79 # $1 is the tag passed to logger if syslog is in use.
  80 script_log ()
  81 {
  82     _tag="$1" ; shift
  83
  84     _using_syslog=false
  85     if [ "$CTDB_SYSLOG" = "yes" -o -z "$CTDB_LOGFILE" ] ; then
  86         _using_syslog=true
  87     fi
  88     case "$CTDB_OPTIONS" in
  89         *--syslog*) _using_syslog=true ;;
  90     esac
  91
  92     if $_using_syslog ; then
  93         logger -t "ctdbd: ${_tag}" $*
  94     else
  95         {
  96             if [ -n "$*" ] ; then
  97                 echo "$*"
  98             else
  99                 cat
 100             fi
 101         } >>"${CTDB_LOGFILE:-/var/log/log.ctdb}"
 102     fi
 103 }
 104
 105 # When things are run in the background in an eventscript then logging
 106 # output might get lost.  This is the "solution".  :-)
 107 background_with_logging ()
 108 {
 109     (
 110         "$@" 2>&1 </dev/null |
 111         script_log "${script_name}&"
 112     )&
 113
 114     return 0
 115 }
 116
 117 ##############################################################
 118 # check number of args for different events
 119 ctdb_check_args ()
 120 {
 121     case "$1" in
 122         takeip|releaseip)
 123             if [ $# != 4 ]; then
 124                 echo "ERROR: must supply interface, IP and maskbits"
 125                 exit 1
 126             fi
 127             ;;
 128         updateip)
 129             if [ $# != 5 ]; then
 130                 echo "ERROR: must supply old interface, new interface, IP and maskbits"
 131                 exit 1
 132             fi
 133             ;;
 134     esac
 135 }
 136
 137 ##############################################################
 138 # determine on what type of system (init style) we are running
 139 detect_init_style() {
 140     # only do detection if not already set:
 141     test "x$CTDB_INIT_STYLE" != "x" && return
 142
 143     if [ -x /sbin/startproc ]; then
 144         CTDB_INIT_STYLE="suse"
 145     elif [ -x /sbin/start-stop-daemon ]; then
 146         CTDB_INIT_STYLE="debian"
 147     else
 148         CTDB_INIT_STYLE="redhat"
 149     fi
 150 }
 151
 152 ######################################################
 153 # simulate /sbin/service on platforms that don't have it
 154 # _service() makes it easier to hook the service() function for
 155 # testing.
 156 _service ()
 157 {
 158   _service_name="$1"
 159   _op="$2"
 160
 161   # do nothing, when no service was specified
 162   [ -z "$_service_name" ] && return
 163
 164   if [ -x /sbin/service ]; then
 165       $_nice /sbin/service "$_service_name" "$_op"
 166   elif [ -x $CTDB_ETCDIR/init.d/$_service_name ]; then
 167       $_nice $CTDB_ETCDIR/init.d/$_service_name "$_op"
 168   elif [ -x $CTDB_ETCDIR/rc.d/init.d/$_service_name ]; then
 169       $_nice $CTDB_ETCDIR/rc.d/init.d/$_service_name "$_op"
 170   fi
 171 }
 172
 173 service()
 174 {
 175     _nice=""
 176     _service "$@"
 177 }
 178
 179 ######################################################
 180 # simulate /sbin/service (niced) on platforms that don't have it
 181 nice_service()
 182 {
 183     _nice="nice"
 184     _service "$@"
 185 }
 186
 187 ######################################################
 188 # wrapper around /proc/ settings to allow them to be hooked
 189 # for testing
 190 # 1st arg is relative path under /proc/, 2nd arg is value to set
 191 set_proc ()
 192 {
 193     echo "$2" >"/proc/$1"
 194 }
 195
 196 ######################################################
 197 # wrapper around getting file contents from /proc/ to allow
 198 # this to be hooked for testing
 199 # 1st arg is relative path under /proc/
 200 get_proc ()
 201 {
 202     cat "/proc/$1"
 203 }
 204
 205 ######################################################
 206 # Check that an RPC service is healthy -
 207 # this includes allowing a certain number of failures
 208 # before marking the NFS service unhealthy.
 209 #
 210 # usage: nfs_check_rpc_service SERVICE_NAME [ triple ...]
 211 #
 212 # each triple is a set of 3 arguments: an operator, a
 213 # fail count limit and an action string.
 214 #
 215 # For example:
 216 #
 217 #       nfs_check_rpc_service "lockd" \
 218 #           -ge 15 "verbose restart unhealthy" \
 219 #           -eq 10 "restart:bs"
 220 #
 221 # says that if lockd is down for 15 iterations then do
 222 # a verbose restart of lockd and mark the node unhealthy.
 223 # Before this, after 10 iterations of failure, the
 224 # service is restarted silently in the background.
 225 # Order is important: the number of failures need to be
 226 # specified in reverse order because processing stops
 227 # after the first condition that is true.
 228 ######################################################
 229 nfs_check_rpc_service ()
 230 {
 231     _prog_name="$1" ; shift
 232
 233     if _nfs_check_rpc_common "$_prog_name" ; then
 234         return
 235     fi
 236
 237     while [ -n "$3" ] ; do
 238         if _nfs_check_rpc_action "$1" "$2" "$3" ; then
 239             break
 240         fi
 241         shift 3
 242     done
 243 }
 244
 245 # The new way of doing things...
 246 nfs_check_rpc_services ()
 247 {
 248     # Files must end with .check - avoids editor backups, RPM fu, ...
 249     for _f in "${CTDB_BASE}/nfs-rpc-checks.d/"[0-9][0-9].*.check ; do
 250         _t="${_f%.check}"
 251         _prog_name="${_t##*/[0-9][0-9].}"
 252
 253         if _nfs_check_rpc_common "$_prog_name" ; then
 254             # This RPC service is up, check next service...
 255             continue
 256         fi
 257
 258         # Check each line in the file in turn until one of the limit
 259         # checks is hit...
 260         while read _cmp _lim _rest ; do
 261             # Skip comments
 262             case "$_cmp" in
 263                 \#*) continue ;;
 264             esac
 265
 266             if _nfs_check_rpc_action "$_cmp" "$_lim" "$_rest" ; then
 267                 # Limit was hit on this line, no further checking...
 268                 break
 269             fi
 270         done <"$_f"
 271     done
 272 }
 273
 274 _nfs_check_rpc_common ()
 275 {
 276     _prog_name="$1"
 277
 278     # Some platforms don't have separate programs for all services.
 279     case "$_prog_name" in
 280         statd)
 281             which "rpc.${_prog_name}" >/dev/null 2>&1 || return 0
 282     esac
 283
 284     _version=1
 285     _rpc_prog="$_prog_name"
 286     _restart=""
 287     _opts=""
 288     case "$_prog_name" in
 289         nfsd)
 290             _rpc_prog=nfs
 291             _version=3
 292             _restart="echo 'Trying to restart NFS service'"
 293             _restart="${_restart}; startstop_nfs restart"
 294             ;;
 295         mountd)
 296             _opts="${MOUNTD_PORT:+ -p }${MOUNTD_PORT}"
 297             ;;
 298         rquotad)
 299             _opts="${RQUOTAD_PORT:+ -p }${RQUOTAD_PORT}"
 300             ;;
 301         lockd)
 302             _rpc_prog=nlockmgr
 303             _version=4
 304             _restart="echo 'Trying to restart lock manager service'"
 305             _restart="${_restart}; startstop_nfslock restart"
 306             ;;
 307         statd)
 308             _rpc_prog=status
 309             _opts="${STATD_HOSTNAME:+ -n }${STATD_HOSTNAME}"
 310             _opts="${_opts}${STATD_PORT:+ -p }${STATD_PORT}"
 311             _opts="${_opts}${STATD_OUTGOING_PORT:+ -o }${STATD_OUTGOING_PORT}"
 312             ;;
 313         *)
 314             echo "Internal error: unknown RPC program \"$_prog_name\"."
 315             exit 1
 316     esac
 317
 318     _service_name="nfs_${_prog_name}"
 319
 320     if ctdb_check_rpc "$_rpc_prog" $_version >/dev/null ; then
 321         ctdb_counter_init "$_service_name"
 322         return 0
 323     fi
 324
 325     ctdb_counter_incr "$_service_name"
 326
 327     return 1
 328 }
 329
 330 _nfs_check_rpc_action ()
 331 {
 332     _cmp="$1"
 333     _limit="$2"
 334     _actions="$3"
 335
 336     if ctdb_check_counter "quiet" "$_cmp" "$_limit" "$_service_name" ; then
 337         return 1
 338     fi
 339
 340     for _action in $_actions ; do
 341         case "$_action" in
 342             verbose)
 343                 echo "$ctdb_check_rpc_out"
 344                 ;;
 345             restart|restart:*)
 346                 # No explicit command specified, construct rpc command.
 347                 if [ -z "$_restart" ] ; then
 348                     _p="rpc.${_prog_name}"
 349                     _restart="echo 'Trying to restart $_prog_name [${_p}${_opts}]'"
 350                     _restart="${_restart}; killall -q -9 $_p"
 351                     _restart="${_restart}; $_p $_opts"
 352                 fi
 353
 354                 # Process restart flags...
 355                 _flags="${_action#restart:}"
 356                 # There may not have been a colon...
 357                 [ "$_flags" != "$_action" ] || _flags=""
 358                 # q=quiet - everything to /dev/null
 359                 if [ "${_flags#*q}" != "$_flags" ] ; then
 360                     _restart="{ ${_restart} ; } >/dev/null 2>&1"
 361                 fi
 362                 # s=stealthy - last command to /dev/null
 363                 if [ "${_flags#*s}" != "$_flags" ] ; then
 364                     _restart="${_restart} >/dev/null 2>&1"
 365                 fi
 366                 # b=background - the whole thing, easy and reliable
 367                 if [ "${_flags#*b}" != "$_flags" ] ; then
 368                     _restart="{ ${_restart} ; } &"
 369                 fi
 370
 371                 # Do it!
 372                 eval "${_restart}"
 373                 ;;
 374             unhealthy)
 375                 exit 1
 376                 ;;
 377             *)
 378                 echo "Internal error: unknown action \"$_action\"."
 379                 exit 1
 380         esac
 381     done
 382
 383     return 0
 384 }
 385
 386 ######################################################
 387 # check that a rpc server is registered with portmap
 388 # and responding to requests
 389 # usage: ctdb_check_rpc SERVICE_NAME VERSION
 390 ######################################################
 391 ctdb_check_rpc ()
 392 {
 393     progname="$1"
 394     version="$2"
 395
 396     if ! ctdb_check_rpc_out=$(rpcinfo -u localhost $progname $version 2>&1) ; then
 397         ctdb_check_rpc_out="ERROR: $progname failed RPC check:
 398 $ctdb_check_rpc_out"
 399         echo "$ctdb_check_rpc_out"
 400         return 1
 401     fi
 402 }
 403
 404 ######################################################
 405 # Ensure $service_name is set
 406 assert_service_name ()
 407 {
 408     [ -n "$service_name" ] || die "INTERNAL ERROR: \$service_name not set"
 409 }
 410
 411 ######################################################
 412 # check a set of directories is available
 413 # return 1 on a missing directory
 414 # directories are read from stdin
 415 ######################################################
 416 ctdb_check_directories_probe()
 417 {
 418     while IFS="" read d ; do
 419         case "$d" in
 420             *%*)
 421                 continue
 422                 ;;
 423             *)
 424                 [ -d "${d}/." ] || return 1
 425         esac
 426     done
 427 }
 428
 429 ######################################################
 430 # check a set of directories is available
 431 # directories are read from stdin
 432 ######################################################
 433 ctdb_check_directories()
 434 {
 435     ctdb_check_directories_probe || {
 436         echo "ERROR: $service_name directory \"$d\" not available"
 437         exit 1
 438     }
 439 }
 440
 441 ######################################################
 442 # check a set of tcp ports
 443 # usage: ctdb_check_tcp_ports <ports...>
 444 ######################################################
 445
 446 # This flag file is created when a service is initially started.  It
 447 # is deleted the first time TCP port checks for that service succeed.
 448 # Until then ctdb_check_tcp_ports() prints a more subtle "error"
 449 # message if a port check fails.
 450 _ctdb_check_tcp_common ()
 451 {
 452     assert_service_name
 453     _ctdb_service_started_file="$ctdb_fail_dir/$service_name.started"
 454 }
 455
 456 ctdb_check_tcp_init ()
 457 {
 458     _ctdb_check_tcp_common
 459     mkdir -p "${_ctdb_service_started_file%/*}" # dirname
 460     touch "$_ctdb_service_started_file"
 461 }
 462
 463 ctdb_check_tcp_ports()
 464 {
 465     if [ -z "$1" ] ; then
 466         echo "INTERNAL ERROR: ctdb_check_tcp_ports - no ports specified"
 467         exit 1
 468     fi
 469
 470     # Set default value for CTDB_TCP_PORT_CHECKS if unset.
 471     # If any of these defaults are unsupported then this variable can
 472     # be overridden in /etc/sysconfig/ctdb or via a file in
 473     # /etc/ctdb/rc.local.d/.
 474     : ${CTDB_TCP_PORT_CHECKERS:=ctdb nmap netstat}
 475
 476     for _c in $CTDB_TCP_PORT_CHECKERS ; do
 477         ctdb_check_tcp_ports_$_c "$@"
 478         case "$?" in
 479             0)
 480                 _ctdb_check_tcp_common
 481                 rm -f "$_ctdb_service_started_file"
 482                 return 0
 483                 ;;
 484             1)
 485                 _ctdb_check_tcp_common
 486                 if [ ! -f "$_ctdb_service_started_file" ] ; then
 487                     echo "ERROR: $service_name tcp port $_p is not responding"
 488                     debug <<EOF
 489 $ctdb_check_tcp_ports_debug
 490 EOF
 491                 else
 492                     echo "INFO: $service_name tcp port $_p is not responding"
 493                 fi
 494
 495                 return 1
 496                 ;;
 497             127)
 498                 debug <<EOF
 499 ctdb_check_ports - checker $_c not implemented
 500 output from checker was:
 501 $ctdb_check_tcp_ports_debug
 502 EOF
 503                 ;;
 504             *)
 505
 506         esac
 507     done
 508
 509     echo "INTERNAL ERROR: ctdb_check_ports - no working checkers in CTDB_TCP_PORT_CHECKERS=\"$CTDB_TCP_PORT_CHECKERS\""
 510
 511     return 127
 512 }
 513
 514 ctdb_check_tcp_ports_netstat ()
 515 {
 516     _cmd='netstat -l -t -n'
 517     _ns=$($_cmd 2>&1)
 518     if [ $? -eq 127 ] ; then
 519         # netstat probably not installed - unlikely?
 520         ctdb_check_tcp_ports_debug="$_ns"
 521         return 127
 522     fi
 523
 524     for _p ; do  # process each function argument (port)
 525         for _a in '0\.0\.0\.0' '::' ; do
 526             _pat="[[:space:]]${_a}:${_p}[[:space:]]+[^[:space:]]+[[:space:]]+LISTEN"
 527             if echo "$_ns" | grep -E -q "$_pat" ; then
 528                 # We matched the port, so process next port
 529                 continue 2
 530             fi
 531         done
 532
 533         # We didn't match the port, so flag an error.
 534         ctdb_check_tcp_ports_debug="$_cmd shows this output:
 535 $_ns"
 536         return 1
 537     done
 538
 539     return 0
 540 }
 541
 542 ctdb_check_tcp_ports_nmap ()
 543 {
 544     # nmap wants a comma-separated list of ports
 545     _ports=""
 546     for _p ; do
 547         _ports="${_ports}${_ports:+,}${_p}"
 548     done
 549
 550     _cmd="nmap -n -oG - -PS 127.0.0.1 -p $_ports"
 551
 552     _nmap_out=$($_cmd 2>&1)
 553     if [ $? -eq 127 ] ; then
 554         # nmap probably not installed
 555         ctdb_check_tcp_ports_debug="$_nmap_out"
 556         return 127
 557     fi
 558
 559     # get the port-related output
 560     _port_info=$(echo "$_nmap_out" | sed -n -r -e 's@^.*Ports:[[:space:]]@@p')
 561
 562     for _p ; do
 563         # looking for something like this:
 564         #  445/open/tcp//microsoft-ds///
 565         # possibly followed by a comma
 566         _t="$_p/open/tcp//"
 567         case "$_port_info" in
 568             # The info we're after must be either at the beginning of
 569             # the string or it must follow a space.
 570             $_t*|*\ $_t*) : ;;
 571             *)
 572                 # Nope, flag an error...
 573                 ctdb_check_tcp_ports_debug="$_cmd shows this output:
 574 $_nmap_out"
 575                 return 1
 576         esac
 577     done
 578
 579     return 0
 580 }
 581
 582 # Use the new "ctdb checktcpport" command to check the port.
 583 # This is very cheap.
 584 ctdb_check_tcp_ports_ctdb ()
 585 {
 586     for _p ; do  # process each function argument (port)
 587         _cmd="ctdb checktcpport $_p"
 588         _out=$($_cmd 2>&1)
 589         _ret=$?
 590         case "$_ret" in
 591             0)
 592                 ctdb_check_tcp_ports_debug="\"$_cmd\" was able to bind to port"
 593                 return 1
 594                 ;;
 595             98)
 596                 # Couldn't bind, something already listening, next port...
 597                 continue
 598                 ;;
 599             *)
 600                 ctdb_check_tcp_ports_debug="$_cmd (exited with $_ret) with output:
 601 $_out"
 602                 # assume not implemented
 603                 return 127
 604         esac
 605     done
 606
 607     return 0
 608 }
 609
 610 ######################################################
 611 # check a unix socket
 612 # usage: ctdb_check_unix_socket SERVICE_NAME <socket_path>
 613 ######################################################
 614 ctdb_check_unix_socket() {
 615     socket_path="$1"
 616     [ -z "$socket_path" ] && return
 617
 618     if ! netstat --unix -a -n | grep -q "^unix.*LISTEN.*${socket_path}$"; then
 619         echo "ERROR: $service_name socket $socket_path not found"
 620         return 1
 621     fi
 622 }
 623
 624 ######################################################
 625 # check a command returns zero status
 626 # usage: ctdb_check_command <command>
 627 ######################################################
 628 ctdb_check_command ()
 629 {
 630     _out=$("$@" 2>&1) || {
 631         echo "ERROR: $* returned error"
 632         echo "$_out" | debug
 633         exit 1
 634     }
 635 }
 636
 637 ################################################
 638 # kill off any TCP connections with the given IP
 639 ################################################
 640 kill_tcp_connections ()
 641 {
 642     _ip="$1"
 643
 644     _oneway=false
 645     if [ "$2" = "oneway" ] ; then
 646         _oneway=true
 647     fi
 648
 649     get_tcp_connections_for_ip "$_ip" | {
 650         _killcount=0
 651         _failed=false
 652
 653         while read dest src; do
 654             echo "Killing TCP connection $src $dest"
 655             ctdb killtcp $src $dest >/dev/null 2>&1 || _failed=true
 656             _destport="${dest##*:}"
 657             __oneway=$_oneway
 658             case $_destport in
 659                 # we only do one-way killtcp for CIFS
 660                 139|445) __oneway=true ;;
 661             esac
 662             if ! $__oneway ; then
 663                 ctdb killtcp $dest $src >/dev/null 2>&1 || _failed=true
 664             fi
 665
 666             _killcount=$(($_killcount + 1))
 667         done
 668
 669         if $_failed ; then
 670             echo "Failed to send killtcp control"
 671             return
 672         fi
 673         if [ $_killcount -eq 0 ] ; then
 674             return
 675         fi
 676
 677         _count=0
 678         while : ; do
 679             if [ -z "$(get_tcp_connections_for_ip $_ip)" ] ; then
 680                 echo "Killed $_killcount TCP connections to released IP $_ip"
 681                 return
 682             fi
 683
 684             _count=$(($_count + 1))
 685             if [ $_count -gt 3 ] ; then
 686                 echo "Timed out killing tcp connections for IP $_ip"
 687                 return
 688             fi
 689
 690             sleep 1
 691         done
 692     }
 693 }
 694
 695 ##################################################################
 696 # kill off the local end for any TCP connections with the given IP
 697 ##################################################################
 698 kill_tcp_connections_local_only ()
 699 {
 700     kill_tcp_connections "$1" "oneway"
 701 }
 702
 703 ##################################################################
 704 # tickle any TCP connections with the given IP
 705 ##################################################################
 706 tickle_tcp_connections ()
 707 {
 708     _ip="$1"
 709
 710     get_tcp_connections_for_ip "$_ip" |
 711     {
 712         _failed=false
 713
 714         while read dest src; do
 715             echo "Tickle TCP connection $src $dest"
 716             ctdb tickle $src $dest >/dev/null 2>&1 || _failed=true
 717             echo "Tickle TCP connection $dest $src"
 718             ctdb tickle $dest $src >/dev/null 2>&1 || _failed=true
 719         done
 720
 721         if $_failed ; then
 722             echo "Failed to send tickle control"
 723         fi
 724     }
 725 }
 726
 727 get_tcp_connections_for_ip ()
 728 {
 729     _ip="$1"
 730
 731     netstat -tn | awk -v ip=$_ip \
 732         'index($1, "tcp") == 1 && \
 733          (index($4, ip ":") == 1 || index($4, "::ffff:" ip ":") == 1) \
 734          && $6 == "ESTABLISHED" \
 735          {print $4" "$5}'
 736 }
 737
 738 ########################################################
 739 # start/stop the Ganesha nfs service
 740 ########################################################
 741 startstop_ganesha()
 742 {
 743     _service_name="nfs-ganesha-$CTDB_CLUSTER_FILESYSTEM_TYPE"
 744     case "$1" in
 745         start)
 746             service "$_service_name" start
 747             ;;
 748         stop)
 749             service "$_service_name" stop
 750             ;;
 751         restart)
 752             service "$_service_name" restart
 753             ;;
 754     esac
 755 }
 756
 757 ########################################################
 758 # start/stop the nfs service on different platforms
 759 ########################################################
 760 startstop_nfs() {
 761         PLATFORM="unknown"
 762         [ -x $CTDB_ETCDIR/init.d/nfsserver ] && {
 763                 PLATFORM="sles"
 764         }
 765         [ -x $CTDB_ETCDIR/init.d/nfslock ] && {
 766                 PLATFORM="rhel"
 767         }
 768
 769         case $PLATFORM in
 770         sles)
 771                 case $1 in
 772                 start)
 773                         service nfsserver start
 774                         ;;
 775                 stop)
 776                         service nfsserver stop > /dev/null 2>&1
 777                         ;;
 778                 restart)
 779                         set_proc "fs/nfsd/threads" 0
 780                         service nfsserver stop > /dev/null 2>&1
 781                         pkill -9 nfsd
 782                         service nfsserver start
 783                         ;;
 784                 esac
 785                 ;;
 786         rhel)
 787                 case $1 in
 788                 start)
 789                         service nfslock start
 790                         service nfs start
 791                         ;;
 792                 stop)
 793                         service nfs stop
 794                         service nfslock stop
 795                         ;;
 796                 restart)
 797                         set_proc "fs/nfsd/threads" 0
 798                         service nfs stop > /dev/null 2>&1
 799                         service nfslock stop > /dev/null 2>&1
 800                         pkill -9 nfsd
 801                         service nfslock start
 802                         service nfs start
 803                         ;;
 804                 esac
 805                 ;;
 806         *)
 807                 echo "Unknown platform. NFS is not supported with ctdb"
 808                 exit 1
 809                 ;;
 810         esac
 811 }
 812
 813 ########################################################
 814 # start/stop the nfs lockmanager service on different platforms
 815 ########################################################
 816 startstop_nfslock() {
 817         PLATFORM="unknown"
 818         [ -x $CTDB_ETCDIR/init.d/nfsserver ] && {
 819                 PLATFORM="sles"
 820         }
 821         [ -x $CTDB_ETCDIR/init.d/nfslock ] && {
 822                 PLATFORM="rhel"
 823         }
 824
 825         case $PLATFORM in
 826         sles)
 827                 # for sles there is no service for lockmanager
 828                 # so we instead just shutdown/restart nfs
 829                 case $1 in
 830                 start)
 831                         service nfsserver start
 832                         ;;
 833                 stop)
 834                         service nfsserver stop > /dev/null 2>&1
 835                         ;;
 836                 restart)
 837                         service nfsserver stop
 838                         service nfsserver start
 839                         ;;
 840                 esac
 841                 ;;
 842         rhel)
 843                 case $1 in
 844                 start)
 845                         service nfslock start
 846                         ;;
 847                 stop)
 848                         service nfslock stop > /dev/null 2>&1
 849                         ;;
 850                 restart)
 851                         service nfslock stop
 852                         service nfslock start
 853                         ;;
 854                 esac
 855                 ;;
 856         *)
 857                 echo "Unknown platform. NFS locking is not supported with ctdb"
 858                 exit 1
 859                 ;;
 860         esac
 861 }
 862
 863 add_ip_to_iface()
 864 {
 865     _iface=$1
 866     _ip=$2
 867     _maskbits=$3
 868
 869     _lockfile="${CTDB_VARDIR}/state/interface_modify_${_iface}.flock"
 870     mkdir -p "${_lockfile%/*}" # dirname
 871     [ -f "$_lockfile" ] || touch "$_lockfile"
 872
 873     (
 874         # Note: use of return/exit/die() below only gets us out of the
 875         # sub-shell, which is actually what we want.  That is, the
 876         # function should just return non-zero.
 877
 878         flock --timeout 30 0 || \
 879             die "add_ip_to_iface: unable to get lock for ${_iface}"
 880
 881         # Ensure interface is up
 882         ip link set "$_iface" up || \
 883             die "Failed to bringup interface $_iface"
 884
 885         ip addr add "$_ip/$_maskbits" brd + dev "$_iface" || \
 886             die "Failed to add $_ip/$_maskbits on dev $_iface"
 887     ) <"$_lockfile"
 888
 889     # Do nothing here - return above only gets us out of the subshell
 890     # and doing anything here will affect the return code.
 891 }
 892
 893 delete_ip_from_iface()
 894 {
 895     _iface=$1
 896     _ip=$2
 897     _maskbits=$3
 898
 899     _lockfile="${CTDB_VARDIR}/state/interface_modify_${_iface}.flock"
 900     mkdir -p "${_lockfile%/*}" # dirname
 901     [ -f "$_lockfile" ] || touch "$_lockfile"
 902
 903     (
 904         # Note: use of return/exit/die() below only gets us out of the
 905         # sub-shell, which is actually what we want.  That is, the
 906         # function should just return non-zero.
 907
 908         flock --timeout 30 0 || \
 909             die "delete_ip_from_iface: unable to get lock for ${_iface}"
 910
 911         _im="$_ip/$_maskbits"  # shorthand for readability
 912
 913         # "ip addr del" will delete all secondary IPs if this is the
 914         # primary.  To work around this _very_ annoying behaviour we
 915         # have to keep a record of the secondaries and re-add them
 916         # afterwards.  Yuck!
 917
 918         _secondaries=""
 919         if ip addr list dev "$_iface" primary | grep -Fq "inet $_im " ; then
 920             _secondaries=$(ip addr list dev "$_iface" secondary | \
 921                 awk '$1 == "inet" { print $2 }')
 922         fi
 923
 924         local _rc=0
 925         ip addr del "$_im" dev "$_iface" || {
 926             echo "Failed to del $_ip on dev $_iface"
 927             _rc=1
 928         }
 929
 930         if [ -n "$_secondaries" ] ; then
 931             for _i in $_secondaries; do
 932                 if ip addr list dev "$_iface" | grep -Fq "inet $_i" ; then
 933                     echo "Kept secondary $_i on dev $_iface"
 934                 else
 935                     echo "Re-adding secondary address $_i to dev $_iface"
 936                     ip addr add $_i brd + dev $_iface || {
 937                         echo "Failed to re-add address $_i to dev $_iface"
 938                         _rc=1
 939                     }
 940                 fi
 941             done
 942         fi
 943
 944         return $_rc
 945     ) <"$_lockfile"
 946
 947     # Do nothing here - return above only gets us out of the subshell
 948     # and doing anything here will affect the return code.
 949 }
 950
 951 # If the given IP is hosted then print 2 items: maskbits and iface
 952 ip_maskbits_iface ()
 953 {
 954     _addr="$1"
 955
 956     ip addr show to "${_addr}/32" 2>/dev/null | \
 957         awk '$1 == "inet" { print gensub(".*/", "", 1, $2), $NF }'
 958 }
 959
 960 drop_ip ()
 961 {
 962     _addr="${1%/*}"  # Remove optional maskbits
 963     _log_tag="$2"
 964
 965     set -- $(ip_maskbits_iface $_addr)
 966     if [ -n "$1" ] ; then
 967         _maskbits="$1"
 968         _iface="$2"
 969         if [ -n "$_log_tag" ] ; then
 970             script_log "$_log_tag" \
 971                 "Removing public address $_addr/$_maskbits from device $_iface"
 972         fi
 973         ip addr del $_addr/$_maskbits dev $_iface >/dev/null 2>&1
 974     fi
 975 }
 976
 977 drop_all_public_ips ()
 978 {
 979     _log_tag="$1"
 980
 981     while read _ip _x ; do
 982         drop_ip "$_ip" "$_log_tag"
 983     done <"${CTDB_PUBLIC_ADDRESSES:-/dev/null}"
 984 }
 985
 986 ########################################################
 987 # some simple logic for counting events - per eventscript
 988 # usage: ctdb_counter_init
 989 #        ctdb_counter_incr
 990 #        ctdb_check_counter_limit <limit>
 991 # ctdb_check_counter_limit fails when count >= <limit>
 992 ########################################################
 993 _ctdb_counter_common () {
 994     _service_name="${1:-${service_name:-${script_name}}}"
 995     _counter_file="$ctdb_fail_dir/$_service_name"
 996     mkdir -p "${_counter_file%/*}" # dirname
 997 }
 998 ctdb_counter_init () {
 999     _ctdb_counter_common "$1"
1000
1001     >"$_counter_file"
1002 }
1003 ctdb_counter_incr () {
1004     _ctdb_counter_common "$1"
1005
1006     # unary counting!
1007     echo -n 1 >> "$_counter_file"
1008 }
1009 ctdb_check_counter () {
1010     _msg="${1:-error}"  # "error"  - anything else is silent on fail
1011     _op="${2:--ge}"  # an integer operator supported by test
1012     _limit="${3:-${service_fail_limit}}"
1013     shift 3
1014     _ctdb_counter_common "$1"
1015
1016     # unary counting!
1017     _size=$(stat -c "%s" "$_counter_file" 2>/dev/null || echo 0)
1018     if [ $_size $_op $_limit ] ; then
1019         if [ "$_msg" = "error" ] ; then
1020             echo "ERROR: $_limit consecutive failures for $_service_name, marking node unhealthy"
1021             exit 1
1022         else
1023             return 1
1024         fi
1025     fi
1026 }
1027
1028 ########################################################
1029
1030 ctdb_status_dir="$CTDB_VARDIR/status"
1031 ctdb_fail_dir="$CTDB_VARDIR/failcount"
1032
1033 ctdb_setup_service_state_dir ()
1034 {
1035     service_state_dir="$CTDB_VARDIR/state/${1:-${service_name}}"
1036     mkdir -p "$service_state_dir" || {
1037         echo "Error creating state dir \"$service_state_dir\""
1038         exit 1
1039     }
1040 }
1041
1042 ########################################################
1043 # Managed status history, for auto-start/stop
1044
1045 ctdb_managed_dir="$CTDB_VARDIR/managed_history"
1046
1047 _ctdb_managed_common ()
1048 {
1049     _ctdb_managed_file="$ctdb_managed_dir/$service_name"
1050 }
1051
1052 ctdb_service_managed ()
1053 {
1054     _ctdb_managed_common
1055     mkdir -p "$ctdb_managed_dir"
1056     touch "$_ctdb_managed_file"
1057 }
1058
1059 ctdb_service_unmanaged ()
1060 {
1061     _ctdb_managed_common
1062     rm -f "$_ctdb_managed_file"
1063 }
1064
1065 is_ctdb_previously_managed_service ()
1066 {
1067     _ctdb_managed_common
1068     [ -f "$_ctdb_managed_file" ]
1069 }
1070
1071 ########################################################
1072 # Check and set status
1073
1074 log_status_cat ()
1075 {
1076     echo "node is \"$1\", \"${script_name}\" reports problem: $(cat $2)"
1077 }
1078
1079 ctdb_checkstatus ()
1080 {
1081     if [ -r "$ctdb_status_dir/$script_name/unhealthy" ] ; then
1082         log_status_cat "unhealthy" "$ctdb_status_dir/$script_name/unhealthy"
1083         return 1
1084     elif [ -r "$ctdb_status_dir/$script_name/banned" ] ; then
1085         log_status_cat "banned" "$ctdb_status_dir/$script_name/banned"
1086         return 2
1087     else
1088         return 0
1089     fi
1090 }
1091
1092 ctdb_setstatus ()
1093 {
1094     d="$ctdb_status_dir/$script_name"
1095     case "$1" in
1096         unhealthy|banned)
1097             mkdir -p "$d"
1098             cat "$2" >"$d/$1"
1099             ;;
1100         *)
1101             for i in "banned" "unhealthy" ; do
1102                 rm -f "$d/$i"
1103             done
1104             ;;
1105     esac
1106 }
1107
1108 ##################################################################
1109 # Reconfigure a service on demand
1110
1111 _ctdb_service_reconfigure_common ()
1112 {
1113     _d="$ctdb_status_dir/${service_name}"
1114     mkdir -p "$_d"
1115     _ctdb_service_reconfigure_flag="$_d/reconfigure"
1116 }
1117
1118 ctdb_service_needs_reconfigure ()
1119 {
1120     _ctdb_service_reconfigure_common
1121     [ -e "$_ctdb_service_reconfigure_flag" ]
1122 }
1123
1124 ctdb_service_set_reconfigure ()
1125 {
1126     _ctdb_service_reconfigure_common
1127     >"$_ctdb_service_reconfigure_flag"
1128 }
1129
1130 ctdb_service_unset_reconfigure ()
1131 {
1132     _ctdb_service_reconfigure_common
1133     rm -f "$_ctdb_service_reconfigure_flag"
1134 }
1135
1136 ctdb_service_reconfigure ()
1137 {
1138     echo "Reconfiguring service \"${service_name}\"..."
1139     ctdb_service_unset_reconfigure
1140     service_reconfigure || return $?
1141     ctdb_counter_init
1142 }
1143
1144 # Default service_reconfigure() function does nothing.
1145 service_reconfigure ()
1146 {
1147     :
1148 }
1149
1150 ctdb_reconfigure_try_lock ()
1151 {
1152     _ctdb_service_reconfigure_common
1153     _lock="${_d}/reconfigure_lock"
1154     mkdir -p "${_lock%/*}" # dirname
1155     touch "$_lock"
1156
1157     (
1158         flock 0
1159         # This is overkill but will work if we need to extend this to
1160         # allow certain events to run multiple times in parallel
1161         # (e.g. takeip) and write multiple PIDs to the file.
1162         read _locker_event
1163         if [ -n "$_locker_event" ] ; then
1164             while read _pid ; do
1165                 if [ -n "$_pid" -a "$_pid" != $$ ] && \
1166                     kill -0 "$_pid" 2>/dev/null ; then
1167                     exit 1
1168                 fi
1169             done
1170         fi
1171
1172         printf "%s\n%s\n" "$event_name" $$ >"$_lock"
1173         exit 0
1174     ) <"$_lock"
1175 }
1176
1177 ctdb_replay_monitor_status ()
1178 {
1179     echo "Replaying previous status for this script due to reconfigure..."
1180     # Leading colon (':') is missing in some versions...
1181     _out=$(ctdb scriptstatus -Y | grep -E "^:?monitor:${script_name}:")
1182     # Output looks like this:
1183     # :monitor:60.nfs:1:ERROR:1314764004.030861:1314764004.035514:foo bar:
1184     # This is the cheapest way of getting fields in the middle.
1185     set -- $(IFS=":" ; echo $_out)
1186     _code="$3"
1187     _status="$4"
1188     # The error output field can include colons so we'll try to
1189     # preserve them.  The weak checking at the beginning tries to make
1190     # this work for both broken (no leading ':') and fixed output.
1191     _out="${_out%:}"
1192     _err_out="${_out#*monitor:${script_name}:*:*:*:*:}"
1193     case "$_status" in
1194         OK) : ;;  # Do nothing special.
1195         TIMEDOUT)
1196             # Recast this as an error, since we can't exit with the
1197             # correct negative number.
1198             _code=1
1199             _err_out="[Replay of TIMEDOUT scriptstatus - note incorrect return code.] ${_err_out}"
1200             ;;
1201         DISABLED)
1202             # Recast this as an OK, since we can't exit with the
1203             # correct negative number.
1204             _code=0
1205             _err_out="[Replay of DISABLED scriptstatus - note incorrect return code.] ${_err_out}"
1206             ;;
1207         *) : ;;  # Must be ERROR, do nothing special.
1208     esac
1209     echo "$_err_out"
1210     exit $_code
1211 }
1212
1213 ctdb_service_check_reconfigure ()
1214 {
1215     assert_service_name
1216
1217     # We only care about some events in this function.  For others we
1218     # return now.
1219     case "$event_name" in
1220         monitor|ipreallocated|reconfigure) : ;;
1221         *) return 0 ;;
1222     esac
1223
1224     if ctdb_reconfigure_try_lock ; then
1225         # No events covered by this function are running, so proceed
1226         # with gay abandon.
1227         case "$event_name" in
1228             reconfigure)
1229                 (ctdb_service_reconfigure)
1230                 exit $?
1231                 ;;
1232             ipreallocated)
1233                 if ctdb_service_needs_reconfigure ; then
1234                     ctdb_service_reconfigure
1235                 fi
1236                 ;;
1237             monitor)
1238                 if ctdb_service_needs_reconfigure ; then
1239                     ctdb_service_reconfigure
1240                     # Given that the reconfigure might not have
1241                     # resulted in the service being stable yet, we
1242                     # replay the previous status since that's the best
1243                     # information we have.
1244                     ctdb_replay_monitor_status
1245                 fi
1246                 ;;
1247         esac
1248     else
1249         # Somebody else is running an event we don't want to collide
1250         # with.  We proceed with caution.
1251         case "$event_name" in
1252             reconfigure)
1253                 # Tell whoever called us to retry.
1254                 exit 2
1255                 ;;
1256             ipreallocated)
1257                 # Defer any scheduled reconfigure and just run the
1258                 # rest of the ipreallocated event, as per the
1259                 # eventscript.  There's an assumption here that the
1260                 # event doesn't depend on any scheduled reconfigure.
1261                 # This is true in the current code.
1262                 return 0
1263                 ;;
1264             monitor)
1265                 # There is most likely a reconfigure in progress so
1266                 # the service is possibly unstable.  As above, we
1267                 # defer any scheduled reconfigured.  We also replay
1268                 # the previous monitor status since that's the best
1269                 # information we have.
1270                 ctdb_replay_monitor_status
1271                 ;;
1272         esac
1273     fi
1274 }
1275
1276 ##################################################################
1277 # Does CTDB manage this service? - and associated auto-start/stop
1278
1279 ctdb_compat_managed_service ()
1280 {
1281     if [ "$1" = "yes" -a "$2" = "$service_name" ] ; then
1282         CTDB_MANAGED_SERVICES="$CTDB_MANAGED_SERVICES $2"
1283     fi
1284 }
1285
1286 is_ctdb_managed_service ()
1287 {
1288     assert_service_name
1289
1290     # $t is used just for readability and to allow better accurate
1291     # matching via leading/trailing spaces
1292     t=" $CTDB_MANAGED_SERVICES "
1293
1294     # Return 0 if "<space>$service_name<space>" appears in $t
1295     if [ "${t#* ${service_name} }" != "${t}" ] ; then
1296         return 0
1297     fi
1298
1299     # If above didn't match then update $CTDB_MANAGED_SERVICES for
1300     # backward compatibility and try again.
1301     ctdb_compat_managed_service "$CTDB_MANAGES_VSFTPD"   "vsftpd"
1302     ctdb_compat_managed_service "$CTDB_MANAGES_SAMBA"    "samba"
1303     ctdb_compat_managed_service "$CTDB_MANAGES_SCP"      "scp"
1304     ctdb_compat_managed_service "$CTDB_MANAGES_WINBIND"  "winbind"
1305     ctdb_compat_managed_service "$CTDB_MANAGES_HTTPD"    "apache2"
1306     ctdb_compat_managed_service "$CTDB_MANAGES_HTTPD"    "httpd"
1307     ctdb_compat_managed_service "$CTDB_MANAGES_ISCSI"    "iscsi"
1308     ctdb_compat_managed_service "$CTDB_MANAGES_CLAMD"    "clamd"
1309     ctdb_compat_managed_service "$CTDB_MANAGES_NFS"      "nfs"
1310     ctdb_compat_managed_service "$CTDB_MANAGES_NFS"      "nfs-ganesha-gpfs"
1311
1312     t=" $CTDB_MANAGED_SERVICES "
1313
1314     # Return 0 if "<space>$service_name<space>" appears in $t
1315     [ "${t#* ${service_name} }" != "${t}" ]
1316 }
1317
1318 ctdb_start_stop_service ()
1319 {
1320     assert_service_name
1321
1322     # Allow service-start/service-stop pseudo-events to start/stop
1323     # services when we're not auto-starting/stopping and we're not
1324     # monitoring.
1325     case "$event_name" in
1326         service-start)
1327             if is_ctdb_managed_service ; then
1328                 die 'service-start event not permitted when service is managed'
1329             fi
1330             if [ "$CTDB_SERVICE_AUTOSTARTSTOP" = "yes" ] ; then
1331                 die 'service-start event not permitted with $CTDB_SERVICE_AUTOSTARTSTOP = yes'
1332             fi
1333             ctdb_service_start
1334             exit $?
1335             ;;
1336         service-stop)
1337             if is_ctdb_managed_service ; then
1338                 die 'service-stop event not permitted when service is managed'
1339             fi
1340             if [ "$CTDB_SERVICE_AUTOSTARTSTOP" = "yes" ] ; then
1341                 die 'service-stop event not permitted with $CTDB_SERVICE_AUTOSTARTSTOP = yes'
1342             fi
1343             ctdb_service_stop
1344             exit $?
1345             ;;
1346     esac
1347
1348     # Do nothing unless configured to...
1349     [ "$CTDB_SERVICE_AUTOSTARTSTOP" = "yes" ] || return 0
1350
1351     [ "$event_name" = "monitor" ] || return 0
1352
1353     if is_ctdb_managed_service ; then
1354         if ! is_ctdb_previously_managed_service ; then
1355             echo "Starting service \"$service_name\" - now managed"
1356             background_with_logging ctdb_service_start
1357             exit $?
1358         fi
1359     else
1360         if is_ctdb_previously_managed_service ; then
1361             echo "Stopping service \"$service_name\" - no longer managed"
1362             background_with_logging ctdb_service_stop
1363             exit $?
1364         fi
1365     fi
1366 }
1367
1368 ctdb_service_start ()
1369 {
1370     # The service is marked managed if we've ever tried to start it.
1371     ctdb_service_managed
1372
1373     service_start || return $?
1374
1375     ctdb_counter_init
1376     ctdb_check_tcp_init
1377 }
1378
1379 ctdb_service_stop ()
1380 {
1381     ctdb_service_unmanaged
1382     service_stop
1383 }
1384
1385 # Default service_start() and service_stop() functions.
1386
1387 # These may be overridden in an eventscript.  When overriding, the
1388 # following convention must be followed.  If these functions are
1389 # called with no arguments then they may use internal logic to
1390 # determine whether the service is managed and, therefore, whether
1391 # they should take any action.  However, if the service name is
1392 # specified as an argument then an attempt must be made to start or
1393 # stop the service.  This is because the auto-start/stop code calls
1394 # them with the service name as an argument.
1395 service_start ()
1396 {
1397     service "$service_name" start
1398 }
1399
1400 service_stop ()
1401 {
1402     service "$service_name" stop
1403 }
1404
1405 ##################################################################
1406
1407 ctdb_standard_event_handler ()
1408 {
1409     case "$1" in
1410         status)
1411             ctdb_checkstatus
1412             exit
1413             ;;
1414         setstatus)
1415             shift
1416             ctdb_setstatus "$@"
1417             exit
1418             ;;
1419     esac
1420 }
1421
1422 # iptables doesn't like being re-entered, so flock-wrap it.
1423 iptables()
1424 {
1425         flock -w 30 $CTDB_VARDIR/iptables-ctdb.flock /sbin/iptables "$@"
1426 }
1427
1428 # AIX (and perhaps others?) doesn't have mktemp
1429 if ! which mktemp >/dev/null 2>&1 ; then
1430     mktemp ()
1431     {
1432         _dir=false
1433         if [ "$1" = "-d" ] ; then
1434             _dir=true
1435             shift
1436         fi
1437         _d="${TMPDIR:-/tmp}"
1438         _hex10=$(dd if=/dev/urandom count=20 2>/dev/null | \
1439             md5sum | \
1440             sed -e 's@\(..........\).*@\1@')
1441         _t="${_d}/tmp.${_hex10}"
1442         (
1443             umask 077
1444             if $_dir ; then
1445                 mkdir "$_t"
1446             else
1447                 >"$_t"
1448             fi
1449         )
1450         echo "$_t"
1451     }
1452 fi
1453
1454 ########################################################
1455 # tickle handling
1456 ########################################################
1457
1458 update_tickles ()
1459 {
1460         _port="$1"
1461
1462         tickledir="$CTDB_VARDIR/state/tickles"
1463         mkdir -p "$tickledir"
1464
1465         # Who am I?
1466         _pnn=$(ctdb pnn) ; _pnn=${_pnn#PNN:}
1467
1468         # What public IPs do I hold?
1469         _ips=$(ctdb -Y ip | awk -F: -v pnn=$_pnn '$3 == pnn {print $2}')
1470
1471         # IPs as a regexp choice
1472         _ipschoice="($(echo $_ips | sed -e 's/ /|/g' -e 's/\./\\\\./g'))"
1473
1474         # Record connections to our public IPs in a temporary file
1475         _my_connections="${tickledir}/${_port}.connections"
1476         rm -f "$_my_connections"
1477         netstat -tn |
1478         awk -v destpat="^${_ipschoice}:${_port}\$" \
1479           '$1 == "tcp" && $6 == "ESTABLISHED" && $4 ~ destpat {print $5, $4}' |
1480         sort >"$_my_connections"
1481
1482         # Record our current tickles in a temporary file
1483         _my_tickles="${tickledir}/${_port}.tickles"
1484         rm -f "$_my_tickles"
1485         for _i in $_ips ; do
1486                 ctdb -Y gettickles $_i $_port |
1487                 awk -F: 'NR > 1 { printf "%s:%s %s:%s\n", $2, $3, $4, $5 }'
1488         done |
1489         sort >"$_my_tickles"
1490
1491         # Add tickles for connections that we haven't already got tickles for
1492         comm -23 "$_my_connections" "$_my_tickles" |
1493         while read _src _dst ; do
1494                 ctdb addtickle $_src $_dst
1495         done
1496
1497         # Remove tickles for connections that are no longer there
1498         comm -13 "$_my_connections" "$_my_tickles" |
1499         while read _src _dst ; do
1500                 ctdb deltickle $_src $_dst
1501         done
1502
1503         rm -f "$_my_connections" "$_my_tickles"
1504 }
1505
1506 ########################################################
1507 # load a site local config file
1508 ########################################################
1509
1510 [ -n "$CTDB_RC_LOCAL" -a -x "$CTDB_RC_LOCAL" ] && {
1511         . "$CTDB_RC_LOCAL"
1512 }
1513
1514 [ -x $CTDB_BASE/rc.local ] && {
1515         . $CTDB_BASE/rc.local
1516 }
1517
1518 [ -d $CTDB_BASE/rc.local.d ] && {
1519         for i in $CTDB_BASE/rc.local.d/* ; do
1520                 [ -x "$i" ] && . "$i"
1521         done
1522 }
1523
1524 script_name="${0##*/}"       # basename
1525 service_fail_limit=1
1526 event_name="$1"