System Downages

        vienna berlin moscow warsaw munich milan athens2

misscritsys
        members
#include <systems/misscritsys_systems.cfg>

misscritsys
#  include <systems/misscritsys_systems.cfg>

EMERGENCY               // things that require immediate attention

#if misscritsys
        timing          10,25,40,55 * * * *
#else
        timing          10,40 * * * *
#endif

page TRUE               // if TRUE, then issue pages, else keep silent

///////////////////////////////////////////////////////////////////////////////

#if piktmaster

SysDownEmergency

        init
                status active
                level emergency
                task "Detect system crashes, or systems going off the network"
                input file "=hostinfo_obj"
                dat $host 1
                // ignore the rest of the fields in HostInfo.obj
                keys $host

        begin
                set $timeout = "20"     // yes, string var here
                =set_timenow
                =set_hr
                =set_dow
                // bypass weekly reboot period
                if =reboot_period
                        quit
                endif

        rule    // exclude systems known to be down
                if " =downsys " =~ " $host "
                        next
                endif

        rule    // report if system goes down; repeat only if system goes up
                // then back down again; for certain mission-critical systems,
                // report every time (issue repeated nagmail), also page but
                // just once per downage incident
#  if linux | freebsd
                if $command("=ping -c 1 $host | =tail -2 | =head -1")
                        =~ " 0% packet loss"
#  elif hpux
                if $command("=ping $host -n 1 | =tail -2 | =head -1")
                        =~ " 0% packet loss"
#  elif solaris | sunos
                if $command("=ping $host $timeout") =~ "is alive"
#  endif
                        set $state = "+"
                else
                        set $state = "-"
                        if " =misscritsys " =~ " $host "
                                output mail "$host is down, or off the network"
#  ifdef page
                                if    ! #defined(%state)
                                   || $state ne %state
                                        exec wait "echo '$host is down' |
                                                   =mailx -s '$host is down'
                                                   pagemozart\
                                                   pagebrahms\
                                                   pageliszt\"
                                endif
#  endifdef
                        elseif    ! #defined(%state)
                               || $state ne %state
                                output mail "$host is down, or off the network"
                        endif
                endif

#endif  // piktmaster

///////////////////////////////////////////////////////////////////////////////

#if piktmaster

SysDownWarning

        init
                status active
                level warning
                task "Detect systems down or off the network"
                input file "=hostinfo_obj"
                dat $host 1
                // ignore the rest of the fields in HostInfo.obj

        begin
                set $timeout = "20"     // yes, string var here

        rule    // report if system doesn't respond to ping
#  if linux | freebsd
                if $command("=ping -c 1 $host | =tail -2 | =head -1")
                        =~ " 0% packet loss"
#  elif hpux
                if $command("=ping $host -n 1 | =tail -2 | =head -1")
                        =~ " 0% packet loss"
#  elif solaris | sunos
                if $command("=ping $host $timeout") =~ "is alive"
#  endif
                        // do nothing
                else
                        output mail "$host is down, or off the network"
                endif

#endif  // piktmaster

///////////////////////////////////////////////////////////////////////////////