But of course, here's the fping.monitor I ended up with.

#!/usr/bin/perl
#
# Return a list of hosts which not reachable via ICMP echo
#
# Jim Trocki, [EMAIL PROTECTED]
#
# $Id: fping.monitor 1.7 Mon, 27 Aug 2001 14:22:45 -0400 trockij $
#
#    Copyright (C) 1998, Jim Trocki
#
#    This program is free software; you can redistribute it and/or modify
#    it under the terms of the GNU General Public License as published by
#    the Free Software Foundation; either version 2 of the License, or
#    (at your option) any later version.
#
#    This program is distributed in the hope that it will be useful,
#    but WITHOUT ANY WARRANTY; without even the implied warranty of
#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#    GNU General Public License for more details.
#
#    You should have received a copy of the GNU General Public License
#    along with this program; if not, write to the Free Software
#    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
#
use strict;

use Getopt::Std;

my %opt;
getopts ("ahr:s:t:T", \%opt);

sub usage
{
    print <<EOF;
usage: fping.monitor [-a] [-r num] [-s num] [-t num] [-T] host [host...]

    -a          only report failure if all hosts are unreachable
    -r num      retry "num" times for each host before reporting failure
    -s num      consider hosts which respond in over "num" msecs failures
    -t num      wait "num" msecs before sending retries
    -T          traceroute to each failed host. CAUTION: this may cause
                this monitor to hang for a very long time

EOF

    exit;
}

usage if ($opt{"h"});

my $TIMEOUT = $opt{"t"} || 2000;
my $RETRIES = $opt{"r"} || 3;
my $CMD = "fping -e -r $RETRIES -t $TIMEOUT";
my $START_TIME = time;
my $END_TIME;

exit 0 if (@ARGV == 0);

open (IN, "$CMD @ARGV 2>&1 |") ||
        die "could not open pipe to fping: $!\n";

my @unreachable;
my @alive;
my @slow;
my @other_prob;         # details for other per-host problems
my @error;              # other errors which I'll give non-zero exit for
my @icmp;               # ICMP messages output by fping
my %addr_unknown;

my %want_host = map { $_ => 1 } @ARGV;  # hosts fping hasn't output yet

while (<IN>)
{
    chomp;
    if (/^(\S+).*unreachable/)
    {
        push (@unreachable, $1);
        delete $want_host{$1}
            or push @error, "unreachable host `$1' wasn't asked for";
    }

    elsif (/^(\S+) is alive \((\S+)/)
    {
        delete $want_host{$1}
            or push @error, "reachable host `$1' wasn't asked for";

        if ($opt{"s"} && $2 > $opt{"s"})
        {
            push (@slow, [$1, $2]);
        }

        else
        {
            push (@alive, [$1, $2]);
        }
    }

    elsif (/^(\S+)\s+address\s+not\s+found/)
    {
        $addr_unknown{$1} = 1;
        push @other_prob, "$1 address not found";
        push @unreachable, $1;
        delete $want_host{$1}
            or push @error, "unknown host `$1' wasn't asked for";
    }

    # ICMP Host Unreachable from 1.2.3.4 for ICMP Echo sent to 2.4.6.8
    # (among others)

    elsif (/^ICMP (.*) for ICMP Echo sent to (\S+)/)
    {
        push @icmp, $_;
    }

    else
    {
        push @error, "unidentified output from fping: [$_]";
    }
}

for my $host (keys %want_host) {
    push @other_prob, "$host not listed in fping's output";
    push @unreachable, $host;
}

close (IN);

$END_TIME = time;

my $retval = $? >> 8;

if ($retval < 3)
{
    # do nothing
}

elsif ($retval == 3)
{
    push @error, "fping: invalid cmdline arguments [$CMD @ARGV]";
}

elsif ($retval == 4)
{
    push @error, "fping: system call failure";
}

else
{
    push @error, "unknown return code ($retval) from fping";
}

if (@error) {
    print "unusual errors\n";
}
else {
    my @fail = sort @unreachable, map { $_->[0] } @slow;
    # This line is intentionally blank if there are no failures.
    print "@fail\n";
}

print "\n";
print "start time: " . localtime ($START_TIME) . "\n";
print "end time  : " . localtime ($END_TIME) . "\n";
print "duration  : " . ($END_TIME - $START_TIME) . " seconds\n";

if (@error != 0)
{
    print <<EOF;

------------------------------------------------------------------------------
unusual errors
------------------------------------------------------------------------------
EOF
    print join ("\n", @error), "\n";
}

if (@unreachable != 0)
{
    print <<EOF;

------------------------------------------------------------------------------
unreachable hosts
------------------------------------------------------------------------------
EOF
    print join ("\n", @unreachable), "\n";

    print "\nother problems:\n", join "\n", @other_prob, ''
        if @other_prob;
}

if (@icmp != 0)
{
    print <<EOF;

------------------------------------------------------------------------------
ICMP messages
------------------------------------------------------------------------------
EOF
    print join "\n", @icmp, '';
}


if (@slow != 0)
{
    print <<EOF;

------------------------------------------------------------------------------
slow hosts (response time which exceeds $opt{s}ms)
------------------------------------------------------------------------------
EOF

    foreach my $host (@slow)
    {
        printf ("%-40s %.2f ms\n", @{$host});
    }
}



if (@alive != 0)
{
    print <<EOF;

------------------------------------------------------------------------------
reachable hosts                          rtt
------------------------------------------------------------------------------
EOF
    
    for (my $i = 0; $i < @alive; $i++)
    {
        printf ("%-40s %.2f ms\n", @{$alive[$i]});
    }
}

#
# traceroute
#
if ($opt{"T"} && @unreachable)
{
    my $header_output = 0;
    foreach my $host (@unreachable)
    {
        next if $addr_unknown{$host};
        print $header_output++ ? "\n" : <<EOF;

------------------------------------------------------------------------------
traceroute to unreachable hosts
------------------------------------------------------------------------------
EOF
        system ("traceroute -w 3 $host 2>&1");
    }
}

exit 1 if @error;

#
# fail only if all hosts do not respond
#
if ($opt{"a"})
{
    exit(@alive ? 0 : 1);
}

exit 1 if (@slow != 0);

exit $retval;

-- 
Roderick Schertler
[EMAIL PROTECTED]

Reply via email to