User Tools

Site Tools


mysql_monitoring

Replication Nagios monitoring

simply use this to monitor mysql replication from nagios

#!/usr/bin/perl -w
# Originally downloaded from nagios exchange http://exchange.nagios.org/components/com_mtree/attachment.php?link_id=1937&cf_id=24
# 
# Fixed check for slave IO and Slave SQL
# k2patel <k2patel\@hotmail.com>.
 
 
use strict;
use Getopt::Long;
use DBI;
 
# Set DEFAULT inputs
my $options = { 
	'master' => 'localhost', 'slave' => 'localhost',
	'dbuser' => 'replication', 'dbpass' => 'testing',
	'port' => 3306, 'crit' => 100000, 'warn' => 10000,
	'debug' => 0
};
GetOptions($options, "master=s", "slave=s", "port=i", "dbuser=s", "dbpass=s",
	"crit=i", "warn=i", "debug=i", "help");
my $max_binlog;
 
if (defined $options->{'help'}) {
	print <<HELP;
$0: check replication between mysql databases
 
 $0 [ --master <host> ] [ --slave <host> ] 
 [ --crit <positions> ] [ --warn <positions> ] [ --dbuser <user> ] 
 [ --dbpass <pass> ]
 
  --master <host>    - MySQL instance running as a master server
  --slave <host>     - MySQL instance running as a slave server
  --port <port>      - port number MySQL is listening on
  --crit <positions> - Number of binlog positions for critical state
  --warn <positions> - Number of binlog positions for warning state
  --dbuser <user>    - Username with File and Process privs to check status
  --dbpass <pass>    - Password for above user
  --help	     - This help page
 
The user that is testing must be the same on all instances, eg:
  GRANT File, Process on *.* TO repl_test\@192.168.0.% IDENTIFIED BY <pass>
 
Note: Any mysqldump tables (for backups) may lock large tables for a long 
time. If you dump from your slave for this, then your master will gallop 
away from your slave, and the difference will become large. The trick is to 
set crit above this differnce and warn below.
 
(c) 2004 Fotango. James Bromberger <jbromberger\@fotango.com>.
(c) 2006 Some changes by Robert Klikics <robert\@klikics.de>.
(c) 2010 Several fixes by Joe DeCello <jdecello\@hotmail.com>.
(c) 2010 Slave_IO and Slave_SQL added by Joe DeCello <jdecello\@hotmail.com>.
 
HELP
exit;
}
 
my $status = "";
my $severity = 0; # OK, 1 is WARNING, 2 is CRITICAL
 
my $master_ref = get_replication_status($options->{'master'}, 'master');
my $slave_ref = get_replication_status($options->{'slave'}, 'slave');
 
my $return;
 
$return = check_slave_IO ($slave_ref);
$severity = $return if ($return > $severity);
 
$return = check_slave_SQL ($slave_ref);
$severity = $return if ($return > $severity);
 
$return = compare_replication_status($master_ref, $slave_ref);
$severity = $return if ($return > $severity);
 
my $output = $status;
if ($severity >= 2) {
	print "CRITICAL: $output\n";
	exit 2; # CRITICAL
} elsif ($severity == 1) {
	print "WARN: $output\n";
	exit 1; # WARNING
} else {
	print "OK: $output\n";
	exit 0;
}
 
#TODO - check for these too
#Last_Error:
#Seconds_Behind_Master: 0
 
# end of main
 
###############
# Subroutines #
###############
 
sub get_replication_status {
	my $host = shift;
	my $role = shift;
	require Carp;
	Carp::cluck "host" if !defined $host;
	Carp::cluck "port" if !defined $options->{'port'};
	Carp::cluck "dbuser" if !defined $options->{'dbuser'};
	Carp::cluck "dbpass" if !defined $options->{'dbpass'};
	my $dbh = DBI->connect("DBI:mysql:host=$host;port=$options->{'port'}",
		$options->{'dbuser'}, $options->{'dbpass'});
	if (not $dbh) {
		print "UNKNOWN: cannot connect to $host";
		exit 3;
	}
 
	if (lc ($role) eq 'master') {
		my $sql1 = "show variables like 'max_binlog_size'";
		my $sth1 = $dbh->prepare($sql1);
		my $res1 = $sth1->execute;
		my $ref1 = $sth1->fetchrow_hashref;
		$max_binlog = $ref1->{'Value'};
	}
	my $sql = sprintf "SHOW %s STATUS", $role;
	my $sth = $dbh->prepare($sql);
	my $res = $sth->execute;
	if (not $res) {
		die "No results";
	}
	my $ref = $sth->fetchrow_hashref;
	$sth->finish;
	if ($options->{'debug'}) {
		print "$host:\n";
		print join (', ', map { sprintf " %s: %s", $_, $ref->{$_} }
			keys %{$ref}) . "\n";
	}
	$dbh->disconnect;
	return $ref;
}
 
#Check Delta between Master and Slave log/POS
sub compare_replication_status {
	my ($a, $b) = @_;
	my ($master, $slave);
	if (defined($a->{'File'})) {
		$master = $a;
		$slave = $b;
	} elsif (defined($b->{'File'})) {
		$master = $b;
		$slave = $a;
	}
	$master->{'File_No'} = $1 if ($master->{'File'} =~ /(\d+)$/);
	$slave->{'File_No'} = $1 
		if ($slave->{'Relay_Master_Log_File'} =~ /(\d+)$/);
 
	my $diff = ($master->{'File_No'} - $slave->{'File_No'}) * $max_binlog;
 
	printf "Master: %d Slave: %d\n", $master->{'Position'}, 
		$slave->{'Exec_Master_Log_Pos'} if $options->{'debug'};
 
	$diff+= $master->{'Position'} - $slave->{'Exec_Master_Log_Pos'};
	my $state = sprintf "Master: %d/%d  Slave: %d/%d  Diff: %d/%d", 
		$master->{'File_No'}, $master->{'Position'}, 
		$slave->{'File_No'}, $slave->{'Exec_Master_Log_Pos'}, 
		($diff/$max_binlog), ($diff % $max_binlog);
	$status .= "$state  ";
	if ($diff >= $options->{'crit'}) {
		return 2; # CRITICAL
	} elsif ($diff >= $options->{'warn'}) {
		return 1; # WARNING
	}
	return 0;
}
 
#Check for these too
#Slave_IO_Running: Yes
 
sub check_slave_IO {
        my $slave = shift @_;
        printf "Slave_SQL_Running: %s \n",
                $slave->{'Slave_IO_Running'},
                if $options->{'debug'};
        my $state = "Slave_IO_Running: ".$slave->{Slave_IO_Running};
        $status .= "$state  ";
        if ($slave->{Slave_IO_Running} eq 'No') {
                        return 2; # CRITICAL
                }
                else {
                        return 0; # OK
                }
        }
#Slave_SQL_Running: Yes	
        sub check_slave_SQL {
        my $slave = shift @_;
 
        printf "Slave_SQL_Running: %s \n",
                $slave->{'Slave_SQL_Running'},
                if $options->{'debug'};
        my $state = "Slave_SQL_Running: ".$slave->{Slave_SQL_Running};
        $status .= "$state  ";
        if ($slave->{Slave_SQL_Running} eq 'No') {
						return 2; # CRITICAL
                }
                else {
                        return 0; # OK
                }
        }
# end of subroutines
 
# END
mysql_monitoring.txt · Last modified: 2020/08/10 02:35 (external edit)