4rwer2 发表于 2014-9-17 08:52:39

nagios监控mysql(check_mysql)及内存使用率(check_mem)

一、监控本地(localhost)内存

1、上传监控脚本 check_mem 到/usr/local/nagios/libexec

1
2
# chown -R nagios.nagios check_mem
# chmod +x check_mem




2、修改commands配置

1
2
3
4
5
# vim /usr/local/nagios/etc/objects/commands.cfg
define command{
      command_name      check_mem
      command_line      $USER1$/check_mem -w $ARG1$ -c $ARG2$
      }




3、修改localhost.cfg


1
2
3
4
5
6
7
# vim /usr/local/nagios/etc/objects/localhost.cfg
define service{
      use                           local-service
      host_name                     localhost
      service_description             check_mem
      check_command                   check_mem!20!10
      }




4、重启nagios服务


1
# service nagios restart




5、check_mem 脚本

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
#!/bin/bash
USAGE="`basename $0` [-w|--warning]<percent free> [-c|--critical]<percent free>"
THRESHOLD_USAGE="WARNING threshold must be greater than CRITICAL: `basename $0` $*"
calc=/tmp/memcalc
percent_free=/tmp/mempercent
critical=""
warning=""
STATE_OK=0
STATE_WARNING=1
STATE_CRITICAL=2
STATE_UNKNOWN=3
# print usage
if [[ $# -lt 4 ]]
then
      echo ""
      echo "Wrong Syntax: `basename $0` $*"
      echo ""
      echo "Usage: $USAGE"
      echo ""
      exit 0
fi
# read input
while [[ $# -gt 0 ]]
do
      case "$1" in
               -w|--warning)
               shift
               warning=$1
      ;;
               -c|--critical)
               shift
               critical=$1
      ;;
      esac
      shift
done

# verify input
if [[ $warning -eq $critical || $warning -lt $critical ]]
then
      echo ""
      echo "$THRESHOLD_USAGE"
      echo ""
      echo "Usage: $USAGE"
      echo ""
      exit 0
fi
# Total memory available
total=`free -m | head -2 |tail -1 |gawk '{print $2}'`
# Total memory used
used=`free -m | head -2 |tail -1 |gawk '{print $3}'`
# Calc total minus used
free=`free -m | head -2 |tail -1 |gawk '{print $2-$3}'`
# normal values
#echo "$total"MB total
#echo "$used"MB used
#echo "$free"MB free
# make it into % percent free = ((free mem / total mem) * 100)
echo "5" > $calc # decimal accuracy
echo "k" >> $calc # commit
echo "100" >> $calc # multiply
echo "$free" >> $calc # division integer
echo "$total" >> $calc # division integer
echo "/" >> $calc # division sign
echo "*" >> $calc # multiplication sign
echo "p" >> $calc # print
percent=`/usr/bin/dc $calc|/bin/sed 's/^\./0./'|/usr/bin/tr "." " "|/usr/bin/gawk {'print $1'}`
#percent1=`/usr/bin/dc $calc`
#echo "$percent1"
if [[ "$percent" -le$critical ]]
      then
                echo "CRITICAL - $free MB ($percent%) Free Memory"
                exit 2
fi
if [[ "$percent" -le$warning ]]
      then
                echo "WARNING - $free MB ($percent%) Free Memory"
                exit 1
fi
if [[ "$percent" -gt$warning ]]
      then
                echo "OK - $free MB ($percent%) Free Memory"
                exit 0
fi




二、监控客户端内存使用情况

1、上传监控脚本 check_mem 到/usr/local/nagios/libexec

1
2
# chown -R nagios.nagios check_mem
# chmod +x check_mem




2、修改nrpe.cfg

1
2
3
4
5
6
7
8
9
# vim /usr/local/nagios/etc/nrpe.cfg
command=/usr/local/nagios/libexec/check_users -w 3 -c 5
command=/usr/local/nagios/libexec/check_load -w 15,10,5 -c 30,25,20
command=/usr/local/nagios/libexec/check_disk -w 10% -c 5% -p /dev/xvda
command=/usr/local/nagios/libexec/check_procs -w 5 -c 10 -s Z
command=/usr/local/nagios/libexec/check_procs -w 150 -c 200
command=/usr/local/nagios/libexec/check_disk -w 10% -c 5% -p /dev/xvdb2
command=/usr/local/nagios/libexec/check_swap -w 20% -c 10%
command=/usr/bin/sudo /usr/local/nagios/libexec/check_mem -w 20 -c 10   #增加此行




3、在nagios服务器端增加监控服务

1
2
3
4
5
6
7
# vim /usr/local/nagios/etc/servers/192.168.200.111.cfg
define service{
      use                           generic-service
      host_name                     192.168.200.111
      service_description             check_mem
      check_command                   check_nrpe!check_mem
      }




三、排错

1、NRPE: Unable to read output
(1)为nagios用户增加sudo权限

1
2
# visudo
nagiosALL=(ALL) NOPASSWD:/usr/local/nagios/libexec/check_mem




(2)注释掉一下行,表示不需要控制终端

1
2
# visudo
#Defaults    requiretty





四、nagios监控mysql
1、check_mysql
    nagios监控mysql使用的是 check_mysql 这个插件,需要在nagios服务器上先安装mysql-devel,然后再重新安装nagios-plugin,这样才会出现check_mysql。否则即使copy了一份,也照样用不了。
2、编译或重新编译 nagios-plugin

1
2
3
4
#yum -y install mysql-devl
#cd nagios-plugins-2.0.3
#./configure --with-nagios-user=nagios --with-nagios-group=nagios
#make && make install




3、查看 check_mysql

1
# ls /usr/local/nagios/libexec/check_mysql




4、建立专用数据库

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
# mysql -uroot -p
mysql> create database nagios_monitor;

mysql> grant select on nagios_monitor.* to nagios@'%' identified by '123qaz!@#';
Query OK, 0 rows affected (0.00 sec)

mysql> flush privileges;
Query OK, 0 rows affected (0.00 sec)

mysql> select User,Password,Host from mysql.user;
+--------+-------------------------------------------+--------------+
| User   | Password                                  | Host         |
+--------+-------------------------------------------+--------------+
| root   | *B9627CB37815863D1E98D0C41E0233A772355E2B | localhost    |
| root   | *B9627CB37815863D1E98D0C41E0233A772355E2B | 127.0.0.1    |
| root   | *B9627CB37815863D1E98D0C41E0233A772355E2B | ::1          |
| cacti| *BC3E1F14C7940F9C8BCDB05A38385754BB55CD64 | localhost    |
| nagios | *BC3E1F14C7940F9C8BCDB05A38385754BB55CD64 | %            |
+--------+-------------------------------------------+--------------+
8 rows in set (0.00 sec)




5、check 一下

1
2
3
4
5
6
7
8
# /usr/local/nagios/libexec/check_mysql -H 192.168.200.105 -unagios -dnagios_monitor -p 123qaz!@#
# 报了一个错
/usr/local/nagios/libexec/check_mysql: error while loading shared libraries: libmysqlclient.so.18: cannot open shared object file: No such file or directory
# 解决:
ln -sv /usr/local/mysql/lib/libmysqlclient.so.18 /usr/lib64/libmysqlclient.so.18
# 再重新测试
# /usr/local/nagios/libexec/check_mysql -H 192.168.200.111 -unagios -dnagios_monitor -p 123qaz!@#
Uptime: 13991Threads: 5Questions: 1242101Slow queries: 0Opens: 159Flush tables: 1Open tables: 60Queries per second avg: 88.778|Connections=315c;;; Open_files=85;;; Open_tables=60;;; Qcache_free_memory=16285768;;; Qcache_hits=1210926c;;; Qcache_inserts=16654c;;; Qcache_lowmem_prunes=0c;;; Qcache_not_cached=2c;;; Qcache_queries_in_cache=283;;; Queries=1242101c;;; Questions=1242101c;;; Table_locks_waited=2c;;; Threads_connected=5;;; Threads_running=1;;; Uptime=13991c;;;




6、监控localhost

(1)修改 commands.cfg

1
2
3
4
5
# vim /usr/local/nagios/etc/objects/commands.cfg
define command{
      command_name check_mysql
      command_line $USER1$/check_mysql -H $HOSTADDRESS$ -unagios -dnagios_monitor -p123qaz!@#
}




(2)修改 localhost.cfg

1
2
3
4
5
6
7
# vim /usr/local/nagios/etc/objects/localhost.cfg
define service{
      use                           local-service
      host_name                     localhost
      service_description             check_mysql
      check_command                   check_mysql
      }




(3)重启 nagios


1
# service nagios restart




7、监控客户端
(1)check 一下


1
# /usr/local/nagios/libexec/check_mysql -H 192.168.200.111 -unagios -dnagios_monitor -p123qaz!@#




(2)客户端修改 nrpe.cfg

1
2
# vim /usr/local/nagios/etc/nrpe.cfg
command=/usr/local/nagios/libexec/check_mysql -H 192.168.200.111 -unagios -dnagios_monitor -p123qaz!@#




(3)重启 nrpe

1
2
# killall nrpe
# /usr/local/nagios/bin/nrpe -c /usr/local/nagios/etc/nrpe.cfg -d




(4)服务端定义服务

1
2
3
4
5
6
7
# vim /usr/local/nagios/etc/servers/192.168.200.111.cfg
define service{
      use                           generic-service
      host_name                     192.168.200.111
      service_description             check_mysql
      check_command                   check_nrpe!check_mysql
      }




(5)重启 nagios 服务


1
# service nagios restart



页: [1]
查看完整版本: nagios监控mysql(check_mysql)及内存使用率(check_mem)