一、监控本地(localhost)内存
1、上传监控脚本 check_mem 到/usr/local/nagios/libexec
1
2
|
# chown -R nagios.nagios check_mem # chmod +x check_mem |
2、修改commands配置
1
2
3
4
5
|
# vim /usr/local/nagios/etc/objects/commands.cfg define command {
command_name check_mem
command_line $USER1$ /check_mem -w $ARG1$ -c $ARG2$
}
|
3、修改localhost.cfg
1
2
3
4
5
6
7
|
# vim /usr/local/nagios/etc/objects/localhost.cfg define service{ use local -service
host_name localhost
service_description check_mem
check_command check_mem!20!10
}
|
4、重启nagios服务
1
|
# service nagios restart |
5、check_mem 脚本
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
|
#!/bin/bash USAGE= "`basename $0` [-w|--warning]<percent free> [-c|--critical]<percent free>"
THRESHOLD_USAGE= "WARNING threshold must be greater than CRITICAL: `basename $0` $*"
calc= /tmp/memcalc
percent_free= /tmp/mempercent
critical= ""
warning= ""
STATE_OK=0 STATE_WARNING=1 STATE_CRITICAL=2 STATE_UNKNOWN=3 # print usage if [[ $ # -lt 4 ]]
then echo "" echo "Wrong Syntax: `basename $0` $*" echo "" echo "Usage: $USAGE" echo "" exit 0
fi # read input while [[ $ # -gt 0 ]]
do
case "$1" in
-w|--warning)
shift
warning=$1
;;
-c|--critical)
shift
critical=$1
;;
esac
shift
done
# verify input if [[ $warning - eq $critical || $warning -lt $critical ]]
then echo "" echo "$THRESHOLD_USAGE" echo "" echo "Usage: $USAGE" echo "" exit 0
fi # Total memory available total=` free -m | head -2 | tail -1 | gawk '{print $2}' `
# Total memory used used=` free -m | head -2 | tail -1 | gawk '{print $3}' `
# Calc total minus used free =` free -m | head -2 | tail -1 | gawk '{print $2-$3}' `
# normal values #echo "$total"MB total #echo "$used"MB used #echo "$free"MB free # make it into % percent free = ((free mem / total mem) * 100) echo "5" > $calc # decimal accuracy
echo "k" >> $calc # commit
echo "100" >> $calc # multiply
echo "$free" >> $calc # division integer
echo "$total" >> $calc # division integer
echo "/" >> $calc # division sign
echo "*" >> $calc # multiplication sign
echo "p" >> $calc # print
percent=` /usr/bin/dc $calc| /bin/sed 's/^\./0./' | /usr/bin/tr "." " " | /usr/bin/gawk { 'print $1' }`
#percent1=`/usr/bin/dc $calc` #echo "$percent1" if [[ "$percent" - le $critical ]]
then
echo "CRITICAL - $free MB ($percent%) Free Memory" exit 2
fi if [[ "$percent" - le $warning ]]
then
echo "WARNING - $free MB ($percent%) Free Memory" exit 1
fi if [[ "$percent" -gt $warning ]]
then
echo "OK - $free MB ($percent%) Free Memory" exit 0
fi |
二、监控客户端内存使用情况
1、上传监控脚本 check_mem 到/usr/local/nagios/libexec
1
2
|
# chown -R nagios.nagios check_mem # chmod +x check_mem |
2、修改nrpe.cfg
1
2
3
4
5
6
7
8
9
|
# vim /usr/local/nagios/etc/nrpe.cfg command [check_users]= /usr/local/nagios/libexec/check_users -w 3 -c 5
command [check_load]= /usr/local/nagios/libexec/check_load -w 15,10,5 -c 30,25,20
command [check_xvda]= /usr/local/nagios/libexec/check_disk -w 10% -c 5% -p /dev/xvda
command [check_zombie_procs]= /usr/local/nagios/libexec/check_procs -w 5 -c 10 -s Z
command [check_total_procs]= /usr/local/nagios/libexec/check_procs -w 150 -c 200
command [check_xvdb2]= /usr/local/nagios/libexec/check_disk -w 10% -c 5% -p /dev/xvdb2
command [check_swap]= /usr/local/nagios/libexec/check_swap -w 20% -c 10%
command [check_mem]= /usr/bin/sudo /usr/local/nagios/libexec/check_mem -w 20 -c 10 #增加此行
|
3、在nagios服务器端增加监控服务
1
2
3
4
5
6
7
|
# vim /usr/local/nagios/etc/servers/192.168.200.111.cfg define service{ use generic-service
host_name 192.168.200.111
service_description check_mem
check_command check_nrpe!check_mem
}
|
三、排错
1、NRPE: Unable to read output
(1)为nagios用户增加sudo权限
1
2
|
# visudo nagios ALL=(ALL) NOPASSWD: /usr/local/nagios/libexec/check_mem
|
(2)注释掉一下行,表示不需要控制终端
1
2
|
# visudo #Defaults requiretty |
四、nagios监控mysql
1、check_mysql
nagios监控mysql使用的是 check_mysql 这个插件,需要在nagios服务器上先安装mysql-devel,然后再重新安装nagios-plugin,这样才会出现check_mysql。否则即使copy了一份,也照样用不了。
2、编译或重新编译 nagios-plugin
1
2
3
4
|
#yum -y install mysql-devl #cd nagios-plugins-2.0.3 #./configure --with-nagios-user=nagios --with-nagios-group=nagios #make && make install |
3、查看 check_mysql
1
|
# ls /usr/local/nagios/libexec/check_mysql |
4、建立专用数据库
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
|
# mysql -uroot -p mysql> create database nagios_monitor; mysql> grant select on nagios_monitor.* to nagios@ '%' identified by '123qaz!@#' ;
Query OK, 0 rows affected (0.00 sec) mysql> flush privileges; Query OK, 0 rows affected (0.00 sec) mysql> select User,Password,Host from mysql.user;
+--------+-------------------------------------------+--------------+ | User | Password | Host | +--------+-------------------------------------------+--------------+ | root | *B9627CB37815863D1E98D0C41E0233A772355E2B | localhost | | root | *B9627CB37815863D1E98D0C41E0233A772355E2B | 127.0.0.1 | | root | *B9627CB37815863D1E98D0C41E0233A772355E2B | ::1 | | cacti | *BC3E1F14C7940F9C8BCDB05A38385754BB55CD64 | localhost | | nagios | *BC3E1F14C7940F9C8BCDB05A38385754BB55CD64 | % | +--------+-------------------------------------------+--------------+ 8 rows in set (0.00 sec)
|
5、check 一下
1
2
3
4
5
6
7
8
|
# /usr/local/nagios/libexec/check_mysql -H 192.168.200.105 -unagios -dnagios_monitor -p 123qaz!@# # 报了一个错 /usr/local/nagios/libexec/check_mysql : error while loading shared libraries: libmysqlclient.so.18: cannot open shared object file : No such file or directory
# 解决: ln -sv /usr/local/mysql/lib/libmysqlclient .so.18 /usr/lib64/libmysqlclient .so.18
# 再重新测试 # /usr/local/nagios/libexec/check_mysql -H 192.168.200.111 -unagios -dnagios_monitor -p 123qaz!@# Uptime: 13991 Threads: 5 Questions: 1242101 Slow queries: 0 Opens: 159 Flush tables: 1 Open tables: 60 Queries per second avg: 88.778|Connections=315c;;; Open_files=85;;; Open_tables=60;;; Qcache_free_memory=16285768;;; Qcache_hits=1210926c;;; Qcache_inserts=16654c;;; Qcache_lowmem_prunes=0c;;; Qcache_not_cached=2c;;; Qcache_queries_in_cache=283;;; Queries=1242101c;;; Questions=1242101c;;; Table_locks_waited=2c;;; Threads_connected=5;;; Threads_running=1;;; Uptime=13991c;;; |
6、监控localhost
(1)修改 commands.cfg
1
2
3
4
5
|
# vim /usr/local/nagios/etc/objects/commands.cfg define command {
command_name check_mysql
command_line $USER1$ /check_mysql -H $HOSTADDRESS$ -unagios -dnagios_monitor -p123qaz!@ #
} |
(2)修改 localhost.cfg
1
2
3
4
5
6
7
|
# vim /usr/local/nagios/etc/objects/localhost.cfg define service{ use local -service
host_name localhost
service_description check_mysql
check_command check_mysql
}
|
(3)重启 nagios
1
|
# service nagios restart |
7、监控客户端
(1)check 一下
1
|
# /usr/local/nagios/libexec/check_mysql -H 192.168.200.111 -unagios -dnagios_monitor -p123qaz!@# |
(2)客户端修改 nrpe.cfg
1
2
|
# vim /usr/local/nagios/etc/nrpe.cfg command [check_mysql]= /usr/local/nagios/libexec/check_mysql -H 192.168.200.111 -unagios -dnagios_monitor -p123qaz!@ #
|
(3)重启 nrpe
1
2
|
# killall nrpe # /usr/local/nagios/bin/nrpe -c /usr/local/nagios/etc/nrpe.cfg -d |
(4)服务端定义服务
1
2
3
4
5
6
7
|
# vim /usr/local/nagios/etc/servers/192.168.200.111.cfg define service{ use generic-service
host_name 192.168.200.111
service_description check_mysql
check_command check_nrpe!check_mysql
}
|
(5)重启 nagios 服务
1
|
# service nagios restart |
本文转自 nmshuishui 51CTO博客,原文链接:http://blog.51cto.com/nmshuishui/1553445,如需转载请自行联系原作者