nrpe的安装
tar xvfz nrpe-2.13.tar.gz
cd nrpe-2.13
./configure
make all
make install-plugin
make install-daemon
make install-daemon-config
yum install xinetd
make install-xinetd
[root@nhserver2 ~]# vim /usr/local/nagios/etc/nrpe.cfg
allowed_hosts=127.0.0.1,192.168.5.10
[root@nhserver2 ~]# vim /etc/xinetd.d/nrpe
# default: on
# description: NRPE (Nagios Remote Plugin Executor)
service nrpe
{
flags = REUSE
socket_type = stream
port = 5666
wait = no
user = nagios
group = nagios
server = /usr/local/nagios/bin/nrpe
server_args = -c /usr/local/nagios/etc/nrpe.cfg --inetd
log_on_failure += USERID
disable = no
only_from = 127.0.0.1 192.168.5.10 # 这个IP可以不变,为本机
}
[root@nhserver2 ~]# /usr/local/nagios/libexec/check_nrpe -H localhost
NRPE v2.12
[root@nhserver2 ~]# /usr/local/nagios/libexec/check_nrpe -H 192.168.5.10 #192.168.5.10为nagios服务器的ip
NRPE v2.12
[root@nhserver2 ~]# /usr/local/nagios/libexec/check_nrpe -H 192.168.5.110 #192.168.5.110还未开机
Connection refused or timed out
[root@nhserver2 ~]# /usr/local/nagios/libexec/check_nrpe -H 192.168.5.110 #192.168.5.110开机
CHECK_NRPE: Error - Could not complete SSL handshake.
[root@nhserver2 ~]# service xinetd restart #重启nrpe服务
=========================================================================================================================
在192.168.5.110被监控端安装nrpe
1.安装nrpe依赖包
yum -y install gcc glibc glibc-common openssl openssl-devel
2.安装nagios-plugin
useradd nagios
wget http://sourceforge.net/projects/nagiosplug/files/nagiosplug/1.4.15/nagios-plugins-1.4.15.tar.gz/download
tar zxf nagios-plugins-1.4.15.tar.gz && cd nagios-plugins-1.4.15
./configure --with-nagios-user=nagios --with-nagios-group=nagios
make
make install
chown -R nagios.nagios /usr/local/nagios
3.安装nrpe
wget http://nchc.dl.sourceforge.net/project/nagios/nrpe-2.x/nrpe-2.12/nrpe-2.12.tar.gz
tar zxf nrpe-2.12.tar.gz && cd nrpe-2.12
./configure
make all
make install-plugin
make install-daemon
make install-daemon-config
4.启动nrpe并设置开机自启动
/usr/local/nagios/bin/nrpe -c /usr/local/nagios/etc/nrpe.cfg -d
echo "/usr/local/nagios/bin/nrpe -c /usr/local/nagios/etc/nrpe.cfg -d" >> /etc/rc.d/rc.local
[root@nhserver1 ~]# vim /usr/local/nagios/etc/nrpe.cfg
allowed_hosts=127.0.0.1,192.168.5.10 #将nagios的服务端IP加上
[root@nhserver1 ~]# vim /etc/xinetd.d/nrpe
# default: on
# description: NRPE (Nagios Remote Plugin Executor)
service nrpe
{
flags = REUSE
socket_type = stream
port = 5666
wait = no
user = nagios
group = nagios
server = /usr/local/nagios/bin/nrpe
server_args = -c /usr/local/nagios/etc/nrpe.cfg --inetd
log_on_failure += USERID
disable = no
only_from = 127.0.0.1 192.168.5.10 #将nagios的服务端IP加上
}
============== 在nagios服务端测试 ====================
[root@nhserver2 ~]#
NRPE v2.12
=================================================================
要在被监控端192.168.5.110加入自定义的脚本
[root@nhserver1 libexec]# vim /usr/local/nagios/libexec/nh_check_users
#!/bin/bash
# for nrpe check user
U=`who | wc -l`
if [ $U -le 3 ];then
echo "OK,current user is.$U"
exit 0
elif [ $U -gt 6 ];then
echo "CRITICAL,current user is.$U"
exit 2
else
echo "WARNING,current user is.$U"
exit 1
fi
定义该脚本为nagios用户和nagios组
[root@nhserver1 libexec]# chown nagios.nagios /usr/local/nagios/libexec/nh_check_91
在NRPE上加入该自定义命令
[root@nhserver1 libexec]# vim /usr/local/nagios/etc/nrpe.cfg
command[nh_check_users]=/usr/local/nagios/libexec/nh_check_users
在服务端测试192.168.5.10,直接使用命令行
[root@nhserver2 libexec]# /usr/local/nagios/libexec/check_nrpe -H 192.168.5.110 -c nh_check_users
OK,current user is.1
=========================================================================
在服务端测试192.168.5.10的nagios中加入自定义脚本
[root@nhserver2 objects]# cd /usr/local/nagios/etc/objects
[root@nhserver2 objects]# vim hosts_192.168.5.110.cfg
define host{
use linux-server
host_name 192.168.5.110
alias 192.168.5.110
address 192.168.5.110
}
define hostgroup{
hostgroup_name nh_linuxs
alias nh_linuxs
members 192.168.5.110
}
define service{
use local-service
host_name 192.168.5.110
service_description check-host-alive
check_command check-host-alive
max_check_attempts 5
normal_check_interval 3
retry_check_interval 2
check_period 24x7
notification_interval 10
notification_period 24x7
}
define service{
use local-service
host_name 192.168.5.110
service_description SSH
check_command check_ssh
max_check_attempts 5
normal_check_interval 3
retry_check_interval 2
check_period 24x7
notification_interval 10
notification_period 24x7
}
define service{
use local-service
host_name 192.168.5.110
service_description check_nrpe_check_users
check_command check_nrpe!nh_check_users
max_check_attempts 5
normal_check_interval 3
retry_check_interval 2
check_period 24x7
notification_interval 10
notification_period 24x7
}
过一下,在nagios中就能观察到check_nrpe_check_users自定义服务的状态了,"OK,current user is.1".
[root@nhserver2 objects]# service nagios reload
Host Sort by host name (ascending)Sort by host name (descending) Service Sort by service name (ascending)Sort by service name (descending)
Status Sort by service status (ascending)Sort by service status (descending) Last Check Sort by last check time (ascending)Sort by last check time
(descending) Duration Sort by state duration (ascending)Sort by state duration time (descending) Attempt Sort by current attempt (ascending)Sort by
current attempt (descending) Status Information
192.168.5.110
SSH
OK 04-04-2014 20:22:01 0d 0h 1m 56s 1/5 SSH OK - OpenSSH_5.3 (protocol 2.0)
check-host-alive
OK 04-04-2014 20:22:50 0d 0h 2m 56s 1/5 PING OK - Packet loss = 0%, RTA = 0.61 ms
check_nrpe_check_users
OK 04-04-2014 20:23:38 0d 0h 0m 19s 1/5 OK,current user is.1