nagios监控服务器 10.1.7.110
linux客户端服 10.1.7.120
windows客户端 10.1.7.119
1创建nagios组和账号
root@nagios ~]# useradd -m nagios
[root@nagios ~]# groupadd nagcmd
[root@nagios ~]# groupadd nagcmd
[root@nagios ~]# usermod -a -G nagcmd nagios
[root@nagios ~]# usermod -a -G nagcmd apache
2编译安装
[root@nagios ~]# tar xvf nagios-3.2.0.tar.gz
[root@nagios ~]# cd nagios-3.2.0
[root@nagios nagios-3.2.0]# less Makefile
[root@nagios nagios-3.2.0]# ./configure --with-command-group=nagcmd\ --with-nagios-user=nagios\ --with-nagios-group=nagios
[root@nagios nagios-3.2.0]# make all
[root@nagios nagios-3.2.0]# make install
[root@nagios nagios-3.2.0]# make install-init
[root@nagios nagios-3.2.0]# make install-config
[root@nagios nagios-3.2.0]# make install-commandmode
[root@nagios nagios-3.2.0]# make install-webconf
3为nagios设置web验证密码
root@nagios nagios-3.2.0]# htpasswd -c usr/local/nagios/etc/htpasswd.users nagiosadmin
5设置nagios的开机启动
root@nagios ~]# chkconfig --add nagios
[root@nagios ~]# chkconfig nagios on
6修改selinux
[root@nagios nagios-3.2.0]# cat /etc/sysconfig/selinux
# This file controls the state of SELinux on the system.
# SELINUX= disable:
二 安装nagios的插件 nagios-plugin
[root@nagios ~]# tar xvf nagios-plugins-1.4.14.tar.gz
[root@nagios ~]# cd nagios-plugins-1.4.14
[root@nagios nagios-plugins-1.4.14]# ./configure --prefix=/usr/local/nagios/ --with-nagios-user=nagios --with-nagios-group=nagios
[root@nagios nagios-plugins-1.4.14]# make && make install
检查主机是佛存在
[root@nagios ~]# cd /usr/local/nagios/etc/
[root@nagios etc]# ls -l
总计 76
-rw-rw-r-- 1 nagios nagios 11408 05-18 16:46 cgi.cfg
-rw-r--r-- 1 root root 26 05-18 19:16 htpasswd.users
-rw-rw-r-- 1 nagios nagios 44020 05-18 18:53 nagios.cfg
-rw-r--r-- 1 nagios nagios 7207 05-18 19:33 nrpe.cfg
drwxrwxr-x 2 nagios nagios 4096 05-18 20:06 objects
-rw-rw---- 1 nagios nagios 1340 05-18 16:46 resource.cfg
[root@nagios etc]#
2主配置文件nagios。cfg配置
[root@nagios etc]# vim nagios.cfg
cfg_file=/usr/local/nagios/etc/objects/commands.cfg
cfg_file=/usr/local/nagios/etc/objects/contacts.cfg
cfg_file=/usr/local/nagios/etc/objects/contactgroups.cfg
cfg_file=/usr/local/nagios/etc/objects/hosts.cfg
cfg_file=/usr/local/nagios/etc/objects/hostgroups.cfg
cfg_file=/usr/local/nagios/etc/objects/services.cfg
cfg_file=/usr/local/nagios/etc/objects/timeperiods.cfg
cfg_file=/usr/local/nagios/etc/objects/templates.cfg
# Definitions for monitoring the local (Linux) host
#cfg_file=/usr/local/nagios/etc/objects/localhost.cfg //注释掉此行
3主机定义文件配置
define host{
host_name Nagios-server
alias Nagios server
address 10.1.7.110
check_command check-host-alive
check_interval 5
retry_interval 1
max_check_attempts 5
check_period 24x7
process_perf_data 0
retain_nonstatus_information 0
contact_groups sagroup
notification_interval 30
notification_period 24x7
notification_options d,u,r
}
define host{
host_name client-server
alias client server
address 10.1.7.120
check_command check-host-alive
check_interval 5
retry_interval 1
max_check_attempts 5
check_period 24x7
process_perf_data 0
retain_nonstatus_information 0
contact_groups sagroup
notification_interval 30
notification_period 24x7
notification_options d,u,r
}
3主机组定义文件配置
[root@nagios etc]# vim objects/hostgroups.cfg
define hostgroup {
hostgroup_name Sysem-Admin
alias system Admin
members Nagios-server,client-server,windows-server
}
~
4服务定义文件配置
[root@nagios etc]# vim objects/services.cfg
define service{
host_name Nagios-server
service_description check-host-alive
check_period 24x7
max_check_attempts 4
normal_check_interval 3
retry_check_interval 2
contact_groups sagroup
notification_interval 10
notification_period 24x7
notification_options w,c,u,r
check_command check-host-alive
}
define service{
host_name client-server
service_description check-host-alive
check_period 24x7
max_check_attempts 4
normal_check_interval 3
retry_check_interval 2
contact_groups sagroup
notification_interval 10
notification_period 24x7
notification_options w,c,u,r
check_command check-host-alive
}
5联系人定义文件配置
[root@nagios etc]# vim objects/contacts.cfg
define contact{
contact_name nagiosadmin ; Short name of user
use generic-contact ; Inherit default values from generic-contact template (defined above)
alias Nagios Admin ; Full name of user
service_notification_period 24x7
host_notification_period 24x7
service_notification_options w,u,c,r
host_notification_options d,u,r
service_notification_commands notify-service-by-email
host_notification_commands notify-host-by-email
email [email protected]
6联系组定义文件配置
[root@nagios etc]# vim objects/contactgroups.cfg
define contactgroup {
contactgroup_name sagroup
alias system administrator group
members nagiosadmin
}
7修改目录所有者
~
[root@nagios etc]# chown -R nagios.nagios objects/
8检查配置文件是否正却
[root@nagios etc]# /usr/local/nagios/bin/nagios -v /usr/local/nagios/etc/nagios.cfg
Total Warnings: 0
Total Errors: 0
9启动nagios服务
[root@nagios etc]# etc/init.d/httpd restart
[root@nagios etc]# /etc/init.d/nagios start
10 测试功能
http://10.1.7.110/nagios/ 输入 nagiosadmin 密码 accp
三 使用nagios监控linux客户端
1 nagios监控服务器的配置
[root@nagios ~]# tar zxvf nrpe-2.12.tar.gz
[root@nagios ~]# cd nrpe-2.12
[root@nagios nrpe-2.12]# ./configure && make all
[root@nagios nrpe-2.12]# make install-plugin
[root@nagios nrpe-2.12]# make install-daemon
[root@nagios nrpe-2.12]# make install-daemon-config
[root@nagios nrpe-2.12]# make install-xinetd
2 配置
[root@nagios nrpe-2.12]# vim /etc/xinetd.d/nrpe
server = /usr/local/nagios/bin/nrpe
server_args = -c /usr/local/nagios/etc/nrpe.cfg --inetd
log_on_failure += USERID
disable = no
only_from = 127.0.0.1,10.1.7.120,10.1.7.119
3 添加端口
[root@nagios nrpe-2.12]# vim /etc/services
nrpe 5666/tcp #nrpe
4 重新启动 xinetd服务
[root@nagios nrpe-2.12]# /etc/init.d/xinetd restart
[root@nagios nrpe-2.12]# netstat -na | grep 5666
以上步骤要到客户机上做 1--4
5修改配置文件commands.cfg加入对nrpe的支持
[root@nagios ~]# vim /usr/local/nagios/etc/objects/commands.cfg
#nrpe set
define command {
command_name check_nrpe
command_line /usr/local/nagios/libexec/check_nrpe -H $ HOSTADDRESS$ -c $ ARG1$
}
检查nrpe命令那些可用
[root@nagios ~]# cat /usr/local/nagios/etc/nrpe.cfg
command[check_users]=/usr/local/nagios/libexec/check_users -w 5 -c 10
command[check_load]=/usr/local/nagios/libexec/check_load -w 15,10,5 -c 30,25,20
command[check_hda1]=/usr/local/nagios/libexec/check_disk -w 20% -c 10% -p /dev/hda1
command[check_zombie_procs]=/usr/local/nagios/libexec/check_procs -w 5 -c 10 -s Z
command[check_total_procs]=/usr/local/nagios/libexec/check_procs -w 150 -c 200
7 使用命令监控客户端
[root@nagios ~]# vim /usr/local/nagios/etc/objects/services.cfg
define service{
host_name Nagios-server
service_description check-users
check_period 24x7
max_check_attempts 4
normal_check_interval 3
retry_check_interval 2
contact_groups sagroup
notification_interval 10
notification_period 24x7
notification_options w,c,u,r
check_command check-nrpe!check_users
}
define service{
host_name Nagios-server
service_description check-load
check_period 24x7
max_check_attempts 4
normal_check_interval 3
retry_check_interval 2
contact_groups sagroup
notification_interval 10
notification_period 24x7
notification_options w,c,u,r
check_command check-nrpe!check_load
}
define service{
host_name Nagios-server
service_description check-total-procs
check_period 24x7
max_check_attempts 4
normal_check_interval 3
retry_check_interval 2
contact_groups sagroup
notification_interval 10
notification_period 24x7
notification_options w,c,u,r
check_command check-total_procs
}