linux 5.4 nagios监控搭建

nagios监控服务器   10.1.7.110

linux客户端服      10.1.7.120

windows客户端      10.1.7.119

1创建nagios组和账号

root@nagios ~]# useradd -m nagios
[root@nagios ~]# groupadd nagcmd
[root@nagios ~]# groupadd nagcmd
[root@nagios ~]# usermod -a -G nagcmd nagios
[root@nagios ~]# usermod -a -G nagcmd apache

2编译安装
[root@nagios ~]# tar xvf nagios-3.2.0.tar.gz
[root@nagios ~]# cd nagios-3.2.0
[root@nagios nagios-3.2.0]# less Makefile
[root@nagios nagios-3.2.0]# ./configure --with-command-group=nagcmd\ --with-nagios-user=nagios\ --with-nagios-group=nagios
[root@nagios nagios-3.2.0]# make all
[root@nagios nagios-3.2.0]# make install
[root@nagios nagios-3.2.0]# make install-init
[root@nagios nagios-3.2.0]# make install-config
[root@nagios nagios-3.2.0]# make install-commandmode
[root@nagios nagios-3.2.0]# make install-webconf

3为nagios设置web验证密码
root@nagios nagios-3.2.0]# htpasswd -c usr/local/nagios/etc/htpasswd.users nagiosadmin

5设置nagios的开机启动
root@nagios ~]# chkconfig --add nagios
[root@nagios ~]# chkconfig nagios on

6修改selinux
[root@nagios nagios-3.2.0]# cat /etc/sysconfig/selinux
# This file controls the state of SELinux on the system.
# SELINUX= disable:


二  安装nagios的插件 nagios-plugin

[root@nagios ~]# tar xvf nagios-plugins-1.4.14.tar.gz
[root@nagios ~]# cd nagios-plugins-1.4.14
[root@nagios nagios-plugins-1.4.14]# ./configure --prefix=/usr/local/nagios/ --with-nagios-user=nagios --with-nagios-group=nagios
[root@nagios nagios-plugins-1.4.14]# make && make install

检查主机是佛存在
[root@nagios ~]# cd /usr/local/nagios/etc/
[root@nagios etc]# ls -l
总计 76
-rw-rw-r-- 1 nagios nagios 11408 05-18 16:46 cgi.cfg
-rw-r--r-- 1 root   root      26 05-18 19:16 htpasswd.users
-rw-rw-r-- 1 nagios nagios 44020 05-18 18:53 nagios.cfg
-rw-r--r-- 1 nagios nagios  7207 05-18 19:33 nrpe.cfg
drwxrwxr-x 2 nagios nagios  4096 05-18 20:06 objects
-rw-rw---- 1 nagios nagios  1340 05-18 16:46 resource.cfg
[root@nagios etc]#

2主配置文件nagios。cfg配置
[root@nagios etc]# vim nagios.cfg
cfg_file=/usr/local/nagios/etc/objects/commands.cfg
cfg_file=/usr/local/nagios/etc/objects/contacts.cfg
cfg_file=/usr/local/nagios/etc/objects/contactgroups.cfg
cfg_file=/usr/local/nagios/etc/objects/hosts.cfg
cfg_file=/usr/local/nagios/etc/objects/hostgroups.cfg
cfg_file=/usr/local/nagios/etc/objects/services.cfg
cfg_file=/usr/local/nagios/etc/objects/timeperiods.cfg
cfg_file=/usr/local/nagios/etc/objects/templates.cfg
# Definitions for monitoring the local (Linux) host
#cfg_file=/usr/local/nagios/etc/objects/localhost.cfg  //注释掉此行

3主机定义文件配置
define host{
        host_name Nagios-server
        alias Nagios server
        address 10.1.7.110
        check_command check-host-alive
        check_interval 5
        retry_interval 1
        max_check_attempts 5
        check_period 24x7
        process_perf_data 0
        retain_nonstatus_information 0
        contact_groups sagroup
        notification_interval 30
        notification_period 24x7
        notification_options d,u,r
}


define host{
        host_name client-server
        alias client server
        address 10.1.7.120
        check_command check-host-alive
        check_interval 5
        retry_interval 1
        max_check_attempts 5
        check_period 24x7
        process_perf_data 0
        retain_nonstatus_information 0
        contact_groups sagroup
        notification_interval 30
        notification_period 24x7
        notification_options d,u,r
}

3主机组定义文件配置
[root@nagios etc]# vim objects/hostgroups.cfg
define hostgroup {
        hostgroup_name Sysem-Admin
        alias system Admin
        members Nagios-server,client-server,windows-server
}
~
4服务定义文件配置
[root@nagios etc]# vim objects/services.cfg

define service{
        host_name Nagios-server
        service_description check-host-alive
        check_period 24x7
        max_check_attempts 4
        normal_check_interval 3
        retry_check_interval 2
        contact_groups sagroup
        notification_interval 10
        notification_period 24x7
        notification_options w,c,u,r
        check_command check-host-alive
}

define service{
        host_name client-server
        service_description check-host-alive
        check_period 24x7
        max_check_attempts 4
        normal_check_interval 3
        retry_check_interval 2
        contact_groups sagroup
        notification_interval 10
        notification_period 24x7
        notification_options w,c,u,r
        check_command check-host-alive
}

5联系人定义文件配置

 


[root@nagios etc]# vim objects/contacts.cfg

define contact{
        contact_name                    nagiosadmin             ; Short name of user
        use                             generic-contact         ; Inherit default values from generic-contact template (defined above)
        alias                           Nagios Admin            ; Full name of user
        service_notification_period 24x7
        host_notification_period 24x7
        service_notification_options w,u,c,r

        host_notification_options d,u,r
        service_notification_commands notify-service-by-email
        host_notification_commands notify-host-by-email
        email                           [email protected]

6联系组定义文件配置
[root@nagios etc]# vim objects/contactgroups.cfg

define contactgroup {
       contactgroup_name sagroup
       alias system administrator group
       members nagiosadmin
}
7修改目录所有者

~
[root@nagios etc]# chown -R nagios.nagios objects/

8检查配置文件是否正却

[root@nagios etc]# /usr/local/nagios/bin/nagios -v /usr/local/nagios/etc/nagios.cfg
Total Warnings: 0
Total Errors:   0

9启动nagios服务
[root@nagios etc]# etc/init.d/httpd restart
[root@nagios etc]# /etc/init.d/nagios start

10 测试功能
http://10.1.7.110/nagios/ 输入 nagiosadmin 密码 accp

 

三 使用nagios监控linux客户端

1  nagios监控服务器的配置

[root@nagios ~]# tar zxvf nrpe-2.12.tar.gz
[root@nagios ~]# cd nrpe-2.12
[root@nagios nrpe-2.12]# ./configure && make all
[root@nagios nrpe-2.12]# make install-plugin
[root@nagios nrpe-2.12]# make install-daemon
[root@nagios nrpe-2.12]# make install-daemon-config
[root@nagios nrpe-2.12]# make install-xinetd

 


2 配置
[root@nagios nrpe-2.12]# vim /etc/xinetd.d/nrpe


        server          = /usr/local/nagios/bin/nrpe
        server_args     = -c /usr/local/nagios/etc/nrpe.cfg --inetd
        log_on_failure  += USERID
        disable         = no
        only_from       = 127.0.0.1,10.1.7.120,10.1.7.119

3 添加端口

[root@nagios nrpe-2.12]# vim /etc/services

nrpe            5666/tcp                          #nrpe

4 重新启动 xinetd服务

[root@nagios nrpe-2.12]# /etc/init.d/xinetd restart
[root@nagios nrpe-2.12]# netstat -na | grep 5666

以上步骤要到客户机上做 1--4

5修改配置文件commands.cfg加入对nrpe的支持
[root@nagios ~]# vim /usr/local/nagios/etc/objects/commands.cfg

#nrpe set
define command {
        command_name check_nrpe
command_line /usr/local/nagios/libexec/check_nrpe -H $ HOSTADDRESS$ -c $ ARG1$
}

检查nrpe命令那些可用
[root@nagios ~]# cat /usr/local/nagios/etc/nrpe.cfg

command[check_users]=/usr/local/nagios/libexec/check_users -w 5 -c 10
command[check_load]=/usr/local/nagios/libexec/check_load -w 15,10,5 -c 30,25,20
command[check_hda1]=/usr/local/nagios/libexec/check_disk -w 20% -c 10% -p /dev/hda1
command[check_zombie_procs]=/usr/local/nagios/libexec/check_procs -w 5 -c 10 -s Z
command[check_total_procs]=/usr/local/nagios/libexec/check_procs -w 150 -c 200

7 使用命令监控客户端
[root@nagios ~]# vim /usr/local/nagios/etc/objects/services.cfg

define service{
        host_name Nagios-server
        service_description check-users
        check_period 24x7
        max_check_attempts 4
        normal_check_interval 3
        retry_check_interval 2
        contact_groups sagroup
        notification_interval 10
        notification_period 24x7
        notification_options w,c,u,r
        check_command check-nrpe!check_users
}

define service{
        host_name Nagios-server
        service_description check-load
        check_period 24x7
        max_check_attempts 4
        normal_check_interval 3
        retry_check_interval 2
        contact_groups sagroup
        notification_interval 10
        notification_period 24x7
        notification_options w,c,u,r
        check_command check-nrpe!check_load
}

define service{
        host_name Nagios-server
        service_description check-total-procs
        check_period 24x7
        max_check_attempts 4
        normal_check_interval 3
        retry_check_interval 2
        contact_groups sagroup
        notification_interval 10
        notification_period 24x7
        notification_options w,c,u,r
        check_command check-total_procs
}


你可能感兴趣的:(linux,服务器,客户端,监控,账号)