博客
关于我
强烈建议你试试无所不能的chatGPT,快点击我
nagios 监控 nginx
阅读量:6450 次
发布时间:2019-06-23

本文共 7630 字,大约阅读时间需要 25 分钟。

   1.在被控端执行操作:把check_nginx插件放进/usr/local/nagios/libexec,并且授权属主和属组为nagios(这点非常关键)

[root@Jiechao libexec]# ll check_nginx 
-rwxr-xr-x 1 nagios nagios 7636 Oct 23 22:48 check_nginx

2.vi /usr/local/nagios/etc/nrpe.cfg

添加这行:command[check_nginx]=/usr/local/nagios/libexec/check_nginx -w 15000 -c 20000

3.重启Nrpe:

killall -9 nrpe
/usr/local/nagios/bin/nrpe -c /usr/local/nagios/etc/nrpe.cfg -d

4.被控端执行操作测试:

[root@Jiechao libexec]# ./check_nginx -H 192.168.0.100 -P 80 -p /var/run/ -n nginx.pid -s nginx_status -o /tmp/ -w 15000 -c 20000
OK - nginx is running. 1 requests per second, 1 connections per second (1.00 requests per connection) | 'reqpsec'=1 'conpsec'=1 'conpreq'=1.00 ]
--------------------------------------------------------------------------------------------------------------------------------------------------
下面在Nagios Server端操作:
1.vi /usr/local/nagios/etc/objects/service.cfg
添加:
define service{
use generic-service
host_name Nagios-server,Nagios-client
service_description check_nginx
check_command check_nrpe!check_nginx
max_check_attempts 3
normal_check_interval 3
retry_check_interval 3
check_period 24x7
notification_interval 5
notification_period 24x7
notification_options w,u,c,r
contact_groups admins
process_perf_data 1
action_url /nagios/pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
}
添加完,保存退出,重启Nagios即可。
/etc/init.d/nagios relaod
/etc/init.d/nagios restart

2.测试:/usr/local/nagios/libexec/check_nrpe -H 192.168.0.100 -c check_nginx

OK - nginx is running. 1 requests per second, 1 connections per second (1.00 requests per connection) | 'reqpsec'=1 'conpsec'=1 'conpreq'=1.00 ]

#---------------------192.168.0.100是我被控端的ip地址------------------------------------------------------

下面是一些注意的地方--
1、关于nginx.pid
     --在nginx.conf一定要加上,如:pid    /opt/nginx.pid
2、如果出现以下提示.
    --UNKNOWN - Local copy/copies of nginx_status is empty.
    --可能就是在你的nginx.conf没有配置状态监控,如
    server
  {
    listen  80;
    server_name  IP | 域名;
    location /nginx_status {
    stub_status on;
    access_log   off;
    }
  }
   
3.需要更改check_nginx 一个地方:
把hostname="localhost"改为:你需要监控的主机ip。
如:hostname="192.168.0.100"

 

check_nginx 脚本

 

 #!/bin/sh

PROGNAME=`basename $0`

VERSION="Version 1.0,"
AUTHOR="2009, Mike Adolphs ()"

ST_OK=0

ST_WR=1
ST_CR=2
ST_UK=3
hostname="192.168.0.100"
port=80
path_pid=/var/run
name_pid="nginx.pid"
status_page="nginx_status"
output_dir=/tmp
pid_check=1
secure=0

print_version() {

    echo "$VERSION $AUTHOR"
}

print_help() {

    print_version $PROGNAME $VERSION
    echo ""
    echo "$PROGNAME is a Nagios plugin to check whether nginx is running."
    echo "It also parses the nginx's status page to get requests and"
    echo "connections per second as well as requests per connection. You"
    echo "may have to alter your nginx configuration so that the plugin"
    echo "can access the server's status page."
    echo "The plugin is highly configurable for this reason. See below for"
    echo "available options."
    echo ""
    echo "$PROGNAME -H localhost -P 80 -p /var/run -n nginx.pid "
 echo "  -s nginx_statut -o /tmp [-w INT] [-c INT] [-S] [-N]"
    echo ""
    echo "Options:"
    echo "  -H/--hostname)"
    echo "     Defines the hostname. Default is: localhost"
    echo "  -P/--port)"
    echo "     Defines the port. Default is: 80"
    echo "  -p/--path-pid)"
    echo "     Path where nginx's pid file is being stored. You might need"
    echo "     to alter this path according to your distribution. Default"
    echo "     is: /var/run"
    echo "  -n/--name_pid)"
    echo "     Name of the pid file. Default is: nginx.pid"
    echo "  -N/--no-pid-check)"
    echo "     Turn this on, if you don't want to check for a pid file"
    echo "     whether nginx is running, e.g. when you're checking a"
    echo "     remote server. Default is: off"
    echo "  -s/--status-page)"
    echo "     Name of the server's status page defined in the location"
    echo "     directive of your nginx configuration. Default is:"
    echo "     nginx_status"
    echo "  -o/--output-directory)"
    echo "     Specifies where to write the tmp-file that the check creates."
    echo "     Default is: /tmp"
    echo "  -S/--secure)"
    echo "     In case your server is only reachable via SSL, use this"
    echo "     this switch to use HTTPS instead of HTTP. Default is: off"
    echo "  -w/--warning)"
    echo "     Sets a warning level for requests per second. Default is: off"
    echo "  -c/--critical)"
    echo "     Sets a critical level for requests per second. Default is:"
 echo "     off"
    exit $ST_UK
}

while test -n "$1"; do

    case "$1" in
        -help|-h)
            print_help
            exit $ST_UK
            ;;
        --version|-v)
            print_version $PROGNAME $VERSION
            exit $ST_UK
            ;;
        --hostname|-H)
            hostname=$2
            shift
            ;;
        --port|-P)
            port=$2
            shift
            ;;
        --path-pid|-p)
            path_pid=$2
            shift
            ;;
        --name-pid|-n)
            name_pid=$2
            shift
            ;;
        --no-pid-check|-N)
            pid_check=0
            ;;
        --status-page|-s)
            status_page=$2
            shift
            ;;
        --output-directory|-o)
            output_dir=$2
            shift
            ;;
        --secure|-S)
            secure=1
            ;;
        --warning|-w)
            warning=$2
            shift
            ;;
        --critical|-c)
            critical=$2
            shift
            ;;
        *)
            echo "Unknown argument: $1"
            print_help
            exit $ST_UK
            ;;
        esac
    shift
done

get_wcdiff() {

    if [ ! -z "$warning" -a ! -z "$critical" ]
    then
        wclvls=1

        if [ ${warning} -gt ${critical} ]

        then
            wcdiff=1
        fi
    elif [ ! -z "$warning" -a -z "$critical" ]
    then
        wcdiff=2
    elif [ -z "$warning" -a ! -z "$critical" ]
    then
        wcdiff=3
    fi
}

val_wcdiff() {

    if [ "$wcdiff" = 1 ]
    then
        echo "Please adjust your warning/critical thresholds. The warning \
must be lower than the critical level!"
        exit $ST_UK
    elif [ "$wcdiff" = 2 ]
    then
        echo "Please also set a critical value when you want to use \
warning/critical thresholds!"
        exit $ST_UK
    elif [ "$wcdiff" = 3 ]
    then
        echo "Please also set a warning value when you want to use \
warning/critical thresholds!"
        exit $ST_UK
    fi
}

check_pid() {

    if [ -f "$path_pid/$name_pid" ]
    then
        retval=0
    else
        retval=1
    fi
}

get_status() {

    if [ "$secure" = 1 ]
    then
        wget --no-check-certificate -q -t 3 -T 3 \
} -O ${output_dir}/nginx-status.1
        sleep 1
        wget --no-check-certificate -q -t 3 -T 3 \
} -O ${output_dir}/nginx-status.2
    else        
        wget -q -t 3 -T 3 } \
-O ${output_dir}/nginx-status.1
        sleep 1
        wget -q -t 3 -T 3 } \
-O ${output_dir}/nginx-status.2
    fi

    stat_output1=`stat -c %s ${output_dir}/nginx-status.1`

    stat_output2=`stat -c %s ${output_dir}/nginx-status.2`
    if [ "$stat_output1" = 0 -o "$stat_output2" = 0 ]
    then
        echo "UNKNOWN - Local copy/copies of $status_page is empty."
    exit $ST_UK
    fi
}

get_vals() {

    tmp1_reqpsec=`grep '^ ' ${output_dir}/nginx-status.1|awk '{print $3}'`
    tmp2_reqpsec=`grep '^ ' ${output_dir}/nginx-status.2|awk '{print $3}'`
    reqpsec=`expr $tmp2_reqpsec - $tmp1_reqpsec`

    tmp1_conpsec=`grep '^ ' ${output_dir}/nginx-status.1|awk '{print $2}'`

    tmp2_conpsec=`grep '^ ' ${output_dir}/nginx-status.2|awk '{print $2}'`
    conpsec=`expr $tmp2_conpsec - $tmp1_conpsec`

    reqpcon=`echo "scale=2; $reqpsec / $conpsec" | bc -l`

    if [ "$reqpcon" = ".99" ]
    then
        reqpcon="1.00"
    fi
}

do_output() {

    output="nginx is running. $reqpsec requests per second, $conpsec \
connections per second ($reqpcon requests per connection)"
}

do_perfdata() {

    perfdata="'reqpsec'=$reqpsec 'conpsec'=$conpsec 'conpreq'=$reqpcon"
}

# Here we go!

get_wcdiff
val_wcdiff

if [ ${pid_check} = 1 ]

then
    check_pid
    if [ "$retval" = 1 ]
    then
        echo "There's no pid file for nginx. Is nginx running? Please \
also make sure whether your pid path and name is correct."
        exit $ST_CR
    fi
fi

get_status

get_vals
do_output
do_perfdata

if [ -n "$warning" -a -n "$critical" ]

then
    if [ "$reqpsec" -ge "$warning" -a "$reqpsec" -lt "$critical" ]
    then
        echo "WARNING - ${output} | ${perfdata}"
 exit $ST_WR
    elif [ "$reqpsec" -ge "$critical" ]
    then
        echo "CRITICAL - ${output} | ${perfdata}"
 exit $ST_CR
    else
        echo "OK - ${output} | ${perfdata} ]"
 exit $ST_OK
    fi
else
    echo "OK - ${output} | ${perfdata}"
    exit $ST_OK
fi

原文链接:http://blog.163.com/ly_89/blog/static/186902299201222111738667/

      本文转自独弹古调  51CTO博客,原文链接:http://blog.51cto.com/hunkz/1657526,如需转载请自行联系原作者

你可能感兴趣的文章
python locals globals
查看>>
JEECG快速开发框架学习
查看>>
组合数据类型
查看>>
Hibernate在线考试系统 03
查看>>
redis底层数据结构
查看>>
Java集合四大家族的故事(四)——Map家族的LinkedHashMap
查看>>
android获取APK签名信息及MD5指纹
查看>>
Linux常用命令
查看>>
数据库高速缓冲区(database buffer cahce)
查看>>
Shell脚本首枚
查看>>
JDK BitSet实现原理
查看>>
Hbase Replication 介绍
查看>>
Nginx配置服务器静态文件支持跨域访问
查看>>
iOS 获取本地视频的缩略图
查看>>
Ubuntu 安装QQ
查看>>
【Android学习笔记】二、创建项目 安装卸载apk
查看>>
show virtual keyboard
查看>>
【转载】Linux升级安装GCC
查看>>
TCPDUMP命令详解
查看>>
value-ref, key-ref, ref local, ref bean
查看>>