|
|
@@ -0,0 +1,247 @@
|
|
|
+# 此监控类型所属类别:service-应用服务监控 db-数据库监控 custom-自定义监控 os-操作系统监控
|
|
|
+category: os
|
|
|
+# 监控应用类型(与文件名保持一致) eg: linux windows tomcat mysql aws...
|
|
|
+app: centos
|
|
|
+name:
|
|
|
+ zh-CN: Centos Linux
|
|
|
+ en-US: Centos Linux
|
|
|
+# 参数映射map. type是参数类型: 0-number数字, 1-string明文字符串, 2-secret加密字符串
|
|
|
+# 强制固定必须参数 - host
|
|
|
+configmap:
|
|
|
+ - key: host
|
|
|
+ type: 1
|
|
|
+ - key: port
|
|
|
+ type: 0
|
|
|
+ - key: username
|
|
|
+ type: 1
|
|
|
+ - key: password
|
|
|
+ type: 2
|
|
|
+ - key: timeout
|
|
|
+ type: 0
|
|
|
+# 指标组列表
|
|
|
+metrics:
|
|
|
+# 第一个监控指标组 basic
|
|
|
+# 注意:内置监控指标有 (responseTime - 响应时间)
|
|
|
+ - name: basic
|
|
|
+ # 指标组调度优先级(0-127)越小优先级越高,优先级低的指标组会等优先级高的指标组采集完成后才会被调度,相同优先级的指标组会并行调度采集
|
|
|
+ # 优先级为0的指标组为可用性指标组,即它会被首先调度,采集成功才会继续调度其它指标组,采集失败则中断调度
|
|
|
+ priority: 0
|
|
|
+ # 指标组中的具体监控指标
|
|
|
+ fields:
|
|
|
+ # 指标信息 包括 field名称 type字段类型:0-number数字,1-string字符串 instance是否为实例主键 unit:指标单位
|
|
|
+ - field: hostname
|
|
|
+ type: 1
|
|
|
+ instance: true
|
|
|
+ - field: version
|
|
|
+ type: 1
|
|
|
+ - field: uptime
|
|
|
+ type: 1
|
|
|
+# 监控采集使用协议 eg: sql, ssh, http, telnet, wmi, snmp, sdk
|
|
|
+ protocol: ssh
|
|
|
+# 当protocol为http协议时具体的采集配置
|
|
|
+ ssh:
|
|
|
+ # 主机host: ipv4 ipv6 域名
|
|
|
+ host: ^_^host^_^
|
|
|
+ # 端口
|
|
|
+ port: ^_^port^_^
|
|
|
+ username: ^_^username^_^
|
|
|
+ password: ^_^password^_^
|
|
|
+ timeout: ^_^timeout^_^
|
|
|
+ script: (uname -r ; hostname ; uptime | awk -F "," '{print $1}' | sed "s/ //g") | sed ":a;N;s/\n/^/g;ta" | awk -F '^' 'BEGIN{print "version hostname uptime"} {print $1, $2, $3}'
|
|
|
+ # 响应数据解析方式:oneRow, multiRow
|
|
|
+ parseType: multiRow
|
|
|
+
|
|
|
+ - name: cpu
|
|
|
+ priority: 1
|
|
|
+ fields:
|
|
|
+ # 指标信息 包括 field名称 type字段类型:0-number数字,1-string字符串 instance是否为实例主键 unit:指标单位
|
|
|
+ - field: info
|
|
|
+ type: 1
|
|
|
+ - field: cores
|
|
|
+ type: 0
|
|
|
+ unit: 核数
|
|
|
+ - field: interrupt
|
|
|
+ type: 0
|
|
|
+ unit: 个数
|
|
|
+ - field: load
|
|
|
+ type: 1
|
|
|
+ - field: context_switch
|
|
|
+ type: 0
|
|
|
+ unit: 个数
|
|
|
+ - field: usage
|
|
|
+ type: 0
|
|
|
+ unit: '%'
|
|
|
+ # (非必须)监控指标别名,与上面的指标名映射。用于采集接口数据字段不直接是最终指标名称,需要此别名做映射转换
|
|
|
+ aliasFields:
|
|
|
+ - info
|
|
|
+ - cores
|
|
|
+ - interrupt
|
|
|
+ - load
|
|
|
+ - context_switch
|
|
|
+ - idle
|
|
|
+ # (非必须)指标计算表达式,与上面的别名一起作用,计算出最终需要的指标值
|
|
|
+ # eg: cores=core1+core2, usage=usage, waitTime=allTime-runningTime
|
|
|
+ calculates:
|
|
|
+ - info=info
|
|
|
+ - cores=cores
|
|
|
+ - interrupt=interrupt
|
|
|
+ - load=load
|
|
|
+ - context_switch=context_switch
|
|
|
+ - usage=100-idle
|
|
|
+ # 监控采集使用协议 eg: sql, ssh, http, telnet, wmi, snmp, sdk
|
|
|
+ protocol: ssh
|
|
|
+ # 当protocol为http协议时具体的采集配置
|
|
|
+ ssh:
|
|
|
+ # 主机host: ipv4 ipv6 域名
|
|
|
+ host: ^_^host^_^
|
|
|
+ # 端口
|
|
|
+ port: ^_^port^_^
|
|
|
+ username: ^_^username^_^
|
|
|
+ password: ^_^password^_^
|
|
|
+ timeout: ^_^timeout^_^
|
|
|
+ script: "LANG=C lscpu | awk -F: '/Model name/ {print $2}';awk '/processor/{core++} END{print core}' /proc/cpuinfo;uptime | sed 's/,/ /g' | awk '{for(i=NF-2;i<=NF;i++)print $i }' | xargs;vmstat 1 1 | awk 'NR==3{print $11}';vmstat 1 1 | awk 'NR==3{print $12}';vmstat 1 1 | awk 'NR==3{print $15}'"
|
|
|
+ parseType: oneRow
|
|
|
+
|
|
|
+ - name: memory
|
|
|
+ priority: 2
|
|
|
+ fields:
|
|
|
+ # 指标信息 包括 field名称 type字段类型:0-number数字,1-string字符串 instance是否为实例主键 unit:指标单位
|
|
|
+ - field: total
|
|
|
+ type: 0
|
|
|
+ unit: Mb
|
|
|
+ - field: used
|
|
|
+ type: 0
|
|
|
+ unit: Mb
|
|
|
+ - field: free
|
|
|
+ type: 0
|
|
|
+ unit: Mb
|
|
|
+ - field: buff_cache
|
|
|
+ type: 0
|
|
|
+ unit: Mb
|
|
|
+ - field: available
|
|
|
+ type: 0
|
|
|
+ unit: Mb
|
|
|
+ - field: usage
|
|
|
+ type: 0
|
|
|
+ unit: '%'
|
|
|
+ # (非必须)监控指标别名,与上面的指标名映射。用于采集接口数据字段不直接是最终指标名称,需要此别名做映射转换
|
|
|
+ aliasFields:
|
|
|
+ - total
|
|
|
+ - used
|
|
|
+ - free
|
|
|
+ - buff_cache
|
|
|
+ - available
|
|
|
+ # (非必须)指标计算表达式,与上面的别名一起作用,计算出最终需要的指标值
|
|
|
+ # eg: cores=core1+core2, usage=usage, waitTime=allTime-runningTime
|
|
|
+ calculates:
|
|
|
+ - total=total
|
|
|
+ - used=used
|
|
|
+ - free=free
|
|
|
+ - buff_cache=buff_cache
|
|
|
+ - available=available
|
|
|
+ - usage=(used / total) * 100
|
|
|
+ # 监控采集使用协议 eg: sql, ssh, http, telnet, wmi, snmp, sdk
|
|
|
+ protocol: ssh
|
|
|
+ # 当protocol为http协议时具体的采集配置
|
|
|
+ ssh:
|
|
|
+ # 主机host: ipv4 ipv6 域名
|
|
|
+ host: ^_^host^_^
|
|
|
+ # 端口
|
|
|
+ port: ^_^port^_^
|
|
|
+ username: ^_^username^_^
|
|
|
+ password: ^_^password^_^
|
|
|
+ timeout: ^_^timeout^_^
|
|
|
+ script: free -m | grep Mem | awk 'BEGIN{print "total used free buff_cache available"} {print $2,$3,$4,$6,$7}'
|
|
|
+ parseType: multiRow
|
|
|
+
|
|
|
+ - name: disk
|
|
|
+ priority: 3
|
|
|
+ fields:
|
|
|
+ # 指标信息 包括 field名称 type字段类型:0-number数字,1-string字符串 instance是否为实例主键 unit:指标单位
|
|
|
+ - field: disk_num
|
|
|
+ type: 0
|
|
|
+ unit: 块数
|
|
|
+ - field: partition_num
|
|
|
+ type: 0
|
|
|
+ unit: 分区数
|
|
|
+ - field: block_write
|
|
|
+ type: 0
|
|
|
+ unit: 块数
|
|
|
+ - field: block_read
|
|
|
+ type: 0
|
|
|
+ unit: 块数
|
|
|
+ - field: write_rate
|
|
|
+ type: 0
|
|
|
+ unit: iops
|
|
|
+ # 监控采集使用协议 eg: sql, ssh, http, telnet, wmi, snmp, sdk
|
|
|
+ protocol: ssh
|
|
|
+ # 当protocol为http协议时具体的采集配置
|
|
|
+ ssh:
|
|
|
+ # 主机host: ipv4 ipv6 域名
|
|
|
+ host: ^_^host^_^
|
|
|
+ # 端口
|
|
|
+ port: ^_^port^_^
|
|
|
+ username: ^_^username^_^
|
|
|
+ password: ^_^password^_^
|
|
|
+ timeout: ^_^timeout^_^
|
|
|
+ script: vmstat -D | awk 'NR==1{print $1}';vmstat -D | awk 'NR==2{print $1}';vmstat 1 1 | awk 'NR==3{print $10}';vmstat 1 1 | awk 'NR==3{print $9}';vmstat 1 1 | awk 'NR==3{print $16}'
|
|
|
+ parseType: oneRow
|
|
|
+
|
|
|
+ - name: interface
|
|
|
+ priority: 4
|
|
|
+ fields:
|
|
|
+ # 指标信息 包括 field名称 type字段类型:0-number数字,1-string字符串 instance是否为实例主键 unit:指标单位
|
|
|
+ - field: interface_name
|
|
|
+ type: 1
|
|
|
+ instance: true
|
|
|
+ - field: receive_bytes
|
|
|
+ type: 0
|
|
|
+ unit: byte
|
|
|
+ - field: transmit_bytes
|
|
|
+ type: 0
|
|
|
+ unit: byte
|
|
|
+ # 监控采集使用协议 eg: sql, ssh, http, telnet, wmi, snmp, sdk
|
|
|
+ protocol: ssh
|
|
|
+ # 当protocol为http协议时具体的采集配置
|
|
|
+ ssh:
|
|
|
+ # 主机host: ipv4 ipv6 域名
|
|
|
+ host: ^_^host^_^
|
|
|
+ # 端口
|
|
|
+ port: ^_^port^_^
|
|
|
+ username: ^_^username^_^
|
|
|
+ password: ^_^password^_^
|
|
|
+ timeout: ^_^timeout^_^
|
|
|
+ script: cat /proc/net/dev | tail -n +3 | awk 'BEGIN{ print "interface_name receive_bytes transmit_bytes"} {print $1,$2,$10}'
|
|
|
+ parseType: multiRow
|
|
|
+
|
|
|
+ - name: disk_free
|
|
|
+ priority: 5
|
|
|
+ fields:
|
|
|
+ # 指标信息 包括 field名称 type字段类型:0-number数字,1-string字符串 instance是否为实例主键 unit:指标单位
|
|
|
+ - field: filesystem
|
|
|
+ type: 1
|
|
|
+ - field: used
|
|
|
+ type: 0
|
|
|
+ unit: Mb
|
|
|
+ - field: available
|
|
|
+ type: 0
|
|
|
+ unit: Mb
|
|
|
+ - field: usage
|
|
|
+ type: 0
|
|
|
+ unit: '%'
|
|
|
+ - field: mounted
|
|
|
+ type: 1
|
|
|
+ instance: true
|
|
|
+ # 监控采集使用协议 eg: sql, ssh, http, telnet, wmi, snmp, sdk
|
|
|
+ protocol: ssh
|
|
|
+ # 当protocol为http协议时具体的采集配置
|
|
|
+ ssh:
|
|
|
+ # 主机host: ipv4 ipv6 域名
|
|
|
+ host: ^_^host^_^
|
|
|
+ # 端口
|
|
|
+ port: ^_^port^_^
|
|
|
+ username: ^_^username^_^
|
|
|
+ password: ^_^password^_^
|
|
|
+ timeout: ^_^timeout^_^
|
|
|
+ script: df -m | tail -n +2 | awk 'BEGIN{ print "filesystem used available usage mounted"} {print $1,$3,$4,$5,$6}'
|
|
|
+ parseType: multiRow
|