您的位置:首页 > 运维架构

监控资料收集整理

2017-12-02 20:02 330 查看
细说Redis监控和告警(待完善)

Redis性能问题排查解决手册(七)

美团在Redis上踩过的一些坑-目录

Redis监控和预警

Redis的info命令详解

互联网企业级监控系统实践

Open-falcon Agent模块rpc通信过程

IT运维监控解决方案介绍

Open-Falcon 监控系统监控 MySQL/Redis/MongoDB 状态监控

ganglia-原理介绍(一)

基于OpenStack云资源监控系统设计与实现

Opentsdb简介(一)

时间序列数据的存储和计算 - 开源时序数据库解析

OpenTsdb 核心设计

OpenTSDB设计解读

时序数据库InfluxDB使用详解

InfluxDB和MySQL的读写对比测试

InfluxDB引擎浅析

使用graphite来监控业务系统

Python性能监控Graphite

#!/usr/bin/python
#-*- coding:utf-8 -*-

import json
import time
import socket
import os
import re
import sys
import commands
import urllib2, base64

class RedisStats:
# 如果你是自己编译部署到redis,请将下面的值替换为你到redis-cli路径
_redis_cli = '/usr/local/redis/bin/redis-cli'
_stat_regex = re.compile(ur'(\w+):([0-9]+\.?[0-9]*)\r')

def __init__(self,  port='6379', passwd=None, host='127.0.0.1'):
self._cmd = '%s -h %s -p %s info' % (self._redis_cli, host, port)
if passwd not in ['', None]:
self._cmd = '%s -h %s -p %s -a %s info' % (self._redis_cli, host, port, passwd)

def stats(self):
' Return a dict containing redis stats '
info = commands.getoutput(self._cmd)
print 'begin info***************'
print info
print 'end info***************'
print '       '
return dict(self._stat_regex.findall(info))

def main():
ip = socket.gethostname()
timestamp = int(time.time())
step = 60
# inst_list中保存了redis配置文件列表,程序将从这些配置中读取port和password,建议使用动态发现的方法获得,如:
# inst_list = [ i for i in commands.getoutput("find  /etc/ -name 'redis*.conf'" ).split('\n') ]
#insts_list = [ '/etc/redis/redis.conf' ]
insts_list = [ '/usr/local/redis/etc/redis.conf' ]
p = []

monit_keys = [
('connected_clients','GAUGE'),
('blocked_clients','GAUGE'),
('used_memory','GAUGE'),
('used_memory_rss','GAUGE'),
('mem_fragmentation_ratio','GAUGE'),
('total_commands_processed','COUNTER'),
('rejected_connections','COUNTER'),
('expired_keys','COUNTER'),
('evicted_keys','COUNTER'),
('keyspace_hits','COUNTER'),
('keyspace_misses','COUNTER'),
('keyspace_hit_ratio','GAUGE'),
]

for inst in insts_list:
port = commands.getoutput("sed -n 's/^port *\([0-9]\{4,5\}\)/\\1/p' %s" % inst)
passwd = commands.getoutput("sed -n 's/^requirepass *\([^ ]*\)/\\1/p' %s" % inst)
metric = "redis"
endpoint = ip
tags = 'port=%s' % port

try:
conn = RedisStats(port, passwd)
stats = conn.stats()
print 'begin stats'
print stats
print 'end stats'
except Exception,e:
continue

for key,vtype in monit_keys:
print key,vtype
#一些老版本的redis中info输出的信息很少,如果缺少一些我们需要采集的key就跳过
if key not in stats.keys():
continue
#计算命中率
if key == 'keyspace_hit_ratio':
try:
value = float(stats['keyspace_hits'])/(int(stats['keyspace_hits']) + int(stats['keyspace_misses']))
except ZeroDivisionError:
value = 0
#碎片率是浮点数
elif key == 'mem_fragmentation_ratio':
value = float(stats[key])
else:
#其他的都采集成counter,int
try:
value = int(stats[key])
except:
continue

i = {
'Metric': '%s.%s' % (metric, key),
'Endpoint': endpoint,
'Timestamp': timestamp,
'Step': step,
'Value': value,
'CounterType': vtype,
'TAGS': tags
}
p.append(i)

print json.dumps(p, sort_keys=True,indent=4)
method = "POST"
handler = urllib2.HTTPHandler()
opener = urllib2.build_opener(handler)
url = 'http://127.0.0.1:1988/v1/push'
request = urllib2.Request(url, data=json.dumps(p) )
request.add_header("Content-Type",'application/json')
request.get_method = lambda: method
try:
connection = opener.open(request)
except urllib2.HTTPError,e:
connection = e

# check. Substitute with appropriate HTTP code.
if connection.code == 200:
print connection.read()
else:
print '{"err":1,"msg":"%s"}' % connection
if __name__ == '__main__':
proc = commands.getoutput(' ps -ef|grep %s|grep -v grep|wc -l ' % os.path.basename(sys.argv[0]))
sys.stdout.flush()
if int(proc) < 5:
main()
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: