一、ServerStatus 介绍

ServerStatus 是一个酷炫高逼格的云探针、云监控、服务器云监控、多服务器探针~。 ServerStatus开源地址:https://github.com/cppla/ServerStatus ### 特性 + 使用 Rust 完全重写 Server、Client,单个执行文件部署 + 支持上下线和简单自定义规则告警 (Telegram、 Wechat、 Email、 Webhook) + 支持 http 协议上报,可以方便部署到各免费容器服务和配合 cf 等优化上报链路 + 支持 vnstat 统计月流量,重启不丢流量数据 + 支持 Railway 快速部署 + 支持 Systemd 开机自启

ServerStatus一个酷炫的云监控神器 - 图1

二、检查宿主机系统版本

  1. cat /etc/os-release

三、检查本地 Docker 环境

检查 Docker 服务状态
  1. // 1) 低版本 Docker 安装
  2. yum install docker -y
  3. ----
  4. // < '推荐' >
  5. // 2) 高版本 Docker 安装
  6. curl -fsSL https://get.docker.com/ | sh
  7. ----
  8. // 关闭防火墙
  9. systemctl disable --now firewalld
  10. setenforce 0
  11. // 启用 Docker
  12. systemctl enable --now docker
检查 Docker 配置信息
  1. docker info
开启 IPv4 forwarding
  1. echo "net.ipv4.ip_forward=1" >> /etc/sysctl.conf
  2. systemctl restart network
  3. sysctl net.ipv4.ip_forward

四、安装 Docker-compose

下载 Docker-compose 二进制包
  1. curl -L https://github.com/docker/compose/releases/download/v2.2.2/docker-compose-linux-x86_64 -o /usr/local/bin/docker-compose
给文件增加执行权限
  1. chmod +x /usr/local/bin/docker-compose
检查 Docker-compose 版本
  1. docker-compose -v

五、下载 ServerStatus 镜像

  1. docker pull stilleshan/serverstatus

六、使用 Docker-cli 部署

  1. mkdir /docker/ServerStatus/server -p && cd /docker/ServerStatus/server
  1. ( 省略 )
  2. docker run -d --name=serverstatus --restart=always \
  3. -p 8888:80 \
  4. -p 35601:35601 \
  5. -v /docker/ServerStatus/server/config.json:/ServerStatus/server/config.json \
  6. stilleshan/serverstatus

七、下载 ServerStatus 安装文件

创建数据目录
  1. mkdir /docker/ServerStatus/server -p && cd /docker/ServerStatus/server
下载安装文件
  1. yum install git -y
  1. git clone https://github.com/stilleshan/ServerStatus.git
  1. [root@localhost ServerStatus]# ls
  2. config.json docker-compose.yml Dockerfile README.md screenshot.jpg status.sh web
查看 Docker-compose.yaml 文件
  1. [root@localhost ServerStatus]# vim docker-compose.yml
  2. version: "3"
  3. services:
  4. serverstatus:
  5. image: stilleshan/serverstatus
  6. container_name: serverstatus
  7. ports:
  8. - 8888:80
  9. - 35601:35601
  10. volumes:
  11. # - ./web:/usr/share/nginx/html
  12. - ./config.json:/ServerStatus/server/config.json
  13. environment:
  14. TZ: Asia/Shanghai
  15. restart: always
创建 ServerStatus 容器
  1. docker-compose up -d
查看 ServerStatus 容器状态
  1. docker ps

ServerStatus一个酷炫的云监控神器 - 图2

八、访问 ServerStatus 服务端

ServerStatus一个酷炫的云监控神器 - 图3

九、客户端安装

修改 status-client.py
  1. [root@node01 ~] vim status-client.py
  2. # -*- coding: utf-8 -*-
  3. SERVER = "192.168.80.8" # 填写服务器地址
  4. PORT = 35601
  5. USER = "admin" # 设置账号 ( 待会需要在服务端填写 )
  6. PASSWORD = "admin" # 设置密码 ( 待会需要在服务端填写 )
  7. INTERVAL = 1 # 更新间隔, 单位: 秒
  8. import socket
  9. import time
  10. import string
  11. import math
  12. import re
  13. import os
  14. import json
  15. import subprocess
  16. import collections
  17. import platform
  18. def get_uptime():
  19. f = open('/proc/uptime', 'r')
  20. uptime = f.readline()
  21. f.close()
  22. uptime = uptime.split('.', 2)
  23. time = int(uptime[0])
  24. return int(time)
  25. def get_memory():
  26. re_parser = re.compile(r'^(?P<key>\S*):\s*(?P<value>\d*)\s*kB')
  27. result = dict()
  28. for line in open('/proc/meminfo'):
  29. match = re_parser.match(line)
  30. if not match:
  31. continue;
  32. key, value = match.groups(['key', 'value'])
  33. result[key] = int(value)
  34. MemTotal = float(result['MemTotal'])
  35. MemFree = float(result['MemFree'])
  36. Cached = float(result['Cached'])
  37. MemUsed = MemTotal - (Cached + MemFree)
  38. SwapTotal = float(result['SwapTotal'])
  39. SwapFree = float(result['SwapFree'])
  40. return int(MemTotal), int(MemUsed), int(SwapTotal), int(SwapFree)
  41. def get_hdd():
  42. p = subprocess.check_output(['df', '-Tlm', '--total', '-t', 'ext4', '-t', 'ext3', '-t', 'ext2', '-t', 'reiserfs', '-t', 'jfs', '-t', 'ntfs', '-t', 'fat32', '-t', 'btrfs', '-t', 'fuseblk', '-t', 'zfs', '-t', 'simfs', '-t', 'xfs']).decode("Utf-8")
  43. total = p.splitlines()[-1]
  44. used = total.split()[3]
  45. size = total.split()[2]
  46. return int(size), int(used)
  47. def get_load():
  48. system = platform.linux_distribution()
  49. if system[0][:6] == "CentOS":
  50. if system[1][0] == "6":
  51. tmp_load = os.popen("netstat -anp |grep ESTABLISHED |grep tcp |grep '::ffff:' |awk '{print $5}' |awk -F ':' '{print $4}' |sort -u |grep -E -o '([0-9]{1,3}[\.]){3}[0-9]{1,3}' |wc -l").read()
  52. else:
  53. tmp_load = os.popen("netstat -anp |grep ESTABLISHED |grep tcp6 |awk '{print $5}' |awk -F ':' '{print $1}' |sort -u |grep -E -o '([0-9]{1,3}[\.]){3}[0-9]{1,3}' |wc -l").read()
  54. else:
  55. tmp_load = os.popen("netstat -anp |grep ESTABLISHED |grep tcp6 |awk '{print $5}' |awk -F ':' '{print $1}' |sort -u |grep -E -o '([0-9]{1,3}[\.]){3}[0-9]{1,3}' |wc -l").read()
  56. return float(tmp_load)
  57. #return os.getloadavg()[0]
  58. def get_time():
  59. stat_file = file("/proc/stat", "r")
  60. time_list = stat_file.readline().split(' ')[2:6]
  61. stat_file.close()
  62. for i in range(len(time_list)) :
  63. time_list[i] = int(time_list[i])
  64. return time_list
  65. def delta_time():
  66. x = get_time()
  67. time.sleep(INTERVAL)
  68. y = get_time()
  69. for i in range(len(x)):
  70. y[i]-=x[i]
  71. return y
  72. def get_cpu():
  73. t = delta_time()
  74. st = sum(t)
  75. if st == 0:
  76. st = 1
  77. result = 100-(t[len(t)-1]*100.00/st)
  78. return round(result)
  79. class Traffic:
  80. def __init__(self):
  81. self.rx = collections.deque(maxlen=10)
  82. self.tx = collections.deque(maxlen=10)
  83. def get(self):
  84. f = open('/proc/net/dev', 'r')
  85. net_dev = f.readlines()
  86. f.close()
  87. avgrx = 0; avgtx = 0
  88. for dev in net_dev[2:]:
  89. dev = dev.split(':')
  90. if dev[0].strip() == "lo" or dev[0].find("tun") > -1:
  91. continue
  92. dev = dev[1].split()
  93. avgrx += int(dev[0])
  94. avgtx += int(dev[8])
  95. self.rx.append(avgrx)
  96. self.tx.append(avgtx)
  97. avgrx = 0; avgtx = 0
  98. l = len(self.rx)
  99. for x in range(l - 1):
  100. avgrx += self.rx[x+1] - self.rx[x]
  101. avgtx += self.tx[x+1] - self.tx[x]
  102. avgrx = int(avgrx / l / INTERVAL)
  103. avgtx = int(avgtx / l / INTERVAL)
  104. return avgrx, avgtx
  105. def liuliang():
  106. NET_IN = 0
  107. NET_OUT = 0
  108. with open('/proc/net/dev') as f:
  109. for line in f.readlines():
  110. netinfo = re.findall('([^\s]+):[\s]{0,}(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+)', line)
  111. if netinfo:
  112. if netinfo[0][0] == 'lo' or 'tun' in netinfo[0][0] or netinfo[0][1]=='0' or netinfo[0][9]=='0':
  113. continue
  114. else:
  115. NET_IN += int(netinfo[0][1])
  116. NET_OUT += int(netinfo[0][9])
  117. return NET_IN, NET_OUT
  118. def get_network(ip_version):
  119. if(ip_version == 4):
  120. HOST = "192.168.80.18" # 客户端地址
  121. elif(ip_version == 6):
  122. HOST = "ipv6.google.com"
  123. try:
  124. s = socket.create_connection((HOST, 80), 2)
  125. return True
  126. except:
  127. pass
  128. return False
  129. if __name__ == '__main__':
  130. socket.setdefaulttimeout(30)
  131. while 1:
  132. try:
  133. print("Connecting...")
  134. s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
  135. s.connect((SERVER, PORT))
  136. data = s.recv(1024)
  137. if data.find("Authentication required") > -1:
  138. s.send(USER + ':' + PASSWORD + '\n')
  139. data = s.recv(1024)
  140. if data.find("Authentication successful") < 0:
  141. print(data)
  142. raise socket.error
  143. else:
  144. print(data)
  145. raise socket.error
  146. print(data)
  147. data = s.recv(1024)
  148. print(data)
  149. timer = 0
  150. check_ip = 0
  151. if data.find("IPv4") > -1:
  152. check_ip = 6
  153. elif data.find("IPv6") > -1:
  154. check_ip = 4
  155. else:
  156. print(data)
  157. raise socket.error
  158. traffic = Traffic()
  159. traffic.get()
  160. while 1:
  161. CPU = get_cpu()
  162. NetRx, NetTx = traffic.get()
  163. NET_IN, NET_OUT = liuliang()
  164. Uptime = get_uptime()
  165. Load = get_load()
  166. MemoryTotal, MemoryUsed, SwapTotal, SwapFree = get_memory()
  167. HDDTotal, HDDUsed = get_hdd()
  168. array = {}
  169. if not timer:
  170. array['online' + str(check_ip)] = get_network(check_ip)
  171. timer = 10
  172. else:
  173. timer -= 1*INTERVAL
  174. array['uptime'] = Uptime
  175. array['load'] = Load
  176. array['memory_total'] = MemoryTotal
  177. array['memory_used'] = MemoryUsed
  178. array['swap_total'] = SwapTotal
  179. array['swap_used'] = SwapTotal - SwapFree
  180. array['hdd_total'] = HDDTotal
  181. array['hdd_used'] = HDDUsed
  182. array['cpu'] = CPU
  183. array['network_rx'] = NetRx
  184. array['network_tx'] = NetTx
  185. array['network_in'] = NET_IN
  186. array['network_out'] = NET_OUT
  187. s.send("update " + json.dumps(array) + "\n")
  188. except KeyboardInterrupt:
  189. raise
  190. except socket.error:
  191. print("Disconnected...")
  192. # keep on trying after a disconnect
  193. s.close()
  194. time.sleep(3)
  195. except Exception as e:
  196. print("Caught Exception:", e)
  197. s.close()
  198. time.sleep(3)
在客户端运行 status-client.py 脚本
  1. [root@node01 ~] python status-client.py &
  2. [1] 105194
服务端配置 修改 config.json 文件,必须配置项为 username/password/host
  1. [root@server ServerStatus] vim config.json
  2. {"servers":
  3. [
  4. {
  5. "username": "admin", # 客户端账号
  6. "password": "admin", # 客户端密码
  7. "name": "腾讯云-上海",
  8. "type": "KVM",
  9. "host": "192.168.80.18", # 填写客户端 IP 地址
  10. "location": "CN",
  11. "disabled": false
  12. },
  13. {
  14. "username": "2",
  15. "password": "xxx",
  16. "name": "阿里云-香港",
  17. "type": "KVM",
  18. "host": "None",
  19. "location": "HK",
  20. "disabled": false
  21. },
  22. {
  23. "username": "3",
  24. "password": "xxxx",
  25. "name": "谷歌云-日本",
  26. "type": "KVM",
  27. "host": "None",
  28. "location": "JP",
  29. "disabled": false
  30. }
  31. ]
  32. }
在 Web 监控页查看效果

ServerStatus一个酷炫的云监控神器 - 图4

大功告成~