完善中央与边缘部署、远程写入与监控文档
- 增加中央与边缘完整配置和部署脚本 - 引入 VictoriaMetrics 数据源与 remote_write 故障排查说明 - 新增 edge-agent 配置脚本、ONVIF 自建 exporter 与 ping 监控示例 Co-authored-by: Cursor <cursoragent@cursor.com>
This commit is contained in:
49
central-server/alert_rules.yml
Normal file
49
central-server/alert_rules.yml
Normal file
@@ -0,0 +1,49 @@
|
||||
groups:
|
||||
- name: onvif_alerts
|
||||
rules:
|
||||
- alert: ONVIFDeviceDown
|
||||
expr: up{job="onvif-devices"} == 0
|
||||
for: 1m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: "ONVIF设备离线"
|
||||
description: "ONVIF设备 {{ $labels.instance }} 已离线超过1分钟"
|
||||
|
||||
- alert: ONVIFDeviceHighTemperature
|
||||
expr: onvif_device_temperature > 70
|
||||
for: 2m
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "ONVIF设备温度过高"
|
||||
description: "设备 {{ $labels.instance }} 温度达到 {{ $value }}°C"
|
||||
|
||||
- alert: ONVIFDeviceLowStorage
|
||||
expr: onvif_storage_usage_percent > 90
|
||||
for: 5m
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "ONVIF设备存储空间不足"
|
||||
description: "设备 {{ $labels.instance }} 存储使用率达到 {{ $value }}%"
|
||||
|
||||
- name: network_alerts
|
||||
rules:
|
||||
- alert: NetworkDeviceDown
|
||||
expr: probe_success{job="network-ping"} == 0
|
||||
for: 2m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: "网络设备离线"
|
||||
description: "网络设备 {{ $labels.instance }} 无法ping通"
|
||||
|
||||
- alert: HighNetworkLatency
|
||||
expr: probe_duration_seconds{job="network-ping"} > 1
|
||||
for: 5m
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "网络延迟过高"
|
||||
description: "设备 {{ $labels.instance }} 延迟达到 {{ $value }}秒"
|
||||
Reference in New Issue
Block a user