mirror of
https://github.com/logos-messaging/logos-messaging-simulator.git
synced 2026-05-21 17:49:26 +00:00
Having first alert working
This commit is contained in:
parent
8551bffaf0
commit
722c58ab8b
@ -1,49 +1,11 @@
|
|||||||
---
|
|
||||||
groups:
|
groups:
|
||||||
- name: waku
|
- name: waku
|
||||||
rules:
|
rules:
|
||||||
- alert: HighNimWakuNodeTraffic
|
|
||||||
expr: >
|
|
||||||
abs(
|
|
||||||
netdata_net_net_kilobits_persec_average{
|
|
||||||
family!~"^(wg|veth|br|docker).*",
|
|
||||||
fleet=~"(shards|waku|status|wakuv2)\\..*"
|
|
||||||
}) > 40000
|
|
||||||
for: 5m
|
|
||||||
annotations:
|
|
||||||
summary: "Too high traffic for {{ $labels.instance }}"
|
|
||||||
description: "Host {{ $labels.instance }} running nim-waku has {{ $labels.dimension }} traffic higher 40Mbps"
|
|
||||||
|
|
||||||
- alert: HighNimWakuMemUsage
|
- alert: HighNimWakuMemUsage
|
||||||
expr: >
|
expr: >
|
||||||
nim_gc_mem_bytes{
|
nim_gc_mem_bytes{} > 1073741824
|
||||||
fleet=~"(shards|waku|status|wakuv2)\\..*"
|
|
||||||
} > 1073741824
|
|
||||||
for: 5m
|
for: 5m
|
||||||
annotations:
|
annotations:
|
||||||
summary: "Too high memory usage for {{ $labels.instance }}"
|
summary: "Too high memory usage for {{ $labels.instance }}"
|
||||||
description: "Host {{ $labels.instance }} running nim-waku has GC memory usage higher 1GB"
|
description: "Host {{ $labels.instance }} running nim-waku has GC memory usage higher 1GB"
|
||||||
current_value: "{{ $value }}"
|
|
||||||
|
|
||||||
- alert: HighNimWakuNodeOpenSockets
|
|
||||||
expr: >
|
|
||||||
netdata_ipv4_sockstat_tcp_sockets_sockets_average{
|
|
||||||
fleet=~"(shards|waku|status|wakuv2)\\..*"
|
|
||||||
} > 300
|
|
||||||
for: 5m
|
|
||||||
annotations:
|
|
||||||
summary: "Too high open sockets for {{ $labels.instance }}"
|
|
||||||
description: "Host {{ $labels.instance }} running nim-waku has more than 300 open sockets"
|
|
||||||
current_value: "{{ $value }}"
|
|
||||||
|
|
||||||
- record: job:waku_libp2p_peers
|
|
||||||
expr: libp2p_peers{fleet=~"(shards|waku|status|wakuv2)\\..*"}
|
|
||||||
|
|
||||||
- alert: NimWakuPeersDecrease
|
|
||||||
expr: >
|
|
||||||
(job:waku_libp2p_peers / avg_over_time(job:waku_libp2p_peers[12h])) < 0.50
|
|
||||||
for: 15m
|
|
||||||
annotations:
|
|
||||||
summary: "Drop of libp2p_peers on {{ $labels.instance }}"
|
|
||||||
description: "Host {{ $labels.instance }} running nim-waku has more than 50% drop of peers compared to 12h average"
|
|
||||||
current_value: "{{ $value }}"
|
current_value: "{{ $value }}"
|
||||||
@ -10,6 +10,9 @@ alerting:
|
|||||||
static_configs:
|
static_configs:
|
||||||
- targets: [ 'alertmanager:9093' ]
|
- targets: [ 'alertmanager:9093' ]
|
||||||
|
|
||||||
|
rule_files:
|
||||||
|
- "./alert-rules.yml"
|
||||||
|
|
||||||
scrape_configs:
|
scrape_configs:
|
||||||
- job_name: cadvisor
|
- job_name: cadvisor
|
||||||
scrape_interval: 5s
|
scrape_interval: 5s
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user