diff --git a/prometheus/prometheus/config/reles/node_rules.yml b/prometheus/prometheus/config/reles/node_rules.yml index 134801c..bb337d4 100644 --- a/prometheus/prometheus/config/reles/node_rules.yml +++ b/prometheus/prometheus/config/reles/node_rules.yml @@ -40,23 +40,23 @@ groups: - alert: 网络流入 - expr: ((sum(rate (node_network_receive_bytes_total{device!~'tap.*|veth.*|br.*|docker.*|virbr*|lo*'}[5m])) by (instance,job)) / 100) > 102400 + expr: ((sum(rate (node_network_receive_bytes_total{device!~'tap.*|veth.*|br.*|docker.*|virbr*|lo*'}[15m])) by (instance,job)) / 100) > 202400 for: 1m labels: severity: 严重告警 annotations: summary: "{{$labels.instance}} 流入网络带宽过高,请尽快处理!" - description: "{{$labels.instance}} 流入网络带宽持续1分钟高于100M. RX带宽使用量{{$value}}." + description: "{{$labels.instance}} 流入网络带宽持续1分钟高于200M. RX带宽使用量{{$value | printf \"%.2f\"}}." - alert: 网络流出 - expr: ((sum(rate (node_network_transmit_bytes_total{device!~'tap.*|veth.*|br.*|docker.*|virbr*|lo*'}[5m])) by (instance,job)) / 100) > 102400 + expr: ((sum(rate (node_network_transmit_bytes_total{device!~'tap.*|veth.*|br.*|docker.*|virbr*|lo*'}[15m])) by (instance,job)) / 100) > 202400 for: 1m labels: severity: 严重告警 annotations: summary: "{{$labels.instance}} 流出网络带宽过高,请尽快处理!" - description: "{{$labels.instance}} 流出网络带宽持15分钟高于100M. RX带宽使用量{$value}}." - + description: "{{$labels.instance}} 流出网络带宽持15分钟高于200M. RX带宽使用量{{$value | printf \"%.2f\"}}." + - alert: TCP连接数 expr: node_netstat_Tcp_CurrEstab > 10000 for: 1m