about summary refs log tree commit diff
path: root/modules/nixos/monitoring/rules/nginx.yaml
blob: 59229a88aa83804bf042ae9b249c9f25429959b6 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
---
groups:
  - name: Nginx

    rules:
      - alert: NginxHighHttp4xxErrorRate
        expr: >-
          sum(rate(nginx_http_requests_total{status=~"^4.."}[1m]))
          / sum(rate(nginx_http_requests_total[1m])) * 100
          > 5
        for: 1m
        labels:
          severity: critical
        annotations:
          summary: NGINX high HTTP 4xx error rate (instance {{ $labels.instance }})
          description: |-
            Too many HTTP requests with status 4xx (> 5%).

              VALUE = {{ $value }}
              LABELS = {{ $labels }}

      - alert: NginxHighHttp5xxErrorRate
        expr: >-
          sum(rate(nginx_http_requests_total{status=~"^5.."}[1m]))
          / sum(rate(nginx_http_requests_total[1m])) * 100
          > 5
        for: 1m
        labels:
          severity: critical
        annotations:
          summary: NGINX high HTTP 5xx error rate (instance {{ $labels.instance }})
          description: |-
            Too many HTTP requests with status 5xx (> 5%).

              VALUE = {{ $value }}
              LABELS = {{ $labels }}

      - alert: NginxLatencyHigh
        expr: >-
          histogram_quantile(0.99,
            sum(rate(nginx_http_request_duration_seconds_bucket[2m])) by (host, node))
          > 3
        for: 2m
        labels:
          severity: warning
        annotations:
          summary: NGINX high latency (instance {{ $labels.instance }})
          description: |-
            NGINX 99% latency is higher than 3 seconds.

              VALUE = {{ $value }}
              LABELS = {{ $labels }}

Consider giving Nix/NixOS a try! <3