mirror of
https://github.com/VictoriaMetrics/VictoriaMetrics.git
synced 2024-12-11 14:53:49 +00:00
8441375da2
* vmalert: add `debug` mode for alerting rules Debug information includes alerts state changes and requests sent to the datasource. Debug can be enabled only on rule's level. It might be useful for debugging unexpected behaviour of alerting rule. https://github.com/VictoriaMetrics/VictoriaMetrics/issues/3025 Signed-off-by: hagen1778 <roman@victoriametrics.com> * vmalert: review fixes Signed-off-by: hagen1778 <roman@victoriametrics.com> * Update app/vmalert/alerting.go Co-authored-by: Aliaksandr Valialkin <valyala@victoriametrics.com> * vmalert: go fmt Signed-off-by: hagen1778 <roman@victoriametrics.com> Signed-off-by: hagen1778 <roman@victoriametrics.com> Co-authored-by: Aliaksandr Valialkin <valyala@victoriametrics.com>
61 lines
No EOL
2 KiB
Text
61 lines
No EOL
2 KiB
Text
groups:
|
|
- name: TestGroup
|
|
interval: 5s
|
|
concurrency: 2
|
|
limit: 1000
|
|
headers:
|
|
- "MyHeader: foo"
|
|
params:
|
|
denyPartialResponse: ["true"]
|
|
rules:
|
|
- alert: Conns
|
|
expr: sum(vm_tcplistener_conns) by(instance) > 1
|
|
for: 3m
|
|
debug: true
|
|
annotations:
|
|
summary: Too high connection number for {{$labels.instance}}
|
|
{{ with printf "sum(vm_tcplistener_conns{instance=%q})" .Labels.instance | query }}
|
|
{{ . | first | value }}
|
|
{{ end }}
|
|
description: "It is {{ $value }} connections for {{$labels.instance}}"
|
|
- alert: ExampleAlertAlwaysFiring
|
|
expr: sum by(job)
|
|
(up == 1)
|
|
labels:
|
|
job: '{{ $labels.job }}'
|
|
dynamic: '{{ $x := query "up" | first | value }}{{ if eq 1.0 $x }}one{{ else }}unknown{{ end }}'
|
|
annotations:
|
|
description: Job {{ $labels.job }} is up!
|
|
external: cluster-{{ $externalLabels.cluster }}; replica-{{ $externalLabels.replica }}
|
|
summary: All instances up {{ range query "up" }}
|
|
{{ . | label "instance" }}
|
|
{{ end }}
|
|
- record: handler:requests:rate5m
|
|
expr: sum(rate(prometheus_http_requests_total[5m])) by (handler)
|
|
labels:
|
|
recording: true
|
|
- record: code:requests:rate5m
|
|
expr: sum(rate(promhttp_metric_handler_requests_total[5m])) by (code)
|
|
labels:
|
|
env: dev
|
|
recording: true
|
|
- record: code:requests:rate5m
|
|
expr: sum(rate(promhttp_metric_handler_requests_total[5m])) by (code)
|
|
labels:
|
|
env: staging
|
|
recording: true
|
|
- record: successful_requests:ratio_rate5m
|
|
labels:
|
|
recording: true
|
|
expr: |2
|
|
sum(code:requests:rate5m{code="200"})
|
|
/
|
|
sum(code:requests:rate5m)
|
|
- record: code:requests:slo
|
|
labels:
|
|
recording: true
|
|
expr: 0.95
|
|
- record: time:current
|
|
labels:
|
|
recording: true
|
|
expr: time() |