From b367a3618365f09598dd8b2709da988dd8bfdb96 Mon Sep 17 00:00:00 2001 From: "Marco Maurer (-Kilchhofer)" <mkilchhofer@users.noreply.github.com> Date: Tue, 3 Sep 2024 10:26:19 +0200 Subject: [PATCH] deployment/alerts: add missing description for VMagent alerts (#6921) The 3 alerts for VMagent: - `RejectedRemoteWriteDataBlocksAreDropped` - `TooManyScrapeErrors` - `TooManyWriteErrors` missed the description annotation. I moved the summary to description and added a generic summary to these alerts. ### Checklist The following checks are **mandatory**: - [x] My change adheres [VictoriaMetrics contributing guidelines](https://docs.victoriametrics.com/contributing/). Signed-off-by: Marco Maurer <marco.kilchhofer@gmail.com> (cherry picked from commit f17fca718d45196cdefb2a924a248f89e9e09d4e) --- deployment/docker/alerts-vmagent.yml | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) diff --git a/deployment/docker/alerts-vmagent.yml b/deployment/docker/alerts-vmagent.yml index 15d522a7fc..bab461a855 100644 --- a/deployment/docker/alerts-vmagent.yml +++ b/deployment/docker/alerts-vmagent.yml @@ -27,8 +27,9 @@ groups: severity: warning annotations: dashboard: "http://localhost:3000/d/G7Z9GzMGz?viewPanel=79&var-instance={{ $labels.instance }}" - summary: "Job \"{{ $labels.job }}\" on instance {{ $labels.instance }} drops the rejected by - remote-write server data blocks. Check the logs to find the reason for rejects." + summary: "Vmagent is dropping data blocks that are rejected by remote storage" + description: "Job \"{{ $labels.job }}\" on instance {{ $labels.instance }} drops the rejected by + remote-write server data blocks. Check the logs to find the reason for rejects." - alert: TooManyScrapeErrors expr: increase(vm_promscrape_scrapes_failed_total[5m]) > 0 @@ -37,7 +38,8 @@ groups: severity: warning annotations: dashboard: "http://localhost:3000/d/G7Z9GzMGz?viewPanel=31&var-instance={{ $labels.instance }}" - summary: "Job \"{{ $labels.job }}\" on instance {{ $labels.instance }} fails to scrape targets for last 15m" + summary: "Vmagent fails to scrape one or more targets" + description: "Job \"{{ $labels.job }}\" on instance {{ $labels.instance }} fails to scrape targets for last 15m" - alert: TooManyWriteErrors expr: | @@ -49,7 +51,8 @@ groups: severity: warning annotations: dashboard: "http://localhost:3000/d/G7Z9GzMGz?viewPanel=77&var-instance={{ $labels.instance }}" - summary: "Job \"{{ $labels.job }}\" on instance {{ $labels.instance }} responds with errors to write requests for last 15m." + summary: "Vmagent responds with too many errors on data ingestion protocols" + description: "Job \"{{ $labels.job }}\" on instance {{ $labels.instance }} responds with errors to write requests for last 15m." - alert: TooManyRemoteWriteErrors expr: rate(vmagent_remotewrite_retries_count_total[5m]) > 0