View in alerts dashboard
|
[4] Firing
|
Labels
alertname = SystemdUnitCrashLoop cluster = misc instance = wdqs2016:9100 job = node name = wdqs-blazegraph.service prometheus = ops severity = warning site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = wdqs-blazegraph.service has had 21.357642857142856 restarts in the last 10m runbook = TODO summary = wdqs-blazegraph.service crashloop on wdqs2016:9100
Source
|
Labels
alertname = SystemdUnitCrashLoop cluster = misc instance = wdqs2016:9100 job = node name = wdqs-categories.service prometheus = ops severity = warning site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = wdqs-categories.service has had 18.984571428571428 restarts in the last 10m runbook = TODO summary = wdqs-categories.service crashloop on wdqs2016:9100
Source
|
Labels
alertname = SystemdUnitCrashLoop cluster = misc instance = wdqs2018:9100 job = node name = wdqs-blazegraph.service prometheus = ops severity = warning site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = wdqs-blazegraph.service has had 33.84074333333333 restarts in the last 10m runbook = TODO summary = wdqs-blazegraph.service crashloop on wdqs2018:9100
Source
|
Labels
alertname = SystemdUnitCrashLoop cluster = misc instance = wdqs2020:9100 job = node name = wdqs-blazegraph.service prometheus = ops severity = warning site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = wdqs-blazegraph.service has had 15.944522222222222 restarts in the last 10m runbook = TODO summary = wdqs-blazegraph.service crashloop on wdqs2020:9100
Source
|