24 alerts for alertname=SystemdUnitFailed team=search-platform
View in alerts dashboard
[24] Firing
Labels
alertname = SystemdUnitFailed
instance = wdqs1011:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1011:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1011:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1012:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1012:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1012:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1013:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1013:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1013:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1014:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1014:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1014:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1015:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1015:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1015:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1016:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1016:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1016:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1017:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1017:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1017:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1021:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1021:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1021:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1022:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1022:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1022:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1025:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1025:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1025:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs1026:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = eqiad
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs1026:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs1026:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2007:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2007:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2007:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2008:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2008:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2008:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2010:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2010:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2010:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2011:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2011:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2011:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2012:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2012:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2012:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2013:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2013:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2013:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2014:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2014:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2014:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2015:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2015:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2015:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2018:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2018:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2018:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2019:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2019:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2019:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2020:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2020:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2020:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2021:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2021:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2021:9100
Source
Labels
alertname = SystemdUnitFailed
instance = wdqs2022:9100
name = load-dcatap-weekly.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = load-dcatap-weekly.service on wdqs2022:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = load-dcatap-weekly.service on wdqs2022:9100
Source