15 alerts for alertname=SystemdUnitFailed team=search-platform
View in alerts dashboard
[15] Firing
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = clean-confd-rundir.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = clean-confd-rundir.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = clean-confd-rundir.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = confd_prometheus_metrics.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = confd_prometheus_metrics.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = confd_prometheus_metrics.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = elasticsearch-disable-readahead.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = elasticsearch-disable-readahead.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = elasticsearch-disable-readahead.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = elasticsearch_7@production-search-codfw.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = elasticsearch_7@production-search-codfw.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = elasticsearch_7@production-search-codfw.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = elasticsearch_7@production-search-omega-codfw.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = elasticsearch_7@production-search-omega-codfw.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = elasticsearch_7@production-search-omega-codfw.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = export_smart_data_dump.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = export_smart_data_dump.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = export_smart_data_dump.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = prometheus-debian-version-textfile.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = prometheus-debian-version-textfile.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = prometheus-debian-version-textfile.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = prometheus-dpkg-success-textfile.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = prometheus-dpkg-success-textfile.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = prometheus-dpkg-success-textfile.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = prometheus-elasticsearch-exporter-9200.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = prometheus-elasticsearch-exporter-9200.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = prometheus-elasticsearch-exporter-9200.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = prometheus-elasticsearch-exporter-9400.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = prometheus-elasticsearch-exporter-9400.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = prometheus-elasticsearch-exporter-9400.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = prometheus-ipmi-exporter.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = prometheus-ipmi-exporter.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = prometheus-ipmi-exporter.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = prometheus-nic-firmware-textfile.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = prometheus-nic-firmware-textfile.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = prometheus-nic-firmware-textfile.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = prometheus-puppet-agent-stats.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = prometheus-puppet-agent-stats.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = prometheus-puppet-agent-stats.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = prometheus_intel_microcode.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = prometheus_intel_microcode.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = prometheus_intel_microcode.service on elastic2037:9100
Source
Labels
alertname = SystemdUnitFailed
instance = elastic2037:9100
name = user@24320.service
prometheus = ops
severity = critical
site = codfw
source = prometheus
team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
description = user@24320.service on elastic2037:9100
runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
summary = user@24320.service on elastic2037:9100
Source