View in alerts dashboard
|
[15] Firing
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = clean-confd-rundir.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = clean-confd-rundir.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = clean-confd-rundir.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = confd_prometheus_metrics.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = confd_prometheus_metrics.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = confd_prometheus_metrics.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = elasticsearch-disable-readahead.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = elasticsearch-disable-readahead.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = elasticsearch-disable-readahead.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = elasticsearch_7@production-search-codfw.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = elasticsearch_7@production-search-codfw.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = elasticsearch_7@production-search-codfw.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = elasticsearch_7@production-search-omega-codfw.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = elasticsearch_7@production-search-omega-codfw.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = elasticsearch_7@production-search-omega-codfw.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = export_smart_data_dump.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = export_smart_data_dump.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = export_smart_data_dump.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = prometheus-debian-version-textfile.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = prometheus-debian-version-textfile.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = prometheus-debian-version-textfile.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = prometheus-dpkg-success-textfile.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = prometheus-dpkg-success-textfile.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = prometheus-dpkg-success-textfile.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = prometheus-elasticsearch-exporter-9200.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = prometheus-elasticsearch-exporter-9200.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = prometheus-elasticsearch-exporter-9200.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = prometheus-elasticsearch-exporter-9400.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = prometheus-elasticsearch-exporter-9400.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = prometheus-elasticsearch-exporter-9400.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = prometheus-ipmi-exporter.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = prometheus-ipmi-exporter.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = prometheus-ipmi-exporter.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = prometheus-nic-firmware-textfile.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = prometheus-nic-firmware-textfile.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = prometheus-nic-firmware-textfile.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = prometheus-puppet-agent-stats.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = prometheus-puppet-agent-stats.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = prometheus-puppet-agent-stats.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = prometheus_intel_microcode.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = prometheus_intel_microcode.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = prometheus_intel_microcode.service on elastic2037:9100
Source
|
Labels
alertname = SystemdUnitFailed instance = elastic2037:9100 name = user@24320.service prometheus = ops severity = critical site = codfw source = prometheus team = search-platform
Annotations
dashboard = https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status description = user@24320.service on elastic2037:9100 runbook = https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state summary = user@24320.service on elastic2037:9100
Source
|