1 alert for alertname=MaintainKubeusersDown project=tools
View in Alertmanager
[1] Resolved
Labels
alertname = MaintainKubeusersDown
instance = k8s.tools.eqiad1.wikimedia.cloud:6443
job = k8s-maintain-kubeusers
pod_label_app = maintain-kubeusers
pod_label_pod_template_hash = 844bc84845
pod_name = maintain-kubeusers-844bc84845-47ln8
project = tools
service = toolforge, maintain-kubeusers
severity = critical
source = prometheus
team = wmcs
Annotations
description = maintain-kubeusers is not getting its data into prometheus. The daemon might be down or unresponsive. Toolforge might be unable to create new accounts or renew certs, etc.
runbook = https://wikitech.wikimedia.org/wiki/Portal:Toolforge/Admin/Runbooks/MaintainKubeusersDown
summary = maintain-kubeusers is down
Source