1 alert for alertname=MaintainKubeusersHang project=tools
View in Alertmanager
[1] Resolved
Labels
alertname = MaintainKubeusersHang
instance = k8s.tools.eqiad1.wikimedia.cloud:6443
job = k8s-maintain-kubeusers
pod_label_app = maintain-kubeusers
pod_label_pod_template_hash = 5f7f944f8
pod_name = maintain-kubeusers-5f7f944f8-bf7sz
project = tools
service = toolforge, maintain-kubeusers
severity = critical
source = prometheus
team = wmcs
Annotations
description = The last finished run of maintain-kubeusers is very old. The daemon might be down or unresponsive. Toolforge might be unable to create new accounts or renew certs, etc.
runbook = https://wikitech.wikimedia.org/wiki/Portal:Toolforge/Admin/Runbooks/MaintainKubeusersDown
summary = maintain-kubeusers last finished run is 28.63M minutes old
Source