1 alert for alertname=MaintainKubeusersHang project=tools
View in Alertmanager
[1] Resolved
Labels
alertname = MaintainKubeusersHang
instance = k8s.tools.eqiad1.wikimedia.cloud:6443
job = k8s-maintain-kubeusers
pod_label_app = maintain-kubeusers
pod_label_pod_template_hash = 767c48c4cb
pod_name = maintain-kubeusers-767c48c4cb-kx789
project = tools
service = toolforge, maintain-kubeusers
severity = critical
source = prometheus
team = wmcs
Annotations
description = The last finished run of maintain-kubeusers is very old. The daemon might be down or unresponsive. Toolforge might be unable to create new accounts or renew certs, etc.
runbook = https://wikitech.wikimedia.org/wiki/Portal:Toolforge/Admin/Runbooks/MaintainKubeusersDown
summary = maintain-kubeusers last finished run is 28.66M minutes old
Source