Common information
- dashboard: https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
- runbook: https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
- alertname: SystemdUnitFailed
- prometheus: ops
- severity: critical
- source: prometheus
- team: collaboration-services
Firing alerts
- dashboard: https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
- description: backup-restore.service on gitlab1003:9100
- runbook: https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
- summary: backup-restore.service on gitlab1003:9100
- alertname: SystemdUnitFailed
- instance: gitlab1003:9100
- name: backup-restore.service
- prometheus: ops
- severity: critical
- site: eqiad
- source: prometheus
- team: collaboration-services
- Source
- dashboard: https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
- description: backup-restore.service on gitlab1004:9100
- runbook: https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
- summary: backup-restore.service on gitlab1004:9100
- alertname: SystemdUnitFailed
- instance: gitlab1004:9100
- name: backup-restore.service
- prometheus: ops
- severity: critical
- site: eqiad
- source: prometheus
- team: collaboration-services
- Source
- dashboard: https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
- description: prometheus-apache-exporter.service on planet2003:9100
- runbook: https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
- summary: prometheus-apache-exporter.service on planet2003:9100
- alertname: SystemdUnitFailed
- instance: planet2003:9100
- name: prometheus-apache-exporter.service
- prometheus: ops
- severity: critical
- site: codfw
- source: prometheus
- team: collaboration-services
- Source
- dashboard: https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
- description: wmf_auto_restart_prometheus-apache-exporter.service on planet2003:9100
- runbook: https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
- summary: wmf_auto_restart_prometheus-apache-exporter.service on planet2003:9100
- alertname: SystemdUnitFailed
- instance: planet2003:9100
- name: wmf_auto_restart_prometheus-apache-exporter.service
- prometheus: ops
- severity: critical
- site: codfw
- source: prometheus
- team: collaboration-services
- Source
- dashboard: https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
- description: prometheus-apache-exporter.service on planet1003:9100
- runbook: https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
- summary: prometheus-apache-exporter.service on planet1003:9100
- alertname: SystemdUnitFailed
- instance: planet1003:9100
- name: prometheus-apache-exporter.service
- prometheus: ops
- severity: critical
- site: eqiad
- source: prometheus
- team: collaboration-services
- Source
- dashboard: https://grafana.wikimedia.org/d/g-AaZRFWk/systemd-status
- description: wmf_auto_restart_prometheus-apache-exporter.service on planet1003:9100
- runbook: https://wikitech.wikimedia.org/wiki/Monitoring/check_systemd_state
- summary: wmf_auto_restart_prometheus-apache-exporter.service on planet1003:9100
- alertname: SystemdUnitFailed
- instance: planet1003:9100
- name: wmf_auto_restart_prometheus-apache-exporter.service
- prometheus: ops
- severity: critical
- site: eqiad
- source: prometheus
- team: collaboration-services
- Source