feat: Add rule to Kubernetes Job not starting (#436)

This commit is contained in:
sipr-invivo 2024-10-28 22:24:10 +01:00 committed by GitHub
parent f9e683896f
commit bb75cb2c68
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -2044,6 +2044,11 @@ groups:
description: "Job {{ $labels.namespace }}/{{ $labels.job_name }} failed to complete" description: "Job {{ $labels.namespace }}/{{ $labels.job_name }} failed to complete"
query: "kube_job_status_failed > 0" query: "kube_job_status_failed > 0"
severity: warning severity: warning
- name: Kubernetes Job not starting
summary: Kubernetes Job not starting ({{ $labels.namespace }}/{{ $labels.job_name }})
description: "Job {{ $labels.namespace }}/{{ $labels.job_name }} did not start for 10 minutes"
query: "kube_job_status_active == 0 and kube_job_status_failed == 0 and kube_job_status_succeeded == 0 and (time() - kube_job_status_start_time) > 600"
severity: warning
- name: Kubernetes CronJob suspended - name: Kubernetes CronJob suspended
summary: Kubernetes CronJob suspended ({{ $labels.namespace }}/{{ $labels.cronjob }}) summary: Kubernetes CronJob suspended ({{ $labels.namespace }}/{{ $labels.cronjob }})
description: "CronJob {{ $labels.namespace }}/{{ $labels.cronjob }} is suspended" description: "CronJob {{ $labels.namespace }}/{{ $labels.cronjob }} is suspended"