keps/sig-apps/3329-retriable-and-non-retriable-failures/kep.yaml (41 lines of code) (raw):
title: Retriable and non-retriable Pod failures for Jobs
kep-number: 3329
authors:
- "@mimowo"
owning-sig: sig-apps
participating-sigs:
- sig-scheduling
- sig-node
status: implementable
creation-date: 2022-06-07
reviewers:
- "@liggitt"
- "@bobbypage"
- "@SergeyKanzhelev"
approvers:
- "@soltysh"
- "@alculquicondor"
- "@deads2k"
- "@dchen1107"
# The target maturity stage in the current dev cycle for this KEP.
stage: beta
# The most recent milestone for which work toward delivery of this KEP has been
# done. This can be the current (upcoming) milestone, if it is being actively
# worked on.
latest-milestone: "v1.27"
# The milestone at which this feature was, or is targeted to be, at each stage.
milestone:
alpha: "v1.25"
beta: "v1.26"
stable: "v1.29"
# The following PRR answers are required at alpha release
# List the feature gate name and the components for which it must be enabled
feature-gates:
- name: PodDisruptionConditions
components:
- kube-apiserver
- kube-controller-manager
- kube-scheduler
- kubelet
- name: JobPodFailurePolicy
components:
- kube-apiserver
- kube-controller-manager
disable-supported: true
# The following PRR answers are required at beta release
metrics:
- job_sync_duration_seconds
- job_finished_total
- job_pod_failure_total