Source code for airflow.providers.cncf.kubernetes.operators.job

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.
"""Executes a Kubernetes Job."""

from __future__ import annotations

import copy
import json
import logging
import os
import sys
import warnings
from collections.abc import Sequence
from functools import cached_property
from typing import TYPE_CHECKING, Any, Literal

from kubernetes.client import BatchV1Api, Configuration, models as k8s
from kubernetes.client.api_client import ApiClient
from kubernetes.client.rest import ApiException

from airflow.exceptions import AirflowProviderDeprecationWarning
from airflow.providers.cncf.kubernetes.hooks.kubernetes import KubernetesHook
from airflow.providers.cncf.kubernetes.kubernetes_helper_functions import (
    POD_NAME_MAX_LENGTH,
    add_unique_suffix,
    create_unique_id,
)
from airflow.providers.cncf.kubernetes.operators.pod import KubernetesPodOperator
from airflow.providers.cncf.kubernetes.pod_generator import PodGenerator, merge_objects
from airflow.providers.cncf.kubernetes.triggers.job import KubernetesJobTrigger
from airflow.providers.cncf.kubernetes.utils.pod_manager import EMPTY_XCOM_RESULT, OnKillAction
from airflow.providers.cncf.kubernetes.version_compat import AIRFLOW_V_3_1_PLUS
from airflow.providers.common.compat.sdk import AirflowException, TaskDeferred, conf
from airflow.utils import yaml

if AIRFLOW_V_3_1_PLUS:
    from airflow.sdk import BaseOperator
else:
    from airflow.models import BaseOperator

if TYPE_CHECKING:
    from airflow.sdk import Context


[docs]
log = logging.getLogger(__name__)



[docs]
JOB_NAME_PREFIX = "job-"




[docs]
class KubernetesJobOperator(KubernetesPodOperator):
    """
    Executes a Kubernetes Job.

    .. seealso::
        For more information on how to use this operator, take a look at the guide:
        :ref:`howto/operator:KubernetesJobOperator`

    .. note::
        If you use `Google Kubernetes Engine <https://cloud.google.com/kubernetes-engine/>`__
        and Airflow is not running in the same cluster, consider using
        :class:`~airflow.providers.google.cloud.operators.kubernetes_engine.GKEStartJobOperator`, which
        simplifies the authorization process.

    :param job_template_file: path to job template file (templated)
    :param full_job_spec: The complete JodSpec
    :param backoff_limit: Specifies the number of retries before marking this job failed. Defaults to 6
    :param completion_mode: CompletionMode specifies how Pod completions are tracked. It can be `NonIndexed` (default) or `Indexed`.
    :param completions: Specifies the desired number of successfully finished pods the job should be run with.
    :param manual_selector: manualSelector controls generation of pod labels and pod selectors.
    :param parallelism: Specifies the maximum desired number of pods the job should run at any given time.
        The value here must be >=1 if wait_until_job_complete=True. Default value is 1
    :param selector: The selector of this V1JobSpec.
    :param suspend: Suspend specifies whether the Job controller should create Pods or not.
    :param ttl_seconds_after_finished: ttlSecondsAfterFinished limits the lifetime of a Job that has finished execution (either Complete or Failed).
    :param wait_until_job_complete: Whether to wait until started job finished execution (either Complete or
        Failed). Default is False.
    :param job_poll_interval: Interval in seconds between polling the job status. Default is 10.
        Used if the parameter `wait_until_job_complete` set True.
    :param deferrable: Run operator in the deferrable mode. Note that the parameter
        `wait_until_job_complete` must be set True.
    :param on_kill_propagation_policy: Whether and how garbage collection will be performed. Default is 'Foreground'.
        Acceptable values are:
        'Orphan' - orphan the dependents;
        'Background' - allow the garbage collector to delete the dependents in the background;
        'Foreground' - a cascading policy that deletes all dependents in the foreground.
        Default value is 'Foreground'.
    :param discover_pods_retry_number: Number of time list_namespaced_pod will be performed to discover
        already running pods.
    :param unwrap_single: Unwrap single result from the pod. For example, when set to `True` - if the XCom
        result should be `['res']`, the final result would be `'res'`. Default is True to support backward
        compatibility.
    """


[docs]
    template_fields: Sequence[str] = tuple({"job_template_file"} | set(KubernetesPodOperator.template_fields))


    def __init__(
        self,
        *,
        job_template_file: str | None = None,
        full_job_spec: k8s.V1Job | None = None,
        backoff_limit: int | None = None,
        completion_mode: str | None = None,
        completions: int | None = None,
        manual_selector: bool | None = None,
        parallelism: int = 1,
        selector: k8s.V1LabelSelector | None = None,
        suspend: bool | None = None,
        ttl_seconds_after_finished: int | None = None,
        wait_until_job_complete: bool = False,
        job_poll_interval: float = 10,
        deferrable: bool = conf.getboolean("operators", "default_deferrable", fallback=False),
        on_kill_propagation_policy: Literal["Foreground", "Background", "Orphan"] = "Foreground",
        discover_pods_retry_number: int = 3,
        unwrap_single: bool = True,
        **kwargs,
    ) -> None:
        self._pod = None
        super().__init__(**kwargs)

[docs]
        self.job_template_file = job_template_file


[docs]
        self.full_job_spec = full_job_spec


[docs]
        self.job_request_obj: k8s.V1Job | None = None


[docs]
        self.job: k8s.V1Job | None = None


[docs]
        self.backoff_limit = backoff_limit


[docs]
        self.completion_mode = completion_mode


[docs]
        self.completions = completions


[docs]
        self.manual_selector = manual_selector


[docs]
        self.parallelism = parallelism


[docs]
        self.selector = selector


[docs]
        self.suspend = suspend


[docs]
        self.ttl_seconds_after_finished = ttl_seconds_after_finished


[docs]
        self.wait_until_job_complete = wait_until_job_complete


[docs]
        self.job_poll_interval = job_poll_interval


[docs]
        self.deferrable = deferrable


[docs]
        self.on_kill_propagation_policy = on_kill_propagation_policy


[docs]
        self.discover_pods_retry_number = discover_pods_retry_number


[docs]
        self.unwrap_single = unwrap_single


    @property

[docs]
    def pod(self):
        warnings.warn(
            "`pod` parameter is deprecated, please use `pods`",
            AirflowProviderDeprecationWarning,
            stacklevel=2,
        )
        return self.pods[0] if self.pods else None


    @pod.setter
    def pod(self, value):
        self._pod = value

    @cached_property
    def _incluster_namespace(self):
        from pathlib import Path

        path = Path("/var/run/secrets/kubernetes.io/serviceaccount/namespace")
        return path.exists() and path.read_text() or None

    @cached_property

[docs]
    def hook(self) -> KubernetesHook:
        hook = KubernetesHook(
            conn_id=self.kubernetes_conn_id,
            in_cluster=self.in_cluster,
            config_file=self.config_file,
            cluster_context=self.cluster_context,
        )
        return hook


    @cached_property

[docs]
    def job_client(self) -> BatchV1Api:
        return self.hook.batch_v1_client



[docs]
    def create_job(self, job_request_obj: k8s.V1Job) -> k8s.V1Job:
        self.log.debug("Starting job:\n%s", yaml.safe_dump(job_request_obj.to_dict()))
        self.hook.create_job(job=job_request_obj)

        return job_request_obj



[docs]
    def execute(self, context: Context):
        self.name = self._set_name(self.name)
        if self.deferrable and not self.wait_until_job_complete:
            self.log.warning(
                "Deferrable mode is available only with parameter `wait_until_job_complete=True`. "
                "Please, set it up."
            )
        if (self.get_logs or self.do_xcom_push) and not self.wait_until_job_complete:
            self.log.warning(
                "Getting Logs and pushing to XCom are available only with parameter `wait_until_job_complete=True`. "
                "Please, set it up."
            )
        if self.parallelism is None:
            warnings.warn(
                "parallelism should be set explicitly. Defaulting to 1.",
                AirflowProviderDeprecationWarning,
                stacklevel=2,
            )
            self.parallelism = 1
        elif self.wait_until_job_complete and self.parallelism < 1:
            # get_pods() will raise an error if parallelism = 0
            raise AirflowException("parallelism cannot be less than 1 with `wait_until_job_complete=True`.")
        self.job_request_obj = self.build_job_request_obj(context)
        self.job = self.create_job(  # must set `self.job` for `on_kill`
            job_request_obj=self.job_request_obj
        )

        ti = context["ti"]
        ti.xcom_push(key="job_name", value=self.job.metadata.name)
        ti.xcom_push(key="job_namespace", value=self.job.metadata.namespace)

        try:
            if self.wait_until_job_complete:
                self.pods: Sequence[k8s.V1Pod] = self.get_pods(
                    pod_request_obj=self.pod_request_obj, context=context
                )

                if self.deferrable:
                    self.execute_deferrable()
                    # execute_deferrable raises TaskDeferred; cleanup is handled
                    # by execute_complete on resume.
                    return

                if self.do_xcom_push:
                    xcom_result = []
                    for pod in self.pods:
                        self.pod_manager.await_container_completion(
                            pod=pod, container_name=self.base_container_name
                        )
                        self.pod_manager.await_xcom_sidecar_container_start(pod=pod)
                        xcom_result.append(self.extract_xcom(pod=pod))
                self.job = self.hook.wait_until_job_complete(
                    job_name=self.job.metadata.name,
                    namespace=self.job.metadata.namespace,
                    job_poll_interval=self.job_poll_interval,
                )
                if self.get_logs:
                    for pod in self.pods:
                        self.pod_manager.fetch_requested_container_logs(
                            pod=pod,
                            containers=self.container_logs,
                            follow_logs=True,
                        )

            ti.xcom_push(key="job", value=self.job.to_dict())
            if self.wait_until_job_complete:
                if error_message := self.hook.is_job_failed(job=self.job):
                    raise AirflowException(
                        f"Kubernetes job '{self.job.metadata.name}' is failed with error '{error_message}'"
                    )
                if self.do_xcom_push:
                    return xcom_result[0] if self.unwrap_single and len(xcom_result) == 1 else xcom_result
        finally:
            self._cleanup_monitoring_pods(context)



[docs]
    def execute_deferrable(self):
        self.defer(
            trigger=KubernetesJobTrigger(
                job_name=self.job.metadata.name,
                job_namespace=self.job.metadata.namespace,
                pod_names=[pod.metadata.name for pod in self.pods],
                pod_namespace=self.pods[0].metadata.namespace,
                base_container_name=self.base_container_name,
                kubernetes_conn_id=self.kubernetes_conn_id,
                cluster_context=self.cluster_context,
                config_file=self.config_file,
                in_cluster=self.in_cluster,
                poll_interval=self.job_poll_interval,
                get_logs=self.get_logs,
                do_xcom_push=self.do_xcom_push,
            ),
            method_name="execute_complete",
        )



[docs]
    def execute_complete(self, context: Context, event: dict, **kwargs):
        # Resolve monitoring pods up front so the log-retrieval path and the
        # cleanup path in the finally block share the same lookup (no double
        # ``hook.get_pod`` calls).
        pods_by_name: dict[str, k8s.V1Pod] = {}
        event_job = event.get("job")
        job_namespace = (
            event_job.get("metadata", {}).get("namespace") if isinstance(event_job, dict) else None
        )
        pod_namespace = event.get("pod_namespace") or event.get("namespace") or job_namespace
        unresolved_pods: list[tuple[str, str]] = []
        for pod_name in event.get("pod_names") or []:
            if not pod_namespace:
                self.log.warning(
                    "Skipping pod %s lookup because no pod namespace was provided in trigger event.",
                    pod_name,
                )
                continue
            try:
                pod = self.hook.get_pod(pod_name, pod_namespace)
            except ApiException as e:
                if e.status == 404:
                    self.log.warning(
                        "Pod %s in namespace %s not found (possibly deleted).",
                        pod_name,
                        pod_namespace,
                    )
                else:
                    self.log.warning(
                        "Failed to retrieve pod %s in namespace %s: %s. Skipping.",
                        pod_name,
                        pod_namespace,
                        e,
                    )
                    unresolved_pods.append((pod_name, pod_namespace))
                continue
            except Exception as e:
                self.log.warning(
                    "Failed to retrieve pod %s in namespace %s: %s. Skipping.",
                    pod_name,
                    pod_namespace,
                    e,
                )
                unresolved_pods.append((pod_name, pod_namespace))
                continue
            if pod is not None:
                pods_by_name[pod_name] = pod

        try:
            ti = context["ti"]
            ti.xcom_push(key="job", value=event["job"])
            if event["status"] == "error":
                raise AirflowException(event["message"])

            if self.get_logs:
                for pod_name in event.get("pod_names") or []:
                    if pod_name not in pods_by_name:
                        # Pod was reported by the trigger but missing now (e.g. 404)
                        self.log.warning("Skipping log retrieval for pod %s (not found).", pod_name)
                        continue
                    self._write_logs(pods_by_name[pod_name])

            if self.do_xcom_push:
                xcom_results: list[Any | None] = []
                for xcom_result in event["xcom_result"]:
                    if isinstance(xcom_result, str) and xcom_result.rstrip() == EMPTY_XCOM_RESULT:
                        self.log.info("xcom result file is empty.")
                        xcom_results.append(None)
                        continue
                    self.log.info("xcom result: \n%s", xcom_result)
                    xcom_results.append(json.loads(xcom_result))
                return xcom_results[0] if self.unwrap_single and len(xcom_results) == 1 else xcom_results
        finally:
            self._cleanup_monitoring_pods_from_dict(
                context, pods_by_name, unresolved_pods=unresolved_pods, event_status=event.get("status")
            )


    @staticmethod

[docs]
    def deserialize_job_template_file(path: str) -> k8s.V1Job:
        """
        Generate a Job from a file.

        Unfortunately we need access to the private method
        ``_ApiClient__deserialize_model`` from the kubernetes client.
        This issue is tracked here: https://github.com/kubernetes-client/python/issues/977.

        :param path: Path to the file
        :return: a kubernetes.client.models.V1Job
        """
        if os.path.exists(path):
            with open(path) as stream:
                job = yaml.safe_load(stream)
        else:
            job = None
            log.warning("Template file %s does not exist", path)

        api_client = ApiClient(configuration=Configuration())
        return api_client._ApiClient__deserialize_model(job, k8s.V1Job)



[docs]
    def on_kill(self) -> None:
        self._killed = True
        if self.job:
            job = self.job
            kwargs = {
                "name": job.metadata.name,
                "namespace": job.metadata.namespace,
                "propagation_policy": self.on_kill_propagation_policy,
            }
            if self.termination_grace_period is not None:
                kwargs.update(grace_period_seconds=self.termination_grace_period)
            self.job_client.delete_namespaced_job(**kwargs)
        if self.on_kill_action == OnKillAction.KEEP_POD:
            self.log.info(
                "Skipping monitoring pod deletion since on_kill_action is set to %r.",
                self.on_kill_action.value,
            )
            return
        # Monitoring pods discovered via get_pods() have no ownerReferences and
        # are not reaped by the Job's foreground cascade. Delete them directly.
        for pod in getattr(self, "pods", None) or []:
            try:
                self.pod_manager.delete_pod(pod)
            except ApiException:
                self.log.exception(
                    "Unable to delete monitoring pod %s",
                    getattr(pod.metadata, "name", "<unknown>"),
                )


    def _cleanup_monitoring_pods(self, context: Context) -> None:
        """
        Run ``post_complete_action`` on each monitoring pod from ``self.pods``.

        Honours ``on_finish_action`` (inherited from ``KubernetesPodOperator``)
        and runs as a side-effect: any per-pod cleanup error is logged but never
        masks the in-flight exception (e.g. an ``AirflowException`` raised because
        the Job itself failed).
        """
        # Skip cleanup when control is leaving execute() via TaskDeferred: the
        # deferred trigger still needs the monitoring pods to exist; the pods
        # will be cleaned up by execute_complete() on resume.
        exc = sys.exc_info()[1]
        if isinstance(exc, TaskDeferred):
            return
        for pod in getattr(self, "pods", None) or []:
            remote_pod = pod
            try:
                pod_name = getattr(pod.metadata, "name", None)
                pod_namespace = getattr(pod.metadata, "namespace", None)
                if pod_name and pod_namespace:
                    remote_pod = self.hook.get_pod(name=pod_name, namespace=pod_namespace) or pod
            except Exception:
                remote_pod = pod
            try:
                self.post_complete_action(
                    pod=pod,
                    remote_pod=remote_pod,
                    context=context,
                    result=None,
                )
            except Exception:
                # cleanup() can raise AirflowException for failed pods, and the
                # k8s client can raise transport errors. For the Job operator we
                # prefer the Job-level failure (or the original exception) to
                # propagate instead of any per-pod cleanup error.
                self.log.warning(
                    "Error while cleaning up monitoring pod %s",
                    getattr(pod.metadata, "name", "<unknown>"),
                    exc_info=True,
                )

    def _cleanup_monitoring_pods_from_dict(
        self,
        context: Context,
        pods_by_name: dict[str, k8s.V1Pod],
        *,
        unresolved_pods: list[tuple[str, str]] | None = None,
        event_status: str | None = None,
    ) -> None:
        """
        Run ``post_complete_action`` on each pod previously resolved via the trigger event.

        Same semantics as :meth:`_cleanup_monitoring_pods` - errors are logged
        but never mask the in-flight exception.
        """
        for pod_name, pod in pods_by_name.items():
            try:
                self.post_complete_action(pod=pod, remote_pod=pod, context=context, result=None)
            except Exception:
                self.log.warning(
                    "Error while cleaning up monitoring pod %s",
                    pod_name,
                    exc_info=True,
                )
        pod_phase = (
            "Succeeded" if event_status == "success" else "Failed" if event_status == "error" else None
        )
        for pod_name, pod_namespace in unresolved_pods or []:
            fallback_pod = k8s.V1Pod(
                metadata=k8s.V1ObjectMeta(name=pod_name, namespace=pod_namespace),
                status=k8s.V1PodStatus(phase=pod_phase),
            )
            self.process_pod_deletion(fallback_pod, reraise=False)


[docs]
    def build_job_request_obj(self, context: Context | None = None) -> k8s.V1Job:
        """
        Return V1Job object based on job template file, full job spec, and other operator parameters.

        The V1Job attributes are derived (in order of precedence) from operator params, full job spec, job
        template file.
        """
        self.log.debug("Creating job for KubernetesJobOperator task %s", self.task_id)
        if self.job_template_file:
            self.log.debug("Job template file found, will parse for base job")
            job_template = self.deserialize_job_template_file(self.job_template_file)
            if self.full_job_spec:
                job_template = self.reconcile_jobs(job_template, self.full_job_spec)
        elif self.full_job_spec:
            job_template = self.full_job_spec
        else:
            job_template = k8s.V1Job(metadata=k8s.V1ObjectMeta())

        pod_template = super().build_pod_request_obj(context)
        pod_template_spec = k8s.V1PodTemplateSpec(
            metadata=pod_template.metadata,
            spec=pod_template.spec,
        )
        self.pod_request_obj = pod_template

        job = k8s.V1Job(
            api_version="batch/v1",
            kind="Job",
            metadata=k8s.V1ObjectMeta(
                namespace=self.namespace,
                labels=self.labels,
                name=self.name,
                annotations=self.annotations,
            ),
            spec=k8s.V1JobSpec(
                active_deadline_seconds=self.active_deadline_seconds,
                backoff_limit=self.backoff_limit,
                completion_mode=self.completion_mode,
                completions=self.completions,
                manual_selector=self.manual_selector,
                parallelism=self.parallelism,
                selector=self.selector,
                suspend=self.suspend,
                template=pod_template_spec,
                ttl_seconds_after_finished=self.ttl_seconds_after_finished,
            ),
        )

        job = self.reconcile_jobs(job_template, job)

        # Account for job name prefix when generating/truncating the name
        max_base_length = POD_NAME_MAX_LENGTH - len(JOB_NAME_PREFIX)

        if not job.metadata.name:
            job.metadata.name = create_unique_id(
                task_id=self.task_id, unique=self.random_name_suffix, max_length=max_base_length
            )
        elif self.random_name_suffix:
            # user has supplied job name, we're just adding suffix
            job.metadata.name = add_unique_suffix(name=job.metadata.name, max_len=max_base_length)

        job.metadata.name = f"{JOB_NAME_PREFIX}{job.metadata.name}"

        if not job.metadata.namespace:
            hook_namespace = self.hook.get_namespace()
            job_namespace = self.namespace or hook_namespace or self._incluster_namespace or "default"
            job.metadata.namespace = job_namespace

        self.log.info("Building job %s ", job.metadata.name)

        return job


    @staticmethod

[docs]
    def reconcile_jobs(base_job: k8s.V1Job, client_job: k8s.V1Job | None) -> k8s.V1Job:
        """
        Merge Kubernetes Job objects.

        :param base_job: has the base attributes which are overwritten if they exist
            in the client job and remain if they do not exist in the client_job
        :param client_job: the job that the client wants to create.
        :return: the merged jobs

        This can't be done recursively as certain fields are overwritten and some are concatenated.
        """
        if client_job is None:
            return base_job

        client_job_cp = copy.deepcopy(client_job)
        client_job_cp.spec = KubernetesJobOperator.reconcile_job_specs(base_job.spec, client_job_cp.spec)
        client_job_cp.metadata = PodGenerator.reconcile_metadata(base_job.metadata, client_job_cp.metadata)
        client_job_cp = merge_objects(base_job, client_job_cp)

        return client_job_cp


    @staticmethod

[docs]
    def reconcile_job_specs(
        base_spec: k8s.V1JobSpec | None, client_spec: k8s.V1JobSpec | None
    ) -> k8s.V1JobSpec | None:
        """
        Merge Kubernetes JobSpec objects.

        :param base_spec: has the base attributes which are overwritten if they exist
            in the client_spec and remain if they do not exist in the client_spec
        :param client_spec: the spec that the client wants to create.
        :return: the merged specs
        """
        if base_spec and not client_spec:
            return base_spec
        if not base_spec and client_spec:
            return client_spec
        if client_spec and base_spec:
            client_spec.template.spec = PodGenerator.reconcile_specs(
                base_spec.template.spec, client_spec.template.spec
            )
            client_spec.template.metadata = PodGenerator.reconcile_metadata(
                base_spec.template.metadata, client_spec.template.metadata
            )
            return merge_objects(base_spec, client_spec)

        return None



[docs]
    def get_pods(
        self, pod_request_obj: k8s.V1Pod, context: Context, *, exclude_checked: bool = True
    ) -> Sequence[k8s.V1Pod]:
        """Return an already-running pods if exists."""
        label_selector = self._build_find_pod_label_selector(context, exclude_checked=exclude_checked)
        pod_list: Sequence[k8s.V1Pod] = []
        retry_number: int = 0

        while retry_number <= self.discover_pods_retry_number:
            if len(pod_list) == self.parallelism:
                break
            pod_list = self.client.list_namespaced_pod(
                namespace=pod_request_obj.metadata.namespace,
                label_selector=label_selector,
            ).items
            retry_number += 1

        if len(pod_list) == 0:
            raise AirflowException(f"No pods running with labels {label_selector}")

        for pod_instance in pod_list:
            self.log_matching_pod(pod=pod_instance, context=context)

        return pod_list





[docs]
class KubernetesDeleteJobOperator(BaseOperator):
    """
    Delete a Kubernetes Job.

    .. seealso::
        For more information on how to use this operator, take a look at the guide:
        :ref:`howto/operator:KubernetesDeleteJobOperator`

    :param name: name of the Job.
    :param namespace: the namespace to run within kubernetes.
    :param kubernetes_conn_id: The :ref:`kubernetes connection id <howto/connection:kubernetes>`
        for the Kubernetes cluster.
    :param config_file: The path to the Kubernetes config file. (templated)
        If not specified, default value is ``~/.kube/config``
    :param in_cluster: run kubernetes client with in_cluster configuration.
    :param cluster_context: context that points to kubernetes cluster.
        Ignored when in_cluster is True. If None, current-context is used. (templated)
    :param delete_on_status: Condition for performing delete operation depending on the job status. Values:
        ``None`` - delete the job regardless of its status, "Complete" - delete only successfully completed
        jobs, "Failed" - delete only failed jobs. (default: ``None``)
    :param wait_for_completion: Whether to wait for the job to complete. (default: ``False``)
    :param poll_interval: Interval in seconds between polling the job status. Used when the `delete_on_status`
        parameter is set. (default: 10.0)
    """


[docs]
    template_fields: Sequence[str] = (
        "config_file",
        "name",
        "namespace",
        "cluster_context",
    )


    def __init__(
        self,
        *,
        name: str,
        namespace: str,
        kubernetes_conn_id: str | None = KubernetesHook.default_conn_name,
        config_file: str | None = None,
        in_cluster: bool | None = None,
        cluster_context: str | None = None,
        delete_on_status: str | None = None,
        wait_for_completion: bool = False,
        poll_interval: float = 10.0,
        **kwargs,
    ) -> None:
        super().__init__(**kwargs)

[docs]
        self.name = name


[docs]
        self.namespace = namespace


[docs]
        self.kubernetes_conn_id = kubernetes_conn_id


[docs]
        self.config_file = config_file


[docs]
        self.in_cluster = in_cluster


[docs]
        self.cluster_context = cluster_context


[docs]
        self.delete_on_status = delete_on_status


[docs]
        self.wait_for_completion = wait_for_completion


[docs]
        self.poll_interval = poll_interval


    @cached_property

[docs]
    def hook(self) -> KubernetesHook:
        return KubernetesHook(
            conn_id=self.kubernetes_conn_id,
            in_cluster=self.in_cluster,
            config_file=self.config_file,
            cluster_context=self.cluster_context,
        )


    @cached_property

[docs]
    def client(self) -> BatchV1Api:
        return self.hook.batch_v1_client



[docs]
    def execute(self, context: Context):
        try:
            if self.delete_on_status not in ("Complete", "Failed", None):
                raise AirflowException(
                    "The `delete_on_status` parameter must be one of 'Complete', 'Failed' or None. "
                    "The current value is %s",
                    str(self.delete_on_status),
                )

            if self.wait_for_completion:
                job = self.hook.wait_until_job_complete(
                    job_name=self.name, namespace=self.namespace, job_poll_interval=self.poll_interval
                )
            else:
                job = self.hook.get_job_status(job_name=self.name, namespace=self.namespace)

            if (
                self.delete_on_status is None
                or (self.delete_on_status == "Complete" and self.hook.is_job_successful(job=job))
                or (self.delete_on_status == "Failed" and self.hook.is_job_failed(job=job))
            ):
                self.log.info("Deleting kubernetes Job: %s", self.name)
                self.client.delete_namespaced_job(name=self.name, namespace=self.namespace)
                self.log.info("Kubernetes job was deleted.")
            else:
                self.log.info(
                    "Deletion of the job %s was skipped due to settings of on_status=%s",
                    self.name,
                    self.delete_on_status,
                )
        except ApiException as e:
            if e.status == 404:
                self.log.info("The Kubernetes job %s does not exist.", self.name)
            else:
                raise e





[docs]
class KubernetesPatchJobOperator(BaseOperator):
    """
    Update a Kubernetes Job.

    .. seealso::
        For more information on how to use this operator, take a look at the guide:
        :ref:`howto/operator:KubernetesPatchJobOperator`

    :param name: name of the Job
    :param namespace: the namespace to run within kubernetes
    :param body: Job json object with parameters for update
        https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.25/#job-v1-batch
        e.g. ``{"spec": {"suspend": True}}``
    :param kubernetes_conn_id: The :ref:`kubernetes connection id <howto/connection:kubernetes>`
        for the Kubernetes cluster.
    :param config_file: The path to the Kubernetes config file. (templated)
        If not specified, default value is ``~/.kube/config``
    :param in_cluster: run kubernetes client with in_cluster configuration.
    :param cluster_context: context that points to kubernetes cluster.
        Ignored when in_cluster is True. If None, current-context is used. (templated)
    """


[docs]
    template_fields: Sequence[str] = (
        "config_file",
        "name",
        "namespace",
        "body",
        "cluster_context",
    )


    def __init__(
        self,
        *,
        name: str,
        namespace: str,
        body: object,
        kubernetes_conn_id: str | None = KubernetesHook.default_conn_name,
        config_file: str | None = None,
        in_cluster: bool | None = None,
        cluster_context: str | None = None,
        **kwargs,
    ) -> None:
        super().__init__(**kwargs)

[docs]
        self.name = name


[docs]
        self.namespace = namespace


[docs]
        self.body = body


[docs]
        self.kubernetes_conn_id = kubernetes_conn_id


[docs]
        self.config_file = config_file


[docs]
        self.in_cluster = in_cluster


[docs]
        self.cluster_context = cluster_context


    @cached_property

[docs]
    def hook(self) -> KubernetesHook:
        return KubernetesHook(
            conn_id=self.kubernetes_conn_id,
            in_cluster=self.in_cluster,
            config_file=self.config_file,
            cluster_context=self.cluster_context,
        )



[docs]
    def execute(self, context: Context) -> dict:
        self.log.info("Updating existing Job: %s", self.name)
        job_object = self.hook.patch_namespaced_job(
            job_name=self.name, namespace=self.namespace, body=self.body
        )
        self.log.info("Job was updated.")
        return k8s.V1Job.to_dict(job_object)