Source code for airflow.providers.airbyte.operators.airbyte
## Licensed to the Apache Software Foundation (ASF) under one# or more contributor license agreements. See the NOTICE file# distributed with this work for additional information# regarding copyright ownership. The ASF licenses this file# to you under the Apache License, Version 2.0 (the# "License"); you may not use this file except in compliance# with the License. You may obtain a copy of the License at## http://www.apache.org/licenses/LICENSE-2.0## Unless required by applicable law or agreed to in writing,# software distributed under the License is distributed on an# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY# KIND, either express or implied. See the License for the# specific language governing permissions and limitations# under the License.from__future__importannotationsimporttimefromcollections.abcimportSequencefromtypingimportTYPE_CHECKING,Anyfromairbyte_api.modelsimportJobStatusEnumfromairflow.configurationimportconffromairflow.exceptionsimportAirflowExceptionfromairflow.modelsimportBaseOperatorfromairflow.providers.airbyte.hooks.airbyteimportAirbyteHookfromairflow.providers.airbyte.triggers.airbyteimportAirbyteSyncTriggerifTYPE_CHECKING:fromairflow.utils.contextimportContext
[docs]classAirbyteTriggerSyncOperator(BaseOperator):""" Submits a job to an Airbyte server to run a integration process between your source and destination. .. seealso:: For more information on how to use this operator, take a look at the guide: :ref:`howto/operator:AirbyteTriggerSyncOperator` :param airbyte_conn_id: Optional. The name of the Airflow connection to get connection information for Airbyte. Defaults to "airbyte_default". :param connection_id: Required. The Airbyte ConnectionId UUID between a source and destination. :param asynchronous: Optional. Flag to get job_id after submitting the job to the Airbyte API. This is useful for submitting long running jobs and waiting on them asynchronously using the AirbyteJobSensor. Defaults to False. :param deferrable: Run operator in the deferrable mode. :param api_version: Optional. Airbyte API version. Defaults to "v1". :param wait_seconds: Optional. Number of seconds between checks. Only used when ``asynchronous`` is False. Defaults to 3 seconds. :param timeout: Optional. The amount of time, in seconds, to wait for the request to complete. Only used when ``asynchronous`` is False. Defaults to 3600 seconds (or 1 hour). """
[docs]defexecute(self,context:Context)->None:"""Create Airbyte Job and wait to finish."""hook=AirbyteHook(airbyte_conn_id=self.airbyte_conn_id,api_version=self.api_version)job_object=hook.submit_sync_connection(connection_id=self.connection_id)self.job_id=job_object.job_idstate=job_object.statusend_time=time.time()+self.timeoutself.log.info("Job %s was submitted to Airbyte Server",self.job_id)ifself.asynchronous:self.log.info("Async Task returning job_id %s",self.job_id)returnself.job_idifnotself.deferrable:hook.wait_for_job(job_id=self.job_id,wait_seconds=self.wait_seconds,timeout=self.timeout)else:ifstatein(JobStatusEnum.RUNNING,JobStatusEnum.PENDING,JobStatusEnum.INCOMPLETE):self.defer(timeout=self.execution_timeout,trigger=AirbyteSyncTrigger(conn_id=self.airbyte_conn_id,job_id=self.job_id,end_time=end_time,poll_interval=60,),method_name="execute_complete",)elifstate==JobStatusEnum.SUCCEEDED:self.log.info("Job %s completed successfully",self.job_id)returnelifstate==JobStatusEnum.FAILED:raiseAirflowException(f"Job failed:\n{self.job_id}")elifstate==JobStatusEnum.CANCELLED:raiseAirflowException(f"Job was cancelled:\n{self.job_id}")else:raiseAirflowException(f"Encountered unexpected state `{state}` for job_id `{self.job_id}")returnself.job_id
[docs]defexecute_complete(self,context:Context,event:Any=None)->None:""" Invoke this callback when the trigger fires; return immediately. Relies on trigger to throw an exception, otherwise it assumes execution was successful. """ifevent["status"]=="error":raiseAirflowException(event["message"])self.log.info("%s completed successfully.",self.task_id)returnNone
[docs]defon_kill(self):"""Cancel the job if task is cancelled."""hook=AirbyteHook(airbyte_conn_id=self.airbyte_conn_id,api_version=self.api_version)ifself.job_id:self.log.info("on_kill: cancel the airbyte Job %s",self.job_id)hook.cancel_job(self.job_id)