Source code for tests.system.google.cloud.dataflow.example_dataflow_native_python
## Licensed to the Apache Software Foundation (ASF) under one# or more contributor license agreements. See the NOTICE file# distributed with this work for additional information# regarding copyright ownership. The ASF licenses this file# to you under the Apache License, Version 2.0 (the# "License"); you may not use this file except in compliance# with the License. You may obtain a copy of the License at## http://www.apache.org/licenses/LICENSE-2.0## Unless required by applicable law or agreed to in writing,# software distributed under the License is distributed on an# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY# KIND, either express or implied. See the License for the# specific language governing permissions and limitations# under the License."""Example Airflow DAG for testing Google Dataflow Beam Pipeline Operator with Python."""from__future__importannotationsimportosfromdatetimeimportdatetimefromairflow.models.dagimportDAGfromairflow.providers.apache.beam.hooks.beamimportBeamRunnerTypefromairflow.providers.apache.beam.operators.beamimportBeamRunPythonPipelineOperatorfromairflow.providers.google.cloud.operators.dataflowimportDataflowStopJobOperatorfromairflow.providers.google.cloud.operators.gcsimportGCSCreateBucketOperator,GCSDeleteBucketOperatorfromairflow.utils.trigger_ruleimportTriggerRule
# [START howto_operator_start_python_job]start_python_job=BeamRunPythonPipelineOperator(runner=BeamRunnerType.DataflowRunner,task_id="start_python_job",py_file=GCS_PYTHON_SCRIPT,py_options=[],pipeline_options={"output":GCS_OUTPUT,},py_requirements=["apache-beam[gcp]==2.59.0"],py_interpreter="python3",py_system_site_packages=False,dataflow_config={"location":LOCATION,"job_name":"start_python_job"},)# [END howto_operator_start_python_job]start_python_job_local=BeamRunPythonPipelineOperator(task_id="start_python_job_local",py_file="apache_beam.examples.wordcount",py_options=["-m"],pipeline_options={"output":GCS_OUTPUT,},py_requirements=["apache-beam[gcp]==2.59.0"],py_interpreter="python3",py_system_site_packages=False,)# [START howto_operator_stop_dataflow_job]stop_dataflow_job=DataflowStopJobOperator(task_id="stop_dataflow_job",location=LOCATION,job_name_prefix="start-python-pipeline",)# [END howto_operator_stop_dataflow_job]delete_bucket=GCSDeleteBucketOperator(task_id="delete_bucket",bucket_name=BUCKET_NAME,trigger_rule=TriggerRule.ALL_DONE)(# TEST SETUPcreate_bucket# TEST BODY>>start_python_job>>start_python_job_local>>stop_dataflow_job# TEST TEARDOWN>>delete_bucket)fromtests_common.test_utils.watcherimportwatcher# This test needs watcher in order to properly mark success/failure# when "teardown" task with trigger rule is part of the DAGlist(dag.tasks)>>watcher()fromtests_common.test_utils.system_testsimportget_test_run# noqa: E402# Needed to run the example DAG with pytest (see: tests/system/README.md#run_via_pytest)