Source code for tests.system.google.cloud.dataproc.example_dataproc_batch_persistent
# Licensed to the Apache Software Foundation (ASF) under one# or more contributor license agreements. See the NOTICE file# distributed with this work for additional information# regarding copyright ownership. The ASF licenses this file# to you under the Apache License, Version 2.0 (the# "License"); you may not use this file except in compliance# with the License. You may obtain a copy of the License at## http://www.apache.org/licenses/LICENSE-2.0## Unless required by applicable law or agreed to in writing,# software distributed under the License is distributed on an# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY# KIND, either express or implied. See the License for the# specific language governing permissions and limitations# under the License."""Example Airflow DAG for Dataproc batch operators."""from__future__importannotationsimportosfromdatetimeimportdatetimefromgoogle.api_core.retryimportRetryfromairflow.models.dagimportDAGfromairflow.providers.google.cloud.operators.dataprocimport(ClusterGenerator,DataprocCreateBatchOperator,DataprocCreateClusterOperator,DataprocDeleteBatchOperator,DataprocDeleteClusterOperator,)fromairflow.providers.google.cloud.operators.gcsimportGCSCreateBucketOperator,GCSDeleteBucketOperatorfromairflow.utils.trigger_ruleimportTriggerRulefromproviders.tests.system.googleimportDEFAULT_GCP_SYSTEM_TEST_PROJECT_ID
# [START how_to_cloud_dataproc_create_cluster_for_persistent_history_server]create_cluster=DataprocCreateClusterOperator(task_id="create_cluster_for_phs",project_id=PROJECT_ID,cluster_config=CLUSTER_GENERATOR_CONFIG_FOR_PHS,region=REGION,cluster_name=CLUSTER_NAME,retry=Retry(maximum=100.0,initial=10.0,multiplier=1.0),num_retries_if_resource_is_not_ready=3,)# [END how_to_cloud_dataproc_create_cluster_for_persistent_history_server]# [START how_to_cloud_dataproc_create_batch_operator_with_persistent_history_server]create_batch=DataprocCreateBatchOperator(task_id="create_batch_with_phs",project_id=PROJECT_ID,region=REGION,batch=BATCH_CONFIG_WITH_PHS,batch_id=BATCH_ID,result_retry=Retry(maximum=100.0,initial=10.0,multiplier=1.0),num_retries_if_resource_is_not_ready=3,)# [END how_to_cloud_dataproc_create_batch_operator_with_persistent_history_server]delete_batch=DataprocDeleteBatchOperator(task_id="delete_batch",project_id=PROJECT_ID,region=REGION,batch_id=BATCH_ID,trigger_rule=TriggerRule.ALL_DONE,)delete_cluster=DataprocDeleteClusterOperator(task_id="delete_cluster",project_id=PROJECT_ID,cluster_name=CLUSTER_NAME,region=REGION,trigger_rule=TriggerRule.ALL_DONE,)delete_bucket=GCSDeleteBucketOperator(task_id="delete_bucket",bucket_name=BUCKET_NAME,trigger_rule=TriggerRule.ALL_DONE)(# TEST SETUPcreate_bucket>>create_cluster# TEST BODY>>create_batch# TEST TEARDOWN>>delete_batch>>delete_cluster>>delete_bucket)fromtests_common.test_utils.watcherimportwatcher# This test needs watcher in order to properly mark success/failure# when "teardown" task with trigger rule is part of the DAGlist(dag.tasks)>>watcher()fromtests_common.test_utils.system_testsimportget_test_run# noqa: E402# Needed to run the example DAG with pytest (see: tests/system/README.md#run_via_pytest)