Source code for
# Licensed to the Apache Software Foundation (ASF) under one# or more contributor license agreements. See the NOTICE file# distributed with this work for additional information# regarding copyright ownership. The ASF licenses this file# to you under the Apache License, Version 2.0 (the# "License"); you may not use this file except in compliance# with the License. You may obtain a copy of the License at## Unless required by applicable law or agreed to in writing,# software distributed under the License is distributed on an# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY# KIND, either express or implied. See the License for the# specific language governing permissions and limitations# under the,BaseAwsLinkfromairflow.utils.helpersimportexactly_one
[docs]classEmrClusterLink(BaseAwsLink):"""Helper class for constructing AWS EMR Cluster Link."""
[docs]defget_log_uri(*,cluster:dict[str,Any]|None=None,emr_client:boto3.client=None,job_flow_id:str|None=None)->str|None:""" Retrieves the S3 URI to the EMR Job logs. Requires either the output of a describe_cluster call or both an EMR Client and a job_flow_id.. """ifnotexactly_one(bool(cluster),emr_clientandjob_flow_id):raiseAirflowException("Requires either the output of a describe_cluster call or both an EMR Client and a job_flow_id.")cluster_info=(clusteroremr_client.describe_cluster(ClusterId=job_flow_id))["Cluster"]if"LogUri"notincluster_info:returnNonelog_uri=S3Hook.parse_s3_url(cluster_info["LogUri"])return"/".join(log_uri)