Source code for airflow.providers.google.cloud.fs.gcs

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.
from __future__ import annotations

from typing import TYPE_CHECKING

from airflow.providers.google.common.hooks.base_google import GoogleBaseHook

if TYPE_CHECKING:
    from fsspec import AbstractFileSystem

[docs]GCS_TOKEN = "gcs.oauth2.token"
[docs]GCS_TOKEN_EXPIRES_AT_MS = "gcs.oauth2.token-expires-at"
[docs]GCS_PROJECT_ID = "gcs.project-id"
[docs]GCS_ACCESS = "gcs.access"
[docs]GCS_CONSISTENCY = "gcs.consistency"
[docs]GCS_CACHE_TIMEOUT = "gcs.cache-timeout"
[docs]GCS_REQUESTER_PAYS = "gcs.requester-pays"
[docs]GCS_SESSION_KWARGS = "gcs.session-kwargs"
[docs]GCS_ENDPOINT = "gcs.endpoint"
[docs]GCS_DEFAULT_LOCATION = "gcs.default-bucket-location"
[docs]GCS_VERSION_AWARE = "gcs.version-aware"
[docs]schemes = ["gs", "gcs"]
[docs]def get_fs(conn_id: str | None) -> AbstractFileSystem: # https://gcsfs.readthedocs.io/en/latest/api.html#gcsfs.core.GCSFileSystem from gcsfs import GCSFileSystem if conn_id is None: return GCSFileSystem() g = GoogleBaseHook(gcp_conn_id=conn_id) creds = g.get_credentials() return GCSFileSystem( project=g.project_id, access=g.extras.get(GCS_ACCESS, "full_control"), token=creds.token, consistency=g.extras.get(GCS_CONSISTENCY, "none"), cache_timeout=g.extras.get(GCS_CACHE_TIMEOUT), requester_pays=g.extras.get(GCS_REQUESTER_PAYS, False), session_kwargs=g.extras.get(GCS_SESSION_KWARGS, {}), endpoint_url=g.extras.get(GCS_ENDPOINT), default_location=g.extras.get(GCS_DEFAULT_LOCATION), version_aware=g.extras.get(GCS_VERSION_AWARE, "false").lower() == "true", )

Was this entry helpful?