Source code for airflow.providers.common.sql.datafusion.base
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
from __future__ import annotations
from abc import ABC, abstractmethod
from typing import TYPE_CHECKING, Any
from airflow.utils.log.logging_mixin import LoggingMixin
if TYPE_CHECKING:
from datafusion import SessionContext
from airflow.providers.common.sql.config import (
ConnectionConfig,
DataSourceConfig,
FormatType,
StorageType,
)
[docs]
class ObjectStorageProvider(LoggingMixin, ABC):
"""Abstract base class for object storage providers."""
@property
[docs]
def get_storage_type(self) -> StorageType:
"""Return storage type handled by this provider (e.g., 's3', 'gcs', 'local')."""
raise NotImplementedError
@abstractmethod
[docs]
def create_object_store(self, path: str, connection_config: ConnectionConfig | None = None) -> Any:
"""Create and return a DataFusion object store instance."""
raise NotImplementedError
@abstractmethod
[docs]
def get_scheme(self) -> str:
"""Return URL scheme for this storage type (e.g., 's3://', 'gs://')."""
raise NotImplementedError
[docs]
def get_bucket(self, path: str) -> str | None:
"""Extract the bucket name from the given path."""
if path and path.startswith(self.get_scheme()):
path_parts = path[len(self.get_scheme()) :].split("/", 1)
return path_parts[0]
return None