Source code for camel.storages.object_storages.google_cloud
# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ========= Copyright 2023-2024 @ CAMEL-AI.org. All Rights Reserved. =========
from pathlib import Path, PurePath
from typing import Tuple
from warnings import warn
from camel.loaders import File, create_file_from_raw_bytes
from camel.storages.object_storages.base import BaseObjectStorage
[docs]
class GoogleCloudStorage(BaseObjectStorage):
r"""A class to connect to Google Cloud Storage. It will connect to one
bucket in the storage account.
Note that Google Cloud Storage does not support api key authentication.
Therefore, before using this class, you need to log in with gcloud command
line tool and save the credentials first.
Args:
bucket_name (str): The name of the bucket.
create_if_not_exists (bool, optional): Whether to create the bucket if
it does not exist. Defaults to True.
anonymous (bool, optional): Whether to use anonymous access. Defaults
to False.
References:
https://cloud.google.com/storage
https://cloud.google.com/docs/authentication/api-keys
"""
def __init__(
self,
bucket_name: str,
create_if_not_exists: bool = True,
anonymous: bool = False,
) -> None:
from google.cloud import storage
self.create_if_not_exists = create_if_not_exists
if anonymous:
client = storage.Client.create_anonymous_client()
else:
client = storage.Client()
self._client = client.bucket(bucket_name)
self._prepare_and_check()
[docs]
@staticmethod
def canonicalize_path(file_path: PurePath) -> Tuple[str, str]:
r"""Canonicalize the path for Google Cloud Storage.
Args:
file_path (PurePath): The path to be canonicalized.
Returns:
Tuple[str, str]: The canonicalized file key and file name.
"""
return file_path.as_posix(), file_path.name
def _prepare_and_check(self) -> None:
r"""Check privileges and existence of the bucket."""
from google.auth.exceptions import InvalidOperation
try:
exists = self._client.exists()
if not exists and self.create_if_not_exists:
self._client.create()
warn(
f"Bucket {self._client.name} not found. Automatically "
f"created."
)
elif not exists:
raise FileNotFoundError(
f"Failed to access bucket {self._client.name}: Not found."
)
except InvalidOperation:
raise PermissionError(
f"Failed to access bucket {self._client.name}: No permission."
)
def _put_file(self, file_key: str, file: File) -> None:
r"""Put a file to the GCloud bucket.
Args:
file_key (str): The path to the object in the bucket.
file (File): The file to be uploaded.
"""
self._client.blob(file_key).upload_from_string(file.raw_bytes)
def _get_file(self, file_key: str, filename: str) -> File:
r"""Get a file from the GCloud bucket.
Args:
file_key (str): The path to the object in the bucket.
filename (str): The name of the file.
Returns:
File: The object from the S3 bucket.
"""
raw_bytes = self._client.get_blob(file_key).download_as_bytes()
return create_file_from_raw_bytes(raw_bytes, filename)
def _upload_file(
self, local_file_path: Path, remote_file_key: str
) -> None:
r"""Upload a local file to the GCloud bucket.
Args:
local_file_path (Path): The path to the local file to be uploaded.
remote_file_key (str): The path to the object in the bucket.
"""
self._client.blob(remote_file_key).upload_from_filename(
local_file_path
)
def _download_file(
self, local_file_path: Path, remote_file_key: str
) -> None:
r"""Download a file from the GCloud bucket to the local system.
Args:
local_file_path (Path): The path to the local file to be saved.
remote_file_key (str): The key of the object in the bucket.
"""
self._client.get_blob(remote_file_key).download_to_filename(
local_file_path
)
def _object_exists(self, file_key: str) -> bool:
r"""
Check if the object exists in the GCloud bucket.
Args:
file_key: The key of the object in the bucket.
Returns:
bool: Whether the object exists in the bucket.
"""
return self._client.blob(file_key).exists()