mirror of
https://github.com/langgenius/dify.git
synced 2024-11-16 11:42:29 +08:00
86 lines
3.0 KiB
Python
86 lines
3.0 KiB
Python
import logging
|
|
from collections.abc import Generator
|
|
|
|
import boto3
|
|
from botocore.client import Config
|
|
from botocore.exceptions import ClientError
|
|
|
|
from configs import dify_config
|
|
from extensions.storage.base_storage import BaseStorage
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
class AwsS3Storage(BaseStorage):
|
|
"""Implementation for Amazon Web Services S3 storage."""
|
|
|
|
def __init__(self):
|
|
super().__init__()
|
|
self.bucket_name = dify_config.S3_BUCKET_NAME
|
|
if dify_config.S3_USE_AWS_MANAGED_IAM:
|
|
logger.info("Using AWS managed IAM role for S3")
|
|
|
|
session = boto3.Session()
|
|
region_name = dify_config.S3_REGION
|
|
self.client = session.client(service_name="s3", region_name=region_name)
|
|
else:
|
|
logger.info("Using ak and sk for S3")
|
|
|
|
self.client = boto3.client(
|
|
"s3",
|
|
aws_secret_access_key=dify_config.S3_SECRET_KEY,
|
|
aws_access_key_id=dify_config.S3_ACCESS_KEY,
|
|
endpoint_url=dify_config.S3_ENDPOINT,
|
|
region_name=dify_config.S3_REGION,
|
|
config=Config(s3={"addressing_style": dify_config.S3_ADDRESS_STYLE}),
|
|
)
|
|
# create bucket
|
|
try:
|
|
self.client.head_bucket(Bucket=self.bucket_name)
|
|
except ClientError as e:
|
|
# if bucket not exists, create it
|
|
if e.response["Error"]["Code"] == "404":
|
|
self.client.create_bucket(Bucket=self.bucket_name)
|
|
# if bucket is not accessible, pass, maybe the bucket is existing but not accessible
|
|
elif e.response["Error"]["Code"] == "403":
|
|
pass
|
|
else:
|
|
# other error, raise exception
|
|
raise
|
|
|
|
def save(self, filename, data):
|
|
self.client.put_object(Bucket=self.bucket_name, Key=filename, Body=data)
|
|
|
|
def load_once(self, filename: str) -> bytes:
|
|
try:
|
|
data = self.client.get_object(Bucket=self.bucket_name, Key=filename)["Body"].read()
|
|
except ClientError as ex:
|
|
if ex.response["Error"]["Code"] == "NoSuchKey":
|
|
raise FileNotFoundError("File not found")
|
|
else:
|
|
raise
|
|
return data
|
|
|
|
def load_stream(self, filename: str) -> Generator:
|
|
try:
|
|
response = self.client.get_object(Bucket=self.bucket_name, Key=filename)
|
|
yield from response["Body"].iter_chunks()
|
|
except ClientError as ex:
|
|
if ex.response["Error"]["Code"] == "NoSuchKey":
|
|
raise FileNotFoundError("File not found")
|
|
else:
|
|
raise
|
|
|
|
def download(self, filename, target_filepath):
|
|
self.client.download_file(self.bucket_name, filename, target_filepath)
|
|
|
|
def exists(self, filename):
|
|
try:
|
|
self.client.head_object(Bucket=self.bucket_name, Key=filename)
|
|
return True
|
|
except:
|
|
return False
|
|
|
|
def delete(self, filename):
|
|
self.client.delete_object(Bucket=self.bucket_name, Key=filename)
|