123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687 |
- import logging
- from collections.abc import Generator
- import boto3 # type: ignore
- from botocore.client import Config # type: ignore
- from botocore.exceptions import ClientError # type: ignore
- from configs import dify_config
- from extensions.storage.base_storage import BaseStorage
- logger = logging.getLogger(__name__)
- class AwsS3Storage(BaseStorage):
- """Implementation for Amazon Web Services S3 storage."""
- def __init__(self):
- super().__init__()
- self.bucket_name = dify_config.S3_BUCKET_NAME
- if dify_config.S3_USE_AWS_MANAGED_IAM:
- logger.info("Using AWS managed IAM role for S3")
- session = boto3.Session()
- region_name = dify_config.S3_REGION
- self.client = session.client(service_name="s3", region_name=region_name)
- else:
- logger.info("Using ak and sk for S3")
- self.client = boto3.client(
- "s3",
- aws_secret_access_key=dify_config.S3_SECRET_KEY,
- aws_access_key_id=dify_config.S3_ACCESS_KEY,
- endpoint_url=dify_config.S3_ENDPOINT,
- region_name=dify_config.S3_REGION,
- config=Config(s3={"addressing_style": dify_config.S3_ADDRESS_STYLE}),
- )
- # create bucket
- try:
- self.client.head_bucket(Bucket=self.bucket_name)
- except ClientError as e:
- # if bucket not exists, create it
- if e.response["Error"]["Code"] == "404":
- self.client.create_bucket(Bucket=self.bucket_name)
- # if bucket is not accessible, pass, maybe the bucket is existing but not accessible
- elif e.response["Error"]["Code"] == "403":
- pass
- else:
- # other error, raise exception
- raise
- def save(self, filename, data):
- self.client.put_object(Bucket=self.bucket_name, Key=filename, Body=data)
- def load_once(self, filename: str) -> bytes:
- try:
- data: bytes = self.client.get_object(Bucket=self.bucket_name, Key=filename)["Body"].read()
- except ClientError as ex:
- if ex.response["Error"]["Code"] == "NoSuchKey":
- raise FileNotFoundError("File not found")
- else:
- raise
- return data
- def load_stream(self, filename: str) -> Generator:
- try:
- response = self.client.get_object(Bucket=self.bucket_name, Key=filename)
- yield from response["Body"].iter_chunks()
- except ClientError as ex:
- if ex.response["Error"]["Code"] == "NoSuchKey":
- raise FileNotFoundError("file not found")
- elif "reached max retries" in str(ex):
- raise ValueError("please do not request the same file too frequently")
- else:
- raise
- def download(self, filename, target_filepath):
- self.client.download_file(self.bucket_name, filename, target_filepath)
- def exists(self, filename):
- try:
- self.client.head_object(Bucket=self.bucket_name, Key=filename)
- return True
- except:
- return False
- def delete(self, filename):
- self.client.delete_object(Bucket=self.bucket_name, Key=filename)
|