| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788 | import loggingfrom collections.abc import Generatorimport boto3from botocore.client import Configfrom botocore.exceptions import ClientErrorfrom configs import dify_configfrom extensions.storage.base_storage import BaseStoragelogger = logging.getLogger(__name__)class AwsS3Storage(BaseStorage):    """Implementation for Amazon Web Services S3 storage."""    def __init__(self):        super().__init__()        self.bucket_name = dify_config.S3_BUCKET_NAME        if dify_config.S3_USE_AWS_MANAGED_IAM:            logger.info("Using AWS managed IAM role for S3")            session = boto3.Session()            region_name = dify_config.S3_REGION            self.client = session.client(service_name="s3", region_name=region_name)        else:            logger.info("Using ak and sk for S3")            self.client = boto3.client(                "s3",                aws_secret_access_key=dify_config.S3_SECRET_KEY,                aws_access_key_id=dify_config.S3_ACCESS_KEY,                endpoint_url=dify_config.S3_ENDPOINT,                region_name=dify_config.S3_REGION,                config=Config(s3={"addressing_style": dify_config.S3_ADDRESS_STYLE}),            )        # create bucket        try:            self.client.head_bucket(Bucket=self.bucket_name)        except ClientError as e:            # if bucket not exists, create it            if e.response["Error"]["Code"] == "404":                self.client.create_bucket(Bucket=self.bucket_name)            # if bucket is not accessible, pass, maybe the bucket is existing but not accessible            elif e.response["Error"]["Code"] == "403":                pass            else:                # other error, raise exception                raise    def save(self, filename, data):        self.client.put_object(Bucket=self.bucket_name, Key=filename, Body=data)    def load_once(self, filename: str) -> bytes:        try:            data = self.client.get_object(Bucket=self.bucket_name, Key=filename)["Body"].read()        except ClientError as ex:            if ex.response["Error"]["Code"] == "NoSuchKey":                raise FileNotFoundError("File not found")            else:                raise        return data    def load_stream(self, filename: str) -> Generator:        def generate(filename: str = filename) -> Generator:            try:                response = self.client.get_object(Bucket=self.bucket_name, Key=filename)                yield from response["Body"].iter_chunks()            except ClientError as ex:                if ex.response["Error"]["Code"] == "NoSuchKey":                    raise FileNotFoundError("File not found")                else:                    raise        return generate()    def download(self, filename, target_filepath):        self.client.download_file(self.bucket_name, filename, target_filepath)    def exists(self, filename):        try:            self.client.head_object(Bucket=self.bucket_name, Key=filename)            return True        except:            return False    def delete(self, filename):        self.client.delete_object(Bucket=self.bucket_name, Key=filename)
 |