mirror of
				https://github.com/langgenius/dify.git
				synced 2025-10-24 23:48:40 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			88 lines
		
	
	
		
			3.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			88 lines
		
	
	
		
			3.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| import logging
 | |
| from collections.abc import Generator
 | |
| 
 | |
| import boto3  # type: ignore
 | |
| from botocore.client import Config  # type: ignore
 | |
| from botocore.exceptions import ClientError  # type: ignore
 | |
| 
 | |
| from configs import dify_config
 | |
| from extensions.storage.base_storage import BaseStorage
 | |
| 
 | |
| logger = logging.getLogger(__name__)
 | |
| 
 | |
| 
 | |
| class AwsS3Storage(BaseStorage):
 | |
|     """Implementation for Amazon Web Services S3 storage."""
 | |
| 
 | |
|     def __init__(self):
 | |
|         super().__init__()
 | |
|         self.bucket_name = dify_config.S3_BUCKET_NAME
 | |
|         if dify_config.S3_USE_AWS_MANAGED_IAM:
 | |
|             logger.info("Using AWS managed IAM role for S3")
 | |
| 
 | |
|             session = boto3.Session()
 | |
|             region_name = dify_config.S3_REGION
 | |
|             self.client = session.client(service_name="s3", region_name=region_name)
 | |
|         else:
 | |
|             logger.info("Using ak and sk for S3")
 | |
| 
 | |
|             self.client = boto3.client(
 | |
|                 "s3",
 | |
|                 aws_secret_access_key=dify_config.S3_SECRET_KEY,
 | |
|                 aws_access_key_id=dify_config.S3_ACCESS_KEY,
 | |
|                 endpoint_url=dify_config.S3_ENDPOINT,
 | |
|                 region_name=dify_config.S3_REGION,
 | |
|                 config=Config(s3={"addressing_style": dify_config.S3_ADDRESS_STYLE}),
 | |
|             )
 | |
|         # create bucket
 | |
|         try:
 | |
|             self.client.head_bucket(Bucket=self.bucket_name)
 | |
|         except ClientError as e:
 | |
|             # if bucket not exists, create it
 | |
|             if e.response["Error"]["Code"] == "404":
 | |
|                 self.client.create_bucket(Bucket=self.bucket_name)
 | |
|             # if bucket is not accessible, pass, maybe the bucket is existing but not accessible
 | |
|             elif e.response["Error"]["Code"] == "403":
 | |
|                 pass
 | |
|             else:
 | |
|                 # other error, raise exception
 | |
|                 raise
 | |
| 
 | |
|     def save(self, filename, data):
 | |
|         self.client.put_object(Bucket=self.bucket_name, Key=filename, Body=data)
 | |
| 
 | |
|     def load_once(self, filename: str) -> bytes:
 | |
|         try:
 | |
|             data: bytes = self.client.get_object(Bucket=self.bucket_name, Key=filename)["Body"].read()
 | |
|         except ClientError as ex:
 | |
|             if ex.response["Error"]["Code"] == "NoSuchKey":
 | |
|                 raise FileNotFoundError("File not found")
 | |
|             else:
 | |
|                 raise
 | |
|         return data
 | |
| 
 | |
|     def load_stream(self, filename: str) -> Generator:
 | |
|         try:
 | |
|             response = self.client.get_object(Bucket=self.bucket_name, Key=filename)
 | |
|             yield from response["Body"].iter_chunks()
 | |
|         except ClientError as ex:
 | |
|             if ex.response["Error"]["Code"] == "NoSuchKey":
 | |
|                 raise FileNotFoundError("file not found")
 | |
|             elif "reached max retries" in str(ex):
 | |
|                 raise ValueError("please do not request the same file too frequently")
 | |
|             else:
 | |
|                 raise
 | |
| 
 | |
|     def download(self, filename, target_filepath):
 | |
|         self.client.download_file(self.bucket_name, filename, target_filepath)
 | |
| 
 | |
|     def exists(self, filename):
 | |
|         try:
 | |
|             self.client.head_object(Bucket=self.bucket_name, Key=filename)
 | |
|             return True
 | |
|         except:
 | |
|             return False
 | |
| 
 | |
|     def delete(self, filename):
 | |
|         self.client.delete_object(Bucket=self.bucket_name, Key=filename)
 | 
