| 
									
										
										
										
											2024-10-07 11:09:27 +08:00
										 |  |  | import base64 | 
					
						
							|  |  |  | import hashlib | 
					
						
							|  |  |  | from collections.abc import Generator | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from baidubce.auth.bce_credentials import BceCredentials | 
					
						
							|  |  |  | from baidubce.bce_client_configuration import BceClientConfiguration | 
					
						
							|  |  |  | from baidubce.services.bos.bos_client import BosClient | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-22 11:01:32 +08:00
										 |  |  | from configs import dify_config | 
					
						
							| 
									
										
										
										
											2024-10-07 11:09:27 +08:00
										 |  |  | from extensions.storage.base_storage import BaseStorage | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-09 14:15:27 +08:00
										 |  |  | class BaiduObsStorage(BaseStorage): | 
					
						
							|  |  |  |     """Implementation for Baidu OBS storage.""" | 
					
						
							| 
									
										
										
										
											2024-10-07 11:09:27 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-22 11:01:32 +08:00
										 |  |  |     def __init__(self): | 
					
						
							|  |  |  |         super().__init__() | 
					
						
							|  |  |  |         self.bucket_name = dify_config.BAIDU_OBS_BUCKET_NAME | 
					
						
							| 
									
										
										
										
											2024-10-07 11:09:27 +08:00
										 |  |  |         client_config = BceClientConfiguration( | 
					
						
							|  |  |  |             credentials=BceCredentials( | 
					
						
							| 
									
										
										
										
											2024-10-22 11:01:32 +08:00
										 |  |  |                 access_key_id=dify_config.BAIDU_OBS_ACCESS_KEY, | 
					
						
							|  |  |  |                 secret_access_key=dify_config.BAIDU_OBS_SECRET_KEY, | 
					
						
							| 
									
										
										
										
											2024-10-07 11:09:27 +08:00
										 |  |  |             ), | 
					
						
							| 
									
										
										
										
											2024-10-22 11:01:32 +08:00
										 |  |  |             endpoint=dify_config.BAIDU_OBS_ENDPOINT, | 
					
						
							| 
									
										
										
										
											2024-10-07 11:09:27 +08:00
										 |  |  |         ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         self.client = BosClient(config=client_config) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def save(self, filename, data): | 
					
						
							|  |  |  |         md5 = hashlib.md5() | 
					
						
							|  |  |  |         md5.update(data) | 
					
						
							|  |  |  |         content_md5 = base64.standard_b64encode(md5.digest()) | 
					
						
							|  |  |  |         self.client.put_object( | 
					
						
							|  |  |  |             bucket_name=self.bucket_name, key=filename, data=data, content_length=len(data), content_md5=content_md5 | 
					
						
							|  |  |  |         ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def load_once(self, filename: str) -> bytes: | 
					
						
							|  |  |  |         response = self.client.get_object(bucket_name=self.bucket_name, key=filename) | 
					
						
							|  |  |  |         return response.data.read() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def load_stream(self, filename: str) -> Generator: | 
					
						
							| 
									
										
										
										
											2024-10-25 10:11:25 +08:00
										 |  |  |         response = self.client.get_object(bucket_name=self.bucket_name, key=filename).data | 
					
						
							|  |  |  |         while chunk := response.read(4096): | 
					
						
							|  |  |  |             yield chunk | 
					
						
							| 
									
										
										
										
											2024-10-07 11:09:27 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def download(self, filename, target_filepath): | 
					
						
							|  |  |  |         self.client.get_object_to_file(bucket_name=self.bucket_name, key=filename, file_name=target_filepath) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def exists(self, filename): | 
					
						
							|  |  |  |         res = self.client.get_object_meta_data(bucket_name=self.bucket_name, key=filename) | 
					
						
							|  |  |  |         if res is None: | 
					
						
							|  |  |  |             return False | 
					
						
							|  |  |  |         return True | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def delete(self, filename): | 
					
						
							|  |  |  |         self.client.delete_object(bucket_name=self.bucket_name, key=filename) |