| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  | import base64 | 
					
						
							| 
									
										
										
										
											2024-12-24 18:38:51 +08:00
										 |  |  | from collections.abc import Mapping | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | from configs import dify_config | 
					
						
							|  |  |  | from core.helper import ssrf_proxy | 
					
						
							| 
									
										
										
										
											2024-11-22 16:30:22 +08:00
										 |  |  | from core.model_runtime.entities import ( | 
					
						
							|  |  |  |     AudioPromptMessageContent, | 
					
						
							|  |  |  |     DocumentPromptMessageContent, | 
					
						
							|  |  |  |     ImagePromptMessageContent, | 
					
						
							|  |  |  |     VideoPromptMessageContent, | 
					
						
							|  |  |  | ) | 
					
						
							| 
									
										
										
										
											2025-04-22 16:17:55 +08:00
										 |  |  | from core.model_runtime.entities.message_entities import PromptMessageContentUnionTypes | 
					
						
							| 
									
										
										
										
											2025-04-30 17:28:02 +08:00
										 |  |  | from core.tools.signature import sign_tool_file | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  | from extensions.ext_storage import storage | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from . import helpers | 
					
						
							|  |  |  | from .enums import FileAttribute | 
					
						
							|  |  |  | from .models import File, FileTransferMethod, FileType | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def get_attr(*, file: File, attr: FileAttribute): | 
					
						
							|  |  |  |     match attr: | 
					
						
							|  |  |  |         case FileAttribute.TYPE: | 
					
						
							|  |  |  |             return file.type.value | 
					
						
							|  |  |  |         case FileAttribute.SIZE: | 
					
						
							|  |  |  |             return file.size | 
					
						
							|  |  |  |         case FileAttribute.NAME: | 
					
						
							|  |  |  |             return file.filename | 
					
						
							|  |  |  |         case FileAttribute.MIME_TYPE: | 
					
						
							|  |  |  |             return file.mime_type | 
					
						
							|  |  |  |         case FileAttribute.TRANSFER_METHOD: | 
					
						
							|  |  |  |             return file.transfer_method.value | 
					
						
							|  |  |  |         case FileAttribute.URL: | 
					
						
							| 
									
										
										
										
											2024-11-11 08:56:19 +08:00
										 |  |  |             return file.remote_url | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |         case FileAttribute.EXTENSION: | 
					
						
							|  |  |  |             return file.extension | 
					
						
							| 
									
										
										
										
											2025-03-21 20:57:02 +08:00
										 |  |  |         case FileAttribute.RELATED_ID: | 
					
						
							|  |  |  |             return file.related_id | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-11-08 18:13:24 +08:00
										 |  |  | def to_prompt_message_content( | 
					
						
							|  |  |  |     f: File, | 
					
						
							|  |  |  |     /, | 
					
						
							|  |  |  |     *, | 
					
						
							| 
									
										
										
										
											2024-11-22 16:30:22 +08:00
										 |  |  |     image_detail_config: ImagePromptMessageContent.DETAIL | None = None, | 
					
						
							| 
									
										
										
										
											2025-04-22 16:17:55 +08:00
										 |  |  | ) -> PromptMessageContentUnionTypes: | 
					
						
							| 
									
										
										
										
											2024-12-17 15:01:38 +08:00
										 |  |  |     if f.extension is None: | 
					
						
							|  |  |  |         raise ValueError("Missing file extension") | 
					
						
							|  |  |  |     if f.mime_type is None: | 
					
						
							|  |  |  |         raise ValueError("Missing file mime_type") | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     params = { | 
					
						
							|  |  |  |         "base64_data": _get_encoded_string(f) if dify_config.MULTIMODAL_SEND_FORMAT == "base64" else "", | 
					
						
							|  |  |  |         "url": _to_url(f) if dify_config.MULTIMODAL_SEND_FORMAT == "url" else "", | 
					
						
							|  |  |  |         "format": f.extension.removeprefix("."), | 
					
						
							|  |  |  |         "mime_type": f.mime_type, | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     if f.type == FileType.IMAGE: | 
					
						
							|  |  |  |         params["detail"] = image_detail_config or ImagePromptMessageContent.DETAIL.LOW | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2025-04-22 16:17:55 +08:00
										 |  |  |     prompt_class_map: Mapping[FileType, type[PromptMessageContentUnionTypes]] = { | 
					
						
							| 
									
										
										
										
											2024-12-17 15:01:38 +08:00
										 |  |  |         FileType.IMAGE: ImagePromptMessageContent, | 
					
						
							|  |  |  |         FileType.AUDIO: AudioPromptMessageContent, | 
					
						
							|  |  |  |         FileType.VIDEO: VideoPromptMessageContent, | 
					
						
							|  |  |  |         FileType.DOCUMENT: DocumentPromptMessageContent, | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     try: | 
					
						
							| 
									
										
										
										
											2024-12-24 18:38:51 +08:00
										 |  |  |         return prompt_class_map[f.type].model_validate(params) | 
					
						
							| 
									
										
										
										
											2024-12-17 15:01:38 +08:00
										 |  |  |     except KeyError: | 
					
						
							|  |  |  |         raise ValueError(f"file type {f.type} is not supported") | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def download(f: File, /): | 
					
						
							| 
									
										
										
										
											2025-07-09 14:27:49 +08:00
										 |  |  |     if f.transfer_method in ( | 
					
						
							|  |  |  |         FileTransferMethod.TOOL_FILE, | 
					
						
							|  |  |  |         FileTransferMethod.LOCAL_FILE, | 
					
						
							|  |  |  |         FileTransferMethod.DATASOURCE_FILE, | 
					
						
							|  |  |  |     ): | 
					
						
							| 
									
										
										
										
											2024-12-20 14:12:50 +08:00
										 |  |  |         return _download_file_content(f._storage_key) | 
					
						
							|  |  |  |     elif f.transfer_method == FileTransferMethod.REMOTE_URL: | 
					
						
							|  |  |  |         response = ssrf_proxy.get(f.remote_url, follow_redirects=True) | 
					
						
							|  |  |  |         response.raise_for_status() | 
					
						
							|  |  |  |         return response.content | 
					
						
							|  |  |  |     raise ValueError(f"unsupported transfer method: {f.transfer_method}") | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def _download_file_content(path: str, /): | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     Download and return the contents of a file as bytes. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     This function loads the file from storage and ensures it's in bytes format. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Args: | 
					
						
							|  |  |  |         path (str): The path to the file in storage. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Returns: | 
					
						
							|  |  |  |         bytes: The contents of the file as a bytes object. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Raises: | 
					
						
							|  |  |  |         ValueError: If the loaded file is not a bytes object. | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     data = storage.load(path, stream=False) | 
					
						
							|  |  |  |     if not isinstance(data, bytes): | 
					
						
							|  |  |  |         raise ValueError(f"file {path} is not a bytes object") | 
					
						
							|  |  |  |     return data | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def _get_encoded_string(f: File, /): | 
					
						
							|  |  |  |     match f.transfer_method: | 
					
						
							|  |  |  |         case FileTransferMethod.REMOTE_URL: | 
					
						
							| 
									
										
										
										
											2024-11-08 13:22:52 +08:00
										 |  |  |             response = ssrf_proxy.get(f.remote_url, follow_redirects=True) | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |             response.raise_for_status() | 
					
						
							| 
									
										
										
										
											2024-11-22 16:30:22 +08:00
										 |  |  |             data = response.content | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |         case FileTransferMethod.LOCAL_FILE: | 
					
						
							| 
									
										
										
										
											2024-12-20 14:12:50 +08:00
										 |  |  |             data = _download_file_content(f._storage_key) | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |         case FileTransferMethod.TOOL_FILE: | 
					
						
							| 
									
										
										
										
											2024-12-20 14:12:50 +08:00
										 |  |  |             data = _download_file_content(f._storage_key) | 
					
						
							| 
									
										
										
										
											2024-11-22 16:30:22 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     encoded_string = base64.b64encode(data).decode("utf-8") | 
					
						
							|  |  |  |     return encoded_string | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def _to_url(f: File, /): | 
					
						
							|  |  |  |     if f.transfer_method == FileTransferMethod.REMOTE_URL: | 
					
						
							|  |  |  |         if f.remote_url is None: | 
					
						
							|  |  |  |             raise ValueError("Missing file remote_url") | 
					
						
							|  |  |  |         return f.remote_url | 
					
						
							|  |  |  |     elif f.transfer_method == FileTransferMethod.LOCAL_FILE: | 
					
						
							|  |  |  |         if f.related_id is None: | 
					
						
							|  |  |  |             raise ValueError("Missing file related_id") | 
					
						
							| 
									
										
										
										
											2024-12-10 10:56:49 +08:00
										 |  |  |         return f.remote_url or helpers.get_signed_file_url(upload_file_id=f.related_id) | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |     elif f.transfer_method == FileTransferMethod.TOOL_FILE: | 
					
						
							|  |  |  |         # add sign url | 
					
						
							|  |  |  |         if f.related_id is None or f.extension is None: | 
					
						
							|  |  |  |             raise ValueError("Missing file related_id or extension") | 
					
						
							| 
									
										
										
										
											2025-04-30 17:28:02 +08:00
										 |  |  |         return sign_tool_file(tool_file_id=f.related_id, extension=f.extension) | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |     else: | 
					
						
							|  |  |  |         raise ValueError(f"Unsupported transfer method: {f.transfer_method}") |