| 
									
										
										
										
											2024-02-05 18:48:30 +08:00
										 |  |  | """
 | 
					
						
							|  |  |  | Proxy requests to avoid SSRF | 
					
						
							|  |  |  | """
 | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | import logging | 
					
						
							|  |  |  | import time | 
					
						
							| 
									
										
										
										
											2024-02-05 18:48:30 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-06-24 16:14:59 +08:00
										 |  |  | import httpx | 
					
						
							| 
									
										
										
										
											2024-02-06 13:21:13 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-11-08 09:33:12 +08:00
										 |  |  | from configs import dify_config | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | SSRF_DEFAULT_MAX_RETRIES = dify_config.SSRF_DEFAULT_MAX_RETRIES | 
					
						
							| 
									
										
										
										
											2024-02-05 18:48:30 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2025-03-14 11:05:37 +09:00
										 |  |  | HTTP_REQUEST_NODE_SSL_VERIFY = True  # Default value for HTTP_REQUEST_NODE_SSL_VERIFY is True | 
					
						
							|  |  |  | try: | 
					
						
							|  |  |  |     HTTP_REQUEST_NODE_SSL_VERIFY = dify_config.HTTP_REQUEST_NODE_SSL_VERIFY | 
					
						
							|  |  |  |     http_request_node_ssl_verify_lower = str(HTTP_REQUEST_NODE_SSL_VERIFY).lower() | 
					
						
							|  |  |  |     if http_request_node_ssl_verify_lower == "true": | 
					
						
							|  |  |  |         HTTP_REQUEST_NODE_SSL_VERIFY = True | 
					
						
							|  |  |  |     elif http_request_node_ssl_verify_lower == "false": | 
					
						
							|  |  |  |         HTTP_REQUEST_NODE_SSL_VERIFY = False | 
					
						
							|  |  |  |     else: | 
					
						
							|  |  |  |         raise ValueError("Invalid value. HTTP_REQUEST_NODE_SSL_VERIFY should be 'True' or 'False'") | 
					
						
							|  |  |  | except NameError: | 
					
						
							|  |  |  |     HTTP_REQUEST_NODE_SSL_VERIFY = True | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | BACKOFF_FACTOR = 0.5 | 
					
						
							|  |  |  | STATUS_FORCELIST = [429, 500, 502, 503, 504] | 
					
						
							| 
									
										
										
										
											2024-06-24 16:14:59 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-12-21 21:22:47 +08:00
										 |  |  | class MaxRetriesExceededError(ValueError): | 
					
						
							| 
									
										
										
										
											2024-12-11 14:22:42 +08:00
										 |  |  |     """Raised when the maximum number of retries is exceeded.""" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     pass | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | def make_request(method, url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs): | 
					
						
							| 
									
										
										
										
											2024-07-25 20:50:26 +08:00
										 |  |  |     if "allow_redirects" in kwargs: | 
					
						
							|  |  |  |         allow_redirects = kwargs.pop("allow_redirects") | 
					
						
							|  |  |  |         if "follow_redirects" not in kwargs: | 
					
						
							|  |  |  |             kwargs["follow_redirects"] = allow_redirects | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-11-06 08:50:57 +08:00
										 |  |  |     if "timeout" not in kwargs: | 
					
						
							|  |  |  |         kwargs["timeout"] = httpx.Timeout( | 
					
						
							| 
									
										
										
										
											2024-11-08 09:33:12 +08:00
										 |  |  |             timeout=dify_config.SSRF_DEFAULT_TIME_OUT, | 
					
						
							|  |  |  |             connect=dify_config.SSRF_DEFAULT_CONNECT_TIME_OUT, | 
					
						
							|  |  |  |             read=dify_config.SSRF_DEFAULT_READ_TIME_OUT, | 
					
						
							|  |  |  |             write=dify_config.SSRF_DEFAULT_WRITE_TIME_OUT, | 
					
						
							| 
									
										
										
										
											2024-11-06 08:50:57 +08:00
										 |  |  |         ) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  |     retries = 0 | 
					
						
							|  |  |  |     while retries <= max_retries: | 
					
						
							|  |  |  |         try: | 
					
						
							| 
									
										
										
										
											2024-11-08 09:33:12 +08:00
										 |  |  |             if dify_config.SSRF_PROXY_ALL_URL: | 
					
						
							| 
									
										
										
										
											2025-03-14 11:05:37 +09:00
										 |  |  |                 with httpx.Client(proxy=dify_config.SSRF_PROXY_ALL_URL, verify=HTTP_REQUEST_NODE_SSL_VERIFY) as client: | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |                     response = client.request(method=method, url=url, **kwargs) | 
					
						
							| 
									
										
										
										
											2025-02-05 12:10:27 +07:00
										 |  |  |             elif dify_config.SSRF_PROXY_HTTP_URL and dify_config.SSRF_PROXY_HTTPS_URL: | 
					
						
							|  |  |  |                 proxy_mounts = { | 
					
						
							|  |  |  |                     "http://": httpx.HTTPTransport(proxy=dify_config.SSRF_PROXY_HTTP_URL), | 
					
						
							|  |  |  |                     "https://": httpx.HTTPTransport(proxy=dify_config.SSRF_PROXY_HTTPS_URL), | 
					
						
							|  |  |  |                 } | 
					
						
							| 
									
										
										
										
											2025-03-14 11:05:37 +09:00
										 |  |  |                 with httpx.Client(mounts=proxy_mounts, verify=HTTP_REQUEST_NODE_SSL_VERIFY) as client: | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |                     response = client.request(method=method, url=url, **kwargs) | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  |             else: | 
					
						
							| 
									
										
										
										
											2025-03-14 11:05:37 +09:00
										 |  |  |                 with httpx.Client(verify=HTTP_REQUEST_NODE_SSL_VERIFY) as client: | 
					
						
							| 
									
										
										
										
											2024-10-21 10:43:49 +08:00
										 |  |  |                     response = client.request(method=method, url=url, **kwargs) | 
					
						
							| 
									
										
										
										
											2024-06-24 16:14:59 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  |             if response.status_code not in STATUS_FORCELIST: | 
					
						
							|  |  |  |                 return response | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 logging.warning(f"Received status code {response.status_code} for URL {url} which is in the force list") | 
					
						
							| 
									
										
										
										
											2024-06-24 16:14:59 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  |         except httpx.RequestError as e: | 
					
						
							|  |  |  |             logging.warning(f"Request to URL {url} failed on attempt {retries + 1}: {e}") | 
					
						
							| 
									
										
										
										
											2024-12-23 14:32:11 +08:00
										 |  |  |             if max_retries == 0: | 
					
						
							|  |  |  |                 raise | 
					
						
							| 
									
										
										
										
											2024-06-24 16:14:59 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  |         retries += 1 | 
					
						
							|  |  |  |         if retries <= max_retries: | 
					
						
							|  |  |  |             time.sleep(BACKOFF_FACTOR * (2 ** (retries - 1))) | 
					
						
							| 
									
										
										
										
											2024-12-11 14:22:42 +08:00
										 |  |  |     raise MaxRetriesExceededError(f"Reached maximum retries ({max_retries}) for URL {url}") | 
					
						
							| 
									
										
										
										
											2024-06-24 16:14:59 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | def get(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs): | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  |     return make_request("GET", url, max_retries=max_retries, **kwargs) | 
					
						
							| 
									
										
										
										
											2024-06-24 16:14:59 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | def post(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs): | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  |     return make_request("POST", url, max_retries=max_retries, **kwargs) | 
					
						
							| 
									
										
										
										
											2024-06-24 16:14:59 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | def put(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs): | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  |     return make_request("PUT", url, max_retries=max_retries, **kwargs) | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def patch(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs): | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  |     return make_request("PATCH", url, max_retries=max_retries, **kwargs) | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def delete(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs): | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  |     return make_request("DELETE", url, max_retries=max_retries, **kwargs) | 
					
						
							| 
									
										
										
										
											2024-07-25 13:10:39 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def head(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs): | 
					
						
							| 
									
										
										
										
											2024-09-10 17:00:20 +08:00
										 |  |  |     return make_request("HEAD", url, max_retries=max_retries, **kwargs) |