From d03bffab8b431a8a97fb0542a91ba25fd87bab03 Mon Sep 17 00:00:00 2001
From: x110 <masagban@gmail.com>
Date: Sun, 19 Nov 2023 19:32:09 +0400
Subject: [PATCH] Promptnode timeout (#6282)

---
 haystack/nodes/prompt/invocation_layer/chatgpt.py    | 12 +++++++++---
 haystack/nodes/prompt/invocation_layer/open_ai.py    |  2 ++
 haystack/nodes/prompt/prompt_model.py                |  3 +++
 haystack/nodes/prompt/prompt_node.py                 |  2 ++
 haystack/utils/openai_utils.py                       |  4 +++-
 ...d-timeout-arg-to-promptnode-de11f17733344052.yaml |  4 ++++
 6 files changed, 23 insertions(+), 4 deletions(-)
 create mode 100644 releasenotes/notes/add-timeout-arg-to-promptnode-de11f17733344052.yaml

diff --git a/haystack/nodes/prompt/invocation_layer/chatgpt.py b/haystack/nodes/prompt/invocation_layer/chatgpt.py
index f3e1a3ef6..65c2df779 100644
--- a/haystack/nodes/prompt/invocation_layer/chatgpt.py
+++ b/haystack/nodes/prompt/invocation_layer/chatgpt.py
@@ -33,6 +33,7 @@ class ChatGPTInvocationLayer(OpenAIInvocationLayer):
         model_name_or_path: str = "gpt-3.5-turbo",
         max_length: Optional[int] = 500,
         api_base: str = "https://api.openai.com/v1",
+        timeout: Optional[float] = None,
         **kwargs,
     ):
         """
@@ -48,7 +49,7 @@ class ChatGPTInvocationLayer(OpenAIInvocationLayer):
         sensitive content using the [OpenAI Moderation API](https://platform.openai.com/docs/guides/moderation)
         if set. If the input or answers are flagged, an empty list is returned in place of the answers.
         """
-        super().__init__(api_key, model_name_or_path, max_length, api_base=api_base, **kwargs)
+        super().__init__(api_key, model_name_or_path, max_length, api_base=api_base, timeout=timeout, **kwargs)
 
     def _extract_token(self, event_data: Dict[str, Any]):
         delta = event_data["choices"][0]["delta"]
@@ -192,12 +193,17 @@ class ChatGPTInvocationLayer(OpenAIInvocationLayer):
         extra_payload = {"messages": messages}
         payload = {**base_payload, **extra_payload}
         if not stream:
-            response = openai_request(url=self.url, headers=self.headers, payload=payload)
+            response = openai_request(url=self.url, headers=self.headers, payload=payload, timeout=self.timeout)
             _check_openai_finish_reason(result=response, payload=payload)
             assistant_response = [choice["message"]["content"].strip() for choice in response["choices"]]
         else:
             response = openai_request(
-                url=self.url, headers=self.headers, payload=payload, read_response=False, stream=True
+                url=self.url,
+                headers=self.headers,
+                payload=payload,
+                timeout=self.timeout,
+                read_response=False,
+                stream=True,
             )
             handler: TokenStreamingHandler = kwargs_with_defaults.pop("stream_handler", DefaultTokenStreamingHandler())
             assistant_response = self._process_streaming_response(response=response, stream_handler=handler)
diff --git a/haystack/nodes/prompt/invocation_layer/open_ai.py b/haystack/nodes/prompt/invocation_layer/open_ai.py
index 85bae198b..825da2623 100644
--- a/haystack/nodes/prompt/invocation_layer/open_ai.py
+++ b/haystack/nodes/prompt/invocation_layer/open_ai.py
@@ -37,6 +37,7 @@ class OpenAIInvocationLayer(PromptModelInvocationLayer):
         max_length: Optional[int] = 100,
         api_base: str = "https://api.openai.com/v1",
         openai_organization: Optional[str] = None,
+        timeout: Optional[float] = None,
         **kwargs,
     ):
         """
@@ -66,6 +67,7 @@ class OpenAIInvocationLayer(PromptModelInvocationLayer):
         self.api_key = api_key
         self.api_base = api_base
         self.openai_organization = openai_organization
+        self.timeout = timeout
 
         # 16 is the default length for answers from OpenAI shown in the docs
         # here, https://platform.openai.com/docs/api-reference/completions/create.
diff --git a/haystack/nodes/prompt/prompt_model.py b/haystack/nodes/prompt/prompt_model.py
index 437b0fdc4..47ce1ee98 100644
--- a/haystack/nodes/prompt/prompt_model.py
+++ b/haystack/nodes/prompt/prompt_model.py
@@ -36,6 +36,7 @@ class PromptModel(BaseComponent):
         model_name_or_path: str = "google/flan-t5-base",
         max_length: Optional[int] = 100,
         api_key: Optional[str] = None,
+        timeout: Optional[float] = None,
         use_auth_token: Optional[Union[str, bool]] = None,
         use_gpu: Optional[bool] = None,
         devices: Optional[List[Union[str, "torch.device"]]] = None,
@@ -63,6 +64,7 @@ class PromptModel(BaseComponent):
         self.model_name_or_path = model_name_or_path
         self.max_length = max_length
         self.api_key = api_key
+        self.timeout = timeout
         self.use_auth_token = use_auth_token
         self.use_gpu = use_gpu
         self.devices = devices
@@ -75,6 +77,7 @@ class PromptModel(BaseComponent):
     ) -> PromptModelInvocationLayer:
         kwargs = {
             "api_key": self.api_key,
+            "timeout": self.timeout,
             "use_auth_token": self.use_auth_token,
             "use_gpu": self.use_gpu,
             "devices": self.devices,
diff --git a/haystack/nodes/prompt/prompt_node.py b/haystack/nodes/prompt/prompt_node.py
index 2360d5b44..92ec069ac 100644
--- a/haystack/nodes/prompt/prompt_node.py
+++ b/haystack/nodes/prompt/prompt_node.py
@@ -57,6 +57,7 @@ class PromptNode(BaseComponent):
         output_variable: Optional[str] = None,
         max_length: Optional[int] = 100,
         api_key: Optional[str] = None,
+        timeout: Optional[float] = None,
         use_auth_token: Optional[Union[str, bool]] = None,
         use_gpu: Optional[bool] = None,
         devices: Optional[List[Union[str, "torch.device"]]] = None,
@@ -113,6 +114,7 @@ class PromptNode(BaseComponent):
                 model_name_or_path=model_name_or_path,
                 max_length=max_length,
                 api_key=api_key,
+                timeout=timeout,
                 use_auth_token=use_auth_token,
                 use_gpu=use_gpu,
                 devices=devices,
diff --git a/haystack/utils/openai_utils.py b/haystack/utils/openai_utils.py
index c42024eb2..25de13e50 100644
--- a/haystack/utils/openai_utils.py
+++ b/haystack/utils/openai_utils.py
@@ -112,7 +112,7 @@ def openai_request(
     url: str,
     headers: Dict,
     payload: Dict,
-    timeout: Union[float, Tuple[float, float]] = OPENAI_TIMEOUT,
+    timeout: Optional[Union[float, Tuple[float, float]]] = None,
     read_response: Optional[bool] = True,
     **kwargs,
 ):
@@ -124,6 +124,8 @@ def openai_request(
     :param timeout: The timeout length of the request. The default is 30s.
     :param read_response: Whether to read the response as JSON. The default is True.
     """
+    if timeout is None:
+        timeout = OPENAI_TIMEOUT
     response = requests.request("POST", url, headers=headers, data=json.dumps(payload), timeout=timeout, **kwargs)
     if read_response:
         json_response = json.loads(response.text)
diff --git a/releasenotes/notes/add-timeout-arg-to-promptnode-de11f17733344052.yaml b/releasenotes/notes/add-timeout-arg-to-promptnode-de11f17733344052.yaml
new file mode 100644
index 000000000..c1ff4630c
--- /dev/null
+++ b/releasenotes/notes/add-timeout-arg-to-promptnode-de11f17733344052.yaml
@@ -0,0 +1,4 @@
+---
+enhancements:
+  - |
+    Introduces a new timeout keyword argument in PromptNode, addressing and fixing the issue #5380 for enhanced control over individual calls to OpenAI.