deepset-ai · masci · May 15, 2024 · Apr 30, 2024 · Apr 30, 2024 · May 6, 2024
@@ -2,6 +2,7 @@
 #
 # SPDX-License-Identifier: Apache-2.0
 
+import os
 from typing import Any, Dict, List, Optional, Tuple
 
 from openai import OpenAI
@@ -49,6 +50,9 @@ def __init__(
  """
  Create a OpenAIDocumentEmbedder component.
 
+ By setting the 'OPENAI_TIMEOUT' and 'OPENAI_MAX_RETRIES' you can change the timeout and max_retries parameters in the OpenAI client.
+
+
  :param api_key:
  The OpenAI API key.
  :param model:
@@ -86,7 +90,13 @@ def __init__(
  self.meta_fields_to_embed = meta_fields_to_embed or []
  self.embedding_separator = embedding_separator
 
- self.client = OpenAI(api_key=api_key.resolve_value(), organization=organization, base_url=api_base_url)
+ self.client = OpenAI(
+ api_key=api_key.resolve_value(),
+ organization=organization,
+ base_url=api_base_url,
+ timeout=float(os.environ.get("OPENAI_TIMEOUT", 30)),
+ max_retries=int(os.environ.get("OPENAI_MAX_RETRIES", 5)),
+ )
 
  def _get_telemetry_data(self) -> Dict[str, Any]:
  """

@@ -2,13 +2,17 @@
 #
 # SPDX-License-Identifier: Apache-2.0
 
+import os
 from typing import Any, Dict, List, Optional
 
 from openai import OpenAI
 
 from haystack import component, default_from_dict, default_to_dict
 from haystack.utils import Secret, deserialize_secrets_inplace
 
+OPENAI_TIMEOUT = float(os.environ.get("OPENAI_API_KEY", 30))
+OPENAI_MAX_RETRIES = int(os.environ.get("OPENAI_MAX_RETRIES", 5))
+
 
 @component
 class OpenAITextEmbedder:
@@ -44,6 +48,8 @@ def __init__(
  """
  Create an OpenAITextEmbedder component.
 
+ By setting the 'OPENAI_TIMEOUT' and 'OPENAI_MAX_RETRIES' you can change the timeout and max_retries parameters in the OpenAI client.
+
  :param api_key:
  The OpenAI API key.
  :param model:
@@ -69,7 +75,13 @@ def __init__(
  self.suffix = suffix
  self.api_key = api_key
 
- self.client = OpenAI(api_key=api_key.resolve_value(), organization=organization, base_url=api_base_url)
+ self.client = OpenAI(
+ api_key=api_key.resolve_value(),
+ organization=organization,
+ base_url=api_base_url,
+ timeout=float(os.environ.get("OPENAI_TIMEOUT", 30)),
+ max_retries=int(os.environ.get("OPENAI_MAX_RETRIES", 5)),
+ )
 
  def _get_telemetry_data(self) -> Dict[str, Any]:
  """

@@ -4,6 +4,7 @@
 
 import copy
 import json
+import os
 from typing import Any, Callable, Dict, List, Optional, Union
 
 from openai import OpenAI, Stream
@@ -82,6 +83,8 @@ def __init__(
  Creates an instance of OpenAIChatGenerator. Unless specified otherwise in the `model`, this is for OpenAI's
  GPT-3.5 model.
 
+ By setting the 'OPENAI_TIMEOUT' and 'OPENAI_MAX_RETRIES' you can change the timeout and max_retries parameters in the OpenAI client.
+
  :param api_key: The OpenAI API key.
  :param model: The name of the model to use.
  :param streaming_callback: A callback function that is called when a new token is received from the stream.
@@ -115,7 +118,13 @@ def __init__(
  self.streaming_callback = streaming_callback
  self.api_base_url = api_base_url
  self.organization = organization
- self.client = OpenAI(api_key=api_key.resolve_value(), organization=organization, base_url=api_base_url)
+ self.client = OpenAI(
+ api_key=api_key.resolve_value(),
+ organization=organization,
+ base_url=api_base_url,
+ timeout=float(os.environ.get("OPENAI_TIMEOUT", 30)),
+ max_retries=int(os.environ.get("OPENAI_MAX_RETRIES", 5)),
+ )
 
  def _get_telemetry_data(self) -> Dict[str, Any]:
  """

@@ -2,6 +2,7 @@
 #
 # SPDX-License-Identifier: Apache-2.0
 
+import os
 from typing import Any, Callable, Dict, List, Optional, Union
 
 from openai import OpenAI, Stream
@@ -64,6 +65,9 @@ def __init__(
  """
  Creates an instance of OpenAIGenerator. Unless specified otherwise in the `model`, this is for OpenAI's GPT-3.5 model.
 
+ By setting the 'OPENAI_TIMEOUT' and 'OPENAI_MAX_RETRIES' you can change the timeout and max_retries parameters in the OpenAI client.
+
+
  :param api_key: The OpenAI API key.
  :param model: The name of the model to use.
  :param streaming_callback: A callback function that is called when a new token is received from the stream.
@@ -101,7 +105,13 @@ def __init__(
 
  self.api_base_url = api_base_url
  self.organization = organization
- self.client = OpenAI(api_key=api_key.resolve_value(), organization=organization, base_url=api_base_url)
+ self.client = OpenAI(
+ api_key=api_key.resolve_value(),
+ organization=organization,
+ base_url=api_base_url,
+ timeout=float(os.environ.get("OPENAI_TIMEOUT", 30)),
+ max_retries=int(os.environ.get("OPENAI_MAX_RETRIES", 5)),
+ )
 
  def _get_telemetry_data(self) -> Dict[str, Any]:
  """

@@ -12,6 +12,10 @@
 
 logger = logging.getLogger(__name__)
 
+# Any remote API (OpenAI, Cohere etc.)
+HAYSTACK_REMOTE_API_BACKOFF_SEC = "HAYSTACK_REMOTE_API_BACKOFF_SEC"
+HAYSTACK_REMOTE_API_MAX_RETRIES = "HAYSTACK_REMOTE_API_MAX_RETRIES"
+HAYSTACK_REMOTE_API_TIMEOUT_SEC = "HAYSTACK_REMOTE_API_TIMEOUT_SEC"
 
 # This value cannot change during the lifetime of the process
 _IS_DOCKER_CACHE = None

@@ -0,0 +1,9 @@
+---
+highlights: >
+ Add the 'OPENAI_TIMEOUT' and 'OPENAI_MAX_RETRIES' to the OpenAI components.
+enhancements:
+ - |
+ Now you can set the timeout and max_retries parameters on the OpenAI client by setting the 'OPENAI_TIMEOUT' and 'OPENAI_MAX_RETRIES' environment vars.
+issues:
+ - |
+ 7610
@@ -29,6 +29,7 @@ class TestOpenAIDocumentEmbedder:
  def test_init_default(self, monkeypatch):
  monkeypatch.setenv("OPENAI_API_KEY", "fake-api-key")
  embedder = OpenAIDocumentEmbedder()
+ assert embedder.api_key.resolve_value() == "fake-api-key"
  assert embedder.model == "text-embedding-ada-002"
  assert embedder.organization is None
  assert embedder.prefix == ""
@@ -37,10 +38,14 @@ def test_init_default(self, monkeypatch):
  assert embedder.progress_bar is True
  assert embedder.meta_fields_to_embed == []
  assert embedder.embedding_separator == "\n"
+ assert embedder.client.max_retries == 5
+ assert embedder.client.timeout == 30
 
- def test_init_with_parameters(self):
+ def test_init_with_parameters(self, monkeypatch):
+ monkeypatch.setenv("OPENAI_TIMEOUT", "100")
+ monkeypatch.setenv("OPENAI_MAX_RETRIES", "10")
  embedder = OpenAIDocumentEmbedder(
- api_key=Secret.from_token("fake-api-key"),
+ api_key=Secret.from_token("fake-api-key-2"),
  model="model",
  organization="my-org",
  prefix="prefix",
@@ -50,6 +55,7 @@ def test_init_with_parameters(self):
  meta_fields_to_embed=["test_field"],
  embedding_separator=" | ",
  )
+ assert embedder.api_key.resolve_value() == "fake-api-key-2"
  assert embedder.organization == "my-org"
  assert embedder.model == "model"
  assert embedder.prefix == "prefix"
@@ -58,6 +64,8 @@ def test_init_with_parameters(self):
  assert embedder.progress_bar is False
  assert embedder.meta_fields_to_embed == ["test_field"]
  assert embedder.embedding_separator == " | "
+ assert embedder.client.max_retries == 10
+ assert embedder.client.timeout == 100
 
  def test_init_fail_wo_api_key(self, monkeypatch):
  monkeypatch.delenv("OPENAI_API_KEY", raising=False)

@@ -20,8 +20,12 @@ def test_init_default(self, monkeypatch):
  assert embedder.organization is None
  assert embedder.prefix == ""
  assert embedder.suffix == ""
+ assert embedder.client.timeout == 30
+ assert embedder.client.max_retries == 5
 
- def test_init_with_parameters(self):
+ def test_init_with_parameters(self, monkeypatch):
+ monkeypatch.setenv("OPENAI_TIMEOUT", "100")
+ monkeypatch.setenv("OPENAI_MAX_RETRIES", "10")
  embedder = OpenAITextEmbedder(
  api_key=Secret.from_token("fake-api-key"),
  model="model",
@@ -36,6 +40,8 @@ def test_init_with_parameters(self):
  assert embedder.organization == "fake-organization"
  assert embedder.prefix == "prefix"
  assert embedder.suffix == "suffix"
+ assert embedder.client.timeout == 100
+ assert embedder.client.max_retries == 10
 
  def test_init_fail_wo_api_key(self, monkeypatch):
  monkeypatch.delenv("OPENAI_API_KEY", raising=False)

@@ -29,13 +29,17 @@ def test_init_default(self, monkeypatch):
  assert component.model == "gpt-3.5-turbo"
  assert component.streaming_callback is None
  assert not component.generation_kwargs
+ assert component.client.timeout == 30
+ assert component.client.max_retries == 5
 
  def test_init_fail_wo_api_key(self, monkeypatch):
  monkeypatch.delenv("OPENAI_API_KEY", raising=False)
  with pytest.raises(ValueError, match="None of the .* environment variables are set"):
  OpenAIChatGenerator()
 
- def test_init_with_parameters(self):
+ def test_init_with_parameters(self, monkeypatch):
+ monkeypatch.setenv("OPENAI_TIMEOUT", "100")
+ monkeypatch.setenv("OPENAI_MAX_RETRIES", "10")
  component = OpenAIChatGenerator(
  api_key=Secret.from_token("test-api-key"),
  model="gpt-4",
@@ -47,6 +51,8 @@ def test_init_with_parameters(self):
  assert component.model == "gpt-4"
  assert component.streaming_callback is print_streaming_chunk
  assert component.generation_kwargs == {"max_tokens": 10, "some_test_param": "test-params"}
+ assert component.client.timeout == 100
+ assert component.client.max_retries == 10
 
  def test_to_dict_default(self, monkeypatch):
  monkeypatch.setenv("OPENAI_API_KEY", "test-api-key")

@@ -22,13 +22,17 @@ def test_init_default(self, monkeypatch):
  assert component.model == "gpt-3.5-turbo"
  assert component.streaming_callback is None
  assert not component.generation_kwargs
+ assert component.client.timeout == 30
+ assert component.client.max_retries == 5
 
  def test_init_fail_wo_api_key(self, monkeypatch):
  monkeypatch.delenv("OPENAI_API_KEY", raising=False)
  with pytest.raises(ValueError, match="None of the .* environment variables are set"):
  OpenAIGenerator()
 
- def test_init_with_parameters(self):
+ def test_init_with_parameters(self, monkeypatch):
+ monkeypatch.setenv("OPENAI_TIMEOUT", "100")
+ monkeypatch.setenv("OPENAI_MAX_RETRIES", "10")
  component = OpenAIGenerator(
  api_key=Secret.from_token("test-api-key"),
  model="gpt-4",
@@ -40,6 +44,8 @@ def test_init_with_parameters(self):
  assert component.model == "gpt-4"
  assert component.streaming_callback is print_streaming_chunk
  assert component.generation_kwargs == {"max_tokens": 10, "some_test_param": "test-params"}
+ assert component.client.timeout == 100
+ assert component.client.max_retries == 10
 
  def test_to_dict_default(self, monkeypatch):
  monkeypatch.setenv("OPENAI_API_KEY", "test-api-key")