haystack/test/components/generators/conftest.py

# SPDX-FileCopyrightText: 2022-present deepset GmbH <info@deepset.ai>
#
# SPDX-License-Identifier: Apache-2.0
from datetime import datetime
from typing import Iterator
from unittest.mock import MagicMock, patch, AsyncMock

import pytest
from openai import AsyncStream, Stream
from openai.types.chat import ChatCompletion, ChatCompletionChunk
from openai.types.chat import chat_completion_chunk


@pytest.fixture
def mock_auto_tokenizer():
    """
    In the original mock_auto_tokenizer fixture, we were mocking the transformers.AutoTokenizer.from_pretrained
    method directly, but we were not providing a return value for this method. Therefore, when from_pretrained
    was called within HuggingFaceTGIChatGenerator, it returned None because that's the default behavior of a
    MagicMock object when a return value isn't specified.

    We will update the mock_auto_tokenizer fixture to return a MagicMock object when from_pretrained is called
    in another PR. For now, we will use this fixture to mock the AutoTokenizer.from_pretrained method.
    """

    with patch("transformers.AutoTokenizer.from_pretrained", autospec=True) as mock_from_pretrained:
        mock_tokenizer = MagicMock()
        mock_from_pretrained.return_value = mock_tokenizer
        yield mock_tokenizer


class OpenAIMockStream(Stream[ChatCompletionChunk]):
    def __init__(self, mock_chunk: ChatCompletionChunk, client=None, *args, **kwargs):
        client = client or MagicMock()
        super().__init__(client=client, *args, **kwargs)
        self.mock_chunk = mock_chunk

    def __stream__(self) -> Iterator[ChatCompletionChunk]:
        yield self.mock_chunk


class OpenAIAsyncMockStream(AsyncStream[ChatCompletionChunk]):
    def __init__(self, mock_chunk: ChatCompletionChunk):
        self.mock_chunk = mock_chunk

    def __aiter__(self):
        return self

    async def __anext__(self):
        # Only yield once, then stop iteration
        if not hasattr(self, "_done"):
            self._done = True
            return self.mock_chunk
        raise StopAsyncIteration


@pytest.fixture
def openai_mock_stream():
    """
    Fixture that returns a function to create MockStream instances with custom chunks
    """
    return OpenAIMockStream


@pytest.fixture
def openai_mock_stream_async():
    """
    Fixture that returns a function to create AsyncMockStream instances with custom chunks
    """
    return OpenAIAsyncMockStream


@pytest.fixture
def openai_mock_chat_completion():
    """
    Mock the OpenAI API completion response and reuse it for tests
    """
    with patch("openai.resources.chat.completions.Completions.create") as mock_chat_completion_create:
        completion = ChatCompletion(
            id="foo",
            model="gpt-4",
            object="chat.completion",
            choices=[
                {
                    "finish_reason": "stop",
                    "logprobs": None,
                    "index": 0,
                    "message": {"content": "Hello world!", "role": "assistant"},
                }
            ],
            created=int(datetime.now().timestamp()),
            usage={"prompt_tokens": 57, "completion_tokens": 40, "total_tokens": 97},
        )

        mock_chat_completion_create.return_value = completion
        yield mock_chat_completion_create


@pytest.fixture
async def openai_mock_async_chat_completion():
    """
    Mock the OpenAI API completion response and reuse it for async tests
    """
    with patch(
        "openai.resources.chat.completions.AsyncCompletions.create", new_callable=AsyncMock
    ) as mock_chat_completion_create:
        completion = ChatCompletion(
            id="foo",
            model="gpt-4",
            object="chat.completion",
            choices=[
                {
                    "finish_reason": "stop",
                    "logprobs": None,
                    "index": 0,
                    "message": {"content": "Hello world!", "role": "assistant"},
                }
            ],
            created=int(datetime.now().timestamp()),
            usage={"prompt_tokens": 57, "completion_tokens": 40, "total_tokens": 97},
        )

        mock_chat_completion_create.return_value = completion
        yield mock_chat_completion_create


@pytest.fixture
def openai_mock_chat_completion_chunk():
    """
    Mock the OpenAI API completion chunk response and reuse it for tests
    """

    with patch("openai.resources.chat.completions.Completions.create") as mock_chat_completion_create:
        completion = ChatCompletionChunk(
            id="foo",
            model="gpt-4",
            object="chat.completion.chunk",
            choices=[
                chat_completion_chunk.Choice(
                    finish_reason="stop",
                    logprobs=None,
                    index=0,
                    delta=chat_completion_chunk.ChoiceDelta(content="Hello", role="assistant"),
                )
            ],
            created=int(datetime.now().timestamp()),
            usage=None,
        )
        mock_chat_completion_create.return_value = OpenAIMockStream(
            completion, cast_to=None, response=None, client=None
        )
        yield mock_chat_completion_create


@pytest.fixture
async def openai_mock_async_chat_completion_chunk():
    """
    Mock the OpenAI API completion chunk response and reuse it for async tests
    """
    with patch(
        "openai.resources.chat.completions.AsyncCompletions.create", new_callable=AsyncMock
    ) as mock_chat_completion_create:
        completion = ChatCompletionChunk(
            id="foo",
            model="gpt-4",
            object="chat.completion.chunk",
            choices=[
                chat_completion_chunk.Choice(
                    finish_reason="stop",
                    logprobs=None,
                    index=0,
                    delta=chat_completion_chunk.ChoiceDelta(content="Hello", role="assistant"),
                )
            ],
            created=int(datetime.now().timestamp()),
            usage=None,
        )
        mock_chat_completion_create.return_value = OpenAIAsyncMockStream(completion)
        yield mock_chat_completion_create
chore: add license header to all modules (#7675) * add license header to modules * check license header at linting time 2024-05-09 15:40:36 +02:00			`# SPDX-FileCopyrightText: 2022-present deepset GmbH <info@deepset.ai>`
			`#`
			`# SPDX-License-Identifier: Apache-2.0`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`from datetime import datetime`
			`from typing import Iterator`
Add `run_async` to `OpenAIChatGenerator` (#8880) * Implememntation of run_async (wip) * Add missing tests ; Move async tests to test_openai_async.py * Add release note * Update docstring * Alignments with haystack-experimental implementation * Lint: removed unused imports * Update haystack/components/generators/chat/openai.py Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> --------- Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> 2025-02-20 17:51:46 +01:00			`from unittest.mock import MagicMock, patch, AsyncMock`
feat: Add `HuggingFaceTGIChatGenerator` Haystack 2.x component (#6199) * Add ChatHuggingFaceTGIGenerator * Add release note --------- Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> Co-authored-by: Stefano Fiorucci <44616784+anakin87@users.noreply.github.com> 2023-11-06 09:48:45 +01:00
			`import pytest`
Add `run_async` to `OpenAIChatGenerator` (#8880) * Implememntation of run_async (wip) * Add missing tests ; Move async tests to test_openai_async.py * Add release note * Update docstring * Alignments with haystack-experimental implementation * Lint: removed unused imports * Update haystack/components/generators/chat/openai.py Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> --------- Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> 2025-02-20 17:51:46 +01:00			`from openai import AsyncStream, Stream`
fix: allow support for `include_usage` in streaming using OpenAIChatGenerator (#8968) * fix error in handling usage completion chunk 2025-03-05 22:30:26 +05:00			`from openai.types.chat import ChatCompletion, ChatCompletionChunk`
feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`from openai.types.chat import chat_completion_chunk`
feat: Add `HuggingFaceTGIChatGenerator` Haystack 2.x component (#6199) * Add ChatHuggingFaceTGIGenerator * Add release note --------- Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> Co-authored-by: Stefano Fiorucci <44616784+anakin87@users.noreply.github.com> 2023-11-06 09:48:45 +01:00

			`@pytest.fixture`
			`def mock_auto_tokenizer():`
			`"""`
			`In the original mock_auto_tokenizer fixture, we were mocking the transformers.AutoTokenizer.from_pretrained`
			`method directly, but we were not providing a return value for this method. Therefore, when from_pretrained`
			`was called within HuggingFaceTGIChatGenerator, it returned None because that's the default behavior of a`
			`MagicMock object when a return value isn't specified.`

			`We will update the mock_auto_tokenizer fixture to return a MagicMock object when from_pretrained is called`
			`in another PR. For now, we will use this fixture to mock the AutoTokenizer.from_pretrained method.`
			`"""`

			`with patch("transformers.AutoTokenizer.from_pretrained", autospec=True) as mock_from_pretrained:`
			`mock_tokenizer = MagicMock()`
			`mock_from_pretrained.return_value = mock_tokenizer`
			`yield mock_tokenizer`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00

feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`class OpenAIMockStream(Stream[ChatCompletionChunk]):`
			`def __init__(self, mock_chunk: ChatCompletionChunk, client=None, args, *kwargs):`
			`client = client or MagicMock()`
			`super().__init__(client=client, args, *kwargs)`
			`self.mock_chunk = mock_chunk`

			`def __stream__(self) -> Iterator[ChatCompletionChunk]:`
			`yield self.mock_chunk`


Add `run_async` to `OpenAIChatGenerator` (#8880) * Implememntation of run_async (wip) * Add missing tests ; Move async tests to test_openai_async.py * Add release note * Update docstring * Alignments with haystack-experimental implementation * Lint: removed unused imports * Update haystack/components/generators/chat/openai.py Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> --------- Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> 2025-02-20 17:51:46 +01:00			`class OpenAIAsyncMockStream(AsyncStream[ChatCompletionChunk]):`
			`def __init__(self, mock_chunk: ChatCompletionChunk):`
			`self.mock_chunk = mock_chunk`

			`def __aiter__(self):`
			`return self`

			`async def __anext__(self):`
			`# Only yield once, then stop iteration`
			`if not hasattr(self, "_done"):`
			`self._done = True`
			`return self.mock_chunk`
			`raise StopAsyncIteration`


feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`@pytest.fixture`
feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`def openai_mock_stream():`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`"""`
feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`Fixture that returns a function to create MockStream instances with custom chunks`
			`"""`
			`return OpenAIMockStream`


Add `run_async` to `OpenAIChatGenerator` (#8880) * Implememntation of run_async (wip) * Add missing tests ; Move async tests to test_openai_async.py * Add release note * Update docstring * Alignments with haystack-experimental implementation * Lint: removed unused imports * Update haystack/components/generators/chat/openai.py Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> --------- Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> 2025-02-20 17:51:46 +01:00			`@pytest.fixture`
			`def openai_mock_stream_async():`
			`"""`
			`Fixture that returns a function to create AsyncMockStream instances with custom chunks`
			`"""`
			`return OpenAIAsyncMockStream`


feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`@pytest.fixture`
			`def openai_mock_chat_completion():`
			`"""`
			`Mock the OpenAI API completion response and reuse it for tests`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`"""`
feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`with patch("openai.resources.chat.completions.Completions.create") as mock_chat_completion_create:`
			`completion = ChatCompletion(`
			`id="foo",`
			`model="gpt-4",`
			`object="chat.completion",`
			`choices=[`
			`{`
			`"finish_reason": "stop",`
			`"logprobs": None,`
			`"index": 0,`
			`"message": {"content": "Hello world!", "role": "assistant"},`
			`}`
			`],`
			`created=int(datetime.now().timestamp()),`
			`usage={"prompt_tokens": 57, "completion_tokens": 40, "total_tokens": 97},`
			`)`

			`mock_chat_completion_create.return_value = completion`
			`yield mock_chat_completion_create`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00

Add `run_async` to `OpenAIChatGenerator` (#8880) * Implememntation of run_async (wip) * Add missing tests ; Move async tests to test_openai_async.py * Add release note * Update docstring * Alignments with haystack-experimental implementation * Lint: removed unused imports * Update haystack/components/generators/chat/openai.py Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> --------- Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> 2025-02-20 17:51:46 +01:00			`@pytest.fixture`
			`async def openai_mock_async_chat_completion():`
			`"""`
			`Mock the OpenAI API completion response and reuse it for async tests`
			`"""`
			`with patch(`
			`"openai.resources.chat.completions.AsyncCompletions.create", new_callable=AsyncMock`
			`) as mock_chat_completion_create:`
			`completion = ChatCompletion(`
			`id="foo",`
			`model="gpt-4",`
			`object="chat.completion",`
			`choices=[`
			`{`
			`"finish_reason": "stop",`
			`"logprobs": None,`
			`"index": 0,`
			`"message": {"content": "Hello world!", "role": "assistant"},`
			`}`
			`],`
			`created=int(datetime.now().timestamp()),`
			`usage={"prompt_tokens": 57, "completion_tokens": 40, "total_tokens": 97},`
			`)`

			`mock_chat_completion_create.return_value = completion`
			`yield mock_chat_completion_create`


feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`@pytest.fixture`
			`def openai_mock_chat_completion_chunk():`
			`"""`
			`Mock the OpenAI API completion chunk response and reuse it for tests`
			`"""`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00
			`with patch("openai.resources.chat.completions.Completions.create") as mock_chat_completion_create:`
			`completion = ChatCompletionChunk(`
			`id="foo",`
			`model="gpt-4",`
			`object="chat.completion.chunk",`
			`choices=[`
feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`chat_completion_chunk.Choice(`
			`finish_reason="stop",`
			`logprobs=None,`
			`index=0,`
			`delta=chat_completion_chunk.ChoiceDelta(content="Hello", role="assistant"),`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`)`
			`],`
			`created=int(datetime.now().timestamp()),`
fix: allow support for `include_usage` in streaming using OpenAIChatGenerator (#8968) * fix error in handling usage completion chunk 2025-03-05 22:30:26 +05:00			`usage=None,`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`)`
feat: support for tools in `OpenAIChatGenerator` (#8666) * move chatmsg>openai conversion to chatmsg dataclass * implementation and tests cleanup * release note * try fixing azure chat generator * add serde test for toolinvoker * small fix 2024-12-20 15:20:54 +01:00			`mock_chat_completion_create.return_value = OpenAIMockStream(`
			`completion, cast_to=None, response=None, client=None`
			`)`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`yield mock_chat_completion_create`
Add `run_async` to `OpenAIChatGenerator` (#8880) * Implememntation of run_async (wip) * Add missing tests ; Move async tests to test_openai_async.py * Add release note * Update docstring * Alignments with haystack-experimental implementation * Lint: removed unused imports * Update haystack/components/generators/chat/openai.py Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> --------- Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> 2025-02-20 17:51:46 +01:00

			`@pytest.fixture`
			`async def openai_mock_async_chat_completion_chunk():`
			`"""`
			`Mock the OpenAI API completion chunk response and reuse it for async tests`
			`"""`
			`with patch(`
			`"openai.resources.chat.completions.AsyncCompletions.create", new_callable=AsyncMock`
			`) as mock_chat_completion_create:`
			`completion = ChatCompletionChunk(`
			`id="foo",`
			`model="gpt-4",`
			`object="chat.completion.chunk",`
			`choices=[`
			`chat_completion_chunk.Choice(`
			`finish_reason="stop",`
			`logprobs=None,`
			`index=0,`
			`delta=chat_completion_chunk.ChoiceDelta(content="Hello", role="assistant"),`
			`)`
			`],`
			`created=int(datetime.now().timestamp()),`
fix: allow support for `include_usage` in streaming using OpenAIChatGenerator (#8968) * fix error in handling usage completion chunk 2025-03-05 22:30:26 +05:00			`usage=None,`
Add `run_async` to `OpenAIChatGenerator` (#8880) * Implememntation of run_async (wip) * Add missing tests ; Move async tests to test_openai_async.py * Add release note * Update docstring * Alignments with haystack-experimental implementation * Lint: removed unused imports * Update haystack/components/generators/chat/openai.py Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> --------- Co-authored-by: Stefano Fiorucci <stefanofiorucci@gmail.com> 2025-02-20 17:51:46 +01:00			`)`
			`mock_chat_completion_create.return_value = OpenAIAsyncMockStream(completion)`
			`yield mock_chat_completion_create`