haystack/test/conftest.py

# SPDX-FileCopyrightText: 2022-present deepset GmbH <info@deepset.ai>
#
# SPDX-License-Identifier: Apache-2.0
from datetime import datetime
from pathlib import Path
from test.tracing.utils import SpyingTracer
from typing import Generator
from unittest.mock import Mock, patch

import pytest
from openai.types.chat import ChatCompletion, ChatCompletionMessage
from openai.types.chat.chat_completion import Choice

from haystack import tracing
from haystack.testing.test_utils import set_all_seeds

set_all_seeds(0)

# Tracing is disable by default to avoid failures in CI
tracing.disable_tracing()


@pytest.fixture()
def mock_tokenizer():
    """
    Tokenizes the string by splitting on spaces.
    """
    tokenizer = Mock()
    tokenizer.encode = lambda text: text.split()
    tokenizer.decode = lambda tokens: " ".join(tokens)
    return tokenizer


@pytest.fixture()
def test_files_path():
    return Path(__file__).parent / "test_files"


@pytest.fixture
def mock_chat_completion():
    """
    Mock the OpenAI API completion response and reuse it for tests
    """
    with patch("openai.resources.chat.completions.Completions.create") as mock_chat_completion_create:
        completion = ChatCompletion(
            id="foo",
            model="gpt-4",
            object="chat.completion",
            choices=[
                Choice(
                    finish_reason="stop",
                    logprobs=None,
                    index=0,
                    message=ChatCompletionMessage(content="Hello world!", role="assistant"),
                )
            ],
            created=int(datetime.now().timestamp()),
            usage={"prompt_tokens": 57, "completion_tokens": 40, "total_tokens": 97},
        )

        mock_chat_completion_create.return_value = completion
        yield mock_chat_completion_create


@pytest.fixture(autouse=True)
def request_blocker(request: pytest.FixtureRequest, monkeypatch):
    """
    This fixture is applied automatically to all tests.
    Those that are not marked as integration will have the requests module
    monkeypatched to avoid making HTTP requests by mistake.
    """
    marker = request.node.get_closest_marker("integration")
    if marker is not None:
        return

    def urlopen_mock(self, method, url, *args, **kwargs):
        raise RuntimeError(f"The test was about to {method} {self.scheme}://{self.host}{url}")

    monkeypatch.setattr("urllib3.connectionpool.HTTPConnectionPool.urlopen", urlopen_mock)


@pytest.fixture()
def spying_tracer() -> Generator[SpyingTracer, None, None]:
    tracer = SpyingTracer()
    tracing.enable_tracing(tracer)

    yield tracer

    # Make sure to disable tracing after the test to avoid affecting other tests
    tracing.disable_tracing()
chore: add license header to all modules (#7675) * add license header to modules * check license header at linting time 2024-05-09 15:40:36 +02:00			`# SPDX-FileCopyrightText: 2022-present deepset GmbH <info@deepset.ai>`
			`#`
			`# SPDX-License-Identifier: Apache-2.0`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`from datetime import datetime`
Improve dependency management (#1994) * Fist attempt at using setup.cfg for dependency management * Trying the new package on the CI and in Docker too * Add composite extras_require * Add the safe_import function for document store imports and add some try-catch statements on rest_api and ui imports * Fix bug on class import and rephrase error message * Introduce typing for optional modules and add type: ignore in sparse.py * Include importlib_metadata backport for py3.7 * Add colab group to extra_requires * Fix pillow version * Fix grpcio * Separate out the crawler as another extra * Make paths relative in rest_api and ui * Update the test matrix in the CI * Add try catch statements around the optional imports too to account for direct imports * Never mix direct deps with self-references and add ES deps to the base install * Refactor several paths in tests to make them insensitive to the execution path * Include tstadel review and re-introduce Milvus1 in the tests suite, to fix * Wrap pdf conversion utils into safe_import * Update some tutorials and rever Milvus1 as default for now, see #2067 * Fix mypy config Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2022-01-26 18:12:55 +01:00			`from pathlib import Path`
ci: Skip collection of `test_json_schema.py` to fix CI failures (#7353) * Skip collection of test_json_schema.py to fix CI failures * mock chroma instance * revert --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> 2024-03-13 16:59:26 +01:00			`from test.tracing.utils import SpyingTracer`
feat: implement pipeline tracing (#7046) * feat: implement pipeline tracing * tests: improve test setup for spying tracer * feat: implement util for type coercion * fix: trace a after checking pipeline output * docs: add release notes * docs: drop unused imports * refactor: simplify getting raw span * refactor: implement `ProxyTracer` 2024-02-22 12:52:04 +01:00			`from typing import Generator`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`from unittest.mock import Mock, patch`

Add test for Elasticsearch document store (#88) 2020-05-04 18:00:07 +02:00			`import pytest`
feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`from openai.types.chat import ChatCompletion, ChatCompletionMessage`
			`from openai.types.chat.chat_completion import Choice`
Add Longform-QA (LFQA), Seq2SeqGenerator for generative QA and Retribert Retriever (#1086) * Integrate LFQA with Haystack * Integrate LFQA with Haystack - unit tests * Properly initialize conftest default value for vector_dim * Update PR after inital feedback * Fix conftest.py import * Seq2SeqGenerator uses Callables instead of subclasses for custom model input * Update docstring * Fix Callable use * Add LFQA tutorials * Improve type error reporting for invalid input converter Callable * Generate docstrings * Format comments in tutorial script * Generate tutorial md * Add usage page Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> Co-authored-by: brandenchan <brandenchan@icloud.com> 2021-06-14 17:53:43 +02:00
feat: implement pipeline tracing (#7046) * feat: implement pipeline tracing * tests: improve test setup for spying tracer * feat: implement util for type coercion * fix: trace a after checking pipeline output * docs: add release notes * docs: drop unused imports * refactor: simplify getting raw span * refactor: implement `ProxyTracer` 2024-02-22 12:52:04 +01:00			`from haystack import tracing`
Fix all tests 2023-11-24 14:48:43 +01:00			`from haystack.testing.test_utils import set_all_seeds`
Add test for Elasticsearch document store (#88) 2020-05-04 18:00:07 +02:00
Remove preview folder in test/ --------- Co-authored-by: Silvano Cerza <silvanocerza@gmail.com> 2023-11-24 11:52:55 +01:00			`set_all_seeds(0)`
Introduce readonly DCDocumentStore (without labels support) (#1991) * minimal DCDocumentStore * support filters * implement get_documents_by_id * handle not existing documents * add docstrings * auth added * add tests * generate docs * Add latest docstring and tutorial changes * add responses to dev dependencies * fix tests * support query() and quey_by_embedding() * Add latest docstring and tutorial changes * query tests added * read api_key and api_endpoint from env * Add latest docstring and tutorial changes * support query() and quey_by_embedding() * query tests added * Add latest docstring and tutorial changes * Add latest docstring and tutorial changes * support dynamic similarity and return_embedding values * Add latest docstring and tutorial changes * adjust KeywordDocumentStore description * refactoring * Add latest docstring and tutorial changes * implement get_document_count and raise on all not implemented methods * Add latest docstring and tutorial changes * don't use abbreviation DC in comments and errors * Add latest docstring and tutorial changes * docstring added to KeywordDocumentStore * Add latest docstring and tutorial changes * enhanced api key set * split tests into two parts * change setup.py in order to work around build cache * added link * Add latest docstring and tutorial changes * rename DCDocumentStore to DeepsetCloudDocumentStore * Add latest docstring and tutorial changes * remove dc.py * reinsert link to docs * fix imports * Add latest docstring and tutorial changes * better test structure Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: ArzelaAscoIi <kristof.herrmann@rwth-aachen.de> 2022-01-25 20:36:28 +01:00
Disable tracing when running tests (#7934) 2024-06-26 12:32:05 +02:00			`# Tracing is disable by default to avoid failures in CI`
			`tracing.disable_tracing()`

test: add meta fields for meta_config to be used during testing (#3021) * added meta fields for meta_config to be used during realtime testing of PineconeDocumentStore * Add documentation on metadata filtering in docstring * docs Co-authored-by: Sara Zan <sara.zanzottera@deepset.ai> 2022-08-12 09:27:56 +01:00
Remove preview folder in test/ --------- Co-authored-by: Silvano Cerza <silvanocerza@gmail.com> 2023-11-24 11:52:55 +01:00			`@pytest.fixture()`
			`def mock_tokenizer():`
test: add version deprecation fixture (#3851) * add fixture * Update test/conftest.py * remove +2 and add tests * few typos * more cases * Update test/conftest.py 2023-01-16 15:36:14 +01:00			`"""`
Remove preview folder in test/ --------- Co-authored-by: Silvano Cerza <silvanocerza@gmail.com> 2023-11-24 11:52:55 +01:00			`Tokenizes the string by splitting on spaces.`
test: add version deprecation fixture (#3851) * add fixture * Update test/conftest.py * remove +2 and add tests * few typos * more cases * Update test/conftest.py 2023-01-16 15:36:14 +01:00			`"""`
Remove preview folder in test/ --------- Co-authored-by: Silvano Cerza <silvanocerza@gmail.com> 2023-11-24 11:52:55 +01:00			`tokenizer = Mock()`
			`tokenizer.encode = lambda text: text.split()`
			`tokenizer.decode = lambda tokens: " ".join(tokens)`
			`return tokenizer`
chore: block all HTTP requests in CI (#5088) 2023-06-13 14:52:24 +02:00

Remove preview folder in test/ --------- Co-authored-by: Silvano Cerza <silvanocerza@gmail.com> 2023-11-24 11:52:55 +01:00			`@pytest.fixture()`
			`def test_files_path():`
			`return Path(__file__).parent / "test_files"`
test: Add fixture to block requests in tests (#6585) * Add fixture to block requests in tests * Mark tests making requests as integration 2023-12-21 08:51:54 +01:00

feat: Update OpenAI Python Client in Haystack 2.x (#6584) * Update openai python client * Add release note * Consolidate multiple mock_chat_completion into one * Ensure all components have api_base_url, organization params * Update tests * Enable function calling * Oversight * Minor fixes, add streaming test mocks * Apply suggestions from code review Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> * metadata -> meta --------- Co-authored-by: Massimiliano Pippi <mpippi@gmail.com> Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> 2023-12-21 16:21:24 +01:00			`@pytest.fixture`
			`def mock_chat_completion():`
			`"""`
			`Mock the OpenAI API completion response and reuse it for tests`
			`"""`
			`with patch("openai.resources.chat.completions.Completions.create") as mock_chat_completion_create:`
			`completion = ChatCompletion(`
			`id="foo",`
			`model="gpt-4",`
			`object="chat.completion",`
			`choices=[`
			`Choice(`
			`finish_reason="stop",`
			`logprobs=None,`
			`index=0,`
			`message=ChatCompletionMessage(content="Hello world!", role="assistant"),`
			`)`
			`],`
			`created=int(datetime.now().timestamp()),`
			`usage={"prompt_tokens": 57, "completion_tokens": 40, "total_tokens": 97},`
			`)`

			`mock_chat_completion_create.return_value = completion`
			`yield mock_chat_completion_create`


test: Add fixture to block requests in tests (#6585) * Add fixture to block requests in tests * Mark tests making requests as integration 2023-12-21 08:51:54 +01:00			`@pytest.fixture(autouse=True)`
			`def request_blocker(request: pytest.FixtureRequest, monkeypatch):`
			`"""`
			`This fixture is applied automatically to all tests.`
			`Those that are not marked as integration will have the requests module`
			`monkeypatched to avoid making HTTP requests by mistake.`
			`"""`
			`marker = request.node.get_closest_marker("integration")`
			`if marker is not None:`
			`return`

			`def urlopen_mock(self, method, url, args, *kwargs):`
			`raise RuntimeError(f"The test was about to {method} {self.scheme}://{self.host}{url}")`

			`monkeypatch.setattr("urllib3.connectionpool.HTTPConnectionPool.urlopen", urlopen_mock)`
feat: implement pipeline tracing (#7046) * feat: implement pipeline tracing * tests: improve test setup for spying tracer * feat: implement util for type coercion * fix: trace a after checking pipeline output * docs: add release notes * docs: drop unused imports * refactor: simplify getting raw span * refactor: implement `ProxyTracer` 2024-02-22 12:52:04 +01:00

			`@pytest.fixture()`
			`def spying_tracer() -> Generator[SpyingTracer, None, None]:`
			`tracer = SpyingTracer()`
			`tracing.enable_tracing(tracer)`

			`yield tracer`

			`# Make sure to disable tracing after the test to avoid affecting other tests`
			`tracing.disable_tracing()`