From 1456f06b2dfc85f64ba2cf83c03d981d1fc04b54 Mon Sep 17 00:00:00 2001 From: cragwolfe Date: Fri, 18 Aug 2023 10:06:17 -0700 Subject: [PATCH] chore: skip consistently failing test in main (#1150) The reason this test is failing is the API is returning "fast" results when "hi_res" is requested, which is being tracked in this ticket: https://github.com/Unstructured-IO/unstructured-api/issues/188 . This failure was only showing up on the `main` branch, per the commented out `pytest` skips. --- test_unstructured/partition/test_api.py | 21 +++++++++++++++------ 1 file changed, 15 insertions(+), 6 deletions(-) diff --git a/test_unstructured/partition/test_api.py b/test_unstructured/partition/test_api.py index 9176f15ed..d74589f2f 100644 --- a/test_unstructured/partition/test_api.py +++ b/test_unstructured/partition/test_api.py @@ -96,17 +96,26 @@ def test_partition_via_api_raises_with_bad_response(monkeypatch): partition_via_api(filename=filename) -@pytest.mark.skipif(skip_outside_ci, reason="Skipping test run outside of CI") -@pytest.mark.skipif(skip_not_on_main, reason="Skipping test run outside of main branch") +@pytest.mark.skip( + reason="API is returning fast for auto, see " + "https://github.com/Unstructured-IO/unstructured-api/issues/188", +) +# @pytest.mark.skipif(skip_outside_ci, reason="Skipping test run outside of CI") +# @pytest.mark.skipif(skip_not_on_main, reason="Skipping test run outside of main branch") def test_partition_via_api_with_no_strategy(): filename = os.path.join(DIRECTORY, "..", "..", "example-docs", "layout-parser-paper-fast.jpg") - elements_no_strategy = partition_via_api(filename=filename, api_key=get_api_key()) + elements_no_strategy = partition_via_api( + filename=filename, + strategy="auto", + api_key=get_api_key(), + ) elements_hi_res = partition_via_api(filename=filename, strategy="hi_res", api_key=get_api_key()) - # confirm that hi_res strategy was not passed as defaukt to partition by comparing outputs - assert elements_no_strategy[0].text.startswith("arXiv") - assert elements_hi_res[0].text.startswith("LayoutParser") + # confirm that hi_res strategy was not passed as default to partition by comparing outputs + # FIXME(crag): elements_hi_res[4].text is 'sacon oot barvard o', the fast output. + # should be 'Harvard University {melissadell,jacob carlson}@fas.harvard.edu' (as of writing) + assert elements_no_strategy[4].text != elements_hi_res[4].text @pytest.mark.skipif(skip_outside_ci, reason="Skipping test run outside of CI")