import pytest from haystack.preprocessor import utils from haystack.preprocessor.cleaning import clean_wiki_text @pytest.mark.tika def test_convert_files_to_dicts(xpdf_fixture): documents = utils.convert_files_to_dicts(dir_path="samples", clean_func=clean_wiki_text, split_paragraphs=True) assert documents and len(documents) > 0 @pytest.mark.tika def test_tika_convert_files_to_dicts(tika_fixture): documents = utils.tika_convert_files_to_dicts(dir_path="samples", clean_func=clean_wiki_text, split_paragraphs=True) assert documents and len(documents) > 0