import pytest from haystack.utils.preprocessing import convert_files_to_dicts, tika_convert_files_to_dicts from haystack.utils.cleaning import clean_wiki_text def test_convert_files_to_dicts(): documents = convert_files_to_dicts(dir_path="samples", clean_func=clean_wiki_text, split_paragraphs=True) assert documents and len(documents) > 0 @pytest.mark.tika def test_tika_convert_files_to_dicts(): documents = tika_convert_files_to_dicts(dir_path="samples", clean_func=clean_wiki_text, split_paragraphs=True) assert documents and len(documents) > 0