import os import json import pytest import unstructured.utils as utils @pytest.fixture def input_data(): return [ {"text": "This is a sentence."}, {"text": "This is another sentence.", "meta": {"score": 0.1}}, ] @pytest.fixture def output_jsonl_file(tmp_path): return os.path.join(tmp_path, "output.jsonl") @pytest.fixture def input_jsonl_file(tmp_path, input_data): file_path = os.path.join(tmp_path, "input.jsonl") with open(file_path, "w+") as input_file: input_file.writelines([json.dumps(obj) + "\n" for obj in input_data]) return file_path def test_save_as_jsonl(input_data, output_jsonl_file): utils.save_as_jsonl(input_data, output_jsonl_file) with open(output_jsonl_file, "r") as output_file: file_data = [json.loads(line) for line in output_file] assert file_data == input_data def test_read_as_jsonl(input_jsonl_file, input_data): file_data = utils.read_from_jsonl(input_jsonl_file) assert file_data == input_data