2025-05-21 11:27:34 -05:00

46 lines
1.3 KiB
Python

import pytest
from datahub.ingestion.run.pipeline import Pipeline
from datahub.testing import mce_helpers
@pytest.mark.integration
def test_excel(pytestconfig, tmp_path, mock_time):
test_resources_dir = pytestconfig.rootpath / "tests/integration/excel"
test_files = "tests/integration/excel/data/*.xlsx"
# Run the metadata ingestion pipeline.
pipeline = Pipeline.create(
{
"run_id": "excel-test",
"source": {
"type": "excel",
"config": {
"path_list": [
str(test_files),
],
"profiling": {
"enabled": True,
},
},
},
"sink": {
"type": "file",
"config": {
"filename": f"{tmp_path}/excel_file_test.json",
},
},
}
)
pipeline.run()
pipeline.raise_from_status()
mce_helpers.check_golden_file(
pytestconfig,
output_path=tmp_path / "excel_file_test.json",
golden_path=test_resources_dir / "excel_file_test_golden.json",
ignore_paths=[
r"root\[\d+\]\['aspect'\]\['json'\]\['fieldProfiles'\]\[\d+\]\['sampleValues'\]",
],
)