PaddleOCR/tests/pipelines/test_ocr.py
Lin Manhui 3d03ca5500
[Breaking][Feat] New PaddleOCR inference package (#15046)
* Init new paddleocr

* Remove unused dependency

* Fix typos

* Fix

* Add doc understanding modules

* Fix package finding

* Normalize name

* Fix setting bugs

* Fix setting bug

* Support single model inference

* Add PP-ChatOCRv4-doc

* Add pp_chatocrv4_doc tests

* Enable MKL-DNN when available

* add seal_text_detection modules

* add layout_detection and table_cells_detection modules

* add testing scripts

* Fix desc

* add text_image_unwarping and table_structure_recognition modules

* add formula_recognition and doc_vlm modules

* update formula_recognition default_model_name

* add MKLDNN_BLOCKLIST

* update MKLDNN log

* add seal rec pipeline

* fix sth

* fix sth

* add doc preprocessor pipeline

* fix sth

* add doc understanding

* add table_rec_v2, ppstructurev3, formula_rec pipelines

* move test files

* forward kwargs to pipeline.predict

* clean test files

* Add missing kwargs

* Fix typo

* Fix typo

* rerun CI

* update mkldnn BLOCKLIST

* update

* update warning message

* fix cli args

* update PIPELINE_MKLDNN_BLOCKLIST

* update  of  workflow

* skip resource_intensive tests

* update config

* skip ppdocbee test_predict_params

---------

Co-authored-by: zhangyue66 <zhangyue66@baidu.com>
Co-authored-by: zhangzelun <zhangzelun@baidu.com>
2025-05-04 15:59:02 +08:00

114 lines
3.9 KiB
Python

import pytest
from paddleocr import PaddleOCR
from ..testing_utils import (
TEST_DATA_DIR,
check_simple_inference_result,
check_wrapper_simple_inference_param_forwarding,
)
@pytest.fixture(scope="module")
def ocr_engine() -> PaddleOCR:
return PaddleOCR()
# TODO: Should we separate unit tests and integration tests?
@pytest.mark.parametrize(
"image_path",
[
TEST_DATA_DIR / "table.jpg",
],
)
def test_predict(ocr_engine: PaddleOCR, image_path: str) -> None:
"""
Test PaddleOCR's OCR functionality.
Args:
ocr_engine: An instance of `PaddleOCR`.
image_path: Path to the image to be processed.
"""
result = ocr_engine.predict(str(image_path))
check_simple_inference_result(result)
res = result[0]
assert len(res["dt_polys"]) > 0
assert isinstance(res["rec_texts"], list)
assert len(res["rec_texts"]) > 0
for text in res["rec_texts"]:
assert isinstance(text, str)
# TODO: Also check passing `None`
@pytest.mark.parametrize(
"params",
[
{"use_doc_orientation_classify": False},
{"use_doc_unwarping": False},
{"use_textline_orientation": False},
{"text_det_limit_side_len": 640, "text_det_limit_type": "min"},
{"text_det_thresh": 0.5},
{"text_det_box_thresh": 0.3},
{"text_det_unclip_ratio": 3.0},
{"text_rec_score_thresh": 0.5},
],
)
def test_predict_params(
monkeypatch,
ocr_engine: PaddleOCR,
params: dict,
) -> None:
check_wrapper_simple_inference_param_forwarding(
monkeypatch,
ocr_engine,
"paddlex_pipeline",
"dummy_path",
params,
)
# TODO: Test init params
def test_lang_and_ocr_version():
ocr_engine = PaddleOCR(lang="ch", ocr_version="PP-OCRv4")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv4_mobile_det"
assert ocr_engine._params["text_recognition_model_name"] == "PP-OCRv4_mobile_rec"
ocr_engine = PaddleOCR(lang="en", ocr_version="PP-OCRv4")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv4_mobile_det"
assert ocr_engine._params["text_recognition_model_name"] == "en_PP-OCRv4_mobile_rec"
ocr_engine = PaddleOCR(lang="ch", ocr_version="PP-OCRv3")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv3_mobile_det"
assert ocr_engine._params["text_recognition_model_name"] == "PP-OCRv3_mobile_rec"
ocr_engine = PaddleOCR(lang="en", ocr_version="PP-OCRv3")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv3_mobile_det"
assert ocr_engine._params["text_recognition_model_name"] == "en_PP-OCRv3_mobile_rec"
ocr_engine = PaddleOCR(lang="fr", ocr_version="PP-OCRv3")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv3_mobile_det"
assert (
ocr_engine._params["text_recognition_model_name"] == "latin_PP-OCRv3_mobile_rec"
)
ocr_engine = PaddleOCR(lang="ar", ocr_version="PP-OCRv3")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv3_mobile_det"
assert (
ocr_engine._params["text_recognition_model_name"]
== "arabic_PP-OCRv3_mobile_rec"
)
ocr_engine = PaddleOCR(lang="ru", ocr_version="PP-OCRv3")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv3_mobile_det"
assert (
ocr_engine._params["text_recognition_model_name"]
== "cyrillic_PP-OCRv3_mobile_rec"
)
ocr_engine = PaddleOCR(lang="hi", ocr_version="PP-OCRv3")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv3_mobile_det"
assert (
ocr_engine._params["text_recognition_model_name"]
== "devanagari_PP-OCRv3_mobile_rec"
)
ocr_engine = PaddleOCR(lang="japan", ocr_version="PP-OCRv3")
assert ocr_engine._params["text_detection_model_name"] == "PP-OCRv3_mobile_det"
assert (
ocr_engine._params["text_recognition_model_name"] == "japan_PP-OCRv3_mobile_rec"
)