mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-11-30 17:20:06 +00:00
roman/update language kwarg partition ingest (#1605)
### Description Change partition kwarg from ocr_languages -> languages Closes out https://github.com/Unstructured-IO/unstructured/issues/1588
This commit is contained in:
parent
ad59a879cc
commit
4d6492391c
@ -1,4 +1,4 @@
|
|||||||
## 0.10.19-dev1
|
## 0.10.19-dev2
|
||||||
|
|
||||||
### Enhancements
|
### Enhancements
|
||||||
|
|
||||||
|
|||||||
@ -1 +1 @@
|
|||||||
__version__ = "0.10.19-dev1" # pragma: no cover
|
__version__ = "0.10.19-dev2" # pragma: no cover
|
||||||
|
|||||||
@ -107,10 +107,11 @@ def process_documents(
|
|||||||
verbose: bool,
|
verbose: bool,
|
||||||
dest_doc_connector: t.Optional[BaseDestinationConnector] = None,
|
dest_doc_connector: t.Optional[BaseDestinationConnector] = None,
|
||||||
) -> None:
|
) -> None:
|
||||||
|
languages = partition_config.ocr_languages.split("+") if partition_config.ocr_languages else []
|
||||||
process_document_with_partition_args = partial(
|
process_document_with_partition_args = partial(
|
||||||
process_document,
|
process_document,
|
||||||
strategy=partition_config.strategy,
|
strategy=partition_config.strategy,
|
||||||
ocr_languages=partition_config.ocr_languages,
|
languages=languages,
|
||||||
encoding=partition_config.encoding,
|
encoding=partition_config.encoding,
|
||||||
pdf_infer_table_structure=partition_config.pdf_infer_table_structure,
|
pdf_infer_table_structure=partition_config.pdf_infer_table_structure,
|
||||||
)
|
)
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user