69 lines
2.3 KiB
Python
Raw Normal View History

from unstructured_inference.inference.layout import LayoutElement
from unstructured.documents.elements import CheckBox, FigureCaption, NarrativeText, Text, Title
import unstructured.partition.common as common
def test_normalize_layout_element_dict():
layout_element = {
"type": "Title",
"coordinates": [[1, 2], [3, 4], [5, 6], [7, 8]],
"text": "Some lovely text",
}
element = common.normalize_layout_element(layout_element)
assert element == Title(text="Some lovely text", coordinates=[[2, 2], [3, 4], [5, 6], [7, 8]])
def test_normalize_layout_element_dict_caption():
layout_element = {
"type": "Figure",
"coordinates": [[1, 2], [3, 4], [5, 6], [7, 8]],
"text": "Some lovely text",
}
element = common.normalize_layout_element(layout_element)
assert element == FigureCaption(
text="Some lovely text", coordinates=[[2, 2], [3, 4], [5, 6], [7, 8]]
)
def test_normalize_layout_element_dict_misc():
layout_element = {
"type": "Misc",
"coordinates": [[1, 2], [3, 4], [5, 6], [7, 8]],
"text": "Some lovely text",
}
element = common.normalize_layout_element(layout_element)
assert element == Text(text="Some lovely text", coordinates=[[2, 2], [3, 4], [5, 6], [7, 8]])
def test_normalize_layout_element_layout_element():
layout_element = LayoutElement(
type="Text",
coordinates=[[1, 2], [3, 4], [5, 6], [7, 8]],
text="Some lovely text",
)
element = common.normalize_layout_element(layout_element)
assert element == NarrativeText(
text="Some lovely text", coordinates=[[2, 2], [3, 4], [5, 6], [7, 8]]
)
def test_normalize_layout_element_checked_box():
layout_element = LayoutElement(
type="Checked",
coordinates=[[1, 2], [3, 4], [5, 6], [7, 8]],
text="",
)
element = common.normalize_layout_element(layout_element)
assert element == CheckBox(checked=True, coordinates=[[1, 2], [3, 4], [5, 6], [7, 8]])
def test_normalize_layout_element_unchecked_box():
layout_element = LayoutElement(
type="Unchecked",
coordinates=[[1, 2], [3, 4], [5, 6], [7, 8]],
text="",
)
element = common.normalize_layout_element(layout_element)
assert element == CheckBox(checked=False, coordinates=[[1, 2], [3, 4], [5, 6], [7, 8]])