mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-06-27 02:30:08 +00:00

**Summary** Improve expression in auto-partition tests and fix xfails and skips. Add issues for the two hard-fails where xfail needed to stay.
127 lines
4.3 KiB
JSON
127 lines
4.3 KiB
JSON
[
|
|
{
|
|
"element_id": "a06d2d9e65212d4aa955c3ab32950ffa",
|
|
"metadata": {
|
|
"category_depth": 0,
|
|
"file_directory": "unstructured/example-docs",
|
|
"filename": "simple.docx",
|
|
"filetype": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
|
|
"languages": [
|
|
"eng"
|
|
],
|
|
"last_modified": "2024-07-06T16:44:51"
|
|
},
|
|
"text": "These are a few of my favorite things:",
|
|
"type": "Title"
|
|
},
|
|
{
|
|
"element_id": "b334c93e9b1cbca3b6f6d78ce8bc2484",
|
|
"metadata": {
|
|
"category_depth": 0,
|
|
"file_directory": "unstructured/example-docs",
|
|
"filename": "simple.docx",
|
|
"filetype": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
|
|
"languages": [
|
|
"eng"
|
|
],
|
|
"last_modified": "2024-07-06T16:44:51",
|
|
"parent_id": "a06d2d9e65212d4aa955c3ab32950ffa"
|
|
},
|
|
"text": "Parrots",
|
|
"type": "ListItem"
|
|
},
|
|
{
|
|
"element_id": "76469ecb9f1459943c8d8cca1a550b5a",
|
|
"metadata": {
|
|
"category_depth": 0,
|
|
"file_directory": "unstructured/example-docs",
|
|
"filename": "simple.docx",
|
|
"filetype": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
|
|
"languages": [
|
|
"eng"
|
|
],
|
|
"last_modified": "2024-07-06T16:44:51",
|
|
"parent_id": "a06d2d9e65212d4aa955c3ab32950ffa"
|
|
},
|
|
"text": "Hockey",
|
|
"type": "ListItem"
|
|
},
|
|
{
|
|
"element_id": "261fac731945a138415adc2dd4434b17",
|
|
"metadata": {
|
|
"category_depth": 0,
|
|
"file_directory": "unstructured/example-docs",
|
|
"filename": "simple.docx",
|
|
"filetype": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
|
|
"languages": [
|
|
"eng"
|
|
],
|
|
"last_modified": "2024-07-06T16:44:51"
|
|
},
|
|
"text": "Analysis",
|
|
"type": "Title"
|
|
},
|
|
{
|
|
"element_id": "95f392d32c5271bfdb30eaef45921e59",
|
|
"metadata": {
|
|
"category_depth": 0,
|
|
"file_directory": "unstructured/example-docs",
|
|
"filename": "simple.docx",
|
|
"filetype": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
|
|
"languages": [
|
|
"eng"
|
|
],
|
|
"last_modified": "2024-07-06T16:44:51",
|
|
"parent_id": "261fac731945a138415adc2dd4434b17"
|
|
},
|
|
"text": "This is my first thought. This is my second thought.",
|
|
"type": "NarrativeText"
|
|
},
|
|
{
|
|
"element_id": "0de25bd6f0d74bc4f909f2678f385736",
|
|
"metadata": {
|
|
"category_depth": 0,
|
|
"file_directory": "unstructured/example-docs",
|
|
"filename": "simple.docx",
|
|
"filetype": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
|
|
"languages": [
|
|
"eng"
|
|
],
|
|
"last_modified": "2024-07-06T16:44:51",
|
|
"parent_id": "261fac731945a138415adc2dd4434b17"
|
|
},
|
|
"text": "This is my third thought.",
|
|
"type": "NarrativeText"
|
|
},
|
|
{
|
|
"element_id": "f296a3bc8a901f19199fda1da92829b6",
|
|
"metadata": {
|
|
"category_depth": 0,
|
|
"file_directory": "unstructured/example-docs",
|
|
"filename": "simple.docx",
|
|
"filetype": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
|
|
"languages": [
|
|
"eng"
|
|
],
|
|
"last_modified": "2024-07-06T16:44:51",
|
|
"parent_id": "261fac731945a138415adc2dd4434b17"
|
|
},
|
|
"text": "2023",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "78c62edbc674fdca0f6a0e3ffb459f86",
|
|
"metadata": {
|
|
"category_depth": 0,
|
|
"file_directory": "unstructured/example-docs",
|
|
"filename": "simple.docx",
|
|
"filetype": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
|
|
"languages": [
|
|
"eng"
|
|
],
|
|
"last_modified": "2024-07-06T16:44:51"
|
|
},
|
|
"text": "DOYLESTOWN, PA 18901",
|
|
"type": "Address"
|
|
}
|
|
] |