mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-11-25 14:50:06 +00:00
also removes mimetype when base64 is not included in image metadata --------- Co-authored-by: ryannikolaidis <ryannikolaidis@users.noreply.github.com>
815 lines
25 KiB
JSON
815 lines
25 KiB
JSON
[
|
|
{
|
|
"element_id": "1672cd06afcef46532e0c1ac6d1ef3e4",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "ef1707e2cadf95400b688c2ea15f6657",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "23332b5a74f166672eda00916897d09c",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "00290c97c096654a5ad758c1aa963b8b",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "252751d6be961b05b423171e53612340",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "9d9ce8fac05e0a6064fc173f51f886b5",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "bcce1169cfd0d24990e5dcf9a1f4417c",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "bef3930174a53244d9333aba98d6ef37",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "40aa9fc4d7bc2522da02123e07615fd1",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "f284f9398e8b26287f59b01df3f87395",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "6da438b97512b144f96de65bcb35c380",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "a3d7fbfb7e7cb92f6c2c809be1aa6a67",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "6780aadfc4e2332b6da7302971e7744e",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "ca6e8673360d0f9a946786edc086f26e",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3 testtext3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "f8085d2948c73dfb968f7b221f3e8fab",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"image_url": "https://unstructured-ingest-test.atlassian.net/wiki/download/thumbnails/1605989/image-20230709-015203.png?version=1&modificationDate=1688907429067&cacheVersion=1&api=v2&width=680&height=259",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "",
|
|
"type": "Image"
|
|
},
|
|
{
|
|
"element_id": "48d494bb12fd182b0106bff99dd2e3be",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 List Item 1",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "3f1b3ecb6515a47b94579cf7de892f09",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 List Item 1 Nested Item A",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "171423f703a966d2616837ed489f6975",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 List Item 1 Nested Item B",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "87daeeb71306ae76a90c0e6ccac0dd47",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 List Item 2",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "c4d15cc61c5d6a3f2350f758b82e487f",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 List Item 3",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "e069a6333ef83f6f250880a500439da3",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 List Item 4",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "2f030590e85c72dd4a2fc739cc05affe",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 List Item 5",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "2db738cf60bf0471df90b6141fc6a8e5",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
],
|
|
"link_texts": [
|
|
"This is the link for unstructured . io."
|
|
],
|
|
"link_urls": [
|
|
"https://www.unstructured.io/"
|
|
]
|
|
},
|
|
"text": "This is the link for unstructured . io.",
|
|
"type": "NarrativeText"
|
|
},
|
|
{
|
|
"element_id": "ab3005ca05b4f48396361646916154b4",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 Checklist Item 1",
|
|
"type": "ListItem"
|
|
},
|
|
{
|
|
"element_id": "ac70c0a823f0a1d56777036e77e77fd9",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 Checklist Item 2 (checked)",
|
|
"type": "ListItem"
|
|
},
|
|
{
|
|
"element_id": "099fca1cec6f3eaa5f71ed9c2ed235e4",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 Checklist Item 3",
|
|
"type": "ListItem"
|
|
},
|
|
{
|
|
"element_id": "85d4a299ad3ee61201530bf0030808b1",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "😃 😃 😃 😃 😃 😃 😃 😃 😃 😃 😃 😃",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "a1a4f27d3b3cc32777e25b3bb0766083",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"emphasized_text_contents": [
|
|
"Testdoc3 bold text"
|
|
],
|
|
"emphasized_text_tags": [
|
|
"b"
|
|
],
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 bold text",
|
|
"type": "NarrativeText"
|
|
},
|
|
{
|
|
"element_id": "976749a5d532d1f18195d61fe8c04be3",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"emphasized_text_contents": [
|
|
"Testdoc3 italic text"
|
|
],
|
|
"emphasized_text_tags": [
|
|
"i"
|
|
],
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 italic text",
|
|
"type": "UncategorizedText"
|
|
},
|
|
{
|
|
"element_id": "079d83c4a7622c70baab0336e3128ec4",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 Heading 1 Sized Text",
|
|
"type": "Title"
|
|
},
|
|
{
|
|
"element_id": "68e58e6fec19f4ec291fd5bcca3dadd8",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 Heading 2 Sized Text",
|
|
"type": "Title"
|
|
},
|
|
{
|
|
"element_id": "8dbaefc9dcf7af80f14871cdd2b0c1d6",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 Heading 3 Sized Text",
|
|
"type": "Title"
|
|
},
|
|
{
|
|
"element_id": "2ca9400f81b794c7d595f9bcd719b18a",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 Heading 4 Sized Text",
|
|
"type": "Title"
|
|
},
|
|
{
|
|
"element_id": "191672694e36e804e20214e8c9bd2d44",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "Testdoc3 Heading 5 Sized Text",
|
|
"type": "Title"
|
|
},
|
|
{
|
|
"element_id": "10d98c7ebc4b2cd6e5508aa9563cc788",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
],
|
|
"text_as_html": "<table><tr><td>Testdoc3 Table: Column 1 Row 0</td><td>Testdoc3 Table: Column 2 Row 0</td><td>Testdoc3 Table: Column 3 Row 0</td></tr><tr><td>Testdoc3 Table: Column 1 Row 1</td><td>Testdoc3 Table: Column 2 Row 1</td><td>Testdoc3 Table: Column 3 Row 1</td></tr><tr><td>Testdoc3 Table: Column 1 Row 2</td><td>Testdoc3 Table: Column 2 Row 2</td><td>Testdoc3 Table: Column 3 Row 2</td></tr></table>"
|
|
},
|
|
"text": "Testdoc3 Table: Column 1 Row 0 Testdoc3 Table: Column 2 Row 0 Testdoc3 Table: Column 3 Row 0 Testdoc3 Table: Column 1 Row 1 Testdoc3 Table: Column 2 Row 1 Testdoc3 Table: Column 3 Row 1 Testdoc3 Table: Column 1 Row 2 Testdoc3 Table: Column 2 Row 2 Testdoc3 Table: Column 3 Row 2",
|
|
"type": "Table"
|
|
},
|
|
{
|
|
"element_id": "45b142b9287e8ebadbc1dfb48ee5245a",
|
|
"metadata": {
|
|
"data_source": {
|
|
"date_created": "2023-07-09T12:56:40.842000",
|
|
"date_modified": "2023-07-09T12:57:59.173000",
|
|
"record_locator": {
|
|
"page_id": "1605989",
|
|
"url": "https://unstructured-ingest-test.atlassian.net"
|
|
},
|
|
"url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/1605989",
|
|
"version": "1"
|
|
},
|
|
"filetype": "text/html",
|
|
"image_url": "https://unstructured-ingest-test.atlassian.net/wiki/download/thumbnails/1605989/image-20230709-020021.png?version=1&modificationDate=1688907429074&cacheVersion=1&api=v2&width=475&height=236",
|
|
"languages": [
|
|
"eng",
|
|
"fra"
|
|
]
|
|
},
|
|
"text": "",
|
|
"type": "Image"
|
|
}
|
|
] |