mirror of
				https://github.com/Unstructured-IO/unstructured.git
				synced 2025-10-24 22:41:05 +00:00 
			
		
		
		
	 542d442699
			
		
	
	
		542d442699
		
			
		
	
	
	
	
		
			
			### Summary Rip off page_number metadata fields until we have page counting for all kinds of html files (not just limited to news articles with multiple `<article>` tag) ### Test Unit tests `test_add_chunking_strategy_on_partition_html_respects_multipage` and `test_add_chunking_strategy_title_on_partition_auto_respects_multipage` removed since they relay on the `page_number` fields from the SEC html file - now test moved to mock test for chunk_by_title -> revisit those tests when we find test file for this Also changed the element ids from partition outputs for html files - element id change due to page number change (in element id hashing) -> todo ticket: update other deterministic element id tests per crag's comment --------- Co-authored-by: ryannikolaidis <1208590+ryannikolaidis@users.noreply.github.com> Co-authored-by: yuming-long <yuming-long@users.noreply.github.com>
		
			
				
	
	
		
			1025 lines
		
	
	
		
			28 KiB
		
	
	
	
		
			JSON
		
	
	
	
	
	
			
		
		
	
	
			1025 lines
		
	
	
		
			28 KiB
		
	
	
	
		
			JSON
		
	
	
	
	
	
| [
 | |
|   {
 | |
|     "element_id": "af28136055ec3b58ec92da684eabe972",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Welcome to your team space!",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "637226363ce2403ca3a797b8e400b470",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "We've added some suggestions and placeholders. Everything is customizable.",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "1827a210ba924c56e275c47f4dcc8680",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "link_start_indexes": [
 | |
|         32,
 | |
|         55,
 | |
|         79
 | |
|       ],
 | |
|       "link_texts": [
 | |
|         "Template - Project plan",
 | |
|         "Template - Meeting notes",
 | |
|         "Template - Weekly status report"
 | |
|       ],
 | |
|       "link_urls": [
 | |
|         "/wiki/spaces/MFS/pages/1540126/Template+-+Project+plan",
 | |
|         "/wiki/spaces/MFS/pages/1605928/Template+-+Meeting+notes",
 | |
|         "/wiki/spaces/MFS/pages/1605942/Template+-+Weekly+status+report"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Get started with page templates:Template - Project planTemplate - Meeting notesTemplate - Weekly status report",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "74ac57479647bf966333f308343d489e",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "link_start_indexes": [
 | |
|         10
 | |
|       ],
 | |
|       "link_texts": [
 | |
|         "Get the most out of your team space"
 | |
|       ],
 | |
|       "link_urls": [
 | |
|         "/wiki/spaces/MFS/pages/1605956/Get+the+most+out+of+your+team+space"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Check out Get the most out of your team space for more tips.",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "42b26823e7d33c417844e3d9866cad89",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "About",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "cf2be0c50ea0ff66bb1dfb0497c453e7",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "What is your team all about?",
 | |
|         "What is your team all about?"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "What is your team all about?",
 | |
|     "type": "NarrativeText"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "53d259755e03050e0d88ddd6660a5e6c",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Mission and vision",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "a725e33535aa3530fe16f61a8417afd7",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "What is your team's mission? What is your vision?",
 | |
|         "What is your team's mission? What is your vision?"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "What is your team's mission? What is your vision?",
 | |
|     "type": "NarrativeText"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "885d987a2a3077b6d014c1db0fa59252",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Meet the team",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "b578d6f9d0e812f6130f14d79a2c9c97",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Add team members to your space.",
 | |
|         "Add team members to your space."
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Add team members to your space.",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "7428e6a9256f6030b2137d082c7ffd27",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Team member"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Team member",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "6aaa4f81530815729e63c057ee8606b5",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Role"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Role",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "9c3c330b00ee89060e13303f5e02bcba",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Responsibility"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Responsibility",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "8e206800f74b037f87bc91ce09a66587",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Team member"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Team member",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "2c4cc93ed9393b0f05a3e564c436e13e",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Role"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Role",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "554c2527470d9fea2aaf8cefd8aa8ffc",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Responsibility"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Responsibility",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "feb3b3be79c77e3d661dc3fa522de26f",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Team member"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Team member",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "5a73ff028549542468675768deee0430",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Role"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Role",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "94d211691238a7f3f74db151876c6734",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Responsibility"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Responsibility",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "819971206479a68fc2c9b189efb456bc",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Contact us",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "c8a0d091f295537e075e91a05c5b9700",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "How can someone reach out to your team?",
 | |
|         "How can someone reach out to your team?"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "How can someone reach out to your team?",
 | |
|     "type": "NarrativeText"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "55d2e1480c9b0daa291da9bb125ed991",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "team@email.com"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "link_start_indexes": [
 | |
|         0
 | |
|       ],
 | |
|       "link_texts": [
 | |
|         null
 | |
|       ],
 | |
|       "link_urls": [
 | |
|         "mailto:team@email.com"
 | |
|       ]
 | |
|     },
 | |
|     "text": "team@email.com",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "8cdf7c104c621a61684afb22e1a12ae6",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Tickets"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Tickets",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "184e1ab78f1ad23cbd87e4051a2e44ba",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Jira board"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Jira board",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "b11108036b6d8a3c5beff0ba72018fbf",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "#channel"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "#channel",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "bec770c2e66ae2747664908931bc34bb",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Important Pages",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "5c143a6e4a05107f68ef13d7da7cd3ed",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "List them here",
 | |
|         "List them here"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "List them here",
 | |
|     "type": "NarrativeText"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "656e2cc40d11fdc4906f2dd580a19c6a",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "618b555629238a470093892056791c8d",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "fb61fd8022c3b78d934d1407834e5409",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "",
 | |
|     "type": "ListItem"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "68accd9d0365712f54b96da661cce03d",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Onboarding FAQs",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "35aa0d02a38ad72c0ca0534155dbdeb8",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Add resources for new hires",
 | |
|         "Add resources for new hires"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Add resources for new hires",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "ea538f1ebdd2ced67e8c86dcf50bc164",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Meeting notes",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "6f4ae84a8d8a1d9005384f35e2ce793c",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Add links to meeting notes",
 | |
|         "Add links to meeting notes"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Add links to meeting notes",
 | |
|     "type": "NarrativeText"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "9616030a71ad0e0654b28e61578d0443",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Team goals",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "d81cb76df56721595c0495e4f5e6094f",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "List them here",
 | |
|         "List them here"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "List them here",
 | |
|     "type": "NarrativeText"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "46c3bd98dbea47cb63923597c929b932",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Team news",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "1558d5e9d97c1cbb5cbb5cb2b077f83d",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "emphasized_text_contents": [
 | |
|         "Create a blog post to share team news. It will automatically appear here once it's published.",
 | |
|         "Create a blog post to share team news. It will automatically appear here once it's published."
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ],
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Create a blog post to share team news. It will automatically appear here once it's published.",
 | |
|     "type": "NarrativeText"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "c281ed85f2e1125c9aaf318fd5178d4d",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Blog stream",
 | |
|     "type": "Title"
 | |
|   },
 | |
|   {
 | |
|     "element_id": "4b401fd3bc190fce17f70000e0164772",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000",
 | |
|         "record_locator": {
 | |
|           "page_id": "229477",
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net"
 | |
|         },
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Create a blog post to share news and announcements with your team and company.",
 | |
|     "type": "NarrativeText"
 | |
|   }
 | |
| ] |