mirror of
				https://github.com/Unstructured-IO/unstructured.git
				synced 2025-10-25 15:03:54 +00:00 
			
		
		
		
	 135aa65906
			
		
	
	
		135aa65906
		
			
		
	
	
	
	
		
			
			### Description * If the contents of a doc were updated by the process of reading/downloading it, this was not being persisted. To fix this, the data being passed around was updated to use a multiprocessing safe dict rather than the json string. Now that dict is updated after the `get_file` method is called. * Wikipedia connector was updated to use a static filename rather than one requiring a call to fetch data. * The read config param `re_download` was not being leveraged by the source node, this was fixed. * Added fix: chunking and embedding order reversed so chunking runs before embeddings --------- Co-authored-by: ryannikolaidis <1208590+ryannikolaidis@users.noreply.github.com> Co-authored-by: rbiseck3 <rbiseck3@users.noreply.github.com>
		
			
				
	
	
		
			1054 lines
		
	
	
		
			29 KiB
		
	
	
	
		
			JSON
		
	
	
	
	
	
			
		
		
	
	
			1054 lines
		
	
	
		
			29 KiB
		
	
	
	
		
			JSON
		
	
	
	
	
	
| [
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "8a15fc1eef0a58dbead47b882dbcdd24",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Welcome to your team space!"
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "a621b19bad2c2be0cfe54534c90ab126",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "We've added some suggestions and placeholders. Everything is customizable."
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "2a2f2d2dcdde9622cd6972a774138f61",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "link_urls": [
 | |
|         "/wiki/spaces/MFS/pages/1540126/Template+-+Project+plan",
 | |
|         "/wiki/spaces/MFS/pages/1605928/Template+-+Meeting+notes",
 | |
|         "/wiki/spaces/MFS/pages/1605942/Template+-+Weekly+status+report"
 | |
|       ],
 | |
|       "link_texts": [
 | |
|         "Template - Project plan",
 | |
|         "Template - Meeting notes",
 | |
|         "Template - Weekly status report"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Get started with page templates:Template - Project planTemplate - Meeting notesTemplate - Weekly status report"
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "84b8c34eea80326420f9b3e5b939497c",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "link_urls": [
 | |
|         "/wiki/spaces/MFS/pages/1605956/Get+the+most+out+of+your+team+space"
 | |
|       ],
 | |
|       "link_texts": [
 | |
|         "Get the most out of your team space"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Check out Get the most out of your team space for more tips."
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "4efca0d10c5feb8e9b35eb1d994f2905",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "About"
 | |
|   },
 | |
|   {
 | |
|     "type": "NarrativeText",
 | |
|     "element_id": "7c7300ac1a16ec290de2442ba09763c1",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "What is your team all about?",
 | |
|         "What is your team all about?"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "What is your team all about?"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "d416dc3ddd2f2ba48ad2bb784b808856",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Mission and vision"
 | |
|   },
 | |
|   {
 | |
|     "type": "NarrativeText",
 | |
|     "element_id": "0d9db833ea5d982786604025ab277aa6",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "What is your team's mission? What is your vision?",
 | |
|         "What is your team's mission? What is your vision?"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "What is your team's mission? What is your vision?"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "ecfdb98aaa881aa6cff78b56f2b1e4bc",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Meet the team"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "44a4aebe327cd902d50cc9462de55db4",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Add team members to your space.",
 | |
|         "Add team members to your space."
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Add team members to your space."
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "8062dbb50d1094a8047ec09c9e013d4b",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Team member"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Team member"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "14736a2eb9f4159f4b6b86f192c3c222",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Role"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Role"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "c91217be093ab3d9bc1ce3917ed89c8c",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Responsibility"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Responsibility"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "8062dbb50d1094a8047ec09c9e013d4b",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Team member"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Team member"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "14736a2eb9f4159f4b6b86f192c3c222",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Role"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Role"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "c91217be093ab3d9bc1ce3917ed89c8c",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Responsibility"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Responsibility"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "8062dbb50d1094a8047ec09c9e013d4b",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Team member"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Team member"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "14736a2eb9f4159f4b6b86f192c3c222",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Role"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Role"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "c91217be093ab3d9bc1ce3917ed89c8c",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Responsibility"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Responsibility"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "47aaf31b83d6bfd705b80bcd5b6269be",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Contact us"
 | |
|   },
 | |
|   {
 | |
|     "type": "NarrativeText",
 | |
|     "element_id": "1c3db10eee185bd74b4a3de5e3175939",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "How can someone reach out to your team?",
 | |
|         "How can someone reach out to your team?"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "How can someone reach out to your team?"
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "74abeee66eab3921cf03757abdb8d5e6",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "link_urls": [
 | |
|         "mailto:team@email.com"
 | |
|       ],
 | |
|       "link_texts": [
 | |
|         null
 | |
|       ],
 | |
|       "emphasized_text_contents": [
 | |
|         "team@email.com"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "team@email.com"
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "3d131368b43397ff5fbe0a9bf62c0f79",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Tickets"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Tickets"
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "d54a2001284ac19f58ad73a62674244a",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Jira board"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Jira board"
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "195a10e63a336aa995e242c92f17b756",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "#channel"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "#channel"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "c8b321a3bf39a57de24aac4cca6605a0",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Important Pages"
 | |
|   },
 | |
|   {
 | |
|     "type": "NarrativeText",
 | |
|     "element_id": "43770d73ac7c6d8d1a38dd0c13fa8607",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "List them here",
 | |
|         "List them here"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "List them here"
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "e3b0c44298fc1c149afbf4c8996fb924",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": ""
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "e3b0c44298fc1c149afbf4c8996fb924",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": ""
 | |
|   },
 | |
|   {
 | |
|     "type": "ListItem",
 | |
|     "element_id": "e3b0c44298fc1c149afbf4c8996fb924",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": ""
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "86d353b1f4a6a63ab4577d94ba9d4fea",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Onboarding FAQs"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "2dd5afc718ccdf97d484020d740d20ce",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Add resources for new hires",
 | |
|         "Add resources for new hires"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Add resources for new hires"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "9e6c24f51918063b7c8514b3040ef52b",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Meeting notes"
 | |
|   },
 | |
|   {
 | |
|     "type": "NarrativeText",
 | |
|     "element_id": "518cd477daaec831ad223c1d2e6b790f",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Add links to meeting notes",
 | |
|         "Add links to meeting notes"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Add links to meeting notes"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "f47e8394cbf0d8338b3dad5f95bcac3e",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Team goals"
 | |
|   },
 | |
|   {
 | |
|     "type": "NarrativeText",
 | |
|     "element_id": "43770d73ac7c6d8d1a38dd0c13fa8607",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "List them here",
 | |
|         "List them here"
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "List them here"
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "c3a1dd0877d734e8ec68983d0cf737ce",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Team news"
 | |
|   },
 | |
|   {
 | |
|     "type": "NarrativeText",
 | |
|     "element_id": "b2c91194db5ddc5e5b30240fbe5386d5",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1,
 | |
|       "emphasized_text_contents": [
 | |
|         "Create a blog post to share team news. It will automatically appear here once it's published.",
 | |
|         "Create a blog post to share team news. It will automatically appear here once it's published."
 | |
|       ],
 | |
|       "emphasized_text_tags": [
 | |
|         "em",
 | |
|         "span"
 | |
|       ]
 | |
|     },
 | |
|     "text": "Create a blog post to share team news. It will automatically appear here once it's published."
 | |
|   },
 | |
|   {
 | |
|     "type": "Title",
 | |
|     "element_id": "903f4f48016cafdf332e01f2d004487f",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Blog stream"
 | |
|   },
 | |
|   {
 | |
|     "type": "NarrativeText",
 | |
|     "element_id": "cfe366b5f8c8991d1e2af6e507e35a4e",
 | |
|     "metadata": {
 | |
|       "data_source": {
 | |
|         "url": "https://unstructured-ingest-test.atlassian.net/wiki/rest/api/content/229477",
 | |
|         "version": "1",
 | |
|         "record_locator": {
 | |
|           "url": "https://unstructured-ingest-test.atlassian.net",
 | |
|           "page_id": "229477"
 | |
|         },
 | |
|         "date_created": "2023-06-30T17:25:25.504000",
 | |
|         "date_modified": "2023-06-30T17:25:30.898000"
 | |
|       },
 | |
|       "filetype": "text/html",
 | |
|       "languages": [
 | |
|         "eng"
 | |
|       ],
 | |
|       "page_number": 1
 | |
|     },
 | |
|     "text": "Create a blog post to share news and announcements with your team and company."
 | |
|   }
 | |
| ] |