mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2026-01-04 03:03:55 +00:00
feat: save file id for all fsspec connectors if present (#3405)
### Description If the id value exists in the stats response from fsspec, save it as a `file_id` field in the metadata being persisted on each element. --------- Co-authored-by: ryannikolaidis <1208590+ryannikolaidis@users.noreply.github.com> Co-authored-by: rbiseck3 <rbiseck3@users.noreply.github.com>
This commit is contained in:
parent
0eb461acc2
commit
1df7908f03
@ -1,4 +1,4 @@
|
||||
## 0.15.0-dev15
|
||||
## 0.15.0-dev16
|
||||
|
||||
### Enhancements
|
||||
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -41,7 +42,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -68,7 +70,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -89,7 +92,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -110,7 +114,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -131,7 +136,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -152,7 +158,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -173,7 +180,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -194,7 +202,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -215,7 +224,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -236,7 +246,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -257,7 +268,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -278,7 +290,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -299,7 +312,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
@ -321,7 +335,8 @@
|
||||
"version": "83125548004193369404829885052395764226",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255888824139"
|
||||
},
|
||||
"date_created": "1688874451.0",
|
||||
"date_modified": "1688874451.0"
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "77943175838335685751163845636763163681",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255892530552"
|
||||
},
|
||||
"date_created": "1688874401.0",
|
||||
"date_modified": "1688874401.0"
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "293680985726204769765169474511274942733",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255884723846"
|
||||
},
|
||||
"date_created": "1688874389.0",
|
||||
"date_modified": "1688874389.0"
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -36,7 +37,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -58,7 +60,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -80,7 +83,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -102,7 +106,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -124,7 +129,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -146,7 +152,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -168,7 +175,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -190,7 +198,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -212,7 +221,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -234,7 +244,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -256,7 +267,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
@ -278,7 +290,8 @@
|
||||
"version": "309546934335254463247992132065898582121",
|
||||
"record_locator": {
|
||||
"protocol": "box",
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures"
|
||||
"remote_file_path": "box://utic-test-ingest-fixtures",
|
||||
"file_id": "1255894255490"
|
||||
},
|
||||
"date_created": "1688874428.0",
|
||||
"date_modified": "1688874428.0"
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -39,7 +40,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -64,7 +66,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -83,7 +86,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -102,7 +106,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -121,7 +126,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -140,7 +146,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -159,7 +166,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -178,7 +186,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -197,7 +206,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -216,7 +226,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -235,7 +246,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -254,7 +266,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -273,7 +286,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -293,7 +307,8 @@
|
||||
"version": "134700592086487568162605251521926324397",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "67356979305728150851855820427694668063",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACw"
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "145453788782335405288844961545898675998",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAADQ"
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -34,7 +35,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -54,7 +56,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -74,7 +77,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -94,7 +98,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -114,7 +119,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -134,7 +140,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -154,7 +161,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -174,7 +182,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -194,7 +203,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -214,7 +224,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -234,7 +245,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -254,7 +266,8 @@
|
||||
"version": "26035320120182381452247268381589958225",
|
||||
"record_locator": {
|
||||
"protocol": "dropbox",
|
||||
"remote_file_path": "dropbox://test-input/"
|
||||
"remote_file_path": "dropbox://test-input/",
|
||||
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "199523943725186047835150971481714294476",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/ideas-page.html/1687304971036821"
|
||||
},
|
||||
"date_created": "1687304971.038",
|
||||
"date_modified": "1687304971.038"
|
||||
|
||||
@ -13,7 +13,8 @@
|
||||
"version": "180263070579038859328651626981788275889",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
|
||||
},
|
||||
"date_created": "1687304893.303",
|
||||
"date_modified": "1687304893.303"
|
||||
@ -34,7 +35,8 @@
|
||||
"version": "180263070579038859328651626981788275889",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
|
||||
},
|
||||
"date_created": "1687304893.303",
|
||||
"date_modified": "1687304893.303"
|
||||
@ -55,7 +57,8 @@
|
||||
"version": "180263070579038859328651626981788275889",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
|
||||
},
|
||||
"date_created": "1687304893.303",
|
||||
"date_modified": "1687304893.303"
|
||||
@ -76,7 +79,8 @@
|
||||
"version": "180263070579038859328651626981788275889",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
|
||||
},
|
||||
"date_created": "1687304893.303",
|
||||
"date_modified": "1687304893.303"
|
||||
@ -97,7 +101,8 @@
|
||||
"version": "180263070579038859328651626981788275889",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
|
||||
},
|
||||
"date_created": "1687304893.303",
|
||||
"date_modified": "1687304893.303"
|
||||
@ -118,7 +123,8 @@
|
||||
"version": "180263070579038859328651626981788275889",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
|
||||
},
|
||||
"date_created": "1687304893.303",
|
||||
"date_modified": "1687304893.303"
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "310890354306462681752199911957569001015",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-1/nested/ideas-page.html/1687304893748677"
|
||||
},
|
||||
"date_created": "1687304893.75",
|
||||
"date_modified": "1687304893.75"
|
||||
|
||||
@ -13,7 +13,8 @@
|
||||
"version": "198731266903969902154134165613731741332",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
|
||||
},
|
||||
"date_created": "1687304904.192",
|
||||
"date_modified": "1687304904.192"
|
||||
@ -34,7 +35,8 @@
|
||||
"version": "198731266903969902154134165613731741332",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
|
||||
},
|
||||
"date_created": "1687304904.192",
|
||||
"date_modified": "1687304904.192"
|
||||
@ -55,7 +57,8 @@
|
||||
"version": "198731266903969902154134165613731741332",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
|
||||
},
|
||||
"date_created": "1687304904.192",
|
||||
"date_modified": "1687304904.192"
|
||||
@ -76,7 +79,8 @@
|
||||
"version": "198731266903969902154134165613731741332",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
|
||||
},
|
||||
"date_created": "1687304904.192",
|
||||
"date_modified": "1687304904.192"
|
||||
@ -97,7 +101,8 @@
|
||||
"version": "198731266903969902154134165613731741332",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
|
||||
},
|
||||
"date_created": "1687304904.192",
|
||||
"date_modified": "1687304904.192"
|
||||
@ -118,7 +123,8 @@
|
||||
"version": "198731266903969902154134165613731741332",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
|
||||
},
|
||||
"date_created": "1687304904.192",
|
||||
"date_modified": "1687304904.192"
|
||||
|
||||
@ -14,7 +14,8 @@
|
||||
"version": "113813498010717860141768546590661839404",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/nested/ideas-page.html/1687304904584421"
|
||||
},
|
||||
"date_created": "1687304904.586",
|
||||
"date_modified": "1687304904.586"
|
||||
|
||||
@ -15,7 +15,8 @@
|
||||
"version": "25646232132200560657189097157576319365",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/stanley-cups.xlsx/1687304904970987"
|
||||
},
|
||||
"date_created": "1687304904.973",
|
||||
"date_modified": "1687304904.973"
|
||||
@ -39,7 +40,8 @@
|
||||
"version": "25646232132200560657189097157576319365",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/stanley-cups.xlsx/1687304904970987"
|
||||
},
|
||||
"date_created": "1687304904.973",
|
||||
"date_modified": "1687304904.973"
|
||||
@ -62,7 +64,8 @@
|
||||
"version": "25646232132200560657189097157576319365",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/stanley-cups.xlsx/1687304904970987"
|
||||
},
|
||||
"date_created": "1687304904.973",
|
||||
"date_modified": "1687304904.973"
|
||||
@ -86,7 +89,8 @@
|
||||
"version": "25646232132200560657189097157576319365",
|
||||
"record_locator": {
|
||||
"protocol": "gs",
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/"
|
||||
"remote_file_path": "gs://utic-test-ingest-fixtures/",
|
||||
"file_id": "utic-test-ingest-fixtures/nested-2/stanley-cups.xlsx/1687304904970987"
|
||||
},
|
||||
"date_created": "1687304904.973",
|
||||
"date_modified": "1687304904.973"
|
||||
|
||||
@ -1 +1 @@
|
||||
__version__ = "0.15.0-dev15" # pragma: no cover
|
||||
__version__ = "0.15.0-dev16" # pragma: no cover
|
||||
|
||||
@ -187,6 +187,9 @@ class FsspecIndexer(Indexer):
|
||||
"protocol": self.index_config.protocol,
|
||||
"remote_file_path": self.index_config.remote_url,
|
||||
}
|
||||
file_stat = self.fs.stat(path=path)
|
||||
if file_id := file_stat.get("id"):
|
||||
record_locator["file_id"] = file_id
|
||||
if metadata:
|
||||
record_locator["metadata"] = metadata
|
||||
return DataSourceMetadata(
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user