feat: save file id for all fsspec connectors if present (#3405)

### Description

If the id value exists in the stats response from fsspec, save it as a
`file_id` field in the metadata being persisted on each element.

---------

Co-authored-by: ryannikolaidis <1208590+ryannikolaidis@users.noreply.github.com>
Co-authored-by: rbiseck3 <rbiseck3@users.noreply.github.com>
This commit is contained in:
Roman Isecke 2024-07-19 09:30:21 -04:00 committed by GitHub
parent 0eb461acc2
commit 1df7908f03
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
17 changed files with 163 additions and 81 deletions

View File

@ -1,4 +1,4 @@
## 0.15.0-dev15
## 0.15.0-dev16
### Enhancements

View File

@ -14,7 +14,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -41,7 +42,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -68,7 +70,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -89,7 +92,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -110,7 +114,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -131,7 +136,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -152,7 +158,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -173,7 +180,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -194,7 +202,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -215,7 +224,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -236,7 +246,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -257,7 +268,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -278,7 +290,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -299,7 +312,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"
@ -321,7 +335,8 @@
"version": "83125548004193369404829885052395764226",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255888824139"
},
"date_created": "1688874451.0",
"date_modified": "1688874451.0"

View File

@ -14,7 +14,8 @@
"version": "77943175838335685751163845636763163681",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255892530552"
},
"date_created": "1688874401.0",
"date_modified": "1688874401.0"

View File

@ -14,7 +14,8 @@
"version": "293680985726204769765169474511274942733",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255884723846"
},
"date_created": "1688874389.0",
"date_modified": "1688874389.0"

View File

@ -14,7 +14,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -36,7 +37,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -58,7 +60,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -80,7 +83,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -102,7 +106,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -124,7 +129,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -146,7 +152,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -168,7 +175,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -190,7 +198,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -212,7 +221,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -234,7 +244,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -256,7 +267,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"
@ -278,7 +290,8 @@
"version": "309546934335254463247992132065898582121",
"record_locator": {
"protocol": "box",
"remote_file_path": "box://utic-test-ingest-fixtures"
"remote_file_path": "box://utic-test-ingest-fixtures",
"file_id": "1255894255490"
},
"date_created": "1688874428.0",
"date_modified": "1688874428.0"

View File

@ -14,7 +14,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -39,7 +40,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -64,7 +66,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -83,7 +86,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -102,7 +106,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -121,7 +126,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -140,7 +146,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -159,7 +166,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -178,7 +186,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -197,7 +206,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -216,7 +226,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -235,7 +246,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -254,7 +266,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -273,7 +286,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}
@ -293,7 +307,8 @@
"version": "134700592086487568162605251521926324397",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACQ"
}
}
}

View File

@ -14,7 +14,8 @@
"version": "67356979305728150851855820427694668063",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACw"
}
}
}

View File

@ -14,7 +14,8 @@
"version": "145453788782335405288844961545898675998",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAADQ"
}
}
}

View File

@ -14,7 +14,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -34,7 +35,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -54,7 +56,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -74,7 +77,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -94,7 +98,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -114,7 +119,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -134,7 +140,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -154,7 +161,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -174,7 +182,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -194,7 +203,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -214,7 +224,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -234,7 +245,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}
@ -254,7 +266,8 @@
"version": "26035320120182381452247268381589958225",
"record_locator": {
"protocol": "dropbox",
"remote_file_path": "dropbox://test-input/"
"remote_file_path": "dropbox://test-input/",
"file_id": "id:De4ZYtDd-JoAAAAAAAAACA"
}
}
}

View File

@ -14,7 +14,8 @@
"version": "199523943725186047835150971481714294476",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/ideas-page.html/1687304971036821"
},
"date_created": "1687304971.038",
"date_modified": "1687304971.038"

View File

@ -13,7 +13,8 @@
"version": "180263070579038859328651626981788275889",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
},
"date_created": "1687304893.303",
"date_modified": "1687304893.303"
@ -34,7 +35,8 @@
"version": "180263070579038859328651626981788275889",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
},
"date_created": "1687304893.303",
"date_modified": "1687304893.303"
@ -55,7 +57,8 @@
"version": "180263070579038859328651626981788275889",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
},
"date_created": "1687304893.303",
"date_modified": "1687304893.303"
@ -76,7 +79,8 @@
"version": "180263070579038859328651626981788275889",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
},
"date_created": "1687304893.303",
"date_modified": "1687304893.303"
@ -97,7 +101,8 @@
"version": "180263070579038859328651626981788275889",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
},
"date_created": "1687304893.303",
"date_modified": "1687304893.303"
@ -118,7 +123,8 @@
"version": "180263070579038859328651626981788275889",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-1/fake-text.txt/1687304893301804"
},
"date_created": "1687304893.303",
"date_modified": "1687304893.303"

View File

@ -14,7 +14,8 @@
"version": "310890354306462681752199911957569001015",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-1/nested/ideas-page.html/1687304893748677"
},
"date_created": "1687304893.75",
"date_modified": "1687304893.75"

View File

@ -13,7 +13,8 @@
"version": "198731266903969902154134165613731741332",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
},
"date_created": "1687304904.192",
"date_modified": "1687304904.192"
@ -34,7 +35,8 @@
"version": "198731266903969902154134165613731741332",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
},
"date_created": "1687304904.192",
"date_modified": "1687304904.192"
@ -55,7 +57,8 @@
"version": "198731266903969902154134165613731741332",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
},
"date_created": "1687304904.192",
"date_modified": "1687304904.192"
@ -76,7 +79,8 @@
"version": "198731266903969902154134165613731741332",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
},
"date_created": "1687304904.192",
"date_modified": "1687304904.192"
@ -97,7 +101,8 @@
"version": "198731266903969902154134165613731741332",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
},
"date_created": "1687304904.192",
"date_modified": "1687304904.192"
@ -118,7 +123,8 @@
"version": "198731266903969902154134165613731741332",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/fake-text.txt/1687304904189941"
},
"date_created": "1687304904.192",
"date_modified": "1687304904.192"

View File

@ -14,7 +14,8 @@
"version": "113813498010717860141768546590661839404",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/nested/ideas-page.html/1687304904584421"
},
"date_created": "1687304904.586",
"date_modified": "1687304904.586"

View File

@ -15,7 +15,8 @@
"version": "25646232132200560657189097157576319365",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/stanley-cups.xlsx/1687304904970987"
},
"date_created": "1687304904.973",
"date_modified": "1687304904.973"
@ -39,7 +40,8 @@
"version": "25646232132200560657189097157576319365",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/stanley-cups.xlsx/1687304904970987"
},
"date_created": "1687304904.973",
"date_modified": "1687304904.973"
@ -62,7 +64,8 @@
"version": "25646232132200560657189097157576319365",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/stanley-cups.xlsx/1687304904970987"
},
"date_created": "1687304904.973",
"date_modified": "1687304904.973"
@ -86,7 +89,8 @@
"version": "25646232132200560657189097157576319365",
"record_locator": {
"protocol": "gs",
"remote_file_path": "gs://utic-test-ingest-fixtures/"
"remote_file_path": "gs://utic-test-ingest-fixtures/",
"file_id": "utic-test-ingest-fixtures/nested-2/stanley-cups.xlsx/1687304904970987"
},
"date_created": "1687304904.973",
"date_modified": "1687304904.973"

View File

@ -1 +1 @@
__version__ = "0.15.0-dev15" # pragma: no cover
__version__ = "0.15.0-dev16" # pragma: no cover

View File

@ -187,6 +187,9 @@ class FsspecIndexer(Indexer):
"protocol": self.index_config.protocol,
"remote_file_path": self.index_config.remote_url,
}
file_stat = self.fs.stat(path=path)
if file_id := file_stat.get("id"):
record_locator["file_id"] = file_id
if metadata:
record_locator["metadata"] = metadata
return DataSourceMetadata(