mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-09-12 18:20:22 +00:00
bugfix: google drive connector metadata safegaurds (#3407)
### Description At times, the google drive response doens't have some of the metadata we're grabbing to populate the `FileData` metadata. This is fine, but without the added safegaurds, this can cause a `KeyError`.
This commit is contained in:
parent
e99e5a8abd
commit
5d387030eb
@ -129,15 +129,15 @@ class GoogleDriveIndexer(Indexer):
|
|||||||
def map_file_data(f: dict) -> FileData:
|
def map_file_data(f: dict) -> FileData:
|
||||||
file_id = f["id"]
|
file_id = f["id"]
|
||||||
filename = f.pop("name")
|
filename = f.pop("name")
|
||||||
url = f.pop("webContentLink")
|
url = f.pop("webContentLink", None)
|
||||||
version = f.pop("version", None)
|
version = f.pop("version", None)
|
||||||
permissions = f.pop("permissions", None)
|
permissions = f.pop("permissions", None)
|
||||||
date_created_str = f.pop("createdTime")
|
date_created_str = f.pop("createdTime", None)
|
||||||
date_created_dt = parser.parse(date_created_str)
|
date_created_dt = parser.parse(date_created_str) if date_created_str else None
|
||||||
date_modified_str = f.pop("modifiedTime")
|
date_modified_str = f.pop("modifiedTime", None)
|
||||||
parent_path = f.pop("parent_path", None)
|
parent_path = f.pop("parent_path", None)
|
||||||
parent_root_path = f.pop("parent_root_path", None)
|
parent_root_path = f.pop("parent_root_path", None)
|
||||||
date_modified_dt = parser.parse(date_modified_str)
|
date_modified_dt = parser.parse(date_modified_str) if date_modified_str else None
|
||||||
if (
|
if (
|
||||||
parent_path
|
parent_path
|
||||||
and isinstance(parent_path, str)
|
and isinstance(parent_path, str)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user