From 726ee0f6b87cf473b067044e28adb490ddfc2569 Mon Sep 17 00:00:00 2001 From: Tamas Nemeth Date: Fri, 23 Jun 2023 09:12:50 +0200 Subject: [PATCH] fix(ingest/csv-enricher): Adding extra check in csv enricher to ignore non-urn urns (#8169) Co-authored-by: Pedro Silva --- .../src/datahub/ingestion/source/csv_enricher.py | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/metadata-ingestion/src/datahub/ingestion/source/csv_enricher.py b/metadata-ingestion/src/datahub/ingestion/source/csv_enricher.py index 869d5a0254..1e9879f599 100644 --- a/metadata-ingestion/src/datahub/ingestion/source/csv_enricher.py +++ b/metadata-ingestion/src/datahub/ingestion/source/csv_enricher.py @@ -546,7 +546,9 @@ class CSVEnricherSource(Source): term_urns: List[str] = terms_array_string.split(self.config.array_delimiter) term_associations: List[GlossaryTermAssociationClass] = [ - GlossaryTermAssociationClass(term) for term in term_urns + GlossaryTermAssociationClass(term) + for term in term_urns + if term.startswith("urn:li:") ] return term_associations @@ -559,7 +561,7 @@ class CSVEnricherSource(Source): tag_urns: List[str] = tags_array_string.split(self.config.array_delimiter) tag_associations: List[TagAssociationClass] = [ - TagAssociationClass(tag) for tag in tag_urns + TagAssociationClass(tag) for tag in tag_urns if tag.startswith("urn:li:") ] return tag_associations @@ -582,7 +584,9 @@ class CSVEnricherSource(Source): owner_urns: List[str] = owners_array_string.split(self.config.array_delimiter) owners: List[OwnerClass] = [ - OwnerClass(owner_urn, type=ownership_type) for owner_urn in owner_urns + OwnerClass(owner_urn, type=ownership_type) + for owner_urn in owner_urns + if owner_urn.startswith("urn:li:") ] return owners