from datahub.metadata.urns import DatasetUrn from datahub.sdk.main_client import DataHubClient client = DataHubClient.from_env() client.lineage.add_dataset_copy_lineage( upstream=DatasetUrn(platform="postgres", name="customer_data"), downstream=DatasetUrn(platform="snowflake", name="customer_info"), column_lineage="auto_fuzzy", ) # by default, the column lineage is "auto_fuzzy", which will match similar field names. # can also be "auto_strict" for strict matching. # can also be a dict mapping upstream fields to downstream fields. # e.g. # column_lineage={ # "customer_id": ["id"], # "full_name": ["first_name", "last_name"], # }