mirror of
https://github.com/datahub-project/datahub.git
synced 2025-07-03 23:28:11 +00:00
19 lines
657 B
Python
19 lines
657 B
Python
from datahub.metadata.urns import DatasetUrn
|
|
from datahub.sdk.main_client import DataHubClient
|
|
|
|
client = DataHubClient.from_env()
|
|
|
|
client.lineage.add_dataset_copy_lineage(
|
|
upstream=DatasetUrn(platform="postgres", name="customer_data"),
|
|
downstream=DatasetUrn(platform="snowflake", name="customer_info"),
|
|
column_lineage="auto_fuzzy",
|
|
)
|
|
# by default, the column lineage is "auto_fuzzy", which will match similar field names.
|
|
# can also be "auto_strict" for strict matching.
|
|
# can also be a dict mapping upstream fields to downstream fields.
|
|
# e.g.
|
|
# column_lineage={
|
|
# "customer_id": ["id"],
|
|
# "full_name": ["first_name", "last_name"],
|
|
# }
|