mirror of
https://github.com/open-metadata/OpenMetadata.git
synced 2025-10-02 04:13:17 +00:00
128 lines
4.5 KiB
Python
128 lines
4.5 KiB
Python
# Copyright 2025 Collate
|
|
# Licensed under the Collate Community License, Version 1.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
# https://github.com/open-metadata/OpenMetadata/blob/main/ingestion/LICENSE
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
"""
|
|
Helpers module for db sources
|
|
"""
|
|
|
|
import traceback
|
|
from typing import Iterable, List, Union
|
|
|
|
from metadata.generated.schema.api.lineage.addLineage import AddLineageRequest
|
|
from metadata.generated.schema.entity.data.table import Table
|
|
from metadata.generated.schema.entity.services.databaseService import (
|
|
DatabaseServiceType,
|
|
)
|
|
from metadata.generated.schema.type.entityLineage import Source as LineageSource
|
|
from metadata.ingestion.api.models import Either
|
|
from metadata.ingestion.lineage.models import ConnectionTypeDialectMapper
|
|
from metadata.ingestion.lineage.parser import LINEAGE_PARSING_TIMEOUT, LineageParser
|
|
from metadata.ingestion.lineage.sql_lineage import (
|
|
get_lineage_by_query,
|
|
get_lineage_via_table_entity,
|
|
)
|
|
from metadata.ingestion.ometa.ometa_api import OpenMetadata
|
|
from metadata.ingestion.source.models import TableView
|
|
from metadata.utils import fqn
|
|
from metadata.utils.logger import utils_logger
|
|
|
|
logger = utils_logger()
|
|
|
|
PUBLIC_SCHEMA = "public"
|
|
|
|
|
|
def get_host_from_host_port(uri: str) -> str:
|
|
"""
|
|
if uri is like "localhost:9000"
|
|
then return the host "localhost"
|
|
"""
|
|
return uri.split(":")[0]
|
|
|
|
|
|
def get_view_lineage(
|
|
view: TableView,
|
|
metadata: OpenMetadata,
|
|
service_names: Union[str, List[str]],
|
|
connection_type: str,
|
|
timeout_seconds: int = LINEAGE_PARSING_TIMEOUT,
|
|
) -> Iterable[Either[AddLineageRequest]]:
|
|
"""
|
|
Method to generate view lineage
|
|
Now supports cross-database lineage by accepting a list of service names.
|
|
"""
|
|
if isinstance(service_names, str):
|
|
service_names = [service_names]
|
|
table_name = view.table_name
|
|
schema_name = view.schema_name
|
|
db_name = view.db_name
|
|
schema_fallback = False
|
|
view_definition = view.view_definition
|
|
table_fqn = fqn.build(
|
|
metadata,
|
|
entity_type=Table,
|
|
service_name=service_names[0], # Use first service for table entity lookup
|
|
database_name=db_name,
|
|
schema_name=schema_name,
|
|
table_name=table_name,
|
|
)
|
|
table_entity: Table = metadata.get_by_name(
|
|
entity=Table,
|
|
fqn=table_fqn,
|
|
)
|
|
|
|
if not view_definition:
|
|
logger.warning(f"View definition for view {table_fqn} not available")
|
|
return
|
|
|
|
try:
|
|
connection_type = str(connection_type)
|
|
dialect = ConnectionTypeDialectMapper.dialect_of(connection_type)
|
|
lineage_parser = LineageParser(
|
|
view_definition, dialect, timeout_seconds=timeout_seconds
|
|
)
|
|
|
|
if table_entity.serviceType == DatabaseServiceType.Postgres:
|
|
# For Postgres, if schema is not defined, we need to use the public schema
|
|
schema_name = PUBLIC_SCHEMA
|
|
schema_fallback = True
|
|
|
|
if lineage_parser.source_tables and lineage_parser.target_tables:
|
|
yield from get_lineage_by_query(
|
|
metadata,
|
|
query=view_definition,
|
|
service_names=service_names,
|
|
database_name=db_name,
|
|
schema_name=schema_name,
|
|
dialect=dialect,
|
|
timeout_seconds=timeout_seconds,
|
|
lineage_source=LineageSource.ViewLineage,
|
|
schema_fallback=schema_fallback,
|
|
) or []
|
|
|
|
else:
|
|
yield from get_lineage_via_table_entity(
|
|
metadata,
|
|
table_entity=table_entity,
|
|
service_names=service_names,
|
|
database_name=db_name,
|
|
schema_name=schema_name,
|
|
query=view_definition,
|
|
dialect=dialect,
|
|
timeout_seconds=timeout_seconds,
|
|
lineage_source=LineageSource.ViewLineage,
|
|
schema_fallback=schema_fallback,
|
|
) or []
|
|
except Exception as exc:
|
|
logger.debug(traceback.format_exc())
|
|
logger.warning(
|
|
f"Could not parse query [{view_definition}] ingesting lineage failed: {exc}"
|
|
)
|