2025-04-03 10:39:47 +05:30

57 lines
2.0 KiB
Python

# Copyright 2025 Collate
# Licensed under the Collate Community License, Version 1.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
# https://github.com/open-metadata/OpenMetadata/blob/main/ingestion/LICENSE
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from airflow import DAG
# these are params only used in the DAG factory, not in the tasks
from openmetadata_managed_apis.utils.logger import workflow_logger
from openmetadata_managed_apis.workflows.ingestion.registry import build_registry
from metadata.generated.schema.entity.services.ingestionPipelines.ingestionPipeline import (
IngestionPipeline,
)
logger = workflow_logger()
class WorkflowBuilder:
"""
Generates tasks and a DAG from a config.
:param workflow_config: configuration for the DAG
"""
def __init__(self, ingestion_pipeline: IngestionPipeline) -> None:
self.airflow_pipeline = ingestion_pipeline
self.dag_name: str = self.airflow_pipeline.name.root
def build(self) -> DAG:
"""
Generates a DAG from the DAG parameters.
:returns: dict with dag_id and DAG object
:type: Dict[str, Union[str, DAG]]
"""
dag_type = self.airflow_pipeline.pipelineType.value
build_fn = build_registry.registry.get(dag_type)
if not build_fn:
msg = f"Cannot find build function for {dag_type} in {build_registry.registry}"
logger.error(msg)
raise ValueError(msg)
dag = build_fn(self.airflow_pipeline)
if not isinstance(dag, DAG):
msg = f"Invalid return type from {build_fn.__name__} when building {dag_type}."
logger.error(msg)
raise ValueError(msg)
return dag