Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

57 lines
2.0 KiB
Python
Raw Normal View History

# Copyright 2021 Collate
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
# http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from airflow import DAG
# these are params only used in the DAG factory, not in the tasks
from openmetadata_managed_apis.utils.logger import workflow_logger
from openmetadata_managed_apis.workflows.ingestion.registry import build_registry
from metadata.generated.schema.entity.services.ingestionPipelines.ingestionPipeline import (
IngestionPipeline,
)
logger = workflow_logger()
class WorkflowBuilder:
"""
Generates tasks and a DAG from a config.
:param workflow_config: configuration for the DAG
"""
def __init__(self, ingestion_pipeline: IngestionPipeline) -> None:
self.airflow_pipeline = ingestion_pipeline
self.dag_name: str = self.airflow_pipeline.name.__root__
def build(self) -> DAG:
"""
Generates a DAG from the DAG parameters.
:returns: dict with dag_id and DAG object
:type: Dict[str, Union[str, DAG]]
"""
dag_type = self.airflow_pipeline.pipelineType.value
build_fn = build_registry.registry.get(dag_type)
if not build_fn:
msg = f"Cannot find build function for {dag_type} in {build_registry.registry}"
logger.error(msg)
raise ValueError(msg)
dag = build_fn(self.airflow_pipeline)
if not isinstance(dag, DAG):
msg = f"Invalid return type from {build_fn.__name__} when building {dag_type}."
logger.error(msg)
raise ValueError(msg)
return dag