| 
									
										
										
										
											2023-11-13 08:58:38 +01:00
										 |  |  | #  Copyright 2021 Collate | 
					
						
							|  |  |  | #  Licensed under the Apache License, Version 2.0 (the "License"); | 
					
						
							|  |  |  | #  you may not use this file except in compliance with the License. | 
					
						
							|  |  |  | #  You may obtain a copy of the License at | 
					
						
							|  |  |  | #  http://www.apache.org/licenses/LICENSE-2.0 | 
					
						
							|  |  |  | #  Unless required by applicable law or agreed to in writing, software | 
					
						
							|  |  |  | #  distributed under the License is distributed on an "AS IS" BASIS, | 
					
						
							|  |  |  | #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
					
						
							|  |  |  | #  See the License for the specific language governing permissions and | 
					
						
							|  |  |  | #  limitations under the License. | 
					
						
							|  |  |  | """
 | 
					
						
							|  |  |  | Generic Workflow entrypoint to execute Applications | 
					
						
							|  |  |  | """
 | 
					
						
							|  |  |  | import json | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from airflow import DAG | 
					
						
							|  |  |  | from openmetadata_managed_apis.utils.logger import set_operator_logger | 
					
						
							|  |  |  | from openmetadata_managed_apis.workflows.ingestion.common import ( | 
					
						
							|  |  |  |     build_dag, | 
					
						
							|  |  |  |     build_workflow_config_property, | 
					
						
							|  |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-11-28 06:25:33 +05:30
										 |  |  | from metadata.generated.schema.entity.applications.configuration.applicationConfig import ( | 
					
						
							| 
									
										
										
										
											2023-11-13 08:58:38 +01:00
										 |  |  |     AppConfig, | 
					
						
							| 
									
										
										
										
											2024-01-31 18:51:09 -08:00
										 |  |  |     PrivateConfig, | 
					
						
							| 
									
										
										
										
											2023-11-13 08:58:38 +01:00
										 |  |  | ) | 
					
						
							|  |  |  | from metadata.generated.schema.entity.services.ingestionPipelines.ingestionPipeline import ( | 
					
						
							|  |  |  |     IngestionPipeline, | 
					
						
							|  |  |  | ) | 
					
						
							|  |  |  | from metadata.generated.schema.metadataIngestion.application import ( | 
					
						
							|  |  |  |     OpenMetadataApplicationConfig, | 
					
						
							|  |  |  | ) | 
					
						
							|  |  |  | from metadata.generated.schema.metadataIngestion.applicationPipeline import ( | 
					
						
							|  |  |  |     ApplicationPipeline, | 
					
						
							|  |  |  | ) | 
					
						
							|  |  |  | from metadata.workflow.application import ApplicationWorkflow | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def application_workflow(workflow_config: OpenMetadataApplicationConfig): | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     Task that creates and runs the ingestion workflow. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     The workflow_config gets cooked form the incoming | 
					
						
							|  |  |  |     ingestionPipeline. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     This is the callable used to create the PythonOperator | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     set_operator_logger(workflow_config) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2025-02-25 17:51:49 +01:00
										 |  |  |     config = json.loads( | 
					
						
							|  |  |  |         workflow_config.model_dump_json(exclude_defaults=False, mask_secrets=False) | 
					
						
							|  |  |  |     ) | 
					
						
							| 
									
										
										
										
											2023-11-13 08:58:38 +01:00
										 |  |  |     workflow = ApplicationWorkflow.create(config) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     workflow.execute() | 
					
						
							|  |  |  |     workflow.raise_from_status() | 
					
						
							| 
									
										
										
										
											2024-07-29 09:20:34 +02:00
										 |  |  |     workflow.print_status() | 
					
						
							| 
									
										
										
										
											2023-11-13 08:58:38 +01:00
										 |  |  |     workflow.stop() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def build_application_workflow_config( | 
					
						
							|  |  |  |     ingestion_pipeline: IngestionPipeline, | 
					
						
							|  |  |  | ) -> OpenMetadataApplicationConfig: | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     Given an airflow_pipeline, prepare the workflow config JSON | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # Here we have an application pipeline, so the Source Config is of type ApplicationPipeline | 
					
						
							|  |  |  |     application_pipeline_conf: ApplicationPipeline = ( | 
					
						
							|  |  |  |         ingestion_pipeline.sourceConfig.config | 
					
						
							|  |  |  |     ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     application_workflow_config = OpenMetadataApplicationConfig( | 
					
						
							|  |  |  |         sourcePythonClass=application_pipeline_conf.sourcePythonClass, | 
					
						
							|  |  |  |         # We pass the generic class and let each app cast the actual object | 
					
						
							|  |  |  |         appConfig=AppConfig( | 
					
						
							| 
									
										
										
										
											2024-06-05 21:18:37 +02:00
										 |  |  |             root=application_pipeline_conf.appConfig.root, | 
					
						
							| 
									
										
										
										
											2024-01-31 18:51:09 -08:00
										 |  |  |         ) | 
					
						
							|  |  |  |         if application_pipeline_conf.appConfig | 
					
						
							|  |  |  |         else None, | 
					
						
							|  |  |  |         appPrivateConfig=PrivateConfig( | 
					
						
							| 
									
										
										
										
											2024-06-05 21:18:37 +02:00
										 |  |  |             root=application_pipeline_conf.appPrivateConfig.root | 
					
						
							| 
									
										
										
										
											2024-01-31 18:51:09 -08:00
										 |  |  |         ) | 
					
						
							|  |  |  |         if application_pipeline_conf.appPrivateConfig | 
					
						
							|  |  |  |         else None, | 
					
						
							| 
									
										
										
										
											2023-11-13 08:58:38 +01:00
										 |  |  |         workflowConfig=build_workflow_config_property(ingestion_pipeline), | 
					
						
							| 
									
										
										
										
											2024-06-05 21:18:37 +02:00
										 |  |  |         ingestionPipelineFQN=ingestion_pipeline.fullyQualifiedName.root, | 
					
						
							| 
									
										
										
										
											2023-11-13 08:58:38 +01:00
										 |  |  |     ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return application_workflow_config | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def build_application_dag(ingestion_pipeline: IngestionPipeline) -> DAG: | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     Build a simple metadata workflow DAG | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     application_workflow_config = build_application_workflow_config(ingestion_pipeline) | 
					
						
							|  |  |  |     dag = build_dag( | 
					
						
							|  |  |  |         task_name="application_task", | 
					
						
							|  |  |  |         ingestion_pipeline=ingestion_pipeline, | 
					
						
							|  |  |  |         workflow_config=application_workflow_config, | 
					
						
							|  |  |  |         workflow_fn=application_workflow, | 
					
						
							|  |  |  |     ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return dag |