2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								---
							 
						 
					
						
							
								
									
										
										
										
											2025-06-20 19:46:38 +05:30 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								title: Airflow Connector | OpenMetadata Workflow Orchestration
							 
						 
					
						
							
								
									
										
										
										
											2025-07-03 17:39:09 +05:30 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								description: Connect Apache Airflow to OpenMetadata effortlessly. Complete setup guide, configuration steps, and pipeline metadata extraction for seamless data lineage tracking.
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								slug: /connectors/pipeline/airflow
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								---
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% connectorDetailsHeader
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								name="Airflow"
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								stage="PROD"
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								platform="OpenMetadata"
							 
						 
					
						
							
								
									
										
										
										
											2025-03-13 13:58:04 +05:30 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								availableFeatures=["Pipelines", "Pipeline Status", "Lineage", "Owners", "Usage"]
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								unavailableFeatures=["Tags"]
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								/ %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								In this section, we provide guides and references to use the Airflow connector.
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								Configure and schedule Airflow metadata workflow from the OpenMetadata UI:
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2025-05-06 15:17:48 +05:30 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								-  [Troubleshooting ](/connectors/pipeline/airflow/troubleshooting ) 
						 
					
						
							
								
									
										
										
										
											2025-04-04 13:59:31 +05:30 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2025-04-18 08:42:17 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								{% partial file="/v1.8/connectors/ingestion-modes-tiles.md" variables={yamlPath: "/connectors/pipeline/airflow/yaml"} /%}
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2025-05-16 15:14:55 +05:30 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								{% tilesContainer %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% tile
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    title="MWAA"
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    description="Run the ingestion framework externally!"
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    link="/deployment/ingestion/external/mwaa"
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								  / %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% tile
							 
						 
					
						
							
								
									
										
										
										
											2025-07-17 18:23:04 +05:30 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    title="GCP Composer "
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    description="Run the ingestion from GCP Composer ."
							 
						 
					
						
							
								
									
										
										
										
											2025-05-16 15:14:55 +05:30 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    link="/deployment/ingestion/external/gcs-composer"
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								  / %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% /tilesContainer %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								## Requirements
  
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% note %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								We only support officially supported Airflow versions. 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								You can check the version list [here ](https://airflow.apache.org/docs/apache-airflow/stable/installation/supported-versions.html ).
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% /note %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								## Metadata Ingestion
  
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% partial 
							 
						 
					
						
							
								
									
										
										
										
											2025-04-18 08:42:17 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								  file="/v1.8/connectors/metadata-ingestion-ui.md" 
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								  variables={
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    connector: "Airflow", 
							 
						 
					
						
							
								
									
										
										
										
											2025-04-18 08:42:17 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								    selectServicePath: "/images/v1.8/connectors/airflow/select-service.png",
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    addNewServicePath: "/images/v1.8/connectors/airflow/add-new-service.png",
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    serviceConnectionPath: "/images/v1.8/connectors/airflow/service-connection.png",
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								} 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								/%}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% stepsContainer %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% extraContent parentTagName="stepsContainer" %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								#### Connection Details
  
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								-  **Host and Port**: URL to the Airflow instance. 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								-  **Number of Status**: Number of status we want to look back to in every ingestion (e.g., Past executions from a DAG). 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								-  **Connection**: Airflow metadata database connection. See these [docs ](https://airflow.apache.org/docs/apache-airflow/stable/howto/set-up-database.html ) 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								  for supported backends.
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								In terms of `connection`  we support the following selections:
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								-  `backend` : Should not be used from the UI. This is only applicable when ingesting Airflow metadata locally 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    by running the ingestion from a DAG. It will use the current Airflow SQLAlchemy connection to extract the data.
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								-  `MySQL` , `Postgres` , and `SQLite` : Pass the required credentials to reach out each of these services. We 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								    will create a connection to the pointed database and read Airflow data from there.
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% /extraContent %}
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2025-04-18 08:42:17 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								{% partial file="/v1.8/connectors/test-connection.md" /%}
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2025-04-18 08:42:17 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								{% partial file="/v1.8/connectors/pipeline/configure-ingestion.md" /%}
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
									
										
										
										
											2025-04-18 08:42:17 +02:00 
										
									 
								 
							 
							
								
									
										 
								
							 
							
								 
							
							
								{% partial file="/v1.8/connectors/ingestion-schedule-and-deploy.md" /%}
							 
						 
					
						
							
								
									
										
										
										
											2024-06-18 15:53:06 +02:00 
										
									 
								 
							 
							
								
							 
							
								 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							
							
								{% /stepsContainer %}