| 
									
										
										
										
											2025-04-03 10:39:47 +05:30
										 |  |  | #  Copyright 2025 Collate | 
					
						
							|  |  |  | #  Licensed under the Collate Community License, Version 1.0 (the "License"); | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  | #  you may not use this file except in compliance with the License. | 
					
						
							|  |  |  | #  You may obtain a copy of the License at | 
					
						
							| 
									
										
										
										
											2025-04-03 10:39:47 +05:30
										 |  |  | #  https://github.com/open-metadata/OpenMetadata/blob/main/ingestion/LICENSE | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  | #  Unless required by applicable law or agreed to in writing, software | 
					
						
							|  |  |  | #  distributed under the License is distributed on an "AS IS" BASIS, | 
					
						
							|  |  |  | #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
					
						
							|  |  |  | #  See the License for the specific language governing permissions and | 
					
						
							|  |  |  | #  limitations under the License. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | """
 | 
					
						
							|  |  |  | Query parser utils tests | 
					
						
							|  |  |  | """
 | 
					
						
							|  |  |  | import json | 
					
						
							| 
									
										
										
										
											2024-07-26 16:45:34 +02:00
										 |  |  | import os.path | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  | from unittest import TestCase | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-08-30 15:49:42 +02:00
										 |  |  | from metadata.workflow.usage import UsageWorkflow | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | config = """
 | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |   "source": { | 
					
						
							| 
									
										
										
										
											2022-12-27 15:00:22 +01:00
										 |  |  |     "type": "custom-database", | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  |     "serviceName": "sample_data", | 
					
						
							|  |  |  |     "serviceConnection": { | 
					
						
							|  |  |  |       "config": { | 
					
						
							| 
									
										
										
										
											2022-12-27 15:00:22 +01:00
										 |  |  |         "type": "CustomDatabase", | 
					
						
							|  |  |  |         "sourcePythonClass": "metadata.ingestion.source.database.sample_usage.SampleUsageSource", | 
					
						
							|  |  |  |         "connectionOptions": { | 
					
						
							|  |  |  |           "sampleDataFolder": "ingestion/examples/sample_data" | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  |       } | 
					
						
							|  |  |  |     }, | 
					
						
							|  |  |  |     "sourceConfig": { | 
					
						
							|  |  |  |       "config":{ | 
					
						
							|  |  |  |         "type": "DatabaseUsage" | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   }, | 
					
						
							|  |  |  |   "processor": { | 
					
						
							|  |  |  |     "type": "query-parser", | 
					
						
							|  |  |  |     "config": {} | 
					
						
							|  |  |  |   }, | 
					
						
							|  |  |  |   "stage": { | 
					
						
							|  |  |  |     "type": "table-usage", | 
					
						
							|  |  |  |     "config": { | 
					
						
							|  |  |  |       "filename": "/tmp/sample_usage" | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   }, | 
					
						
							|  |  |  |   "bulkSink": { | 
					
						
							|  |  |  |     "type": "metadata-usage", | 
					
						
							|  |  |  |     "config": { | 
					
						
							|  |  |  |       "filename": "/tmp/sample_usage" | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   }, | 
					
						
							|  |  |  |   "workflowConfig": { | 
					
						
							|  |  |  |     "openMetadataServerConfig": { | 
					
						
							|  |  |  |       "hostPort": "http://localhost:8585/api", | 
					
						
							| 
									
										
										
										
											2022-09-26 16:19:47 +05:30
										 |  |  |       "authProvider": "openmetadata", | 
					
						
							|  |  |  |       "securityConfig": { | 
					
						
							|  |  |  |         "jwtToken": "eyJraWQiOiJHYjM4OWEtOWY3Ni1nZGpzLWE5MmotMDI0MmJrOTQzNTYiLCJ0eXAiOiJKV1QiLCJhbGciOiJSUzI1NiJ9.eyJzdWIiOiJhZG1pbiIsImlzQm90IjpmYWxzZSwiaXNzIjoib3Blbi1tZXRhZGF0YS5vcmciLCJpYXQiOjE2NjM5Mzg0NjIsImVtYWlsIjoiYWRtaW5Ab3Blbm1ldGFkYXRhLm9yZyJ9.tS8um_5DKu7HgzGBzS1VTA5uUjKWOCU0B_j08WXBiEC0mr0zNREkqVfwFDD-d24HlNEbrqioLsBuFRiwIWKc1m_ZlVQbG7P36RUxhuv2vbSp80FKyNM-Tj93FDzq91jsyNmsQhyNv_fNr3TXfzzSPjHt8Go0FMMP66weoKMgW2PbXlhVKwEuXUHyakLLzewm9UMeQaEiRzhiTMU3UkLXcKbYEJJvfNFcLwSl9W8JCO_l0Yj3ud-qt_nQYEZwqW6u5nfdQllN133iikV4fM5QZsMCnm8Rq1mvLR0y9bmJiD7fwM1tmJ791TUWqmKaTnP49U493VanKpUAfzIiOiIbhg" | 
					
						
							|  |  |  |       } | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  |     } | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | """
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class QueryParserTest(TestCase): | 
					
						
							|  |  |  |     def test_join_count(self): | 
					
						
							|  |  |  |         """
 | 
					
						
							|  |  |  |         Check the join count | 
					
						
							|  |  |  |         """
 | 
					
						
							|  |  |  |         expected_result = { | 
					
						
							| 
									
										
										
										
											2025-03-14 13:37:40 +05:30
										 |  |  |             "shopify.raw_product_catalog": 5, | 
					
						
							|  |  |  |             "dim_customer": 4, | 
					
						
							|  |  |  |             "fact_order": 4, | 
					
						
							|  |  |  |             "shopify.fact_sale": 5, | 
					
						
							| 
									
										
										
										
											2025-03-17 11:33:50 +05:30
										 |  |  |             "shopify.raw_customer": 11, | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2024-07-26 16:45:34 +02:00
										 |  |  |         config_dict = json.loads(config) | 
					
						
							|  |  |  |         config_dict["source"]["serviceConnection"]["config"]["connectionOptions"][ | 
					
						
							|  |  |  |             "sampleDataFolder" | 
					
						
							|  |  |  |         ] = ( | 
					
						
							|  |  |  |             os.path.dirname(__file__) | 
					
						
							|  |  |  |             + "/../../../" | 
					
						
							|  |  |  |             + config_dict["source"]["serviceConnection"]["config"]["connectionOptions"][ | 
					
						
							|  |  |  |                 "sampleDataFolder" | 
					
						
							|  |  |  |             ] | 
					
						
							|  |  |  |         ) | 
					
						
							|  |  |  |         workflow = UsageWorkflow.create(config_dict) | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  |         workflow.execute() | 
					
						
							|  |  |  |         table_usage_map = {} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-08-30 15:49:42 +02:00
										 |  |  |         # UsageWorkflow has the steps (processor, stage, bulk_sink) | 
					
						
							|  |  |  |         for key, value in workflow.steps[1].table_usage.items(): | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  |             table_usage_map[key[0]] = value.count | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         for table_name, expected_count in expected_result.items(): | 
					
						
							|  |  |  |             try: | 
					
						
							|  |  |  |                 self.assertEqual(table_usage_map[table_name], expected_count) | 
					
						
							| 
									
										
										
										
											2023-08-30 15:49:42 +02:00
										 |  |  |             except KeyError: | 
					
						
							| 
									
										
										
										
											2022-07-18 18:50:27 +02:00
										 |  |  |                 self.assertTrue(False) | 
					
						
							|  |  |  |         workflow.stop() |