diff --git a/ingestion/src/metadata/profiler/processor/sample_data_handler.py b/ingestion/src/metadata/profiler/processor/sample_data_handler.py index e6410daeac0..2536682a5d0 100644 --- a/ingestion/src/metadata/profiler/processor/sample_data_handler.py +++ b/ingestion/src/metadata/profiler/processor/sample_data_handler.py @@ -17,8 +17,6 @@ from datetime import datetime from functools import singledispatch from io import BytesIO -import pandas as pd - from metadata.clients.aws_client import AWSClient from metadata.generated.schema.entity.data.table import Table, TableData from metadata.generated.schema.security.credentials.awsCredentials import AWSCredentials @@ -44,6 +42,8 @@ def upload_sample_data(data: TableData, profiler_interface: ProfilerInterface) - """ Upload Sample data to storage config """ + import pandas as pd # pylint: disable=import-outside-toplevel + try: sample_storage_config = profiler_interface.storage_config if not sample_storage_config: diff --git a/ingestion/tests/cli_e2e/test_cli_athena.py b/ingestion/tests/cli_e2e/test_cli_athena.py index 348c1f3d06a..becd6a37a58 100644 --- a/ingestion/tests/cli_e2e/test_cli_athena.py +++ b/ingestion/tests/cli_e2e/test_cli_athena.py @@ -60,7 +60,7 @@ class AthenaCliTest(CliCommonDB.TestSuite): return 7 def inserted_rows_count(self) -> int: - return 100 + return 50 def view_column_lineage_count(self) -> int: pass diff --git a/ingestion/tests/cli_e2e/test_cli_datalake_s3.py b/ingestion/tests/cli_e2e/test_cli_datalake_s3.py index 8428567f505..80a035a2dda 100644 --- a/ingestion/tests/cli_e2e/test_cli_datalake_s3.py +++ b/ingestion/tests/cli_e2e/test_cli_datalake_s3.py @@ -58,7 +58,7 @@ class DatalakeCliTest(CliCommonDB.TestSuite): return 7 def inserted_rows_count(self) -> int: - return 100 + return 50 def view_column_lineage_count(self) -> int: pass diff --git a/ingestion/tests/cli_e2e/test_cli_redshift.py b/ingestion/tests/cli_e2e/test_cli_redshift.py index d9f473e0b66..e90af0ab776 100644 --- a/ingestion/tests/cli_e2e/test_cli_redshift.py +++ b/ingestion/tests/cli_e2e/test_cli_redshift.py @@ -83,7 +83,7 @@ class RedshiftCliTest(CliCommonDB.TestSuite, SQACommonMethods): return 5 def inserted_rows_count(self) -> int: - return 100 + return 50 def view_column_lineage_count(self) -> int: """