Fix #432:Added Redash Connector (#444)

* added redash connector

* added redash connector

* Added Redash Connector

* minor changes

Co-authored-by: parthp2107 <parth.panchal@deuexsoultions.com>
Co-authored-by: parthp2107 <parth@getcollate.io>
This commit is contained in:
parthp2107 2021-09-22 15:09:24 +05:30 committed by GitHub
parent d961948946
commit 06810cdec1
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 156 additions and 1 deletions

View File

@ -0,0 +1,28 @@
{
"source": {
"type": "redash",
"config": {
"api_key": "api_key",
"uri": "http://localhost:5000",
"service_name": "redash"
}
},
"sink": {
"type": "metadata-rest",
"config": {}
},
"metadata_server": {
"type": "metadata-server",
"config": {
"api_endpoint": "http://localhost:8585/api",
"auth_provider_type": "no-auth"
}
},
"cron": {
"minute": "*/5",
"hour": null,
"day": null,
"month": null,
"day_of_week": null
}
}

View File

@ -92,7 +92,8 @@ plugins: Dict[str, Set[str]] = {
"pii-processor": pii_requirements,
"presto": {"pyhive~=0.6.3"},
"postgres": {"pymysql>=1.0.2", "psycopg2-binary", "GeoAlchemy2"},
"redshift": {"sqlalchemy-redshift", "GeoAlchemy2", "psycopg2-binary"},
"redash": {"redash-toolbelt==0.1.4"},
"redshift": {"sqlalchemy-redshift", "psycopg2-binary", "GeoAlchemy2"},
"redshift-usage": {"sqlalchemy-redshift", "psycopg2-binary", "GeoAlchemy2"},
"scheduler": scheduler_requirements,
"data-profiler": {"openmetadata-data-profiler"},

View File

@ -0,0 +1,126 @@
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import uuid
from dataclasses import dataclass
from dataclasses import field
from typing import List, Iterable
import requests
from metadata.generated.schema.entity.data.chart import Chart
from metadata.generated.schema.type.entityReference import EntityReference
from metadata.ingestion.api.common import ConfigModel, Record, WorkflowContext
from metadata.ingestion.api.source import Source
from metadata.ingestion.api.source import SourceStatus
from metadata.ingestion.models.table_metadata import Dashboard
from metadata.ingestion.ometa.openmetadata_rest import MetadataServerConfig
from redash_toolbelt import Redash
from metadata.utils.helpers import get_dashboard_service_or_create
from metadata.generated.schema.entity.services.dashboardService import DashboardServiceType
class RedashSourceConfig(ConfigModel):
uri: str = "http://localhost:5000"
username: str = ""
api_key: str
service_name: str
service_type: str = "Redash"
@dataclass
class RedashSourceStatus(SourceStatus):
items_scanned: int = 0
filtered: List[str] = field(default_factory=list)
def item_scanned_status(self) -> None:
self.items_scanned += 1
def item_dropped_status(self, item: str) -> None:
self.filtered.append(item)
class RedashSource(Source):
config: RedashSourceConfig
metadata_config: MetadataServerConfig
status: RedashSourceStatus
platform = "redash"
def __init__(self, config: RedashSourceConfig, metadata_config: MetadataServerConfig, ctx: WorkflowContext):
super().__init__(ctx)
self.config = config
self.metadata_config = metadata_config
self.status = RedashSourceStatus()
self.client = Redash(self.config.uri, self.config.api_key)
self.service = get_dashboard_service_or_create(config.service_name,
DashboardServiceType.Redash.name,
config.username,
config.api_key,
config.uri,
metadata_config)
@classmethod
def create(cls, config_dict: dict, metadata_config_dict: dict, ctx: WorkflowContext):
config = RedashSourceConfig.parse_obj(config_dict)
metadata_config = MetadataServerConfig.parse_obj(metadata_config_dict)
return cls(config, metadata_config, ctx)
def prepare(self):
pass
def next_record(self) -> Iterable[Record]:
yield from self.get_redash_charts()
yield from self.get_redash_dashboard()
def get_redash_charts(self) -> Chart:
query_info = self.client.queries()
for query_info in query_info["results"]:
query_id = query_info["id"]
query_name = query_info["name"]
query_data = requests.get(f"{self.config.uri}/api/queries/{query_id}").json()
for visualization in query_data.get("Visualizations", []):
chart_type = visualization.get("type", "")
chart_description = visualization.get("description", "") if visualization.get("description", "") else ""
yield Chart(
id=uuid.uuid4(),
name=query_id,
displayName=query_name,
chartType=chart_type,
service=EntityReference(id=self.service.id, type="dashboardService"),
description=chart_description,
)
def get_redash_dashboard(self) -> Dashboard:
charts: List[Chart] = []
dashboard_info = self.client.dashboards()
for dashboard_info in dashboard_info["results"]:
dashboard_id = dashboard_info["id"]
if dashboard_info["id"] is not None:
self.status.item_scanned_status()
dashboard_data = self.client.dashboard(dashboard_id)
dashboard_url = f"{self.config.uri}/dashboard/{dashboard_data.get('slug', '')}"
for widgets in dashboard_data.get("widgets", []):
dashboard_description = widgets.get("text")
yield Dashboard(
id=uuid.uuid4(),
name=dashboard_info["id"],
displayName=dashboard_info["name"],
description=dashboard_description if dashboard_info else "",
charts=charts,
usageSummary=None,
service=EntityReference(id=self.service.id, type="dashboardService"),
url=dashboard_url
)
def get_status(self) -> SourceStatus:
return self.status