mirror of
https://github.com/open-metadata/OpenMetadata.git
synced 2025-07-13 03:59:45 +00:00

* Add multiple owners * Multi Ownership * Issue #17012: Multi User/Team Ownership * Issue #17012: Multi User/Team Ownership * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 1 * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 2 * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 3 * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 4 * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 5 * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 6 * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 7 * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 8 * Add Migrations for Owner Thread * update ingestion for multi owner * fix pytests * fixed checkstyle * Add Alert Name to Publishers (#17108) * Add Alert Name to Publishers * Fix Test * Add Bound to Setuptools (#17105) * Minor: fixed testSummaryGraph issue (#17115) * feat: updated multi pipeline ui as per new mock (#17106) * feat: updated multi pipeline ui as per new mock * translation sync * fixed failing unit test * fixed playwright test * fixed viewService click issue * sorted pipeline based on test case length * Added domo federated dataset support (#17061) * fix usernames (#17122) * Doc: Updated Doris & Redshift Docs (#17123) Co-authored-by: Prajwal Pandit <prajwalpandit@Prajwals-MacBook-Air.local> * Fix #12677: Added Synapse Connector - docs and side docs (#17041) * Fix #17098: Fixed case sensitive partition column name in Bigquery (#17104) * Fixed case sensitive partiion col name bigquery * update test * #13876: change placement of comment and close button in task approval workflow (#17044) * change placment of comment and close button in task approval workflow * minor change * playwright test for the close and comment function * supported ref in activityFeedEditor * fix playwright test * added playwright test for data steward * fix the test for the data streward user * fix the close button not showing if task has no suggestions and icon fixes * fix sonar issue * change glossary and add suggestion button to dropdown button * fix the glossary failure due to button change * icon change for add tag and description * fix glossary cypress failure due to button chnages * changes as per comments * MINOR: docs links fix (#17125) * alation link fix * dbt yaml config source link fix * bigquery doc fix * Explore tree feedbacks (#17078) * fix explore design * update switcher icon * show menu when search query exists * fix selection of active service * fix type error * fix tests * fix tests * fix tests * MINOR: Databricks view TableType fix (#17124) * Minor: fixed AUT test (#17128) * Fix #16692: Override Lineage Support for View & Dashboard Lineage (#17064) * #17065: fix the tags not rendering in selector after selection in edit tags task (#17107) * fix the tags not rendering in selector after selection in edit tags taks * added playwright test * minor changes * minor fix * fix the tags not updating in edit and accept tag * fix explore type changes for collate (#17131) * MINOR: changed log level to debug (#17126) * changed log level to debug * fixed type * changed type to optional * Get feed and count data of soft deleted user (#17135) * Doc: Adding OIDC Docs (#17139) Co-authored-by: Prajwal Pandit <prajwalpandit@Prajwals-MacBook-Air.local> * Doc: Updating Profiler Workflow Docs URL (#17140) Co-authored-by: Prajwal Pandit <prajwalpandit@Prajwals-MacBook-Air.local> * fix playwright and cypress (#17138) * Minor: fixed edit modal issue for sql test case (#17132) * Minor: fixed edit modal issue for sql test case * fixed test * Minor: Added whats new content for 1.4.6 release (#17148) * MINOR [GEN-799]: add option to disable manual trigger using scheduleType (#17031) * fix: raise for triggering system app * added scheduleType ScheduledOrManual * minor: remove "service" field from required properties in createAPIEndpoint schema (#17147) * initial commit multi ownership * update glossary and other entities * update owners * fix version pages * fix tests * Update entity_extension to move owner to array (#17200) * fix tests * fix api page errors * fix owner label design * locales * fix owners in elastic search source * fix types * fix tests * fix tests * Updated CustomMetric owner to entityReferenceList. (#17211) * Fix owners field in search mappings * fix search aggregates * fix inherited label * Issue #17012: Multi User/Team Ownership - Fix Tests - Part 9 * Fix QUeries * Fix Mysql Queries * Typo * fix tests * fix tests * fix tests * fix advanced search constants * fix service ingestion tests * fix tests --------- Co-authored-by: mohitdeuex <mohit.y@deuexsolutions.com> Co-authored-by: Onkar Ravgan <onkar.10r@gmail.com> Co-authored-by: Mohit Yadav <105265192+mohityadav766@users.noreply.github.com> Co-authored-by: Ayush Shah <ayush@getcollate.io> Co-authored-by: Shailesh Parmar <shailesh.parmar.webdev@gmail.com> Co-authored-by: k.nakagaki <141020064+nakaken-churadata@users.noreply.github.com> Co-authored-by: Prajwal214 <167504578+Prajwal214@users.noreply.github.com> Co-authored-by: Prajwal Pandit <prajwalpandit@Prajwals-MacBook-Air.local> Co-authored-by: Suman Maharana <sumanmaharana786@gmail.com> Co-authored-by: Ashish Gupta <ashish@getcollate.io> Co-authored-by: harshsoni2024 <64592571+harshsoni2024@users.noreply.github.com> Co-authored-by: Karan Hotchandani <33024356+karanh37@users.noreply.github.com> Co-authored-by: Mayur Singal <39544459+ulixius9@users.noreply.github.com> Co-authored-by: Imri Paran <imri.paran@gmail.com> Co-authored-by: sonika-shah <58761340+sonika-shah@users.noreply.github.com> Co-authored-by: Sachin Chaurasiya <sachinchaurasiyachotey87@gmail.com> Co-authored-by: karanh37 <karanh37@gmail.com> Co-authored-by: Siddhant <86899184+Siddhanttimeline@users.noreply.github.com>
447 lines
15 KiB
Python
447 lines
15 KiB
Python
# Copyright 2021 Collate
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
|
|
"""
|
|
OpenMetadata high-level API Model test
|
|
"""
|
|
import uuid
|
|
from unittest import TestCase
|
|
|
|
from metadata.generated.schema.api.data.createDatabase import CreateDatabaseRequest
|
|
from metadata.generated.schema.api.data.createDatabaseSchema import (
|
|
CreateDatabaseSchemaRequest,
|
|
)
|
|
from metadata.generated.schema.api.data.createMlModel import CreateMlModelRequest
|
|
from metadata.generated.schema.api.data.createTable import CreateTableRequest
|
|
from metadata.generated.schema.api.services.createDatabaseService import (
|
|
CreateDatabaseServiceRequest,
|
|
)
|
|
from metadata.generated.schema.api.services.createMlModelService import (
|
|
CreateMlModelServiceRequest,
|
|
)
|
|
from metadata.generated.schema.api.teams.createUser import CreateUserRequest
|
|
from metadata.generated.schema.entity.data.mlmodel import (
|
|
FeatureSource,
|
|
FeatureSourceDataType,
|
|
FeatureType,
|
|
MlFeature,
|
|
MlHyperParameter,
|
|
MlModel,
|
|
)
|
|
from metadata.generated.schema.entity.data.table import Column, DataType, Table
|
|
from metadata.generated.schema.entity.services.connections.database.common.basicAuth import (
|
|
BasicAuth,
|
|
)
|
|
from metadata.generated.schema.entity.services.connections.database.mysqlConnection import (
|
|
MysqlConnection,
|
|
)
|
|
from metadata.generated.schema.entity.services.connections.metadata.openMetadataConnection import (
|
|
OpenMetadataConnection,
|
|
)
|
|
from metadata.generated.schema.entity.services.connections.mlmodel.mlflowConnection import (
|
|
MlflowConnection,
|
|
)
|
|
from metadata.generated.schema.entity.services.databaseService import (
|
|
DatabaseConnection,
|
|
DatabaseService,
|
|
DatabaseServiceType,
|
|
)
|
|
from metadata.generated.schema.entity.services.mlmodelService import (
|
|
MlModelConnection,
|
|
MlModelService,
|
|
MlModelServiceType,
|
|
)
|
|
from metadata.generated.schema.security.client.openMetadataJWTClientConfig import (
|
|
OpenMetadataJWTClientConfig,
|
|
)
|
|
from metadata.generated.schema.type.entityLineage import EntitiesEdge
|
|
from metadata.generated.schema.type.entityReference import EntityReference
|
|
from metadata.generated.schema.type.entityReferenceList import EntityReferenceList
|
|
from metadata.ingestion.ometa.ometa_api import OpenMetadata
|
|
|
|
|
|
class OMetaModelTest(TestCase):
|
|
"""
|
|
Run this integration test with the local API available
|
|
Install the ingestion package before running the tests
|
|
"""
|
|
|
|
server_config = OpenMetadataConnection(
|
|
hostPort="http://localhost:8585/api",
|
|
authProvider="openmetadata",
|
|
securityConfig=OpenMetadataJWTClientConfig(
|
|
jwtToken="eyJraWQiOiJHYjM4OWEtOWY3Ni1nZGpzLWE5MmotMDI0MmJrOTQzNTYiLCJ0eXAiOiJKV1QiLCJhbGciOiJSUzI1NiJ9.eyJzdWIiOiJhZG1pbiIsImlzQm90IjpmYWxzZSwiaXNzIjoib3Blbi1tZXRhZGF0YS5vcmciLCJpYXQiOjE2NjM5Mzg0NjIsImVtYWlsIjoiYWRtaW5Ab3Blbm1ldGFkYXRhLm9yZyJ9.tS8um_5DKu7HgzGBzS1VTA5uUjKWOCU0B_j08WXBiEC0mr0zNREkqVfwFDD-d24HlNEbrqioLsBuFRiwIWKc1m_ZlVQbG7P36RUxhuv2vbSp80FKyNM-Tj93FDzq91jsyNmsQhyNv_fNr3TXfzzSPjHt8Go0FMMP66weoKMgW2PbXlhVKwEuXUHyakLLzewm9UMeQaEiRzhiTMU3UkLXcKbYEJJvfNFcLwSl9W8JCO_l0Yj3ud-qt_nQYEZwqW6u5nfdQllN133iikV4fM5QZsMCnm8Rq1mvLR0y9bmJiD7fwM1tmJ791TUWqmKaTnP49U493VanKpUAfzIiOiIbhg"
|
|
),
|
|
)
|
|
metadata = OpenMetadata(server_config)
|
|
|
|
assert metadata.health_check()
|
|
|
|
user = metadata.create_or_update(
|
|
data=CreateUserRequest(name="random-user", email="random@user.com"),
|
|
)
|
|
owners = EntityReferenceList(root=[EntityReference(id=user.id, type="user")])
|
|
|
|
service = CreateMlModelServiceRequest(
|
|
name="test-model-service",
|
|
serviceType=MlModelServiceType.Mlflow,
|
|
connection=MlModelConnection(
|
|
config=MlflowConnection(
|
|
trackingUri="http://localhost:1234",
|
|
registryUri="http://localhost:4321",
|
|
)
|
|
),
|
|
)
|
|
|
|
@classmethod
|
|
def setUpClass(cls) -> None:
|
|
"""
|
|
Prepare ingredients
|
|
"""
|
|
|
|
cls.service_entity = cls.metadata.create_or_update(data=cls.service)
|
|
cls.service_reference = EntityReference(
|
|
id=cls.service_entity.id, name="test-mlflow", type="mlmodelService"
|
|
)
|
|
|
|
cls.create = CreateMlModelRequest(
|
|
name="test-model",
|
|
algorithm="algo",
|
|
service=cls.service_entity.fullyQualifiedName,
|
|
)
|
|
|
|
cls.entity = MlModel(
|
|
id=uuid.uuid4(),
|
|
name="test-model",
|
|
algorithm="algo",
|
|
fullyQualifiedName="test-model-service.test-model",
|
|
service=cls.service_reference,
|
|
)
|
|
|
|
@classmethod
|
|
def tearDownClass(cls) -> None:
|
|
"""
|
|
Clean up
|
|
"""
|
|
|
|
service_id = str(
|
|
cls.metadata.get_by_name(
|
|
entity=MlModelService, fqn="test-model-service"
|
|
).id.root
|
|
)
|
|
|
|
cls.metadata.delete(
|
|
entity=MlModelService,
|
|
entity_id=service_id,
|
|
recursive=True,
|
|
hard_delete=True,
|
|
)
|
|
|
|
def test_create(self):
|
|
"""
|
|
We can create a Model and we receive it back as Entity
|
|
"""
|
|
|
|
res = self.metadata.create_or_update(data=self.create)
|
|
|
|
self.assertEqual(res.name, self.entity.name)
|
|
self.assertEqual(res.algorithm, self.entity.algorithm)
|
|
self.assertIsNone(res.owners)
|
|
|
|
def test_update(self):
|
|
"""
|
|
Updating it properly changes its properties
|
|
"""
|
|
|
|
res_create = self.metadata.create_or_update(data=self.create)
|
|
|
|
updated = self.create.model_dump(exclude_unset=True)
|
|
updated["owners"] = self.owners
|
|
updated_entity = CreateMlModelRequest(**updated)
|
|
|
|
res = self.metadata.create_or_update(data=updated_entity)
|
|
|
|
# Same ID, updated algorithm
|
|
self.assertEqual(res.algorithm, updated_entity.algorithm)
|
|
self.assertEqual(res_create.id, res.id)
|
|
self.assertEqual(res.owners.root[0].id, self.user.id)
|
|
|
|
# Getting without owner field does not return it by default
|
|
res_none = self.metadata.get_by_name(
|
|
entity=MlModel, fqn=self.entity.fullyQualifiedName
|
|
)
|
|
self.assertIsNone(res_none.owners)
|
|
|
|
# We can request specific fields to be added
|
|
res_owner = self.metadata.get_by_name(
|
|
entity=MlModel,
|
|
fqn=self.entity.fullyQualifiedName,
|
|
fields=["owners", "followers"],
|
|
)
|
|
self.assertEqual(res_owner.owners.root[0].id, self.user.id)
|
|
|
|
def test_get_name(self):
|
|
"""
|
|
We can fetch a model by name and get it back as Entity
|
|
"""
|
|
|
|
self.metadata.create_or_update(data=self.create)
|
|
|
|
res = self.metadata.get_by_name(
|
|
entity=MlModel, fqn=self.entity.fullyQualifiedName
|
|
)
|
|
self.assertEqual(res.name, self.entity.name)
|
|
|
|
def test_get_id(self):
|
|
"""
|
|
We can fetch a model by ID and get it back as Entity
|
|
"""
|
|
|
|
self.metadata.create_or_update(data=self.create)
|
|
|
|
# First pick up by name
|
|
res_name = self.metadata.get_by_name(
|
|
entity=MlModel, fqn=self.entity.fullyQualifiedName
|
|
)
|
|
# Then fetch by ID
|
|
res = self.metadata.get_by_id(entity=MlModel, entity_id=res_name.id)
|
|
|
|
self.assertEqual(res_name.id, res.id)
|
|
|
|
def test_list(self):
|
|
"""
|
|
We can list all our models
|
|
"""
|
|
|
|
self.metadata.create_or_update(data=self.create)
|
|
|
|
res = self.metadata.list_entities(entity=MlModel)
|
|
|
|
# Fetch our test model. We have already inserted it, so we should find it
|
|
data = next(
|
|
iter(ent for ent in res.entities if ent.name == self.entity.name), None
|
|
)
|
|
assert data
|
|
|
|
def test_delete(self):
|
|
"""
|
|
We can delete a model by ID
|
|
"""
|
|
|
|
self.metadata.create_or_update(data=self.create)
|
|
|
|
# Find by name
|
|
res_name = self.metadata.get_by_name(
|
|
entity=MlModel, fqn=self.entity.fullyQualifiedName
|
|
)
|
|
# Then fetch by ID
|
|
res_id = self.metadata.get_by_id(
|
|
entity=MlModel, entity_id=str(res_name.id.root)
|
|
)
|
|
|
|
# Delete
|
|
self.metadata.delete(entity=MlModel, entity_id=str(res_id.id.root))
|
|
|
|
# Then we should not find it
|
|
res = self.metadata.list_entities(entity=MlModel)
|
|
|
|
assert not next(
|
|
iter(
|
|
ent
|
|
for ent in res.entities
|
|
if ent.fullyQualifiedName == self.entity.fullyQualifiedName
|
|
),
|
|
None,
|
|
)
|
|
|
|
def test_mlmodel_properties(self):
|
|
"""
|
|
Check that we can create models with MLFeatures and MLHyperParams
|
|
|
|
We can add lineage information
|
|
"""
|
|
|
|
service = CreateDatabaseServiceRequest(
|
|
name="test-service-table-ml",
|
|
serviceType=DatabaseServiceType.Mysql,
|
|
connection=DatabaseConnection(
|
|
config=MysqlConnection(
|
|
username="username",
|
|
authType=BasicAuth(
|
|
password="password",
|
|
),
|
|
hostPort="http://localhost:1234",
|
|
)
|
|
),
|
|
)
|
|
service_entity = self.metadata.create_or_update(data=service)
|
|
|
|
create_db = CreateDatabaseRequest(
|
|
name="test-db-ml",
|
|
service=service_entity.fullyQualifiedName,
|
|
)
|
|
create_db_entity = self.metadata.create_or_update(data=create_db)
|
|
|
|
create_schema = CreateDatabaseSchemaRequest(
|
|
name="test-schema-ml",
|
|
database=create_db_entity.fullyQualifiedName,
|
|
)
|
|
create_schema_entity = self.metadata.create_or_update(data=create_schema)
|
|
|
|
create_table1 = CreateTableRequest(
|
|
name="test-ml",
|
|
databaseSchema=create_schema_entity.fullyQualifiedName,
|
|
columns=[Column(name="education", dataType=DataType.STRING)],
|
|
)
|
|
table1_entity = self.metadata.create_or_update(data=create_table1)
|
|
|
|
create_table2 = CreateTableRequest(
|
|
name="another_test-ml",
|
|
databaseSchema=create_schema_entity.fullyQualifiedName,
|
|
columns=[Column(name="age", dataType=DataType.INT)],
|
|
)
|
|
table2_entity = self.metadata.create_or_update(data=create_table2)
|
|
|
|
model = CreateMlModelRequest(
|
|
name="test-model-lineage",
|
|
algorithm="algo",
|
|
mlFeatures=[
|
|
MlFeature(
|
|
name="age",
|
|
dataType=FeatureType.numerical,
|
|
featureSources=[
|
|
FeatureSource(
|
|
name="age",
|
|
dataType=FeatureSourceDataType.integer,
|
|
dataSource=self.metadata.get_entity_reference(
|
|
entity=Table, fqn=table2_entity.fullyQualifiedName
|
|
),
|
|
)
|
|
],
|
|
),
|
|
MlFeature(
|
|
name="persona",
|
|
dataType=FeatureType.categorical,
|
|
featureSources=[
|
|
FeatureSource(
|
|
name="age",
|
|
dataType=FeatureSourceDataType.integer,
|
|
dataSource=self.metadata.get_entity_reference(
|
|
entity=Table, fqn=table2_entity.fullyQualifiedName
|
|
),
|
|
),
|
|
FeatureSource(
|
|
name="education",
|
|
dataType=FeatureSourceDataType.string,
|
|
dataSource=self.metadata.get_entity_reference(
|
|
entity=Table, fqn=table1_entity.fullyQualifiedName
|
|
),
|
|
),
|
|
FeatureSource(
|
|
name="city", dataType=FeatureSourceDataType.string
|
|
),
|
|
],
|
|
featureAlgorithm="PCA",
|
|
),
|
|
],
|
|
mlHyperParameters=[
|
|
MlHyperParameter(name="regularisation", value="0.5"),
|
|
MlHyperParameter(name="random", value="hello"),
|
|
],
|
|
target="myTarget",
|
|
service=self.service_entity.fullyQualifiedName,
|
|
)
|
|
|
|
res: MlModel = self.metadata.create_or_update(data=model)
|
|
|
|
self.assertIsNotNone(res.mlFeatures)
|
|
self.assertIsNotNone(res.mlHyperParameters)
|
|
|
|
# Lineage will be created just by ingesting the model.
|
|
# Alternatively, we could manually send lineage via `add_mlmodel_lineage`
|
|
# E.g., lineage = self.metadata.add_mlmodel_lineage(model=res)
|
|
lineage = self.metadata.get_lineage_by_id(
|
|
entity=MlModel, entity_id=str(res.id.root)
|
|
)
|
|
|
|
nodes = {node["id"] for node in lineage["nodes"]}
|
|
assert nodes == {str(table1_entity.id.root), str(table2_entity.id.root)}
|
|
|
|
# If we delete the lineage, the `add_mlmodel_lineage` will take care of it too
|
|
for edge in lineage.get("upstreamEdges") or []:
|
|
self.metadata.delete_lineage_edge(
|
|
edge=EntitiesEdge(
|
|
fromEntity=EntityReference(id=edge["fromEntity"], type="table"),
|
|
toEntity=EntityReference(id=edge["toEntity"], type="mlmodel"),
|
|
)
|
|
)
|
|
|
|
self.metadata.add_mlmodel_lineage(model=res)
|
|
|
|
lineage = self.metadata.get_lineage_by_id(
|
|
entity=MlModel, entity_id=str(res.id.root)
|
|
)
|
|
|
|
nodes = {node["id"] for node in lineage["nodes"]}
|
|
assert nodes == {str(table1_entity.id.root), str(table2_entity.id.root)}
|
|
|
|
self.metadata.delete(
|
|
entity=DatabaseService,
|
|
entity_id=service_entity.id,
|
|
recursive=True,
|
|
hard_delete=True,
|
|
)
|
|
|
|
def test_list_versions(self):
|
|
"""
|
|
test list MLmodel entity versions
|
|
"""
|
|
self.metadata.create_or_update(data=self.create)
|
|
|
|
# Find by name
|
|
res_name = self.metadata.get_by_name(
|
|
entity=MlModel, fqn=self.entity.fullyQualifiedName
|
|
)
|
|
|
|
res = self.metadata.get_list_entity_versions(
|
|
entity=MlModel, entity_id=res_name.id.root
|
|
)
|
|
assert res
|
|
|
|
def test_get_entity_version(self):
|
|
"""
|
|
test get MLModel entity version
|
|
"""
|
|
self.metadata.create_or_update(data=self.create)
|
|
|
|
# Find by name
|
|
res_name = self.metadata.get_by_name(
|
|
entity=MlModel, fqn=self.entity.fullyQualifiedName
|
|
)
|
|
res = self.metadata.get_entity_version(
|
|
entity=MlModel, entity_id=res_name.id.root, version=0.1
|
|
)
|
|
|
|
# check we get the correct version requested and the correct entity ID
|
|
assert res.version.root == 0.1
|
|
assert res.id == res_name.id
|
|
|
|
def test_get_entity_ref(self):
|
|
"""
|
|
test get EntityReference
|
|
"""
|
|
res = self.metadata.create_or_update(data=self.create)
|
|
entity_ref = self.metadata.get_entity_reference(
|
|
entity=MlModel, fqn=res.fullyQualifiedName
|
|
)
|
|
|
|
assert res.id == entity_ref.id
|