113 lines
3.3 KiB
Python
Raw Normal View History

2023-10-26 10:34:08 +08:00
# -*- coding: utf-8 -*-
# Copyright 2023 Ant Group CO., Ltd.
2023-10-26 10:34:08 +08:00
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
# in compliance with the License. You may obtain a copy of the License at
2023-10-26 10:34:08 +08:00
#
# http://www.apache.org/licenses/LICENSE-2.0
2023-10-26 10:34:08 +08:00
#
# Unless required by applicable law or agreed to in writing, software distributed under the License
# is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
# or implied.
2023-10-26 10:34:08 +08:00
2023-12-18 14:30:59 +08:00
from knext.client.model.builder_job import BuilderJob
from knext.api.component import SPGTypeMapping
from knext.api.component import (
2023-12-21 10:52:47 +08:00
CSVReader,
KGWriter,
2023-12-19 11:11:47 +08:00
RelationMapping
2023-11-21 15:17:02 +08:00
)
2023-12-19 11:11:47 +08:00
from knext.examples.riskmining.schema.riskmining_schema_helper import RiskMining
2023-10-26 10:34:08 +08:00
class Person(BuilderJob):
def build(self):
2023-12-21 10:52:47 +08:00
source = CSVReader(
2023-10-26 10:34:08 +08:00
local_path="./builder/job/data/Person.csv",
columns=["id", "name", "age", "hasPhone"],
2023-11-21 15:17:02 +08:00
start_row=2,
2023-10-26 10:34:08 +08:00
)
2023-11-21 15:17:02 +08:00
mapping = (
2023-12-19 11:11:47 +08:00
SPGTypeMapping(spg_type_name=RiskMining.Person.__typename__)
2023-11-21 15:17:02 +08:00
.add_field("id", RiskMining.Person.id)
.add_field("name", RiskMining.Person.name)
.add_field("age", RiskMining.Person.age)
2023-10-26 10:34:08 +08:00
.add_field("hasPhone", RiskMining.Person.hasPhone)
2023-11-21 15:17:02 +08:00
)
2023-10-26 10:34:08 +08:00
2023-12-21 10:52:47 +08:00
sink = KGWriter()
2023-10-26 10:34:08 +08:00
return source >> mapping >> sink
class PersonFundTrans(BuilderJob):
def build(self):
2023-12-21 10:52:47 +08:00
source = CSVReader(
2023-10-26 10:34:08 +08:00
local_path="./builder/job/data/Person_fundTrans_Person.csv",
2023-11-21 15:17:02 +08:00
columns=["src", "dst", "transDate", "transAmt"],
start_row=2,
2023-10-26 10:34:08 +08:00
)
2023-11-21 15:17:02 +08:00
mapping = (
2023-12-19 11:11:47 +08:00
RelationMapping(
subject_name=RiskMining.Person.__typename__,
2023-11-21 15:17:02 +08:00
predicate_name="fundTrans",
2023-12-19 11:11:47 +08:00
object_name=RiskMining.Person.__typename__,
2023-11-21 15:17:02 +08:00
)
.add_field("src", "srcId")
.add_field("dst", "dstId")
.add_field("transDate", "transDate")
.add_field("transAmt", "transAmt")
)
2023-10-26 10:34:08 +08:00
2023-12-21 10:52:47 +08:00
sink = KGWriter()
2023-10-26 10:34:08 +08:00
return source >> mapping >> sink
class PersonHasDevice(BuilderJob):
def build(self):
2023-12-21 10:52:47 +08:00
source = CSVReader(
2023-10-26 10:34:08 +08:00
local_path="./builder/job/data/Person_hasDevice_Device.csv",
2023-11-21 15:17:02 +08:00
columns=["src", "dst"],
start_row=2,
2023-10-26 10:34:08 +08:00
)
2023-11-21 15:17:02 +08:00
mapping = (
2023-12-19 11:11:47 +08:00
RelationMapping(
subject_name=RiskMining.Person.__typename__,
2023-11-21 15:17:02 +08:00
predicate_name="hasDevice",
2023-12-19 11:11:47 +08:00
object_name=RiskMining.Device.__typename__,
2023-11-21 15:17:02 +08:00
)
.add_field("src", "srcId")
2023-10-26 10:34:08 +08:00
.add_field("dst", "dstId")
2023-11-21 15:17:02 +08:00
)
2023-10-26 10:34:08 +08:00
2023-12-21 10:52:47 +08:00
sink = KGWriter()
2023-10-26 10:34:08 +08:00
return source >> mapping >> sink
class PersonHoldShare(BuilderJob):
def build(self):
2023-12-21 10:52:47 +08:00
source = CSVReader(
2023-10-26 10:34:08 +08:00
local_path="./builder/job/data/Person_holdShare_Company.csv",
2023-11-21 15:17:02 +08:00
columns=["src", "dst"],
start_row=2,
2023-10-26 10:34:08 +08:00
)
2023-11-21 15:17:02 +08:00
mapping = (
2023-12-19 11:11:47 +08:00
RelationMapping(
subject_name=RiskMining.Person.__typename__,
2023-11-21 15:17:02 +08:00
predicate_name="holdShare",
2023-12-19 11:11:47 +08:00
object_name=RiskMining.Company.__typename__,
2023-11-21 15:17:02 +08:00
)
.add_field("src", "srcId")
2023-10-26 10:34:08 +08:00
.add_field("dst", "dstId")
2023-11-21 15:17:02 +08:00
)
2023-10-26 10:34:08 +08:00
2023-12-21 10:52:47 +08:00
sink = KGWriter()
2023-10-26 10:34:08 +08:00
return source >> mapping >> sink