2023-12-21 10:52:47 +08:00

62 lines
1.8 KiB
Python

# -*- coding: utf-8 -*-
# Copyright 2023 Ant Group CO., Ltd.
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
# in compliance with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software distributed under the License
# is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
# or implied.
from knext.client.model.builder_job import BuilderJob
from knext.api.component import (
CSVReader,
KGWriter,
SPGTypeMapping,
)
from schema.supplychain_schema_helper import SupplyChain
class Product(BuilderJob):
parallelism = 6
def build(self):
source = CSVReader(
local_path="./builder/job/data/Product.csv",
columns=["fullname", "belongToIndustry", "hasSupplyChain"],
start_row=2,
)
mapping = (
SPGTypeMapping(spg_type_name=SupplyChain.Product)
.add_field("fullname", SupplyChain.Product.id)
.add_field("belongToIndustry", SupplyChain.Product.belongToIndustry)
)
sink = KGWriter()
return source >> mapping >> sink
class ProductHasSupplyChain(BuilderJob):
parallelism = 6
def build(self):
source = CSVReader(
local_path="./builder/job/data/Product.csv",
columns=["fullname", "belongToIndustry", "hasSupplyChain"],
start_row=2,
)
mapping = (
SPGTypeMapping(spg_type_name="SupplyChain.Product")
.add_field("fullname", "id")
.add_field("hasSupplyChain", "hasSupplyChain")
)
sink = KGWriter()
return source >> mapping >> sink