62 lines
1.8 KiB
Python
Raw Normal View History

2023-10-26 10:34:08 +08:00
# -*- coding: utf-8 -*-
# Copyright 2023 Ant Group CO., Ltd.
2023-10-26 10:34:08 +08:00
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
# in compliance with the License. You may obtain a copy of the License at
2023-10-26 10:34:08 +08:00
#
# http://www.apache.org/licenses/LICENSE-2.0
2023-10-26 10:34:08 +08:00
#
# Unless required by applicable law or agreed to in writing, software distributed under the License
# is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
# or implied.
2023-10-26 10:34:08 +08:00
2023-12-18 14:30:59 +08:00
from knext.client.model.builder_job import BuilderJob
from knext.api.component import (
CsvSourceReader,
KGSinkWriter,
SPGTypeMapping,
2023-11-21 15:17:02 +08:00
)
2023-10-26 10:34:08 +08:00
from schema.supplychain_schema_helper import SupplyChain
class Product(BuilderJob):
parallelism = 6
def build(self):
2023-12-18 14:30:59 +08:00
source = CsvSourceReader(
2023-10-26 10:34:08 +08:00
local_path="./builder/job/data/Product.csv",
columns=["fullname", "belongToIndustry", "hasSupplyChain"],
2023-11-21 15:17:02 +08:00
start_row=2,
2023-10-26 10:34:08 +08:00
)
2023-11-21 15:17:02 +08:00
mapping = (
2023-12-18 14:30:59 +08:00
SPGTypeMapping(spg_type_name=SupplyChain.Product)
2023-11-21 15:17:02 +08:00
.add_field("fullname", SupplyChain.Product.id)
2023-10-26 10:34:08 +08:00
.add_field("belongToIndustry", SupplyChain.Product.belongToIndustry)
2023-11-21 15:17:02 +08:00
)
2023-10-26 10:34:08 +08:00
2023-12-18 14:30:59 +08:00
sink = KGSinkWriter()
2023-10-26 10:34:08 +08:00
return source >> mapping >> sink
class ProductHasSupplyChain(BuilderJob):
parallelism = 6
def build(self):
2023-12-18 14:30:59 +08:00
source = CsvSourceReader(
2023-10-26 10:34:08 +08:00
local_path="./builder/job/data/Product.csv",
columns=["fullname", "belongToIndustry", "hasSupplyChain"],
2023-11-21 15:17:02 +08:00
start_row=2,
2023-10-26 10:34:08 +08:00
)
2023-11-21 15:17:02 +08:00
mapping = (
2023-12-18 14:30:59 +08:00
SPGTypeMapping(spg_type_name="SupplyChain.Product")
2023-11-21 15:17:02 +08:00
.add_field("fullname", "id")
.add_field("hasSupplyChain", "hasSupplyChain")
)
2023-10-26 10:34:08 +08:00
2023-12-18 14:30:59 +08:00
sink = KGSinkWriter()
2023-10-26 10:34:08 +08:00
return source >> mapping >> sink