mirror of
https://github.com/microsoft/graphrag.git
synced 2025-07-16 13:30:58 +00:00

Correct links to verbs in comments Updated the links in comments to reflect new paths for 'derive' and 'aggregate' verbs. This improves documentation and ensures that references are up to date for future developers. Co-authored-by: Alonso Guevara <alonsog@microsoft.com>
23 lines
1.1 KiB
YAML
23 lines
1.1 KiB
YAML
workflows:
|
|
- name: aggregate_workflow
|
|
steps:
|
|
- verb: "aggregate" # https://github.com/microsoft/datashaper/blob/main/python/datashaper/datashaper/verbs/aggregate.py
|
|
args:
|
|
groupby: "type"
|
|
column: "col_multiplied"
|
|
to: "aggregated_output"
|
|
operation: "sum"
|
|
input:
|
|
source: "workflow:derive_workflow" # reference the derive_workflow, cause this one requires that one to run first
|
|
# Notice, these are out of order, the indexing engine will figure out the right order to run them in
|
|
|
|
- name: derive_workflow
|
|
steps:
|
|
- verb: "derive" # https://github.com/microsoft/datashaper/blob/main/python/datashaper/datashaper/verbs/derive.py
|
|
args:
|
|
column1: "col1" # from above
|
|
column2: "col2" # from above
|
|
to: "col_multiplied" # new column name
|
|
operator: "*" # multiply the two columns,
|
|
# Since we're trying to act on the dataset, we don't need explicitly to specify an input
|
|
# "input": { "source": "source" } # use the dataset as the input to this verb. This is the default, so you can omit it. |