| workflows: | |
| - name: aggregate_workflow | |
| steps: | |
| - verb: "aggregate" # https://github.com/microsoft/datashaper/blob/main/python/datashaper/datashaper/engine/verbs/aggregate.py | |
| args: | |
| groupby: "type" | |
| column: "col_multiplied" | |
| to: "aggregated_output" | |
| operation: "sum" | |
| input: | |
| source: "workflow:derive_workflow" # reference the derive_workflow, cause this one requires that one to run first | |
| # Notice, these are out of order, the indexing engine will figure out the right order to run them in | |
| - name: derive_workflow | |
| steps: | |
| - verb: "derive" # https://github.com/microsoft/datashaper/blob/main/python/datashaper/datashaper/engine/verbs/derive.py | |
| args: | |
| column1: "col1" # from above | |
| column2: "col2" # from above | |
| to: "col_multiplied" # new column name | |
| operator: "*" # multiply the two columns, | |
| # Since we're trying to act on the dataset, we don't need explicitly to specify an input | |
| # "input": { "source": "source" } # use the dataset as the input to this verb. This is the default, so you can omit it. |