Schoolmeister
03/08/2022, 1:26 PMtrain_data
and validation_data
outputs to create the subsequent pipelines with?
python
cv_split_pipe = Pipeline(
[
node(
func=nodes.cv_split,
inputs=["data", "params:fold_config"],
outputs=["train_data", "validation_data"], # train_data and validation_data are lists, one index per fold
)
]
)
# get the train_data and validation_data outputs somehow
train_data = []
validation_data = []
# build modular pipeline
pipelines = []
for i, train_set, validation_set in enumerate(zip(train_data, validation_data)):
pipelines.append(
pipeline(
pipe=new_inference_pipeline(),
inputs=[train_set, validation_set],
outputs={"y_pred": f"y_pred_{i}"}
)
)
final_pipeline = sum(pipelines)