Source code for WORC.WORC

#!/usr/bin/env python

# Copyright 2016-2023 Biomedical Imaging Group Rotterdam, Departments of
# Medical Informatics and Radiology, Erasmus MC, Rotterdam, The Netherlands
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import yaml
import fastr
import graphviz
import configparser
from pathlib import Path
from random import randint
import WORC.IOparser.file_io as io
from fastr.api import ResourceLimit
from WORC.tools.Slicer import Slicer
from WORC.tools.Elastix import Elastix
from WORC.tools.Evaluate import Evaluate
import WORC.addexceptions as WORCexceptions
import WORC.IOparser.config_WORC as config_io
from WORC.detectors.detectors import DebugDetector
from WORC.export.hyper_params_exporter import export_hyper_params_to_latex
from urllib.parse import urlparse
from urllib.request import url2pathname
from WORC.tools.fingerprinting import quantitative_modalities, qualitative_modalities, all_modalities


[docs]class WORC(object):
    """Workflow for Optimal Radiomics Classification.

    A Workflow for Optimal Radiomics Classification (WORC) object that
    serves as a pipeline spawner and manager for optimizating radiomics
    studies. Depending on the attributes set, the object will spawn an
    appropriate pipeline and manage it.

    Note that many attributes are lists and can therefore contain multiple
    instances. For example, when providing two sequences per patient,
    the "images" list contains two items. The type of items in the lists
    is described below.

    All objects that serve as source for your network, i.e. refer to
    actual files to be used, should be formatted as fastr sources suited for
    one of the fastr plugings, see also
    http://fastr.readthedocs.io/en/stable/fastr.reference.html#ioplugin-reference
    The objects should be lists of these fastr sources or dictionaries with the
    sample ID's, e.g.

    images_train = [{'Patient001': vfs://input/CT001.nii.gz,
                     'Patient002': vfs://input/CT002.nii.gz},
                    {'Patient001': vfs://input/MR001.nii.gz,
                     'Patient002': vfs://input/MR002.nii.gz}]

    Attributes
    ------------------
        name: String, default 'WORC'
            name of the network.

        configs: list, required
            Configuration parameters, either ConfigParser objects
            created through the defaultconfig function or paths of config .ini
            files. (list, required)

        labels: list, required
            Paths to files containing patient labels (.txt files).

        network: automatically generated
            The FASTR network generated through the "build" function.

        images: list, optional
            Paths refering to the images used for Radiomics computation. Images
            should be of the ITK Image type.

        segmentations: list, optional
            Paths refering to the segmentations used for Radiomics computation.
            Segmentations should be of the ITK Image type.

        semantics: semantic features per image type (list, optional)

        masks: state which pixels of images are valid (list, optional)

        features: input Radiomics features for classification (list, optional)

        metadata: DICOM headers belonging to images (list, optional)

        Elastix_Para: parameter files for Elastix (list, optional)

        fastr_plugin: plugin to use for FASTR execution

        fastr_tempdir: temporary directory to use for FASTR execution

        additions: additional inputs for your network (dict, optional)

        source_data: data to use as sources for FASTR (dict)

        sink_data: data to use as sinks for FASTR (dict)

        CopyMetadata: Boolean, default True
            when using elastix, copy metadata from image to segmentation or not

    """

[docs]    def __init__(self, name='test'):
        """Initialize WORC object.

        Set the initial variables all to None, except for some defaults.

        Arguments:
            name: name of the nework (string, optional)

        """
        self.name = 'WORC_' + name

        # Initialize several objects
        self.configs = list()
        self.fastrconfigs = list()

        self.images_train = list()
        self.segmentations_train = list()
        self.semantics_train = list()
        self.labels_train = list()
        self.masks_train = list()
        self.masks_normalize_train = list()
        self.features_train = list()
        self.metadata_train = list()

        self.images_test = list()
        self.segmentations_test = list()
        self.semantics_test = list()
        self.labels_test = list()
        self.masks_test = list()
        self.masks_normalize_test = list()
        self.features_test = list()
        self.metadata_test = list()
        
        self.trained_model = None

        self.Elastix_Para = list()
        self.label_names = 'Label1, Label2'

        self.fixedsplits = list()

        # Set some defaults, name
        self.fastr_plugin = 'LinearExecution'
        if name == '':
            name = [randint(0, 9) for p in range(0, 5)]
        self.fastr_tmpdir = os.path.join(fastr.config.mounts['tmp'], self.name)

        self.additions = dict()
        self.CopyMetadata = True
        self.segmode = []
        self._add_evaluation = False
        self.TrainTest = False
        self.OnlyTest = False

        # Memory settings for all fastr nodes
        self.fastr_memory_parameters = dict()
        self.fastr_memory_parameters['FeatureCalculator'] = '14G'
        self.fastr_memory_parameters['Classification'] = '6G'
        self.fastr_memory_parameters['WORCCastConvert'] = '4G'
        self.fastr_memory_parameters['Preprocessing'] = '4G'
        self.fastr_memory_parameters['Elastix'] = '4G'
        self.fastr_memory_parameters['Transformix'] = '4G'
        self.fastr_memory_parameters['Segmentix'] = '6G'
        self.fastr_memory_parameters['ComBat'] = '12G'
        self.fastr_memory_parameters['PlotEstimator'] = '12G'
        self.fastr_memory_parameters['Fingerprinter'] = '12G'

        if DebugDetector().do_detection():
            print(fastr.config)

[docs]    def defaultconfig(self):
        """Generate a configparser object holding all default configuration values.

        Returns:
            config: configparser configuration file

        """
        config = configparser.ConfigParser()
        config.optionxform = str

        # General configuration of WORC
        config['General'] = dict()
        config['General']['cross_validation'] = 'True'
        config['General']['Segmentix'] = 'True'
        config['General']['FeatureCalculators'] = '[predict/CalcFeatures:1.0, pyradiomics/Pyradiomics:1.0]'
        config['General']['Preprocessing'] = 'worc/PreProcess:1.0'
        config['General']['RegistrationNode'] = "elastix4.8/Elastix:4.8"
        config['General']['TransformationNode'] = "elastix4.8/Transformix:4.8"
        config['General']['Joblib_ncores'] = '1'
        config['General']['Joblib_backend'] = 'threading'
        config['General']['tempsave'] = 'True'
        config['General']['AssumeSameImageAndMaskMetadata'] = 'False'
        config['General']['ComBat'] = 'False'
        config['General']['Fingerprint'] = 'True'
        config['General']['DoTestNRSNEns'] = 'False'

        # Fingerprinting
        config['Fingerprinting'] = dict()
        config['Fingerprinting']['max_num_image'] = '100'

        # Options for the object/patient labels that are used
        config['Labels'] = dict()
        config['Labels']['label_names'] = 'Label1, Label2'
        config['Labels']['modus'] = 'singlelabel'
        config['Labels']['url'] = 'WIP'
        config['Labels']['projectID'] = 'WIP'

        # Preprocessing
        config['Preprocessing'] = dict()
        config['Preprocessing']['CheckSpacing'] = 'False'
        config['Preprocessing']['Clipping'] = 'False'
        config['Preprocessing']['Clipping_Range'] = '-1000.0, 3000.0'
        config['Preprocessing']['Normalize'] = 'True'
        config['Preprocessing']['Normalize_ROI'] = 'Full'
        config['Preprocessing']['Method'] = 'z_score'
        config['Preprocessing']['ROIDetermine'] = 'Provided'
        config['Preprocessing']['ROIdilate'] = 'False'
        config['Preprocessing']['ROIdilateradius'] = '10'
        config['Preprocessing']['Resampling'] = 'False'
        config['Preprocessing']['Resampling_spacing'] = '1, 1, 1'
        config['Preprocessing']['BiasCorrection'] = 'False'
        config['Preprocessing']['BiasCorrection_Mask'] = 'False'
        config['Preprocessing']['CheckOrientation'] = 'False'
        config['Preprocessing']['OrientationPrimaryAxis'] = 'axial'
        config['Preprocessing']['HistogramEqualization'] = 'False'
        config['Preprocessing']['HistogramEqualization_Alpha'] = '0.3'
        config['Preprocessing']['HistogramEqualization_Beta'] = '0.3'
        config['Preprocessing']['HistogramEqualization_Radius'] = '5'
        

        # Segmentix
        config['Segmentix'] = dict()
        config['Segmentix']['mask'] = 'None'
        config['Segmentix']['segtype'] = 'None'
        config['Segmentix']['segradius'] = '5'
        config['Segmentix']['N_blobs'] = '1'
        config['Segmentix']['fillholes'] = 'True'
        config['Segmentix']['remove_small_objects'] = 'False'
        config['Segmentix']['min_object_size'] = '2'

        # PREDICT - Feature calculation
        # Determine which features are calculated
        config['ImageFeatures'] = dict()
        config['ImageFeatures']['shape'] = 'True'
        config['ImageFeatures']['histogram'] = 'True'
        config['ImageFeatures']['orientation'] = 'True'
        config['ImageFeatures']['texture_Gabor'] = 'True'
        config['ImageFeatures']['texture_LBP'] = 'True'
        config['ImageFeatures']['texture_GLCM'] = 'True'
        config['ImageFeatures']['texture_GLCMMS'] = 'True'
        config['ImageFeatures']['texture_GLRLM'] = 'False'
        config['ImageFeatures']['texture_GLSZM'] = 'False'
        config['ImageFeatures']['texture_NGTDM'] = 'False'
        config['ImageFeatures']['coliage'] = 'False'
        config['ImageFeatures']['vessel'] = 'True'
        config['ImageFeatures']['log'] = 'True'
        config['ImageFeatures']['phase'] = 'True'

        # Parameter settings for PREDICT feature calculation
        # Defines only naming of modalities
        config['ImageFeatures']['image_type'] = ''

        # How to extract the features in different dimension
        config['ImageFeatures']['extraction_mode'] = '2.5D'

        # Define frequencies for gabor filter in pixels
        config['ImageFeatures']['gabor_frequencies'] = '0.05, 0.2, 0.5'

        # Gabor, GLCM angles in degrees and radians, respectively
        config['ImageFeatures']['gabor_angles'] = '0, 45, 90, 135'
        config['ImageFeatures']['GLCM_angles'] = '0, 0.79, 1.57, 2.36'

        # GLCM discretization levels, distances in pixels
        config['ImageFeatures']['GLCM_levels'] = '16'
        config['ImageFeatures']['GLCM_distances'] = '1, 3'

        # LBP radius, number of points in pixels
        config['ImageFeatures']['LBP_radius'] = '3, 8, 15'
        config['ImageFeatures']['LBP_npoints'] = '12, 24, 36'

        # Phase features minimal wavelength and number of scales
        config['ImageFeatures']['phase_minwavelength'] = '3'
        config['ImageFeatures']['phase_nscale'] = '5'

        # Log features sigma of Gaussian in pixels
        config['ImageFeatures']['log_sigma'] = '1, 5, 10'

        # Vessel features scale range, steps for the range
        config['ImageFeatures']['vessel_scale_range'] = '1, 10'
        config['ImageFeatures']['vessel_scale_step'] = '2'

        # Vessel features radius for erosion to determine boudnary
        config['ImageFeatures']['vessel_radius'] = '5'

        # Tags from which to extract features, and how to name them
        config['ImageFeatures']['dicom_feature_tags'] = '0010 1010, 0010 0040'
        config['ImageFeatures']['dicom_feature_labels'] = 'age, sex'

        # PyRadiomics - Feature calculation
        # Addition to the above, specifically for PyRadiomics
        # Mostly based on specific MR Settings: see https://github.com/Radiomics/pyradiomics/blob/master/examples/exampleSettings/exampleMR_NoResampling.yaml
        config['PyRadiomics'] = dict()
        config['PyRadiomics']['geometryTolerance'] = '0.0001'
        config['PyRadiomics']['normalize'] = 'False'
        config['PyRadiomics']['normalizeScale'] = '100'
        config['PyRadiomics']['resampledPixelSpacing'] = 'None'
        config['PyRadiomics']['interpolator'] = 'sitkBSpline'
        config['PyRadiomics']['preCrop'] = 'True'
        config['PyRadiomics']['binCount'] = config['ImageFeatures']['GLCM_levels'] # BinWidth to sensitive for normalization, thus use binCount
        config['PyRadiomics']['binWidth'] = 'None'
        config['PyRadiomics']['force2D'] = 'False'
        config['PyRadiomics']['force2Ddimension'] = '0'  # axial slices, for coronal slices, use dimension 1 and for sagittal, dimension 2.
        config['PyRadiomics']['voxelArrayShift'] = '300'
        config['PyRadiomics']['Original'] = 'True'
        config['PyRadiomics']['Wavelet'] = 'False'
        config['PyRadiomics']['LoG'] = 'False'

        if config['General']['Segmentix'] == 'True':
            config['PyRadiomics']['label'] = '1'
        else:
            config['PyRadiomics']['label'] = '255'

        # Enabled PyRadiomics features
        config['PyRadiomics']['extract_firstorder'] = 'False'
        config['PyRadiomics']['extract_shape'] = 'True'
        config['PyRadiomics']['texture_GLCM'] = 'False'
        config['PyRadiomics']['texture_GLRLM'] = 'True'
        config['PyRadiomics']['texture_GLSZM'] = 'True'
        config['PyRadiomics']['texture_GLDM'] = 'True'
        config['PyRadiomics']['texture_NGTDM'] = 'True'

        # ComBat Feature Harmonization
        config['ComBat'] = dict()
        config['ComBat']['language'] = 'python'
        config['ComBat']['batch'] = 'Hospital'
        config['ComBat']['mod'] = '[]'
        config['ComBat']['par'] = '1'
        config['ComBat']['eb'] = '1'
        config['ComBat']['per_feature'] = '0'
        config['ComBat']['excluded_features'] = 'sf_, of_, semf_, pf_'
        config['ComBat']['matlab'] = 'C:\\Program Files\\MATLAB\\R2015b\\bin\\matlab.exe'

        # Feature OneHotEncoding
        config['OneHotEncoding'] = dict()
        config['OneHotEncoding']['Use'] = 'False'
        config['OneHotEncoding']['feature_labels_tofit'] = ''

        # Feature imputation
        config['Imputation'] = dict()
        config['Imputation']['use'] = 'True'
        config['Imputation']['strategy'] = 'mean, median, most_frequent, constant, knn'
        config['Imputation']['n_neighbors'] = '5, 5'
        config['Imputation']['skipallNaN'] = 'True'

        # Feature scaling options
        config['FeatureScaling'] = dict()
        config['FeatureScaling']['scaling_method'] = 'robust_z_score'
        config['FeatureScaling']['skip_features'] = 'semf_, pf_'

        # Feature preprocessing before the whole HyperOptimization
        config['FeatPreProcess'] = dict()
        config['FeatPreProcess']['Use'] = 'False'
        config['FeatPreProcess']['Combine'] = 'False'
        config['FeatPreProcess']['Combine_method'] = 'mean'

        # Feature selection
        config['Featsel'] = dict()
        config['Featsel']['Variance'] = '1.0'
        config['Featsel']['GroupwiseSearch'] = 'True'
        config['Featsel']['SelectFromModel'] = '0.275'
        config['Featsel']['SelectFromModel_estimator'] = 'Lasso, LR, RF'
        config['Featsel']['SelectFromModel_lasso_alpha'] = '0.1, 1.4'
        config['Featsel']['SelectFromModel_n_trees'] = '10, 90'
        config['Featsel']['UsePCA'] = '0.275'
        config['Featsel']['PCAType'] = '95variance, 10, 50, 100'
        config['Featsel']['StatisticalTestUse'] = '0.275'
        config['Featsel']['StatisticalTestMetric'] = 'MannWhitneyU'
        config['Featsel']['StatisticalTestThreshold'] = '-3, 2.5'
        config['Featsel']['ReliefUse'] = '0.275'
        config['Featsel']['ReliefNN'] = '2, 4'
        config['Featsel']['ReliefSampleSize'] = '0.75, 0.2'
        config['Featsel']['ReliefDistanceP'] = '1, 3'
        config['Featsel']['ReliefNumFeatures'] = '10, 40'
        config['Featsel']['RFE'] = '0.0'
        config['Featsel']['RFE_estimator'] = config['Featsel']['SelectFromModel_estimator']
        config['Featsel']['RFE_lasso_alpha'] = config['Featsel']['SelectFromModel_lasso_alpha']
        config['Featsel']['RFE_n_trees'] = config['Featsel']['SelectFromModel_n_trees']
        config['Featsel']['RFE_n_features_to_select'] = '10, 90'
        config['Featsel']['RFE_step'] = '1, 9'

        # Groupwise Featureselection options
        config['SelectFeatGroup'] = dict()
        config['SelectFeatGroup']['shape_features'] = 'True, False'
        config['SelectFeatGroup']['histogram_features'] = 'True, False'
        config['SelectFeatGroup']['orientation_features'] = 'True, False'
        config['SelectFeatGroup']['texture_Gabor_features'] = 'True, False'
        config['SelectFeatGroup']['texture_GLCM_features'] = 'True, False'
        config['SelectFeatGroup']['texture_GLDM_features'] = 'True, False'
        config['SelectFeatGroup']['texture_GLCMMS_features'] = 'True, False'
        config['SelectFeatGroup']['texture_GLRLM_features'] = 'True, False'
        config['SelectFeatGroup']['texture_GLSZM_features'] = 'True, False'
        config['SelectFeatGroup']['texture_GLDZM_features'] = 'True, False'
        config['SelectFeatGroup']['texture_NGTDM_features'] = 'True, False'
        config['SelectFeatGroup']['texture_NGLDM_features'] = 'True, False'
        config['SelectFeatGroup']['texture_LBP_features'] = 'True, False'
        config['SelectFeatGroup']['dicom_features'] = 'False'
        config['SelectFeatGroup']['semantic_features'] = 'False'
        config['SelectFeatGroup']['coliage_features'] = 'False'
        config['SelectFeatGroup']['vessel_features'] = 'True, False'
        config['SelectFeatGroup']['phase_features'] = 'True, False'
        config['SelectFeatGroup']['fractal_features'] = 'True, False'
        config['SelectFeatGroup']['location_features'] = 'True, False'
        config['SelectFeatGroup']['rgrd_features'] = 'True, False'

        # Select features per toolbox, or simply all
        config['SelectFeatGroup']['toolbox'] = 'All, PREDICT, PyRadiomics'

        # Select original features, or after transformation of feature space
        config['SelectFeatGroup']['original_features'] = 'True'
        config['SelectFeatGroup']['wavelet_features'] = 'True, False'
        config['SelectFeatGroup']['log_features'] = 'True, False'

        # Resampling options
        config['Resampling'] = dict()
        config['Resampling']['Use'] = '0.20'
        config['Resampling']['Method'] =\
            'RandomUnderSampling, RandomOverSampling, NearMiss, ' +\
            'NeighbourhoodCleaningRule, ADASYN, BorderlineSMOTE, SMOTE, ' +\
            'SMOTEENN, SMOTETomek'
        config['Resampling']['sampling_strategy'] = 'auto, majority, minority, not minority, not majority, all'
        config['Resampling']['n_neighbors'] = '3, 12'
        config['Resampling']['k_neighbors'] = '5, 15'
        config['Resampling']['threshold_cleaning'] = '0.25, 0.5'

        # Classification
        config['Classification'] = dict()
        config['Classification']['fastr'] = 'True'
        config['Classification']['fastr_plugin'] = self.fastr_plugin
        config['Classification']['classifiers'] =\
            'SVM, RF, LR, LDA, QDA, GaussianNB, ' +\
            'AdaBoostClassifier, ' +\
            'XGBClassifier'
        config['Classification']['max_iter'] = '100000'
        config['Classification']['SVMKernel'] = 'linear, poly, rbf'
        config['Classification']['SVMC'] = '0, 6'
        config['Classification']['SVMdegree'] = '1, 6'
        config['Classification']['SVMcoef0'] = '0, 1'
        config['Classification']['SVMgamma'] = '-5, 5'
        config['Classification']['RFn_estimators'] = '10, 90'
        config['Classification']['RFmin_samples_split'] = '2, 3'
        config['Classification']['RFmax_depth'] = '5, 5'
        config['Classification']['LRpenalty'] = 'l1, l2, elasticnet'
        config['Classification']['LRC'] = '0.01, 0.99'
        config['Classification']['LR_solver'] = 'lbfgs, saga'
        config['Classification']['LR_l1_ratio'] = '0, 1'
        config['Classification']['LDA_solver'] = 'svd, lsqr, eigen'
        config['Classification']['LDA_shrinkage'] = '-5, 5'
        config['Classification']['QDA_reg_param'] = '-5, 5'
        config['Classification']['ElasticNet_alpha'] = '-5, 5'
        config['Classification']['ElasticNet_l1_ratio'] = '0, 1'
        config['Classification']['SGD_alpha'] = '-5, 5'
        config['Classification']['SGD_l1_ratio'] = '0, 1'
        config['Classification']['SGD_loss'] = 'squared_loss, huber, epsilon_insensitive, squared_epsilon_insensitive'
        config['Classification']['SGD_penalty'] = 'none, l2, l1'
        config['Classification']['CNB_alpha'] = '0, 1'
        config['Classification']['AdaBoost_n_estimators'] = config['Classification']['RFn_estimators']
        config['Classification']['AdaBoost_learning_rate'] = '0.01, 0.99'

        # Based on https://towardsdatascience.com/doing-xgboost-hyper-parameter-tuning-the-smart-way-part-1-of-2-f6d255a45dde
        # and https://www.analyticsvidhya.com/blog/2016/03/complete-guide-parameter-tuning-xgboost-with-codes-python/
        # and https://medium.com/data-design/xgboost-hi-im-gamma-what-can-i-do-for-you-and-the-tuning-of-regularization-a42ea17e6ab6
        config['Classification']['XGB_boosting_rounds'] = config['Classification']['RFn_estimators']
        config['Classification']['XGB_max_depth'] = '3, 12'
        config['Classification']['XGB_learning_rate'] = config['Classification']['AdaBoost_learning_rate']
        config['Classification']['XGB_gamma'] = '0.01, 9.99'
        config['Classification']['XGB_min_child_weight'] = '1, 6'
        config['Classification']['XGB_colsample_bytree'] = '0.3, 0.7'

        # https://lightgbm.readthedocs.io/en/latest/Parameters-Tuning.html. Mainly prevent overfitting
        config['Classification']['LightGBM_num_leaves'] = '5, 95'  # Default 31 so search around that
        config['Classification']['LightGBM_max_depth'] = config['Classification']['XGB_max_depth'] # Good to limit explicitly to decrease compuytation time and limit overfitting
        config['Classification']['LightGBM_min_child_samples'] = '5, 45'  # = min_data_in_leaf. Default 20
        config['Classification']['LightGBM_reg_alpha'] = config['Classification']['LRC']
        config['Classification']['LightGBM_reg_lambda'] = config['Classification']['LRC']
        config['Classification']['LightGBM_min_child_weight'] = '-7, 4' # Default 1e-3

        # CrossValidation
        config['CrossValidation'] = dict()
        config['CrossValidation']['Type'] = 'random_split'
        config['CrossValidation']['N_iterations'] = '100'
        config['CrossValidation']['test_size'] = '0.2'
        config['CrossValidation']['fixed_seed'] = 'False'

        # Hyperparameter optimization options
        config['HyperOptimization'] = dict()
        config['HyperOptimization']['scoring_method'] = 'f1_weighted'
        config['HyperOptimization']['test_size'] = '0.2'
        config['HyperOptimization']['n_splits'] = '5'
        config['HyperOptimization']['N_iterations'] = '1000' # represents either wallclock time limit or nr of evaluations when using SMAC
        config['HyperOptimization']['n_jobspercore'] = '200'  # only relevant when using fastr in classification
        config['HyperOptimization']['maxlen'] = '100'
        config['HyperOptimization']['ranking_score'] = 'test_score'
        config['HyperOptimization']['memory'] = '3G'
        config['HyperOptimization']['refit_training_workflows'] = 'False'
        config['HyperOptimization']['refit_validation_workflows'] = 'False'
        config['HyperOptimization']['fix_random_seed'] = 'False'

        # SMAC options
        config['SMAC'] = dict()
        config['SMAC']['use'] = 'False'
        config['SMAC']['n_smac_cores'] = '1'
        config['SMAC']['budget_type'] = 'evals' # ['evals', 'time']
        config['SMAC']['budget'] = '100' # Nr of evals or time in seconds
        config['SMAC']['init_method'] = 'random' # ['sobol', 'random']
        config['SMAC']['init_budget'] = '20' # Nr of evals

        # Ensemble options
        config['Ensemble'] = dict()
        config['Ensemble']['Method'] = 'top_N' # ['Single', 'top_N', 'FitNumber', 'ForwardSelection', 'Caruana', 'Bagging']
        config['Ensemble']['Size'] = '100' # Size of ensemble in top_N, or number of bags in Bagging
        config['Ensemble']['Metric'] = 'Default'

        # Evaluation options
        config['Evaluation'] = dict()
        config['Evaluation']['OverfitScaler'] = 'False'

        # Bootstrap options
        config['Bootstrap'] = dict()
        config['Bootstrap']['Use'] = 'False'
        config['Bootstrap']['N_iterations'] = '10000'

        return config

[docs]    def add_tools(self):
        """Add several tools to the WORC object."""
        self.Tools = Tools()

[docs]    def build(self, buildtype='training'):
        """Build the  network based on the given attributes.

        Parameters
        ----------
        buildtype: string, default 'training'
                Specify the WORC execution type.
                - inference: use if you have a trained classifier and want to
                           train it on some new images.
                - training: use if you want to train a classifier from a dataset.

        """
        if buildtype == 'training':
            self.build_training()
        elif buildtype == 'inference':
            raise WORCexceptions.WORCValueError("Inference workflow is still WIP and does not fully work yet.")
            self.TrainTest = True
            self.OnlyTest = True
            self.build_inference()       
             
[docs]    def build_training(self):
        """Build the training network based on the given attributes."""
        # We either need images or features for Radiomics
        if self.images_test or self.features_test:
            if not self.labels_test:
                m = "You provided images and/or features for a test set, but not ground truth labels. Please also provide labels for the test set."
                raise WORCexceptions.WORCValueError(m)
            self.TrainTest = True
            
        if self.images_train or self.features_train:
            print('Building training network...')
            # We currently require labels for supervised learning
            if self.labels_train:
                if not self.configs:
                    print("No configuration given, assuming default")
                    if self.images_train:
                        self.configs = [self.defaultconfig()] * len(self.images_train)
                    else:
                        self.configs = [self.defaultconfig()] * len(self.features_train)

                self.network = fastr.create_network(self.name)

                # NOTE: We currently use the first configuration as general config
                image_types = list()
                for c in range(len(self.configs)):
                    image_types.append(self.configs[c]['ImageFeatures']['image_type'])

                if self.configs[0]['General']['Fingerprint'] == 'True' and any(imt not in all_modalities for imt in image_types):
                    m = f'One of your image types {image_types} is not one of the valid image types {quantitative_modalities + qualitative_modalities}. This is mandatory to set when performing fingerprinting, see the WORC Documentation (https://worc.readthedocs.io/en/latest/static/configuration.html#imagefeatures).'
                    raise WORCexceptions.WORCValueError(m)

                # Create config source
                self.source_class_config = self.network.create_source('ParameterFile', id='config_classification_source', node_group='conf', step_id='general_sources')

                # Classification tool and label source
                self.source_patientclass_train = self.network.create_source('PatientInfoFile', id='patientclass_train', node_group='pctrain', step_id='train_sources')
                if self.labels_test:
                    self.source_patientclass_test = self.network.create_source('PatientInfoFile', id='patientclass_test', node_group='pctest', step_id='test_sources')

                # Add classification node
                memory = self.fastr_memory_parameters['Classification']
                self.classify = self.network.create_node('worc/TrainClassifier:1.0',
                                                         tool_version='1.0',
                                                         id='classify',
                                                         resources=ResourceLimit(memory=memory),
                                                         step_id='WorkflowOptimization')

                # Add fingerprinting
                if self.configs[0]['General']['Fingerprint'] == 'True':
                    self.node_fingerprinters = dict()
                    self.links_fingerprinting = dict()

                    self.add_fingerprinter(id='classification', type='classification', config_source=self.source_class_config.output)

                    # Link output of fingerprinter to classification node
                    self.link_class_1 = self.network.create_link(self.node_fingerprinters['classification'].outputs['config'], self.classify.inputs['config'])
                    # self.link_class_1.collapse = 'conf'
                else:
                    # Directly parse config to classify node
                    self.link_class_1 = self.network.create_link(self.source_class_config.output, self.classify.inputs['config'])
                    self.link_class_1.collapse = 'conf'

                if self.fixedsplits:
                    self.fixedsplits_node = self.network.create_source('CSVFile', id='fixedsplits_source', node_group='conf', step_id='general_sources')
                    self.classify.inputs['fixedsplits'] = self.fixedsplits_node.output

                self.source_ensemble_method =\
                    self.network.create_constant('String', [self.configs[0]['Ensemble']['Method']],
                                                 id='ensemble_method',
                                                 step_id='Evaluation')

                self.source_ensemble_size =\
                    self.network.create_constant('String', [self.configs[0]['Ensemble']['Size']],
                                                 id='ensemble_size',
                                                 step_id='Evaluation')

                self.source_LabelType =\
                    self.network.create_constant('String', [self.configs[0]['Labels']['label_names']],
                                                 id='LabelType',
                                                 step_id='Evaluation')

                memory = self.fastr_memory_parameters['PlotEstimator']
                self.plot_estimator =\
                    self.network.create_node('worc/PlotEstimator:1.0', tool_version='1.0',
                                             id='plot_Estimator',
                                             resources=ResourceLimit(memory=memory),
                                             step_id='Evaluation')

                # Outputs
                self.sink_classification = self.network.create_sink('HDF5', id='classification', step_id='general_sinks')
                self.sink_performance = self.network.create_sink('JsonFile', id='performance', step_id='general_sinks')
                self.sink_class_config = self.network.create_sink('ParameterFile', id='config_classification_sink', node_group='conf', step_id='general_sinks')

                # Links
                if self.configs[0]['General']['Fingerprint'] == 'True':
                    self.sink_class_config.input = self.node_fingerprinters['classification'].outputs['config']
                else:
                    self.sink_class_config.input = self.source_class_config.output

                self.link_class_2 = self.network.create_link(self.source_patientclass_train.output, self.classify.inputs['patientclass_train'])
                self.link_class_2.collapse = 'pctrain'

                self.plot_estimator.inputs['ensemble_method'] = self.source_ensemble_method.output
                self.plot_estimator.inputs['ensemble_size'] = self.source_ensemble_size.output
                self.plot_estimator.inputs['label_type'] = self.source_LabelType.output

                if self.labels_test:
                    pinfo = self.source_patientclass_test.output
                else:
                    pinfo = self.source_patientclass_train.output

                self.plot_estimator.inputs['prediction'] = self.classify.outputs['classification']
                self.plot_estimator.inputs['pinfo'] = pinfo

                # Optional SMAC output
                if self.configs[0]['SMAC']['use'] == 'True':
                    self.sink_smac_results = self.network.create_sink('JsonFile', id='smac_results',
                                                                      step_id='general_sinks')
                    self.sink_smac_results.input = self.classify.outputs['smac_results']

                if self.TrainTest:
                    # FIXME: the naming here is ugly
                    self.link_class_3 = self.network.create_link(self.source_patientclass_test.output, self.classify.inputs['patientclass_test'])
                    self.link_class_3.collapse = 'pctest'

                self.sink_classification.input = self.classify.outputs['classification']
                self.sink_performance.input = self.plot_estimator.outputs['output_json']

                if self.masks_normalize_train:
                    self.sources_masks_normalize_train = dict()

                if self.masks_normalize_test:
                    self.sources_masks_normalize_test = dict()

                # -----------------------------------------------------
                # Optionally, add ComBat Harmonization. Currently done
                # on full dataset, not in a cross-validation
                if self.configs[0]['General']['ComBat'] == 'True':
                    self.add_ComBat()

                if not self.features_train:
                    # Create nodes to compute features
                    # General
                    self.sources_parameters = dict()
                    self.source_config_pyradiomics = dict()
                    self.source_toolbox_name = dict()

                    # Training only
                    self.calcfeatures_train = dict()
                    self.featureconverter_train = dict()
                    self.preprocessing_train = dict()
                    self.sources_images_train = dict()
                    self.sinks_features_train = dict()
                    self.sinks_configs = dict()
                    self.converters_im_train = dict()
                    self.converters_seg_train = dict()
                    self.links_C1_train = dict()

                    self.featurecalculators = dict()

                    if self.TrainTest:
                        # A test set is supplied, for which nodes also need to be created
                        self.calcfeatures_test = dict()
                        self.featureconverter_test = dict()
                        self.preprocessing_test = dict()
                        self.sources_images_test = dict()
                        self.sinks_features_test = dict()
                        self.converters_im_test = dict()
                        self.converters_seg_test = dict()
                        self.links_C1_test = dict()

                    # Check which nodes are necessary
                    if not self.segmentations_train:
                        message = "No automatic segmentation method is yet implemented."
                        raise WORCexceptions.WORCNotImplementedError(message)

                    elif len(self.segmentations_train) == len(image_types):
                        # Segmentations provided
                        self.sources_segmentations_train = dict()
                        self.sources_segmentations_test = dict()
                        self.segmode = 'Provided'

                    elif len(self.segmentations_train) == 1:
                        # Assume segmentations need to be registered to other modalities
                        print('\t - Adding Elastix node for image registration.')
                        self.add_elastix_sourcesandsinks()
                        pass

                    else:
                        nseg = len(self.segmentations_train)
                        nim = len(image_types)
                        m = f'Length of segmentations for training is ' +\
                            f'{nseg}: should be equal to number of images' +\
                            f' ({nim}) or 1 when using registration.'
                        raise WORCexceptions.WORCValueError(m)

                    # BUG: We assume that first type defines if we use segmentix
                    if self.configs[0]['General']['Segmentix'] == 'True':
                        # Use the segmentix toolbox for segmentation processing
                        print('\t - Adding segmentix node for segmentation preprocessing.')
                        self.sinks_segmentations_segmentix_train = dict()
                        self.sources_masks_train = dict()
                        self.converters_masks_train = dict()
                        self.nodes_segmentix_train = dict()

                        if self.TrainTest:
                            # Also use segmentix on the tes set
                            self.sinks_segmentations_segmentix_test = dict()
                            self.sources_masks_test = dict()
                            self.converters_masks_test = dict()
                            self.nodes_segmentix_test = dict()

                    if self.semantics_train:
                        # Semantic features are supplied
                        self.sources_semantics_train = dict()

                    if self.metadata_train:
                        # Metadata to extract patient features from is supplied
                        self.sources_metadata_train = dict()

                    if self.semantics_test:
                        # Semantic features are supplied
                        self.sources_semantics_test = dict()

                    if self.metadata_test:
                        # Metadata to extract patient features from is supplied
                        self.sources_metadata_test = dict()

                    # Create a part of the pipeline for each modality
                    self.modlabels = list()
                    for nmod, mod in enumerate(image_types):
                        # Create label for each modality/image
                        num = 0
                        label = mod + '_' + str(num)
                        while label in self.calcfeatures_train.keys():
                            # if label already exists, add number to label
                            num += 1
                            label = mod + '_' + str(num)
                        self.modlabels.append(label)

                        # Create required sources and sinks
                        self.sources_parameters[label] = self.network.create_source('ParameterFile', id=f'config_{label}', step_id='general_sources')
                        self.sinks_configs[label] = self.network.create_sink('ParameterFile', id=f'config_{label}_sink', node_group='conf', step_id='general_sinks')

                        self.sources_images_train[label] = self.network.create_source('ITKImageFile', id='images_train_' + label, node_group='train', step_id='train_sources')
                        if self.TrainTest:
                            self.sources_images_test[label] = self.network.create_source('ITKImageFile', id='images_test_' + label, node_group='test', step_id='test_sources')

                        if self.metadata_train and len(self.metadata_train) >= nmod + 1:
                            self.sources_metadata_train[label] = self.network.create_source('DicomImageFile', id='metadata_train_' + label, node_group='train', step_id='train_sources')

                        if self.metadata_test and len(self.metadata_test) >= nmod + 1:
                            self.sources_metadata_test[label] = self.network.create_source('DicomImageFile', id='metadata_test_' + label, node_group='test', step_id='test_sources')

                        if self.masks_train and len(self.masks_train) >= nmod + 1:
                            # Create mask source and convert
                            self.sources_masks_train[label] = self.network.create_source('ITKImageFile', id='mask_train_' + label, node_group='train', step_id='train_sources')
                            memory = self.fastr_memory_parameters['WORCCastConvert']
                            self.converters_masks_train[label] =\
                                self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                         tool_version='0.1',
                                                         id='convert_mask_train_' + label,
                                                         node_group='train',
                                                         resources=ResourceLimit(memory=memory),
                                                         step_id='FileConversion')

                            self.converters_masks_train[label].inputs['image'] = self.sources_masks_train[label].output

                        if self.masks_test and len(self.masks_test) >= nmod + 1:
                            # Create mask source and convert
                            self.sources_masks_test[label] = self.network.create_source('ITKImageFile', id='mask_test_' + label, node_group='test', step_id='test_sources')
                            memory = self.fastr_memory_parameters['WORCCastConvert']
                            self.converters_masks_test[label] =\
                                self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                         tool_version='0.1',
                                                         id='convert_mask_test_' + label,
                                                         node_group='test',
                                                         resources=ResourceLimit(memory=memory),
                                                         step_id='FileConversion')

                            self.converters_masks_test[label].inputs['image'] = self.sources_masks_test[label].output

                        # First convert the images
                        if any(modality in mod for modality in all_modalities):
                            # Use WORC PXCastConvet for converting image formats
                            memory = self.fastr_memory_parameters['WORCCastConvert']
                            self.converters_im_train[label] =\
                                self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                         tool_version='0.1',
                                                         id='convert_im_train_' + label,
                                                         resources=ResourceLimit(memory=memory),
                                                         step_id='FileConversion')
                            if self.TrainTest:
                                self.converters_im_test[label] =\
                                    self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                             tool_version='0.1',
                                                             id='convert_im_test_' + label,
                                                             resources=ResourceLimit(memory=memory),
                                                             step_id='FileConversion')

                        else:
                            raise WORCexceptions.WORCTypeError(('No valid image type for modality {}: {} provided.').format(str(nmod), mod))

                        # Create required links
                        self.converters_im_train[label].inputs['image'] = self.sources_images_train[label].output
                        if self.TrainTest:
                            self.converters_im_test[label].inputs['image'] = self.sources_images_test[label].output

                        # -----------------------------------------------------
                        # Add fingerprinting
                        if self.configs[0]['General']['Fingerprint'] == 'True':
                            self.add_fingerprinter(id=label, type='images', config_source=self.sources_parameters[label].output)
                            self.links_fingerprinting[f'{label}_images'] = self.network.create_link(self.converters_im_train[label].outputs['image'], self.node_fingerprinters[label].inputs['images_train'])
                            self.links_fingerprinting[f'{label}_images'].collapse = 'train'

                            self.sinks_configs[label].input = self.node_fingerprinters[label].outputs['config']

                            if nmod == 0:
                                # Also add images from first modality for classification fingerprinter
                                self.links_fingerprinting['classification'] = self.network.create_link(self.converters_im_train[label].outputs['image'], self.node_fingerprinters['classification'].inputs['images_train'])
                                self.links_fingerprinting['classification'].collapse = 'train'

                        else:
                            self.sinks_configs[label].input = self.sources_parameters[label].output

                        # -----------------------------------------------------
                        # Preprocessing
                        preprocess_node = str(self.configs[nmod]['General']['Preprocessing'])
                        print('\t - Adding preprocessing node for image preprocessing.')
                        self.add_preprocessing(preprocess_node, label, nmod)

                        # -----------------------------------------------------
                        # Feature calculation
                        feature_calculators =\
                            self.configs[nmod]['General']['FeatureCalculators']
                        feature_calculators = feature_calculators.strip('][').split(', ')
                        self.featurecalculators[label] = [f.split('/')[0] for f in feature_calculators]

                        # Add lists for feature calculation and converter objects
                        self.calcfeatures_train[label] = list()
                        self.featureconverter_train[label] = list()
                        if self.TrainTest:
                            self.calcfeatures_test[label] = list()
                            self.featureconverter_test[label] = list()

                        for f in feature_calculators:
                            print(f'\t - Adding feature calculation node: {f}.')
                            self.add_feature_calculator(f, label, nmod)

                        # -----------------------------------------------------
                        # Create the neccesary nodes for the segmentation
                        if self.segmode == 'Provided':
                            # Segmentation ----------------------------------------------------
                            # Use the provided segmantions for each modality
                            memory = self.fastr_memory_parameters['WORCCastConvert']
                            self.sources_segmentations_train[label] =\
                                self.network.create_source('ITKImageFile',
                                                           id='segmentations_train_' + label,
                                                           node_group='train',
                                                           step_id='train_sources')

                            self.converters_seg_train[label] =\
                                self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                         tool_version='0.1',
                                                         id='convert_seg_train_' + label,
                                                         resources=ResourceLimit(memory=memory),
                                                         step_id='FileConversion')

                            self.converters_seg_train[label].inputs['image'] =\
                                self.sources_segmentations_train[label].output

                            if self.TrainTest:
                                self.sources_segmentations_test[label] =\
                                    self.network.create_source('ITKImageFile',
                                                               id='segmentations_test_' + label,
                                                               node_group='test',
                                                               step_id='test_sources')

                                self.converters_seg_test[label] =\
                                    self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                             tool_version='0.1',
                                                             id='convert_seg_test_' + label,
                                                             resources=ResourceLimit(memory=memory),
                                                             step_id='FileConversion')

                                self.converters_seg_test[label].inputs['image'] =\
                                    self.sources_segmentations_test[label].output

                            # Add to fingerprinting if required
                            if self.configs[0]['General']['Fingerprint'] == 'True':
                                self.links_fingerprinting[f'{label}_segmentations'] = self.network.create_link(self.converters_seg_train[label].outputs['image'], self.node_fingerprinters[label].inputs['segmentations_train'])
                                self.links_fingerprinting[f'{label}_segmentations'].collapse = 'train'

                        elif self.segmode == 'Register':
                            # ---------------------------------------------
                            # Registration nodes: Align segmentation of first
                            # modality to others using registration with Elastix
                            self.add_elastix(label, nmod)

                            # Add to fingerprinting if required
                            if self.configs[0]['General']['Fingerprint'] == 'True':
                                # Since there are no segmentations yet of this modality, just use those of the first, provided modality
                                self.links_fingerprinting[f'{label}_segmentations'] = self.network.create_link(self.converters_seg_train[self.modlabels[0]].outputs['image'], self.node_fingerprinters[label].inputs['segmentations_train'])
                                self.links_fingerprinting[f'{label}_segmentations'].collapse = 'train'

                        # -----------------------------------------------------
                        # Optionally, add segmentix, the in-house segmentation
                        # processor of WORC
                        if self.configs[nmod]['General']['Segmentix'] == 'True':
                            self.add_segmentix(label, nmod)
                        elif self.configs[nmod]['Preprocessing']['Resampling'] == 'True':
                            raise WORCexceptions.WORCValueError('If you use resampling, ' +
                                                 'have to use segmentix to ' +
                                                 ' make sure the mask is ' +
                                                 'also resampled. Please ' +
                                                 'set ' +
                                                 'config["General"]["Segmentix"]' +
                                                 'to "True".')

                        else:
                            # Provide source or elastix segmentations to
                            # feature calculator
                            for i_node in range(len(self.calcfeatures_train[label])):
                                if self.segmode == 'Provided':
                                    self.calcfeatures_train[label][i_node].inputs['segmentation'] =\
                                        self.converters_seg_train[label].outputs['image']
                                elif self.segmode == 'Register':
                                    if nmod > 0:
                                        self.calcfeatures_train[label][i_node].inputs['segmentation'] =\
                                            self.transformix_seg_nodes_train[label].outputs['image']
                                    else:
                                        self.calcfeatures_train[label][i_node].inputs['segmentation'] =\
                                            self.converters_seg_train[label].outputs['image']

                                if self.TrainTest:
                                    if self.segmode == 'Provided':
                                        self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                                            self.converters_seg_test[label].outputs['image']
                                    elif self.segmode == 'Register':
                                        if nmod > 0:
                                            self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                                                self.transformix_seg_nodes_test[label].outputs['image']
                                        else:
                                            self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                                                self.converters_seg_test[label].outputs['image']

                        # -----------------------------------------------------
                        # Optionally, add ComBat Harmonization
                        if self.configs[0]['General']['ComBat'] == 'True':
                            # Link features to ComBat
                            self.links_Combat1_train[label] = list()
                            for i_node, fname in enumerate(self.featurecalculators[label]):
                                self.links_Combat1_train[label].append(self.ComBat.inputs['features_train'][f'{label}_{self.featurecalculators[label][i_node]}'] << self.featureconverter_train[label][i_node].outputs['feat_out'])
                                self.links_Combat1_train[label][i_node].collapse = 'train'

                            if self.TrainTest:
                                self.links_Combat1_test[label] = list()
                                for i_node, fname in enumerate(self.featurecalculators[label]):
                                    self.links_Combat1_test[label].append(self.ComBat.inputs['features_test'][f'{label}_{self.featurecalculators[label][i_node]}'] << self.featureconverter_test[label][i_node].outputs['feat_out'])
                                    self.links_Combat1_test[label][i_node].collapse = 'test'

                        # -----------------------------------------------------
                        # Classification nodes
                        # Add the features from this modality to the classifier node input
                        self.links_C1_train[label] = list()
                        self.sinks_features_train[label] = list()
                        if self.TrainTest:
                            self.links_C1_test[label] = list()
                            self.sinks_features_test[label] = list()

                        for i_node, fname in enumerate(self.featurecalculators[label]):
                            # Create sink for feature outputs
                            self.sinks_features_train[label].append(self.network.create_sink('HDF5', id='features_train_' + label + '_' + fname, step_id='train_sinks'))

                            # Append features to the classification
                            if not self.configs[0]['General']['ComBat'] == 'True':
                                self.links_C1_train[label].append(self.classify.inputs['features_train'][f'{label}_{self.featurecalculators[label][i_node]}'] << self.featureconverter_train[label][i_node].outputs['feat_out'])
                                self.links_C1_train[label][i_node].collapse = 'train'

                            # Save output
                            self.sinks_features_train[label][i_node].input = self.featureconverter_train[label][i_node].outputs['feat_out']

                            # Similar for testing workflow
                            if self.TrainTest:
                                # Create sink for feature outputs
                                self.sinks_features_test[label].append(self.network.create_sink('HDF5', id='features_test_' + label + '_' + fname, step_id='test_sinks'))

                                # Append features to the classification
                                if not self.configs[0]['General']['ComBat'] == 'True':
                                    self.links_C1_test[label].append(self.classify.inputs['features_test'][f'{label}_{self.featurecalculators[label][i_node]}'] << self.featureconverter_test[label][i_node].outputs['feat_out'])
                                    self.links_C1_test[label][i_node].collapse = 'test'

                                # Save output
                                self.sinks_features_test[label][i_node].input = self.featureconverter_test[label][i_node].outputs['feat_out']

                else:
                    # Features already provided: hence we can skip numerous nodes
                    self.sources_features_train = dict()
                    self.links_C1_train = dict()

                    if self.features_test:
                        self.sources_features_test = dict()
                        self.links_C1_test = dict()

                    # Create label for each modality/image
                    self.modlabels = list()
                    for num, mod in enumerate(image_types):
                        num = 0
                        label = mod + str(num)
                        while label in self.sources_features_train.keys():
                            # if label exists, add number to label
                            num += 1
                            label = mod + str(num)
                        self.modlabels.append(label)

                        # Create a node for the feature computation
                        self.sources_features_train[label] = self.network.create_source('HDF5', id='features_train_' + label, node_group='train', step_id='train_sources')

                        # Add the features from this modality to the classifier node input
                        self.links_C1_train[label] = self.classify.inputs['features_train'][str(label)] << self.sources_features_train[label].output
                        self.links_C1_train[label].collapse = 'train'

                        if self.features_test:
                            # Create a node for the feature computation
                            self.sources_features_test[label] = self.network.create_source('HDF5', id='features_test_' + label, node_group='test', step_id='test_sources')

                            # Add the features from this modality to the classifier node input
                            self.links_C1_test[label] = self.classify.inputs['features_test'][str(label)] << self.sources_features_test[label].output
                            self.links_C1_test[label].collapse = 'test'

                        # Add input to fingerprinting for classification
                        if self.configs[0]['General']['Fingerprint'] == 'True':
                            if num == 0:
                                self.links_fingerprinting['classification'] = self.network.create_link(self.sources_features_train[label].output, self.node_fingerprinters['classification'].inputs['features_train'])
                                self.links_fingerprinting['classification'].collapse = 'train'

            else:
                raise WORCexceptions.WORCIOError("Please provide labels for training, i.e., WORC.labels_train or SimpleWORC.labels_from_this_file.")
        else:
            raise WORCexceptions.WORCIOError("Please provide either images or features.")

[docs]    def build_inference(self):
        """Build a network to test an already trained model on a test dataset based on the given attributes."""
        #FIXME WIP
        if self.images_test or self.features_test:
            if not self.labels_test:
                m = "You provided images and/or features for a test set, but not ground truth labels. Please also provide labels for the test set."
                raise WORCexceptions.WORCValueError(m)
        else:
            m = "Please provide either images and/or features for your test set."
            raise WORCexceptions.WORCValueError(m)
        
        if not self.configs:
            m = 'For a testing workflow, you need to provide a WORC config.ini file'
            raise WORCexceptions.WORCValueError(m)
        
        self.network = fastr.create_network(self.name)
        
        # Add trained model node
        memory = self.fastr_memory_parameters['Classification']
        self.source_trained_model = self.network.create_source('HDF5',
                                               id='trained_model',
                                               node_group='trained_model', step_id='general_sources')

        if self.images_test or self.features_test:
            print('Building testing network...')
            # We currently require labels for supervised learning
            if self.labels_test:
                self.network = fastr.create_network(self.name)

                # Extract some information from the configs
                image_types = list()
                for conf_it in range(len(self.configs)):
                    if type(self.configs[conf_it]) == str:
                        # Config is a .ini file, load
                        temp_conf = config_io.load_config(self.configs[conf_it])
                    else:
                        temp_conf = self.configs[conf_it]
                    
                    image_type = temp_conf['ImageFeatures']['image_type']   
                    image_types.append(image_type)
                    
                    # NOTE: We currently use the first configuration as general config
                    if conf_it == 0:
                        print(temp_conf)
                        ensemble_method = [temp_conf['Ensemble']['Method']]
                        ensemble_size = [temp_conf['Ensemble']['Size']]
                        label_names = [temp_conf['Labels']['label_names']]
                        use_ComBat = temp_conf['General']['ComBat']
                        use_segmentix = temp_conf['General']['Segmentix']

                # Create various input sources
                self.source_patientclass_test =\
                    self.network.create_source('PatientInfoFile',
                                               id='patientclass_test',
                                               node_group='pctest', step_id='test_sources')

                self.source_ensemble_method =\
                    self.network.create_constant('String', ensemble_method,
                                                 id='ensemble_method',
                                                 step_id='Evaluation')

                self.source_ensemble_size =\
                    self.network.create_constant('String', ensemble_size,
                                                 id='ensemble_size',
                                                 step_id='Evaluation')

                self.source_LabelType =\
                    self.network.create_constant('String', label_names,
                                                 id='LabelType',
                                                 step_id='Evaluation')

                memory = self.fastr_memory_parameters['PlotEstimator']
                self.plot_estimator =\
                    self.network.create_node('worc/PlotEstimator:1.0', tool_version='1.0',
                                             id='plot_Estimator',
                                             resources=ResourceLimit(memory=memory),
                                             step_id='Evaluation')
                    
                # Links to performance creator
                self.plot_estimator.inputs['ensemble_method'] = self.source_ensemble_method.output
                self.plot_estimator.inputs['ensemble_size'] = self.source_ensemble_size.output
                self.plot_estimator.inputs['label_type'] = self.source_LabelType.output
                pinfo = self.source_patientclass_test.output
                self.plot_estimator.inputs['prediction'] = self.source_trained_model.output
                self.plot_estimator.inputs['pinfo'] = pinfo
                
                # Performance output
                self.sink_performance = self.network.create_sink('JsonFile', id='performance', step_id='general_sinks')
                self.sink_performance.input = self.plot_estimator.outputs['output_json']

                if self.masks_normalize_test:
                    self.sources_masks_normalize_test = dict()

                # -----------------------------------------------------
                # Optionally, add ComBat Harmonization. Currently done
                # on full dataset, not in a cross-validation
                if use_ComBat == 'True':
                    message = '[ERROR] If you want to use ComBat, you need to provide training images or features as well.'
                    raise WORCexceptions.WORCNotImplementedError(message)

                if not self.features_test:
                    # Create nodes to compute features
                    # General
                    self.sources_parameters = dict()
                    self.source_config_pyradiomics = dict()
                    self.source_toolbox_name = dict()

                    # testing only
                    self.calcfeatures_test = dict()
                    self.featureconverter_test = dict()
                    self.preprocessing_test = dict()
                    self.sources_images_test = dict()
                    self.sinks_features_test = dict()
                    self.sinks_configs = dict()
                    self.converters_im_test = dict()
                    self.converters_seg_test = dict()
                    self.links_C1_test = dict()

                    self.featurecalculators = dict()

                    # Check which nodes are necessary
                    if not self.segmentations_test:
                        message = "No automatic segmentation method is yet implemented."
                        raise WORCexceptions.WORCNotImplementedError(message)

                    elif len(self.segmentations_test) == len(image_types):
                        # Segmentations provided
                        self.sources_segmentations_test = dict()
                        self.segmode = 'Provided'

                    elif len(self.segmentations_test) == 1:
                        # Assume segmentations need to be registered to other modalities
                        print('\t - Adding Elastix node for image registration.')
                        self.add_elastix_sourcesandsinks()
                        pass

                    else:
                        nseg = len(self.segmentations_test)
                        nim = len(image_types)
                        m = f'Length of segmentations for testing is ' +\
                            f'{nseg}: should be equal to number of images' +\
                            f' ({nim}) or 1 when using registration.'
                        raise WORCexceptions.WORCValueError(m)

                    if use_segmentix == 'True':
                        # Use the segmentix toolbox for segmentation processing
                        print('\t - Adding segmentix node for segmentation preprocessing.')
                        self.sinks_segmentations_segmentix_test = dict()
                        self.sources_masks_test = dict()
                        self.converters_masks_test = dict()
                        self.nodes_segmentix_test = dict()

                    if self.semantics_test:
                        # Semantic features are supplied
                        self.sources_semantics_test = dict()

                    if self.metadata_test:
                        # Metadata to extract patient features from is supplied
                        self.sources_metadata_test = dict()

                    # Create a part of the pipeline for each modality
                    self.modlabels = list()
                    for nmod, mod in enumerate(image_types):
                        # Extract some modality specific config info 
                        if type(self.configs[conf_it]) == str:
                            # Config is a .ini file, load
                            temp_conf = config_io.load_config(self.configs[nmod])
                        else:
                            temp_conf = self.configs[nmod]
                        
                        # Create label for each modality/image
                        num = 0
                        label = mod + '_' + str(num)
                        while label in self.calcfeatures_test.keys():
                            # if label already exists, add number to label
                            num += 1
                            label = mod + '_' + str(num)
                        self.modlabels.append(label)

                        # Create required sources and sinks
                        self.sources_parameters[label] = self.network.create_source('ParameterFile', id=f'config_{label}', step_id='general_sources')
                        self.sources_images_test[label] = self.network.create_source('ITKImageFile', id='images_test_' + label, node_group='test', step_id='test_sources')

                        if self.metadata_test and len(self.metadata_test) >= nmod + 1:
                            self.sources_metadata_test[label] = self.network.create_source('DicomImageFile', id='metadata_test_' + label, node_group='test', step_id='test_sources')
                            
                        if self.masks_test and len(self.masks_test) >= nmod + 1:
                            # Create mask source and convert
                            self.sources_masks_test[label] = self.network.create_source('ITKImageFile', id='mask_test_' + label, node_group='test', step_id='test_sources')
                            memory = self.fastr_memory_parameters['WORCCastConvert']
                            self.converters_masks_test[label] =\
                                self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                         tool_version='0.1',
                                                         id='convert_mask_test_' + label,
                                                         node_group='test',
                                                         resources=ResourceLimit(memory=memory),
                                                         step_id='FileConversion')

                            self.converters_masks_test[label].inputs['image'] = self.sources_masks_test[label].output

                        # First convert the images
                        if any(modality in mod for modality in all_modalities):
                            # Use WORC PXCastConvet for converting image formats
                            memory = self.fastr_memory_parameters['WORCCastConvert']
                            self.converters_im_test[label] =\
                                self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                            tool_version='0.1',
                                                            id='convert_im_test_' + label,
                                                            resources=ResourceLimit(memory=memory),
                                                            step_id='FileConversion')

                        else:
                            raise WORCexceptions.WORCTypeError(('No valid image type for modality {}: {} provided.').format(str(nmod), mod))

                        # Create required links
                        self.converters_im_test[label].inputs['image'] = self.sources_images_test[label].output

                        # -----------------------------------------------------
                        # Preprocessing
                        preprocess_node = str(temp_conf['General']['Preprocessing'])
                        print('\t - Adding preprocessing node for image preprocessing.')
                        self.add_preprocessing(preprocess_node, label, nmod)

                        # -----------------------------------------------------
                        # Feature calculation
                        feature_calculators =\
                            temp_conf['General']['FeatureCalculators']
                        if not isinstance(feature_calculators, list):
                            # Configparser object, need to split string
                            feature_calculators = feature_calculators.strip('][').split(', ')
                            self.featurecalculators[label] = [f.split('/')[0] for f in feature_calculators]
                        else:
                            self.featurecalculators[label] = feature_calculators
                        

                        # Add lists for feature calculation and converter objects
                        self.calcfeatures_test[label] = list()
                        self.featureconverter_test[label] = list()

                        for f in feature_calculators:
                            print(f'\t - Adding feature calculation node: {f}.')
                            self.add_feature_calculator(f, label, nmod)

                        # -----------------------------------------------------
                        # Create the neccesary nodes for the segmentation
                        if self.segmode == 'Provided':
                            # Segmentation ----------------------------------------------------
                            # Use the provided segmantions for each modality
                            memory = self.fastr_memory_parameters['WORCCastConvert']
                            self.sources_segmentations_test[label] =\
                                self.network.create_source('ITKImageFile',
                                                            id='segmentations_test_' + label,
                                                            node_group='test',
                                                            step_id='test_sources')

                            self.converters_seg_test[label] =\
                                self.network.create_node('worc/WORCCastConvert:0.3.2',
                                                            tool_version='0.1',
                                                            id='convert_seg_test_' + label,
                                                            resources=ResourceLimit(memory=memory),
                                                            step_id='FileConversion')

                            self.converters_seg_test[label].inputs['image'] =\
                                self.sources_segmentations_test[label].output

                        elif self.segmode == 'Register':
                            # ---------------------------------------------
                            # Registration nodes: Align segmentation of first
                            # modality to others using registration with Elastix
                            self.add_elastix(label, nmod)

                        # -----------------------------------------------------
                        # Optionally, add segmentix, the in-house segmentation
                        # processor of WORC
                        if temp_conf['General']['Segmentix'] == 'True':
                            self.add_segmentix(label, nmod)
                        elif temp_conf['Preprocessing']['Resampling'] == 'True':
                            raise WORCexceptions.WORCValueError('If you use resampling, ' +
                                                 'have to use segmentix to ' +
                                                 ' make sure the mask is ' +
                                                 'also resampled. Please ' +
                                                 'set ' +
                                                 'config["General"]["Segmentix"]' +
                                                 'to "True".')

                        else:
                            # Provide source or elastix segmentations to
                            # feature calculator
                            for i_node in range(len(self.calcfeatures_test[label])):
                                if self.segmode == 'Provided':
                                    self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                                        self.converters_seg_test[label].outputs['image']
                                elif self.segmode == 'Register':
                                    if nmod > 0:
                                        self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                                            self.transformix_seg_nodes_test[label].outputs['image']
                                    else:
                                        self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                                            self.converters_seg_test[label].outputs['image']

                        # -----------------------------------------------------
                        # Optionally, add ComBat Harmonization
                        if use_ComBat == 'True':
                            # Link features to ComBat
                            self.links_Combat1_test[label] = list()
                            for i_node, fname in enumerate(self.featurecalculators[label]):
                                self.links_Combat1_test[label].append(self.ComBat.inputs['features_test'][f'{label}_{self.featurecalculators[label][i_node]}'] << self.featureconverter_test[label][i_node].outputs['feat_out'])
                                self.links_Combat1_test[label][i_node].collapse = 'test'

                        # -----------------------------------------------------
                        # Output the features
                        # Add the features from this modality to the classifier node input
                        self.links_C1_test[label] = list()
                        self.sinks_features_test[label] = list()

                        for i_node, fname in enumerate(self.featurecalculators[label]):
                            # Create sink for feature outputs
                            node_id = 'features_test_' + label + '_' + fname
                            node_id = node_id.replace(':', '_').replace('.', '_').replace('/', '_')
                            self.sinks_features_test[label].append(self.network.create_sink('HDF5', id=node_id, step_id='test_sinks'))

                            # Save output
                            self.sinks_features_test[label][i_node].input = self.featureconverter_test[label][i_node].outputs['feat_out']

                else:
                    # Features already provided: hence we can skip numerous nodes
                    self.sources_features_train = dict()
                    self.links_C1_train = dict()

                    if self.features_test:
                        self.sources_features_test = dict()
                        self.links_C1_test = dict()

                    # Create label for each modality/image
                    self.modlabels = list()
                    for num, mod in enumerate(image_types):
                        num = 0
                        label = mod + str(num)
                        while label in self.sources_features_train.keys():
                            # if label exists, add number to label
                            num += 1
                            label = mod + str(num)
                        self.modlabels.append(label)

                        # Create a node for the features
                        self.sources_features_test[label] = self.network.create_source('HDF5', id='features_test_' + label, node_group='test', step_id='test_sources')

            else:
                raise WORCexceptions.WORCIOError("Please provide labels for training, i.e., WORC.labels_train or SimpleWORC.labels_from_this_file.")
        else:
            raise WORCexceptions.WORCIOError("Please provide either images or features.")
        
[docs]    def add_fingerprinter(self, id, type, config_source):
        """Add WORC Fingerprinter to the network.

        Note: applied per imaging sequence, or per feature file if no
        images are present.
        """
        # Add fingerprinting tool
        memory = self.fastr_memory_parameters['Fingerprinter']
        fingerprinter_node = self.network.create_node('worc/Fingerprinter:1.0',
                                                      tool_version='1.0',
                                                      id=f'fingerprinter_{id}',
                                                      resources=ResourceLimit(memory=memory),
                                                      step_id='FingerPrinting')

        # Add general sources to fingerprinting node
        fingerprinter_node.inputs['config'] = config_source
        fingerprinter_node.inputs['patientclass_train'] = self.source_patientclass_train.output

        # Add type input
        valid_types = ['classification', 'images']
        if type not in valid_types:
            raise WORCexceptions.WORCValueError(f'Type {type} is not valid for fingeprinting. Should be one of {valid_types}.')

        type_node = self.network.create_constant('String', type,
                                                 id=f'type_fingerprint_{id}',
                                                 node_group='train',
                                                 step_id='FingerPrinting')
        fingerprinter_node.inputs['type'] = type_node.output

        # Add to list of fingerprinting nodes
        self.node_fingerprinters[id] = fingerprinter_node

[docs]    def add_ComBat(self):
        """Add ComBat harmonization to the network.

        Note: applied on all objects, not in a train-test or cross-val setting.
        """
        memory = self.fastr_memory_parameters['ComBat']
        self.ComBat =\
            self.network.create_node('combat/ComBat:1.0',
                                     tool_version='1.0',
                                     id='ComBat',
                                     resources=ResourceLimit(memory=memory),
                                     step_id='ComBat')

        # Create sink for ComBat output
        self.sinks_features_train_ComBat = self.network.create_sink('HDF5', id='features_train_ComBat', step_id='ComBat')

        # Create links for inputs
        if self.configs[0]['General']['Fingerprint'] == 'True':
            self.link_combat_1 = self.network.create_link(self.node_fingerprinters['classification'].outputs['config'], self.ComBat.inputs['config'])
        else:
            self.link_combat_1 = self.network.create_link(self.source_class_config.output, self.ComBat.inputs['config'])

        self.link_combat_2 = self.network.create_link(self.source_patientclass_train.output, self.ComBat.inputs['patientclass_train'])
        self.link_combat_1.collapse = 'conf'
        self.link_combat_2.collapse = 'pctrain'
        self.links_Combat1_train = dict()
        self.links_Combat1_test = dict()

        # Link Combat output to both sink and classify node
        self.links_Combat_out_train = self.network.create_link(self.ComBat.outputs['features_train_out'], self.classify.inputs['features_train'])
        self.links_Combat_out_train.collapse = 'ComBat'
        self.sinks_features_train_ComBat.input = self.ComBat.outputs['features_train_out']

        if self.TrainTest or self.OnlyTest:
            # Create sink for ComBat output
            self.sinks_features_test_ComBat = self.network.create_sink('HDF5', id='features_test_ComBat', step_id='ComBat')

            # Create links for inputs
            self.link_combat_3 = self.network.create_link(self.source_patientclass_test.output, self.ComBat.inputs['patientclass_test'])
            self.link_combat_3.collapse = 'pctest'

            # Link Combat output to both sink and classify node
            self.links_Combat_out_test = self.network.create_link(self.ComBat.outputs['features_test_out'], self.classify.inputs['features_test'])
            self.links_Combat_out_test.collapse = 'ComBat'
            self.sinks_features_test_ComBat.input = self.ComBat.outputs['features_test_out']

[docs]    def add_preprocessing(self, preprocess_node, label, nmod):
        """Add nodes required for preprocessing of images."""
        
        # Extract some general information on the setup
        if type(self.configs[0]) == str:
            # Config is a .ini file, load
            temp_conf = config_io.load_config(self.configs[nmod])
        else:
            temp_conf = self.configs[nmod]
        
        memory = self.fastr_memory_parameters['Preprocessing']
        if not self.OnlyTest:
            self.preprocessing_train[label] = self.network.create_node(preprocess_node, tool_version='1.0', id='preprocessing_train_' + label, resources=ResourceLimit(memory=memory), step_id='Preprocessing')
        
        if self.TrainTest:
            self.preprocessing_test[label] = self.network.create_node(preprocess_node, tool_version='1.0', id='preprocessing_test_' + label, resources=ResourceLimit(memory=memory), step_id='Preprocessing')

        # Create required links
        if not self.OnlyTest:
            if temp_conf['General']['Fingerprint'] == 'True':
                self.preprocessing_train[label].inputs['parameters'] = self.node_fingerprinters[label].outputs['config']
            else:
                self.preprocessing_train[label].inputs['parameters'] = self.sources_parameters[label].output

            self.preprocessing_train[label].inputs['image'] = self.converters_im_train[label].outputs['image']

        if self.TrainTest:
            if temp_conf['General']['Fingerprint'] == 'True' and not self.OnlyTest:
                self.preprocessing_test[label].inputs['parameters'] = self.node_fingerprinters[label].outputs['config']
            else:
                self.preprocessing_test[label].inputs['parameters'] = self.sources_parameters[label].output

            self.preprocessing_test[label].inputs['image'] = self.converters_im_test[label].outputs['image']

        if self.metadata_train and len(self.metadata_train) >= nmod + 1:
            self.preprocessing_train[label].inputs['metadata'] = self.sources_metadata_train[label].output

        if self.metadata_test and len(self.metadata_test) >= nmod + 1:
            self.preprocessing_test[label].inputs['metadata'] = self.sources_metadata_test[label].output

        # If there are masks to use in normalization, add them here
        if self.masks_normalize_train:
            self.sources_masks_normalize_train[label] = self.network.create_source('ITKImageFile', id='masks_normalize_train_' + label, node_group='train', step_id='Preprocessing')
            self.preprocessing_train[label].inputs['mask'] = self.sources_masks_normalize_train[label].output

        if self.masks_normalize_test:
            self.sources_masks_normalize_test[label] = self.network.create_source('ITKImageFile', id='masks_normalize_test_' + label, node_group='test', step_id='Preprocessing')
            self.preprocessing_test[label].inputs['mask'] = self.sources_masks_normalize_test[label].output

[docs]    def add_feature_calculator(self, calcfeat_node, label, nmod):
        """Add a feature calculation node to the network."""
        # Name of fastr node has to exclude some specific symbols, which
        # are used in the node name
        node_ID = '_'.join([calcfeat_node.replace(':', '_').replace('.', '_').replace('/', '_'),
                            label])

        memory = self.fastr_memory_parameters['FeatureCalculator']
        if not self.OnlyTest:
            node_train =\
                self.network.create_node(calcfeat_node,
                                        tool_version='1.0',
                                        id='calcfeatures_train_' + node_ID,
                                        resources=ResourceLimit(memory=memory),
                                        step_id='Feature_Extraction')

        if self.TrainTest:
            node_test =\
                self.network.create_node(calcfeat_node,
                                         tool_version='1.0',
                                         id='calcfeatures_test_' + node_ID,
                                         resources=ResourceLimit(memory=memory),
                                         step_id='Feature_Extraction')

        # Check if we need to add pyradiomics specific sources
        if 'pyradiomics' in calcfeat_node.lower():
            if self.configs[0]['General']['Fingerprint'] != 'True':
                # Add a config source
                self.source_config_pyradiomics[label] =\
                    self.network.create_source('YamlFile',
                                               id='config_pyradiomics_' + label,
                                               node_group='train',
                                               step_id='Feature_Extraction')

            # Add a format source, which we are going to set to a constant
            # And attach to the tool node
            self.source_format_pyradiomics =\
                self.network.create_constant('String', 'csv',
                                             id='format_pyradiomics_' + label,
                                             node_group='train',
                                             step_id='Feature_Extraction')
            if not self.OnlyTest:
                node_train.inputs['format'] =\
                    self.source_format_pyradiomics.output

            if self.TrainTest:
                node_test.inputs['format'] =\
                    self.source_format_pyradiomics.output

        # Create required links
        # We can have a different config for different tools
        if not self.OnlyTest:
            if 'pyradiomics' in calcfeat_node.lower():
                if self.configs[0]['General']['Fingerprint'] != 'True':
                    node_train.inputs['parameters'] =\
                        self.source_config_pyradiomics[label].output
                else:
                    node_train.inputs['parameters'] =\
                        self.node_fingerprinters[label].outputs['config_pyradiomics']
            else:
                if self.configs[0]['General']['Fingerprint'] == 'True':
                    node_train.inputs['parameters'] =\
                        self.node_fingerprinters[label].outputs['config']
                else:
                    node_train.inputs['parameters'] =\
                        self.sources_parameters[label].output

            node_train.inputs['image'] =\
                self.preprocessing_train[label].outputs['image']

        if self.OnlyTest:
            if 'pyradiomics' in calcfeat_node.lower():
                node_test.inputs['parameters'] =\
                    self.source_config_pyradiomics[label].output
            else:
                node_test.inputs['parameters'] =\
                    self.sources_parameters[label].output

            node_test.inputs['image'] =\
                self.preprocessing_test[label].outputs['image']
                       
        elif self.TrainTest:
            if 'pyradiomics' in calcfeat_node.lower():
                if self.configs[0]['General']['Fingerprint'] != 'True':
                    node_test.inputs['parameters'] =\
                        self.source_config_pyradiomics[label].output
                else:
                    node_test.inputs['parameters'] =\
                        self.node_fingerprinters[label].outputs['config_pyradiomics']
            else:
                if self.configs[0]['General']['Fingerprint'] == 'True':
                    node_test.inputs['parameters'] =\
                        self.node_fingerprinters[label].outputs['config']
                else:
                    node_test.inputs['parameters'] =\
                        self.sources_parameters[label].output

            node_test.inputs['image'] =\
                self.preprocessing_test[label].outputs['image']

        # PREDICT can extract semantic and metadata features
        if 'predict' in calcfeat_node.lower():
            if self.metadata_train and len(self.metadata_train) >= nmod + 1:
                node_train.inputs['metadata'] =\
                    self.sources_metadata_train[label].output

            if self.metadata_test and len(self.metadata_test) >= nmod + 1:
                node_test.inputs['metadata'] =\
                    self.sources_metadata_test[label].output

            # If a semantics file is provided, connect to feature extraction tool
            if self.semantics_train and len(self.semantics_train) >= nmod + 1:
                self.sources_semantics_train[label] =\
                    self.network.create_source('CSVFile',
                                               id='semantics_train_' + label,
                                               step_id='train_sources')

                node_train.inputs['semantics'] =\
                    self.sources_semantics_train[label].output

            if self.semantics_test and len(self.semantics_test) >= nmod + 1:
                self.sources_semantics_test[label] =\
                    self.network.create_source('CSVFile',
                                               id='semantics_test_' + label,
                                               step_id='test_sources')
                node_test.inputs['semantics'] =\
                    self.sources_semantics_test[label].output

        # Add feature converter to make features WORC compatible
        if not self.OnlyTest:
            conv_train =\
                self.network.create_node('worc/FeatureConverter:1.0',
                                        tool_version='1.0',
                                        id='featureconverter_train_' + node_ID,
                                        resources=ResourceLimit(memory='4G'),
                                        step_id='Feature_Extraction')

            conv_train.inputs['feat_in'] = node_train.outputs['features']

        # Add source to tell converter which toolbox we use
        if 'pyradiomics' in calcfeat_node.lower():
            toolbox = 'PyRadiomics'
        elif 'predict' in calcfeat_node.lower():
            toolbox = 'PREDICT'
        else:
            message = f'Toolbox {calcfeat_node} not recognized!'
            raise WORCexceptions.WORCKeyError(message)

        self.source_toolbox_name[label] =\
            self.network.create_constant('String', toolbox,
                                         id=f'toolbox_name_{toolbox}_{label}',
                                         step_id='Feature_Extraction')

        if not self.OnlyTest:
            conv_train.inputs['toolbox'] = self.source_toolbox_name[label].output
            if self.configs[0]['General']['Fingerprint'] == 'True':
                conv_train.inputs['config'] =\
                    self.node_fingerprinters[label].outputs['config']
            else:
                conv_train.inputs['config'] = self.sources_parameters[label].output

        if self.TrainTest:
            conv_test =\
                self.network.create_node('worc/FeatureConverter:1.0',
                                         tool_version='1.0',
                                         id='featureconverter_test_' + node_ID,
                                         resources=ResourceLimit(memory='4G'),
                                         step_id='Feature_Extraction')

            conv_test.inputs['feat_in'] = node_test.outputs['features']
            conv_test.inputs['toolbox'] = self.source_toolbox_name[label].output
            if self.OnlyTest:
                conv_test.inputs['config'] =\
                    self.sources_parameters[label].output
            elif self.configs[0]['General']['Fingerprint'] == 'True':
                conv_test.inputs['config'] =\
                    self.node_fingerprinters[label].outputs['config']
            else:
                conv_test.inputs['config'] =\
                    self.sources_parameters[label].output

        # Append to nodes to list
        if not self.OnlyTest:
            self.calcfeatures_train[label].append(node_train)
            self.featureconverter_train[label].append(conv_train)
            
        if self.TrainTest:
            self.calcfeatures_test[label].append(node_test)
            self.featureconverter_test[label].append(conv_test)

[docs]    def add_elastix_sourcesandsinks(self):
        """Add sources and sinks required for image registration."""
        self.sources_segmentation = dict()
        self.segmode = 'Register'

        self.source_Elastix_Parameters = dict()
        
        if not self.OnlyTest:
            self.elastix_nodes_train = dict()
            self.transformix_seg_nodes_train = dict()
            self.sources_segmentations_train = dict()
            self.sinks_transformations_train = dict()
            self.sinks_segmentations_elastix_train = dict()
            self.sinks_images_elastix_train = dict()
            self.converters_seg_train = dict()
            self.edittransformfile_nodes_train = dict()
            self.transformix_im_nodes_train = dict()

        if self.TrainTest:
            self.elastix_nodes_test = dict()
            self.transformix_seg_nodes_test = dict()
            self.sources_segmentations_test = dict()
            self.sinks_transformations_test = dict()
            self.sinks_segmentations_elastix_test = dict()
            self.sinks_images_elastix_test = dict()
            self.converters_seg_test = dict()
            self.edittransformfile_nodes_test = dict()
            self.transformix_im_nodes_test = dict()

[docs]    def add_elastix(self, label, nmod):
        """ Add image registration through elastix to network."""
        # Create sources and converter for only for the given segmentation,
        # which should be on the first modality
        if nmod == 0:
            memory = self.fastr_memory_parameters['WORCCastConvert']
            if not self.OnlyTest:
                self.sources_segmentations_train[label] =\
                    self.network.create_source('ITKImageFile',
                                            id='segmentations_train_' + label,
                                            node_group='train',
                                            step_id='train_sources')

                self.converters_seg_train[label] =\
                    self.network.create_node('worc/WORCCastConvert:0.3.2',
                                            tool_version='0.1',
                                            id='convert_seg_train_' + label,
                                            resources=ResourceLimit(memory=memory),
                                            step_id='FileConversion')

                self.converters_seg_train[label].inputs['image'] =\
                    self.sources_segmentations_train[label].output

            if self.TrainTest:
                self.sources_segmentations_test[label] =\
                    self.network.create_source('ITKImageFile',
                                               id='segmentations_test_' + label,
                                               node_group='test',
                                               step_id='test_sources')

                self.converters_seg_test[label] =\
                    self.network.create_node('worc/WORCCastConvert:0.3.2',
                                             tool_version='0.1',
                                             id='convert_seg_test_' + label,
                                             resources=ResourceLimit(memory=memory),
                                             step_id='FileConversion')

                self.converters_seg_test[label].inputs['image'] =\
                    self.sources_segmentations_test[label].output

        # Assume provided segmentation is on first modality
        if nmod > 0:
            # Use elastix and transformix for registration
            # NOTE: Assume elastix node type is on first configuration
            elastix_node =\
                str(self.configs[0]['General']['RegistrationNode'])

            transformix_node =\
                str(self.configs[0]['General']['TransformationNode'])

            memory_elastix = self.fastr_memory_parameters['Elastix']
            if not self.OnlyTest:
                self.elastix_nodes_train[label] =\
                    self.network.create_node(elastix_node,
                                            tool_version='0.2',
                                            id='elastix_train_' + label,
                                            resources=ResourceLimit(memory=memory_elastix),
                                            step_id='Image_Registration')

                memory_transformix = self.fastr_memory_parameters['Elastix']
                self.transformix_seg_nodes_train[label] =\
                    self.network.create_node(transformix_node,
                                            tool_version='0.2',
                                            id='transformix_seg_train_' + label,
                                            resources=ResourceLimit(memory=memory_transformix),
                                            step_id='Image_Registration')

                self.transformix_im_nodes_train[label] =\
                    self.network.create_node(transformix_node,
                                            tool_version='0.2',
                                            id='transformix_im_train_' + label,
                                            resources=ResourceLimit(memory=memory_transformix),
                                            step_id='Image_Registration')

            if self.TrainTest:
                self.elastix_nodes_test[label] =\
                    self.network.create_node(elastix_node,
                                             tool_version='0.2',
                                             id='elastix_test_' + label,
                                             resources=ResourceLimit(memory=memory_elastix),
                                             step_id='Image_Registration')

                self.transformix_seg_nodes_test[label] =\
                    self.network.create_node(transformix_node,
                                             tool_version='0.2',
                                             id='transformix_seg_test_' + label,
                                             resources=ResourceLimit(memory=memory_transformix),
                                             step_id='Image_Registration')

                self.transformix_im_nodes_test[label] =\
                    self.network.create_node(transformix_node,
                                             tool_version='0.2',
                                             id='transformix_im_test_' + label,
                                             resources=ResourceLimit(memory=memory_transformix),
                                             step_id='Image_Registration')

            # Create sources_segmentation
            # M1 = moving, others = fixed
            if not self.OnlyTest:
                self.elastix_nodes_train[label].inputs['fixed_image'] =\
                    self.converters_im_train[label].outputs['image']

                self.elastix_nodes_train[label].inputs['moving_image'] =\
                    self.converters_im_train[self.modlabels[0]].outputs['image']

            # Add node that copies metadata from the image to the
            # segmentation if required
            if self.CopyMetadata and not self.OnlyTest:
                # Copy metadata from the image which was registered to
                # the segmentation, if it is not created yet
                if not hasattr(self, "copymetadata_nodes_train"):
                    # NOTE: Do this for first modality, as we assume
                    # the segmentation is on that one
                    self.copymetadata_nodes_train = dict()
                    self.copymetadata_nodes_train[self.modlabels[0]] =\
                        self.network.create_node('itktools/0.3.2/CopyMetadata:1.0',
                                                 tool_version='1.0',
                                                 id='CopyMetadata_train_' + self.modlabels[0],
                                                 step_id='Image_Registration')

                    self.copymetadata_nodes_train[self.modlabels[0]].inputs["source"] =\
                        self.converters_im_train[self.modlabels[0]].outputs['image']

                    self.copymetadata_nodes_train[self.modlabels[0]].inputs["destination"] =\
                        self.converters_seg_train[self.modlabels[0]].outputs['image']

                self.transformix_seg_nodes_train[label].inputs['image'] =\
                    self.copymetadata_nodes_train[self.modlabels[0]].outputs['output']
            else:
                self.transformix_seg_nodes_train[label].inputs['image'] =\
                    self.converters_seg_train[self.modlabels[0]].outputs['image']

            if self.TrainTest:
                self.elastix_nodes_test[label].inputs['fixed_image'] =\
                    self.converters_im_test[label].outputs['image']
                self.elastix_nodes_test[label].inputs['moving_image'] =\
                    self.converters_im_test[self.modlabels[0]].outputs['image']

                if self.CopyMetadata:
                    # Copy metadata from the image which was registered
                    # to the segmentation
                    if not hasattr(self, "copymetadata_nodes_test"):
                        # NOTE: Do this for first modality, as we assume
                        # the segmentation is on that one
                        self.copymetadata_nodes_test = dict()
                        self.copymetadata_nodes_test[self.modlabels[0]] =\
                            self.network.create_node('itktools/0.3.2/CopyMetadata:1.0',
                                                     tool_version='1.0',
                                                     id='CopyMetadata_test_' + self.modlabels[0],
                                                     step_id='Image_Registration')

                        self.copymetadata_nodes_test[self.modlabels[0]].inputs["source"] =\
                            self.converters_im_test[self.modlabels[0]].outputs['image']

                        self.copymetadata_nodes_test[self.modlabels[0]].inputs["destination"] =\
                            self.converters_seg_test[self.modlabels[0]].outputs['image']

                    self.transformix_seg_nodes_test[label].inputs['image'] =\
                        self.copymetadata_nodes_test[self.modlabels[0]].outputs['output']
                else:
                    self.transformix_seg_nodes_test[label].inputs['image'] =\
                        self.converters_seg_test[self.modlabels[0]].outputs['image']

            # Apply registration to input modalities
            self.source_Elastix_Parameters[label] =\
                self.network.create_source('ElastixParameterFile',
                                           id='Elastix_Para_' + label,
                                           node_group='elpara',
                                           step_id='Image_Registration')
            if not self.OnlyTest:
                self.link_elparam_train =\
                    self.network.create_link(self.source_Elastix_Parameters[label].output,
                                            self.elastix_nodes_train[label].inputs['parameters'])

                self.link_elparam_train.collapse = 'elpara'

            if self.TrainTest:
                self.link_elparam_test =\
                    self.network.create_link(self.source_Elastix_Parameters[label].output,
                                             self.elastix_nodes_test[label].inputs['parameters'])
                self.link_elparam_test.collapse = 'elpara'

            if self.masks_train:
                self.elastix_nodes_train[label].inputs['fixed_mask'] =\
                    self.converters_masks_train[label].outputs['image']

                self.elastix_nodes_train[label].inputs['moving_mask'] =\
                    self.converters_masks_train[self.modlabels[0]].outputs['image']

            if self.TrainTest:
                if self.masks_test:
                    self.elastix_nodes_test[label].inputs['fixed_mask'] =\
                        self.converters_masks_test[label].outputs['image']

                    self.elastix_nodes_test[label].inputs['moving_mask'] =\
                        self.converters_masks_test[self.modlabels[0]].outputs['image']

            # Change the FinalBSpline Interpolation order to 0 as required for binarie images: see https://github.com/SuperElastix/elastix/wiki/FAQ
            if not self.OnlyTest:
                self.edittransformfile_nodes_train[label] =\
                    self.network.create_node('elastixtools/EditElastixTransformFile:0.1',
                                            tool_version='0.1',
                                            id='EditElastixTransformFile_train_' + label,
                                            step_id='Image_Registration')

                self.edittransformfile_nodes_train[label].inputs['set'] =\
                    ["FinalBSplineInterpolationOrder=0"]

                self.edittransformfile_nodes_train[label].inputs['transform'] =\
                    self.elastix_nodes_train[label].outputs['transform'][-1]

            if self.TrainTest:
                self.edittransformfile_nodes_test[label] =\
                    self.network.create_node('elastixtools/EditElastixTransformFile:0.1',
                                             tool_version='0.1',
                                             id='EditElastixTransformFile_test_' + label,
                                             step_id='Image_Registration')

                self.edittransformfile_nodes_test[label].inputs['set'] =\
                    ["FinalBSplineInterpolationOrder=0"]

                self.edittransformfile_nodes_test[label].inputs['transform'] =\
                    self.elastix_nodes_test[label].outputs['transform'][-1]

            # Link data and transformation to transformix and source
            if not self.OnlyTest:
                self.transformix_seg_nodes_train[label].inputs['transform'] =\
                    self.edittransformfile_nodes_train[label].outputs['transform']

                self.transformix_im_nodes_train[label].inputs['transform'] =\
                    self.elastix_nodes_train[label].outputs['transform'][-1]

                self.transformix_im_nodes_train[label].inputs['image'] =\
                    self.converters_im_train[self.modlabels[0]].outputs['image']

            if self.TrainTest:
                self.transformix_seg_nodes_test[label].inputs['transform'] =\
                    self.edittransformfile_nodes_test[label].outputs['transform']

                self.transformix_im_nodes_test[label].inputs['transform'] =\
                    self.elastix_nodes_test[label].outputs['transform'][-1]

                self.transformix_im_nodes_test[label].inputs['image'] =\
                    self.converters_im_test[self.modlabels[0]].outputs['image']

            if self.configs[nmod]['General']['Segmentix'] != 'True':
                if not self.OnlyTest:
                    # These segmentations serve as input for the feature calculation
                    for i_node in range(len(self.calcfeatures_train[label])):
                        self.calcfeatures_train[label][i_node].inputs['segmentation'] =\
                            self.transformix_seg_nodes_train[label].outputs['image']
                        if self.TrainTest:
                            self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                                self.transformix_seg_nodes_test[label].outputs['image']
                else:
                    for i_node in range(len(self.calcfeatures_test[label])):
                        self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                            self.transformix_seg_nodes_test[label].outputs['image']

            # Save outputfor the training set
            if not self.OnlyTest:
                self.sinks_transformations_train[label] =\
                    self.network.create_sink('ElastixTransformFile',
                                            id='transformations_train_' + label,
                                            step_id='train_sinks')

                self.sinks_segmentations_elastix_train[label] =\
                    self.network.create_sink('ITKImageFile',
                                            id='segmentations_out_elastix_train_' + label,
                                            step_id='train_sinks')

                self.sinks_images_elastix_train[label] =\
                    self.network.create_sink('ITKImageFile',
                                            id='images_out_elastix_train_' + label,
                                            step_id='train_sinks')

                self.sinks_transformations_train[label].input =\
                    self.elastix_nodes_train[label].outputs['transform']

                self.sinks_segmentations_elastix_train[label].input =\
                    self.transformix_seg_nodes_train[label].outputs['image']

                self.sinks_images_elastix_train[label].input =\
                    self.transformix_im_nodes_train[label].outputs['image']

            # Save output for the test set
            if self.TrainTest:
                self.sinks_transformations_test[label] =\
                    self.network.create_sink('ElastixTransformFile',
                                             id='transformations_test_' + label,
                                             step_id='test_sinks')

                self.sinks_segmentations_elastix_test[label] =\
                    self.network.create_sink('ITKImageFile',
                                             id='segmentations_out_elastix_test_' + label,
                                             step_id='test_sinks')
                self.sinks_images_elastix_test[label] =\
                    self.network.create_sink('ITKImageFile',
                                             id='images_out_elastix_test_' + label,
                                             step_id='test_sinks')
                self.sinks_transformations_test[label].input =\
                    self.elastix_nodes_test[label].outputs['transform']
                self.sinks_segmentations_elastix_test[label].input =\
                    self.transformix_seg_nodes_test[label].outputs['image']
                self.sinks_images_elastix_test[label].input =\
                    self.transformix_im_nodes_test[label].outputs['image']

[docs]    def add_segmentix(self, label, nmod):
        """Add segmentix to the network."""
        # Segmentix nodes -------------------------------------------------
        # Use segmentix node to convert input segmentation into
        # correct contour
        if not self.OnlyTest:
            if label not in self.sinks_segmentations_segmentix_train:
                self.sinks_segmentations_segmentix_train[label] =\
                    self.network.create_sink('ITKImageFile',
                                            id='segmentations_out_segmentix_train_' + label,
                                            step_id='train_sinks')

            memory = self.fastr_memory_parameters['Segmentix']
            self.nodes_segmentix_train[label] =\
                self.network.create_node('segmentix/Segmentix:1.0',
                                        tool_version='1.0',
                                        id='segmentix_train_' + label,
                                        resources=ResourceLimit(memory=memory),
                                        step_id='Preprocessing')

            # Input the image
            self.nodes_segmentix_train[label].inputs['image'] =\
                self.converters_im_train[label].outputs['image']

        # Input the metadata
        if self.metadata_train and len(self.metadata_train) >= nmod + 1:
            self.nodes_segmentix_train[label].inputs['metadata'] = self.sources_metadata_train[label].output

        # Input the segmentation
        if not self.OnlyTest:
            if hasattr(self, 'transformix_seg_nodes_train'):
                if label in self.transformix_seg_nodes_train.keys():
                    # Use output of registration in segmentix
                    self.nodes_segmentix_train[label].inputs['segmentation_in'] =\
                        self.transformix_seg_nodes_train[label].outputs['image']
                else:
                    # Use original segmentation
                    self.nodes_segmentix_train[label].inputs['segmentation_in'] =\
                        self.converters_seg_train[label].outputs['image']
            else:
                # Use original segmentation
                self.nodes_segmentix_train[label].inputs['segmentation_in'] =\
                    self.converters_seg_train[label].outputs['image']

        # Input the parameters
        if not self.OnlyTest:
            if self.configs[0]['General']['Fingerprint'] == 'True':
                self.nodes_segmentix_train[label].inputs['parameters'] =\
                    self.node_fingerprinters[label].outputs['config']
            else:
                self.nodes_segmentix_train[label].inputs['parameters'] =\
                    self.sources_parameters[label].output

            self.sinks_segmentations_segmentix_train[label].input =\
                self.nodes_segmentix_train[label].outputs['segmentation_out']

        if self.TrainTest:
            self.sinks_segmentations_segmentix_test[label] =\
                self.network.create_sink('ITKImageFile',
                                         id='segmentations_out_segmentix_test_' + label,
                                         step_id='test_sinks')

            self.nodes_segmentix_test[label] =\
                self.network.create_node('segmentix/Segmentix:1.0',
                                         tool_version='1.0',
                                         id='segmentix_test_' + label,
                                         resources=ResourceLimit(memory=memory),
                                         step_id='Preprocessing')

            # Input the image
            self.nodes_segmentix_test[label].inputs['image'] =\
                self.converters_im_test[label].outputs['image']

            # Input the metadata
            if self.metadata_test and len(self.metadata_test) >= nmod + 1:
                self.nodes_segmentix_test[label].inputs['metadata'] = self.sources_metadata_test[label].output

            if hasattr(self, 'transformix_seg_nodes_test'):
                if label in self.transformix_seg_nodes_test.keys():
                    # Use output of registration in segmentix
                    self.nodes_segmentix_test[label].inputs['segmentation_in'] =\
                        self.transformix_seg_nodes_test[label].outputs['image']
                else:
                    # Use original segmentation
                    self.nodes_segmentix_test[label].inputs['segmentation_in'] =\
                        self.converters_seg_test[label].outputs['image']
            else:
                # Use original segmentation
                self.nodes_segmentix_test[label].inputs['segmentation_in'] =\
                    self.converters_seg_test[label].outputs['image']

            if self.configs[0]['General']['Fingerprint'] == 'True' and not self.OnlyTest:
                self.nodes_segmentix_test[label].inputs['parameters'] =\
                    self.node_fingerprinters[label].outputs['config']
            else:
                self.nodes_segmentix_test[label].inputs['parameters'] =\
                    self.sources_parameters[label].output

            self.sinks_segmentations_segmentix_test[label].input =\
                self.nodes_segmentix_test[label].outputs['segmentation_out']

        if not self.OnlyTest:
            for i_node in range(len(self.calcfeatures_train[label])):
                self.calcfeatures_train[label][i_node].inputs['segmentation'] =\
                    self.nodes_segmentix_train[label].outputs['segmentation_out']

                if self.TrainTest:
                    self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                        self.nodes_segmentix_test[label].outputs['segmentation_out']
        else:
            for i_node in range(len(self.calcfeatures_test[label])):
                self.calcfeatures_test[label][i_node].inputs['segmentation'] =\
                    self.nodes_segmentix_test[label].outputs['segmentation_out']
            
        if self.masks_train and len(self.masks_train) >= nmod + 1:
            # Use masks
            self.nodes_segmentix_train[label].inputs['mask'] =\
                self.converters_masks_train[label].outputs['image']

        if self.masks_test and len(self.masks_test) >= nmod + 1:
            # Use masks
            self.nodes_segmentix_test[label].inputs['mask'] =\
                self.converters_masks_test[label].outputs['image']

[docs]    def set(self):
        """Set the FASTR source and sink data based on the given attributes."""
        self.fastrconfigs = list()
        self.source_data = dict()
        self.sink_data = dict()

        # Save the configurations as files
        if not self.OnlyTest:
            self.save_config()
        else:
            self.fastrconfigs = self.configs

        # fixed splits
        if self.fixedsplits:
            self.source_data['fixedsplits_source'] = self.fixedsplits

        # Set source and sink data
        self.source_data['patientclass_train'] = self.labels_train
        self.source_data['patientclass_test'] = self.labels_test
        self.source_data['trained_model'] = self.trained_model

        self.sink_data['classification'] = ("vfs://output/{}/estimator_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name)
        self.sink_data['performance'] = ("vfs://output/{}/performance_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name)
        self.sink_data['smac_results'] = ("vfs://output/{}/smac_results_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name)
        self.sink_data['config_classification_sink'] = ("vfs://output/{}/config_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name)
        self.sink_data['features_train_ComBat'] = ("vfs://output/{}/ComBat/features_ComBat_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name)
        self.sink_data['features_test_ComBat'] = ("vfs://output/{}/ComBat/features_ComBat_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name)

        # Get info from the first config file
        if type(self.configs[0]) == str:
            # Config is a .ini file, load
            temp_conf = config_io.load_config(self.configs[0])
        else:
            temp_conf = self.configs[0]
                        
        # Set the source data from the WORC objects you created
        for num, label in enumerate(self.modlabels):
            self.source_data['config_' + label] = self.fastrconfigs[num]
            self.sink_data[f'config_{label}_sink'] = f"vfs://output/{self.name}/config_{label}_{{sample_id}}_{{cardinality}}{{ext}}"

            if 'pyradiomics' in temp_conf['General']['FeatureCalculators'] and temp_conf['General']['Fingerprint'] != 'True':
                self.source_data['config_pyradiomics_' + label] = self.pyradiomics_configs[num]

            # Add train data sources
            if self.images_train and len(self.images_train) - 1 >= num:
                self.source_data['images_train_' + label] = self.images_train[num]

            if self.masks_train and len(self.masks_train) - 1 >= num:
                self.source_data['mask_train_' + label] = self.masks_train[num]

            if self.masks_normalize_train and len(self.masks_normalize_train) - 1 >= num:
                self.source_data['masks_normalize_train_' + label] = self.masks_normalize_train[num]

            if self.metadata_train and len(self.metadata_train) - 1 >= num:
                self.source_data['metadata_train_' + label] = self.metadata_train[num]

            if self.segmentations_train and len(self.segmentations_train) - 1 >= num:
                self.source_data['segmentations_train_' + label] = self.segmentations_train[num]

            if self.semantics_train and len(self.semantics_train) - 1 >= num:
                self.source_data['semantics_train_' + label] = self.semantics_train[num]

            if self.features_train and len(self.features_train) - 1 >= num:
                self.source_data['features_train_' + label] = self.features_train[num]

            if self.Elastix_Para:
                # First modality does not need to be registered
                if num > 0:
                    if len(self.Elastix_Para) > 1:
                        # Each modality has its own registration parameters
                        self.source_data['Elastix_Para_' + label] = self.Elastix_Para[num]
                    else:
                        # Use one fileset for all modalities
                        self.source_data['Elastix_Para_' + label] = self.Elastix_Para[0]

            # Add test data sources
            if self.images_test and len(self.images_test) - 1 >= num:
                self.source_data['images_test_' + label] = self.images_test[num]

            if self.masks_test and len(self.masks_test) - 1 >= num:
                self.source_data['mask_test_' + label] = self.masks_test[num]

            if self.masks_normalize_test and len(self.masks_normalize_test) - 1 >= num:
                self.source_data['masks_normalize_test_' + label] = self.masks_normalize_test[num]

            if self.metadata_test and len(self.metadata_test) - 1 >= num:
                self.source_data['metadata_test_' + label] = self.metadata_test[num]

            if self.segmentations_test and len(self.segmentations_test) - 1 >= num:
                self.source_data['segmentations_test_' + label] = self.segmentations_test[num]

            if self.semantics_test and len(self.semantics_test) - 1 >= num:
                self.source_data['semantics_test_' + label] = self.semantics_test[num]

            if self.features_test and len(self.features_test) - 1  >= num:
                self.source_data['features_test_' + label] = self.features_test[num]

            self.sink_data['segmentations_out_segmentix_train_' + label] = ("vfs://output/{}/Segmentations/seg_{}_segmentix_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, label)
            self.sink_data['segmentations_out_elastix_train_' + label] = ("vfs://output/{}/Elastix/seg_{}_elastix_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, label)
            self.sink_data['images_out_elastix_train_' + label] = ("vfs://output/{}/Elastix/im_{}_elastix_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, label)
            if hasattr(self, 'featurecalculators'):
                for f in self.featurecalculators[label]:
                    self.sink_data['features_train_' + label + '_' + f] = ("vfs://output/{}/Features/features_{}_{}_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, f, label)

            if self.labels_test:
                self.sink_data['segmentations_out_segmentix_test_' + label] = ("vfs://output/{}/Segmentations/seg_{}_segmentix_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, label)
                self.sink_data['segmentations_out_elastix_test_' + label] = ("vfs://output/{}/Elastix/seg_{}_elastix_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, label)
                self.sink_data['images_out_elastix_test_' + label] = ("vfs://output/{}/Images/im_{}_elastix_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, label)
                if hasattr(self, 'featurecalculators'):
                    for f in self.featurecalculators[label]:
                        f = f.replace(':', '_').replace('.', '_').replace('/', '_')
                        self.sink_data['features_test_' + label + '_' + f] = ("vfs://output/{}/Features/features_{}_{}_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, f, label)

            # Add elastix sinks if used
            if self.segmode:
                # Segmode is only non-empty if segmentations are provided
                if self.segmode == 'Register':
                    self.sink_data['transformations_train_' + label] = ("vfs://output/{}/Elastix/transformation_{}_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, label)
                    if self.TrainTest:
                        self.sink_data['transformations_test_' + label] = ("vfs://output/{}/Elastix/transformation_{}_{{sample_id}}_{{cardinality}}{{ext}}").format(self.name, label)

        if self._add_evaluation:
            self.Evaluate.set()

        # Generate gridsearch parameter files if required
        self.source_data['config_classification_source'] = self.fastrconfigs[0]

        # Give configuration sources to WORC
        for num, label in enumerate(self.modlabels):
            self.source_data['config_' + label] = self.fastrconfigs[num]

[docs]    def execute(self):
        """Execute the network through the fastr.network.execute command."""
        # Draw and execute nwtwork
        try:
            self.network.draw(file_path=self.network.id + '.svg', draw_dimensions=True)
        except graphviz.backend.ExecutableNotFound:
            print('[WORC WARNING] Graphviz executable not found: not drawing network diagram. Make sure the Graphviz executables are on your systems PATH.')
        except graphviz.backend.CalledProcessError as e:
            print(f'[WORC WARNING] Graphviz executable gave an error: not drawing network diagram. Original error: {e}')

        # export hyper param. search space to LaTeX table. Only for training models.
        if not self.OnlyTest:
            for config in self.fastrconfigs:
                config_path = Path(url2pathname(urlparse(config).path))
                tex_path = f'{config_path.parent.absolute() / config_path.stem}_hyperparams_space.tex'
                export_hyper_params_to_latex(config_path, tex_path)

        if DebugDetector().do_detection():
            print("Source Data:")
            for k in self.source_data.keys():
                print(f"\t {k}: {self.source_data[k]}.")
            print("\n Sink Data:")
            for k in self.sink_data.keys():
                print(f"\t {k}: {self.sink_data[k]}.")

            # When debugging, set the tempdir to the default of fastr + name
            self.fastr_tmpdir = os.path.join(fastr.config.mounts['tmp'],
                                             self.name)

        self.network.execute(self.source_data, self.sink_data, execution_plugin=self.fastr_plugin, tmpdir=self.fastr_tmpdir)

[docs]    def add_evaluation(self, label_type, modus='binary_classification'):
        """Add branch for evaluation of performance to network.

        Note: should be done after build, before set:
        WORC.build()
        WORC.add_evaluation(label_type)
        WORC.set()
        WORC.execute()

        """
        self.Evaluate =\
            Evaluate(label_type=label_type, parent=self, modus=modus)
        self._add_evaluation = True

[docs]    def save_config(self):
        """Save the config files to physical files and add to network."""
        # If the configuration files are confiparse objects, write to file
        self.pyradiomics_configs = list()

        # Make sure we can dump blank values for PyRadiomics
        yaml.SafeDumper.add_representer(type(None),
                                        lambda dumper, value: dumper.represent_scalar(u'tag:yaml.org,2002:null', ''))

        for num, c in enumerate(self.configs):
            if type(c) != configparser.ConfigParser:
                # A filepath (not a fastr source) is provided. Hence we read
                # the config file and convert it to a configparser object
                config = configparser.ConfigParser()
                config.read(c)
                c = config

            cfile = os.path.join(self.fastr_tmpdir, f"config_{self.name}_{num}.ini")
            if not os.path.exists(os.path.dirname(cfile)):
                os.makedirs(os.path.dirname(cfile))

            with open(cfile, 'w') as configfile:
                c.write(configfile)

            # If PyRadiomics is used and there is no finterprinting, also write a config for PyRadiomics
            if 'pyradiomics' in c['General']['FeatureCalculators'] and self.configs[0]['General']['Fingerprint'] != 'True':
                cfile_pyradiomics = os.path.join(self.fastr_tmpdir, f"config_pyradiomics_{self.name}_{num}.yaml")
                config_pyradiomics = io.convert_config_pyradiomics(c)
                with open(cfile_pyradiomics, 'w') as file:
                    yaml.safe_dump(config_pyradiomics, file)
                cfile_pyradiomics = Path(self.fastr_tmpdir) / f"config_pyradiomics_{self.name}_{num}.yaml"
                self.pyradiomics_configs.append(cfile_pyradiomics.as_uri().replace('%20', ' '))

            # BUG: Make path with pathlib to create windows double slashes
            cfile = Path(self.fastr_tmpdir) / f"config_{self.name}_{num}.ini"
            self.fastrconfigs.append(cfile.as_uri().replace('%20', ' '))


[docs]class Tools(object):
    """
    Create other pipelines besides the default radiomics executions.

    Currently includes:
    1. Registration pipeline
    2. Evaluation pipeline
    3. Slicer pipeline, to create pngs of middle slice of images.
    """

[docs]    def __init__(self):
        """Initialize object with all pipelines."""
        self.Elastix = Elastix()
        self.Evaluate = Evaluate()
        self.Slicer = Slicer()