tabular_learner: tabular_learner.xml comparison

comparison tabular_learner.xml @ 4:11fdac5affb3 draft

planemo upload for repository https://github.com/goeckslab/gleam commit 8112548ac44b7a4769093d76c722c8fcdeaaef54

author	goeckslab
date	Fri, 25 Jul 2025 19:02:12 +0000
parents	f6a65e05d6ec
children	3d42f82b3c7f

comparison

equal deleted inserted replaced

-:f6a65e05d6ec
+:11fdac5affb3
 #if $model_type == "regression"
 #if $regression_models
 --models '$regression_models'
 #end if
 #end if
+#if $tune_model
+--tune_model
+#end if
 #if $customize_defaults == "true"
 #if $train_size
 --train_size '$train_size'
 #end if
 #if $normalize
 --normalize
 #end if
 #if $feature_selection
 --feature_selection
 #end if
 #if $enable_cross_validation == "true"
 --cross_validation
 #if $cross_validation_folds
 --cross_validation_folds '$cross_validation_folds'
 #end if
 #end if
 ]]>
 </command>
 <inputs>
 <param name="input_file" type="data" format="csv,tabular" label="Tabular Input Dataset" />
 <param name="test_file" type="data" format="csv,tabular" optional="true" label="Tabular Test Dataset"
 help="If a test dataset is not provided,
 the input dataset will be split into training, validation, and test sets.
 If a test set is provided, the input dataset will be split into training and validation sets.
 Cross-validation is applied by default during training." />
 <param name="target_feature" multiple="false" type="data_column" use_header_names="true" data_ref="input_file" label="Select the target column:" />
 <conditional name="model_selection">
 <param name="model_type" type="select" label="Task">
 <option value="classification">classification</option>
 <option value="lightgbm">Light Gradient Boosting Machine</option>
 <option value="catboost">CatBoost Regressor</option>
 </param>
 </when>
 </conditional>
+<param name="tune_model" type="boolean" truevalue="True" falsevalue="False" label="Tune hyperparameters" help="Hyperparameter tuning on the best model" />
 <param name="random_seed" type="integer" value="42" label="Random Seed" help="Random seed for reproducibility." />
 <conditional name="advanced_settings">
 <param name="customize_defaults" type="select" label="Customize Default Settings?" help="Select yes if you want to customize the default settings of the experiment.">
 <option value="false" selected="true">No</option>
 <option value="true">Yes</option>
 <param name="remove_outliers" value="true"/>
 <param name="remove_multicollinearity" value="true"/>
 <output name="model" file="expected_model_classification_customized.h5" compare="sim_size"/>
 <output name="comparison_result">
 <assert_contents>
-<has_text text="Validation Result Summary" />
+<has_text text="Validation Summary" />
-<has_text text="Test Results" />
+<has_text text="Test Summary" />
 <has_text text="Feature Importance" />
 </assert_contents>
 </output>
 <output name="best_model_csv" value="expected_best_model_classification_customized.csv" />
 </test>
 <param name="remove_outliers" value="true"/>
 <param name="remove_multicollinearity" value="true"/>
 <output name="model" file="expected_model_classification_customized_cross_off.h5" compare="sim_size"/>
 <output name="comparison_result">
 <assert_contents>
-<has_text text="Validation Result Summary" />
+<has_text text="Validation Summary" />
-<has_text text="Test Results" />
+<has_text text="Test Summary" />
 <has_text text="Feature Importance" />
 </assert_contents>
 </output>
 <output name="best_model_csv" value="expected_best_model_classification_customized_cross_off.csv" />
 </test>
 <test>
 <param name="input_file" value="pcr.tsv"/>
 <param name="target_feature" value="11"/>
 <param name="model_type" value="classification"/>
 <param name="random_seed" value="42"/>
+<param name="tune_model" value="true"/>
 <output name="model" file="expected_model_classification.h5" compare="sim_size"/>
 <output name="comparison_result">
 <assert_contents>
-<has_text text="Validation Result Summary" />
+<has_text text="Validation Summary" />
-<has_text text="Test Results" />
+<has_text text="Test Summary" />
+<has_text text="Feature Importance" />
+</assert_contents>
+</output>
+<output name="best_model_csv" value="expected_best_model_classification.csv" />
+</test>
+<test>
+<param name="input_file" value="pcr.tsv"/>
+<param name="target_feature" value="11"/>
+<param name="model_type" value="classification"/>
+<param name="random_seed" value="42"/>
+<output name="model" file="expected_model_classification.h5" compare="sim_size"/>
+<output name="comparison_result">
+<assert_contents>
+<has_text text="Validation Summary" />
+<has_text text="Test Summary" />
 <has_text text="Feature Importance" />
 </assert_contents>
 </output>
 <output name="best_model_csv" value="expected_best_model_classification.csv" />
 </test>
 <param name="model_type" value="regression"/>
 <param name="random_seed" value="42"/>
 <output name="model" file="expected_model_regression.h5" compare="sim_size" />
 <output name="comparison_result">
 <assert_contents>
-<has_text text="Validation Result Summary" />
+<has_text text="Validation Summary" />
-<has_text text="Test Results" />
+<has_text text="Test Summary" />
 <has_text text="Feature Importance" />
 </assert_contents>
 </output>
 <output name="best_model_csv" value="expected_best_model_regression.csv" />
 </test>

Mercurial > repos > goeckslab > tabular_learner

comparison tabular_learner.xml @ 4:11fdac5affb3 draft