comparison tabular_learner.xml @ 10:49f73a3c12f3 draft default tip

planemo upload for repository https://github.com/goeckslab/gleam commit 1ffd143e57fa952ee9dd84fc141771520aea0791
author goeckslab
date Wed, 26 Nov 2025 17:49:36 +0000
parents e7dd78077b72
children
comparison
equal deleted inserted replaced
9:e7dd78077b72 10:49f73a3c12f3
4 <import>pycaret_macros.xml</import> 4 <import>pycaret_macros.xml</import>
5 </macros> 5 </macros>
6 <expand macro="python_requirements" /> 6 <expand macro="python_requirements" />
7 <command> 7 <command>
8 <![CDATA[ 8 <![CDATA[
9 python $__tool_directory__/pycaret_train.py --input_file '$input_file' --target_col '$target_feature' --output_dir '.' --random_seed '$random_seed' 9 python $__tool_directory__/pycaret_train.py --input_file '$input_file' --target_col '$target_feature' --output_dir '.' --random_seed '$random_seed' --n-jobs \${GALAXY_SLOTS:-1}
10 #if $model_type == "classification" 10 #if $model_type == "classification"
11 #if $classification_models 11 #if $classification_models
12 --models '$classification_models' 12 --models '$classification_models'
13 #end if 13 #end if
14 #end if 14 #end if
197 </outputs> 197 </outputs>
198 <tests> 198 <tests>
199 <test> 199 <test>
200 <param name="input_file" value="pcr.tsv"/> 200 <param name="input_file" value="pcr.tsv"/>
201 <param name="target_feature" value="11"/> 201 <param name="target_feature" value="11"/>
202 <param name="model_type" value="classification"/> 202 <param name="model_selection|model_type" value="classification"/>
203 <param name="best_model_metric" value="F1"/> 203 <param name="model_selection|best_model_metric" value="F1"/>
204 <param name="random_seed" value="42"/> 204 <param name="random_seed" value="42"/>
205 <param name="customize_defaults" value="true"/> 205 <param name="advanced_settings|customize_defaults" value="true"/>
206 <param name="train_size" value="0.8"/> 206 <param name="advanced_settings|train_size" value="0.8"/>
207 <param name="normalize" value="true"/> 207 <param name="advanced_settings|normalize" value="true"/>
208 <param name="feature_selection" value="true"/> 208 <param name="advanced_settings|feature_selection" value="true"/>
209 <param name="enable_cross_validation" value="true"/> 209 <param name="advanced_settings|cross_validation|enable_cross_validation" value="true"/>
210 <param name="cross_validation_folds" value="5"/> 210 <param name="advanced_settings|cross_validation|cross_validation_folds" value="5"/>
211 <param name="remove_outliers" value="true"/> 211 <param name="advanced_settings|remove_outliers" value="true"/>
212 <param name="remove_multicollinearity" value="true"/> 212 <param name="advanced_settings|remove_multicollinearity" value="true"/>
213 <param name="probability_threshold" value="0.4" /> 213 <param name="advanced_settings|probability_threshold" value="0.4" />
214 <output name="model" file="expected_model_classification_customized.h5" compare="sim_size"/> 214 <output name="model" file="expected_model_classification_customized.h5" compare="sim_size"/>
215 <output name="comparison_result"> 215 <output name="comparison_result">
216 <assert_contents> 216 <assert_contents>
217 <has_text text="Validation Summary" /> 217 <has_text text="Validation Summary" />
218 <has_text text="Test Summary" /> 218 <has_text text="Test Summary" />
224 <output name="best_model_csv" value="expected_best_model_classification_customized.csv" /> 224 <output name="best_model_csv" value="expected_best_model_classification_customized.csv" />
225 </test> 225 </test>
226 <test> 226 <test>
227 <param name="input_file" value="pcr.tsv"/> 227 <param name="input_file" value="pcr.tsv"/>
228 <param name="target_feature" value="11"/> 228 <param name="target_feature" value="11"/>
229 <param name="model_type" value="classification"/> 229 <param name="model_selection|model_type" value="classification"/>
230 <param name="random_seed" value="42"/> 230 <param name="random_seed" value="42"/>
231 <param name="customize_defaults" value="true"/> 231 <param name="advanced_settings|customize_defaults" value="true"/>
232 <param name="train_size" value="0.8"/> 232 <param name="advanced_settings|train_size" value="0.8"/>
233 <param name="normalize" value="true"/> 233 <param name="advanced_settings|normalize" value="true"/>
234 <param name="feature_selection" value="true"/> 234 <param name="advanced_settings|feature_selection" value="true"/>
235 <param name="enable_cross_validation" value="false"/> 235 <param name="advanced_settings|cross_validation|enable_cross_validation" value="false"/>
236 <param name="remove_outliers" value="true"/> 236 <param name="advanced_settings|remove_outliers" value="true"/>
237 <param name="remove_multicollinearity" value="true"/> 237 <param name="advanced_settings|remove_multicollinearity" value="true"/>
238 <param name="probability_threshold" value="0.6" /> 238 <param name="advanced_settings|probability_threshold" value="0.6" />
239 <output name="model" file="expected_model_classification_customized_cross_off.h5" compare="sim_size"/> 239 <output name="model" file="expected_model_classification_customized_cross_off.h5" compare="sim_size"/>
240 <output name="comparison_result"> 240 <output name="comparison_result">
241 <assert_contents> 241 <assert_contents>
242 <has_text text="Validation Summary" /> 242 <has_text text="Validation Summary" />
243 <has_text text="Test Summary" /> 243 <has_text text="Test Summary" />
247 <output name="best_model_csv" value="expected_best_model_classification_customized_cross_off.csv" /> 247 <output name="best_model_csv" value="expected_best_model_classification_customized_cross_off.csv" />
248 </test> 248 </test>
249 <test> 249 <test>
250 <param name="input_file" value="pcr.tsv"/> 250 <param name="input_file" value="pcr.tsv"/>
251 <param name="target_feature" value="11"/> 251 <param name="target_feature" value="11"/>
252 <param name="model_type" value="classification"/> 252 <param name="model_selection|model_type" value="classification"/>
253 <param name="random_seed" value="42"/> 253 <param name="random_seed" value="42"/>
254 <param name="tune_model" value="true"/> 254 <param name="tune_model" value="true"/>
255 <output name="model" file="expected_model_classification.h5" compare="sim_size"/> 255 <output name="model" file="expected_model_classification.h5" compare="sim_size"/>
256 <output name="comparison_result"> 256 <output name="comparison_result">
257 <assert_contents> 257 <assert_contents>
258 <has_text text="Validation Summary" /> 258 <has_text text="Validation Summary" />
259 <has_text text="Test Summary" /> 259 <has_text text="Test Summary" />
260 <has_text text="Feature Importance" /> 260 <has_text text="Feature Importance" />
261 </assert_contents> 261 </assert_contents>
262 </output> 262 </output>
263 <output name="best_model_csv" value="expected_best_model_classification.csv" /> 263 <output name="best_model_csv">
264 <assert_contents>
265 <has_text text="n_estimators,100" />
266 <has_text text="num_leaves,31" />
267 <has_text text="learning_rate,0.1" />
268 </assert_contents>
269 </output>
264 </test> 270 </test>
265 <test> 271 <test>
266 <param name="input_file" value="pcr.tsv"/> 272 <param name="input_file" value="pcr.tsv"/>
267 <param name="target_feature" value="11"/> 273 <param name="target_feature" value="11"/>
268 <param name="model_type" value="classification"/> 274 <param name="model_selection|model_type" value="classification"/>
269 <param name="random_seed" value="42"/> 275 <param name="random_seed" value="42"/>
270 <output name="model" file="expected_model_classification.h5" compare="sim_size"/> 276 <output name="model" file="expected_model_classification.h5" compare="sim_size"/>
271 <output name="comparison_result"> 277 <output name="comparison_result">
272 <assert_contents> 278 <assert_contents>
273 <has_text text="Validation Summary" /> 279 <has_text text="Validation Summary" />
274 <has_text text="Test Summary" /> 280 <has_text text="Test Summary" />
275 <has_text text="Feature Importance" /> 281 <has_text text="Feature Importance" />
276 </assert_contents> 282 </assert_contents>
277 </output> 283 </output>
278 <output name="best_model_csv" value="expected_best_model_classification.csv" /> 284 <output name="best_model_csv">
285 <assert_contents>
286 <has_text text="n_estimators,100" />
287 <has_text text="num_leaves,31" />
288 <has_text text="learning_rate,0.1" />
289 </assert_contents>
290 </output>
279 </test> 291 </test>
280 <test> 292 <test>
281 <param name="input_file" value="auto-mpg.tsv"/> 293 <param name="input_file" value="auto-mpg.tsv"/>
282 <param name="target_feature" value="1"/> 294 <param name="target_feature" value="1"/>
283 <param name="model_type" value="regression"/> 295 <param name="model_selection|model_type" value="regression"/>
284 <param name="best_model_metric" value="RMSE"/> 296 <param name="model_selection|best_model_metric" value="RMSE"/>
285 <param name="random_seed" value="42"/> 297 <param name="random_seed" value="42"/>
286 <output name="model" file="expected_model_regression.h5" compare="sim_size" /> 298 <output name="model" file="expected_model_regression.h5" compare="sim_size" />
287 <output name="comparison_result"> 299 <output name="comparison_result">
288 <assert_contents> 300 <assert_contents>
289 <has_text text="Validation Summary" /> 301 <has_text text="Validation Summary" />