annotate ensemble.xml @ 19:4570575d060c draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
author bgruening
date Fri, 17 Aug 2018 12:28:21 -0400
parents f02eeabab5d1
children 038cecaa9e7c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
1 <tool id="sklearn_ensemble" name="Ensemble methods" version="@VERSION@">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
2 <description>for classification and regression</description>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
3 <macros>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
4 <import>main_macros.xml</import>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
5 </macros>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
6 <expand macro="python_requirements"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
7 <expand macro="macro_stdio"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
8 <version_command>echo "@VERSION@"</version_command>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
9 <command><![CDATA[
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
10 python "$ensemble_script" '$inputs'
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
11 ]]>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
12 </command>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
13 <configfiles>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
14 <inputs name="inputs"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
15 <configfile name="ensemble_script">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
16 <![CDATA[
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
17 import sys
19
4570575d060c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 15
diff changeset
18 import os
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
19 import json
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
20 import numpy as np
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
21 import sklearn.ensemble
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
22 import pandas
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
23 import pickle
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
24 from scipy.io import mmread
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
25
19
4570575d060c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 15
diff changeset
26 execfile("$__tool_directory__/utils.py")
4
0431274c367d planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit cea052cf3b8dd4f3620253bd222e126de32e7466
bgruening
parents: 2
diff changeset
27
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
28 # Get inputs, outputs.
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
29 input_json_path = sys.argv[1]
15
f02eeabab5d1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 14
diff changeset
30 with open(input_json_path, "r") as param_handler:
f02eeabab5d1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 14
diff changeset
31 params = json.load(param_handler)
f02eeabab5d1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 14
diff changeset
32 print(params)
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
33
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
34 # Put all cheetah up here to avoid confusion.
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
35 #if $selected_tasks.selected_task == "train":
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
36 infile1 = "$selected_tasks.selected_algorithms.input_options.infile1"
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
37 infile2 = "$selected_tasks.selected_algorithms.input_options.infile2"
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
38 #else:
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
39 infile_model = "$selected_tasks.infile_model"
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
40 infile_data = "$selected_tasks.infile_data"
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
41 #end if
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
42 outfile_fit = "$outfile_fit"
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
43 outfile_predict = "$outfile_predict"
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
44
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
45 # All Python from here on out:
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
46
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
47 if params["selected_tasks"]["selected_task"] == "train":
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
48 algorithm = params["selected_tasks"]["selected_algorithms"]["selected_algorithm"]
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
49 options = params["selected_tasks"]["selected_algorithms"]["options"]
19
4570575d060c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 15
diff changeset
50 if algorithm in ['RandomForestClassifier', 'RandomForestRegressor']:
4570575d060c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 15
diff changeset
51 options['n_jobs'] = N_JOBS
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
52 if "select_max_features" in options:
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
53 if options["select_max_features"]["max_features"] == "number_input":
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
54 options["select_max_features"]["max_features"] = options["select_max_features"]["num_max_features"]
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
55 options["select_max_features"].pop("num_max_features")
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
56 options["max_features"] = options["select_max_features"]["max_features"]
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
57 options.pop("select_max_features")
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
58 if "presort" in options:
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
59 if options["presort"] == "true":
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
60 options["presort"] = True
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
61 if options["presort"] == "false":
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
62 options["presort"] = False
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
63 if "min_samples_leaf" in options and options["min_samples_leaf"] == 1.0:
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
64 options["min_samples_leaf"] = 1
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
65 if "min_samples_split" in options and options["min_samples_split"] > 1.0:
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
66 options["min_samples_split"] = int(options["min_samples_split"])
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
67
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
68 X, y = get_X_y(params, infile1, infile2)
15
f02eeabab5d1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 14
diff changeset
69
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
70 my_class = getattr(sklearn.ensemble, algorithm)
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
71 estimator = my_class(**options)
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
72 estimator.fit(X,y)
15
f02eeabab5d1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 14
diff changeset
73 with open(outfile_fit, 'wb') as out_handler:
f02eeabab5d1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 14
diff changeset
74 pickle.dump(estimator, out_handler, pickle.HIGHEST_PROTOCOL)
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
75
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
76 else:
15
f02eeabab5d1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 14
diff changeset
77 with open(infile_model, 'rb') as model_handler:
f02eeabab5d1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 14
diff changeset
78 classifier_object = pickle.load(model_handler)
14
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
79 header = 'infer' if params["selected_tasks"]["header"] else None
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
80 data = pandas.read_csv(infile_data, sep='\t', header=header, index_col=None, parse_dates=True, encoding=None, tupleize_cols=False)
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
81 prediction = classifier_object.predict(data)
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
82 prediction_df = pandas.DataFrame(prediction, columns=["predicted"])
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
83 res = pandas.concat([data, prediction_df], axis=1)
84724d805bfa planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 13
diff changeset
84 res.to_csv(path_or_buf = outfile_predict, sep="\t", index=False)
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
85
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
86 ]]>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
87 </configfile>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
88 </configfiles>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
89 <inputs>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
90 <expand macro="sl_Conditional" model="zip">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
91 <param name="selected_algorithm" type="select" label="Select an ensemble method:">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
92 <option value="RandomForestClassifier" selected="true">Random forest classifier</option>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
93 <option value="AdaBoostClassifier">Ada boost classifier</option>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
94 <option value="GradientBoostingClassifier">Gradient Boosting Classifier</option>
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
95 <option value="RandomForestRegressor">Random forest regressor</option>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
96 <option value="AdaBoostRegressor">Ada boost regressor</option>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
97 <option value="GradientBoostingRegressor">Gradient Boosting Regressor</option>
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
98 </param>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
99 <when value="RandomForestClassifier">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
100 <expand macro="sl_mixed_input"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
101 <section name="options" title="Advanced Options" expanded="False">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
102 <expand macro="n_estimators"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
103 <expand macro="criterion"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
104 <expand macro="max_features"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
105 <expand macro="max_depth"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
106 <expand macro="min_samples_split"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
107 <expand macro="min_samples_leaf"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
108 <expand macro="min_weight_fraction_leaf"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
109 <expand macro="max_leaf_nodes"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
110 <expand macro="bootstrap"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
111 <expand macro="warm_start" checked="false"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
112 <expand macro="random_state"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
113 <expand macro="oob_score"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
114 <!--class_weight=None-->
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
115 </section>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
116 </when>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
117 <when value="AdaBoostClassifier">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
118 <expand macro="sl_mixed_input"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
119 <section name="options" title="Advanced Options" expanded="False">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
120 <!--base_estimator=None-->
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
121 <expand macro="n_estimators" default_value="50"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
122 <expand macro="learning_rate"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
123 <param argument="algorithm" type="select" label="Boosting algorithm" help=" ">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
124 <option value="SAMME.R" selected="true">SAMME.R</option>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
125 <option value="SAMME">SAMME</option>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
126 </param>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
127 <expand macro="random_state"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
128 </section>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
129 </when>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
130 <when value="GradientBoostingClassifier">
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
131 <expand macro="sl_mixed_input"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
132 <section name="options" title="Advanced Options" expanded="False">
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
133 <!--base_estimator=None-->
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
134 <param argument="loss" type="select" label="Loss function">
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
135 <option value="deviance" selected="true">deviance - logistic regression with probabilistic outputs</option>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
136 <option value="exponential">exponential - gradient boosting recovers the AdaBoost algorithm</option>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
137 </param>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
138 <expand macro="learning_rate" default_value='0.1'/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
139 <expand macro="n_estimators" default_value="100" help="The number of boosting stages to perform"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
140 <expand macro="max_depth" default_value="3" help="maximum depth of the individual regression estimators"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
141 <expand macro="criterion2">
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
142 <option value="friedman_mse" selected="true">friedman_mse - mean squared error with improvement score by Friedman</option>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
143 </expand>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
144 <expand macro="min_samples_split" type="float"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
145 <expand macro="min_samples_leaf" type="float" label="The minimum number of samples required to be at a leaf node"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
146 <expand macro="min_weight_fraction_leaf"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
147 <expand macro="subsample"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
148 <expand macro="max_features"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
149 <expand macro="max_leaf_nodes"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
150 <expand macro="min_impurity_decrease"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
151 <expand macro="verbose"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
152 <expand macro="warm_start" checked="false"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
153 <expand macro="random_state"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
154 <expand macro="presort"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
155 </section>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
156 </when>
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
157 <when value="RandomForestRegressor">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
158 <expand macro="sl_mixed_input"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
159 <section name="options" title="Advanced Options" expanded="False">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
160 <expand macro="n_estimators"/>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
161 <expand macro="criterion2"/>
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
162 <expand macro="max_features"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
163 <expand macro="max_depth"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
164 <expand macro="min_samples_split"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
165 <expand macro="min_samples_leaf"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
166 <expand macro="min_weight_fraction_leaf"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
167 <expand macro="max_leaf_nodes"/>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
168 <expand macro="min_impurity_decrease"/>
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
169 <expand macro="bootstrap"/>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
170 <expand macro="oob_score"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
171 <expand macro="random_state"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
172 <expand macro="verbose"/>
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
173 <expand macro="warm_start" checked="false"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
174 </section>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
175 </when>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
176 <when value="AdaBoostRegressor">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
177 <expand macro="sl_mixed_input"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
178 <section name="options" title="Advanced Options" expanded="False">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
179 <!--base_estimator=None-->
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
180 <expand macro="n_estimators" default_value="50"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
181 <expand macro="learning_rate"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
182 <param argument="loss" type="select" label="Loss function" optional="true" help="Used when updating the weights after each boosting iteration. ">
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
183 <option value="linear" selected="true">linear</option>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
184 <option value="square">square</option>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
185 <option value="exponential">exponential</option>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
186 </param>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
187 <expand macro="random_state"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
188 </section>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
189 </when>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
190 <when value="GradientBoostingRegressor">
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
191 <expand macro="sl_mixed_input"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
192 <section name="options" title="Advanced Options" expanded="False">
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
193 <param argument="loss" type="select" label="Loss function">
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
194 <option value="ls" selected="true">ls - least squares regression</option>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
195 <option value="lad">lad - least absolute deviation</option>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
196 <option value="huber">huber - combination of least squares regression and least absolute deviation</option>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
197 <option value="quantile">quantile - use alpha to specify the quantile</option>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
198 </param>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
199 <expand macro="learning_rate" default_value="0.1"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
200 <expand macro="n_estimators" default_value="100" help="The number of boosting stages to perform"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
201 <expand macro="max_depth" default_value="3" help="maximum depth of the individual regression estimators"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
202 <expand macro="criterion2">
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
203 <option value="friedman_mse" selected="true">friedman_mse - mean squared error with improvement score by Friedman</option>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
204 </expand>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
205 <expand macro="min_samples_split" type="float"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
206 <expand macro="min_samples_leaf" type="float" label="The minimum number of samples required to be at a leaf node"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
207 <expand macro="min_weight_fraction_leaf"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
208 <expand macro="subsample"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
209 <expand macro="max_features"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
210 <expand macro="max_leaf_nodes"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
211 <expand macro="min_impurity_decrease"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
212 <param argument="alpha" type="float" value="0.9" label="alpha" help="The alpha-quantile of the huber loss function and the quantile loss function" />
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
213 <!--base_estimator=None-->
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
214 <expand macro="verbose"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
215 <expand macro="warm_start" checked="false"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
216 <expand macro="random_state"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
217 <expand macro="presort"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
218 </section>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
219 </when>
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
220 </expand>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
221 </inputs>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
222
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
223 <expand macro="output"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
224
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
225 <tests>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
226 <test>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
227 <param name="infile1" value="train.tabular" ftype="tabular"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
228 <param name="infile2" value="train.tabular" ftype="tabular"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
229 <param name="col1" value="1,2,3,4"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
230 <param name="col2" value="5"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
231 <param name="selected_task" value="train"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
232 <param name="selected_algorithm" value="RandomForestClassifier"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
233 <param name="random_state" value="10"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
234 <output name="outfile_fit" file="rfc_model01" compare="sim_size" delta="500"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
235 </test>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
236 <test>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
237 <param name="infile_model" value="rfc_model01" ftype="zip"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
238 <param name="infile_data" value="test.tabular" ftype="tabular"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
239 <param name="selected_task" value="load"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
240 <output name="outfile_predict" file="rfc_result01" compare="sim_size" delta="500"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
241 </test>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
242 <test>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
243 <param name="infile1" value="regression_train.tabular" ftype="tabular"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
244 <param name="infile2" value="regression_train.tabular" ftype="tabular"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
245 <param name="col1" value="1,2,3,4,5"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
246 <param name="col2" value="6"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
247 <param name="selected_task" value="train"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
248 <param name="selected_algorithm" value="RandomForestRegressor"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
249 <param name="random_state" value="10"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
250 <output name="outfile_fit" file="rfr_model01" compare="sim_size" delta="500"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
251 </test>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
252 <test>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
253 <param name="infile_model" value="rfr_model01" ftype="zip"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
254 <param name="infile_data" value="regression_test.tabular" ftype="tabular"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
255 <param name="selected_task" value="load"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
256 <output name="outfile_predict" file="rfr_result01" compare="sim_size" delta="500"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
257 </test>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
258 <test>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
259 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
260 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
261 <param name="header1" value="True"/>
10
cd595710f0c0 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 5
diff changeset
262 <param name="selected_column_selector_option" value="all_columns"/>
5
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
263 <param name="header2" value="True"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
264 <param name="col2" value="1"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
265 <param name="selected_task" value="train"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
266 <param name="selected_algorithm" value="GradientBoostingRegressor"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
267 <param name="max_features" value="number_input"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
268 <param name="num_max_features" value=""/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
269 <param name="random_state" value="42"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
270 <output name="outfile_fit" file="gbr_model01" compare="sim_size" delta="500"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
271 </test>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
272 <test>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
273 <param name="infile_model" value="gbr_model01" ftype="zip"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
274 <param name="infile_data" value="regression_test_X.tabular" ftype="tabular"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
275 <param name="selected_task" value="load"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
276 <param name="header" value="True"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
277 <output name="outfile_predict" file="gbr_prediction_result01.tabular" compare="sim_size" delta="500"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
278 </test>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
279 <test>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
280 <param name="infile1" value="train.tabular" ftype="tabular"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
281 <param name="infile2" value="train.tabular" ftype="tabular"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
282 <param name="col1" value="1,2,3,4"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
283 <param name="col2" value="5"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
284 <param name="selected_task" value="train"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
285 <param name="selected_algorithm" value="GradientBoostingClassifier"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
286 <output name="outfile_fit" file="gbc_model01" compare="sim_size" delta="500"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
287 </test>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
288 <test>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
289 <param name="infile_model" value="gbc_model01" ftype="zip"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
290 <param name="infile_data" value="test.tabular" ftype="tabular"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
291 <param name="selected_task" value="load"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
292 <output name="outfile_predict" file="gbc_result01" compare="sim_size" delta="500"/>
f1761288587e planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 4
diff changeset
293 </test>
0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
294 </tests>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
295 <help><![CDATA[
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
296 ***What it does***
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
297 The goal of ensemble methods is to combine the predictions of several base estimators built with a given learning algorithm in order to improve generalizability / robustness over a single estimator. This tool offers two sets of ensemble algorithms for classification and regression: random forests and ADA boosting which are based on sklearn.ensemble library from Scikit-learn. Here you can find out about the input, output and methods presented in the tools. For information about ensemble methods and parameters settings please refer to `Scikit-learn ensemble`_.
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
298
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
299 .. _`Scikit-learn ensemble`: http://scikit-learn.org/stable/modules/ensemble.html
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
300
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
301 **1 - Methods**
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
302 There are two groups of operations available:
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
303
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
304 1 - Train a model : A training set containing samples and their respective labels (or predicted values) are input. Based on the selected algorithm and options, an estimator object is fit to the data and is returned.
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
305
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
306 2 - Load a model and predict : An existing model predicts the class labels (or regression values) for a new dataset.
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
307
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
308 **2 - Trainig input**
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
309 When you choose to train a model, you need a features dataset X and a labels set y. This tool expects tabular or sparse data for X and a single column for y (tabular). You can select a subset of columns in a tabular dataset as your features dataset or labels column. Below you find some examples:
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
310
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
311 **Sample tabular features dataset**
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
312 The following training dataset contains 3 feature columns and a column containing class labels. You can simply select the first 3 columns as features and the last column as labels:
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
313
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
314 ::
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
315
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
316 4.01163365529 -6.10797684314 8.29829894763 1
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
317 10.0788438916 1.59539821454 10.0684278289 0
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
318 -5.17607775503 -0.878286135332 6.92941850665 2
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
319 4.00975406235 -7.11847496542 9.3802423585 1
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
320 4.61204065139 -5.71217537352 9.12509610964 1
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
321
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
322
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
323 **Sample sparse features dataset**
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
324 In this case you cannot specifiy a column range.
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
325
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
326 ::
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
327
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
328 4 1048577 8738
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
329 1 271 0.02083333333333341
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
330 1 1038 0.02461995616119806
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
331 2 829017 0.01629088031127686
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
332 2 829437 0.01209127083516686
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
333 2 830752 0.02535100632816968
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
334 3 1047487 0.01485722929945572
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
335 3 1047980 0.02640566620767753
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
336 3 1048475 0.01665869913262564
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
337 4 608 0.01662975263094352
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
338 4 1651 0.02519674277562741
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
339 4 4053 0.04223659971350601
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
340
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
341
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
342 **2 - Trainig output**
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
343 The trained model is generated and output in the form of a binary file.
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
344
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
345
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
346 **3 - Prediction input**
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
347
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
348 When you choose to load a model and do prediction, the tool expects an already trained estimator and a tabular dataset as input. The dataset contains new samples which you want to classify or predict regression values for.
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
349
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
350
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
351 .. class:: warningmark
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
352
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
353 The number of feature columns must be the same in training and prediction datasets!
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
354
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
355
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
356 **3 - Prediction output**
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
357 The tool predicts the class labels for new samples and adds them as the last column to the prediction dataset. The new dataset then is output as a tabular file. The prediction output format should look like the training dataset.
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
358
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
359 ]]></help>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
360 <expand macro="sklearn_citation"/>
569eefee7ed8 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents:
diff changeset
361 </tool>