comparison svm.xml @ 4:41d0edb7d1fc draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 8cf3d813ec755166ee0bd517b4ecbbd4f84d4df1
author bgruening
date Thu, 23 Aug 2018 16:14:13 -0400
parents 297541cc26d0
children 1c5989b930e3
comparison
equal deleted inserted replaced
3:297541cc26d0 4:41d0edb7d1fc
17 <![CDATA[ 17 <![CDATA[
18 import sys 18 import sys
19 import json 19 import json
20 import sklearn.svm 20 import sklearn.svm
21 import pandas 21 import pandas
22 import pickle
23 22
24 execfile("$__tool_directory__/utils.py") 23 execfile("$__tool_directory__/sk_whitelist.py")
24 execfile("$__tool_directory__/utils.py", globals())
25 25
26 input_json_path = sys.argv[1] 26 input_json_path = sys.argv[1]
27 with open(input_json_path, "r") as param_handler: 27 with open(input_json_path, "r") as param_handler:
28 params = json.load(param_handler) 28 params = json.load(param_handler)
29 29
30 #if $selected_tasks.selected_task == "load": 30 #if $selected_tasks.selected_task == "load":
31 31
32 with open("$infile_model", 'rb') as model_handler: 32 with open("$infile_model", 'rb') as model_handler:
33 classifier_object = pickle.load(model_handler) 33 classifier_object = SafePickler.load(model_handler)
34 34
35 header = 'infer' if params["selected_tasks"]["header"] else None 35 header = 'infer' if params["selected_tasks"]["header"] else None
36 data = pandas.read_csv("$selected_tasks.infile_data", sep='\t', header=header, index_col=None, parse_dates=True, encoding=None, tupleize_cols=False) 36 data = pandas.read_csv("$selected_tasks.infile_data", sep='\t', header=header, index_col=None, parse_dates=True, encoding=None, tupleize_cols=False)
37 prediction = classifier_object.predict(data) 37 prediction = classifier_object.predict(data)
38 prediction_df = pandas.DataFrame(prediction) 38 prediction_df = pandas.DataFrame(prediction)
53 my_class = getattr(sklearn.svm, selected_algorithm) 53 my_class = getattr(sklearn.svm, selected_algorithm)
54 classifier_object = my_class(**options) 54 classifier_object = my_class(**options)
55 classifier_object.fit(X, y) 55 classifier_object.fit(X, y)
56 56
57 with open("$outfile_fit", 'wb') as out_handler: 57 with open("$outfile_fit", 'wb') as out_handler:
58 pickle.dump(classifier_object, out_handler) 58 pickle.dump(classifier_object, out_handler, pickle.HIGHEST_PROTOCOL)
59 59
60 #end if 60 #end if
61 61
62 ]]> 62 ]]>
63 </configfile> 63 </configfile>
120 <param name="col1" value="1,2,3,4"/> 120 <param name="col1" value="1,2,3,4"/>
121 <param name="col2" value="5"/> 121 <param name="col2" value="5"/>
122 <param name="selected_task" value="train"/> 122 <param name="selected_task" value="train"/>
123 <param name="selected_algorithm" value="SVC"/> 123 <param name="selected_algorithm" value="SVC"/>
124 <param name="random_state" value="5"/> 124 <param name="random_state" value="5"/>
125 <output name="outfile_fit" file="svc_model01.txt"/> 125 <output name="outfile_fit" file="svc_model01.txt" compare="sim_size" delta="1"/>
126 </test> 126 </test>
127 <test> 127 <test>
128 <param name="infile1" value="train_set.tabular" ftype="tabular"/> 128 <param name="infile1" value="train_set.tabular" ftype="tabular"/>
129 <param name="infile2" value="train_set.tabular" ftype="tabular"/> 129 <param name="infile2" value="train_set.tabular" ftype="tabular"/>
130 <param name="header1" value="True"/> 130 <param name="header1" value="True"/>
132 <param name="col1" value="1,2,3,4"/> 132 <param name="col1" value="1,2,3,4"/>
133 <param name="col2" value="5"/> 133 <param name="col2" value="5"/>
134 <param name="selected_task" value="train"/> 134 <param name="selected_task" value="train"/>
135 <param name="selected_algorithm" value="NuSVC"/> 135 <param name="selected_algorithm" value="NuSVC"/>
136 <param name="random_state" value="5"/> 136 <param name="random_state" value="5"/>
137 <output name="outfile_fit" file="svc_model02.txt"/> 137 <output name="outfile_fit" file="svc_model02.txt" compare="sim_size" delta="1"/>
138 </test> 138 </test>
139 <test> 139 <test>
140 <param name="infile1" value="train_set.tabular" ftype="tabular"/> 140 <param name="infile1" value="train_set.tabular" ftype="tabular"/>
141 <param name="infile2" value="train_set.tabular" ftype="tabular"/> 141 <param name="infile2" value="train_set.tabular" ftype="tabular"/>
142 <param name="header1" value="True"/> 142 <param name="header1" value="True"/>
144 <param name="col1" value="1,2,3,4"/> 144 <param name="col1" value="1,2,3,4"/>
145 <param name="col2" value="5"/> 145 <param name="col2" value="5"/>
146 <param name="selected_task" value="train"/> 146 <param name="selected_task" value="train"/>
147 <param name="selected_algorithm" value="LinearSVC"/> 147 <param name="selected_algorithm" value="LinearSVC"/>
148 <param name="random_state" value="5"/> 148 <param name="random_state" value="5"/>
149 <output name="outfile_fit" file="svc_model03.txt"/> 149 <output name="outfile_fit" file="svc_model03.txt" compare="sim_size" delta="1"/>
150 </test> 150 </test>
151 <test> 151 <test>
152 <param name="infile_model" value="svc_model01.txt" ftype="txt"/> 152 <param name="infile_model" value="svc_model01.txt" ftype="zip"/>
153 <param name="infile_data" value="test_set.tabular" ftype="tabular"/> 153 <param name="infile_data" value="test_set.tabular" ftype="tabular"/>
154 <param name="header" value="True"/> 154 <param name="header" value="True"/>
155 <param name="selected_task" value="load"/> 155 <param name="selected_task" value="load"/>
156 <output name="outfile_predict" file="svc_prediction_result01.tabular"/> 156 <output name="outfile_predict" file="svc_prediction_result01.tabular"/>
157 </test> 157 </test>
158 <test> 158 <test>
159 <param name="infile_model" value="svc_model02.txt" ftype="txt"/> 159 <param name="infile_model" value="svc_model02.txt" ftype="zip"/>
160 <param name="infile_data" value="test_set.tabular" ftype="tabular"/> 160 <param name="infile_data" value="test_set.tabular" ftype="tabular"/>
161 <param name="header" value="True"/> 161 <param name="header" value="True"/>
162 <param name="selected_task" value="load"/> 162 <param name="selected_task" value="load"/>
163 <output name="outfile_predict" file="svc_prediction_result02.tabular"/> 163 <output name="outfile_predict" file="svc_prediction_result02.tabular"/>
164 </test> 164 </test>
165 <test> 165 <test>
166 <param name="infile_model" value="svc_model03.txt" ftype="txt"/> 166 <param name="infile_model" value="svc_model03.txt" ftype="zip"/>
167 <param name="infile_data" value="test_set.tabular" ftype="tabular"/> 167 <param name="infile_data" value="test_set.tabular" ftype="tabular"/>
168 <param name="header" value="True"/> 168 <param name="header" value="True"/>
169 <param name="selected_task" value="load"/> 169 <param name="selected_task" value="load"/>
170 <output name="outfile_predict" file="svc_prediction_result03.tabular"/> 170 <output name="outfile_predict" file="svc_prediction_result03.tabular"/>
171 </test> 171 </test>