Mercurial > repos > anmoljh > feature_selection
annotate feature_selection.xml @ 1:f3aeeb15d4cc draft default tip
planemo upload commit 14622cfccfaec931b5937c5172d661de0ed69861-dirty
author | anmoljh |
---|---|
date | Tue, 05 Jun 2018 04:09:15 -0400 |
parents | b4d2524e79ab |
children |
rev | line source |
---|---|
0
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
1 <tool id="feature_selection" name="Feature Selector" version="1.0"> |
1
f3aeeb15d4cc
planemo upload commit 14622cfccfaec931b5937c5172d661de0ed69861-dirty
anmoljh
parents:
0
diff
changeset
|
2 |
f3aeeb15d4cc
planemo upload commit 14622cfccfaec931b5937c5172d661de0ed69861-dirty
anmoljh
parents:
0
diff
changeset
|
3 <description>selects best features subset</description> |
0
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
4 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
5 <requirements> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
6 <requirement type="package" version="3.2.1">R</requirement> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
7 <requirement type="package" version="1.0">carettools</requirement> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
8 </requirements> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
9 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
10 <stdio> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
11 <exit_code range="1:" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
12 </stdio> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
13 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
14 <command interpreter="Rscript">feature_selection.R $input $profile $finalset $function1 $resampling $repeat $number $corcutoff $SAMPLING \${GALAXY_SLOTS:-1} >/dev/null 2>&1 </command> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
15 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
16 <inputs> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
17 <param name="input" type="data" format="rdata" label="Select input data file" help="input .RData file" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
18 <param name="SAMPLING" type="select" label="Select Sampling Method for imbalanced data" help="Defualt is with No sampling. you may choose downsample or upsample" > |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
19 <option value="garBage" selected="true">No Sampling</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
20 <option value="downsampling">downsample</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
21 <option value="upsampling">upsample</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
22 </param> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
23 <param name="function1" type="select" display="radio" label="Select appropriate function for algorithm" > |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
24 <option value="rfFuncs" selected="true">random forest based function </option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
25 <option value="lmFuncs">linear model based function</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
26 <option value="treebagFuncs">treebag(CART) based function</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
27 <option value="nbFuncs">neive bayes based function</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
28 </param> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
29 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
30 <param name="corcutoff" type="float" value= "0.8" min="0.0" max = "1.0" label="Select correlation cutoff" help="values bewteen 0-1. fileds above cufoff value removed from data " /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
31 <param name="resampling" type="select" label="Select appropriate resampling method" > |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
32 <option value="repeatedcv" selected="true">repeatedcv </option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
33 <option value="boot">boot</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
34 <option value="cv">cv</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
35 <option value="boot632">boot632</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
36 </param> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
37 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
38 <param name="repeat" type="select" label="Set Number of times to repeat" help="default is 3 "> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
39 <option value="3" selected="true">3</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
40 <option value="5">5</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
41 <option value="7">7</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
42 <option value="10">10</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
43 </param> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
44 <param name="number" type="select" label="Set Number of times Resample" help="default is 10"> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
45 <option value="10" selected="true">10</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
46 <option value="5">5</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
47 <option value="15">15</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
48 <option value="20">20</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
49 <option value="25">25</option> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
50 </param> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
51 </inputs> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
52 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
53 <outputs> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
54 <data format="data" name="profile" label="$function1-profile" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
55 <data format="rdata" name="finalset" label="Selected_feature.RData "/> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
56 </outputs> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
57 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
58 <tests> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
59 <test> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
60 <param name="input" value="testinput.RData"/> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
61 <param name="function1" value="rfFuncs" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
62 <param name="corcutoff" value="0.6" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
63 <param name="resampling" value="repeatedcv" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
64 <param name="repeat" value="1" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
65 <param name="number" value="5" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
66 <param name="SAMPLING" value="garb" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
67 <param name="cores" value="1" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
68 <output name="profile" file="rfprofile.RData" compare="sim_size" delta="2000000" /> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
69 <output name="finalset" file="selected_fet.RData" compare="sim_size" delta="2000000"/> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
70 </test> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
71 </tests> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
72 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
73 <help> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
74 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
75 .. class:: infomark |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
76 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
77 **RFE based feature selection for classification and regression** |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
78 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
79 Input file must be RData file obtained by converting csv file in to RData. |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
80 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
81 output "Selected_feature.RData" file used for model building purpose.While profile |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
82 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
83 represents feature selection model. |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
84 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
85 Correlation cutoff value is desired for choosing independent variables For example |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
86 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
87 Cutoff value = 0.8 removes all descriptors sharing equal or highet correlation values. |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
88 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
89 User may choose varous resampling methods in combination with repeats and times of resample. |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
90 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
91 </help> |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
92 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
93 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
94 |
b4d2524e79ab
planemo upload commit a1f4dd8eb560c649391ada1a6bb9505893a35272
anmoljh
parents:
diff
changeset
|
95 </tool> |