annotate regionFitness.xml @ 0:4f8e15e25c79 draft

Uploaded
author antmarge
date Tue, 28 Mar 2017 10:45:08 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
1 <tool id="regionFitness" name="Region Fitness" version="0.1.0">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
2
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
3 <!-- Margaret Antonio 17.01.08 -->
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
4
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
5 <requirements>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
6 <!--<requirement type="set_environment">LINKYX_PATH</requirement>-->
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
7 <requirement type="package" version="5.18.1">perl</requirement>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
8 <requirement type="package" version="0.25">perl_list_binarysearch</requirement>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
9 <requirement type="package" version="0.12">perl_data_random</requirement>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
10 </requirements>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
11
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
12 <description>assess fitness effect of mutations in a region (sliding window or custom)</description>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
13
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
14 <command interpreter="perl">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
15 regionFitness.pl
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
16 -f $fasta
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
17 -r $ref_genome
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
18 -c $cutoff
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
19 -n $run
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
20 -m $max
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
21 #if $region.define == "c":
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
22 -u $region.custom
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
23 #end if
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
24 #if $region.define == "s":
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
25 -size $region.size
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
26 -step $region.step
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
27 #end if
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
28 #if $weight.algorithm == "yes":
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
29 -w
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
30 -wc $weight.ceiling
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
31 #end if
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
32
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
33 -f1 $allTAsites
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
34 -f2 $nullDist
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
35 -f3 $slidingWindows
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
36 -f4 $fitWindowscsv
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
37 -f5 $fitWindowswig
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
38 -f6 $fitWindowstxt
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
39
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
40 $input
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
41 #for $a in $additionalcsv
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
42 ${a.input2}
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
43 #end for
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
44
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
45 </command>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
46
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
47 <inputs>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
48 <param name="input" type="data" label="CSV Fitness File(s)"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
49 <repeat name="additionalcsv" title="Additional csv fitness file(s)">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
50 <param name="input2" type="data" label="Select" />
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
51 </repeat>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
52 <param format="fasta" name="fasta" type="data" label="Fasta file"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
53 <param name="ref_genome" type="data" label="GenBank reference genome"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
54
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
55 <conditional name="region">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
56 <param name="define" type="select" label="Define regions: custom or sliding?">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
57 <option value="s">Sliding Windows</option>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
58 <option value="c">Custom</option>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
59 </param>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
60 <when value="s">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
61 <param name="size" type="integer" value="500" label="Sliding window size"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
62 <param name="step" type="integer" value="10" label="Sliding window intervals"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
63 </when>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
64 <when value="c">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
65 <param name="custom" type="data" label="File with custom regions" />
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
66 </when>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
67 </conditional>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
68
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
69 <conditional name="weight">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
70 <param name="algorithm" type="select" label="Use weighted algorithms?">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
71 <option value="yes">Yes</option>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
72 <option value="no">No</option>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
73 </param>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
74 <when value = "yes">
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
75 <param name="ceiling" type="integer" value="50" label="Weight ceiling"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
76 </when>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
77 </conditional>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
78
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
79 <param name="cutoff" type="integer" value="10" label="Cutoff"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
80 <param name="max" type="integer" value="100" label="Highest # insertions in region"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
81 <param name="run" type="text" value="run1" label="Name of run (will be appended to output files)"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
82
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
83 </inputs>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
84
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
85 <outputs>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
86 <data format="txt" name="allTAsites" label="${run}_allTAsites" />
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
87 <data format="txt" name="unmatched" label="${run}_unmatched"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
88 <data format="txt" name="nullDist" label="${run}_nullDist"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
89 <data format="csv" name="slidingWindows" label="${run}_slidingWindows"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
90 <data format="csv" name="fitWindowscsv" label="${run}_fitWindows_csv"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
91 <data format="wig" name="fitWindowswig" label="${run}_fitWindows_wig"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
92 <data format="txt" name="fitWindowstxt" label="${run}_fitWindows_txt"/>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
93 </outputs>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
94
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
95 <help>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
96 **Tool Description**
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
97
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
98 This tool takes a non-gene-centric approach to assessing importance of regions (user defined or sliding windows) to organismal fitness.
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
99
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
100 **Options**
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
101
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
102 *The csv fitness file(s)*: These are the csv (comma separated values) files containing the fitness values that will be used in downstream analyses. Since they should have been produced by the "Calculate Fitness" tool, each line besides the header should represent the following information for an insertion location: position,strand,count_1,count_2,ratio,mt_freq_t1,mt_freq_t2,pop_freq_t1,pop_freq_t2,gene,D,W,nW
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
103
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
104 *Fasta file*: the fasta file for the genome of the organism
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
105
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
106 *GenBank reference genome*: the reference genome of whatever model you're working with, which needs to be in standard genbank format. For more on that format see the genbank website.
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
107
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
108 *Region definition*: Define the regions by a custom file or by sliding windows at a set size and step. If using the custom region option, provide a tab-delimited file with start and end coordinates of each region, one region per line. If choosing the sliding window option, specify the size of the window over which assessments will be made and the step, how much the sliding window increments at each asssessment.
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
109
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
110 *Max*: The maximum number of insertions expected in a window. This is used for creating a null distrubtion upon which the significance of regional essentiality is assessed. An error will be produced if the maximum number of insertions is lower than the actual. Run the Data Overview tool to find the real max number of insertions in a window. This option will be removed later by being data-determined.
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
111
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
112 *Weight ceiling*: This value lets you set a weight ceiling for the weights of fitness values. It's only relevant if you're using weighted algorithms.
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
113
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
114 *Cutoff*: This value lets you ignore the fitness scores of any insertion locations with an average count (the number of counts from t1 and t2 divided by 2) less than it.
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
115
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
116 *Run name*: The name of the run, to be appended to the end of every output file.
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
117
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
118
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
119 </help>
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
120
4f8e15e25c79 Uploaded
antmarge
parents:
diff changeset
121 </tool>