Mercurial > repos > iuc > stringtie
comparison stringtie.xml @ 10:c84d44519b2e draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/stringtie commit b78c073ab258852730fc9af1cd4862d571459103
author | iuc |
---|---|
date | Tue, 04 Apr 2017 12:58:27 -0400 |
parents | e3f369973054 |
children | 6e45b443ef1f |
comparison
equal
deleted
inserted
replaced
9:1f23fc7df25c | 10:c84d44519b2e |
---|---|
1 <tool id="stringtie" name="StringTie" version="1.2.3"> | 1 <tool id="stringtie" name="StringTie" version="1.3.3"> |
2 <description>transcript assembly and quantification</description> | 2 <description>transcript assembly and quantification</description> |
3 <macros> | 3 <macros> |
4 <import>macros.xml</import> | 4 <import>macros.xml</import> |
5 </macros> | 5 </macros> |
6 <expand macro="requirements" /> | 6 <expand macro="requirements" /> |
7 <expand macro="stdio" /> | 7 <expand macro="stdio" /> |
8 <expand macro="version_command" /> | 8 <expand macro="version_command" /> |
9 <command> | 9 <command> |
10 <![CDATA[ | 10 <![CDATA[ |
11 mkdir -p ./special_de_output/sample1/ && | |
12 #if str($guide.use_guide) == 'yes': | |
13 ln -s '$guide.guide_gff' ./special_de_output/sample1/guide.gtf && | |
14 #end if | |
15 | |
11 #if $input_bam.metadata.ftype == 'sam': | 16 #if $input_bam.metadata.ftype == 'sam': |
12 samtools sort -@ \${GALAXY_SLOTS:-1} "$input_bam" | stringtie | 17 samtools sort -@ \${GALAXY_SLOTS:-1} '$input_bam' | stringtie |
13 #else | 18 #else |
14 stringtie "$input_bam" | 19 stringtie '$input_bam' |
15 #end if | 20 #end if |
21 | |
16 -o "$output_gtf" | 22 -o "$output_gtf" |
17 -p "\${GALAXY_SLOTS:-1}" | 23 -p "\${GALAXY_SLOTS:-1}" |
18 #if str($guide.use_guide) == 'yes': | 24 #if str($guide.use_guide) == 'yes': |
19 -C "$coverage" -G "$guide.guide_gff" $guide.input_estimation | 25 -C '$coverage' |
20 #if $guide.output_ballgown: | 26 -G '$guide.guide_gff' |
21 -b . | 27 $guide.input_estimation |
28 #if $guide.special_outputs != 'no': | |
29 -b ./special_de_output/sample1/ | |
22 #end if | 30 #end if |
23 #end if | 31 #end if |
24 #if str($option_set.options) == 'advanced': | 32 #if str($option_set.options) == 'advanced': |
25 -l "$option_set.name_prefix" | 33 -l '$option_set.name_prefix' |
26 -f "$option_set.fraction" | 34 -f '$option_set.fraction' |
27 -m "$option_set.min_tlen" | 35 -m '$option_set.min_tlen' |
28 -a "$option_set.min_anchor_len" | 36 -a '$option_set.min_anchor_len' |
29 -j "$option_set.min_anchor_cov" | 37 -j '$option_set.min_anchor_cov' |
30 -c "$option_set.min_bundle_cov" | 38 -c '$option_set.min_bundle_cov' |
31 -g "$option_set.bdist" | 39 -g '$option_set.bdist' |
32 -M "$option_set.bundle_fraction" $option_set.sensitive $option_set.disable_trimming $option_set.multi_mapping | 40 -M '$option_set.bundle_fraction' $option_set.sensitive $option_set.disable_trimming $option_set.multi_mapping |
33 #if $option_set.abundance_estimation: | 41 #if $option_set.abundance_estimation: |
34 -A "$gene_abundance_estimation" | 42 -A "$gene_abundance_estimation" |
35 #end if | 43 #end if |
36 #if str($option_set.omit_sequences).strip() != "": | 44 #if str($option_set.omit_sequences).strip() != "": |
37 -x "$option_set.omit_sequences" | 45 -x "$option_set.omit_sequences" |
38 #end if | 46 #end if |
39 #end if | 47 #end if |
48 | |
49 #if str($guide.use_guide) == 'yes': | |
50 #if $guide.special_outputs.special_outputs_select == 'deseq2': | |
51 && | |
52 prepDE.py | |
53 -i ./special_de_output/ | |
54 -g gene_cout_matrix.tsv | |
55 -t transcripts_count_matrix.tsv | |
56 -l $guide.special_outputs.read_length | |
57 #if str($option_set.options) == 'advanced': | |
58 -s '$option_set.name_prefix' | |
59 #end if | |
60 #if $guide.special_outputs.clustering: | |
61 -c | |
62 --legend ./legend.tsv | |
63 | |
64 && | |
65 sed -i.bak 's/,/\t/g' ./legend.tsv | |
66 | |
67 #end if | |
68 && | |
69 sed -i.bak 's/,/\t/g' transcripts_count_matrix.tsv | |
70 && | |
71 sed -i.bak 's/,/\t/g' gene_cout_matrix.tsv | |
72 #end if | |
73 #end if | |
74 | |
40 ]]> | 75 ]]> |
41 </command> | 76 </command> |
42 <inputs> | 77 <inputs> |
43 <param format="sam,bam" label="Mapped reads to assemble transcripts from" name="input_bam" type="data" /> | 78 <param format="sam,bam" label="Mapped reads to assemble transcripts from" name="input_bam" type="data" /> |
44 <conditional name="guide"> | 79 <conditional name="guide"> |
45 <param label="Use GFF file to guide assembly" name="use_guide" type="select"> | 80 <param label="Use GFF file to guide assembly" name="use_guide" type="select"> |
46 <option value="yes">Use GFF</option> | 81 <option value="yes">Use GFF/GTF</option> |
47 <option selected="True" value="no">Do not use GFF</option> | 82 <option selected="True" value="no">Do not use GFF/GTF</option> |
48 </param> | 83 </param> |
49 <when value="no" /> | 84 <when value="no" /> |
50 <when value="yes"> | 85 <when value="yes"> |
51 <param argument="-G" format="gtf,gff3" help="" label="Reference annotation to use for guiding the assembly process" name="guide_gff" type="data" /> | 86 <param argument="-G" format="gtf,gff3" name="guide_gff" type="data" |
52 <param argument="-e" falsevalue="" help="" label="Perform abundance estimation only of input transcripts" name="input_estimation" truevalue="-e" type="boolean" /> | 87 help="" label="Reference annotation to use for guiding the assembly process" /> |
53 <param argument="-b" falsevalue="" help="" label="Output additional files for use in Ballgown" name="output_ballgown" truevalue="-b" type="boolean" /> | 88 <param argument="-e" name="input_estimation" truevalue="-e" type="boolean" falsevalue="" |
89 help="" label="Perform abundance estimation only of input transcripts" /> | |
90 <conditional name="special_outputs"> | |
91 <param label="Output additional files for use in..." name="special_outputs_select" type="select"> | |
92 <option value="ballgown">Ballgown</option> | |
93 <option selected="True" value="deseq2">DESeq2/EdgeR</option> | |
94 <option value="no">No addional output</option> | |
95 </param> | |
96 <when value="ballgown" /> | |
97 <when value="deseq2"> | |
98 <param label="Average read length" name="read_length" type="integer" value="75" help="" /> | |
99 <param label="Whether to cluster genes that overlap with different gene IDs" | |
100 name="clustering" | |
101 truevalue="--cluster" | |
102 type="boolean" help="ignoring ones with geneID pattern" falsevalue="" /> | |
103 </when> | |
104 </conditional> | |
54 </when> | 105 </when> |
55 </conditional> | 106 </conditional> |
56 <conditional name="option_set"> | 107 <conditional name="option_set"> |
57 <param help="" label="Options" name="options" type="select"> | 108 <param help="" label="Options" name="options" type="select"> |
58 <option selected="True" value="default">Use defaults</option> | 109 <option selected="True" value="default">Use defaults</option> |
59 <option value="advanced">Specify advanced options</option> | 110 <option value="advanced">Specify advanced options</option> |
60 </param> | 111 </param> |
61 <when value="default" /> | 112 <when value="default" /> |
62 <when value="advanced"> | 113 <when value="advanced"> |
63 <param argument="-t" falsevalue="" help="" label="Disable trimming of predicted transcripts based on coverage" name="disable_trimming" truevalue="-t" type="boolean" /> | 114 <param argument="-t" falsevalue="" name="disable_trimming" truevalue="-t" type="boolean" |
64 <param argument="-S" falsevalue="" help="" label="Increase sensitivity" name="sensitive" truevalue="-S" type="boolean" /> | 115 label="Disable trimming of predicted transcripts based on coverage" /> |
65 <param argument="-l" help="" label="Name prefix for output transcripts" name="name_prefix" type="text" value="STRG" /> | 116 <param argument="-S" falsevalue="" |
66 <param argument="-f" help="" label="Minimum isoform fraction" max="1.0" min="0.0" name="fraction" type="float" value="0.15" /> | 117 label="Increase sensitivity" name="sensitive" truevalue="-S" type="boolean" /> |
67 <param argument="-m" help="" label="Minimum assembled transcript length" name="min_tlen" type="integer" value="200" /> | 118 <param argument="-l" label="Name prefix for output transcripts" name="name_prefix" type="text" value="STRG" /> |
68 <param argument="-a" help="" label="Minimum anchor length for junctions" name="min_anchor_len" type="integer" value="10" /> | 119 <param argument="-f" label="Minimum isoform fraction" max="1.0" min="0.0" name="fraction" type="float" value="0.15" /> |
69 <param argument="-j" help="" label="Minimum junction coverage" name="min_anchor_cov" type="integer" value="1" /> | 120 <param argument="-m" label="Minimum assembled transcript length" name="min_tlen" type="integer" value="200" /> |
70 <param argument="-c" help="" label="Minimum bundle reads per bp coverage to consider for assembly" name="min_bundle_cov" type="integer" value="2" /> | 121 <param argument="-a" label="Minimum anchor length for junctions" name="min_anchor_len" type="integer" value="10" /> |
71 <param argument="-g" help="" label="Gap between read mappings triggering a new bundle" name="bdist" type="integer" value="50" /> | 122 <param argument="-j" label="Minimum junction coverage" name="min_anchor_cov" type="integer" value="1" /> |
72 <param argument="-M" help="" label="Fraction of bundle allowed to be covered by multi-hit reads" name="bundle_fraction" type="float" value="0.95" /> | 123 <param argument="-c" label="Minimum bundle reads per bp coverage to consider for assembly" name="min_bundle_cov" type="integer" value="2" /> |
73 <param argument="-x" help="e.g. chrM,chrX" label="Do not assemble any transcripts on these reference sequence(s)" name="omit_sequences" type="text" value="" /> | 124 <param argument="-g" label="Gap between read mappings triggering a new bundle" name="bdist" type="integer" value="50" /> |
74 <param argument="-A" falsevalue="" help="" label="Additional gene abundance estimation output file" name="abundance_estimation" truevalue="-A" type="boolean" /> | 125 <param argument="-M" label="Fraction of bundle allowed to be covered by multi-hit reads" name="bundle_fraction" type="float" value="0.95" /> |
75 <param argument="-u" falsevalue="" help="" label="Disable multi-mapping correction" name="multi_mapping" truevalue="-u" type="boolean" /> | 126 <param argument="-x" name="omit_sequences" type="text" value="" |
127 help="e.g. chrM,chrX" label="Do not assemble any transcripts on these reference sequence(s)" /> | |
128 <param argument="-A" falsevalue="" name="abundance_estimation" truevalue="-A" type="boolean" | |
129 label="Additional gene abundance estimation output file" /> | |
130 <param argument="-u" falsevalue="" truevalue="-u" type="boolean" | |
131 label="Disable multi-mapping correction" name="multi_mapping" /> | |
76 </when> | 132 </when> |
77 </conditional> | 133 </conditional> |
78 </inputs> | 134 </inputs> |
79 <outputs> | 135 <outputs> |
80 <data format="gtf" label="${tool.name} on ${on_string}: Assembled transcripts" name="output_gtf" /> | 136 <data format="gtf" label="${tool.name} on ${on_string}: Assembled transcripts" name="output_gtf" /> |
82 <filter>option_set['options'] == 'advanced' and option_set['abundance_estimation']</filter> | 138 <filter>option_set['options'] == 'advanced' and option_set['abundance_estimation']</filter> |
83 </data> | 139 </data> |
84 <data format="gff3" label="${tool.name} on ${on_string}: Coverage" name="coverage"> | 140 <data format="gff3" label="${tool.name} on ${on_string}: Coverage" name="coverage"> |
85 <filter>guide['use_guide'] == 'yes'</filter> | 141 <filter>guide['use_guide'] == 'yes'</filter> |
86 </data> | 142 </data> |
87 <data format="tabular" from_work_dir="e_data.ctab" label="${tool.name} on ${on_string}: exon-level expression measurements" name="exon_expression"> | 143 <data format="tabular" from_work_dir="special_de_output/sample1/e_data.ctab" |
88 <filter>guide['use_guide'] == 'yes' and guide['output_ballgown']</filter> | 144 label="${tool.name} on ${on_string}: exon-level expression measurements" name="exon_expression"> |
89 </data> | 145 <filter>guide['use_guide'] == 'yes' and guide['special_outputs']['special_outputs_select'] == 'ballgown'</filter> |
90 <data format="tabular" from_work_dir="i_data.ctab" label="${tool.name} on ${on_string}: intron-level expression measurements" name="intron_expression"> | 146 </data> |
91 <filter>guide['use_guide'] == 'yes' and guide['output_ballgown']</filter> | 147 <data format="tabular" from_work_dir="special_de_output/sample1/i_data.ctab" |
92 </data> | 148 label="${tool.name} on ${on_string}: intron-level expression measurements" name="intron_expression"> |
93 <data format="tabular" from_work_dir="t_data.ctab" label="${tool.name} on ${on_string}: transcript-level expression measurements" name="transcript_expression"> | 149 <filter>guide['use_guide'] == 'yes' and guide['special_outputs']['special_outputs_select'] == 'ballgown'</filter> |
94 <filter>guide['use_guide'] == 'yes' and guide['output_ballgown']</filter> | 150 </data> |
95 </data> | 151 <data format="tabular" from_work_dir="special_de_output/sample1/t_data.ctab" |
96 <data format="tabular" from_work_dir="e2t.ctab" label="${tool.name} on ${on_string}: exon to transcript mapping" name="exon_transcript_mapping"> | 152 label="${tool.name} on ${on_string}: transcript-level expression measurements" name="transcript_expression"> |
97 <filter>guide['use_guide'] == 'yes' and guide['output_ballgown']</filter> | 153 <filter>guide['use_guide'] == 'yes' and guide['special_outputs']['special_outputs_select'] == 'ballgown'</filter> |
98 </data> | 154 </data> |
99 <data format="tabular" from_work_dir="i2t.ctab" label="${tool.name} on ${on_string}: intron to transcript mapping" name="intron_transcript_mapping"> | 155 <data format="tabular" from_work_dir="special_de_output/sample1/e2t.ctab" |
100 <filter>guide['use_guide'] == 'yes' and guide['output_ballgown']</filter> | 156 label="${tool.name} on ${on_string}: exon to transcript mapping" name="exon_transcript_mapping"> |
157 <filter>guide['use_guide'] == 'yes' and guide['special_outputs']['special_outputs_select'] == 'ballgown'</filter> | |
158 </data> | |
159 <data format="tabular" from_work_dir="special_de_output/sample1/i2t.ctab" | |
160 label="${tool.name} on ${on_string}: intron to transcript mapping" name="intron_transcript_mapping"> | |
161 <filter>guide['use_guide'] == 'yes' and guide['special_outputs']['special_outputs_select'] == 'ballgown'</filter> | |
162 </data> | |
163 | |
164 <data format="tabular" from_work_dir="gene_cout_matrix.tsv" | |
165 label="${tool.name} on ${on_string}: Gene counts" name="gene_counts"> | |
166 <filter>guide['use_guide'] == 'yes' and guide['special_outputs']['special_outputs_select'] == 'deseq2'</filter> | |
167 </data> | |
168 <data format="tabular" from_work_dir="transcripts_count_matrix.tsv" | |
169 label="${tool.name} on ${on_string}: Transcript counts" name="transcript_counts"> | |
170 <filter>guide['use_guide'] == 'yes' and guide['special_outputs']['special_outputs_select'] == 'deseq2'</filter> | |
171 </data> | |
172 <data format="tabular" from_work_dir="legend.tsv" | |
173 label="${tool.name} on ${on_string}: legend" name="legend"> | |
174 <filter>guide['use_guide'] == 'yes' and guide['special_outputs']['special_outputs_select'] == 'deseq2' and guide['special_outputs']['clustering'] is True</filter> | |
101 </data> | 175 </data> |
102 </outputs> | 176 </outputs> |
103 <tests> | 177 <tests> |
104 <test> | 178 <test> |
105 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> | 179 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> |
115 <output file="stringtie_out2.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> | 189 <output file="stringtie_out2.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> |
116 </test> | 190 </test> |
117 <test> | 191 <test> |
118 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> | 192 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> |
119 <param name="use_guide" value="yes" /> | 193 <param name="use_guide" value="yes" /> |
194 <param name="special_outputs_select" value="no" /> | |
120 <param name="guide_gff" value="stringtie_in.gtf" /> | 195 <param name="guide_gff" value="stringtie_in.gtf" /> |
121 <param name="options" value="default" /> | 196 <param name="options" value="default" /> |
122 <output file="stringtie_out3.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> | 197 <output file="stringtie_out3.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> |
123 </test> | 198 </test> |
124 <test> | 199 <test> |
125 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> | 200 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> |
126 <param name="use_guide" value="yes" /> | 201 <param name="use_guide" value="yes" /> |
202 <param name="special_outputs_select" value="no" /> | |
127 <param name="guide_gff" value="stringtie_in.gtf" /> | 203 <param name="guide_gff" value="stringtie_in.gtf" /> |
128 <param name="options" value="advanced" /> | 204 <param name="options" value="advanced" /> |
129 <param name="fraction" value="0.17" /> | 205 <param name="fraction" value="0.17" /> |
130 <output file="stringtie_out4.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> | 206 <output file="stringtie_out4.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> |
131 </test> | 207 </test> |
132 <test> | 208 <test> |
133 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> | 209 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> |
134 <param name="use_guide" value="yes" /> | 210 <param name="use_guide" value="yes" /> |
135 <param name="output_ballgown" value="yes" /> | 211 <param name="special_outputs_select" value="ballgown" /> |
136 <param name="guide_gff" value="stringtie_in.gtf" /> | 212 <param name="guide_gff" value="stringtie_in.gtf" /> |
137 <param name="options" value="default" /> | 213 <param name="options" value="default" /> |
138 <output file="ballgown/e_data.ctab" ftype="tabular" name="exon_expression" /> | 214 <output file="./ballgown/e_data.ctab" ftype="tabular" name="exon_expression" /> |
139 <output file="ballgown/i_data.ctab" ftype="tabular" name="intron_expression" /> | 215 <output file="./ballgown/i_data.ctab" ftype="tabular" name="intron_expression" /> |
140 <output file="ballgown/t_data.ctab" ftype="tabular" name="transcript_expression" /> | 216 <output file="./ballgown/t_data.ctab" ftype="tabular" name="transcript_expression" /> |
141 <output file="ballgown/e2t.ctab" ftype="tabular" name="exon_transcript_mapping" /> | 217 <output file="./ballgown/e2t.ctab" ftype="tabular" name="exon_transcript_mapping" /> |
142 <output file="ballgown/i2t.ctab" ftype="tabular" name="intron_transcript_mapping" /> | 218 <output file="./ballgown/i2t.ctab" ftype="tabular" name="intron_transcript_mapping" /> |
143 <output file="stringtie_out5.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> | 219 <output file="stringtie_out5.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> |
220 <output file="stringtie_out_coverage.gtf" ftype="gff3" name="coverage" /> | |
221 </test> | |
222 <test> | |
223 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> | |
224 <param name="use_guide" value="yes" /> | |
225 <param name="special_outputs_select" value="deseq2" /> | |
226 <param name="input_estimation" value="True" /> | |
227 <param name="guide_gff" value="stringtie_in.gtf" /> | |
228 <param name="options" value="default" /> | |
229 <param name="clustering" value="True" /> | |
230 <output file="./deseq2/gene_counts.tsv" ftype="tabular" lines_diff="2" name="gene_counts" /> | |
231 <output file="./deseq2/transcript_counts.tsv" ftype="tabular" name="transcript_counts" /> | |
232 <output file="./deseq2/legend.tsv" ftype="tabular" name="legend" /> | |
233 <output file="stringtie_out6.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> | |
144 <output file="stringtie_out_coverage.gtf" ftype="gff3" name="coverage" /> | 234 <output file="stringtie_out_coverage.gtf" ftype="gff3" name="coverage" /> |
145 </test> | 235 </test> |
146 <test> | 236 <test> |
147 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> | 237 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> |
148 <param name="use_guide" value="yes" /> | 238 <param name="use_guide" value="yes" /> |
149 <param name="guide_gff" value="stringtie_in.gtf" /> | 239 <param name="guide_gff" value="stringtie_in.gtf" /> |
150 <param name="options" value="advanced" /> | 240 <param name="options" value="advanced" /> |
151 <param name="fraction" value="0.17" /> | 241 <param name="fraction" value="0.17" /> |
152 <param name="abundance_estimation" value="True" /> | 242 <param name="abundance_estimation" value="True" /> |
153 <output file="stringtie_out4.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> | 243 <output file="stringtie_out4.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> |
154 <output file="stringtie_out6.gtf" ftype="gtf" lines_diff="2" name="gene_abundance_estimation" /> | 244 <output file="stringtie_out7.gtf" ftype="gtf" lines_diff="2" name="gene_abundance_estimation" /> |
155 </test> | 245 </test> |
156 <test> | 246 <test> |
157 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> | 247 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" /> |
158 <param name="use_guide" value="yes" /> | 248 <param name="use_guide" value="yes" /> |
249 <param name="special_outputs_select" value="no" /> | |
159 <param name="guide_gff" value="stringtie_in.gtf" /> | 250 <param name="guide_gff" value="stringtie_in.gtf" /> |
160 <param name="options" value="advanced" /> | 251 <param name="options" value="advanced" /> |
161 <param name="fraction" value="0.15" /> | 252 <param name="fraction" value="0.15" /> |
162 <param name="c" value="test_chromosome" /> | 253 <param name="c" value="test_chromosome" /> |
163 <output file="stringtie_out7.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> | 254 <output file="stringtie_out8.gtf" ftype="gtf" lines_diff="2" name="output_gtf" /> |
164 </test> | 255 </test> |
165 </tests> | 256 </tests> |
166 <help> | 257 <help> |
167 <![CDATA[ | 258 <![CDATA[ |
168 | 259 |