comparison mapper.xml @ 4:dbbe92348c7a draft default tip

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/mirdeep2/mirdeep2_mapper commit 04c75332ac618b43ce5c3f307f7866e97147e865
author rnateam
date Thu, 05 Apr 2018 08:55:27 -0400
parents a8d24f4b6d95
children
comparison
equal deleted inserted replaced
3:a8d24f4b6d95 4:dbbe92348c7a
1 <tool id="rbc_mirdeep2_mapper" name="MiRDeep2 Mapper" version="2.0.0"> 1 <tool id="rbc_mirdeep2_mapper" name="MiRDeep2 Mapper" version="2.0.0.8.1">
2 <description>process and map reads to a reference genome</description> 2 <description>process and map reads to a reference genome</description>
3 <macros> 3 <macros>
4 <macro name="map_params"> 4 <macro name="map_params">
5 <conditional name="refGenomeSource"> 5 <conditional name="refGenomeSource">
6 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Map to genome. (-p)"> 6 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Map to genome. (-p)">
26 </macro> 26 </macro>
27 </macros> 27 </macros>
28 <requirements> 28 <requirements>
29 <requirement type="package" version="2.0.0.8">mirdeep2</requirement> 29 <requirement type="package" version="2.0.0.8">mirdeep2</requirement>
30 </requirements> 30 </requirements>
31 <stdio> 31 <command detect_errors="aggressive">
32 <!-- Anything other than zero is an error -->
33 <exit_code range="1:" />
34 <exit_code range=":-1" />
35 <!-- In case the return code has not been set propery check stderr too -->
36 <regex match="Error:" />
37 <regex match="Exception:" />
38 </stdio>
39 <command>
40 <![CDATA[ 32 <![CDATA[
41
42 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_map" 33 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_map"
43 #if $operation.refGenomeSource.genomeSource == "history" 34 #if $operation.refGenomeSource.genomeSource == "history"
44 bowtie-build '$operation.refGenomeSource.ownFile' custom_bowtie_indices && 35 bowtie-build '$operation.refGenomeSource.ownFile' custom_bowtie_indices &&
45 #end if 36 #end if
46 #end if 37 #end if
47 38
48 mapper.pl 39 mapper.pl
49 40
50 '$reads' 41 #if $input.type == "single":
51 42 '$input.reads'
52 #if $reads.extension.startswith("fasta") 43
53 -c 44 #if $input.reads.extension.startswith("fasta")
54 #else if $reads.extension.startswith("fastq") 45 -c
55 -e 46 #else if $input.reads.extension.startswith("fastq")
56 -h 47 -e
48 -h
49 #end if
50 #else:
51 '$samples' -d
52
53 #if $input.reads_list[0].reads.extension.startswith("fasta")
54 -c
55 #else if $input.reads_list[0].reads.extension.startswith("fastq")
56 -e
57 -h
58 #end if
57 #end if 59 #end if
58 60
59 $remove_non_canon 61 $remove_non_canon
60 62
61 $convert_rna_dna 63 $convert_rna_dna
62 64
63 #if $clip_adapter.clip == "true" 65 #if $clip_adapter.clip == "true"
64 -k $clip_adapter.adapter_seq 66 -k $clip_adapter.adapter_seq
65 #end if 67 #end if
67 -l $discard_short_reads 69 -l $discard_short_reads
68 70
69 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_collapse" 71 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_collapse"
70 -m -s '$output_reads_collapsed' 72 -m -s '$output_reads_collapsed'
71 #end if 73 #end if
72 74
73 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_map" 75 #if $operation.collapse_map == "collapse_and_map" or $operation.collapse_map == "only_map"
74 -p 76 -p
75 77
76 #if $operation.refGenomeSource.genomeSource == "history" 78 #if $operation.refGenomeSource.genomeSource == "history"
77 custom_bowtie_indices 79 custom_bowtie_indices
78 #else 80 #else
79 '$operation.refGenomeSource.index.fields.path' 81 '$operation.refGenomeSource.index.fields.path'
80 #end if 82 #end if
81 $operation.map_mismatch 83 $operation.map_mismatch
82 -r $operation.map_threshold 84 -r $operation.map_threshold
83 85
84 -t '$output_mapping' 86 -t '$output_mapping'
85 #end if 87 #end if
86 88
87 -v -n 89 -v -n
88 ]]> 90 ]]>
89 </command> 91 </command>
92 <configfiles>
93 <configfile name="samples"><![CDATA[#if $input.type == "multiple":
94 #for $r in $input.reads_list:
95 $r.reads $r.sample_name
96 #end for
97 #end if]]></configfile>
98 </configfiles>
90 <inputs> 99 <inputs>
91 <param format="fastq, fasta" name="reads" type="data" optional="false" label="Deep sequencing reads" help="Reads in fastq or FASTA format"/> 100 <conditional name="input">
101 <param name="type" type="select" label="Pool multiple read sets">
102 <option value="single" selected="true">No</option>
103 <option value="multiple">Yes</option>
104 </param>
105 <when value="single">
106 <param format="fastq,fasta" name="reads" type="data" label="Deep sequencing reads" help="Reads in fastq or FASTA format"/>
107 </when>
108 <when value="multiple">
109 <repeat name="reads_list" title="Reads">
110 <param name="sample_name" value="" type="text" label="Sample name" help="Must be a 3 letters/digits code">
111 <validator type="expression" message="The sample name must be a 3 letters/digits code">len(value) == 3 and value.isalnum()</validator>
112 </param>
113 <param format="fastq,fasta" name="reads" type="data" optional="false" label="Deep sequencing reads" help="Reads in fastq or FASTA format"/>
114 </repeat>
115 </when>
116 </conditional>
92 <param name="remove_non_canon" type="boolean" truevalue="-j" falsevalue="" checked="false" label="Remove reads with non-standard nucleotides" help="Remove all entries that have a sequence that contains letters other than a,c,g,t,u,n,A,C,G,T,U,N. (-j)"/> 117 <param name="remove_non_canon" type="boolean" truevalue="-j" falsevalue="" checked="false" label="Remove reads with non-standard nucleotides" help="Remove all entries that have a sequence that contains letters other than a,c,g,t,u,n,A,C,G,T,U,N. (-j)"/>
93 <param name="convert_rna_dna" type="boolean" truevalue="-i" falsevalue="" checked="false" label="Convert RNA to DNA alphabet (to map against genome)" help="(-i)"/> 118 <param name="convert_rna_dna" type="boolean" truevalue="-i" falsevalue="" checked="false" label="Convert RNA to DNA alphabet (to map against genome)" help="(-i)"/>
94 119
95 <conditional name="clip_adapter"> 120 <conditional name="clip_adapter">
96 <param name="clip" type="select" label="Clip 3' Adapter Sequence" help="(-k)"> 121 <param name="clip" type="select" label="Clip 3' Adapter Sequence" help="(-k)">
102 <validator type="regex" message="Adapter can ONLY contain a,c,g,t,u,n,A,C,G,T,U,N">^[ACGTUacgtu]+$</validator> 127 <validator type="regex" message="Adapter can ONLY contain a,c,g,t,u,n,A,C,G,T,U,N">^[ACGTUacgtu]+$</validator>
103 </param> 128 </param>
104 </when> 129 </when>
105 <when value="false"/> 130 <when value="false"/>
106 </conditional> 131 </conditional>
107 132
108 <param name="discard_short_reads" value="18" type="integer" optional="false" label="Discard reads shorter than this length" help="Set to 0 to keep all reads. (-l)"> 133 <param name="discard_short_reads" value="18" type="integer" optional="false" label="Discard reads shorter than this length" help="Set to 0 to keep all reads. (-l)">
109 <validator type="in_range" min="0" message="Minimum value is 0"/> 134 <validator type="in_range" min="0" message="Minimum value is 0"/>
110 </param> 135 </param>
111 136
112 <conditional name="operation"> 137 <conditional name="operation">
113 <param name="collapse_map" type="select" label="Collapse reads and/or Map" help="(-m) and/or (-p)"> 138 <param name="collapse_map" type="select" label="Collapse reads and/or Map" help="(-m) and/or (-p)">
114 <option value="collapse_and_map">Collapse reads and Map</option> 139 <option value="collapse_and_map">Collapse reads and Map</option>
115 <option value="only_map">Map</option> 140 <option value="only_map">Map</option>
116 <option value="only_collapse">Collapse</option> 141 <option value="only_collapse">Collapse</option>
142 </filter> 167 </filter>
143 </data> 168 </data>
144 </outputs> 169 </outputs>
145 <tests> 170 <tests>
146 <test> 171 <test>
147 <param name="reads" value="reads.fa"/> 172 <conditional name="input">
173 <param name="type" value="single"/>
174 <param name="reads" value="reads.fa"/>
175 </conditional>
148 <param name="remove_non_canon" value="True"/> 176 <param name="remove_non_canon" value="True"/>
149 <param name="clip" value="true"/> 177 <param name="clip" value="true"/>
150 <param name="adapter_seq" value="TCGTATGCCGTCTTCTGCTTGT"/> 178 <param name="adapter_seq" value="TCGTATGCCGTCTTCTGCTTGT"/>
151 <param name="discard_short_reads" value="18"/> 179 <param name="discard_short_reads" value="18"/>
152 <param name="collapse_map" value="collapse_and_map"/> 180 <param name="collapse_map" value="collapse_and_map"/>
169 <has_line_matching expression="^.*22\t1\t22\ttcaccgggagaaaaactggtgt\tchrII:11534525-11540624\t22\t3382\t3403.*$"/> 197 <has_line_matching expression="^.*22\t1\t22\ttcaccgggagaaaaactggtgt\tchrII:11534525-11540624\t22\t3382\t3403.*$"/>
170 <has_line_matching expression="^.*25\t1\t25\ttcaccgggtggaaactagcagtggc\tchrII:11534525-11540624\t25\t3060\t3084.*$"/> 198 <has_line_matching expression="^.*25\t1\t25\ttcaccgggtggaaactagcagtggc\tchrII:11534525-11540624\t25\t3060\t3084.*$"/>
171 </assert_contents> 199 </assert_contents>
172 </output> 200 </output>
173 </test> 201 </test>
202 <test>
203 <conditional name="input">
204 <param name="type" value="multiple"/>
205 <repeat name="reads_list">
206 <param name="sample_name" value="sa1"/>
207 <param name="reads" value="reads_sample1.fa"/>
208 </repeat>
209 <repeat name="reads_list">
210 <param name="sample_name" value="sa2"/>
211 <param name="reads" value="reads_sample2.fa"/>
212 </repeat>
213 </conditional>
214 <param name="remove_non_canon" value="True"/>
215 <param name="clip" value="true"/>
216 <param name="adapter_seq" value="TCGTATGCCGTCTTCTGCTTGT"/>
217 <param name="discard_short_reads" value="18"/>
218 <param name="collapse_map" value="collapse_and_map"/>
219 <param name="genomeSource" value="history"/>
220 <param name="ownFile" value="cel_cluster.fa"/>
221 <output name="output_reads_collapsed">
222 <assert_contents>
223 <has_text text=">sa1_220_x1"/>
224 <has_text text="TCACCGGGTGTACATCAGC"/>
225 <has_text text=">sa2_0_x250"/>
226 <has_text text="AATGACACTGGTTATCTTTTCCATCG"/>
227 </assert_contents>
228 </output>
229 <output name="output_mapping">
230 <assert_contents>
231 <has_line_matching expression="^.*22\t1\t22\ttcaccgggtggaaactagcagt\tchrII:11534525-11540624\t22\t3060\t3081.*$"/>
232 <has_line_matching expression="^.*21\t1\t21\ttcaccgggtggaaactagcag\tchrII:11534525-11540624\t21\t3060\t3080.*$"/>
233 <has_line_matching expression="^.*22\t1\t22\ttcaccgggtgtacatcagctaa\tchrII:11534525-11540624\t22\t3631\t3652.*$"/>
234 </assert_contents>
235 </output>
236 </test>
174 </tests> 237 </tests>
175 <help> 238 <help>
176 <![CDATA[ 239 <![CDATA[
177 **What it does** 240 **What it does**
178 241
179 The MiRDeep2 Mapper module is designed as a tool to process deep sequencing reads and/or map them to the reference genome. 242 The MiRDeep2 Mapper module is designed as a tool to process deep sequencing reads and/or map them to the reference genome.
180 The module works in sequence space, and can process or map data that is in sequence FASTA format. 243 The module works in sequence space, and can process or map data that is in sequence FASTA format.
181 A number of the functions of the mapper module are implemented specifically with Solexa/Illumina data in mind. 244 A number of the functions of the mapper module are implemented specifically with Solexa/Illumina data in mind.
182 245
183 **Input** 246 **Input**
184 247
185 Default input is a file in FASTA format, seq.txt or qseq.txt format. More input can be given depending on the options used. 248 Default input is a file in FASTA format, seq.txt or qseq.txt format. More input can be given depending on the options used.
186 249
187 **Output** 250 **Output**
188 251
189 The output depends on the options used. Either a FASTA file with processed reads or an arf file with with mapped reads, or both, are output. 252 The output depends on the options used. Either a FASTA file with processed reads or an arf file with with mapped reads, or both, are output.
190 253
191 Arf format: 254 Arf format:
192 Is a proprietary file format generated and processed by miRDeep2. It contains information of reads mapped to a reference genome. Each line in such a file contains 13 columns: 255 Is a proprietary file format generated and processed by miRDeep2. It contains information of reads mapped to a reference genome. Each line in such a file contains 13 columns:
193 256
194 1. read identifier 257 1. read identifier