Mercurial > repos > bgruening > repeat_masker
comparison repeatmasker.xml @ 4:04f5c3d7448e draft
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/repeat_masker commit cbba6947f1380751e1db3fa5b043af630523fd86
author | iuc |
---|---|
date | Fri, 04 May 2018 07:59:50 -0400 |
parents | bdfc22c1c3e3 |
children | 8404aa79a631 |
comparison
equal
deleted
inserted
replaced
3:bdfc22c1c3e3 | 4:04f5c3d7448e |
---|---|
1 <tool id="repeatmasker_wrapper" name="RepeatMasker" version="4.0.7" profile="17.01"> | 1 <tool id="repeatmasker_wrapper" name="RepeatMasker" version="4.0.7+galaxy1" profile="17.01"> |
2 <description>RepeatMasker</description> | 2 <description>RepeatMasker</description> |
3 | 3 |
4 <requirements> | 4 <requirements> |
5 <requirement type="package" version="4.0.7">repeatmasker</requirement> | 5 <requirement type="package" version="4.0.7">repeatmasker</requirement> |
6 </requirements> | 6 </requirements> |
9 RM_LIB_PATH=\$(dirname \$(which RepeatMasker))/../share/RepeatMasker/Libraries && | 9 RM_LIB_PATH=\$(dirname \$(which RepeatMasker))/../share/RepeatMasker/Libraries && |
10 mkdir lib && | 10 mkdir lib && |
11 export REPEATMASKER_LIB_DIR=\$(pwd)/lib && | 11 export REPEATMASKER_LIB_DIR=\$(pwd)/lib && |
12 for file in \$(ls \$RM_LIB_PATH) ; do ln -s \$RM_LIB_PATH/\$file lib/\$file ; done && | 12 for file in \$(ls \$RM_LIB_PATH) ; do ln -s \$RM_LIB_PATH/\$file lib/\$file ; done && |
13 #if $repeat_source.source_type == "repbase": | 13 #if $repeat_source.source_type == "repbase": |
14 cp '${repeat_source.repbase_file}' lib/RMRBSeqs.embl && | 14 cp '${repeat_source.repbase_file}' 'lib/${repeat_source.repbase_file_name}' && |
15 #end if | 15 #end if |
16 ln -s '${input_fasta}' rm_input.fasta && | 16 ln -s '${input_fasta}' rm_input.fasta && |
17 RepeatMasker -dir \$(pwd) | 17 RepeatMasker -dir \$(pwd) |
18 #if $repeat_source.source_type == "library": | 18 #if $repeat_source.source_type == "library": |
19 -lib '${repeat_source.repeat_lib}' | 19 -lib '${repeat_source.repeat_lib}' |
24 #else | 24 #else |
25 -species '${repeat_source.species_source.species_name}' | 25 -species '${repeat_source.species_source.species_name}' |
26 #end if | 26 #end if |
27 #end if | 27 #end if |
28 -parallel \${GALAXY_SLOTS:-1} | 28 -parallel \${GALAXY_SLOTS:-1} |
29 '${gff}' | 29 ${gff} |
30 '${ignore_n_stretches}' | 30 ${excln} |
31 '${advanced.is_only}' | 31 ${advanced.is_only} |
32 '${advanced.is_clip}' | 32 ${advanced.is_clip} |
33 '${advanced.no_is}' | 33 ${advanced.no_is} |
34 '${advanced.rodspec}' | 34 ${advanced.rodspec} |
35 '${advanced.primspec}' | 35 ${advanced.primspec} |
36 '${advanced.nolow}' | 36 ${advanced.nolow} |
37 '${advanced.noint}' | 37 ${advanced.noint} |
38 '${advanced.norna}' | 38 ${advanced.norna} |
39 '${advanced.alu}' | 39 ${advanced.alu} |
40 '${advanced.div}' | 40 ${advanced.div} |
41 '${advanced.search_speed}' | 41 ${advanced.search_speed} |
42 '${advanced.frag}' | 42 -frag ${advanced.frag} |
43 '${advanced.maxsize}' | 43 ## -maxsize ${advanced.maxsize} |
44 #if $advanced.gc is not None: | 44 #if str($advanced.gc): |
45 '${advanced.gc}' | 45 -gc ${advanced.gc} |
46 #end if | 46 #end if |
47 '${advanced.gccalc}' | 47 ${advanced.gccalc} |
48 '${advanced.nocut}' | 48 ${advanced.nocut} |
49 '${advanced.keep_alignments}' | 49 ${advanced.keep_alignments} |
50 '${advanced.invert_alignments}' | 50 ${advanced.invert_alignments} |
51 '${advanced.xout}' | 51 ${advanced.xout} |
52 '${advanced.xsmall}' | 52 ${advanced.xsmall} |
53 '${advanced.poly}' | 53 ${advanced.poly} |
54 rm_input.fasta && | 54 rm_input.fasta && |
55 #if $advanced.is_only != '-is_only': | 55 #if $advanced.is_only != '-is_only': |
56 mv rm_input.fasta.masked '${output_masked_genome}' && | 56 mv rm_input.fasta.masked '${output_masked_genome}' && |
57 sed -r 's/^ *// ; s/ *$//; s/\+ //; s/ +/\t/g ; 1,2c SW score\t% div.\t% del.\t% ins.\tquery sequence\tpos in query: begin\tend\t(left)\trepeat\tclass/family\tpos in repeat: begin\tend\t(left)\tID' rm_input.fasta.out >'${output_log}' && | 57 sed -r 's/^ *// ; s/ *$//; s/\+ //; s/ +/\t/g ; 1,2c SW score\t% div.\t% del.\t% ins.\tquery sequence\tpos in query: begin\tend\t(left)\trepeat\tclass/family\tpos in repeat: begin\tend\t(left)\tID' rm_input.fasta.out >'${output_log}' && |
58 mv rm_input.fasta.tbl '${output_table}' && | 58 mv rm_input.fasta.tbl '${output_table}' && |
77 <option selected="true" value="repbase">RepBase</option> | 77 <option selected="true" value="repbase">RepBase</option> |
78 <option value="library">Custom library of repeats</option> | 78 <option value="library">Custom library of repeats</option> |
79 </param> | 79 </param> |
80 <when value="repbase"> | 80 <when value="repbase"> |
81 <param name="repbase_file" type="data" format="embl" label="RepBase (RMRBSeqs.embl) file" /> | 81 <param name="repbase_file" type="data" format="embl" label="RepBase (RMRBSeqs.embl) file" /> |
82 <param name="repbase_file_name" type="hidden" value="RMRBSeqs.embl"/> <!-- This is an ugly hack to allow testing with a fake repbase --> | |
82 <conditional name="species_source"> | 83 <conditional name="species_source"> |
83 <param label="Select species name from a list?" name="species_from_list" type="select"> | 84 <param label="Select species name from a list?" name="species_from_list" type="select"> |
84 <option value="yes" selected="true">Yes</option> | 85 <option value="yes" selected="true">Yes</option> |
85 <option value="no">No</option> | 86 <option value="no">No</option> |
86 </param> | 87 </param> |
124 <param name="repeat_lib" type="data" format="fasta" label="Custom library of repeats" /> | 125 <param name="repeat_lib" type="data" format="fasta" label="Custom library of repeats" /> |
125 <param name="cutoff" type="integer" argument="-cutoff" value="225" label="Cutoff score for masking repeats" /> | 126 <param name="cutoff" type="integer" argument="-cutoff" value="225" label="Cutoff score for masking repeats" /> |
126 </when> | 127 </when> |
127 </conditional> | 128 </conditional> |
128 <param type="boolean" argument="-gff" truevalue="-gff" falsevalue="" label="Output annotation of repeats in GFF format" checked="false" /> | 129 <param type="boolean" argument="-gff" truevalue="-gff" falsevalue="" label="Output annotation of repeats in GFF format" checked="false" /> |
129 <param name="ignore_n_stretches" type="boolean" argument="-excln" falsevalue="" label="Ignore stretches of Ns when computing statistics" checked="true" help="Scaffolds are sometimes joined with stretches of 25 or more Ns. This option ignores them when calculating repeat statistics" /> | 130 <param argument="-excln" type="boolean" truevalue="-excln" falsevalue="" label="Ignore stretches of Ns when computing statistics" checked="true" help="Scaffolds are sometimes joined with stretches of 25 or more Ns. This option ignores them when calculating repeat statistics" /> |
130 <section name="advanced" title="Advanced options" expanded="false"> | 131 <section name="advanced" title="Advanced options" expanded="false"> |
131 <param argument="-is_only" type="boolean" truevalue="-is_only" falsevalue="" checked="false" label="Only clip E coli insertion elements" /> | 132 <param argument="-is_only" type="boolean" truevalue="-is_only" falsevalue="" checked="false" label="Only clip E coli insertion elements" /> |
132 <param argument="-is_clip" type="boolean" truevalue="-is_clip" falsevalue="" checked="false" label="Clip IS elements before analysis" help="Normally RepeatMasker will report on IS element, with this option selected it will clip them before analysis" /> | 133 <param argument="-is_clip" type="boolean" truevalue="-is_clip" falsevalue="" checked="false" label="Clip IS elements before analysis" help="Normally RepeatMasker will report on IS element, with this option selected it will clip them before analysis" /> |
133 <param argument="-no_is" type="boolean" truevalue="-no_is" falsevalue="" checked="false" label="Skip bacterial insertion element check" /> | 134 <param argument="-no_is" type="boolean" truevalue="-no_is" falsevalue="" checked="false" label="Skip bacterial insertion element check" /> |
134 <param argument="-rodspec" type="boolean" truevalue="-rodspec" falsevalue="" checked="false" label="Only check for rodent specific repeats" help="If this option is select a check for rodent specific repeats is done instead of a full RepeatMasker run" /> | 135 <param argument="-rodspec" type="boolean" truevalue="-rodspec" falsevalue="" checked="false" label="Only check for rodent specific repeats" help="If this option is select a check for rodent specific repeats is done instead of a full RepeatMasker run" /> |
143 <option value="-q">Quick (5-10% less sensitive, 3-4 times speedup)</option> | 144 <option value="-q">Quick (5-10% less sensitive, 3-4 times speedup)</option> |
144 <option value="-qq">Rush (10% less sensitive)</option> | 145 <option value="-qq">Rush (10% less sensitive)</option> |
145 <option value="-s">Slow (0-5% more sensitive, 2.5 times slowdown)</option> | 146 <option value="-s">Slow (0-5% more sensitive, 2.5 times slowdown)</option> |
146 </param> | 147 </param> |
147 <param type="integer" argument="-frag" value="40000" label="Maximum contiguous sequence searched" help="Maximum length of sequencing that is search without fragmenting" /> | 148 <param type="integer" argument="-frag" value="40000" label="Maximum contiguous sequence searched" help="Maximum length of sequencing that is search without fragmenting" /> |
148 <param type="integer" argument="-maxsize" value="4000000" label="Maximum length for IS or repeat clipped sequences" /> | 149 <!-- -maxsize option is in the help, but not in the code of repeatmasker--> |
149 <param type="integer" argument="-gc" optional="True" label="Select matrices for this GC%" help="Valid values are a percentage or -1 to choose the default" /> | 150 <!--param type="integer" argument="-maxsize" value="4000000" label="Maximum length for IS or repeat clipped sequences" /--> |
151 <param type="integer" argument="-gc" optional="true" label="Select matrices for this GC%" help="Valid values are a percentage or -1 to choose the default" /> | |
150 <param type="boolean" argument="-gccalc" truevalue="-gcccalc" falsevalue="" checked="false" label="Calculate GC % for all sequences" help="By default RepeatMasker skips calculating GC % for small sequences" /> | 152 <param type="boolean" argument="-gccalc" truevalue="-gcccalc" falsevalue="" checked="false" label="Calculate GC % for all sequences" help="By default RepeatMasker skips calculating GC % for small sequences" /> |
151 <param type="boolean" argument="-nocut" truevalue="-nocut" falsevalue="" checked="false" label="Skips cutting of repeats" /> | 153 <param type="boolean" argument="-nocut" truevalue="-nocut" falsevalue="" checked="false" label="Skips cutting of repeats" /> |
152 <param name="xout" type="boolean" argument="-x" truevalue="-x" falsevalue="" checked="false" label="Mask with X instead of N characters" /> | 154 <param name="xout" type="boolean" argument="-x" truevalue="-x" falsevalue="" checked="false" label="Mask with X instead of N characters" /> |
153 <param name="keep_alignments" type="boolean" argument="-ali" truevalue="-ali" falsevalue="" checked="false" label="Output alignments file" /> | 155 <param name="keep_alignments" type="boolean" argument="-ali" truevalue="-ali" falsevalue="" checked="false" label="Output alignments file" /> |
154 <param name="invert_alignments" type="boolean" argument="-inv" truevalue="-inv" falsevalue="" checked="false" label="Invert alignments in alignment file" help="Show alignments in the orientation of the repeat sequence, not the query sequence" /> | 156 <param name="invert_alignments" type="boolean" argument="-inv" truevalue="-inv" falsevalue="" checked="false" label="Invert alignments in alignment file" help="Show alignments in the orientation of the repeat sequence, not the query sequence" /> |
201 <output name="output_log" file="small.fasta.log" /> | 203 <output name="output_log" file="small.fasta.log" /> |
202 <output name="output_alignment" file="small.fasta.align" /> | 204 <output name="output_alignment" file="small.fasta.align" /> |
203 <output name="output_polymorphic" file="small.fasta.poly" /> | 205 <output name="output_polymorphic" file="small.fasta.poly" /> |
204 <output name="output_gff" file="small.fasta.gff" lines_diff="4" /> | 206 <output name="output_gff" file="small.fasta.gff" lines_diff="4" /> |
205 </test> | 207 </test> |
208 <test expect_num_outputs="4"> | |
209 <param name="input_fasta" value="small.fasta" ftype="fasta" /> | |
210 <param name="source_type" value="repbase" /> | |
211 <param name="repbase_file" value="fake_repbase.embl" /> | |
212 <param name="repbase_file_name" value="fake.embl" /> | |
213 <param name="species_list" value="anopheles" /> | |
214 <output name="output_masked_genome" file="small.fasta.masked" /> | |
215 <output name="output_table" file="small_repbase.fasta.stats" lines_diff="2" /> | |
216 <output name="output_repeat_catalog" file="small.fasta.cat" /> | |
217 <output name="output_log" file="small_repbase.fasta.log" /> | |
218 </test> | |
206 </tests> | 219 </tests> |
207 <help><![CDATA[ | 220 <help><![CDATA[ |
208 RepeatMasker is a program that screens DNA for interspersed repeats and low | 221 RepeatMasker is a program that screens DNA for interspersed repeats and low |
209 complexity DNA sequences. The database of repeats to screen for can be | 222 complexity DNA sequences. The database of repeats to screen for can be |
210 provided as a FASTA file or downloaded from RepBase_. If the RepBase option is | 223 provided as a FASTA file or downloaded from RepBase_. If the RepBase option is |