Mercurial > repos > bgruening > repeat_masker
comparison repeatmasker.xml @ 10:bfc70c8cc5ca draft
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/repeat_masker commit 69abffb867af7c4329eaa513201bd6626ac39cbf"
author | iuc |
---|---|
date | Fri, 11 Dec 2020 22:26:02 +0000 |
parents | 438f65cb1d14 |
children | 72aade318318 |
comparison
equal
deleted
inserted
replaced
9:438f65cb1d14 | 10:bfc70c8cc5ca |
---|---|
1 <tool id="repeatmasker_wrapper" name="RepeatMasker" version="4.0.9" profile="17.01"> | 1 <tool id="repeatmasker_wrapper" name="RepeatMasker" version="4.1.1" profile="17.01"> |
2 <description>screen DNA sequences for interspersed repeats and low complexity regions</description> | 2 <description>screen DNA sequences for interspersed repeats and low complexity regions</description> |
3 | 3 |
4 <requirements> | 4 <requirements> |
5 <requirement type="package" version="4.0.9_p2">repeatmasker</requirement> | 5 <requirement type="package" version="4.1.1">repeatmasker</requirement> |
6 </requirements> | 6 </requirements> |
7 | 7 |
8 <command detect_errors="exit_code"><![CDATA[ | 8 <command detect_errors="exit_code"><![CDATA[ |
9 RM_PATH=\$(which RepeatMasker) && | 9 RM_PATH=\$(which RepeatMasker) && |
10 if [ -z "\$RM_PATH" ] ; then echo "Failed to find RepeatMasker in PATH (\$PATH)" >&2 ; exit 1 ; fi && | 10 if [ -z "\$RM_PATH" ] ; then echo "Failed to find RepeatMasker in PATH (\$PATH)" >&2 ; exit 1 ; fi && |
11 | |
11 RM_LIB_PATH=\$(dirname \$RM_PATH)/../share/RepeatMasker/Libraries && | 12 RM_LIB_PATH=\$(dirname \$RM_PATH)/../share/RepeatMasker/Libraries && |
12 mkdir lib && | 13 #if $repeat_source.source_type == "dfam_up": |
13 export REPEATMASKER_LIB_DIR=\$(pwd)/lib && | 14 mkdir lib/ && |
14 for file in \$(ls \$RM_LIB_PATH) ; do ln -s \$RM_LIB_PATH/\$file lib/\$file ; done && | 15 ln -s '${repeat_source.dfam_lib}' lib/RepeatMaskerLib.h5 && |
15 #if $repeat_source.source_type == "repbase": | 16 RM_LIB_PATH=\$(pwd)/lib && |
16 cp '${repeat_source.repbase_file}' 'lib/${repeat_source.repbase_file_name}' && | 17 #end if |
17 #end if | 18 |
18 ln -s '${input_fasta}' rm_input.fasta && | 19 ln -s '${input_fasta}' rm_input.fasta && |
20 | |
19 RepeatMasker -dir \$(pwd) | 21 RepeatMasker -dir \$(pwd) |
22 -libdir \$RM_LIB_PATH | |
20 #if $repeat_source.source_type == "library": | 23 #if $repeat_source.source_type == "library": |
21 -lib '${repeat_source.repeat_lib}' | 24 -lib '${repeat_source.repeat_lib}' |
22 -cutoff '${repeat_source.cutoff}' | 25 -cutoff '${repeat_source.cutoff}' |
23 #else if $repeat_source.source_type == "repbase": | 26 #else if $repeat_source.source_type == "dfam": |
24 #if $repeat_source.species_source.species_from_list == 'yes': | 27 #if $repeat_source.species_source.species_from_list == 'yes': |
25 $repeat_source.species_source.species_list | 28 -species $repeat_source.species_source.species_list |
26 #else | 29 #else |
27 -species '${repeat_source.species_source.species_name}' | 30 -species '${repeat_source.species_source.species_name}' |
28 #end if | 31 #end if |
32 #else if $repeat_source.source_type == "dfam_up": | |
33 -species '${repeat_source.species_name}' | |
29 #end if | 34 #end if |
30 -parallel \${GALAXY_SLOTS:-1} | 35 -parallel \${GALAXY_SLOTS:-1} |
31 ${gff} | 36 ${gff} |
32 ${excln} | 37 ${excln} |
33 ${advanced.is_only} | 38 ${advanced.is_only} |
77 </command> | 82 </command> |
78 | 83 |
79 <inputs> | 84 <inputs> |
80 <param name="input_fasta" type="data" format="fasta" label="Genomic DNA" /> | 85 <param name="input_fasta" type="data" format="fasta" label="Genomic DNA" /> |
81 <conditional name="repeat_source"> | 86 <conditional name="repeat_source"> |
82 <param label="Repeat library source" name="source_type" type="select"> | 87 <param label="Repeat library source" name="source_type" type="select" help="To use RepBase, choose 'Custom library of repeats' and select a fasta version of this non-free database."> |
83 <option selected="true" value="repbase">RepBase</option> | 88 <option selected="true" value="dfam">DFam (curated only, bundled with RepeatMasker)</option> |
89 <option value="dfam_up">DFam (full/specific version)</option> | |
84 <option value="library">Custom library of repeats</option> | 90 <option value="library">Custom library of repeats</option> |
85 </param> | 91 </param> |
86 <when value="repbase"> | 92 <when value="dfam"> |
87 <param name="repbase_file" type="data" format="embl" label="RepBase (RMRBSeqs.embl) file" /> | |
88 <param name="repbase_file_name" type="hidden" value="RMRBSeqs.embl"/> <!-- This is an ugly hack to allow testing with a fake repbase --> | |
89 <conditional name="species_source"> | 93 <conditional name="species_source"> |
90 <param label="Select species name from a list?" name="species_from_list" type="select"> | 94 <param label="Select species name from a list?" name="species_from_list" type="select"> |
91 <option value="yes" selected="true">Yes</option> | 95 <option value="yes" selected="true">Yes</option> |
92 <option value="no">No</option> | 96 <option value="no">No</option> |
93 </param> | 97 </param> |
94 <when value="yes"> | 98 <when value="yes"> |
95 <param name="species_list" type="select" label="Species"> | 99 <param name="species_list" type="select" label="Species"> |
96 <option value="-species anopheles" selected="true">anopheles</option> | 100 <option value="vertebrate">Vertebrate (other than below)</option> |
97 <option value="-species arabidopsis">arabidopsis</option> | 101 <option value="mammal">Mammal (other than below)</option> |
98 <option value="-species artiodactyl">artiodactyl</option> | 102 <option value="human" selected="true">Human</option> |
99 <option value="-species aspergillus">aspergillus</option> | 103 <option value="rodent">Rodent</option> |
100 <option value="-species carnivore">carnivore</option> | 104 <option value="mouse">Mouse</option> |
101 <option value="-species cat">cat</option> | 105 <option value="rat">Rat</option> |
102 <option value="-species chicken">chicken</option> | 106 <option value="danio">Danio (zebra fish)</option> |
103 <option value="-species 'ciona intestinalis'">ciona intestinalis</option> | 107 <option value="drosophila">Fruit fly (Drosophila melanogaster)</option> |
104 <option value="-species 'ciona savignyi'">ciona savignyi</option> | 108 <option value="elegans">Caenorhabditis elegans (nematode)</option> |
105 <option value="-species cow">cow</option> | |
106 <option value="-species danio">danio</option> | |
107 <option value="-species diatoaea">diatomea</option> | |
108 <option value="-species dog">dog</option> | |
109 <option value="-species drosophila">drosophila</option> | |
110 <option value="-species elegans">elegans</option> | |
111 <option value="-species fugu">fugu</option> | |
112 <option value="-species fungi" selected="true">fungi</option> | |
113 <option value="-species human">human</option> | |
114 <option value="-species maize">maize</option> | |
115 <option value="-species mammal">mammal</option> | |
116 <option value="-species mouse">mouse</option> | |
117 <option value="-species pig">pig</option> | |
118 <option value="-species rat">rat</option> | |
119 <option value="-species rice">rice</option> | |
120 <option value="-species rodentia">rodentia</option> | |
121 <option value="-species ruminantia">ruminantia</option> | |
122 <option value="-species wheat">wheat</option> | |
123 </param> | 109 </param> |
124 </when> | 110 </when> |
125 <when value="no"> | 111 <when value="no"> |
126 <param name="species_name" type="text" value="homo sapiens" label="Repeat source species" help="Source species (or clade name) used to select repeats from RepBase" /> | 112 <param name="species_name" type="text" value="human" label="Repeat source species" help="Source species (or clade name) used to select repeats from DFam" /> |
127 </when> | 113 </when> |
128 </conditional> | 114 </conditional> |
115 </when> | |
116 <when value="dfam_up"> | |
117 <param name="dfam_lib" type="data" format="h5" label="DFam library" help="The full DFam library can be downloaded from https://www.dfam.org/releases/current/families/Dfam.h5.gz" /> | |
118 <param name="species_name" type="text" value="human" label="Repeat source species" help="Source species (or clade name) used to select repeats from DFam" /> | |
129 </when> | 119 </when> |
130 <when value="library"> | 120 <when value="library"> |
131 <param name="repeat_lib" type="data" format="fasta" label="Custom library of repeats" /> | 121 <param name="repeat_lib" type="data" format="fasta" label="Custom library of repeats" /> |
132 <param name="cutoff" type="integer" argument="-cutoff" value="225" label="Cutoff score for masking repeats" /> | 122 <param name="cutoff" type="integer" argument="-cutoff" value="225" label="Cutoff score for masking repeats" /> |
133 </when> | 123 </when> |
197 </test> | 187 </test> |
198 <test expect_num_outputs="7"> | 188 <test expect_num_outputs="7"> |
199 <param name="input_fasta" value="small.fasta" ftype="fasta" /> | 189 <param name="input_fasta" value="small.fasta" ftype="fasta" /> |
200 <param name="source_type" value="library" /> | 190 <param name="source_type" value="library" /> |
201 <param name="gff" value="-gff" /> | 191 <param name="gff" value="-gff" /> |
202 <!-- <param name="show" value="yes" /> --> | |
203 <param name="keep_alignments" value="-ali" /> | 192 <param name="keep_alignments" value="-ali" /> |
204 <param name="poly" value="-poly" /> | 193 <param name="poly" value="-poly" /> |
205 <param name="repeat_lib" value="repeats.fasta" ftype="fasta" /> | 194 <param name="repeat_lib" value="repeats.fasta" ftype="fasta" /> |
206 <output name="output_masked_genome" file="small.fasta.masked" /> | 195 <output name="output_masked_genome" file="small.fasta.masked" /> |
207 <output name="output_table" file="small.fasta.stats" lines_diff="6" /> | 196 <output name="output_table" file="small.fasta.stats" lines_diff="6" /> |
211 <output name="output_polymorphic" file="small.fasta.poly" /> | 200 <output name="output_polymorphic" file="small.fasta.poly" /> |
212 <output name="output_gff" file="small.fasta.gff" lines_diff="4" /> | 201 <output name="output_gff" file="small.fasta.gff" lines_diff="4" /> |
213 </test> | 202 </test> |
214 <test expect_num_outputs="4"> | 203 <test expect_num_outputs="4"> |
215 <param name="input_fasta" value="small.fasta" ftype="fasta" /> | 204 <param name="input_fasta" value="small.fasta" ftype="fasta" /> |
216 <param name="source_type" value="repbase" /> | 205 <param name="source_type" value="dfam" /> |
217 <param name="repbase_file" value="fake_repbase.embl" /> | 206 <param name="species_list" value="human" /> |
218 <param name="repbase_file_name" value="fake.embl" /> | 207 <output name="output_masked_genome" file="small_dfam.fasta.masked" /> |
219 <param name="species_list" value="anopheles" /> | 208 <output name="output_table" file="small_dfam.fasta.stats" lines_diff="2" /> |
220 <output name="output_masked_genome" file="small.fasta.masked" /> | 209 <output name="output_repeat_catalog" file="small_dfam.fasta.cat" lines_diff="2" /> |
221 <output name="output_table" file="small_repbase.fasta.stats" lines_diff="2" /> | 210 <output name="output_log" file="small_dfam.fasta.log" lines_diff="2"/> |
222 <output name="output_repeat_catalog" file="small.fasta.cat" lines_diff="2" /> | 211 </test> |
223 <output name="output_log" file="small_repbase.fasta.log" lines_diff="2"/> | 212 <test expect_num_outputs="4"> |
213 <param name="input_fasta" value="small.fasta" ftype="fasta" /> | |
214 <param name="source_type" value="dfam_up" /> | |
215 <param name="dfam_lib" value="Dfam_partial_test.h5" ftype="h5" /> | |
216 <param name="species_name" value="rodent" /> | |
217 <output name="output_masked_genome" file="small_dfam_up.fasta.masked" /> | |
218 <output name="output_table" file="small_dfam_up.fasta.stats" lines_diff="2" /> | |
219 <output name="output_repeat_catalog" file="small_dfam_up.fasta.cat" lines_diff="2" /> | |
220 <output name="output_log" file="small_dfam_up.fasta.log" lines_diff="2"/> | |
224 </test> | 221 </test> |
225 </tests> | 222 </tests> |
226 <help><![CDATA[ | 223 <help><![CDATA[ |
227 RepeatMasker is a program that screens DNA for interspersed repeats and low | 224 RepeatMasker is a program that screens DNA for interspersed repeats and low |
228 complexity DNA sequences. The database of repeats to screen for can be | 225 complexity DNA sequences. The database of repeats to screen for can be |