comparison roary.xml @ 4:809e42326fc2 draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/roary commit d2e1ee6304af1062175ca87aab59c4042ace3116"
author iuc
date Thu, 14 Nov 2019 03:51:08 -0500
parents 15ca041134a9
children dbe2b2204555
comparison
equal deleted inserted replaced
3:15ca041134a9 4:809e42326fc2
1 <tool id="roary" name="Roary" version="3.12.0+galaxy0"> 1 <tool id="roary" name="Roary" version="3.12.0+galaxy0">
2 <description>the pangenome pipeline - Quickly generate a core gene alignment from gff3 files</description> 2 <description>the pangenome pipeline - Quickly generate a core gene alignment from gff3 files</description>
3 3
4 <requirements> 4 <requirements>
5 <requirement type="package" version="3.12.0">roary</requirement> 5 <requirement type="package" version="3.12.0">roary</requirement>
6 </requirements> 6 </requirements>
7 7
8 <command detect_errors="exit_code"><![CDATA[ 8 <command detect_errors="exit_code"><![CDATA[
9 9 #set $filenames = list()
10 #for $gff in $gff_input.gffs 10 #for $gff in $gff_input.gffs
11 cp $gff '${gff.element_identifier}'.gff && 11 cp '$gff' '${gff.element_identifier}.gff' &&
12 #set $filename = str($gff.element_identifier) + '.gff'
13 $filenames.append(str($filename))
12 #end for 14 #end for
13 15
14 roary 16 roary
15 -f out 17 -f out
16 -p \${GALAXY_SLOTS:-1} 18 -p \${GALAXY_SLOTS:-1}
21 -g '$advanced.maxclust' 23 -g '$advanced.maxclust'
22 $advanced.split_para 24 $advanced.split_para
23 -t '$advanced.trans_tab' 25 -t '$advanced.trans_tab'
24 -iv '$advanced.mcl' 26 -iv '$advanced.mcl'
25 27
26 *.gff 28 #for $f in $filenames
27 29 '$f'
30 #end for
31
28 ]]></command> 32 ]]></command>
29 33
30 <inputs> 34 <inputs>
31 <conditional name="gff_input"> 35 <conditional name="gff_input">
32 <param name="gff_input_selector" type="select" label="Individual gff files or a dataset collection" help="Select between individual gff files or a collection of gff files"> 36 <param name="gff_input_selector" type="select" label="Individual gff files or a dataset collection" help="Select between individual gff files or a collection of gff files">
33 <option value="individual">Individual</option> 37 <option value="individual">Individual</option>
34 <option value="collection">Collection</option> 38 <option value="collection">Collection</option>
40 <param name="gffs" type="data_collection" collection_type="list" format="gff,gff3" label="Dataset collection to submit to Roary" help="A dataset list collection of gff3 files to send to Roary for analysis." /> 44 <param name="gffs" type="data_collection" collection_type="list" format="gff,gff3" label="Dataset collection to submit to Roary" help="A dataset list collection of gff3 files to send to Roary for analysis." />
41 </when> 45 </when>
42 </conditional> 46 </conditional>
43 <param name="percent_ident" type="integer" label="minimum percentage identity for blastp" help="Sets the minimum percentage identity for protein matches" value="95"/> 47 <param name="percent_ident" type="integer" label="minimum percentage identity for blastp" help="Sets the minimum percentage identity for protein matches" value="95"/>
44 <param name="core_diff" type="float" label="percentage of isolates a gene must be in to be core" help="The total percentage of the isolates that must have the gene for it to be considered a core gene." value="99.0"/> 48 <param name="core_diff" type="float" label="percentage of isolates a gene must be in to be core" help="The total percentage of the isolates that must have the gene for it to be considered a core gene." value="99.0"/>
45 49
46 <param name="outputs" type="select" multiple="true" display="checkboxes" label="Additional outputs" help="Summary statistics, core gene alignments and Gene Presence/Absence tables are always produced."> 50 <param name="outputs" type="select" multiple="true" display="checkboxes" label="Additional outputs" help="Summary statistics, core gene alignments and Gene Presence/Absence tables are always produced.">
47 <option value="abg_nw">Accessory binary genes in newick format</option> 51 <option value="abg_nw">Accessory binary genes in newick format</option>
48 <option value="abg_fa">Accessory binary genes in fasta format</option> 52 <option value="abg_fa">Accessory binary genes in fasta format</option>
49 <option value="accgraph">Accessory graph in dot format</option> 53 <option value="accgraph">Accessory graph in dot format</option>
50 <option value="acchead_embl">Accessory header file in embl format</option> 54 <option value="acchead_embl">Accessory header file in embl format</option>
58 <option value="numcons_rtab">Number of Conserved Genes in Rtab format</option> 62 <option value="numcons_rtab">Number of Conserved Genes in Rtab format</option>
59 <option value="numpangene_rtab">Number of Genes in Pan Genome in Rtab format</option> 63 <option value="numpangene_rtab">Number of Genes in Pan Genome in Rtab format</option>
60 <option value="numnew_rtab">Number of New Genes in Rtab format</option> 64 <option value="numnew_rtab">Number of New Genes in Rtab format</option>
61 <option value="numuniq_rtab">Number of Unique Genes in Rtab format</option> 65 <option value="numuniq_rtab">Number of Unique Genes in Rtab format</option>
62 </param> 66 </param>
63 67
64 <section name="advanced" title="Advanced options" expanded="false"> 68 <section name="advanced" title="Advanced options" expanded="false">
65 <param name="maxclust" type="integer" value="50000" label="Maximum number of clusters" help="The maximum number of clusters to assign proteins" /> 69 <param name="maxclust" type="integer" value="50000" label="Maximum number of clusters" help="The maximum number of clusters to assign proteins" />
66 <param name="split_para" type="boolean" checked="False" truevalue="-s" falsevalue="" label="Don't split paralogs" help="Click yes so that paralogs aren't split."/> 70 <param name="split_para" type="boolean" checked="False" truevalue="-s" falsevalue="" label="Don't split paralogs" help="Click yes so that paralogs aren't split."/>
67 <param name="trans_tab" type="integer" value="11" label="Translation table to use [1 or 4 or 11]" help="DNA -> RNA translation table to use. Roary is designed for prokaryotes and so tables 1, 4 or 11 will work, others could be problematic." /> 71 <param name="trans_tab" type="integer" value="11" label="Translation table to use [1 or 4 or 11]" help="DNA -> RNA translation table to use. Roary is designed for prokaryotes and so tables 1, 4 or 11 will work, others could be problematic." />
68 <param name="mcl" type="float" value="1.5" label="MCL inflation value" help="This is an advanced setting, change only if you know what you are doing and then at your own risk!" /> 72 <param name="mcl" type="float" value="1.5" label="MCL inflation value" help="This is an advanced setting, change only if you know what you are doing and then at your own risk!" />
69 </section> 73 </section>
70 74
71 </inputs> 75 </inputs>
72 76
73 <outputs> 77 <outputs>
74 <data format="tabular" name="sumstats" label="${tool.name} on ${on_string} Summary statistics" from_work_dir="out/summary_statistics.txt" /> 78 <data format="tabular" name="sumstats" label="${tool.name} on ${on_string} Summary statistics" from_work_dir="out/summary_statistics.txt" />
75 <data format="fasta" name="core_gene_aln" label="${tool.name} on ${on_string} Core Gene Alignment" from_work_dir="out/core_gene_alignment.aln" /> 79 <data format="fasta" name="core_gene_aln" label="${tool.name} on ${on_string} Core Gene Alignment" from_work_dir="out/core_gene_alignment.aln" />
76 <data format="csv" name="gene_p_a" label="${tool.name} on ${on_string} Gene Presence Absence" from_work_dir="out/gene_presence_absence.csv" /> 80 <data format="csv" name="gene_p_a" label="${tool.name} on ${on_string} Gene Presence Absence" from_work_dir="out/gene_presence_absence.csv" />
77 <data format="fasta" name="acc_bin" label="${tool.name} on ${on_string} Accessory Binary Genes" from_work_dir="out/accessory_binary_genes.fa" > 81 <data format="fasta" name="acc_bin" label="${tool.name} on ${on_string} Accessory Binary Genes" from_work_dir="out/accessory_binary_genes.fa" >
118 </data> 122 </data>
119 <data format="txt" name="num_uniq_rtab" label="${tool.name} on ${on_string} Number of Unique Genes" from_work_dir="out/number_of_unique_genes.Rtab" > 123 <data format="txt" name="num_uniq_rtab" label="${tool.name} on ${on_string} Number of Unique Genes" from_work_dir="out/number_of_unique_genes.Rtab" >
120 <filter>outputs and 'numuniq_rtab' in outputs</filter> 124 <filter>outputs and 'numuniq_rtab' in outputs</filter>
121 </data> 125 </data>
122 </outputs> 126 </outputs>
123 127
124 <tests> 128 <tests>
125 <test> 129 <test>
126 <param name="gff_input_selector" value="individual"/> 130 <param name="gff_input_selector" value="individual"/>
127 <param name="gffs" value="ex1.gff,ex2.gff" ftype="gff3"/> 131 <param name="gffs" value="ex1.gff,ex2.gff" ftype="gff3"/>
128 <output name="sumstats" file="out/summary_statistics.txt" ftype="tabular"/> 132 <output name="sumstats" file="out/summary_statistics.txt" ftype="tabular"/>
133 <param name="percent_ident" value="50"/> 137 <param name="percent_ident" value="50"/>
134 <param name="core_diff" value="50.0"/> 138 <param name="core_diff" value="50.0"/>
135 <output name="sumstats" file="test2/summary_statistics.txt" ftype="tabular"/> 139 <output name="sumstats" file="test2/summary_statistics.txt" ftype="tabular"/>
136 </test> 140 </test>
137 </tests> 141 </tests>
138 142
139 <help><![CDATA[ 143 <help><![CDATA[
140 **Roary** 144 **Roary**
141 145
142 Roary is a high speed stand alone pan genome pipeline, which takes annotated assemblies in GFF3 format (produced by Prokka) and calculates the pan genome. Using a standard desktop PC, it can analyse datasets with thousands of samples, something which is computationally infeasible with existing methods, without compromising the quality of the results. 128 samples can be analysed in under 1 hour using 1 GB of RAM and a single processor. To perform this analysis using existing methods would take weeks and hundreds of GB of RAM. 146 Roary is a high speed stand alone pan genome pipeline, which takes annotated assemblies in GFF3 format (produced by Prokka) and calculates the pan genome. Using a standard desktop PC, it can analyse datasets with thousands of samples, something which is computationally infeasible with existing methods, without compromising the quality of the results. 128 samples can be analysed in under 1 hour using 1 GB of RAM and a single processor. To perform this analysis using existing methods would take weeks and hundreds of GB of RAM.
143 147
144 To use Roary, select two or more gff3 files OR a collection of gff3 files 148 To use Roary, select two or more gff3 files OR a collection of gff3 files
145 149
146 **Options**: 150 **Options**:
147 151
148 152
149 - Minimum percentage identity for blastp - an integer, default is [95] 153 - Minimum percentage identity for blastp - an integer, default is [95]
150 154
151 155
152 - Percentage of isolates a gene must be in to be core - a float, default is [99.0] 156 - Percentage of isolates a gene must be in to be core - a float, default is [99.0]
153 157
154 158
155 **Advanced Options**: 159 **Advanced Options**:
156 160
157 - Maximum number of clusters - integer, default is [50000] 161 - Maximum number of clusters - integer, default is [50000]
158 162
159 163
160 - Don't split paralogs - check box 164 - Don't split paralogs - check box
161 165
162 166
163 - Translation table - which translation table to use, an integer, default is [11] 167 - Translation table - which translation table to use, an integer, default is [11]
164 168
165 169
166 - Change the MCL inflation value - a float, default is [1.5] 170 - Change the MCL inflation value - a float, default is [1.5]
167 171
168 172
169 For further info see: http://sanger-pathogens.github.io/Roary/ 173 For further info see: http://sanger-pathogens.github.io/Roary/
170 174
171 ]]></help> 175 ]]></help>
172 176
173 <citations> 177 <citations>
174 <citation type="doi">10.1093/bioinformatics/btv421</citation> 178 <citation type="doi">10.1093/bioinformatics/btv421</citation>
175 </citations> 179 </citations>
176 180
177 </tool> 181 </tool>