Mercurial > repos > bgruening > glimmer_knowledge_based
comparison glimmer_w_icm.xml @ 0:9b2e283dc3b5 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/glimmer commit 37388949e348d221170659bbee547bf4ac67ef1a
author | bgruening |
---|---|
date | Tue, 28 Nov 2017 10:10:55 -0500 |
parents | |
children | ce89c473666d |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:9b2e283dc3b5 |
---|---|
1 <tool id="glimmer_knowledge_based" name="Glimmer3" version="@WRAPPER_VERSION@"> | |
2 <description>Predict ORFs in prokaryotic genomes (knowlegde-based)</description> | |
3 <macros> | |
4 <import>macros.xml</import> | |
5 </macros> | |
6 <expand macro="requirements"/> | |
7 <command detect_errors="aggressive"><![CDATA[ | |
8 glimmer3 | |
9 --max_olap $max_olap | |
10 --gene_len $gene_len | |
11 --threshold $threshold | |
12 #if float( str($gc_percent) ) > 0.0: | |
13 --gc_percent $gc_percent | |
14 #end if | |
15 | |
16 #if $stop_codon_opts.stop_codon_opts_selector == "gb": | |
17 --trans_table '${stop_codon_opts.genbank_gencode}' | |
18 #else: | |
19 --stop_codons '${stop_codon_opts.stop_codons}' | |
20 #end if | |
21 | |
22 --start_codons '$start_codons' | |
23 | |
24 $linear | |
25 $no_indep | |
26 $extend | |
27 '$seq_input' | |
28 '$icm_input' | |
29 glimmer_output | |
30 | |
31 && | |
32 | |
33 #if $report: | |
34 cp glimmer_output.predict '$report_output' && | |
35 #end if | |
36 #if $detailed_report: | |
37 cp glimmer_output.detail '$detailed_output' && | |
38 #end if | |
39 | |
40 ## convert prediction to FASTA sequences | |
41 python '$__tool_directory__/glimmer2seq.py' glimmer_output.predict '$seq_input' '$genes_output' | |
42 ]]></command> | |
43 <inputs> | |
44 <param name="seq_input" type="data" format="fasta" label="Genome Sequence" /> | |
45 <param name="icm_input" type="data" format="tar" label="Interpolated context model (ICM)" /> | |
46 | |
47 <param name="max_olap" type="integer" value="50" label="Set maximum overlap length" help="Overlaps this short or shorter are ignored." /> | |
48 <param name="gene_len" type="integer" value="90" label="Set the minimum gene length to n nucleotides" help="This does not include the bases in the stop codon."/> | |
49 <param name="threshold" type="integer" value="30" label="Set threshold score for calling as gene" help="If the in-frame score >= N, then the region is given a number and considered a potential gene." /> | |
50 <param name="gc_percent" type="float" value="0.0" label="Set the GC percentage of the independent model, i.e., the model of intergenic sequence" help="If 0.0 specified, the GC percentage will be counted from the input file." /> | |
51 | |
52 <param name="linear" type="boolean" truevalue="--linear" falsevalue="" checked="true" label="Assume linear rather than circular genome, i.e., no wraparound" /> | |
53 <param name="no_indep" type="boolean" truevalue="--no_indep" falsevalue="" checked="false" label="Don’t use the independent probability score column at all" help="Using this option will produce more short gene predictions." /> | |
54 <param name="extend" type="boolean" truevalue="--extend" falsevalue="" checked="false" label="Also score orfs that extend off the end of the sequence(s)" /> | |
55 <param name="start_codons" type="text" value="atg,gtg,ttg" label="Specify start codons as a comma-separated list" /> | |
56 | |
57 <conditional name="stop_codon_opts"> | |
58 <param name="stop_codon_opts_selector" type="select" label="Specify start codons as"> | |
59 <option value="gb" selected="True">Genbank translation table entry</option> | |
60 <option value="free_form">Comma-separated list</option> | |
61 </param> | |
62 <when value="gb"> | |
63 <param name="genbank_gencode" type="select" label="Use Genbank translation table to specify stop codons"> | |
64 <option value="1" selected="True">1. Standard</option> | |
65 <option value="2">2. Vertebrate Mitochondrial</option> | |
66 <option value="3">3. Yeast Mitochondrial</option> | |
67 <option value="4">4. Mold, Protozoan, and Coelenterate Mitochondrial Code and the Mycoplasma/Spiroplasma Code</option> | |
68 <option value="5">5. Invertebrate Mitochondrial</option> | |
69 <option value="6">6. Ciliate, Dasycladacean and Hexamita Nuclear Code</option> | |
70 <option value="9">9. Echinoderm Mitochondrial</option> | |
71 <option value="10">10. Euplotid Nuclear</option> | |
72 <option value="11">11. Bacteria and Archaea</option> | |
73 <option value="12">12. Alternative Yeast Nuclear</option> | |
74 <option value="13">13. Ascidian Mitochondrial</option> | |
75 <option value="14">14. Flatworm Mitochondrial</option> | |
76 <option value="15">15. Blepharisma Macronuclear</option> | |
77 <option value="16">16. Chlorophycean Mitochondrial</option> | |
78 <option value="21">21. Trematode Mitochondrial</option> | |
79 <option value="22">22. Scenedesmus obliquus mitochondrial</option> | |
80 <option value="23">23. Thraustochytrium Mitochondrial</option> | |
81 <option value="24">24. Pterobranchia mitochondrial</option> | |
82 </param> | |
83 </when> | |
84 <when value="free_form"> | |
85 <param name="stop_codons" type="text" value="tag,tga,taa" label="Specify stop codons as a comma-separated list" /> | |
86 </when> | |
87 </conditional> | |
88 | |
89 <param name="report" type="boolean" truevalue="" falsevalue="" checked="false" label="Report the classic glimmer table output"/> | |
90 <param name="detailed_report" type="boolean" truevalue="" falsevalue="" checked="false" label="Output a detailed gene prediction report as separate file"/> | |
91 </inputs> | |
92 <outputs> | |
93 <data name="genes_output" format="fasta" label="Glimmer3 on ${on_string} (Gene Prediction FASTA)" /> | |
94 <data name="report_output" format="txt" label="Glimmer3 on ${on_string} (Gene Prediction table)"> | |
95 <filter>report == True</filter> | |
96 </data> | |
97 <data name="detailed_output" format="txt" label="Glimmer3 on ${on_string} (detailed report)"> | |
98 <filter>detailed_report == True</filter> | |
99 </data> | |
100 </outputs> | |
101 <tests> | |
102 <test> | |
103 <param name="seq_input" value='streptomyces_Tue6071_plasmid_genomic.fasta' /> | |
104 <param name="icm_input" value='streptomyces_Tu6071_plasmid_genes.icm' ftype="tar" /> | |
105 <param name="max_olap" value="50" /> | |
106 <param name="gene_len" value="90" /> | |
107 <param name="threshold" value="30" /> | |
108 <param name="gc_percent" value="0.0" /> | |
109 <param name="linear" value="--linear" /> | |
110 <param name="no_indep" value="" /> | |
111 <param name="extend" value="" /> | |
112 <param name="start_codons" value="atg,gtg,ttg" /> | |
113 <param name="genbank_gencode" value="11" /> | |
114 <param name="detailed_report" value="true" /> | |
115 <param name="report" value="true" /> | |
116 <output name="genes_output" file='glimmer_w_icm_trans-table-11_genomic.fasta' ftype="fasta" /> | |
117 <output name="report_output" file='glimmer_w_icm_trans-table-11_genomic.out' ftype="txt" /> | |
118 <output name="detailed_output" file='glimmer_w_icm_trans-table-11_genomic.dout' ftype="txt" lines_diff="6" /> | |
119 </test> | |
120 </tests> | |
121 <help><![CDATA[ | |
122 **What it does** | |
123 | |
124 This is the main program that makes gene predictions based on an interpolated context model (ICM). | |
125 | |
126 The ICM can be generated with extracted CDS from related organisms (ICM builder). If you can't generate an ICM model you can use the non knowlegde-based Glimmer with a de novo prediction. | |
127 | |
128 | |
129 **Input** | |
130 | |
131 - Interpolated context model (ICM): Use the 'Glimmer ICM builder' tool to create one | |
132 - Genome Sequence in FASTA format | |
133 | |
134 | |
135 | |
136 **Output** | |
137 | |
138 - FASTA file with predicted proteins | |
139 - Glimmer prediction file (optional) | |
140 ]]></help> | |
141 <expand macro="citation" /> | |
142 </tool> |