comparison gaeval.xml @ 0:1dd7adc21b6d draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/aegean commit e6c01517075cab35e620fe1bbdb5fd68e4d1359f"
author iuc
date Sun, 03 Jan 2021 14:59:26 +0000
parents
children 8dc7512c9dc9
comparison
equal deleted inserted replaced
-1:000000000000 0:1dd7adc21b6d
1 <tool id="aegean_gaeval" name="AEGeAn GAEVAL" version="@TOOL_VERSION@" profile="20.01">
2 <description> compute coverage and integrity scores for gene models using transcript alignments.</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro='xrefs'/>
7 <expand macro='edam_ontology'/>
8 <expand macro='requirements'/>
9 <version_command>gaeval --version</version_command>
10 <command detect_errors='exit_code'>
11 <![CDATA[
12 gaeval '$alignmentgff3' '$genesgff3'
13 -a $weights.alpha
14 -b $weights.beta
15 -g $weights.gamma
16 -e $weights.epsilon
17 -c $expected.expcds
18 -5 $expected.exp5putr
19 -3 $expected.exp3putr > '$output'
20 ]]>
21 </command>
22 <inputs>
23 <param name='alignmentgff3' type='data' format='gff3' label='Alignment GFF3 file' />
24 <param name='genesgff3' type='data' format='gff3' label='Genes GFF3 file'/>
25 <!-- Weight options -->
26 <section name='weights'
27 title='Weights for calculating integrity score'
28 expanded='False'>
29 <param argument='--alpha' type='float'
30 min='0' max='1' value='0.6'
31 label='Introns confirmed, or % expected CDS lenght for single-exon genes'
32 help='The percentage of introns confirmed by an alignment gap; for single-exon gene predictions lacking introns, it represents the ratio of the observed CDS length to the expected CDS length. '/>
33 <param argument='--beta' type='float'
34 min='0' max='1' value='0.3'
35 label='Exon coverage'
36 help='Overall percentage of individual exons spanned by at least one sequencing read.'/>
37 <param argument='--gamma' type='float'
38 min='0' max='1' value='0.05'
39 label='% expected 5’ UTR length'
40 help='The ratio of the observed 5’ UTR length to the expected 5’ UTR length.'/>
41 <param argument='--epsilon' type='float'
42 min='0' max='1' value='0.05'
43 label='% expected 3’ UTR lenght'
44 help='The ratio of the observed 3’ UTR length to the expected 3’ UTR length.'/>
45 </section>
46 <!-- Expected feature lenght options -->
47 <section name='expected'
48 title='Expected feature lenghts for calculating integrity score'
49 expanded='False'>
50 <param name='expcds' type='integer'
51 min='0' max='1000' value='400'
52 label='Expected CDs length (in bp) (-c)' />
53 <param name='exp5putr' type='integer'
54 min='0' max='1000' value='200'
55 label='Expected 5’ UTR length (-5)' />
56 <param name='exp3putr' type='integer'
57 min='0' max='1000' value='100'
58 label='Expected 3’ UTR length (-3)' />
59 </section>
60 </inputs>
61 <outputs>
62 <data name='output' format='tabular' />
63 </outputs>
64 <tests>
65 <test expect_num_outputs="1">
66 <param name='alignmentgff3' value='TAIR10_GFF3_alignment.gff'/>
67 <param name='genesgff3' value='TAIR10_GFF3_genes.gff'/>
68 <output name='output' file='gaeval_output_test1.txt'/>
69 </test>
70 <test expect_num_outputs="1">
71 <param name='alignmentgff3' value='TAIR10_GFF3_alignment.gff'/>
72 <param name='genesgff3' value='TAIR10_GFF3_genes.gff'/>
73 <section name='weights'>
74 <param name='alpha' value='0.5'/>
75 <param name='beta' value='0.4'/>
76 <param name='gamma' value='0.05'/>
77 <param name='epsion' value='0.05'/>
78 </section>
79 <output name='output' file='gaeval_output_test2.txt'/>
80 </test>
81 <test expect_num_outputs="1">
82 <param name='alignmentgff3' value='TAIR10_GFF3_alignment.gff'/>
83 <param name='genesgff3' value='TAIR10_GFF3_genes.gff'/>
84 <section name='expected'>
85 <param name='expcds' value='20'/>
86 <param name='exp5putr' value='150'/>
87 <param name='exp3putr' value='120'/>
88 </section>
89 <output name='output' file='gaeval_output_test3.txt' lines_diff='2'/>
90 </test>
91
92 </tests>
93 <help>
94 <![CDATA[
95 .. class:: infomark
96
97 **Purpose**
98
99 GAEVAL is a program for computing coverage and integrity scores for gene models using transcript alignments. The integrity score is a value between 0 and 1 that indicates the level of agreement between the gene model and any related transcript alignments, with 0 corresponding to no transcript support and 1 corresponding to complete transcript support.
100
101 -----
102
103 .. class:: infomark
104
105 **Input**
106
107 Input for GAEVAL is two GFF3 files, one containing gene predictions/annotations and one containing transcript alignments. Although the GFF3 Specification explicitly supports several similar encoding conventions for alignment features, only one is supported by GAEVAL, as shown below.
108
109
110 ctg123 . cDNA_match 1050 1500 5.8e-42 + . ID=match00001;Target=cdna0123 12 462
111 ctg123 . cDNA_match 5000 5500 8.1e-43 + . ID=match00001;Target=cdna0123 463 963
112 ctg123 . cDNA_match 7000 9000 1.4e-40 + . ID=match00001;Target=cdna0123 964 2964
113
114
115 GAEVAL will accept alignments with types cDNA_match, EST_match, and the generic nucleotide_match, depending on the source of the data.
116
117 The Target and Gap attributes are not disallowed by GAEVAL, but they are not interpreted by GAEVAL either. Gapped or spliced alignments must be encoded as multifeatures, with each segment of the alignment on its own distinct line and all segments of a single alignment sharing the same ID attribute.
118
119 -----
120
121 .. class:: infomark
122
123 **Output**
124
125 GAEVAL computes coverage and integrity scores for each mRNA feature in the gene prediction input. The output will be identical to the input, except that each mRNA feature will have two new attribtues: gaeval_coverage and gaeval_integrity.
126
127 ]]>
128 </help>
129 <expand macro='citations'/>
130 </tool>