Mercurial > repos > devteam > cuffcompare
annotate cuffcompare_wrapper.xml @ 11:ad5d061fbdf2 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit 80b06e80066b32ad53ed418628992f056444256f
author | iuc |
---|---|
date | Sat, 05 Oct 2024 11:15:49 +0000 |
parents | f648e5180e40 |
children |
rev | line source |
---|---|
11
ad5d061fbdf2
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit 80b06e80066b32ad53ed418628992f056444256f
iuc
parents:
10
diff
changeset
|
1 <tool id="cuffcompare" name="Cuffcompare" version="@TOOL_VERSION@.3" profile="@PROFILE@"> |
0 | 2 <description>compare assembled transcripts to a reference annotation and track Cufflinks transcripts across multiple experiments</description> |
6 | 3 <macros> |
4 <import>cuff_macros.xml</import> | |
5 </macros> | |
8
1322b73ffe44
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit eb18f691975ef9539b5ebd4f118343c8ad967a1f
devteam
parents:
7
diff
changeset
|
6 <expand macro="requirements" /> |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
7 <version_command><![CDATA[ |
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
8 cuffcompare 2>&1 | head -n 1 |
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
9 ]]></version_command> |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
10 <command detect_errors="aggressive"><![CDATA[ |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
11 @CUFFLINKS_LINK_GTF_INPUTS@ |
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
12 cuffcompare |
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
13 -o output |
0 | 14 ## Use annotation reference? |
15 #if $annotation.use_ref_annotation == "Yes": | |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
16 -r '$annotation.reference_annotation' |
0 | 17 #if $annotation.ignore_nonoverlapping_reference: |
18 -R | |
19 #end if | |
6 | 20 #if $annotation.ignore_nonoverlapping_transfrags: |
21 -Q | |
22 #end if | |
0 | 23 #end if |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
24 |
0 | 25 ## Use sequence data? |
26 #if $seq_data.use_seq_data == "Yes": | |
2
8b22e9adae34
Update to the new data table specification.
Dave Bouvier <dave@bx.psu.edu>
parents:
0
diff
changeset
|
27 -s |
0 | 28 #if $seq_data.seq_source.index_source == "history": |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
29 '$seq_data.seq_source.ref_file' |
0 | 30 #else: |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
31 '${seq_data.seq_source.index.fields.path}' |
0 | 32 #end if |
33 #end if | |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
34 |
6 | 35 $discard_single_exon |
36 | |
37 -e $max_dist_exon | |
38 -d $max_dist_group | |
39 | |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
40 $discard_intron_redundant_transfrags |
6 | 41 |
42 @CUFFLINKS_GTF_INPUTS@ | |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
43 ]]></command> |
0 | 44 <inputs> |
6 | 45 <expand macro="cufflinks_gtf_inputs" /> |
0 | 46 <conditional name="annotation"> |
47 <param name="use_ref_annotation" type="select" label="Use Reference Annotation"> | |
48 <option value="No">No</option> | |
49 <option value="Yes">Yes</option> | |
50 </param> | |
51 <when value="Yes"> | |
6 | 52 <param format="gff3,gtf" name="reference_annotation" type="data" label="Reference Annotation" help="Requires an annotation file in GFF3 or GTF format."/> |
53 <param name="ignore_nonoverlapping_reference" type="boolean" label="Ignore reference transcripts that are not overlapped by any input transfrags" help="consider only the reference transcripts that overlap any of the input transfrags (Sn correction)" /> | |
54 <param name="ignore_nonoverlapping_transfrags" type="boolean" label="Ignore input transcripts that are not overlapped by any reference transcripts" help="consider only the input transcripts that overlap any of the reference transcripts (Sp correction). Warning: this will discard all 'novel' loci!" /> | |
0 | 55 </when> |
56 <when value="No"> | |
57 </when> | |
58 </conditional> | |
59 <conditional name="seq_data"> | |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
60 <param name="use_seq_data" type="select" label="Use Sequence Data" |
6 | 61 help="Use sequence data for some optional classification functions, including the addition of the p_id attribute required by Cuffdiff."> |
0 | 62 <option value="Yes">Yes</option> |
63 <option value="No">No</option> | |
64 </param> | |
65 <when value="No"></when> | |
66 <when value="Yes"> | |
67 <conditional name="seq_source"> | |
68 <param name="index_source" type="select" label="Choose the source for the reference list"> | |
69 <option value="cached">Locally cached</option> | |
70 <option value="history">History</option> | |
71 </param> | |
2
8b22e9adae34
Update to the new data table specification.
Dave Bouvier <dave@bx.psu.edu>
parents:
0
diff
changeset
|
72 <when value="cached"> |
8b22e9adae34
Update to the new data table specification.
Dave Bouvier <dave@bx.psu.edu>
parents:
0
diff
changeset
|
73 <param name="index" type="select" label="Using reference genome"> |
8b22e9adae34
Update to the new data table specification.
Dave Bouvier <dave@bx.psu.edu>
parents:
0
diff
changeset
|
74 <options from_data_table="fasta_indexes"> |
6 | 75 <filter type="data_meta" ref="inputs" key="dbkey" column="1" /> |
2
8b22e9adae34
Update to the new data table specification.
Dave Bouvier <dave@bx.psu.edu>
parents:
0
diff
changeset
|
76 <validator type="no_options" message="No reference genome is available for the build associated with the selected input dataset" /> |
8b22e9adae34
Update to the new data table specification.
Dave Bouvier <dave@bx.psu.edu>
parents:
0
diff
changeset
|
77 </options> |
8b22e9adae34
Update to the new data table specification.
Dave Bouvier <dave@bx.psu.edu>
parents:
0
diff
changeset
|
78 </param> |
8b22e9adae34
Update to the new data table specification.
Dave Bouvier <dave@bx.psu.edu>
parents:
0
diff
changeset
|
79 </when> |
0 | 80 <when value="history"> |
81 <param name="ref_file" type="data" format="fasta" label="Using reference file" /> | |
82 </when> | |
83 </conditional> | |
84 </when> | |
85 </conditional> | |
6 | 86 <param type="select" name="discard_single_exon" label="discard (ignore) single-exon transcripts"> |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
87 <option value="" selected="True">No</option> |
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
88 <option value="-M">Discard single-exon transfrags and reference transcripts</option> |
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
89 <option value="-N">Discard single-exon reference transcripts</option> |
6 | 90 </param> |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
91 <param type="integer" name="max_dist_exon" value="100" label="Max. Distance for assessing exon accuracy" |
6 | 92 help="max. distance (range) allowed from free ends of terminal exons of reference transcripts when assessing exon accuracy. Default: 100" /> |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
93 <param type="integer" name="max_dist_group" value="100" label="Max.Distance for transcript grouping" |
6 | 94 help="max. distance (range) for grouping transcript start sites. Default: 100" /> |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
95 <param type="boolean" name="discard_intron_redundant_transfrags" label="discard intron-redundant transfrags sharing 5'" |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
96 value="false" truevalue="-F" falsevalue="" |
6 | 97 help="Discard intron-redundant transfrags if they share the 5' end (if they differ only at the 3' end)" /> |
0 | 98 </inputs> |
99 | |
100 <outputs> | |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
101 <data format="txt" name="transcripts_accuracy" label="${tool.name} on ${on_string}: transcript accuracy" |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
102 from_work_dir="output.stats" /> |
6 | 103 <data format="tabular" name="input1_tmap" label="${tool.name} on ${on_string}: data ${inputs[0].hid} tmap file" |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
104 from_work_dir="output.input_0.tmap" /> |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
105 <data format="tabular" name="input1_refmap" |
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
106 label="${tool.name} on ${on_string}: data ${inputs[0].hid} refmap file" |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
107 from_work_dir="output.input_0.refmap"> |
0 | 108 <filter>annotation['use_ref_annotation'] == 'Yes'</filter> |
109 </data> | |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
110 <data format="tabular" name="input2_tmap" label="${tool.name} on ${on_string}: data ${inputs[1].hid} tmap file" from_work_dir="output.input_1.tmap"> |
6 | 111 <filter>@HAS_MULTIPLE_INPUTS@</filter> |
0 | 112 </data> |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
113 <data format="tabular" name="input2_refmap" |
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
114 label="${tool.name} on ${on_string}: data ${inputs[1].hid} refmap file" |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
115 from_work_dir="output.input_1.refmap"> |
6 | 116 <filter>annotation['use_ref_annotation'] == 'Yes' and @HAS_MULTIPLE_INPUTS@</filter> |
0 | 117 </data> |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
118 <data format="tabular" name="transcripts_tracking" label="${tool.name} on ${on_string}: transcript tracking" from_work_dir="output.tracking"> |
6 | 119 <filter>@HAS_MULTIPLE_INPUTS@</filter> |
0 | 120 </data> |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
121 <data format="gtf" name="transcripts_combined" label="${tool.name} on ${on_string}: combined transcripts" from_work_dir="output.combined.gtf"/> |
0 | 122 </outputs> |
123 | |
124 <tests> | |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
125 <!-- |
0 | 126 cuffcompare -r cuffcompare_in3.gtf -R cuffcompare_in1.gtf cuffcompare_in2.gtf |
127 --> | |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
128 <test expect_num_outputs="7"> |
6 | 129 <param name="inputs" value="cuffcompare_in1.gtf,cuffcompare_in2.gtf" ftype="gtf"/> |
0 | 130 <param name="use_ref_annotation" value="Yes"/> |
131 <param name="reference_annotation" value="cuffcompare_in3.gtf" ftype="gtf"/> | |
132 <param name="ignore_nonoverlapping_reference" value="Yes"/> | |
6 | 133 <param name="ignore_nonoverlapping_transfrags" value="No"/> |
0 | 134 <param name="use_seq_data" value="No"/> |
6 | 135 <param name="discard_single_exon" value="" /> |
136 <param name="max_dist_exon" value="100" /> | |
137 <param name="max_dist_group" value="100" /> | |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
138 <param name="discard_intron_redundant_transfrags" value="false" /> |
0 | 139 <!-- Line diffs are the result of different locations for input files; this cannot be fixed as cuffcompare outputs |
140 full input path for each input. --> | |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
141 <output name="transcripts_accuracy" file="cuffcompare_out7.txt" lines_diff="6"/> |
0 | 142 <output name="input1_tmap" file="cuffcompare_out1.tmap"/> |
143 <output name="input1_refmap" file="cuffcompare_out2.refmap"/> | |
144 <output name="input2_tmap" file="cuffcompare_out3.tmap"/> | |
145 <output name="input2_refmap" file="cuffcompare_out4.refmap"/> | |
146 <output name="transcripts_tracking" file="cuffcompare_out6.tracking"/> | |
147 <output name="transcripts_combined" file="cuffcompare_out5.gtf"/> | |
148 </test> | |
149 </tests> | |
150 | |
151 <help> | |
152 **Cuffcompare Overview** | |
153 | |
154 Cuffcompare is part of Cufflinks_. Cuffcompare helps you: (a) compare your assembled transcripts to a reference annotation and (b) track Cufflinks transcripts across multiple experiments (e.g. across a time course). Please cite: Trapnell C, Williams BA, Pertea G, Mortazavi AM, Kwan G, van Baren MJ, Salzberg SL, Wold B, Pachter L. Transcript assembly and abundance estimation from RNA-Seq reveals thousands of new transcripts and switching among isoforms. Nature Biotechnology doi:10.1038/nbt.1621 | |
155 | |
6 | 156 .. _Cufflinks: http://cole-trapnell-lab.github.io/cufflinks/ |
157 | |
0 | 158 ------ |
159 | |
160 **Know what you are doing** | |
161 | |
162 .. class:: warningmark | |
163 | |
164 There is no such thing (yet) as an automated gearshift in expression analysis. It is all like stick-shift driving in San Francisco. In other words, running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy. | |
165 | |
6 | 166 .. __: http://cole-trapnell-lab.github.io/cufflinks/cuffcompare/ |
0 | 167 |
168 ------ | |
169 | |
170 **Input format** | |
171 | |
172 Cuffcompare takes Cufflinks' GTF output as input, and optionally can take a "reference" annotation (such as from Ensembl_) | |
173 | |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
174 .. _Ensembl: http://www.ensembl.org |
0 | 175 |
176 ------ | |
177 | |
178 **Outputs** | |
179 | |
180 Cuffcompare produces the following output files: | |
181 | |
182 Transcripts Accuracy File: | |
183 | |
184 Cuffcompare reports various statistics related to the "accuracy" of the transcripts in each sample when compared to the reference annotation data. The typical gene finding measures of "sensitivity" and "specificity" (as defined in Burset, M., Guigó, R. : Evaluation of gene structure prediction programs (1996) Genomics, 34 (3), pp. 353-367. doi: 10.1006/geno.1996.0298) are calculated at various levels (nucleotide, exon, intron, transcript, gene) for each input file and reported in this file. The Sn and Sp columns show specificity and sensitivity values at each level, while the fSn and fSp columns are "fuzzy" variants of these same accuracy calculations, allowing for a very small variation in exon boundaries to still be counted as a "match". | |
185 | |
186 Transcripts Combined File: | |
187 | |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
188 Cuffcompare reports a GTF file containing the "union" of all transfrags in each sample. If a transfrag is present in both samples, it is thus reported once in the combined gtf. |
0 | 189 |
190 Transcripts Tracking File: | |
191 | |
192 This file matches transcripts up between samples. Each row contains a transcript structure that is present in one or more input GTF files. Because the transcripts will generally have different IDs (unless you assembled your RNA-Seq reads against a reference transcriptome), cuffcompare examines the structure of each the transcripts, matching transcripts that agree on the coordinates and order of all of their introns, as well as strand. Matching transcripts are allowed to differ on the length of the first and last exons, since these lengths will naturally vary from sample to sample due to the random nature of sequencing. | |
193 If you ran cuffcompare with the -r option, the first and second columns contain the closest matching reference transcript to the one described by each row. | |
194 | |
195 Here's an example of a line from the tracking file:: | |
196 | |
6 | 197 TCONS_00000045 XLOC_000023 Tcea|uc007afj.1 j \ |
0 | 198 q1:exp.115|exp.115.0|100|3.061355|0.350242|0.350207 \ |
199 q2:60hr.292|60hr.292.0|100|4.094084|0.000000|0.000000 | |
200 | |
201 In this example, a transcript present in the two input files, called exp.115.0 in the first and 60hr.292.0 in the second, doesn't match any reference transcript exactly, but shares exons with uc007afj.1, an isoform of the gene Tcea, as indicated by the class code j. The first three columns are as follows:: | |
202 | |
203 Column number Column name Example Description | |
204 ----------------------------------------------------------------------- | |
205 1 Cufflinks transfrag id TCONS_00000045 A unique internal id for the transfrag | |
206 2 Cufflinks locus id XLOC_000023 A unique internal id for the locus | |
207 3 Reference gene id Tcea The gene_name attribute of the reference GTF record for this transcript, or '-' if no reference transcript overlaps this Cufflinks transcript | |
208 4 Reference transcript id uc007afj.1 The transcript_id attribute of the reference GTF record for this transcript, or '-' if no reference transcript overlaps this Cufflinks transcript | |
209 5 Class code c The type of match between the Cufflinks transcripts in column 6 and the reference transcript. See class codes | |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
210 |
0 | 211 Each of the columns after the fifth have the following format: |
212 qJ:gene_id|transcript_id|FMI|FPKM|conf_lo|conf_hi | |
213 | |
214 A transcript need be present in all samples to be reported in the tracking file. A sample not containing a transcript will have a "-" in its entry in the row for that transcript. | |
215 | |
216 Class Codes | |
217 | |
218 If you ran cuffcompare with the -r option, tracking rows will contain the following values. If you did not use -r, the rows will all contain "-" in their class code column:: | |
219 | |
6 | 220 Priority Code Description |
0 | 221 --------------------------------- |
6 | 222 1 = Match |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
223 2 c Contained |
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
224 3 j New isoform |
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
225 4 e A single exon transcript overlapping a reference exon and at least 10 bp of a reference intron, indicating a possible pre-mRNA fragment. |
7
b77178f66fc3
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit a1517c9d22029095120643bbe2c8fa53754dd2b7
devteam
parents:
6
diff
changeset
|
226 5 i A single exon transcript falling entirely with a reference intron |
b77178f66fc3
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit a1517c9d22029095120643bbe2c8fa53754dd2b7
devteam
parents:
6
diff
changeset
|
227 6 o Generic exonic overlap with a reference transcript |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
228 7 p Possible polymerase run-on fragment |
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
229 8 r Repeat. Currently determined by looking at the soft-masked reference sequence and applied to transcripts where at least 50% of the bases are lower case |
7
b77178f66fc3
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit a1517c9d22029095120643bbe2c8fa53754dd2b7
devteam
parents:
6
diff
changeset
|
230 9 u Unknown, intergenic transcript |
b77178f66fc3
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit a1517c9d22029095120643bbe2c8fa53754dd2b7
devteam
parents:
6
diff
changeset
|
231 10 x Exonic overlap with reference on the opposite strand |
b77178f66fc3
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit a1517c9d22029095120643bbe2c8fa53754dd2b7
devteam
parents:
6
diff
changeset
|
232 11 s An intron of the transfrag overlaps a reference intron on the opposite strand (likely due to read mapping errors) |
b77178f66fc3
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit a1517c9d22029095120643bbe2c8fa53754dd2b7
devteam
parents:
6
diff
changeset
|
233 12 . (.tracking file only, indicates multiple classifications) |
9
e66b9b5b8580
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/cufflinks/cuffcompare commit 82ee6fc860c52c531b7a57bbb346ab1a67a434a5
devteam
parents:
8
diff
changeset
|
234 |
0 | 235 ------- |
236 | |
237 **Settings** | |
238 | |
239 All of the options have a default value. You can change any of them. Most of the options in Cuffcompare have been implemented here. | |
240 | |
241 ------ | |
242 | |
243 **Cuffcompare parameter list** | |
244 | |
245 This is a list of implemented Cuffcompare options:: | |
246 | |
247 -r An optional "reference" annotation GTF. Each sample is matched against this file, and sample isoforms are tagged as overlapping, matching, or novel where appropriate. See the refmap and tmap output file descriptions below. | |
248 -R If -r was specified, this option causes cuffcompare to ignore reference transcripts that are not overlapped by any transcript in one of cuff1.gtf,...,cuffN.gtf. Useful for ignoring annotated transcripts that are not present in your RNA-Seq samples and thus adjusting the "sensitivity" calculation in the accuracy report written in the transcripts_accuracy file | |
249 </help> | |
10
f648e5180e40
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/cufflinks/cuffcompare commit a0b0845a9d1b3e7ecdeacd1e606133617e3918bd"
iuc
parents:
9
diff
changeset
|
250 <expand macro="citations"/> |
0 | 251 </tool> |