comparison rna_quast.xml @ 3:bf3dc4cae5bf draft

Uploaded
author lehmanju
date Wed, 14 Oct 2020 07:03:06 +0000
parents 7e130d325fa7
children cc0366f0bdf7
comparison
equal deleted inserted replaced
2:7e130d325fa7 3:bf3dc4cae5bf
1 <tool id="rna_quast" name="rnaQUAST" version="@TOOL_VERSION@" python_template_version="3.7"> 1 <tool id="rna_quast" name="rnaQUAST" version="@TOOL_VERSION@">
2 <description>A Quality Assessment Tool for De Novo Transcriptome Assemblies</description> 2 <description>A Quality Assessment Tool for De Novo Transcriptome Assemblies</description>
3 <macros> 3 <macros>
4 <token name="@TOOL_VERSION@">2.1.0</token> 4 <token name="@TOOL_VERSION@">2.1.0</token>
5 <xml name="element_matching_line" token_name="" token_expression="">
6 <element name="@NAME@">
7 <assert_contents><has_line_matching expression="@EXPRESSION@"/></assert_contents>
8 </element>
9 </xml>
10 <xml name="element_has_text" token_name="" token_text="">
11 <element name="@NAME@">
12 <assert_contents><has_text text="@TEXXT@"/></assert_contents>
13 </element>
14 </xml>
5 </macros> 15 </macros>
6 <requirements> 16 <requirements>
7 <requirement type="package" version="@TOOL_VERSION@">rnaquast</requirement> 17 <requirement type="package" version="@TOOL_VERSION@">rnaquast</requirement>
8 </requirements> 18 </requirements>
9 <stdio> 19 <stdio>
80 <param name="use_gtf" type="select" label="Use file with gene coordinates in GTF/GFF format?" help="We recommend to use files downloaded from GENCODE or Ensembl."> 90 <param name="use_gtf" type="select" label="Use file with gene coordinates in GTF/GFF format?" help="We recommend to use files downloaded from GENCODE or Ensembl.">
81 <option value="true" selected="true">Yes</option> 91 <option value="true" selected="true">Yes</option>
82 <option value="false">No</option> 92 <option value="false">No</option>
83 </param> 93 </param>
84 <when value="true"> 94 <when value="true">
85 <param name="gtf" argument="--gtf" type="data" format="gtf, gff, gff3" multiple="true" label="GTF/GFF file"/> 95 <param name="gtf" argument="--gtf" type="data" format="gtf,gff,gff3" multiple="true" label="GTF/GFF file"/>
86 <param argument="--disable_infer_genes" type="boolean" truevalue="--disable_infer_genes" falsevalue="" checked="false" label=" GTF file contains genes records?"/> 96 <param argument="--disable_infer_genes" type="boolean" truevalue="--disable_infer_genes" falsevalue="" checked="false" label=" GTF file contains genes records?"/>
87 <param argument="--disable_infer_transcripts" type="boolean" truevalue="--disable_infer_transcripts" falsevalue="" checked="false" label="GTF file contains transcripts records?"/> 97 <param argument="--disable_infer_transcripts" type="boolean" truevalue="--disable_infer_transcripts" falsevalue="" checked="false" label="GTF file contains transcripts records?"/>
88 </when> 98 </when>
89 <when value="false"> 99 <when value="false">
90 </when> 100 </when>
126 </data> 136 </data>
127 <collection name="list_logs" type="list" label="${tool.name} on ${on_string}: logs" > 137 <collection name="list_logs" type="list" label="${tool.name} on ${on_string}: logs" >
128 <discover_datasets ext="txt" pattern="(?P&lt;name&gt;.+)\.log" directory="outputdir/logs/" visible="false" /> 138 <discover_datasets ext="txt" pattern="(?P&lt;name&gt;.+)\.log" directory="outputdir/logs/" visible="false" />
129 <filter>"logs" in out_add</filter> 139 <filter>"logs" in out_add</filter>
130 </collection> 140 </collection>
131 <collection name="list_comparison_png" type="list" label="${tool.name} on ${on_string}: comparison plots" > 141 <collection name="comparison_png" type="list" label="${tool.name} on ${on_string}: comparison plots" >
132 <discover_datasets ext="png" pattern="(?P&lt;name&gt;.+)\.png" directory="outputdir/comparison_output/" visible="false" recurse="true"/> 142 <discover_datasets ext="png" pattern="(?P&lt;name&gt;.+)\.png" directory="outputdir/comparison_output/" visible="false" recurse="true"/>
133 <filter> len(input)>1 and "plots" in out_add </filter> 143 <filter> len(input)>1 and "plots" in out_add</filter>
134 </collection> 144 </collection>
135 <collection name="list_comparison" type="list" label="${tool.name} on ${on_string}: comparison" > 145 <collection name="comparison" type="list" label="${tool.name} on ${on_string}: comparison" >
136 <discover_datasets ext="txt" pattern="(?P&lt;name&gt;.+)\.txt" directory="outputdir/comparison_output/" visible="false" recurse="true" /> 146 <discover_datasets ext="txt" pattern="(?P&lt;name&gt;.+)\.txt" directory="outputdir/comparison_output/" visible="false" recurse="true" />
137 <filter> len(input)>1 and "comparison" in out_add</filter> 147 <filter> len(input)>1 and "comparison" in out_add</filter>
138 </collection> 148 </collection>
139 <collection name="data_collection" type="list:list" label="${tool.name} on ${on_string}: detailed output"> 149 <collection name="details" type="list:list" label="${tool.name} on ${on_string}: detailed output">
140 <discover_datasets pattern="(?P&lt;identifier_0&gt;.+)_____(?P&lt;identifier_1&gt;.+)\.(?P&lt;ext&gt;txt)" directory="details/" visible="false"/> 150 <discover_datasets pattern="(?P&lt;identifier_0&gt;.+)_____(?P&lt;identifier_1&gt;.+)\.(?P&lt;ext&gt;txt)" directory="details/" visible="false"/>
141 <filter>"details" in out_add</filter> 151 <filter>"details" in out_add</filter>
142 </collection> 152 </collection>
143 <collection name="data_collection_png" type="list:list" label="${tool.name} on ${on_string}: detailed output plots"> 153 <collection name="details_png" type="list:list" label="${tool.name} on ${on_string}: detailed output plots">
144 <discover_datasets pattern="(?P&lt;identifier_0&gt;.+)_____(?P&lt;identifier_1&gt;.+)\.(?P&lt;ext&gt;png)" directory="details/" visible="false"/> 154 <discover_datasets pattern="(?P&lt;identifier_0&gt;.+)_____(?P&lt;identifier_1&gt;.+)\.(?P&lt;ext&gt;png)" directory="details/" visible="false"/>
145 <filter>"details_plots" in out_add</filter> 155 <filter>"details_plots" in out_add</filter>
146 </collection> 156 </collection>
147 </outputs> 157 </outputs>
148 <tests> 158 <tests>
171 <output name="short_report_tsv"> 181 <output name="short_report_tsv">
172 <assert_contents> 182 <assert_contents>
173 <has_line_matching expression="^METRICS/TRANSCRIPTS\tidba\tTrinity$"/> 183 <has_line_matching expression="^METRICS/TRANSCRIPTS\tidba\tTrinity$"/>
174 </assert_contents> 184 </assert_contents>
175 </output> 185 </output>
176 <output_collection name="list_comparison_png" type="list" count="15"/> 186 <output_collection name="comparison_png" type="list" count="15"/>
177 <output_collection name="list_comparison" type="list" count="19"/> 187 <output_collection name="comparison" type="list" count="19"/>
178 <output_collection name="list_logs" type="list" count="8"/> 188 <output_collection name="list_logs" type="list" count="8"/>
179 <output_collection name="data_collection" type="list:list" count="2"> 189 <output_collection name="details" type="list:list" count="2">
180 <element name="Trinity"> 190 <output_collection name="Trinity" type="list" count="21"/>
181 <element name="alignment_metrics"> 191 <output_collection name="idba" type="list" count="21"/>
182 <assert_contents><has_line_matching expression="^METRICS/TRANSCRIPTS\s+Trinity\s+$"/></assert_contents>
183 </element>
184 <element name="alignment_multiplicity"/>
185 <element name="alignments_per_isoform"/>
186 <element name="basic_metrics"/>
187 <element name="block_length"/>
188 <element name="blocks_per_alignment"/>
189 <element name="database_metrics"/>
190 <element name="misassemblies"/>
191 <element name="mismatch_rate"/>
192 <element name="sensitivity"/>
193 <element name="specificity"/>
194 <element name="transcript_length"/>
195 <element name="x-aligned"/>
196 <element name="x-assembled_exons"/>
197 <element name="x-assembled"/>
198 <element name="x-covered_exons"/>
199 <element name="x-covered"/>
200 <element name="x-matched_blocks"/>
201 <element name="x-matched"/>
202 </element>
203 <element name="idba">
204 <element name="alignment_metrics">
205 <assert_contents>
206 <has_line_matching expression="^METRICS/TRANSCRIPTS\s+idba\s+$"/>
207 </assert_contents>
208 </element>
209 </element>
210 </output_collection> 192 </output_collection>
211 </test> 193 </test>
212 <test expect_num_outputs="8"> 194 <test expect_num_outputs="8">
213 <param name="input" value="spades.311.fasta" ftype="fasta" /> 195 <param name="input" value="Trinity.fasta" ftype="fasta" />
214 <conditional name="gene_coordinates"> 196 <conditional name="gene_coordinates">
215 <param name="use_gtf" value="false" /> 197 <param name="use_gtf" value="false" />
216 </conditional> 198 </conditional>
217 <param name="min_alignment" value="30" /> 199 <param name="min_alignment" value="30" />
218 <param name="lower_threshold" value="45" /> 200 <param name="lower_threshold" value="45" />
219 <param name="upper_threshold" value="95"/> 201 <param name="upper_threshold" value="95"/>
220 <param name="out_sr" value="txt,tex,tsv,pdf" /> 202 <param name="out_sr" value="txt,tex,tsv,pdf" />
221 <param name="out_add" value="logs" /> 203 <param name="out_add" value="logs,details_plots" />
222 <output name="short_report_pdf" file="short_report.pdf" compare="sim_size"/> 204 <output name="short_report_pdf" file="short_report.pdf" compare="sim_size"/>
223 <output name="short_report_txt" file="short_report.txt" compare="sim_size"/> 205 <output name="short_report_txt" file="short_report.txt" compare="sim_size"/>
224 <output name="short_report_tex" file="short_report.tex" compare="sim_size"/> 206 <output name="short_report_tex" file="short_report.tex" compare="sim_size"/>
225 <output name="short_report_tsv" file="short_report.tsv" compare="sim_size"/> 207 <output name="short_report_tsv" file="short_report.tsv" compare="sim_size"/>
226 <output_collection name="list_logs" type="list"> 208 <output_collection name="list_logs" type="list">
227 <element name="rnaQUAST" file="rnaQUAST"/> 209 <element name="rnaQUAST" file="rnaQUAST"/>
228 <element name="spades.311.GeneMarkS_T.err" file="spades.311.GeneMarkS_T.err"/> 210 <element name="Trinity.GeneMarkS_T.err" file="spades.311.GeneMarkS_T.err"/>
229 </output_collection> 211 </output_collection>
230 <output_collection name="data_collection" type="list:list"> 212 <output_collection name="details_png" type="list:list" count="1">
231 <element name="spades.311"> 213 <output_collection name="Trinity" type="list" count="11"/>
232 <element name="alignment_metrics" file="spades.311/alignment_metrics.txt"/>
233 </element>
234 </output_collection> 214 </output_collection>
235 </test> 215 </test>
236 </tests> 216 </tests>
237 <help><![CDATA[ 217 <help><![CDATA[
238 **What it does** 218 **What is rnaQUAST**
239 rnaQUAST: a quality assessment tool for de novo transcriptome assemblies 219 - a quality assessment tool for de novo transcriptome assemblies
240 rnaQUAST—a tool for evaluating RNA-Seq assembly quality and benchmarking transcriptome assemblers using reference genome and gene database. rnaQUAST calculates various metrics that demonstrate completeness and correctness levels of the assembled transcripts, and outputs them in a user-friendly report. 220 - evaluating RNA-Seq assembly quality and benchmarking transcriptome assemblers using reference genome and gene database
221 - calculates various metrics that demonstrate completeness and correctness levels of the assembled transcripts
241 222
242 **Using rnaQuast without reference** you wont get: 223 **Using rnaQuast without reference** you wont get:
243 - x_assebled PNG & Txt 224
244 - x_assembled Exons PNG & Txt 225 - x-assembled (Exons)
245 - Alignments per Isoform PNG & Txt 226 - Alignments per Isoform
246 - x_covered PNG & Txt 227 - x-covered (Exons)
247 - x_covered Exons PNG & Txt 228 - x-matched (Blocks)
248 - x_matched PNG & Txt 229 - gmap build logs
249 - x_matched PNG & Txt
250 - x_matched Blocks PNG & Txt
251 - gmap build out log
252 - gmap build err log
253 230
254 **Using rnaQuast with reference** you will get: 231 **Using rnaQuast with reference** you will get:
255 - PDF report 232 - Reports
256 - TXT report 233 - Logs
257 - TSV report 234 - Alignement/Basic Metrics
258 - Log 235 - Misassemblies/ Specificity/ Sensitivity
259 - Alignement Metrics 236 - Alignment multiplicity
260 - Basic Metrics 237 - Block/ Transcript Lentgh
261 - Misassemblies
262 - Specificity
263 - Sensitivity
264 - Alignment multiplicity
265 - Block lentgh
266 - Blocks per alignment 238 - Blocks per alignment
267 - Mismatch rate 239 - Mismatch rate
268 - Transcript length 240 - x-aligned
269 - x_aligned 241 - Nx
270 - Transcript Length PNG 242 - Blocks per alignment
271 - Nx PNG 243 - gmap build logs
272 - Block length PNG
273 - Blocks per alignment PNG
274 - gmap build out log
275 - gmap build err log
276 244
277 **Using rnaQuast without gene coordinates** you wont get: 245 **Using rnaQuast without gene coordinates** you wont get:
278 - x_assebled PNG & Txt 246 - x-assembled (Exons)
279 - x_assembled Exons PNG & Txt 247 - Alignments per Isoform
280 - Alignments per Isoform PNG & Txt 248 - x-covered (Exons)
281 - x_covered PNG & Txt 249 - x-matched (Blocks)
282 - x_covered Exons PNG & Txt 250 - gmap build logs
283 - x_matched PNG & Txt
284 - x_matched PNG & Txt
285 - x_matched Blocks PNG & Txt
286 - gmap build out log
287 - gmap build err log
288 - Database Metrics 251 - Database Metrics
289 - Alignment multiplicity PNG 252 - Alignment multiplicity
290 - Mismatch rate PNG 253 - Mismatch rate
291 - NAx PNG 254 - NAx
292 - x_aligned PNG 255 - x-aligned
293 **Using rnaQuast with gene coordinates** you will get: 256 **Using rnaQuast with gene coordinates** you will get:
294 - PDF report 257 - Reports
295 - TXT report 258 - Logs
296 - TSV report 259 - Alignement/Basic Metrics
297 - Log 260 - Misassemblies/Specificity/Sensitivity
298 - Alignement Metrics 261 - Alignment multiplicity
299 - Basic Metrics 262 - Block/Transcript length
300 - Misassemblies
301 - Specificity
302 - Sensitivity
303 - Alignment multiplicity
304 - Block lentgh
305 - Blocks per alignment 263 - Blocks per alignment
306 - Mismatch rate 264 - Mismatch rate
307 - Transcript length 265 - x-aligned
308 - x_aligned 266 - Nx/NAx
309 - Transcript Length PNG 267 - gmap build logs
310 - Nx PNG
311 - Block length PNG
312 - Blocks per alignment PNG
313 - gmap build out log
314 - gmap build err log
315 - Database Metrics 268 - Database Metrics
316 - Alignment multiplicity PNG 269 - Alignment multiplicity
317 - Mismatch rate PNG 270 More informations, see citations.
318 - NAx PNG
319 - x_aligned PNG
320 **Using rnaQuast without drawing plots** you wont get any PNG's and txt-files of these + the PDF report
321 *Output*
322 **Reports**
323 The following text files with reports are contained in comparison_output directory and include results for all input assemblies. In addition, these reports are contained in <assembly_label>_output directories for each assembly separately.
324 database_metrics.txt
325 Gene database metrics.
326 - Genes / Protein coding genes – number of genes / protein coding genes
327 - Isoforms / Protein coding isoforms – number of isoforms / protein coding isoforms
328 - Exons / Introns – total number of exons / introns
329 - Total / Average length of all isoforms, bp
330 - Average exon length, bp
331 - Average intron length, bp
332 - Average / Maximum number of exons per isoform
333 Database coverage – the total number of bases covered by reads (in all isoforms) divided by the total length of all isoforms.
334 x%-covered genes / isoforms / exons – number of genes / isoforms / exons from the database that have at least x% of bases covered by all reads, where x is specified with lower_threshold /upper_threshold options (50% / 95% by default).
335 basic_mertics.txt
336 Basic transcripts metrics are calculated without reference genome and gene database.
337 - Transcripts – total number of assembled transcripts.
338 - Transcripts > 500 bp
339 - Transcripts > 1000 bp
340 - Average length of assembled transcripts
341 - Longest transcript
342 - Total length
343 - Transcript N50 – a maximal number N, such that the total length of all transcripts longer than N bp is at least 50% of the total length of all transcripts.
344 alignment_metrics.txt
345 Alignment metrics are calculated with reference genome but without using gene database. To calculate the following metrics rnaQUAST filters all short partial alignments (see min_alignment option) and attempts to select the best hits for each transcript.
346 - Transcripts – total number of assembled transcripts.
347 - Aligned – the number of transcripts having at least 1 significant alignment.
348 - Uniquely aligned – the number of transcripts having a single significant alignment.
349 - Multiply aligned – the number of transcripts having 2 or more significant alignments. Multiply aligned transcripts are stored in <assembly_label>.paralogs.fasta file.
350 - Misassembly candidates reported by GMAP (or BLAT) – transcripts that have discordant best-scored alignment (partial alignments that are either mapped to different strands / different chromosomes / in reverse order / too far away).
351 - Unaligned – the number of transcripts without any significant alignments. Unaligned transcripts are stored in <assembly_label>.unaligned.fasta file.
352 Number of assembled transcripts = Unaligned + Aligned = Unaligned + (Uniquely aligned + Multiply aligned + Misassembly candidates reported by GMAP (or BLAT)).
353 Alignment metrics for non-misassembled transcripts
354 - Average aligned fraction. Aligned fraction for a single transcript is defined as total number of aligned bases in the transcript divided by the total transcript length.
355 - Average alignment length. Aligned length for a single transcript is defined as total number of aligned bases in the transcript.
356 - Average blocks per alignment. A block is defined as a continuous alignment fragment without indels.
357 - Average block length (see above).
358 - Average mismatches per transcript – average number of single nucleotide differences with reference genome per transcript.
359 - NA50 – N50 for alignments.
360 misassemblies.txt
361 - Transcripts – total number of assembled transcripts.
362 - Misassembly candidates reported by GMAP (or BLAT) – transcripts that have discordant best-scored alignment (partial alignments that are either mapped to different strands / different chromosomes / in reverse order / too far away).
363 - Misassembly candidates reported by BLASTN – transcripts are aligned to the isoform sequences extracted from the genome using gene database with BLASTN and then transcripts that have partial alignments to multiple isoforms are selected.
364 - Misassemblies – misassembly candidates confirmed by both methods described above. Using both methods simultaneously allows to avoid considering misalignments that can be caused, for example, by paralogous genes or genomic repeats. Misassembled transcripts are stored in <assembly_label>.misassembled.fasta file.
365 sensitivity.txt
366 Assembly completeness (sensitivity). For the following metrics (calculated with reference genome and gene database) rnaQUAST attempts to select best-matching database isoforms for every transcript. Note that a single transcript can contribute to multiple isoforms in the case of, for example, paralogous genes or genomic repeats. At the same time, an isoform can be covered by multiple transcripts in the case of fragmented assembly or duplicated transcripts in the assembly.
367 - Database coverage – the total number of bases covered by transcripts (in all isoforms) divided by the total length of all isoforms.
368 - Duplication ratio – total number of aligned bases in assembled transcripts divided by the total number of isoform covered bases. This metric does not count neither paralogous genes nor shared exons, only real overlaps of the assembled sequences that are mapped to the same isoform.
369 - Average number of transcripts mapped to one isoform.
370 - x%-assembled genes / isoforms/ exons – number of genes / isoforms / exons from the database that have at least x% captured by a single assembled transcript, where x is specified with lower_threshold / upper_threshold options (50% / 95% by default). 95%-assembled isoforms are stored in <assembly_label>.95%assembled.fasta file.
371 - x%-covered genes / isoforms– number of genes / isoforms from the database that have at least x% of bases covered by all alignments, where x is specified with lower_threshold / upper_threshold options (50% / 95% by default).
372 - Mean isoform assembly – assembled fraction of a single isoform is calculated as the largest number of its bases captured by a single assembled transcript divided by its length; average value is computed for isoforms with > 0 bases covered.
373 - Mean isoform coverage – coverage of a single isoform is calculated as the number of its bases covered by all assembled transcripts divided by its length; average value is computed for isoforms with > 0 bases covered.
374 - Mean exon coverage – coverage of a single exon is calculated as the number of its bases covered by all assembled transcripts divided by its length; average value is computed for exons with > 0 bases covered.
375 - Average percentage of isoform x%-covered exons, where x is specified with lower_threshold / upper_threshold options (50% / 95% by default). For each isoform rnaQUAST calculates the number of x%-covered exons divided by the total number of exons. Afterwards it computes average value for all covered isoforms.
376 BUSCO metrics. The following metrics are calculated only when busco_lineage option is used (see options for details).
377 - Complete – percentage of completely recovered genes.
378 - Partial – percentage of partially recovered genes.
379 GeneMarkS-T metrics. The following metrics are calculated when reference and gene database are not provided or gene_mark option is used (see options for details).
380 - Genes – number of predicted genes in transcripts.
381 specificity.txt
382 Assembly specificity. To compute the following metrics we use only transcripts that have at least one significant alignment and are not misassembled.
383 - Unannotated – total number of transcripts that do not cover any isoform from the database. Unannotated transcripts are stored in <assembly_label>.unannotated.fasta file.
384 - x%-matched – total number of transcripts that have at least x% covering an isoform from the database, where x is specified with lower_threshold / upper_threshold options (50% / 95% by default).
385 - Mean fraction of transcript matched – matched fraction of a single transcript is calculated as the number of its bases covering an isoform divided by the transcript length; average value is computed for transcripts with > 0 bases matched.
386 - Mean fraction of block matched – matched fraction of a single block is calculated as the number of its bases covering an isoform divided by the block length; average value is computed for blocks with > 0 bases matched.
387 - x%-matched blocks – percentage of blocks that have at least x% covering an isoform from the database, where x is specified with lower_threshold / upper_threshold options (50% / 95% by default).
388 - Matched length – total number of transcript bases covering isoforms from the database.
389 - Unmatched length – total alignment length - Matched length.
390 relative_database_coverage.txt
391 Relative database coverage metrics are calculated only when raw reads (or read alignments) are provided. rnaQUAST uses read alignments to estimate the upper bound of the database coverage and the number of x-covered genes / isoforms / exons (see read coverage) and computes the following metrics:
392 - Relative database coverage – ratio between transcripts database coverage and reads database coverage.
393 - Relative x%-assembled genes / isoforms / exons – ratio between transcripts x%-assembled and reads x%-covered genes / isoforms / exons.
394 - Relative x%-covered genes / isoforms / exons – ratio between transcripts x%-covered and reads x%-covered genes / isoforms / exons.
395 **Detailed output**
396 These files are contained in <assembly_label>_output directories for each assembly separately.
397 - <assembly_label>.unaligned.fasta – transcripts without any significant alignments.
398 - <assembly_label>.paralogs.fasta – transcripts having 2 or more significant alignments.
399 - <assembly_label>.misassembled.fasta – misassembly candidates detected by methods described above. See misassemblies.txt description for details.
400 - <assembly_label>.correct.fasta – transcripts with exactly 1 significant alignment that do not contain misassemblies.
401 - <assembly_label>.x%-assembled.list – IDs of the isoforms from the database that have at least x% captured by a single assembled transcript, where x is specified by the user with an option upper_threshold (95% by default).
402 - <assembly_label>.unannotated.fasta – transcripts that do not cover any isoform from the database.
403 The following text file is contained in comparison_output directory and <assembly_label>_output directories for each assembly separately.
404 reads.x%-covered.list – IDs of the isoforms from the database that have at least x% bases covered by all reads, where x is specified with lower_threshold / upper_threshold options (50% / 95% by default).
405 **Plots**
406 The following plots are similarly contained in both comparison_output directory and <assembly_label>_output directories. Please note, that most of the plots represent cumulative distributions and some plots are given in logarithmic scale.
407 Basic
408 - transcript_length.png – assembled transcripts length distribution (+ database isoforms length distribution).
409 - block_length.png – alignment blocks length distribution (+ database exons length distribution).
410 - x-aligned.png – transcript aligned fraction distribution.
411 - blocks_per_alignment.png – distribution of number of blocks per alignment (+ distribution of number of database exons per isoform).
412 - alignment_multiplicity.png – distribution for the number of significant alignment for each multiply-aligned transcript.
413 - mismatch_rate.png – substitution errors per alignment distribution.
414 - Nx.png – Nx plot for transcripts. Nx is a maximal number N, such that the total length of all transcripts longer than N bp is at least x% of the total length of all transcripts.
415 - NAx.png – Nx plot for alignments.
416 **Sensitivity**
417 - x-assembled.png – a histogram in which each bar represents the number of isoforms from the database that have at least x% captured by a single assembled transcript.
418 - x-covered.png – a histogram in which each bar represents the number of isoforms from the database that have at least x% of bases covered by all alignments.
419 - x-assembled_exons.png – a histogram in which each bar represents the number of exons from the database that have at least x% captured by a single assembled transcript.
420 - x-covered_exons.png – a histogram in which each bar represents the number of exons from the database that have at least x% of bases covered by all alignments.
421 - alignments_per_isoform.png – plot showing number of transcript alignments per isoform
422 **Specificity**
423 - x-matched.png – a histogram in which each bar represents the number of transcripts that have at least x% matched to an isoform from the database.
424 - x-matched_blocks.png – a histogram in which each bar represents the number of all blocks from all transcript alignments that have at least x% matched to an isoform from the database.
425 ]]></help> 271 ]]></help>
426 <citations> 272 <citations>
427 <citation type="doi">10.1093/bioinformatics/btw218 </citation> 273 <citation type="doi">10.1093/bioinformatics/btw218 </citation>
428 </citations> 274 </citations>
429 </tool> 275 </tool>