comparison featurecounts.xml @ 10:46cccc52be5f draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/featurecounts commit cf1ae941d02bff8848f05c4e4039457656e3a4e8
author iuc
date Sun, 14 Jan 2018 09:23:49 -0500
parents e6a2a912677a
children e803ca6407c0
comparison
equal deleted inserted replaced
9:e6a2a912677a 10:46cccc52be5f
1 <tool id="featurecounts" name="featureCounts" version="1.6.0.1" profile="16.04"> 1 <tool id="featurecounts" name="featureCounts" version="1.6.0.2" profile="16.04">
2 <description>Measure gene expression in RNA-Seq experiments from SAM or BAM files.</description> 2 <description>Measure gene expression in RNA-Seq experiments from SAM or BAM files.</description>
3 <requirements> 3 <requirements>
4 <requirement type="package" version="1.6.0">subread</requirement> 4 <requirement type="package" version="1.6.0">subread</requirement>
5 </requirements> 5 </requirements>
6 6
7 <version_command>featureCounts -v 2&gt;&amp;1 | grep .</version_command> 7 <version_command>featureCounts -v 2&gt;&amp;1 | grep .</version_command>
8 <command><![CDATA[ 8 <command detect_errors="exit_code"><![CDATA[
9 ## Export fc path for its built-in annotation
10 export FC_PATH=\$(command -v featureCounts | sed 's@/bin/featureCounts$@@') &&
11
9 ## Check whether all alignments are from the same type (bam || sam) 12 ## Check whether all alignments are from the same type (bam || sam)
10 featureCounts 13 featureCounts
11 #if $gtf_source.ref_source=="history": 14
12 -a '$gtf_source.reference_gene_sets' 15 #if $anno.anno_select=="gtf":
13 #else: 16 #if $anno.gtf_source.ref_source=="history":
14 -a '$gtf_source.reference_gene_sets_builtin.fields.path' 17 -a '$anno.gtf_source.reference_gene_sets'
18 #else:
19 -a '$anno.gtf_source.reference_gene_sets_builtin.fields.path'
20 #end if
21 -F "GTF"
22 #elif $anno.anno_select=="builtin":
23 -a \${FC_PATH}/annotation/${anno.genome}_RefSeq_exon.txt
24 -F "SAF"
15 #end if 25 #end if
16 26
17 -o "output" 27 -o "output"
18 -T \${GALAXY_SLOTS:-2} 28 -T \${GALAXY_SLOTS:-2}
19 29
22 $extended_parameters.summarization_level 32 $extended_parameters.summarization_level
23 $extended_parameters.contribute_to_multiple_features 33 $extended_parameters.contribute_to_multiple_features
24 -s $extended_parameters.strand_specificity 34 -s $extended_parameters.strand_specificity
25 $extended_parameters.multimapping_enabled.multimapping_counts 35 $extended_parameters.multimapping_enabled.multimapping_counts
26 36
27 #if str($extended_parameters.multimapping_enabled.multimapping_counts) == " -M" 37 #if str($extended_parameters.multimapping_enabled.multimapping_counts) == " -M":
28 $extended_parameters.multimapping_enabled.fraction 38 $extended_parameters.multimapping_enabled.fraction
29 #end if 39 #end if
30 40
31 $extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads 41 $extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads
32 #if str($extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads) == "-J" 42 #if str($extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads) == "-J":
33 #if $extended_parameters.exon_exon_junction_read_counting_enabled.genome 43 #if $extended_parameters.exon_exon_junction_read_counting_enabled.genome:
34 -G '$extended_parameters.exon_exon_junction_read_counting_enabled.genome' 44 -G '$extended_parameters.exon_exon_junction_read_counting_enabled.genome'
35 #end if 45 #end if
36 #end if 46 #end if
37 47
38 $extended_parameters.long_reads 48 $extended_parameters.long_reads
46 --fracOverlapFeature $extended_parameters.frac_overlap_feature 56 --fracOverlapFeature $extended_parameters.frac_overlap_feature
47 $extended_parameters.read_reduction 57 $extended_parameters.read_reduction
48 $extended_parameters.primary 58 $extended_parameters.primary
49 $extended_parameters.ignore_dup 59 $extended_parameters.ignore_dup
50 60
51 #if str($extended_parameters.read_extension_5p) != "0" 61 #if str($extended_parameters.read_extension_5p) != "0":
52 --readExtension5 $extended_parameters.read_extension_5p 62 --readExtension5 $extended_parameters.read_extension_5p
53 #end if 63 #end if
54 64
55 #if str($extended_parameters.read_extension_3p) != "0" 65 #if str($extended_parameters.read_extension_3p) != "0":
56 --readExtension3 $extended_parameters.read_extension_3p 66 --readExtension3 $extended_parameters.read_extension_3p
57 #end if 67 #end if
58 68
59 $pe_parameters.fragment_counting_enabled.fragment_counting 69 $pe_parameters.fragment_counting_enabled.fragment_counting
60 #if str($pe_parameters.fragment_counting_enabled.fragment_counting) == " -p" 70 #if str($pe_parameters.fragment_counting_enabled.fragment_counting) == " -p":
61 $pe_parameters.fragment_counting_enabled.check_distance_enabled.check_distance 71 $pe_parameters.fragment_counting_enabled.check_distance_enabled.check_distance
62 #if str($pe_parameters.fragment_counting_enabled.check_distance_enabled.check_distance) == " -P" 72 #if str($pe_parameters.fragment_counting_enabled.check_distance_enabled.check_distance) == " -P":
63 -d $pe_parameters.fragment_counting_enabled.check_distance_enabled.minimum_fragment_length 73 -d $pe_parameters.fragment_counting_enabled.check_distance_enabled.minimum_fragment_length
64 -D $pe_parameters.fragment_counting_enabled.check_distance_enabled.maximum_fragment_length 74 -D $pe_parameters.fragment_counting_enabled.check_distance_enabled.maximum_fragment_length
65 #end if 75 #end if
66 #end if 76 #end if
67 77
68 $pe_parameters.only_both_ends 78 $pe_parameters.only_both_ends
69 $pe_parameters.exclude_chimerics 79 $pe_parameters.exclude_chimerics
70 80
71 '${alignment}' 81 '${alignment}'
72 82
73 ## Removal of comment and column-header line 83 ## Removal of comment
74 && grep -v "^#" "output" | tail -n+2 > body.txt 84 && grep -v "^#" "output"
75 85
86 #if $format.value != "tabdel_short":
87 ## and remove column-header line
88 | tail -n+2
89 #else
90 ## update header
91 | sed --expression='s|${alignment}|${alignment.element_identifier}|g'
92 #end if
93 > body.txt
76 ## Set the right columns for the tabular formats 94 ## Set the right columns for the tabular formats
77 #if $format.value == "tabdel_medium" 95 #if $format.value == "tabdel_medium":
78 && cut -f 1,7 body.txt > expression_matrix.txt 96 && cut -f 1,7 body.txt > expression_matrix.txt
79 97
80 ## Paste doesn't allow a non ordered list of columns: -f 1,7,8,6 will only return columns 1,7 and 8 98 ## Paste doesn't allow a non ordered list of columns: -f 1,7,8,6 will only return columns 1,7 and 8
81 ## Thus the gene length column (last column) has to be added separately 99 ## Thus the gene length column (last column) has to be added separately
82 && cut -f 6 body.txt > gene_lengths.txt 100 && cut -f 6 body.txt > gene_lengths.txt
83 && paste expression_matrix.txt gene_lengths.txt > expression_matrix.txt.bak 101 && paste expression_matrix.txt gene_lengths.txt > expression_matrix.txt.bak
84 && mv -f expression_matrix.txt.bak '${output_medium}' 102 && mv -f expression_matrix.txt.bak '${output_medium}'
85 #elif $format.value == "tabdel_short" 103 #elif $format.value == "tabdel_short" or $format.value == "tabdel_short_noheader":
86 && cut -f 1,7 body.txt > '${output_short}' 104 && cut -f 1,7 body.txt > '${output_short}'
87 #else 105 #else:
88 && cp body.txt '${output_full}' 106 && cp body.txt '${output_full}'
89 #end if 107 #end if
90 108
91 109 #if str($include_feature_length_file) == "true":
92 #if str($include_feature_length_file) == "true"
93 && cut -f 1,6 body.txt > '${output_feature_lengths}' 110 && cut -f 1,6 body.txt > '${output_feature_lengths}'
94 #end if 111 #end if
95 112
96 #if str($extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads) == "-J" 113 #if str($extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads) == "-J":
97 && tail -n+2 'output.jcounts' > '${output_jcounts}' 114 #if $format.value != "tabdel_short":
115 && tail -n+2 'output.jcounts' > '${output_jcounts}'
116 #else:
117
118 && sed --expression='s|${alignment}|${alignment.element_identifier}|g' 'output.jcounts' > '${output_jcounts}'
119 #end if
98 #end if 120 #end if
99 121
100 && tail -n+2 'output.summary' > '${output_summary}' 122 #if $format.value != "tabdel_short":
101 123 && tail -n+2 'output.summary' > '${output_summary}'
124 #else:
125 && sed --expression='s|${alignment}|${alignment.element_identifier}|g' 'output.summary' > '${output_summary}'
126 #end if
102 ]]></command> 127 ]]></command>
103 <inputs> 128 <inputs>
104 <param name="alignment" 129 <param name="alignment"
105 type="data" 130 type="data"
106 multiple="false" 131 multiple="false"
107 format="bam,sam" 132 format="bam,sam"
108 label="Alignment file" 133 label="Alignment file"
109 help="The input alignment file(s) where the gene expression has to be counted. The file can have a SAM or BAM format; but ALL files must be in the same format" /> 134 help="The input alignment file(s) where the gene expression has to be counted. The file can have a SAM or BAM format; but ALL files must be in the same format" />
110 135 <conditional name="anno">
111 <conditional name="gtf_source"> 136 <param name="anno_select" type="select" label="Gene annotation file">
112 <param name="ref_source" type="select" label="Gene annotation file"> 137 <option value="builtin">featureCounts built-in</option>
113 <option value="cached">locally cached</option> 138 <option value="gtf">GTF file</option>
114 <option value="history">in your history</option>
115 </param> 139 </param>
116 <when value="cached"> 140 <when value="builtin">
117 <param name="reference_gene_sets_builtin" type="select" label="Using locally cached annotation" help="If the annotation file you require is not listed here, please contact the Galaxy administrator"> 141 <param name="genome" type="select" label="Select built-in genome" help="Built-in gene annotations for genomes hg38, hg19, mm10 and mm9 are included in featureCounts">
118 <options from_data_table="gene_sets"> 142 <option value="hg38">hg38</option>
119 <filter type="sort_by" column="1" /> 143 <option value="hg19">hg19</option>
120 <validator type="no_options" message="No annotations are available." /> 144 <option value="mm10">mm10</option>
121 </options> 145 <option value="mm9">mm9</option>
122 </param> 146 </param>
123 </when> 147 </when>
124 <when value="history"> 148 <when value="gtf">
125 <param name="reference_gene_sets" 149 <conditional name="gtf_source">
126 format="gff,gtf,gff3" 150 <param name="ref_source" type="select" label="Gene annotation file">
127 type="data" 151 <option value="cached">locally cached</option>
128 label="Gene annotation file" 152 <option value="history">in your history</option>
129 help="The program assumes that the provided annotation file is in GTF format. Make sure that the gene annotation file corresponds to the same reference genome as used for the alignment" /> 153 </param>
154 <when value="cached">
155 <param name="reference_gene_sets_builtin" type="select" label="Using locally cached annotation" help="If the annotation file you require is not listed here, please contact the Galaxy administrator">
156 <options from_data_table="gene_sets">
157 <filter type="sort_by" column="1" />
158 <validator type="no_options" message="No annotations are available." />
159 </options>
160 </param>
161 </when>
162 <when value="history">
163 <param name="reference_gene_sets"
164 format="gff,gtf,gff3"
165 type="data"
166 label="Gene annotation file"
167 help="The program assumes that the provided annotation file is in GTF format. Make sure that the gene annotation file corresponds to the same reference genome as used for the alignment" />
168 </when>
169 </conditional>
130 </when> 170 </when>
131 </conditional> 171 </conditional>
132 172
133 <param name="format" 173 <param name="format"
134 type="select" 174 type="select"
135 label="Output format" 175 label="Output format"
136 help="The output format will be tabular, select the preferred columns here"> 176 help="The output format will be tabular, select the preferred columns here">
137 <option value="tabdel_short" selected="true">Gene-ID "\t" read-count (DESeq2 IUC wrapper compatible)</option> 177 <option value="tabdel_short_noheader" selected="true">Gene-ID "\t" read-count (DESeq2 IUC wrapper compatible)</option>
178 <option value="tabdel_short">Gene-ID "\t" read-count (MultiQC/edgeR/limma-voom compatible, includes header in output)</option>
138 <option value="tabdel_medium">Gene-ID "\t" read-count "\t" gene-length</option> 179 <option value="tabdel_medium">Gene-ID "\t" read-count "\t" gene-length</option>
139 <option value="tabdel_full">featureCounts 1.4.0+ default (includes regions provided by the GTF file)</option> 180 <option value="tabdel_full">featureCounts 1.4.0+ default (includes regions provided by the GTF file)</option>
140 </param> 181 </param>
141 182
142 <param name="include_feature_length_file" 183 <param name="include_feature_length_file"
289 330
290 <param name="long_reads" argument="-L" type="boolean" truevalue="-L" falsevalue="" 331 <param name="long_reads" argument="-L" type="boolean" truevalue="-L" falsevalue=""
291 label="Long reads" 332 label="Long reads"
292 help="If specified, long reads such as Nanopore and PacBio reads will be counted. Long read counting can only run in one thread and only reads (not read-pairs) can be counted." /> 333 help="If specified, long reads such as Nanopore and PacBio reads will be counted. Long read counting can only run in one thread and only reads (not read-pairs) can be counted." />
293 334
294 <param name="by_read_group" argument="--byReadGroup" type="boolean" truevalue="--byReadGroup" falsevalue="" 335 <param name="by_read_group" argument="--byReadGroup" type="boolean" truevalue="--byReadGroup" falsevalue=""
295 label="Count reads by read group" 336 label="Count reads by read group"
296 help="If specified, reads are counted for each read group separately. The 'RG' tag must be present in the input BAM/SAM alignment files." /> 337 help="If specified, reads are counted for each read group separately. The 'RG' tag must be present in the input BAM/SAM alignment files." />
297 338
298 339
299 <param name="largest_overlap" 340 <param name="largest_overlap"
309 value="1" 350 value="1"
310 argument="--minOverlap" 351 argument="--minOverlap"
311 label="Minimum bases of overlap" 352 label="Minimum bases of overlap"
312 help="Specify the minimum required number of overlapping bases between a read (or a fragment) and a feature. 1 by default. If a negative value is provided, the read will be extended from both ends." /> 353 help="Specify the minimum required number of overlapping bases between a read (or a fragment) and a feature. 1 by default. If a negative value is provided, the read will be extended from both ends." />
313 354
314 <param name="frac_overlap" 355 <param name="frac_overlap"
315 type="integer" 356 type="integer"
316 value="0" 357 value="0"
317 min="0" 358 min="0"
318 max="1" 359 max="1"
319 argument="--fracOverlap" 360 argument="--fracOverlap"
320 label="Minimum fraction (of read) overlapping a feature" 361 label="Minimum fraction (of read) overlapping a feature"
321 help="Specify the minimum required fraction of overlapping bases between a read (or a fragment) and a feature. Value should be within range [0,1]. 0 by default. Number of overlapping bases is counted from both reads if paired end. Both this option and '--minOverlap' need to be satisfied for read assignment." /> 362 help="Specify the minimum required fraction of overlapping bases between a read (or a fragment) and a feature. Value should be within range [0,1]. 0 by default. Number of overlapping bases is counted from both reads if paired end. Both this option and '--minOverlap' need to be satisfied for read assignment." />
322 363
323 <param name="frac_overlap_feature" 364 <param name="frac_overlap_feature"
324 type="integer" 365 type="integer"
325 value="0" 366 value="0"
326 min="0" 367 min="0"
327 max="1" 368 max="1"
328 argument="--fracOverlapFeature" 369 argument="--fracOverlapFeature"
389 </data> 430 </data>
390 431
391 <data format="tabular" 432 <data format="tabular"
392 name="output_short" 433 name="output_short"
393 label="${tool.name} on ${on_string}"> 434 label="${tool.name} on ${on_string}">
394 <filter>format == "tabdel_short"</filter> 435 <filter>format == "tabdel_short_noheader" or format == "tabdel_short"</filter>
395 <actions> 436 <actions>
396 <action name="column_names" type="metadata" default="Geneid,${alignment.element_identifier}" /> 437 <action name="column_names" type="metadata" default="Geneid,${alignment.element_identifier}" />
397 </actions> 438 </actions>
398 </data> 439 </data>
399 440
406 </actions> 447 </actions>
407 </data> 448 </data>
408 449
409 <data format="tabular" 450 <data format="tabular"
410 name="output_summary" 451 name="output_summary"
411 hidden="true"
412 label="${tool.name} on ${on_string}: summary"> 452 label="${tool.name} on ${on_string}: summary">
413 <actions> 453 <actions>
414 <action name="column_names" type="metadata" default="Status,${alignment.element_identifier}" /> 454 <action name="column_names" type="metadata" default="Status,${alignment.element_identifier}" />
415 </actions> 455 </actions>
416 </data> 456 </data>
426 466
427 <data name="output_jcounts" format="tabular" 467 <data name="output_jcounts" format="tabular"
428 label="${tool.name} on ${on_string}: junction counts"> 468 label="${tool.name} on ${on_string}: junction counts">
429 <filter>extended_parameters['exon_exon_junction_read_counting_enabled']['count_exon_exon_junction_reads']</filter> 469 <filter>extended_parameters['exon_exon_junction_read_counting_enabled']['count_exon_exon_junction_reads']</filter>
430 <actions> 470 <actions>
431 <action name="column_names" type="metadata" default="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,${alignment.element_identifier}" /> 471 <action name="column_names" type="metadata"
472 default="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,${alignment.element_identifier}" />
432 </actions> 473 </actions>
433 </data> 474 </data>
434 </outputs> 475 </outputs>
435 <tests> 476 <tests>
436 <test expect_num_outputs="4"> 477 <test expect_num_outputs="4">
437 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> 478 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" />
479 <param name="anno_select" value="gtf"/>
438 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> 480 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" />
439 <param name="format" value="tabdel_short" /> 481 <param name="format" value="tabdel_short_noheader" />
440 <param name="include_feature_length_file" value="true"/> 482 <param name="include_feature_length_file" value="true"/>
441 <param name="ref_source" value="history" /> 483 <param name="ref_source" value="history" />
442 <param name="count_exon_exon_junction_reads" value="-J"/> 484 <param name="count_exon_exon_junction_reads" value="-J"/>
443 <output name="output_short" file="output_1_short.tab"> 485 <output name="output_short" file="output_1_short.tab">
444 <metadata name="column_names" value="Geneid,featureCounts_input1.bam"/> 486 <metadata name="column_names" value="Geneid,featureCounts_input1.bam"/>
450 <metadata name="column_names" value="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,featureCounts_input1.bam"/> 492 <metadata name="column_names" value="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,featureCounts_input1.bam"/>
451 </output> 493 </output>
452 </test> 494 </test>
453 <test expect_num_outputs="3"> 495 <test expect_num_outputs="3">
454 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> 496 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" />
497 <param name="anno_select" value="gtf"/>
455 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> 498 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" />
456 <param name="format" value="tabdel_medium" /> 499 <param name="format" value="tabdel_medium" />
457 <param name="include_feature_length_file" value="true"/> 500 <param name="include_feature_length_file" value="true"/>
458 <param name="ref_source" value="history" /> 501 <param name="ref_source" value="history" />
459 <output name="output_medium" file="output_1_medium.tab"> 502 <output name="output_medium" file="output_1_medium.tab">
463 <metadata name="column_names" value="Status,featureCounts_input1.bam"/> 506 <metadata name="column_names" value="Status,featureCounts_input1.bam"/>
464 </output> 507 </output>
465 </test> 508 </test>
466 <test expect_num_outputs="3"> 509 <test expect_num_outputs="3">
467 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> 510 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" />
511 <param name="anno_select" value="gtf"/>
468 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> 512 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" />
469 <param name="format" value="tabdel_full" /> 513 <param name="format" value="tabdel_full" />
470 <param name="include_feature_length_file" value="true"/> 514 <param name="include_feature_length_file" value="true"/>
471 <param name="ref_source" value="history" /> 515 <param name="ref_source" value="history" />
472 <output name="output_full" file="output_1_full.tab"> 516 <output name="output_full" file="output_1_full.tab">
477 </output> 521 </output>
478 <output name="output_feature_lengths" file="output_feature_lengths.tab"> 522 <output name="output_feature_lengths" file="output_feature_lengths.tab">
479 <metadata name="column_names" value="Feature,Length"/> 523 <metadata name="column_names" value="Feature,Length"/>
480 </output> 524 </output>
481 </test> 525 </test>
482 526 <test expect_num_outputs="4">
527 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" />
528 <param name="anno_select" value="gtf"/>
529 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" />
530 <param name="format" value="tabdel_short" />
531 <param name="include_feature_length_file" value="true"/>
532 <param name="ref_source" value="history" />
533 <param name="count_exon_exon_junction_reads" value="-J"/>
534 <output name="output_short" file="output_1_short_with_header.tab">
535 <metadata name="column_names" value="Geneid,featureCounts_input1.bam"/>
536 </output>
537 <output name="output_summary" file="output_1_summary_with_header.tab">
538 <metadata name="column_names" value="Status,featureCounts_input1.bam"/>
539 </output>
540 <output name="output_jcounts" file="output_1_jcounts_with_header.tab">
541 <metadata name="column_names" value="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,featureCounts_input1.bam"/>
542 </output>
543 </test>
544 <!-- Ensure built-in annotation works -->
545 <test expect_num_outputs="2">
546 <param name="alignment" value="pairend_strandspecific_51mer_hg19_chr1_1-100000.bam" ftype="bam" />
547 <param name="anno_select" value="builtin"/>
548 <param name="format" value="tabdel_short" />
549 <param name="genome" value="hg19" />
550 <output name="output_short" file="output_builtin_hg19.tab">
551 <metadata name="column_names" value="Geneid,pairend_strandspecific_51mer_hg19_chr1_1-100000.bam"/>
552 </output>
553 <output name="output_summary" file="output_summary_builtin_hg19.tab"/>
554 </test>
483 </tests> 555 </tests>
484 556
485 <help><![CDATA[ 557 <help><![CDATA[
486 featureCounts 558 featureCounts
487 ############# 559 #############
488 560
489 Overview 561 Overview
490 -------- 562 --------
491 FeatureCounts is a light-weight read counting program written entirely in the C programming language. It can be used to count both gDNA-seq and RNA-seq reads for genomic features in in SAM/BAM files. 563 FeatureCounts is a light-weight read counting program written entirely in the C programming language. It can be used to count both gDNA-seq and RNA-seq reads for genomic features in in SAM/BAM files. FeatureCounts is part of the Subread_ package.
492 564
493 Input formats 565 Input formats
494 ------------- 566 -------------
495 Alignments should be provided in either: 567 Alignments should be provided in either:
496 568
497 - SAM format, http://samtools.sourceforge.net/samtools.shtml#5 569 - SAM format, http://samtools.sourceforge.net/samtools.shtml#5
498 - BAM format 570 - BAM format
499 571
500 Gene regions should be provided in the GFF/GTF format: 572 Annotations for gene regions should be provided in the GFF/GTF format:
501 573
502 - http://genome.ucsc.edu/FAQ/FAQformat.html#format3 574 - http://genome.ucsc.edu/FAQ/FAQformat.html#format3
503 - http://www.ensembl.org/info/website/upload/gff.html 575 - http://www.ensembl.org/info/website/upload/gff.html
576
577 Alternatively, the featureCounts built-in annotations for genomes hg38, hg19, mm10 and mm9 can be used through selecting the built-in option above. These annotations were downloaded from NCBI RefSeq database and then adapted by merging overlapping exons from the same gene to form a set of disjoint exons for each gene. Genes with the same Entrez gene identifiers were also merged into one gene. See the Subread_ User's Guide for more information.
504 578
505 Output format 579 Output format
506 ------------- 580 -------------
507 FeatureCounts produces a table containing counted reads, per gene, per row. Optionally the last column can be set to be the effective gene-length. These tables are compatible with the DESeq2 Galaxy wrapper by IUC. Column names are added as metadata object. 581 FeatureCounts produces a table containing counted reads, per gene, per row. Optionally the last column can be set to be the effective gene-length. These tables are compatible with the DESeq2 Galaxy wrapper by IUC. Column names are added as metadata object.
582
583 .. _Subread: http://bioinf.wehi.edu.au/subread-package/SubreadUsersGuide.pdf
508 ]]></help> 584 ]]></help>
509 <citations> 585 <citations>
510 <citation type="doi">10.1093/bioinformatics/btt656</citation> 586 <citation type="doi">10.1093/bioinformatics/btt656</citation>
511 </citations> 587 </citations>
512 </tool> 588 </tool>