Mercurial > repos > iuc > featurecounts
comparison featurecounts.xml @ 10:46cccc52be5f draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/featurecounts commit cf1ae941d02bff8848f05c4e4039457656e3a4e8
author | iuc |
---|---|
date | Sun, 14 Jan 2018 09:23:49 -0500 |
parents | e6a2a912677a |
children | e803ca6407c0 |
comparison
equal
deleted
inserted
replaced
9:e6a2a912677a | 10:46cccc52be5f |
---|---|
1 <tool id="featurecounts" name="featureCounts" version="1.6.0.1" profile="16.04"> | 1 <tool id="featurecounts" name="featureCounts" version="1.6.0.2" profile="16.04"> |
2 <description>Measure gene expression in RNA-Seq experiments from SAM or BAM files.</description> | 2 <description>Measure gene expression in RNA-Seq experiments from SAM or BAM files.</description> |
3 <requirements> | 3 <requirements> |
4 <requirement type="package" version="1.6.0">subread</requirement> | 4 <requirement type="package" version="1.6.0">subread</requirement> |
5 </requirements> | 5 </requirements> |
6 | 6 |
7 <version_command>featureCounts -v 2>&1 | grep .</version_command> | 7 <version_command>featureCounts -v 2>&1 | grep .</version_command> |
8 <command><![CDATA[ | 8 <command detect_errors="exit_code"><![CDATA[ |
9 ## Export fc path for its built-in annotation | |
10 export FC_PATH=\$(command -v featureCounts | sed 's@/bin/featureCounts$@@') && | |
11 | |
9 ## Check whether all alignments are from the same type (bam || sam) | 12 ## Check whether all alignments are from the same type (bam || sam) |
10 featureCounts | 13 featureCounts |
11 #if $gtf_source.ref_source=="history": | 14 |
12 -a '$gtf_source.reference_gene_sets' | 15 #if $anno.anno_select=="gtf": |
13 #else: | 16 #if $anno.gtf_source.ref_source=="history": |
14 -a '$gtf_source.reference_gene_sets_builtin.fields.path' | 17 -a '$anno.gtf_source.reference_gene_sets' |
18 #else: | |
19 -a '$anno.gtf_source.reference_gene_sets_builtin.fields.path' | |
20 #end if | |
21 -F "GTF" | |
22 #elif $anno.anno_select=="builtin": | |
23 -a \${FC_PATH}/annotation/${anno.genome}_RefSeq_exon.txt | |
24 -F "SAF" | |
15 #end if | 25 #end if |
16 | 26 |
17 -o "output" | 27 -o "output" |
18 -T \${GALAXY_SLOTS:-2} | 28 -T \${GALAXY_SLOTS:-2} |
19 | 29 |
22 $extended_parameters.summarization_level | 32 $extended_parameters.summarization_level |
23 $extended_parameters.contribute_to_multiple_features | 33 $extended_parameters.contribute_to_multiple_features |
24 -s $extended_parameters.strand_specificity | 34 -s $extended_parameters.strand_specificity |
25 $extended_parameters.multimapping_enabled.multimapping_counts | 35 $extended_parameters.multimapping_enabled.multimapping_counts |
26 | 36 |
27 #if str($extended_parameters.multimapping_enabled.multimapping_counts) == " -M" | 37 #if str($extended_parameters.multimapping_enabled.multimapping_counts) == " -M": |
28 $extended_parameters.multimapping_enabled.fraction | 38 $extended_parameters.multimapping_enabled.fraction |
29 #end if | 39 #end if |
30 | 40 |
31 $extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads | 41 $extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads |
32 #if str($extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads) == "-J" | 42 #if str($extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads) == "-J": |
33 #if $extended_parameters.exon_exon_junction_read_counting_enabled.genome | 43 #if $extended_parameters.exon_exon_junction_read_counting_enabled.genome: |
34 -G '$extended_parameters.exon_exon_junction_read_counting_enabled.genome' | 44 -G '$extended_parameters.exon_exon_junction_read_counting_enabled.genome' |
35 #end if | 45 #end if |
36 #end if | 46 #end if |
37 | 47 |
38 $extended_parameters.long_reads | 48 $extended_parameters.long_reads |
46 --fracOverlapFeature $extended_parameters.frac_overlap_feature | 56 --fracOverlapFeature $extended_parameters.frac_overlap_feature |
47 $extended_parameters.read_reduction | 57 $extended_parameters.read_reduction |
48 $extended_parameters.primary | 58 $extended_parameters.primary |
49 $extended_parameters.ignore_dup | 59 $extended_parameters.ignore_dup |
50 | 60 |
51 #if str($extended_parameters.read_extension_5p) != "0" | 61 #if str($extended_parameters.read_extension_5p) != "0": |
52 --readExtension5 $extended_parameters.read_extension_5p | 62 --readExtension5 $extended_parameters.read_extension_5p |
53 #end if | 63 #end if |
54 | 64 |
55 #if str($extended_parameters.read_extension_3p) != "0" | 65 #if str($extended_parameters.read_extension_3p) != "0": |
56 --readExtension3 $extended_parameters.read_extension_3p | 66 --readExtension3 $extended_parameters.read_extension_3p |
57 #end if | 67 #end if |
58 | 68 |
59 $pe_parameters.fragment_counting_enabled.fragment_counting | 69 $pe_parameters.fragment_counting_enabled.fragment_counting |
60 #if str($pe_parameters.fragment_counting_enabled.fragment_counting) == " -p" | 70 #if str($pe_parameters.fragment_counting_enabled.fragment_counting) == " -p": |
61 $pe_parameters.fragment_counting_enabled.check_distance_enabled.check_distance | 71 $pe_parameters.fragment_counting_enabled.check_distance_enabled.check_distance |
62 #if str($pe_parameters.fragment_counting_enabled.check_distance_enabled.check_distance) == " -P" | 72 #if str($pe_parameters.fragment_counting_enabled.check_distance_enabled.check_distance) == " -P": |
63 -d $pe_parameters.fragment_counting_enabled.check_distance_enabled.minimum_fragment_length | 73 -d $pe_parameters.fragment_counting_enabled.check_distance_enabled.minimum_fragment_length |
64 -D $pe_parameters.fragment_counting_enabled.check_distance_enabled.maximum_fragment_length | 74 -D $pe_parameters.fragment_counting_enabled.check_distance_enabled.maximum_fragment_length |
65 #end if | 75 #end if |
66 #end if | 76 #end if |
67 | 77 |
68 $pe_parameters.only_both_ends | 78 $pe_parameters.only_both_ends |
69 $pe_parameters.exclude_chimerics | 79 $pe_parameters.exclude_chimerics |
70 | 80 |
71 '${alignment}' | 81 '${alignment}' |
72 | 82 |
73 ## Removal of comment and column-header line | 83 ## Removal of comment |
74 && grep -v "^#" "output" | tail -n+2 > body.txt | 84 && grep -v "^#" "output" |
75 | 85 |
86 #if $format.value != "tabdel_short": | |
87 ## and remove column-header line | |
88 | tail -n+2 | |
89 #else | |
90 ## update header | |
91 | sed --expression='s|${alignment}|${alignment.element_identifier}|g' | |
92 #end if | |
93 > body.txt | |
76 ## Set the right columns for the tabular formats | 94 ## Set the right columns for the tabular formats |
77 #if $format.value == "tabdel_medium" | 95 #if $format.value == "tabdel_medium": |
78 && cut -f 1,7 body.txt > expression_matrix.txt | 96 && cut -f 1,7 body.txt > expression_matrix.txt |
79 | 97 |
80 ## Paste doesn't allow a non ordered list of columns: -f 1,7,8,6 will only return columns 1,7 and 8 | 98 ## Paste doesn't allow a non ordered list of columns: -f 1,7,8,6 will only return columns 1,7 and 8 |
81 ## Thus the gene length column (last column) has to be added separately | 99 ## Thus the gene length column (last column) has to be added separately |
82 && cut -f 6 body.txt > gene_lengths.txt | 100 && cut -f 6 body.txt > gene_lengths.txt |
83 && paste expression_matrix.txt gene_lengths.txt > expression_matrix.txt.bak | 101 && paste expression_matrix.txt gene_lengths.txt > expression_matrix.txt.bak |
84 && mv -f expression_matrix.txt.bak '${output_medium}' | 102 && mv -f expression_matrix.txt.bak '${output_medium}' |
85 #elif $format.value == "tabdel_short" | 103 #elif $format.value == "tabdel_short" or $format.value == "tabdel_short_noheader": |
86 && cut -f 1,7 body.txt > '${output_short}' | 104 && cut -f 1,7 body.txt > '${output_short}' |
87 #else | 105 #else: |
88 && cp body.txt '${output_full}' | 106 && cp body.txt '${output_full}' |
89 #end if | 107 #end if |
90 | 108 |
91 | 109 #if str($include_feature_length_file) == "true": |
92 #if str($include_feature_length_file) == "true" | |
93 && cut -f 1,6 body.txt > '${output_feature_lengths}' | 110 && cut -f 1,6 body.txt > '${output_feature_lengths}' |
94 #end if | 111 #end if |
95 | 112 |
96 #if str($extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads) == "-J" | 113 #if str($extended_parameters.exon_exon_junction_read_counting_enabled.count_exon_exon_junction_reads) == "-J": |
97 && tail -n+2 'output.jcounts' > '${output_jcounts}' | 114 #if $format.value != "tabdel_short": |
115 && tail -n+2 'output.jcounts' > '${output_jcounts}' | |
116 #else: | |
117 | |
118 && sed --expression='s|${alignment}|${alignment.element_identifier}|g' 'output.jcounts' > '${output_jcounts}' | |
119 #end if | |
98 #end if | 120 #end if |
99 | 121 |
100 && tail -n+2 'output.summary' > '${output_summary}' | 122 #if $format.value != "tabdel_short": |
101 | 123 && tail -n+2 'output.summary' > '${output_summary}' |
124 #else: | |
125 && sed --expression='s|${alignment}|${alignment.element_identifier}|g' 'output.summary' > '${output_summary}' | |
126 #end if | |
102 ]]></command> | 127 ]]></command> |
103 <inputs> | 128 <inputs> |
104 <param name="alignment" | 129 <param name="alignment" |
105 type="data" | 130 type="data" |
106 multiple="false" | 131 multiple="false" |
107 format="bam,sam" | 132 format="bam,sam" |
108 label="Alignment file" | 133 label="Alignment file" |
109 help="The input alignment file(s) where the gene expression has to be counted. The file can have a SAM or BAM format; but ALL files must be in the same format" /> | 134 help="The input alignment file(s) where the gene expression has to be counted. The file can have a SAM or BAM format; but ALL files must be in the same format" /> |
110 | 135 <conditional name="anno"> |
111 <conditional name="gtf_source"> | 136 <param name="anno_select" type="select" label="Gene annotation file"> |
112 <param name="ref_source" type="select" label="Gene annotation file"> | 137 <option value="builtin">featureCounts built-in</option> |
113 <option value="cached">locally cached</option> | 138 <option value="gtf">GTF file</option> |
114 <option value="history">in your history</option> | |
115 </param> | 139 </param> |
116 <when value="cached"> | 140 <when value="builtin"> |
117 <param name="reference_gene_sets_builtin" type="select" label="Using locally cached annotation" help="If the annotation file you require is not listed here, please contact the Galaxy administrator"> | 141 <param name="genome" type="select" label="Select built-in genome" help="Built-in gene annotations for genomes hg38, hg19, mm10 and mm9 are included in featureCounts"> |
118 <options from_data_table="gene_sets"> | 142 <option value="hg38">hg38</option> |
119 <filter type="sort_by" column="1" /> | 143 <option value="hg19">hg19</option> |
120 <validator type="no_options" message="No annotations are available." /> | 144 <option value="mm10">mm10</option> |
121 </options> | 145 <option value="mm9">mm9</option> |
122 </param> | 146 </param> |
123 </when> | 147 </when> |
124 <when value="history"> | 148 <when value="gtf"> |
125 <param name="reference_gene_sets" | 149 <conditional name="gtf_source"> |
126 format="gff,gtf,gff3" | 150 <param name="ref_source" type="select" label="Gene annotation file"> |
127 type="data" | 151 <option value="cached">locally cached</option> |
128 label="Gene annotation file" | 152 <option value="history">in your history</option> |
129 help="The program assumes that the provided annotation file is in GTF format. Make sure that the gene annotation file corresponds to the same reference genome as used for the alignment" /> | 153 </param> |
154 <when value="cached"> | |
155 <param name="reference_gene_sets_builtin" type="select" label="Using locally cached annotation" help="If the annotation file you require is not listed here, please contact the Galaxy administrator"> | |
156 <options from_data_table="gene_sets"> | |
157 <filter type="sort_by" column="1" /> | |
158 <validator type="no_options" message="No annotations are available." /> | |
159 </options> | |
160 </param> | |
161 </when> | |
162 <when value="history"> | |
163 <param name="reference_gene_sets" | |
164 format="gff,gtf,gff3" | |
165 type="data" | |
166 label="Gene annotation file" | |
167 help="The program assumes that the provided annotation file is in GTF format. Make sure that the gene annotation file corresponds to the same reference genome as used for the alignment" /> | |
168 </when> | |
169 </conditional> | |
130 </when> | 170 </when> |
131 </conditional> | 171 </conditional> |
132 | 172 |
133 <param name="format" | 173 <param name="format" |
134 type="select" | 174 type="select" |
135 label="Output format" | 175 label="Output format" |
136 help="The output format will be tabular, select the preferred columns here"> | 176 help="The output format will be tabular, select the preferred columns here"> |
137 <option value="tabdel_short" selected="true">Gene-ID "\t" read-count (DESeq2 IUC wrapper compatible)</option> | 177 <option value="tabdel_short_noheader" selected="true">Gene-ID "\t" read-count (DESeq2 IUC wrapper compatible)</option> |
178 <option value="tabdel_short">Gene-ID "\t" read-count (MultiQC/edgeR/limma-voom compatible, includes header in output)</option> | |
138 <option value="tabdel_medium">Gene-ID "\t" read-count "\t" gene-length</option> | 179 <option value="tabdel_medium">Gene-ID "\t" read-count "\t" gene-length</option> |
139 <option value="tabdel_full">featureCounts 1.4.0+ default (includes regions provided by the GTF file)</option> | 180 <option value="tabdel_full">featureCounts 1.4.0+ default (includes regions provided by the GTF file)</option> |
140 </param> | 181 </param> |
141 | 182 |
142 <param name="include_feature_length_file" | 183 <param name="include_feature_length_file" |
289 | 330 |
290 <param name="long_reads" argument="-L" type="boolean" truevalue="-L" falsevalue="" | 331 <param name="long_reads" argument="-L" type="boolean" truevalue="-L" falsevalue="" |
291 label="Long reads" | 332 label="Long reads" |
292 help="If specified, long reads such as Nanopore and PacBio reads will be counted. Long read counting can only run in one thread and only reads (not read-pairs) can be counted." /> | 333 help="If specified, long reads such as Nanopore and PacBio reads will be counted. Long read counting can only run in one thread and only reads (not read-pairs) can be counted." /> |
293 | 334 |
294 <param name="by_read_group" argument="--byReadGroup" type="boolean" truevalue="--byReadGroup" falsevalue="" | 335 <param name="by_read_group" argument="--byReadGroup" type="boolean" truevalue="--byReadGroup" falsevalue="" |
295 label="Count reads by read group" | 336 label="Count reads by read group" |
296 help="If specified, reads are counted for each read group separately. The 'RG' tag must be present in the input BAM/SAM alignment files." /> | 337 help="If specified, reads are counted for each read group separately. The 'RG' tag must be present in the input BAM/SAM alignment files." /> |
297 | 338 |
298 | 339 |
299 <param name="largest_overlap" | 340 <param name="largest_overlap" |
309 value="1" | 350 value="1" |
310 argument="--minOverlap" | 351 argument="--minOverlap" |
311 label="Minimum bases of overlap" | 352 label="Minimum bases of overlap" |
312 help="Specify the minimum required number of overlapping bases between a read (or a fragment) and a feature. 1 by default. If a negative value is provided, the read will be extended from both ends." /> | 353 help="Specify the minimum required number of overlapping bases between a read (or a fragment) and a feature. 1 by default. If a negative value is provided, the read will be extended from both ends." /> |
313 | 354 |
314 <param name="frac_overlap" | 355 <param name="frac_overlap" |
315 type="integer" | 356 type="integer" |
316 value="0" | 357 value="0" |
317 min="0" | 358 min="0" |
318 max="1" | 359 max="1" |
319 argument="--fracOverlap" | 360 argument="--fracOverlap" |
320 label="Minimum fraction (of read) overlapping a feature" | 361 label="Minimum fraction (of read) overlapping a feature" |
321 help="Specify the minimum required fraction of overlapping bases between a read (or a fragment) and a feature. Value should be within range [0,1]. 0 by default. Number of overlapping bases is counted from both reads if paired end. Both this option and '--minOverlap' need to be satisfied for read assignment." /> | 362 help="Specify the minimum required fraction of overlapping bases between a read (or a fragment) and a feature. Value should be within range [0,1]. 0 by default. Number of overlapping bases is counted from both reads if paired end. Both this option and '--minOverlap' need to be satisfied for read assignment." /> |
322 | 363 |
323 <param name="frac_overlap_feature" | 364 <param name="frac_overlap_feature" |
324 type="integer" | 365 type="integer" |
325 value="0" | 366 value="0" |
326 min="0" | 367 min="0" |
327 max="1" | 368 max="1" |
328 argument="--fracOverlapFeature" | 369 argument="--fracOverlapFeature" |
389 </data> | 430 </data> |
390 | 431 |
391 <data format="tabular" | 432 <data format="tabular" |
392 name="output_short" | 433 name="output_short" |
393 label="${tool.name} on ${on_string}"> | 434 label="${tool.name} on ${on_string}"> |
394 <filter>format == "tabdel_short"</filter> | 435 <filter>format == "tabdel_short_noheader" or format == "tabdel_short"</filter> |
395 <actions> | 436 <actions> |
396 <action name="column_names" type="metadata" default="Geneid,${alignment.element_identifier}" /> | 437 <action name="column_names" type="metadata" default="Geneid,${alignment.element_identifier}" /> |
397 </actions> | 438 </actions> |
398 </data> | 439 </data> |
399 | 440 |
406 </actions> | 447 </actions> |
407 </data> | 448 </data> |
408 | 449 |
409 <data format="tabular" | 450 <data format="tabular" |
410 name="output_summary" | 451 name="output_summary" |
411 hidden="true" | |
412 label="${tool.name} on ${on_string}: summary"> | 452 label="${tool.name} on ${on_string}: summary"> |
413 <actions> | 453 <actions> |
414 <action name="column_names" type="metadata" default="Status,${alignment.element_identifier}" /> | 454 <action name="column_names" type="metadata" default="Status,${alignment.element_identifier}" /> |
415 </actions> | 455 </actions> |
416 </data> | 456 </data> |
426 | 466 |
427 <data name="output_jcounts" format="tabular" | 467 <data name="output_jcounts" format="tabular" |
428 label="${tool.name} on ${on_string}: junction counts"> | 468 label="${tool.name} on ${on_string}: junction counts"> |
429 <filter>extended_parameters['exon_exon_junction_read_counting_enabled']['count_exon_exon_junction_reads']</filter> | 469 <filter>extended_parameters['exon_exon_junction_read_counting_enabled']['count_exon_exon_junction_reads']</filter> |
430 <actions> | 470 <actions> |
431 <action name="column_names" type="metadata" default="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,${alignment.element_identifier}" /> | 471 <action name="column_names" type="metadata" |
472 default="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,${alignment.element_identifier}" /> | |
432 </actions> | 473 </actions> |
433 </data> | 474 </data> |
434 </outputs> | 475 </outputs> |
435 <tests> | 476 <tests> |
436 <test expect_num_outputs="4"> | 477 <test expect_num_outputs="4"> |
437 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> | 478 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> |
479 <param name="anno_select" value="gtf"/> | |
438 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> | 480 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> |
439 <param name="format" value="tabdel_short" /> | 481 <param name="format" value="tabdel_short_noheader" /> |
440 <param name="include_feature_length_file" value="true"/> | 482 <param name="include_feature_length_file" value="true"/> |
441 <param name="ref_source" value="history" /> | 483 <param name="ref_source" value="history" /> |
442 <param name="count_exon_exon_junction_reads" value="-J"/> | 484 <param name="count_exon_exon_junction_reads" value="-J"/> |
443 <output name="output_short" file="output_1_short.tab"> | 485 <output name="output_short" file="output_1_short.tab"> |
444 <metadata name="column_names" value="Geneid,featureCounts_input1.bam"/> | 486 <metadata name="column_names" value="Geneid,featureCounts_input1.bam"/> |
450 <metadata name="column_names" value="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,featureCounts_input1.bam"/> | 492 <metadata name="column_names" value="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,featureCounts_input1.bam"/> |
451 </output> | 493 </output> |
452 </test> | 494 </test> |
453 <test expect_num_outputs="3"> | 495 <test expect_num_outputs="3"> |
454 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> | 496 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> |
497 <param name="anno_select" value="gtf"/> | |
455 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> | 498 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> |
456 <param name="format" value="tabdel_medium" /> | 499 <param name="format" value="tabdel_medium" /> |
457 <param name="include_feature_length_file" value="true"/> | 500 <param name="include_feature_length_file" value="true"/> |
458 <param name="ref_source" value="history" /> | 501 <param name="ref_source" value="history" /> |
459 <output name="output_medium" file="output_1_medium.tab"> | 502 <output name="output_medium" file="output_1_medium.tab"> |
463 <metadata name="column_names" value="Status,featureCounts_input1.bam"/> | 506 <metadata name="column_names" value="Status,featureCounts_input1.bam"/> |
464 </output> | 507 </output> |
465 </test> | 508 </test> |
466 <test expect_num_outputs="3"> | 509 <test expect_num_outputs="3"> |
467 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> | 510 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> |
511 <param name="anno_select" value="gtf"/> | |
468 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> | 512 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> |
469 <param name="format" value="tabdel_full" /> | 513 <param name="format" value="tabdel_full" /> |
470 <param name="include_feature_length_file" value="true"/> | 514 <param name="include_feature_length_file" value="true"/> |
471 <param name="ref_source" value="history" /> | 515 <param name="ref_source" value="history" /> |
472 <output name="output_full" file="output_1_full.tab"> | 516 <output name="output_full" file="output_1_full.tab"> |
477 </output> | 521 </output> |
478 <output name="output_feature_lengths" file="output_feature_lengths.tab"> | 522 <output name="output_feature_lengths" file="output_feature_lengths.tab"> |
479 <metadata name="column_names" value="Feature,Length"/> | 523 <metadata name="column_names" value="Feature,Length"/> |
480 </output> | 524 </output> |
481 </test> | 525 </test> |
482 | 526 <test expect_num_outputs="4"> |
527 <param name="alignment" value="featureCounts_input1.bam" ftype="bam" /> | |
528 <param name="anno_select" value="gtf"/> | |
529 <param name="reference_gene_sets" value="featureCounts_guide.gff" ftype="gff" /> | |
530 <param name="format" value="tabdel_short" /> | |
531 <param name="include_feature_length_file" value="true"/> | |
532 <param name="ref_source" value="history" /> | |
533 <param name="count_exon_exon_junction_reads" value="-J"/> | |
534 <output name="output_short" file="output_1_short_with_header.tab"> | |
535 <metadata name="column_names" value="Geneid,featureCounts_input1.bam"/> | |
536 </output> | |
537 <output name="output_summary" file="output_1_summary_with_header.tab"> | |
538 <metadata name="column_names" value="Status,featureCounts_input1.bam"/> | |
539 </output> | |
540 <output name="output_jcounts" file="output_1_jcounts_with_header.tab"> | |
541 <metadata name="column_names" value="PrimaryGene,SecondaryGene,Site1_chr,Site1_location,Site1_strand,Site2_chr,Site2_location,Site2_strand,featureCounts_input1.bam"/> | |
542 </output> | |
543 </test> | |
544 <!-- Ensure built-in annotation works --> | |
545 <test expect_num_outputs="2"> | |
546 <param name="alignment" value="pairend_strandspecific_51mer_hg19_chr1_1-100000.bam" ftype="bam" /> | |
547 <param name="anno_select" value="builtin"/> | |
548 <param name="format" value="tabdel_short" /> | |
549 <param name="genome" value="hg19" /> | |
550 <output name="output_short" file="output_builtin_hg19.tab"> | |
551 <metadata name="column_names" value="Geneid,pairend_strandspecific_51mer_hg19_chr1_1-100000.bam"/> | |
552 </output> | |
553 <output name="output_summary" file="output_summary_builtin_hg19.tab"/> | |
554 </test> | |
483 </tests> | 555 </tests> |
484 | 556 |
485 <help><![CDATA[ | 557 <help><![CDATA[ |
486 featureCounts | 558 featureCounts |
487 ############# | 559 ############# |
488 | 560 |
489 Overview | 561 Overview |
490 -------- | 562 -------- |
491 FeatureCounts is a light-weight read counting program written entirely in the C programming language. It can be used to count both gDNA-seq and RNA-seq reads for genomic features in in SAM/BAM files. | 563 FeatureCounts is a light-weight read counting program written entirely in the C programming language. It can be used to count both gDNA-seq and RNA-seq reads for genomic features in in SAM/BAM files. FeatureCounts is part of the Subread_ package. |
492 | 564 |
493 Input formats | 565 Input formats |
494 ------------- | 566 ------------- |
495 Alignments should be provided in either: | 567 Alignments should be provided in either: |
496 | 568 |
497 - SAM format, http://samtools.sourceforge.net/samtools.shtml#5 | 569 - SAM format, http://samtools.sourceforge.net/samtools.shtml#5 |
498 - BAM format | 570 - BAM format |
499 | 571 |
500 Gene regions should be provided in the GFF/GTF format: | 572 Annotations for gene regions should be provided in the GFF/GTF format: |
501 | 573 |
502 - http://genome.ucsc.edu/FAQ/FAQformat.html#format3 | 574 - http://genome.ucsc.edu/FAQ/FAQformat.html#format3 |
503 - http://www.ensembl.org/info/website/upload/gff.html | 575 - http://www.ensembl.org/info/website/upload/gff.html |
576 | |
577 Alternatively, the featureCounts built-in annotations for genomes hg38, hg19, mm10 and mm9 can be used through selecting the built-in option above. These annotations were downloaded from NCBI RefSeq database and then adapted by merging overlapping exons from the same gene to form a set of disjoint exons for each gene. Genes with the same Entrez gene identifiers were also merged into one gene. See the Subread_ User's Guide for more information. | |
504 | 578 |
505 Output format | 579 Output format |
506 ------------- | 580 ------------- |
507 FeatureCounts produces a table containing counted reads, per gene, per row. Optionally the last column can be set to be the effective gene-length. These tables are compatible with the DESeq2 Galaxy wrapper by IUC. Column names are added as metadata object. | 581 FeatureCounts produces a table containing counted reads, per gene, per row. Optionally the last column can be set to be the effective gene-length. These tables are compatible with the DESeq2 Galaxy wrapper by IUC. Column names are added as metadata object. |
582 | |
583 .. _Subread: http://bioinf.wehi.edu.au/subread-package/SubreadUsersGuide.pdf | |
508 ]]></help> | 584 ]]></help> |
509 <citations> | 585 <citations> |
510 <citation type="doi">10.1093/bioinformatics/btt656</citation> | 586 <citation type="doi">10.1093/bioinformatics/btt656</citation> |
511 </citations> | 587 </citations> |
512 </tool> | 588 </tool> |