Mercurial > repos > ebi-gxa > gtf2gene_list
comparison gtf2featureAnnotation.xml @ 1:247b439a78f7 draft
planemo upload for repository https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary/tree/develop/tools/util/.shed.yml commit 194d2e0af16624c9a3d1af92f7b3686d2e0ee552
author | ebi-gxa |
---|---|
date | Fri, 18 Oct 2019 10:10:54 -0400 |
parents | |
children | e255c0e5dfca |
comparison
equal
deleted
inserted
replaced
0:040d4b3a19d5 | 1:247b439a78f7 |
---|---|
1 <tool id="_ensembl_gtf2gene_list" name="GTF2GeneAnnotationTable" version="1.42.1+galaxy1"> | |
2 <description>extracts a complete annotation table or subsets thereof from an Ensembl GTF using rtracklayer</description> | |
3 <requirements> | |
4 <requirement type="package" version="1.42.1">bioconductor-rtracklayer</requirement> | |
5 <requirement type="package">bioconductor-biostrings</requirement> | |
6 <requirement type="package">r-optparse</requirement> | |
7 </requirements> | |
8 <command detect_errors="exit_code"><![CDATA[ | |
9 ln -s '$gtf_input' input.gtf; | |
10 $__tool_directory__/gtf2featureAnnotation.R --gtf-file input.gtf | |
11 #if $noheader | |
12 --no-header | |
13 #end if | |
14 #if $version_transcripts | |
15 --version-transcripts | |
16 #end if | |
17 #if $mito.mark_mito | |
18 --mito --mito-chr "${mito.mito_chr}" --mito-biotypes "${mito.mito_biotypes}" | |
19 #end if | |
20 #if $cdnas.filter_cdnas | |
21 --filter-cdnas "${cdnas.fasta_input}" --filter-cdnas-field "${cdnas.cdnas_field}" --filter-cdnas-output "${fasta_output}" | |
22 #end if | |
23 --feature-type "${feature_type}" --first-field "${first_field}" --output-file annotation.txt --fields "${fields}" | |
24 ]]></command> | |
25 | |
26 <inputs> | |
27 <param name="gtf_input" type="data" format="gff" label="Ensembl GTF file" /> | |
28 <param name="feature_type" type="text" optional='true' value="gene" label="Feature type for which to derive annotation"/> | |
29 <param name="first_field" type="text" optional='true' value="gene_id" label="Field to place first in output table"/> | |
30 <param name="noheader" type="boolean" checked="false" label="Suppress header line in output?"/> | |
31 <param name="fields" type="text" optional='true' value="" label="Comma-separated list of field names to extract from the GTF (default: use all fields)"/> | |
32 <param name="version_transcripts" type="boolean" checked="false" label="Append version to transcript identifiers?" help="For transcript feature type only: where the GTF contains transcript versions, should these be appended to transcript identifiers? Useful when generating transcript/gene mappings for use with transcriptomes"/> | |
33 <conditional name="mito"> | |
34 <param name="mark_mito" type="boolean" checked="true" label="Flag mitochondrial features?"/> | |
35 <when value="true"> | |
36 <param name="mito_chr" type="text" optional='true' value="mt,mitochondrion_genome,mito,m,chrM,chrMt" label="Comma-separated list of possible mitochondrial chromosome names (case insensitive)"/> | |
37 <param name="mito_biotypes" type="text" optional='true' value="mt_trna,mt_rrna,mt_trna_pseudogene" label="Comma-separated list of possible mitochondrial biotypes (case insensitive)"/> | |
38 </when> | |
39 <when value="false" /> | |
40 </conditional> | |
41 <conditional name="cdnas"> | |
42 <param name="filter_cdnas" type="boolean" checked="false" label="Filter a FASTA-format cDNA file to match annotations?" help="For some applications, e.g. transcriptome mappers, its useful to match a cDNAs file to an annotation list (e.g. transcript-to-gene mapping)"/> | |
43 <when value="true"> | |
44 <param name="fasta_input" type="data" format="fasta" label="FASTA-format cDNA/ transcript file" /> | |
45 <param name="cdnas_field" type="text" optional='true' value="transcript_id" label="Annotation field to match with sequences."/> | |
46 </when> | |
47 <when value="false" /> | |
48 </conditional> | |
49 </inputs> | |
50 | |
51 <outputs> | |
52 <data name="feature_annotation" format="tsv" from_work_dir="annotation.txt" label="${tool.name} on ${on_string}: annotation table"/> | |
53 <data name="fasta_output" format="fasta" from_work_dir="filtered.fa.gz" label="${tool.name} on ${on_string}: annotation-matched sequences"> | |
54 <filter>filter_cdnas</filter> | |
55 </data> | |
56 </outputs> | |
57 <tests> | |
58 <test> | |
59 <param name="gtf_input" ftype="gtf" value="test.gtf"/> | |
60 <output name="feature_annotation" file="annotation.txt"/> | |
61 </test> | |
62 </tests> | |
63 | |
64 | |
65 <help><![CDATA[ | |
66 .. class:: infomark | |
67 | |
68 **What it does** | |
69 | |
70 Given an Ensembl GTF file, it will extract all information on chromosomes, coordinates, and attributes provided at the specified feature level. Mitochondrial features can also be flagged. | |
71 | |
72 You can also supply a fasta-format file of sequences, which will be filtered by identifier to match annotation. This can be useful for tools such as Alevin which need a transcript-to-gene mapping and a transcriptome file without any missing entries (with respect to annotation). | |
73 | |
74 | |
75 **Inputs** | |
76 | |
77 * Ensembl GTF file | |
78 | |
79 ----- | |
80 | |
81 **Outputs** | |
82 | |
83 * Gene annotations in tsv. | |
84 ]]></help> | |
85 <citations> | |
86 <citation type="bibtex"> | |
87 @misc{github-hinxton-single-cell, | |
88 author = {Jonathan Manning, EBI Gene Expression Team}, | |
89 year = {2019}, | |
90 title = {Hinxton Single Cell Anlysis Environment}, | |
91 publisher = {GitHub}, | |
92 journal = {GitHub repository}, | |
93 url = {https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary}, | |
94 }</citation> | |
95 </citations> | |
96 </tool> |