comparison gtf2featureAnnotation.xml @ 7:14b3f2a4523b draft default tip

"planemo upload for repository https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary/tree/develop/tools/gtf-2-gene-list/.shed.yml commit 5a62f18c80ddd55cfcc9d64546fde4e20be3e070"
author ebi-gxa
date Mon, 19 Jul 2021 08:00:24 +0000
parents 1a642de6db01
children
comparison
equal deleted inserted replaced
6:1a642de6db01 7:14b3f2a4523b
1 <tool id="_ensembl_gtf2gene_list" name="GTF2GeneList" version="1.42.1+galaxy6" profile="18.01"> 1 <tool id="_ensembl_gtf2gene_list" name="GTF2GeneList" version="1.52.0+galaxy0" profile="18.01">
2 <description>extracts a complete annotation table or subsets thereof from an Ensembl GTF using rtracklayer</description> 2 <description>extracts a complete annotation table or subsets thereof from an Ensembl GTF using rtracklayer</description>
3 <requirements> 3 <requirements>
4 <requirement type="package" version="1.42.1">bioconductor-rtracklayer</requirement> 4 <requirement type="package" version="1.0.1">atlas-gene-annotation-manipulation</requirement>
5 <requirement type="package" version="2.50.2">bioconductor-biostrings</requirement>
6 <requirement type="package" version="1.6.4">r-optparse</requirement>
7 </requirements> 5 </requirements>
8 <command detect_errors="exit_code"><![CDATA[ 6 <command detect_errors="exit_code"><![CDATA[
9 ln -s '$gtf_input' input.gtf; 7 ln -s '$gtf_input' input.gtf;
10 $__tool_directory__/gtf2featureAnnotation.R --gtf-file input.gtf 8 gtf2featureAnnotation.R --gtf-file input.gtf
11 #if $noheader 9 #if $noheader
12 --no-header 10 --no-header
13 #end if 11 #end if
14 #if $version_transcripts 12 #if $version_transcripts
15 --version-transcripts 13 --version-transcripts
16 #end if 14 #end if
17 #if $mito.mark_mito 15 #if $mito.mark_mito
18 --mito --mito-chr "${mito.mito_chr}" --mito-biotypes "${mito.mito_biotypes}" 16 --mito --mito-chr "${mito.mito_chr}" --mito-biotypes "${mito.mito_biotypes}"
19 #end if 17 #end if
18 #if $cdnas.parse_cdnas
19 --parse-cdnas "${cdnas.fasta_input}" --parse-cdna-field "${cdnas.cdnas_field}"
20 #if $cdnas.filter_cdnas 20 #if $cdnas.filter_cdnas
21 --filter-cdnas "${cdnas.fasta_input}" --filter-cdnas-field "${cdnas.cdnas_field}" --filter-cdnas-output "${fasta_output}" 21 --filter-cdnas-output "${fasta_output}"
22 #end if
23 #if $cdnas.parse_cdna_names
24 --parse-cdna-names
25 #end if
26 #if $fill_empty
27 --fill-empty "${fill_empty}"
28 #end if
22 #end if 29 #end if
23 --feature-type "${feature_type}" --first-field "${first_field}" --output-file annotation.txt --fields "${fields}" 30 --feature-type "${feature_type}" --first-field "${first_field}" --output-file annotation.txt --fields "${fields}"
24 ]]></command> 31 ]]></command>
25 32
26 <inputs> 33 <inputs>
28 <param name="feature_type" type="text" optional='true' value="gene" label="Feature type for which to derive annotation"/> 35 <param name="feature_type" type="text" optional='true' value="gene" label="Feature type for which to derive annotation"/>
29 <param name="first_field" type="text" optional='true' value="gene_id" label="Field to place first in output table"/> 36 <param name="first_field" type="text" optional='true' value="gene_id" label="Field to place first in output table"/>
30 <param name="noheader" type="boolean" checked="false" label="Suppress header line in output?"/> 37 <param name="noheader" type="boolean" checked="false" label="Suppress header line in output?"/>
31 <param name="fields" type="text" optional='true' value="" label="Comma-separated list of field names to extract from the GTF (default: use all fields)"/> 38 <param name="fields" type="text" optional='true' value="" label="Comma-separated list of field names to extract from the GTF (default: use all fields)"/>
32 <param name="version_transcripts" type="boolean" checked="false" label="Append version to transcript identifiers?" help="For transcript feature type only: where the GTF contains transcript versions, should these be appended to transcript identifiers? Useful when generating transcript/gene mappings for use with transcriptomes"/> 39 <param name="version_transcripts" type="boolean" checked="false" label="Append version to transcript identifiers?" help="For transcript feature type only: where the GTF contains transcript versions, should these be appended to transcript identifiers? Useful when generating transcript/gene mappings for use with transcriptomes"/>
40 <param name="fill_empty" type="text" optional='true' value="" label="Column to be used to fill empty values in other fields" help="Only when output fields are defined, useful when you need to guarantee a value, for example a gene ID for a transcript/gene mapping."/>
33 <conditional name="mito"> 41 <conditional name="mito">
34 <param name="mark_mito" type="boolean" checked="true" label="Flag mitochondrial features?"/> 42 <param name="mark_mito" type="boolean" checked="true" label="Flag mitochondrial features?"/>
35 <when value="true"> 43 <when value="true">
36 <param name="mito_chr" type="text" optional='true' value="mt,mitochondrion_genome,mito,m,chrM,chrMt" label="Comma-separated list of possible mitochondrial chromosome names (case insensitive)"/> 44 <param name="mito_chr" type="text" optional='true' value="mt,mitochondrion_genome,mito,m,chrM,chrMt" label="Comma-separated list of possible mitochondrial chromosome names (case insensitive)"/>
37 <param name="mito_biotypes" type="text" optional='true' value="mt_trna,mt_rrna,mt_trna_pseudogene" label="Comma-separated list of possible mitochondrial biotypes (case insensitive)"/> 45 <param name="mito_biotypes" type="text" optional='true' value="mt_trna,mt_rrna,mt_trna_pseudogene" label="Comma-separated list of possible mitochondrial biotypes (case insensitive)"/>
38 </when> 46 </when>
39 <when value="false" /> 47 <when value="false" />
40 </conditional> 48 </conditional>
41 <conditional name="cdnas"> 49 <conditional name="cdnas">
42 <param name="filter_cdnas" type="boolean" checked="false" label="Filter a FASTA-format cDNA file to match annotations?" help="For some applications, e.g. transcriptome mappers, its useful to match a cDNAs file to an annotation list (e.g. transcript-to-gene mapping)"/> 50 <param name="parse_cdnas" type="boolean" checked="false" label="Provide a cDNA file for extracting annotations and/ or possible filtering?" help="For some applications, e.g. transcriptome mappers, its useful to match a cDNAs file to an annotation list (e.g. transcript-to-gene mapping)"/>
43 <when value="true"> 51 <when value="true">
44 <param name="fasta_input" type="data" format="fasta,fasta.gz" label="FASTA-format cDNA/ transcript file" /> 52 <param name="fasta_input" type="data" format="fasta,fasta.gz" label="FASTA-format cDNA/ transcript file" />
45 <param name="cdnas_field" type="text" optional='true' value="transcript_id" label="Annotation field to match with sequences."/> 53 <param name="cdnas_field" type="text" optional='true' value="transcript_id" label="Annotation field in GTF to match with sequences."/>
54 <param name="parse_cdna_names" type="boolean" checked="false" label="Parse the FASTA headers for annotation info?" help="e.g. to find gene IDs for transcripts not present in the GTF. May only work for Ensembl GTFs."/>
55 <param name="filter_cdnas" type="boolean" checked="false" label="Filter the cDNA file to match the annotations?" />
46 </when> 56 </when>
47 <when value="false" /> 57 <when value="false" />
48 </conditional> 58 </conditional>
49 </inputs> 59 </inputs>
50 60
65 <help><![CDATA[ 75 <help><![CDATA[
66 .. class:: infomark 76 .. class:: infomark
67 77
68 **What it does** 78 **What it does**
69 79
70 Given an Ensembl GTF file, it will extract all information on chromosomes, coordinates, and attributes provided at the specified feature level. Mitochondrial features can also be flagged. 80 Given an Ensembl GTF file, it will extract all information on chromosomes, coordinates, and attributes provided at the specified feature level. Mitochondrial features can also be flagged. See https://github.com/ebi-gene-expression-group/atlas-gene-annotation-manipulation.
71 81
72 You can also supply a fasta-format file of sequences, which will be filtered by identifier to match annotation. This can be useful for tools such as Alevin which need a transcript-to-gene mapping and a transcriptome file without any missing entries (with respect to annotation). 82 You can also supply a fasta-format file of sequences, which can be filtered by identifier to match annotation and/or used a source of information for transcripts un-annotated in the GTF. This can be useful for tools such as Alevin which need a transcript-to-gene mapping and a transcriptome file without any missing entries (with respect to annotation).
73 83
74 84
75 **Inputs** 85 **Inputs**
76 86
77 * Ensembl GTF file 87 * Ensembl GTF file
90 title = {Hinxton Single Cell Anlysis Environment}, 100 title = {Hinxton Single Cell Anlysis Environment},
91 publisher = {GitHub}, 101 publisher = {GitHub},
92 journal = {GitHub repository}, 102 journal = {GitHub repository},
93 url = {https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary}, 103 url = {https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary},
94 }</citation> 104 }</citation>
105 <citation type="doi">10.1101/2020.04.08.032698</citation>
95 </citations> 106 </citations>
96 </tool> 107 </tool>