Mercurial > repos > cpt > cpt_gff_extract_seq
view gff3_extract_sequence.xml @ 9:9264ac799feb draft
planemo upload commit e794f52198fcd387dbf44a2c13b552d557696323-dirty
author | cpt |
---|---|
date | Fri, 01 Dec 2023 04:26:28 +0000 |
parents | 759ba1430091 |
children | 3d9f283ff09d |
line wrap: on
line source
<tool id="edu.tamu.cpt.gff3.export_seq" name="GFF3 Feature Sequence Export" version="19.1.0.0"> <description>Export corresponding sequence in genome from GFF3</description> <macros> <import>macros.xml</import> </macros> <expand macro="requirements"/> <command detect_errors="aggressive"><![CDATA[ @GENOME_SELECTOR_PRE@ '$__tool_directory__/gff3_extract_sequence.py' @GENOME_SELECTOR@ @INPUT_GFF@ #if $feature_filter and $feature_filter is not None: --feature_filter '$feature_filter' #end if '$nodesc' > '$default']]></command> <inputs> <expand macro="genome_selector"/> <expand macro="gff3_input"/> <param label="Filter for specific feature types" name="feature_filter" type="text" help="Use 'nice_cds' if your features are coming from Apollo, however this will fail on non-Apollo data"/> <param label="Remove description (use if blasting)" name="nodesc" type="boolean" truevalue="--nodesc" falsevalue=""/> </inputs> <outputs> <data format="fasta" hidden="false" name="default"/> </outputs> <tests> <test> <param name="reference_genome_source" value="history"/> <param name="genome_fasta" value="T7_ExtSeqIn.fasta"/> <param name="gff3_data" value="T7_ExtSeqIn.gff3"/> <param name="nodesc" value=""/> <param name="feature_filter" value="CDS"/> <output name="output" file="T7_ExtSeqOut.fasta"/> </test> <test> <param name="reference_genome_source" value="history"/> <param name="genome_fasta" value="Miro_ExtSeqIn.fa"/> <param name="gff3_data" value="Miro_ExtSeqIn.gff3"/> <param name="nodesc" value=""/> <param name="feature_filter" value="CDS"/> <output name="output" file="Miro_ExtSeqOut1.fa"/> </test> <test> <param name="reference_genome_source" value="history"/> <param name="genome_fasta" value="Miro_ExtSeqIn.fa"/> <param name="gff3_data" value="Miro_ExtSeqIn.gff3"/> <param name="feature_filter" value="CDS"/> <param name="nodesc" value="--nodesc"/> <output name="output" file="Miro_ExtSeqOut2.fa"/> </test> </tests> <help><![CDATA[ **What it does** From the FASTA sequence for a genome, extracts the *nucleotide* sequences for all CDSs in an input GFF3 and outputs them as a multi-FASTA formatted file. The filter for specific feature types was designed for data retrieved from Apollo. Using ‘unique_cds’ extracts the sequence for all CDS. Using ‘nice_cds’ will extract the sequence only for CDS features with a start codon (recommended). If a gene from Apollo has multiple CDSs, the tool will append a "_##" to the end of subsequent genes. ]]></help> <expand macro="citations"/> </tool>