view align_and_estimate_abundance.xml @ 2:de0af39266ef draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trinity commit 77385ec02b79f527348aff01bd83a019e30f5f45
author iuc
date Mon, 25 Apr 2016 10:02:37 -0400
parents
children c7555bc21812
line wrap: on
line source

<tool id="align_and_estimate_abundance" name="Align reads and estimate abundance" version="2.1.1">
    <description>on a de novo assembly of RNA-Seq data</description>
    <requirements>
        <requirement type="package" version="2.1.1">trinity</requirement>
        <requirement type="package" version="1.1.2">bowtie</requirement>
        <requirement type="package" version="2.2.6">bowtie2</requirement>
        <requirement type="package" version="1.2">samtools</requirement>
        <requirement type="package" version="1.2.28">rsem</requirement>
        <requirement type="package" version="1.5.1">express</requirement>
    </requirements>
    <stdio>
        <exit_code range="1:"/>
    </stdio>
    <command><![CDATA[
        ln -s $transcripts input.fa

        &&

        align_and_estimate_abundance.pl
       
        --transcripts input.fa

        --est_method $method.est_method
        #if $method.est_method == "RSEM" or $method.est_method == "eXpress":
            --aln_method $method.aln_method
        #end if

        #if $inputs.paired_or_single == "paired":
            --left $inputs.left_input --right $inputs.right_input
            
            #if $inputs.left_input.is_of_type('fasta'):
                --seqType fa
            #else:
                --seqType fq
            #end if
            
            #if $inputs.strand.is_strand_specific:
                --SS_lib_type $inputs.strand.library_type
            #end if

        #else:
            --single $inputs.input
            
            #if $inputs.input.is_of_type('fasta'):
                --seqType fa
            #else:
                --seqType fq
            #end if
            
            #if $inputs.strand.is_strand_specific:
                --SS_lib_type $inputs.strand.library_type
            #end if
        #end if
        
        --max_ins_size $inputs.paired_fragment_length

        ## Additional parameters.
        #if $additional_params.gene_map.has_gene_map == "yes":
            --gene_trans_map $additional_params.gene_map.gene_trans_map
        #else
            --trinity_mode
        #end if
        
        --prep_reference
        
        --output_dir .

        ## CPU
        --thread_count \${GALAXY_SLOTS:-4}
    ]]></command>
    <inputs>
        <param format="fasta" name="transcripts" type="data" label="Transcripts" help="de novo assembly of RNA-Seq data"/>
        <conditional name="inputs">
            <param name="paired_or_single" type="select" label="Paired or Single-end data?">
                <option value="paired">Paired</option>
                <option value="single">Single</option>
            </param>
            <when value="paired">
                <param format="fasta,fastqsanger" name="left_input" type="data" label="Left/Forward strand reads" help=""/>
                <param format="fasta,fastqsanger" name="right_input" type="data" label="Right/Reverse strand reads" help=""/>
                <conditional name="strand">
                    <param name="is_strand_specific" type="boolean" checked="false" label="Strand specific data"/>
                    <when value="false">
                    </when>
                    <when value="true">
                        <param name="library_type" type="select" label="Strand-specific Library Type">
                            <option value="FR">Forward-Reverse</option>
                            <option value="RF">Reverse-Forward</option>
                        </param>
                    </when>
                </conditional>
                <param name="paired_fragment_length" type="integer" value="800" min="1" label="Maximum insert size" help="bowtie -X parameter"/>
            </when>
            <when value="single">
                <param format="fasta,fastqsanger" name="input" type="data" label="Single-end reads" help=""/>
                <conditional name="strand">
                    <param name="is_strand_specific" type="boolean" checked="false" label="Strand specific data"/>
                    <when value="false">
                    </when>
                    <when value="true">
                        <param name="library_type" type="select" label="Strand-specific Library Type">
                            <option value="F">F</option>
                            <option value="R">R</option>
                        </param>
                    </when>
                </conditional>
            </when>
        </conditional>
        
        <conditional name="method">
            <param type="select" name="est_method" label="Abundance estimation method">
                <option value="RSEM">RSEM</option>
                <option value="eXpress">eXpress</option>
            </param>
            <when value="RSEM">
                <param type="select" name="aln_method" label="Alignment method">
                    <option value="bowtie">Bowtie</option>
                    <option value="bowtie2">Bowtie2</option>
                </param>
            </when>
            <when value="eXpress">
                <param type="select" name="aln_method" label="Alignment method">
                    <option value="bowtie">Bowtie</option>
                    <option value="bowtie2">Bowtie2</option>
                </param>
            </when>
        </conditional>

        <section name="additional_params" title="Additional Options" expanded="False">
            <conditional name="gene_map">
                <param name="has_gene_map" type="select" label="Trinity assembly?" help="If the transcripts were not assembled by trinity, additional information is needed">
                    <option value="no">No</option>
                    <option value="yes">Yes</option>
                </param>
                <when value="no">
                </when>
                <when value="yes">
                    <param format="tabular" name="gene_trans_map" type="data" label="Gene to transcript correspondence ('gene(tab)transcript' lines)" />
                </when>
            </conditional>
            
        </section>
    </inputs>
    <outputs>
        <data format="tabular" name="isoforms_counts_rsem" label="${tool.name} on ${on_string}: isoforms counts" from_work_dir="RSEM.isoforms.results">
            <filter>method['est_method'] == "RSEM"</filter>
        </data>
        <data format="tabular" name="genes_counts_rsem" label="${tool.name} on ${on_string}: genes counts" from_work_dir="RSEM.genes.results">
            <filter>method['est_method'] == "RSEM"</filter>
        </data>
        
        <data format="tabular" name="isoforms_counts_express" label="${tool.name} on ${on_string}: isoforms counts" from_work_dir="results.xprs">
            <filter>method['est_method'] == "eXpress"</filter>
        </data>
        <data format="tabular" name="genes_counts_express" label="${tool.name} on ${on_string}: genes counts" from_work_dir="results.xprs.genes">
            <filter>method['est_method'] == "eXpress"</filter>
        </data>
    </outputs>
    <tests>
        <test>
            <param name="paired_or_single" value="paired"/>
            <param name="left_input" value="reads.left.fq"/>
            <param name="right_input" value="reads.right.fq"/>
            <param name="transcripts" value="raw/Trinity.fasta"/>
            <param name="library_type" value="RF"/>
            <param name="est_method" value="RSEM"/>
            <param name="aln_method" value="bowtie"/>
            <param name="has_gene_map" value="no"/>
            <output name="isoforms_counts_rsem">
                <assert_contents>
                    <has_line_matching expression="TRINITY_DN0_c0_g1_i1&#009;.*" />
                    <has_n_columns n="8" />
                </assert_contents>
            </output>
            <output name="genes_counts_rsem">
                <assert_contents>
                    <has_line_matching expression="TRINITY_DN0_c0_g1&#009;.*" />
                    <has_n_columns n="7" />
                </assert_contents>
            </output>
        </test>
        <test>
            <param name="paired_or_single" value="paired"/>
            <param name="left_input" value="reads.left.fq"/>
            <param name="right_input" value="reads.right.fq"/>
            <param name="transcripts" value="raw/Trinity.fasta"/>
            <param name="library_type" value="RF"/>
            <param name="est_method" value="RSEM"/>
            <param name="aln_method" value="bowtie2"/>
            <param name="has_gene_map" value="no"/>
            <output name="isoforms_counts_rsem">
                <assert_contents>
                    <has_line_matching expression="TRINITY_DN0_c0_g1_i1&#009;.*" />
                    <has_n_columns n="8" />
                </assert_contents>
            </output>
            <output name="genes_counts_rsem">
                <assert_contents>
                    <has_line_matching expression="TRINITY_DN0_c0_g1&#009;.*" />
                    <has_n_columns n="7" />
                </assert_contents>
            </output>
        </test>
        <test>
            <param name="paired_or_single" value="paired"/>
            <param name="left_input" value="reads.left.fq"/>
            <param name="right_input" value="reads.right.fq"/>
            <param name="transcripts" value="raw/Trinity.fasta"/>
            <param name="library_type" value="RF"/>
            <param name="est_method" value="eXpress"/>
            <param name="aln_method" value="bowtie"/>
            <param name="has_gene_map" value="no"/>
            <output name="isoforms_counts_express">
                <assert_contents>
                    <has_line_matching expression=".*&#009;TRINITY_DN2_c3_g1_i1&#009;.*" />
                    <has_n_columns n="15" />
                </assert_contents>
            </output>
            <output name="genes_counts_express">
                <assert_contents>
                    <has_line_matching expression="NA&#009;TRINITY_DN3_c0_g1.*" />
                    <has_n_columns n="15" />
                </assert_contents>
            </output>
        </test>
    </tests>
    <help>
<![CDATA[
Trinity_ assembles transcript sequences from Illumina RNA-Seq data.
This tool estimates the abundance of isoforms and genes of a transcriptome assembled with Trinity, using FastQ of a specific sample.

**Inputs**

It takes as input a transcriptome assembled with Trinity and the reads from a RNASeq sample.
You have to choose between several counting methods.

If you dont align on a Trinity assembly, you need to provide a file of the following (tabular) format to map gene ids to transcript ids:

=========== ================
gene1       transcript1
----------- ----------------
gene2       transcript2
=========== ================

**Output**

This tool will produce 2 tabular files, with counts for isoforms and genes respectively. More details on this page:

.. _Trinity manual: https://github.com/trinityrnaseq/trinityrnaseq/wiki/Trinity-Transcript-Quantification


.. _Trinity: http://trinityrnaseq.github.io
]]>
    </help>
    
     <citations>
        <citation type="doi">doi:10.1038/nbt.1883</citation>
    </citations>
</tool>