diff align_and_estimate_abundance.xml @ 2:de0af39266ef draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trinity commit 77385ec02b79f527348aff01bd83a019e30f5f45
author iuc
date Mon, 25 Apr 2016 10:02:37 -0400
parents
children c7555bc21812
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/align_and_estimate_abundance.xml	Mon Apr 25 10:02:37 2016 -0400
@@ -0,0 +1,260 @@
+<tool id="align_and_estimate_abundance" name="Align reads and estimate abundance" version="2.1.1">
+    <description>on a de novo assembly of RNA-Seq data</description>
+    <requirements>
+        <requirement type="package" version="2.1.1">trinity</requirement>
+        <requirement type="package" version="1.1.2">bowtie</requirement>
+        <requirement type="package" version="2.2.6">bowtie2</requirement>
+        <requirement type="package" version="1.2">samtools</requirement>
+        <requirement type="package" version="1.2.28">rsem</requirement>
+        <requirement type="package" version="1.5.1">express</requirement>
+    </requirements>
+    <stdio>
+        <exit_code range="1:"/>
+    </stdio>
+    <command><![CDATA[
+        ln -s $transcripts input.fa
+
+        &&
+
+        align_and_estimate_abundance.pl
+       
+        --transcripts input.fa
+
+        --est_method $method.est_method
+        #if $method.est_method == "RSEM" or $method.est_method == "eXpress":
+            --aln_method $method.aln_method
+        #end if
+
+        #if $inputs.paired_or_single == "paired":
+            --left $inputs.left_input --right $inputs.right_input
+            
+            #if $inputs.left_input.is_of_type('fasta'):
+                --seqType fa
+            #else:
+                --seqType fq
+            #end if
+            
+            #if $inputs.strand.is_strand_specific:
+                --SS_lib_type $inputs.strand.library_type
+            #end if
+
+        #else:
+            --single $inputs.input
+            
+            #if $inputs.input.is_of_type('fasta'):
+                --seqType fa
+            #else:
+                --seqType fq
+            #end if
+            
+            #if $inputs.strand.is_strand_specific:
+                --SS_lib_type $inputs.strand.library_type
+            #end if
+        #end if
+        
+        --max_ins_size $inputs.paired_fragment_length
+
+        ## Additional parameters.
+        #if $additional_params.gene_map.has_gene_map == "yes":
+            --gene_trans_map $additional_params.gene_map.gene_trans_map
+        #else
+            --trinity_mode
+        #end if
+        
+        --prep_reference
+        
+        --output_dir .
+
+        ## CPU
+        --thread_count \${GALAXY_SLOTS:-4}
+    ]]></command>
+    <inputs>
+        <param format="fasta" name="transcripts" type="data" label="Transcripts" help="de novo assembly of RNA-Seq data"/>
+        <conditional name="inputs">
+            <param name="paired_or_single" type="select" label="Paired or Single-end data?">
+                <option value="paired">Paired</option>
+                <option value="single">Single</option>
+            </param>
+            <when value="paired">
+                <param format="fasta,fastqsanger" name="left_input" type="data" label="Left/Forward strand reads" help=""/>
+                <param format="fasta,fastqsanger" name="right_input" type="data" label="Right/Reverse strand reads" help=""/>
+                <conditional name="strand">
+                    <param name="is_strand_specific" type="boolean" checked="false" label="Strand specific data"/>
+                    <when value="false">
+                    </when>
+                    <when value="true">
+                        <param name="library_type" type="select" label="Strand-specific Library Type">
+                            <option value="FR">Forward-Reverse</option>
+                            <option value="RF">Reverse-Forward</option>
+                        </param>
+                    </when>
+                </conditional>
+                <param name="paired_fragment_length" type="integer" value="800" min="1" label="Maximum insert size" help="bowtie -X parameter"/>
+            </when>
+            <when value="single">
+                <param format="fasta,fastqsanger" name="input" type="data" label="Single-end reads" help=""/>
+                <conditional name="strand">
+                    <param name="is_strand_specific" type="boolean" checked="false" label="Strand specific data"/>
+                    <when value="false">
+                    </when>
+                    <when value="true">
+                        <param name="library_type" type="select" label="Strand-specific Library Type">
+                            <option value="F">F</option>
+                            <option value="R">R</option>
+                        </param>
+                    </when>
+                </conditional>
+            </when>
+        </conditional>
+        
+        <conditional name="method">
+            <param type="select" name="est_method" label="Abundance estimation method">
+                <option value="RSEM">RSEM</option>
+                <option value="eXpress">eXpress</option>
+            </param>
+            <when value="RSEM">
+                <param type="select" name="aln_method" label="Alignment method">
+                    <option value="bowtie">Bowtie</option>
+                    <option value="bowtie2">Bowtie2</option>
+                </param>
+            </when>
+            <when value="eXpress">
+                <param type="select" name="aln_method" label="Alignment method">
+                    <option value="bowtie">Bowtie</option>
+                    <option value="bowtie2">Bowtie2</option>
+                </param>
+            </when>
+        </conditional>
+
+        <section name="additional_params" title="Additional Options" expanded="False">
+            <conditional name="gene_map">
+                <param name="has_gene_map" type="select" label="Trinity assembly?" help="If the transcripts were not assembled by trinity, additional information is needed">
+                    <option value="no">No</option>
+                    <option value="yes">Yes</option>
+                </param>
+                <when value="no">
+                </when>
+                <when value="yes">
+                    <param format="tabular" name="gene_trans_map" type="data" label="Gene to transcript correspondence ('gene(tab)transcript' lines)" />
+                </when>
+            </conditional>
+            
+        </section>
+    </inputs>
+    <outputs>
+        <data format="tabular" name="isoforms_counts_rsem" label="${tool.name} on ${on_string}: isoforms counts" from_work_dir="RSEM.isoforms.results">
+            <filter>method['est_method'] == "RSEM"</filter>
+        </data>
+        <data format="tabular" name="genes_counts_rsem" label="${tool.name} on ${on_string}: genes counts" from_work_dir="RSEM.genes.results">
+            <filter>method['est_method'] == "RSEM"</filter>
+        </data>
+        
+        <data format="tabular" name="isoforms_counts_express" label="${tool.name} on ${on_string}: isoforms counts" from_work_dir="results.xprs">
+            <filter>method['est_method'] == "eXpress"</filter>
+        </data>
+        <data format="tabular" name="genes_counts_express" label="${tool.name} on ${on_string}: genes counts" from_work_dir="results.xprs.genes">
+            <filter>method['est_method'] == "eXpress"</filter>
+        </data>
+    </outputs>
+    <tests>
+        <test>
+            <param name="paired_or_single" value="paired"/>
+            <param name="left_input" value="reads.left.fq"/>
+            <param name="right_input" value="reads.right.fq"/>
+            <param name="transcripts" value="raw/Trinity.fasta"/>
+            <param name="library_type" value="RF"/>
+            <param name="est_method" value="RSEM"/>
+            <param name="aln_method" value="bowtie"/>
+            <param name="has_gene_map" value="no"/>
+            <output name="isoforms_counts_rsem">
+                <assert_contents>
+                    <has_line_matching expression="TRINITY_DN0_c0_g1_i1&#009;.*" />
+                    <has_n_columns n="8" />
+                </assert_contents>
+            </output>
+            <output name="genes_counts_rsem">
+                <assert_contents>
+                    <has_line_matching expression="TRINITY_DN0_c0_g1&#009;.*" />
+                    <has_n_columns n="7" />
+                </assert_contents>
+            </output>
+        </test>
+        <test>
+            <param name="paired_or_single" value="paired"/>
+            <param name="left_input" value="reads.left.fq"/>
+            <param name="right_input" value="reads.right.fq"/>
+            <param name="transcripts" value="raw/Trinity.fasta"/>
+            <param name="library_type" value="RF"/>
+            <param name="est_method" value="RSEM"/>
+            <param name="aln_method" value="bowtie2"/>
+            <param name="has_gene_map" value="no"/>
+            <output name="isoforms_counts_rsem">
+                <assert_contents>
+                    <has_line_matching expression="TRINITY_DN0_c0_g1_i1&#009;.*" />
+                    <has_n_columns n="8" />
+                </assert_contents>
+            </output>
+            <output name="genes_counts_rsem">
+                <assert_contents>
+                    <has_line_matching expression="TRINITY_DN0_c0_g1&#009;.*" />
+                    <has_n_columns n="7" />
+                </assert_contents>
+            </output>
+        </test>
+        <test>
+            <param name="paired_or_single" value="paired"/>
+            <param name="left_input" value="reads.left.fq"/>
+            <param name="right_input" value="reads.right.fq"/>
+            <param name="transcripts" value="raw/Trinity.fasta"/>
+            <param name="library_type" value="RF"/>
+            <param name="est_method" value="eXpress"/>
+            <param name="aln_method" value="bowtie"/>
+            <param name="has_gene_map" value="no"/>
+            <output name="isoforms_counts_express">
+                <assert_contents>
+                    <has_line_matching expression=".*&#009;TRINITY_DN2_c3_g1_i1&#009;.*" />
+                    <has_n_columns n="15" />
+                </assert_contents>
+            </output>
+            <output name="genes_counts_express">
+                <assert_contents>
+                    <has_line_matching expression="NA&#009;TRINITY_DN3_c0_g1.*" />
+                    <has_n_columns n="15" />
+                </assert_contents>
+            </output>
+        </test>
+    </tests>
+    <help>
+<![CDATA[
+Trinity_ assembles transcript sequences from Illumina RNA-Seq data.
+This tool estimates the abundance of isoforms and genes of a transcriptome assembled with Trinity, using FastQ of a specific sample.
+
+**Inputs**
+
+It takes as input a transcriptome assembled with Trinity and the reads from a RNASeq sample.
+You have to choose between several counting methods.
+
+If you dont align on a Trinity assembly, you need to provide a file of the following (tabular) format to map gene ids to transcript ids:
+
+=========== ================
+gene1       transcript1
+----------- ----------------
+gene2       transcript2
+=========== ================
+
+**Output**
+
+This tool will produce 2 tabular files, with counts for isoforms and genes respectively. More details on this page:
+
+.. _Trinity manual: https://github.com/trinityrnaseq/trinityrnaseq/wiki/Trinity-Transcript-Quantification
+
+
+.. _Trinity: http://trinityrnaseq.github.io
+]]>
+    </help>
+    
+     <citations>
+        <citation type="doi">doi:10.1038/nbt.1883</citation>
+    </citations>
+</tool>
+