Repository 'ngsap2'
hg clone https://toolshed.g2.bx.psu.edu/repos/mytest/ngsap2

Changeset 0:cc71440b759f (2015-09-22)
Commit message:
Uploaded
added:
NGSAP-Workflow-Denovo_workflow.ga
NGSAP-Workflow-Reference_based_workflow.ga
README.rst
abundance_estimates_to_matrix.xml
align_and_estimate_abundance.xml
all_de_steps.xml
blast_parser.xml
gtf2fasta.xml
insilico_read_normalization.xml
pfam_db.loc.sample
tool_dependencies.xml
transDecoder.xml
trinityStats.xml
trinityrnaseq.xml
trinityrnaseq.xml~
b
diff -r 000000000000 -r cc71440b759f NGSAP-Workflow-Denovo_workflow.ga
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/NGSAP-Workflow-Denovo_workflow.ga Tue Sep 22 01:58:00 2015 -0400
[
b'@@ -0,0 +1,792 @@\n+{\n+    "a_galaxy_workflow": "true", \n+    "annotation": "NGSAP workflow 1", \n+    "format-version": "0.1", \n+    "name": "Denovo_workflow", \n+    "steps": {\n+        "0": {\n+            "annotation": "", \n+            "id": 0, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "R1_left"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 191, \n+                "top": 195\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"R1_left\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uuid": "1c908163-a494-4e00-8463-2f3611220745"\n+        }, \n+        "1": {\n+            "annotation": "", \n+            "id": 1, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "R1_right"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 200, \n+                "top": 285\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"R1_right\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uuid": "f5d95ab6-b503-45a0-bbb4-c3c2980f4a04"\n+        }, \n+        "2": {\n+            "annotation": "", \n+            "id": 2, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "R2_left"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 200, \n+                "top": 370\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"R2_left\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uuid": "a296680e-69bd-4e43-87f3-5a19a3dfb00a"\n+        }, \n+        "3": {\n+            "annotation": "", \n+            "id": 3, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "R4_left"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 200, \n+                "top": 709.9999694824219\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"R4_left\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uuid": "da874053-bcaa-4a91-a4b6-43b722799b5a"\n+        }, \n+        "4": {\n+            "annotation": "", \n+            "id": 4, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "R3_left"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 200, \n+                "top": 539.9999694824219\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"R3_left\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uu'..b': {\n+                    "id": 12, \n+                    "output_name": "rsem_isoforms"\n+                }, \n+                "isoform_sample_2|isoform_sample_matrix": {\n+                    "id": 14, \n+                    "output_name": "rsem_isoforms"\n+                }, \n+                "isoform_sample_3|isoform_sample_matrix": {\n+                    "id": 16, \n+                    "output_name": "rsem_isoforms"\n+                }, \n+                "isoform_sample_4|isoform_sample_matrix": {\n+                    "id": 17, \n+                    "output_name": "rsem_isoforms"\n+                }\n+            }, \n+            "inputs": [], \n+            "label": null, \n+            "name": "Differential Expression", \n+            "outputs": [\n+                {\n+                    "name": "de_output", \n+                    "type": "zip"\n+                }, \n+                {\n+                    "name": "output_log", \n+                    "type": "txt"\n+                }\n+            ], \n+            "position": {\n+                "left": 1589.0000305175781, \n+                "top": 313\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/mytest/ngsap1/differential_expression/1.0", \n+            "tool_state": "{\\"isoform_sample\\": \\"[{\\\\\\"__index__\\\\\\": 0, \\\\\\"isoform_sample_matrix\\\\\\": null, \\\\\\"sample_name\\\\\\": \\\\\\"Sample1\\\\\\"}, {\\\\\\"__index__\\\\\\": 2, \\\\\\"isoform_sample_matrix\\\\\\": null, \\\\\\"sample_name\\\\\\": \\\\\\"Sample2\\\\\\"}, {\\\\\\"__index__\\\\\\": 3, \\\\\\"isoform_sample_matrix\\\\\\": null, \\\\\\"sample_name\\\\\\": \\\\\\"Sample3\\\\\\"}, {\\\\\\"__index__\\\\\\": 4, \\\\\\"isoform_sample_matrix\\\\\\": null, \\\\\\"sample_name\\\\\\": \\\\\\"Sample4\\\\\\"}]\\", \\"__page__\\": 0, \\"est_method\\": \\"\\\\\\"RSEM\\\\\\"\\", \\"__rerun_remap_job_id__\\": null, \\"method\\": \\"\\\\\\"edgeR\\\\\\"\\"}", \n+            "tool_version": "1.0", \n+            "type": "tool", \n+            "user_outputs": [], \n+            "uuid": "ad56b1ff-e6d3-492e-b17b-72d68285ae17"\n+        }, \n+        "20": {\n+            "annotation": "", \n+            "id": 20, \n+            "input_connections": {\n+                "blastoutfile": {\n+                    "id": 18, \n+                    "output_name": "output1"\n+                }, \n+                "trinityassembledfile": {\n+                    "id": 15, \n+                    "output_name": "transdecoder_pep"\n+                }\n+            }, \n+            "inputs": [], \n+            "label": null, \n+            "name": "BLAST OUTPUT PARSER", \n+            "outputs": [\n+                {\n+                    "name": "parsed_blastfile_above_cutoff", \n+                    "type": "tabular"\n+                }, \n+                {\n+                    "name": "parsed_blastfile_below_cutoff", \n+                    "type": "tabular"\n+                }, \n+                {\n+                    "name": "oneline_file", \n+                    "type": "fasta"\n+                }, \n+                {\n+                    "name": "blastfile_below_cutoff", \n+                    "type": "fasta"\n+                }, \n+                {\n+                    "name": "blastfile_above_cutoff", \n+                    "type": "fasta"\n+                }\n+            ], \n+            "position": {\n+                "left": 1912.9999084472656, \n+                "top": 200\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/mytest/ngsap1/blast_parser_using_awk/0.0.1", \n+            "tool_state": "{\\"__page__\\": 0, \\"blastoutfile\\": \\"null\\", \\"evalue\\": \\"\\\\\\"1e-05\\\\\\"\\", \\"trinityassembledfile\\": \\"null\\", \\"qcovs\\": \\"\\\\\\"95\\\\\\"\\", \\"__rerun_remap_job_id__\\": null}", \n+            "tool_version": "0.0.1", \n+            "type": "tool", \n+            "user_outputs": [], \n+            "uuid": "a3e88afe-a154-43b3-8f7c-8baa37e529c0"\n+        }\n+    }, \n+    "uuid": "7bbee726-311d-420a-92f8-fed0c0d00e1a"\n+}\n'
b
diff -r 000000000000 -r cc71440b759f NGSAP-Workflow-Reference_based_workflow.ga
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/NGSAP-Workflow-Reference_based_workflow.ga Tue Sep 22 01:58:00 2015 -0400
[
b'@@ -0,0 +1,1364 @@\n+{\n+    "a_galaxy_workflow": "true", \n+    "annotation": "NGSAP workflow 2", \n+    "format-version": "0.1", \n+    "name": "Reference_based_workflow", \n+    "steps": {\n+        "0": {\n+            "annotation": "", \n+            "id": 0, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "C1_R1"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 150, \n+                "top": 440.58334350585938\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"C1_R1\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uuid": "d466bcf1-44fd-48e5-b25b-24db8173941f"\n+        }, \n+        "1": {\n+            "annotation": "", \n+            "id": 1, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "C1_R2"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 169, \n+                "top": 508.58334350585938\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"C1_R2\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uuid": "2a107ff8-0c09-40ec-bc7d-0b6f5b87fc8e"\n+        }, \n+        "2": {\n+            "annotation": "", \n+            "id": 2, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "C2_R1"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 127, \n+                "top": 588.58334350585938\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"C2_R1\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uuid": "a030d9b3-55ed-4668-acb0-5cfffc4eabc4"\n+        }, \n+        "3": {\n+            "annotation": "", \n+            "id": 3, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "C2_R2"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 148, \n+                "top": 674.58334350585938\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"C2_R2\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": [], \n+            "uuid": "ea00291e-3b19-4887-9e35-a7be6c141572"\n+        }, \n+        "4": {\n+            "annotation": "", \n+            "id": 4, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "C3_R2"\n+                }\n+            ], \n+            "label": null, \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 202, \n+                "top": 836.58334350585938\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"C3_R2\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "u'..b'n": "1.0", \n+            "type": "tool", \n+            "user_outputs": [], \n+            "uuid": "cd9576bd-5729-418d-808c-cba84fc4f597"\n+        }, \n+        "33": {\n+            "annotation": "", \n+            "id": 33, \n+            "input_connections": {\n+                "isoform_sample_0|isoform_sample_matrix": {\n+                    "id": 28, \n+                    "output_name": "rsem_isoforms"\n+                }, \n+                "isoform_sample_1|isoform_sample_matrix": {\n+                    "id": 29, \n+                    "output_name": "rsem_isoforms"\n+                }, \n+                "isoform_sample_2|isoform_sample_matrix": {\n+                    "id": 30, \n+                    "output_name": "rsem_isoforms"\n+                }, \n+                "isoform_sample_3|isoform_sample_matrix": {\n+                    "id": 31, \n+                    "output_name": "rsem_isoforms"\n+                }\n+            }, \n+            "inputs": [], \n+            "label": null, \n+            "name": "Differential Expression", \n+            "outputs": [\n+                {\n+                    "name": "de_output", \n+                    "type": "zip"\n+                }, \n+                {\n+                    "name": "output_log", \n+                    "type": "txt"\n+                }\n+            ], \n+            "position": {\n+                "left": 3247.3167419433594, \n+                "top": 1127.3999938964844\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/mytest/ngsap1/differential_expression/1.0", \n+            "tool_state": "{\\"isoform_sample\\": \\"[{\\\\\\"__index__\\\\\\": 0, \\\\\\"isoform_sample_matrix\\\\\\": null, \\\\\\"sample_name\\\\\\": \\\\\\"s1\\\\\\"}, {\\\\\\"__index__\\\\\\": 1, \\\\\\"isoform_sample_matrix\\\\\\": null, \\\\\\"sample_name\\\\\\": \\\\\\"s2\\\\\\"}, {\\\\\\"__index__\\\\\\": 2, \\\\\\"isoform_sample_matrix\\\\\\": null, \\\\\\"sample_name\\\\\\": \\\\\\"s3\\\\\\"}, {\\\\\\"__index__\\\\\\": 3, \\\\\\"isoform_sample_matrix\\\\\\": null, \\\\\\"sample_name\\\\\\": \\\\\\"s4\\\\\\"}]\\", \\"__page__\\": 0, \\"est_method\\": \\"\\\\\\"RSEM\\\\\\"\\", \\"__rerun_remap_job_id__\\": null, \\"method\\": \\"\\\\\\"edgeR\\\\\\"\\"}", \n+            "tool_version": "1.0", \n+            "type": "tool", \n+            "user_outputs": [], \n+            "uuid": "f050b6ce-635b-429c-91b0-0fdd7a367895"\n+        }, \n+        "34": {\n+            "annotation": "", \n+            "id": 34, \n+            "input_connections": {\n+                "query": {\n+                    "id": 32, \n+                    "output_name": "transdecoder_pep"\n+                }\n+            }, \n+            "inputs": [], \n+            "label": null, \n+            "name": "NCBI BLAST+ blastp", \n+            "outputs": [\n+                {\n+                    "name": "output1", \n+                    "type": "tabular"\n+                }\n+            ], \n+            "position": {\n+                "left": 3150.3167419433594, \n+                "top": 891.39999389648438\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/ncbi_blast_plus/ncbi_blastp_wrapper/0.1.01", \n+            "tool_state": "{\\"evalue_cutoff\\": \\"\\\\\\"0.001\\\\\\"\\", \\"__page__\\": 0, \\"adv_opts\\": \\"{\\\\\\"adv_opts_selector\\\\\\": \\\\\\"basic\\\\\\", \\\\\\"__current_case__\\\\\\": 0}\\", \\"__rerun_remap_job_id__\\": null, \\"blast_type\\": \\"\\\\\\"blastp\\\\\\"\\", \\"db_opts\\": \\"{\\\\\\"db_opts_selector\\\\\\": \\\\\\"db\\\\\\", \\\\\\"subject\\\\\\": \\\\\\"\\\\\\", \\\\\\"histdb\\\\\\": \\\\\\"\\\\\\", \\\\\\"__current_case__\\\\\\": 0, \\\\\\"database\\\\\\": {\\\\\\"__class__\\\\\\": \\\\\\"UnvalidatedValue\\\\\\", \\\\\\"value\\\\\\": null}}\\", \\"output\\": \\"{\\\\\\"out_format\\\\\\": \\\\\\"ext\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"query\\": \\"null\\"}", \n+            "tool_version": "0.1.01", \n+            "type": "tool", \n+            "user_outputs": [], \n+            "uuid": "66733833-c554-4f7f-bea2-5acbe7b0f039"\n+        }\n+    }, \n+    "uuid": "a38fab70-37ac-4d67-9952-68f25ea6194a"\n+}\n'
b
diff -r 000000000000 -r cc71440b759f README.rst
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/README.rst Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,18 @@
+Introduction
+============
+
+Next Generation Sequence Analysis Pipelines (NGSAP) is to provide a user friendly platform for NGS analysis to support researchers working on myriad aspects of life sciences with post processing of the next generation sequencing data. It has beed designed specifically for transcriptomics tools available through Galaxy for data analysis which can be translated into meaningful scientific publications. NGSAP is an initiative of NGSAP team working in School of Computational and Integrative Sciences at Jawaharlal Nehru University, Delhi
+
+NGSAP provides two worlflows
+
+
+Denovo Assembly and differential gene analysis workflow
+========================================================
+
+details of the workflow
+
+
+Reference based assembly and differential gene analysis workflow
+=================================================================
+details of the workflow
+
b
diff -r 000000000000 -r cc71440b759f abundance_estimates_to_matrix.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/abundance_estimates_to_matrix.xml Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,39 @@
+<tool id='abundance_estimates_to_matrix' name='abundance estimates to matrix' version='1.0'>
+<description> Generates combined Matrix for abundance estimates </description>
+<!--requirement></requirement-->
+<requirements>
+        <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
+        <requirement type="R-module">edgeR</requirement>
+        <requirement type="set_environment">TRINITY_HOME</requirement>
+
+</requirements>
+<command interpreter='perl'>\$TRINITY_HOME/util/abundance_estimates_to_matrix.pl 
+ --est_method $est_method  
+ #for $i in $isoform_sample:
+ $i.isoform_sample_matrix
+ #end for
+ &gt; $output_log 2&gt;&amp;1;
+</command>
+
+<inputs>
+ <!-- Required -->
+
+  <param name='est_method' type='select' display="radio"  label='Select est_method'>
+   <option value="RSEM" selected='true'>RSEM</option>
+   <option value="eXpress">eXpress</option>
+  </param>
+
+
+  <repeat name="isoform_sample" title="Isoform Sample" min="2">
+   <param name="isoform_sample_matrix" type="data" label="Isoform Sample Matrix"/>
+  </repeat>
+
+ <!-- Optional -->
+
+</inputs>
+<outputs>
+ <data name='matrix_count' format='tabular' label="${tool.name} on ${on_string}: matrix_count" from_work_dir="matrix.counts.matrix"/>
+ <data name='matrix_fpkm' format='tabular' label="${tool.name} on ${on_string} : matrix_fpkm" from_work_dir="matrix.TMM.fpkm.matrix"/>
+ <data name='output_log' format='txt' label="${tool.name} on ${on_string} : matrix_log"/>
+</outputs>
+</tool>
b
diff -r 000000000000 -r cc71440b759f align_and_estimate_abundance.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/align_and_estimate_abundance.xml Tue Sep 22 01:58:00 2015 -0400
[
@@ -0,0 +1,150 @@
+<tool id='id_align_and_estimate_abundance' name='align_and_estimate_abundance' version='1.0'>
+
+<description>align_and_estimate_abundance</description>
+
+<requirements>
+        <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
+        <requirement type="package" version="1.1.17">rsem</requirement>
+        <requirement type="package" version="1.5.1">eXpress</requirement>
+        <requirement type="package" version="2.1.0">bowtie2</requirement>
+        <requirement type="package" version="0.12.7">bowtie</requirement>
+        <requirement type="package" version="0.1.18">samtools</requirement>
+        <requirement type="set_environment">TRINITY_HOME</requirement>
+
+</requirements>
+<command >perl \$TRINITY_HOME/util/align_and_estimate_abundance.pl
+ --transcripts $transcripts
+ --est_method $est_method
+ --aln_method $aln_method
+ --prep_reference
+
+ ## Inputs.
+ #if str($reads.paired_or_single) == "paired":
+
+         --left $reads.left_input --right $reads.right_input
+
+         #if  $reads.left_input.ext == 'fa':
+         --seqType fa
+         #else:
+                 --seqType fq
+         #end if
+
+ ## Additional parameters.
+         #if str($reads.optional.use_options) == "yes":
+
+                 #if str($reads.optional.library_type) != "None":
+                --SS_lib_type $reads.optional.library_type
+                 #end if
+
+
+
+         #end if
+
+        #else:
+         --single $reads.input
+
+         #if  str($reads.input.ext) == 'fa':
+              --seqType fa
+         #else:
+             --seqType fq
+         #end if
+
+                ## Additional parameters.
+                #if str($reads.optional.use_option) == "yes":
+
+                        #if str($reads.additional_params.library_type) != "None":
+                         --SS_lib_type $reads.optional.library_type
+                        #end if
+
+                #end if
+ #end if
+
+## direct to output
+&gt; $align_and_estimate_abundance_log 2&gt;&amp;1;samtools sort bowtie.bam bowtie_sorted
+
+</command>
+
+<inputs>
+
+<!-- Required -->
+<param name="transcripts" type="data" format="fasta" label="Transcripts [ in fasta format ]" help="--transcripts &lt; string &gt; ; transcript fasta file"/>
+
+<param name="est_method" type="select" display="radio" label="Choose abundance estimation method" help="">
+ <option value="RSEM" selected="True">RSEM</option>
+ <option value="eXpress">eXpress</option>
+</param>
+
+<param name="aln_method" type="select" display="radio" label="Choose alignment method" help="">
+ <option value="bowtie" selected="True">bowtie</option>
+ <option value="bowtie2">bowtie2</option>
+</param>
+
+<conditional name="reads">
+ <param name="paired_or_single" type="select" label="Paired or Single-end reads?">
+ <option value="paired">Paired</option>
+ <option value="single">Single</option>
+ </param>
+
+
+ <when value="paired">
+ <param format="fastq" name="left_input" type="data" label="Left/Forward strand reads" help=""/>
+ <param format="fastq" name="right_input" type="data" label="Right/Reverse strand reads" help=""/>
+
+ <param name="seqtype" type="select" label="--seqType" help="">
+ <option value='fq' selected='true'>fastq</option>
+ <option value='fa'>fasta</option> 
+ </param>
+
+ <conditional name='optional'>
+ <param name='use_options' type='select' label='Use Optional parameters?'>
+ <option value='no'>NO</option>
+ <option value='yes'>YES</option>
+ </param>
+ <when value='no'/>
+ <when value='yes'>
+ <param name="library_type" type="select" label="Strand-specific Library Type">
+ <option value="None">None</option>
+ <option value="FR">FR</option>
+ <option value="RF">RF</option>
+ </param>
+
+
+
+ </when>
+ </conditional>
+ </when>
+
+ <when value="single">
+ <param format="fastq" name="input" type="data" label="Single-end reads" help=""/>
+ <param name="seqtype" type="select" label="--seqType" help="">
+ <option value='fq' selected='true'>fastq</option>
+ <option value='fa'>fasta</option> 
+ </param>
+
+ <conditional name='optional'>
+ <param name='use_options' type='select' label='Use Optional parameters?'>
+ <option value='no'>NO</option>
+ <option value='yes'>YES</option>
+ </param>
+ <when value='no'/>
+ <when value='yes'>
+ <param name="library_type" type="select" label="Strand-specific Library Type">
+ <option value="None">None</option>
+ <option value="F">F</option>
+ <option value="R">R</option>
+ </param>
+ </when>
+ </conditional>
+ </when>
+</conditional>
+
+</inputs>
+
+<outputs>
+ <data format="txt" name="align_and_estimate_abundance_log" label="${tool.name} on ${on_string}: log" />
+ <data format="bam" name="bowtie_bam" label="${tool.name} on ${on_string}: bam" from_work_dir="bowtie_sorted.bam" />
+ <data format="tabular"  name="rsem_isoforms"  label="${tool.name} on ${on_string}: isoforms" from_work_dir="RSEM.isoforms.results"/>
+ <data format="tabular"  name="rsem_genes" label="${tool.name} on ${on_string}: genes" from_work_dir="RSEM.genes.results"/>
+</outputs>
+</tool>
+
b
diff -r 000000000000 -r cc71440b759f all_de_steps.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/all_de_steps.xml Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,94 @@
+<tool id='differential_expression' name='Differential Expression' version='1.0'>
+<description>Generates results for DE </description>
+<!--requirement></requirement-->
+<requirements>
+        <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
+        <requirement type="set_environment">TRINITY_HOME</requirement>
+
+</requirements>
+<command>
+
+echo  -e "Differential Expression Log File" &gt; $output_log 2&gt;&amp;1;
+
+## Step 0: preprocess  input_file preparaton
+
+ #for $i in $isoform_sample:
+ cp -s $i.isoform_sample_matrix $i.sample_name;
+ #end for;
+
+
+## Step 1: abundance_estimates_to_matrix
+echo -e "" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "\#\# Step 1: abundance_estimates_to_matrix" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "" &gt;&gt;  $output_log  2&gt;&amp;1;
+
+
+perl \$TRINITY_HOME/util/abundance_estimates_to_matrix.pl 
+ --est_method $est_method  
+ #for $i in $isoform_sample:
+ $i.sample_name
+ #end for
+ &gt;&gt; $output_log 2&gt;&amp;1;
+
+
+## Step 2: run_DE_analysis 
+echo -e "" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "\#\# Step 2: run_DE_analysis" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "" &gt;&gt;  $output_log  2&gt;&amp;1;
+
+perl \$TRINITY_HOME/Analysis/DifferentialExpression/run_DE_analysis.pl
+        --matrix matrix.counts.matrix
+        --method $method
+        --output result_dir
+        &gt;&gt; $output_log 2&gt;&amp;1;
+
+## Step 3: analyze_diff_expr
+echo -e "" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#\#" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "\#\# Step 3: analyze_diff_expr" &gt;&gt;  $output_log  2&gt;&amp;1;
+echo -e "" &gt;&gt;  $output_log  2&gt;&amp;1;
+
+cd result_dir &amp;&amp; perl \$TRINITY_HOME/Analysis/DifferentialExpression/analyze_diff_expr.pl
+
+ --matrix ../matrix.TMM.fpkm.matrix
+
+        &gt;&gt; $output_log 2&gt;&amp;1;
+
+pwd;
+cd .. &amp;&amp; zip -r results.zip result_dir;
+</command>
+
+<inputs>
+ <!-- Required -->
+
+  <param name='est_method' type='select' display="radio"  label='Select est_method'>
+   <option value="RSEM" selected='true'>RSEM</option>
+   <option value="eXpress">eXpress</option>
+  </param>
+
+
+  <repeat name="isoform_sample" title="Isoform Sample" min="2">
+         <param name="sample_name" type="text" label="Sample Name" help="Only alpha-numerical name without space."> 
+   <validator type="empty_field" message="don't leave the field empty!"/> 
+  </param>
+ <param format="tabular" name="isoform_sample_matrix" type="data" label="Isoform Sample Matrix"/>
+  </repeat>
+
+  <param name='method' type="select" label="Select Method" >
+         <option value="edgeR">edgeR</option>
+         <option value="DESeq">DESeq</option>
+         <option value="DESeq2">DESeq2</option>
+  </param>
+
+
+
+ <!-- Optional -->
+
+</inputs>
+<outputs>
+ <data name='de_output' format='zip' label="${tool.name} on ${on_string}: compressed_output" from_work_dir="results.zip"/>
+ <data name='output_log' format='txt' label="${tool.name} on ${on_string} : matrix_log"/>
+</outputs>
+</tool>
b
diff -r 000000000000 -r cc71440b759f blast_parser.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/blast_parser.xml Tue Sep 22 01:58:00 2015 -0400
[
@@ -0,0 +1,59 @@
+<?xml version="1.0"?>
+<tool id="blast_parser_using_awk" name="BLAST OUTPUT PARSER" version="0.0.1">
+
+<description>parses Blast Output File</description>
+
+<command>
+   /bin/awk 
+   'BEGIN {FS="\t"} {if($11 &lt;= $evalue &amp;&amp;  $13 &gt;= $qcovs) print $0 }'  
+   $blastoutfile  
+   &gt; $parsed_blastfile_above_cutoff;
+
+   /bin/awk 
+   '{FS="\t"} {if($11 &gt; $evalue ||  $13 &lt; $qcovs) print $0 }'  
+   $blastoutfile 
+   &gt; $parsed_blastfile_below_cutoff;
+
+   /bin/sed -e '/^&gt;/s/$/@@@@/' -e 's/^&gt;/#/' $trinityassembledfile 
+      |  tr -d '\n' 
+      |  tr "#" '\n' 
+      |  sed -e 's/^/&gt;/' -e 's/@@@@/\n/' 
+      |  sed -e  "1d"  
+      &gt; $oneline_file;
+
+   /bin/awk 
+   'BEGIN {FS="|"} {print "grep -w -A 1 \""$1"\" $oneline_file &gt;&gt; $blastfile_below_cutoff"}' 
+   $parsed_blastfile_below_cutoff  
+   &gt; pick_below_sh;
+
+   /bin/sh pick_below_sh;
+
+   /bin/awk 
+   'BEGIN {FS="|"} {print "grep -w -A 1 \""$1"\" $oneline_file &gt;&gt; $blastfile_above_cutoff"}' 
+   $parsed_blastfile_above_cutoff  
+   &gt; pick_above_sh;
+   
+   /bin/sh pick_above_sh;
+   
+</command>
+
+<inputs>
+ <param name="blastoutfile" type="data" format="tabular" label="blast output file"/>
+ <param name="trinityassembledfile" type="data" format="fasta" label="Trinity Assembled [fasta file]" /> 
+ <param name="evalue" type="float"  value='1e-05'  label="EVALUE" help="default (evalue &lt; = 1e-05)"/>
+ <param name="qcovs" type="integer"  value='95'  label="Query Coverage" help="default (qcovs &gt;  = 95)"/>
+</inputs>

+<outputs>
+ <data name="parsed_blastfile_above_cutoff" format="tabular" label="parsed_blastfile (Above Cutoff Value)" />
+ <data name="parsed_blastfile_below_cutoff" format="tabular" label="parsed_blastfile (Below cutoff Value)" />
+ <data name="oneline_file" format="fasta" label="parsed_trinity_assembled_file (oneline_file)" />
+ <data name="blastfile_below_cutoff" format="fasta" label="blast fasta file (Below cutoff Value)" />
+ <data name="blastfile_above_cutoff" format="fasta" label="blast fasta file (Above cutoff Value)" />
+</outputs>
+
+<tests/>
+<help>blast output parser tool</help>
+
+
+</tool>
b
diff -r 000000000000 -r cc71440b759f gtf2fasta.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/gtf2fasta.xml Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,30 @@
+<tool id='id_gtf2fasta' name='gtf2fasta' version='1.0'>
+
+<description>
+        Converts gtf  to fasta
+</description>
+ <requirements>
+ <requirement type="package" version="2.0.9">tophat2</requirement>
+ </requirements>
+
+<command >gtf_to_fasta $gtf $genome $fasta</command>
+
+<inputs>
+        <param name='gtf' type='data' format="gtf"  optional='false' label='gtf_file' help='input gtf file'/>
+        <param name='genome' type='data' format="fasta" optional='false' label='genome_file' help='input genome'/>
+</inputs>
+
+
+<outputs>
+        <data format='fasta' name='fasta' label='fasta file'/>
+</outputs>
+
+
+<help>
+**What it does**
+  Converts gtf file to fasta using reference genome
+
+</help>
+
+</tool>
+
b
diff -r 000000000000 -r cc71440b759f insilico_read_normalization.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/insilico_read_normalization.xml Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,152 @@
+<?xml version="1.0"?>
+<tool id="insilico_read_nomalization" name="Insilico Read Normalization" version="0.0.1">
+
+<description>Read Normalization</description>
+<requirements>
+        <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
+        <requirement type="set_environment">TRINITY_HOME</requirement>
+
+</requirements>
+<command interperter="perl"> \$TRINITY_HOME/util/insilico_read_normalization.pl
+--JM $JM
+--max_cov $maximum_coverage
+
+## Inputs.
+#if str($inputs.paired_or_single) == "paired":
+
+ --left $inputs.left_input --right $inputs.right_input
+
+ #if  $inputs.left_input.ext == 'fa':
+ --seqType fa
+ #else:
+ --seqType fq
+ #end if
+
+ ## Additional parameters.
+ #if str($inputs.additional_params.use_additional) == "yes":
+
+ #if str($inputs.additional_params.library_type) != "None":
+ --SS_lib_type $inputs.additional_params.library_type
+ #end if
+
+ $inputs.additional_params.pairs_together
+ --CPU $inputs.additional_params.CPU
+ $inputs.additional_params.PARALLEL_STATS
+ --KMER_SIZE $inputs.additional_params.KMER_SIZE
+ --max_pct_stdev $inputs.additional_params.max_pct_stdev
+
+ #end if
+
+
+#else:
+
+ --single $inputs.input
+
+ #if  str($inputs.input.ext) == 'fa':
+ --seqType fa
+ #else:
+ --seqType fq
+ #end if
+
+ ## Additional parameters.
+ #if str($inputs.additional_params.use_additional) == "yes":
+
+ #if str($inputs.additional_params.library_type) != "None":
+ --SS_lib_type $inputs.additional_params.library_type
+ #end if
+
+ ##$inputs.additional_params.pairs_together
+ --CPU $inputs.additional_params.CPU
+ ##$inputs.additional_params.PARALLEL_STATS
+ --KMER_SIZE $inputs.additional_params.KMER_SIZE
+ --max_pct_stdev $inputs.additional_params.max_pct_stdev
+
+ #end if
+
+#end if
+
+
+
+## direct to output
+&gt; $insilico_read_normalization_log 2&gt;&amp;1
+
+</command>
+
+<inputs>
+ <param name="JM" type="select" label="JM" help="--JM &lt; string &gt; ; Amount of memory to allocate to Jellyfish for Kmer catalog construction">
+ <option value="1G">1G</option>
+ <option value="10G">10G</option>
+ <option value="20G">20G</option>
+ <option value="50G">50G</option>
+ </param>
+
+ <param name="maximum_coverage" type="integer" value="25" label="Maximum Coverage" help="--max_cov &lt; int &gt; ; targeted maximum coverage for reads"/>
+
+ <conditional name="inputs">
+ <param name="paired_or_single" type="select" label="Paired or Single-end data?">
+ <option value="paired">Paired</option>
+ <option value="single">Single</option>
+ </param>
+
+ <when value="paired">
+ <param format="fasta,fastq" name="left_input" type="data" label="Left/Forward strand reads" help=""/>
+ <param format="fasta,fastq" name="right_input" type="data" label="Right/Reverse strand reads" help=""/>
+
+ <conditional name="additional_params">
+ <param name="use_additional" type="select" label="Use Additional Params?">
+ <option value="no">No</option>
+ <option value="yes">Yes</option>
+ </param>
+ <when value="no"/>
+ <when value="yes">
+ <param name="library_type" type="select" label="Strand-specific Library Type">
+ <option value="None">None</option>
+ <option value="FR">FR</option>
+ <option value="RF">RF</option>
+ </param>
+ <param name="pairs_together" type="boolean" label="--pairs_together" help="process paired reads by averaging stats between pairs and retaining linking info" truevalue="--pairs_together" falsevalue="" checked="true" />
+ <param name="CPU" type="integer" value="2" min="1" max="30" label="CPU" help="--CPU &lt; int &gt; ; Number of CPUs to use (Maximum limit is 30 core)" />
+ <param name="PARALLEL_STATS" type="boolean" label="--PARALLEL_STATS"  help="Generate read stats in parallel for paired reads" truevalue="--PARALLEL_STATS" falsevalue="" checked="true" />
+ <param name="KMER_SIZE" type="integer"  value="25" label="--KMER SIZE" help="Default is 25" />
+ <param name="max_pct_stdev" type="integer"  value="200" label="--max_pct_stdev" help="maximum pct of mean for stdev of kmer coverage across read"/>
+ </when>
+ </conditional>
+ </when>
+
+ <when value="single">
+ <param format="fasta,fastq" name="input" type="data" label="Single-end reads" help=""/>
+
+ <conditional name="additional_params">
+ <param name="use_additional" type="select" label="Use Additional Params?">
+ <option value="no">No</option>
+ <option value="yes">Yes</option>
+ </param>
+ <when value="no"/>
+ <when value="yes">
+ <param name="library_type" type="select" label="Strand-specific Library Type">
+ <option value="None">None</option>
+ <option value="F">F</option>
+ <option value="R">R</option>
+ </param>
+ <param name="CPU" type="integer" value="2" min="1" max="30" label="CPU" help="--CPU &lt; int &gt; ; Number of CPUs to use (Maximum limit is 30 core)" />
+ <param name="KMER_SIZE" type="integer"  value="25" label="--KMER SIZE" help="Default is 25" />
+ <param name="max_pct_stdev" type="integer"  value="200" label="--max_pct_stdev" help="maximum pct of mean for stdev of kmer coverage across read"/>
+ </when>
+ </conditional>
+ </when>
+ </conditional>
+
+
+</inputs>
+
+<outputs>
+<data format="txt" name="insilico_read_normalization_log" label="${tool.name} on ${on_string}: log" />
+<data format="fastq"  name="left_normalized_read"  label="${tool.name} on ${on_string}: Left  Read" from_work_dir="left.norm.fq"/>
+<data format="fastq"  name="right_normalized_read" label="${tool.name} on ${on_string}: Right Read" from_work_dir="right.norm.fq"/>
+</outputs>
+
+
+<tests/>
+<help>Insilico Read Normalization</help>
+
+</tool>
b
diff -r 000000000000 -r cc71440b759f pfam_db.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/pfam_db.loc.sample Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,3 @@
+
+###1_name       ###2_date       ###2_path_to_db
+pfam_db.hmm july 2014 /home/username/galaxy-dist/tool-data/pfam_db.hmm
b
diff -r 000000000000 -r cc71440b759f tool_dependencies.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml Tue Sep 22 01:58:00 2015 -0400
b
b'@@ -0,0 +1,336 @@\n+<?xml version="1.0"?>\n+<tool_dependency>\n+    <package name="trinityrnaseq" version="2013_08_14">\n+        <install version="1.0">\n+            <actions>\n+                <action type="download_by_url">http://ngsaptools.osdd.jnu.ac.in/ngsap/trinityrnaseq_r20140717.tar.gz</action>\n+                <action type="shell_command">make</action>\n+                <action type="move_directory_files">\n+                    <source_directory>.</source_directory>\n+                    <destination_directory>$INSTALL_DIR</destination_directory>\n+                </action>\n+                <action type="set_environment">\n+                    <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR</environment_variable>\n+                </action>\n+                <action type="set_environment">\n+                    <environment_variable name="TRINITY_HOME" action="set_to">$INSTALL_DIR</environment_variable>\n+                </action>\n+            </actions>\n+        </install>\n+        <readme>\n+        </readme>\n+    </package>\n+ <package name="samtools" version="0.1.18">\n+        <install version="1.0">\n+            <actions_group>\n+                <actions os="linux" architecture="i386">\n+                    <action type="download_by_url" target_filename="samtools-0.1.18.tgz">http://depot.galaxyproject.org/package/linux/i386/samtools/samtools-0.1.18-linux-i386.tgz</action>\n+                    <action type="move_directory_files">\n+                        <source_directory>.</source_directory>\n+                        <destination_directory>$INSTALL_DIR</destination_directory>\n+                    </action>\n+                </actions>\n+                <actions os="linux" architecture="x86_64">\n+                    <action type="download_by_url" target_filename="samtools-0.1.18.tgz">http://depot.galaxyproject.org/package/linux/x86_64/samtools/samtools-0.1.18-linux-x86_64.tgz</action>\n+                    <action type="move_directory_files">\n+                        <source_directory>.</source_directory>\n+                        <destination_directory>$INSTALL_DIR</destination_directory>\n+                    </action>\n+                </actions>\n+                <actions os="darwin" architecture="i386">\n+                    <action type="download_by_url" target_filename="samtools-0.1.18.tgz">http://depot.galaxyproject.org/package/darwin/i386/samtools/samtools-0.1.18-Darwin-i386.tgz</action>\n+                    <action type="move_directory_files">\n+                        <source_directory>.</source_directory>\n+                        <destination_directory>$INSTALL_DIR</destination_directory>\n+                    </action>\n+                </actions>\n+                <actions os="darwin" architecture="x86_64">\n+                    <action type="download_by_url" target_filename="samtools-0.1.18.tgz">http://depot.galaxyproject.org/package/darwin/x86_64/samtools/samtools-0.1.18-Darwin-x86_64.tgz</action>\n+                    <action type="move_directory_files">\n+                        <source_directory>.</source_directory>\n+                        <destination_directory>$INSTALL_DIR</destination_directory>\n+                    </action>\n+                </actions>\n+                <actions>\n+                    <action type="download_by_url">http://depot.galaxyproject.org/package/source/samtools/samtools-0.1.18.tar.bz2</action>\n+                    <action type="shell_command">sed -i.bak \'s/-lcurses/-lncurses/\' Makefile</action>\n+                    <action type="shell_command">make</action>\n+                    <action type="move_file">\n+                        <source>samtools</source>\n+                        <destination>$INSTALL_DIR/bin</destination>\n+                    </action>\n+                    <action type="move_file">\n+                        <source>libbam.a</source>\n+                        <destination>$INSTALL_DIR/lib</destination>\n+                    </action>\n+                    <action type="'..b'                   <action type="move_directory_files">\n+                        <source_directory>.</source_directory>\n+                        <destination_directory>$INSTALL_DIR</destination_directory>\n+                    </action>\n+                </actions>\n+                <actions os="darwin" architecture="x86_64">\n+                    <action type="download_by_url">http://depot.galaxyproject.org/package/darwin/x86_64/bowtie2/bowtie2-2.1.0-macos-x86_64.tgz</action>\n+                    <action type="move_directory_files">\n+                        <source_directory>.</source_directory>\n+                        <destination_directory>$INSTALL_DIR</destination_directory>\n+                    </action>\n+                </actions>\n+                <actions os="linux" architecture="i386">\n+                    <action type="download_by_url">http://depot.galaxyproject.org/package/linux/i386/bowtie2/bowtie2-2.1.0-linux-i386.tgz</action>\n+                    <action type="move_directory_files">\n+                        <source_directory>.</source_directory>\n+                        <destination_directory>$INSTALL_DIR</destination_directory>\n+                    </action>\n+                </actions>\n+                <actions os="darwin" architecture="i386">\n+                    <action type="download_by_url">http://depot.galaxyproject.org/package/darwin/i386/bowtie2/bowtie2-2.1.0-macos-i386.tgz</action>\n+                    <action type="move_directory_files">\n+                        <source_directory>.</source_directory>\n+                        <destination_directory>$INSTALL_DIR</destination_directory>\n+                    </action>\n+                </actions>\n+                <actions>\n+                    <action type="download_by_url">http://downloads.sourceforge.net/project/bowtie-bio/bowtie2/2.1.0/bowtie2-2.1.0-source.zip</action>\n+                    <action type="shell_command">make</action>\n+                    <action type="move_file">\n+                        <source>bowtie2</source>\n+                        <destination>$INSTALL_DIR</destination>\n+                    </action>\n+                    <action type="move_file">\n+                        <source>bowtie2-align</source>\n+                        <destination>$INSTALL_DIR</destination>\n+                    </action>\n+                    <action type="move_file">\n+                        <source>bowtie2-build</source>\n+                        <destination>$INSTALL_DIR</destination>\n+                    </action>\n+                    <action type="move_file">\n+                        <source>bowtie2-inspect</source>\n+                        <destination>$INSTALL_DIR</destination>\n+                    </action>\n+                </actions>\n+                <action type="set_environment">\n+                    <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR</environment_variable>\n+                </action>\n+            </actions_group>\n+        </install>\n+        <readme></readme>\n+    </package>\n+<package name="tophat2" version="2.0.9">\n+<repository toolshed="http://toolshed.g2.bx.psu.edu" name="tophat2" owner="devteam" changeset_revision="ae06af1118dc" />\n+</package>\n+<package name="fastq_groomer" version="1.0.0">\n+<repository toolshed="http://toolshed.g2.bx.psu.edu" name="fastq_groomer" owner="devteam" changeset_revision="1298445c852b" />\n+</package>\n+<package name="blast+" version="2.2.29">\n+        <repository toolshed="http://toolshed.g2.bx.psu.edu" name="ncbi_blast_plus" owner="devteam" changeset_revision="2fe07f50a41e" />\n+    </package>\n+<package name="cufflinks" version="2.1.1">\n+        <repository toolshed="http://toolshed.g2.bx.psu.edu" name="cufflinks" owner="devteam" changeset_revision="9aab29e159a7" />\n+    </package>\n+<package name="cufflinks" version="2.2.1">\n+        <repository toolshed="http://toolshed.g2.bx.psu.edu" name="cuffmerge" owner="devteam" changeset_revision="b6e3849293b1" />\n+    </package>\n+</tool_dependency>\n+\n'
b
diff -r 000000000000 -r cc71440b759f transDecoder.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/transDecoder.xml Tue Sep 22 01:58:00 2015 -0400
[
@@ -0,0 +1,120 @@
+<tool id='id_transDecoder' name='transDecoder' version='1.0'>
+<description> coding region </description>
+<!--requirement></requirement-->
+<requirements>
+        <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
+        <requirement type="set_environment">TRINITY_HOME</requirement>
+
+</requirements>
+<command>perl \$TRINITY_HOME/trinity-plugins/transdecoder/TransDecoder
+
+ -t $transcript
+
+ #if str($optional.parameters) == 'yes':
+ #if ($train):
+ --train $train
+ #end if
+
+ #if ($min_protein_length):
+ -m $min_protein_length
+ #end if
+
+ #if ($genetic_code):
+ -G $genetic_code
+ #end if
+
+ #if ($strand-specific):
+ $strand-specific
+ #end if
+
+ #if ($lottmn):
+ -T $lottmm
+ #end if
+
+ #if ($retain_long_orfs):
+ --retain_long_orfs $retain_long_orfs
+ #end if
+ #end if
+
+ #if str($pfam.options) == 'yes':
+ #if ($pfam_db):
+ --search_pfam $pfam_db
+ #end if
+
+ #if ($CPU):
+ --CPU $CPU
+ #end if
+ #end if
+
+ ##log file
+ &gt; $transdecoder_log 2&gt;&amp;1;
+
+
+ ## output renaming
+
+ cp -s dataset_*.dat.transdecoder.pep transcript.transdecoder.pep;
+ cp -s dataset_*.dat.transdecoder.cds transcript.transdecoder.cds;
+ cp -s dataset_*.dat.transdecoder.bed transcript.transdecoder.bed;
+ cp -s dataset_*.dat.transdecoder.gff3 transcript.transdecoder.gff3;
+ cp -s dataset_*.dat.transdecoder.mRNA transcript.transdecoder.mRNA;
+</command>
+
+<inputs>
+ <!-- Required -->
+
+  <param name='transcript' type='data' label='Transcripts [ in fasta format ]' help=' -t &lt; string &gt; ; Assembled reads in fasta file format'/>
+
+ <!-- Optional -->
+
+ <conditional name='optional'>
+  <param name='parameters' type='select' label='Use Optional Parameters'>
+  <option value='no'>NO</option>
+  <option value='yes'>YES</option>
+  </param>
+  <when value='no'/>
+ <when value='yes'>
+   <param name='train' type='data' optional='true' label='FASTA file with ORFs to train Markov Mod for protein identification' help='--train &lt; string &gt; ; FASTA file with ORFs to train Markov Mod for protein identification; otherwise longest non-redundant ORFs used' />
+ <param name='min_protein_length' type='integer' optional='true' value='100' label='Minimum Protein Length' help='-m &lt; int &gt; ;minimum protein length (default: 100)'/>
+ <param name='genetic_code' type='select' optional='true' label='Select Genetic Code' help=' -G &lt; string &gt; ; genetic code (default is "universal")'>
+ <option value='universal' selected='true'>Universal</option>
+ <option value='Euplotes'>Euplotes</option>
+ <option value='Tetrahymena'>Tetrahymena</option>
+ <option value='Candida'>Candida</option>
+ <option value='Acetabularia'>Acetabularia</option>
+   </param>
+   <param name='strand-specific' type='boolean' truevalue='-S' falsevalue='' optional='true' label='Strand-Specific [ -S ]' help='strand-specific (only analyzes top strand)'/> 
+   <param name='lottmm' type='integer' optional='true' value='500' label=' -T ; Needs a label ??? ' help='-T &lt; int &gt; ; If no --train, top longest ORFs to train Markov Model (hexamer stats) (default: 500)'/>
+   <param name='retain_long_orfs' type="integer" optional='true' value="900" label=' --retain_long_orfs ; Needs a label ??? ' help='--retain_long_orfs &lt; int &gt; ; Retain all ORFs found that are equal or longer than these many nucleotides even if no other evidence marks it as coding (default: 900 bp => 300aa)' />
+  </when>
+ </conditional>
+
+
+ <!-- Pfam Options -->
+
+ <conditional name='pfam'>
+ <param name='options' type='select' label='Use Pfam Options [ Optional ]'>
+ <option value='no'>NO</option>
+ <option value='yes'>YES</option>
+ </param>
+ <when value='no'/>
+ <when value='yes'>
+ <param name='pfam_db' type='select' label='Search pfam database' help=' --search_pfam  &lt; pfam_db.hmm &gt; ; /path/to/pfam_db.hmm to search using hmmscan'>
+     <options from_file="pfam_db.loc">
+ <column name="name" index="0"/>
+           <column name="value" index="2"/>
+ </options>
+ </param>
+ <param name='CPU' type='integer' value='2'  label='CPU' help='--CPU &lt; int &gt; Number of CPU for the job'/>
+ </when>
+  </conditional>
+
+</inputs>
+<outputs>
+ <data name='transdecoder_pep' format='fasta' label="${tool.name} on ${on_string}: pep" from_work_dir="transcript.transdecoder.pep"/>
+ <data name='transdecoder_cds' format='fasta' label="${tool.name} on ${on_string}: cds" from_work_dir="transcript.transdecoder.cds"/>
+ <data name='transdecoder_bed' format='bed' label="${tool.name} on ${on_string}: bed" from_work_dir="transcript.transdecoder.bed"/>
+ <data name='transdecoder_gff3' format='tabular' label="${tool.name} on ${on_string}: gff3" from_work_dir="transcript.transdecoder.gff3"/>
+ <data name='transdecoder_mRNA' format='fasta' label="${tool.name} on ${on_string}: mRNA" from_work_dir="transcript.transdecoder.mRNA"/>
+ <data name='transdecoder_log' format='txt' label="${tool.name} on ${on_string}: log" />
+</outputs>
+</tool>
b
diff -r 000000000000 -r cc71440b759f trinityStats.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/trinityStats.xml Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,25 @@
+<tool id='id_trinity_stats' name='Trinity Stats' version='1.0'>
+<description> check stats...  </description>
+
+<requirements>
+        <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
+        <requirement type="set_environment">TRINITY_HOME</requirement>
+
+</requirements>
+<command >perl \$TRINITY_HOME/util/TrinityStats.pl  $fastafile 
+&gt; $statsfile 2&gt;&amp;1;
+</command>
+
+<inputs>
+ <!-- Required -->
+
+  <param name='fastafile'  type="data" format="fasta"  label='fastafile' help='Assembled fasta file'>
+  </param>
+
+ <!-- Optional -->
+
+</inputs>
+<outputs>
+<data name='statsfile' format='text' label="${tool.name} on ${on_string}: "/>
+</outputs>
+</tool>
b
diff -r 000000000000 -r cc71440b759f trinityrnaseq.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/trinityrnaseq.xml Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,131 @@
+<tool id="trinityrnaseq" name="Trinity" version="0.0.1">
+
+    <!-- Written by Jeremy Goecks, now maintained here by bhaas -->
+    <description>De novo assembly of RNA-Seq data Using Trinity</description>
+ <requirements>
+        <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
+        <requirement type="package" version="0.1.18">samtools</requirement>
+        <requirement type="package" version="0.12.7">bowtie</requirement>
+        <requirement type="set_environment">TRINITY_HOME</requirement>
+
+</requirements>
+    <command>
+        \$TRINITY_HOME/Trinity --JM $JM --CPU $CPU
+        
+        ## Inputs.
+        #if str($inputs.paired_or_single) == "paired":
+            --left $inputs.left_input --right $inputs.right_input
+            #if  $inputs.left_input.ext == 'fa':
+                --seqType fa
+            #else:
+                --seqType fq
+            #end if
+            #if str($inputs.library_type) != "None":
+                --SS_lib_type $inputs.library_type
+            #end if
+ --group_pairs_distance $inputs.group_pairs_distance
+        #else:
+            --single $inputs.input
+            #if  str($inputs.input.ext) == 'fa':
+                --seqType fa
+            #else:
+                --seqType fq
+            #end if
+            #if str($inputs.library_type) != "None":
+                --SS_lib_type $inputs.library_type
+            #end if
+        #end if
+
+        ## Additional parameters.
+        #if str($additional_params.use_additional) == "yes":
+ --min_kmer_cov $inputs.min_kmer_cov --max_reads_per_graph $inputs.max_reads_per_graph --bflyHeapSpaceMax $input.bflyHeapSpaceMax
+ #if $inputs.bfly_opts != 'None':
+ --bfly_opts " $inputs.bfly_opts "
+ #end if
+        #end if
+
+                
+        ## direct to output
+        > $trinity_log 2>&amp;1

+    </command>
+    <inputs>
+       <param name="JM" type="select" label="JM" help="Amount of memory to allocate to Jellyfish for Kmer catalog construction">
+ <option value="1G">1G</option>
+ <option value="10G">10G</option>
+ <option value="50G">50G</option>
+ <option value="100G">100G</option>
+ <option value="200G">200G</option>
+ <option value="500G">500G</option>
+ </param>
+
+ <param name="CPU" type="integer" value="2" min="1" label="CPU" help="Number of CPUs to use by Trinity" />
+
+
+        <conditional name="inputs">
+     <param name="paired_or_single" type="select" label="Paired or Single-end data?">
+                <option value="paired">Paired</option>
+                <option value="single">Single</option>
+            </param>
+            <when value="paired">
+                <param format="fasta,fastq" name="left_input" type="data" label="Left/Forward strand reads" help=""/>
+                <param format="fasta,fastq" name="right_input" type="data" label="Right/Reverse strand reads" help=""/>
+                <param name="library_type" type="select" label="Strand-specific Library Type">
+                    <option value="None">None</option>
+                    <option value="FR">FR</option>
+                    <option value="RF">RF</option>
+                </param>
+                <param name="group_pairs_distance" type="integer" value="500" min="1" label="Group pairs distance" help="Maximum length expected between fragment pairs"/>
+         <param name="path_reinforcement_distance" type="integer" value="75" min="1" label="Path reinforcement distance" help="Minimum read overlap required for path extension in the graph" />    
+
+            </when>
+            <when value="single">
+                <param format="fasta,fastq" name="input" type="data" label="Single-end reads" help=""/>
+                <param name="library_type" type="select" label="Strand-specific Library Type">
+                    <option value="None">None</option>
+                    <option value="F">F</option>
+                    <option value="R">R</option>
+                </param>
+             <param name="path_reinforcement_distance" type="integer" value="40" min="1" label="Path reinforcement distance" help="Minimum read overlap required for path extension in the graph" />    
+            </when>
+        </conditional>
+    
+ <conditional name="additional_params">
+            <param name="use_additional" type="select" label="Use Additional Params?">
+                <option value="no">No</option>
+                <option value="yes">Yes</option>
+            </param>
+            <when value="no">
+            </when>
+            <when value="yes">            
+ <param name="min_kmer_cov" type="integer" value="1" min="1" label="inchworm_min_kmer_cov" help="Minimum kmer coverage required by Inchworm for initial contig construction" />
+ <param name="max_reads_per_graph" type="integer" value="20000000" min="10000" label="chrysalis_max_reads_per_graph" help="Maximum number of reads to be anchored within each transcript graph by Chrysalis" />
+
+
+ <param name="bfly_opts" type="text" value="None" label="bfly_opts" help="Options to pass on to Butterfly" />
+ <param name="bflyHeapSpaceMax" type="select" label="bflyHeapSpaceMax" help="Java heap space maximum value for Butterfly">
+ <option value="1G">1G</option>
+ <option value="2G">2G</option>
+ <option value="4G" selected="true">4G</option>
+ <option value="10G">10G</option>
+ <option value="20G">20G</option>
+ </param>
+
+               <param name="min_contig_length" type="integer" value="200" min="1" label="Minimum Contig Length" help=""/>
+            </when>
+        </conditional>
+    
+
+    </inputs>
+    <outputs>
+        <data format="txt" name="trinity_log" label="${tool.name} on ${on_string}: log" />
+        <data format="fasta" name="assembled_transcripts" label="${tool.name} on ${on_string}: Assembled Transcripts" from_work_dir="trinity_out_dir/Trinity.fasta"/>
+    </outputs>
+    <tests>
+    </tests>
+    <help>
+        Trinity is a de novo transcript assembler that uses RNA-seq data as input. This tool runs all Trinity_ commands--Inchworm, Chrysalis, and Butterfly--in a single pass.
+        
+        .. _Trinity: http://trinityrnaseq.sourceforge.net
+    </help>
+</tool>
b
diff -r 000000000000 -r cc71440b759f trinityrnaseq.xml~
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/trinityrnaseq.xml~ Tue Sep 22 01:58:00 2015 -0400
b
@@ -0,0 +1,131 @@
+<tool id="trinityrnaseq" name="Trinity" version="0.0.1">
+
+    <!-- Written by Jeremy Goecks, now maintained here by bhaas -->
+    <description>De novo assembly of RNA-Seq data Using Trinity</description>
+ <requirements>
+        <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
+        <requirement type="package" version="0.1.18">samtools</requirement>
+        <requirement type="package" version="0.12.7">bowtie</requirement>
+        <requirement type="set_environment">TRINITY_HOME</requirement>
+
+</requirements>
+    <command>
+        \$TRINITY_HOME/Trinity --JM $JM --CPU $CPU
+        
+        ## Inputs.
+        #if str($inputs.paired_or_single) == "paired":
+            --left $inputs.left_input --right $inputs.right_input
+            #if  $inputs.left_input.ext == 'fa':
+                --seqType fa
+            #else:
+                --seqType fq
+            #end if
+            #if str($inputs.library_type) != "None":
+                --SS_lib_type $inputs.library_type
+            #end if
+ --group_pairs_distance $inputs.group_pairs_distance
+        #else:
+            --single $inputs.input
+            #if  str($inputs.input.ext) == 'fa':
+                --seqType fa
+            #else:
+                --seqType fq
+            #end if
+            #if str($inputs.library_type) != "None":
+                --SS_lib_type $inputs.library_type
+            #end if
+        #end if
+
+        ## Additional parameters.
+        #if str($additional_params.use_additional) == "yes":
+ --min_kmer_cov $inputs.min_kmer_cov --max_reads_per_graph $inputs.max_reads_per_graph --bflyHeapSpaceMax $input.bflyHeapSpaceMax
+ #if $inputs.bfly_opts != 'None':
+ --bfly_opts " $inputs.bfly_opts "
+ #end if
+        #end if
+
+                
+        ## direct to output
+        > $trinity_log 2>&amp;1

+    </command>
+    <inputs>
+       <param name="JM" type="select" label="JM" help="Amount of memory to allocate to Jellyfish for Kmer catalog construction">
+ <option value="1G">1G</option>
+ <option value="10G">10G</option>
+ <option value="50G">50G</option>
+ <option value="100G">100G</option>
+ <option value="200G">200G</option>
+ <option value="500G">500G</option>
+ </param>
+
+ <param name="CPU" type="integer" value="2" min="1" label="CPU" help="Number of CPUs to use by Trinity" />
+
+
+        <conditional name="inputs">
+     <param name="paired_or_single" type="select" label="Paired or Single-end data?">
+                <option value="paired">Paired</option>
+                <option value="single">Single</option>
+            </param>
+            <when value="paired">
+                <param format="fasta,fastq" name="left_input" type="data" label="Left/Forward strand reads" help=""/>
+                <param format="fasta,fastq" name="right_input" type="data" label="Right/Reverse strand reads" help=""/>
+                <param name="library_type" type="select" label="Strand-specific Library Type">
+                    <option value="None">None</option>
+                    <option value="FR">FR</option>
+                    <option value="RF">RF</option>
+                </param>
+                <param name="group_pairs_distance" type="integer" value="500" min="1" label="Group pairs distance" help="Maximum length expected between fragment pairs"/>
+         <param name="path_reinforcement_distance" type="integer" value="75" min="1" label="Path reinforcement distance" help="Minimum read overlap required for path extension in the graph" />    
+
+            </when>
+            <when value="single">
+                <param format="fasta,fastq" name="input" type="data" label="Single-end reads" help=""/>
+                <param name="library_type" type="select" label="Strand-specific Library Type">
+                    <option value="None">None</option>
+                    <option value="F">F</option>
+                    <option value="R">R</option>
+                </param>
+             <param name="path_reinforcement_distance" type="integer" value="40" min="1" label="Path reinforcement distance" help="Minimum read overlap required for path extension in the graph" />    
+            </when>
+        </conditional>
+    
+ <conditional name="additional_params">
+            <param name="use_additional" type="select" label="Use Additional Params?">
+                <option value="no">No</option>
+                <option value="yes">Yes</option>
+            </param>
+            <when value="no">
+            </when>
+            <when value="yes">            
+ <param name="min_kmer_cov" type="integer" value="1" min="1" label="inchworm_min_kmer_cov" help="Minimum kmer coverage required by Inchworm for initial contig construction" />
+ <param name="max_reads_per_graph" type="integer" value="20000000" min="10000" label="chrysalis_max_reads_per_graph" help="Maximum number of reads to be anchored within each transcript graph by Chrysalis" />
+
+
+ <param name="bfly_opts" type="text" value="None" label="bfly_opts" help="Options to pass on to Butterfly" />
+ <param name="bflyHeapSpaceMax" type="select" label="bflyHeapSpaceMax" help="Java heap space maximum value for Butterfly">
+ <option value="1G">1G</option>
+ <option value="2G">2G</option>
+ <option value="4G" selected="true">4G</option>
+ <option value="10G">10G</option>
+ <option value="20G">20G</option>
+ </param>
+
+               <param name="min_contig_length" type="integer" value="200" min="1" label="Minimum Contig Length" help=""/>
+            </when>
+        </conditional>
+    
+
+    </inputs>
+    <outputs>
+        <data format="txt" name="trinity_log" label="${tool.name} on ${on_string}: log" />
+        <data format="fasta" name="assembled_transcripts" label="${tool.name} on ${on_string}: Assembled Transcripts" from_work_dir="trinity_out_dir/Trinity.fasta"/>
+    </outputs>
+    <tests>
+    </tests>
+    <help>
+        Trinity is a de novo transcript assembler that uses RNA-seq data as input. This tool runs all Trinity_ commands--Inchworm, Chrysalis, and Butterfly--in a single pass.
+        
+        .. _Trinity: http://trinityrnaseq.sourceforge.net
+    </help>
+</tool>