Repository 'proteomics_rnaseq_sap_db_workflow'
hg clone https://toolshed.g2.bx.psu.edu/repos/galaxyp/proteomics_rnaseq_sap_db_workflow

Changeset 0:3a11830963e3 (2014-03-17)
Commit message:
Initial upload
added:
README.rst
proteomics_rnaseq_human_splice_db_workflow.ga
proteomics_rnaseq_mouse_splice_db_workflow.ga
proteomics_rnaseq_splice_db_workflow.ga
repository_dependencies.xml
b
diff -r 000000000000 -r 3a11830963e3 README.rst
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/README.rst Mon Mar 17 15:59:57 2014 -0500
[
@@ -0,0 +1,60 @@
+This package contains a Galaxy workflow for the detection and incorporation of single amino acid polymorphism (SAP) into a custom proteomics search database.
+
+The workflow aligns RNA-Seq reads to the organism's genome using Tophat, call SNPs using SAMtools mpileup command, and annotates the SNPs that reside within protein-coding regions using SNPeff.
+Galaxy tool "SNPeff to Peptide Fasta" generates peptide sequences with the polymorhisms.
+
+See http://www.galaxyproject.org for information about the Galaxy Project.
+
+
+Availability
+============
+
+This workflow is available to download and/or install from the main
+Galaxy Tool Shed:
+
+http://toolshed.g2.bx.psu.edu/view/galaxyp/proteomics_rnaseq_sap_db_workflow
+
+
+Reference Data
+==============
+
+For Human RNAseq data this workflow was tested with a genome build named "GRCh37_canon" using reference data from:
+
+* ftp://ftp.ensembl.org/pub/release-73/fasta/homo_sapiens/dna/Homo_sapiens.GRCh37.73.dna.chromosome.[1-9XY]*.fa.gz
+* ftp://ftp.ensembl.org/pub/release-73/fasta/homo_sapiens/pep/Homo_sapiens.GRCh37.73.pep.all.fa.gz
+* ftp://ftp.ensembl.org/pub/release-73/gtf/homo_sapiens/Homo_sapiens.GRCh37.73.gtf.gz
+
+
+For Mouse RNAseq data this workflow was tested with a genome build named "GRCm38_canon" using reference data from:
+
+* ftp://ftp.ensembl.org/pub/release-73/fasta/mus_musculus/dna/Mus_musculus.GRCm38.73.dna.chromosome.[1-9XY]*.fa.gz
+* ftp://ftp.ensembl.org/pub/release-73/fasta/mus_musculus/pep/Mus_musculus.GRCm38.73.pep.all.fa.gz
+* ftp://ftp.ensembl.org/pub/release-73/gtf/mus_musculus/Mus_musculus.GRCm38.73.gtf.gz
+
+
+Genome builds "GRCh37_canon" and "GRCm38_canon" were built according to instructions in:  https://wiki.galaxyproject.org/Admin/NGS%20Local%20Setup
+The builds used only the standard chromosomesi sequences from the reference fasta; the other sequences were filtered out.
+The GTF was filtered to retain only those entries that referenced the standard chromosomes. 
+
+
+Dependencies
+============
+
+These dependencies should be resolved automatically via the Galaxy Tool Shed:
+
+* http://toolshed.g2.bx.psu.edu/view/devteam/tophat
+* http://toolshed.g2.bx.psu.edu/view/devteam/samtools_mpileup
+* http://toolshed.g2.bx.psu.edu/view/nilesh/bcftools
+* http://toolshed.g2.bx.psu.edu/view/iuc/snpeff
+* http://toolshed.g2.bx.psu.edu/view/jjohnson/snpeff_to_peptides
+
+History
+=======
+
+======= ======================================================================
+Version Changes
+------- ----------------------------------------------------------------------
+v0.0.1  - Initial release to Tool Shed (March, 2014)
+======= ======================================================================
+
+
b
diff -r 000000000000 -r 3a11830963e3 proteomics_rnaseq_human_splice_db_workflow.ga
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/proteomics_rnaseq_human_splice_db_workflow.ga Mon Mar 17 15:59:57 2014 -0500
[
b'@@ -0,0 +1,368 @@\n+{\n+    "a_galaxy_workflow": "true", \n+    "annotation": "The SAP Database Workflow creates a database of polypeptide sequences containing single amino acid polymorphisms (SAPs) detected in RNA-Seq data.", \n+    "format-version": "0.1", \n+    "name": "Proteomics SAP DB", \n+    "steps": {\n+        "0": {\n+            "annotation": "", \n+            "id": 0, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "RNA-Seq Left mate pair fastq"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 257, \n+                "top": 163\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"RNA-Seq Left mate pair fastq\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "1": {\n+            "annotation": "", \n+            "id": 1, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "RNA-Seq right mate pair fastq"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 257, \n+                "top": 393\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"RNA-Seq right mate pair fastq\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "2": {\n+            "annotation": "", \n+            "id": 2, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "Ensembl GTF for the reference genome"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 500, \n+                "top": 526\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"Ensembl GTF for the reference genome\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "3": {\n+            "annotation": "", \n+            "id": 3, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "The Ensembl peptide sequences fasta"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 1551, \n+                "top": 552\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"The Ensembl peptide sequences fasta\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "4": {\n+            "annotation": "", \n+            "id": 4, \n+            "input_connections": {\n+                "input": {\n+                    "id": 0, \n+                    "output_name": "output"\n+                }\n+            }, \n+            "inputs": [], \n+            "name": "Select first", \n+            "outputs": [\n+                {\n+                    "name": "out_file1", \n+                    "type": "input"\n+                }\n+            ], \n+            "position": {\n+                "left": 482, \n+                "top": 209\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "Show beginning1", \n+            "tool_state": "{\\"__page__\\": 0, \\"input\\": \\"null\\", \\"__rerun_rema'..b'ry\\\\\\": \\\\\\"false\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"G\\": \\"\\\\\\"false\\\\\\"\\", \\"F\\": \\"\\\\\\"false\\\\\\"\\", \\"i\\": \\"{\\\\\\"__current_case__\\\\\\": 1, \\\\\\"alt_indel_snp_ratio\\\\\\": \\\\\\"false\\\\\\"}\\", \\"__rerun_remap_job_id__\\": null, \\"N\\": \\"\\\\\\"false\\\\\\"\\", \\"p\\": \\"{\\\\\\"variant_filter\\\\\\": \\\\\\"false\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"S\\": \\"\\\\\\"false\\\\\\"\\", \\"g\\": \\"\\\\\\"false\\\\\\"\\", \\"t\\": \\"{\\\\\\"mutation_rate\\\\\\": \\\\\\"false\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"v\\": \\"\\\\\\"true\\\\\\"\\", \\"u\\": \\"\\\\\\"false\\\\\\"\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\", \\"input\\": \\"null\\"}", \n+            "tool_version": "1.0.0", \n+            "type": "tool", \n+            "user_outputs": []\n+        }, \n+        "10": {\n+            "annotation": "", \n+            "id": 10, \n+            "input_connections": {\n+                "input": {\n+                    "id": 9, \n+                    "output_name": "output"\n+                }\n+            }, \n+            "inputs": [], \n+            "name": "SnpEff", \n+            "outputs": [\n+                {\n+                    "name": "snpeff_output", \n+                    "type": "vcf"\n+                }, \n+                {\n+                    "name": "statsFile", \n+                    "type": "html"\n+                }\n+            ], \n+            "position": {\n+                "left": 1576, \n+                "top": 317\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/snpeff/snpEff/3.4", \n+            "tool_state": "{\\"spliceSiteSize\\": \\"\\\\\\"1\\\\\\"\\", \\"filterHomHet\\": \\"\\\\\\"no_filter\\\\\\"\\", \\"outputFormat\\": \\"\\\\\\"vcf\\\\\\"\\", \\"udLength\\": \\"\\\\\\"0\\\\\\"\\", \\"inputFormat\\": \\"\\\\\\"vcf\\\\\\"\\", \\"filterIn\\": \\"\\\\\\"-snp\\\\\\"\\", \\"__page__\\": 0, \\"__rerun_remap_job_id__\\": null, \\"filterOut\\": \\"[\\\\\\"-no-downstream\\\\\\", \\\\\\"-no-intergenic\\\\\\", \\\\\\"-no-intron\\\\\\", \\\\\\"-no-upstream\\\\\\", \\\\\\"-no-utr\\\\\\"]\\", \\"generate_stats\\": \\"\\\\\\"True\\\\\\"\\", \\"noLog\\": \\"\\\\\\"True\\\\\\"\\", \\"chr\\": \\"\\\\\\"\\\\\\"\\", \\"intervals\\": \\"null\\", \\"snpDb\\": \\"{\\\\\\"genome_version\\\\\\": \\\\\\"GRCh37.73\\\\\\", \\\\\\"genomeSrc\\\\\\": \\\\\\"named\\\\\\", \\\\\\"__current_case__\\\\\\": 2}\\", \\"offset\\": \\"\\\\\\"\\\\\\"\\", \\"input\\": \\"null\\", \\"transcripts\\": \\"null\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\", \\"annotations\\": \\"null\\"}", \n+            "tool_version": "3.4", \n+            "type": "tool", \n+            "user_outputs": []\n+        }, \n+        "11": {\n+            "annotation": "", \n+            "id": 11, \n+            "input_connections": {\n+                "all_pep_fasta": {\n+                    "id": 3, \n+                    "output_name": "output"\n+                }, \n+                "snpeff_vcf": {\n+                    "id": 10, \n+                    "output_name": "snpeff_output"\n+                }\n+            }, \n+            "inputs": [], \n+            "name": "SnpEff to Peptide fasta", \n+            "outputs": [\n+                {\n+                    "name": "peptide_variant_fasta", \n+                    "type": "fasta"\n+                }\n+            ], \n+            "position": {\n+                "left": 1885, \n+                "top": 455\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/jjohnson/snpeff_to_peptides/snpeff_to_peptides/0.0.1", \n+            "tool_state": "{\\"__page__\\": 0, \\"leading_aa_num\\": \\"\\\\\\"66\\\\\\"\\", \\"all_pep_fasta\\": \\"null\\", \\"__rerun_remap_job_id__\\": null, \\"trailing_aa_num\\": \\"\\\\\\"66\\\\\\"\\", \\"snpeff_vcf\\": \\"null\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\"}", \n+            "tool_version": "0.0.1", \n+            "type": "tool", \n+            "user_outputs": []\n+        }\n+    }\n+}\n\\ No newline at end of file\n'
b
diff -r 000000000000 -r 3a11830963e3 proteomics_rnaseq_mouse_splice_db_workflow.ga
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/proteomics_rnaseq_mouse_splice_db_workflow.ga Mon Mar 17 15:59:57 2014 -0500
[
b'@@ -0,0 +1,368 @@\n+{\n+    "a_galaxy_workflow": "true", \n+    "annotation": "The SAP Database Workflow creates a database of polypeptide sequences containing single amino acid polymorphisms (SAPs) detected in RNA-Seq data.", \n+    "format-version": "0.1", \n+    "name": "Mouse SAP DB", \n+    "steps": {\n+        "0": {\n+            "annotation": "", \n+            "id": 0, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "RNA-Seq left mate pair fastq"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 257, \n+                "top": 163\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"RNA-Seq left mate pair fastq\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "1": {\n+            "annotation": "", \n+            "id": 1, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "RNA-Seq right mate pair fastq"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 257, \n+                "top": 393\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"RNA-Seq right mate pair fastq\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "2": {\n+            "annotation": "", \n+            "id": 2, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "Ensembl GTF file (gene models)"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 500, \n+                "top": 526\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"Ensembl GTF file (gene models)\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "3": {\n+            "annotation": "", \n+            "id": 3, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "The Ensembl protein FASTA file (reference proteome)"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 1551, \n+                "top": 552\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"The Ensembl protein FASTA file (reference proteome)\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "4": {\n+            "annotation": "", \n+            "id": 4, \n+            "input_connections": {\n+                "input": {\n+                    "id": 0, \n+                    "output_name": "output"\n+                }\n+            }, \n+            "inputs": [], \n+            "name": "Select first", \n+            "outputs": [\n+                {\n+                    "name": "out_file1", \n+                    "type": "input"\n+                }\n+            ], \n+            "position": {\n+                "left": 482, \n+                "top": 209\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "Show beginning1", \n+            "tool_state": "{\\"__page__\\": 0, \\"input\\": \\"null\\",'..b'ry\\\\\\": \\\\\\"false\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"G\\": \\"\\\\\\"false\\\\\\"\\", \\"F\\": \\"\\\\\\"false\\\\\\"\\", \\"i\\": \\"{\\\\\\"__current_case__\\\\\\": 1, \\\\\\"alt_indel_snp_ratio\\\\\\": \\\\\\"false\\\\\\"}\\", \\"__rerun_remap_job_id__\\": null, \\"N\\": \\"\\\\\\"false\\\\\\"\\", \\"p\\": \\"{\\\\\\"variant_filter\\\\\\": \\\\\\"false\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"S\\": \\"\\\\\\"false\\\\\\"\\", \\"g\\": \\"\\\\\\"false\\\\\\"\\", \\"t\\": \\"{\\\\\\"mutation_rate\\\\\\": \\\\\\"false\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"v\\": \\"\\\\\\"true\\\\\\"\\", \\"u\\": \\"\\\\\\"false\\\\\\"\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\", \\"input\\": \\"null\\"}", \n+            "tool_version": "1.0.0", \n+            "type": "tool", \n+            "user_outputs": []\n+        }, \n+        "10": {\n+            "annotation": "", \n+            "id": 10, \n+            "input_connections": {\n+                "input": {\n+                    "id": 9, \n+                    "output_name": "output"\n+                }\n+            }, \n+            "inputs": [], \n+            "name": "SnpEff", \n+            "outputs": [\n+                {\n+                    "name": "snpeff_output", \n+                    "type": "vcf"\n+                }, \n+                {\n+                    "name": "statsFile", \n+                    "type": "html"\n+                }\n+            ], \n+            "position": {\n+                "left": 1576, \n+                "top": 317\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/snpeff/snpEff/3.4", \n+            "tool_state": "{\\"spliceSiteSize\\": \\"\\\\\\"1\\\\\\"\\", \\"filterHomHet\\": \\"\\\\\\"no_filter\\\\\\"\\", \\"outputFormat\\": \\"\\\\\\"vcf\\\\\\"\\", \\"udLength\\": \\"\\\\\\"0\\\\\\"\\", \\"inputFormat\\": \\"\\\\\\"vcf\\\\\\"\\", \\"filterIn\\": \\"\\\\\\"-snp\\\\\\"\\", \\"__page__\\": 0, \\"__rerun_remap_job_id__\\": null, \\"filterOut\\": \\"[\\\\\\"-no-downstream\\\\\\", \\\\\\"-no-intergenic\\\\\\", \\\\\\"-no-intron\\\\\\", \\\\\\"-no-upstream\\\\\\", \\\\\\"-no-utr\\\\\\"]\\", \\"generate_stats\\": \\"\\\\\\"True\\\\\\"\\", \\"noLog\\": \\"\\\\\\"True\\\\\\"\\", \\"chr\\": \\"\\\\\\"\\\\\\"\\", \\"intervals\\": \\"null\\", \\"snpDb\\": \\"{\\\\\\"genome_version\\\\\\": \\\\\\"GRCm38.73\\\\\\", \\\\\\"genomeSrc\\\\\\": \\\\\\"named\\\\\\", \\\\\\"__current_case__\\\\\\": 2}\\", \\"offset\\": \\"\\\\\\"\\\\\\"\\", \\"input\\": \\"null\\", \\"transcripts\\": \\"null\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\", \\"annotations\\": \\"null\\"}", \n+            "tool_version": "3.4", \n+            "type": "tool", \n+            "user_outputs": []\n+        }, \n+        "11": {\n+            "annotation": "", \n+            "id": 11, \n+            "input_connections": {\n+                "all_pep_fasta": {\n+                    "id": 3, \n+                    "output_name": "output"\n+                }, \n+                "snpeff_vcf": {\n+                    "id": 10, \n+                    "output_name": "snpeff_output"\n+                }\n+            }, \n+            "inputs": [], \n+            "name": "SnpEff to Peptide fasta", \n+            "outputs": [\n+                {\n+                    "name": "peptide_variant_fasta", \n+                    "type": "fasta"\n+                }\n+            ], \n+            "position": {\n+                "left": 1885, \n+                "top": 455\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/jjohnson/snpeff_to_peptides/snpeff_to_peptides/0.0.1", \n+            "tool_state": "{\\"__page__\\": 0, \\"leading_aa_num\\": \\"\\\\\\"66\\\\\\"\\", \\"all_pep_fasta\\": \\"null\\", \\"__rerun_remap_job_id__\\": null, \\"trailing_aa_num\\": \\"\\\\\\"66\\\\\\"\\", \\"snpeff_vcf\\": \\"null\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\"}", \n+            "tool_version": "0.0.1", \n+            "type": "tool", \n+            "user_outputs": []\n+        }\n+    }\n+}\n\\ No newline at end of file\n'
b
diff -r 000000000000 -r 3a11830963e3 proteomics_rnaseq_splice_db_workflow.ga
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/proteomics_rnaseq_splice_db_workflow.ga Mon Mar 17 15:59:57 2014 -0500
[
b'@@ -0,0 +1,387 @@\n+{\n+    "a_galaxy_workflow": "true", \n+    "annotation": "The SAP Database Workflow creates a database of polypeptide sequences containing single amino acid polymorphisms (SAPs) detected in RNA-Seq data.", \n+    "format-version": "0.1", \n+    "name": "Proteomics SAP DB", \n+    "steps": {\n+        "0": {\n+            "annotation": "", \n+            "id": 0, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "RNA-Seq Left mate pair fastq"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 257, \n+                "top": 163\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"RNA-Seq Left mate pair fastq\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "1": {\n+            "annotation": "", \n+            "id": 1, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "RNA-Seq right mate pair fastq"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 257, \n+                "top": 393\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"RNA-Seq right mate pair fastq\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "2": {\n+            "annotation": "", \n+            "id": 2, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "Ensembl GTF for the reference genome"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 500, \n+                "top": 526\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"Ensembl GTF for the reference genome\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "3": {\n+            "annotation": "", \n+            "id": 3, \n+            "input_connections": {}, \n+            "inputs": [\n+                {\n+                    "description": "", \n+                    "name": "The Ensembl peptide sequences fasta"\n+                }\n+            ], \n+            "name": "Input dataset", \n+            "outputs": [], \n+            "position": {\n+                "left": 1551, \n+                "top": 552\n+            }, \n+            "tool_errors": null, \n+            "tool_id": null, \n+            "tool_state": "{\\"name\\": \\"The Ensembl peptide sequences fasta\\"}", \n+            "tool_version": null, \n+            "type": "data_input", \n+            "user_outputs": []\n+        }, \n+        "4": {\n+            "annotation": "", \n+            "id": 4, \n+            "input_connections": {\n+                "input": {\n+                    "id": 0, \n+                    "output_name": "output"\n+                }\n+            }, \n+            "inputs": [], \n+            "name": "Select first", \n+            "outputs": [\n+                {\n+                    "name": "out_file1", \n+                    "type": "input"\n+                }\n+            ], \n+            "position": {\n+                "left": 482, \n+                "top": 209\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "Show beginning1", \n+            "tool_state": "{\\"__page__\\": 0, \\"input\\": \\"null\\", \\"__rerun_rema'..b'"}\\", \\"__rerun_remap_job_id__\\": null, \\"N\\": \\"\\\\\\"false\\\\\\"\\", \\"p\\": \\"{\\\\\\"variant_filter\\\\\\": \\\\\\"false\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"S\\": \\"\\\\\\"false\\\\\\"\\", \\"g\\": \\"\\\\\\"false\\\\\\"\\", \\"t\\": \\"{\\\\\\"mutation_rate\\\\\\": \\\\\\"false\\\\\\", \\\\\\"__current_case__\\\\\\": 1}\\", \\"v\\": \\"\\\\\\"true\\\\\\"\\", \\"u\\": \\"\\\\\\"false\\\\\\"\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\", \\"input\\": \\"null\\"}", \n+            "tool_version": "1.0.0", \n+            "type": "tool", \n+            "user_outputs": []\n+        }, \n+        "10": {\n+            "annotation": "", \n+            "id": 10, \n+            "input_connections": {\n+                "input": {\n+                    "id": 9, \n+                    "output_name": "output"\n+                }\n+            }, \n+            "inputs": [\n+                {\n+                    "description": "runtime parameter for tool SnpEff", \n+                    "name": "snpDb"\n+                }\n+            ], \n+            "name": "SnpEff", \n+            "outputs": [\n+                {\n+                    "name": "snpeff_output", \n+                    "type": "vcf"\n+                }, \n+                {\n+                    "name": "statsFile", \n+                    "type": "html"\n+                }\n+            ], \n+            "position": {\n+                "left": 1576, \n+                "top": 317\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/snpeff/snpEff/3.4", \n+            "tool_state": "{\\"spliceSiteSize\\": \\"\\\\\\"1\\\\\\"\\", \\"filterHomHet\\": \\"\\\\\\"no_filter\\\\\\"\\", \\"outputFormat\\": \\"\\\\\\"vcf\\\\\\"\\", \\"udLength\\": \\"\\\\\\"0\\\\\\"\\", \\"inputFormat\\": \\"\\\\\\"vcf\\\\\\"\\", \\"filterIn\\": \\"\\\\\\"-snp\\\\\\"\\", \\"__page__\\": 0, \\"__rerun_remap_job_id__\\": null, \\"filterOut\\": \\"[\\\\\\"-no-downstream\\\\\\", \\\\\\"-no-intergenic\\\\\\", \\\\\\"-no-intron\\\\\\", \\\\\\"-no-upstream\\\\\\", \\\\\\"-no-utr\\\\\\"]\\", \\"generate_stats\\": \\"\\\\\\"True\\\\\\"\\", \\"noLog\\": \\"\\\\\\"True\\\\\\"\\", \\"chr\\": \\"\\\\\\"\\\\\\"\\", \\"intervals\\": \\"null\\", \\"snpDb\\": \\"{\\\\\\"genome_version\\\\\\": {\\\\\\"__class__\\\\\\": \\\\\\"RuntimeValue\\\\\\"}, \\\\\\"genomeSrc\\\\\\": \\\\\\"named\\\\\\", \\\\\\"__current_case__\\\\\\": 2}\\", \\"offset\\": \\"\\\\\\"\\\\\\"\\", \\"input\\": \\"null\\", \\"transcripts\\": \\"null\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\", \\"annotations\\": \\"null\\"}", \n+            "tool_version": "3.4", \n+            "type": "tool", \n+            "user_outputs": []\n+        }, \n+        "11": {\n+            "annotation": "", \n+            "id": 11, \n+            "input_connections": {\n+                "all_pep_fasta": {\n+                    "id": 3, \n+                    "output_name": "output"\n+                }, \n+                "snpeff_vcf": {\n+                    "id": 10, \n+                    "output_name": "snpeff_output"\n+                }\n+            }, \n+            "inputs": [], \n+            "name": "SnpEff to Peptide fasta", \n+            "outputs": [\n+                {\n+                    "name": "peptide_variant_fasta", \n+                    "type": "fasta"\n+                }\n+            ], \n+            "position": {\n+                "left": 1885, \n+                "top": 455\n+            }, \n+            "post_job_actions": {}, \n+            "tool_errors": null, \n+            "tool_id": "toolshed.g2.bx.psu.edu/repos/jjohnson/snpeff_to_peptides/snpeff_to_peptides/0.0.1", \n+            "tool_state": "{\\"__page__\\": 0, \\"leading_aa_num\\": \\"\\\\\\"66\\\\\\"\\", \\"all_pep_fasta\\": \\"null\\", \\"__rerun_remap_job_id__\\": null, \\"trailing_aa_num\\": \\"\\\\\\"66\\\\\\"\\", \\"snpeff_vcf\\": \\"null\\", \\"chromInfo\\": \\"\\\\\\"/website/galaxy.msi.umn.edu/PRODUCTION/tool-data/shared/ucsc/chrom/GRCh37_canon.len\\\\\\"\\"}", \n+            "tool_version": "0.0.1", \n+            "type": "tool", \n+            "user_outputs": []\n+        }\n+    }\n+}\n\\ No newline at end of file\n'
b
diff -r 000000000000 -r 3a11830963e3 repository_dependencies.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/repository_dependencies.xml Mon Mar 17 15:59:57 2014 -0500
b
@@ -0,0 +1,8 @@
+<?xml version="1.0"?>
+<repositories description="Required tools for proteomics_rnaseq_splice_db_workflow">
+    <repository name="tophat" owner="devteam" toolshed="http://toolshed.g2.bx.psu.edu" changeset_revision="1030acbecce6" />
+    <repository name="samtools_mpileup" owner="devteam" toolshed="http://toolshed.g2.bx.psu.edu" changeset_revision="44a18a94d7a9" />
+    <repository name="bcftools" owner="nilesh" toolshed="http://toolshed.g2.bx.psu.edu" changeset_revision="3182c7fac413" />
+    <repository name="snpeff" owner="iuc" toolshed="http://toolshed.g2.bx.psu.edu" changeset_revision="e8adfc4c0a6b" />
+    <repository name="snpeff_to_peptides" owner="jjohnson" toolshed="http://toolshed.g2.bx.psu.edu" changeset_revision="fcb7188fa0d2" />
+</repositories>