Repository 'protein_properties'
hg clone https://toolshed.g2.bx.psu.edu/repos/bgruening/protein_properties

Changeset 0:cd211b8c2e51 (2017-11-20)
Commit message:
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/protein_properties commit 6767a5ffb02052c844e9d862c79912f998f39d8e
added:
protein_properties.py
protein_properties.xml
test-data/Q9LHB9.fasta
test-data/protein_properties_result1.tabular
tool_dependencies.xml
b
diff -r 000000000000 -r cd211b8c2e51 protein_properties.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/protein_properties.py Mon Nov 20 05:09:21 2017 -0500
b
@@ -0,0 +1,23 @@
+#!/usr/bin/env python
+
+import sys
+from Bio import SeqIO
+from Bio.SeqUtils.ProtParam import ProteinAnalysis
+
+sys.stdout.write("ID\tMW\tIP\tgravy\tlength\tinstability\tmonoisotpoic\tSequence\n")
+
+for record in SeqIO.parse(sys.stdin, "fasta"):
+    a = ProteinAnalysis(str(record.seq))
+
+    properties = list()
+    properties.append(record.id)
+    properties.append(a.molecular_weight())
+    properties.append(a.isoelectric_point())
+    properties.append(a.gravy())
+    properties.append(a.length)
+    properties.append(a.instability_index())
+    properties.append(a.aromaticity())
+    # always last column to make the output more readable
+    properties.append(a.sequence)
+    sys.stdout.write( '\t'.join(map(str, properties))+"\n" )
+
b
diff -r 000000000000 -r cd211b8c2e51 protein_properties.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/protein_properties.xml Mon Nov 20 05:09:21 2017 -0500
[
@@ -0,0 +1,43 @@
+<tool id="bg_protein_properties" name="Calculate protein properties" version="0.1.0">
+    <description></description>
+    <requirements>
+        <requirement type="package" version="1.65">biopython</requirement>
+    </requirements>
+    <command detect_errors="aggressive"><![CDATA[
+        '$__tool_directory__/protein_properties.py' < '$input' > '$output'
+    ]]></command>
+    <inputs>
+        <param format="fasta" name="input" type="data" label="Protein sequence"
+            help="This should be in FASTA format." />
+    </inputs>
+    <outputs>
+        <data format="tabular" name="output" />
+    </outputs>
+    <tests>
+        <test>
+            <param name="input" value="Q9LHB9.fasta" ftype="fasta"/>
+            <output name="output" file="protein_properties_result1.tabular" ftype="tabular"/>
+        </test>
+    </tests>
+    <help><![CDATA[
+
+**What it does**

+This tool will calculate several properties for each given input sequence. The result will contain the following columns:
+
+- ID of the sequence
+- Molecular weight
+- Isoelectric point
+- *gravy* according to Kyte and Doolittle
+- Length of the sequence
+- Instability index, according to Guruprasad, 1990. (Any value above 40 means the protein is unstable (has a short half life))
+- Aromaticity, according to Lobry, 1994. (It is simply the relative frequency of Phe+Trp+Tyr)
+- Sequence (as given in the input)
+
+For more information see the `BioPython ProteinAnalysis documentation <http://www.biopython.org/DIST/docs/api/Bio.SeqUtils.ProtParam.ProteinAnalysis-class.html>`_.
+
+    ]]></help>
+    <citations>
+        <citation type="doi">10.1093/bioinformatics/btp163</citation>
+    </citations>
+</tool>
b
diff -r 000000000000 -r cd211b8c2e51 test-data/Q9LHB9.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/Q9LHB9.fasta Mon Nov 20 05:09:21 2017 -0500
b
@@ -0,0 +1,9 @@
+>sp|Q9LHB9|PER32_ARATH Peroxidase 32 OS=Arabidopsis thaliana GN=PER32 PE=1 SV=3
+MNFSYSSLSTWTTLMTLGCLLLHSSISSAQLTPTFYDNTCPSVFTIVRDTIVNELRSDPR
+IAASILRLHFHDCFVNGCDASILLDNTTSFRTEKDAAPNANSARGFPVIDRMKAAVETAC
+PRTVSCADILTIAAQQAVNLAGGPSWRVPLGRRDSLQAFFALANTNLPAPFFTLPQLKAS
+FQNVGLDRPSDLVALSGGHTFGKNQCQFIMDRLYNFSNTGLPDPTLNTTYLQTLRGQCPR
+NGNQTVLVDFDLRTPTVFDNKYYVNLKELKGLIQTDQELFSSPNATDTIPLVREYADGTQ
+KFFNAFVEAMNRMGNITPLTGTQGQIRQNCRVVNSNSLLHDVVEIVDFVSSM
+>sp|Q9LHB9|PER32_ARATH short
+MNFSYSSLSTWTTLMTLGCLLLHSSISSAQLTPTFYDNTCPSVFTIVRDTIVNELRSDPR
b
diff -r 000000000000 -r cd211b8c2e51 test-data/protein_properties_result1.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/protein_properties_result1.tabular Mon Nov 20 05:09:21 2017 -0500
b
@@ -0,0 +1,3 @@
+ID MW IP gravy length instability monoisotpoic Sequence
+sp|Q9LHB9|PER32_ARATH 38846.6361 6.20635986328 -0.0943181818182 352 31.0301420455 0.0880681818182 MNFSYSSLSTWTTLMTLGCLLLHSSISSAQLTPTFYDNTCPSVFTIVRDTIVNELRSDPRIAASILRLHFHDCFVNGCDASILLDNTTSFRTEKDAAPNANSARGFPVIDRMKAAVETACPRTVSCADILTIAAQQAVNLAGGPSWRVPLGRRDSLQAFFALANTNLPAPFFTLPQLKASFQNVGLDRPSDLVALSGGHTFGKNQCQFIMDRLYNFSNTGLPDPTLNTTYLQTLRGQCPRNGNQTVLVDFDLRTPTVFDNKYYVNLKELKGLIQTDQELFSSPNATDTIPLVREYADGTQKFFNAFVEAMNRMGNITPLTGTQGQIRQNCRVVNSNSLLHDVVEIVDFVSSM
+sp|Q9LHB9|PER32_ARATH 6733.5899 5.41021728516 0.13 60 35.0618333333 0.1 MNFSYSSLSTWTTLMTLGCLLLHSSISSAQLTPTFYDNTCPSVFTIVRDTIVNELRSDPR
b
diff -r 000000000000 -r cd211b8c2e51 tool_dependencies.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml Mon Nov 20 05:09:21 2017 -0500
b
@@ -0,0 +1,6 @@
+<?xml version="1.0"?>
+<tool_dependency>
+    <package name="biopython" version="1.65">
+        <repository changeset_revision="d8185f5631ed" name="package_biopython_1_65" owner="biopython" toolshed="https://toolshed.g2.bx.psu.edu" />
+    </package>
+</tool_dependency>