annotate sappDocker/interproscan.xml @ 31:957156367442 draft

Uploaded
author jjkoehorst
date Wed, 29 Jun 2016 01:36:58 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
31
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
1 <tool id="DInterproscan" name="Interproscan" version="1.0.0">
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
2 <description>Interproscan annotation for SAPP</description>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
3 <requirements>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
4 <container type="docker">jjkoehorst/sappdocker:INTERPROSCAN</container>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
5 </requirements>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
6 <command interpreter="docker">java -jar /interproscan/target/interproscanRDF-0.0.1-SNAPSHOT-jar-with-dependencies.jar
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
7 '-input' '$input' '-format' 'TURTLE'
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
8 '-applications' '$appl'
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
9 '-output'
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
10 '$outfile' -v '$version' '$disable'
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
11 </command>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
12 <inputs>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
13 <param format="ttl" label="genome rdf file with orf prediction" name="input" type="data"/>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
14 <param display="checkboxes" help="Select your programm." label="Applications to run" multiple="True" name="appl" type="select">
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
15 <option selected="true" value="TIGRFAM">TIGRFAM: protein families
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
16 based on Hidden Markov Models or HMMs
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
17 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
18 <option selected="false" value="PIRSF">PIRSF: non-overlapping
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
19 clustering of UniProtKB sequences into a hierarchical order
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
20 (evolutionary relationships)
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
21 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
22 <option selected="true" value="ProDom">ProDom: set of protein domain
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
23 families generated from the UniProtKB
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
24 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
25 <option selected="true" value="SMART">SMART: identification and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
26 analysis of domain architectures based on Hidden Markov Models or
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
27 HMMs
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
28 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
29 <option selected="false" value="PrositeProfiles">PROSITE Profiles:
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
30 protein domains, families and functional sites as well as associated
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
31 profiles to identify them
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
32 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
33 <option selected="true" value="PrositePatterns">PROSITE Pattern:
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
34 protein domains, families and functional sites as well as associated
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
35 patterns to identify them
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
36 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
37 <option selected="false" value="HAMAP">HAMAP: High-quality Automated
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
38 Annotation of Microbial Proteomes
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
39 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
40 <option selected="true" value="PfamA">PfamA: protein families, each
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
41 represented by multiple sequence alignments and hidden Markov models
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
42 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
43 <option selected="true" value="PRINTS">PRINTS: group of conserved
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
44 motifs (fingerprints) used to characterise a protein family
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
45 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
46 <option selected="true" value="SuperFamily">SUPERFAMILY: database of
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
47 structural and functional annotation
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
48 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
49 <option selected="true" value="Coils">Coils: Prediction of Coiled
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
50 Coil Regions in Proteins
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
51 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
52 <option selected="true" value="Gene3d">Gene3d: Structural assignment
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
53 for whole genes and genomes using the CATH domain structure database
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
54 </option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
55 </param>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
56 <param label="Version selection" name="version" type="select">
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
57 <option value="interproscan-5.17-56.0">interproscan-5.17-56.0</option>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
58 </param>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
59 <param checked="false" falsevalue="-disableprecalc" help="You need to setup your own lookup server as the EBI version can differ. Look at interproscan configuration file for more info" label="Perform lookup of InterPro at defined server address" name="disable" truevalue="" type="boolean"/>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
60 </inputs>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
61 <outputs>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
62 <data format="ttl" label="IPR: ${input.name}" name="outfile"/>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
63 </outputs>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
64 <help>Interproscan annotation suite. Select your RDF genome with
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
65 protein annotation.
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
66 This can be either from a converted GenBank/EMBL
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
67 file or from a
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
68 Prodigal prediction.
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
69 The output will be an RDF file with
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
70 protein domain annotation from
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
71 InterPro.
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
72 </help>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
73 <citations>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
74 <citation type="bibtex">@article{Mitchell26112014,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
75 author = {Mitchell,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
76 Alex and Chang, Hsin-Yu and Daugherty, Louise and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
77 Fraser, Matthew and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
78 Hunter, Sarah and Lopez, Rodrigo and McAnulla,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
79 Craig and McMenamin,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
80 Conor and Nuka, Gift and Pesseat, Sebastien and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
81 Sangrador-Vegas, Amaia
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
82 and Scheremetjew, Maxim and Rato, Claudia and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
83 Yong, Siew-Yit and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
84 Bateman, Alex and Punta, Marco and Attwood, Teresa
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
85 K. and Sigrist,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
86 Christian J.A. and Redaschi, Nicole and Rivoire,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
87 Catherine and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
88 Xenarios, Ioannis and Kahn, Daniel and Guyot, Dominique
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
89 and Bork, Peer
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
90 and Letunic, Ivica and Gough, Julian and Oates, Matt
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
91 and Haft, Daniel
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
92 and Huang, Hongzhan and Natale, Darren A. and Wu,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
93 Cathy H. and Orengo,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
94 Christine and Sillitoe, Ian and Mi, Huaiyu and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
95 Thomas, Paul D. and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
96 Finn, Robert D.},
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
97 title = {The InterPro protein families database: the
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
98 classification
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
99 resource after 15 years},
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
100 year = {2014},
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
101 doi =
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
102 {10.1093/nar/gku1243},
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
103 abstract ={The InterPro database
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
104 (http://www.ebi.ac.uk/interpro/) is a freely
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
105 available resource that
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
106 can be used to classify sequences into
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
107 protein families and to predict
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
108 the presence of important domains and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
109 sites. Central to the InterPro
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
110 database are predictive models, known
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
111 as signatures, from a range of
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
112 different protein family databases
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
113 that have different biological
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
114 focuses and use different
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
115 methodological approaches to classify
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
116 protein families and domains.
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
117 InterPro integrates these signatures,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
118 capitalizing on the respective
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
119 strengths of the individual databases,
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
120 to produce a powerful protein
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
121 classification resource. Here, we report
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
122 on the status of InterPro as
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
123 it enters its 15th year of operation, and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
124 give an overview of new
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
125 developments with the database and its
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
126 associated Web interfaces and
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
127 software. In particular, the new domain
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
128 architecture search tool is
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
129 described and the process of mapping of
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
130 Gene Ontology terms to
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
131 InterPro is outlined. We also discuss the
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
132 challenges faced by the
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
133 resource given the explosive growth in
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
134 sequence data in recent years.
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
135 InterPro (version 48.0) contains 36 766
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
136 member database signatures
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
137 integrated into 26 238 InterPro entries, an
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
138 increase of over 3993
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
139 entries (5081 signatures), since 2012.},
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
140 URL =
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
141 {http://nar.oxfordjournals.org/content/early/2014/11/26/nar.gku1243.abstract},
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
142 eprint =
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
143 {http://nar.oxfordjournals.org/content/early/2014/11/26/nar.gku1243.full.pdf+html},
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
144 journal = {Nucleic Acids Research}
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
145 }
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
146 </citation>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
147 </citations>
957156367442 Uploaded
jjkoehorst
parents:
diff changeset
148 </tool>