annotate glassgo_wrapper.xml @ 25:2e27fdf82795 draft default tip

Uploaded
author computationaltranscriptomics
date Thu, 02 Apr 2020 12:07:52 -0400
parents 74d04a19fdd7
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
1 <tool id="glassgo" name="GLASSgo" version="@VERSION@">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
2 <description>sRNA homolog finder</description>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
3 <macros>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
4 <import>glassgo_macros.xml</import>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
5 </macros>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
6 <expand macro="requirements"/>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
7 <command detect_errors="aggressive">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
8 <![CDATA[
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
9 GLASSgo.py
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
10 -t \${GALAXY_SLOTS:-Z}
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
11 -i ${input_data.input}
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
12 -d ${input_data.database}
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
13 #if str($search.cond_param_setup.param_setup) == "manual":
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
14 -e ${search.cond_param_setup.evalue}
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
15 -p ${search.cond_param_setup.identity}
24
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
16 #if str($search.cond_param_setup.cond_clust_setup.clust_setup) == "off":
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
17 -l 0
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
18 #else:
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
19 -l 2
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
20 #if str($search.cond_param_setup.cond_clust_setup.clustering.conditional_filtering_setup.filtering_setup) == "manual":
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
21 -a ${search.cond_param_setup.cond_clust_setup.clustering.conditional_filtering_setup.filtering}
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
22 #else:
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
23 -a -1
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
24 #end if
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
25 #end if
8
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
26 #end if
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
27 -u ${additional_setting.upstream_region}
13
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
28 #if str($search.acclist) != "global":
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
29 -g ${search.acclist}
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
30 #end if
8
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
31 -n 500
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
32 -o $output
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
33 ]]>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
34 </command>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
35 <inputs>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
36 <section name="input_data" title="Input" expanded="true">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
37 <param name="input" type="data" format="fasta" label="Query sRNA in FASTA" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
38 <param name="database" type="select" display="radio" label="NCBI-nt database">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
39 <options from_file="blastdb.loc">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
40 <column name="name" index="1"/>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
41 <column name="value" index="2"/>
25
2e27fdf82795 Uploaded
computationaltranscriptomics
parents: 24
diff changeset
42 <filter type="regexp" value="nt_.*" column="0" />
8
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
43 </options>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
44 </param>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
45 </section>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
46 <section name="search" title="Search Parameters" expanded="true">
13
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
47 <param name="acclist" type="select" label="Choose taxon">
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
48 <options from_file="glassgo_accession_list.txt">
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
49 <column name="name" index="0"/>
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
50 <column name="value" index="1"/>
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
51 </options>
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
52 </param>
8
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
53 <conditional name="cond_param_setup">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
54 <param name="param_setup" type="select" display="radio" label="Parameter Setup">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
55 <option value="automatic">automatic</option>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
56 <option value="manual">manual</option>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
57 </param>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
58 <when value="manual">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
59 <param name="evalue" type="float" value="1.0" label="Maximum allowed E-Value" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
60 <param name="identity" type="integer" value="52" label="Minimum allowed identity [%]" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
61 <conditional name="cond_clust_setup">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
62 <param name="clust_setup" type="select" display="radio" label="Structure-based clustering">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
63 <option value="off">off</option>
24
74d04a19fdd7 Uploaded
computationaltranscriptomics
parents: 13
diff changeset
64 <option value="on" selected="true">on</option>
8
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
65 </param>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
66 <when value="on">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
67 <section name="clustering" title="Structure-based Clustering" expanded="true">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
68 <conditional name="conditional_filtering_setup">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
69 <param name="filtering_setup" type="select" display="radio" label="Structure-based filtering">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
70 <option value="automatic">automatic</option>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
71 <option value="manual">manual</option>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
72 </param>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
73 <when value="manual">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
74 <param name="filtering" type="integer" value="2" label="manual value for filtering" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
75 </when>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
76 </conditional>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
77 </section>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
78 </when>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
79 </conditional>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
80 </when>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
81 </conditional>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
82 </section>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
83 <section name="additional_setting" title="Additional Settings" expanded="true">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
84 <param name="upstream_region" type="integer" value="0" label="Include upstream region">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
85 <validator type="in_range" min="0" message="Value must be positive" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
86 </param>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
87 </section>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
88 </inputs>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
89 <outputs>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
90 <data name="output" format_source="input" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
91 </outputs>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
92 <tests>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
93 <test>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
94 <param name="input" value="NsiR4_Synechocystis_sp_PCC6803.fa" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
95 <param name="taxon_setup" value="global" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
96 <param name="param_setup" value="automatic" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
97 <param name="upstream_region" value="0" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
98 <output name="output" file="glassgo_NsiR4_Synechocystis_sp_PCC6803.fa" />
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
99 </test>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
100 </tests>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
101 <help>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
102 <![CDATA[
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
103 **Introduction**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
104
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
105 GLASSgo (GLobal Automated sRNA Search go) combines iterative BLAST searches, pairwise identity filtering, and structure based clustering in an automated prediction pipeline to find sRNA homologs from scratch. The web server provides predefined parameter sets for a non-expert usage as well as enables a manual setup of the query parameters. The returned GLASSgo result is in FASTA format, whereby the first entry represents the input sequence.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
106
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
107
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
108 **Input**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
109
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
110 - **Query sRNA in FASTA**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
111 The (single) sRNA sequence has to be provided in FASTA format. Input can be given either as direct text input or by uploading a file. A sequence in FASTA format begins with a single-line sequence
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
112 identifier that starts with a greater-than (">") symbol, followed by lines of sequence data. For readability, it is recommended that each line is at most 80 characters in length.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
113
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
114 .. class:: warningmark
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
115
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
116 The parameter constraints are: The input has to be in valid FASTA format. The number of sequences has to be at least 1 and at most 1. Sequence lengths have to be in the range 20-800. The allowed sequence alphabet is 'ACGUTacgut'.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
117
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
118 - **NCBI Nucloetide database**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
119 The (latest) NCBI Nucleotide database.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
120
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
121 **Search Parameters**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
122
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
123 - **Taxon selection**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
124 The GLASSgo search is by default based on the complete NCBI Nucleotide database. In general, sRNAs show a limited distribution among the phylogenetic tree, such that a targeted search in a specfic taxonomic group is likely to perform better. For that, we provide accession lists for the taxonomic groups the search should
9
6b6453e9da44 Uploaded
computationaltranscriptomics
parents: 8
diff changeset
125 be limited to.
8
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
126
13
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
127
76b7a84ba942 Uploaded
computationaltranscriptomics
parents: 10
diff changeset
128
8
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
129 - **Parameter Setup**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
130 You can run GLASSgo either in automated mode or you can manually set the advanced parameters.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
131
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
132 - **Maximum allowed E-value**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
133 The E-value mainly influences the sensitivity of GLASSgo. A relaxed E-value (>1.0) increases the chance to get more sequences, but also increases computation time.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
134
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
135 .. class:: warningmark
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
136
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
137 The parameter constraints are: Input value has to be parsable as a Double. The value must be smaller than or equal to 50.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
138
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
139 - **Minimum allowed identity[%]**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
140 Each sRNA candidate is compared to the query sRNA on sequence level and should have a percent identity larger than the value of this parameter to be kept for further
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
141 analysis. Please note, that values lower than 65% increase the total number of hits, but also slightly increase the probability for false positives.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
142
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
143 .. class:: warningmark
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
144
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
145 The parameter constraints are: Input value has to be parsable as a Double. The value must be greater than or equal to 10 and must be smaller than or equal to 75.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
146
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
147 - **Structure-based clustering**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
148 Defines whether or not structural clustering (via Londen) is to be applied.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
149
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
150 .. class:: warningmark
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
151
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
152
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
153 **Structure-based clustering**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
154
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
155 - **Structure-based filtering**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
156 Structure-based filtering can either be done automatically or you can set manually an according structure-based filtering value (see according parameter).
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
157
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
158 - **Manual value for filtering**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
159 The structure-based filtering represents the third filtering step of GLASSgo and is applied to the candidate hits with medium percent identity (80% > %ID > min_identity).
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
160 Lowering the parameter value will result in a more strict analysis (less false positives) and vice versa.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
161
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
162 .. class:: warningmark
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
163
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
164 The parameter constraints are: Input value has to be parsable as a Double. The value must be greater than or equal to 0 and must be smaller than or equal to 3.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
165
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
166 **Additional Settings**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
167
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
168 - **Include upstream region**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
169 Setting the parameter 'Upstream Region' to 100 extracts 100 nucleotides upstream for each predicted GLASSgo hit. This additionally sequence information is directly
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
170 concatenated with the corresponding GLASSgo hit and therefore an integral part of the returned GLASSgo results. Note: The upstream region is not considered while the
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
171 similarity value [%] is computed! In addition, the FASTA header (e.g. start position) for each GLASSgo hit will be updated (if upstream region is activated), whereas
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
172 the upstream region is additionally mentioned like -UTR-REGION-100nt:1002422-1002521-. You can find further information about the GLASSgo results in the output help
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
173 section. (0 == no consideration).
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
174
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
175
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
176 **Output Description**
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
177
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
178 The output of GLASSgo is a file in multi-FASTA format where the input sequence (query) is followed by the identified homologs. If no homologs could be found, only the input sequence is shown. In the following the output format will be discussed using two examples. Both examples show a partial result of GLASSgo applying EcpR1. In the first example,the upstream region was turned off while the value for the upstream region was set to 100 nt for the second. For this very reason, the headers as well as the sequence sizes are unequal.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
179
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
180 The following header shows the Accession number of the respective genome followed by the genomic coordinates of the proposed sRNA homolog (no upstream region included).
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
181
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
182 >CP013051.1:1422247-1422417 Sinorhizobium americanum CCGM7, complete genome-p.c.VAL:80.75%-taxID:1408224
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
183 AAAGGAAGTGAGACTTCCACGATCGATCGGTTACCCCATGATGCTCAGGTCCGCCGCATCTCCTGGGTCGTGGGGTCGGTCGGCTGGCTTCCGACATCCGCGGATTCCTCGTGCCGCAGTCGGAGCCAGCCGACCCCCTTTCAAAACGCCGCTTCAAAAGAGGCGGCGTTT
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
184
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
185 In contrast, the next header shows the genomic coordinates of the combined upstream region (100nt) and the proposed sRNA. The exact coordinates of the upstream region are given later in the header (UPSTREAM-REGION-100nt:1422147-1422246).
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
186
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
187 >CP013051.1:1422147-1422417 Sinorhizobium americanum CCGM7, complete genome-UPSTREAM-REGION-100nt:1422147-1422246-p.c.VAL:80.75%-taxID:1408224
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
188 ATTTGTCCGAATACGAGACAGAATTAACCAAACGCCGAGCAACCCGCTTCGGCGATTAAGAATTCGTTGATTTTTTTTTATTTTCAAGCAATGCTGATATAAAGGAAGTGAGACTTCCACGATCGATCGGTTACCCCATGATGCTCAGGTCCGCCGCATCTCCTGGGTCGTGGGGTCGGTCGGCTGGCTTCCGACATCCGCGGATTCCTCGTGCCGCAGTCGGAGCCAGCCGACCCCCTTTCAAAACGCCGCTTCAAAAGAGGCGGCGTTT
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
189
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
190 Both examples contain the name of the genome entry and a pairwise similarity value of p.c.Val:80.75% (query vs. GLASSgo hit ) as well as their corresponding taxonomic number taxID:1408224.
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
191
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
192 ]]>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
193 </help>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
194 <citations>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
195 <citation type="bibtex">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
196 @article{10.3389/fgene.2018.00124,
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
197 author={Lott, Steffen C. and Schäfer, Richard A. and Mann, Martin and Backofen, Rolf and Hess, Wolfgang R. and Voß, Björn and Georg, Jens},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
198 title={GLASSgo – Automated and Reliable Detection of sRNA Homologs From a Single Input Sequence},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
199 journal={Frontiers in Genetics},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
200 volume={9},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
201 pages={124},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
202 year={2018},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
203 url={https://www.frontiersin.org/article/10.3389/fgene.2018.00124},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
204 doi={10.3389/fgene.2018.00124}
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
205 }
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
206 </citation>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
207 <citation type="bibtex">
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
208 @article{Raden-2018-websrv,
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
209 author = {Raden, Martin and Ali, Syed M and Alkhnbashi, Omer S and Busch, Anke and Costa, Fabrizio and Davis, Jason A and Eggenhofer, Florian and Gelhausen,
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
210 Rick and Georg, Jens and Heyne, Steffen and Hiller, Michael and Kundu, Kousik and Kleinkauf, Robert and Lott, Steffen C and Mohamed, Mostafa M and Mattheis,
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
211 Alexander and Miladi, Milad and Richter, Andreas S and Will, Sebastian and Wolff, Joachim and Wright, Patrick R and Backofen, Rolf},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
212 title = {{Freiburg} {RNA} {tools}: a central online resource for {RNA}-focused research and teaching},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
213 journal = {Nucleic Acids Research},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
214 volume = {46},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
215 number = {W1},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
216 pages = {W25-W29},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
217 year = {2018},
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
218 doi = {10.1093/nar/gky329}
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
219 }
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
220 </citation>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
221 </citations>
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
222
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
223
d8237aeeb694 Add missing zenodo link
computationaltranscriptomics
parents:
diff changeset
224 </tool>