comparison DimontWeb.xml @ 0:5130880b8e0a draft

Uploaded
author grau
date Tue, 12 Nov 2013 12:55:52 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:5130880b8e0a
1 <tool id="Dimont" name="Dimont" version="0.1" force_history_refresh="true">
2 <description>- a universal tool for de-novo motif discovery.</description>
3 <command>java -Xms256M -Xmx2G -jar \$JAR_PATH/DimontWeb.jar --run $script_file $summary $summary.id $__new_file_path__ $summary.extra_files_path</command>
4 <inputs>
5 <param type="text" size="40" name="Dimont_jobname" label="Job name" value="" optional="true" help="Please enter a name for your job that should be used in the history (optional)">
6 </param>
7 <param type="data" format="fasta" name="Dimont_ps_Input_sequences" label="&lt;hr /&gt;Input sequences" help="The input sequences for de-novo motif discovery (can be uploaded using &quot;GetData&quot; -&gt; &quot;Upload File&quot;), annotated FastA format. The required format is described in the help section." value="" optional="false">
8 </param>
9
10 <param type="text" size="40" name="Dimont_ps_Position_tag" label="Position tag" help="The tag for the position information in the FastA-annotation of the input file" value="" optional="false">
11 </param>
12
13 <param type="text" size="40" name="Dimont_ps_Value_tag" label="Value tag" help="The tag for the value information in the FastA-annotation of the input file" value="" optional="false">
14 </param>
15
16 <param type="float" name="Dimont_ps_Standard_deviation" label="Standard deviation" help="The standard deviation of the position distribution centered at the position specified by the position tag" value="75.0" optional="false">
17 <validator type="in_range" min="1.0" max="10000.0" message="Value is not in the specified range [1.0, 10000.0]."/></param>
18
19 <param type="text" size="40" name="Dimont_ps_Weighting_factor" label="Weighting factor" help="The value for weighting the data; either a value between 0 and 1, or a description relative to the standard deviation (e.g. +4sd)" value="0.2" optional="false">
20 </param>
21
22 <param type="integer" name="Dimont_ps_Starts" label="&lt;hr /&gt;Starts" help="The number of pre-optimization runs." value="20" optional="false">
23 <validator type="in_range" min="1" max="100" message="Value is not in the specified range [1, 100]."/></param>
24
25 <param type="integer" name="Dimont_ps_Initial_motif_width" label="&lt;hr /&gt;Initial motif width" help="The motif width that is used initially, may be adjusted during optimization." value="15" optional="false">
26 <validator type="in_range" min="1" max="50" message="Value is not in the specified range [1, 50]."/></param>
27
28 <param type="integer" name="Dimont_ps_Markov_order_of_motif_model" label="Markov order of motif model" help="The Markov order of the model for the motif." value="0" optional="false">
29 <validator type="in_range" min="0" max="3" message="Value is not in the specified range [0, 3]."/></param>
30
31 <param type="integer" name="Dimont_ps_Markov_order_of_background_model" label="Markov order of background model" help="The Markov order of the model for the background sequence and the background sequence, -1 defines uniform distribution." value="-1" optional="false">
32 <validator type="in_range" min="-1" max="5" message="Value is not in the specified range [-1, 5]."/></param>
33
34 <param type="float" name="Dimont_ps_Equivalent_sample_size" label="&lt;hr /&gt;Equivalent sample size" help="Reflects the strength of the prior on the model parameters." value="4.0" optional="false">
35 <validator type="in_range" min="0.0" max="Infinity" message="Value is not in the specified range [0.0, Infinity]."/></param>
36
37 <param type="boolean" name="Dimont_ps_Delete_BSs_from_profile" label="Delete BSs from profile" help="A switch for deleting binding site positions of discovered motifs from the profile before searching for futher motifs." checked="True" optional="false">
38 </param>
39
40 </inputs>
41 <requirements>
42 <requirement type="set_environment">JAR_PATH</requirement>
43 <requirement type="binary" version=">=1.6">java</requirement>
44 </requirements>
45 <configfiles>
46 <configfile name="script_file">
47 &lt;Dimont_ps_Input_sequences&gt;
48 &lt;value&gt;
49 ${Dimont_ps_Input_sequences}&lt;/value&gt;
50 &lt;extension&gt;
51 ${Dimont_ps_Input_sequences.ext}&lt;/extension&gt;
52 &lt;/Dimont_ps_Input_sequences&gt;
53
54 &lt;Dimont_ps_Position_tag&gt;
55 ${Dimont_ps_Position_tag}&lt;/Dimont_ps_Position_tag&gt;
56
57 &lt;Dimont_ps_Value_tag&gt;
58 ${Dimont_ps_Value_tag}&lt;/Dimont_ps_Value_tag&gt;
59
60 &lt;Dimont_ps_Standard_deviation&gt;
61 ${Dimont_ps_Standard_deviation}&lt;/Dimont_ps_Standard_deviation&gt;
62
63 &lt;Dimont_ps_Weighting_factor&gt;
64 ${Dimont_ps_Weighting_factor}&lt;/Dimont_ps_Weighting_factor&gt;
65
66 &lt;Dimont_ps_Starts&gt;
67 ${Dimont_ps_Starts}&lt;/Dimont_ps_Starts&gt;
68
69 &lt;Dimont_ps_Initial_motif_width&gt;
70 ${Dimont_ps_Initial_motif_width}&lt;/Dimont_ps_Initial_motif_width&gt;
71
72 &lt;Dimont_ps_Markov_order_of_motif_model&gt;
73 ${Dimont_ps_Markov_order_of_motif_model}&lt;/Dimont_ps_Markov_order_of_motif_model&gt;
74
75 &lt;Dimont_ps_Markov_order_of_background_model&gt;
76 ${Dimont_ps_Markov_order_of_background_model}&lt;/Dimont_ps_Markov_order_of_background_model&gt;
77
78 &lt;Dimont_ps_Equivalent_sample_size&gt;
79 ${Dimont_ps_Equivalent_sample_size}&lt;/Dimont_ps_Equivalent_sample_size&gt;
80
81 &lt;Dimont_ps_Delete_BSs_from_profile&gt;
82 ${Dimont_ps_Delete_BSs_from_profile}&lt;/Dimont_ps_Delete_BSs_from_profile&gt;
83
84 </configfile>
85 </configfiles>
86 <outputs>
87 <data format="html" name="summary" label="#if str($Dimont_jobname) == '' then $tool.name + ' on ' + $on_string else $Dimont_jobname#">
88 </data>
89 </outputs>
90 <tests>
91 <test>
92 <param name="Dimont_jobname" value="Test" />
93 <param name="Dimont_ps_Input_sequences" value="dimont_test.fasta" />
94 <param name="Dimont_ps_Position_tag" value="peakSummit" />
95 <param name="Dimont_ps_Value_tag" value="maxT" />
96 <param name="Dimont_ps_Standard_deviation" value="75.0" />
97 <param name="Dimont_ps_Weighting_factor" value="0.2" />
98 <param name="Dimont_ps_Starts" value="20" />
99 <param name="Dimont_ps_Initial_motif_width" value="15" />
100 <param name="Dimont_ps_Markov_order_of_motif_model" value="0" />
101 <param name="Dimont_ps_Markov_order_of_background_model" value="-1" />
102 <param name="Dimont_ps_Equivalent_sample_size" value="4.0" />
103 <param name="Dimont_ps_Delete_BSs_from_profile" value="True" />
104 <output name="summary" file="Test/Test_html.html" />
105 </test>
106 </tests>
107 <help>
108 **Dimont** is a universal tool for de-novo motif discovery. Dimont has successfully been applied to ChIP-seq, ChIP-exo and protein-binding microarray (PBM) data.
109
110 Input sequences must be supplied in an annotated FastA format as a file uploaded by the "Upload File" task in section "Get Data" of Galaxy or generated using the "Dimont Data Extractor" tool.
111 In the annotation of each sequence, you need to provide a value that reflects the confidence that this sequence is bound by the factor of interest.
112 Such confidences may be peak statistics (e.g., number of fragments under a peak) for ChIP data or signal intensities for PBM data. In addition, you need to provide an anchor position within the sequence.
113 In case of ChIP data, this anchor position could for instance be the peak summit.
114 For instance, an annotated FastA file for ChIP-exo data comprising sequences of length 100 centered around the peak summit could look like::
115
116 > peak: 50; signal: 515
117 ggccatgtgtatttttttaaatttccac...
118 > peak: 50; signal: 199
119 GGTCCCCTGGGAGGATGGGGACGTGCTG...
120 ...
121
122 where the anchor point is given as 50 for the first two sequences, and the confidence amounts to 515 and 199, respectively.
123 The FastA comment may contain additional annotations of the format ``key1 : value1; key2: value2;...``.
124 We also provide an example_ input file and a Perl script_ for preparing data in the format required by Dimont.
125
126 Accordingly, you would need to set the parameter "Position tag" to ``peak`` and the parameter "Value tag" to ``signal`` for the input file.
127
128 For the standard deviation of the position prior, the initial motif length and the number of pre-optimization runs, we provide default values that worked well in our studies on ChIP and PBM data.
129 However, you may want adjust these parameters to meet your prior information.
130
131 The parameter "Markov order of the motif model" sets the order of the inhomogeneous Markov model used for modeling the motif. If this parameter is set to ``0``, you obtain a position weight matrix (PWM) model.
132 If it is set to ``1``, you obtain a weight array matrix (WAM) model. You can set the order of the motif model to at most ``3``.
133
134 The parameter "Markov order of the background model" sets the order of the homogeneous Markov model used for modeling positions not covered by a motif.
135 If this parameter is set to ``-1``, you obtain a uniform distribution, which worked well for ChIP data. For PBM data, orders of up to ``4`` resulted in an increased prediction performance in our case studies. The maximum allowed value is ``5``.
136
137 The parameter "Weighting factor" defines the proportion of sequences that you expect to be bound by the targeted factor with high confidence. For ChIP data, the default value of ``0.2`` typically works well.
138 For PBM data, containing a large number of unspecific probes, this parameter should be set to a lower value, e.g. ``0.01``.
139
140 The "Equivalent sample size" reflects the strength of the influence of the prior on the model parameters, where higher values smooth out the parameters to a greater extent.
141
142 The parameter "Delete BSs from profile" defines if BSs of already discovered motifs should be deleted, i.e., "blanked out", from the sequence before searching for futher motifs.
143
144 You can also install this web-application within your local Galaxy server. Instructions can be found at the Dimont_ page of Jstacs.
145 There you can also download a command line version of Dimont.
146
147 If you experience problems using Dimont, please contact_ us.
148
149 .. _example: http://www.jstacs.de/downloads/dimont-example.fa
150 .. _script: http://www.jstacs.de/index.php/Dimont#Data_preparation
151 .. _Dimont: http://jstacs.de/index.php/Dimont
152 .. _contact: mailto:grau@informatik.uni-halle.de
153 </help>
154 </tool>
155