comparison meme_psp_gen.xml @ 0:a0fa4efeeee3 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/meme commit 3f116ddc83447056068573320c148a9bfca9aa2e
author iuc
date Wed, 23 Aug 2017 20:57:34 -0400
parents
children b48e673af4e8
comparison
equal deleted inserted replaced
-1:000000000000 0:a0fa4efeeee3
1 <tool id="meme_psp_gen" name="MEME psp-gen" version="@WRAPPER_VERSION@.0">
2 <description>- perform discriminative motif discovery</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro="requirements" />
7 <command detect_errors="exit_code"><![CDATA[
8 psp-gen
9 -pos '$primary_sequence'
10 -neg '$control_sequence'
11 -minw $adv.minw
12 -maxw $adv.maxw
13 $adv.alphabet
14 #if str($adv.triples_cond.triples) == 'yes':
15 -triples
16 $adv.triples_cond.fixedstart
17 #end if
18 $adv.equiv
19 $adv.revcomp
20 $adv.scalemin
21 $adv.scalemax
22 $adv.maxrange
23 $adv.raw
24 #if str($adv.report_scores_cond.report_scores) == 'yes':
25 -reportscores
26 $adv.report_scores_cond.verbose
27 2> '$output_tabular'
28 #end if
29 > '$output_psp'
30 ]]></command>
31 <inputs>
32 <param format="fasta" name="primary_sequence" type="data" label="Primary sequence file"/>
33 <param format="fasta" name="control_sequence" type="data" label="Control sequence file"/>
34 <section name="adv" title="Additional Options">
35 <param argument="-minw" type="integer" value="4" min="0" label="Minimum width to use for position specific priors"/>
36 <param argument="-maxw" type="integer" value="20" min="0" label="Maximum width to use for position specific priors"/>
37 <param name="alphabet" type="select" label="Alphabet">
38 <option value="-dna" selected="true">DNA</option>
39 <option value="-protein">protein</option>
40 <option value="-rna">RNA</option>
41 </param>
42 <conditional name="triples_cond">
43 <param name="triples" type="select" label="Use spaced triples instead of whole-word matches?" help="Recommended for protein">
44 <option value="no" selected="true">No</option>
45 <option value="yes">yes</option>
46 </param>
47 <when value="no"/>
48 <when value="yes">
49 <param argument="-fixedstart" type="boolean" truevalue="-fixedstart" falsevalue="" checked="False" label="Allow triples to start anywhere within a site?" help="Select 'No' to only consider triples starting at the start of the site"/>
50 </when>
51 </conditional>
52 <param argument="-equiv" type="boolean" truevalue="-equiv" falsevalue="" checked="False" label="Match as equal sequences of letters that appear together?"/>
53 <param argument="-revcomp" type="boolean" truevalue="-revcomp" falsevalue="" checked="False" label="Consider both strands when calculating position specific priors for alphabets?"/>
54 <param argument="-scalemin" type="boolean" truevalue="-scalemin" falsevalue="" checked="False" label="Set the lowest score value after scaling?"/>
55 <param argument="-scalemax" type="boolean" truevalue="-scalemax" falsevalue="" checked="False" label="Set the highest score value after scaling?"/>
56 <param argument="-maxrange" type="boolean" truevalue="-maxrange" falsevalue="" checked="False" label="Choose the width with the biggest difference between minimum and maximum scores before scaling?" help="Select 'No' to choose the width with the biggest maximum score (before scaling)"/>
57 <param argument="-raw" type="boolean" truevalue="-raw" falsevalue="" checked="False" label="Output scores instead of priors?"/>
58 <conditional name="report_scores_cond">
59 <param name="report_scores" type="select" label="Output primary and control file names, scores and widths?">
60 <option value="no" selected="true">No</option>
61 <option value="yes">yes</option>
62 </param>
63 <when value="no"/>
64 <when value="yes">
65 <param argument="-verbose" type="boolean" truevalue="-verbose" falsevalue="" checked="False" label="Report frequency of each score?"/>
66 </when>
67 </conditional>
68 </section>
69 <param name="non_commercial_use" label="I certify that I am not using this tool for commercial purposes." type="boolean" truevalue="NON_COMMERCIAL_USE" falsevalue="COMMERCIAL_USE" checked="False">
70 <validator type="expression" message="This tool is only available for non-commercial use.">value == True</validator>
71 </param>
72 </inputs>
73 <outputs>
74 <data format="memepsp" name="output_psp"/>
75 <data format="tabular" name="output_tabular" label="${tool.name} (report) on ${on_string}">
76 <filter>adv['report_scores_cond']['report_scores'] == 'yes'</filter>
77 </data>
78 </outputs>
79 <tests>
80 <test>
81 <param name="primary_sequence" value="meme_psp_protein_input.fasta" ftype="fasta"/>
82 <param name="control_sequence" value="meme_psp_protein_input.fasta" ftype="fasta"/>
83 <param name="alphabet" value="protein"/>
84 <param name="report_scores" value="yes"/>
85 <param name="verbose" value="-verbose"/>
86 <param name="non_commercial_use" value="NON_COMMERCIAL_USE"/>
87 <output name="output_psp" file="output.memepsp"/>
88 <output name="output_tabular" file="meme_psp_gen_reports_output.tabular" compare="contains"/>
89 </test>
90 </tests>
91 <help>
92
93 .. class:: warningmark
94
95 **WARNING: This tool is only available for non-commercial use. Use for educational, research and non-profit purposes is permitted.
96 Before using, be sure to review, agree, and comply with the license.**
97
98 psp-gen is used to allow MEME to perform discriminative motif discovery—to find motifs overrepresented in one set of sequences compared to in another set.
99 It takes two files as input—the sequence file to be input to MEME, (the "primary" file) and a "control" sequence file of sequences believed not to contain
100 the same motifs as in the "primary" file. psp-gen creates a file for use by MEME that encapsulates information about probable discriminative motifs. psp-gen
101 records its chosen motif width in the file, and MEME is able to adjust the data when it tries different motif widths.
102
103 .. class:: infomark
104
105 For detailed information on psp-gen, click here_, or view the license_.
106
107 .. _here: http://meme-suite.org/doc/psp-gen.html?man_type=web
108 .. _license: http://meme-suite.org/doc/copyright.html?man_type=web
109
110 -----
111
112 **Required options**
113
114 * **Primary sequence file** - a file containing FASTA formatted sequences which are to be used as the primary set in PSP calculation.
115 * **Control sequence file** - a file containing FASTA formatted sequences which are to be used as the control set in PSP calculation.
116
117 **Additional options**
118
119 * **Minimum width to use for position specific priors** - the minimum width to use with selecting the "best" width for PSPs.
120 * **Maximum width to use for position specific priors** - the maximum width to use with selecting the "best" width for PSPs.
121 * **Alphabet** - The alphabet to be used, one of DNA, protein or RNA.
122 * **Use spaced triples instead of whole-word matches** - use spaced triples instead of whole-word matches (recommended when using the protein alphabet).
123
124 * **Allow triples to start anywhere within a site** - when using the -triples option, select 'Yes' to only consider triples starting at the start of the site or 'No' to allow triples to start anywhere in a width 'w' site.
125
126 * **Match as equal sequences of letters that appear together** - select 'Yes' to match as equal any sequence of letter that appears together. Separate letter groups using "-" (e.g. -equiv "IVL-HKR") means treat all occurrences of I, V or L as the same, and all occurrences of H, K or R as the same.
127 * **Consider both strands when calculating position specific priors for alphabets** - select 'Yes' to consider both strands when calculating PSPs for complementable alphabets or 'No to consider only the given strand.
128 * **Set the lowest score value after scaling** - select 'Yes' to set the lowest score to 0.1 unless the the following "highest score" option is selected, in which case the lowest score is highest score - 1.
129 * **Set the highest score value after scaling** - select 'Yes' to set the highest score to 0.9 unless the previous "lowest score" option is selected, in which case the highest score is lowest score + 1.
130 * **Choose the width with the biggest difference between minimum and maximum scores before scaling** - select 'Yes' to choose the width with the biggest difference between minimum and maximum scores before scaling, or 'No' to choose the width with the biggest maximum score before scaling.
131 * **Output scores instead of priors** - select 'Yes' to output scores instead of position specific priors.
132 * **Output primary and control file names, scores and widths** - select 'Yes' to produce an additional tabular output consisting of control file names, lowest and highest scores and lowest and highest widths.
133
134 * **Report frequency of each score** - select 'Yes' to include the frequency of each score in the output.
135
136 </help>
137 <citations>
138 <citation type="doi">10.1186/1471-2105-11-179</citation>
139 </citations>
140 </tool>