annotate mdust.xml @ 2:79feb4eb7832 draft default tip

Uploaded
author urgi-team
date Wed, 18 Nov 2015 10:51:42 -0500
parents cc6db1ee2d48
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
1 <?xml version="1.0"?>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
2 <tool id="mdust" name="mdust" version="1.0">
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
3 <description>fast and symmetric DUST implementation to mask low-complexity DNA sequences</description>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
4 <requirements>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
5 <requirement type="package" version="1.0">mdust</requirement>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
6 </requirements>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
7 <command interpreter="python">
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
8 mdust_wrapper.py -i ${input_file} -v ${cutoff} -w ${wsize} -m ${masking_letter.masking_letter_selector} -f ${output_type.output_type_selector}
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
9
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
10 #if str( $output_type.output_type_selector) == "default"
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
11 -o ${output_masked_fasta}
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
12 #end if
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
13
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
14 #if str( $output_type.output_type_selector) == "tab"
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
15 -o ${output_tab}
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
16 #end if
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
17
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
18 #if str( $output_type.output_type_selector) == "bed"
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
19 -o ${output_bed}
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
20 #end if
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
21 </command>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
22 <inputs>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
23 <param name="input_file" type="data" format="fasta" label="Input fasta file" help=""/>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
24 <param name="cutoff" type="integer" value="28" label="cutt-off" help="cut-off" />
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
25 <param name="wsize" type="integer" value="3" label="set maximum word size" help="word-size" />
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
26 <conditional name="masking_letter">
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
27 <param name="masking_letter_selector" type="select" label="Choose your masking type" help="Select the masking letter (N,X or lowercase)" >
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
28 <option value="N" selected="True">N (default)</option>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
29 <option value="X">X</option>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
30 <option value="L">lowercase</option>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
31 </param>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
32 </conditional>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
33 <conditional name="output_type">
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
34 <param name="output_type_selector" type="select" label="Choose your output type" help="select your output">
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
35 <option value="default" selected="True">masked file (default)</option>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
36 <option value="tab">output masking coordinates only (tab delimited)</option>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
37 <option value="bed">output masking coordinates only (bed format)</option>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
38 </param>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
39 </conditional>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
40 </inputs>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
41 <outputs>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
42 <data format="fasta" name="output_masked_fasta" label="masked.${input_file.name}">
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
43 <filter>( output_type['output_type_selector'] == 'default' )</filter>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
44 </data>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
45 <data format="tabular" name="output_tab" label="${input_file.name}.tab">
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
46 <filter>( output_type['output_type_selector'] == 'tab' )</filter>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
47 </data>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
48 <data format="bed" name="output_bed" label="${input_file.name}.bed">
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
49 <filter>( output_type['output_type_selector'] == 'bed' )</filter>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
50 </data>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
51 </outputs>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
52 <tests>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
53 <test>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
54 <param name="input_file" value="seq-mdust.fsa" />
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
55 <output name="output_masked_fasta" file="masked-seq-mdust.fsa" ftype="fasta" />
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
56 </test>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
57 </tests>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
58 <help><![CDATA[
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
59 mdust new implementation of the DUST module that uses the same function to assign a complexity score to a sequence, but uses a different rule by which high-scoring sequences are masked.
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
60
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
61 -----
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
62
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
63 **Usage:** ::
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
64
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
65 mdust [<fasta-file>] [-w <wsize>] [-v <cut-off>] [-m N|X|L] [-c]
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
66 if no <fasta-file> is given, a multi-fasta stream is expected at stdin
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
67 -v default <cut-off> value is 28 (lower values might mask more,
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
68 but possibly still useful sequence; > 64 will rarely mask poly-triplets)
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
69 -w set maximum word size to <wsize> (default 3)
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
70 -m if fasta output is not disabled by -c, set the masking letter type:
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
71 N ('N', default), X ('X'), L (make lowercase)
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
72 -c output masking coordinates only:
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
73 seq_name, seqlength, mask_start, mask_end (tab delimited)
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
74
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
75 -----
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
76
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
77 **Reference:** ::
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
78
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
79 A fast and symmetric DUST implementation to mask low-complexity DNA sequences.
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
80 Morgulis A, Gertz EM, Schäffer AA, Agarwala R.
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
81 J Comput Biol. 2006 Jun;13(5):1028-40.
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
82 PMID:16796549
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
83
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
84
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
85 ]]>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
86 </help>
cc6db1ee2d48 Uploaded
urgi-team
parents:
diff changeset
87 </tool>