Mercurial > repos > fubar > microsatbed
annotate microsatbed.xml @ 23:45f690db0eaf draft
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
author | fubar |
---|---|
date | Wed, 17 Jul 2024 23:19:12 +0000 |
parents | b5acf60b903d |
children | 26e9575c2c83 |
rev | line source |
---|---|
22
b5acf60b903d
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
21
diff
changeset
|
1 <tool name="STR to bed" id="microsatbed" version="1.3.2" profile="22.05"> |
11 | 2 <description>Short Tandem Repeats to bed features from fasta</description> |
3 <requirements> | |
4 <requirement version="3.12.3" type="package">python</requirement> | |
5 <requirement version="2.1.0" type="package">pyfastx</requirement> | |
21
8406413cb4aa
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
20
diff
changeset
|
6 <requirement version="1.3.2" type="package">pytrf</requirement> |
8406413cb4aa
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
20
diff
changeset
|
7 <requirement version="0.2.0" type="package">pybigtools</requirement> |
11 | 8 </requirements> |
9 <required_files> | |
10 <include path="find_str.py"/> | |
11 </required_files> | |
12 <version_command><![CDATA[python -c "import pytrf; from importlib.metadata import version; print(version('pytrf'))"]]></version_command> | |
13 <command><![CDATA[ | |
14 #if $mode_cond.mode == "NATIVE": | |
15 #if $reference_genome.genome_type_select == "history": | |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
16 pytrf findstr -f '$mode_cond.outformat' -o $bed -r $monomin $dimin $trimin $tetramin $pentamin $hexamin '${reference_genome.fasta}' |
11 | 17 #else: |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
18 pytrf findstr -f '$mode_cond.outformat' -o $bed -r $monomin $dimin $trimin $tetramin $pentamin $hexamin '${reference_genome.fasta.fields.path}' |
11 | 19 #end if |
20 #else: | |
21 python '${__tool_directory__}/find_str.py' | |
22 #if $reference_genome.genome_type_select == "history": | |
23 --fasta '${reference_genome.fasta}' | |
24 #else: | |
25 --fasta '${reference_genome.fasta.fields.path}' | |
26 #end if | |
27 --bed '$bed' | |
28 #if $mode_cond.mode == "SPECIFIC": | |
29 --specific '$mode_cond.specific' | |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
30 #elif $mode_cond.mode == "SPECIFICBW": |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
31 --bigwig |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
32 --winwidth '$mode_cond.winwidth' |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
33 --specific '$mode_cond.specific' |
11 | 34 #else: |
35 #if "MONO" in $mode_cond.subset: | |
36 --mono | |
37 #end if | |
38 #if "DI" in $mode_cond.subset: | |
39 --di | |
40 #end if | |
41 #if "TRI" in $mode_cond.subset: | |
42 --tri | |
43 #end if | |
44 #if "TETRA" in $mode_cond.subset: | |
45 --tetra | |
46 #end if | |
47 #if "PENTA" in $mode_cond.subset: | |
48 --penta | |
49 #end if | |
50 #if "HEXA" in $mode_cond.subset: | |
51 --hexa | |
52 #end if | |
53 #end if | |
18
607620f93b4c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
17
diff
changeset
|
54 --monomin '$monomin' |
607620f93b4c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
17
diff
changeset
|
55 --dimin '$dimin' |
607620f93b4c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
17
diff
changeset
|
56 --trimin '$trimin' |
607620f93b4c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
17
diff
changeset
|
57 --tetramin '$tetramin' |
607620f93b4c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
17
diff
changeset
|
58 --pentamin '$pentamin' |
607620f93b4c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
17
diff
changeset
|
59 --hexamin '$hexamin' |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
60 #if $mode_cond.mode == "SPECIFICBW": |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
61 --bigwig |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
62 --winwidth '$mode_cond.winwidth' |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
63 #end if |
11 | 64 #end if |
65 ]]></command> | |
66 <inputs> | |
67 <conditional name="reference_genome"> | |
68 <param name="genome_type_select" type="select" label="Select a source for fasta sequences to be searched for STRs" help="Options are to choose a built-in genome, or choose any history fasta file"> | |
69 <option value="indexed">Use a Galaxy server built-in reference genome fasta</option> | |
70 <option value="history" selected="True">Use any fasta file from the current history</option> | |
71 </param> | |
72 <when value="indexed"> | |
73 <param name="fasta" type="select" multiple="false" label="Choose a built-in genome" | |
74 help="If the genome you need is not on the list, upload it and select it as a current history fasta"> | |
75 <options from_data_table="all_fasta"/> | |
76 </param> | |
77 </when> | |
78 <when value="history"> | |
79 <param name="fasta" type="data" format="fasta,fasta.gz" optional="false" multiple="false" label="Choose a fasta file from the current history"/> | |
80 </when> | |
81 </conditional> | |
82 <conditional name="mode_cond"> | |
83 <param name="mode" type="select" label="Select patterns by motif length; or provide a specific motif pattern to report?" help="Choose *By length:* or *By pattern:* to configure STR selection mode"> | |
84 <option selected="True" value="ALL">By length: Report all motifs of one or more specified lengths (1-6nt) as bed features</option> | |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
85 <option value="ALLBW">By length as windowed bigwig: Report all motifs of one or more specified lengths (1-6nt) as windowed density</option> |
11 | 86 <option value="SPECIFIC">By motif: Report one or more specific motifs (such as TCA,GC) as bed features</option> |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
87 <option value="SPECIFICBW">By motif as windowed bigwig: Report one or more specific motifs (such as TCA,GC) as windowed density</option> |
11 | 88 <option value="NATIVE">All exact STR: use the pytrf findstr native command to a create csv, tsv or gtf output</option> |
89 </param> | |
90 <when value="ALL"> | |
91 <param name="subset" type="select" multiple="true" optional="false" label="Select at least 1 specific motif length to report" | |
92 help="Bed features will be output for every motif of the selected length(s) with the minimum required repeats or more"> | |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
93 <option value="DI" selected="true">All dimers (AC,AG,AT,...)</option> |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
94 <option value="TRI">All trimers (ACG,..)</option> |
23
45f690db0eaf
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
22
diff
changeset
|
95 <option value="TETRA">All tetramers (ACGT,..)</option> |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
96 <option value="PENTA">All pentamers (ACGTC,..)</option> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
97 <option value="HEXA">All hexamers (ACGTCG,..)</option> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
98 <option value="MONO">All monomers (A,C...). Warning! Can produce overwhelming numbers of bed features</option> |
11 | 99 </param> |
100 </when> | |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
101 <when value="ALLBW"> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
102 <param name="subset" type="select" multiple="true" optional="false" label="Select at least 1 specific motif length to report" |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
103 help="Bed features will be output for every motif of the selected length(s) with the minimum required repeats or more"> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
104 <option value="DI" selected="true">All dimers (AC,AG,AT,...)</option> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
105 <option value="TRI">All trimers (ACG,..)</option> |
23
45f690db0eaf
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
22
diff
changeset
|
106 <option value="TETRA">All tetramers (ACGT,..)</option> |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
107 <option value="PENTA">All pentamers (ACGTC,..)</option> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
108 <option value="HEXA">All hexamers (ACGTCG,..)</option> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
109 <option value="MONO">All monomers (A,C...). Warning! Can produce overwhelming numbers of bed features</option> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
110 </param> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
111 <param type="integer" min="5" name="winwidth" label="Window with for estimating STR bigwig density" value="128"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
112 </when> |
11 | 113 <when value="SPECIFIC"> |
114 <param name="specific" type="text" label="Supply a specific motif pattern. Separate multiple patterns with commas such as GA,GC" | |
115 help="Make bed features only for the nominated specific motifs." optional="false"/> | |
116 </when> | |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
117 <when value="SPECIFICBW"> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
118 <param name="specific" type="text" label="Supply a specific motif pattern. Separate multiple patterns with commas such as GA,GC" |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
119 help="Make bed features only for the nominated specific motifs." optional="false"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
120 <param type="integer" min="5" name="winwidth" label="Window with for estimating STR bigwig density" value="128"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
121 </when> |
11 | 122 <when value="NATIVE"> |
123 <param name="outformat" type="select" optional="false" label="Select the required output format" | |
124 help="Pytrf can create GFF, CSV or TSV output files. Documentation is linked in the help section below"> | |
125 <option value="gff" >GFF</option> | |
126 <option value="csv">Comma separated values</option> | |
127 <option value="tsv" selected="true">Tab separated values</option> | |
128 </param> | |
129 </when> | |
130 </conditional> | |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
131 <param type="integer" min="2" name="monomin" value="10"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
132 <param type="integer" min="1" name="dimin" value="3"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
133 <param type="integer" min="2" name="trimin" value="2"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
134 <param type="integer" min="2" name="tetramin" value="2"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
135 <param type="integer" min="2" name="pentamin" value="2"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
136 <param type="integer" min="2" name="hexamin" value="2"/> |
11 | 137 </inputs> |
138 <outputs> | |
139 <data name="bed" format="bed" label="STR from $fasta.element_identifier" hidden="false"> | |
140 <change_format> | |
141 <when input="mode_cond.outformat" value="gff" format="gff" /> | |
142 <when input="mode_cond.outformat" value="csv" format="csv" /> | |
143 <when input="mode_cond.outformat" value="tsv" format="tabular" /> | |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
144 <when input="mode_cond.mode" value="ALLBW" format="bigwig" /> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
145 <when input="mode_cond.mode" value="SPECIFICBW" format="bigwig" /> |
11 | 146 </change_format> |
147 </data> | |
148 </outputs> | |
149 <tests> | |
150 <test expect_num_outputs="1"> | |
151 <conditional name="reference_genome"> | |
152 <param name="genome_type_select" value="history"/> | |
153 <param name="fasta" value="humsamp.fa"/> | |
154 </conditional> | |
155 <conditional name="mode_cond"> | |
156 <param name="mode" value="ALL"/> | |
157 <param name="subset" value="DI,TRI,TETRA,PENTA,HEXA"/> | |
158 </conditional> | |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
159 <param name="monomin" value="20"/> |
19
db5523378e5c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
18
diff
changeset
|
160 <param name="dimin" value="20"/> |
db5523378e5c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
18
diff
changeset
|
161 <param name="trimin" value="5"/> |
db5523378e5c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
18
diff
changeset
|
162 <param name="tetramin" value="5"/> |
db5523378e5c
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
18
diff
changeset
|
163 <param name="pentamin" value="3"/> |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
164 <param name="hexamin" value="2"/> |
11 | 165 <output name="bed" value="bed_sample" compare="diff" lines_diff="0"/> |
166 </test> | |
167 <test expect_num_outputs="1"> | |
168 <conditional name="reference_genome"> | |
169 <param name="genome_type_select" value="history"/> | |
170 <param name="fasta" value="humsamp.fa"/> | |
171 </conditional> | |
172 <conditional name="mode_cond"> | |
173 <param name="mode" value="SPECIFIC"/> | |
174 <param name="specific" value="GC"/> | |
175 </conditional> | |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
176 <param name="monomin" value="20"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
177 <param name="dimin" value="1"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
178 <param name="trimin" value="20"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
179 <param name="tetramin" value="20"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
180 <param name="pentamin" value="20"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
181 <param name="hexamin" value="20"/> |
11 | 182 <output name="bed" value="dibed_sample" compare="diff" lines_diff="0"/> |
183 </test> | |
184 <test expect_num_outputs="1"> | |
185 <conditional name="reference_genome"> | |
186 <param name="genome_type_select" value="history"/> | |
187 <param name="fasta" value="mouse.fa"/> | |
188 </conditional> | |
189 <conditional name="mode_cond"> | |
190 <param name="mode" value="NATIVE"/> | |
191 <param name="outformat" value="gff"/> | |
192 </conditional> | |
17
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
193 <param name="monomin" value="20"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
194 <param name="dimin" value="10"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
195 <param name="trimin" value="5"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
196 <param name="tetramin" value="4"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
197 <param name="pentamin" value="4"/> |
264d79548d19
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
16
diff
changeset
|
198 <param name="hexamin" value="2"/> |
11 | 199 <output name="bed" value="nativegff_sample" compare="diff" lines_diff="0"/> |
200 </test> | |
20
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
201 <test expect_num_outputs="1"> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
202 <conditional name="reference_genome"> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
203 <param name="genome_type_select" value="history"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
204 <param name="fasta" value="humsamp.fa"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
205 </conditional> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
206 <conditional name="mode_cond"> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
207 <param name="mode" value="SPECIFICBW"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
208 <param name="specific" value="GC"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
209 </conditional> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
210 <param name="monomin" value="20"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
211 <param name="dimin" value="1"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
212 <param name="trimin" value="20"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
213 <param name="tetramin" value="20"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
214 <param name="pentamin" value="20"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
215 <param name="hexamin" value="20"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
216 <output name="bed" value="dibed_wig_sample" compare="sim_size" delta="10"/> |
410144c7b2d6
planemo upload for repository https://github.com/fubar2/microsatbed commit d952bc313f408735456747c3d33e09a3170c8f59-dirty
fubar
parents:
19
diff
changeset
|
217 </test> |
11 | 218 </tests> |
219 <help><![CDATA[ | |
220 | |
221 **Convert short repetitive sequences to bed features** | |
222 | |
223 Microsatellites are usually defined as repeated short DNA patterns in an unbroken sequence. | |
224 A microsatellite pattern or *motif* can be any combination nucleotides, typically from 1 to 6nt in length. | |
225 | |
226 This tool allows microsatellite and related features to be selected from a fasta sequence input file, and output into a single bed track, suitable for viewing in a genome browser such as JBrowse2. | |
227 | |
228 All motifs of selected lengths can be reported as individual features in the output bed file, or specific motifs can be provided and all | |
229 others will be ignored. In all cases, a minimum required number of repeats can be specified. For example, requiring 2 or more repeats of the trimer *ACG* will report | |
230 every sequence of *ACGACG* or *ACGACGACG* or *ACGACGACGACG* and so on, as individual bed features. Similarly, requiring 3 repeats of any trimer will | |
231 report every distinct 3 nucleotide pattern, including *ACGACGACG* as well as every other unique 3 nucleotide pattern with 3 sequential repeats or more such, as "CTCCTCCTC*. | |
232 | |
233 For other output formats, the pytrf native command line *findstr* can be used to produce a gff, csv or tsv output containing all exact short tandem repeats, as | |
234 described at the end of https://pytrf.readthedocs.io/en/latest | |
235 | |
236 A fasta file must be supplied for processing. A built in genome can be selected, or a fasta file of any kind can be selected from the current history. Note that all | |
237 symbols are treated as valid nucleotides by pytrf, so extraneous characters such as *-* or *N* in the input fasta may appear as unexpected bed features. Lower case fasta symbols will be converted | |
238 to uppercase, to prevent them being reported as distinct motifs. | |
239 | |
240 | |
241 **Select motifs by length** | |
242 | |
243 The default tool form setting is to select all dimer motif patterns. | |
244 | |
245 Additional motif lengths from 1 to 6nt can be selected in the multiple-select drop-down list. All features will be returned in a single bed file. For each selected motif length, | |
246 the minimum number of repeats required for reporting can be adjusted. **Tandem repeats** are defined as at least 2 of any pattern. This tool allows singleton motifs to be reported, | |
247 so is not restricted to short tandem repeats (STR) | |
248 | |
249 **Select motifs by pattern** | |
250 | |
251 This option allows a motif pattern to be specified as a text string such as *CG* or *ATC*. Multiple motifs can be specified as a comma separated string such as *CG,ATC*. | |
252 All features will be returned as a single bed file. | |
253 | |
254 The minimum number of repeats for all motifs can be set to match specific requirements. | |
255 | |
256 For example, technical sequencing read bias may be influenced by the density of specific dimers, whether they are repeated or not | |
257 such as in https://github.com/arangrhie/T2T-Polish/tree/master/pattern | |
258 | |
259 **Select all perfect STR using pytrf findstr in csv, tsv or gff output format** | |
260 | |
261 This selection runs the pytrf *findstr* option to create gff/csv/tsv outputs as described at the end of https://pytrf.readthedocs.io/en/latest/. | |
262 | |
263 Quoted here: | |
264 | |
265 *A Tandem repeat (TR) in genomic sequence is a set of adjacent short DNA sequence repeated consecutively. The core sequence or repeat unit is generally called motif. | |
266 According to the motif length, tandem repeats can be classified as microsatellites and minisatellites. Microsatellites are also known as simple sequence repeats (SSRs) | |
267 or short tandem repeats (STRs) with motif length of 1-6 bp. Minisatellites are also sometimes referred to as variable number of tandem repeats (VNTRs) has longer motif length than microsatellites. | |
268 Pytrf is a lightweight Python C extension for identification of tandem repeats. The pytrf enables to fastly identify both exact or perfect SSRs. | |
269 It also can find generic tandem repeats with any size of motif, such as with maximum motif length of 100 bp. Additionally, it has capability of finding approximate or imperfect tandem repeats* | |
270 | |
271 ]]></help> | |
272 <citations> | |
273 <citation type="bibtex">@misc{pytrf, | |
274 title = {{pytrf} Short tandem repeat finder, Accessed on July 10 2024}, | |
275 howpublished = {\url{https://github.com/lmdu/pytrf}}, | |
276 note = {Accessed on July 10 2024} | |
277 }</citation> | |
278 </citations> | |
279 </tool> | |
280 |