annotate TEdenovo.xml @ 0:baea09e6722b draft default tip

1st Uploaded
author vmarcon
date Mon, 06 Feb 2017 13:31:53 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
1 <tool id="tedenovo" name="REPET Lite - TEdenovo" version="2.2.0">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
2
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
3 <!-- [REQUIRED] Tool description displayed after the tool name -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
4 <description> Compute a library of transposable element</description>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
5
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
6 <!-- [OPTIONAL] 3rd party tools, binaries, modules... required for the tool to work -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
7 <requirements>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
8 <requirement type="binary">python</requirement>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
9 <requirement type="package" version="2.5">repet</requirement>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
10 </requirements>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
11
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
12 <!-- [STRONGLY RECOMMANDED] Exit code rules -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
13 <stdio>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
14 <!-- Anything other than zero is an error -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
15 <exit_code range="1:" level="fatal"/>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
16 <exit_code range=":-1" level="fatal"/>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
17
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
18 </stdio>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
19
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
20 <!-- [OPTIONAL] Command to be executed to get the tool's version string -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
21 <version_command>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
22 TEdenovo.py --version
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
23 </version_command>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
24
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
25 <!-- [REQUIRED] The command to execute -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
26 <command interpreter="bash">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
27 TEdenovo.sh $fasta $outputfasta $classif $outputlog $outputconfig $outputstats
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
28 #if str( $classif ) == "yes":
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
29 $outputclassif
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
30 #else
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
31 ''
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
32 #end if
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
33 </command>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
34
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
35 <!-- [REQUIRED] Input files and tool parameters -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
36 <inputs>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
37 <param name="fasta" type="data" format="fasta" optional="false" label="Fasta alignment input" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
38 <param name="classif" type="select" label="Get classification informations" help="To add the informations at annotation file on next step." >
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
39 <option value="no" selected="true">No</option>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
40 <option value="yes">Yes</option>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
41 </param>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
42 <param name="label" type="text" label="Output name" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
43 </inputs>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
44
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
45 <!-- [REQUIRED] Output files -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
46 <outputs>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
47 <data name="outputlog" type="data" format="txt" label="TEdenovo-#if str($label)=='' then $fasta.name else $label #.log" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
48 <data name="outputfasta" type="data" format="fasta" label="TEdenovo-#if str($label)=='' then $fasta.name else $label #.TElib.fa" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
49 <data name="outputstats" type="data" format="txt" label="TEdenovo-#if str($label)=='' then $fasta.name else $label #.classif_stats.txt" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
50 <data name="outputclassif" type="data" format="tabular" label="TEdenovo-#if str($label)=='' then $fasta.name else $label #.classif" >
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
51 <filter>(classif == 'yes')</filter>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
52 </data>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
53 <data name="outputconfig" type="data" format="txt" label="TEdenovo-#if str($label)=='' then $fasta.name else $label #.cfg" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
54 </outputs>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
55
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
56
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
57 <!-- [OPTIONAL] Tests to be run manually by the Galaxy admin -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
58 <tests>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
59 <!-- [HELP] Test files have to be in the ~/test-data directory -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
60 <test>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
61 <param name="fasta" value="DmelChr4Chr3.fa" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
62 <output name="outputfasta">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
63 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
64 <has_line_matching expression="^>\w+" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
65 <has_line_matching expression="[ACTG]{60}" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
66 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
67 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
68 <output name="outputlog">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
69 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
70 <has_line_matching expression="^step 7 finished successfully" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
71 <has_line_matching expression="^END time: \d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
72 <has_line_matching expression="^Writing fasta file" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
73 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
74 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
75 <output name="outputconfig">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
76 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
77 <has_line_matching expression="^project_name: \d{8}" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
78 <has_line_matching expression="^repet_version: 2.5" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
79 <has_line_matching expression="^tmpDir:" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
80 <has_line_matching expression="^clean: yes" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
81 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
82 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
83 <output name="outputstats">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
84 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
85 <has_line_matching expression="-------Summary---------" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
86 <has_line_matching expression="TOTAL: \d+ (\d+.\d+%)" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
87 <has_line_matching expression="------NOTES---------" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
88 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
89 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
90 </test>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
91 <test>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
92 <param name="fasta" value="DmelChr4Chr3.fa" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
93 <param name="classif" value="yes" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
94 <output name="outputfasta">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
95 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
96 <has_line_matching expression="^>\w+" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
97 <has_line_matching expression="[ACTG]{60}" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
98 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
99 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
100 <output name="outputlog">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
101 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
102 <has_line_matching expression="^step 7 finished successfully" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
103 <has_line_matching expression="^END time: \d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
104 <has_line_matching expression="^Writing fasta file" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
105 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
106 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
107 <output name="outputconfig">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
108 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
109 <has_line_matching expression="^project_name: \d{8}" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
110 <has_line_matching expression="^repet_version: 2.5" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
111 <has_line_matching expression="^tmpDir:" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
112 <has_line_matching expression="^clean: yes" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
113 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
114 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
115 <output name="outputstats">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
116 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
117 <has_line_matching expression="-------Summary---------" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
118 <has_line_matching expression="TOTAL: \d+ (\d+.\d+%)" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
119 <has_line_matching expression="------NOTES---------" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
120 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
121 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
122 <output name="outputclassif">
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
123 <assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
124 <has_n_columns n="8" />
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
125 </assert_contents>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
126 </output>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
127 </test>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
128 </tests>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
129
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
130 <!-- [OPTIONAL] Help displayed in Galaxy -->
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
131 <help>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
132 <![CDATA[
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
133 .. class:: infomark
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
134
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
135
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
136 **Authors**
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
137 Gwendoline Andres
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
138 Valentin Marcon
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
139 Veronique Jamilloux
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
140 Olivier Inizan
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
141
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
142 ---------------------------------------------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
143
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
144 .. class:: infomark
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
145
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
146 **Please cite** If you use this tool, please cite
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
147
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
148 ---------------------------------------------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
149
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
150 ==============
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
151 TEdenovo Lite
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
152 ==============
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
153
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
154 -----------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
155 Description
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
156 -----------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
157 REPET is for detection and annotation of transposable elements (TE). The ligth version available on Galaxy is specialised on transposable element masking.
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
158 TEdenovo is the first step to constitute a consensus library of TE.
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
159 For a detailed description of each parameter used, please consult the Galaxy page in "Shared Data > Published Pages"
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
160
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
161 -----------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
162 Workflow position
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
163 -----------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
164
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
165 **Downstream tools**
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
166
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
167 =========== ========================== =======
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
168 Name output file(s) format
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
169 =========== ========================== =======
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
170 TEannot GFF with TE masked gff
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
171 =========== ========================== =======
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
172
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
173
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
174 ----------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
175 Input file
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
176 ----------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
177
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
178 Fasta file
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
179 Genome file at fasta format
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
180
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
181
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
182 ------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
183 Output files
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
184 ------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
185
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
186 Output_name.fa
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
187 TE library
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
188
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
189 Output_name.log
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
190 log file to see each steps progress
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
191
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
192 Output_name.cfg
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
193 File to show which params have been used
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
194
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
195 Output_name.classif_stats.txt
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
196 File with statistics you can visualize
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
197
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
198 Output_name.classif
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
199 If asked, the classification file to give to next step (TEannot)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
200
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
201
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
202 ---------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
203 Working example
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
204 ---------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
205
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
206 Input files
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
207 ===========
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
208
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
209 Fasta file
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
210 -----------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
211
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
212 ::
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
213
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
214 >dmel_chr4
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
215 GAATTCGCGTCCGCTTACCCATGTGCCTGTGGATGCCGAACAGGAGGCGCCGTTGACGGC
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
216 GAATGACTTACTCAAGGGAGTAGCCAATCTGTCGGATACGCCCGGATTGGAGCTGCCCAT
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
217 GGAGGGTTCTACAAGAAAGCGGTGGAGGATTGCTCGCATACTGCGAGACCGTTTCTGAAG
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
218 GAGATGGCTCATGGAGTACCTGCCTACGCTTGTGCGCCGCGAGAAGTGGTGAAGAAGAAC
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
219 GGAGCCCATACACCAGGGTGATATGGTCTTCGTCTGCGATCCCGCCTTGCCCCGGCGAGA
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
220 GTGGTGCAAGGGCATCATGGAGGAAGTCTCCAGCAGAGCAGATGGAGCAACGGCCTATAG
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
221 AGGACACTGATGCTACCCGTCTCTAAGCTTGCAGTTTTGGATTTAAGTGAATCGGTTATT
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
222 CACGGGGTCGGGGATGTCGCGGATCGAACGGTGCAATCGATAGGCGTAATCAGTATTTCC
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
223 AGATAGTGATAAGATTTGGTGGATAAATGTGTGCGGGCACACTAATGGCCGCCATCGTAA
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
224 GCCGCGAAAAGCTTAGCGTGCATTGTCGATCGAGAGTTTGGAGGGCAAACTGCGGTAAGA
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
225 TAAGATTAAATAATTTGTACTGAATAATCTTAAAGAATCCTGATGGAAAGCGCCATGCAG
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
226 TCACATATAATATGTGCAGAGCTCTCCTC
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
227
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
228
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
229 Output files
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
230 ============
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
231
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
232 output fasta : TE library
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
233 -------------------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
234
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
235 ::
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
236
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
237 >DTX-incomp_20150313101806-B-G1-Map3
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
238 ATACAGCTGCGGTTAAAATAATAGCACTACTGCAGGTGGAAAGTTGATTTCCTAAAAAAA
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
239 ATTATTAAATGTTTATATTTTTTTAAGTCAGATTGCATGAATAATAAGTACCATATGTTG
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
240 GCTCTCTGAGCAAGAAATTTTTAG
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
241 >RLX-incomp_20150313101806-B-R12-Map3_reversed
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
242 ATGATAAGTAGGCAAACTATAAAAATGTTCTATTTATGGGCTGCAATAAACATGTCACCG
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
243 GACAGCATAAGTGGCAACTACAG
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
244
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
245
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
246 output config : .cfg
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
247 --------------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
248
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
249 ::
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
250
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
251 [repet_env]
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
252 repet_version: 2.4
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
253 repet_host: ******
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
254 repet_user: ******
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
255
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
256
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
257 output stats : .classif_stats.txt
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
258 ---------------------------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
259
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
260 ::
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
261
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
262 LTR incomp: 1 (10.00%)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
263 LTR total (RLX): 1 (10.00%)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
264
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
265 ClassI + one order: 1 (10.00%)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
266 ClassI total (RXX): 1 (10.00%)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
267
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
268 -------------------------Summary--------------------------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
269
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
270 RXX: 1 (10.00%)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
271 DXX: 9 (90.00%)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
272 TOTAL: 10 (100.00%)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
273
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
274 -----------------------------NOTES------------------------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
275
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
276
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
277 output classif : Classification file
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
278 ------------------------------------
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
279
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
280 ::
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
281
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
282 DTX-incomp_dataset_370.dat-B-G1-Map3 542 + ok II TIR incomplete CI=37; coding=(TE_BLRtx: TC1_DM:ClassII:TIR:Tc1-Mariner: 32.59%; TE_BLRx: Mariner-1_DAn_1p:ClassII:TIR:Tc1-Mariner: 18.43%); struct=(TElength: <700bps); other=(Other_profiles: PF13936.1_HTH_38_NA_OTHER_27.0: 77.27%(77.27%); SSRCoverage=0.03)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
283 DTX-comp_dataset_370.dat-B-G8-Map20 1244 + ok II TIR complete CI=50; coding=(TE_BLRtx: PROTOP:ClassII:TIR:P: 12.03%, PROTOP_A:ClassII:TIR:P: 49.14%); struct=(TElength: >1000bps; TermRepeats: termTIR: 50); other=(SSRCoverage=0.25)
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
284
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
285 ]]>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
286 </help>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
287
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
288 <citations>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
289 <citation type="bibtex"><![CDATA[@article{10.1371/journal.pone.0016526,
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
290 author = {Flutre, Timothée AND Duprat, Elodie AND Feuillet, Catherine AND Quesneville, Hadi},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
291 journal = {PLoS ONE},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
292 publisher = {Public Library of Science},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
293 title = {Considering Transposable Element Diversification in <italic>De Novo</italic> Annotation Approaches},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
294 year = {2011},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
295 month = {01},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
296 volume = {6},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
297 url = {http://dx.doi.org/10.1371%2Fjournal.pone.0016526},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
298 pages = {e16526},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
299 abstract = {
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
300 <p>Transposable elements (TEs) are mobile, repetitive DNA sequences that are almost ubiquitous in prokaryotic and eukaryotic genomes. They have a large impact on genome structure, function and evolution. With the recent development of high-throughput sequencing methods, many genome sequences have become available, making possible comparative studies of TE dynamics at an unprecedented scale. Several methods have been proposed for the <italic>de novo</italic> identification of TEs in sequenced genomes. Most begin with the detection of genomic repeats, but the subsequent steps for defining TE families differ. High-quality TE annotations are available for the <italic>Drosophila melanogaster</italic> and <italic>Arabidopsis thaliana</italic> genome sequences, providing a solid basis for the benchmarking of such methods. We compared the performance of specific algorithms for the clustering of interspersed repeats and found that only a particular combination of algorithms detected TE families with good recovery of the reference sequences. We then applied a new procedure for reconciling the different clustering results and classifying TE sequences. The whole approach was implemented in a pipeline using the REPET package. Finally, we show that our combined approach highlights the dynamics of well defined TE families by making it possible to identify structural variations among their copies. This approach makes it possible to annotate TE families and to study their diversification in a single analysis, improving our understanding of TE dynamics at the whole-genome scale and for diverse species.</p>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
301 },
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
302 number = {1},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
303 doi = {10.1371/journal.pone.0016526}
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
304 }]]></citation>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
305 <citation type="bibtex"><![CDATA[@article{10.1371/journal.pone.0094101,
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
306 author = {Maumus, Florian AND Quesneville, Hadi},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
307 journal = {PLoS ONE},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
308 publisher = {Public Library of Science},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
309 title = {Deep Investigation of <italic>Arabidopsis thaliana</italic> Junk DNA Reveals a Continuum between Repetitive Elements and Genomic Dark Matter},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
310 year = {2014},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
311 month = {04},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
312 volume = {9},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
313 url = {http://dx.doi.org/10.1371%2Fjournal.pone.0094101},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
314 pages = {e94101},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
315 abstract = {<p>Eukaryotic genomes contain highly variable amounts of DNA with no apparent function. This so-called junk DNA is composed of two components: repeated and repeat-derived sequences (together referred to as the repeatome), and non-annotated sequences also known as genomic dark matter. Because of their high duplication rates as compared to other genomic features, transposable elements are predominant contributors to the repeatome and the products of their decay is thought to be a major source of genomic dark matter. Determining the origin and composition of junk DNA is thus important to help understanding genome evolution as well as host biology. In this study, we have used a combination of tools enabling to show that the repeatome from the small and reducing <italic>A. thaliana</italic> genome is significantly larger than previously thought. Furthermore, we present the concepts and results from a series of innovative approaches suggesting that a significant amount of the <italic>A. thaliana</italic> dark matter is of repetitive origin. As a tentative standard for the community, we propose a deep compendium annotation of the <italic>A. thaliana</italic> repeatome that may help addressing farther genome evolution as well as transcriptional and epigenetic regulation in this model plant.</p>},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
316 number = {4},
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
317 doi = {10.1371/journal.pone.0094101}
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
318 }]]></citation>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
319 </citations>
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
320
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
321
baea09e6722b 1st Uploaded
vmarcon
parents:
diff changeset
322 </tool>