Mercurial > repos > petr-novak > repeat_annotation_pipeline3
annotate format_repeat_library.xml @ 12:755a4d643184 draft default tip
planemo upload commit a61591d548f42ff417781e7fe7418dc2901ccc23
author | petr-novak |
---|---|
date | Tue, 26 Sep 2023 07:28:04 +0000 |
parents | 5366d5ea04bc |
children |
rev | line source |
---|---|
0 | 1 <tool id="annotate_contigs" name="Format Repeat Library" version="0.1.0" python_template_version="3.5"> |
2 <requirements> | |
3 <requirement type="package" version="2.60.0">bioconductor-biostrings</requirement> | |
4 </requirements> | |
11
5366d5ea04bc
planemo upload commit 9d1b19f98d8b7f0a0d1baf2da63a373d155626f8-dirty
petr-novak
parents:
0
diff
changeset
|
5 <required_files> |
5366d5ea04bc
planemo upload commit 9d1b19f98d8b7f0a0d1baf2da63a373d155626f8-dirty
petr-novak
parents:
0
diff
changeset
|
6 <include type="literal" path="annotate_contigs.R"/> |
5366d5ea04bc
planemo upload commit 9d1b19f98d8b7f0a0d1baf2da63a373d155626f8-dirty
petr-novak
parents:
0
diff
changeset
|
7 </required_files> |
0 | 8 <command detect_errors="exit_code"><![CDATA[ |
11
5366d5ea04bc
planemo upload commit 9d1b19f98d8b7f0a0d1baf2da63a373d155626f8-dirty
petr-novak
parents:
0
diff
changeset
|
9 Rscript $__tool_directory__/annotate_contigs.R '$contigs' '$cluster_table' '$annotated_contigs' |
0 | 10 ]]></command> |
11 <inputs> | |
12 <param type="data" name="contigs" format="fasta" label="Contigs - Library of Repeats from TAREAN/RepeatExplorer pipeline" /> | |
13 <param type="data" name="cluster_table" format="txt" label="CLUSTER_TABLE from RepeatExplorer pipeline" help="CLUSTER_TABLE which contain annotation of clusters from RepeatExplorer pipeline"/> | |
14 </inputs> | |
15 <outputs> | |
16 <data name="annotated_contigs" format="fasta" label="Annotated Repeat Library based on ${contigs.hid} and ${cluster_table.hid}" /> | |
17 </outputs> | |
18 <help><![CDATA[ | |
19 **What this tool does** | |
20 | |
21 Contigs from RepeatExplorer archive are annotated based on the classification of repeats from cluster_table. | |
22 | |
23 Preformated CLUSTER_TABLE can be extracted from RepeatExplorer archive and modified accordingly. By default, "Final_annotation" column is used to append annotation to contigs in repeat library (based on the cluster id). If "Final_annotation" column is incomplete, "Automatic_annotation" column is used instead. | |
24 | |
25 Example of tab delimited CLUSTER_TABLE:: | |
26 | |
27 | |
28 "Number_of_reads_in_clusters" 3886 | |
29 "Number_of_clusters" 822 | |
30 "Number_of_superclusters" 821 | |
31 "Number_of_singlets" 6114 | |
32 "Number_of_analyzed_reads" 10000 | |
33 | |
34 "Cluster" "Supercluster" "Size" "Size_adjusted" "Automatic_annotation" "TAREAN_annotation" "Final_annotation" | |
35 1 1 260 260 "All/repeat/satellite" "Putative satellites (low confidence)" "" | |
36 2 2 157 157 "All/repeat/satellite" "Putative satellites (low confidence)" "" | |
37 3 4 100 100 "All" "Other" "" | |
38 4 5 83 83 "All" "Other" "" | |
39 5 3 77 77 "All" "Other" "" | |
40 6 3 65 65 "All" "Other" "" | |
41 7 6 61 61 "All" "Other" "" | |
42 8 7 58 58 "All" "Other" "" | |
43 9 8 53 53 "All" "Other" "" | |
44 10 9 53 53 "All" "Other" "" | |
45 11 10 51 51 "All" "Other" "" | |
46 12 11 45 45 "All" "Other" "" | |
47 13 12 44 44 "All" "Other" "" | |
48 14 13 44 44 "All" "Other" "" | |
49 15 14 39 39 "All" "Other" "" | |
50 16 15 37 37 "All" "Other" "" | |
51 17 16 30 30 "All/repeat/satellite" "Putative satellites (low confidence)" "" | |
52 18 17 28 28 "All/repeat/satellite" "Putative satellites (low confidence)" "" | |
53 19 18 26 26 "All/repeat/satellite" "Putative satellites (high confidence)" "" | |
54 20 19 23 23 "All/repeat/../CRM" "Other" "" | |
55 21 20 21 21 "All" "Other" "" | |
56 22 21 21 21 "All" "Other" "" | |
57 23 22 21 21 "All" "Other" "" | |
58 24 23 21 21 "All" "Other" "" | |
59 25 24 20 20 "All/repeat/../Ogre" "Other" "" | |
60 | |
61 | |
62 Only Cluster, Automatic_annotation/Final_annnotation are mandatory" | |
63 | |
64 Clusters with higher number than those in CLUSTER_TABLE are removed from Repeat library | |
65 | |
11
5366d5ea04bc
planemo upload commit 9d1b19f98d8b7f0a0d1baf2da63a373d155626f8-dirty
petr-novak
parents:
0
diff
changeset
|
66 Contigs are provided in following format:: |
0 | 67 |
68 | |
69 >CL25Contig1 | |
70 AGATCAAGATGGCGCCGGAGGACATGGAGAAAACGACGTTTATCACTCCCTGGGGAACATTTTGCTACAAGGTAATGCCT | |
71 TTCGGTCTGAAGAACGCAGGGGCCACTTACCAACGAGCAATGGTAACTT | |
72 >CL1Contig4#All/repeat/satellite | |
73 ACCCGAAGGCCGGCTCAACCCGAAGTTGAGAAGAACATCTGACCTCGCCGTCAGGCATCTGTTAAACAAACAGGCATCGA | |
74 A | |
75 >CL1Contig5 | |
76 TGAGAAGAACATCTGACCTCGCCGTCAGGCATCTGTTAAACAAACAGGCATCGAACCCGAAGGCCGGCTCAACCCGAAGT | |
77 TGATAAGAACATCTGACCTCGCCGTCAGGCATCTGTTAAACAAACAGGCATCGAACCCGAAGGCCGGCTCAACACGAAGT | |
78 TGAGAGGAACATCTGACCTCGCCGTCAGGCATCTGTTAAA | |
79 | |
80 | |
81 Resulting repeat library will have following format:: | |
82 | |
83 >CL25Contig1#All/repeat/mobile_element/Class_I/LTR/Ty3_gypsy/non-chromovirus/OTA/Tat/Ogre | |
84 AGATCAAGATGGCGCCGGAGGACATGGAGAAAACGACGTTTATCACTCCCTGGGGAACATTTTGCTACAAGGTAATGCCT | |
85 TTCGGTCTGAAGAACGCAGGGGCCACTTACCAACGAGCAATGGTAACTT | |
86 >CL1Contig4#All/repeat/satellite | |
87 ACCCGAAGGCCGGCTCAACCCGAAGTTGAGAAGAACATCTGACCTCGCCGTCAGGCATCTGTTAAACAAACAGGCATCGA | |
88 A | |
89 >CL1Contig5#All/repeat/satellite | |
90 TGAGAAGAACATCTGACCTCGCCGTCAGGCATCTGTTAAACAAACAGGCATCGAACCCGAAGGCCGGCTCAACCCGAAGT | |
91 TGATAAGAACATCTGACCTCGCCGTCAGGCATCTGTTAAACAAACAGGCATCGAACCCGAAGGCCGGCTCAACACGAAGT | |
92 TGAGAGGAACATCTGACCTCGCCGTCAGGCATCTGTTAAA | |
93 | |
94 | |
95 | |
96 | |
97 ]]></help> | |
98 </tool> |