Mercurial > repos > csbl > repeatmodeler
comparison repeatmodeler.xml @ 0:4f0c878b36d4 draft
"planemo upload commit 5c6a5c0f9aacbc7def652b33cc35ee37aa543d05-dirty"
author | csbl |
---|---|
date | Tue, 24 Nov 2020 04:14:46 +0000 |
parents | |
children | dda44fd49bcd |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:4f0c878b36d4 |
---|---|
1 <tool id="repeatmodeler" name="RepeatModeler - Model repetitive DNA" version="0.1.0" python_template_version="3.5"> | |
2 <requirements> | |
3 <requirement type="package" version="2.0.1">repeatmodeler</requirement> | |
4 </requirements> | |
5 <command detect_errors="exit_code"><![CDATA[ | |
6 BuildDatabase -name '$name' '$input_file' && RepeatModeler -database '$name' -pa '$pa' && cp '$name'-families.fa '$output' | |
7 ]]></command> | |
8 <inputs> | |
9 <param type="data" name="input_file" format="fasta" label="Input genome fasta"/> | |
10 <param argument="-name" type="text" value="" label="Title for building database" /> | |
11 <param argument="-pa" type="text" value="" label="Numer of paralleled job: # of nodes" /> | |
12 </inputs> | |
13 <outputs> | |
14 <!-- <data format="fasta" name="RepeatModels" from_work_dir="*-families.fa" label="${tool.name} on ${on_string}: RepeatModels::FASTA" /> --> | |
15 <!-- <data format="txt" name="StockholmFormat" from_work_dir="*-families.stk" label="${tool.name} on ${on_string}: RepeatModels::StockholmFormat" /> --> | |
16 <data format="fasta" name="output" label="${tool.name} on ${on_string}: RepeatModels::FASTA" /> | |
17 </outputs> | |
18 <tests> | |
19 <test> | |
20 <param name="input_file" value="eco.fasta" ftype="fasta"/> | |
21 <param name="name" value="eco" /> | |
22 <param name="pa" value="4" /> | |
23 <output name="output" file="consensi.fa.classified" compare="sim_size" delta_frac="0.1" /> | |
24 </test> | |
25 </tests> | |
26 <help><![CDATA[ | |
27 RepeatModeler - 2.0.1 | |
28 | |
29 NAME | |
30 RepeatModeler - Model repetitive DNA | |
31 | |
32 SYNOPSIS | |
33 RepeatModeler [-options] -database <XDF Database> | |
34 | |
35 DESCRIPTION | |
36 The options are: | |
37 | |
38 -h(elp) | |
39 Detailed help | |
40 | |
41 -database <DBNAME> | |
42 The name of the sequence database to run an analysis on. This is the | |
43 name that was provided to the BuildDatabase script using the "-name" | |
44 option. | |
45 | |
46 -pa # | |
47 Specify the number of parallel search jobs to run. RMBlast jobs will | |
48 use 4 cores each and ABBlast jobs will use a single core each. i.e. | |
49 on a machine with 12 cores and running with RMBlast you would use | |
50 -pa 3 to fully utilize the machine. | |
51 | |
52 -recoverDir <Previous Output Directory> | |
53 If a run fails in the middle of processing, it may be possible | |
54 recover some results and continue where the previous run left off. | |
55 Simply supply the output directory where the results of the failed | |
56 run were saved and the program will attempt to recover and continue | |
57 the run. | |
58 | |
59 -srand # | |
60 Optionally set the seed of the random number generator to a known | |
61 value before the batches are randomly selected ( using Fisher Yates | |
62 Shuffling ). This is only useful if you need to reproduce the sample | |
63 choice between runs. This should be an integer number. | |
64 | |
65 -LTRStruct [optional] | |
66 Run the LTR structural discovery pipeline ( LTR_Harvest and | |
67 LTR_retreiver ) and combine results with the RepeatScout/RECON | |
68 pipeline. [optional] | |
69 | |
70 -genomeSampleSizeMax # | |
71 Optionally change the maximum bp of the genome to sample in all | |
72 rounds of RECON (default=243000000). | |
73 | |
74 CONFIGURATION OVERRIDES | |
75 -ltr_retriever_dir <string> | |
76 The path to the installation of the LTR_Retriever structural LTR | |
77 analysis package. | |
78 | |
79 -rmblast_dir <string> | |
80 The path to the installation of the RMBLAST sequence alignment | |
81 program. | |
82 | |
83 -repeatmasker_dir <string> | |
84 The path to the installation of RepeatMasker. | |
85 | |
86 -trf_prgm <string> | |
87 The full path including the name for the TRF program ( 4.0.9 or | |
88 higher ) | |
89 | |
90 -ninja_dir <string> | |
91 The path to the installation of the Ninja phylogenetic analysis | |
92 package. | |
93 | |
94 -recon_dir <string> | |
95 The path to the installation of the RECON de-novo repeatfinding | |
96 program. | |
97 | |
98 -genometools_dir <string> | |
99 The path to the installation of the GenomeTools package. | |
100 | |
101 -abblast_dir <string> | |
102 The path to the installation of the ABBLAST sequence alignment | |
103 program. | |
104 | |
105 -rscout_dir <string> | |
106 The path to the installation of the RepeatScout ( 1.0.6 or higher ) | |
107 de-novo repeatfinding program. | |
108 | |
109 -mafft_dir <string> | |
110 The path to the installation of the MAFFT multiple alignment | |
111 program. | |
112 | |
113 -cdhit_dir <string> | |
114 The path to the installation of the CD-Hit sequence clustering | |
115 package. | |
116 | |
117 SEE ALSO | |
118 RepeatMasker, RMBlast | |
119 | |
120 COPYRIGHT | |
121 Copyright 2005-2019 Institute for Systems Biology | |
122 | |
123 AUTHOR | |
124 RepeatModeler: | |
125 Robert Hubley <rhubley@systemsbiology.org> | |
126 Arian Smit <asmit@systemsbiology.org> | |
127 | |
128 LTR Pipeline Extensions: | |
129 Jullien Michelle Flynn <jmf422@cornell.edu> | |
130 ]]></help> | |
131 <citations> | |
132 <citation type="doi">10.1073/pnas.1921046117</citation> | |
133 <citation type="doi">10.1186/s13059-018-1577-z</citation> | |
134 </citations> | |
135 </tool> |