Mercurial > repos > iuc > genomescope
comparison genomescope.xml @ 0:b2f674562a18 draft
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/genomescope commit aa87b7b1713b749328c5a710f32631aab2acaa3a"
author | iuc |
---|---|
date | Fri, 30 Apr 2021 20:21:25 +0000 |
parents | |
children | 3169a38c2656 |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:b2f674562a18 |
---|---|
1 <tool id="genomescope" name="GenomeScope" version="@VERSION@" profile="20.01"> | |
2 <description>Analyze unassembled short reads</description> | |
3 <macros> | |
4 <token name="@VERSION@">2.0</token> | |
5 </macros> | |
6 <requirements> | |
7 <requirement type="package" version="@VERSION@">genomescope2</requirement> | |
8 </requirements> | |
9 <version_command>genomescope2 --version</version_command> | |
10 <command detect_errors="exit_code"><![CDATA[ | |
11 genomescope2 | |
12 --input '$input' | |
13 --output . | |
14 --kmer_length $kmer_length | |
15 $no_unique_sequence $testing $trace_flag | |
16 #if $ploidy: | |
17 --ploidy $ploidy | |
18 #end if | |
19 #if $lambda: | |
20 --lambda $lambda | |
21 #end if | |
22 #if $max_kmercov: | |
23 --max_kmercov $max_kmercov | |
24 #end if | |
25 #if $topology: | |
26 --topology $topology | |
27 #end if | |
28 #if $initial_repetitiveness: | |
29 --initial_repetitiveness $initial_repetitiveness | |
30 #end if | |
31 #if $initial_heterozygosities: | |
32 --initial_heterozygosities $initial_heterozygosities | |
33 #end if | |
34 #if $transform_exp: | |
35 --transform_exp $transform_exp | |
36 #end if | |
37 #if $true_params: | |
38 --true_params $true_params | |
39 #end if | |
40 #if $num_rounds: | |
41 --num_rounds $num_rounds | |
42 #end if | |
43 ]]> | |
44 </command> | |
45 <inputs> | |
46 <param argument="--input" type="data" format="tabular" label="Input histogram file" help="This file is a two column tabular file for example generated with the histo function of Jellyfish."/> | |
47 <param name="model_output" type="boolean" label="Add the model parameters to your history"/> | |
48 <param name="summary_output" type="boolean" label="Output a summary of the analysis"/> | |
49 <param name="progress_output" type="boolean" label="Additional information for each optimization round"/> | |
50 <param argument="--ploidy" type="integer" optional="true" label="Ploidy for model to use" help="Default: 2"/> | |
51 <param argument="--kmer_length" type="integer" value="21" optional="false" label="K-mer length used to calculate k-mer spectra"/> | |
52 <param argument="--lambda" type="integer" optional="true" label="Optional initial kmercov estimate for model to use"/> | |
53 <param argument="--max_kmercov" type="integer" optional="true" label="Optional maximum k-mer coverage threshold" help="K-mers with coverage greater than max_kmercov are ignored by the model"/> | |
54 <param argument="--no_unique_sequence" type="boolean" truevalue="--no_unique_sequence" falsevalue="" label="Turn off yellow unique sequence line in plots"/> | |
55 <param argument="--topology" type="integer" optional="true" label="Flag for topology for model to use"/> | |
56 <param argument="--initial_repetitiveness" type="integer" optional="true" label="Initial value for repetitiveness"/> | |
57 <param argument="--initial_heterozygosities" type="integer" optional="true" label="Initial values for nucleotide heterozygosity rates"/> | |
58 <param argument="--transform_exp" type="integer" optional="true" label="Parameter for the exponent when fitting a transformed (x**transform_exp*y vs. x) k-mer histogram" help="Default: 1"/> | |
59 <param argument="--testing" type="boolean" truevalue="--testing" falsevalue="" label="Create testing.tsv file with model parameters"/> | |
60 <param argument="--true_params" type="integer" optional="true" label="Flag to state true simulated parameters for testing mode"/> | |
61 <param argument="--trace_flag" type="boolean" truevalue="--trace_flag" falsevalue="" label="Turn on printing of iteration progress of nlsLM function"/> | |
62 <param argument="--num_rounds" type="integer" min="1" optional="true" label="Number of optimization rounds"/> | |
63 </inputs> | |
64 <outputs> | |
65 <data name="linear_plot" format="png" from_work_dir="linear_plot.png" label="${tool.name} on ${on_string} Linear plot"/> | |
66 <data name="log_plot" format="png" from_work_dir="log_plot.png" label="${tool.name} on ${on_string} Log plot"/> | |
67 <data name="transformed_linear_plot" format="png" from_work_dir="transformed_linear_plot.png" label="${tool.name} on ${on_string} Transformed linear plot"/> | |
68 <data name="transformed_log_plot" format="png" from_work_dir="transformed_log_plot.png" label="${tool.name} on ${on_string} Transformed log plot"/> | |
69 <data name="model" format="txt" from_work_dir="model.txt" label="${tool.name} on ${on_string} Model"> | |
70 <filter>model_output</filter> | |
71 </data> | |
72 <data name="summary" format="txt" from_work_dir="summary.txt" label="${tool.name} on ${on_string} Summary"> | |
73 <filter>summary_output</filter> | |
74 </data> | |
75 <data name="progress" format="txt" from_work_dir="progress.txt" label="${tool.name} on ${on_string} Progress"> | |
76 <filter>progress_output</filter> | |
77 </data> | |
78 <data name="model_params" format="tabular" from_work_dir="SIMULATED_testing.tsv" label="${tool.name} on ${on_string} Model parameters"> | |
79 <filter>testing</filter> | |
80 </data> | |
81 </outputs> | |
82 <tests> | |
83 <test expect_num_outputs="8"> | |
84 <param name="input" value="genomescope-in1.tab"/> | |
85 <param name="kmer_length" value="21"/> | |
86 <param name="testing" value="true"/> | |
87 <param name="model_output" value="true"/> | |
88 <param name="summary_output" value="true"/> | |
89 <param name="progress_output" value="true"/> | |
90 <output name="linear_plot" file="genomescope-out1-1.png" ftype="png"/> | |
91 <output name="log_plot" file="genomescope-out1-2.png" ftype="png"/> | |
92 <output name="transformed_linear_plot" file="genomescope-out1-3.png" ftype="png"/> | |
93 <output name="transformed_log_plot" file="genomescope-out1-4.png" ftype="png" compare="sim_size"/> | |
94 <output name="model" file="genomescope-out1-1.txt" ftype="txt" lines_diff="2"/> | |
95 <output name="summary" file="genomescope-out1-2.txt" ftype="txt" lines_diff="2"/> | |
96 <output name="progress" file="genomescope-out1-3.txt" ftype="txt" lines_diff="2"/> | |
97 <output name="testing" file="genomescope-out1-1.tab" ftype="tabular"/> | |
98 </test> | |
99 </tests> | |
100 <help><![CDATA[ | |
101 | |
102 GenomeScope 2.0: Reference-free profiling of polyploid genomes | |
103 ============================================================== | |
104 | |
105 GenomeScope 2.0 applies classical insights from combinatorial theory to establish | |
106 a detailed mathematical model of how k-mer frequencies will be distributed in | |
107 heterozygous and polyploid genomes. GenomeScope 2.0 employs a polyploid-aware | |
108 mixture model that, within seconds, accurately infers genome properties from | |
109 unassembled sequencing data. GenomeScope 2.0 uses the k-mer count distribution, | |
110 e.g. from KMC or Jellyfish, and produces a report and several informative plots | |
111 describing the genome properties. We validate the approach on simulated polyploid | |
112 data created using a generative model with parameters for genome size, heterozygosity, | |
113 repetitiveness, ploidy, and sequencing coverage, and find GenomeScope 2.0 retains | |
114 accuracy across a broad range of realistic and extreme parameter values. We also | |
115 validate GenomeScope 2.0 by analyzing genuine sequence data from 11 diverse | |
116 polyploid genomes with known genome characteristics. | |
117 | |
118 ]]></help> | |
119 <citations> | |
120 <citation type="doi">10.1093/bioinformatics/btx153</citation> | |
121 <citation type="doi">10.1038/s41467-020-14998-3</citation> | |
122 </citations> | |
123 </tool> |