comparison genomescope.xml @ 0:b2f674562a18 draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/genomescope commit aa87b7b1713b749328c5a710f32631aab2acaa3a"
author iuc
date Fri, 30 Apr 2021 20:21:25 +0000
parents
children 3169a38c2656
comparison
equal deleted inserted replaced
-1:000000000000 0:b2f674562a18
1 <tool id="genomescope" name="GenomeScope" version="@VERSION@" profile="20.01">
2 <description>Analyze unassembled short reads</description>
3 <macros>
4 <token name="@VERSION@">2.0</token>
5 </macros>
6 <requirements>
7 <requirement type="package" version="@VERSION@">genomescope2</requirement>
8 </requirements>
9 <version_command>genomescope2 --version</version_command>
10 <command detect_errors="exit_code"><![CDATA[
11 genomescope2
12 --input '$input'
13 --output .
14 --kmer_length $kmer_length
15 $no_unique_sequence $testing $trace_flag
16 #if $ploidy:
17 --ploidy $ploidy
18 #end if
19 #if $lambda:
20 --lambda $lambda
21 #end if
22 #if $max_kmercov:
23 --max_kmercov $max_kmercov
24 #end if
25 #if $topology:
26 --topology $topology
27 #end if
28 #if $initial_repetitiveness:
29 --initial_repetitiveness $initial_repetitiveness
30 #end if
31 #if $initial_heterozygosities:
32 --initial_heterozygosities $initial_heterozygosities
33 #end if
34 #if $transform_exp:
35 --transform_exp $transform_exp
36 #end if
37 #if $true_params:
38 --true_params $true_params
39 #end if
40 #if $num_rounds:
41 --num_rounds $num_rounds
42 #end if
43 ]]>
44 </command>
45 <inputs>
46 <param argument="--input" type="data" format="tabular" label="Input histogram file" help="This file is a two column tabular file for example generated with the histo function of Jellyfish."/>
47 <param name="model_output" type="boolean" label="Add the model parameters to your history"/>
48 <param name="summary_output" type="boolean" label="Output a summary of the analysis"/>
49 <param name="progress_output" type="boolean" label="Additional information for each optimization round"/>
50 <param argument="--ploidy" type="integer" optional="true" label="Ploidy for model to use" help="Default: 2"/>
51 <param argument="--kmer_length" type="integer" value="21" optional="false" label="K-mer length used to calculate k-mer spectra"/>
52 <param argument="--lambda" type="integer" optional="true" label="Optional initial kmercov estimate for model to use"/>
53 <param argument="--max_kmercov" type="integer" optional="true" label="Optional maximum k-mer coverage threshold" help="K-mers with coverage greater than max_kmercov are ignored by the model"/>
54 <param argument="--no_unique_sequence" type="boolean" truevalue="--no_unique_sequence" falsevalue="" label="Turn off yellow unique sequence line in plots"/>
55 <param argument="--topology" type="integer" optional="true" label="Flag for topology for model to use"/>
56 <param argument="--initial_repetitiveness" type="integer" optional="true" label="Initial value for repetitiveness"/>
57 <param argument="--initial_heterozygosities" type="integer" optional="true" label="Initial values for nucleotide heterozygosity rates"/>
58 <param argument="--transform_exp" type="integer" optional="true" label="Parameter for the exponent when fitting a transformed (x**transform_exp*y vs. x) k-mer histogram" help="Default: 1"/>
59 <param argument="--testing" type="boolean" truevalue="--testing" falsevalue="" label="Create testing.tsv file with model parameters"/>
60 <param argument="--true_params" type="integer" optional="true" label="Flag to state true simulated parameters for testing mode"/>
61 <param argument="--trace_flag" type="boolean" truevalue="--trace_flag" falsevalue="" label="Turn on printing of iteration progress of nlsLM function"/>
62 <param argument="--num_rounds" type="integer" min="1" optional="true" label="Number of optimization rounds"/>
63 </inputs>
64 <outputs>
65 <data name="linear_plot" format="png" from_work_dir="linear_plot.png" label="${tool.name} on ${on_string} Linear plot"/>
66 <data name="log_plot" format="png" from_work_dir="log_plot.png" label="${tool.name} on ${on_string} Log plot"/>
67 <data name="transformed_linear_plot" format="png" from_work_dir="transformed_linear_plot.png" label="${tool.name} on ${on_string} Transformed linear plot"/>
68 <data name="transformed_log_plot" format="png" from_work_dir="transformed_log_plot.png" label="${tool.name} on ${on_string} Transformed log plot"/>
69 <data name="model" format="txt" from_work_dir="model.txt" label="${tool.name} on ${on_string} Model">
70 <filter>model_output</filter>
71 </data>
72 <data name="summary" format="txt" from_work_dir="summary.txt" label="${tool.name} on ${on_string} Summary">
73 <filter>summary_output</filter>
74 </data>
75 <data name="progress" format="txt" from_work_dir="progress.txt" label="${tool.name} on ${on_string} Progress">
76 <filter>progress_output</filter>
77 </data>
78 <data name="model_params" format="tabular" from_work_dir="SIMULATED_testing.tsv" label="${tool.name} on ${on_string} Model parameters">
79 <filter>testing</filter>
80 </data>
81 </outputs>
82 <tests>
83 <test expect_num_outputs="8">
84 <param name="input" value="genomescope-in1.tab"/>
85 <param name="kmer_length" value="21"/>
86 <param name="testing" value="true"/>
87 <param name="model_output" value="true"/>
88 <param name="summary_output" value="true"/>
89 <param name="progress_output" value="true"/>
90 <output name="linear_plot" file="genomescope-out1-1.png" ftype="png"/>
91 <output name="log_plot" file="genomescope-out1-2.png" ftype="png"/>
92 <output name="transformed_linear_plot" file="genomescope-out1-3.png" ftype="png"/>
93 <output name="transformed_log_plot" file="genomescope-out1-4.png" ftype="png" compare="sim_size"/>
94 <output name="model" file="genomescope-out1-1.txt" ftype="txt" lines_diff="2"/>
95 <output name="summary" file="genomescope-out1-2.txt" ftype="txt" lines_diff="2"/>
96 <output name="progress" file="genomescope-out1-3.txt" ftype="txt" lines_diff="2"/>
97 <output name="testing" file="genomescope-out1-1.tab" ftype="tabular"/>
98 </test>
99 </tests>
100 <help><![CDATA[
101
102 GenomeScope 2.0: Reference-free profiling of polyploid genomes
103 ==============================================================
104
105 GenomeScope 2.0 applies classical insights from combinatorial theory to establish
106 a detailed mathematical model of how k-mer frequencies will be distributed in
107 heterozygous and polyploid genomes. GenomeScope 2.0 employs a polyploid-aware
108 mixture model that, within seconds, accurately infers genome properties from
109 unassembled sequencing data. GenomeScope 2.0 uses the k-mer count distribution,
110 e.g. from KMC or Jellyfish, and produces a report and several informative plots
111 describing the genome properties. We validate the approach on simulated polyploid
112 data created using a generative model with parameters for genome size, heterozygosity,
113 repetitiveness, ploidy, and sequencing coverage, and find GenomeScope 2.0 retains
114 accuracy across a broad range of realistic and extreme parameter values. We also
115 validate GenomeScope 2.0 by analyzing genuine sequence data from 11 diverse
116 polyploid genomes with known genome characteristics.
117
118 ]]></help>
119 <citations>
120 <citation type="doi">10.1093/bioinformatics/btx153</citation>
121 <citation type="doi">10.1038/s41467-020-14998-3</citation>
122 </citations>
123 </tool>