comparison links.xml @ 0:7acd9ade2dd1 draft default tip

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/links commit f15e5bb67b7a212ecd8c98e816c80e22d3b7a0cb"
author iuc
date Wed, 23 Feb 2022 08:25:55 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:7acd9ade2dd1
1 <tool id="links" name="LINKS" version="@TOOL_VERSION@+galaxy+@VERSION_SUFFIX@" python_template_version="3.5" profile="20.09">
2 <description> - scaffold genome assemblies with long reads</description>
3 <xrefs>
4 <xref type="bio.tools">links</xref>
5 </xrefs>
6 <macros>
7 <token name="@TOOL_VERSION@">2.0.1</token>
8 <token name="@VERSION_SUFFIX@">1</token>
9 </macros>
10 <requirements>
11 <requirement type="package" version="@TOOL_VERSION@">links</requirement>
12 </requirements>
13 <version_command><![CDATA[
14 LINKS | grep "LINKS v" | cut -d' ' -f4
15 ]]></version_command>
16 <command detect_errors="exit_code"><![CDATA[
17
18 ## set up file paths
19
20 #set sequences_fn = 'sequences.' + $f.ext
21 ln -s '$f' '$sequences_fn'
22 &&
23 #for $n, $read in enumerate($reads):
24 #set read_fn = 'reads' + str($n) + '.' + $read.ext
25 ln -s '$read' '$read_fn'
26 &&
27 printf '%s\n' '$read_fn' >> reads.fof
28 &&
29 #end for
30
31 ## RUN LINKS
32
33 LINKS
34 -f '$sequences_fn'
35 -s reads.fof
36 -b links_output
37
38 #if str($scaffolding.k):
39 -k '$scaffolding.k'
40 #end if
41
42 #if str($scaffolding.d):
43 -d '$scaffolding.d'
44 #end if
45
46 #if str($scaffolding.t):
47 -t '$scaffolding.t'
48 #end if
49
50 #if str($advanced.a):
51 -a '$advanced.a'
52 #end if
53
54 #if str($advanced.e):
55 -e '$advanced.e'
56 #end if
57
58 #if str($advanced.o):
59 -o '$advanced.o'
60 #end if
61
62 #if str($advanced.l):
63 -l '$advanced.l'
64 #end if
65
66 #if str($advanced.z):
67 -z '$advanced.z'
68 #end if
69
70 #if str($advanced.p):
71 -p '$advanced.p'
72 #end if
73
74 ]]></command>
75 <inputs>
76 <param argument="-f" type="data" format="fasta,fasta.gz" label="Contigs" help="Sequences to scaffold" />
77 <param name="reads" type="data" format="fasta,fasta.gz,fastq,fastq.gz" label="Reads" help="Long sequence reads for scaffolding" multiple="true" />
78 <section name="scaffolding" title="Scaffolding options" expanded="False">
79 <param argument="-k" type="integer" value="15" optional="true" label="k-mer length" />
80 <param argument="-d" type="text" value="4000" optional="true" label="Distance" help="Distance between k-mer pairs. Multiple distances are separated by comma, e.g. 500,1000,2000,3000"/>
81 <param argument="-t" type="text" value="2" optional="true" label="Step" help="Step of sliding window when extracting k-mer pairs from long reads. Multiple steps are separated by comma, e.g. 10,5" />
82 </section>
83 <section name="advanced" title="Advanced options" expanded="False">
84 <param argument="-a" type="float" value="0.3" optional="true" label="Maximum link ratio" help="Maximum link ratio between two best contig pairs. Higher values lead to least accurate scaffolding" />
85 <param argument="-e" type="float" value="0.1" optional="true" label="Error" help="Error (%) allowed on -d distance"/>
86 <param argument="-l" type="integer" value="5" optional="true" label="Number of links" help="Minimum number of links (k-mer pairs) to compute
87 scaffold"/>
88 <param argument="-o" type="integer" value="0" optional="true" label="Offset" help="Offset position for extracting k-mer pairs"/>
89 <param argument="-p" type="float" value="0.001" optional="true" label="Bloom filter false positive rate" help="Increase to prevent memory allocation errors"/>
90 <param argument="-z" type="integer" value="500" optional="true" label="Minimum contig length" help="Minimum contig length to consider for scaffolding"/>
91 </section>
92 </inputs>
93 <outputs>
94 <data name="scaffolds" format="fasta" from_work_dir="links_output.scaffolds.fa" label="${tool.name} on ${on_string} (scaffolds)" />
95 <data name="correspondence" format="tabular" from_work_dir="links_output.assembly_correspondence.tsv" label="${tool.name} on ${on_string} (Correspondence file)" />
96 <data name="gv" format="graph_dot" from_work_dir="links_output.gv" label="${tool.name} on ${on_string} (Graph)" />
97 </outputs>
98 <tests>
99 <!-- Basic test -->
100 <test>
101 <param name="f" value="used_contigs.fasta.gz"/>
102 <param name="reads" value="reads.fasta.gz"/>
103 <output name="scaffolds" ftype="fasta" file="single_readfile.scaffolds.fa"/>
104 <output name="correspondence" ftype="tabular" file="single_readfile.assembly_correspondence.tsv"/>
105 <output name="gv">
106 <assert_contents>
107 <has_text text="node [shape = circle]" />
108 </assert_contents>
109 </output>
110 </test>
111 <!-- Test multiple readfile input -->
112 <test>
113 <param name="f" value="used_contigs.fasta.gz"/>
114 <param name="reads" value="reads1.fasta.gz,reads2.fasta.gz"/>
115 <output name="scaffolds" ftype="fasta" file="multi_readfile.scaffolds.fa"/>
116 <output name="correspondence" ftype="tabular" file="multi_readfile.assembly_correspondence.tsv"/>
117 </test>
118 <!-- Test scaffolding parameters -->
119 <test>
120 <param name="f" value="used_contigs.fasta.gz"/>
121 <param name="reads" value="reads.fasta.gz"/>
122 <param name="k" value="19" />
123 <param name="d" value="500,1000,2000,3000" />
124 <param name="t" value="10,5" />
125 <output name="scaffolds" ftype="fasta" file="scaffolding.scaffolds.fa"/>
126 <output name="correspondence" ftype="tabular" file="scaffolding.assembly_correspondence.tsv"/>
127 </test>
128 <!-- Test advanced parameters -->
129 <test>
130 <param name="f" value="used_contigs.fasta.gz"/>
131 <param name="reads" value="reads.fasta.gz"/>
132 <output name="scaffolds" ftype="fasta" file="advanced.scaffolds.fa"/>
133 <param name="a" value="0.2" />
134 <param name="e" value="0.05" />
135 <param name="l" value="10" />
136 <param name="o" value="1" />
137 <param name="z" value="600" />
138 <output name="scaffolds" ftype="fasta" file="advanced.scaffolds.fa"/>
139 <output name="correspondence" ftype="tabular" file="advanced.assembly_correspondence.tsv"/>
140 </test>
141 </tests>
142 <help><![CDATA[
143
144 .. figure:: https://github.com/warrenlr/links/raw/master/links-logo.png
145 :alt: links-logo
146 :width: 200px
147
148 `LINKS <https://github.com/bcgsc/LINKS>`__ is a genomics application for
149 scaffolding genome assemblies with long reads, such as those produced by
150 Oxford Nanopore Technologies Ltd. It can be used to scaffold
151 high-quality draft genome assemblies with any long sequences (eg. ONT
152 reads, PacBio reads, other draft genomes, etc).
153
154 **Input**:
155
156 **LINKS does not use quality information in the Reads, so it is
157 recommended to filter the long reads first**.
158
159 Provide a ``fasta`` or ``fasta.gz`` dataset containing the Contigs, and
160 a ``fastq``, ``fastq.gz``, ``fasta`` or ``fasta.gz`` dataset of Reads to
161 be used for scaffolding.
162
163 **Use cases**:
164
165 - *Use long reads to scaffold a draft assembly* by providing the draft
166 assembly to the Contigs parameter and the long reads to the Reads
167 parameter.
168 - *Use a reference assembly to scaffold a draft assembly* by providing
169 the reference assembly to the Reads parameter. For example, you could
170 use a species’s reference genome to scaffold a genome that was
171 assembled for another individual.
172
173 **How it works**:
174
175 LINKS uses *k*-mer pairs from the Reads to identify candidate pairs of
176 Contigs, then uses the number of spanning *k*-mer pairs and the mean
177 distance between them to build scaffolds.
178
179 You can control the distance between *k*-mer pairs, the length of the
180 *k*-mers and the minimum number of *k*-mer pairs between contigs. See
181 the `LINKS readme on
182 GitHub <https://github.com/bcgsc/LINKS#how-it-works>`__ for information
183 on setting advanced parameters.
184
185
186
187 ]]></help>
188 <citations>
189 <citation type="doi">10.1186/s13742-015-0076-3</citation>
190 </citations>
191 </tool>