annotate trycycler_cluster.xml @ 6:ed2425b9fd27 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e9abd8b86133e530d0395d85bca320a1af27a9b6
author iuc
date Tue, 02 Apr 2024 08:30:22 +0000
parents 189e837009c9
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
1 <tool id='trycycler_cluster' name='Trycycler cluster' version='@TOOL_VERSION@' profile='20.01'>
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
2 <description>cluster the contigs of your input assemblies into per-replicon groups</description>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
3 <macros>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
4 <import>macros.xml</import>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
5 </macros>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
6 <expand macro='edam_ontology' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
7 <expand macro='requirements' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
8 <version_command>trycycler --version</version_command>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
9 <command detect_errors='exit_code'><![CDATA[
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
10 #import re
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
11 mkdir -p initial_clusters assemblies &&
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
12 #for $input_file in $assemblies
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
13 #set $name = re.sub('[^\w\-\.]', '_', str($input_file.element_identifier))
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
14 ln -s '$input_file' 'assemblies/$name' &&
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
15 #end for
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
16 trycycler cluster --assemblies assemblies/*
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
17 --reads '$reads'
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
18 --min_contig_len $min_contig_len
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
19 --min_contig_depth $min_contig_depth
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
20 --distance $distance
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
21 --threads \${GALAXY_SLOTS:-2}
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
22 --out_dir 'initial_clusters' &&
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
23 mv initial_clusters/contigs.phylip '$output_phylip' &&
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
24 mv initial_clusters/contigs.newick '$output_newick' &&
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
25 python3 '$__tool_directory__/trycycler.py' 'cluster' 'initial_clusters'
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
26 ]]> </command>
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
27 <inputs>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
28 <param name='assemblies' type='data' format='fasta,fasta.gz' multiple='true' label='Assembled sequences datasets' help='Input assemblies whose contigs will be clustered (multiple FASTA files)' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
29 <param name='reads' type='data' format='fastq,fastq.gz' label='Long-read datasets' help='Long reads (FASTQ format) used to generate the assemblies' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
30 <param argument='--min_contig_len' type='integer' min='100' max='5000' value='1000' label='Minimun contig length' help='Contigs shorter than this are thrown out on the assumption that they are either incomplete or spurious. The default value is 1000, as plasmids smaller than that are very rare.' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
31 <param argument='--min_contig_depth' type='float' min='0.01' max='1' value='0.1' label='Minimun contig depth' help='This controls how Trycycler filters out contigs with a low read depth. It is a multiple of the mean read depth for the assembly. For example, if an assembly has a mean depth of 90x and this setting is 0.1 (the default), then any contig with depth lower that x9 will be removed.' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
32 <param argument='--distance' type='float' min='0.001' max='0.1' value='0.01' label='Mash distance threshold' help='This is the Mash distance threshold used when defining clusters, and the default threshold is 0.01. Smaller thresholds (e.g. 0.005) can result in a larger number of tighter clusters. Larger thresholds (e.g. 0.02) can result in a smaller number of looser clusters.' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
33 </inputs>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
34 <outputs>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
35 <data name='output_phylip' format='phylip' label='${tool.name} on ${on_string}: phylip' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
36 <data name='output_newick' format='newick' label='${tool.name} on ${on_string}: newick' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
37 <collection name='initial_clusters' type='list' label='${tool.name} on ${on_string}'>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
38 <discover_datasets pattern='__designation_and_ext__' format='fasta' directory='initial_clusters' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
39 </collection>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
40 </outputs>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
41 <tests>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
42 <test>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
43 <param name='assemblies' value='assembly_00.fasta.gz,assembly_01.fasta.gz,assembly_02.fasta.gz,assembly_03.fasta.gz' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
44 <param name='reads' value='reads.fastq.gz' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
45 <output name='output_phylip' file='contigs_01.phylip' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
46 <output name='output_newick' file='contigs_01.newick' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
47 <output_collection name='initial_clusters' type='list' count='2'>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
48 <element name='cluster_01' file='cluster_01.fasta' ftype='fasta' lines_diff='20' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
49 </output_collection>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
50 </test>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
51 <test>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
52 <param name='assemblies' value='assembly_00.fasta.gz,assembly_01.fasta.gz,assembly_02.fasta.gz,assembly_03.fasta.gz' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
53 <param name='reads' value='reads.fastq.gz' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
54 <param name='min_contig_len' value='900' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
55 <param name='min_contig_depth' value='0.05' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
56 <param name='distance' value='0.05' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
57 <output name='output_phylip' file='contigs_02.phylip' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
58 <output name='output_newick' file='contigs_02.newick' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
59 <output_collection name='initial_clusters' type='list' count='2'>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
60 <element name='cluster_01' file='cluster_02.fasta' ftype='fasta' lines_diff='20' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
61 </output_collection>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
62 </test>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
63 <test>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
64 <param name='assemblies' value='assembly_00.fasta.gz,assembly_01.fasta.gz,assembly_02.fasta.gz,assembly_03.fasta.gz' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
65 <param name='reads' value='reads.fastq.gz' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
66 <param name='min_contig_len' value='850' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
67 <param name='min_contig_depth' value='0.01' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
68 <param name='distance' value='0.09' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
69 <output name='output_phylip' file='contigs_03.phylip' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
70 <output name='output_newick' file='contigs_03.newick' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
71 <output_collection name='initial_clusters' type='list' count='2'>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
72 <element name='cluster_01' file='cluster_03.fasta' ftype='fasta' lines_diff='20' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
73 </output_collection>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
74 </test>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
75 <test>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
76 <param name='assemblies' value='assembly_00.fasta.gz,assembly_01.fasta.gz,assembly_02.fasta.gz,assembly_03.fasta.gz' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
77 <param name='reads' value='reads.fastq.gz' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
78 <param name='min_contig_len' value='1100' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
79 <param name='min_contig_depth' value='0.02' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
80 <param name='distance' value='0.07' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
81 <output name='output_phylip' file='contigs_04.phylip' />
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
82 <output name='output_newick' file='contigs_04.newick' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
83 <output_collection name='initial_clusters' type='list' count='2'>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
84 <element name='cluster_01' file='cluster_04.fasta' ftype='fasta' lines_diff='20' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
85 </output_collection>
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
86 </test>
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
87 </tests>
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
88 <help><![CDATA[
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
89 .. class:: infomark
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
90
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
91 **Purpose**
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
92
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
93 The *Trycycler cluster* tool carries out complete-linkage clustering of all contig sequences based on their `Mash distance <https://genomebiology.biomedcentral.com/articles/10.1186/s13059-016-0997-x/>`_, a fast sequence distance estimator that uses the MinHash algorithm. It also serves to exclude any spurious, incomplete or badly misassembled contigs.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
94
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
95 If your contigs do not form clear clusters, that indicates that the input assemblies are inconsistent and unreliable. If you find yourself in this situation (struggling to identify which clusters are good and which are bad), then you probably need to get better long-read data (longer and/or deeper) and try again.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
96
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
97 ----
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
98
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
99 .. class:: infomark
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
100
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
101 **Input**
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
102
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
103 This tool requires two different inputs: a set of multiple separate assemblies and a long-read set.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
104
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
105 ----
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
106
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
107 .. class:: infomark
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
108
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
109 **Output**
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
110
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
111 **Trycycler cluster** generates three files:
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
112
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
113 \* A matrix of the Mash distances between contigs (phylip output).
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
114
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
115 \* A `FastMe tree <https://academic.oup.com/mbe/article/32/10/2798/1212138>`_ of the contigs built from the distance matrix. It can be visualised in the **newick display** tool.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
116
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
117 \* A collection list which contains the clusters.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
118
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
119 \
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
120
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
121 **Choose your clusters**
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
122
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
123 After running **Trycycler cluster**, you need to extract the cluster datasets from the collection by using the **Extract Element from a collection based on a name** tool. It is up to you to choose which of the clusters are good and which are bad. This can be somewhat subjective, so there is not an exact procedure for you to follow.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
124
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
125 Generally speaking, a good cluster contains many contigs (ideally one from each assembly) which are all very close to each other and have realistic read depths. A bad cluster contains a small number of contigs (maybe just one) which might have low read depths. The tree can be useful in making these decisions, though interpret it with a grain of salt, as the contig sequences are not necessarily related in a tree-like manner.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
126
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
127 If you have prior knowledge about what your genome should look like, that information can be quite useful in deciding which clusters are good. E.g. if you happened to know that your genome contains a 150 kbp plasmid, then you can expect one of your good clusters to have contigs of about that size.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
128
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
129 You might also decide at this point that the default value for --distance (0.01) was not quite right. E.g. if your tree contains two very close clusters that you think should actually be one cluster, you can run Trycycler cluster again with a larger distance threshold. Another thing to keep in mind: contamination can happen. I most often see this occur with cross-barcode contamination, where a contig in one assembly actually belongs to a different genome from the same multiplexed sequencing run.
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
130
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
131
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
132 ----
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
133
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
134 .. class:: infomark
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
135
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
136 @PIPELINE@
1
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
137 ]]> </help>
189e837009c9 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents: 0
diff changeset
138 <expand macro='citations' />
0
c767a45616d0 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff changeset
139 </tool>