Mercurial > repos > iuc > trycycler_cluster
annotate trycycler_cluster.xml @ 6:ed2425b9fd27 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e9abd8b86133e530d0395d85bca320a1af27a9b6
author | iuc |
---|---|
date | Tue, 02 Apr 2024 08:30:22 +0000 |
parents | 189e837009c9 |
children |
rev | line source |
---|---|
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
1 <tool id='trycycler_cluster' name='Trycycler cluster' version='@TOOL_VERSION@' profile='20.01'> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
2 <description>cluster the contigs of your input assemblies into per-replicon groups</description> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
3 <macros> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
4 <import>macros.xml</import> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
5 </macros> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
6 <expand macro='edam_ontology' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
7 <expand macro='requirements' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
8 <version_command>trycycler --version</version_command> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
9 <command detect_errors='exit_code'><![CDATA[ |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
10 #import re |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
11 mkdir -p initial_clusters assemblies && |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
12 #for $input_file in $assemblies |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
13 #set $name = re.sub('[^\w\-\.]', '_', str($input_file.element_identifier)) |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
14 ln -s '$input_file' 'assemblies/$name' && |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
15 #end for |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
16 trycycler cluster --assemblies assemblies/* |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
17 --reads '$reads' |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
18 --min_contig_len $min_contig_len |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
19 --min_contig_depth $min_contig_depth |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
20 --distance $distance |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
21 --threads \${GALAXY_SLOTS:-2} |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
22 --out_dir 'initial_clusters' && |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
23 mv initial_clusters/contigs.phylip '$output_phylip' && |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
24 mv initial_clusters/contigs.newick '$output_newick' && |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
25 python3 '$__tool_directory__/trycycler.py' 'cluster' 'initial_clusters' |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
26 ]]> </command> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
27 <inputs> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
28 <param name='assemblies' type='data' format='fasta,fasta.gz' multiple='true' label='Assembled sequences datasets' help='Input assemblies whose contigs will be clustered (multiple FASTA files)' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
29 <param name='reads' type='data' format='fastq,fastq.gz' label='Long-read datasets' help='Long reads (FASTQ format) used to generate the assemblies' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
30 <param argument='--min_contig_len' type='integer' min='100' max='5000' value='1000' label='Minimun contig length' help='Contigs shorter than this are thrown out on the assumption that they are either incomplete or spurious. The default value is 1000, as plasmids smaller than that are very rare.' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
31 <param argument='--min_contig_depth' type='float' min='0.01' max='1' value='0.1' label='Minimun contig depth' help='This controls how Trycycler filters out contigs with a low read depth. It is a multiple of the mean read depth for the assembly. For example, if an assembly has a mean depth of 90x and this setting is 0.1 (the default), then any contig with depth lower that x9 will be removed.' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
32 <param argument='--distance' type='float' min='0.001' max='0.1' value='0.01' label='Mash distance threshold' help='This is the Mash distance threshold used when defining clusters, and the default threshold is 0.01. Smaller thresholds (e.g. 0.005) can result in a larger number of tighter clusters. Larger thresholds (e.g. 0.02) can result in a smaller number of looser clusters.' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
33 </inputs> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
34 <outputs> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
35 <data name='output_phylip' format='phylip' label='${tool.name} on ${on_string}: phylip' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
36 <data name='output_newick' format='newick' label='${tool.name} on ${on_string}: newick' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
37 <collection name='initial_clusters' type='list' label='${tool.name} on ${on_string}'> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
38 <discover_datasets pattern='__designation_and_ext__' format='fasta' directory='initial_clusters' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
39 </collection> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
40 </outputs> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
41 <tests> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
42 <test> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
43 <param name='assemblies' value='assembly_00.fasta.gz,assembly_01.fasta.gz,assembly_02.fasta.gz,assembly_03.fasta.gz' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
44 <param name='reads' value='reads.fastq.gz' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
45 <output name='output_phylip' file='contigs_01.phylip' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
46 <output name='output_newick' file='contigs_01.newick' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
47 <output_collection name='initial_clusters' type='list' count='2'> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
48 <element name='cluster_01' file='cluster_01.fasta' ftype='fasta' lines_diff='20' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
49 </output_collection> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
50 </test> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
51 <test> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
52 <param name='assemblies' value='assembly_00.fasta.gz,assembly_01.fasta.gz,assembly_02.fasta.gz,assembly_03.fasta.gz' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
53 <param name='reads' value='reads.fastq.gz' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
54 <param name='min_contig_len' value='900' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
55 <param name='min_contig_depth' value='0.05' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
56 <param name='distance' value='0.05' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
57 <output name='output_phylip' file='contigs_02.phylip' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
58 <output name='output_newick' file='contigs_02.newick' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
59 <output_collection name='initial_clusters' type='list' count='2'> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
60 <element name='cluster_01' file='cluster_02.fasta' ftype='fasta' lines_diff='20' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
61 </output_collection> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
62 </test> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
63 <test> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
64 <param name='assemblies' value='assembly_00.fasta.gz,assembly_01.fasta.gz,assembly_02.fasta.gz,assembly_03.fasta.gz' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
65 <param name='reads' value='reads.fastq.gz' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
66 <param name='min_contig_len' value='850' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
67 <param name='min_contig_depth' value='0.01' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
68 <param name='distance' value='0.09' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
69 <output name='output_phylip' file='contigs_03.phylip' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
70 <output name='output_newick' file='contigs_03.newick' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
71 <output_collection name='initial_clusters' type='list' count='2'> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
72 <element name='cluster_01' file='cluster_03.fasta' ftype='fasta' lines_diff='20' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
73 </output_collection> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
74 </test> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
75 <test> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
76 <param name='assemblies' value='assembly_00.fasta.gz,assembly_01.fasta.gz,assembly_02.fasta.gz,assembly_03.fasta.gz' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
77 <param name='reads' value='reads.fastq.gz' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
78 <param name='min_contig_len' value='1100' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
79 <param name='min_contig_depth' value='0.02' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
80 <param name='distance' value='0.07' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
81 <output name='output_phylip' file='contigs_04.phylip' /> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
82 <output name='output_newick' file='contigs_04.newick' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
83 <output_collection name='initial_clusters' type='list' count='2'> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
84 <element name='cluster_01' file='cluster_04.fasta' ftype='fasta' lines_diff='20' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
85 </output_collection> |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
86 </test> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
87 </tests> |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
88 <help><![CDATA[ |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
89 .. class:: infomark |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
90 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
91 **Purpose** |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
92 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
93 The *Trycycler cluster* tool carries out complete-linkage clustering of all contig sequences based on their `Mash distance <https://genomebiology.biomedcentral.com/articles/10.1186/s13059-016-0997-x/>`_, a fast sequence distance estimator that uses the MinHash algorithm. It also serves to exclude any spurious, incomplete or badly misassembled contigs. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
94 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
95 If your contigs do not form clear clusters, that indicates that the input assemblies are inconsistent and unreliable. If you find yourself in this situation (struggling to identify which clusters are good and which are bad), then you probably need to get better long-read data (longer and/or deeper) and try again. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
96 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
97 ---- |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
98 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
99 .. class:: infomark |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
100 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
101 **Input** |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
102 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
103 This tool requires two different inputs: a set of multiple separate assemblies and a long-read set. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
104 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
105 ---- |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
106 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
107 .. class:: infomark |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
108 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
109 **Output** |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
110 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
111 **Trycycler cluster** generates three files: |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
112 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
113 \* A matrix of the Mash distances between contigs (phylip output). |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
114 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
115 \* A `FastMe tree <https://academic.oup.com/mbe/article/32/10/2798/1212138>`_ of the contigs built from the distance matrix. It can be visualised in the **newick display** tool. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
116 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
117 \* A collection list which contains the clusters. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
118 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
119 \ |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
120 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
121 **Choose your clusters** |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
122 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
123 After running **Trycycler cluster**, you need to extract the cluster datasets from the collection by using the **Extract Element from a collection based on a name** tool. It is up to you to choose which of the clusters are good and which are bad. This can be somewhat subjective, so there is not an exact procedure for you to follow. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
124 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
125 Generally speaking, a good cluster contains many contigs (ideally one from each assembly) which are all very close to each other and have realistic read depths. A bad cluster contains a small number of contigs (maybe just one) which might have low read depths. The tree can be useful in making these decisions, though interpret it with a grain of salt, as the contig sequences are not necessarily related in a tree-like manner. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
126 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
127 If you have prior knowledge about what your genome should look like, that information can be quite useful in deciding which clusters are good. E.g. if you happened to know that your genome contains a 150 kbp plasmid, then you can expect one of your good clusters to have contigs of about that size. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
128 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
129 You might also decide at this point that the default value for --distance (0.01) was not quite right. E.g. if your tree contains two very close clusters that you think should actually be one cluster, you can run Trycycler cluster again with a larger distance threshold. Another thing to keep in mind: contamination can happen. I most often see this occur with cross-barcode contamination, where a contig in one assembly actually belongs to a different genome from the same multiplexed sequencing run. |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
130 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
131 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
132 ---- |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
133 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
134 .. class:: infomark |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
135 |
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
136 @PIPELINE@ |
1
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
137 ]]> </help> |
189e837009c9
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit e88166111fa3b6c57c870ea4cff6e012a1b1a912"
iuc
parents:
0
diff
changeset
|
138 <expand macro='citations' /> |
0
c767a45616d0
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/trycycler commit 9d7c4277b0f96aacd466f2d497e08edcca3fa238"
iuc
parents:
diff
changeset
|
139 </tool> |