0
|
1 <tool id="mapsembler2" name="Mapsembler2" version="2.2.3">
|
|
2 <description>is a targeted assembly software.</description>
|
|
3 <requirements>
|
|
4 <requirement type="package" version="2.2.3">mapsembler2</requirement>
|
|
5 </requirements>
|
|
6 <command interpreter="python">
|
|
7 mapsembler2.py
|
|
8 -s $input_starters
|
|
9 -r $data_files
|
2
|
10 -e $extension_format
|
0
|
11 -t $output_extension
|
|
12 -k $kmer
|
|
13 -c $coverage
|
|
14 -d $substitutions
|
|
15 -g $genome_size
|
|
16 -f $process_search
|
|
17 -x $max_length
|
|
18 -y $max_depth
|
|
19 --output $output
|
|
20 -i $index_files
|
|
21 </command>
|
|
22
|
|
23 <inputs>
|
|
24 <!-- Input data files -->
|
|
25 <param name="input_starters" type="data" format="fasta" label="Starters" help="set of input sequences" />
|
|
26 <param name="data_files" type="data" multiple="true" format="fasta,fastq" label="Read file" help="Data loaded in the script" />
|
2
|
27 <param name="extension_format" type="select" label="Input files">
|
|
28 <option value="fasta">fasta</option>
|
|
29 <option value="fastq">fastq</option>
|
|
30 </param>
|
0
|
31 <param name="output_extension" type="select" label="Select your output extension type">
|
|
32 <option value="1">a strict sequence</option>
|
|
33 <option value="2">a consensus sequence</option>
|
|
34 <option value="3">a strict graph</option>
|
|
35 <option value="4">a consensus graph</option>
|
|
36 </param>
|
|
37 <param name="kmer" type="integer" label="Size of kmers" value="31" help="Set the length of used kmers. Must fit the compiled value. Only uneven number" />
|
|
38 <param name="coverage" type="integer" label="Minimal coverage" value="5" help="set the minimal coverage: Used by Phaser (don't use kmers with lower coverage) "/>
|
|
39 <param name="substitutions" type="integer" label="Number of authorized substitutions" value="1" help="set the number of authorized substitutions used while mapping reads on finding SNPs"/>
|
|
40 <param name="genome_size" type="integer" label="Estimated genome size" value="10000000" help="Used only to control memory usage. e.g.3 billion (3000000000) uses 4Gb of RAM." />
|
|
41 <param name="process_search" type="select" label="Process of search" help="Set the process of search in the graph" >
|
|
42 <option value="1">Breadth</option>
|
|
43 <option value="2">Depth</option>
|
|
44 </param>
|
|
45 <param name="max_length" type="integer" label="Max length of nodes" value="40" help="set the maximal length of nodes"/>
|
|
46 <param name="max_depth" type="integer" label="Max depth of nodes" value="10000" help="set the maximal depth of the graph"/>
|
|
47 <param name="index_files" type="boolean" checked="false" default="false" label="Include index output files" />
|
|
48 </inputs>
|
|
49
|
|
50 <outputs>
|
|
51 <data format="txt" name="output" label="${tool.name} on ${on_string}: out.txt" >
|
|
52 <discover_datasets pattern="__designation_and_ext__" directory="job_outputs" visible="true" />
|
|
53 </data>
|
|
54
|
|
55 </outputs>
|
2
|
56 <stdio>
|
|
57 <exit_code range="1" level="fatal" description="Error in Stacks Denovo execution" />
|
|
58 </stdio>
|
0
|
59 <help>
|
|
60
|
|
61 **Description**
|
|
62
|
|
63 Mapsembler2 is a targeted assembly software. It takes as input a set of NGS raw reads (fasta or fastq, gzipped or not) and a set of input sequences (starters). It first determines if each starter is read-coherent, e.g. whether reads confirm the presence of each starter in the original sequence. Then for each read-coherent starter, Mapsembler2 outputs its sequence neighborhood as a linear sequence or as a graph, depending on the user choice.
|
|
64 Mapsembler2 may be used for (not limited to):
|
|
65
|
|
66 · Validate an assembled sequence (input as starter), e.g. from a de Bruijn graph assembly where read-coherence was not enforced.
|
|
67
|
|
68 · Checks if a gene (input as starter) has an homolog in a set of reads.
|
|
69
|
|
70 · Checks if a known enzyme is present in a metagenomic NGS read set.
|
|
71
|
|
72 · Enrich unmappable reads by extending them, possibly making them mappable.
|
|
73
|
|
74 · Checks what happens at the extremities of a contig.
|
|
75
|
|
76 · Remove contaminants or symbiont reads from a read set
|
|
77
|
|
78 -------
|
|
79
|
|
80 **Web site**
|
|
81
|
|
82 http://colibread.inria.fr/mapsembler2/
|
|
83
|
|
84 -------
|
|
85
|
|
86 **Integrated by**
|
|
87
|
|
88 Cyril Monjeaud
|
|
89
|
|
90 GenOuest Bio-informatics Core Facility
|
|
91
|
|
92 UMR 6074 IRISA INRIA-CNRS-UR1 Rennes (France)
|
|
93
|
|
94 support@genouest.org
|
|
95
|
|
96 If you use this tool in Galaxy, please cite :
|
|
97
|
|
98 `Y. Le Bras, A. Roult, C. Monjeaud, M. Bahin, O. Quenez, C. Heriveau, A. Bretaudeau, O. Sallou, O. Collin, Towards a Life Sciences Virtual Research Environment : an e-Science initiative in Western France. JOBIM 2013. <https://www.e-biogenouest.org/resources/128>`_
|
|
99
|
|
100 </help>
|
|
101 <citations>
|
|
102 <citation type="doi">10.1186/1471-2105-13-48</citation>
|
|
103 <citation type="bibtex">@INPROCEEDINGS{JOBIM2013,
|
|
104 author = {Le Bras, Y. and ROULT, A. and Monjeaud, C. and Bahin, M. and Quenez, O. and Heriveau, C. and Bretaudeau, A. and Sallou, O. and Collin, O.},
|
|
105 title = {Towards a Life Sciences Virtual Research Environment: An e-Science initiative in Western France},
|
|
106 booktitle = {JOBIM 2013 Proceedings},
|
|
107 year = {2013},
|
|
108 url = {https://www.e-biogenouest.org/resources/128},
|
|
109 pages = {97-106}
|
|
110 }
|
|
111 </citation>
|
|
112
|
|
113 </citations>
|
|
114
|
|
115 </tool>
|
|
116
|