0
|
1 <tool id="mapsembler2" name="Mapsembler2" version="2.2.3">
|
|
2 <description>is a targeted assembly software.</description>
|
|
3 <requirements>
|
|
4 <requirement type="package" version="2.2.3">mapsembler2</requirement>
|
|
5 </requirements>
|
|
6 <command interpreter="python">
|
|
7 mapsembler2.py
|
|
8 -s $input_starters
|
|
9 -r $data_files
|
|
10 -t $output_extension
|
|
11 -k $kmer
|
|
12 -c $coverage
|
|
13 -d $substitutions
|
|
14 -g $genome_size
|
|
15 -f $process_search
|
|
16 -x $max_length
|
|
17 -y $max_depth
|
|
18 --output $output
|
|
19 -i $index_files
|
|
20 </command>
|
|
21
|
|
22 <inputs>
|
|
23 <!-- Input data files -->
|
|
24 <param name="input_starters" type="data" format="fasta" label="Starters" help="set of input sequences" />
|
|
25 <param name="data_files" type="data" multiple="true" format="fasta,fastq" label="Read file" help="Data loaded in the script" />
|
|
26 <param name="output_extension" type="select" label="Select your output extension type">
|
|
27 <option value="1">a strict sequence</option>
|
|
28 <option value="2">a consensus sequence</option>
|
|
29 <option value="3">a strict graph</option>
|
|
30 <option value="4">a consensus graph</option>
|
|
31 </param>
|
|
32 <param name="kmer" type="integer" label="Size of kmers" value="31" help="Set the length of used kmers. Must fit the compiled value. Only uneven number" />
|
|
33 <param name="coverage" type="integer" label="Minimal coverage" value="5" help="set the minimal coverage: Used by Phaser (don't use kmers with lower coverage) "/>
|
|
34 <param name="substitutions" type="integer" label="Number of authorized substitutions" value="1" help="set the number of authorized substitutions used while mapping reads on finding SNPs"/>
|
|
35 <param name="genome_size" type="integer" label="Estimated genome size" value="10000000" help="Used only to control memory usage. e.g.3 billion (3000000000) uses 4Gb of RAM." />
|
|
36 <param name="process_search" type="select" label="Process of search" help="Set the process of search in the graph" >
|
|
37 <option value="1">Breadth</option>
|
|
38 <option value="2">Depth</option>
|
|
39 </param>
|
|
40 <param name="max_length" type="integer" label="Max length of nodes" value="40" help="set the maximal length of nodes"/>
|
|
41 <param name="max_depth" type="integer" label="Max depth of nodes" value="10000" help="set the maximal depth of the graph"/>
|
|
42 <param name="index_files" type="boolean" checked="false" default="false" label="Include index output files" />
|
|
43 </inputs>
|
|
44
|
|
45 <outputs>
|
|
46 <data format="txt" name="output" label="${tool.name} on ${on_string}: out.txt" >
|
|
47 <discover_datasets pattern="__designation_and_ext__" directory="job_outputs" visible="true" />
|
|
48 </data>
|
|
49
|
|
50 </outputs>
|
|
51 <help>
|
|
52
|
|
53 **Description**
|
|
54
|
|
55 Mapsembler2 is a targeted assembly software. It takes as input a set of NGS raw reads (fasta or fastq, gzipped or not) and a set of input sequences (starters). It first determines if each starter is read-coherent, e.g. whether reads confirm the presence of each starter in the original sequence. Then for each read-coherent starter, Mapsembler2 outputs its sequence neighborhood as a linear sequence or as a graph, depending on the user choice.
|
|
56 Mapsembler2 may be used for (not limited to):
|
|
57
|
|
58 · Validate an assembled sequence (input as starter), e.g. from a de Bruijn graph assembly where read-coherence was not enforced.
|
|
59
|
|
60 · Checks if a gene (input as starter) has an homolog in a set of reads.
|
|
61
|
|
62 · Checks if a known enzyme is present in a metagenomic NGS read set.
|
|
63
|
|
64 · Enrich unmappable reads by extending them, possibly making them mappable.
|
|
65
|
|
66 · Checks what happens at the extremities of a contig.
|
|
67
|
|
68 · Remove contaminants or symbiont reads from a read set
|
|
69
|
|
70 -------
|
|
71
|
|
72 **Web site**
|
|
73
|
|
74 http://colibread.inria.fr/mapsembler2/
|
|
75
|
|
76 -------
|
|
77
|
|
78 **Integrated by**
|
|
79
|
|
80 Cyril Monjeaud
|
|
81
|
|
82 GenOuest Bio-informatics Core Facility
|
|
83
|
|
84 UMR 6074 IRISA INRIA-CNRS-UR1 Rennes (France)
|
|
85
|
|
86 support@genouest.org
|
|
87
|
|
88 If you use this tool in Galaxy, please cite :
|
|
89
|
|
90 `Y. Le Bras, A. Roult, C. Monjeaud, M. Bahin, O. Quenez, C. Heriveau, A. Bretaudeau, O. Sallou, O. Collin, Towards a Life Sciences Virtual Research Environment : an e-Science initiative in Western France. JOBIM 2013. <https://www.e-biogenouest.org/resources/128>`_
|
|
91
|
|
92 </help>
|
|
93 <citations>
|
|
94 <citation type="doi">10.1186/1471-2105-13-48</citation>
|
|
95 <citation type="bibtex">@INPROCEEDINGS{JOBIM2013,
|
|
96 author = {Le Bras, Y. and ROULT, A. and Monjeaud, C. and Bahin, M. and Quenez, O. and Heriveau, C. and Bretaudeau, A. and Sallou, O. and Collin, O.},
|
|
97 title = {Towards a Life Sciences Virtual Research Environment: An e-Science initiative in Western France},
|
|
98 booktitle = {JOBIM 2013 Proceedings},
|
|
99 year = {2013},
|
|
100 url = {https://www.e-biogenouest.org/resources/128},
|
|
101 pages = {97-106}
|
|
102 }
|
|
103 </citation>
|
|
104
|
|
105 </citations>
|
|
106
|
|
107 </tool>
|
|
108
|