Mercurial > repos > stheil > metavelvet_wrapper
changeset 1:0591d844bd08 draft
Uploaded
author | stheil |
---|---|
date | Thu, 24 Sep 2015 10:41:51 -0400 |
parents | 3e0660c2fb2c |
children | 1bb80c25b379 |
files | meta_velvet.xml |
diffstat | 1 files changed, 419 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/meta_velvet.xml Thu Sep 24 10:41:51 2015 -0400 @@ -0,0 +1,419 @@ +<tool id="velvet_test" name="velvet_test" version="3.0 (2013-4-30)"> + + <macros> + <import>velvet_macro.xml</import> + </macros> + <description>Run velvet or meta-velvetg assembly.</description> + + <command interpreter="perl">velvet.pl + + $meta + + #for $i, $library in enumerate( $shortPaired ) + + #set $libNumber = $i + 1 + + #if $libNumber == 1 + + #set $libNumber = '' + + #end if + + #if not $library.ins_length.value is None + + -ins_length$libNumber $library.ins_length + + #end if + + #if not $library.ins_length_sd.value is None + + -ins_length_sd$libNumber $library.ins_length_sd + + #end if + + -shortPaired$libNumber + + @PAIRED_FILES_OPTIONS@ + + #end for + + #for $i, $library in enumerate( $short ) + + #set $libNumber = $i + 1 + + #if $libNumber == 1 + + #set $libNumber = '' + + #end if + + -short$libNumber + + @UNPAIRED_FILES_OPTIONS@ + + #end for + + #for $i, $library in enumerate( $longPaired ) + + #if not $library.ins_length.value is None + + -ins_length_long $library.ins_length + + #end if + + #if not $library.ins_length_sd.value is None + + -ins_length_long_sd $library.ins_length_sd + + #end if + + -longPaired + + @PAIRED_FILES_OPTIONS@ + + #end for + + #for $i, $library in enumerate( $long ) + + -long + + @UNPAIRED_FILES_OPTIONS@ + + #end for + + #if not $hash_length.value == '' + + -hash_length $hash_length + + #end if + + $strand_specific + + #if not $cov_cutoff.value == '' + + -cov_cutoff $cov_cutoff + + #end if + + $read_trkg + + #if not $min_contig_lgth.value is None + + -min_contig_lgth $min_contig_lgth + + #end if + + $amos_file + + #if not $exp_cov.value == '' + + -exp_cov $exp_cov + + #end if + + #if not $long_cov_cutoff.value == '' + + -long_cov_cutoff $long_cov_cutoff + + #end if + + $scaffolding + + #if not $max_branch_length.value is None + + -max_branch_length $max_branch_length + + #end if + + #if not $max_divergence.value is None + + -max_divergence $max_divergence + + #end if + + #if not $max_gap_count.value is None + + -max_gap_count $max_gap_count + + #end if + + #if not $min_pair_count.value is None + + -min_pair_count $min_pair_count + + #end if + + #if not $max_coverage.value is None + + -max_coverage $max_coverage + + #end if + + #if not $coverage_mask.value is None + + -coverage_mask $coverage_mask + + #end if + + #if not $long_mult_cutoff.value is None + + -long_mult_cutoff $long_mult_cutoff + + #end if + + $unused_reads + + $alignments + + $exportFiltered + + #if not $paired_exp_fraction.value is None + + -paired_exp_fraction $paired_exp_fraction + + #end if + + $shortMatePaired + + $conserveLong + + $discard_chimera + + #if not $max_chimera_rate.value is None + + -max_chimera_rate $max_chimera_rate + + #end if + + #if not $repeat_cov_sd.value is None + + -repeat_cov_sd $repeat_cov_sd + + #end if + + #if not $min_split_length.value is None + + -min_split_length $min_split_length + + #end if + + #if not $valid_connections.value is None + + -valid_connections $valid_connections + + #end if + + #if not $noise_connections.value is None + + -noise_connections $noise_connections + + #end if + + $use_connections + + $report_split_detail + + $report_subgraph + + #if not $exp_covs.value == '' + + -exp_covs $exp_covs + + #end if + + #if not $min_peak_cov.value is None + + -min_peak_cov $min_peak_cov + + #end if + + #if not $max_peak_cov.value is None + + -max_peak_cov $max_peak_cov + + #end if + + #if not $histo_bin_width.value is None + + -histo_bin_width $histo_bin_width + + #end if + + #if not $histo_sn_ratio.value is None + + -histo_sn_ratio $histo_sn_ratio + + #end if + + </command> + + <inputs> + + <param name="hash_length" type="text" value="31" label="Hash length : integer <= 150 OR m,M,s with m (min kmer length) < M (max kmer length) <= 150 and s is a step number"/> + + <param name="meta" type="select" label="Perform a metagenomic assembly using meta-velvetg"> + <option value="">Yes</option> + <option value="-nometa">No</option> + </param> + + <repeat name="shortPaired" max="2" title="Short paired reads library"> + <expand macro="paired_library_options" /> + </repeat> + + <repeat name="short" max="2" title="Short unpaired reads library"> + <expand macro="unpaired_library_options" /> + </repeat> + + <repeat name="longPaired" max="1" title="Long paired reads library"> + <expand macro="paired_library_options" /> + </repeat> + + <repeat name="long" max="1" title="Long unpaired reads library"> + <expand macro="unpaired_library_options" /> + </repeat> + + <param name="reference" type="data" format="fasta" optional="true" label="VELVETH - Reference file (-reference)"/> + + <param name="strand_specific" type="select" label="VELVETH - Strand specific transcriptome sequencing data. Default: No (-strand_specific)"> + <option value="">No</option> + <option value="-strand_specific">Yes</option> + </param> + + <param name="cov_cutoff" type="text" optional="true" label="VELVETG - Coverage cutoff. Float or auto (-cov_cutoff)"/> + + <param name="read_trkg" type="select" label="VELVETG - Tracking of short read positions in assembly. Default: no tracking (-read_trkg)"> + <option value="">No</option> + <option value="-read_trkg yes">Yes</option> + </param> + + <param name="min_contig_lgth" type="integer" optional="true" label="VELVETG - Minimum contig length. Default: hash length * 2 (-min_contig_lgth)"/> + + <param name="amos_file" type="select" label="VELVETG - Export assembly to AMOS file. Default: no export (-amos_file)"> + <option value="">No</option> + <option value="-amos_file yes">Yes</option> + </param> + + <param name="exp_cov" type="text" optional="true" label="VELVETG - Expected coverage of unique regions (float or auto). In case of metagenomic analysis it will be set to auto (-exp_cov)"/> + <param name="long_cov_cutoff" type="text" optional="true" label="VELVETG - Cutoff for removal of nodes with low long-read coverage (-long_cov_cutoff)"/> + + <param name="scaffolding" type="select" label="VELVETG - Scaffolding of contigs used paired end information. Default: on (-scaffolding)"> + <option value="">Yes</option> + <option value="-scaffolding no">No</option> + </param> + + <param name="max_branch_length" type="integer" optional="true" label="VELVETG - Maximum length in base pair of bubble. Default: 100 (-max_branch_length)"/> + <param name="max_divergence" type="float" optional="true" label="VELVETG - Maximum divergence rate between two branches in a bubble. Default: 0.2 (-max_divergence)"/> + <param name="max_gap_count" type="integer" optional="true" label="VELVETG - Maximum number of gaps allowed in the alignment of the two branches of a bubble. Default: 3 (-max_gap_count)"/> + <param name="min_pair_count" type="integer" optional="true" label="VELVETG -Minimum number of paired end connections to justify the scaffolding of two long contigs. Default: 5 (-min_pair_count)"/> + + <param name="max_coverage" type="float" optional="true" label="VELVETG - Cutoff for removal of high coverage nodes AFTER tour bus. Default: no removal (-max_coverage)"/> + <param name="coverage_mask" type="integer" optional="true" label="VELVETG - Minimum coverage required for confident regions of contigs. Default: 1 (-coverage_mask)"/> + <param name="long_mult_cutoff" type="integer" optional="true" label="VELVETG -Minimum number of long reads required to merge contigs. Default: 2 (-long_mult_cutoff)"/> + + <param name="unused_reads" type="select" label="VELVETG - Export unused reads in UnusedReads.fa file. Default: no (-unused_reads)"> + <option value="">No</option> + <option value="-unused_reads yes">Yes</option> + </param> + + <param name="alignments" type="select" label="VELVETG - Export a summary of contig alignment to the reference sequences. Default: no (-alignments)"> + <option value="">No</option> + <option value="-alignments yes">Yes</option> + </param> + + <param name="exportFiltered" type="select" label="VELVETG - Export the long nodes which were eliminated by the coverage filters. Default: no (-exportFiltered)"> + <option value="">No</option> + <option value="-exportFiltered yes">Yes</option> + </param> + + <param name="paired_exp_fraction" type="float" optional="true" label="VELVETG -Remove all the paired end connections which less than the specified fraction of the expected count. Default: 0.1 (-paired_exp_fraction)"/> + + <param name="shortMatePaired" type="select" label="VELVETG - For mate-pair libraries, indicate that the library might be contaminated with paired-end reads. Default no (-shortMatePaired)"> + <option value="">No</option> + <option value="-shortMatePaired yes">Yes</option> + </param> + + <param name="conserveLong" type="select" label="VELVETG - Preserve sequences with long reads in them. Default no (-conserveLong)"> + <option value="">No</option> + <option value="-conserveLong yes">Yes</option> + </param> + + <param name="discard_chimera" type="select" label="META-VELVETG - Discard chimera sub-graph. Default: no (-discard_chimera)"> + <option value="">No</option> + <option value="-discard_chimera yes">Yes</option> + </param> + + <param name="max_chimera_rate" type="float" optional="true" label="META-VELVETG - Maximum allowable chimera rate. Default: 0.0 (-max_chimera_rate)"/> + <param name="repeat_cov_sd" type="float" optional="true" label="META-VELVETG - Standard deviation of repeat node coverages. Default: 0.1 (-repeat_cov_sd)"/> + <param name="min_split_length" type="integer" optional="true" label="META-VELVETG - Minimum node length required for repeat resolution. Default: 0 (-min_split_length)"/> + <param name="valid_connections" type="integer" optional="true" label="META-VELVETG - Minimum allowable number of consistent paired-end connections. Default: 1 (-valid_connections)"/> + <param name="noise_connections" type="integer" optional="true" label="META-VELVETG - Maximum allowable number of inconsistent paired-end connections. Default: 0 (-noise_connections)"/> + + <param name="use_connections" type="select" label="META-VELVETG - Use paired-end connections for graph splitting. Default: yes (-use_connections)"> + <option value="">Yes</option> + <option value="-use_connections no">No</option> + </param> + + <param name="report_split_detail" type="select" label="META-VELVETG - Report sequences around repeat nodes. Default: no (-report_split_detail)"> + <option value="">No</option> + <option value="-report_split_detail yes">Yes</option> + </param> + + <param name="report_subgraph" type="select" label="META-VELVETG - Report node sequences for each subgraph. Default: no (-report_subgraph)"> + <option value="">No</option> + <option value="-report_subgraph yes">Yes</option> + </param> + + <param name="exp_covs" type="text" optional="true" label="META-VELVETG - Expected coverages for each species in microbiome. Default: auto (-exp_covs)"/> + + <param name="min_peak_cov" type="float" optional="true" label="META-VELVETG - Minimum peak coverage. Default: 0 (-min_peak_cov)"/> + <param name="max_peak_cov" type="float" optional="true" label="META-VELVETG - Maximum peak coverage. Default: 500 (-max_peak_cov)"/> + <param name="histo_bin_width" type="float" optional="true" label="META-VELVETG - Bin width of peak coverage histogram. Default: 1 (-histo_bin_width)"/> + <param name="histo_sn_ratio" type="float" optional="true" label="META-VELVETG - Signal-noise ratio to remove peak noises. Default: 10 (-histo_sn_ratio)"/> + + </inputs> + + <outputs> + + <data format="fasta" name="meta_velvet_contigs" from_work_dir="meta-velvetg.contigs.fa" label="${tool.name} on ${on_string}: meta-velvetg.contigs.fasta"> + <filter>(meta == '')</filter> + </data> + + <data format="fasta" name="velvet_contigs" from_work_dir="contigs.fa" label="${tool.name} on ${on_string}: contigs.fasta"> + <filter>(meta == '-nometa')</filter> + </data> + + <data format="fasta" name="velvet_singlets" from_work_dir="Singlets.fasta" label="${tool.name} on ${on_string}: singlets.fasta"> + <filter>(unused_reads == '-unused_reads yes')</filter> + </data> + + <data format="txt" name="meta-velvetg.asm.afg" from_work_dir="meta-velvetg.asm.afg" label="${tool.name} on ${on_string}: meta-velvetg.asm.afg"> + <filter>((meta == '') and (amos_file == '-amos_file yes'))</filter> + </data> + + <data format="txt" name="velvet_asm.afg" from_work_dir="velvet_asm.afg" label="${tool.name} on ${on_string}: velvet_asm.afg"> + <filter>((meta == '-nometa') and (amos_file == '-amos_file yes'))</filter> + </data> + + <data format="tabular" name="stats.txt" from_work_dir="stats.txt" label="${tool.name} on ${on_string}: stats.txt"> + <filter>(meta == '-nometa')</filter> + </data> + + <data format="tabular" name="meta-velvetg.split-stats.txt" from_work_dir="meta-velvetg.split-stats.txt" label="${tool.name} on ${on_string}: meta-velvetg.split-stats.txt"> + <filter>(meta == '')</filter> + </data> + + <data format="txt" name="LastGraph" from_work_dir="LastGraph" label="${tool.name} on ${on_string}: LastGraph"> + <filter>(meta == '-nometa')</filter> + </data> + + <data format="txt" name="meta-velvetg.LastGraph" from_work_dir="meta-velvetg.LastGraph" label="${tool.name} on ${on_string}: meta-velvetg.LastGraph"> + <filter>(meta == '')</filter> + </data> + + <data format="tabular" name="meta-velvetg.Graph2-stats.txt" from_work_dir="meta-velvetg.Graph2-stats.txt" label="${tool.name} on ${on_string}: meta-velvetg.Graph2-stats.txt"> + <filter>(meta == '')</filter> + </data> + + </outputs> + +</tool>