comparison split_libraries.xml @ 0:e5c3175506b7 default tip

Initial tool configs for qiime, most need work.
author Jim Johnson <jj@umn.edu>
date Sun, 17 Jul 2011 10:30:11 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:e5c3175506b7
1 <tool id="split_libraries" name="split_libraries" version="1.2.1">
2 <description>Split libraries according to barcodes specified in mapping file</description>
3 <requirements>
4 <requirement type="binary">split_libraries.py</requirement>
5 </requirements>
6 <command interpreter="python">
7 qiime_wrapper.py
8 --galaxy_tmpdir='$__new_file_path__'
9 --galaxy_datasets='^seqs.fna$:'$sequences,'histograms.txt:'$histograms,'split_library_log.txt:'$log
10 split_libraries.py
11 --map=$map
12 #set fnas = []
13 #for i in $inputs:
14 #set fnas = $fnas + [$i.fasta.__str__]
15 #end for
16 --fasta=#echo ','.join($fnas)
17 #set quals = []
18 #for i in $inputs:
19 #if $i.qual != None and $i.qual.__str__ != 'None':
20 #set quals = $quals + [$i.qual.__str__]
21 #end if
22 #end for
23 #if len($quals) > 0:
24 --qual=#echo ','.join($quals)
25 #end if
26 #if len($min_seq_length.__str__) > 0 and $min_seq_length > 0:
27 --min-seq-length=$min_seq_length
28 #end if
29 #if len($max_seq_length.__str__) > 0:
30 --max-seq-length=$max_seq_length
31 #end if
32 $trim_seq_length
33 #if len($min_qual_score.__str__) > 0:
34 --min-qual-score=$min_qual_score
35 #end if
36 $keep_primer
37 $keep_barcode
38 #if len($max_ambig.__str__) > 0:
39 --max-ambig=$max_ambig
40 #end if
41 #if len($max_homopolymer.__str__) > 0:
42 --max-homopolymer=$max_homopolymer
43 #end if
44 #if len($max_primer_mismatch.__str__) > 0:
45 --max-primer-mismatch=$max_primer_mismatch
46 #end if
47 --barcode-type=$barcode_type
48 ## --dir-prefix=$dir_prefix
49 #if $max_barcode_errors >= 0.:
50 --max-barcode-errors=$max_barcode_errors
51 #end if
52 #if len($start_numbering_at.__str__) > 0:
53 --start-numbering-at=$start_numbering_at
54 #end if
55 $remove_unassigned
56 $disable_bc_correction
57 #if len($qual_score_window.__str__) > 0:
58 --qual_score_window=$qual_score_window
59 #end if
60 $disable_primers
61 --reverse_primers=$reverse_primers
62 $record_qual_scores
63 $discard_bad_windows
64 </command>
65 <inputs>
66 <param name="map" type="data" format="tabular" label="map"
67 help="name of mapping file. NOTE: Must contain a header line indicating SampleID in the first column and BarcodeSequence in the second, LinkerPrimerSequence in the third. [REQUIRED]"/>
68 <repeat name="inputs" title="Input Sequences">
69 <param name="fasta" type="data" format="fasta" label="fasta"
70 help="names of fasta files, comma-delimited [REQUIRED]"/>
71 <param name="qual" type="data" format="qual" label="qual"
72 help="names of qual files, comma-delimited [default: ('NO', 'DEFAULT')]"/>
73 </repeat>
74 <param name="min_seq_length" type="integer" optional="true" value="200" label="min-seq-length"
75 help="minimum sequence length, in nucleotides [default: 200]"/>
76 <param name="max_seq_length" type="integer" optional="true" value="1000" label="max-seq-length"
77 help="maximum sequence length, in nucleotides [default: 1000]"/>
78 <param name="trim_seq_length" type="boolean" truevalue="--trim-seq-length" falsevalue="" checked="false" label="trim-seq-length"
79 help="calculate sequence lengths after trimming primers and barcodes [default: False]"/>
80 <param name="min_qual_score" type="integer" optional="true" value="25" label="min-qual-score"
81 help="min average qual score allowed in read [default: 25]"/>
82 <param name="keep_primer" type="boolean" truevalue="--keep-primer" falsevalue="" checked="false" label="keep-primer"
83 help="do not remove primer from sequences"/>
84 <param name="keep_barcode" type="boolean" truevalue="--keep-barcode" falsevalue="" checked="false" label="keep-barcode"
85 help="do not remove barcode from sequences"/>
86 <param name="max_ambig" type="integer" optional="true" value="0" label="max-ambig"
87 help="maximum number of ambiguous bases [default: 0]"/>
88 <param name="max_homopolymer" type="integer" optional="true" value="6" label="max-homopolymer"
89 help="maximum length of homopolymer run [default: 6]"/>
90 <param name="max_primer_mismatch" type="integer" optional="true" value="0" label="max-primer-mismatch"
91 help="maximum number of primer mismatches [default: 0]"/>
92 <param name="barcode_type" type="text" value="golay_12" label="barcode-type"
93 help="barcode type, hamming_8, golay_12, variable_length (will disable any barcode correction if variable_length set), or a number representing the length of the barcode, such as -b 4. [default: golay_12]"/>
94 <!-- Not needed in galaxy
95 <param name="dir_prefix" type="text" value="." label="dir-prefix"
96 help="directory prefix for output files [default: .]"/>
97 -->
98 <param name="max_barcode_errors" type="float" optional="true" value="1.5" label="max-barcode-errors"
99 help="maximum number of errors in barcode [default: 1.5]"/>
100 <param name="start_numbering_at" type="integer" optional="true" min="1" value="1" label="start-numbering-at"
101 help="seq id to use for the first sequence [default: 1]"/>
102 <param name="remove_unassigned" type="boolean" truevalue="--remove_unassigned" falsevalue="" checked="false" label="remove_unassigned"
103 help="remove sequences which are Unassigned from output [default: False]"/>
104 <param name="disable_bc_correction" type="boolean" truevalue="--disable_bc_correction" falsevalue="" checked="false" label="disable_bc_correction"
105 help="Disable attempts to find nearest corrected barcode. Can improve performance. [default: False]"/>
106 <param name="qual_score_window" type="integer" optional="true" value="0" label="qual_score_window"
107 help="Enable sliding window test of quality scores. If the average score of a continuous set of w nucleotides falls below the threshold (see -s for default), the sequence is discarded. A good value would be 50. 0 (zero) means no filtering. Must pass a .qual file (see -q parameter) if this functionality is enabled. [default: 0]"/>
108 <param name="discard_bad_windows" type="boolean" truevalue="--discard_bad_windows" falsevalue="" checked="false" label="discard_bad_windows"
109 help="If the qual_score_window option (-w) is enabled, this will override the default truncation behavior and discard any sequences where a bad window is found. [default: False]"/>
110 <param name="disable_primers" type="boolean" truevalue="--disable_primers" falsevalue="" checked="false" label="disable_primers"
111 help="Disable primer usage when demultiplexing. Should be enabled for unusual circumstances, such as analyzing Sanger sequence data generated with different primers. [default: False]"/>
112 <param name="reverse_primers" type="select" label="reverse_primers"
113 help="Enable removal of the reverse primer and any subsequence sequence from the end of each read. To enable this, there has to be a 'ReversePrimer' column in the mapping file. Primers a required to be in IUPAC format and written in the 5' to 3' direction. Valid options are 'disable', 'truncate_only', and 'truncate_remove'. 'truncate_only' will remove the primer and subsequence sequence data from the output read and will not alter output of sequences where the primer cannot be found. 'truncate_remove' will flag sequences where the primer cannot be found to not be written and will record the quantity of such failed sequences in the log file. [default: disable]">
114 <option value="disable" >disable</option>
115 <option value="truncate_only">truncate_only</option>
116 <option value="truncate_remove">truncate_remove</option>
117 </param>
118 <param name="record_qual_scores" type="boolean" truevalue="--record_qual_scores" falsevalue="" checked="false" label="record_qual_scores"
119 help="Enables recording of quality scores for all sequences that are recorded. If this option is enabled, a file named seqs_filtered.qual will be created in the output directory, and will contain the same sequence IDs in the seqs.fna file and sequence quality scores matching the bases present in the seqs.fna file. [default: False]"/>
120 </inputs>
121 <outputs>
122 <data format="txt" name="log" label="${tool.name} on ${on_string}: log" />
123 <data format="txt" name="histograms" label="${tool.name} on ${on_string}: histograms"/>
124 <data format="fasta" name="sequences" label="${tool.name} on ${on_string}: fasta"/>
125 </outputs>
126 <tests>
127 </tests>
128 <help>
129
130 </help>
131 </tool>
132