comparison barcode_splitter-bc23f6946bb8/fastx_barcode_splitter.xml @ 0:2b6d577dd1ab default tip

Uploaded
author bccarstens
date Mon, 16 Jan 2012 22:38:10 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:2b6d577dd1ab
1 <tool id="cshl_fastx_barcode_splitter" name="Barcode Splitter" force_history_refresh="True">
2 <description></description>
3 <requirements><requirement type="package">fastx_toolkit</requirement></requirements>
4 <command interpreter="python">fastx_barcode_splitter_galaxy_wrapper.py
5 ## params for galaxy wrapper
6 $output
7 "$output.id"
8 "$input.ext"
9 "$__new_file_path__"
10 --barcodes='$barcodes'
11 $BARCODE $input "$input.name" "$output.extra_files_path"
12 ## params for fastx_barcode_splitter
13 --mismatches $mismatches --partial $partial $EOL
14 </command>
15
16 <inputs>
17 <param format="txt" name="BARCODE" type="data" label="Barcodes to use" />
18 <param format="fasta,fastqsanger,fastqsolexa,fastqillumina" name="input" type="data" label="Library to split" />
19
20 <param name="EOL" type="select" label="Barcodes found at">
21 <option value="--bol">Start of sequence (5' end)</option>
22 <option value="--eol">End of sequence (3' end)</option>
23 </param>
24
25 <param name="mismatches" type="integer" size="3" value="2" label="Number of allowed mismatches" />
26
27 <param name="partial" type="integer" size="3" value="0" label="Number of allowed barcodes nucleotide deletions" />
28
29 <param name="barcodes" type="select" multiple="true" label="Select barcodes to add as new datasets to history">
30 <options from_dataset="BARCODE">
31 <column name="name" index="0"/>
32 <column name="value" index="0"/>
33 <filter type="unique_value" name="unq_bc" column="0" />
34 <filter type="add_value" name="unmatched" value="unmatched"/>
35 </options>
36 </param>
37 </inputs>
38
39 <outputs>
40 <data format="html" name="output" />
41 </outputs>
42
43 <tests>
44 <test>
45 <!-- Split a FASTQ file -->
46 <param name="BARCODE" value="fastx_barcode_splitter1.txt" />
47 <param name="input" value="fastx_barcode_splitter1.fastq" ftype="fastqsolexa" />
48 <param name="EOL" value="Start of sequence (5' end)" />
49 <param name="mismatches" value="2" />
50 <param name="partial" value="0" />
51 <output name="output" file="fastx_barcode_splitter1.out" />
52 </test>
53 </tests>
54
55 <help>
56
57 **What it does**
58
59 This tool splits a Solexa library (FASTQ file) or a regular FASTA file into several files, using barcodes as the split criteria.
60
61 --------
62
63 **Barcode file Format**
64
65 Barcode files are simple text files.
66 Each line should contain an identifier (descriptive name for the barcode), and the barcode itself (A/C/G/T), separated by a TAB character.
67 Example::
68
69 #This line is a comment (starts with a 'number' sign)
70 BC1 GATCT
71 BC2 ATCGT
72 BC3 GTGAT
73 BC4 TGTCT
74
75 For each barcode, a new FASTQ file will be created (with the barcode's identifier as part of the file name).
76 Sequences matching the barcode will be stored in the appropriate file.
77
78 One additional FASTQ file will be created (the 'unmatched' file), where sequences not matching any barcode will be stored.
79
80 The output of this tool is an HTML file, displaying the split counts and the file locations.
81
82 **Output Example**
83
84 .. image:: ./static/fastx_icons/barcode_splitter_output_example.png
85
86 </help>
87 </tool>
88 <!-- FASTX-barcode-splitter is part of the FASTX-toolkit, by A.Gordon (gordon@cshl.edu) -->