annotate fastq-join.xml @ 0:e6f1c31279db draft

Initial version with fastq-join
author Lance Parsons <lparsons@princeton.edu>
date Thu, 20 Sep 2012 18:59:38 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
1 <tool id="fastq_join" name="fastq-join" version="0.1">
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
2 <description> - Joins two paired-end reads on the overlapping ends</description>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
3 <requirements>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
4 <requirement type="package" version="1.1.2-469">ea-utils</requirement>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
5 </requirements>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
6 <command>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
7 fastq-join
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
8 -v '$splitChar'
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
9 -p $pctMaxDiff
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
10 -m $minOverlap
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
11 #if $stitchLengthReport:
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
12 -r $outputStitchLengthReport
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
13 #end if
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
14 $read1
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
15 $read2
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
16 -o $outputUnmatched1 -o $outputUnmatched2 -o $outputJoined
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
17 </command>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
18 <inputs>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
19 <param format="fastq, fastqillumina, fastqsanger, fastqsolexa" name="read1" type="data" label="Read 1 Fastq" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
20 <param format="fastq, fastqillumina, fastqsanger, fastqsolexa" name="read2" type="data" label="Read 2 Fastq" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
21 <param name="splitChar" type="text" value=" " label="Split read ids on this character" help="Default is space ' ' for Illumina reads" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
22 <param name="pctMaxDiff" type="float" value="8" min="0" max="100" label="Maximum percentage difference between matching segments" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
23 <param name="minOverlap" type="integer" value="6" min="1" label="Minimum length of matching segements" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
24 <param name="stitchLengthReport" type="boolean" value="False" label="Output verbose stitch length report" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
25 </inputs>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
26
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
27 <outputs>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
28 <data format="input" format_source="read1" name="outputJoined" label="${tool.name} on ${on_string} (joined)"/>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
29 <data format="input" format_source="read1" name="outputUnmatched1" label="${tool.name} on ${on_string} (unmatched1)"/>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
30 <data format="input" format_source="read2" name="outputUnmatched2" label="${tool.name} on ${on_string} (unmatched2)"/>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
31 <data format="tabular" name="outputStitchLengthReport" label="${tool.name} on ${on_string} (stitch length report)">
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
32 <filter>stitchLengthReport</filter>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
33 </data>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
34 </outputs>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
35
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
36 <stdio>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
37 <exit_code range="1:" level="fatal" description="Unknown error occurred" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
38 </stdio>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
39
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
40 <tests>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
41 <test>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
42 <param name="read1" value="test_read1.fastq" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
43 <param name="read2" value="test_read3.fastq" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
44 <output name="outputJoined" file="testout.join.fastq" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
45 <output name="outputUnmatched1" file="testout.un1.fastq" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
46 <output name="outputUnmatched2" file="testout.un2.fastq" />
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
47 </test>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
48 </tests>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
49
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
50 <help>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
51 Overview
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
52 --------
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
53 fastq-join joins two paired-end reads on the overlapping ends.
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
54
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
55 Split read ids character: Verifies that the 2 files probe id's match up to char C. Use ' ' for Illumina reads.
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
56
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
57 Maximum difference is the maximum allowed percentage of bases that differ in the matching region.
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
58
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
59 Minimum overlap is the minimum number of bases that must overlap (with no more than the maximum difference) for reads to be joined.
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
60
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
61 Verbose stitch length report is a report for each joined paired of reads showing how large the overlapping section was.
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
62
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
63 This tool uses sqr(distance)/len for anchored alignment quality algorithm. It's a good measure of anchored alignment quality, akin to squared-deviation for means. This tool uses the fastq-join program that is part of the ea-utils suite. See http://code.google.com/p/ea-utils/wiki/FastqJoin for details.
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
64 </help>
e6f1c31279db Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff changeset
65 </tool>