Mercurial > repos > lparsons > ea_utils
annotate fastq-join.xml @ 0:e6f1c31279db draft
Initial version with fastq-join
author | Lance Parsons <lparsons@princeton.edu> |
---|---|
date | Thu, 20 Sep 2012 18:59:38 -0400 |
parents | |
children |
rev | line source |
---|---|
0
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
1 <tool id="fastq_join" name="fastq-join" version="0.1"> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
2 <description> - Joins two paired-end reads on the overlapping ends</description> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
3 <requirements> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
4 <requirement type="package" version="1.1.2-469">ea-utils</requirement> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
5 </requirements> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
6 <command> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
7 fastq-join |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
8 -v '$splitChar' |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
9 -p $pctMaxDiff |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
10 -m $minOverlap |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
11 #if $stitchLengthReport: |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
12 -r $outputStitchLengthReport |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
13 #end if |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
14 $read1 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
15 $read2 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
16 -o $outputUnmatched1 -o $outputUnmatched2 -o $outputJoined |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
17 </command> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
18 <inputs> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
19 <param format="fastq, fastqillumina, fastqsanger, fastqsolexa" name="read1" type="data" label="Read 1 Fastq" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
20 <param format="fastq, fastqillumina, fastqsanger, fastqsolexa" name="read2" type="data" label="Read 2 Fastq" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
21 <param name="splitChar" type="text" value=" " label="Split read ids on this character" help="Default is space ' ' for Illumina reads" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
22 <param name="pctMaxDiff" type="float" value="8" min="0" max="100" label="Maximum percentage difference between matching segments" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
23 <param name="minOverlap" type="integer" value="6" min="1" label="Minimum length of matching segements" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
24 <param name="stitchLengthReport" type="boolean" value="False" label="Output verbose stitch length report" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
25 </inputs> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
26 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
27 <outputs> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
28 <data format="input" format_source="read1" name="outputJoined" label="${tool.name} on ${on_string} (joined)"/> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
29 <data format="input" format_source="read1" name="outputUnmatched1" label="${tool.name} on ${on_string} (unmatched1)"/> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
30 <data format="input" format_source="read2" name="outputUnmatched2" label="${tool.name} on ${on_string} (unmatched2)"/> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
31 <data format="tabular" name="outputStitchLengthReport" label="${tool.name} on ${on_string} (stitch length report)"> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
32 <filter>stitchLengthReport</filter> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
33 </data> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
34 </outputs> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
35 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
36 <stdio> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
37 <exit_code range="1:" level="fatal" description="Unknown error occurred" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
38 </stdio> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
39 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
40 <tests> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
41 <test> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
42 <param name="read1" value="test_read1.fastq" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
43 <param name="read2" value="test_read3.fastq" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
44 <output name="outputJoined" file="testout.join.fastq" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
45 <output name="outputUnmatched1" file="testout.un1.fastq" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
46 <output name="outputUnmatched2" file="testout.un2.fastq" /> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
47 </test> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
48 </tests> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
49 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
50 <help> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
51 Overview |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
52 -------- |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
53 fastq-join joins two paired-end reads on the overlapping ends. |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
54 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
55 Split read ids character: Verifies that the 2 files probe id's match up to char C. Use ' ' for Illumina reads. |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
56 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
57 Maximum difference is the maximum allowed percentage of bases that differ in the matching region. |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
58 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
59 Minimum overlap is the minimum number of bases that must overlap (with no more than the maximum difference) for reads to be joined. |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
60 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
61 Verbose stitch length report is a report for each joined paired of reads showing how large the overlapping section was. |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
62 |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
63 This tool uses sqr(distance)/len for anchored alignment quality algorithm. It's a good measure of anchored alignment quality, akin to squared-deviation for means. This tool uses the fastq-join program that is part of the ea-utils suite. See http://code.google.com/p/ea-utils/wiki/FastqJoin for details. |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
64 </help> |
e6f1c31279db
Initial version with fastq-join
Lance Parsons <lparsons@princeton.edu>
parents:
diff
changeset
|
65 </tool> |