view fastq-join.xml @ 2:b007d9642911 draft

planemo upload for repository commit 1a3c419bc0ded7c40cb2bc3e7c87bfb01ddfeba2
author lparsons
date Thu, 16 Jul 2015 17:36:11 -0400
parents 593a729e5706
children 8ec3dfde378b
line wrap: on
line source

<tool id="fastq_join" name="fastq-join" version="1.1.2-806">
    <description> - Joins two paired-end reads on the overlapping ends</description>

        <requirement type="package" version="1.1.2-806">ea-utils</requirement>

        <exit_code range="1:" level="fatal" description="Unknown error occurred" />

        -v '$splitChar'
        -p $pctMaxDiff
        -m $minOverlap
        #if $stitchLengthReport:
        -r $outputStitchLengthReport
        #end if
        -o $outputUnmatched1 -o $outputUnmatched2 -o $outputJoined

        <param format="fastq, fastqillumina, fastqsanger, fastqsolexa" name="read1" type="data" label="Read 1 Fastq" />
        <param format="fastq, fastqillumina, fastqsanger, fastqsolexa" name="read2" type="data" label="Read 2 Fastq" />
        <param name="splitChar" type="text" value=" " label="Split read ids on this character" help="Default is space ' ' for Illumina reads" />
        <param name="pctMaxDiff" type="float" value="8" min="0" max="100" label="Maximum percentage difference between matching segments" />
        <param name="minOverlap" type="integer" value="6" min="1" label="Minimum length of matching segements" />
        <param name="stitchLengthReport" type="boolean" value="False" label="Output verbose stitch length report" />

        <data format_source="read1" name="outputJoined" label="${} on ${on_string} (joined)"/>
        <data format_source="read1" name="outputUnmatched1" label="${} on ${on_string} (unmatched1)"/>
        <data format_source="read2" name="outputUnmatched2" label="${} on ${on_string} (unmatched2)"/>
        <data format="tabular" name="outputStitchLengthReport" label="${} on ${on_string} (stitch length report)">

            <param name="read1" value="test_read1.fastq" />
            <param name="read2" value="test_read3.fastq" />
            <output name="outputJoined" file="testout.join.fastq" />
            <output name="outputUnmatched1" file="testout.un1.fastq" />
            <output name="outputUnmatched2" file="testout.un2.fastq" />

fastq-join joins two paired-end reads on the overlapping ends.

Split read ids character: Verifies that the 2 files probe id's match up to char C. Use ' ' for Illumina reads.

Maximum difference is the maximum allowed percentage of bases that differ in the matching region.

Minimum overlap is the minimum number of bases that must overlap (with no more than the maximum difference) for reads to be joined.

Verbose stitch length report is a report for each joined paired of reads showing how large the overlapping section was.

This tool uses sqr(distance)/len for anchored alignment quality algorithm. It's a good measure of anchored alignment quality, akin to squared-deviation for means.  This tool uses the fastq-join program that is part of the ea-utils suite. See for details.

        <citation type="bibtex">
                title = {Comparison of {Sequencing} {Utility} {Programs}},
                volume = {7},
                issn = {18750362},
                url = {},
                doi = {10.2174/1875036201307010001},
                language = {en},
                number = {1},
                urldate = {2015-07-10},
                journal = {The Open Bioinformatics Journal},
                author = {Aronesty, Erik},
                month = jan,
                year = {2013},
                pages = {1--8}