Mercurial > repos > iuc > artic_guppyplex

<tool id="artic_guppyplex" name="ARTIC guppyplex" version="@PACKAGE_VERSION@+galaxy2" profile="20.09">
    <description>Filter Nanopore reads by read length and (optionally) quality</description>
    <macros>
        <import>macros.xml</import>
    </macros>
    <requirements>
        <requirement type="package" version="@PACKAGE_VERSION@">artic</requirement>
    </requirements>
    <command detect_errors="exit_code">
    <![CDATA[
        mkdir inputs &&

        ## Note about compression handling in the following:
        ## guppyplex use mimetypes.guess_type to guess compression so
        ## it's important to get the suffix of the inputs right.
        ## Even if it detects compressed input, it will write uncompressed
        ## output so we need to handle output compression separately.

        ## symlink input files to appropriate names in the inputs/ directory
        bash prepare_inputs.sh &&
        #if str($input.structure) == 'one_to_one':
            #set $compressed = $input.reads.is_of_type("fastq.gz", "fastqsanger.gz")
        #else:
            #set $compressed = next(iter($input.reads)).is_of_type("fastq.gz", "fastqsanger.gz")
        #end if
        artic guppyplex --min-length $min_length --max-length $max_length
        #if $min_quality == 0:
            --skip-quality-check
        #else:
            --quality $min_quality
        #end if
            --directory inputs/
            --output guppyplex_out.fastq
        #if $compressed:
            && gzip guppyplex_out.fastq
        #end if
    ]]>
    </command>
    <configfiles>
        <configfile filename="prepare_inputs.sh"><![CDATA[
            #if str($input.structure) == 'one_to_one':
ln -s '$input.reads' inputs/1.${input.reads.ext}
            #else:
                #for $i, $elem in enumerate($input.reads):
ln -s '$elem' inputs/${i}.${elem.ext} &&
                #end for
:
            #end if
        ]]>
        </configfile>
    </configfiles>
    <inputs>
        <conditional name="input">
            <param name="structure" type="select"
            label="Structure of your input data"
            help="">
                <option value="one_to_one">One input dataset per sample</option>
                <option value="one_to_many">Multiple input datasets per sample</option>
            </param>
            <when value="one_to_one">
                <param name="reads" type="data" format="@FASTQ_FORMATS@"
                label="Sequencing dataset(s) - one per sample" />
            </when>
            <when value="one_to_many">
                <param name="reads" multiple="true" type="data" format="@FASTQ_FORMATS@"
                label="Partial sequencing datasets for your sample"
                help="Multiple datasets selected here will get combined into a single output for a single assumed sample. Select a nested list to have its inner lists interpreted as data from one sample each and to obtain one output per inner list." />
            </when>
        </conditional>
        <param name="max_length" type="integer" label="Remove reads longer than" value="700" help="remove reads greater than this number of base pairs" />
        <param name="min_length" type="integer" label="Remove reads shorter than" value="400" help="remove reads less than this number of base pairs" />
        <param name="min_quality" type="integer" min="0" value="7"
        label="Eliminate reads with a mean base quality score of less than"
        help="Set to 0 to skip the quality check." />
    </inputs>
    <outputs>
        <data name="output" format_source="reads" from_work_dir="guppyplex_out.fastq*" />
    </outputs>
    <tests>
        <test>
            <conditional name="input">
                <param name="structure" value="one_to_one" />
                <param name="reads" value="test.fastq" />
            </conditional>
            <output name="output" file="gupplyplex_output.fastq"/>
        </test>
        <test>
            <conditional name="input">
                <param name="structure" value="one_to_many" />
                <param name="reads" value="test.fastq,test.fastq" />
            </conditional>
            <!-- guppyplex drops duplicate reads so we don't need a new
            test file for checking this branch -->
            <output name="output" file="gupplyplex_output.fastq"/>
        </test>
    </tests>
    <help><![CDATA[
        The ARTIC_ guppyplex tool filters reads by length and (optionally) quality.
        This filter is typically used as a pre-processing step in the processing
        of amplicon sequencing Nanopore reads, where a size-based filter can
        be used to remove possibly-chimeric reads.

        The default paramters of the tool (minimum length of 400 and maximum of 700)
        are based on the ARTIC amplicon scheme. If used with a different amplicon
        scheme they should be adjusted to use the minimum length of an amplicon as
        the minimum length and the maximum length of an amplicon plus 200 as the
        maximum length.

        The tool can also be used simultaneously to gather partial fastq
        datasets into single datasets per sample.

        .. _ARTIC: https://artic.readthedocs.io/en/latest/
    ]]></help>
    <expand macro="citations" />
</tool>
author	iuc
date	Mon, 31 Jan 2022 10:12:54 +0000
parents	5ceeb5a5d70f
children