view prophage_relatedness.xml @ 1:7ba8b1f0fdf0 draft default tip

planemo upload commit f8aa1f8dc7acaa1187d197da50a3eb21ad4b6dc9-dirty
author cpt
date Sun, 11 Aug 2024 22:26:57 +0000
parents 7a23dda2e932
children
line wrap: on
line source

<tool id="edu.tamu.cpt2.phage.relatedProphages" name="Related Prophages tool" version="21.1.0.0">
    <description/>
    <macros>
        <import>macros.xml</import>
    </macros>
    <requirements>
        <requirement type="package" version="3.7">python</requirement>
        <requirement type="package" version="1.77">biopython</requirement>
    </requirements>
    <command detect_errors="aggressive"><![CDATA[
    python $__tool_directory__/prophage_relatedness.py
    '${blastIn.blast}'
    --outFile '$output'
    --padding '$padding'
    --cutoff '$cutoff'
    --numReturn '$returns'
    #if '$blastIn.blastType' == "TSV":
    --isTSV
    #end if
]]></command>
    <inputs>
        <conditional name="blastIn">
            <param name="blastType" type="select" label="Blastn Input Type">
                <option value="XML" selected="true">Blast XML</option>
                <option value="TSV">Blast 25-Column Tabular</option>
            </param>
            <when value="XML">
                <param label="Blastn Results (Blast XML)" name="blast" type="data" format="blastxml"/>
            </when>
            <when value="TSV">
                <param label="Blastn Results (Blast 25-Column Tabular)" name="blast" type="data" format="tsv, tabular"/>
            </when>
        </conditional>
        <param label="Cluster Window" name="padding" type="text" value="2.0" help="Nucleotide window for HSPs to form a cluster (Multiplicative of length of query sequence)"/>
        <param label="Score cutoff" name="cutoff" type="text" value=".3"/>
        <param label="Number of Results to return" name="returns" type="integer" value="20"/>
    </inputs>
    <outputs>
        <data format="tabular" name="output" label="Top related prophages"/>
    </outputs>
    <tests/>
    <help><![CDATA[
**What it does**

Filters BLAST results for high-scoring clusters of HSPs.

The script first determines a window of X nucleotide bases, where X is the length of the query multiplied by the value supplied in the cluster window input. Then for each hit in the blast record, the high scoring pairs are sorted into sets based on the number of HSPs which would fall within that window.&ast; Finally, the total number of identities in the set is divided by the query length, and this score is used to return the top results. If a set would make it into the final results, any other HSP sets from that same hit will also be returned.

&ast; Sets are formed with a greedy method, where creating a set with the largest possible number of HSPs is the first action, then the next set is the largest possible number of HSPs that is also disjoint from the first, and so on until all HSPs are in a set.

      ]]></help>
    <expand macro="citations-2020-AJC-solo"/>
</tool>