view clean_dante_ltr.xml @ 7:c33d6583e548 draft

"planemo upload commit 50884f7f0269a0bbde078f24fe5020975693bcd9"
author petr-novak
date Fri, 24 Jun 2022 14:19:48 +0000
parents b91ca438a1cb
children 9de392f2fc02
line wrap: on
line source

<tool id="clean_dante_ltr" name="DANTE_LTR retrotransposons filtering" version="0.1.6" python_template_version="3.5">
    <requirements>

        <requirement type="package">r-optparse</requirement>
        <requirement type="package">blast</requirement>
        <requirement type="package">bioconductor-bsgenome</requirement>
        <requirement type="package">bioconductor-biostrings</requirement>
        <requirement type="package">bioconductor-rtracklayer</requirement>
    </requirements>
    <command detect_errors="exit_code"><![CDATA[
        Rscript ${__tool_directory__}/clean_ltr.R --gff3 '$dante_ltr' --reference_sequence '$reference' --output output --cpu 32
        &&
        mv output_clean.gff3 $dante_ltr_clean
        &&
        mv output_RM_lib_non_redundant.fasta $rm_lib
        &&
        mv output_RM_lib_full_TE.fasta $te_full
        &&
        mv output_RM_lib_5LTR.fasta $ltr5
        &&
        mv output_RM_lib_3LTR.fasta $ltr3
        &&
        mv output_summary.pdf $summary

    ]]></command>
    <inputs>
        <param type="data" name="dante_ltr" format="gff3"
               label="GFF3 output from DANTE_LTR retrotransposon identification pipeline"/>
        <param type="data" name="reference" format="fasta" label="Reference sequence matching input GFF3" />
    </inputs>
    <outputs>
        <data name="dante_ltr_clean" format="gff3"
              label="Validated LTR retrotransposons annotation (GFF3) based on annotation
               $dante_ltr.hid and reference $reference.hid"/>
        <data name="rm_lib" format="fasta" label="Non-redundant library of LTR retrotransposons (FASTA) based on annotation $dante_ltr.hid and reference $reference.hid"/>

        <data name="te_full" format="fasta" label="Library of full length LTR retrotransposons (FASTA) based on annotation $dante_ltr.hid and reference $reference.hid"/>

        <data name="ltr5" format="fasta" label="Library of 5'LTR of retrotransposons (FASTA) based on annotation $dante_ltr.hid and reference $reference.hid"/>

        <data name="ltr3" format="fasta" label="Library of 3'LTR of retrotransposons (FASTA) based on annotation $dante_ltr.hid and reference $reference.hid"/>

        <data name="summary" format="pdf" label="LTR retrotransposons lengths summary  based on $dante_ltr.hid and reference $reference.hid"/>

    </outputs>
    <help><![CDATA[
        This tool takes output from DANTE_LTR search identifies good quality retrotransposons.
         Good quality retrotransposons are considered those which does not have any cross-similarity between distinct lineages.
         Output from this tool is a annotation in GFF3 format and
         libraries of elements for custom RepeatMasker search.

    ]]></help>
</tool>