comparison dante_ltr_search.xml @ 7:c33d6583e548 draft

"planemo upload commit 50884f7f0269a0bbde078f24fe5020975693bcd9"
author petr-novak
date Fri, 24 Jun 2022 14:19:48 +0000
parents b91ca438a1cb
children 9de392f2fc02
comparison
equal deleted inserted replaced
6:b91ca438a1cb 7:c33d6583e548
1 <tool id="dante_ltr_search" name="DANTE_LTR retrotransposon identification" version="0.1.5" python_template_version="3.5"> 1 <tool id="dante_ltr_search" name="DANTE_LTR retrotransposon identification" version="0.1.6" python_template_version="3.5">
2 <requirements> 2 <requirements>
3 <requirement type="package">blast</requirement> 3 <requirement type="package">blast</requirement>
4 <requirement type="package">r-optparse</requirement> 4 <requirement type="package">r-optparse</requirement>
5 <requirement type="package">bioconductor-bsgenome</requirement> 5 <requirement type="package">bioconductor-bsgenome</requirement>
6 <requirement type="package">bioconductor-biostrings</requirement> 6 <requirement type="package">bioconductor-biostrings</requirement>
7 <requirement type="package">bioconductor-rtracklayer</requirement> 7 <requirement type="package">bioconductor-rtracklayer</requirement>
8 8
9 </requirements> 9 </requirements>
10 <command detect_errors="exit_code"><![CDATA[ 10 <command detect_errors="exit_code"><![CDATA[
11 Rscript ${__tool_directory__}/extract_putative_ltr.R --gff3 '$dante' --reference_sequence '$reference' --output output --cpu 32 11 Rscript ${__tool_directory__}/extract_putative_ltr.R --gff3 '$dante' --reference_sequence '$reference' -M $max_missing --output output --cpu 32
12 && 12 &&
13 mv output.gff3 $te_ltr_gff 13 mv output.gff3 $te_ltr_gff
14 &&
15 mv output_statistics.csv $statistics
14 ]]></command> 16 ]]></command>
15 <inputs> 17 <inputs>
16 <param type="data" name="dante" format="gff3" label="Filtered GFF3 output from DANTE pipeline"/> 18 <param type="data" name="dante" format="gff3" label="Filtered GFF3 output from DANTE pipeline"/>
17 <param type="data" name="reference" format="fasta" label="Reference sequence matching DANTE output" /> 19 <param type="data" name="reference" format="fasta" label="Reference sequence matching DANTE output" />
20 <param type="integer" name="max_missing" min="0" max="3" value="1" label="Maximum number of missing protein domains to tolerate in full length retrotransposon" />
18 </inputs> 21 </inputs>
19 <outputs> 22 <outputs>
20 <data name="te_ltr_gff" format="gff3" label="LTR retrotransposons annotation (GFF3) 23 <data name="te_ltr_gff" format="gff3" label="LTR retrotransposons annotation (GFF3)
21 based on DANTE annotation $dante.hid and reference $reference.hid" /> 24 based on DANTE annotation $dante.hid and reference $reference.hid" />
25 <data name="statistics" format="tabular" label="LTR retrotransposons detection
26 summary based on $dante.hid and reference $reference.hid" />
22 </outputs> 27 </outputs>
23 <help><![CDATA[ 28 <help><![CDATA[
24 This tool uses output from DANTE annotation pipeline to identify full length LTR 29 This tool uses output from DANTE annotation pipeline to identify full length LTR
25 transposable elements. Output is in the GFF3 format and include annotation of 30 transposable elements. Output is in the GFF3 format and include annotation of
26 5' and 3' Longe Terminal Repeats, Target Site Duplication (TSD) and primer binding site (PBS). 31 5' and 3' Long Terminal Repeats, Target Site Duplication (TSD) and primer binding site (PBS).
27 32
28 All identified elements contains complete set of protein domains as defined in 33 All identified elements contains set of protein domains as defined in
29 REXdb_. Based on the results detection structural feature, 34 REXdb_.Based on the results of detection of structural features,
30 elements falls into four categories: 35 elements falls into five categories:
31 36
32 - elements with domains, 5'LTR, 3'LTR, TSD and PBS 37 - elements with domains, 5'LTR, 3'LTR, TSD and PBS - rank DLTP
33 - elements with domains, 5'LTR, 3'LTR and PBS (TSD was not found) 38 - elements with domains, 5'LTR, 3'LTR and PBS (TSD was not found) rank DLP
34 - elements with domains, 5' LTR, 3'LTR, TSD (PBS was not found) 39 - elements with domains, 5' LTR, 3'LTR, TSD (PBS was not found) - rank DTL
35 - elements with protein domains, 5'LTR and 3'LTR (PBS and LDS were not found) 40 - elements with protein domains, 5'LTR and 3'LTR (PBS and LDS were not found) - rank DL
41 - elements as cluster of proteins domains with same classification, no LTRs - rank D
36 42
37 .. _REXdb: https://doi.org/10.1186/s13100-018-0144-1 43 .. _REXdb: https://doi.org/10.1186/s13100-018-0144-1
38 44
39 ]]></help> 45 ]]></help>
40 </tool> 46 </tool>