comparison TEfinder.xml @ 0:b81a83c743d3 draft default tip

Uploaded
author namhsuya
date Tue, 09 Aug 2022 06:58:49 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:b81a83c743d3
1 <tool id="te_finder_1" name="TEfinder" version="1.0.1" profile="21.05">
2 <description>A bioinformatics tool for detecting novel transposable element insertions</description>
3
4 <requirements>
5 <requirement type="package" version="1.15.1">samtools</requirement>
6 <requirement type="package" version="2.30.0">bedtools</requirement>
7 <requirement type="package" version="2.27.4">picard</requirement>
8 <requirement type="package" version="3.4">grep</requirement>
9 <requirement type="package" version="1.07.1">bc</requirement>
10 </requirements>
11
12 <command>
13 <![CDATA[
14 '$__tool_directory__/TEfinder' -fa '$required_inputs.FastaFile'
15 -alignment '$required_inputs.alignmentFile'
16 -gtf '$required_inputs.TransposonsInGenome'
17 -te '$required_inputs.TransposonsToSearch'
18 -bamo '$discordantreads'
19 -bedo '$bteinsertion'
20 -threads '\${GALAXY_SLOTS:-1}'
21 -fis $($advanced_options.FragmentInsertSize)
22 -md $($advanced_options.MaxDistanceForMerge)
23 -k $($advanced_options.MaxTSDLength)
24 #if str( $advanced_options.OutFormat) == "gtf":
25 -gtfo '$gteinsertion'
26 -out $($advanced_options.OutFormat)
27 #end if
28 ]]>
29 </command>
30
31 <inputs>
32 <!-- <param format="fasta" name="input" type="data" label="Source file"/> -->
33 <section name="required_inputs" title="Required Inputs" expanded="True">
34 <param name="FastaFile" type="data" format="fasta" label="Select reference genome FASTA index (FA/FASTA file)" />
35 <param name="alignmentFile" type="data" format="bam" label="Select sample reads aligned to reference genome (BAM/SAM file)" />
36 <param name="TransposonsInGenome" type="data" format="gtf" label="Select reference genome TE annotation (GFF/GTF file)" />
37 <param name="TransposonsToSearch" type="data" format="text" label="Select TE names (single column text file)" />
38 </section>
39 <!-- Advanced Options -->
40 <section name="advanced_options" title="Advanced Options" expanded="False">
41 <param name="FragmentInsertSize" argument="-fis" type="integer" min="0" value="400" label="Short-read sequencing fragment insert size [400]" />
42 <param name="MaxDistanceForMerge" argument="-md" type="integer" min="0" value="150" label="Maximum distance between reads for bedtools merge" />
43 <param name="MaxTSDLength" argument="-k" type="integer" min="0" value="20" label="Maximum TE target site duplication (TSD) length" />
44 <param name="OutFormat" argument="-out" type="select" display="radio" label="Select output format as GTF [BED]" help="See help below for more details">
45 <option value="gtf">Other available format is GTF (-out gtf)</option>
46 <option value="bed" selected="True">Default format is BED</option>
47 </param>
48 </section>
49 </inputs>
50
51 <outputs>
52 <data format="bed" name="bteinsertion" label="${tool.name} on ${on_string}: BED" />
53 <data format="gtf" name="gteinsertion" label="${tool.name} on ${on_string}: GTF">
54 <filter>advanced_options['OutFormat'] and 'gtf' in advanced_options['OutFormat']</filter>
55 </data>
56 <data format="bam" name="discordantreads" />
57 </outputs>
58
59 <tests>
60 <!-- Test for the most simple case for BED output : Running TEfinder with a .bam file and a .fasta file -->
61 <test expect_num_outputs="2">
62 <!-- TEfinder commands: TEfinder -alignment sample.bam -fa reference.fa -gtf TEs.gtf -te List_of_TEs.txt -->
63 <param name="FastaFile" ftype="fasta" value="reference.fa"/>
64 <param name="alignmentFile" ftype="bam" value="sample.bam"/>
65 <param name="TransposonsInGenome" ftype="gtf" value="TEs.gtf"/>
66 <param name="TransposonsToSearch" ftype="txt" value="List_of_TEs.txt"/>
67 <param name="OutFormat" value="bed" />
68 <output name="bteinsertion" file="TEinsertions.bed" ftype="bed"/>
69 <output name="discordantreads" file="DiscordantReads.bam" ftype="bam"/>
70 </test>
71
72 <!-- Test for the GTF output -->
73 <test expect_num_outputs="3">
74 <!-- TEfinder commands: TEfinder -alignment sample.bam -fa reference.fa -gtf TEs.gtf -te List_of_TEs.txt -out gtf -->
75 <param name="FastaFile" ftype="fasta" value="reference.fa"/>
76 <param name="alignmentFile" ftype="bam" value="sample.bam"/>
77 <param name="TransposonsInGenome" ftype="gtf" value="TEs.gtf"/>
78 <param name="TransposonsToSearch" ftype="txt" value="List_of_TEs.txt"/>
79 <param name="OutFormat" value="gtf" />
80 <output name="bteinsertion" file="TEinsertions.bed" ftype="bed"/>
81 <output name="gteinsertion" file="TEinsertions.gtf" ftype="gtf"/>
82 <output name="discordantreads" file="DiscordantReads.bam" ftype="bam"/>
83 </test>
84 </tests>
85
86 <help>
87 <![CDATA[
88 A bioinformatics tool for detecting novel transposable element insertions
89
90 Authors: Vista Sohrab & Dilay Hazal Ayhan
91
92 TEfinder uses discordant reads to detect novel transposable element insertion events in paired-end sample sequencing data.
93
94 **Output files**::
95
96 TE_insertions.bed contains identified TE insertion events in sample (in the final column, FILTER attribute with "PASS" refers to high confidence insertion events while instances labeled as "in_repeat", "weak_evidence", "strand bias" or a combination of these three labels indicate less confident insertion events)
97
98 TE_insertions.gtf is provided with the same information as the BED file if using -out GTF
99
100 DiscordantReads.bam contains all discordant reads that have been identified based on the TEs of interest that have been submitted to TEfinder
101
102 **Note**::
103
104 Modifying the maximum TSD length (-k) could be useful if there is an unexpected number of insertion events identified with the default parameter. The optimal maximum TSD length can vary across datasets.
105 Modifying the fragment insert size (-fis) based on the sequencing library preparation can be useful.
106
107 ]]>
108 </help>
109
110 <citations>
111 <citation type="doi">10.5281/zenodo.4479946</citation>
112 </citations>
113
114 </tool>