comparison read2mut.xml @ 0:e5953c54cfb5 draft

planemo upload for repository https://github.com/gpovysil/VariantAnalyzerGalaxy/tree/master/tools/variant_analyzer commit ee4a8e6cf290e6c8a4d55f9cd2839d60ab3b11c8
author mheinzl
date Sun, 04 Oct 2020 17:19:39 +0000
parents
children 2a505d46f682
comparison
equal deleted inserted replaced
-1:000000000000 0:e5953c54cfb5
1 <?xml version="1.0" encoding="UTF-8"?>
2 <tool id="read2mut" name="Call specific mutations in reads:" version="1.0.2" profile="19.01">
3 <description>Looks for reads with mutation at known positions and calculates frequencies and stats.</description>
4 <macros>
5 <import>va_macros.xml</import>
6 </macros>
7 <expand macro="requirements">
8 <requirement type="package" version="1.1.0">xlsxwriter</requirement>
9 </expand>
10 <command><![CDATA[
11 ln -s '$file2' bam_input.bam &&
12 ln -s '${file2.metadata.bam_index}' bam_input.bam.bai &&
13 python '$__tool_directory__/read2mut.py'
14 --mutFile '$file1'
15 --bamFile bam_input.bam
16 --inputJson '$file3'
17 --sscsJson '$file4'
18 --thresh '$thresh'
19 --phred '$phred'
20 --trim '$trim'
21 $chimera_correction
22 --outputFile '$output_xlsx'
23 ]]>
24 </command>
25 <inputs>
26 <param name="file1" type="data" format="tabular" label="DCS Mutation File" optional="false" help="TABULAR file with DCS mutations. See Help section below for a detailed explanation."/>
27 <param name="file2" type="data" format="bam" label="BAM File of raw reads" optional="false" help="BAM file with aligned raw reads of selected tags."/>
28 <param name="file3" type="data" format="json" label="JSON File with DCS tag stats" optional="false" help="JSON file generated by DCS mutations to tags/reads"/>
29 <param name="file4" type="data" format="json" label="JSON File with SSCS tag stats" optional="false" help="JSON file generated by DCS mutations to SSCS stats."/>
30 <param name="thresh" type="integer" label="Tag count threshold" value="0" help="Integer threshold for displaying mutations. Only mutations occuring in DCS of less than thresh tags are displayed. Default of 0 displays all."/>
31 <param name="phred" type="integer" label="Phred quality score threshold" min="0" max="41" value="20" help="Integer threshold for Phred quality score. Only reads higher than this threshold are considered. Default = 20."/>
32 <param name="trim" type="integer" label="Trimming threshold" value="10" help="Integer threshold for assigning mutations at start and end of reads to lower tier. Default 10."/>
33 <param name="chimera_correction" type="boolean" label="Apply chimera correction?" truevalue="--chimera_correction" falsevalue="" checked="False" help="Add additional tier for chimeric variants and correct the variant frequencies."/>
34 </inputs>
35 <outputs>
36 <data name="output_xlsx" format="xlsx" label="${tool.name} on ${on_string}: XLSX"/>
37 </outputs>
38 <tests>
39 <test>
40 <param name="file1" value="DCS_Mutations_test_data_VA.tabular"/>
41 <param name="file2" value="Interesting_Reads_test_data_VA.trim.bam"/>
42 <param name="file3" value="tag_count_dict_test_data_VA.json"/>
43 <param name="file4" value="SSCS_counts_test_data_VA.json"/>
44 <param name="thresh" value="0"/>
45 <param name="phred" value="20"/>
46 <param name="trim" value="10"/>
47 <param name="chimera_correction" value="False"/>
48 <output name="output_xlsx" file="mutant_reads_summary_short_trim_test_data_VA.xlsx" decompress="true" lines_diff="10"/>
49 </test>
50 </tests>
51 <help> <![CDATA[
52 **What it does**
53
54 Takes a tabular file with mutations, a BAM file of aligned raw reads, and JSON files
55 created by the tools **DCS mutations to tags/reads** and **DCS mutations to SSCS stats**
56 as input and calculates frequencies and stats for DCS mutations based on information
57 from the raw reads.
58
59 **Input**
60
61 **Dataset 1:** Tabular file with duplex consesus sequence (DCS) mutations as
62 generated by the **Variant Annotator** tool.
63
64 **Dataset 2:** BAM file of aligned raw reads. This file can be obtained by the
65 tool `Map with BWA-MEM <https://arxiv.org/abs/1303.3997>`_.
66
67 **Dataset 3:** JSON file generated by the **DCS mutations to tags/reads** tool
68 containing dictonaries of the tags of reads containing mutations
69 in the DCS.
70
71 **Dataset 4:** JSON file generated by the **DCS mutations to SSCS stats** tool
72 stats of tags that carry a mutation in the SSCS at the same position a mutation
73 is called in the DCS.
74
75 **Output**
76
77 The output is an XLSX file containing frequencies stats for DCS mutations based
78 on information from the raw reads. In addition to that a tier based
79 classification is provided based on the amout of support for a true variant call.
80
81 ]]>
82 </help>
83 <expand macro="citation" />
84 </tool>