comparison vapor.xml @ 0:3fe0d1df3950 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/vapor commit 81874af500338d4ba72ca4d2bb11a628fb405525
author iuc
date Wed, 24 Aug 2022 09:51:46 +0000
parents
children 7bf891a13ace
comparison
equal deleted inserted replaced
-1:000000000000 0:3fe0d1df3950
1 <tool id="vapor" name="VAPOR" version="@TOOL_VERSION@+galaxy0" profile="21.05">
2 <description>
3 Classify Influenza samples from raw short read sequence data
4 </description>
5 <macros>
6 <token name="@TOOL_VERSION@">1.0.2</token>
7 </macros>
8 <xrefs>
9 <xref type="bio.tools">vapor</xref>
10 </xrefs>
11 <requirements>
12 <requirement type="package" version="@TOOL_VERSION@">vapor</requirement>
13 </requirements>
14 <command detect_errors="exit_code"><![CDATA[
15 vapor.py
16 --return_best_n $opt.return_best_n
17 #if $output_type == "fasta"
18 --return_seqs
19 #end if
20 -k '$opt.kmer_length'
21 -t '$opt.score_threshold'
22 -c '$opt.min_kmer_cov'
23 -m '$opt.min_kmer_prop'
24 -fa '$fasta_file'
25 -fq '$fastq_file'
26 -f '$opt.top_seed_frac'
27 -q
28 > out_file
29 ]]> </command>
30 <inputs>
31 <param name="fasta_file" format="fasta" type="data" label="FASTA file" help="Raw short read sequences (full length reference segment sequences)" />
32 <param name="fastq_file" format="fastq,fastq.gz" type="data" multiple="true" label="FASTQ file(s)" help="WGS reads" />
33 <param name="output_type" type="select" label="Output type">
34 <option value="scores" selected="true">Return scores only</option>
35 <option value="fasta">Return FASTA only</option>
36 </param>
37 <section name="opt" title="Optional arguments" expanded="true">
38 <param name="return_best_n" type="integer" min="1" value="1" label="Returns the highest scoring n queries" help="A list of the best n queries instead of only the highest scoring query" />
39 <param name="kmer_length" type="integer" min="5" max="30" value="21" label="Kmer Length" help="" />
40 <param name="score_threshold" type="float" min="0.0" max="1.0" value="0.2" label="Read kmer filtering threshold" help="" />
41 <param name="min_kmer_cov" type="integer" value="5" label="Min coverage kmer culling" help="Minimum coverage kmer culling" />
42 <param name="min_kmer_prop" type="float" value="0.1" label="Min kmer proportion" help="Minimum proportion of matched kmers allowed for queries" />
43 <param name="top_seed_frac" type="float" min="0.0" max="1.0" value="0.2" label="Fraction of best seeds to extend" help="" />
44 </section>
45 </inputs>
46 <outputs>
47 <data name="output_scores" from_work_dir="out_file" format="tabular" label="VAPOR: closest reference">
48 <filter>output_type == "scores"</filter>
49 <actions>
50 <action name="column_names" type="metadata" default="% of query bases in reads,Total score,Query length,Mean score,Reads after culling,Query description" />
51 </actions>
52 </data>
53 <data name="output_fasta" from_work_dir="out_file" format="fasta" label="VAPOR: closest reference (fasta)">
54 <filter>output_type == "fasta"</filter>
55 </data>
56 </outputs>
57 <tests>
58 <test expect_num_outputs="1">
59 <param name="fasta_file" value="HA_sample.fa" />
60 <param name="fastq_file" value="test_reads.fq" />
61 <output name="output_scores" file="output1.tab" />
62 </test>
63 <test expect_num_outputs="1">
64 <param name="fasta_file" value="HA_sample.fa" />
65 <param name="fastq_file" value="test_reads.fq" />
66 <section name="opt">
67 <param name="kmer_length" value="29" />
68 <param name="score_threshold" value="0.5" />
69 <param name="min_kmer_cov" value="7" />
70 <param name="min_kmer_prop" value="0.5" />
71 <param name="top_seed_frac" value="0.5" />
72 </section>
73 <output name="output_scores" file="output2.tab" />
74 </test>
75 <test expect_num_outputs="1">
76 <param name="fasta_file" value="HA_sample.fa" />
77 <param name="fastq_file" value="test_reads.fq" />
78 <param name="output_type" value="fasta" />
79 <section name="opt">
80 <param name="return_best_n" value="3" />
81 </section>
82 <output name="output_fasta" file="output3.fa" />
83 </test>
84 </tests>
85 <help><![CDATA[
86 **What it does**
87
88 VAPOR is a tool for classification of Influenza samples from raw short read sequence data for downstream bioinformatics analysis.
89 VAPOR is provided with a fasta file of full-length sequences (> 20,000) for a given segment, a set of reads, and attempts to retrieve a reference that is closest to the sample strain.
90
91 `sub_sample` is not an option here (compared to the tool on GitHub), since you can always build a workflow that preprocesses your reads to a (random) subsample. You can use this output as your reads file for VAPOR.
92 ]]> </help>
93 <citations>
94 <citation type="doi">10.1093/bioinformatics/btz814</citation>
95 </citations>
96 </tool>