Mercurial > repos > iuc > kraken2
comparison kraken2.xml @ 0:0968856c687c draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken2/kraken2/ commit 6ad48e582972ec27cdc0d401f877dfe172057231
author | iuc |
---|---|
date | Thu, 14 Mar 2019 05:16:48 -0400 |
parents | |
children | d4bb87ca916d |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:0968856c687c |
---|---|
1 <?xml version="1.0"?> | |
2 <tool id="kraken2" name="Kraken2" version="@TOOL_VERSION@+galaxy0"> | |
3 <description> | |
4 assign taxonomic labels to sequencing reads | |
5 </description> | |
6 <macros> | |
7 <import>macros.xml</import> | |
8 </macros> | |
9 <requirements> | |
10 <requirement type="package" version="@TOOL_VERSION@">kraken2</requirement> | |
11 </requirements> | |
12 <version_command>kraken2 --version</version_command> | |
13 <command detect_errors="exit_code"> | |
14 <![CDATA[ | |
15 kraken2 | |
16 --threads \${GALAXY_SLOTS:-1} | |
17 --db '${kraken2_database.fields.path}' | |
18 | |
19 #if $quick: | |
20 --quick | |
21 #end if | |
22 | |
23 #if $single_paired.single_paired_selector == 'yes' | |
24 --paired | |
25 '${single_paired.forward_input}' '${single_paired.reverse_input}' | |
26 #elif $single_paired.single_paired_selector == "collection": | |
27 '${single_paired.input_pair.forward}' '${single_paired.input_pair.reverse}' | |
28 #else: | |
29 '${single_paired.input_sequences}' | |
30 #end if | |
31 | |
32 #if $split_reads: | |
33 --classified-out '${classified_out}' --unclassified-out '${unclassified_out}' | |
34 #end if | |
35 | |
36 --confidence '${confidence}' | |
37 | |
38 --minimum-base-quality '${min_base_quality}' | |
39 | |
40 #if $use_names: | |
41 --use-names | |
42 #end if | |
43 | |
44 #if $report.create_report: | |
45 --report '${report_output}' | |
46 #if $report.use_mpa_style: | |
47 --use-mpa-style | |
48 #end if | |
49 #if $report.report_zero_counts: | |
50 --report-zero-counts | |
51 #end if | |
52 #end if | |
53 | |
54 > '${output}' | |
55 ]]></command> | |
56 <inputs> | |
57 <conditional name="single_paired"> | |
58 <param name="single_paired_selector" type="select" label="Single or paired reads" help="--paired"> | |
59 <option value="collection">Collection</option> | |
60 <option value="yes">Paired</option> | |
61 <option selected="True" value="no">Single</option> | |
62 </param> | |
63 <when value="collection"> | |
64 <param format="@INTYPES@" name="input_pair" type="data_collection" collection_type="paired" label="Collection of paired reads"/> | |
65 </when> | |
66 <when value="yes"> | |
67 <param format="@INTYPES@" name="forward_input" type="data" label="Forward strand"/> | |
68 <param format="@INTYPES@" name="reverse_input" type="data" label="Reverse strand"/> | |
69 </when> | |
70 <when value="no"> | |
71 <param format="@INTYPES@" label="Input sequences" name="input_sequences" type="data"/> | |
72 </when> | |
73 </conditional> | |
74 | |
75 <param name="use_names" type="boolean" label="Print scientific names instead of just taxids"/> | |
76 | |
77 <param name="confidence" type="float" label="Confidence" value="0.0" help="Confidence score threshold. Must be in [0, 1]"> | |
78 <validator type="in_range" min="0.0" max="1.0" message="Confidence score threshold should be between 0 and 1" /> | |
79 </param> | |
80 | |
81 <param name="min_base_quality" type="integer" label="Minimum Base Quality" value="0" help="Minimum base quality used in classification (only effective with FASTQ input)"/> | |
82 | |
83 <param name="quick" type="boolean" label="Enable quick operation" help="Quick operation (use first hit)"/> | |
84 | |
85 <param name="split_reads" type="boolean" label="Split classified and unclassified outputs?" help="Sets --unclassified-out and --classified-out"/> | |
86 | |
87 <section name="report" title="Create Report" expanded="false"> | |
88 <param name="create_report" type="boolean" label="Print a report with aggregrate counts/clade to file" help="--report" optional="true"/> | |
89 <param name="use_mpa_style" type="boolean" label="Format report output like Kraken 1's kraken-mpa-report" help="--use-mpa-style" optional="true"/> | |
90 <param name="report_zero_counts" type="boolean" label="Report counts for ALL taxa, even if counts are zero" help="--report-zero-counts" optional="true"/> | |
91 </section> | |
92 | |
93 <expand macro="input_database"/> | |
94 | |
95 </inputs> | |
96 <outputs> | |
97 <data name="classified_out" format_source="input_sequences" label="${tool.name} on ${on_string}: Classified reads"> | |
98 <filter>(split_reads)</filter> | |
99 </data> | |
100 <data name="unclassified_out" format_source="input_sequences" label="${tool.name} on ${on_string}: Unclassified reads"> | |
101 <filter>(split_reads)</filter> | |
102 </data> | |
103 <data name="report_output" format_source="text" label="Report: ${tool.name} on ${on_string}"> | |
104 <filter>(report['create_report'])</filter> | |
105 </data> | |
106 <data name="output" format="tabular" label="${tool.name} on ${on_string}: Classification"/> | |
107 <!--<data format="tabular" label="${tool.name} on ${on_string}: Translated classification" name="translated" />--> | |
108 </outputs> | |
109 | |
110 <tests> | |
111 <test> | |
112 <param name="single_paired_selector" value="no"/> | |
113 <param name="input_sequences" value="kraken_test1.fa" ftype="fasta"/> | |
114 <param name="split_reads" value="false"/> | |
115 <param name="quick" value="no"/> | |
116 <param name="confidence" value=".2"/> | |
117 <param name="only-classified-output" value="false"/> | |
118 <param name="kraken2_database" value="test_entry"/> | |
119 <output name="output" file="kraken_test1_output.tab" ftype="tabular"/> | |
120 </test> | |
121 </tests> | |
122 <help> | |
123 <![CDATA[ | |
124 **What it does** | |
125 | |
126 Kraken2 is a taxonomic sequence classifier that assigns taxonomic labels to short DNA reads. It does this by examining the k-mers within a read and querying a database with those k-mers. This database contains a mapping of every k-mer in Kraken's genomic library to the lowest common ancestor (LCA) in a taxonomic tree of all genomes that contain that k-mer. The set of LCA taxa that correspond to the k-mers in a read are then analyzed to create a single taxonomic label for the read; this label can be any of the nodes in the taxonomic tree. Kraken is designed to be rapid, sensitive, and highly precise. | |
127 | |
128 ----- | |
129 | |
130 **Output Format** | |
131 | |
132 Each sequence classified by Kraken results in a single line of output. Output lines contain five tab-delimited fields; from left to right, they are:: | |
133 | |
134 1. "C"/"U": a one letter code indicating that the sequence was either classified or unclassified. | |
135 2. The sequence ID, obtained from the FASTA/FASTQ header. | |
136 3. The taxonomy ID Kraken 2 used to label the sequence; this is 0 if the sequence is unclassified. | |
137 4. The length of the sequence in bp. | |
138 5. A space-delimited list indicating the LCA mapping of each k-mer in the sequence. For example, "562:13 561:4 A:31 0:1 562:3" would indicate that: | |
139 a) the first 13 k-mers mapped to taxonomy ID #562 | |
140 b) the next 4 k-mers mapped to taxonomy ID #561 | |
141 c) the next 31 k-mers contained an ambiguous nucleotide | |
142 d) the next k-mer was not in the database | |
143 e) the last 3 k-mers mapped to taxonomy ID #562 | |
144 ]]> | |
145 </help> | |
146 <expand macro="citations" /> | |
147 </tool> |