annotate kraken-filter.xml @ 4:3d6570bffdb1 draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 06345505a91f3dcfa8a37dceb6f25e95806dddc8"
author iuc
date Wed, 04 Dec 2019 06:51:27 -0500
parents 5bee9adae474
children 67236d921e83
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
1 <tool id="kraken-filter" name="Kraken-filter" version="@WRAPPER_VERSION@">
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
2 <description>filter classification by confidence score</description>
0
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
3 <macros>
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
4 <import>macros.xml</import>
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
5 </macros>
1
7dfb0218e838 planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents: 0
diff changeset
6 <expand macro="requirements" />
7dfb0218e838 planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents: 0
diff changeset
7 <expand macro="version_command" />
3
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
8 <command detect_errors="exit_code"><![CDATA[
0
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
9 @SET_DATABASE_PATH@ &&
3
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
10
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
11 kraken-filter
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
12 @INPUT_DATABASE@
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
13 --threshold $threshold
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
14 '${input}'
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
15 > '$filtered_output'
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
16 ]]></command>
0
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
17 <inputs>
3
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
18 <param name="input" type="data" format="tabular" label="Kraken output" help="Select taxonomy classification produced by kraken"/>
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
19 <param argument="--threshold" type="float" value="0" min="0" max="1"
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
20 label="Confidence threshold" help="A floating point number between 0 and 1; default=0"/>
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
21
0
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
22 <expand macro="input_database" />
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
23 </inputs>
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
24 <outputs>
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
25 <data format="tabular" name="filtered_output" />
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
26 </outputs>
1
7dfb0218e838 planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents: 0
diff changeset
27 <tests>
7dfb0218e838 planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents: 0
diff changeset
28 <test>
4
3d6570bffdb1 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 06345505a91f3dcfa8a37dceb6f25e95806dddc8"
iuc
parents: 3
diff changeset
29 <param name="input" value="kraken-filter/kraken_filter_test1.tab"/>
1
7dfb0218e838 planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents: 0
diff changeset
30 <param name="threshold" value="0"/>
4
3d6570bffdb1 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 06345505a91f3dcfa8a37dceb6f25e95806dddc8"
iuc
parents: 3
diff changeset
31 <param name="kraken_database" value="new_style_test_entry"/>
3
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
32
4
3d6570bffdb1 "planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 06345505a91f3dcfa8a37dceb6f25e95806dddc8"
iuc
parents: 3
diff changeset
33 <output name="filtered_output" file="kraken-filter/kraken_filter_test1_output.tab" ftype="tabular"/>
1
7dfb0218e838 planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents: 0
diff changeset
34 </test>
7dfb0218e838 planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents: 0
diff changeset
35 </tests>
7dfb0218e838 planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents: 0
diff changeset
36
0
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
37 <help>
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
38 <![CDATA[
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
39
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
40 .. class:: warningmark
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
41
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
42 **Note**: the database used must be the same as the one used in the original Kraken run
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
43
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
44 -----
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
45
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
46 **What it does**
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
47
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
48 At present, we have not yet developed a confidence score with a solid probabilistic interpretation for Kraken. However, we have developed a simple scoring scheme that has yielded good results for us, and we've made that available in the kraken-filter script. The approach we use allows a user to specify a threshold score in the [0,1] interval; the ``kraken-filter`` script then will adjust labels up the tree until the label's score (described below) meets or exceeds that threshold. If a label at the root of the taxonomic tree would not have a score exceeding the threshold, the sequence is called unclassified by ``kraken-filter``.
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
49
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
50 A sequence label's score is a fraction C/Q, where C is the number of k-mers mapped to LCA values in the clade rooted at the label, and Q is the number of k-mers in the sequence that lack an ambiguous nucleotide (i.e., they were queried against the database). Consider the example of the LCA mappings in Kraken's output::
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
51
3
5bee9adae474 planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents: 2
diff changeset
52 562:13 561:4 A:31 0:1 562:3
0
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
53
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
54 would indicate that::
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
55
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
56 the first 13 k-mers mapped to taxonomy ID #562
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
57 the next 4 k-mers mapped to taxonomy ID #561
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
58 the next 31 k-mers contained an ambiguous nucleotide
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
59 the next k-mer was not in the database
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
60 the last 3 k-mers mapped to taxonomy ID #562
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
61
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
62 In this case, ID #561 is the parent node of #562. Here, a label of #562 for this sequence would have a score of C/Q = (13+3)/(13+4+1+3) = 16/21. A label of #561 would have a score of C/Q = (13+4+3)/(13+4+1+3) = 20/21. If a user specified a threshold over 16/21, kraken-filter would adjust the original label from #562 to #561; if the threshold was greater than 20/21, the sequence would become unclassified.
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
63 ]]>
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
64 </help>
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
65 <expand macro="citations" />
cbb802a726fd planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff changeset
66 </tool>