Mercurial > repos > devteam > kraken_filter
annotate kraken-filter.xml @ 5:67236d921e83 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 3a94fbf6a188ea81441ef2f654ba5a74bff56f22
author | iuc |
---|---|
date | Tue, 12 Mar 2024 16:10:31 +0000 |
parents | 3d6570bffdb1 |
children |
rev | line source |
---|---|
3
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
1 <tool id="kraken-filter" name="Kraken-filter" version="@WRAPPER_VERSION@"> |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
2 <description>filter classification by confidence score</description> |
0
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
3 <macros> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
4 <import>macros.xml</import> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
5 </macros> |
5
67236d921e83
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 3a94fbf6a188ea81441ef2f654ba5a74bff56f22
iuc
parents:
4
diff
changeset
|
6 <expand macro="xrefs"/> |
1
7dfb0218e838
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents:
0
diff
changeset
|
7 <expand macro="requirements" /> |
7dfb0218e838
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents:
0
diff
changeset
|
8 <expand macro="version_command" /> |
3
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
9 <command detect_errors="exit_code"><![CDATA[ |
0
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
10 @SET_DATABASE_PATH@ && |
3
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
11 |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
12 kraken-filter |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
13 @INPUT_DATABASE@ |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
14 --threshold $threshold |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
15 '${input}' |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
16 > '$filtered_output' |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
17 ]]></command> |
0
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
18 <inputs> |
3
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
19 <param name="input" type="data" format="tabular" label="Kraken output" help="Select taxonomy classification produced by kraken"/> |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
20 <param argument="--threshold" type="float" value="0" min="0" max="1" |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
21 label="Confidence threshold" help="A floating point number between 0 and 1; default=0"/> |
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
22 |
0
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
23 <expand macro="input_database" /> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
24 </inputs> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
25 <outputs> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
26 <data format="tabular" name="filtered_output" /> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
27 </outputs> |
1
7dfb0218e838
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents:
0
diff
changeset
|
28 <tests> |
7dfb0218e838
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents:
0
diff
changeset
|
29 <test> |
4
3d6570bffdb1
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 06345505a91f3dcfa8a37dceb6f25e95806dddc8"
iuc
parents:
3
diff
changeset
|
30 <param name="input" value="kraken-filter/kraken_filter_test1.tab"/> |
1
7dfb0218e838
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents:
0
diff
changeset
|
31 <param name="threshold" value="0"/> |
4
3d6570bffdb1
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 06345505a91f3dcfa8a37dceb6f25e95806dddc8"
iuc
parents:
3
diff
changeset
|
32 <param name="kraken_database" value="new_style_test_entry"/> |
3
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
33 |
4
3d6570bffdb1
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/ commit 06345505a91f3dcfa8a37dceb6f25e95806dddc8"
iuc
parents:
3
diff
changeset
|
34 <output name="filtered_output" file="kraken-filter/kraken_filter_test1_output.tab" ftype="tabular"/> |
1
7dfb0218e838
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents:
0
diff
changeset
|
35 </test> |
7dfb0218e838
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents:
0
diff
changeset
|
36 </tests> |
7dfb0218e838
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 3abfc7eb2999fa588862b84c453012c811fa8350
devteam
parents:
0
diff
changeset
|
37 |
0
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
38 <help> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
39 <![CDATA[ |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
40 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
41 .. class:: warningmark |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
42 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
43 **Note**: the database used must be the same as the one used in the original Kraken run |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
44 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
45 ----- |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
46 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
47 **What it does** |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
48 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
49 At present, we have not yet developed a confidence score with a solid probabilistic interpretation for Kraken. However, we have developed a simple scoring scheme that has yielded good results for us, and we've made that available in the kraken-filter script. The approach we use allows a user to specify a threshold score in the [0,1] interval; the ``kraken-filter`` script then will adjust labels up the tree until the label's score (described below) meets or exceeds that threshold. If a label at the root of the taxonomic tree would not have a score exceeding the threshold, the sequence is called unclassified by ``kraken-filter``. |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
50 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
51 A sequence label's score is a fraction C/Q, where C is the number of k-mers mapped to LCA values in the clade rooted at the label, and Q is the number of k-mers in the sequence that lack an ambiguous nucleotide (i.e., they were queried against the database). Consider the example of the LCA mappings in Kraken's output:: |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
52 |
3
5bee9adae474
planemo upload for repository https://github.com/galaxyproject/tools-iuc/blob/master/tool_collections/kraken/kraken_filter/ commit e8fc7c9dad5f583ad6763ecb9bd8c924832abacd
iuc
parents:
2
diff
changeset
|
53 562:13 561:4 A:31 0:1 562:3 |
0
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
54 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
55 would indicate that:: |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
56 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
57 the first 13 k-mers mapped to taxonomy ID #562 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
58 the next 4 k-mers mapped to taxonomy ID #561 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
59 the next 31 k-mers contained an ambiguous nucleotide |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
60 the next k-mer was not in the database |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
61 the last 3 k-mers mapped to taxonomy ID #562 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
62 |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
63 In this case, ID #561 is the parent node of #562. Here, a label of #562 for this sequence would have a score of C/Q = (13+3)/(13+4+1+3) = 16/21. A label of #561 would have a score of C/Q = (13+4+3)/(13+4+1+3) = 20/21. If a user specified a threshold over 16/21, kraken-filter would adjust the original label from #562 to #561; if the threshold was greater than 20/21, the sequence would become unclassified. |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
64 ]]> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
65 </help> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
66 <expand macro="citations" /> |
cbb802a726fd
planemo upload for repository https://github.com/galaxyproject/tools-devteam/blob/master/tool_collections/kraken/kraken_filter/ commit 00a7926c285bc4a339bd7deebf40b28f39c7d947-dirty
devteam
parents:
diff
changeset
|
67 </tool> |