annotate tools/blastxml_to_top_descr/blastxml_to_top_descr.xml @ 13:8dc4ba7eba5d draft default tip

v0.1.2 with Python 3.9 declaration
author peterjc
date Sun, 17 Sep 2023 13:01:56 +0000
parents fe1ed74793c9
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
1 <tool id="blastxml_to_top_descr" name="BLAST top hit descriptions" version="0.1.2" profile="16.10">
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
2 <description>Make a table from BLAST output</description>
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
3 <requirements>
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
4 <requirement type="package" version="3.9">python</requirement>
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
5 </requirements>
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
6 <version_command>
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
7 python $__tool_directory__/blastxml_to_top_descr.py --version
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
8 </version_command>
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
9 <command detect_errors="aggressive">
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
10 python $__tool_directory__/blastxml_to_top_descr.py
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
11 -f '$input.in_format'
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
12 #if $input.in_format == "tabular":
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
13 --qseqid $input.qseqid
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
14 --sseqid $input.sseqid
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
15 --salltitles $input.salltitles
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
16 #end if
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
17 -o '${tabular_file}'
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
18 -t ${topN}
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
19 '${in_file}'
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
20 </command>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
21 <inputs>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
22 <conditional name="input">
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
23 <param name="in_format" type="select" label="Input format">
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
24 <option value="blastxml" selected="true">BLAST XML</option>
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
25 <option value="tabular">Tabular</option>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
26 </param>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
27 <when value="blastxml">
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
28 <param name="in_file" type="data" format="blastxml" label="BLAST results as XML"/>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
29 </when>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
30 <when value="tabular">
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
31 <param name="in_file" type="data" format="tabular" label="BLAST results as tabular"/>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
32 <param name="qseqid" type="data_column" data_ref="in_file"
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
33 multiple="false" numerical="false" default_value="1" value="1"
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
34 label="Column containing query ID (qseqid)"
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
35 help="This is column 1 in standard BLAST tabular output" />
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
36 <param name="sseqid" type="data_column" data_ref="in_file"
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
37 multiple="false" numerical="false" default_value="2" value="2"
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
38 label="Column containing match ID (sseqid)"
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
39 help="This is column 2 in standard BLAST tabular output"/>
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
40 <param name="salltitles" type="data_column" data_ref="in_file"
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
41 multiple="false" numerical="false" default_value="25" value="25"
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
42 label="Column containing containing descriptions (salltitles)"
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
43 help="This is column 25 in the default extended BLAST tabular output"/>
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
44 </when>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
45 </conditional>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
46 <param name="topN" type="integer" min="1" max="100" optional="false" label="Number of descriptions" value="3"/>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
47 </inputs>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
48 <outputs>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
49 <data name="tabular_file" format="tabular" label="Top $topN descriptions from $input.in_file.name" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
50 </outputs>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
51 <tests>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
52 <test>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
53 <param name="in_format" value="blastxml" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
54 <param name="in_file" value="blastp_four_human_vs_rhodopsin.xml" ftype="blastxml" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
55 <param name="topN" value="3" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
56 <output name="tabular_file" file="blastp_four_human_vs_rhodopsin_top3.tabular" ftype="tabular" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
57 </test>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
58 <test>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
59 <param name="in_format" value="tabular" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
60 <param name="in_file" value="blastp_four_human_vs_rhodopsin_converted_ext.tabular" ftype="tabular" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
61 <param name="topN" value="3" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
62 <output name="tabular_file" file="blastp_four_human_vs_rhodopsin_top3_positive.tabular" ftype="tabular" />
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
63 </test>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
64 </tests>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
65 <help>
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
66
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
67 **What it does**
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
68
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
69 NCBI BLAST+ (and the older NCBI 'legacy' BLAST) can output in a range of
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
70 formats including text, tabular and a more detailed XML format. You can
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
71 do a lot of things with tabular files in Galaxy (sorting, filtering, joins,
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
72 etc), however until BLAST+ 2.2.28 the tabular output never included the
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
73 hit descriptions (titles) found in the other output formats.
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
74
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
75 This tool turns a BLAST XML file into a simple tabular file containing
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
76 one row per query sequence, containing the query identifier and then
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
77 the three (by default) top hit descriptions (i.e. the first three). If
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
78 a query doesn't have that many hits, then these entries are left blank.
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
79
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
80 This tool can also be used with the tabular output from BLAST+ instead,
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
81 provided the relevant columns are provided. The default settings will
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
82 work with the default 25 column extended output from the BLAST+ tools
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
83 wrapped in Galaxy. Note if a query has *no* hits, it does not appear in
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
84 the BLAST tabular output.
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
85
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
86 **Example Usage**
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
87
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
88 One simple usage would be to take a transcriptome assembly or set of
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
89 gene predictions, run a BLAST search against the NCBI NR database, and
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
90 then use this tool to make a table of the top three BLAST hits. This
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
91 can give you a 'quick and dirty' crude annotation, potentially enough
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
92 to spot some problems (e.g. bacterial contaimination could be very
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
93 obvious).
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
94
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
95 **References**
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
96
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
97 If you use this Galaxy tool in work leading to a scientific publication please
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
98 cite:
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
99
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
100 Peter J.A. Cock, Björn A. Grüning, Konrad Paszkiewicz and Leighton Pritchard (2013).
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
101 Galaxy tools and workflows for sequence analysis with applications
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
102 in molecular plant pathology. PeerJ 1:e167
13
8dc4ba7eba5d v0.1.2 with Python 3.9 declaration
peterjc
parents: 12
diff changeset
103 https://doi.org/10.7717/peerj.167
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
104
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
105 This wrapper is available to install into other Galaxy Instances via the Galaxy
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
106 Tool Shed at http://toolshed.g2.bx.psu.edu/view/peterjc/blastxml_to_top_descr
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
107
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
108 </help>
12
fe1ed74793c9 Uploaded v0.1.1, embed citation in tool XML
peterjc
parents: 11
diff changeset
109 <citations>
fe1ed74793c9 Uploaded v0.1.1, embed citation in tool XML
peterjc
parents: 11
diff changeset
110 <citation type="doi">10.7717/peerj.167</citation>
fe1ed74793c9 Uploaded v0.1.1, embed citation in tool XML
peterjc
parents: 11
diff changeset
111 </citations>
11
98f8431dab44 Uploaded v0.1.0, now also handles extended tabular BLAST output.
peterjc
parents:
diff changeset
112 </tool>