annotate tools/seq_select_by_id/seq_select_by_id.xml @ 6:91f55ee8fea5 draft

v0.0.11; more tests and assorting minor changes
author peterjc
date Wed, 13 May 2015 10:56:29 -0400
parents 6842c0c7bc70
children a5602454b0ad
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
1 <tool id="seq_select_by_id" name="Select sequences by ID" version="0.0.11">
4
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
2 <description>from a tabular file</description>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
3 <requirements>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
4 <requirement type="package" version="1.62">biopython</requirement>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
5 <requirement type="python-module">Bio</requirement>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
6 </requirements>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
7 <stdio>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
8 <!-- Anything other than zero is an error -->
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
9 <exit_code range="1:" />
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
10 <exit_code range=":-1" />
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
11 </stdio>
6
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
12 <version_command interpreter="python">seq_select_by_id.py --version</version_command>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
13 <command interpreter="python">
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
14 seq_select_by_id.py "$input_tabular" "$column" "$input_file" "$input_file.ext" "$output_file"
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
15 </command>
4
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
16 <inputs>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
17 <param name="input_file" type="data" format="fasta,qual,fastq,sff" label="Sequence file to select from" help="FASTA, QUAL, FASTQ, or SFF format." />
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
18 <param name="input_tabular" type="data" format="tabular" label="Tabular file containing sequence identifiers"/>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
19 <param name="column" type="data_column" data_ref="input_tabular" multiple="False" numerical="False" label="Column containing sequence identifiers"/>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
20 </inputs>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
21 <outputs>
6
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
22 <data name="output_file" format_source="input_file" metadata_source="input_file" label="Selected sequences from $input_file.name"/>
4
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
23 </outputs>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
24 <tests>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
25 <test>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
26 <param name="input_file" value="k12_ten_proteins.fasta" ftype="fasta" />
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
27 <param name="input_tabular" value="k12_hypothetical.tabular" ftype="tabular" />
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
28 <param name="column" value="1" />
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
29 <output name="output_file" file="k12_hypothetical.fasta" ftype="fasta" />
6
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
30 <assert_stdout>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
31 <has_line line="Indexed 10 sequences" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
32 <has_line line="Selected 1 sequences by ID" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
33 </assert_stdout>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
34 </test>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
35 <!-- this version has white space in the identifier column (id and description) -->
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
36 <test>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
37 <param name="input_file" value="k12_ten_proteins.fasta" ftype="fasta" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
38 <param name="input_tabular" value="k12_hypothetical_alt.tabular" ftype="tabular" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
39 <param name="column" value="1" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
40 <output name="output_file" file="k12_hypothetical.fasta" ftype="fasta" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
41 <assert_stdout>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
42 <has_line line="Indexed 10 sequences" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
43 <has_line line="Selected 1 sequences by ID" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
44 </assert_stdout>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
45 <assert_stderr>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
46 <has_line line="WARNING: Some of your identifiers had white space in them, using first word only. e.g.:" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
47 </assert_stderr>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
48 </test>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
49 <test expect_failure="true" expect_exit_code="1">
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
50 <param name="input_file" value="empty.fasta" ftype="fasta" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
51 <param name="input_tabular" value="k12_hypothetical.tabular" ftype="tabular" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
52 <param name="column" value="1" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
53 <assert_stdout>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
54 <has_line line="Indexed 0 sequences" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
55 </assert_stdout>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
56 <assert_stderr>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
57 <has_line line="Identifier 'gi|16127999|ref|NP_414546.1|' not found in sequence file" />
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
58 </assert_stderr>
4
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
59 </test>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
60 </tests>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
61 <help>
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
62 **What it does**
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
63
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
64 Takes a FASTA, QUAL, FASTQ or Standard Flowgram Format (SFF) file and produces a
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
65 new sequence file (of the same format) containing only the records with identifiers
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
66 in the tabular file (in the order from the tabular file).
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
67
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
68 WARNING: If you have any duplicates in the tabular file identifiers, you will get
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
69 duplicate sequences in the output.
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
70
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
71 **References**
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
72
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
73 If you use this Galaxy tool in work leading to a scientific publication please
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
74 cite the following papers:
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
75
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
76 Peter J.A. Cock, Björn A. Grüning, Konrad Paszkiewicz and Leighton Pritchard (2013).
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
77 Galaxy tools and workflows for sequence analysis with applications
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
78 in molecular plant pathology. PeerJ 1:e167
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
79 http://dx.doi.org/10.7717/peerj.167
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
80
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
81 This tool uses Biopython to read, write and index sequence files, so you may
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
82 also wish to cite the Biopython application note (and Galaxy too of course):
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
83
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
84 Cock et al (2009). Biopython: freely available Python tools for computational
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
85 molecular biology and bioinformatics. Bioinformatics 25(11) 1422-3.
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
86 http://dx.doi.org/10.1093/bioinformatics/btp163 pmid:19304878.
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
87
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
88 This tool is available to install into other Galaxy Instances via the Galaxy
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
89 Tool Shed at http://toolshed.g2.bx.psu.edu/view/peterjc/seq_select_by_id
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
90 </help>
6
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
91 <citations>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
92 <citation type="doi">10.7717/peerj.167</citation>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
93 <citation type="doi">10.1093/bioinformatics/btp163</citation>
91f55ee8fea5 v0.0.11; more tests and assorting minor changes
peterjc
parents: 4
diff changeset
94 </citations>
4
6842c0c7bc70 Uploaded v0.0.7, depend on Biopython 1.62, tabs to spaces in XML
peterjc
parents:
diff changeset
95 </tool>