annotate tools/seq_filter_by_id/seq_filter_by_id.xml @ 6:03e134cae41a draft

v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
author peterjc
date Tue, 17 May 2016 05:59:24 -0400
parents 832c1fd57852
children fb1313d79396
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
1 <tool id="seq_filter_by_id" name="Filter sequences by ID" version="0.2.3">
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
2 <description>from a tabular file</description>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
3 <requirements>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
4 <requirement type="package" version="1.64">biopython</requirement>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
5 <requirement type="python-module">Bio</requirement>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
6 </requirements>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
7 <stdio>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
8 <!-- Anything other than zero is an error -->
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
9 <exit_code range="1:" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
10 <exit_code range=":-1" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
11 </stdio>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
12 <version_command interpreter="python">seq_filter_by_id.py --version</version_command>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
13 <command interpreter="python">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
14 seq_filter_by_id.py -i "$input_file" -f "$input_file.ext"
6
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
15 #if str($output_choice_cond.output_choice)=="both"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
16 -p "$output_pos" -n "$output_neg"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
17 #elif str($output_choice_cond.output_choice)=="pos"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
18 -p "$output_pos"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
19 #elif str($output_choice_cond.output_choice)=="neg"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
20 -n "$output_neg"
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
21 #end if
6
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
22 #if str($adv_opts.adv_opts_selector)=="advanced" and $adv_opts.strip_suffix
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
23 -s
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
24 #end if
6
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
25 #if str($id_opts.id_opts_selector)=="tabular":
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
26 ## TODO - Decide on best way to expose multiple ID files via the XML wrapper.
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
27 ## Single tabular file, can call the Python script with either UNION or INTERSECTION
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
28 -l UNION "$id_opts.input_tabular" "$id_opts.columns"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
29 #else
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
30 -t "$id_opts.id_list"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
31 #end if
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
32 </command>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
33 <inputs>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
34 <param name="input_file" type="data" format="fasta,fastq,sff" label="Sequence file to be filtered" help="FASTA, FASTQ, or SFF format." />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
35 <conditional name="id_opts">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
36 <param name="id_opts_selector" type="select" label="Filter using the ID list from">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
37 <option value="tabular" selected="True">tabular file</option>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
38 <option value="list">provided list</option>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
39 <!-- add UNION or INTERSECTION of multiple tabular files here? -->
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
40 </param>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
41 <when value="tabular">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
42 <param name="input_tabular" type="data" format="tabular" label="Tabular file containing sequence identifiers"/>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
43 <param name="columns" type="data_column" data_ref="input_tabular" multiple="True" numerical="False"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
44 label="Column(s) containing sequence identifiers"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
45 help="Multi-select list - hold the appropriate key while clicking to select multiple columns">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
46 <validator type="no_options" message="Pick at least one column"/>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
47 </param>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
48 </when>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
49 <when value="list">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
50 <param name="id_list" type="text" size="20x80" area="True" format="tabular"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
51 label="List of sequence identifiers (white space separated)"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
52 help="You can use both spaces and new lines to separate your identifiers.">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
53 <sanitizer>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
54 <valid>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
55 <!-- default includes underscore, hyphen, etc -->
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
56 <add value="%"/>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
57 <add value="|"/>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
58 </valid>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
59 </sanitizer>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
60 </param>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
61 </when>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
62 </conditional>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
63 <conditional name="output_choice_cond">
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
64 <param name="output_choice" type="select" label="Output positive matches, negative matches, or both?">
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
65 <option value="both">Both positive matches (ID on list) and negative matches (ID not on list), as two files</option>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
66 <option value="pos">Just positive matches (ID on list), as a single file</option>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
67 <option value="neg">Just negative matches (ID not on list), as a single file</option>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
68 </param>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
69 <!-- Seems need these dummy entries here, compare this to indels/indel_sam2interval.xml -->
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
70 <when value="both" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
71 <when value="pos" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
72 <when value="neg" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
73 </conditional>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
74 <conditional name="adv_opts">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
75 <param name="adv_opts_selector" type="select" label="Advanced Options">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
76 <option value="basic" selected="True">Hide Advanced Options</option>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
77 <option value="advanced">Show Advanced Options</option>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
78 </param>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
79 <when value="basic" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
80 <when value="advanced">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
81 <param name="strip_suffix" type="boolean" value="false" label="Remove typical pair read name suffices when matching identifiers?" help="Will remove suffices including Illumina /1 and /2, Roche 454 .f and .r, and assorted Sanger names like .p* and .q*" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
82 </when>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
83 </conditional>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
84 </inputs>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
85 <outputs>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
86 <data name="output_pos" format_source="input_file" metadata_source="input_file" label="$input_file.name with matched ID">
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
87 <filter>output_choice_cond["output_choice"] != "neg"</filter>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
88 </data>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
89 <data name="output_neg" format_source="input_file" metadata_source="input_file" label="$input_file.name without matched ID">
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
90 <filter>output_choice_cond["output_choice"] != "pos"</filter>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
91 </data>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
92 </outputs>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
93 <tests>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
94 <test>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
95 <param name="input_file" value="k12_ten_proteins.fasta" ftype="fasta" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
96 <param name="input_tabular" value="k12_hypothetical.tabular" ftype="tabular" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
97 <param name="columns" value="1" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
98 <param name="output_choice" value="pos" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
99 <output name="output_pos" file="k12_hypothetical.fasta" ftype="fasta" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
100 </test>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
101 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
102 <param name="input_file" value="k12_ten_proteins.fasta" ftype="fasta" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
103 <param name="input_tabular" value="k12_hypothetical_alt.tabular" ftype="tabular" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
104 <param name="columns" value="1" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
105 <param name="output_choice" value="pos" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
106 <param name="adv_opts_selector" value="advanced" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
107 <param name="strip_suffix" value="true" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
108 <output name="output_pos" file="k12_hypothetical.fasta" ftype="fasta" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
109 </test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
110 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
111 <param name="input_file" value="k12_ten_proteins.fasta" ftype="fasta" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
112 <param name="id_opts_selector" value="list" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
113 <param name="id_list" value="gi|16127999|ref|NP_414546.1|" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
114 <param name="output_choice" value="pos" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
115 <output name="output_pos" file="k12_hypothetical.fasta" ftype="fasta" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
116 </test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
117 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
118 <param name="input_file" value="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
119 <param name="id_opts_selector" value="list" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
120 <param name="id_list" value="WTSI_1055_1a05 WTSI_1055_1g02" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
121 <param name="output_choice" value="pos" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
122 <param name="adv_opts_selector" value="advanced" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
123 <param name="strip_suffix" value="true" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
124 <output name="output_pos" file="sanger-sample.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
125 </test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
126 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
127 <param name="input_file" value="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
128 <param name="id_opts_selector" value="tabular" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
129 <param name="input_tabular" value="sanger-pairs-names.tabular" ftype="tabular" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
130 <param name="columns" value="1" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
131 <param name="output_choice" value="both" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
132 <param name="adv_opts_selector" value="advanced" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
133 <param name="strip_suffix" value="true" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
134 <output name="output_pos" file="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
135 <output name="output_neg" file="empty_file.dat" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
136 </test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
137 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
138 <param name="input_file" value="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
139 <param name="input_tabular" value="sanger-pairs-names.tabular" ftype="tabular" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
140 <param name="columns" value="1" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
141 <param name="output_choice" value="both" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
142 <param name="adv_opts_selector" value="advanced" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
143 <param name="strip_suffix" value="false" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
144 <output name="output_pos" file="empty_file.dat" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
145 <output name="output_neg" file="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
146 </test>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
147 </tests>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
148 <help>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
149 **What it does**
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
150
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
151 By default it divides a FASTA, FASTQ or Standard Flowgram Format (SFF) file in
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
152 two, those sequences with or without an ID present in the tabular file column(s)
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
153 specified. You can opt to have a single output file of just the matching records,
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
154 or just the non-matching ones.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
155
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
156 Instead of providing the identifiers in a tabular file, you can alternatively
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
157 provide them as a parameter (type or paste them into the text box). This is a
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
158 useful shortcut for extracting a few sequences of interest without first having
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
159 to prepare a tabular file.
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
160
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
161 Note that the order of sequences in the original sequence file is preserved, as
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
162 is any Roche XML Manifest in an SFF file. Also, if any sequences share an
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
163 identifier (which would be very unusual in SFF files), duplicates are not removed.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
164
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
165 **Example Usage**
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
166
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
167 You may have performed some kind of contamination search, for example running
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
168 BLASTN against a database of cloning vectors or bacteria, giving you a tabular
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
169 file containing read identifiers. You could use this tool to extract only the
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
170 reads without BLAST matches (i.e. those which do not match your contaminant
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
171 database).
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
172
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
173 You may have a file of FASTA sequences which has been used with some analysis
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
174 tool giving tabular output, which has then been filtered on some criteria.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
175 You can then use this tool to divide the original FASTA file into those entries
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
176 matching or not matching your criteria (those with or without their identifier
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
177 in the filtered tabular file).
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
178
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
179 **References**
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
180
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
181 If you use this Galaxy tool in work leading to a scientific publication please
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
182 cite the following papers:
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
183
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
184 Peter J.A. Cock, Björn A. Grüning, Konrad Paszkiewicz and Leighton Pritchard (2013).
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
185 Galaxy tools and workflows for sequence analysis with applications
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
186 in molecular plant pathology. PeerJ 1:e167
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
187 http://dx.doi.org/10.7717/peerj.167
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
188
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
189 This tool uses Biopython to read and write SFF files, so you may also wish to
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
190 cite the Biopython application note (and Galaxy too of course):
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
191
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
192 Cock et al (2009). Biopython: freely available Python tools for computational
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
193 molecular biology and bioinformatics. Bioinformatics 25(11) 1422-3.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
194 http://dx.doi.org/10.1093/bioinformatics/btp163 pmid:19304878.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
195
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
196 This tool is available to install into other Galaxy Instances via the Galaxy
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
197 Tool Shed at http://toolshed.g2.bx.psu.edu/view/peterjc/seq_filter_by_id
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
198 </help>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
199 <citations>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
200 <citation type="doi">10.7717/peerj.167</citation>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
201 <citation type="doi">10.1093/bioinformatics/btp163</citation>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
202 </citations>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
203 </tool>