annotate tools/seq_filter_by_id/seq_filter_by_id.xml @ 7:fb1313d79396 draft

Uploaded v0.2.5, ignore blank names in tabular files (based on contribution from Gildas Le Corguille)
author peterjc
date Fri, 04 Nov 2016 08:11:08 -0400
parents 03e134cae41a
children 2d4537dbf0bc
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
7
fb1313d79396 Uploaded v0.2.5, ignore blank names in tabular files (based on contribution from Gildas Le Corguille)
peterjc
parents: 6
diff changeset
1 <tool id="seq_filter_by_id" name="Filter sequences by ID" version="0.2.5">
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
2 <description>from a tabular file</description>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
3 <requirements>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
4 <requirement type="package" version="1.64">biopython</requirement>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
5 </requirements>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
6 <stdio>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
7 <!-- Anything other than zero is an error -->
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
8 <exit_code range="1:" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
9 <exit_code range=":-1" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
10 </stdio>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
11 <version_command interpreter="python">seq_filter_by_id.py --version</version_command>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
12 <command interpreter="python">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
13 seq_filter_by_id.py -i "$input_file" -f "$input_file.ext"
6
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
14 #if str($output_choice_cond.output_choice)=="both"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
15 -p "$output_pos" -n "$output_neg"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
16 #elif str($output_choice_cond.output_choice)=="pos"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
17 -p "$output_pos"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
18 #elif str($output_choice_cond.output_choice)=="neg"
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
19 -n "$output_neg"
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
20 #end if
6
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
21 #if str($adv_opts.adv_opts_selector)=="advanced" and $adv_opts.strip_suffix
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
22 -s
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
23 #end if
6
03e134cae41a v0.2.3, ignore blank lines in ID file (contributed by Gildas Le Corguille)
peterjc
parents: 5
diff changeset
24 #if str($id_opts.id_opts_selector)=="tabular":
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
25 ## TODO - Decide on best way to expose multiple ID files via the XML wrapper.
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
26 ## Single tabular file, can call the Python script with either UNION or INTERSECTION
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
27 -l UNION "$id_opts.input_tabular" "$id_opts.columns"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
28 #else
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
29 -t "$id_opts.id_list"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
30 #end if
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
31 </command>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
32 <inputs>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
33 <param name="input_file" type="data" format="fasta,fastq,sff" label="Sequence file to be filtered" help="FASTA, FASTQ, or SFF format." />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
34 <conditional name="id_opts">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
35 <param name="id_opts_selector" type="select" label="Filter using the ID list from">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
36 <option value="tabular" selected="True">tabular file</option>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
37 <option value="list">provided list</option>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
38 <!-- add UNION or INTERSECTION of multiple tabular files here? -->
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
39 </param>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
40 <when value="tabular">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
41 <param name="input_tabular" type="data" format="tabular" label="Tabular file containing sequence identifiers"/>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
42 <param name="columns" type="data_column" data_ref="input_tabular" multiple="True" numerical="False"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
43 label="Column(s) containing sequence identifiers"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
44 help="Multi-select list - hold the appropriate key while clicking to select multiple columns">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
45 <validator type="no_options" message="Pick at least one column"/>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
46 </param>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
47 </when>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
48 <when value="list">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
49 <param name="id_list" type="text" size="20x80" area="True" format="tabular"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
50 label="List of sequence identifiers (white space separated)"
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
51 help="You can use both spaces and new lines to separate your identifiers.">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
52 <sanitizer>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
53 <valid>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
54 <!-- default includes underscore, hyphen, etc -->
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
55 <add value="%"/>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
56 <add value="|"/>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
57 </valid>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
58 </sanitizer>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
59 </param>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
60 </when>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
61 </conditional>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
62 <conditional name="output_choice_cond">
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
63 <param name="output_choice" type="select" label="Output positive matches, negative matches, or both?">
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
64 <option value="both">Both positive matches (ID on list) and negative matches (ID not on list), as two files</option>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
65 <option value="pos">Just positive matches (ID on list), as a single file</option>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
66 <option value="neg">Just negative matches (ID not on list), as a single file</option>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
67 </param>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
68 <!-- Seems need these dummy entries here, compare this to indels/indel_sam2interval.xml -->
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
69 <when value="both" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
70 <when value="pos" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
71 <when value="neg" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
72 </conditional>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
73 <conditional name="adv_opts">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
74 <param name="adv_opts_selector" type="select" label="Advanced Options">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
75 <option value="basic" selected="True">Hide Advanced Options</option>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
76 <option value="advanced">Show Advanced Options</option>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
77 </param>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
78 <when value="basic" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
79 <when value="advanced">
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
80 <param name="strip_suffix" type="boolean" value="false" label="Remove typical pair read name suffices when matching identifiers?" help="Will remove suffices including Illumina /1 and /2, Roche 454 .f and .r, and assorted Sanger names like .p* and .q*" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
81 </when>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
82 </conditional>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
83 </inputs>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
84 <outputs>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
85 <data name="output_pos" format_source="input_file" metadata_source="input_file" label="$input_file.name with matched ID">
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
86 <filter>output_choice_cond["output_choice"] != "neg"</filter>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
87 </data>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
88 <data name="output_neg" format_source="input_file" metadata_source="input_file" label="$input_file.name without matched ID">
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
89 <filter>output_choice_cond["output_choice"] != "pos"</filter>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
90 </data>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
91 </outputs>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
92 <tests>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
93 <test>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
94 <param name="input_file" value="k12_ten_proteins.fasta" ftype="fasta" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
95 <param name="input_tabular" value="k12_hypothetical.tabular" ftype="tabular" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
96 <param name="columns" value="1" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
97 <param name="output_choice" value="pos" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
98 <output name="output_pos" file="k12_hypothetical.fasta" ftype="fasta" />
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
99 </test>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
100 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
101 <param name="input_file" value="k12_ten_proteins.fasta" ftype="fasta" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
102 <param name="input_tabular" value="k12_hypothetical_alt.tabular" ftype="tabular" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
103 <param name="columns" value="1" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
104 <param name="output_choice" value="pos" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
105 <param name="adv_opts_selector" value="advanced" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
106 <param name="strip_suffix" value="true" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
107 <output name="output_pos" file="k12_hypothetical.fasta" ftype="fasta" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
108 </test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
109 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
110 <param name="input_file" value="k12_ten_proteins.fasta" ftype="fasta" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
111 <param name="id_opts_selector" value="list" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
112 <param name="id_list" value="gi|16127999|ref|NP_414546.1|" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
113 <param name="output_choice" value="pos" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
114 <output name="output_pos" file="k12_hypothetical.fasta" ftype="fasta" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
115 </test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
116 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
117 <param name="input_file" value="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
118 <param name="id_opts_selector" value="list" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
119 <param name="id_list" value="WTSI_1055_1a05 WTSI_1055_1g02" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
120 <param name="output_choice" value="pos" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
121 <param name="adv_opts_selector" value="advanced" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
122 <param name="strip_suffix" value="true" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
123 <output name="output_pos" file="sanger-sample.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
124 </test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
125 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
126 <param name="input_file" value="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
127 <param name="id_opts_selector" value="tabular" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
128 <param name="input_tabular" value="sanger-pairs-names.tabular" ftype="tabular" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
129 <param name="columns" value="1" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
130 <param name="output_choice" value="both" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
131 <param name="adv_opts_selector" value="advanced" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
132 <param name="strip_suffix" value="true" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
133 <output name="output_pos" file="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
134 <output name="output_neg" file="empty_file.dat" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
135 </test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
136 <test>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
137 <param name="input_file" value="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
138 <param name="input_tabular" value="sanger-pairs-names.tabular" ftype="tabular" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
139 <param name="columns" value="1" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
140 <param name="output_choice" value="both" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
141 <param name="adv_opts_selector" value="advanced" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
142 <param name="strip_suffix" value="false" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
143 <output name="output_pos" file="empty_file.dat" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
144 <output name="output_neg" file="sanger-pairs-mixed.fastq" ftype="fastq" />
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
145 </test>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
146 </tests>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
147 <help>
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
148 **What it does**
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
149
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
150 By default it divides a FASTA, FASTQ or Standard Flowgram Format (SFF) file in
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
151 two, those sequences with or without an ID present in the tabular file column(s)
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
152 specified. You can opt to have a single output file of just the matching records,
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
153 or just the non-matching ones.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
154
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
155 Instead of providing the identifiers in a tabular file, you can alternatively
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
156 provide them as a parameter (type or paste them into the text box). This is a
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
157 useful shortcut for extracting a few sequences of interest without first having
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
158 to prepare a tabular file.
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
159
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
160 Note that the order of sequences in the original sequence file is preserved, as
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
161 is any Roche XML Manifest in an SFF file. Also, if any sequences share an
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
162 identifier (which would be very unusual in SFF files), duplicates are not removed.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
163
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
164 **Example Usage**
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
165
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
166 You may have performed some kind of contamination search, for example running
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
167 BLASTN against a database of cloning vectors or bacteria, giving you a tabular
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
168 file containing read identifiers. You could use this tool to extract only the
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
169 reads without BLAST matches (i.e. those which do not match your contaminant
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
170 database).
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
171
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
172 You may have a file of FASTA sequences which has been used with some analysis
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
173 tool giving tabular output, which has then been filtered on some criteria.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
174 You can then use this tool to divide the original FASTA file into those entries
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
175 matching or not matching your criteria (those with or without their identifier
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
176 in the filtered tabular file).
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
177
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
178 **References**
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
179
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
180 If you use this Galaxy tool in work leading to a scientific publication please
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
181 cite the following papers:
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
182
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
183 Peter J.A. Cock, Björn A. Grüning, Konrad Paszkiewicz and Leighton Pritchard (2013).
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
184 Galaxy tools and workflows for sequence analysis with applications
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
185 in molecular plant pathology. PeerJ 1:e167
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
186 http://dx.doi.org/10.7717/peerj.167
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
187
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
188 This tool uses Biopython to read and write SFF files, so you may also wish to
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
189 cite the Biopython application note (and Galaxy too of course):
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
190
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
191 Cock et al (2009). Biopython: freely available Python tools for computational
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
192 molecular biology and bioinformatics. Bioinformatics 25(11) 1422-3.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
193 http://dx.doi.org/10.1093/bioinformatics/btp163 pmid:19304878.
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
194
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
195 This tool is available to install into other Galaxy Instances via the Galaxy
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
196 Tool Shed at http://toolshed.g2.bx.psu.edu/view/peterjc/seq_filter_by_id
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
197 </help>
5
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
198 <citations>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
199 <citation type="doi">10.7717/peerj.167</citation>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
200 <citation type="doi">10.1093/bioinformatics/btp163</citation>
832c1fd57852 v0.2.2; New options for IDs via text parameter, ignore paired read suffix; misc changes
peterjc
parents: 3
diff changeset
201 </citations>
3
44ab4c0f7683 Uploaded v0.0.6, automatic dependency on Biopython 1.62, new README file, citation information, MIT licence
peterjc
parents:
diff changeset
202 </tool>