annotate tools/primers/seq_primer_clip.xml @ 1:8c02a91a8680 draft

Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
author peterjc
date Tue, 30 Apr 2013 11:04:43 -0400
parents 945053d79e60
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
1 <tool id="seq_primer_clip" name="Primer clip sequences" version="0.0.9">
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
2 <description>Trim off 5' or 3' primers</description>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
3 <version_command interpreter="python">seq_primer_clip.py --version</version_command>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
4 <command interpreter="python">
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
5 seq_primer_clip.py $input_file $input_file.ext $primer_fasta $primer_type $mm $min_len $keep_negatives $output_file
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
6 </command>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
7 <stdio>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
8 <!-- Anything other than zero is an error -->
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
9 <exit_code range="1:" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
10 <exit_code range=":-1" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
11 </stdio>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
12 <inputs>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
13 <param name="input_file" type="data" format="fasta,fastq,sff" label="Sequence file to clip" description="FASTA, FASTQ, or SFF format."/>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
14 <param name="primer_fasta" type="data" format="fasta" label="FASTA file containing primer(s)"/>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
15 <param name="primer_type" type="select" label="Type of primers">
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
16 <option value="Forward">Forward (5') primers</option>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
17 <option value="Reverse">Reverse (3') primers (given with respect to the forward strand)</option>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
18 <option value="Reverse-complement">Reverse (3') primers (given with respect to the reverse strand)</option>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
19 </param>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
20 <param name="mm" type="integer" value="0" label="How many mismatches to allow? (0, 1 or 2)">
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
21 <validator type="in_range" min="0" max="2" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
22 </param>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
23 <param name="keep_negatives" type="boolean" value="false" label="Keep reads with no matched primer"/>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
24 <param name="min_len" type="integer" label="Minimum length for (clipped) sequences " value="1"/>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
25 </inputs>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
26 <outputs>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
27 <data name="output_file" format="data" label="$primer_type primer clipped">
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
28 <!-- TODO - Replace this with format="input:input_fastq" if/when that works -->
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
29 <change_format>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
30 <when input_dataset="input_file" attribute="extension" value="sff" format="sff" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
31 <when input_dataset="input_file" attribute="extension" value="fasta" format="fasta" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
32 <when input_dataset="input_file" attribute="extension" value="fastq" format="fastq" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
33 <when input_dataset="input_file" attribute="extension" value="fastqsanger" format="fastqsanger" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
34 <when input_dataset="input_file" attribute="extension" value="fastqsolexa" format="fastqsolexa" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
35 <when input_dataset="input_file" attribute="extension" value="fastqillumina" format="fastqillumina" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
36 <when input_dataset="input_file" attribute="extension" value="fastqcssanger" format="fastqcssanger" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
37 </change_format>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
38 </data>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
39 </outputs>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
40 <tests>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
41 <test>
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
42 <param name="input_file" value="MID4_GLZRM4E04_rnd30.fasta" ftype="fasta" />
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
43 <param name="primer_fasta" value="dop_primers.fasta" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
44 <param name="primer_type" value="Forward" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
45 <param name="mm" value="2" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
46 <param name="keep_negatives" value="false" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
47 <param name="min_len" value="35" />
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
48 <output name="output_file" file="MID4_GLZRM4E04_rnd30_fclip.fasta" ftype="fasta" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
49 </test>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
50 <test>
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
51 <param name="input_file" value="MID4_GLZRM4E04_rnd30.fastqsanger" ftype="fastqsanger" />
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
52 <param name="primer_fasta" value="dop_primers.fasta" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
53 <param name="primer_type" value="Forward" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
54 <param name="mm" value="2" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
55 <param name="keep_negatives" value="false" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
56 <param name="min_len" value="35" />
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
57 <output name="output_file" file="MID4_GLZRM4E04_rnd30_fclip.fastqsanger" ftype="fastqsanger" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
58 </test>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
59 <test>
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
60 <param name="input_file" value="MID4_GLZRM4E04_rnd30.sff" ftype="sff" />
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
61 <param name="primer_fasta" value="dop_primers.fasta" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
62 <param name="primer_type" value="Forward" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
63 <param name="mm" value="2" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
64 <param name="keep_negatives" value="false" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
65 <param name="min_len" value="35" />
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
66 <output name="output_file" file="MID4_GLZRM4E04_rnd30_fclip.sff" ftype="sff" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
67 </test>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
68 <test>
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
69 <param name="input_file" value="MID4_GLZRM4E04_rnd30_fclip.fasta" ftype="fasta" />
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
70 <param name="primer_fasta" value="dop_primers.fasta" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
71 <param name="primer_type" value="Reverse" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
72 <param name="mm" value="2" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
73 <param name="keep_negatives" value="true" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
74 <param name="min_len" value="35" />
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
75 <output name="output_file" file="MID4_GLZRM4E04_rnd30_frclip.fasta" ftype="fasta" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
76 </test>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
77 <test>
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
78 <param name="input_file" value="MID4_GLZRM4E04_rnd30_fclip.fastqsanger" ftype="fastqsanger" />
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
79 <param name="primer_fasta" value="dop_primers.fasta" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
80 <param name="primer_type" value="Reverse" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
81 <param name="mm" value="2" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
82 <param name="keep_negatives" value="true" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
83 <param name="min_len" value="35" />
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
84 <output name="output_file" file="MID4_GLZRM4E04_rnd30_frclip.fastqsanger" ftype="fastqsanger" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
85 </test>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
86 <test>
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
87 <param name="input_file" value="MID4_GLZRM4E04_rnd30_fclip.sff" ftype="sff" />
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
88 <param name="primer_fasta" value="dop_primers.fasta" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
89 <param name="primer_type" value="Reverse" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
90 <param name="mm" value="2" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
91 <param name="keep_negatives" value="true" />
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
92 <param name="min_len" value="35" />
1
8c02a91a8680 Uploaded v0.0.9, modifies tests to cope with current Tool Shed limitation.
peterjc
parents: 0
diff changeset
93 <output name="output_file" file="MID4_GLZRM4E04_rnd30_frclip.sff" ftype="sff" />
0
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
94 </test>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
95 </tests>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
96 <requirements>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
97 <requirement type="python-module">Bio</requirement>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
98 </requirements>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
99 <help>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
100
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
101 **What it does**
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
102
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
103 Looks for the given primer sequences (within the existing clipped sequence) and
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
104 further clips the reads to remove the primers and any preceding/trailing sequence.
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
105
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
106 Reads containing a forward primer are reduced to just the sequence after (and
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
107 excluding) the forward primer.
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
108
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
109 Reads containing a reverse primer are reduced to just the sequence before (and
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
110 excluding) the reverse primer.
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
111
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
112 Degenerate primers can be specified using the standard IUPAC ambiguity codes,
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
113 thus a primer with an N would match A, C, T or G (or any of the IUPAC ambiguity
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
114 codes) and so on.
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
115
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
116 Note that for SFF files only the clip/trim positions are edited - you will still
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
117 be able to extract the original full read (with any adapter sequence and poor
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
118 quality sequence) if you need to.
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
119
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
120 .. class:: warningmark
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
121
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
122 **Note**. This tool was initially written for Roche 454 data, and should also
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
123 work fine on Sanger or Ion Torrent as well. However, it is probably too slow
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
124 for use on large Illumina datasets.
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
125
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
126
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
127 **Citation**
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
128
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
129 This tool uses Biopython. If you use this tool in scientific work leading to a
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
130 publication, please cite:
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
131
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
132 Cock et al 2009. Biopython: freely available Python tools for computational
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
133 molecular biology and bioinformatics. Bioinformatics 25(11) 1422-3.
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
134 http://dx.doi.org/10.1093/bioinformatics/btp163 pmid:19304878.
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
135
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
136 </help>
945053d79e60 Uploaded v0.0.8, first public release
peterjc
parents:
diff changeset
137 </tool>