annotate je-clip.xml @ 2:b61628ae2371 draft

planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 62411561ae3bc65ea8762d27ec79a7d912503e5b
author gbcs-embl-heidelberg
date Wed, 07 Dec 2016 11:57:50 -0500
parents 101525093ba1
children 2cfed59e4d27
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
1 <tool id="je_clip" name="Je-Clip" version="1.0">
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
2 <description>clips Unique Molecular Identifiers (UMIs) from fastq files</description>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
3 <macros>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
4 <import>macros.xml</import>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
5 </macros>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
6 <stdio>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
7 <exit_code range="1:" level="fatal" description="Tool exception" />
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
8 </stdio>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
9 <version_command>echo '1.0'</version_command>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
10 <command interpreter="bash">
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
11 <![CDATA[
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
12 je clip
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
13
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
14 ## Fastq inputs
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
15 @single_or_paired_cmd@
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
16 #if str( $library.type ) != "single":
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
17 BPOS=${library.BPOS}
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
18 #end if
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
19
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
20 @common_options_cmd@
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
21 @barcode_len_cmd@
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
22 ADD=${ADD}
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
23 #if str($ADD) == "false":
2
b61628ae2371 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 62411561ae3bc65ea8762d27ec79a7d912503e5b
gbcs-embl-heidelberg
parents: 0
diff changeset
24 BARCODE_RESULT_FILENAME=${BARCODE_RESULT_FILENAME}
0
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
25 #end if
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
26
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
27 OF1=${OF1}
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
28 #if str( $library.type ) != "single":
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
29 OF2=${OF2}
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
30 #end if
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
31
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
32 FORCE=true
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
33 ]]>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
34 </command>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
35 <inputs>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
36 <!-- single/paired -->
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
37 <expand macro="single_or_paired_general">
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
38 <param name="BPOS" type="select" label="Barcode read position (BPOS)" help="where are the barcodes.">
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
39 <option value="READ_1" selected="true">READ_1 (beginning of read from the first fastq file)</option>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
40 <option value="READ_2">READ_2 (beginning of read from the second fastq file)</option>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
41 <option value="BOTH">BOTH (beginning of both reads)</option>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
42 </param>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
43 </expand>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
44 <expand macro="barcode_len_option"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
45 <param name="ADD" type="boolean"
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
46 label="Add matched barcode at the end of the read header (ADD)"
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
47 truevalue="true"
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
48 falsevalue="false"
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
49 checked="true"
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
50 />
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
51
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
52 <expand macro="common_options"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
53
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
54
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
55 </inputs>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
56 <outputs>
2
b61628ae2371 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 62411561ae3bc65ea8762d27ec79a7d912503e5b
gbcs-embl-heidelberg
parents: 0
diff changeset
57 <data name="BARCODE_RESULT_FILENAME" format="tabular" label="Je-Clipped Barcodes">
b61628ae2371 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 62411561ae3bc65ea8762d27ec79a7d912503e5b
gbcs-embl-heidelberg
parents: 0
diff changeset
58 <filter>!ADD</filter>
b61628ae2371 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 62411561ae3bc65ea8762d27ec79a7d912503e5b
gbcs-embl-heidelberg
parents: 0
diff changeset
59 </data>
b61628ae2371 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 62411561ae3bc65ea8762d27ec79a7d912503e5b
gbcs-embl-heidelberg
parents: 0
diff changeset
60 <data name="OF1" format_source="input_1" label="Je-Clip OF1: ${on_string}"/>
b61628ae2371 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 62411561ae3bc65ea8762d27ec79a7d912503e5b
gbcs-embl-heidelberg
parents: 0
diff changeset
61 <data name="OF2" format_source="input_2" label="Je-Clip OF2: ${on_string}">
b61628ae2371 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 62411561ae3bc65ea8762d27ec79a7d912503e5b
gbcs-embl-heidelberg
parents: 0
diff changeset
62 <filter>library["type"] != "single"</filter>
0
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
63 </data>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
64 </outputs>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
65
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
66 <tests>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
67 <test>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
68 <!-- simple test on single end data -->
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
69 <param name="type" value="single"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
70 <param name="input_1" value="file_1_sequence.txt" ftype="fastqsanger"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
71 <param name="LEN" value="6"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
72 <param name="ADD" value="false"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
73 <output name="BARCODE_RESULT_FILENAME" file="clip_barcode_result_file.txt"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
74 <output name="OF1" file="clip_dataset1_SE.fastq"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
75 </test>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
76 <test>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
77 <!-- more complex test on paired end data with different barcode for fwd/rev -->
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
78 <param name="type" value="paired"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
79 <param name="input_1" value="file_1_sequence.txt" ftype="fastqsanger"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
80 <param name="input_2" value="file_2_sequence.txt" ftype="fastqsanger"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
81 <param name="LEN" value="6"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
82 <param name="BPOS" value="BOTH"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
83 <output name="OF1" file="clip_dataset1_PE.fastq"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
84 <output name="OF2" file="clip_dataset2_PE.fastq"/>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
85 </test>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
86 </tests>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
87
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
88
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
89 <help>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
90 <![CDATA[
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
91 **What it does**
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
92
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
93 Je clip: Clips barcodes or Unique Molecular Identifiers (UMIs) from the input fastq files
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
94 Input files are fastq files, and can be in gzip compressed format.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
95
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
96 Author: Charles Girardot (charles.girardot@embl.de).
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
97
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
98 Wrapper by: Jelle Scholtalbers (jelle.scholtalbers@embl.de).
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
99
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
100 ------
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
101
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
102 **Know what you are doing**
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
103
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
104 .. class:: warningmark
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
105
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
106 You will want to read the `documentation`__.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
107
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
108 .. __: http://gbcs.embl.de/portal/Je
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
109
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
110 ------
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
111
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
112 **Parameter list**
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
113
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
114 This is an exhaustive list of options::
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
115
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
116 FASTQ_FILE1=File
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
117 F1=File
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
118
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
119 Input fastq file (optionally gzipped) for single end data, or first read in paired end data.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
120 Required.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
121
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
122 FASTQ_FILE2=File
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
123 F2=File
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
124
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
125 Input fastq file (optionally gzipped) for the second read of paired end data.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
126 Default value: null.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
127
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
128 BCLEN=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
129 LEN=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
130
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
131 Length of the barcode sequences. When BARCODE_READ_POS == BOTH, two distinct lengths can
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
132 be provided using the syntax LEN=X:Z where X and Z are 2 integers representing the
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
133 barcode length for read_1 and read_2 respectively.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
134 Required.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
135
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
136 BARCODE_READ_POS=BarcodePosition
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
137 BPOS=BarcodePosition
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
138
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
139 Reads containing the sequence (i.e. UMIs) to clip:
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
140 READ_1 (beginning of read from FASTQ_FILE_1),
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
141 READ_2 (beginning of read from FASTQ_FILE_2),
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
142 BOTH (beginning of both reads).
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
143
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
144 Automatically set to READ_1 in single end mode and BOTH in paired end mode. Actually not
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
145 relevant for single end data
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
146 Default value: BOTH. This option can be set to 'null' to clear the default value.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
147 Possible values: {READ_1, READ_2, BOTH, NONE}
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
148
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
149 ADD_BARCODE_TO_HEADER=Boolean
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
150 ADD=Boolean
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
151
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
152 Should clipped UMIs be added to the read header (at the end); apply to both barcodes when
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
153 BPOS=BOTH.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
154 If ADD=true, the string ':barcode' is added at the end of the read header with a ':'
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
155 added only if current read header does not end with ':'.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
156 If both reads of the pair contains a UMI (i.e. BARCODE_READ_POS == BOTH), the UMI from
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
157 the second read is also added to the read header.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
158 Else, the header of the read without UMI receives the UMI from the other read.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
159 For example:
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
160 @D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965 2:N:0:
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
161 becomes
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
162 @D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965 2:N:0:BARCODE
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
163 Default value: true. This option can be set to 'null' to clear the default value.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
164 Possible values: {true, false}
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
165
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
166 ENSURE_IDENTICAL_HEADER_NAMES=Boolean
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
167 SAME_HEADERS=Boolean
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
168
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
169 Makes sure headers of both reads of a pair are identical.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
170 Read name (or headers) will follow the pattern (for both reads of a pair):
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
171 @D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965 CLIPPED_SEQ_FROMREAD1:CLIPPED_SEQ_FROMREAD2
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
172 This option only makes sense in paired end mode and ADD=true.Some (if not all) mappers
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
173 will indeed complain when read headers of a read pair are not identical.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
174 When SAME_HEADERS=FALSE and the RCHAR is used, read headers look like this:
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
175 HISEQ:44:C6KC0ANXX:5:1101:1491:1994:1:N:0:TGGAGTAG
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
176 HISEQ:44:C6KC0ANXX:5:1101:1491:1994:3:N:0:CGTTGTAT
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
177
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
178 SAME_HEADERS=true will instead generates the following identical header for both reads :
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
179 HISEQ:44:C6KC0ANXX:5:1101:1491:1994:TGGAGTAG:CGTTGTAT
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
180 Note that we also clipped the useless '1:N:0' amd '3:N:0' as they also result in
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
181 different headers
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
182 Important : this option will force RCHAR=: UNLESS you specify RCHAR=null ; in which case
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
183 a space will be preserved i.e.:
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
184 HISEQ:44:C6KC0ANXX:5:1101:1491:1994 TAGAACAC:TGGAGTAG:CGTTGTAT
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
185
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
186 Default value: true.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
187 This option can be set to 'null' to clear the default value. Possible values: {true,
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
188 false}
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
189
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
190 READ_NAME_REPLACE_CHAR=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
191 RCHAR=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
192
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
193 Replace spaces in read name/header using provided character.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
194 This is needed when you need to retain ADDed barcode in read name/header during mapping
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
195 as everything after space in read name is usually clipped in BAM files.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
196 For example, with RCHAR=':':
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
197 @D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965 1:N:0:
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
198 becomes
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
199 @D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965:1:N:0:BARCODE
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
200
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
201 Default value: ':'. This option can be set to 'null' to clear the default value.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
202
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
203 XTRIMLEN=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
204 XT=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
205
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
206 Optional extra number of base(s) to be trimmed right after the barcode. These extra bases
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
207 are not added to read headers.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
208 When running paired-end, two distinct values can be given using the syntax XT=X:Z where X
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
209 and Z are 2 integers to use for read_1 and read_2 respectively. Note that even when
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
210 BPOS=READ_1 or BPOS=READ_2, a X:Y synthax can be given to trim the read w/o barcode to
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
211 end up with reads of identical length (note that this can also be operated using ZT). If
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
212 a unique value is given, e.g. XT=1, while running paired-end the following rule applies :
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
213 (1) BPOS=READ_1 or BPOS=READ_2, no trim is applied at the read w/o barcode
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
214 (2) BPOS=BOTH, the value is used for both reads.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
215 Note that XT=null is like XT=0.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
216 Default value: 0. This option can be set to 'null' to clear the default value.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
217
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
218 ZTRIMLEN=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
219 ZT=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
220
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
221 Optional extra number of bases to be trimmed from the read end i.e. 3' end. These extra
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
222 bases are not added to read headers.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
223 When running paired-end, two distinct values can be given here using the syntax ZT=X:Z
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
224 where X and Z are 2 integers to use for read_1 and read_2 respectively. Note that even
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
225 when BPOS=READ_1 or BPOS=READ_2, a X:Y synthax can be given to trim the read w/o barcode
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
226 as to end up with reads of the same length (note that this can also be operated using
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
227 XT). Note that if a single value is passed, the value always applies to both reads in
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
228 paired-end mode without further consideration.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
229
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
230 Default value: 0. This option can be set to 'null' to clear the default value.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
231
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
232 BARCODE_RESULT_FILENAME=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
233 BF=String
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
234
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
235 Optional file name where to write clipped barcodes, default name is clipped_barcodes.txt.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
236 This file is automatically created if ADD=FALSE i.e. even if this option is not provided
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
237 by user (and always created if this option is given).
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
238 File format is tab delimited with:
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
239 ``read header (col 1) barcode from read_1 (col 2) barcode quality from read_1 (col 2)``
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
240 + barcode + quality from read_2 (col 4 and 5 respectively) when relevant.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
241 Can either be a name (in which case the file will be created in the output dir) or a full path.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
242 Default value: null.
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
243
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
244 ]]>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
245 </help>
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
246
101525093ba1 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
247 </tool>