annotate umi-tools_extract.xml @ 14:9fa7803d1c51 draft

"planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
author iuc
date Wed, 02 Jun 2021 18:27:33 +0000
parents d5ff68d2d5ff
children 27ac32a22ad2
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
14
9fa7803d1c51 "planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
iuc
parents: 12
diff changeset
1 <tool id="umi_tools_extract" name="UMI-tools extract" version="@VERSION@.2">
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
2 <description>Extract UMI from fastq files</description>
1
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
3 <macros>
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
4 <import>macros.xml</import>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
5 <macro name="out_conditional">
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
6 <actions>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
7 <conditional name="input_type.type">
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
8 <when value="paired_collection" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
9 <action type="format">
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
10 <option type="from_param" name="input_type.input_readpair" param_attribute="forward.ext" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
11 </action>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
12 </when>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
13 <when value="paired" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
14 <action type="format">
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
15 <option type="from_param" name="input_type.input_read1" param_attribute="ext" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
16 </action>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
17 </when>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
18 </conditional>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
19 </actions>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
20 </macro>
1
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
21 </macros>
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
22 <expand macro="requirements" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
23 <command detect_errors="exit_code"><![CDATA[
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
24 @COMMAND_LINK@
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
25
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
26 umi_tools extract
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
27 --extract-method='$extract_method.value'
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
28 --bc-pattern='$bc_pattern'
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
29
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
30 #if $input_type.type == 'single':
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
31 #if $gz:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
32 --stdin=input_single.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
33 --stdout out.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
34 #else
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
35 --stdin=input_single.txt
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
36 --stdout '$out'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
37 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
38 #else:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
39 #if $gz:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
40 --stdin=input_read1.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
41 --read2-in=input_read2.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
42 --stdout out1.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
43 --read2-out=out2.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
44 #else:
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
45 --stdin=input_read1.txt
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
46 --read2-in=input_read2.txt
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
47 --stdout '$out1'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
48 --read2-out='$out2'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
49 #end if
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
50 #if $input_type.barcode.barcode_select == "both_reads":
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
51 --split-barcode
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
52 --bc-pattern2='$input_type.barcode.bc_pattern2'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
53 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
54 #end if
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
55
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
56 #if $barcodes.use_barcodes.value == 'yes':
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
57 --filter-cell-barcode
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
58 --whitelist='$barcodes.filter_barcode_file'
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
59 '$barcodes.filter_correct.value'
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
60 #end if
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
61
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
62 #if not $prime3:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
63 --3prime
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
64 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
65 #if $quality.quality_selector =='true':
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
66 --quality-filter-threshold '$quality.quality_filter_threshold'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
67 --quality-encoding '$quality.quality_encoding'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
68 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
69 #if $print_log == "1":
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
70 --log='$out_log'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
71 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
72 #if $gz:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
73 #if $input_type.type == 'single':
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
74 && mv out.gz '$out'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
75 #else
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
76 && mv out1.gz '$out1'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
77 && mv out2.gz '$out2'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
78 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
79 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
80 ]]></command>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
81 <inputs>
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
82 <expand macro="input_types" />
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
83
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
84 <conditional name="barcodes" >
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
85 <param name="use_barcodes" argument="--filter-cell-barcode" type="select" label="Use Known Barcodes?" >
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
86 <option value="yes">Yes</option>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
87 <option value="no" selected="true" >No</option>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
88 </param>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
89 <when value="no" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
90 <when value="yes" >
10
828dba98cdb4 planemo upload commit 04285134f1d28f273bed56976895072148c443c9
iuc
parents: 8
diff changeset
91 <param name="filter_barcode_file" type="data" format="tabular,tsv" label="Barcode File" />
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
92 <param name="filter_correct" argument="--error-correct-cell" type="boolean" truevalue="--error-correct-cell" falsevalue="" checked="false" label="Apply correction to cell barcodes?" help="This only applies if your barcode file has two columns output from the umi_tools whitelist command." />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
93 </when>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
94 </conditional>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
95
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
96 <param name="extract_method" type="select" label="Method to extract barcodes" >
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
97 <option value="regex">Regular Expressions</option>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
98 <option value="string" selected="true">String</option>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
99 </param>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
100
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
101 <param name="bc_pattern" argument="--bc-pattern" type="text" label="Barcode pattern for first read"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
102 help="Use this option to specify the format of the UMI/barcode. Use Ns to
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
103 represent the random positions and Xs to indicate the bc positions.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
104 Bases with Ns will be extracted and added to the read name. Remaining
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
105 bases, marked with an X will be reattached to the read.">
12
d5ff68d2d5ff "planemo upload commit 5d3fc4232e0e036ac1ed9e2c36adc41d6af4987f"
iuc
parents: 11
diff changeset
106 <expand macro="barcode_sanitizer" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
107 </param>
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
108
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
109 <param name="prime3" argument="--3prime" type="boolean" label="Is the barcode at the 5' end?"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
110 truevalue="1" falsevalue="0" checked="true"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
111 help="By default the barcode is assumed to be on the 5' end of the read, but
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
112 use this option to sepecify that it is on the 3' end instead." />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
113 <param name="print_log" argument="-L" type="boolean" label="Output log?"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
114 truevalue="1" falsevalue="0" checked="true"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
115 help="Choose if you want to generate a text file containing logging information." />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
116 <conditional name="quality">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
117 <param name="quality_selector" type="select" label="Enable quality filter?" >
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
118 <option value="false">No</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
119 <option value="true">Yes</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
120 </param>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
121 <when value="false">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
122 </when>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
123 <when value="true">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
124 <param name="quality_filter_threshold" label="Phred score threshold"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
125 type="integer" value="20" argument="--quality-filter-threshold"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
126 help="Remove reads where any UMI base quality score falls below this threshold." />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
127 <param name="quality_encoding" argument="--quality-encoding" type="select" label="Library type"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
128 help="Quality score encoding. Choose from phred33 [33-77], phred64 [64-106] or solexa [59-106].">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
129 <option value="phred33">phred33 [33-77]</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
130 <option value="phred64">phred64 [64-106]</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
131 <option value="solexa">solexa [59-106]</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
132 </param>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
133 </when>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
134 </conditional>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
135 </inputs>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
136 <outputs>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
137 <data name="out" format_source="input_single" label="Reads: ${tool.name} on ${on_string}" >
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
138 <filter>input_type['type'] == "single"</filter>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
139 </data>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
140 <data name="out1" format_source="input_read1" label="Reads1: ${tool.name} on ${on_string}" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
141 <filter>input_type['type'] != "single"</filter>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
142 <expand macro="out_conditional" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
143 </data>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
144 <data name="out2" format_source="input_read2" label="Reads2: ${tool.name} on ${on_string}" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
145 <filter>input_type['type'] != "single"</filter>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
146 <expand macro="out_conditional" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
147 </data>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
148
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
149 <data name="out_log" format="txt">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
150 <filter>print_log == True</filter>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
151 </data>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
152 </outputs>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
153 <tests>
14
9fa7803d1c51 "planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
iuc
parents: 12
diff changeset
154 <test expect_num_outputs="2">
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
155 <param name="type" value="single" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
156 <param name="input_single" value="t_R1.fastq" ftype="fastq" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
157 <param name="bc_pattern" value="XXXNNN" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
158 <param name="prime3" value="0" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
159 <param name="quality_selector" value="true" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
160 <param name="quality_filter_threshold" value="10" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
161 <param name="quality_encoding" value="phred33" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
162 <output name="out" file="out_SE.fastq" ftype="fastq" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
163 <output name="out_log" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
164 <assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
165 <has_text text="Input Reads: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
166 <has_text text="umi quality: 28" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
167 <has_text text="Reads output: 72" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
168 </assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
169 </output>
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
170 </test>
14
9fa7803d1c51 "planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
iuc
parents: 12
diff changeset
171 <test expect_num_outputs="3">
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
172 <param name="type" value="paired" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
173 <param name="input_read1" value="t_R1.fastq.gz" ftype="fastq.gz" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
174 <param name="input_read2" value="t_R2.fastq.gz" ftype="fastq.gz" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
175 <param name="bc_pattern" value="NNNXXX" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
176 <output name="out1" file="out_R1.fastq.gz" decompress="true" lines_diff="2" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
177 <output name="out2" file="out_R2.fastq.gz" decompress="true" lines_diff="2" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
178 <output name="out_log" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
179 <assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
180 <has_text text="Input Reads: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
181 <has_text text="Reads output: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
182 </assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
183 </output>
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
184 </test>
14
9fa7803d1c51 "planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
iuc
parents: 12
diff changeset
185 <test expect_num_outputs="3">
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
186 <param name="type" value="paired_collection" /> <!-- same as before, but uncompressed -->
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
187 <param name="paired_type" value="no" />
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
188 <param name="input_readpair" >
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
189 <collection type="paired" >
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
190 <element name="forward" ftype="fastq" value="t_R1.fastq" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
191 <element name="reverse" ftype="fastq" value="t_R2.fastq" />
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
192 </collection>
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
193 </param>
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
194 <param name="bc_pattern" value="NNNXXX" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
195 <output name="out1" file="out_R1.fastq" ftype="fastq" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
196 <output name="out2" file="out_R2.fastq" ftype="fastq" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
197 <output name="out_log" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
198 <assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
199 <has_text text="Input Reads: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
200 <has_text text="Reads output: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
201 </assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
202 </output>
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
203 </test>
14
9fa7803d1c51 "planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
iuc
parents: 12
diff changeset
204 <test expect_num_outputs="3">
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
205 <param name="type" value="paired" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
206 <param name="input_read1" value="scrb_seq_fastq.1.gz" ftype="fastq.gz" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
207 <param name="input_read2" value="scrb_seq_fastq.2.gz" ftype="fastq.gz" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
208 <param name="extract_method" value="string" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
209 <param name="bc_pattern" value="CCCCCCNNNNNNNNNN" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
210 <param name="use_barcodes" value="yes" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
211 <param name="filter_barcode_file" value="scrb_seq_barcodes" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
212 <output name="out2" file="scrb_extract.fastq.gz" decompress="true" ftype="fastq.gz" />
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
213 </test>
14
9fa7803d1c51 "planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
iuc
parents: 12
diff changeset
214 <test expect_num_outputs="3"><!-- same as above but with regex barcode-->
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
215 <param name="type" value="paired" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
216 <param name="input_read1" value="scrb_seq_fastq.1.gz" ftype="fastq.gz" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
217 <param name="input_read2" value="scrb_seq_fastq.2.gz" ftype="fastq.gz" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
218 <param name="extract_method" value="regex" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
219 <param name="bc_pattern" value="^(?P&lt;cell_1&gt;.{6})(?P&lt;umi_1&gt;.{10})" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
220 <param name="use_barcodes" value="yes" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
221 <param name="filter_barcode_file" value="scrb_seq_barcodes" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
222 <output name="out2" file="scrb_extract.fastq.gz" decompress="true" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
223 </test>
14
9fa7803d1c51 "planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
iuc
parents: 12
diff changeset
224 <test expect_num_outputs="2"><!-- CelSeq2 example -->
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
225 <param name="type" value="paired" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
226 <param name="input_read1" value="read_R1.200.gz" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
227 <param name="input_read2" value="read_R2.200.gz" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
228 <param name="extract_method" value="string" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
229 <param name="bc_pattern" value="NNNNNNCCCCCC" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
230 <output name="out1" file="read_R1.200_extracted.fastq.gz" ftype="fastq.gz" decompress="true" lines_diff="1" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
231 <output name="out2" file="read_R2.200_extracted.fastq.gz" ftype="fastq.gz" decompress="true" lines_diff="1" />
14
9fa7803d1c51 "planemo upload commit 59c614a9dda4b9f49bd3349fbde968ee5eca1db6"
iuc
parents: 12
diff changeset
232 <param name="print_log" value="false"/>
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
233 </test>
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
234 </tests>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
235 <help><![CDATA[
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
236
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
237
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
238 UMI-tools extract.py - Extract UMI from fastq
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
239 =============================================
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
240
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
241 Purpose
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
242 -------
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
243
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
244 Extract UMI barcode from a read and add it to the read name, leaving
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
245 any sample barcode in place. Can deal with paired end reads and UMIs
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
246 split across the paired ends
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
247
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
248 Options
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
249 -------
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
250
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
251 --split-barcode
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
252 By default the UMI is assumed to be on the first read. Use this
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
253 option if the UMI is contained on both reads and specify the
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
254 pattern of the barcode/UMI on the second read using the option
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
255 ``--bc-pattern2``
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
256
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
257 --bc-pattern
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
258 Use this option to specify the format of the UMI/barcode. Use Ns to
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
259 represent the random positions and Xs to indicate the bc positions.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
260 Bases with Ns will be extracted and added to the read name. Remaining
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
261 bases, marked with an X will be reattached to the read.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
262
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
263 E.g. If the pattern is NNXXNN,
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
264 Then the read:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
265
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
266 @HISEQ:87:00000000 read1
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
267 AAGGTTGCTGATTGGATGGGCTAG
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
268 DA1AEBFGGCG01DFH00B1FF0B
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
269 +
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
270
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
271 will become:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
272 @HISEQ:87:00000000_AATT read1
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
273 GGGCTGATTGGATGGGCTAG
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
274 1AFGGCG01DFH00B1FF0B
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
275 +
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
276
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
277 --bc-pattern2
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
278 Use this option to specify the format of the UMI/barcode for
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
279 the second read pair if required. If --bc-pattern2 is not
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
280 supplied, this defaults to the same pattern as --bc-pattern
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
281
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
282 --3prime
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
283 By default the barcode is assumed to be on the 5' end of the read, but
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
284 use this option to sepecify that it is on the 3' end instead
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
285
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
286 -L
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
287 Specify a log file to retain logging information and final statistics
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
288
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
289 --split-barcode
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
290 barcode is split across read pair
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
291
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
292 --quality-filter-threshold=QUALITY_FILTER_THRESHOLD
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
293 Remove reads where any UMI base quality score falls
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
294 below this threshold
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
295 --quality-encoding=QUALITY_ENCODING
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
296 Quality score encoding. Choose from phred33[33-77]
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
297 phred64 [64-106] or solexa [59-106]
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
298
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
299 Usage:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
300 ------
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
301
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
302 For single ended reads:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
303 umi_tools extract --bc-pattern=[PATTERN] -L extract.log [OPTIONS]
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
304
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
305 reads from stdin and outputs to stdout.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
306
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
307 For paired end reads:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
308 umi_tools extract --bc-pattern=[PATTERN] --read2-in=[FASTQIN] --read2-out=[FASTQOUT] -L extract.log [OPTIONS]
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
309
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
310 reads end one from stdin and end two from FASTQIN and outputs end one to stdin
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
311 and end two to FASTQOUT.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
312
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
313 ]]></help>
1
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
314 <expand macro="citations" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
315 </tool>