annotate umi-tools_extract.xml @ 12:d5ff68d2d5ff draft

"planemo upload commit 5d3fc4232e0e036ac1ed9e2c36adc41d6af4987f"
author iuc
date Tue, 10 Sep 2019 14:28:00 -0400
parents a472e995d157
children 9fa7803d1c51
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
12
d5ff68d2d5ff "planemo upload commit 5d3fc4232e0e036ac1ed9e2c36adc41d6af4987f"
iuc
parents: 11
diff changeset
1 <tool id="umi_tools_extract" name="UMI-tools extract" version="@VERSION@.1">
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
2 <description>Extract UMI from fastq files</description>
1
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
3 <macros>
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
4 <import>macros.xml</import>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
5 <macro name="out_conditional">
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
6 <actions>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
7 <conditional name="input_type.type">
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
8 <when value="paired_collection" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
9 <action type="format">
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
10 <option type="from_param" name="input_type.input_readpair" param_attribute="forward.ext" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
11 </action>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
12 </when>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
13 <when value="paired" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
14 <action type="format">
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
15 <option type="from_param" name="input_type.input_read1" param_attribute="ext" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
16 </action>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
17 </when>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
18 </conditional>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
19 </actions>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
20 </macro>
1
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
21 </macros>
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
22 <expand macro="requirements" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
23 <command detect_errors="exit_code"><![CDATA[
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
24 @COMMAND_LINK@
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
25
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
26 umi_tools extract
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
27 --extract-method='$extract_method.value'
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
28 --bc-pattern='$bc_pattern'
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
29
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
30 #if $input_type.type == 'single':
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
31 #if $gz:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
32 --stdin=input_single.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
33 --stdout out.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
34 #else
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
35 --stdin=input_single.txt
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
36 --stdout '$out'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
37 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
38 #else:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
39 #if $gz:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
40 --stdin=input_read1.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
41 --read2-in=input_read2.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
42 --stdout out1.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
43 --read2-out=out2.gz
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
44 #else:
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
45 --stdin=input_read1.txt
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
46 --read2-in=input_read2.txt
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
47 --stdout '$out1'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
48 --read2-out='$out2'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
49 #end if
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
50 #if $input_type.barcode.barcode_select == "both_reads":
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
51 --split-barcode
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
52 --bc-pattern2='$input_type.barcode.bc_pattern2'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
53 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
54 #end if
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
55
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
56 #if $barcodes.use_barcodes.value == 'yes':
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
57 --filter-cell-barcode
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
58 --whitelist='$barcodes.filter_barcode_file'
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
59 '$barcodes.filter_correct.value'
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
60 #end if
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
61
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
62 #if not $prime3:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
63 --3prime
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
64 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
65 #if $quality.quality_selector =='true':
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
66 --quality-filter-threshold '$quality.quality_filter_threshold'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
67 --quality-encoding '$quality.quality_encoding'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
68 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
69 #if $print_log == "1":
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
70 --log='$out_log'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
71 #else
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
72 --supress-stats
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
73 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
74 #if $gz:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
75 #if $input_type.type == 'single':
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
76 && mv out.gz '$out'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
77 #else
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
78 && mv out1.gz '$out1'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
79 && mv out2.gz '$out2'
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
80 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
81 #end if
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
82 ]]></command>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
83 <inputs>
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
84 <expand macro="input_types" />
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
85
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
86 <conditional name="barcodes" >
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
87 <param name="use_barcodes" argument="--filter-cell-barcode" type="select" label="Use Known Barcodes?" >
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
88 <option value="yes">Yes</option>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
89 <option value="no" selected="true" >No</option>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
90 </param>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
91 <when value="no" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
92 <when value="yes" >
10
828dba98cdb4 planemo upload commit 04285134f1d28f273bed56976895072148c443c9
iuc
parents: 8
diff changeset
93 <param name="filter_barcode_file" type="data" format="tabular,tsv" label="Barcode File" />
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
94 <param name="filter_correct" argument="--error-correct-cell" type="boolean" truevalue="--error-correct-cell" falsevalue="" checked="false" label="Apply correction to cell barcodes?" help="This only applies if your barcode file has two columns output from the umi_tools whitelist command." />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
95 </when>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
96 </conditional>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
97
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
98 <param name="extract_method" type="select" label="Method to extract barcodes" >
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
99 <option value="regex">Regular Expressions</option>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
100 <option value="string" selected="true">String</option>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
101 </param>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
102
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
103 <param name="bc_pattern" argument="--bc-pattern" type="text" label="Barcode pattern for first read"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
104 help="Use this option to specify the format of the UMI/barcode. Use Ns to
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
105 represent the random positions and Xs to indicate the bc positions.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
106 Bases with Ns will be extracted and added to the read name. Remaining
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
107 bases, marked with an X will be reattached to the read.">
12
d5ff68d2d5ff "planemo upload commit 5d3fc4232e0e036ac1ed9e2c36adc41d6af4987f"
iuc
parents: 11
diff changeset
108 <expand macro="barcode_sanitizer" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
109 </param>
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
110
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
111 <param name="prime3" argument="--3prime" type="boolean" label="Is the barcode at the 5' end?"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
112 truevalue="1" falsevalue="0" checked="true"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
113 help="By default the barcode is assumed to be on the 5' end of the read, but
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
114 use this option to sepecify that it is on the 3' end instead." />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
115 <param name="print_log" argument="-L" type="boolean" label="Output log?"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
116 truevalue="1" falsevalue="0" checked="true"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
117 help="Choose if you want to generate a text file containing logging information." />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
118 <conditional name="quality">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
119 <param name="quality_selector" type="select" label="Enable quality filter?" >
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
120 <option value="false">No</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
121 <option value="true">Yes</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
122 </param>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
123 <when value="false">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
124 </when>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
125 <when value="true">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
126 <param name="quality_filter_threshold" label="Phred score threshold"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
127 type="integer" value="20" argument="--quality-filter-threshold"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
128 help="Remove reads where any UMI base quality score falls below this threshold." />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
129 <param name="quality_encoding" argument="--quality-encoding" type="select" label="Library type"
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
130 help="Quality score encoding. Choose from phred33 [33-77], phred64 [64-106] or solexa [59-106].">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
131 <option value="phred33">phred33 [33-77]</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
132 <option value="phred64">phred64 [64-106]</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
133 <option value="solexa">solexa [59-106]</option>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
134 </param>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
135 </when>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
136 </conditional>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
137 </inputs>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
138 <outputs>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
139 <data name="out" format_source="input_single" label="Reads: ${tool.name} on ${on_string}" >
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
140 <filter>input_type['type'] == "single"</filter>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
141 </data>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
142 <data name="out1" format_source="input_read1" label="Reads1: ${tool.name} on ${on_string}" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
143 <filter>input_type['type'] != "single"</filter>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
144 <expand macro="out_conditional" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
145 </data>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
146 <data name="out2" format_source="input_read2" label="Reads2: ${tool.name} on ${on_string}" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
147 <filter>input_type['type'] != "single"</filter>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
148 <expand macro="out_conditional" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
149 </data>
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
150
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
151 <data name="out_log" format="txt">
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
152 <filter>print_log == True</filter>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
153 </data>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
154 </outputs>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
155 <tests>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
156 <test>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
157 <param name="type" value="single" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
158 <param name="input_single" value="t_R1.fastq" ftype="fastq" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
159 <param name="bc_pattern" value="XXXNNN" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
160 <param name="prime3" value="0" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
161 <param name="quality_selector" value="true" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
162 <param name="quality_filter_threshold" value="10" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
163 <param name="quality_encoding" value="phred33" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
164 <output name="out" file="out_SE.fastq" ftype="fastq" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
165 <output name="out_log" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
166 <assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
167 <has_text text="Input Reads: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
168 <has_text text="umi quality: 28" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
169 <has_text text="Reads output: 72" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
170 </assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
171 </output>
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
172 </test>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
173 <test>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
174 <param name="type" value="paired" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
175 <param name="input_read1" value="t_R1.fastq.gz" ftype="fastq.gz" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
176 <param name="input_read2" value="t_R2.fastq.gz" ftype="fastq.gz" />
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
177 <param name="bc_pattern" value="NNNXXX" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
178 <output name="out1" file="out_R1.fastq.gz" decompress="true" lines_diff="2" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
179 <output name="out2" file="out_R2.fastq.gz" decompress="true" lines_diff="2" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
180 <output name="out_log" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
181 <assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
182 <has_text text="Input Reads: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
183 <has_text text="Reads output: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
184 </assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
185 </output>
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
186 </test>
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
187 <test>
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
188 <param name="type" value="paired_collection" /> <!-- same as before, but uncompressed -->
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
189 <param name="paired_type" value="no" />
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
190 <param name="input_readpair" >
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
191 <collection type="paired" >
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
192 <element name="forward" ftype="fastq" value="t_R1.fastq" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
193 <element name="reverse" ftype="fastq" value="t_R2.fastq" />
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
194 </collection>
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
195 </param>
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
196 <param name="bc_pattern" value="NNNXXX" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
197 <output name="out1" file="out_R1.fastq" ftype="fastq" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
198 <output name="out2" file="out_R2.fastq" ftype="fastq" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
199 <output name="out_log" >
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
200 <assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
201 <has_text text="Input Reads: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
202 <has_text text="Reads output: 100" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
203 </assert_contents>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
204 </output>
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
205 </test>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
206 <test>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
207 <param name="type" value="paired" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
208 <param name="input_read1" value="scrb_seq_fastq.1.gz" ftype="fastq.gz" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
209 <param name="input_read2" value="scrb_seq_fastq.2.gz" ftype="fastq.gz" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
210 <param name="extract_method" value="string" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
211 <param name="bc_pattern" value="CCCCCCNNNNNNNNNN" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
212 <param name="use_barcodes" value="yes" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
213 <param name="filter_barcode_file" value="scrb_seq_barcodes" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
214 <output name="out2" file="scrb_extract.fastq.gz" decompress="true" ftype="fastq.gz" />
5
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
215 </test>
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
216 <test><!-- same as above but with regex barcode-->
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
217 <param name="type" value="paired" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
218 <param name="input_read1" value="scrb_seq_fastq.1.gz" ftype="fastq.gz" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
219 <param name="input_read2" value="scrb_seq_fastq.2.gz" ftype="fastq.gz" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
220 <param name="extract_method" value="regex" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
221 <param name="bc_pattern" value="^(?P&lt;cell_1&gt;.{6})(?P&lt;umi_1&gt;.{10})" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
222 <param name="use_barcodes" value="yes" />
f77bc14eba31 planemo upload commit 57e3e460a740aa7aad217c8365527c49e88c9a30
iuc
parents: 4
diff changeset
223 <param name="filter_barcode_file" value="scrb_seq_barcodes" />
8
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
224 <output name="out2" file="scrb_extract.fastq.gz" decompress="true" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
225 </test>
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
226 <test><!-- CelSeq2 example -->
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
227 <param name="type" value="paired" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
228 <param name="input_read1" value="read_R1.200.gz" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
229 <param name="input_read2" value="read_R2.200.gz" ftype="fastq.gz" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
230 <param name="extract_method" value="string" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
231 <param name="bc_pattern" value="NNNNNNCCCCCC" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
232 <output name="out1" file="read_R1.200_extracted.fastq.gz" ftype="fastq.gz" decompress="true" lines_diff="1" />
3cfd8e1073d7 planemo upload commit f6178c9e071a2158a35b82a3607f6dc8a767675c
iuc
parents: 5
diff changeset
233 <output name="out2" file="read_R2.200_extracted.fastq.gz" ftype="fastq.gz" decompress="true" lines_diff="1" />
4
e73a22ff585c planemo upload commit 76cbd559320d2a639e35ed10cb2d9522a5a77ae0
iuc
parents: 1
diff changeset
234 </test>
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
235 </tests>
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
236 <help><![CDATA[
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
237
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
238
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
239 UMI-tools extract.py - Extract UMI from fastq
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
240 =============================================
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
241
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
242 Purpose
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
243 -------
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
244
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
245 Extract UMI barcode from a read and add it to the read name, leaving
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
246 any sample barcode in place. Can deal with paired end reads and UMIs
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
247 split across the paired ends
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
248
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
249 Options
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
250 -------
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
251
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
252 --split-barcode
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
253 By default the UMI is assumed to be on the first read. Use this
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
254 option if the UMI is contained on both reads and specify the
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
255 pattern of the barcode/UMI on the second read using the option
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
256 ``--bc-pattern2``
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
257
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
258 --bc-pattern
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
259 Use this option to specify the format of the UMI/barcode. Use Ns to
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
260 represent the random positions and Xs to indicate the bc positions.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
261 Bases with Ns will be extracted and added to the read name. Remaining
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
262 bases, marked with an X will be reattached to the read.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
263
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
264 E.g. If the pattern is NNXXNN,
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
265 Then the read:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
266
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
267 @HISEQ:87:00000000 read1
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
268 AAGGTTGCTGATTGGATGGGCTAG
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
269 DA1AEBFGGCG01DFH00B1FF0B
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
270 +
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
271
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
272 will become:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
273 @HISEQ:87:00000000_AATT read1
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
274 GGGCTGATTGGATGGGCTAG
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
275 1AFGGCG01DFH00B1FF0B
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
276 +
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
277
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
278 --bc-pattern2
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
279 Use this option to specify the format of the UMI/barcode for
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
280 the second read pair if required. If --bc-pattern2 is not
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
281 supplied, this defaults to the same pattern as --bc-pattern
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
282
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
283 --3prime
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
284 By default the barcode is assumed to be on the 5' end of the read, but
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
285 use this option to sepecify that it is on the 3' end instead
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
286
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
287 -L
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
288 Specify a log file to retain logging information and final statistics
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
289
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
290 --split-barcode
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
291 barcode is split across read pair
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
292
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
293 --quality-filter-threshold=QUALITY_FILTER_THRESHOLD
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
294 Remove reads where any UMI base quality score falls
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
295 below this threshold
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
296 --quality-encoding=QUALITY_ENCODING
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
297 Quality score encoding. Choose from phred33[33-77]
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
298 phred64 [64-106] or solexa [59-106]
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
299
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
300 Usage:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
301 ------
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
302
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
303 For single ended reads:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
304 umi_tools extract --bc-pattern=[PATTERN] -L extract.log [OPTIONS]
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
305
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
306 reads from stdin and outputs to stdout.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
307
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
308 For paired end reads:
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
309 umi_tools extract --bc-pattern=[PATTERN] --read2-in=[FASTQIN] --read2-out=[FASTQOUT] -L extract.log [OPTIONS]
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
310
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
311 reads end one from stdin and end two from FASTQIN and outputs end one to stdin
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
312 and end two to FASTQOUT.
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
313
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
314 ]]></help>
1
79436b3019e9 planemo upload commit c8e46ecad0b1473097517e582ed6c43eb0635b36
iuc
parents: 0
diff changeset
315 <expand macro="citations" />
0
418b961e0576 planemo upload commit 453bb3b44d9f27908cbe2677378da88b9f77b5cf
iuc
parents:
diff changeset
316 </tool>