annotate umi-tools_whitelist.xml @ 3:853f74e08009 draft

planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
author iuc
date Sat, 31 Mar 2018 17:36:28 -0400
parents c1743022a8cd
children 095c349b4343
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
1 <tool id="umi_tools_whitelist" name="UMI-tools whitelist" version="@VERSION@.1">
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
2 <description>Extract cell barcodes from FASTQ files</description>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
3 <macros>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
4 <import>macros.xml</import>
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
5 <macro name="barcode2_conditional" >
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
6 <conditional name="barcode">
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
7 <param name="barcode_select" argument="--split-barcode" type="select" label="Barcode on both reads?">
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
8 <option value="first_read_only">Barcode on first read only</option>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
9 <option value="both_reads">Barcode on both reads</option>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
10 </param>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
11 <when value="first_read_only"/>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
12 <when value="both_reads">
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
13 <param name="bc_pattern2" argument="--bc-pattern2" type="text" value="" label="Barcode pattern for second read"
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
14 help="Use this option to specify the format of the UMI/barcode for
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
15 the second read pair if required.">
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
16 </param>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
17 </when>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
18 </conditional>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
19 </macro>
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
20 </macros>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
21 <expand macro="requirements" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
22 <command detect_errors="exit_code"><![CDATA[
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
23 #set $gz = False
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
24 #if $input_type.type == 'single':
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
25 #if $input_type.input_single.is_of_type("fastq.gz", "fastqsanger.gz"):
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
26 ln -s '$input_type.input_single' input_single.gz &&
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
27 #set $gz = True
3
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
28 #else
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
29 ln -s '$input_type.input_single' input_single.txt &&
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
30 #end if
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
31 #elif $input_type.type == 'paired':
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
32 #if $input_type.input_read1.is_of_type("fastq.gz", "fastqsanger.gz"):
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
33 ln -s '$input_type.input_read1' input_read1.gz &&
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
34 ln -s '$input_type.input_read2' input_read2.gz &&
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
35 #set $gz = True
3
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
36 #else
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
37 ln -s '$input_type.input_read1' input_read1.txt &&
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
38 ln -s '$input_type.input_read2' input_read2.txt &&
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
39 #end if
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
40 #else ## paired_collection
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
41 #if $input_type.input_readpair.forward.is_of_type("fastq.gz", "fastqsanger.gz"):
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
42 ln -s '$input_type.input_readpair.forward' input_read1.gz &&
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
43 ln -s '$input_type.input_readpair.reverse' input_read2.gz &&
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
44 #set $gz = True
3
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
45 #else
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
46 ln -s '$input_type.input_readpair.forward' input_read1.txt &&
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
47 ln -s '$input_type.input_readpair.reverse' input_read2.txt &&
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
48 #end if
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
49 #end if
3
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
50
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
51 umi_tools whitelist
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
52 --bc-pattern='$bc_pattern'
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
53 --subset-reads='$subset_reads'
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
54 #if $input_type.type == 'single':
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
55 #if $gz:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
56 --stdin=input_single.gz
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
57 #else
3
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
58 --stdin=input_single.txt
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
59 #end if
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
60 #else: ## equally valid for both 'paired' and 'paired_collection'
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
61 #if $gz:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
62 --stdin=input_read1.gz
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
63 --read2-in=input_read2.gz
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
64 #else:
3
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
65 --stdin=input_read1.txt
853f74e08009 planemo upload commit d8f6e961cc9f14c5b39762f87e11352c0aadefc9
iuc
parents: 2
diff changeset
66 --read2-in=input_read2.txt
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
67 #end if
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
68 #if $input_type.barcode.barcode_select == "1":
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
69 --bc-pattern2='$input_type.barcode.bc_pattern2'
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
70 #end if
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
71 #end if
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
72 #if $celloptions.use_cell_opts == "advanced":
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
73 #if $celloptions.set_cell_number != "0":
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
74 --set-cell-number=$celloptions.set_cell_number
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
75 #end if
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
76 #if $celloptions.expect_cells != "0":
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
77 --expect-cells=$celloptions.expect_cells
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
78 #end if
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
79 --error-correct-threshold=$celloptions.error_correct_thresh
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
80 #end if
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
81 --method=$method
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
82 --plot-prefix=OUT
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
83
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
84 $prime3
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
85
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
86 #if $log:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
87 --log='$out_log'
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
88 #end if
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
89
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
90 --log2stderr
1
dac4e7dc837d planemo upload commit c69e558f5186d40896ee40a49bdb2275949faf9e
iuc
parents: 0
diff changeset
91
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
92 > '$out_whitelist' &&
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
93
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
94 mkdir '${ out_html_report.files_path }' &&
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
95 cp OUT_*.png '${ out_html_report.files_path }' &&
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
96
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
97 echo "<html>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
98 <head></head><body>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
99 <h1>Cell and Count Metrics</h1>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
100 <img src=\"OUT_cell_barcode_count_density.png\" ><br />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
101 <img src=\"OUT_cell_barcode_knee.png\" ><br />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
102 <img src=\"OUT_cell_barcode_counts.png\" ><br />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
103 </body></html>" > '$out_html_report'
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
104 &&
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
105 mv OUT_cell_thresholds.tsv '$out_thresh'
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
106 ]]></command>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
107 <inputs>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
108 <conditional name="input_type">
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
109 <param name="type" type="select" label="Library type">
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
110 <option value="single">Single-end</option>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
111 <option value="paired">Paired-end</option>
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
112 <option value="paired_collection">Paired-end Dataset Collection</option>
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
113 </param>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
114 <when value="single">
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
115 <param name="input_single" type="data" format="fastq,fastq.gz" label="Reads in FASTQ format" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
116 </when>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
117 <when value="paired">
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
118 <param name="input_read1" type="data" format="fastq,fastq.gz" label="Reads in FASTQ format" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
119 <param name="input_read2" type="data" format="fastq,fastq.gz" label="Reads in FASTQ format" />
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
120 <expand macro="barcode2_conditional" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
121 </when>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
122 <when value="paired_collection">
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
123 <param name="input_readpair" type="data_collection" collection_type="paired" format="fastq,fastq.gz" label="Reads in FASTQ format" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
124 <expand macro="barcode2_conditional" />
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
125 </when>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
126 </conditional>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
127 <param name="bc_pattern" argument="--bc-pattern" type="text" label="Barcode pattern for first read"
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
128 help="Use this option to specify the format of the UMI/barcode. Use Ns to
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
129 represent the random positions and Xs to indicate the bc positions.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
130 Bases with Ns will be extracted and added to the read name. Remaining
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
131 bases, marked with an X will be reattached to the read.">
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
132 </param>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
133 <param name="method" argument="--method" type="select" label="Count reads or UMIs"
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
134 help="Many published protocols rank CBs by the number of reads the CBs appear in. However you could also use the number of unique UMIs a CB is associated with. Note that this is still and approximation to the number of transcripts captured because the same UMI could be associated with two different transcripts and be counted as independent." >
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
135 <option value="reads" selected="true" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
136 <option value="umis" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
137 </param>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
138
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
139 <param argument="--3prime" name="prime3" type="boolean" label="Is barcode on 3' end of the read?"
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
140 truevalue="--3prime" falsevalue=""
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
141 help="By default the barcode is assumed to be on the 5' end of the read, but
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
142 use this option to specify that it is on the 3' end instead." />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
143 <param name="subset_reads" argument="--subset-reads" type="integer" min="0" value="0" label="Use the first N reads to automatically identify the true cell barcodes." />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
144 <conditional name="celloptions" >
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
145 <param name="use_cell_opts" type="select" label="Cell parameters" >
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
146 <option value="defaults" selected="True">Use Defaults</option>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
147 <option value="advanced">Advanced Options</option>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
148 </param>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
149 <when value="defaults"/>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
150 <when value="advanced">
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
151 <param name="set_cell_number" type="integer" min="0" value="0" label="Specify the number of cell barcodes to accept" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
152 <param name="expect_cells" type="integer" min="0" value="0" label="Prior expectation on the upper limit on the number of cells sequenced" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
153 <param name="error_correct_thresh" type="integer" min="0" value="0" label="Hamming distance for correction of barcodes to whilelist barcodes. Set to zero to generate no error correcting metrics." />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
154 </when>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
155 </conditional>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
156 <param argument="--log" type="boolean" label="Output log?" truevalue="--log" falsevalue=""
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
157 help="Choose if you want to generate a text file containing logging information." />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
158
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
159 </inputs>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
160 <outputs>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
161 <data name="out_whitelist" format="tabular" label="${tool.name} on ${on_string}: Whitelist"/>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
162 <data name="out_log" format="txt" label="${tool.name} on ${on_string}: logfile" >
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
163 <filter>log</filter>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
164 </data>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
165 <data name="out_html_report" format="html" label="${tool.name} on ${on_string}: Webpage" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
166 <data name="out_thresh" format="tabular" label="${tool.name} on ${on_string}: TSV Cell Thresholds" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
167 </outputs>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
168 <tests>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
169 <test expect_num_outputs="3">
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
170 <param name="type" value="single" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
171 <param name="input_single" value="t_R2.fastq.gz" ftype="fastq" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
172 <param name="bc_pattern" value="CCCCCCCCNNNNNNNN" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
173 <param name="method" value="reads" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
174 <param name="prime3" value="true" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
175 <output name="out_whitelist" file="out_wl_single.txt" lines_diff="40" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
176 <output name="out_thresh" file="out_wl_single.tresh.tab" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
177 <output name="out_html_report" file="out_wl_single.html" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
178 </test>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
179 <test expect_num_outputs="4">
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
180 <param name="type" value="paired" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
181 <param name="input_read1" value="t_R1.fastq.gz" ftype="fastq" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
182 <param name="input_read2" value="t_R2.fastq.gz" ftype="fastq" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
183 <param name="barcode_select" value="both_reads" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
184 <param name="bc_pattern" value="CCCNNNNNNNNXXXXX" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
185 <param name="bc_pattern2" value="CCCCCCCCNNNNNNNN" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
186 <param name="method" value="reads" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
187 <param name="prime3" value="false" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
188 <param name="use_cell_opts" value="advanced" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
189 <param name="expect_cells" value="5" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
190 <param name="error_correct_thresh" value="3" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
191 <param name="log" value="true" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
192 <output name="out_whitelist" file="out_wl_paired.txt" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
193 <output name="out_log" file="out_wl_paired.log" lines_diff="40" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
194 <output name="out_html_report" file="out_wl_paired.html" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
195 <output name="out_thresh" file="out_wl_paired.tresh.tab" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
196 </test>
2
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
197 <test expect_num_outputs="4"> <!-- As previous, identical outputs but paired collection input -->
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
198 <param name="type" value="paired_collection" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
199 <param name="input_readpair" >
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
200 <collection type="paired">
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
201 <element name="forward" ftype="fastq.gz" value="t_R1.fastq.gz" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
202 <element name="reverse" ftype="fastq.gz" value="t_R2.fastq.gz" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
203 </collection>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
204 </param>
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
205 <param name="barcode_select" value="both_reads" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
206 <param name="bc_pattern" value="CCCNNNNNNNNXXXXX" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
207 <param name="bc_pattern2" value="CCCCCCCCNNNNNNNN" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
208 <param name="method" value="reads" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
209 <param name="prime3" value="false" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
210 <param name="use_cell_opts" value="advanced" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
211 <param name="expect_cells" value="5" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
212 <param name="error_correct_thresh" value="3" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
213 <param name="log" value="true" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
214 <output name="out_whitelist" file="out_wl_paired.txt" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
215 <output name="out_log" file="out_wl_paired.log" lines_diff="40" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
216 <output name="out_html_report" file="out_wl_paired.html" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
217 <output name="out_thresh" file="out_wl_paired.tresh.tab" />
c1743022a8cd planemo upload commit e274ffd67bede657f4f5a2c6524023ff57f0db87
iuc
parents: 1
diff changeset
218 </test>
0
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
219 </tests>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
220 <help><![CDATA[
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
221
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
222
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
223 UMI-tools whitelist - Extract barcodes from fastq
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
224 ==================================================
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
225
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
226 Purpose
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
227 -------
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
228
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
229 Extract cell barcodes and identify the most likely true barcodes using
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
230 the 'knee' method.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
231
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
232 Options
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
233 -------
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
234
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
235 --bc-pattern
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
236 This should be used where the barcodes are always in the same
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
237 place in the read.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
238
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
239 - N = UMI position (required)
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
240 - C = cell barcode position (optional)
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
241 - X = sample position (optional)
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
242
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
243 Bases with Ns and Cs will be extracted and added to the read
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
244 name. The corresponding sequence qualities will be removed from
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
245 the read. Bases with an X will be reattached to the read.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
246
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
247 E.g. If the pattern is NNNNCC,
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
248 Then the read:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
249 @HISEQ:87:00000000 read1
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
250 AAGGTTGCTGATTGGATGGGCTAG
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
251 DA1AEBFGGCG01DFH00B1FF0B
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
252 +
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
253 will become:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
254 @HISEQ:87:00000000_TT_AAGG read1
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
255 GCTGATTGGATGGGCTAG
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
256 1AFGGCG01DFH00B1FF0B
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
257 +
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
258
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
259 where 'TT' is the cell barcode and 'AAGG' is the UMI.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
260
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
261
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
262 --set-cell-number
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
263 Use this option to explicity set the number of cell barcodes
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
264 which should be accepted. Note that the exact number of cell
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
265 barcodes in the outputted whitelist may be slightly less than
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
266 this if there are multiple cells observed with the same
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
267 frequency at the threshold between accepted and rejected cell
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
268 barcodes.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
269
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
270 --expect-cells=[EXPECTED_CELLS]
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
271 An upper limit estimate for the number of inputted cells. The knee
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
272 method will now select the first threshold (order ascendingly)
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
273 which results in the number of cell barcodes accepted being <=
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
274 EXPECTED_CELLS and > EXPECTED_CELLS * 0.1.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
275
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
276
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
277 --bc-pattern2
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
278 Use this option to specify the format of the UMI/barcode for
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
279 the second read pair if required. If --bc-pattern2 is not
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
280 supplied, this defaults to the same pattern as --bc-pattern
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
281
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
282 --3prime
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
283 By default the barcode is assumed to be on the 5' end of the read, but
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
284 use this option to sepecify that it is on the 3' end instead
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
285
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
286 Usage:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
287 ------
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
288
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
289 For single ended reads:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
290 umi_tools whitelist --bc-pattern=[PATTERN] -L extract.log
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
291 [OPTIONS]
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
292
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
293 reads from stdin and outputs to stdout.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
294
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
295 For paired end reads where the cell barcodes is split across the read pairs:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
296 umi_tools whitelist --bc-pattern=[PATTERN]
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
297 --bc-pattern2=[PATTERN] --read2-in=[FASTQIN] -L extract.log
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
298 [OPTIONS]
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
299
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
300 reads end one from stdin and end two from FASTQIN and outputs to stdin
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
301
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
302
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
303 Output:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
304 -------
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
305
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
306 The whitelist is outputted as 4 tab-separated columns:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
307
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
308 1. whitelisted cell barcode
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
309 2. Other cell barcode(s) (comma-separated) to correct to the
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
310 whitelisted barcode
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
311 3. Count for whitelisted cell barcodes
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
312 4. Count(s) for the other cell barcode(s) (comma-separated)
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
313
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
314 example output:
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
315
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
316 AAAAAA AGAAAA 146 1
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
317 AAAATC 22
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
318 AAACAT 21
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
319 AAACTA AAACTN,GAACTA 27 1,1
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
320 AAATAC 72
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
321 AAATCA GAATCA 37 3
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
322 AAATGT AAAGGT,CAATGT 41 1,1
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
323 AAATTG CAATTG 36 1
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
324 AACAAT 18
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
325 AACATA 24
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
326
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
327 If --error-correct-threshold is set to 0, columns 2 and 4 will be empty.
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
328
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
329
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
330 ]]></help>
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
331 <expand macro="citations" />
b911124762a8 planemo upload commit 8da5246c32d60a49e6b6b9027c9adc0a31d4bc5a
iuc
parents:
diff changeset
332 </tool>