Mercurial > repos > iuc > umi_tools_dedup
comparison umi-tools_dedup.xml @ 11:7fa28eb10fed draft
"planemo upload commit 2da1197aac6a18df9252e5da096645d2ecaece88"
author | iuc |
---|---|
date | Wed, 10 Feb 2021 19:30:35 +0000 |
parents | c6567483aa1e |
children | 4098ab380097 |
comparison
equal
deleted
inserted
replaced
10:c6567483aa1e | 11:7fa28eb10fed |
---|---|
1 <tool id="umi_tools_dedup" name="UMI-tools deduplicate" version="@VERSION@.0"> | 1 <tool id="umi_tools_dedup" name="UMI-tools deduplicate" version="@VERSION@+galaxy1"> |
2 <description>Extract UMI from fastq files</description> | 2 <description>Extract UMI from fastq files</description> |
3 <macros> | 3 <macros> |
4 <import>macros.xml</import> | 4 <import>macros.xml</import> |
5 </macros> | 5 </macros> |
6 <expand macro="requirements"> | 6 <expand macro="requirements"> |
14 ln -sf '$input.metadata.bam_index' 'input.bam.bai' && | 14 ln -sf '$input.metadata.bam_index' 'input.bam.bai' && |
15 #set $input_file = 'input.bam' | 15 #set $input_file = 'input.bam' |
16 #end if | 16 #end if |
17 | 17 |
18 umi_tools dedup | 18 umi_tools dedup |
19 '$output_stats_bool' | |
19 --random-seed 0 | 20 --random-seed 0 |
20 --extract-umi-method $extract_umi_method | 21 --extract-umi-method $extract_umi_method |
21 #if str($extract_umi_method) != 'read_id': | 22 #if str($extract_umi_method) != 'read_id': |
22 --umi-separator '$umi_separator' --umi-tag '$umi_tag' | 23 --umi-separator '$umi_separator' --umi-tag '$umi_tag' |
23 #end if | 24 #end if |
61 <param argument="--chrom" type="boolean" truevalue="--chrom" falsevalue="" label="Only consider a single chromosome" /> | 62 <param argument="--chrom" type="boolean" truevalue="--chrom" falsevalue="" label="Only consider a single chromosome" /> |
62 <param name="per_contig" argument="--per-contig" type="boolean" truevalue="--per-contig" falsevalue="" label="Deduplicate per contig" help="Field 3 in BAM; RNAME. All reads with the same contig will be considered to have the same alignment position. This is useful if your library prep generates PCR duplicates with non identical alignment positions such as CEL-Seq. In this case, you would align to a reference transcriptome with one transcript per gene" /> | 63 <param name="per_contig" argument="--per-contig" type="boolean" truevalue="--per-contig" falsevalue="" label="Deduplicate per contig" help="Field 3 in BAM; RNAME. All reads with the same contig will be considered to have the same alignment position. This is useful if your library prep generates PCR duplicates with non identical alignment positions such as CEL-Seq. In this case, you would align to a reference transcriptome with one transcript per gene" /> |
63 <param name="per_gene" argument="--per-gene" type="boolean" truevalue="--per-gene" falsevalue="" label="Deduplicate per gene" help="As above except with this option you can align to a reference transcriptome with more than one transcript per gene. You need to also provide a map of genes to transcripts. This will also add a metacontig ('MC') tag to the output BAM file." /> | 64 <param name="per_gene" argument="--per-gene" type="boolean" truevalue="--per-gene" falsevalue="" label="Deduplicate per gene" help="As above except with this option you can align to a reference transcriptome with more than one transcript per gene. You need to also provide a map of genes to transcripts. This will also add a metacontig ('MC') tag to the output BAM file." /> |
64 <param name="gene_transcript_map" argument="--gene-transcript-map" type="data" format="tabular" optional="True" label="Tabular file mapping genes to transripts" /> | 65 <param name="gene_transcript_map" argument="--gene-transcript-map" type="data" format="tabular" optional="True" label="Tabular file mapping genes to transripts" /> |
65 <param name="gene_tag" argument="--gene-tag" type="text" optional="True" label="Deduplicate by this gene tag" help="As --per-gene except here the gene information is encoded in the bam read tag specified so you do not need to supply the mapping file." /> | 66 <param name="gene_tag" argument="--gene-tag" type="text" optional="True" label="Deduplicate by this gene tag" help="As --per-gene except here the gene information is encoded in the bam read tag specified so you do not need to supply the mapping file." /> |
67 <param name="output_stats_bool" type="boolean" truevalue="--output-stats=stats_outputs" falsevalue="" checked="false" label="Output UMI related statistics files?"/> | |
66 </inputs> | 68 </inputs> |
67 <outputs> | 69 <outputs> |
68 <data format="bam" name="output" /> | 70 <data format="bam" name="output" /> |
71 <collection name="output_stats" type="list" label="UMI_tools dedup stats"> | |
72 <filter>output_stats_bool</filter> | |
73 <data name="edit_distance" format="tabular" from_work_dir="stats_outputs_edit_distance.tsv"/> | |
74 <data name="per_umi" format="tabular" from_work_dir="stats_outputs_per_umi.tsv"/> | |
75 <data name="per_umi_per_position" format="tabular" from_work_dir="stats_outputs_per_umi_per_position.tsv"/> | |
76 </collection> | |
69 </outputs> | 77 </outputs> |
70 <tests> | 78 <tests> |
71 <test> | 79 <test expect_num_outputs="1"> |
72 <param name="input" value="group_in1.sam" ftype="sam" /> | 80 <param name="input" value="group_in1.sam" ftype="sam" /> |
73 <param name="extract_umi_method" value="read_id" /> | 81 <param name="extract_umi_method" value="read_id" /> |
74 <param name="method" value="unique" /> | 82 <param name="method" value="unique" /> |
75 <output name="output" file="dedup_out1.bam" ftype="bam" sort="True"/> | 83 <output name="output" file="dedup_out1.bam" ftype="bam" sort="True"/> |
76 </test> | 84 </test> |
77 <test> | 85 <test expect_num_outputs="1"> |
78 <param name="input" value="group_in2.bam" ftype="bam" /> | 86 <param name="input" value="group_in2.bam" ftype="bam" /> |
79 <param name="extract_umi_method" value="read_id" /> | 87 <param name="extract_umi_method" value="read_id" /> |
80 <param name="paired" value="True" /> | 88 <param name="paired" value="True" /> |
81 <param name="method" value="unique" /> | 89 <param name="method" value="unique" /> |
82 <output name="output" file="dedup_out2.bam" ftype="bam" sort="True" /> | 90 <output name="output" file="dedup_out2.bam" ftype="bam" sort="True" /> |
83 </test> | 91 </test> |
84 <test> | 92 <test expect_num_outputs="1"> |
85 <param name="input" value="group_in3.bam" ftype="bam" /> | 93 <param name="input" value="group_in3.bam" ftype="bam" /> |
86 <param name="extract_umi_method" value="read_id" /> | 94 <param name="extract_umi_method" value="read_id" /> |
87 <param name="method" value="unique" /> | 95 <param name="method" value="unique" /> |
88 <output name="output" file="dedup_out3.bam" ftype="bam" sort="True" /> | 96 <output name="output" file="dedup_out3.bam" ftype="bam" sort="True" /> |
89 </test> | 97 </test> |
90 <test> | 98 <test expect_num_outputs="1"> |
91 <param name="input" value="group_in4.bam" ftype="bam" /> | 99 <param name="input" value="group_in4.bam" ftype="bam" /> |
92 <param name="extract_umi_method" value="tag" /> | 100 <param name="extract_umi_method" value="tag" /> |
93 <param name="umi_tag" value="BX" /> | 101 <param name="umi_tag" value="BX" /> |
94 <param name="method" value="unique" /> | 102 <param name="method" value="unique" /> |
95 <output name="output" file="dedup_out4.bam" ftype="bam" sort="True" /> | 103 <output name="output" file="dedup_out4.bam" ftype="bam" sort="True" /> |
96 </test> | 104 </test> |
97 <test> | 105 <test expect_num_outputs="1"> |
98 <param name="input" value="group_in5.bam" ftype="bam" /> | 106 <param name="input" value="group_in5.bam" ftype="bam" /> |
99 <param name="extract_umi_method" value="read_id" /> | 107 <param name="extract_umi_method" value="read_id" /> |
100 <param name="umi_tag" value="BX" /> | 108 <param name="umi_tag" value="BX" /> |
101 <param name="method" value="cluster" /> | 109 <param name="method" value="cluster" /> |
102 <output name="output" file="dedup_out5.bam" ftype="bam" sort="True" /> | 110 <output name="output" file="dedup_out5.bam" ftype="bam" sort="True" /> |
103 </test> | 111 </test> |
104 <test> | 112 <test expect_num_outputs="1"> |
105 <param name="input" value="group_in6.bam" ftype="bam" /> | 113 <param name="input" value="group_in6.bam" ftype="bam" /> |
106 <param name="extract_umi_method" value="read_id" /> | 114 <param name="extract_umi_method" value="read_id" /> |
107 <param name="umi_tag" value="BX" /> | 115 <param name="umi_tag" value="BX" /> |
108 <param name="method" value="directional" /> | 116 <param name="method" value="directional" /> |
109 <output name="output" file="dedup_out6.bam" ftype="bam" sort="True" /> | 117 <output name="output" file="dedup_out6.bam" ftype="bam" sort="True" /> |
118 </test> | |
119 <test expect_num_outputs="5"> | |
120 <param name="input" value="group_in6.bam" ftype="bam" /> | |
121 <param name="extract_umi_method" value="read_id" /> | |
122 <param name="umi_tag" value="BX" /> | |
123 <param name="method" value="directional" /> | |
124 <param name="output_stats_bool" value="true"/> | |
125 <output name="output" file="dedup_out6.bam" ftype="bam" sort="True" /> | |
126 <output_collection name="output_stats"> | |
127 <element name="edit_distance" file="stats_outputs_edit_distance.tsv" /> | |
128 <element name="per_umi" file="stats_outputs_per_umi.tsv" /> | |
129 <element name="per_umi_per_position" file="stats_outputs_per_umi_per_position.tsv" /> | |
130 </output_collection> | |
110 </test> | 131 </test> |
111 </tests> | 132 </tests> |
112 <help><![CDATA[ | 133 <help><![CDATA[ |
113 umi_tools dedup - Deduplicate reads based on their UMI | 134 umi_tools dedup - Deduplicate reads based on their UMI |
114 ====================================================== | 135 ====================================================== |