comparison umi-tools_dedup.xml @ 11:7fa28eb10fed draft

"planemo upload commit 2da1197aac6a18df9252e5da096645d2ecaece88"
author iuc
date Wed, 10 Feb 2021 19:30:35 +0000
parents c6567483aa1e
children 4098ab380097
comparison
equal deleted inserted replaced
10:c6567483aa1e 11:7fa28eb10fed
1 <tool id="umi_tools_dedup" name="UMI-tools deduplicate" version="@VERSION@.0"> 1 <tool id="umi_tools_dedup" name="UMI-tools deduplicate" version="@VERSION@+galaxy1">
2 <description>Extract UMI from fastq files</description> 2 <description>Extract UMI from fastq files</description>
3 <macros> 3 <macros>
4 <import>macros.xml</import> 4 <import>macros.xml</import>
5 </macros> 5 </macros>
6 <expand macro="requirements"> 6 <expand macro="requirements">
14 ln -sf '$input.metadata.bam_index' 'input.bam.bai' && 14 ln -sf '$input.metadata.bam_index' 'input.bam.bai' &&
15 #set $input_file = 'input.bam' 15 #set $input_file = 'input.bam'
16 #end if 16 #end if
17 17
18 umi_tools dedup 18 umi_tools dedup
19 '$output_stats_bool'
19 --random-seed 0 20 --random-seed 0
20 --extract-umi-method $extract_umi_method 21 --extract-umi-method $extract_umi_method
21 #if str($extract_umi_method) != 'read_id': 22 #if str($extract_umi_method) != 'read_id':
22 --umi-separator '$umi_separator' --umi-tag '$umi_tag' 23 --umi-separator '$umi_separator' --umi-tag '$umi_tag'
23 #end if 24 #end if
61 <param argument="--chrom" type="boolean" truevalue="--chrom" falsevalue="" label="Only consider a single chromosome" /> 62 <param argument="--chrom" type="boolean" truevalue="--chrom" falsevalue="" label="Only consider a single chromosome" />
62 <param name="per_contig" argument="--per-contig" type="boolean" truevalue="--per-contig" falsevalue="" label="Deduplicate per contig" help="Field 3 in BAM; RNAME. All reads with the same contig will be considered to have the same alignment position. This is useful if your library prep generates PCR duplicates with non identical alignment positions such as CEL-Seq. In this case, you would align to a reference transcriptome with one transcript per gene" /> 63 <param name="per_contig" argument="--per-contig" type="boolean" truevalue="--per-contig" falsevalue="" label="Deduplicate per contig" help="Field 3 in BAM; RNAME. All reads with the same contig will be considered to have the same alignment position. This is useful if your library prep generates PCR duplicates with non identical alignment positions such as CEL-Seq. In this case, you would align to a reference transcriptome with one transcript per gene" />
63 <param name="per_gene" argument="--per-gene" type="boolean" truevalue="--per-gene" falsevalue="" label="Deduplicate per gene" help="As above except with this option you can align to a reference transcriptome with more than one transcript per gene. You need to also provide a map of genes to transcripts. This will also add a metacontig ('MC') tag to the output BAM file." /> 64 <param name="per_gene" argument="--per-gene" type="boolean" truevalue="--per-gene" falsevalue="" label="Deduplicate per gene" help="As above except with this option you can align to a reference transcriptome with more than one transcript per gene. You need to also provide a map of genes to transcripts. This will also add a metacontig ('MC') tag to the output BAM file." />
64 <param name="gene_transcript_map" argument="--gene-transcript-map" type="data" format="tabular" optional="True" label="Tabular file mapping genes to transripts" /> 65 <param name="gene_transcript_map" argument="--gene-transcript-map" type="data" format="tabular" optional="True" label="Tabular file mapping genes to transripts" />
65 <param name="gene_tag" argument="--gene-tag" type="text" optional="True" label="Deduplicate by this gene tag" help="As --per-gene except here the gene information is encoded in the bam read tag specified so you do not need to supply the mapping file." /> 66 <param name="gene_tag" argument="--gene-tag" type="text" optional="True" label="Deduplicate by this gene tag" help="As --per-gene except here the gene information is encoded in the bam read tag specified so you do not need to supply the mapping file." />
67 <param name="output_stats_bool" type="boolean" truevalue="--output-stats=stats_outputs" falsevalue="" checked="false" label="Output UMI related statistics files?"/>
66 </inputs> 68 </inputs>
67 <outputs> 69 <outputs>
68 <data format="bam" name="output" /> 70 <data format="bam" name="output" />
71 <collection name="output_stats" type="list" label="UMI_tools dedup stats">
72 <filter>output_stats_bool</filter>
73 <data name="edit_distance" format="tabular" from_work_dir="stats_outputs_edit_distance.tsv"/>
74 <data name="per_umi" format="tabular" from_work_dir="stats_outputs_per_umi.tsv"/>
75 <data name="per_umi_per_position" format="tabular" from_work_dir="stats_outputs_per_umi_per_position.tsv"/>
76 </collection>
69 </outputs> 77 </outputs>
70 <tests> 78 <tests>
71 <test> 79 <test expect_num_outputs="1">
72 <param name="input" value="group_in1.sam" ftype="sam" /> 80 <param name="input" value="group_in1.sam" ftype="sam" />
73 <param name="extract_umi_method" value="read_id" /> 81 <param name="extract_umi_method" value="read_id" />
74 <param name="method" value="unique" /> 82 <param name="method" value="unique" />
75 <output name="output" file="dedup_out1.bam" ftype="bam" sort="True"/> 83 <output name="output" file="dedup_out1.bam" ftype="bam" sort="True"/>
76 </test> 84 </test>
77 <test> 85 <test expect_num_outputs="1">
78 <param name="input" value="group_in2.bam" ftype="bam" /> 86 <param name="input" value="group_in2.bam" ftype="bam" />
79 <param name="extract_umi_method" value="read_id" /> 87 <param name="extract_umi_method" value="read_id" />
80 <param name="paired" value="True" /> 88 <param name="paired" value="True" />
81 <param name="method" value="unique" /> 89 <param name="method" value="unique" />
82 <output name="output" file="dedup_out2.bam" ftype="bam" sort="True" /> 90 <output name="output" file="dedup_out2.bam" ftype="bam" sort="True" />
83 </test> 91 </test>
84 <test> 92 <test expect_num_outputs="1">
85 <param name="input" value="group_in3.bam" ftype="bam" /> 93 <param name="input" value="group_in3.bam" ftype="bam" />
86 <param name="extract_umi_method" value="read_id" /> 94 <param name="extract_umi_method" value="read_id" />
87 <param name="method" value="unique" /> 95 <param name="method" value="unique" />
88 <output name="output" file="dedup_out3.bam" ftype="bam" sort="True" /> 96 <output name="output" file="dedup_out3.bam" ftype="bam" sort="True" />
89 </test> 97 </test>
90 <test> 98 <test expect_num_outputs="1">
91 <param name="input" value="group_in4.bam" ftype="bam" /> 99 <param name="input" value="group_in4.bam" ftype="bam" />
92 <param name="extract_umi_method" value="tag" /> 100 <param name="extract_umi_method" value="tag" />
93 <param name="umi_tag" value="BX" /> 101 <param name="umi_tag" value="BX" />
94 <param name="method" value="unique" /> 102 <param name="method" value="unique" />
95 <output name="output" file="dedup_out4.bam" ftype="bam" sort="True" /> 103 <output name="output" file="dedup_out4.bam" ftype="bam" sort="True" />
96 </test> 104 </test>
97 <test> 105 <test expect_num_outputs="1">
98 <param name="input" value="group_in5.bam" ftype="bam" /> 106 <param name="input" value="group_in5.bam" ftype="bam" />
99 <param name="extract_umi_method" value="read_id" /> 107 <param name="extract_umi_method" value="read_id" />
100 <param name="umi_tag" value="BX" /> 108 <param name="umi_tag" value="BX" />
101 <param name="method" value="cluster" /> 109 <param name="method" value="cluster" />
102 <output name="output" file="dedup_out5.bam" ftype="bam" sort="True" /> 110 <output name="output" file="dedup_out5.bam" ftype="bam" sort="True" />
103 </test> 111 </test>
104 <test> 112 <test expect_num_outputs="1">
105 <param name="input" value="group_in6.bam" ftype="bam" /> 113 <param name="input" value="group_in6.bam" ftype="bam" />
106 <param name="extract_umi_method" value="read_id" /> 114 <param name="extract_umi_method" value="read_id" />
107 <param name="umi_tag" value="BX" /> 115 <param name="umi_tag" value="BX" />
108 <param name="method" value="directional" /> 116 <param name="method" value="directional" />
109 <output name="output" file="dedup_out6.bam" ftype="bam" sort="True" /> 117 <output name="output" file="dedup_out6.bam" ftype="bam" sort="True" />
118 </test>
119 <test expect_num_outputs="5">
120 <param name="input" value="group_in6.bam" ftype="bam" />
121 <param name="extract_umi_method" value="read_id" />
122 <param name="umi_tag" value="BX" />
123 <param name="method" value="directional" />
124 <param name="output_stats_bool" value="true"/>
125 <output name="output" file="dedup_out6.bam" ftype="bam" sort="True" />
126 <output_collection name="output_stats">
127 <element name="edit_distance" file="stats_outputs_edit_distance.tsv" />
128 <element name="per_umi" file="stats_outputs_per_umi.tsv" />
129 <element name="per_umi_per_position" file="stats_outputs_per_umi_per_position.tsv" />
130 </output_collection>
110 </test> 131 </test>
111 </tests> 132 </tests>
112 <help><![CDATA[ 133 <help><![CDATA[
113 umi_tools dedup - Deduplicate reads based on their UMI 134 umi_tools dedup - Deduplicate reads based on their UMI
114 ====================================================== 135 ======================================================