comparison cpm_tpm_rpk.xml @ 7:f00c1c34565e draft default tip

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/main/tools/cpm_tpm_rpk commit 8cca5f05212cd25113955fb9c11801f4047c12b4
author artbio
date Wed, 03 Jul 2024 14:39:26 +0000
parents d2575928b824
children
comparison
equal deleted inserted replaced
6:d2575928b824 7:f00c1c34565e
1 <tool id="cpm_tpm_rpk" name="Generate CPM, TPM, RPK" version="0.5.2"> 1 <tool id="cpm_tpm_rpk" name="Generate CPM, TPM, RPKM" version="0.6.0">
2 <description>from raw counts expression values</description> 2 <description>from raw counts expression values</description>
3 <requirements> 3 <requirements>
4 <requirement type="package" version="1.7.1">r-optparse</requirement> 4 <requirement type="package" version="1.7.5">r-optparse</requirement>
5 <requirement type="package" version="0.16">r-rtsne</requirement> 5 <requirement type="package" version="0.17">r-rtsne</requirement>
6 <requirement type="package" version="3.3.6">r-ggplot2</requirement> 6 <requirement type="package" version="3.5.1">r-ggplot2</requirement>
7 <requirement type="package" version="0.4.14">r-ggfortify</requirement> 7 <requirement type="package" version="0.4.17">r-ggfortify</requirement>
8 <requirement type="package" version="1.4.4">r-reshape2</requirement> 8 <requirement type="package" version="1.4.4">r-reshape2</requirement>
9 </requirements> 9 </requirements>
10 <stdio> 10 <stdio>
11 <exit_code range="1:" level="fatal" description="Tool exception" /> 11 <exit_code range="1:" level="fatal" description="Tool exception" />
12 </stdio> 12 </stdio>
19 #if $option.type_transfo == "tpm": 19 #if $option.type_transfo == "tpm":
20 -f $option.gene_file 20 -f $option.gene_file
21 --gene_sep $option.gene_sep 21 --gene_sep $option.gene_sep
22 --gene_header $option.gene_header 22 --gene_header $option.gene_header
23 #end if 23 #end if
24 #if $option.type_transfo == "rpk": 24 #if $option.type_transfo == "rpkm":
25 -f $option.gene_file 25 -f $option.gene_file
26 --gene_sep $option.gene_sep 26 --gene_sep $option.gene_sep
27 --gene_header $option.gene_header 27 --gene_header $option.gene_header
28 #end if 28 #end if
29 -l $log 29 -l $log
62 </param> 62 </param>
63 <conditional name="option"> 63 <conditional name="option">
64 <param name="type_transfo" type="select" label="Type of transformation"> 64 <param name="type_transfo" type="select" label="Type of transformation">
65 <option value="cpm" selected="true">CPM</option> 65 <option value="cpm" selected="true">CPM</option>
66 <option value="tpm">TPM</option> 66 <option value="tpm">TPM</option>
67 <option value="rpk">RPK</option> 67 <option value="rpkm">RPKM</option>
68 <option value="none">NONE</option> 68 <option value="none">NONE</option>
69 </param> 69 </param>
70 <when value="tpm"> 70 <when value="tpm">
71 <param name="gene_file" type="data" format="txt" label="Gene length file"/> 71 <param name="gene_file" type="data" format="txt" label="Gene length file"/>
72 <param name="gene_sep" type="select" label="Gene length column separator"> 72 <param name="gene_sep" type="select" label="Gene length column separator">
80 <param name="gene_header" type="select" label="Consider first line of gene length file as header ?"> 80 <param name="gene_header" type="select" label="Consider first line of gene length file as header ?">
81 <option value="TRUE" selected="true">Yes</option> 81 <option value="TRUE" selected="true">Yes</option>
82 <option value="FALSE">No</option> 82 <option value="FALSE">No</option>
83 </param> 83 </param>
84 </when> 84 </when>
85 <when value="rpk"> 85 <when value="rpkm">
86 <param name="gene_file" type="data" format="txt" label="Gene length file"/> 86 <param name="gene_file" type="data" format="txt" label="Gene length file"/>
87 <param name="gene_sep" type="select" label="Gene length column separator"> 87 <param name="gene_sep" type="select" label="Gene length column separator">
88 <option value="tab" selected="true">Tabs</option> 88 <option value="tab" selected="true">Tabs</option>
89 <option value=",">Commas</option> 89 <option value=",">Commas</option>
90 <option value="\ ">Whitespaces</option> 90 <option value="\ ">Whitespaces</option>
206 <param name="log" value="TRUE"/> 206 <param name="log" value="TRUE"/>
207 <output name="output" file="logtpm.tab" ftype="tabular" /> 207 <output name="output" file="logtpm.tab" ftype="tabular" />
208 </test> 208 </test>
209 <test expect_num_outputs="1"> 209 <test expect_num_outputs="1">
210 <param name="input" value="counts.tab" ftype="tabular"/> 210 <param name="input" value="counts.tab" ftype="tabular"/>
211 <param name="type_transfo" value="rpk"/> 211 <param name="type_transfo" value="rpkm"/>
212 <param name="gene_file" value="gene_length.tab" ftype="tabular"/> 212 <param name="gene_file" value="gene_length.tab" ftype="tabular"/>
213 <param name="gene_header" value="TRUE"/> 213 <param name="gene_header" value="TRUE"/>
214 <output name="output" file="rpk.tab" ftype="tabular" /> 214 <output name="output" file="rpkm.tab" ftype="tabular" />
215 </test> 215 </test>
216 <test expect_num_outputs="1"> 216 <test expect_num_outputs="1">
217 <param name="input" value="counts.tab" ftype="tabular"/> 217 <param name="input" value="counts.tab" ftype="tabular"/>
218 <param name="type_transfo" value="rpk"/> 218 <param name="type_transfo" value="rpkm"/>
219 <param name="gene_file" value="gene_length.tab" ftype="tabular"/> 219 <param name="gene_file" value="gene_length.tab" ftype="tabular"/>
220 <param name="gene_header" value="TRUE"/> 220 <param name="gene_header" value="TRUE"/>
221 <param name="log" value="TRUE"/> 221 <param name="log" value="TRUE"/>
222 <output name="output" file="logrpk.tab" ftype="tabular" /> 222 <output name="output" file="logrpkm.tab" ftype="tabular" />
223 </test> 223 </test>
224 </tests> 224 </tests>
225 <help> 225 <help>
226 226
227 **What it does** 227 **What it does**
229 Takes a raw count expression matrix and returns a table of normalized expression values. 229 Takes a raw count expression matrix and returns a table of normalized expression values.
230 230
231 Normalization can be: 231 Normalization can be:
232 232
233 - CPM (Counts Per Million) are obtained by dividing counts by the library counts sum and multiplying the results by a million. 233 - CPM (Counts Per Million) are obtained by dividing counts by the library counts sum and multiplying the results by a million.
234 - RPK (Reads Per Kilobases) are obtained by dividing read counts by gene lengths (expressed in kilo-nucleotides). 234 - RPK (Reads Per Kilobase) are obtained by dividing read counts by gene lengths (expressed as kilo-nucleotides).
235 - RPKM (Reads Per Kilobase per Million of Counts) are obtained by dividing read counts by gene lengths (expressed in kilo-nucleotides) then by the sum of library counts (expressed as millions of reads)
235 - TPM (Transcripts Per Million) are obtained by dividing RPK values by the sum of all RPK values in a sample and multiplying the results by 1 million. 236 - TPM (Transcripts Per Million) are obtained by dividing RPK values by the sum of all RPK values in a sample and multiplying the results by 1 million.
236 237
237 RPK and TPM require a two-column correspondance table gene_name - gene length where the length is specified in nucleotide. Both these metrics are relevant only for sequencing of full length RNAs. 238 RPK and TPM require a two-column correspondance table gene_name - gene length where the length is specified in nucleotide. Both these metrics are relevant only for sequencing of full length RNAs.
238 239
239 Note: do not comment you header line if you have header line in you tabular input (ie do not start the header line with a '#' character) 240 Note: do not comment you header line if you have header line in you tabular input (ie do not start the header line with a '#' character)