Mercurial > repos > artbio > gsc_gene_expression_correlations
diff correlation_with_signature.xml @ 0:734ab9c5595a draft
planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/gsc_gene_expression_correlations commit 09dcd74dbc01f448518cf3db3e646afb0675a6fe
author | artbio |
---|---|
date | Mon, 24 Jun 2019 13:38:39 -0400 |
parents | |
children | 8ad272e0b640 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/correlation_with_signature.xml Mon Jun 24 13:38:39 2019 -0400 @@ -0,0 +1,97 @@ +<tool id="single_cell_gene_expression_correlations" name="single-cell gene expression correlations" version="0.9.0"> + <description>between genes or with a signature of selected genes</description> + <requirements> + <requirement type="package" version="1.3.2=r3.3.2_0">r-optparse</requirement> + <requirement type="package" version="4.0_3=r3.3.2_0">r-hmisc</requirement> + </requirements> + <stdio> + <exit_code range="1:" level="fatal" description="Tool exception" /> + </stdio> + <command detect_errors="exit_code"><![CDATA[ + Rscript $__tool_directory__/correlation_with_signature.R + --expression_file '$expression_file' + --signatures_file '$signatures_file' + --sep + #if $sep == 'tab': + 'tab' + #elif $sep == 'comma': + 'comma' + #end if + --colnames '$colnames' + --sig_corr '$sig_corr' + --gene_corr '$gene_corr' + --gene_corr_pval '$gene_corr_pval' +]]></command> + <inputs> + <param name="expression_file" type="data" format="txt,tabular" label="Expression data" + help="a csv or tsv file that contains log2(CPM +1) expression values" /> + <param name="signatures_file" type="data" format="txt,tabular" label="signature values" + help="a csv or tsv file that contains cell signatures" /> + <param name="sep" type="select" label="Indicate column separator" + help="Note that all input files must have the same format"> + <option value="tab" selected="true">Tabs</option> + <option value="comma">Comma</option> + </param> + <param name="colnames" type="select" label="Firt row contains column names" + help="chose whether your files contain a header row (often a good idea)" > + <option value="TRUE" selected="true">True</option> + <option value="FALSE">False</option> + </param> + </inputs> + <outputs> + <data name="sig_corr" format="tabular" label="Genes-Signature correlations" /> + <data name="gene_corr" format="tabular" label="Correlations r (all)" /> + <data name="gene_corr_pval" format="tabular" label="Correlations p-values (all)" /> + </outputs> + <tests> + <test> + <param name="expression_file" value="gene_filtered_input.tsv" ftype="txt"/> + <param name="signatures_file" value="signature.tsv" ftype="txt"/> + <param name="sep" value='tab' /> + <param name="colnames" value="TRUE"/> + <output name="sig_corr" file="sig_corr.tsv" ftype="tabular"/> + <output name="gene_corr" file="gene_corr.tsv" ftype="tabular"/> + <output name="gene_corr_pval" file="gene_corr_pval.tsv" ftype="tabular"/> + </test> + </tests> + <help> + +**What it does** + +The tools computes a table of pairwise expression correlations between **selected genes** +in single-cell RNAseq data, as well as a table of correlation between the expression of +these selected genes and the value of a signature (must be a scalar for each library) +across the single-cell data + +**Inputs** + +- a table of expression values (e.E. log10(CPM+1), etc...) of **selected genes** from single-cell RNAseq sequencing libraries (columns) + These genes may be selected for their significant differential expression, because they + belong to a specific pathway, etc. +- a table of signature values for the single-cell RNAseq sequencing datasets + The table should have 2 columns (Cell-identifier and signature-value). The signature + values are scalars, one value per cell-identifier and are in the second column. + +**Outputs** + +- Correlation table between the signature score and selected gene expression. There is three columns: + - gene name + - Pearson_correlation : Pearson correlation value + - p_value : associated p-value +- Gene - Gene correlation table. It's a n x n matrix of correlation values where n is the number of selected genes. +- Gene - Gene correlation associated p-values table. It has the same dimensions as Gene-Gene correlation table but for p-values. + + </help> + <citations> + <citation type="bibtex"> + @Manual{, + title = {R: A Language and Environment for Statistical Computing}, + author = {{R Core Team}}, + organization = {R Foundation for Statistical Computing}, + address = {Vienna, Austria}, + year = {2014}, + url = {http://www.R-project.org/}, + } + </citation> + </citations> +</tool>