comparison pyscenic_aucell.xml @ 0:f408bd51bb59 draft

planemo upload for repository https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary/ commit 4990a52ac6fd3d97434a24051e5828c86c8a802c
author ebi-gxa
date Tue, 20 Aug 2024 12:48:20 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:f408bd51bb59
1 <tool id="pyscenic_aucell" name="PySCENIC AUCell" profile="21.09" version="@TOOL_VERSION@+galaxy0">
2 <description>calculates AUCell to find relevant regulons/gene sets</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro="requirements"/>
7 <command><![CDATA[
8 ln -s '${expression_mtx_fname}' expr_mat.loom &&
9 ln -s '${signatures_fname}' regulons.tsv &&
10
11 pyscenic aucell expr_mat.loom regulons.tsv
12 -o aucell.tsv
13 $transpose
14 $weights
15 --num_workers \${GALAXY_SLOTS:-1}
16 #if $seed
17 --seed '${seed}'
18 #end if
19 #if str($rank_threshold):
20 --rank_threshold '${rank_threshold}'
21 #end if
22 #if $auc_threshold
23 --auc_threshold '${auc_threshold}'
24 #end if
25 #if $nes_threshold
26 --nes_threshold '${nes_threshold}'
27 #end if
28 #if $cell_id_attribute
29 --cell_id_attribute '${cell_id_attribute}'
30 #end if
31 #if $gene_attribute
32 --gene_attribute '${gene_attribute}'
33 #end if
34 $sparse
35
36 && mv aucell.tsv '${output}'
37 ]]></command>
38 <inputs>
39 <param name="expression_mtx_fname" format="loom" type="data" label="Expression Matrix File" help="The file that contains the expression matrix for the single-cell experiment. Supported formats: csv (rows=cells x columns=genes) or loom (rows=genes x columns=cells)."/>
40 <param name="signatures_fname" type="data" format="csv,tabular" label="Gene Signatures/Regulons File" help="The file that contains the gene signatures (usually the precomputed regulons). Currently only csv/tsv supported, could be extended."/>
41 <param type="boolean" name="transpose" label="Transpose Expression Matrix" truevalue="-t" falsevalue="" help="Use this if the matrix is cell x genes instead of genes x cells as expected"/>
42 <param name="weights" type="boolean" label="Use Weights for Recovery Analysis" truevalue="-w" falsevalue="" help="Use weights associated with genes in recovery analysis. Relevant when gene signatures are supplied as json format."/>
43 <param name="seed" type="integer" label="Seed for Ranking" help="Seed for the expression matrix ranking step. The default is to use a random seed." optional="true"/>
44 <param name="rank_threshold" type="integer" label="Rank Threshold" help="The rank threshold used for deriving the target genes of an enriched motif (default: 5000)." optional="true"/>
45 <param name="auc_threshold" type="float" label="AUC Threshold" help="The threshold used for calculating the AUC of a feature as fraction of ranked genes (default: 0.05)." optional="true"/>
46 <param name="nes_threshold" type="float" label="NES Threshold" help="The Normalized Enrichment Score (NES) threshold for finding enriched features (default: 3.0)." optional="true"/>
47 <param name="cell_id_attribute" type="text" label="Cell ID Attribute" help="The name of the column attribute that specifies the identifiers of the cells in the loom file." optional="true"/>
48 <param name="gene_attribute" type="text" label="Gene Attribute" help="The name of the row attribute that specifies the gene symbols in the loom file." optional="true"/>
49 <param name="sparse" type="boolean" label="Sparse Matrix" truevalue="--sparse" falsevalue="" help="If set, load the expression data as a sparse matrix. Currently applies to the grn inference step only."/>
50 </inputs>
51 <outputs>
52 <data name="output" format="tabular" label="${tool.name} on ${on_string}: AUCell scores for regulons or gene sets."/>
53 </outputs>
54 <tests>
55 <test expect_num_outputs="1">
56 <param name="expression_mtx_fname" value="expr_mat.loom"/>
57 <param name="signatures_fname" value="regulons.tsv"/>
58 <output name="output">
59 <assert_contents>
60 <has_n_lines n="101"/>
61 <has_text text="CEBPB"/>
62 </assert_contents>
63 </output>
64 </test>
65 </tests>
66 <help>
67 <![CDATA[
68 Run PySCENIC aucell command to analyze single-cell gene expression data.
69
70 **Input Parameters:**
71
72 - **expression_mtx_fname**: The name of the file that contains the expression matrix for the single cell experiment. Two file formats are supported: csv (rows=cells x columns=genes) or loom (rows=genes x columns=cells).
73
74 - **signatures_fname**: The name of the file that contains the gene signatures. Three file formats are supported: gmt, yaml, or dat (pickle).
75
76 **Options:**
77
78 - **-o, --output**: Output file/stream, a matrix of AUC values. Two file formats are supported: csv or loom. If loom file is specified, it will contain the original expression matrix and the calculated AUC values as extra column attributes.
79
80 - **-t, --transpose**: Transpose the expression matrix if supplied as csv (rows=genes x columns=cells).
81
82 - **-w, --weights**: Use weights associated with genes in recovery analysis. Is only relevant when gene signatures are supplied as json format.
83
84 - **--seed**: Seed for the expression matrix ranking step. The default is to use a random seed.
85
86 **Motif Enrichment Arguments:**
87
88 - **--rank_threshold**: The rank threshold used for deriving the target genes of an enriched motif (default: 5000).
89
90 - **--auc_threshold**: The threshold used for calculating the AUC of a feature as fraction of ranked genes (default: 0.05).
91
92 - **--nes_threshold**: The Normalized Enrichment Score (NES) threshold for finding enriched features (default: 3.0).
93
94 **Loom File Arguments:**
95
96 - **--cell_id_attribute**: The name of the column attribute that specifies the identifiers of the cells in the loom file.
97
98 - **--gene_attribute**: The name of the row attribute that specifies the gene symbols in the loom file.
99
100 - **--sparse**: If set, load the expression data as a sparse matrix. Currently applies to the grn inference step only.
101 ]]>
102 </help>
103 <expand macro="citations"/>
104 </tool>