Mercurial > repos > ebi-gxa > pyscenic_ctx
comparison pyscenic_ctx.xml @ 0:931cd3661690 draft
planemo upload for repository https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary/ commit 4990a52ac6fd3d97434a24051e5828c86c8a802c
author | ebi-gxa |
---|---|
date | Tue, 20 Aug 2024 12:48:31 +0000 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:931cd3661690 |
---|---|
1 <tool id="pyscenic_ctx" name="PySCENIC CTX" profile="21.09" version="@TOOL_VERSION@+galaxy0"> | |
2 <description> | |
3 computes active regulons based on a gene regulatory network | |
4 </description> | |
5 <macros> | |
6 <import>macros.xml</import> | |
7 </macros> | |
8 <expand macro="requirements"/> | |
9 <command><![CDATA[ | |
10 #set PySCENIC_DB = "db.genes_vs_motifs.rankings.feather" | |
11 ln -s '${module_fname}' tf2targets.tsv && | |
12 ln -s '${expression_mtx}' expr_mat.loom && | |
13 ln -s '${database_fname}' ${PySCENIC_DB} && | |
14 | |
15 pyscenic ctx tf2targets.tsv ${PySCENIC_DB} | |
16 --expression_mtx_fname expr_mat.loom | |
17 --output regulons.tsv | |
18 $no_pruning | |
19 #if $chunk_size | |
20 --chunk_size '${chunk_size}' | |
21 #end if | |
22 --mode custom_multiprocessing | |
23 --num_workers \${GALAXY_SLOTS:-1} | |
24 $all_modules | |
25 $transpose | |
26 #if $rank_threshold | |
27 --rank_threshold '${rank_threshold}' | |
28 #end if | |
29 #if $auc_threshold | |
30 --auc_threshold '${auc_threshold}' | |
31 #end if | |
32 #if $nes_threshold | |
33 --nes_threshold '${nes_threshold}' | |
34 #end if | |
35 #if $min_orthologous_identity | |
36 --min_orthologous_identity '${min_orthologous_identity}' | |
37 #end if | |
38 #if $max_similarity_fdr | |
39 --max_similarity_fdr '${max_similarity_fdr}' | |
40 #end if | |
41 #if $annotations_fname | |
42 --annotations_fname '${annotations_fname}' | |
43 #end if | |
44 #if $thresholds | |
45 --thresholds '${thresholds}' | |
46 #end if | |
47 #if $top_n_targets | |
48 --top_n_targets '${top_n_targets}' | |
49 #end if | |
50 #if $top_n_regulators | |
51 --top_n_regulators '${top_n_regulators}' | |
52 #end if | |
53 #if $min_genes | |
54 --min_genes '${min_genes}' | |
55 #end if | |
56 $mask_dropouts | |
57 #if $cell_id_attribute | |
58 --cell_id_attribute '${cell_id_attribute}' | |
59 #end if | |
60 #if $gene_attribute | |
61 --gene_attribute '${gene_attribute}' | |
62 #end if | |
63 $sparse | |
64 | |
65 ]]></command> | |
66 <inputs> | |
67 <param type="data" name="module_fname" format="tabular" label="Module File" help="Signatures or the co-expression modules. Usually the output from pyscenic grn."/> | |
68 <param type="data" name="database_fname" label="Database File" help="Regulatory feature databases. Supported formats: feather"/> | |
69 <param type="data" name="annotations_fname" format="tabular" label="Annotations File" help="File that contains the motif annotations to use."/> | |
70 <param type="data" name="expression_mtx" format="loom" label="Expression Matrix" help="The expression matrix for the single cell experiment."/> | |
71 <param type="boolean" name="no_pruning" label="No Pruning" truevalue="--no_pruning" falsevalue="" help="Do not perform pruning, i.e. find enriched motifs."/> | |
72 <param type="integer" name="chunk_size" label="Chunk Size" optional="true" help="The size of the module chunks assigned to a node in the dask graph (default: 100)."/> | |
73 <param type="boolean" name="all_modules" label="All Modules" truevalue="--all_modules" falsevalue="" help="Include positive and negative regulons in the analysis (default: no, i.e. only positive)."/> | |
74 <param type="boolean" name="transpose" label="Transpose Expression Matrix" truevalue="-t" falsevalue="" help="Use this if the matrix is cell x genes instead of genes x cells as expected"/> | |
75 <param type="float" name="rank_threshold" label="Rank Threshold" optional="true" help="The rank threshold used for deriving the target genes of an enriched motif."/> | |
76 <param type="float" name="auc_threshold" label="AUC Threshold" optional="true" help="The threshold used for calculating the AUC of a feature as fraction of ranked genes."/> | |
77 <param type="float" name="nes_threshold" label="NES Threshold" optional="true" help="The Normalized Enrichment Score (NES) threshold for finding enriched features."/> | |
78 <param type="float" name="min_orthologous_identity" label="Minimum Orthologous Identity" optional="true" help="Minimum orthologous identity to use when annotating enriched motifs."/> | |
79 <param type="float" name="max_similarity_fdr" label="Maximum Similarity FDR" optional="true" help="Maximum FDR in motif similarity to use when annotating enriched motifs."/> | |
80 <param type="text" name="thresholds" label="Thresholds" optional="true" help="Thresholds to use for selecting the features (e.g., motifs)."/> | |
81 <param type="integer" name="top_n_targets" label="Top N Targets" optional="true" help="The number of top targets to retain for each feature."/> | |
82 <param type="integer" name="top_n_regulators" label="Top N Regulators" optional="true" help="The number of top regulators to retain for each feature."/> | |
83 <param type="integer" name="min_genes" label="Minimum Genes" optional="true" help="The minimum number of genes a module needs to have to be considered for regulatory network analysis."/> | |
84 <param type="boolean" name="mask_dropouts" label="Mask Dropouts" truevalue="--mask_dropouts" falsevalue="" help="Mask dropouts in the expression matrix."/> | |
85 <param type="text" name="cell_id_attribute" label="Cell ID Attribute" optional="true" help="The name of the attribute in the loom expression matrix that contains cell IDs."/> | |
86 <param type="text" name="gene_attribute" label="Gene Attribute" optional="true" help="The name of the attribute in the loom expression matrix that contains gene names."/> | |
87 <param name="sparse" type="boolean" label="Sparse Matrix" truevalue="--sparse" falsevalue="" help="If set, load the expression data as a sparse matrix. Currently applies to the grn inference step only."/> | |
88 </inputs> | |
89 <outputs> | |
90 <data name="output" format="tabular" from_work_dir="regulons.tsv" label="${tool.name} on ${on_string}: table of enriched motifs and target genes"/> | |
91 <!-- Define other output formats as needed --> | |
92 </outputs> | |
93 <tests> | |
94 <test expect_num_outputs="1"> | |
95 <param name="module_fname" value="tf2targets.tsv"/> | |
96 <param name="expression_mtx" value="expr_mat.loom"/> | |
97 <param name="database_fname" value="genome-ranking_v2.feather"/> | |
98 <param name="annotations_fname" value="motifs.tbl"/> | |
99 <output name="output" file="regulons.tsv" compare="sim_size" delta_frac="0.2"/> | |
100 </test> | |
101 </tests> | |
102 <help><![CDATA[ | |
103 .. class:: infomark | |
104 :name: warning | |
105 | |
106 **pySCENIC ctx: Contextualize GRN** | |
107 | |
108 This tool refines gene regulatory networks (GRNs) by pruning targets that do not have an enrichment for a corresponding motif of the transcription factor (TF). This process effectively separates direct from indirect targets based on the presence of cis-regulatory footprints. | |
109 | |
110 **Inputs:** | |
111 | |
112 - **Module File**: A file containing the signature or co-expression modules. Supported formats include CSV, TSV (adjacencies), YAML, GMT, and DAT (modules). | |
113 - **Database Files**: One or more regulatory feature databases. Supported formats include feather or db (legacy). | |
114 - **Annotations File**: A file containing the motif annotations to use. | |
115 | |
116 **Optional Parameters:** | |
117 | |
118 - **No Pruning**: Do not perform pruning, i.e., find enriched motifs. | |
119 - **Chunk Size**: The size of the module chunks assigned to a node in the dask graph (default: 100). | |
120 - **Mode**: The mode to be used for computing (default: custom_multiprocessing). | |
121 - **All Modules**: Include positive and negative regulons in the analysis (default: only positive). | |
122 - **Transpose**: Transpose the expression matrix (rows=genes x columns=cells). | |
123 - **Rank Threshold**: The rank threshold used for deriving the target genes of an enriched motif (default: 5000). | |
124 - **AUC Threshold**: The threshold used for calculating the AUC of a feature as a fraction of ranked genes (default: 0.05). | |
125 - **NES Threshold**: The Normalized Enrichment Score (NES) threshold for finding enriched features (default: 3.0). | |
126 - **Min Orthologous Identity**: Minimum orthologous identity to use when annotating enriched motifs (default: 0.0). | |
127 - **Max Similarity FDR**: Maximum FDR in motif similarity to use when annotating enriched motifs (default: 0.001). | |
128 - **Thresholds**: The first method to create the TF-modules based on the best targets for each transcription factor (default: 0.75 0.90). | |
129 - **Top N Targets**: The second method is to select the top targets for a given TF (default: 50). | |
130 - **Top N Regulators**: The alternative way to create the TF-modules is to select the best regulators for each gene (default: 5 10 50). | |
131 - **Min Genes**: The minimum number of genes in a module (default: 20). | |
132 - **Expression Matrix File**: The name of the file that contains the expression matrix for the single-cell experiment. Supported formats include csv (rows=cells x columns=genes) or loom (rows=genes x columns=cells). Required if modules need to be generated. | |
133 - **Mask Dropouts**: Controls whether cell dropouts (cells in which expression of either TF or target gene is 0) are masked when calculating the correlation between a TF-target pair. | |
134 - **Cell ID Attribute**: The name of the column attribute that specifies the identifiers of the cells in the loom file. | |
135 - **Gene Attribute**: The name of the row attribute that specifies the gene symbols in the loom file. | |
136 - **Sparse**: If set, load the expression data as a sparse matrix. Currently applies to the GRN inference step only. | |
137 ]]></help> | |
138 <expand macro="citations"/> | |
139 </tool> |