Mercurial > repos > iuc > genomic_super_signature
comparison genomic_super_signature.xml @ 0:d0cbe6cc1f04 draft default tip
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/genomic_super_signature commit 1aadd5dce3b254e7714c2fdd39413029fd4b9b7a"
author | iuc |
---|---|
date | Wed, 12 Jan 2022 19:07:45 +0000 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:d0cbe6cc1f04 |
---|---|
1 <tool id="genomic_super_signature" name="GenomicSuperSignature" version="@TOOL_VERSION@+galaxy@GALAXY_VERSION@" profile="20.01"> | |
2 <description>interpretation of RNAseq experiments</description> | |
3 <macros> | |
4 <token name="@TOOL_VERSION@">1.2.0</token> | |
5 <token name="@GALAXY_VERSION@">0</token> | |
6 </macros> | |
7 <requirements> | |
8 <requirement type="package" version="@TOOL_VERSION@">bioconductor-genomicsupersignature</requirement> | |
9 <requirement type="package" version="1.7.1">r-optparse</requirement> | |
10 <requirement type="package" version="2.6">r-wordcloud</requirement> | |
11 <requirement type="package" version="2.22.0">bioconductor-biocstyle</requirement> | |
12 <requirement type="package" version="2.7.3">r-magick</requirement> | |
13 <requirement type="package" version="2021d">tzdata</requirement> | |
14 </requirements> | |
15 <command detect_errors="exit_code"><![CDATA[ | |
16 #set $model = $model.fields.path | |
17 mkdir out && | |
18 Rscript '$__tool_directory__/gss.R' --input '$input' --model '$model' --method '$method' --maxFrom '$maxFrom' --level '$level' --scale '$scale' --numOut $numOut --outDir out --toolDir '$__tool_directory__' --validate '$validate' --html '$html' | |
19 ]]></command> | |
20 <inputs> | |
21 <param argument="--input" type="data" format="tabular,tsv" label="Tabular count matrix"/> | |
22 <param argument="--model" type="select" label="Using RAVmodel" help="Select model from the list"> | |
23 <options from_data_table="genomic_super_signature_ravmodels"> | |
24 <filter type="data_meta" ref="input" key="dbkey" column="dbkey" /> | |
25 </options> | |
26 <validator type="no_options" message="A built-in RAVmodel is not available for the build associated with the selected input file"/> | |
27 </param> | |
28 <param argument="--method" type="select" label="Select a correlation coefficient"> | |
29 <option value="pearson">Pearson</option> | |
30 <option value="kendall">Kendall</option> | |
31 <option value="spearman">Spearman</option> | |
32 </param> | |
33 <param argument="--maxFrom" type="select" label="Select whether to display the maximum value from dataset's PCs or avgLoadings" help="With Principal Component (PC), the maximum correlation coefficient from top 8 PCs for each avgLoading will be selected as an output. If you choose Average Loading, the Average Loading with the maximum correlation coefficient with each Principal Component will be in the output."> | |
34 <option value="pc">Principal Components</option> | |
35 <option value="avgLoading">Average Loading</option> | |
36 </param> | |
37 <param argument="--level" type="select" label="Output format of validated result" help="max will output the matrix containing only the maximum coefficient. To get the coefficient of all 8 PCs, set this argument to all."> | |
38 <option value="max">Max</option> | |
39 <option value="all">All</option> | |
40 </param> | |
41 <param argument="--scale" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="false" label="Normalize rows of datasets?"/> | |
42 <param argument="--numOut" type="integer" min="1" value="3" label="The number of top validated RAVs to check"/> | |
43 </inputs> | |
44 <outputs> | |
45 <collection name="genesets" type="list" label="GenomicSuperSignature Genesets"> | |
46 <discover_datasets pattern=".*_genesets_(?P<name>.+)\.csv" format="csv" directory="out" /> | |
47 </collection> | |
48 <collection name="literatures" type="list" label="GenomicSuperSignature Literatures"> | |
49 <discover_datasets pattern=".*_literatures_(?P<name>.+)\.csv" format="csv" directory="out" /> | |
50 </collection> | |
51 <data name="validate" format="csv" label="GenomicSuperSignature validate.csv"> | |
52 </data> | |
53 <data name="html" format="html" label="GenomicSuperSignature report.html"> | |
54 </data> | |
55 </outputs> | |
56 <tests> | |
57 <test> | |
58 <param name="input" value="bcellViperExpr_10C.tsv.gz" dbkey="hg38" ftype="tabular"/> | |
59 <param name="model" value="microRAVmodel" dbkey="hg38"/> | |
60 <param name="method" value="Pearson"/> | |
61 <param name="maxFrom" value="Principal Components"/> | |
62 <param name="level" value="Max"/> | |
63 <param name="numOut" value="1"/> | |
64 <output name="html" ftype="html"> | |
65 <assert_contents> | |
66 <has_n_lines n="2843"/> | |
67 </assert_contents> | |
68 </output> | |
69 <output name="validate" ftype="csv"> | |
70 <assert_contents> | |
71 <has_line line='"","score","PC","sw","cl_size","cl_num"'/> | |
72 <has_text text='"RAV1076"'/> | |
73 <has_text text='"RAV725"'/> | |
74 <has_text text='"RAV884"'/> | |
75 <has_text text='"RAV1994"'/> | |
76 <has_n_lines n="5"/> | |
77 </assert_contents> | |
78 </output> | |
79 </test> | |
80 </tests> | |
81 <help><![CDATA[ | |
82 GenomicSuperSignature | |
83 ===================== | |
84 | |
85 What it does | |
86 ------------ | |
87 | |
88 Connect new gene expression profile with the relevant information from | |
89 the existing databases, such as previous publications, MeSH terms, and | |
90 gene sets. | |
91 | |
92 Inputs | |
93 ------ | |
94 | |
95 Count Files | |
96 ~~~~~~~~~~~ | |
97 | |
98 GenomicSuperSignature takes a count matrix as an input. Input file | |
99 should have row names in gene symbols and column names in sample ID. For | |
100 the best result, we recommend a data transformation (e.g. log2) for the | |
101 input to follow a normal distribution, while scaling is NOT recommended. | |
102 Currently for validation, inputs need at least eight samples. | |
103 | |
104 Example of input format: | |
105 | |
106 ===== ======== ========= ======== ========= | |
107 \ GSM44075 GSM44078 GSM44080 GSM44081 | |
108 ===== ======== ========= ======== ========= | |
109 ADA 9.571369 10.599436 8.740659 10.104469 | |
110 CDH2 6.175890 5.312704 5.651928 4.462205 | |
111 MED6 9.671113 8.773383 9.190276 9.526235 | |
112 NR2E3 9.847733 9.582061 9.628792 8.820422 | |
113 ===== ======== ========= ======== ========= | |
114 | |
115 RAVmodel | |
116 ~~~~~~~~ | |
117 | |
118 *R*\ eplicable *A*\ xes of *V*\ ariation (RAV) consists of principal | |
119 components repeatedly observed in an independent analysis of multiple | |
120 published datasets. RAVs connect different databases that are both | |
121 linked to the originated study or associated with the RAV itself through | |
122 the gene rankings of it. RAVmodel contains the collection of RAVs | |
123 (RAVindex), metadata from model building process and the additional | |
124 annotations. Currently, two RAVmodels are available based on the gene | |
125 sets used for annotation. | |
126 | |
127 1) C2 : RAVmodel annotated with Molecular Signatures Database (MSigDB) | |
128 curated gene sets (version 7.1) | |
129 2) PLIERpriors : RAVmodel annotated with the three gene sets provided in | |
130 the `PLIER package <https://github.com/wgmao/PLIER>`__ - | |
131 bloodCellMarkersIRISDMAP, svmMarkers, and canonicalPathways | |
132 | |
133 Outputs | |
134 ------- | |
135 | |
136 There are four categories of outputs from this tool, which is one html | |
137 file and three csv tabular files. The actual number of csv files will | |
138 vary depending on the parameter, *–numOut*, and the validated RAVs. | |
139 | |
140 validate.csv | |
141 ~~~~~~~~~~~~ | |
142 | |
143 +--------------------------+--------------------------------------------+ | |
144 | Column | Description | | |
145 +==========================+============================================+ | |
146 | score | the maximum pearson correlation | | |
147 | | coefficient between the top 8 PCs of the | | |
148 | | input and RAVs | | |
149 +--------------------------+--------------------------------------------+ | |
150 | PC | one of the top 8 PCs of the input, which | | |
151 | | gives the highest *score* | | |
152 +--------------------------+--------------------------------------------+ | |
153 | sw | the average silhouette width of the RAV | | |
154 +--------------------------+--------------------------------------------+ | |
155 | cl_size | the size of each RAV | | |
156 +--------------------------+--------------------------------------------+ | |
157 | cl_num | the RAV number | | |
158 +--------------------------+--------------------------------------------+ | |
159 | |
160 Genesets | |
161 ~~~~~~~~ | |
162 | |
163 This is the enriched gene sets for the target RAV, calculated from the | |
164 ranked gene list. Gene sets with the adjusted p-value < 0.05 are | |
165 included. | |
166 | |
167 =========== ================================ | |
168 Column Description | |
169 =========== ================================ | |
170 Description name of the gene sets | |
171 NES normalized enrichment score (ES) | |
172 pvalue statistical significance | |
173 qvalues p-value adjusted for the FDR | |
174 =========== ================================ | |
175 | |
176 Literatures | |
177 ~~~~~~~~~~~ | |
178 | |
179 ========= ====================== | |
180 Column Description | |
181 ========= ====================== | |
182 studyName study accession | |
183 title the title of the study | |
184 ========= ====================== | |
185 | |
186 report.html | |
187 ~~~~~~~~~~~ | |
188 | |
189 A html file with the summary of the main analyses by | |
190 GenomicSuperSignature. It includes MeSH terms in word cloud and an | |
191 interactive plot overviewing the validated RAVs, in addition to the | |
192 previews of the tabular output files. | |
193 | |
194 Citations | |
195 --------- | |
196 | |
197 Oh, S., Geistlinger, L., Ramos, M., Taroni, J.N., Carey, V.J., Greene, | |
198 C.S., Waldron, L., & Davis, S.R. (2021). GenomicSuperSignature: | |
199 interpretation of RNA-seq experiments through robust, efficient | |
200 comparison to public databases. bioRxiv. | |
201 | |
202 References | |
203 ---------- | |
204 | |
205 | GenomicSuperSignature package: | |
206 `webpage <https://shbrief.github.io/GenomicSuperSignature/>`__ | |
207 | GenomicSuperSignature usecases: | |
208 `webpage <https://shbrief.github.io/GenomicSuperSignaturePaper/>`__ | |
209 ]]></help> | |
210 <citations> | |
211 <citation type="doi">10.1101/2021.05.26.445900</citation> | |
212 </citations> | |
213 </tool> |