comparison checkformat_config.xml @ 3:80a38d36f946 draft

planemo upload for repository https://github.com/workflow4metabolomics/checkformat.git commit 5cf3f6eb62c1396ade1b068a3dd3cc2e3f827e15
author ethevenot
date Thu, 11 Jan 2018 10:24:56 -0500
parents b6a6b4cc932a
children 9590fac86f63
comparison
equal deleted inserted replaced
2:b6a6b4cc932a 3:80a38d36f946
1 <tool id="checkFormat" name="Check Format" version="2.0.4"> 1 <tool id="checkFormat" name="Check Format" version="3.0.0">
2 <description>Checks the formats of the dataMatrix, sampleMetadata, and variableMetadata files</description> 2 <description>Checking/formatting the sample and variable names of the dataMatrix, sampleMetadata, and variableMetadata files</description>
3 3
4 <requirements> 4 <requirements>
5 <requirement type="package">r-batch</requirement> 5 <requirement type="package">r-batch</requirement>
6 </requirements> 6 </requirements>
7 7
12 <command><![CDATA[ 12 <command><![CDATA[
13 Rscript $__tool_directory__/checkformat_wrapper.R 13 Rscript $__tool_directory__/checkformat_wrapper.R
14 dataMatrix_in "$dataMatrix_in" 14 dataMatrix_in "$dataMatrix_in"
15 sampleMetadata_in "$sampleMetadata_in" 15 sampleMetadata_in "$sampleMetadata_in"
16 variableMetadata_in "$variableMetadata_in" 16 variableMetadata_in "$variableMetadata_in"
17 17 makeNameL "$makeNameL"
18
19 dataMatrix_out "$dataMatrix_out"
20 sampleMetadata_out "$sampleMetadata_out"
21 variableMetadata_out "$variableMetadata_out"
18 information "$information" 22 information "$information"
19 ]]></command> 23 ]]></command>
20 24
21 <inputs> 25 <inputs>
22 <param name="dataMatrix_in" type="data" label="Data matrix file" help="" format="tabular" /> 26 <param name="dataMatrix_in" type="data" label="Data matrix file" help="" format="tabular" />
23 <param name="sampleMetadata_in" type="data" label="Sample metadata file" help="" format="tabular" /> 27 <param name="sampleMetadata_in" type="data" label="Sample metadata file" help="" format="tabular" />
24 <param name="variableMetadata_in" type="data" label="Variable metadata file" help="" format="tabular" /> 28 <param name="variableMetadata_in" type="data" label="Variable metadata file" help="" format="tabular" />
29 <param name="makeNameL" label="Make syntactically valid sample and variable names" type="select" help="">
30 <option value="TRUE">yes</option>
31 <option value="FALSE" selected="true">no</option>
32 </param>
25 </inputs> 33 </inputs>
26 34
27 <outputs> 35 <outputs>
36 <data name="dataMatrix_out" label="${tool.name}_${dataMatrix_in.name}" format="tabular" ></data>
37 <data name="sampleMetadata_out" label="${tool.name}_${sampleMetadata_in.name}" format="tabular" ></data>
38 <data name="variableMetadata_out" label="${tool.name}_${variableMetadata_in.name}" format="tabular" ></data>
28 <data name="information" label="${tool.name}_information.txt" format="txt"/> 39 <data name="information" label="${tool.name}_information.txt" format="txt"/>
29 </outputs> 40 </outputs>
30 41
31 <tests> 42 <tests>
32 <test> 43 <test>
33 <param name="dataMatrix_in" value="input-dataMatrix.tsv"/> 44 <param name="dataMatrix_in" value="input-dataMatrix.tsv"/>
34 <param name="sampleMetadata_in" value="input-sampleMetadata.tsv"/> 45 <param name="sampleMetadata_in" value="input-sampleMetadata.tsv"/>
35 <param name="variableMetadata_in" value="input-variableMetadata.tsv"/> 46 <param name="variableMetadata_in" value="input-variableMetadata.tsv"/>
36 <output name="information" file="output-information.txt" lines_diff="4"/> 47 <param name="makeNameL" value="TRUE"/>
48 <output name="information">
49 <assert_contents>
50 <has_text text="Message: Converting sample and variable names to the standard R format" />
51 <has_text text="Warning: The sample and/or variable names or orders from the input tables have been modified" />
52 </assert_contents>
53 </output>
37 </test> 54 </test>
38 </tests> 55 </tests>
39 56
40 <help> 57 <help><![CDATA[
41 58
42 .. class:: infomark 59 .. class:: infomark
43 60
44 **Author** Etienne Thevenot (W4M Core Development Team, MetaboHUB Paris, CEA) 61 **Author** Etienne Thevenot (W4M Core Development Team, MetaboHUB Paris, CEA)
45 62
51 68
52 See the **NEWS** section at the bottom of this page 69 See the **NEWS** section at the bottom of this page
53 70
54 --------------------------------------------------- 71 ---------------------------------------------------
55 72
56 ======================== 73 ============
57 Check Format 74 Check Format
58 ======================== 75 ============
59 76
60 ----------- 77 -----------
61 Description 78 Description
62 ----------- 79 -----------
63 80
64 | Checks the format (row and column names) of the dataMatrix, sampleMetadata and variableMetadata tables 81 | **Checks the format (row and column names)** of the dataMatrix, sampleMetadata and variableMetadata tables; in case of difference of orders of the samples and/or variables between (some of) the tables, the **orders from the dataMatrix are permuted** to match those of the sampleMetadata and/or the variableMetadata; sample and variables names can also be modified to be **syntactically valid** for R by selecting the corresponding argument (e.g. an 'X' is added to names starting with a digit, blanks will be converted to '.', etc.).
65 82
66 83
67 ----------------- 84 -----------------
68 Workflow position 85 Workflow position
69 ----------------- 86 -----------------
70 87
71 .. image:: ./static/images/checkFormat_workflowPositionImage.png 88 .. image:: ./static/images/checkFormat_workflowPositionImage.png
72 :width: 600 89
73
74
75 90
76 ----------- 91 -----------
77 Input files 92 Input files
78 ----------- 93 -----------
79 94
84 +----------------------------+---------+ 99 +----------------------------+---------+
85 | 2 : Sample metadata file | tabular | 100 | 2 : Sample metadata file | tabular |
86 +----------------------------+---------+ 101 +----------------------------+---------+
87 | 3 : Variable metadata file | tabular | 102 | 3 : Variable metadata file | tabular |
88 +----------------------------+---------+ 103 +----------------------------+---------+
89 104
90 | 105 | The **required formats** for the dataMatrix, sampleMetadata, and variableMetadata files are described in the **HowTo** entitled 'Format Data For Postprocessing' available on the main page of Workflow4Metabolomics.org (http://web11.sb-roscoff.fr/download/w4m/howto/w4m_HowToFormatDataForPostprocessing_v02.pdf)
91 | **Required formats for the dataMatrix, sampleMetadata, and variableMetadata files are** 106
92 | **described in the HowTo entitled 'Format Data For Postprocessing' available on the** 107
93 | **main page of Workflow4Metabolomics.org** 108 ----------
94 | 109 Parameters
95 110 ----------
111
112 Data matrix file
113 | variable x sample **dataMatrix** tabular separated file of the numeric data matrix, with . as decimal, and NA for missing values; the table must not contain metadata apart from row and column names; the row and column names must be identical to the rownames of the sample and variable metadata, respectively (see below)
114 |
115
116 Sample metadata file
117 | sample x metadata **sampleMetadata** tabular separated file of the numeric and/or character sample metadata, with . as decimal and NA for missing values
118 |
119
120 Variable metadata file
121 | variable x metadata **variableMetadata** tabular separated file of the numeric and/or character variable metadata, with . as decimal and NA for missing values
122 |
123
124 Make syntactically valid sample and variable names
125 | if set to 'yes', sample and variable names will converted to syntactically valid names with the 'make.names' R function when required (e.g. an 'X' is added to names starting with a digit, blanks will be converted to '.', etc.)
126 |
127
96 ------------ 128 ------------
97 Output files 129 Output files
98 ------------ 130 ------------
99 131
132 dataMatrix_out.tabular
133 | dataMatrix data file; may be identical to the input dataMatrix in case no renaming of sample/variable names nor re-ordering of samples/variables (see the 'information' file for the presence/absence of modifications)
134 |
135
136 sampleMetadata_out.tabular
137 | sampleMetadata data file; may be identical to the input sampleMetadata in case no renaming of sample names nor re-ordering of samples (see the 'information' file for the presence/absence of modifications)
138 |
139
140 variableMetadata_out.tabular
141 | variableMetadata data file; may be identical to the input variableMetadata in case no renaming of variable names nor re-ordering of variables (see the 'information' file for the presence/absence of modifications)
142 |
143
100 information.txt 144 information.txt
101 | Text file with all messages when error(s) in formats are detected 145 | Text file with all messages when error(s) in formats are detected
102 | 146 |
103 147
104 --------------------------------------------------- 148 ---------------------------------------------------
105 149
106 --------------- 150 ---------------
107 Working example 151 Working example
114 --------------------------------------------------- 158 ---------------------------------------------------
115 159
116 ---- 160 ----
117 NEWS 161 NEWS
118 ---- 162 ----
163
164 CHANGES IN VERSION 3.0.0
165 ========================
166
167 NEW FEATURES
168
169 Automated re-ordering (if necessary) of sample and/or variable names from dataMatrix based on sampleMetadata and variableMetadata
170
171 New argument to make sample and variable names syntactically valid
172
173 Output of dataMatrix, sampleMetadata, and variableMetadata files, whether they have been modified or not
119 174
120 CHANGES IN VERSION 2.0.4 175 CHANGES IN VERSION 2.0.4
121 ======================== 176 ========================
122 177
123 INTERNAL MODIFICATIONS 178 INTERNAL MODIFICATIONS
133 Planemo running validation 188 Planemo running validation
134 Planemo installing validation 189 Planemo installing validation
135 Travis automated testing 190 Travis automated testing
136 Toolshed export 191 Toolshed export
137 192
138 </help> 193 ]]></help>
139 194
140 <citations> 195 <citations>
141 <citation type="bibtex">@Article{Thevenot2015, 196 <citation type="doi">10.1021/acs.jproteome.5b00354</citation>
142 Title = {Analysis of the human adult urinary metabolome variations with age, body mass index and gender by implementing a comprehensive workflow for univariate and OPLS statistical analyses}, 197 <citation type="doi">10.1016/j.biocel.2017.07.002</citation>
143 Author = {Thévenot, Etienne A. and Roux, Aurélie and Xu, Ying and Ezan, Eric and Junot, Christophe},
144 Journal = {Journal of Proteome Research},
145 Year = {2015},
146 Note = {PMID: 26088811},
147 Number = {8},
148 Pages = {3322-3335},
149 Volume = {14},
150
151 Doi = {10.1021/acs.jproteome.5b00354},
152 Url = {http://pubs.acs.org/doi/full/10.1021/acs.jproteome.5b00354}
153 }</citation>
154 <citation type="doi">10.1093/bioinformatics/btu813</citation> 198 <citation type="doi">10.1093/bioinformatics/btu813</citation>
155 </citations> 199 </citations>
156 <!-- 200
157
158
159 Working example
160
161
162
163 Input files
164 ===========
165
166 | **To generate the "dataMatrix", "sampleMetadata" and "variableMetadata" files:**
167 | **1) copy/paste the values below in three distinct .txt files**
168 | **2) use the "Get Data" / "Upload File" in the "Tools" (left) panel from the Galaxy / ABiMS page by choosing:**
169 | **a) File Format: 'tabular'**
170 | **b) Convert spaces to tabs: 'Yes'**
171 |
172
173 **dataMatrix file**::
174
175 dataMatrix HU_017 HU_021 HU_027 HU_032 HU_041 HU_048 HU_049 HU_050 HU_052 HU_059 HU_060 HU_066 HU_072 HU_077 HU_090 HU_109 HU_110 HU_125 HU_126 HU_131 HU_134 HU_149 HU_150 HU_173 HU_179 HU_180 HU_182 HU_202 HU_204 HU_209
176 HMDB01032 2569204.92420381 6222035.77434915 17070707.9912636 1258838.24348419 13039543.0754619 1909391.77026598 3495.09386434063 2293521.90928998 128503.275117713 81872.5276382213 8103557.56578035 149574887.036181 1544036.41049333 7103429.53933206 14138796.50382 4970265.57952158 263054.73056162 1671332.30008058 88433.1944958815 23602331.2894815 18648126.5206986 1554657.98756878 34152.3646391152 209372.71275317 33187733.370626 202438.591636003 13581070.0886437 354170.810678102 9120781.48986975 43419175.4051586
177 HMDB03072 3628416.30251025 65626.9834353751 112170.118946651 3261804.34422417 42228.2787747563 343254.201250707 1958217.69317664 11983270.0435677 5932111.41638028 5511385.83359531 9154521.47755199 2632133.21209418 9500411.14556502 6551644.51726592 7204319.80891836 1273412.04795188 3260583.81592376 8932005.5351622 8340827.52597275 9256460.69197759 11217839.169041 5919262.81433556 11790077.0657915 9567977.80797097 73717.5811684739 9991787.29074293 4208098.14739633 623970.649925847 10904221.2642849 2171793.93621067
178 HMDB00792 429568.609438384 3887629.50527037 1330692.11658995 1367446.73023821 844197.447472453 2948090.71886592 1614157.90566884 3740009.19379795 3292251.66531919 2310688.79492013 4404239.59008605 3043289.12780863 825736.467181043 2523241.91730649 6030501.02648005 474901.604069803 2885792.42617652 2955990.64049134 1917716.3427982 1767962.67737699 5926203.40397675 1639065.69474684 346810.763557826 1054776.22313737 2390258.27543894 1831346.37315857 1026696.36904362 7079792.50047866 4368341.01359769 3495986.87280275
179
180
181 **sampleMetadata file**::
182
183 sampleMetadata age ageGrp
184 HU_017 41 experienced
185 HU_021 34 junior
186 HU_027 37 experienced
187 HU_032 38 experienced
188 HU_041 28 junior
189 HU_048 39 experienced
190 HU_049 50 senior
191 HU_050 30 junior
192 HU_052 51 senior
193 HU_059 81 senior
194 HU_060 55 senior
195 HU_066 25 junior
196 HU_072 47 experienced
197 HU_077 27 junior
198 HU_091 46 experienced
199 HU_109 32 junior
200 HU_110 50 senior
201 HU_125 58 senior
202 HU_126 45 experienced
203 HU_131 42 experienced
204 HU_134 48 experienced
205 HU_149 35 experienced
206 HU_150 49 experienced
207 HU_173 55 senior
208 HU_179 33 junior
209 HU_180 53 senior
210 HU_182 43 experienced
211 HU_202 42 experienced
212 HU_204 31 junior
213 HU_209 17.5 junior
214
215
216 **variableMetadata file**::
217
218 variableMetadata name
219 HMDB01032 Dehydroepiandrosterone sulfate
220 HMDB03072 Quinic acid
221 HMDB00792 Sebacic acid
222 -->
223 201
224 </tool> 202 </tool>