comparison id_converter.xml @ 0:f2d0b13d9615 draft

planemo upload commit 5774fd6a5a746f36f6bf4671a51a39ea2b978300-dirty
author proteore
date Fri, 16 Feb 2018 03:16:29 -0500
parents
children 3b654cb3f6ad
comparison
equal deleted inserted replaced
-1:000000000000 0:f2d0b13d9615
1 <tool id="IDconverter" name="ID Converter" version="0.1.0">
2 <description>convert public database identifiers (Homo sapiens only for now)
3 </description>
4 <requirements>
5 </requirements>
6 <stdio>
7 <exit_code range="1:" />
8 </stdio>
9 <command interpreter="Rscript">
10 id_converter_UniProt.R
11 "$idti.idtypein"
12 #if $input.ids == "text"
13 "$input.txt"
14 "list"
15 #else
16 "$input.file,$input.ncol,$input.header"
17 "file"
18 #end if
19 "$idto.idtypeout"
20 "$output"
21 $__tool_directory__/../../utils/human_id_mapping_file.txt
22
23 </command>
24 <inputs>
25 <conditional name="input" >
26 <param name="ids" type="select" label="Provide your identifiers" help="Copy/paste or ID list from a file (e.g. table)" >
27 <option value="text">Copy/paste your identifiers</option>
28 <option value="file">Input file containing your identifiers</option>
29 </param>
30 <when value="text" >
31 <param name="txt" type="text" label="Copy/paste your identifiers" help='IDs must be separated by spaces into the form field, for example: P31946 P62258' >
32 <sanitizer>
33 <valid initial="string.printable">
34 <remove value="&apos;"/>
35 </valid>
36 <mapping initial="none">
37 <add source="&apos;" target="__sq__"/>
38 </mapping>
39 </sanitizer>
40 </param>
41 </when>
42 <when value="file" >
43 <param name="file" type="data" format="txt,tabular" label="Choose a file that contains your list of IDs" help="" />
44 <param name="header" type="boolean" checked="true" truevalue="true" falsevalue="false" label="Does your input file contain header?" />
45 <param name="ncol" type="text" label="The column number of IDs to map" help='For example, fill in "c1" if it is the first column, "c2" if it is the second column and so on' />
46 </when>
47 </conditional>
48 <conditional name="idti" >
49 <param name="idtypein" type="select" label="Select type/source of identifier of your list" help="Please see example of IDs in help section" >
50 <option value="neXtProt_ID" >neXtProt ID (e.g. NX_P31946)</option>
51 <option value="UniProt.AC" selected="True" >Uniprot accession number (e.g. P31946)</option>
52 <option value="UniProt.ID" >Uniprot ID (e.g 1433B_HUMAN)</option>
53 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option>
54 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option>
55 <option value="GI" >GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)</option>
56 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option>
57 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option>
58 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option>
59 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option>
60 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option>
61 <option value="Ensembl" >Ensembl gene ID (e.g. ENSG00000166913)</option>
62 <option value="Ensembl_TRS" >Ensembl transcript ID (e.g. ENST00000353703)</option>
63 <option value="Ensembl_PRO" >Ensembl protein ID (e.g. ENSP00000300161)</option>
64 </param>
65 <when value="neXtProt_ID" >
66 </when>
67 <when value="UniProt.AC" >
68 </when>
69 <when value="UniProt.ID" >
70 </when>
71 <when value="GeneID" >
72 </when>
73 <when value="RefSeq" >
74 </when>
75 <when value="GI" >
76 </when>
77 <when value="PDB" >
78 </when>
79 <when value="GO" >
80 </when>
81 <when value="PIR" >
82 </when>
83 <when value="MIM" >
84 </when>
85 <when value="UniGene" >
86 </when>
87 <when value="Ensembl" >
88 </when>
89 <when value="Ensembl_TRS" >
90 </when>
91 <when value="Ensembl_PRO" >
92 </when>
93 </conditional>
94 <section name="idto" title="Target type of IDs" expanded="True" >
95 <param name="idtypeout" type="select" label="Target type of IDs you would like to map to" display="checkboxes" multiple="True" help="Please see example of IDs in help section" >
96 <option value="neXtProt_ID" >neXtProt ID (e.g. NX_P31946)</option>
97 <option value="UniProt.AC" >Uniprot accession number (e.g. P31946)</option>
98 <option value="UniProt.ID" >Uniprot ID (e.g 1433B_HUMAN)</option>
99 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option>
100 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option>
101 <option value="GI" >GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)</option>
102 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option>
103 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option>
104 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option>
105 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option>
106 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option>
107 <option value="Ensembl" >Ensembl gene ID (e.g. ENSG00000166913)</option>
108 <option value="Ensembl_TRS" >Ensembl transcript ID (e.g. ENST00000353703)</option>
109 <option value="Ensembl_PRO" >Ensembl protein ID (e.g. ENSP00000300161)</option>
110 </param>
111 </section>
112 </inputs>
113 <outputs>
114 <data name="output" format="tabular" />
115 </outputs>
116 <tests>
117 <test>
118 <conditional name="input">
119 <param name="ids" value="file" />
120 <param name="file" value="FKW_Lacombe_et_al_2017_OK.txt" />
121 <param name="header" value="True" />
122 <param name="ncol" value="c1" />
123 </conditional>
124 <conditional name="idti">
125 <param name="idtypein" value="UniProt.AC" />
126 </conditional>
127 <section name="idto">
128 <param name="idtypeout" value="neXtProt_ID,UniProt.ID,GeneID,MIM,Ensembl" />
129 </section>
130 <output name="output" file="ID_Converter_FKW_Lacombe_et_al_2017_OK.txt" />
131 </test>
132 </tests>
133 <help><![CDATA[
134 This tool converts a list of IDs to another identifier type, select the source and target type from the dropdown menus above (see below supported source and target types).
135
136 After choosing the type of input IDs, you can choose one or more types of IDs you would like to map to.
137
138 If your input is a list of IDs or a single-column file, the tool will return a file containing the mapped IDs. Please, note that a "NA" is returned when there is no corresponding ID.
139
140 If your input is a multiple-column file, the mapped IDs column(s) will be added at the end of the input file.
141
142 **Available databases**
143
144 * neXtProt ID (e.g. NX_P31946)
145
146 * Uniprot accession number (e.g. P31946)
147
148 * Uniprot ID (e.g 1433B_HUMAN)
149
150 * Entrez gene ID (e.g. 7529)
151
152 * RefSeq (NCBI) protein (e.g. NP_003395.1)
153
154 * GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)
155
156 * Protein DataBank ID (e.g. 2BR9:A)
157
158 * GOterms (Gene Ontology) ID (e.g. GO:0070062)
159
160 * Protein Information Resource ID (e.g. S34755)
161
162 * OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)
163
164 * Unigene ID (e.g. Hs.643544)
165
166 * Ensembl gene ID (e.g. ENSG00000166913)
167
168 * Ensembl transcript ID (e.g. ENST00000353703)
169
170 * Ensembl protein ID (e.g. ENSP00000300161)
171
172 -----
173
174 .. class:: infomark
175
176 This tool converts human IDs using the following source files:
177
178 * HUMAN_9606_idmapping_selected.tab
179 Tarball downloaded from ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/
180
181 * nextprot_ac_list_all.txt
182 Downloaded from ftp://ftp.nextprot.org/pub/current_release/ac_lists/
183
184 -----
185
186 .. class:: warningmark
187
188 Accession numbers with an hyphen ("-") that normally correspond to isoform are considered
189 (and will therefore be treated) as similar to its canonical form.
190
191 For example, "Q71U36-2" will be treated as "Q71U36".
192
193 -----
194
195 .. class:: infomark
196
197 **Authors**
198
199 T.P. Lien Nguyen, Florence Combes, Yves Vandenbrouck CEA, INSERM, CNRS, Grenoble-Alpes University, BIG Institute, FR
200
201 Sandra Dérozier, Olivier Rué, Christophe Caron, Valentin Loux INRA, Paris-Saclay University, MAIAGE Unit, Migale Bioinformatics platform
202
203 This work has been partially funded through the French National Agency for Research (ANR) IFB project.
204
205 Contact support@proteore.org for any questions or concerns about the Galaxy implementation of this tool.
206
207 ]]></help>
208 <citations>
209 </citations>
210 </tool>