Mercurial > repos > proteore > proteore_id_converter
comparison id_converter.xml @ 0:f2d0b13d9615 draft
planemo upload commit 5774fd6a5a746f36f6bf4671a51a39ea2b978300-dirty
author | proteore |
---|---|
date | Fri, 16 Feb 2018 03:16:29 -0500 |
parents | |
children | 3b654cb3f6ad |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:f2d0b13d9615 |
---|---|
1 <tool id="IDconverter" name="ID Converter" version="0.1.0"> | |
2 <description>convert public database identifiers (Homo sapiens only for now) | |
3 </description> | |
4 <requirements> | |
5 </requirements> | |
6 <stdio> | |
7 <exit_code range="1:" /> | |
8 </stdio> | |
9 <command interpreter="Rscript"> | |
10 id_converter_UniProt.R | |
11 "$idti.idtypein" | |
12 #if $input.ids == "text" | |
13 "$input.txt" | |
14 "list" | |
15 #else | |
16 "$input.file,$input.ncol,$input.header" | |
17 "file" | |
18 #end if | |
19 "$idto.idtypeout" | |
20 "$output" | |
21 $__tool_directory__/../../utils/human_id_mapping_file.txt | |
22 | |
23 </command> | |
24 <inputs> | |
25 <conditional name="input" > | |
26 <param name="ids" type="select" label="Provide your identifiers" help="Copy/paste or ID list from a file (e.g. table)" > | |
27 <option value="text">Copy/paste your identifiers</option> | |
28 <option value="file">Input file containing your identifiers</option> | |
29 </param> | |
30 <when value="text" > | |
31 <param name="txt" type="text" label="Copy/paste your identifiers" help='IDs must be separated by spaces into the form field, for example: P31946 P62258' > | |
32 <sanitizer> | |
33 <valid initial="string.printable"> | |
34 <remove value="'"/> | |
35 </valid> | |
36 <mapping initial="none"> | |
37 <add source="'" target="__sq__"/> | |
38 </mapping> | |
39 </sanitizer> | |
40 </param> | |
41 </when> | |
42 <when value="file" > | |
43 <param name="file" type="data" format="txt,tabular" label="Choose a file that contains your list of IDs" help="" /> | |
44 <param name="header" type="boolean" checked="true" truevalue="true" falsevalue="false" label="Does your input file contain header?" /> | |
45 <param name="ncol" type="text" label="The column number of IDs to map" help='For example, fill in "c1" if it is the first column, "c2" if it is the second column and so on' /> | |
46 </when> | |
47 </conditional> | |
48 <conditional name="idti" > | |
49 <param name="idtypein" type="select" label="Select type/source of identifier of your list" help="Please see example of IDs in help section" > | |
50 <option value="neXtProt_ID" >neXtProt ID (e.g. NX_P31946)</option> | |
51 <option value="UniProt.AC" selected="True" >Uniprot accession number (e.g. P31946)</option> | |
52 <option value="UniProt.ID" >Uniprot ID (e.g 1433B_HUMAN)</option> | |
53 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> | |
54 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> | |
55 <option value="GI" >GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)</option> | |
56 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> | |
57 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> | |
58 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> | |
59 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> | |
60 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> | |
61 <option value="Ensembl" >Ensembl gene ID (e.g. ENSG00000166913)</option> | |
62 <option value="Ensembl_TRS" >Ensembl transcript ID (e.g. ENST00000353703)</option> | |
63 <option value="Ensembl_PRO" >Ensembl protein ID (e.g. ENSP00000300161)</option> | |
64 </param> | |
65 <when value="neXtProt_ID" > | |
66 </when> | |
67 <when value="UniProt.AC" > | |
68 </when> | |
69 <when value="UniProt.ID" > | |
70 </when> | |
71 <when value="GeneID" > | |
72 </when> | |
73 <when value="RefSeq" > | |
74 </when> | |
75 <when value="GI" > | |
76 </when> | |
77 <when value="PDB" > | |
78 </when> | |
79 <when value="GO" > | |
80 </when> | |
81 <when value="PIR" > | |
82 </when> | |
83 <when value="MIM" > | |
84 </when> | |
85 <when value="UniGene" > | |
86 </when> | |
87 <when value="Ensembl" > | |
88 </when> | |
89 <when value="Ensembl_TRS" > | |
90 </when> | |
91 <when value="Ensembl_PRO" > | |
92 </when> | |
93 </conditional> | |
94 <section name="idto" title="Target type of IDs" expanded="True" > | |
95 <param name="idtypeout" type="select" label="Target type of IDs you would like to map to" display="checkboxes" multiple="True" help="Please see example of IDs in help section" > | |
96 <option value="neXtProt_ID" >neXtProt ID (e.g. NX_P31946)</option> | |
97 <option value="UniProt.AC" >Uniprot accession number (e.g. P31946)</option> | |
98 <option value="UniProt.ID" >Uniprot ID (e.g 1433B_HUMAN)</option> | |
99 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> | |
100 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> | |
101 <option value="GI" >GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)</option> | |
102 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> | |
103 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> | |
104 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> | |
105 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> | |
106 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> | |
107 <option value="Ensembl" >Ensembl gene ID (e.g. ENSG00000166913)</option> | |
108 <option value="Ensembl_TRS" >Ensembl transcript ID (e.g. ENST00000353703)</option> | |
109 <option value="Ensembl_PRO" >Ensembl protein ID (e.g. ENSP00000300161)</option> | |
110 </param> | |
111 </section> | |
112 </inputs> | |
113 <outputs> | |
114 <data name="output" format="tabular" /> | |
115 </outputs> | |
116 <tests> | |
117 <test> | |
118 <conditional name="input"> | |
119 <param name="ids" value="file" /> | |
120 <param name="file" value="FKW_Lacombe_et_al_2017_OK.txt" /> | |
121 <param name="header" value="True" /> | |
122 <param name="ncol" value="c1" /> | |
123 </conditional> | |
124 <conditional name="idti"> | |
125 <param name="idtypein" value="UniProt.AC" /> | |
126 </conditional> | |
127 <section name="idto"> | |
128 <param name="idtypeout" value="neXtProt_ID,UniProt.ID,GeneID,MIM,Ensembl" /> | |
129 </section> | |
130 <output name="output" file="ID_Converter_FKW_Lacombe_et_al_2017_OK.txt" /> | |
131 </test> | |
132 </tests> | |
133 <help><![CDATA[ | |
134 This tool converts a list of IDs to another identifier type, select the source and target type from the dropdown menus above (see below supported source and target types). | |
135 | |
136 After choosing the type of input IDs, you can choose one or more types of IDs you would like to map to. | |
137 | |
138 If your input is a list of IDs or a single-column file, the tool will return a file containing the mapped IDs. Please, note that a "NA" is returned when there is no corresponding ID. | |
139 | |
140 If your input is a multiple-column file, the mapped IDs column(s) will be added at the end of the input file. | |
141 | |
142 **Available databases** | |
143 | |
144 * neXtProt ID (e.g. NX_P31946) | |
145 | |
146 * Uniprot accession number (e.g. P31946) | |
147 | |
148 * Uniprot ID (e.g 1433B_HUMAN) | |
149 | |
150 * Entrez gene ID (e.g. 7529) | |
151 | |
152 * RefSeq (NCBI) protein (e.g. NP_003395.1) | |
153 | |
154 * GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448) | |
155 | |
156 * Protein DataBank ID (e.g. 2BR9:A) | |
157 | |
158 * GOterms (Gene Ontology) ID (e.g. GO:0070062) | |
159 | |
160 * Protein Information Resource ID (e.g. S34755) | |
161 | |
162 * OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289) | |
163 | |
164 * Unigene ID (e.g. Hs.643544) | |
165 | |
166 * Ensembl gene ID (e.g. ENSG00000166913) | |
167 | |
168 * Ensembl transcript ID (e.g. ENST00000353703) | |
169 | |
170 * Ensembl protein ID (e.g. ENSP00000300161) | |
171 | |
172 ----- | |
173 | |
174 .. class:: infomark | |
175 | |
176 This tool converts human IDs using the following source files: | |
177 | |
178 * HUMAN_9606_idmapping_selected.tab | |
179 Tarball downloaded from ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
180 | |
181 * nextprot_ac_list_all.txt | |
182 Downloaded from ftp://ftp.nextprot.org/pub/current_release/ac_lists/ | |
183 | |
184 ----- | |
185 | |
186 .. class:: warningmark | |
187 | |
188 Accession numbers with an hyphen ("-") that normally correspond to isoform are considered | |
189 (and will therefore be treated) as similar to its canonical form. | |
190 | |
191 For example, "Q71U36-2" will be treated as "Q71U36". | |
192 | |
193 ----- | |
194 | |
195 .. class:: infomark | |
196 | |
197 **Authors** | |
198 | |
199 T.P. Lien Nguyen, Florence Combes, Yves Vandenbrouck CEA, INSERM, CNRS, Grenoble-Alpes University, BIG Institute, FR | |
200 | |
201 Sandra Dérozier, Olivier Rué, Christophe Caron, Valentin Loux INRA, Paris-Saclay University, MAIAGE Unit, Migale Bioinformatics platform | |
202 | |
203 This work has been partially funded through the French National Agency for Research (ANR) IFB project. | |
204 | |
205 Contact support@proteore.org for any questions or concerns about the Galaxy implementation of this tool. | |
206 | |
207 ]]></help> | |
208 <citations> | |
209 </citations> | |
210 </tool> |