Mercurial > repos > proteore > proteore_id_converter
comparison id_converter.xml @ 15:b50d913ec067 draft
planemo upload commit bdd7e8a1f08c11db2a9f1b6db5535c6d32153b2b
author | proteore |
---|---|
date | Tue, 18 Dec 2018 09:57:21 -0500 |
parents | 659f1248f535 |
children | b6607b7e683f |
comparison
equal
deleted
inserted
replaced
14:659f1248f535 | 15:b50d913ec067 |
---|---|
1 <tool id="IDconverter" name="ID Converter" version="2018.09.18"> | 1 <tool id="IDconverter" name="ID Converter" version="2018.12.18"> |
2 <description>convert public database identifiers | 2 <description>(Human, Mouse, Rat) |
3 </description> | 3 </description> |
4 <requirements> | 4 <requirements> |
5 <requirement type="package" version="3.4.1">R</requirement> | 5 <requirement type="package" version="3.4.1">R</requirement> |
6 </requirements> | 6 </requirements> |
7 <stdio> | 7 <stdio> |
8 <exit_code range="1:" /> | 8 <exit_code range="1:" /> |
9 </stdio> | 9 </stdio> |
10 <command interpreter="Rscript"> | 10 <command interpreter="Rscript"> |
11 $__tool_directory__/id_converter_UniProt.R | 11 $__tool_directory__/id_converter.R |
12 --id_type="$species.idtypein" | 12 --id_type="$species.idtypein" |
13 #if $input.ids == "text" | 13 #if $input.ids == "text" |
14 --input="$input.txt" | 14 --input="$input.txt" |
15 --input_type="list" | 15 --input_type="list" |
16 #else | 16 #else |
19 --header="$input.header" | 19 --header="$input.header" |
20 --input_type="file" | 20 --input_type="file" |
21 #end if | 21 #end if |
22 --target_ids="$species.idto.idtypeout" | 22 --target_ids="$species.idto.idtypeout" |
23 --output="$output" | 23 --output="$output" |
24 --ref_file="$__tool_directory__/${ filter( lambda x: str( x[0] ) == str( $species.mapping_file ), $__app__.tool_data_tables['id_mapping_tab'].get_fields() )[0][-1] }" | 24 --ref_file="$__tool_directory__/${ filter( lambda x: str( x[0] ) == str( $species.mapping_file ), $__app__.tool_data_tables['proteore_id_mapping'].get_fields() )[0][-1] }" |
25 | 25 |
26 </command> | 26 </command> |
27 <inputs> | 27 <inputs> |
28 <conditional name="input" > | 28 <conditional name="input" > |
29 <param name="ids" type="select" label="Provide your identifiers" help="Copy/paste or ID list from a file (e.g. table)" > | 29 <param name="ids" type="select" label="Enter IDs" help="Copy/paste or from a file (e.g. table)" > |
30 <option value="text">Copy/paste your identifiers</option> | 30 <option value="text">Copy/paste your identifiers</option> |
31 <option value="file" selected="true">Input file containing your identifiers</option> | 31 <option value="file" selected="true">Input file containing IDs</option> |
32 </param> | 32 </param> |
33 <when value="text" > | 33 <when value="text" > |
34 <param name="txt" type="text" label="Copy/paste your identifiers" help='IDs must be separated by "," into the form field, for example: P31946,P62258' > | 34 <param name="txt" type="text" label="Copy/paste IDs" help='IDs must be separated by tab, space or carriage return into the form field, for example: P31946 P62258' > |
35 <sanitizer invalid_char=""> | 35 <sanitizer invalid_char=""> |
36 <valid initial="string.printable"> | 36 <valid initial="string.printable"> |
37 <remove value="'"/> | 37 <remove value="'"/> |
38 </valid> | 38 </valid> |
39 <mapping initial="none"> | 39 <mapping initial="none"> |
45 </mapping> | 45 </mapping> |
46 </sanitizer> | 46 </sanitizer> |
47 </param> | 47 </param> |
48 </when> | 48 </when> |
49 <when value="file" > | 49 <when value="file" > |
50 <param name="file" type="data" format="txt,tabular" label="Choose a file that contains your list of IDs" help="" /> | 50 <param name="file" type="data" format="txt,tabular" label="Select your file" help="" /> |
51 <param name="header" type="boolean" checked="true" truevalue="true" falsevalue="false" label="Does your input file contain header?" /> | 51 <param name="header" type="boolean" checked="true" truevalue="true" falsevalue="false" label="Does file contain header?" /> |
52 <param name="ncol" type="text" value="c1" label="The column number of IDs to map" help='For example, fill in "c1" if it is the first column, "c2" if it is the second column and so on' /> | 52 <param name="ncol" type="text" value="c1" label="Column number of IDs to map" help='For example, fill in "c1" if it is the first column, "c2" if it is the second column and so on' /> |
53 </when> | 53 </when> |
54 </conditional> | 54 </conditional> |
55 <conditional name="species"> | 55 <conditional name="species"> |
56 <param name="mapping_file" type="select" label="Select species for ID conversion" > | 56 <param name="mapping_file" type="select" label="Species" > |
57 <options from_data_table="id_mapping_tab"/> | 57 <options from_data_table="proteore_id_mapping"/> |
58 <option value="human_id_mapping"></option> | 58 <option value="human_id_mapping"></option> |
59 <option value="mouse_id_mapping"></option> | 59 <option value="mouse_id_mapping"></option> |
60 <option value="rat_id_mapping"></option> | |
60 </param> | 61 </param> |
61 <when value="human_id_mapping"> | 62 <when value="human_id_mapping"> |
62 <param name="idtypein" type="select" label="Select type/source of identifier of your list" help="Please see example of IDs in help section" > | 63 <param name="idtypein" type="select" label="Type/source of IDs" optional="false" > |
63 <option value="neXtProt" >neXtProt ID (e.g. NX_P31946)</option> | 64 <option value="neXtProt" >neXtProt ID (e.g. NX_P31946)</option> |
64 <option value="UniProt.AC" selected="True" >Uniprot accession number (e.g. P31946)</option> | 65 <option value="UniProt-AC" selected="True" >UniProt accession number (e.g. P31946)</option> |
65 <option value="UniProt.ID" >Uniprot ID (e.g 1433B_HUMAN)</option> | 66 <option value="UniProt-ID" >UniProt ID (e.g 1433B_HUMAN)</option> |
66 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> | 67 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> |
67 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> | 68 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> |
68 <option value="GI" >GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)</option> | 69 <option value="GI" >GI (NCBI GI number) (e.g. 21328448)</option> |
70 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> | |
71 <option value="GO" >GO terms (Gene Ontology) ID (e.g. GO:0070062)</option> | |
72 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> | |
73 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> | |
74 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> | |
75 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> | |
76 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> | |
77 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> | |
78 <option value="BioGrid" >BioGrid (e.g. 113361)</option> | |
79 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> | |
80 <option value="KEGG" >KEGG gene id (e.g. hsa:7529)</option> | |
81 </param> | |
82 <section name="idto" title="Target type" expanded="True" > | |
83 <param name="idtypeout" type="select" label="Target type of IDs you would like to map to" display="checkboxes" multiple="True" optional="false" > | |
84 <option value="neXtProt" >neXtProt ID (e.g. NX_P31946)</option> | |
85 <option value="UniProt-AC" >UniProt accession number (e.g. P31946)</option> | |
86 <option value="UniProt-ID" >UniProt ID (e.g 1433B_HUMAN)</option> | |
87 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> | |
88 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> | |
89 <option value="GI" >GI (NCBI GI number) (e.g. 21328448)</option> | |
90 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> | |
91 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> | |
92 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> | |
93 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> | |
94 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> | |
95 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> | |
96 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> | |
97 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> | |
98 <option value="BioGrid" >BioGrid (e.g. 113361)</option> | |
99 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> | |
100 <option value="KEGG" >KEGG gene id (e.g. hsa:7529)</option> | |
101 </param> | |
102 </section> | |
103 </when> | |
104 <when value="mouse_id_mapping"> | |
105 <param name="idtypein" type="select" label="Type/source of IDs" optional="false" > | |
106 <option value="UniProt-AC" selected="True" >UniProt accession number (e.g. P31946)</option> | |
107 <option value="UniProt-ID" >UniProt ID (e.g 1433B_HUMAN)</option> | |
108 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> | |
109 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> | |
110 <option value="GI" >GI (NCBI GI number) (e.g. 21328448)</option> | |
69 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> | 111 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> |
70 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> | 112 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> |
71 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> | 113 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> |
72 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> | 114 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> |
73 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> | 115 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> |
74 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> | 116 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> |
75 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> | 117 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> |
76 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> | 118 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> |
77 <option value="BioGrid" >BioGrid (e.g. 113361)</option> | 119 <option value="BioGrid" >BioGrid (e.g. 113361)</option> |
78 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> | 120 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> |
79 <option value="KEGG" >KEGG (e.g. hsa:7529)</option> | 121 <option value="KEGG" >KEGG gene id (e.g. hsa:7529)</option> |
80 </param> | 122 </param> |
81 <section name="idto" title="Target type of IDs" expanded="True" > | 123 <section name="idto" title="Target type of IDs" expanded="True" > |
82 <param name="idtypeout" type="select" label="Target type of IDs you would like to map to" display="checkboxes" multiple="True" help="Please see example of IDs in help section" > | 124 <param name="idtypeout" type="select" label="Target type of IDs you would like to map to" display="checkboxes" multiple="True" optional="false" > |
83 <option value="neXtProt" >neXtProt ID (e.g. NX_P31946)</option> | 125 <option value="UniProt-AC" >UniProt accession number (e.g. P31946)</option> |
84 <option value="UniProt.AC" >Uniprot accession number (e.g. P31946)</option> | 126 <option value="UniProt-ID" >UniProt ID (e.g 1433B_HUMAN)</option> |
85 <option value="UniProt.ID" >Uniprot ID (e.g 1433B_HUMAN)</option> | |
86 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> | 127 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> |
87 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> | 128 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> |
88 <option value="GI" >GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)</option> | 129 <option value="GI" >GI (NCBI GI number) (e.g. 21328448)</option> |
89 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> | 130 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> |
90 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> | 131 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> |
91 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> | 132 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> |
92 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> | |
93 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> | 133 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> |
94 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> | 134 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> |
95 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> | 135 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> |
96 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> | 136 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> |
97 <option value="BioGrid" >BioGrid (e.g. 113361)</option> | 137 <option value="BioGrid" >BioGrid (e.g. 113361)</option> |
98 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> | 138 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> |
99 <option value="KEGG" >KEGG (e.g. hsa:7529)</option> | 139 <option value="KEGG" >KEGG gene id (e.g. hsa:7529)</option> |
100 </param> | 140 </param> |
101 </section> | 141 </section> |
102 </when> | 142 </when> |
103 <when value="mouse_id_mapping"> | 143 <when value="rat_id_mapping"> |
104 <param name="idtypein" type="select" label="Select type/source of identifier of your list" help="Please see example of IDs in help section" > | 144 <param name="idtypein" type="select" label="Select type/source of identifier of your list" optional="false" > |
105 <option value="UniProt.AC" selected="True" >Uniprot accession number (e.g. P31946)</option> | 145 <option value="UniProt-AC" selected="True" >UniProt accession number (e.g. P31946)</option> |
106 <option value="UniProt.ID" >Uniprot ID (e.g 1433B_HUMAN)</option> | 146 <option value="UniProt-ID" >UniProt ID (e.g 1433B_HUMAN)</option> |
107 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> | 147 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> |
108 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> | 148 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> |
109 <option value="GI" >GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)</option> | 149 <option value="GI" >GI (NCBI GI number) (e.g. 21328448)</option> |
110 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> | 150 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> |
111 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> | 151 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> |
112 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> | 152 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> |
113 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> | 153 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> |
114 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> | 154 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> |
115 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> | 155 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> |
116 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> | 156 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> |
117 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> | 157 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> |
118 <option value="BioGrid" >BioGrid (e.g. 113361)</option> | 158 <option value="BioGrid" >BioGrid (e.g. 113361)</option> |
119 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> | 159 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> |
120 <option value="KEGG" >KEGG (e.g. hsa:7529)</option> | 160 <option value="KEGG" >KEGG gene id (e.g. hsa:7529)</option> |
121 </param> | 161 </param> |
122 <section name="idto" title="Target type of IDs" expanded="True" > | 162 <section name="idto" title="Target type of IDs" expanded="True" > |
123 <param name="idtypeout" type="select" label="Target type of IDs you would like to map to" display="checkboxes" multiple="True" help="Please see example of IDs in help section" > | 163 <param name="idtypeout" type="select" label="Target type of IDs you would like to map to" display="checkboxes" multiple="True" optional="false" > |
124 <option value="UniProt.AC" >Uniprot accession number (e.g. P31946)</option> | 164 <option value="UniProt-AC" >UniProt accession number (e.g. P31946)</option> |
125 <option value="UniProt.ID" >Uniprot ID (e.g 1433B_HUMAN)</option> | 165 <option value="UniProt-ID" >UniProt ID (e.g 1433B_HUMAN)</option> |
126 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> | 166 <option value="GeneID" >Entrez gene ID (e.g. 7529)</option> |
127 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> | 167 <option value="RefSeq" >RefSeq (NCBI) protein (e.g. NP_003395.1)</option> |
128 <option value="GI" >GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448)</option> | 168 <option value="GI" >GI (NCBI GI number) (e.g. 21328448)</option> |
129 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> | 169 <option value="PDB" >Protein DataBank ID (e.g. 2BR9:A)</option> |
130 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> | 170 <option value="GO" >GOterms (Gene Ontology) ID (e.g. GO:0070062)</option> |
131 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> | 171 <option value="PIR" >Protein Information Resource ID (e.g. S34755)</option> |
132 <option value="MIM" >OMIM (Online Mendelian Inheritance in Man database) ID (e.g: 601289)</option> | |
133 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> | 172 <option value="UniGene" >Unigene ID (e.g. Hs.643544)</option> |
134 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> | 173 <option value="Ensembl_Gene" >Ensembl gene ID (e.g. ENSG00000166913)</option> |
135 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> | 174 <option value="Ensembl_Transcript" >Ensembl transcript ID (e.g. ENST00000353703)</option> |
136 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> | 175 <option value="Ensembl_Protein" >Ensembl protein ID (e.g. ENSP00000300161)</option> |
137 <option value="BioGrid" >BioGrid (e.g. 113361)</option> | 176 <option value="BioGrid" >BioGrid (e.g. 113361)</option> |
138 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> | 177 <option value="STRING" >STRING (e.g. 9606.ENSP00000300161)</option> |
139 <option value="KEGG" >KEGG (e.g. hsa:7529)</option> | 178 <option value="KEGG" >KEGG gene id (e.g. hsa:7529)</option> |
140 </param> | 179 </param> |
141 </section> | 180 </section> |
142 </when> | 181 </when> |
143 </conditional> | 182 </conditional> |
144 </inputs> | 183 </inputs> |
145 <outputs> | 184 <outputs> |
146 <data name="output" format="tabular" /> | 185 <data name="output" format="tsv" /> |
147 </outputs> | 186 </outputs> |
148 <tests> | 187 <tests> |
149 <test> | 188 <test> |
150 <conditional name="input" > | 189 <conditional name="input" > |
151 <param name="ids" value="file"/> | 190 <param name="ids" value="file"/> |
153 <param name="header" value="true" /> | 192 <param name="header" value="true" /> |
154 <param name="ncol" value="c1"/> | 193 <param name="ncol" value="c1"/> |
155 </conditional> | 194 </conditional> |
156 <conditional name="species"> | 195 <conditional name="species"> |
157 <param name="mapping_file" value="human_id_mapping"/> | 196 <param name="mapping_file" value="human_id_mapping"/> |
158 <param name="idtypein" value="UniProt.AC"/> | 197 <param name="idtypein" value="UniProt-AC"/> |
159 <section name="idto"> | 198 <section name="idto"> |
160 <param name="idtypeout" value="neXtProt,UniProt.ID,GeneID,MIM,Ensembl" /> | 199 <param name="idtypeout" value="neXtProt,UniProt-ID,GeneID,MIM,Ensembl" /> |
161 </section> | 200 </section> |
162 </conditional> | 201 </conditional> |
163 <output name="output" value="ID_Converted_FKW_Lacombe_et_al_2017_OK.txt" /> | 202 <output name="output" value="ID_Converted_FKW_Lacombe_et_al_2017_OK.txt" /> |
164 </test> | 203 </test> |
165 </tests> | 204 </tests> |
166 <help><![CDATA[ | 205 <help><![CDATA[ |
167 This tool converts a list of IDs to another identifier type, select the source and target type from the dropdown menus above (see below supported source and target types). | 206 **Description** |
168 | 207 This tool converts a list of identifiers (IDs) into another type of ID. Currently the conversion of IDs applies to the following three species: Human (homo sapiens, Mouse (Mus musculus), Rat (Rattus norvegicus). |
169 After choosing the type of input IDs, you can choose one or more types of IDs you would like to map to. | 208 Supported source and target type of IDs are listed below. After choosing the type of your input IDs, you can select one or more types of ID you may need. |
170 | 209 |
171 If your input is a list of IDs or a single-column file, the tool will return a file containing the mapped IDs. Please, note that a "NA" is returned when there is no corresponding ID. | 210 ----- |
172 | 211 |
212 **Input** | |
213 | |
214 A list of IDs (entered in a copy/paste mode) or a single-column file, the tool will then return a file containing the mapped IDs. | |
173 If your input is a multiple-column file, the mapped IDs column(s) will be added at the end of the input file. | 215 If your input is a multiple-column file, the mapped IDs column(s) will be added at the end of the input file. |
174 | 216 |
175 **Available databases** | 217 .. class:: warningmark |
218 | |
219 Accession numbers with an hyphen ("-") that normally correspond to isoform are considered as similar to its canonical form. | |
220 For example, "Q71U36-2" will be treated as "Q71U36". | |
221 | |
222 ----- | |
223 | |
224 **Parameters** | |
225 Target type of IDs currently supported: | |
176 | 226 |
177 * neXtProt ID (e.g. NX_P31946) | 227 * neXtProt ID (e.g. NX_P31946) |
178 | 228 |
179 * Uniprot accession number (e.g. P31946) | 229 * UniProt accession number (e.g. P31946) |
180 | 230 |
181 * Uniprot ID (e.g 1433B_HUMAN) | 231 * UniProt ID (e.g 1433B_HUMAN) |
182 | 232 |
183 * Entrez gene ID (e.g. 7529) | 233 * Entrez gene ID (e.g. 7529) |
184 | 234 |
185 * RefSeq (NCBI) protein (e.g. NP_003395.1) | 235 * RefSeq protein (NCBI) (e.g. NP_003395.1) |
186 | 236 |
187 * GI (NCBI GI number) ID assigned to each sequence record processed by NCBI (e.g. 21328448) | 237 * GI (NCBI GI number) (e.g. 21328448) |
188 | 238 |
189 * Protein DataBank ID (e.g. 2BR9:A) | 239 * Protein DataBank ID (e.g. 2BR9:A) |
190 | 240 |
191 * GOterms (Gene Ontology) ID (e.g. GO:0070062) | 241 * GOterms (Gene Ontology) ID (e.g. GO:0070062) |
192 | 242 |
200 | 250 |
201 * Ensembl transcript ID (e.g. ENST00000353703) | 251 * Ensembl transcript ID (e.g. ENST00000353703) |
202 | 252 |
203 * Ensembl protein ID (e.g. ENSP00000300161) | 253 * Ensembl protein ID (e.g. ENSP00000300161) |
204 | 254 |
255 * BioGrid (e.g. 113361) | |
256 | |
257 * STRING (e.g. 9606.ENSP00000300161) | |
258 | |
259 * KEGG gene id (e.g. hsa:7529) | |
260 | |
261 .. class:: warningmark | |
262 | |
263 Nextprot and OMIM only applicable to Human species. | |
264 | |
265 ----- | |
266 | |
267 **Output** | |
268 | |
269 A text file containing the selected type of IDs (in addition to the original column(s) provided) | |
270 Please, note that a "NA" is returned when there is no match between a source ID and the corresponding target ID. | |
271 | |
272 ----- | |
273 | |
274 **Data sources (release date)** | |
275 | |
276 This tool converts human IDs using the following source files: | |
277 | |
278 - **HUMAN_9606_idmapping_selected.tab (Uniprot 23/10/2018)**: ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
279 - **HUMAN_9606_idmapping.dat (Uniprot 23/10/18)**: ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
280 - **nextprot_ac_list_all.txt (Nextprot released on 10/10/2018)**: ftp://ftp.nextprot.org/pub/current_release/ac_lists/ | |
281 - **MOUSE_10090_idmapping_selected.tab (Uniprot 23/10/2018)**: ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
282 - **MOUSE_10090_idmapping.dat (Uniprot 23/10/18)**: ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
283 - **RAT_10116_idmapping.dat (Uniprot 23/10/18)**: ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
284 - **RAT_10116_idmapping_selected.tab (Uniprot 23/10/18)**: ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
285 | |
205 ----- | 286 ----- |
206 | 287 |
207 .. class:: infomark | 288 .. class:: infomark |
208 | 289 |
209 This tool converts human IDs using the following source files: | |
210 | |
211 * HUMAN_9606_idmapping_selected.tab (Uniprot 02/07/2018) | |
212 Tarball downloaded from ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
213 | |
214 * HUMAN_9606_idmapping.dat (Uniprot 02/07/18) | |
215 Tarball downloaded from ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/idmapping/by_organism/ | |
216 | |
217 * nextprot_ac_list_all.txt (Nextprot released on 17/01/2018) | |
218 Downloaded from ftp://ftp.nextprot.org/pub/current_release/ac_lists/ | |
219 | |
220 ----- | |
221 | |
222 .. class:: warningmark | |
223 | |
224 Accession numbers with an hyphen ("-") that normally correspond to isoform are considered | |
225 (and will therefore be treated) as similar to its canonical form. | |
226 | |
227 For example, "Q71U36-2" will be treated as "Q71U36". | |
228 | |
229 ----- | |
230 | |
231 .. class:: infomark | |
232 | |
233 **Authors** | 290 **Authors** |
234 | 291 |
235 T.P. Lien Nguyen, David Christiany, Florence Combes, Yves Vandenbrouck CEA, INSERM, CNRS, Grenoble-Alpes University, BIG Institute, FR | 292 David Christiany, T.P. Lien Nguyen, Florence Combes, Yves Vandenbrouck CEA, INSERM, CNRS, Grenoble-Alpes University, BIG Institute, FR |
236 | 293 |
237 Sandra Dérozier, Olivier Rué, Christophe Caron, Valentin Loux INRA, Paris-Saclay University, MAIAGE Unit, Migale Bioinformatics platform | 294 Sandra Dérozier, Olivier Rué, Christophe Caron, Valentin Loux INRA, Paris-Saclay University, MAIAGE Unit, Migale Bioinformatics platform, FR |
238 | 295 |
239 This work has been partially funded through the French National Agency for Research (ANR) IFB project. | 296 This work has been partially funded through the French National Agency for Research (ANR) IFB project. |
240 | 297 |
241 Contact support@proteore.org for any questions or concerns about the Galaxy implementation of this tool. | 298 Contact support@proteore.org for any questions or concerns about the Galaxy implementation of this tool. |
242 | 299 |