Previous changeset 6:054483e27a35 (2018-09-16) Next changeset 8:af5eccf83605 (2022-11-21) |
Commit message:
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/uniprot_rest_interface commit ddbed5f0b0879b4a001d2da6a521b0c9a39c1e7b" |
modified:
macros.xml test-data/id_uniprot.tab test-data/test1_map.tab test-data/test1_retrieve.fasta test-data/test2_map.tab test-data/test2_retrieve.gff uniprot.py uniprot.xml |
added:
test-data/test.tab |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a macros.xml --- a/macros.xml Sun Sep 16 13:41:08 2018 -0400 +++ b/macros.xml Thu Apr 22 17:32:16 2021 +0000 |
b |
@@ -46,7 +46,6 @@ <option value="ACC+ID">UniProtKB AC/ID</option> <option value="ACC">UniProtKB AC</option> <option value="ID">UniProtKB ID</option> - <option value="ACC">UniProtKB AC</option> <option value="UPARC">UniParc</option> <option value="NF50">UniRef50</option> <option value="NF90">UniRef90</option> @@ -59,7 +58,6 @@ help=""> <option value="ACC">UniProtKB AC</option> <option value="ID">UniProtKB ID</option> - <option value="ACC">UniProtKB AC</option> <option value="UPARC">UniParc</option> <option value="NF50">UniRef50</option> <option value="NF90">UniRef90</option> |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a test-data/id_uniprot.tab --- a/test-data/id_uniprot.tab Sun Sep 16 13:41:08 2018 -0400 +++ b/test-data/id_uniprot.tab Thu Apr 22 17:32:16 2021 +0000 |
b |
@@ -7,3 +7,4 @@ A0A077Z587 Q13685 O14639 +WRONGIDWHICHDOESNOTEXIST \ No newline at end of file |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a test-data/test.tab --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/test.tab Thu Apr 22 17:32:16 2021 +0000 |
b |
b'@@ -0,0 +1,2554 @@\n+Uniref_ID\tUniprot_ID\n+UniRef50_A0A009DJS4\tA0A009DJS4\n+UniRef50_A0A009EPD3\tA0A009EPD3\n+UniRef50_A0A010ZLH4\tA0A010ZLH4\n+UniRef50_A0A011A340\tA0A011A340\n+UniRef50_A0A011A588\tA0A011A588\n+UniRef50_A0A015P981\tA0A015P981\n+UniRef50_A0A015PAW5\tA0A015PAW5\n+UniRef50_A0A015PBQ8\tA0A015PBQ8\n+UniRef50_A0A015Q9A2\tA0A015Q9A2\n+UniRef50_A0A015TE87\tA0A015TE87\n+UniRef50_A0A016A5N0\tA0A016A5N0\n+UniRef50_A0A016KJM6\tA0A016KJM6\n+UniRef50_A0A016LGZ5\tA0A016LGZ5\n+UniRef50_A0A016LHE0\tA0A016LHE0\n+UniRef50_A0A017I4T8\tA0A017I4T8\n+UniRef50_A0A017IYW6\tA0A017IYW6\n+UniRef50_A0A017LCS6\tA0A017LCS6\n+UniRef50_A0A017M644\tA0A017M644\n+UniRef50_A0A017MMC4\tA0A017MMC4\n+UniRef50_A0A018RUS5\tA0A018RUS5\n+UniRef50_A0A018WYQ2\tA0A018WYQ2\n+UniRef50_A0A018Y1M8\tA0A018Y1M8\n+UniRef50_A0A018Z6E5\tA0A018Z6E5\n+UniRef50_A0A022HIF5\tA0A022HIF5\n+UniRef50_A0A022KGA3\tA0A022KGA3\n+UniRef50_A0A023BKX3\tA0A023BKX3\n+UniRef50_A0A023K2K8\tA0A023K2K8\n+UniRef50_A0A023K3H2\tA0A023K3H2\n+UniRef50_A0A023K7A9\tA0A023K7A9\n+UniRef50_A0A023K7S3\tA0A023K7S3\n+UniRef50_A0A023KE77\tA0A023KE77\n+UniRef50_A0A023KET7\tA0A023KET7\n+UniRef50_A0A023KEX3\tA0A023KEX3\n+UniRef50_A0A023KEX8\tA0A023KEX8\n+UniRef50_A0A023KLN1\tA0A023KLN1\n+UniRef50_A0A023KN88\tA0A023KN88\n+UniRef50_A0A023KNT6\tA0A023KNT6\n+UniRef50_A0A023KPW6\tA0A023KPW6\n+UniRef50_A0A023KQS7\tA0A023KQS7\n+UniRef50_A0A023KT22\tA0A023KT22\n+UniRef50_A0A023KU88\tA0A023KU88\n+UniRef50_A0A023KUE4\tA0A023KUE4\n+UniRef50_A0A023KWU4\tA0A023KWU4\n+UniRef50_A0A023KXV3\tA0A023KXV3\n+UniRef50_A0A023KYQ0\tA0A023KYQ0\n+UniRef50_A0A023KYY3\tA0A023KYY3\n+UniRef50_A0A023L0G2\tA0A023L0G2\n+UniRef50_A0A023L4E6\tA0A023L4E6\n+UniRef50_A0A023L5T1\tA0A023L5T1\n+UniRef50_A0A023L5T5\tA0A023L5T5\n+UniRef50_A0A023L5T6\tA0A023L5T6\n+UniRef50_A0A023LAK9\tA0A023LAK9\n+UniRef50_A0A023LC15\tA0A023LC15\n+UniRef50_A0A023LCW0\tA0A023LCW0\n+UniRef50_A0A023LDQ6\tA0A023LDQ6\n+UniRef50_A0A023LE00\tA0A023LE00\n+UniRef50_A0A023LEL1\tA0A023LEL1\n+UniRef50_A0A023LFU4\tA0A023LFU4\n+UniRef50_A0A023LFZ4\tA0A023LFZ4\n+UniRef50_A0A023LG84\tA0A023LG84\n+UniRef50_A0A023LGN2\tA0A023LGN2\n+UniRef50_A0A023LKA4\tA0A023LKA4\n+UniRef50_A0A023WHY5\tA0A023WHY5\n+UniRef50_A0A023Y025\tA0A023Y025\n+UniRef50_A0A023YCU8\tA0A023YCU8\n+UniRef50_A0A023YDI7\tA0A023YDI7\n+UniRef50_A0A023YGB7\tA0A023YGB7\n+UniRef50_A0A023YH78\tA0A023YH78\n+UniRef50_A0A023YIZ9\tA0A023YIZ9\n+UniRef50_A0A023YJW6\tA0A023YJW6\n+UniRef50_A0A023YK14\tA0A023YK14\n+UniRef50_A0A023YKD7\tA0A023YKD7\n+UniRef50_A0A023YKI9\tA0A023YKI9\n+UniRef50_A0A023YKS2\tA0A023YKS2\n+UniRef50_A0A023YLG4\tA0A023YLG4\n+UniRef50_A0A023YMZ2\tA0A023YMZ2\n+UniRef50_A0A023YN72\tA0A023YN72\n+UniRef50_A0A023YP31\tA0A023YP31\n+UniRef50_A0A023YQS4\tA0A023YQS4\n+UniRef50_A0A023YSE6\tA0A023YSE6\n+UniRef50_A0A023YVZ5\tA0A023YVZ5\n+UniRef50_A0A023YXD9\tA0A023YXD9\n+UniRef50_A0A023YY37\tA0A023YY37\n+UniRef50_A0A023YYP5\tA0A023YYP5\n+UniRef50_A0A023Z1J3\tA0A023Z1J3\n+UniRef50_A0A023Z249\tA0A023Z249\n+UniRef50_A0A023Z561\tA0A023Z561\n+UniRef50_A0A023Z6S6\tA0A023Z6S6\n+UniRef50_A0A024KZS2\tA0A024KZS2\n+UniRef50_A0A024L1D8\tA0A024L1D8\n+UniRef50_A0A024L3K6\tA0A024L3K6\n+UniRef50_A0A024L3Z4\tA0A024L3Z4\n+UniRef50_A0A024L4B0\tA0A024L4B0\n+UniRef50_A0A024L5T0\tA0A024L5T0\n+UniRef50_A0A024L6L4\tA0A024L6L4\n+UniRef50_A0A024L767\tA0A024L767\n+UniRef50_A0A024L7A3\tA0A024L7A3\n+UniRef50_A0A024L7Z6\tA0A024L7Z6\n+UniRef50_A0A024L874\tA0A024L874\n+UniRef50_A0A024LAF1\tA0A024LAF1\n+UniRef50_A0A024LAN1\tA0A024LAN1\n+UniRef50_A0A024LAU7\tA0A024LAU7\n+UniRef50_A0A024LBI2\tA0A024LBI2\n+UniRef50_A0A024LBQ1\tA0A024LBQ1\n+UniRef50_A0A024LC63\tA0A024LC63\n+UniRef50_A0A024LCB9\tA0A024LCB9\n+UniRef50_A0A024LKC0\tA0A024LKC0\n+UniRef50_A0A025BQD1\tA0A025BQD1\n+UniRef50_A0A025DCK3\tA0A025DCK3\n+UniRef50_A0A025E569\tA0A025E569\n+UniRef50_A0A025GLL8\tA0A025GLL8\n+UniRef50_A0A025SEL1\tA0A025SEL1\n+UniRef50_A0A025XI46\tA0A025XI46\n+UniRef50_A0A025XRP5\tA0A025XRP5\n+UniRef50_A0A025ZG79\tA0A025ZG79\n+UniRef50_A0A026FAT8\tA0A026FAT8\n+UniRef50_A0A026FX19\tA0A026FX19\n+UniRef50_A0A026RF42\tA0A026RF42\n+UniRef50_A0A026S5H6\tA0A026S5H6\n+UniRef50_A0A026TYJ6\tA0A026TYJ6\n+UniRef50_A0A026XYW8\tA0A026XYW8\n+UniRef50_A0A027G7Z7\tA0A027G7Z7\n+UniRef50_A0A027IZ46\tA0A027IZ46\n+UniRef50_A0A027RVP4\tA'..b'_W6FCT0\tW6FCT0\n+UniRef50_W6FDL4\tW6FDL4\n+UniRef50_W6FF32\tW6FF32\n+UniRef50_W6FHU2\tW6FHU2\n+UniRef50_W6P1M0\tW6P1M0\n+UniRef50_W6PQ03\tW6PQ03\n+UniRef50_W6RZA0\tW6RZA0\n+UniRef50_W6S4M9\tW6S4M9\n+UniRef50_W6S650\tW6S650\n+UniRef50_W6W5E1\tW6W5E1\n+UniRef50_W7NJD0\tW7NJD0\n+UniRef50_W8KLI9\tW8KLI9\n+UniRef50_W8SSM4\tW8SSM4\n+UniRef50_W8STB2\tW8STB2\n+UniRef50_W8SUL3\tW8SUL3\n+UniRef50_W8SW86\tW8SW86\n+UniRef50_W8SXN8\tW8SXN8\n+UniRef50_W8SXX6\tW8SXX6\n+UniRef50_W8SY51\tW8SY51\n+UniRef50_W8SYA0\tW8SYA0\n+UniRef50_W8SZC5\tW8SZC5\n+UniRef50_W8SZQ6\tW8SZQ6\n+UniRef50_W8T0J0\tW8T0J0\n+UniRef50_W8T0Q2\tW8T0Q2\n+UniRef50_W8T0R4\tW8T0R4\n+UniRef50_W8T104\tW8T104\n+UniRef50_W8T289\tW8T289\n+UniRef50_W8T2D1\tW8T2D1\n+UniRef50_W8T306\tW8T306\n+UniRef50_W8T335\tW8T335\n+UniRef50_W8T3J5\tW8T3J5\n+UniRef50_W8T426\tW8T426\n+UniRef50_W8T4A8\tW8T4A8\n+UniRef50_W8T550\tW8T550\n+UniRef50_W8T6Y6\tW8T6Y6\n+UniRef50_W8T781\tW8T781\n+UniRef50_W8T8I2\tW8T8I2\n+UniRef50_W8T8M9\tW8T8M9\n+UniRef50_W8T948\tW8T948\n+UniRef50_W8T950\tW8T950\n+UniRef50_W8T9K1\tW8T9K1\n+UniRef50_W8TAD5\tW8TAD5\n+UniRef50_W8TB18\tW8TB18\n+UniRef50_W8TC27\tW8TC27\n+UniRef50_W8TCM7\tW8TCM7\n+UniRef50_W8TF04\tW8TF04\n+UniRef50_W8TFZ0\tW8TFZ0\n+UniRef50_W8TGP5\tW8TGP5\n+UniRef50_W8TIX1\tW8TIX1\n+UniRef50_W8TQE0\tW8TQE0\n+UniRef50_W8TS58\tW8TS58\n+UniRef50_W8TSS1\tW8TSS1\n+UniRef50_W8TT27\tW8TT27\n+UniRef50_W8TUT7\tW8TUT7\n+UniRef50_W8TVH9\tW8TVH9\n+UniRef50_W8TVZ3\tW8TVZ3\n+UniRef50_W8TWM7\tW8TWM7\n+UniRef50_W8TXR8\tW8TXR8\n+UniRef50_W8TXZ4\tW8TXZ4\n+UniRef50_W8TZQ2\tW8TZQ2\n+UniRef50_W8U063\tW8U063\n+UniRef50_W8U1K9\tW8U1K9\n+UniRef50_W8U2M8\tW8U2M8\n+UniRef50_W8U2W4\tW8U2W4\n+UniRef50_W8UYM6\tW8UYM6\n+UniRef50_W8V6D6\tW8V6D6\n+UniRef50_W8V6S8\tW8V6S8\n+UniRef50_W8V764\tW8V764\n+UniRef50_W8XGI2\tW8XGI2\n+UniRef50_W8ZPQ9\tW8ZPQ9\n+UniRef50_W9A0W7\tW9A0W7\n+UniRef50_W9B0K7\tW9B0K7\n+UniRef50_W9B8I4\tW9B8I4\n+UniRef50_W9BBP6\tW9BBP6\n+UniRef50_W9BHI2\tW9BHI2\n+UniRef50_W9T9W7\tW9T9W7\n+UniRef50_W9UR67\tW9UR67\n+UniRef50_W9V347\tW9V347\n+UniRef50_X0R4J1\tX0R4J1\n+UniRef50_X0Z7Y9\tX0Z7Y9\n+UniRef50_X1G4F7\tX1G4F7\n+UniRef50_X1WW26\tX1WW26\n+UniRef50_X1XJA7\tX1XJA7\n+UniRef50_X1XK55\tX1XK55\n+UniRef50_X2LIK1\tX2LIK1\n+UniRef50_X2LK66\tX2LK66\n+UniRef50_X2LKW6\tX2LKW6\n+UniRef50_X2LR89\tX2LR89\n+UniRef50_X2LRE4\tX2LRE4\n+UniRef50_X2LS39\tX2LS39\n+UniRef50_X2LSX3\tX2LSX3\n+UniRef50_X2LU18\tX2LU18\n+UniRef50_X2LWW8\tX2LWW8\n+UniRef50_X2M0B0\tX2M0B0\n+UniRef50_X2M1Y3\tX2M1Y3\n+UniRef50_X2M254\tX2M254\n+UniRef50_X2M2B8\tX2M2B8\n+UniRef50_X2M2P8\tX2M2P8\n+UniRef50_X2MAR9\tX2MAR9\n+UniRef50_X2MBX8\tX2MBX8\n+UniRef50_X2MGB2\tX2MGB2\n+UniRef50_X2MHY7\tX2MHY7\n+UniRef50_X2MLT5\tX2MLT5\n+UniRef50_X2MMA8\tX2MMA8\n+UniRef50_X2MNB6\tX2MNB6\n+UniRef50_X2MQH7\tX2MQH7\n+UniRef50_X2MTF4\tX2MTF4\n+UniRef50_X2MTV9\tX2MTV9\n+UniRef50_X2MU03\tX2MU03\n+UniRef50_X2MU68\tX2MU68\n+UniRef50_X2MV43\tX2MV43\n+UniRef50_X2MVD0\tX2MVD0\n+UniRef50_X2MX97\tX2MX97\n+UniRef50_X2MZD5\tX2MZD5\n+UniRef50_X2N154\tX2N154\n+UniRef50_X2N1A9\tX2N1A9\n+UniRef50_X2N2G9\tX2N2G9\n+UniRef50_X2N374\tX2N374\n+UniRef50_X2N3P8\tX2N3P8\n+UniRef50_X2N485\tX2N485\n+UniRef50_X2N4K3\tX2N4K3\n+UniRef50_X2N4S2\tX2N4S2\n+UniRef50_X2N530\tX2N530\n+UniRef50_X2N7H7\tX2N7H7\n+UniRef50_X2N7K7\tX2N7K7\n+UniRef50_X2NAE3\tX2NAE3\n+UniRef50_X2NAF9\tX2NAF9\n+UniRef50_X2NAM5\tX2NAM5\n+UniRef50_X2NCR6\tX2NCR6\n+UniRef50_X2NDM5\tX2NDM5\n+UniRef50_X2NG16\tX2NG16\n+UniRef50_X2P110\tX2P110\n+UniRef50_X3E1V8\tX3E1V8\n+UniRef50_X3EEJ0\tX3EEJ0\n+UniRef50_X3EGM7\tX3EGM7\n+UniRef50_X3EKE6\tX3EKE6\n+UniRef50_X3ELX1\tX3ELX1\n+UniRef50_X3EN79\tX3EN79\n+UniRef50_X3ERM3\tX3ERM3\n+UniRef50_X3EY15\tX3EY15\n+UniRef50_X3EYH3\tX3EYH3\n+UniRef50_X3EZZ6\tX3EZZ6\n+UniRef50_X3JE73\tX3JE73\n+UniRef50_X3W1J0\tX3W1J0\n+UniRef50_X3W353\tX3W353\n+UniRef50_X3WS87\tX3WS87\n+UniRef50_X3XQD3\tX3XQD3\n+UniRef50_X3YW87\tX3YW87\n+UniRef50_X4FRC6\tX4FRC6\n+UniRef50_X4RGC4\tX4RGC4\n+UniRef50_X4WXD8\tX4WXD8\n+UniRef50_X4X4C7\tX4X4C7\n+UniRef50_X4XFI8\tX4XFI8\n+UniRef50_X4XHM9\tX4XHM9\n+UniRef50_X4ZJB4\tX4ZJB4\n+UniRef50_X4ZSZ9\tX4ZSZ9\n+UniRef50_X5AT19\tX5AT19\n+UniRef50_X5DW04\tX5DW04\n+UniRef50_X5G1M7\tX5G1M7\n+UniRef50_X5K4I4\tX5K4I4\n+UniRef50_X7LA43\tX7LA43\n+UniRef50_X7QK55\tX7QK55\n+UniRef50_X8K474\tX8K474\n+UniRef50_X8L2K3\tX8L2K3\n+UniRef50_Y1IXG9\tY1IXG9\n+UniRef50_Y1MEW7\tY1MEW7\n+UniRef50_Z2DBM9\tZ2DBM9\n' |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a test-data/test1_map.tab --- a/test-data/test1_map.tab Sun Sep 16 13:41:08 2018 -0400 +++ b/test-data/test1_map.tab Thu Apr 22 17:32:16 2021 +0000 |
b |
@@ -1,10 +1,10 @@ From To -Q0P8A9 fdhC +A0A077Z587 TTRE_0000309301 +A0A077ZFY8 TTRE_0000758701 A0A077ZHN8 TTRE_0000819801 -A0A077ZFY8 TTRE_0000758701 M5B8V9 CMN_01519 M5BAG7 cydC +O14639 ABLIM1 +Q0P8A9 fdhC +Q13685 AAMP S0DS17 apf8 -A0A077Z587 TTRE_0000309301 -Q13685 AAMP -O14639 ABLIM1 |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a test-data/test1_retrieve.fasta --- a/test-data/test1_retrieve.fasta Sun Sep 16 13:41:08 2018 -0400 +++ b/test-data/test1_retrieve.fasta Thu Apr 22 17:32:16 2021 +0000 |
b |
@@ -1,3 +1,23 @@ +>sp|Q13685|AAMP_HUMAN Angio-associated migratory cell protein OS=Homo sapiens OX=9606 GN=AAMP PE=1 SV=2 +MESESESGAAADTPPLETLSFHGDEEIIEVVELDPGPPDPDDLAQEMEDVDFEEEEEEEG +NEEGWVLEPQEGVVGSMEGPDDSEVTFALHSASVFCVSLDPKTNTLAVTGGEDDKAFVWR +LSDGELLFECAGHKDSVTCAGFSHDSTLVATGDMSGLLKVWQVDTKEEVWSFEAGDLEWM +EWHPRAPVLLAGTADGNTWMWKVPNGDCKTFQGPNCPATCGRVLPDGKRAVVGYEDGTIR +IWDLKQGSPIHVLKGTEGHQGPLTCVAANQDGSLILTGSVDCQAKLVSATTGKVVGVFRP +ETVASQPSLGEGEESESNSVESLGFCSVMPLAAVGYLDGTLAIYDLATQTLRHQCQHQSG +IVQLLWEAGTAVVYTCSLDGIVRLWDARTGRLLTDYRGHTAEILDFALSKDASLVVTTSG +DHKAKVFCVQRPDR +>tr|M5B8V9|M5B8V9_9MICO ABC transporter involved in the biosynthesis of cytochrom bd, fused permease/ATP-binding protein OS=Clavibacter michiganensis subsp. nebraskensis NCPPB 2581 OX=1097677 GN=CMN_01519 PE=4 SV=1 +MKPLDPRLLRHSASARTMLAVGAVVSVVQTAALVAFCWSLTQLVVRAIGGADQAALAPVL +ALAVGSAVVRGAAAWLLDVTGARGAARVTAELRRRALRAIADLGPAWTAARSRGRLATIV +GPGLDALDPYFARYVPQLILTALATPIVVAVLLLSDPLTGVTVLVTLPVIPVFMVLVGWA +TQEVQRRQWSRLTELASSFLEVVDGLSTLLVFRRARRQTARIRRVTEEYRVETMRVLRIS +FLSGFVLELAASLSVALVAVSVGVRLIGGQLDLEVGLFVLLLAPEAFLPIRQVGVQFHAA +AEGVAAADDVLGILEEERAARATRPVPGPATATPPAGDALVIRDLAVARGDRAVLSGVSA +RFPRGRVTAVTGPSGVGKSSLLGAMLGHLPAGGAAGWIDDDASSLRPPVPTEIAWAGQRP +GLVAGTVRENVALGVADPDDALVRRALALAAADGIDPDLVLGVGGQGLSGGQAQRVAVAR +AVHRALALDCPLVLLDEPSSALDAATEERLAAGIRALADQGRAVVVVTHRGALVRAADAE +LRLGGASGEDDAPAAVGSSVGAGRVAPARIAPEPAWRAQVAP >sp|S0DS17|APF8_GIBF5 Cytochrome P450 monooxygenase apf8 OS=Gibberella fujikuroi (strain CBS 195.34 / IMI 58289 / NRRL A-6831) OX=1279085 GN=apf8 PE=1 SV=1 MSYQSILLRQVNSLCDNLEEVARDENGGLIDMAMQSDYFTFDVMSEVIFGMAYNALKDTS YRFVTGALGSSNIRIGTLVQSPLPAMCRIDKYLFPESIQGRNKFLGFIGSLLRDRSKASF @@ -6,6 +26,17 @@ LTLPAGVDVGTGIYSLHHNAAYHPEPFKYLPERWLVGEGSSTSESVELARSAFAPFSRGP RSCVGKGFAYHELTLTIAHILHRFDFSATEEDFALRHGSEGPGGINEFLLHDHVTGARSG PLLQFSMRR +>tr|M5BAG7|M5BAG7_9MICO ABC transporter, fused permease/ABC transporter involved in the biosynthesis of cytochrom bd, fused permease/ATP-binding protein OS=Clavibacter michiganensis subsp. nebraskensis NCPPB 2581 OX=1097677 GN=cydC PE=4 SV=1 +MNRDGVLRLAQPPTRRTLPGLLAGLASAVGAVALLATSAWLITRASEQPPILFLGMAIVG +VRAFALGRAAFRYLERITSHDAAFRALATLRVGVFERLLPFAPAGLRDTRRGDLLARLVG +DVDRLQDLPLRVVQPLAVSVVVQAASVAVVGAVLPAAGIALAVVLGVALVVGIGATTALA +GRAETRIAPLRARLQDLVLDFVGGLDVLTSFGAVDDRLAAIDRAATELRRAELRSAAAAG +VTTGVVLAGTGAVAGWTVLQGVPGLASGTLDPAWLALAALVPLALVEQATAVPLAVQAWR +RVRTSAERVAGVVPETVPDEIPREPDDAADAQPVTADASPAGTTLEVRDLVTRWPGADED +ALAPVSLVVRPGETVVVRGPSGSGKSSLAAALARFLESRGAYELDGRDARSMPPSAVRRI +VGLCEQAPHLFDASIRQNLLFARDDATDDELVAVLARVGLADWTAGRGGLDARVGDRGGL +VSGGQAQRIALARALLADFPVLVLDEPTADVDAERARAVLRDVLTAARDRGPGVLLLTHT +DVPHDLVDRTVELRVAGDRVRTE >tr|A0A077Z587|A0A077Z587_TRITR Kelch 3 and Kelch 4 and Cytochrom B561 domain con taining protein OS=Trichuris trichiura OX=36087 GN=TTRE_0000309301 PE=4 SV=1 MGSQQAADETQKVVERIILNINVRKDKRSFGLGIKIKKGNVFVSSIRPGSIAEDHFKLYD VIKDVNGSRIDSRELCRDLIRTHKVLTVTVERELSKNIEQPGQGDRKSSTECPYLETAQP @@ -20,41 +51,7 @@ SASFALILPAGALWALYKSARVTKQKKSGGWTMTHTIAQTCGMVIVAAGAVCSIQAKRDN GKHFGSVHGVLGIIVIALLCVQVALGFSKSLIRTEAQRRTINRVHFWLAIVLLPLAFLNI ILGLQLIAVPVGLLLGFFVHIFCLLAALGLILPILRFRKANRSVAFPPPNDD ->sp|Q13685|AAMP_HUMAN Angio-associated migratory cell protein OS=Homo sapiens OX=9606 GN=AAMP PE=1 SV=2 -MESESESGAAADTPPLETLSFHGDEEIIEVVELDPGPPDPDDLAQEMEDVDFEEEEEEEG -NEEGWVLEPQEGVVGSMEGPDDSEVTFALHSASVFCVSLDPKTNTLAVTGGEDDKAFVWR -LSDGELLFECAGHKDSVTCAGFSHDSTLVATGDMSGLLKVWQVDTKEEVWSFEAGDLEWM -EWHPRAPVLLAGTADGNTWMWKVPNGDCKTFQGPNCPATCGRVLPDGKRAVVGYEDGTIR -IWDLKQGSPIHVLKGTEGHQGPLTCVAANQDGSLILTGSVDCQAKLVSATTGKVVGVFRP -ETVASQPSLGEGEESESNSVESLGFCSVMPLAAVGYLDGTLAIYDLATQTLRHQCQHQSG -IVQLLWEAGTAVVYTCSLDGIVRLWDARTGRLLTDYRGHTAEILDFALSKDASLVVTTSG -DHKAKVFCVQRPDR ->sp|O14639|ABLM1_HUMAN Actin-binding LIM protein 1 OS=Homo sapiens OX=9606 GN=ABLIM1 PE=1 SV=3 -MPAFLGLKCLGKLCSSEKSKVTSSERTSARGSNRKRLIVEDRRVSGTSFTAHRRATITHL -LYLCPKDYCPRGRVCNSVDPFVAHPQDPHHPSEKPVIHCHKCGEPCKGEVLRVQTKHFHI -KCFTCKVCGCDLAQGGFFIKNGEYLCTLDYQRMYGTRCHGCGEFVEGEVVTALGKTYHPN -CFACTICKRPFPPGDRVTFNGRDCLCQLCAQPMSSSPKETTFSSNCAGCGRDIKNGQALL -ALDKQWHLGCFKCKSCGKVLTGEYISKDGAPYCEKDYQGLFGVKCEACHQFITGKVLEAG -DKHYHPSCARCSRCNQMFTEGEEMYLQGSTVWHPDCKQSTKTEEKLRPTRTSSESIYSRP -GSSIPGSPGHTIYAKVDNEILDYKDLAAIPKVKAIYDIERPDLITYEPFYTSGYDDKQER -QSLGESPRTLSPTPSAEGYQDVRDRMIHRSTSQGSINSPVYSRHSYTPTTSRSPQHFHRP -GNEPSSGRNSPLPYRPDSRPLTPTYAQAPKHFHVPDQGINIYRKPPIYKQHAALAAQSKS -SEDIIKFSKFPAAQAPDPSETPKIETDHWPGPPSFAVVGPDMKRRSSGREEDDEELLRRR -QLQEEQLMKLNSGLGQLILKEEMEKESRERSSLLASRYDSPINSASHIPSSKTASLPGYG -RNGLHRPVSTDFAQYNSYGDVSGGVRDYQTLPDGHMPAMRMDRGVSMPNMLEPKIFPYEM -LMVTNRGRNKILREVDRTRLERHLAPEVFREIFGMSIQEFDRLPLWRRNDMKKKAKLF ->tr|M5B8V9|M5B8V9_9MICO ABC transporter involved in the biosynthesis of cytochrom bd, fused permease/ATP-binding protein OS=Clavibacter nebraskensis NCPPB 2581 OX=1097677 GN=CMN_01519 PE=4 SV=1 -MKPLDPRLLRHSASARTMLAVGAVVSVVQTAALVAFCWSLTQLVVRAIGGADQAALAPVL -ALAVGSAVVRGAAAWLLDVTGARGAARVTAELRRRALRAIADLGPAWTAARSRGRLATIV -GPGLDALDPYFARYVPQLILTALATPIVVAVLLLSDPLTGVTVLVTLPVIPVFMVLVGWA -TQEVQRRQWSRLTELASSFLEVVDGLSTLLVFRRARRQTARIRRVTEEYRVETMRVLRIS -FLSGFVLELAASLSVALVAVSVGVRLIGGQLDLEVGLFVLLLAPEAFLPIRQVGVQFHAA -AEGVAAADDVLGILEEERAARATRPVPGPATATPPAGDALVIRDLAVARGDRAVLSGVSA -RFPRGRVTAVTGPSGVGKSSLLGAMLGHLPAGGAAGWIDDDASSLRPPVPTEIAWAGQRP -GLVAGTVRENVALGVADPDDALVRRALALAAADGIDPDLVLGVGGQGLSGGQAQRVAVAR -AVHRALALDCPLVLLDEPSSALDAATEERLAAGIRALADQGRAVVVVTHRGALVRAADAE -LRLGGASGEDDAPAAVGSSVGAGRVAPARIAPEPAWRAQVAP ->tr|Q0P8A9|Q0P8A9_CAMJE Putative formate dehydrogenase, cytochrom B subunit OS=Campylobacter jejuni subsp. jejuni serotype O:2 (strain ATCC 700819 / NCTC 11168) OX=192222 GN=fdhC PE=4 SV=1 +>tr|Q0P8A9|Q0P8A9_CAMJE Putative formate dehydrogenase, cytochrom B subunit OS=Campylobacter jejuni subsp. jejuni serotype O:2 (strain ATCC 700819 / NCTC 11168) OX=192222 GN=fdhC PE=3 SV=1 MRKVFVTLLLSVVSLFAYGSERMGQDTQIWDFHRITNIPNYDTFGKLWTTLQGEYIATIA LIAVIAVLSAFALHYMVIGPKQFSHDGKKIYAFTLFERLFHFIAAISWVILVPTGFVMMF GEVFGGGVFVRVCKNLHAFATILFIISIIPMFLCWIKRMLPASYDIRWMMIVGGYLSKIK @@ -91,14 +88,17 @@ ENGEIQYPVSEITIAVSSLVFSSASFAADLEDNMETLNDNLKVVEKADNAAQVKDALTKM RAAALDAQKATPPKLEGKSPDSPEMKDFRHGFDILVGQIDDALKLANEGKVKEAQAAAEQ LKTTRNAYHQKYR ->tr|M5BAG7|M5BAG7_9MICO ABC transporter, fused permease/ABC transporter involved in the biosynthesis of cytochrom bd, fused permease/ATP-binding protein OS=Clavibacter nebraskensis NCPPB 2581 OX=1097677 GN=cydC PE=4 SV=1 -MNRDGVLRLAQPPTRRTLPGLLAGLASAVGAVALLATSAWLITRASEQPPILFLGMAIVG -VRAFALGRAAFRYLERITSHDAAFRALATLRVGVFERLLPFAPAGLRDTRRGDLLARLVG -DVDRLQDLPLRVVQPLAVSVVVQAASVAVVGAVLPAAGIALAVVLGVALVVGIGATTALA -GRAETRIAPLRARLQDLVLDFVGGLDVLTSFGAVDDRLAAIDRAATELRRAELRSAAAAG -VTTGVVLAGTGAVAGWTVLQGVPGLASGTLDPAWLALAALVPLALVEQATAVPLAVQAWR -RVRTSAERVAGVVPETVPDEIPREPDDAADAQPVTADASPAGTTLEVRDLVTRWPGADED -ALAPVSLVVRPGETVVVRGPSGSGKSSLAAALARFLESRGAYELDGRDARSMPPSAVRRI -VGLCEQAPHLFDASIRQNLLFARDDATDDELVAVLARVGLADWTAGRGGLDARVGDRGGL -VSGGQAQRIALARALLADFPVLVLDEPTADVDAERARAVLRDVLTAARDRGPGVLLLTHT -DVPHDLVDRTVELRVAGDRVRTE +>sp|O14639|ABLM1_HUMAN Actin-binding LIM protein 1 OS=Homo sapiens OX=9606 GN=ABLIM1 PE=1 SV=3 +MPAFLGLKCLGKLCSSEKSKVTSSERTSARGSNRKRLIVEDRRVSGTSFTAHRRATITHL +LYLCPKDYCPRGRVCNSVDPFVAHPQDPHHPSEKPVIHCHKCGEPCKGEVLRVQTKHFHI +KCFTCKVCGCDLAQGGFFIKNGEYLCTLDYQRMYGTRCHGCGEFVEGEVVTALGKTYHPN +CFACTICKRPFPPGDRVTFNGRDCLCQLCAQPMSSSPKETTFSSNCAGCGRDIKNGQALL +ALDKQWHLGCFKCKSCGKVLTGEYISKDGAPYCEKDYQGLFGVKCEACHQFITGKVLEAG +DKHYHPSCARCSRCNQMFTEGEEMYLQGSTVWHPDCKQSTKTEEKLRPTRTSSESIYSRP +GSSIPGSPGHTIYAKVDNEILDYKDLAAIPKVKAIYDIERPDLITYEPFYTSGYDDKQER +QSLGESPRTLSPTPSAEGYQDVRDRMIHRSTSQGSINSPVYSRHSYTPTTSRSPQHFHRP +GNEPSSGRNSPLPYRPDSRPLTPTYAQAPKHFHVPDQGINIYRKPPIYKQHAALAAQSKS +SEDIIKFSKFPAAQAPDPSETPKIETDHWPGPPSFAVVGPDMKRRSSGREEDDEELLRRR +QLQEEQLMKLNSGLGQLILKEEMEKESRERSSLLASRYDSPINSASHIPSSKTASLPGYG +RNGLHRPVSTDFAQYNSYGDVSGGVRDYQTLPDGHMPAMRMDRGVSMPNMLEPKIFPYEM +LMVTNRGRNKILREVDRTRLERHLAPEVFREIFGMSIQEFDRLPLWRRNDMKKKAKLF |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a test-data/test2_map.tab --- a/test-data/test2_map.tab Sun Sep 16 13:41:08 2018 -0400 +++ b/test-data/test2_map.tab Thu Apr 22 17:32:16 2021 +0000 |
b |
@@ -1,5 +1,4 @@ From To +NM_001087 AAMP_HUMAN NM_130786 A1BG_HUMAN NM_130786 V9HWD8_HUMAN -NM_001087 A0A024R410_HUMAN -NM_001087 AAMP_HUMAN |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a test-data/test2_retrieve.gff --- a/test-data/test2_retrieve.gff Sun Sep 16 13:41:08 2018 -0400 +++ b/test-data/test2_retrieve.gff Thu Apr 22 17:32:16 2021 +0000 |
b |
b'@@ -1,27 +1,4 @@\n ##gff-version 3\n-##sequence-region A0A077Z587 1 772\n-A0A077Z587\tUniProtKB\tTransmembrane\t593\t617\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077Z587\tUniProtKB\tTransmembrane\t637\t656\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077Z587\tUniProtKB\tTransmembrane\t668\t692\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077Z587\tUniProtKB\tTransmembrane\t704\t727\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077Z587\tUniProtKB\tTransmembrane\t733\t755\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077Z587\tUniProtKB\tDomain\t20\t94\t.\t.\t.\tNote=PDZ;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50106\t\n-A0A077Z587\tUniProtKB\tDomain\t552\t761\t.\t.\t.\tNote=Cytochrome b561;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50939\t\n-##sequence-region A0A077ZHN8 1 634\n-A0A077ZHN8\tUniProtKB\tTransmembrane\t14\t36\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077ZHN8\tUniProtKB\tTransmembrane\t56\t80\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077ZHN8\tUniProtKB\tTransmembrane\t113\t132\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077ZHN8\tUniProtKB\tTransmembrane\t290\t310\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-A0A077ZHN8\tUniProtKB\tDomain\t312\t364\t.\t.\t.\tNote=HAMP;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50885\t\n-A0A077ZHN8\tUniProtKB\tDomain\t369\t598\t.\t.\t.\tNote=Methyl-accepting transducer;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50111\t\n-A0A077ZHN8\tUniProtKB\tCoiled coil\t170\t204\t.\t.\t.\tOntology_term=ECO:0000256;evidence=ECO:0000256|SAM:Coils\t\n-A0A077ZHN8\tUniProtKB\tCoiled coil\t569\t607\t.\t.\t.\tOntology_term=ECO:0000256;evidence=ECO:0000256|SAM:Coils\t\n-##sequence-region A0A077ZFY8 1 973\n-A0A077ZFY8\tUniProtKB\tDomain\t1\t89\t.\t.\t.\tNote=Mur_ligase;Ontology_term=ECO:0000259;evidence=ECO:0000259|Pfam:PF01225\t\n-A0A077ZFY8\tUniProtKB\tDomain\t96\t279\t.\t.\t.\tNote=Mur_ligase_M;Ontology_term=ECO:0000259;evidence=ECO:0000259|Pfam:PF08245\t\n-A0A077ZFY8\tUniProtKB\tDomain\t300\t349\t.\t.\t.\tNote=Mur_ligase_C;Ontology_term=ECO:0000259;evidence=ECO:0000259|Pfam:PF02875\t\n-A0A077ZFY8\tUniProtKB\tCoiled coil\t867\t887\t.\t.\t.\tOntology_term=ECO:0000256;evidence=ECO:0000256|SAM:Coils\t\n-A0A077ZFY8\tUniProtKB\tCoiled coil\t951\t971\t.\t.\t.\tOntology_term=ECO:0000256;evidence=ECO:0000256|SAM:Coils\t\n ##sequence-region M5BAG7 1 563\n M5BAG7\tUniProtKB\tTransmembrane\t21\t43\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n M5BAG7\tUniProtKB\tTransmembrane\t49\t71\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n@@ -32,6 +9,43 @@\n M5BAG7\tUniProtKB\tDomain\t20\t301\t.\t.\t.\tNote=ABC transmembrane type-1;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50929\t\n M5BAG7\tUniProtKB\tDomain\t345\t559\t.\t.\t.\tNote=ABC transporter;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50893\t\n M5BAG7\tUniProtKB\tNucleotide binding\t379\t386\t.\t.\t.\tNote=ATP;Ontology_term=ECO:0000256;evidence=ECO:0000256|PROSITE-ProRule:PRU00434\t\n+M5BAG7\tUniProtKB\tRegion\t317\t337\t.\t.\t.\tNote=Disordered;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:MobiDB-lite\t\n+##sequence-region A0A077ZHN8 1 634\n+A0A077ZHN8\tUniProtKB\tTransmembrane\t14\t36\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n+A0A077ZHN8\tUniProtKB\tTransmembrane\t56\t80\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n+A0A077ZHN8\tUniProtKB\tTransmembrane\t113\t132\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n+A0A077ZHN8\tUniProtKB\tTransmembrane\t290\t310\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n+A0A077ZHN8\tUniProtKB\tDomain\t312\t364\t.\t.\t.\tNote=HAMP;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50885\t\n+A0A077ZHN8\tUniProtKB\tDomain\t369\t598\t.'..b'0P8A9\tUniProtKB\tTransmembrane\t99\t124\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n+Q0P8A9\tUniProtKB\tTransmembrane\t136\t156\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n+Q0P8A9\tUniProtKB\tTransmembrane\t195\t216\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n+Q0P8A9\tUniProtKB\tTransmembrane\t244\t264\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n+Q0P8A9\tUniProtKB\tDomain\t93\t274\t.\t.\t.\tNote=Ni_hydr_CYTB;Ontology_term=ECO:0000259;evidence=ECO:0000259|Pfam:PF01292\t\n ##sequence-region O14639 1 778\n O14639\tUniProtKB\tChain\t1\t778\t.\t.\t.\tID=PRO_0000075697;Note=Actin-binding LIM protein 1\t\n O14639\tUniProtKB\tDomain\t97\t156\t.\t.\t.\tNote=LIM zinc-binding 1;Ontology_term=ECO:0000255;evidence=ECO:0000255|PROSITE-ProRule:PRU00125\t\n@@ -72,25 +86,12 @@\n O14639\tUniProtKB\tSequence conflict\t532\t532\t.\t.\t.\tNote=A->R;Ontology_term=ECO:0000305;evidence=ECO:0000305\t\n O14639\tUniProtKB\tSequence conflict\t563\t563\t.\t.\t.\tNote=K->E;Ontology_term=ECO:0000305;evidence=ECO:0000305\t\n O14639\tUniProtKB\tSequence conflict\t578\t578\t.\t.\t.\tNote=V->I;Ontology_term=ECO:0000305;evidence=ECO:0000305\t\n-##sequence-region S0DS17 1 369\n-S0DS17\tUniProtKB\tChain\t1\t369\t.\t.\t.\tID=PRO_0000437163;Note=Cytochrome P450 monooxygenase apf8\t\n-S0DS17\tUniProtKB\tMetal binding\t303\t303\t.\t.\t.\tNote=Iron (heme axial ligand);Ontology_term=ECO:0000250;evidence=ECO:0000250|UniProtKB:P04798\t\n-##sequence-region Q0P8A9 1 310\n-Q0P8A9\tUniProtKB\tTransmembrane\t55\t78\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-Q0P8A9\tUniProtKB\tTransmembrane\t99\t124\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-Q0P8A9\tUniProtKB\tTransmembrane\t136\t156\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-Q0P8A9\tUniProtKB\tTransmembrane\t195\t216\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-Q0P8A9\tUniProtKB\tTransmembrane\t244\t264\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-Q0P8A9\tUniProtKB\tDomain\t93\t274\t.\t.\t.\tNote=Ni_hydr_CYTB;Ontology_term=ECO:0000259;evidence=ECO:0000259|Pfam:PF01292\t\n-##sequence-region M5B8V9 1 582\n-M5B8V9\tUniProtKB\tTransmembrane\t20\t43\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-M5B8V9\tUniProtKB\tTransmembrane\t55\t77\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-M5B8V9\tUniProtKB\tTransmembrane\t134\t154\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-M5B8V9\tUniProtKB\tTransmembrane\t161\t180\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-M5B8V9\tUniProtKB\tTransmembrane\t236\t260\t.\t.\t.\tNote=Helical;Ontology_term=ECO:0000256;evidence=ECO:0000256|SAM:Phobius\t\n-M5B8V9\tUniProtKB\tDomain\t20\t302\t.\t.\t.\tNote=ABC transmembrane type-1;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50929\t\n-M5B8V9\tUniProtKB\tDomain\t340\t570\t.\t.\t.\tNote=ABC transporter;Ontology_term=ECO:0000259;evidence=ECO:0000259|PROSITE:PS50893\t\n-M5B8V9\tUniProtKB\tNucleotide binding\t372\t379\t.\t.\t.\tNote=ATP;Ontology_term=ECO:0000256;evidence=ECO:0000256|PROSITE-ProRule:PRU00434\t\n+##sequence-region A0A077ZFY8 1 973\n+A0A077ZFY8\tUniProtKB\tDomain\t1\t89\t.\t.\t.\tNote=Mur_ligase;Ontology_term=ECO:0000259;evidence=ECO:0000259|Pfam:PF01225\t\n+A0A077ZFY8\tUniProtKB\tDomain\t96\t279\t.\t.\t.\tNote=Mur_ligase_M;Ontology_term=ECO:0000259;evidence=ECO:0000259|Pfam:PF08245\t\n+A0A077ZFY8\tUniProtKB\tDomain\t300\t349\t.\t.\t.\tNote=Mur_ligase_C;Ontology_term=ECO:0000259;evidence=ECO:0000259|Pfam:PF02875\t\n+A0A077ZFY8\tUniProtKB\tCoiled coil\t867\t887\t.\t.\t.\tOntology_term=ECO:0000256;evidence=ECO:0000256|SAM:Coils\t\n+A0A077ZFY8\tUniProtKB\tCoiled coil\t951\t971\t.\t.\t.\tOntology_term=ECO:0000256;evidence=ECO:0000256|SAM:Coils\t\n ##sequence-region Q13685 1 434\n Q13685\tUniProtKB\tChain\t1\t434\t.\t.\t.\tID=PRO_0000050832;Note=Angio-associated migratory cell protein\t\n Q13685\tUniProtKB\tRepeat\t89\t129\t.\t.\t.\tNote=WD 1\t\n' |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a uniprot.py --- a/uniprot.py Sun Sep 16 13:41:08 2018 -0400 +++ b/uniprot.py Thu Apr 22 17:32:16 2021 +0000 |
[ |
@@ -7,47 +7,61 @@ available services: map retrieve + +rewitten using inspiration form: https://findwork.dev/blog/advanced-usage-python-requests-timeouts-retries-hooks/ """ import argparse import sys import requests +from requests.adapters import HTTPAdapter +from requests.packages.urllib3.util.retry import Retry -url = 'https://www.uniprot.org/' + +DEFAULT_TIMEOUT = 5 # seconds +URL = 'https://www.uniprot.org/' + +retry_strategy = Retry( + total=5, + backoff_factor=2, + status_forcelist=[429, 500, 502, 503, 504], + allowed_methods=["HEAD", "GET", "OPTIONS", "POST"] +) -def _retrieve(query, format='txt'): - """_retrieve is not meant for use with the python interface, use `retrieve` - instead""" - tool = 'uploadlists/' - - query = list(set(query.split('\n'))) - queries = [query[i:i+100] for i in range(0, len(query), 100)] +class TimeoutHTTPAdapter(HTTPAdapter): + def __init__(self, *args, **kwargs): + self.timeout = DEFAULT_TIMEOUT + if "timeout" in kwargs: + self.timeout = kwargs["timeout"] + del kwargs["timeout"] + super().__init__(*args, **kwargs) - data = { - 'format': format, - 'from': 'ACC+ID', - 'to': 'ACC' - } - - responses = [requests.post(url + tool, data=data, files={'file': ' '.join(_)}) for _ in queries] - page = ''.join(response.text for response in responses) - return page + def send(self, request, **kwargs): + timeout = kwargs.get("timeout") + if timeout is None: + kwargs["timeout"] = self.timeout + return super().send(request, **kwargs) -def _map(query, f, t, format='tab'): +def _map(query, f, t, format='tab', chunk_size=100): """ _map is not meant for use with the python interface, use `map` instead """ tool = 'uploadlists/' + data = {'format': format, 'from': f, 'to': t} - data = { - 'from': f, - 'to': t, - 'format': format, - 'query': query - } - response = requests.post(url + tool, data=data) + req = [] + for i in range(0, len(query), chunk_size): + q = query[i:i + chunk_size] + req.append(dict([("url", URL + tool), + ('data', data), + ("files", {'file': ' '.join(q)})])) + return req + response = requests.post(URL + tool, data=data) + response.raise_for_status() page = response.text + if "The service is temporarily unavailable" in page: + exit("The UNIPROT service is temporarily unavailable. Please try again later.") return page @@ -72,10 +86,23 @@ retrieve.add_argument('-f', '--format', help='specify output format', default='txt') args = parser.parse_args() - query = args.inp.read() + + # get the IDs from the file as sorted list + # (sorted is convenient for testing) + query = set() + for line in args.inp: + query.add(line.strip()) + query = sorted(query) if args.tool == 'map': - args.out.write(_map(query, args.f, args.t, args.format)) + pload = _map(query, args.f, args.t, chunk_size=100) + elif args.tool == 'retrieve': + pload = _map(query, 'ACC+ID', 'ACC', args.format, chunk_size=100) - elif args.tool == 'retrieve': - args.out.write(_retrieve(query, format=args.format)) + adapter = TimeoutHTTPAdapter(max_retries=retry_strategy) + http = requests.Session() + http.mount("https://", adapter) + for i, p in enumerate(pload): + response = http.post(**p) + args.out.write(response.text) + http.close() |
b |
diff -r 054483e27a35 -r bfdc6a7ffd3a uniprot.xml --- a/uniprot.xml Sun Sep 16 13:41:08 2018 -0400 +++ b/uniprot.xml Thu Apr 22 17:32:16 2021 +0000 |
[ |
@@ -1,10 +1,10 @@ -<tool id="uniprot" name="UniProt" version="0.2"> +<tool id="uniprot" name="UniProt" version="0.3"> <description>ID mapping and retrieval</description> <macros> <import>macros.xml</import> </macros> <requirements> - <requirement type="package" version="2.19.1">requests</requirement> + <requirement type="package" version="2.25.1">requests</requirement> </requirements> <version_command>echo "UniProt ID mapping for Galaxy in version 0.1"</version_command> <command detect_errors="aggressive"><![CDATA[ |