comparison PDAUG_Word_Vector_Descriptor/test-data/test.fasta @ 0:668434d3fc8a draft

"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
author jay
date Wed, 28 Oct 2020 01:45:32 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:668434d3fc8a
1 >ACP
2 GLWSKIKEVGKEAAKAAAKAAGKAALGAVSEAV
3 >ACP
4 GLFDIIKKIAESI
5 >ACP
6 GLLDIVKKVVGAFGSL
7 >ACP
8 GLFDIVKKVVGALGSL
9 >ACP
10 GLFDIVKKVVGTLAGL
11 >ACP
12 GLFDIAKKVIGVIGSL
13 >ACP
14 GLFDIVKKIAGHIAGSI
15 >ACP
16 GLFDIVKKIAGHIVSSI
17 >ACP
18 AACARFIDDFCDTLTPNIYRPRDNGQRCYAVNGHRCDFTVFNTNNGGNPIRASTPNCKTVLRTAANRCPTGGRGKINPNAPFLFAIDPNDGDCSTNF
19 >ACP
20 HGVSGHGQHGVHG
21 >ACP
22 FKCRRWQWRMKKLGAPSITCVRRAF
23 >ACP
24 KWKLFKKIKFLHSAKKF
25 >ACP
26 KSSAYSLQMGATAIKQVKKLFKKWGW
27 >ACP
28 GIGTKILGGVKTALKGALKELASTYAN
29 >ACP
30 GIGGKILSGLKTALKGAAKELASTYLH
31 >ACP
32 GIGGVLLSAGKAALKGLAKVLAEKYAN
33 >ACP
34 SIGAKILGGVKTFFKGALKELASTYLQ
35 >ACP
36 FLPLLAGLAANFLPTIICKISYKC
37 >ACP
38 FVQWFSKFLGRIL
39 >ACP
40 KWKIFKKIEKVGRNIRNGIIKAGPAVAVLGEAKAL
41 >ACP
42 GWLKKIGKKIERVGQHTRDATIQTIGVAQQAANVAATLK
43 >ACP
44 KWKLFKKIEKVGQNIRDGIIKAGPAVAVVGQATQIAK
45 >ACP
46 SQLGDLGSGAGQGGGGGGSIRAAGGAFGKLEAAREEEFFYKKQKEQLERLKNDQIHQAEFHHQQIKEHEEAIQRHKDFLNNLHK
47 >ACP
48 GIGKFLHSAKKFGKAFVGEIMNS
49 >ACP
50 GIGAVLKVLTTGLPALISWIKRKRQQ
51 >ACP
52 ALWKNMLKGIGKLAGQAALGAVKTLVGAE
53 >ACP
54 ACYCRIPACIAGERRYGTCIYQGRLWAFCC
55 >ACP
56 ECRRLCYKQRCVTYCRGR
57 >ACP
58 LKLKSIVSWAKKVL
59 >ACP
60 KWCFRVCYRGICYRRCR
61 >ACP
62 KSCCRNTWARNCYNVCRLPGTISREICAKKCDCKIISGTTCPSDYPK
63 >ACP
64 GLLSVLGSVAKHVLPHVVPVIAEHL
65 >ACP
66 GLLSVLGSVVKHVIPHVVPVIAEHL
67 >ACP
68 GLFKVLGSVAKHLLPHVAPVIAEK
69 >ACP
70 GLFGVLGSIAKHVLPHVVPVIAEK
71 >ACP
72 GLFVGVLAKVAAHVVPAIAEHF
73 >ACP
74 GLFVGLAKVAAHNNPAIAEHFQA
75 >ACP
76 GFVDFLKKVAGTIANVVT
77 >ACP
78 GLLQTIKEKLESLESLAKGIVSGIQA
79 >ACP
80 TRSSRAGLQFPVGRVHRLLRK
81 >ACP
82 FFGWLIKGAIHAGKAIHGLIHRRRH
83 >ACP
84 GLFDVIKKVASVIGGL
85 >ACP
86 GLFDIIKKVASVVGGL
87 >ACP
88 GRFKRFRKKFKKLFKKLSPVIPLLHLG
89 >ACP
90 GGLRSLGRKILRAWKKYGPIIVPIIRIG
91 >ACP
92 RRRPRPPYLPRPRPPPFFPPRLPPRIPPGFPPRFPPRFP
93 >ACP
94 GLLGPLLKIAAKVGSNLL
95 >ACP
96 GLICESCRKIIQKLEDMVGPQPNEDTVTQAASQVCDKLKILRGLCKKIMRSFLRRISWDILTGKKPQAICVDIKICKEKTGLI
97 >ACP
98 DHYNCVSSGGQCLYSACPIFTKIQGTCYRGKAKCCK
99 >ACP
100 FFHHIFRGIVHVGKTIHRLVTG
101 >ACP
102 KLAKLAKKLAKLAK
103 >ACP
104 KTCENLADTFRGPCFATSNC
105 >ACP
106 IDWKKLLDAAKQIL
107 >ACP
108 FLIGMTQGLICLITRKC
109 >ACP
110 ILPILSLIGGLLGK
111 >ACP
112 GLLGLLGSVVSHVVPAIVGHF
113 >ACP
114 GLLGLLGSVVSHVLPAITQHL
115 >ACP
116 GIKCRFCCGCCTPGICGVCCRF
117 >ACP
118 QSHLSLCRWCCNCCRSNKGC
119 >ACP
120 ILGPVISTIGGVLGGLLKNL
121 >ACP
122 FLPILASLAAKFGPKLFCLVTKKC
123 >ACP
124 GLWSKIKEAAKAAGKAALNAVTGLVNQGDQPS
125 >ACP
126 LLGMIPLAISAISALSKL
127 >ACP
128 GLPVCGETCVGGTCNTPGCSCSWPVCTRN
129 >ACP
130 GVPICGETCTLGTCYTAGCSCSWPVCTRN
131 >ACP
132 GIPCGESCVWIPCISSAIGCSCKSKVCYRN
133 >ACP
134 GIPCAESCVWIPCTVTALIGCGCSNKVCYN
135 >ACP
136 GTFPCGESCVFIPCLTSAIGCSCKSKVCYKN
137 >ACP
138 GLLPCAESCVYIPCLTTVIGCSCKSKVCYKN
139 >ACP
140 GRDYRTCLTIVQKLKKMVDKPTQRSVSNAATRVCRTGRSRWRDVCRNFMRRYQSRVTQGLVAGETAQQICEDLRLCIPSTGPL
141 >ACP
142 GETDPNTQLLNDLGNNMAWGAALGAPGGLGSAALGAAGGALQTVGQGLIDHGPVNVFIPVLIGPSWNGSGSGYNSATSSSGSGS
143 >ACP
144 GFKDLLKGAAKALVKTVLF
145 >ACP
146 KSCCPNTTGRNIYNACRLTGAPRPTCAKLSGCKIISGSTCPSDYPK
147 >ACP
148 KSCCPNTTGRNIYNTCRFGGGSREVCARISGCKIISASTCPSDYPK
149 >ACP
150 KSCCPNTTGRNIYNTCRLTGSSRETCAKLSGCKIISASTCPSNYPK
151 >ACP
152 MRKEFHNVLSSGQLLADKRPARDYNRK
153 >ACP
154 KSCCKNTTGRNIYNTCRFAGGSRERCAKLSGCKIISASTCPSDYPK
155 >ACP
156 FIFHIIKGLFHAGKMIHGLVTRRRH
157 >ACP
158 FLPAIVGAAAKFLPKIFCAISKKC
159 >ACP
160 FLPIIAGVAAKVLPKIFCAISKKC
161 >ACP
162 FLPIIAGIAAKFLPKIFCTISKKC
163 >ACP
164 FLPVIAGVAANFLPKLFCAISKKC
165 >ACP
166 FLPIIAGAAAKVVQKIFCAISKKC
167 >ACP
168 GLMDTIKGVAKTVAASWLDKLKCKITGC
169 >ACP
170 VNWKKVLGKIIKVAK
171 >ACP
172 VNWKKILGKIIKVAK
173 >ACP
174 FFSLLPSLIGGLVSAIK
175 >ACP
176 RFRLPFRRPPIRIHPPPFYPPFRRFL
177 >ACP
178 KWKLFKKIPKFLHLAKKF
179 >ACP
180 YKQCHKKGGHCFPKEKICLPPSSDFGKMDCRWRWKCCKKGSG
181 >ACP
182 GIPCGESCVFIPCITGAIGCSCKSKVCYRN
183 >ACP
184 GEFLKCGESCVQGECYTPGCSCDWPICKKN
185 >ACP
186 GLPTCGETCTLGTCYVPDCSCSWPICMKN
187 >ACP
188 GLPVCGETCFGGTCNTPGCTCDPWPVCTRN
189 >ACP
190 FVDLKKIANIINSIFGK
191 >ACP
192 GSIPCGESCVFIPCISSVIGCACKSKVCYKN
193 >ACP
194 GIPCGESCVFIPCISSVIGCSCSSKVCYRN
195 >ACP
196 GSIPCGESCVFIPCISAVIGCSCSNKVCYKN
197 >ACP
198 GSIPCEGSCVFIPCISAIIGCSCSNKVCYKN
199 >ACP
200 GIPCGESCVFIPCLTSAIDCSCKSKVCYRN
201 >ACP
202 GMWSKILGHLIR
203 >ACP
204 GKWMSLLKHILK
205 >ACP
206 GFGMALKLLKKVL
207 >ACP
208 GTGLPMSERRKIMLMMR
209 >ACP
210 GIACGESCVFLGCFIPGCSCKSKVCYFN
211 >ACP
212 GVIPCGESCVFIPCISSVLGCSCKNKVCYRD
213 >ACP
214 KLCGETCFKFKCYTPGCSCSYPFCK
215 >ACP
216 GDACGETCFTGICFTAGCSCNPWPTCTRN
217 >ACP
218 GIPCAESCVWIPPCTITALMGCSCKNNVCYNN
219 >ACP
220 IPCGESCVWIPCITAIAGCSCKNKVCYT
221 >ACP
222 AIPCGESCVWIPCISTVIGCSCSNKVCYR
223 >ACP
224 GEYCGESCYLIPCFTPGCYCVSRQCVNKN
225 >ACP
226 IPCGESCVWIPCISGMFGCSCKDKVCYS
227 >ACP
228 FLGWLFKWASK
229 >ACP
230 FLKWLFKWAKK
231 >ACP
232 KWKSFLKTFKSAKKTVLHTALKAISS
233 >ACP
234 KWKSFLKTFKSLKKTVLHTLLKAISS
235 >ACP
236 MPFLFCNVNDVCNFASRNDYSCNYYSNSYSFWLASLNPER
237 >ACP
238 KWKLFKKIGAVLKVL
239 >ACP
240 GACFSIAHECGA
241 >ACP
242 TCCATGACGTTCCTGACGTT
243 >ACP
244 KRFKQDGGASHASPASS
245 >ACP
246 KRAKAAGGWSHWSPWSSC
247 >ACP
248 LLGDFFRKSKEKIGKEFKRIVQRIKDFLRNLVPRTES
249 >ACP
250 FLGALFKVASKVLPSVKCAITKKC
251 >ACP
252 GIGKFLKKAKKFGKAFVKILKK
253 >ACP
254 GIGKFLKKAKKGIGAVLKVLTTGL
255 >ACP
256 VECYGPNRPQF
257 >ACP
258 KRFKQDGGWSHWSPWSSC
259 >ACP
260 RQVFQVAYIIIKA
261 >ACP
262 KAFDITYVRLKF
263 >ACP
264 DFKLFAVTIKYR
265 >ACP
266 DFKLFAVYIKYR
267 >ACP
268 WHSDMEWWYLLG
269 >ACP
270 HTMYYHHYQHHL
271 >ACP
272 RLVSYNGIIFFLK
273 >ACP
274 GRENYHGCTTHWGFTLC
275 >ACP
276 ASSSYPLIHWRPWAR
277 >non-ACP
278 MTISLIWGIAMVVCCCIWVIFDRRRRKAGEPPL
279 >non-ACP
280 MFATPLRQPTNASGARPAVSMDGQETPFQYEITD
281 >non-ACP
282 LLWRKVAGATVGPGPVPA
283 >non-ACP
284 DSPDPMNGASSNALIAKMNSAKLLYQHY
285 >non-ACP
286 NNQEVIDAISQAISQTPGCVL
287 >non-ACP
288 KKVVEKNADPETTLLVYLRRKLGLCGTKLGCGEG
289 >non-ACP
290 CSRLLPSLAQEEG
291 >non-ACP
292 KNDFAALQAKLDADAAEIEKWWSDSR
293 >non-ACP
294 VDREQLVQKARLAEQAERYDD
295 >non-ACP
296 RPLRRVVLFYQGKLCSMAGNFWQSSHYLQW
297 >non-ACP
298 GAAGERKLCLLSLLLIGA
299 >non-ACP
300 MFRKLLKMWILLRPTHWLILIALCAVTCAGYWLLWSE
301 >non-ACP
302 HLRGPADSGWMPQAAPCLSGAPQAS
303 >non-ACP
304 NNPNNSNSHLRPHAYNNSRRDDSD
305 >non-ACP
306 VVILASLSVMFLVSLWQQKIRERLPPGPTPLPFIGNY
307 >non-ACP
308 ICLSCLISFFLWNQNRAKGKLPPG
309 >non-ACP
310 VVMNSLRVILQAS
311 >non-ACP
312 ARPRLDLQLVQRFVRIQKVF
313 >non-ACP
314 MLAKGLSLRSVLAKGCQPFLSPTWQSSVLATGGGANIS
315 >non-ACP
316 AAGLPGAALPLRKRPLRAPSPEPAAPRGAAGLVV
317 >non-ACP
318 PPMPSAPPVHPPP
319 >non-ACP
320 SCPIDKRRPLIAFLRRLRD
321 >non-ACP
322 RLGLWASGLILILGFLKLLRLLLRRQRLARAMD
323 >non-ACP
324 FSPQRDRFQAEGS
325 >non-ACP
326 GTLWALVFLGILVGMVVPSPAGTRANNTLLDSRG
327 >non-ACP
328 MNRLLQKGTSLVPSWRTR
329 >non-ACP
330 MTTSLIWGIAIAACCCLWLILGIRRRQT
331 >non-ACP
332 ATLANGMSLQPPLEEVS
333 >non-ACP
334 PLTATNSGLAVNN
335 >non-ACP
336 VRACHKVCRCLLSGFGGRVDAGQPELLTER
337 >non-ACP
338 TAGILLLLLLGTLEGS
339 >non-ACP
340 MEPSILLLLALLVGFLLLLVRGH
341 >non-ACP
342 MKNCFQLLCNLKVPAAGFKNTVKS
343 >non-ACP
344 SVIHTQAHASGLQQVPQLVPAGPGGGGKAVAPSKQSK
345 >non-ACP
346 KPLGLLKPSSLMKVSGRFKAHQDA
347 >non-ACP
348 ARTLNNKLSLSKPKFSGFT
349 >non-ACP
350 LLLVIIWTLFGPSGLGEELLSLSLASLLPAPASPGPP
351 >non-ACP
352 WPGILVGGARVASCRYPALGPRLA
353 >non-ACP
354 RSVKGLVALITGGASGL
355 >non-ACP
356 AAAALRARILQVSSKVN
357 >non-ACP
358 TGCCIAGRLANLDDQNLTVAL
359 >non-ACP
360 GSILGFLQIATVLTVLLLLLK
361 >non-ACP
362 AARQIGSCLMRCRTLDTTSP
363 >non-ACP
364 WGCRGRRWAFARVDGGSCHRRGAPTGSTSNQIR
365 >non-ACP
366 YAKPGAVRSPAQILQWQVLPNTVPAKS
367 >non-ACP
368 RMAGPWLSLHEARLLGTRGAAAPKAV
369 >non-ACP
370 SISNRAAVPEHGVAPDAERL
371 >non-ACP
372 PNFSMETWLLLV
373 >non-ACP
374 PRPPSKTYRGAFQN
375 >non-ACP
376 SVLVKGCQPFLSAPRECPGHPRVGT
377 >non-ACP
378 LVTPPKALLKPLSIPNQ
379 >non-ACP
380 KMQGSRMDEQRCS
381 >non-ACP
382 VIADDLPPTCIRP
383 >non-ACP
384 LPGGLRVLVQTGH
385 >non-ACP
386 GWIWRWGWGRRCLGRPGLPGPGPGPATPLFLLLL
387 >non-ACP
388 RGIRGSSAARPSGRRRDPAGRTTETGFNIFTQHD
389 >non-ACP
390 QQEKEFLESYPQNCPPDALPGTPGNLD
391 >non-ACP
392 APARRVLQVKRVMQESSLSPAHL
393 >non-ACP
394 KVAPGGPTGYPGNLTAEQEQKLGELKMILL
395 >non-ACP
396 FLASYPQKCPAGSLPGTPGNTDE
397 >non-ACP
398 MDAKARNCLLQHREALEKDIKTSY
399 >non-ACP
400 ASRQLLVAPPEAL
401 >non-ACP
402 MISNGIGTVTTGKRSMCLFPLLLIGLWGC
403 >non-ACP
404 MTLRNFGMGKRSIEDRVQEEARCLVEELRKTNASPC
405 >non-ACP
406 AVFGLGGVGLSVIMGCKAAGASRIIAVDIN
407 >non-ACP
408 PNAKQSILQKNPDDVVIVAAYRTA
409 >non-ACP
410 AMELLLTATIFYLVLWVVKAFRLQVPKGLKSPPGP
411 >non-ACP
412 LLAAGFCPAVLCH
413 >non-ACP
414 AASVNDEQHQRIIKYGRALVLDIVEQ
415 >non-ACP
416 IARLREDGIQKRVIQEGRGELPDFQDG
417 >non-ACP
418 FIVVMNILALTLPFLAAEVQN
419 >non-ACP
420 CQNGRRANRTVRFARTA
421 >non-ACP
422 WVTVRSQQRGLFPAI
423 >non-ACP
424 LLRSCPLQGSPGRPRSV
425 >non-ACP
426 LNDGHFMPVLGFGTYAPPEVPRNRAVEV
427 >non-ACP
428 HLGRPSAPTIVAQPVSGLASPASFQPEQFQYTLDNNVLT
429 >non-ACP
430 RPEPGGCCCRRTVRANGC
431 >non-ACP
432 SWVEENRASFQPPVCNKLMHR
433 >non-ACP
434 VFHRVRWAPELGASLG
435 >non-ACP
436 RAKVLTLDGMNPRVRRVEYAVRGPIVQRALELEQELRQ
437 >non-ACP
438 LLQRARLAEQAERYDDMASAMKAVTELNEPLS
439 >non-ACP
440 ALIQKLNSDPQFVLAQNVGTTHDLLDICLKRATVQRA
441 >non-ACP
442 AALPMLWTGLVLLGLLGFPQTPAQGHDTVQPNFQQ
443 >non-ACP
444 QRRQNDSSVFLAIMVAAAVES
445 >non-ACP
446 CNAPGCGQRFTNEDHLAVHKHKHEMTLKFGPARTDS
447 >non-ACP
448 LVLLTVQNSALILTLNYSRIMPGYD
449 >non-ACP
450 TVLSPPQRFKRILQAMMLAVAVV
451 >non-ACP
452 ISRGLLLLAALCCLAPSFL
453 >non-ACP
454 VAGTESAQGPPGPAASLELWLNKATDPS
455 >non-ACP
456 QYLRIRTVQPEPDYGAAV
457 >non-ACP
458 ASPTQTPPTTSTIRVARRSRVALVAM
459 >non-ACP
460 TIWRNQHTYKMATSASANLSKIVKKNYMELPQDGKVQ
461 >non-ACP
462 LSITRGLLLLAALCCLAPIS
463 >non-ACP
464 ILLSIWRQSSGRGKLPPGPIPLPIIGNIFQ
465 >non-ACP
466 LLLLSWVALGPRSLEGADPGTPGEAEGPACP
467 >non-ACP
468 LRVKRAMQEASFMPPLLPPAAHQRFSTVPAVP
469 >non-ACP
470 GLLLLAGLCCLVFGIMAEDAQVAQGPSQQI
471 >non-ACP
472 RHVGLLCATGPQRWRF
473 >non-ACP
474 AAVALARPKPPLRHQEHLQNEPDS
475 >non-ACP
476 SRVNDQSQASRNGLKGKVLTLDTMNPCV
477 >non-ACP
478 AAALGPGVLQATRAFHTGQPRLAPLPPLPEYGGK
479 >non-ACP
480 LCTSGLWTAQASTNESSNSHRGLAPTNV
481 >non-ACP
482 PAIQPVLSGLSRIVNGEEA
483 >non-ACP
484 GCQASLSTAQERLGHPGVPTREGVR
485 >non-ACP
486 RKVLILTLVVAACGFVLWSSNGR
487 >non-ACP
488 GRVRSRCPGPALLLLLALAARPALAGPPAAALQ
489 >non-ACP
490 CRITKPALLVLNQETAKVVQT
491 >non-ACP
492 KAEVCMAVPWLSLQ
493 >non-ACP
494 SHLELNNGTKMPTLGLGT
495 >non-ACP
496 LLLPEAAAERDAREKLALWDRRPDTTAPL
497 >non-ACP
498 LLALSLVLLYRYATYSHGFFKKLGIPGPKPLPLFGNVLS
499 >non-ACP
500 LLSLWRQSSGRGKLPPGPTPLPVIGNILQIGIKD
501 >non-ACP
502 AFKSMEVANFYYEADCLAAAYGGKAAPAAPPADRPGPR
503 >non-ACP
504 SLFWAARPLQRCGQLVRMAIRAQH
505 >non-ACP
506 MRPPRTLTSTATMSALSTSMPMEIDDVMDEDAVNGQA
507 >non-ACP
508 LLSLIGFCWAQYDP
509 >non-ACP
510 LWARSKNDQLRISFPPGLCWG
511 >non-ACP
512 PQGFDVDRDAKKLNKACKGMGTNEAAIIEILSG
513 >non-ACP
514 IFCLILWVVKAWQPRLPKGLKSPPGPWGWPLLG
515 >non-ACP
516 LDAASPGPLALLGLLFAATLLLSALFLL
517 >non-ACP
518 VTLLFKLYCLA
519 >non-ACP
520 ATRAAAARLVGTAASRTPAAARH
521 >non-ACP
522 RNKLDLETLTDILEHQIR
523 >non-ACP
524 RRLVLQARTYAQAAASPAPAAGPGQMSFTFASPTQVFF
525 >non-ACP
526 PGRSRSAADDINPAPANM
527 >non-ACP
528 LLSALTLETWVLLAVILVLLYRLG
529 >non-ACP
530 VMGHGLCPQGARAKAAIPAALRDHEST
531 >non-ACP
532 FLVSIAGLLYALVQLGQPCDCLPPLRAAA
533 >non-ACP
534 VRSVRAAVGGLRAISAPSAPCLPRPWGLRAG
535 >non-ACP
536 RGGCWPRGLQQLLVPGG
537 >non-ACP
538 APATPPRPLKRKKLQFTDVTPESSP
539 >non-ACP
540 EQAERYDDMAAAMKAVTEQGHELSNEERNL
541 >non-ACP
542 MPNDPSDNQLK
543 >non-ACP
544 TELLLAITVFCLGFWVVRALRTQVP
545 >non-ACP
546 LTADLLGAPFFTLPKELQLALLERQTVFL
547 >non-ACP
548 GHGRLVEIQGRLGVRIER
549 >non-ACP
550 LPFKLLLFVLLDGWTRLTH
551 >non-ACP
552 QALWLVLVLSMPPVLVAAVVGTLVSLVQ