diff test-data/PUBLIC_Ectocarpus-sp7_proteins_head.fa @ 0:196795831b6a draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/tapscan commit 2e1cd301fb38af8a1e9267fc60fcb5ca3c576aeb
author bgruening
date Wed, 14 Feb 2024 13:54:16 +0000
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/PUBLIC_Ectocarpus-sp7_proteins_head.fa	Wed Feb 14 13:54:16 2024 +0000
@@ -0,0 +1,32 @@
+>Ec-00_001160.1 Forkhead-associated (FHA) domain (809) ;mRNA; f:1452084-1459465
+MEPPPPVPAPIIVAGTRAKETGVDGNSSAATAGSTAAVSPPLDKAQQSALDPAKDGSASLPPPPPKTAGSLNGDGVKAVASGGYKPPSWGLTEAPGASGLSLTVLKGGVEVGSISLDNRTHVLLGRQQGVVDVLLEHPSISRKHAILQHGQNGALFLFDNGSTHGCSVNKKKIPPKEFHRLHVGDVIKFGESTRLYALEGPEELRPAEYESDNLRNLRLDAGRKQLAAKLAKIKAGGAGEGGGKGGGDSGEYGISWGFDEDAVAEEEDEDGDGAERDEDEVELPDYLKTEAQKRRRRDTKIGLTEDNVHKRDAKLFEKLQLKLTKIEEIEETIRSKNKARERGKEGGEGGSGGEEGGRKAGRGTEDGEEDDDYYDRTAPVVPTSSGTSKSDLASKKAEIKARRFGARDKTKKLSAVTPPADDTAAAERKRGVGPGQNEAAAQSLEALTRRGEAVVEDLERTQAGLAELEAEEAGEAALAEDGGVAADPLDMFMTENRRKERQQAIVRLTAKREALREEQALLKVMVEAARPSMPTLKKSPAPAAATASVAATKEETVPVPETTTRGSGSSSSDQAAEPDDRKDTRAAAVDREHMPGGGGYGEAMPGSTGSGSHEKYGDEVEKTAPSRAVLAPEAASTLGSMPSPVAPPCRSNAIPEARKSPAGTVASAGTRERGVEKGQAETRHPGVKEGKEASGTKKRGTPVGTSMLPPPPSKRQQRRAENSKAGLAGENDDDPVEPKAKRTVKGPAMPPPLGKPSKVGGGVSVPTAVARVGEKVAGKEALEGGDVDWVPPKDALEKMAALNRKFGY*
+>Ec-00_001310.1 SET domain protein (668) ;mRNA; r:1563326-1571582
+MAIPTSKDEDLLDDEQAPAVAAAQDQELVAGSDAGTVAPSKKKKKKKKKKKSPQQNNQLAQVQVYETIKDLDTFKVTEDSVSGRCVIASRDLKAGELVLREPPFVKVVRRDCASRQCAYCCQQVTERGKIEADVPFAVYCSRACQAREDALRAAEASALGKLAGISAARDVDIDLLRMLLRLLITRAKALGLREPSGDSDSVSRGVDEEGEDGTMGEGLFLRQQWENLYALMHHREAMAPDWISVVREAGEDLLQLLPEWVRFDVEEVVQLACRVNVNAHGLRDDSGANLVIGVGMFPLTAMINHACRPNCTFVYFGGNLEVRTLEPVSAGAELSVYYIDLLQSTAARRQELLTSKHFLCKCSRCENPSSMDDYLDGVCCTDCGERGCLTPTPPPSAEDILAAQLAQLGEGLADESAANGSGKGMGKKKGGGGGSTTSRRETSVNPSAALGAKDGSGNGSRAGGVRGGSESVVQKVYCSACGREYPGTAVEESVARAKALWDAAMAVVRAKSFSLARKSLEKWLQDYDAGAVLPPTATKKKSVKKDRLKLHPANVMVVQTLVPLSNCCTFEEDHAASARHLRRAVSAMEAVYPANFPELGDFHAALADANDALLQKRGQTLPKKSRSQAVSERKQALERAATIRSVCLGKDHPATREAARALDRVTG*
+>Ec-00_001360.1 aureochrome 2 (442) ;mRNA; r:1593684-1598236
+MPASVKPPVFTSMVHRKVQHHTSWQDADFQPDDLGLDLTDLSTMTGFLMNEVPDNTGHFYPPWANELSPLVKDEPSAFMMPDPAAPRQPQPRQQQQQQDQRLPAPEGLPAAPVADPALDVIMGGATGSSRPGSTTSSSSSGASSMLRAPKAAAAAGAAALGGVGSTFRKTPAGGVTRRRSSSKEEQAKKRRERNRVLARRTRLRKKFFFQSLQQQVARLQRENERLKGIVTTRCPDSVGEILMSCRSKMPSMVADCAGQATAVLDQSGFLLVKALQSSQPSFCVTDPQMPDNPIVYASDTFIELTGYDRAQVLGRNCRFLQGPDTDPDAVAKIRKGIEEGSDTSVYLRQYKADGTVFWNHVFVAALRNSEHKIINYVGIQHPLDKEPSPEVVACINNGKEQEIMSVQEEDRPAGWGGQWPEDVNGDLATLDHLMAGGWGTD*
+>Ec-00_001730.1 WD40 repeat (1089) ;mRNA; r:1948051-1960039
+MSGYSRAGVGVGGGGGGGGGGGGGGGGGGGGANSNRGASASRGPGGALQGAHMAGTVATVAAAGGQQSKSVAVFRSLELCDLLKLEIGNITSEMGQHLEEREEYEKKFRQQLAEMDRIQHSLKQLQEAHMVMKQQYEDEIVRLRHQLESSHPLKSDPDSRGGGAGSSVQGVSGGMSMGSTGPSQSHSSGPPHKGLGGMPVGGPHGLGSPRKQPGQLEPGAASLRGPMLTAPGAQLVGGGGMGAGSGVVLPGMAMRGRGHGEDDYGGGRGQGPNGQTLEPLSKRPRLADLQGPPGPLPPHVLHPPHGFSQSQHQQHPQQHQQHPPPHHKGGFFGGRPGAPPAAVAGGGGGGGGGGDNGGRRPGGPEGQYRWPGGSGPGGGGGGGDSGGAGGGGGAGVPAMGPGKQRQLGPGGGGAPPRELSSSTGKGGGAGGGGGGNGNGMVEIPDAIPAELSYQVRYEAEEGEGGRAAAAKDGLAVELAKSQDLRSVVCCVRFSTDGTKIAAGSHSCVKVFDVNSFKQLYVCRKQVQEEQGAPQTADGGDPYVRAVCFSPDGLSIVAGMEKNSAKVLVLEEEGGRQGAITLSGHESEVYSLDWVSDMIASGSGDGRIRLWDSVTGACKASLGDMGGPQDGVTSVVLRQDTTMVAAASIDRVVHVWSTQTHKILHRLDGHSESVYAITFSADGNRLVSGGLDKTIKVWDLGPGSEGRLSPQAKTLPGGHKDYVLSVCFSQDGKYIISGSKDRSVTMWDARLMKRVATITGFKNSVIGVSASPFNSMFATGSGDNLVCVWNYGDRDDYRRQSESAVAPASSGRSSSAEKPRPPSRSSRSASPPISNASSLRKDDRASSPSPPRASPGRGGRGGDGDGGSSRGRGGVGLVEKGRGGSAGAGAGATNGKGRTSPSSDEREGRTAAGSEERKRSGSKESSRTGPRGGGGGHDSDRKQQRHESKHRQGRAGSPSDGRRSSSNSKERSSGRGGGVEPMDEDDDTEEEKQGEEAEGGGGKRAGNTDETPLGRKRGSGGVGNGSGGRKALNRSSSSSSSSSGSGGGGGGGGGGGGGGGRGPSPEKRGKAALPPKKELQRRDSPSSAE*
+>Ec-00_010160.1 Phytochrome-like protein (978) ;mRNA; f:17223525-17226527
+MDPHTHTNERIHMRSSGGCDGDMRTASTHIQSCGCAFAIEETADDMYPSGLRILGVSQNAVEAPWAYASSVSDLLGKDLGHLLRVECVRTVRSLVTRYAQACKPSHEDDDHISPKANRITADACPSPRIRGELRPGAASGAEGDIASFTVTGSNPGVYLVDVERHGSDCARVEHTPGLLLLGDLLESIPVGSNPVESTAALCDALAKSMPAYDRVMVYRFAPDGSGQDDGSGEVVHESVRAGADIGSSYLNLRFPALDIPPIARKLFKLVGVRFIADTSAPAVPMITLHDQASSPLDLFRSALRAPAECHLRYLRNMGVKASLVVSIAVDGGTWGLFSFHSYTRTVHPSCEERLSVEMAASVVSSLISRYQREEIAATALSLSRTLGNLGNYTRVNDFLSADHHSLLGILDVDAVILCEHLRSVTLYGKKDITLSLEECQELRNGDGDESSEMAISFRTLGARGVAFFWVRSFFVAFLRGSIANSVKWAGNPDAPVNKDEVMTPRASFELFMRTSGARCKAWSPLTVDLLNMVRQGFSSQLYAEALPADLQETFARVSHELRTPFHGVMGALEILEAGNGIMGAEEQLDVIRSALRCGGSMMSTLNDILEIAKDRNNTEVVRGRFSASGPIVLAVAAMGLFAAAESVELTVEIGPPDDVLEVTGDMRRIKAIVQNLVNNAIKFTPSGGKVRISLVVFDSLQEVTDWWAKETGRFGAQTWMASSGGESAPGTGSSQAIKWHVYCVEDSGIGVLPADLPHLVEAYRQISHGASRSHAGTGLGLHICRTHMEAMCGSFGIASTFSEKDTSGGTLFAVVLPLDSEEPGAAVNTQEPLEAEVNLRLLDHKIRRFFKDNGADVEVMSATDGFIALEMHEAARRNQSHGSVLAGMFIDFHMPDLDGIECTKRIRLLEADNGWSRIMICGCTADPTQAIRRVFQNAGGDEVISKPWCPGQVESICNAMVANVLNAEQKSGGDGGA*
+>Ec-00_001700.1 NIN-like transcription factor (579) ;mRNA; r:1923852-1928158
+MHTPLLNSHHRDTGLLETLEKPDKEPSTSRQQDTVMSLSTHSGTRGRPPANRASCGNSTIPDITVRSPADGLPPRLAIPHEPPKVPRRTPSKGNKRETLADIAKRIPVGLMRHYFNYPLRAAAEAMDISVTTLKRLCRRHGVKRWPHRQICGINRTLNDLETQHDTAKGDEVDSVADQLRQLYRRRDVIIELAFESDDESISNGSDDAPPAGRKLSKRGSFTSSDGGGSSASSSSFPSPPSSPSPSRSSSFVSPPASPTPTDERTHTAAGVTWLNNGAPGTGLPSLAPVLSVTVSSGGGGGGGGSSSSRSSKCPAVRSRGSSRGAKISSGGVGSSGSSGSYGKTSSGSMRPHRPSGTSGSGRSKGPRKPRSSAMFGSIPGLGKVPPPVVTVATGAAVSTTLSLPERTSASTSTSTSPVRADASTETSSRVTIPVPSRPLSASIPANSSSTHDGGGTSTVARLSLIGSGASWISDNDAPSPSTTSVDILGLGPHGSQKMDDLAILGDLLFGPDDAAVAAAAAAGVRAQSSAATYPPPSSTTSPPSSSYERGFSAGLASASNWGGGLCWDANGLSHLGPL*
+>Ec-01_005970.1 Acetyltransferase (GNAT) domain protein (608) ;mRNA; f:5180258-5197307
+MERSVSLAKRRNLVIGWRKMARKKEIQVVLLAALISTLGIGPVAARIVVTDHLAFVASTVRTRTSSSSSPSTFQLQRDVRKTAAVPPRRYEQQQQTSRLRPRCGWGLERPSLSPDPVPDAFSAPLRRRRRRPRQQQQQHLVVAASSGLQEPLERVASIPVQEAAAGRGDRVSYGRGGTVVEAAAPEGVDAADGGGHERKTAGSVYGDEVGVLRGAVIWKGEENDADKDDGGGGGEDDDFEGDDIDIYLPGGMGAGLRPGAKPRRKRPKPPVMWSKPVRGSKRLAVVLAGREDLDEAGALCIKVFFGQPDSPWKAAQLRQLLHEQRQDLESRCSRRESVMFKAIDTRRKDGMVGFVEVSETSGSKYGMGAGITLADTRPVVSNLAVDPRVRRCGVGSALMEACEDLVKTWSFDEIILQVEEANEAALAFYGGKGFKKLFVDKAARRYDTSGFLLQNVRTSKLTMRKALGSSTKRSKSGDSLADHVSQLFGFLSKPFVVRPPPSKRLPARSTASVETLFGRPGAVGSGSGVRRPRSGGSGRRVTSSGGRVGSSSGGIGRSSGRSEAAAGGHDTSFSSSSSSSSSSSSSSSSAGEISTSRTRLPRTIRRR*
+>Ec-01_004960.2 Ankyrin repeat-containing domain (797) ;mRNA; f:4270310-4278760
+MPAEGRRANPIELNIYIEVVLYSSTTRLAAASFFFCFSFFSSKTTVSGEPTPRGGDFADPPPIFMIARSTASPSLIDITKLSSAMMLGNMSSSVLSQLDRLKESFLWAAAKGGRVEECESLLEMGTDINWVSPEGDTPLLAACRNGHLQTALCLLSHGASANQVDKDGRTALHVSCRYGKEAVAEALILRGADVSARDHGGATAFESQGPHVPDGMLQRLDTIAQRSGRRTHHHLGISTAAINTSTFTTSSGRSAQDGGGSMSSRRSNTVLDSDTLSARATGGGVPENNIGDGRSGWRWRSNTGRIEHHVPLTDDAHDGAAGVGPAAISTGDGGRDDAQREERGGVEGRTTFPSISRKAGSTSADSRPSSRVHSAGRAASSSGDGVRSSDDEHDSAAIAAAIASASAPAPATTVTAAGSTIYPMMASNTLASPAPGPTSLRSPRRPLHFHGTPTASWDGAGADGGAGHGITVSNSRDSGSGGNRWNGSGSASGSSSSSSSSSSSNSGRGGGGERQSRPAASATNANSPATATGTTATTTTVTPTCGLYGSLSTNAVAERINSRSITAHWLSPPAAAEVRGPLGDHAMHWGGRTNGDLVSGDAPYESIAPAGAGGRGVLGGGGHGGDPAQGDGGSSDHVGLIRALWLQEKESRLASEAKADAVRDQSARLWNELVRSEKQVLSLEEGAAALREERDKLKATLNGEGFKGRSLQELEHLEKDLRKALEGVCGERDRIVQQQLAKEEQRLCVVCQENERSVLLLPCRHLCVCRGCSERQELTLCPLCRDHITESLVVYS*
+>Ec-01_005360.1 Ferrochelatase-2, putative chloroplast precursor (583) ;mRNA; f:4601493-4607037
+MRREQKMRAAATLLCTLSVASAWFVAPPTSAASSHRHFDSTTSRASSPPFSSTAQRRRRNAAGGDAADASTTSGNIRGRRRAAAARTSHRMVASSRNWEWGRAKSSGDAPTPAAQAFGSDQELKLGVLLLNLGGPERPEDVQPFLFNLFADPDIIRLPKLVQWLQNPIAAVLAARRAPQSKSAYESIGGGSPIVSWTNAQAKGIASQLEAKGLSGTKCYVGMRYWHPFTEAALEAVEDDEINALVILPLYPQFSISTSGSSLRILNEEFTRRPEQWGHKNVVHTVVPSYHDRPGYVNAMASLIAREVAEYTPEQRMQGVQVLFSAHGVPKSYIDAGDPYKAQIESCVKLISEKVDGINAEGGPGAKPGSSGAAAGGVTYHLSYQSRVGPVEWLQPYTDAKIHELADNGCKNLVVVPVSFVSEHIETLEEIDMEYREVAEEAGITNWRRVPALNTDPAFIEDMADMVVEALALPTLTVSEAFTRNNCDRKEAEGFLEKALDGMYGMPKTGGKPPKSGKVGGAGAAGANASSGGGGGADGEGSGDKRKEAARVLSTLSGAAFAADGVGREIAGLFTATSDGIFF*
+>Ec-01_005370.1 Hypothetical protein (68) ;mRNA; r:4610968-4611171
+MAHGVLLSSTTGWWRNLQVWCPCCCIFQFEPVGFYLHAKRGPSRLQTISLVGQRIMIFADPKQLESA*
+>Ec-01_005380.1 Aminoalcohol phosphotransferase (396) ;mRNA; r:4612890-4621264
+MSDFRGGSVVTPRAVKYLRRYQYHGSDRSLLYKYVLSPLAETCLVFLPSWMAPNLVTTIGLGLTTASYLLLYLSMPGLVSNESTPWWVFPAAAAGLIVYQTLDNMDGKQARRTGSSSPLGLIFDHGCDAINCCFGVVFVSCILDAGSSLPLLAAIVLNQLVPFFFTTWEHYYTHELILPIVNGPSEGVVLGAVSACLRGVYGPEFFSAPREGLRGWPLGEVLMACSLLGVALTVFKQIVLVARARRLAGRGMVNPIRDASWFVVLMVLGGSWASVRPELFLTKPYTMVLLFGLLHVDMAVHLMVCHVCNMVCRSFRPILIPFMLVAANSFFPGGPLLGERTLVLGFTVLTFIYEALYLYLVVTETSLALDIYVFKLGKRSDATRNGGGTTTSKKD*
+>Ec-01_005390.1 WD40 repeat (407) ;mRNA; f:4621750-4629304
+MSESKDGGGSSGGGGRAPYLDVSEDKMYDSRLRGDYELHDYAHSPSNQRLKEQRESKGGGSIADRVLGARLHPGLTISENSAEVFVTRFAPEGNLLAAACGDGTIRIFHVSTGRLAYNLQSSSSQSLPTTSLRFRPAIAQSKTRNVLVSCNAGGEIQHWHITSGKCLSTIKEEDQFYALDYRKDGSVFAATGKNHTVHIYDETTKHEISLLQGGSGYGSSSAPGHSNRVFAVKFHPEDPEVLLTAGWDNTVQFWDMRVGHSVRSIFGPHISGDSLDICGNEILTGSWRPNDPLEIWDYGTAELKETIPWNRSSAQGVQPTLLYTAQFSNTADGGRYIAAGGSGANEAKIFDHTANNQLVGTVTGLPRGVFTVDFSPSPDAKKVAVAGGDASIRIIDIVEEKTADVY*
+>Ec-01_005400.1 hypothetical protein (1653) ;mRNA; r:4630582-4637601
+MSYVERLREELMGSLGFEVESQSCLSGNRGSAGERDQKARRRRSGGGAIAAVQVGVPYPHALRPRQIQQQQQQQQQQQGRRAADDSSCMVGGGCLRPQRADLSRVPRSRRRPASASSVRYLANKSNMNDGYSGANKDMDVLLKICRDQGRANSLNPADFDSSISAIANLPVKQFMTAAKDGWGPYFRNLHSNMRKETTARSTTTAKRMNRPPPERRRRSSQQQHPPLPLPRRASSGATKDEKKNNRRYSKVANDLHHMVRSADVASSDSNNRRRRRQSEDDNSDGLAASRARAAKRQAEEMVIRRMGVRLQALWQELKIPDPDRAYVTAAYLDAGGGGGGFSGQRARGGGGIEEPPVGSGGGGGGNSGPTSENVNRELTRQIRLLLEHRAATVKVLRCVNARESRLCEVEQALQAFQWHRGLDTDALGVVVSLAGLRDASLDVVRAVEEWRTNLWQPRAFCWRGVNYLEKMWQDTIFLRSPVGQSLLASVGLEAKDMTFVLYPSGNGGGAPSAIPGDSSTCGSELSDGERDTKGDVLRPPPAIVRLTPKAELVSAYRARYFEQSPVVGAGGRPGGESGDVGGERGRLKSTAAAATAAMEAVVVQEAALQRRVEAERVRLATKGCFVPLLRWLPGDSRNPAPKGKRRWSSSSPPSVPPAARNPPPGAESETHAAKDVVDSFAHNDGRSGVPAVRDVSVSAAIPPDPLTGGELPLQLQQQQQQQQQQQQPATVTNTSTSAGASLFRGSVRDSAQQERLTVSGEGDGHEEEDREDEDGDEGEDREQDEKGQASLLHTEGVRSQKQPERVEEGGHDQTQSQSEGPQAGQGSTAEVEGRSAFHENGVGEQTKMTNPLAPSFRLETSLHPPGAEEESRSETDIARRSACTVGAEARAGENGCLKVVATSECGVGSAGIPVGGVSSGDDGDGDTDKPSIVPGELRQEGIVDEERSVAPSVCYDDDFEEDAEGYSLSDSETSGEGGSADFGECLNGSISSDDAKDARRDQGVAHTTEEEGAAISCGEGRQNPVVGGNNVLTEHQRQQQLVEERETVAATAALRIQRSARAWLCRGGRLRNTKPDEKEAPQESAKEGKQEWLDAWRARRHSQVRQAQRPEEIPEEAAIRIQTTVRGGLASRQVEELRRELHARKMAATLKIQAFVRRRRARRNTTAINRREISENVDLRQQQEAEPDPELAGVGVCRGTARQGEEEILAVSSEFDSAEAATRSDRSARTIQKAVRRRLSSGNTTSKADGLPAMEIKGQPKTLEEEAQGQPDAGKRGDGPGAVLVNRCGSGDGSFIPSQQAPVVAAESSSPVVRAGDELDSPSSPAAVDGTPSSTPASGADGLDARLSDADGKNNRPDVAESAFVEAGLPSTSLPSEDSAESETADDAAGGDLSQTLQHPREGSNFQPEGASSWSPLPSPTTPRPEAAERGQQENDHQPRQVEGGGEAAVSLPPSSATACPPTLGPTVDVFVGLLPVDTDTSADAMMTTVGGTHAGGGAESLGFSAVGLSPVPERQALVAVAASASEYGSEDPDFDALSSSPGGSSRGGVSRGEEENAGVAARVATRSSVVTTGEKVEEPTESRGVERVAAPVAAAVAGAATEKNLAGDIEPVSLAAAEVATTKEVERGGTQCTEDGSDNSSIVSLSVSSGS*
+>Ec-01_005410.1 Hypothetical protein (154) ;mRNA; f:4637945-4638913
+MGSAWSRKQATIHSSFQAAPLAVASWDLQHVKILHDRFRDDGYEFGIDRVSLRDLISSALPLARGVTGDLWEIYVEHEQEMLYPLELFAAVALQCHGLSRCGVSTIYSCPVFLCKNCKNPSYFHAHFGPCRSEGRRLDWCISSKASPGIRVHF*
+>Ec-01_005410.2 Hypothetical protein (200) ;mRNA; f:4641160-4641759
+MATGDSKTEFSIPTPIPVNPCNGTCSLSSPVDASCKIVVTQHLYAVHAAIVLRGNSKQLKTRDLVRICARFDGKPVATLPPQSFHAHSSPAHCVVRLKKAGALHNRTAVPPSCRWPLATPLVYLFDQGSNHRHLRRQQHRSKRLLVCIAPTTIKPARPTTVVPSLRQPPPRLCPAPRPAPLVPATHHPRAIHQQRGRRC*
+>Ec-01_005410.3 Hypothetical protein (102) ;mRNA; f:4639028-4639623
+MRGALLKLGVYRWLSVQRKRENSTKTRPQPTDSVCAVEVYYRVGVSFRAPRLLRSQPTEKRRGLCSTCLTLKADKRFRTTSWPSASRPSWEHFRRSLDPAV*