diff test-data/glassgo_NsiR4_Synechocystis_sp_PCC6803.fa @ 13:76b7a84ba942 draft

Uploaded
author computationaltranscriptomics
date Tue, 14 Jan 2020 06:03:45 -0500
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/glassgo_NsiR4_Synechocystis_sp_PCC6803.fa	Tue Jan 14 06:03:45 2020 -0500
@@ -0,0 +1,144 @@
+>NsiR4_Synechocystis_sp_PCC6803
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>CP017708.1:6970845-6970912 Moorea producens JHB sequence-p.c.VAL:60.47%-taxID:1454205
+ACCAAGTAACCTAGAGTTACCCTCCGATTGCTTAACCATGCCGCCCTATTGCTAGCGGCGGTTTTTTA
+>CP011304.1:c510694-510626 Microcystis aeruginosa NIES-2549, complete genome-p.c.VAL:61.63%-taxID:1641812
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAGAAAATGTTTGGATCGCTTAATATTTAAGCCC
+>CP024785.1:c5901670-5901600 Nostoc flagelliforme CCNUN1 chromosome, complete genome-p.c.VAL:60.23%-taxID:2038116
+GCAGAGTAATCTGTAATTACCCTCCGATTGCTTAACCAAACCGCCCTATGATATTTAGTGGCGGTTTTTTT
+>AP017295.1:c5126310-5126244 Nostoc sp. NIES-3756 DNA, complete genome-p.c.VAL:61.18%-taxID:1751286
+CGAAGTAGGCTATAGATTACCCTCCGATTGCTTAACCAGACCGCCCTAACCTAGTGGCGGTTTTTTT
+>CP012375.1:c508130-508062 Microcystis aeruginosa NIES-2481, complete genome-p.c.VAL:61.63%-taxID:1698524
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAGAAAATGTTTGGATCGCTTAATATTTAAGCCC
+>AP018248.1:c2285028-2284962 Tolypothrix tenuis PCC 7101 DNA, nearly complete genome-p.c.VAL:55.68%-taxID:231146
+GCAATTTAAGCTATAAATACCCTCCGATTGCTTAACCAAACCGCCCTAGATTAGCGGCGGTTTCCTC
+>CP003653.1:c4488913-4488847 Stanieria cyanosphaera PCC 7437, complete genome-p.c.VAL:61.18%-taxID:111780
+AAAGCTTAAGCTATTATTACCCTCCGATTGCTTATTCAGACCGCCCAAATCTAGAGGCGGTTTTTTA
+>AP012205.1:c1288143-1288074 Synechocystis sp. PCC 6803 DNA, complete genome, strain: GT-S-p.c.VAL:100.0%-taxID:1148
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>AP012277.1:c1288386-1288317 Synechocystis sp. PCC 6803 substr. PCC-N DNA, complete genome-p.c.VAL:100.0%-taxID:1080229
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>AP018174.1:1782280-1782351 Anabaenopsis circularis NIES-21 DNA, nearly complete genome-p.c.VAL:59.55%-taxID:1085406
+CCCAGAGTAATCTTTAATTACCCTCCGATTGCTTAACCAGACAACCGCCATAATTTAGTGGCGGTTTTTTAT
+>CP020771.1:c600281-600213 Microcystis aeruginosa PCC 7806SL chromosome, complete genome-p.c.VAL:63.53%-taxID:1903187
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAGAAAATGTTTGAATCGCTTAATATTTGGGCTT
+>AP012278.1:c1288398-1288329 Synechocystis sp. PCC 6803 substr. PCC-P DNA, complete genome-p.c.VAL:100.0%-taxID:1080230
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>CP007542.1:c257489-257420 Synechocystis sp. PCC 6714, complete genome-p.c.VAL:97.18%-taxID:1147
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCGTTGCTTCAGTGGCGGCTTTCTTTTT
+>AP018207.1:4141752-4141819 Calothrix brevissima NIES-22 DNA, nearly complete genome-p.c.VAL:58.62%-taxID:1973478
+TCAAGAGTAATCTATATCTACCCTCCGATTGCTTAACTAAACCGCCCTCGTTTTGCGGCGGTTTTCTC
+>AP018318.1:c3470288-3470217 Nostoc sp. HK-01 DNA, complete genome-p.c.VAL:59.55%-taxID:196308
+CCCAGAGTAATCTTTAATTACCCTCCGATTGCTTAACCAGACAACCGCCATAATTTAGTGGCGGTTTTTTAT
+>AP018269.1:749499-749565 Cylindrospermum sp. NIES-4074 DNA, nearly complete genome-p.c.VAL:61.18%-taxID:2005457
+AGCATAGTAAGCTAAAACTACCCTCCGATTACTTAACCACACCGCCCTCATTTAGTGGCGGTTTTTT
+>CP011339.1:2880774-2880842 Microcystis panniformis FACHB-1757, complete genome-p.c.VAL:63.53%-taxID:1638788
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAAAAAATGTTTGGATCGCTTAGTATTTAAGCCT
+>AP018172.1:7286537-7286603 Calothrix sp. NIES-2098 DNA, complete genome-p.c.VAL:57.47%-taxID:1954171
+GCAGAGTAAGCTATAACTACCCTCCGATTGCTTAACCAGACCGCCCTAGTTTAGCGGCGGTTTTCTC
+>BA000019.2:c4499343-4499277 Nostoc sp. PCC 7120 DNA, complete genome-p.c.VAL:63.1%-taxID:103690
+CAGAATAGGCTAGAGATTACCCTCCGATTGCTTAACCAGACCGCCCTAATCTAGTGGCGGTTTTTTT
+>AP019314.1:2189722-2189790 Microcystis viridis NIES-102 DNA, complete genome-p.c.VAL:61.63%-taxID:213615
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAAAAAATGTTTGGATCGCTTAAGGTTTAAGCCT
+>AP018178.1:6725304-6725371 Calothrix sp. NIES-2100 DNA, nearly complete genome-p.c.VAL:62.35%-taxID:1954172
+TAAAGAGTAAGCTATATCTACCCTCCGATTGCTTAACTAGACCGCCCTTGTTTAGCGGCGGTTTTCTC
+>AP012276.1:c1288245-1288176 Synechocystis sp. PCC 6803 substr. GT-I DNA, complete genome-p.c.VAL:100.0%-taxID:1080228
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>CP002198.1:c2006173-2006101 Cyanothece sp. PCC 7822, complete genome-p.c.VAL:76.54%-taxID:497965
+AAGACATAAAGTCAATATCACCCTCCGATTGCTTATCCAAGCCGCCCGTTGTCTAGGGGCGGTTTCTCTTTTT
+>CP019636.1:c552258-552192 Nostocales cyanobacterium HT-58-2, complete genome-p.c.VAL:61.18%-taxID:1940762
+CCAGAGTAAGCTTATAGTACCCTCCGATTGCTTAACCAGACCGCCCTAATTAAGTGGCGGTTTTTTT
+>CP001037.1:3179029-3179099 Nostoc punctiforme PCC 73102, complete genome-p.c.VAL:62.07%-taxID:63737
+GCAGAGTAATCTGTAATTACCCTCCGATTGCTTAACCAGACCGCCCTATTATATTTAGTGGCGGTTTTTTT
+>CP003630.1:5983203-5983270 Microcoleus sp. PCC 7113, complete genome-p.c.VAL:58.62%-taxID:1173027
+GCACCGTAAGCTTGTACTACCCTCCGATTGCTTAATCACGCCGCCCTATTTCTAGAGGCGGTTTTTTA
+>AP018233.1:c762274-762208 Fremyella diplosiphon NIES-3275 DNA, nearly complete genome-p.c.VAL:55.68%-taxID:1973485
+GCAAATTAAGCTATAAATACCCTCCGATTGCTTAACCAAACCGCCCTAGATTAGCGGCGGTTTCCTC
+>CP003590.1:4604043-4604111 Pleurocapsa sp. PCC 7327, complete genome-p.c.VAL:56.18%-taxID:118163
+AAGATATAGAGTCAATATCACCCTCCGATTGCTGGAAATTGACCTCCTTAATCTGTCGCAATGTAAAGA
+>AP012495.1:c2672591-2672522 Bacillus subtilis BEST7613 DNA, complete genome-p.c.VAL:100.0%-taxID:1204343
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>AM778881.1:2250-2318 Microcystis aeruginosa PCC 7806 genome sequencing data, contig C251-p.c.VAL:63.53%-taxID:267872
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAGAAAATGTTTGAATCGCTTAATATTTGGGCTT
+>AP018180.1:6949840-6949906 Nostoc carneum NIES-2107 DNA, nearly complete genome-p.c.VAL:55.68%-taxID:1973483
+GCAATTTAAGCTATAAATACCCTCCGATTGCTTAACCAAACCGCCCTAGATTAGCGGCGGTTTCCTC
+>CP017599.1:7196019-7196086 Moorea producens PAL-8-15-08-1, complete genome-p.c.VAL:60.47%-taxID:1458985
+ATCAAGTAACCTAGAGTTACCCTCCGATTGCTTAACCATCCCGCCCTATTGCTAGCGGCGGTTTTTTA
+>CP023278.1:4829822-4829885 Nostoc sp. CENA543 chromosome, complete genome-p.c.VAL:59.52%-taxID:1869241
+GGAGGTTAGTCTATAGATTACCCTCCGATTGCTTAACTAGACCGCCCTTTAGTGGCGGTTTTTT
+>CP016483.1:2220526-2220599 Synechococcus sp. PCC 8807, complete genome-p.c.VAL:56.52%-taxID:195248
+CCCGCGCTAGGTTAGCAATACCCTCCGATTGCTTATCAAGCTAGACCGTCCTCACCCAGTGGCGGTTTTTTATT
+>AP018216.1:c2608232-2608166 Anabaena variabilis NIES-23 DNA, nearly complete genome-p.c.VAL:63.1%-taxID:1973479
+CAGAATAGGCTAGAGATTACCCTCCGATTGCTTAACCAGACCGCCCTAATCTAGTGGCGGTTTTTTT
+>CP000951.1:2203752-2203825 Synechococcus sp. PCC 7002, complete genome-p.c.VAL:56.52%-taxID:32049
+CCCGCGCTAGGTTAGCAATACCCTCCGATTGCTTATCAAGCTAGACCGTCCTCACCCAGTGGCGGTTTTTTATT
+>CP001291.1:c4248692-4248623 Cyanothece sp. PCC 7424, complete genome-p.c.VAL:77.22%-taxID:65393
+AAGACATAAAGTCAATATCACCCTCCGATTGCTTATCCAGGCCGCCCATAGTCTAGGGGCGGTTTCTCTT
+>AP018268.1:6771484-6771550 Scytonema sp. NIES-4073 DNA, nearly complete genome-p.c.VAL:61.18%-taxID:2005464
+GCAGAGTAAGCTGTAAATACCCTCCGATTGCTTAACCAGACCGCCCTAATTAAGTGGCGGTTTTTTT
+>AP017375.1:c3231655-3231589 Stanieria sp. NIES-3757 DNA, complete genome-p.c.VAL:61.18%-taxID:1807358
+AAAGCCTAAGCTAGTATTACCCTCCGATTGCTTATTCAGACCGCCCAAATCTAGAGGCGGTTTTTTA
+>AM778951.1:90327-90395 Microcystis aeruginosa PCC 7806 genome sequencing data, contig C321-p.c.VAL:63.53%-taxID:267872
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAGAAAATGTTTGAATCGCTTAATATTTGGGCTT
+>AP018298.1:882710-882779 Fischerella sp. NIES-4106 DNA, nearly complete genome-p.c.VAL:60.92%-taxID:2005456
+CCAGAGTAAGCTAAAAATACCCTCCGATTGCTTAACCAGACCGCCCTACTCTACTAGTGGCGGTTTTTTC
+>CP003548.1:5862130-5862199 Nostoc sp. PCC 7107, complete genome-p.c.VAL:59.09%-taxID:317936
+GCAGAGTAATCTTTAATTACCCTCCGATTGCTTAACCAGACAACCGCCATCATCTAGTGGCGGTTTTTTA
+>BA000022.2:c1289326-1289257 Synechocystis sp. PCC 6803 DNA, complete genome-p.c.VAL:100.0%-taxID:1148
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>CP016474.1:2244707-2244779 Synechococcus sp. PCC 7003, complete genome-p.c.VAL:57.14%-taxID:374981
+CCCGCGCTAGGTTAGCAATACCCTCCGATTGCTTATCAAGCTAGACCGTCCCCCCCAGTGGCGGTTTTTTATT
+>AP018255.1:9040341-9040410 Calothrix sp. NIES-4071 DNA, complete genome-p.c.VAL:60.92%-taxID:2005469
+GCAGAGTAAGCTATTAATACCCTCCGATTGCTTAACCAGACCGCCCATTTAATTTTAGGGCGGTTTTTTT
+>CP020664.1:408158-408226 Microcystis sp. MC19 chromosome, complete genome-p.c.VAL:63.53%-taxID:1967666
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAGAAAATGTTTGAATCGCTTAATATTTGGGCTT
+>AP018280.1:3400319-3400385 Calothrix sp. NIES-4101 DNA, complete genome-p.c.VAL:59.3%-taxID:2005461
+GCAGAGTAAGCTGTAAATACCCTCCGATTGCTTAACCAGACCGCCCTAAACTAGTGGCGGTTTTTCT
+>CP003265.1:c1287796-1287727 Synechocystis sp. PCC 6803, complete genome-p.c.VAL:100.0%-taxID:1148
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>CP000806.1:666566-666637 Cyanothece sp. ATCC 51142 circular chromosome, complete sequence-p.c.VAL:77.5%-taxID:43989
+AAGACATAAAGTCAATTATCACCCTCCGATTGCTTATTGCAACCGCCCACACTTCAGTGGCGGTTTTTTATT
+>CP011382.1:c4400583-4400515 Calothrix sp. 336/3, complete genome-p.c.VAL:65.48%-taxID:1337936
+CCAGAGTAATCTGTAAATACCCTCCGATTGCTTAACCAGACCGCCCTACTTCTCAGTGGCGGTTTTTTT
+>AP018194.1:c3394929-3394863 Scytonema sp. HK-05 DNA, nearly complete genome-p.c.VAL:63.1%-taxID:1137095
+GCACAGTAAGCTATAAATACCCTCCGATTGCTTAACCAGACCGCCCTAATTAAGTGGCGGTTTTTTT
+>AP009552.1:4321642-4321710 Microcystis aeruginosa NIES-843 DNA, complete genome-p.c.VAL:61.63%-taxID:449447
+AAGACATAAAGTCAATATCACCCTCCGATTGCAATGAAAAAATGTTTGGATCGCTTAAGGTTTAAGCCT
+>CP026681.1:1035105-1035175 Nostoc sp. 'Peltigera membranacea cyanobiont' N6 chromosome, complete genome-p.c.VAL:63.95%-taxID:1261031
+GCAGAGTAATCTGTAATTACCCTCCGATTGCTTAACCAGACCGCCCTATTATACTTAGTGGCGGTTTTTTT
+>CP028094.1:c1288143-1288074 Synechocystis sp. IPPAS B-1465 chromosome, complete genome-p.c.VAL:100.0%-taxID:2116702
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>CP040360.1:2869162-2869235 Synechococcus sp. PCC 11901 chromosome, complete genome-p.c.VAL:56.52%-taxID:2579791
+CCCGCGCTAGGTTAGCAATACCCTCCGATTGCTTATCAAGCTAGACCGTCCTCACCCAGTGGCGGTTTTTTATT
+>CP012832.1:c1288399-1288330 Synechocystis sp. PCC 6803 substrain GT-G, complete genome-p.c.VAL:100.0%-taxID:1148
+AAGACATAAAGTCAATATCACCCTCCGATTGCTAGAGGTCGCCCATTGCTTCAGTGGCGGCTTTCTTTTT
+>CP000117.1:4424793-4424859 Anabaena variabilis ATCC 29413, complete genome-p.c.VAL:65.06%-taxID:240292
+CAGAATAGGCTAGATATTACCCTCCGATTGCTTAACCAGACCGCCCTAATCTAGTGGCGGTTTTTTT
+>AP012549.1:5724-5792 Cyanobacterium endosymbiont of Epithemia turgida isolate EtSB Lake Yunoko DNA, complete genome-p.c.VAL:63.53%-taxID:1228987
+AATACATAAAGTCAATTATTAGCCTTCGATTGCTTAGGATGACTACTCACTCTTTAGTGGTATTTTTTC
+>AF381044.1:400-473 Synechococcus sp. PCC 7002 type II NADH dehydrogenase B (ndbB) gene, complete cds-p.c.VAL:56.52%-taxID:32049
+CCCGCGCTAGGTTAGCAATACCCTCCGATTGCTTATCAAGCTAGACCGTCCTCACCCAGTGGCGGTTTTTTATT
+>CP003620.1:3331800-3331870 Crinalium epipsammum PCC 9333, complete genome-p.c.VAL:67.86%-taxID:1173022
+AGCAACGTAAGGTATTGATACCCTCCGATTGCTTAAGACGACCGCCCTCTTTCTAGTGGCGGTTTTTTATT
+>CP003642.1:c4145251-4145185 Cylindrospermum stagnale PCC 7417, complete genome-p.c.VAL:59.3%-taxID:56107
+GCAAAGTAAACTGTAAGTACCCTCCGATTGCTTAACCAAACCGCCCTCATCTTGTGGCGGTTTTTTC
+>CP002059.1:2779593-2779658 'Nostoc azollae' 0708, complete genome-p.c.VAL:61.9%-taxID:551115
+AATTAAGTAAGGTGTAATTACCCTCCGATTGCTTAAGCATACCGCCCCCACTAGAGGCGGTTTTTT
+>AP018290.1:9037675-9037744 Calothrix sp. NIES-4105 DNA, nearly complete genome-p.c.VAL:60.92%-taxID:2005463
+GCAGAGTAAGCTATTAATACCCTCCGATTGCTTAACCAGACCGCCCATTTAATTTTAGGGCGGTTTTTTT
+>CP016477.1:2215408-2215481 Synechococcus sp. PCC 7117, complete genome-p.c.VAL:56.52%-taxID:195498
+CCCGCGCTAGGTTAGCAATACCCTCCGATTGCTTATCAAGCTAGACCGTCCTCACCCAGTGGCGGTTTTTTATT
+>CP003549.1:c1417649-1417583 Rivularia sp. PCC 7116, complete genome-p.c.VAL:65.06%-taxID:373994
+GCAGAGTAACCTATAAATACCCTCCGATTGCTTAACCAGACCGCCCTATTTTAGTGGCGGTTTTTTT
+>CP003610.1:c5163331-5163265 Calothrix sp. PCC 6303, complete genome-p.c.VAL:65.06%-taxID:1170562
+GTAGACTAAGCTAATCATACCCTCCGATTGCTTAACCAGACCGCCCTTATCTAGAGGCGGTTTTTTT
+>AP018227.1:c6677631-6677565 Calothrix parasitica NIES-267 DNA, nearly complete genome-p.c.VAL:63.1%-taxID:1973488
+AGCAGAGTAATGTGTAAATACCCTCCGATTGCTTAACCAAACCGCCCTATTTTAGTGGCGGTTTTTT
+>AP017305.1:c2087972-2087903 Fischerella sp. NIES-3754 DNA, complete genome-p.c.VAL:64.71%-taxID:1752063
+GCACAGTAAGCTGAAAATACCCTCCGATTGCTTAACCAGACCGCCCTACTCTACTAGTGGCGGTTTTTTT
+>AP018307.1:113675-113741 Aulosira laxa NIES-50 DNA, nearly complete genome-p.c.VAL:55.68%-taxID:1541988
+GCAATTTAAGCTATAAATACCCTCCGATTGCTTAACCAAACCGCCCTAGATTAGCGGCGGTTTCCTC
+>CP013998.1:2202505-2202578 Synechococcus sp. PCC 73109, complete genome-p.c.VAL:56.52%-taxID:374982
+CCCGCGCTAGGTTAGCAATACCCTCCGATTGCTTATCAAGCTAGACCGTCCTCACCCAGTGGCGGTTTTTTATT
+>AP018184.1:1339916-1339982 Nostoc sp. NIES-2111 DNA, nearly complete genome-p.c.VAL:61.18%-taxID:1973475
+CGAAGTAGGCTATAGATTACCCTCCGATTGCTTAACCAGACCGCCCTAACCTAGTGGCGGTTTTTTT