# HG changeset patch # User artbio # Date 1668299003 0 # Node ID 3c8c9911cf2afbf66120728f19a117cfe0f4eedb planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/embl2fa commit 6e5860cedc0ed0bc807ff64f752e62355c1b19d4 diff -r 000000000000 -r 3c8c9911cf2a embl2fa.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/embl2fa.xml Sun Nov 13 00:23:23 2022 +0000 @@ -0,0 +1,35 @@ + + + + + + "$output" && + sed -i -E "s/^ID />/" "$output" && + sed -i -E "s/(>[^ ]+) .+/\1/g" "$output" && + sed -i -E "s/([GATCNgatcn]+) /\1/g" "$output" && + sed -i -E "s/^ +//g" "$output" && + sed -i -E "s/ +[0-9]+//g" "$output" + ]]> + + + + + + + + + + + + + + +.. class:: infomark + +**What it does** + +Converts file in EMBL flat format to fasta file + + + diff -r 000000000000 -r 3c8c9911cf2a test-data/transposon_sequence_set_v9.5.embl.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transposon_sequence_set_v9.5.embl.txt Sun Nov 13 00:23:23 2022 +0000 @@ -0,0 +1,6207 @@ + +ID DME9736 standard; DNA; INV; 7411 BP. +XX +AC AJ009736; +XX +DR FLYBASE; FBte0000104; Dmel\Idefix. +XX +FT source AJ009736:1..7411 +FT SO_feature five_prime_LTR ; SO:0000425:1..600 +FT SO_feature three_prime_LTR ; SO:0000426:6841..7411 +FT SO_feature CDS ; SO:0000316:<988..2031 +FT /name="Dmel\Idefix\gag" +FT /db_xref="FLYBASE:FBgn0027381" +FT /db_xref="SPTREMBL:O96739" +FT /db_xref="NCBI_PROTEIN:CAA08806.1" +FT /translation="ARKLKDIMAVPQLSETHLNQLLNQIKELNYYDGAPGKLSGFVNQV +FT EQLLSLYPTQEARQAHVIYGAVKRLLVDSALEVVTQERANTWLDMKKALAMAFKDHRPY +FT VTLIRQLEDISYPGSICKFIEKLETQYWIMFDKLELESDHVDKSNYTEMLNKTVKSVID +FT RKLPDRIYMSLARKDIDTIYKLKQASMELGLYDAIPENHRSNRTEMNKRRNRGNYNQNN +FT NQKYYNNRNHNYSNYYPSMNQNHNTQPPQNPTQPMTNQNQYSPRFIPNNQRGNYYAFRR +FT DLTQAQQNNPLNNTLNFQPSTSNNINRQGPVKRQRESQSDQSRMDVNFHQAASDTQMIE +FT KDIQVPM" +FT SO_feature CDS ; SO:0000316:<1950..5402 +FT /name="Dmel\Idefix\pol" +FT /db_xref="FLYBASE:FBgn0027380" +FT /db_xref="SPTREMBL:O96740" +FT /db_xref="NCBI_PROTEIN:CAA08807.1" +FT /translation="PKQDGCKFSSSCLGHSNDREGHTSPYVKIIHHNKNYKGMIDTGSS +FT INIIRENFENLEEKEENLIVYTIKGPITLKRSIIIKPTSVCPSAQKFYIHKFSDNYDFL +FT LGRKYLEDTKAKIDYANETVTLGSKVFKFLYEEKKGETASKCLDPQEKNDSALVDRTKP +FT KMQKVKTAPKCLKPKHQQQKKETALPKCLISNVVKDTVDNDVTHLDPMSVDNDIVNFAI +FT NNELRECNEYRLEHLNAEEVECLKKFLYEYRDIQYKEGENLTFTSTIKHVIQTQHEDPV +FT YRKPYKYPQSVDQEVNKQIKEMIEQGIVRKSKSPYCSPIWVVPKKADASGKQKFRLVVD +FT YRNLNEITVNDKFPIPRMDEILDKLGRCQYFTTIDLAKGFHQIQMDENSIAKTAFSTKH +FT GHYEYTRMPFGLKNAPATFQRCMNNLLEDLIYKDCLVYLDDIIVYSTPLEEHILSLKKV +FT FEKLRDANLKLQLDKCEFMKKETEFLGHIVTTNGIKPNPNKTKAITNFPLPKTPKQIKS +FT FLGLCGFYRKFIPNFAKIVKPMTLKLKKGAIIDTKCKEYIESFEKLKVLITSDPILIYP +FT DFSKPFSLTTDASNVAIGAVLSQNHKPVCYASRTLNEHEINYATIEKELLAIVWATKYF +FT RSYLFGRPFEVLSDHKPLVWLNNIKEPNMKLQRWKIKLNEFDYKIKYLPGKENHVADAL +FT SRTKIEVMVGEVANSADATIHSAIEDNLNYIPITERPINYFSRQIEIEKGDNDTTSVQH +FT LFQKLKIKIVYKEMTPELAKNLIKEYVCTKKSAIYFPNDEDFLIFQRAFTEIISPNNFT +FT KLLRCTTKLIDILTYAEFKDLILKKHKELLHPGIEKTINLFKEEYYYPDSQKLIQTIIN +FT ECQICYLAKTEHQTQMTYETTPEIFNTREKYMIDFYLTGNQIFLSCIDIYSKFASLVEL +FT KSRDWLEAKRAITKIFNDMGKPQEIKADKDSAFMCLALQNWLRSEGVQISISTSKNGIS +FT DIERFHKTVNEKLRIIGSQQNVEDRCTKFERILYIYNHKTKHNSTKRFPADIFLYAGSP +FT DFNVQQNKIDRIEYLNKNRHDFEVDIKYRQAPLVKSKITNPFKKTGRIGQVDDKHFEET +FT NRGRKIVHYKSKFKKQKKFNKSKYDNSRPTKEAQSTQHTSNNA" +FT SO_feature CDS ; SO:0000316:5248..6780 +FT /name="Dmel\Idefix\env" +FT /db_xref="FLYBASE:FBgn0027382" +FT /db_xref="SPTREMBL:O96741" +FT /db_xref="NCBI_PROTEIN:CAA08808.1" +FT /translation="MINISKKQIVAGRSFTISQNLRNRKSLIRANMIIPDQPKKHKVHN +FT ILLIMLSCILSLIITVKCNNIEVNPVNAKNGYLIFQTGTMEIPTSYEYHYLSINITKTM +FT LMFEDIVSEANNYPNVPQIQYLVDKLKREINGLRIISRSKRGLLNVVGKAYKYLFGTLD +FT EDDREELEEKINNMSEDSVKTHDLNTILDVINSGIDIINKLKVDKEQHQQIAVLIFNLE +FT QFTEYIEDIELGLQLTRLGIFNPRLLKHDYLKHVNSEKMLKIKTSTWLKTDTNEILIIS +FT HIPSEVTKVPIFQIVPYPDEHNYILTEQIFDKFYIFDNQVFHKDTNRDIFDKCIIGIIK +FT QEQTQCKYIKTHKNYQINYIEPNILLTWNIPETAVNQDCTHNKILISGNNIIKIKNCTI +FT QIDEFLISNNLADFTQTIYITNNVTRLEPINHLQTREMIETHVKHYNFFQIICITTFVI +FT MIISLTLYVAYKFKNIPKKIIVNIVSKKNTRTLKIMSMKIFNKEIILPYTQI" +XX +CC Derived from AJ009736 (e1371475) (Rel. 58, Last updated, Version 1). +CC Takis Benos and Michael Ashburner, 1-Feb-1999. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 7411 BP; 3047 A; 1363 C; 1109 G; 1892 T; 0 other; + GTGACATATC CATAAGTCCC TAAGACTTAA GCATATGCCT ACATACTAAT ACACTTACAA 60 + CACATACACC CCAATACAAC ATACACTACT CCGGATGTAC CCAACAGATA CCAGATAAGA 120 + ATAAGATTGT TATATGATCC TCGAGAATGG AAAAAACCCC AATTCTAGAT AAGTCACCCA 180 + CTGGTAGACT AAACATCCGT CCCCTAATTT AAACAATTCC TTGCTTAAGC CTCACCCCAT 240 + CGTCACATTC CCACGTTCAA AGCTCGGAGC CGCAATCCCG AAAAACAAAA GTATCGATTT 300 + CAATAAACAA ATTATAAGAA TCTAAGAGCA CTTGTATCCA AGAGCAAATG CACTTGAATC 360 + CAAGAGAAAC GCAAAGCTTT TTCTCTTTAC GATCAGAATC CTAAAGTCTA AAGTCCATAT 420 + TAGAAAAGCT CGATACCGAG GCTTGAACGT CAACCAAATC AGAATAATTA TCAGAGTTCA 480 + GTTTGAGACC TAATTGTAAA AGGTTCGGTG TTCTTCTCAA ATAAAAAGAT TGTAATCATT 540 + TAGTGAAATA AAAATTATAT TTTTTTCACT TATAAATATT GCAAGTATTT AATTGGCGCA 600 + GTCGGTTAGG ATCCAATAAA ATAAAAGAGT CCTTTTAGTA CGGTACTGAT CAACTGAAGG 660 + ATATGCTATA CGACTAGCTA TCCAAGATCA GCGAATTAAA ATAGTGATTC AAAAATATTT 720 + TTTAATCCGC AAAAGAATCT ACGTGAAAGT AGTATTCAAA ATAAAATCCC GTGCGGTCGG 780 + AAACAAAAAT TAATTTAAAT TTTTTAATTC CGAAACTTAA AACCAAGTTT AAAGAAAACT 840 + TAAAATCAAG AAAACTTAAA ACCAAGTTTA AAGAAAACTT AAAATCAAGA AAACTTAAAA 900 + CCAAGTTTAA AGAAAACTTA AAATCAAGAA AACTTAAAAC CAAGTTTAAA GAAAACTCAA 960 + AATCAAGAAA ACTTAAAGCC AAAATAAGCT AGAAAACTAA AAGACATCAT GGCAGTCCCA 1020 + CAACTCTCAG AAACACACCT AAACCAACTG CTAAACCAAA TCAAAGAATT AAACTACTAC 1080 + GATGGCGCAC CTGGCAAATT ATCTGGATTC GTCAACCAAG TGGAACAACT GCTCAGTTTA 1140 + TACCCAACAC AGGAAGCAAG ACAGGCACAC GTCATATATG GAGCAGTGAA GCGGTTATTA 1200 + GTGGATTCAG CCTTAGAAGT CGTAACCCAG GAAAGAGCTA ACACATGGCT GGACATGAAG 1260 + AAAGCACTGG CAATGGCATT CAAAGACCAT AGACCTTATG TAACTCTCAT CAGACAATTA 1320 + GAAGACATAT CATACCCAGG AAGTATCTGT AAGTTTATAG AAAAATTAGA AACACAATAC 1380 + TGGATTATGT TCGATAAGTT AGAATTAGAA AGTGACCATG TTGATAAATC GAATTATACC 1440 + GAAATGTTAA ACAAAACTGT TAAATCAGTA ATAGATCGAA AACTGCCGGA TAGAATTTAT 1500 + ATGTCTTTGG CACGTAAAGA TATTGATACA ATTTATAAAT TAAAACAAGC ATCAATGGAA 1560 + TTAGGCCTTT ATGATGCTAT TCCAGAAAAT CACCGTTCTA ATAGAACAGA AATGAATAAA 1620 + CGTAGGAACA GGGGAAACTA TAATCAAAAT AATAATCAAA AATATTACAA TAATAGAAAT 1680 + CACAACTACA GTAATTATTA TCCTAGCATG AATCAGAATC ATAATACACA ACCACCTCAG 1740 + AATCCGACTC AACCTATGAC AAATCAAAAC CAATATTCAC CGCGTTTCAT ACCGAATAAT 1800 + CAAAGAGGGA ATTATTATGC ATTTAGACGA GACTTAACAC AAGCTCAGCA GAACAACCCA 1860 + CTTAATAACA CCCTTAACTT CCAACCTTCG ACATCGAATA ATATTAACAG ACAAGGGCCA 1920 + GTAAAAAGAC AACGCGAGAG TCAGAGTGAC CAAAGCAGGA TGGATGTAAA TTTTCATCAA 1980 + GCTGCCTCGG ACACTCAAAT GATAGAGAAG GACATACAAG TCCCTATGTA AAAATAATTC 2040 + ATCATAATAA AAATTATAAG GGAATGATCG ATACAGGATC ATCAATTAAC ATCATAAGAG 2100 + AAAATTTTGA GAACTTAGAA GAAAAGGAAG AAAACCTAAT AGTATACACT ATTAAAGGAC 2160 + CAATAACACT AAAGAGAAGT ATAATAATAA AACCTACTTC AGTATGTCCG TCTGCTCAAA 2220 + AATTCTACAT TCACAAATTT TCTGATAACT ATGATTTCTT GTTAGGTCGA AAGTATTTAG 2280 + AAGATACAAA AGCTAAAATA GATTATGCTA ACGAAACAGT AACACTAGGC TCAAAAGTAT 2340 + TTAAGTTTCT CTATGAAGAA AAGAAGGGCG AGACCGCATC CAAATGCCTT GACCCACAAG 2400 + AAAAGAATGA TTCCGCTCTA GTGGACAGAA CCAAACCAAA AATGCAAAAG GTTAAGACCG 2460 + CACCTAAGTG CCTTAAACCA AAGCATCAAC AGCAGAAGAA AGAGACCGCA TTACCCAAAT 2520 + GCCTCATTTC AAATGTTGTT AAAGACACAG TGGACAATGA TGTAACACAT CTCGATCCCA 2580 + TGTCCGTTGA CAACGATATA GTCAACTTCG CGATTAACAA TGAGTTACGC GAATGTAACG 2640 + AGTATAGACT CGAACACTTA AATGCAGAGG AAGTTGAATG TTTAAAGAAG TTCCTATACG 2700 + AATATAGAGA CATTCAGTAC AAAGAGGGCG AAAATTTGAC CTTCACCAGT ACTATTAAAC 2760 + ATGTCATCCA GACTCAACAC GAAGACCCAG TATACCGTAA ACCCTACAAG TACCCTCAAA 2820 + GCGTTGACCA AGAAGTTAAC AAACAAATTA AAGAAATGAT AGAACAAGGG ATTGTTCGCA 2880 + AATCGAAGTC CCCTTATTGT TCTCCTATTT GGGTGGTCCC CAAGAAGGCA GACGCCTCTG 2940 + GGAAACAAAA ATTCAGGTTG GTAGTCGATT ACAGGAACCT AAATGAGATA ACTGTTAACG 3000 + ACAAATTTCC CATTCCCCGA ATGGATGAGA TATTGGACAA ACTAGGTAGA TGCCAATACT 3060 + TTACCACTAT AGATCTAGCC AAGGGTTTTC ACCAAATCCA AATGGATGAA AATTCTATTG 3120 + CAAAAACAGC TTTTTCAACT AAGCATGGGC ATTATGAATA TACTCGTATG CCCTTTGGTT 3180 + TAAAAAACGC TCCAGCTACT TTTCAGAGAT GCATGAATAA TCTTCTGGAA GATTTAATCT 3240 + ACAAAGACTG TTTAGTCTAT TTAGACGATA TTATTGTTTA TTCCACTCCA TTGGAAGAAC 3300 + ACATTTTATC CCTAAAGAAA GTCTTTGAAA AACTGAGAGA CGCTAATTTA AAGTTGCAAC 3360 + TAGATAAATG TGAATTCATG AAGAAAGAAA CTGAATTCCT AGGACACATC GTCACAACAA 3420 + ATGGCATCAA ACCAAATCCA AATAAAACTA AAGCAATTAC AAATTTTCCA TTACCCAAGA 3480 + CACCTAAGCA AATAAAATCA TTTTTGGGAT TATGTGGATT CTATCGCAAG TTTATTCCTA 3540 + ACTTTGCCAA AATAGTTAAA CCCATGACCC TCAAATTAAA GAAAGGTGCT ATAATAGACA 3600 + CCAAATGTAA AGAATACATC GAATCATTTG AAAAATTAAA AGTTTTGATA ACTTCAGACC 3660 + CGATATTAAT CTATCCTGAT TTTTCAAAAC CTTTTTCTTT GACAACTGAT GCTAGCAACG 3720 + TAGCTATTGG TGCAGTGTTA TCACAAAATC ACAAGCCAGT TTGTTATGCC AGTAGAACGC 3780 + TAAACGAACA TGAAATCAAC TATGCTACGA TTGAAAAAGA ATTGTTAGCT ATAGTTTGGG 3840 + CTACAAAATA TTTCAGGTCA TACTTATTCG GCAGACCATT TGAAGTATTA AGTGATCACA 3900 + AGCCACTGGT ATGGCTCAAC AACATTAAAG AACCAAACAT GAAATTGCAA AGATGGAAAA 3960 + TAAAACTTAA TGAATTCGAT TATAAAATCA AATATCTTCC AGGCAAAGAA AACCATGTCG 4020 + CGGATGCTCT TTCCCGCACG AAAATAGAAG TTATGGTTGG CGAGGTCGCA AATAGCGCAG 4080 + ACGCAACTAT ACACAGTGCC ATTGAAGATA ATCTAAATTA CATACCCATA ACAGAAAGAC 4140 + CAATAAATTA CTTCTCTAGA CAAATAGAGA TAGAAAAAGG CGATAACGAT ACAACAAGTG 4200 + TACAACATTT GTTTCAAAAA TTAAAGATTA AGATAGTCTA TAAAGAAATG ACACCTGAAC 4260 + TCGCCAAAAA CCTCATTAAG GAATATGTGT GCACCAAAAA GAGTGCAATT TATTTCCCTA 4320 + ATGACGAAGA TTTTCTGATC TTCCAGAGAG CGTTTACCGA AATTATAAGC CCTAACAATT 4380 + TCACAAAACT CTTGAGATGT ACCACAAAGT TAATTGATAT ACTAACGTAT GCAGAATTCA 4440 + AAGATTTAAT CTTAAAGAAA CATAAGGAAC TTTTACATCC GGGTATAGAA AAAACAATCA 4500 + ATTTATTTAA AGAAGAATAT TACTATCCTG ATAGTCAAAA GCTTATTCAA ACCATTATCA 4560 + ATGAATGTCA AATTTGTTAT CTAGCAAAAA CGGAACATCA AACACAAATG ACATATGAGA 4620 + CTACACCAGA AATATTTAAC ACAAGAGAAA AATACATGAT AGATTTTTAT CTCACAGGAA 4680 + ACCAGATCTT CTTATCTTGC ATTGATATCT ATTCGAAATT TGCATCACTA GTTGAATTAA 4740 + AAAGTAGAGA TTGGCTAGAA GCAAAAAGAG CCATTACTAA AATATTCAAT GACATGGGAA 4800 + AACCGCAAGA AATTAAAGCA GACAAAGACT CAGCTTTTAT GTGTTTAGCC TTACAAAATT 4860 + GGTTAAGATC TGAAGGTGTA CAAATTTCTA TAAGCACTAG CAAAAATGGT ATATCTGATA 4920 + TAGAAAGATT CCACAAGACC GTAAACGAAA AGCTAAGAAT CATTGGTAGC CAACAAAATG 4980 + TTGAAGATAG GTGCACAAAA TTCGAAAGAA TTCTATACAT ATACAATCAC AAAACTAAAC 5040 + ATAATAGTAC TAAAAGATTT CCAGCAGACA TTTTCCTATA TGCAGGCAGT CCAGATTTTA 5100 + ATGTACAACA AAACAAAATC GATAGGATAG AATACCTCAA TAAGAATAGA CACGATTTTG 5160 + AAGTTGATAT AAAATATAGA CAAGCCCCAC TTGTAAAAAG TAAAATAACC AATCCATTTA 5220 + AAAAGACAGG AAGAATTGGA CAAGTAGATG ATAAACATTT CGAAGAACAA AATCGTGGCA 5280 + GGAAGATCGT TCACTATAAG TCAAAATTTA AGAAACAGAA AAAGTTTAAT AAGAGCAAAT 5340 + ATGATAATTC CAGACCAACC AAAGAAGCAC AAAGTACACA ACATACTTCT AATAATGCTT 5400 + AGTTGCATAC TATCACTTAT CATCACGGTC AAGTGCAACA ATATAGAAGT AAATCCAGTA 5460 + AACGCGAAAA ATGGATACCT TATATTCCAA ACAGGAACAA TGGAAATTCC AACCAGCTAT 5520 + GAATACCATT ATTTAAGCAT AAACATAACA AAGACAATGC TCATGTTCGA AGATATAGTA 5580 + AGTGAAGCAA ACAACTATCC TAATGTACCA CAAATACAAT ATTTAGTCGA CAAATTAAAA 5640 + CGAGAAATAA ATGGGTTAAG AATTATTAGT CGAAGTAAAA GAGGTCTTTT AAACGTAGTA 5700 + GGAAAAGCAT ACAAATACTT ATTCGGCACA TTAGATGAGG ATGACAGAGA AGAGTTAGAA 5760 + GAAAAAATAA ACAACATGTC AGAAGACTCT GTAAAAACCC ATGACCTAAA CACGATTCTA 5820 + GATGTAATCA ATAGTGGTAT AGATATAATT AATAAGCTCA AAGTAGATAA AGAACAACAC 5880 + CAACAAATTG CGGTACTAAT ATTTAACCTA GAGCAATTTA CAGAATATAT AGAAGACATA 5940 + GAATTGGGTC TGCAATTAAC CAGACTAGGA ATTTTCAATC CAAGATTACT AAAGCATGAC 6000 + TATTTAAAAC ATGTAAATTC AGAAAAAATG CTAAAGATAA AAACGTCAAC CTGGCTTAAA 6060 + ACAGACACGA ACGAAATTTT GATTATTTCC CATATTCCTA GCGAAGTTAC TAAAGTTCCA 6120 + ATATTCCAAA TTGTTCCGTA CCCAGATGAA CATAATTATA TTCTAACCGA GCAAATATTC 6180 + GATAAATTCT ACATATTTGA TAACCAAGTA TTCCATAAAG ATACCAATAG GGATATATTC 6240 + GACAAATGTA TTATTGGAAT CATCAAACAA GAGCAAACTC AATGCAAATA TATTAAAACA 6300 + CATAAAAATT ACCAAATAAA TTATATAGAA CCAAATATAC TATTAACATG GAATATTCCT 6360 + GAAACAGCTG TTAACCAAGA CTGTACACAC AATAAAATAT TAATTTCAGG AAACAACATC 6420 + ATTAAAATTA AAAATTGTAC CATACAAATA GATGAATTCT TAATCTCTAA TAATCTAGCA 6480 + GACTTTACAC AAACAATTTA TATCACCAAC AATGTAACAC GTCTAGAACC AATAAATCAC 6540 + TTACAAACGA GAGAAATGAT AGAAACCCAT GTAAAACACT ATAACTTTTT TCAAATTATA 6600 + TGCATTACAA CGTTCGTCAT AATGATAATT AGTTTGACTC TGTATGTAGC ATATAAGTTT 6660 + AAAAATATAC CTAAGAAAAT TATTGTCAAT ATCGTAAGCA AAAAGAACAC ACGCACCTTG 6720 + AAAATAATGT CAATGAAAAT ATTCAACAAG GAAATAATAT TACCTTATAC CCAAATTTAA 6780 + CGACCTGAGG ACAGGCCAAA TTCAAAGGTT GGGGGAGTGA CATATCCATA AGTCCCTAAG 6840 + ACTTAAGCAT ATGCCTACAT ACTAATACAC TTACAACACA TACACCCCAA TACAACATAC 6900 + ACTACTCCGG ATGTACCCAA CAGATACCAG ATAAGAATAA GATTGTTATA TGATCCTCGA 6960 + GAATGGAAAA AACCCCAATT CTAGATAAGT CACCCACTGG TAGACTAAAC ATCCGTTCCC 7020 + CTAATTTAAA CAATTCCTTG CTTAAGCCTC ACCCCATCGT CACATTCCCA CGTTCAAAGC 7080 + TCGGAGCCGC AATCCCGAAA AACAAAAGTA TCGATTTCAA TAAACAAATT ATAAGAATCT 7140 + AAGAGCACTT GTATCCAAGA GCAAATGCAC TTGAATCCAA GAGAAACGCA AAGCTTTTTC 7200 + TCTTTACGAT CAGAATCCTA AAGTCTAAAG TCCATATTAG AAAAGCTCGA TACCGAGGCT 7260 + TGAACGTCAA CCAAATCAGA ATAATTATCA GAGTTCAGTT TGAGACCTAA TTGTAAAAGG 7320 + TTCGGTGTTC TTCTCAAATA AAAAGATTGT AATCATTTAG TGAAATAAAA ATTATATTTT 7380 + TTTCACTTAT AAATATTGCA AGTATTTAAT T 7411 +// +ID DMIS176 standard; DNA; INV; 7439 BP. +XX +AC X01472; J01060; J01061; +XX +DR FLYBASE; FBte0000109; Dmel\17.6. +XX +FT source X01472:1..7439 +FT SO_feature five_prime_LTR ; SO:0000425:1..512 +FT SO_feature three_prime_LTR ; SO:0000426:6928..7439 +FT SO_feature TATA_box ; SO:0000174:372..377 +FT SO_feature TATA_box ; SO:0000174:7271..7277 +FT SO_feature primer_binding_site ; SO:0005850:511..529 +FT SO_feature polyA_signal_sequence ; SO:0000551:372..377 +FT SO_feature polyA_signal_sequence ; SO:0000551:7299.7304 +FT SO_feature RR_tract ; SO:0000435:6917..6927 +FT SO_feature CDS ; SO:0000316:1074..2393 +FT /name="Dmel\17.6\gag" +FT /db_xref="FLYBASE:FBgn0044339" +FT /db_xref="SWISS-PROT:P04282" +FT /db_xref="NCBI_PROTEIN:CAA25701.1" +FT /translation="MAQEPAIVPPLSDSNMTQVAYQIGNVEKFNGDPGSLYTFVSRIDY +FT ILALYATGDERQQQIIFGHIERSISGEVMRCIGAYDMYTWQQLRRQLVLNYKPQTPNHV +FT LLEEFRKTPFRGNVRAFLEEAESRRQTLTSKLELEQDLEEKTFYLKLIKSSIESLIEKL +FT PTHIYLRINNHNIPDLRSLINLLQEKGMYEQINHTSTHVQKQNFSDKPQKSFNQNTNQS +FT NNIRKYPTPFLHYNSPIPYQAPQIYQTPPTNNPLYRHPIPYHPNPNNVFQPSQQNNVFQ +FT PSQQNNAFQPNQRTNFTSRPIFNTNRNNAFDQNRFGQQPQYQNQQSTQNSSSYVPNRPI +FT KRLRPANSGQTGMSVDETLYQEDAFYQQCVPYDYFYYPTYDHSDYYPENQYQIDENNQN +FT LQRTQQLQQINTDETNNDNQEPNVEQAENFQPQALENPNI" +FT SO_feature CDS ; SO:0000316:2345..5518 +FT /name="Dmel\17.6\pol" +FT /db_xref="FLYBASE:FBgn0014453" +FT /db_xref="SWISS-PROT:P04323" +FT /db_xref="NCBI_PROTEIN:CAA25702.1" +FT /translation="TGRKFSATSLGKPQYITIKYKENNLKCLIDTGSTVNMTSKNIFDL +FT PIQNTSTFIHTSNGPLIVNKSIIIPSKILFPTTNEFLLHPFSENYDLLLGRKLLAEAKA +FT TISYRDQEVTLYNNKYKLIEGIATHEQSHFQNVNMIPDTMLRQPNKISPILESDLYRLE +FT HLNNEEKQRLCALLQKYHDIQYHEGDKLTFTNQTKHTINTKHNLPLYSKYSYPQAYEQE +FT VESQIQDMLNQGIIRTSNSPYNSPIWVVPKKQDASGKQKFRIVIDYRKLNEITVGDRHP +FT IPNMDEILGKLGRCNYFTTIDLAKGFHQIEMDPESVSKTAFSTKHGHYEYLRMPFGLKN +FT APATFQRCMNDILRPLLNKHCLVYLDDIIVFSTSLDEHLQSLGLVFEKLAKANLKLQLD +FT KCEFLKQETTFLGHVLTPDGIKPNPEKIEAIQKYPIPTKPKEIKAFLGLTGYYRKFIPN +FT FADIAKPMTKCLKKNMKIDTTNPEYDSAFKKLKYLISEDPILKVPDFTKKFTLTTDASD +FT VALGAVLSQDGHPLSYISRTLNEHEINYSTIEKELLAIVWATKTFRHYLLGRHFEISSD +FT HQPLSWLYRMKDPNSKLTRWRVKLSEFDFDIKYIKGKENCVADALSRIKLEETYLSEQT +FT QHSAEEDNSDLIFITERPLNTFNRQVIFSKGPPDIKVTKYFKKHITQIFYDIMTREKAE +FT QYLIDHFCGKKSALYIESDADFEVIQAAHKLAINTKYTKILRSTILLKNITTYAEFKEL +FT ILTAHEKLLHPGIQKTTKLFGETYYFPNSQLLIQNIINECSICNLAKTEHRNTDMPTKT +FT TPKPEHCREKFMIDIYSSEGKHYVSCIDIYSKFATLEEIKTKDWIECKNALMRIFNQLG +FT KPKLLKADRDGAFSSLALKRWLESEEVELQLNTTKTGVADIERLHKTINEKIRIIKTSD +FT DEETKLSKMETVLNIYNHKTKHDTTGQTPAHIFLYAGQPILDTQQNKENKINKINNDRV +FT EYEVDTRYRKGPLQKGKLENPFKPTKNVEQTDSDHYKITNRNRITHYYKTQFKKRKKNN +FT QLSISQAPGT" +FT SO_feature CDS ; SO:0000316:5488..6903 +FT /name="17.6\env" +FT /db_xref="FLYBASE:FBgn0027624" +FT /db_xref="SWISS-PROT:P04283" +FT /db_xref="NCBI_PROTEIN:CAA25703.1" +FT /translation="SALNFTGTWHLITLLLMLITTVHGQQIEINNIDTNHGYLLFSDKP +FT VQIPSSFEHHCLRINLTEIDTIADYFEQRLRTDYHAPQVKFLYNKMRRELAGIALRHRN +FT KRGLINIVGSVFKYLFGTLDENDRVDIQRKLETNAHNSVNLHELNDAIQLINDGMQKIQ +FT NYENNSNIINSLLYELMQFTEYIEDVEMGMQLSRLGLFNPKLLNYDKLENVNSQNILNI +FT KTSTWINYNDNQLLIISHIPINFSLINTVKIIPYPDSNGYQLEYTDTQSYFERENKVYN +FT NENKEINNECVTNIIKHLKPICNFESIHTDEIIKYIEPNTIVTWNLTQTSLKQNCQNSF +FT NNIKIKGNKMIKVTQCKIEINSIILSENLFKPEIDLTPLYTPLNITKIKTVKHNDINEM +FT ISQNNITLYIFMTTVIIILILLYLYLRYVSFNPFMMLYAKLKLRKNQNQNTAQQIEMED +FT VPLPLLYPSIPAQV" +XX +CC Derived from X01472 (g8142) (Rel. 36, Last updated, Version 2). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 7439 BP; 2985 A; 1512 C; 1048 G; 1894 T; 0 other; + AGTGACATAT TCACATACAA AACCACATAA CATAGAGTAA ACATATTGAA AAGCCGCATA 60 + CGTAAACAAT AAGTGACCAC CATGCTAATG TGGATCAAAT AACAAAAATA TCCACTCTGC 120 + ATTTTGACAC CCCCATACTG TATGCCATCT GCGCAGTATG CATTCTAATA AACAAATTCT 180 + TTGACAGCGG CACTTAGCCA TTCTTGTAAA CAAATCTTAA AGTCTGCCTG CTCTCTCTGA 240 + GGCTTCTCCT CCACTTAAGA ATCCAAGAGC AATGCTCTCC CAAAAACACT AACATATTCT 300 + TTAAGCAAGC ACAGAGGCTT CTCCTCATTT TCACTTTCAT TTGATTTTCA GTCTTAAGCT 360 + GAACGTTAAT CAATAAACAA CACAATCGAT ACCGAAATTT TGATTCGTTT TATTTTGGCA 420 + AAACTCAATT TTCAGCGTTG GTCTTAGTTC ATATTCGGAA CGGTCCATTT AATAGACTCA 480 + AAACTATTTA TTGCAACCAT TTATTTGCAA TTGGCGCAGT CGATGTGATC AGTGTTAAAG 540 + TTCCTTGATG CGGTAACCAG ATTTGCCAAT TCCTGTGTTC TTTTTGTTCT CTGACAAAAG 600 + TACCACGATA ACGGGCACCC ACGTGACGGT TAATATCGCT TTAAGTTTTT AATTAAACCT 660 + CGACAATAAA GTGAAACCGA AAAATCACAA TTTGCCTAAA CAAACCTGAA TTTATTATCA 720 + GGAAGACGCT ATTGAATTTG TGAGAGGCTG TAAATCCAAT TGGTTACCTC AAAGACCCAC 780 + GAAAAAGCTA TAGTGCAACC CTTGCGAAAA TCAAAACCTA TCTTAAAAAA AAAAAAAAAA 840 + TATAAATAAT AAATTAATAA GCGAAAATTA AAACGTATTA AAAGTAAGAA TAATAAATAA 900 + ATAAGTGAAA ATTCTATATG ATAAAAATTA AAAATAAGAA TAATAAATAA AAAGACAACA 960 + TTTTAAATTA AACAATATTA AAAAAATATA AAAATATTAA AAACTATATT AAAAAAAAAA 1020 + AAAAAACAAA AAAACAAAAA AAAAAAAATA AATAAATAAT CCAAAAATCA AAAATGGCTC 1080 + AAGAACCAGC AATTGTGCCA CCACTATCAG ACAGCAACAT GACCCAGGTT GCCTACCAGA 1140 + TTGGCAATGT GGAGAAATTC AACGGTGATC CAGGCTCACT ATACACCTTT GTGAGTCGAA 1200 + TTGATTACAT ACTGGCTCTT TATGCTACCG GAGATGAACG CCAACAGCAG ATCATATTTG 1260 + GGCATATTGA ACGCAGCATC AGCGGAGAAG TTATGCGCTG CATTGGAGCC TATGACATGT 1320 + ACACCTGGCA GCAGCTTAGA AGACAATTGG TACTCAACTA TAAACCCCAG ACCCCTAACC 1380 + ACGTTCTTTT AGAAGAGTTT CGAAAGACCC CATTTCGAGG CAATGTACGA GCATTCCTGG 1440 + AAGAAGCAGA AAGCCGCAGA CAAACACTTA CTAGTAAGCT TGAATTAGAG CAAGATCTTG 1500 + AAGAAAAGAC TTTTTATTTG AAATTAATAA AATCCAGTAT AGAATCACTA ATTGAAAAAT 1560 + TACCTACACA CATTTATTTA AGAATAAATA ACCACAACAT ACCAGATTTG CGATCACTTA 1620 + TAAACCTTTT ACAAGAGAAG GGCATGTACG AACAAATAAA TCATACAAGT ACACATGTCC 1680 + AAAAACAAAA TTTCTCTGAT AAGCCACAAA AGTCCTTTAA TCAAAATACT AATCAGTCTA 1740 + ACAATATCAG AAAATATCCA ACACCTTTCC TACATTATAA TTCACCAATA CCATATCAAG 1800 + CTCCACAAAT TTATCAAACA CCACCAACTA ATAACCCACT TTATCGTCAT CCAATACCCT 1860 + ACCACCCTAA TCCAAACAAT GTTTTTCAAC CAAGCCAACA AAACAATGTT TTCCAACCAA 1920 + GCCAACAAAA CAATGCTTTT CAACCAAATC AACGAACAAA CTTTACATCT CGACCAATTT 1980 + TTAACACCAA TCGAAACAAT GCATTCGATC AGAATAGGTT CGGACAACAA CCCCAATATC 2040 + AAAATCAACA ATCAACACAA AATTCAAGTT CCTATGTACC CAATCGACCA ATAAAACGAT 2100 + TAAGACCAGC TAATAGTGGA CAGACTGGGA TGAGTGTTGA CGAAACATTA TATCAAGAGG 2160 + ACGCTTTTTA TCAGCAGTGT GTTCCATATG ACTATTTTTA TTATCCAACT TACGACCATT 2220 + CAGACTATTA TCCAGAAAAT CAATATCAAA TTGACGAAAA CAACCAAAAT TTACAAAGAA 2280 + CACAACAGTT ACAGCAGATT AATACAGACG AGACAAACAA TGACAACCAA GAACCCAATG 2340 + TTGAACAGGC CGAAAATTTT CAGCCACAAG CCTTGGAAAA CCCCAATATA TAACAATTAA 2400 + ATACAAAGAA AATAATTTGA AATGCCTTAT TGATACCGGA TCAACAGTTA ACATGACATC 2460 + TAAAAATATA TTTGATTTAC CAATCCAGAA TACTAGTACT TTTATTCATA CCAGCAATGG 2520 + ACCGCTCATT GTCAACAAAA GTATAATCAT ACCTTCAAAG ATTTTGTTCC CAACAACAAA 2580 + TGAATTTTTA TTGCACCCTT TCTCTGAGAA TTACGATCTT TTATTAGGAA GAAAACTTTT 2640 + AGCAGAAGCA AAAGCAACAA TAAGTTACCG CGATCAAGAG GTAACTCTTT ACAACAACAA 2700 + ATACAAATTA ATAGAAGGAA TAGCAACACA TGAACAGAGT CATTTTCAAA ATGTAAATAT 2760 + GATACCTGAC ACCATGCTCA GACAGCCAAA TAAAATTTCA CCCATTTTAG AATCAGACCT 2820 + ATACAGATTG GAACATTTAA ATAACGAAGA AAAACAAAGA TTGTGCGCAC TCCTGCAGAA 2880 + ATACCATGAC ATACAGTACC ATGAAGGTGA TAAGTTGACA TTTACTAATC AAACCAAACA 2940 + TACTATCAAT ACAAAGCACA ATCTACCACT TTACTCTAAA TACAGTTACC CACAGGCTTA 3000 + TGAACAGGAG GTCGAAAGCC AAATACAAGA TATGCTAAAT CAAGGTATTA TACGTACCAG 3060 + TAATTCACCT TACAATAGCC CCATCTGGGT GGTTCCAAAG AAACAAGATG CATCAGGCAA 3120 + ACAGAAATTT AGAATTGTAA TAGACTACCG AAAATTAAAT GAAATAACAG TAGGAGACAG 3180 + ACACCCAATC CCAAACATGG ACGAAATCTT GGGAAAATTG GGCAGATGTA ATTACTTCAC 3240 + AACTATAGAC TTGGCAAAGG GTTTCCACCA GATCGAAATG GATCCAGAAT CAGTTTCAAA 3300 + GACAGCCTTT TCTACCAAGC ACGGTCATTA TGAATATTTG CGCATGCCAT TCGGATTAAA 3360 + AAACGCGCCA GCCACCTTTC AACGGTGCAT GAATGATATT TTAAGACCAC TCTTAAACAA 3420 + ACACTGTCTT GTGTATTTGG ACGACATAAT TGTATTCTCG ACATCCCTTG ATGAACACCT 3480 + GCAATCGCTC GGACTAGTTT TCGAAAAATT AGCAAAAGCC AACCTTAAAT TACAACTTGA 3540 + CAAATGTGAG TTTCTCAAGC AAGAAACCAC ATTTTTAGGA CATGTTCTAA CACCAGATGG 3600 + AATAAAACCA AACCCTGAAA AAATTGAAGC CATTCAAAAA TATCCAATTC CCACTAAACC 3660 + AAAAGAAATA AAAGCTTTTC TTGGACTGAC AGGATATTAT CGTAAATTTA TTCCAAACTT 3720 + TGCAGACATA GCCAAACCCA TGACTAAGTG TTTAAAAAAG AACATGAAAA TTGACACTAC 3780 + CAACCCAGAA TATGACTCTG CATTTAAAAA ATTAAAATAT CTAATATCAG AAGACCCAAT 3840 + TCTTAAAGTA CCCGACTTTA CAAAGAAATT CACTTTAACC ACAGACGCAA GTGATGTCGC 3900 + TTTGGGGGCA GTACTGTCAC AAGATGGACA CCCACTTAGC TACATTAGCC GAACACTTAA 3960 + TGAACACGAA ATAAATTACA GCACAATTGA AAAAGAACTC TTAGCAATTG TATGGGCGAC 4020 + AAAGACTTTT CGACACTACC TACTTGGAAG ACACTTTGAA ATATCCAGTG ACCATCAACC 4080 + ATTGAGCTGG TTGTACCGTA TGAAAGACCC AAATTCAAAA CTGACCCGAT GGAGAGTAAA 4140 + ATTATCCGAA TTCGATTTTG ATATAAAATA TATAAAAGGA AAAGAAAATT GCGTGGCGGA 4200 + TGCTCTGTCC AGAATAAAAC TTGAGGAGAC ATATTTGAGC GAACAAACCC AACATAGTGC 4260 + AGAAGAGGAC AATAGTGATT TAATTTTTAT TACAGAAAGA CCTCTAAATA CATTTAACAG 4320 + ACAAGTTATA TTTTCAAAAG GACCACCAGA CATTAAAGTT ACGAAATATT TCAAAAAACA 4380 + CATCACCCAA ATATTTTACG ACATTATGAC CAGGGAAAAA GCCGAACAAT ATTTGATAGA 4440 + CCATTTTTGT GGTAAGAAAA GTGCGTTGTA TATTGAGAGT GACGCTGATT TCGAAGTCAT 4500 + TCAAGCCGCA CATAAATTAG CCATAAACAC CAAATATACA AAAATCCTGC GTAGCACGAT 4560 + TTTGTTAAAA AACATAACCA CTTATGCGGA ATTTAAGGAA TTGATCTTGA CTGCTCATGA 4620 + AAAACTTCTA CACCCAGGCA TACAGAAAAC TACTAAACTT TTCGGAGAAA CTTACTATTT 4680 + CCCTAATAGC CAGCTACTTA TTCAGAATAT AATAAATGAG TGCAGTATTT GCAATCTGGC 4740 + AAAAACAGAG CACCGAAATA CAGACATGCC AACGAAAACC ACACCCAAAC CAGAACATTG 4800 + CCGCGAAAAA TTCATGATAG ACATTTACTC ATCCGAAGGC AAACATTACG TTAGTTGCAT 4860 + AGACATTTAT TCGAAATTTG CCACATTAGA AGAAATAAAA ACAAAAGACT GGATAGAATG 4920 + CAAAAACGCG CTTATGCGCA TATTCAACCA GCTTGGCAAG CCAAAGTTAC TAAAGGCGGA 4980 + CAGAGACGGC GCATTTTCCA GTTTAGCCCT CAAGAGATGG CTGGAGAGTG AGGAAGTCGA 5040 + ATTGCAGCTT AACACAACAA AAACTGGTGT GGCGGACATA GAAAGACTAC ATAAAACAAT 5100 + TAATGAAAAG ATTCGCATAA TCAAAACATC CGATGACGAA GAAACCAAAT TGAGCAAAAT 5160 + GGAAACAGTA CTTAACATAT ACAATCATAA AACCAAACAC GACACCACTG GACAGACCCC 5220 + TGCACACATA TTTCTCTACG CTGGACAACC AATATTAGAT ACCCAACAAA ACAAAGAAAA 5280 + CAAAATAAAC AAAATAAATA ATGACAGAGT GGAGTACGAA GTCGACACAA GATACAGAAA 5340 + AGGTCCACTA CAGAAAGGCA AATTAGAAAA TCCTTTTAAG CCAACAAAAA ATGTGGAGCA 5400 + GACTGACTCT GATCATTATA AAATTACTAA TAGAAATAGA ATTACTCACT ACTACAAAAC 5460 + ACAATTCAAA AAACGAAAGA AAAATAATCA GCTCTCAATT TCACAGGCAC CTGGCACTTG 5520 + ATAACATTGC TGCTGATGCT GATCACAACA GTTCATGGAC AACAAATTGA AATTAATAAT 5580 + ATTGACACAA ACCACGGATA TCTCCTTTTT TCTGATAAAC CAGTCCAGAT ACCATCATCC 5640 + TTTGAACATC ATTGCTTGAG AATCAATTTA ACTGAAATAG ACACCATAGC TGATTATTTT 5700 + GAGCAAAGAC TACGTACCGA CTACCATGCA CCCCAGGTCA AATTTTTATA CAACAAAATG 5760 + AGAAGAGAAC TAGCTGGAAT AGCCTTGCGA CATAGAAATA AACGGGGACT TATTAACATT 5820 + GTAGGTTCAG TTTTTAAATA CCTATTTGGC ACACTTGACG AAAATGATCG AGTGGATATA 5880 + CAGAGGAAAC TTGAAACAAA CGCCCATAAC TCGGTAAATT TACATGAACT CAATGACGCT 5940 + ATTCAATTAA TAAATGACGG AATGCAAAAG ATACAGAATT ATGAAAACAA CAGCAACATC 6000 + ATTAACAGTC TTTTATATGA ACTCATGCAG TTTACAGAAT ACATAGAAGA TGTGGAAATG 6060 + GGAATGCAGC TTTCCAGACT CGGTCTATTT AATCCCAAAC TACTAAACTA CGATAAACTT 6120 + GAGAATGTAA ACAGCCAAAA TATTTTAAAC ATTAAAACAT CCACTTGGAT TAATTACAAT 6180 + GATAACCAAT TATTAATCAT ATCTCACATA CCTATTAACT TTTCATTAAT AAATACAGTA 6240 + AAAATAATCC CTTACCCAGA CTCGAACGGC TATCAGCTAG AATACACAGA CACACAATCA 6300 + TATTTTGAAA GAGAAAATAA AGTTTACAAT AACGAAAATA AAGAAATAAA CAATGAGTGT 6360 + GTCACCAACA TTATTAAACA TTTAAAACCA ATTTGTAATT TTGAGTCAAT CCACACAGAT 6420 + GAAATAATAA AATACATAGA ACCAAACACA ATTGTAACCT GGAATTTAAC CCAAACAAGT 6480 + CTCAAACAAA ATTGTCAAAA TTCATTTAAT AATATAAAAA TAAAAGGAAA CAAAATGATA 6540 + AAAGTAACCC AATGTAAAAT AGAAATCAAT AGCATAATTC TAAGTGAAAA TCTCTTTAAA 6600 + CCAGAAATAG ATTTGACACC ATTATACACA CCACTTAACA TAACAAAAAT AAAAACTGTT 6660 + AAACACAACG ACATTAATGA AATGATTTCA CAAAACAATA TTACACTTTA CATATTTATG 6720 + ACTACTGTCA TCATTATACT TATTTTATTG TACTTATATT TAAGATACGT ATCATTTAAC 6780 + CCATTCATGA TGCTGTATGC AAAACTAAAA TTAAGAAAAA ATCAAAATCA AAACACAGCA 6840 + CAACAAATAG AAATGGAAGA CGTTCCATTA CCCCTACTAT ATCCATCAAT CCCAGCCCAA 6900 + GTATAGGCTT CTCTTTAAGG GAAGGGAAGT GACATATTCA CATACAAAAC CACATAACGT 6960 + AGAGTAAACA TATTGAAAAG CCGCATACGT CAACAATAAG TGACCACCAT GCTAATGTGG 7020 + ATCAAATAAC AAAAATATCC ACTCTGCATT TTGACACCCC CATACTGTAT GCCATCTGCG 7080 + CAGTATGCAT TCTAATAAAC AAATTCTTTG ACAGCGGCAC TTAGCCATTC TTGTAAACAA 7140 + ATCTTAAAGT CTGCCTGCTC TCTCTGAGGC TTCTCCTCCA CTTAAGAATC CAAGAGCAAT 7200 + GCTCTCCCAA AAACACTAAC ATATTCTTTA AGCAAGCACA GAGGCTTCTC CTCATTTTCA 7260 + CTTTCATTTG ATTTTCAGTC TTAAGCTGAA CGTTAATCAA TAAACAACAC AATCGATACC 7320 + GAAATTTTGA TTCGTTTTAT TTTGGCAAAA CTCAATTTTC AGCGTTGGTC TTAGTTCATA 7380 + TTCGGAACGG TCCATTTAAT AGACTCAAAA CTATTTATTG CAACCATTTA TTTGCAATT 7439 +// +ID DMTN1731 standard; DNA; INV; 4648 BP. +XX +AC X07656; +XX +DR FLYBASE; FBte0000003; Dmel\1731. +XX +FT source X07656:1..4648 +FT SO_feature five_prime_LTR ; SO:0000425:1..336 +FT SO_feature three_prime_LTR ; SO:0000426:4313..4648 +FT SO_feature TATA_box ; SO:0000174:110..116 +FT SO_feature primer_binding_site ; SO:0005850:342..352 +FT SO_feature CDS ; SO:0000316:431..1252 +FT /name="Dmel\1731\gag" +FT /db_xref="FLYBASE:FBgn0020768" +FT /db_xref="REMTREMBL:CAA30502" +FT /db_xref="NCBI_PROTEIN:CAA30502.1" +FT /translation="MSNLYQIDKLEDGSYETWSIQMRSVLVHACLWKVVSGESVKPEVD +FT TGGAWQSQDEKALATIILSVKSSQLGYVKGCLTAAEAWKVLQDVHQPKGPLRTVMLYKK +FT LLSKRLLEGQSISSHIKEFKEIFDALDAVEIGITEKLRSVVLLSSLPESFENFVVAIET +FT RDDVPLFDALCIKLIEEDTRRGGAEQQREKQTESAKAFTAVHKPQAPAREARPSAKKRK +FT DVVCYNCGERRHFKANCRREKVNKESATQEQCSLLNALDSGGFWQNTVVSR" +FT SO_feature CDS ; SO:0000316:1203..4151 +FT /name="Dmel\1731\RTase" +FT /db_xref="FLYBASE:FBgn0012032" +FT /db_xref="REMTREMBL:CAA30503" +FT /db_xref="NCBI_PROTEIN:CAA30503.1" +FT /translation="MRWIVVVFGKTQWCLDSGATSHMCCDRSVFTEFEEHTEKISLAGN +FT GFLLAKGIGTVKLKTDLCTLVLNNVLFVPDLNGNFMSVSRAAQYKCFVNFGPHYADVIQ +FT EGERILRVMRAGNLYMFQGKHNSCFAAVDADGSLWHKRNGHLNTSSLQEMVRKKMVYGV +FT EKVVFKPDAVCKTCMLAKIHVQPFPKTTRSRAEELLDMIHSDLCGPFSTPSLAGSKYFL +FT TFIDDKSRRIFVYFLRKKDEVFTKFVEFKKLVERQTGRKIKCIRSDNGGEFVNNVFDDY +FT LKAHGIARQLTIPHTPQQNGVAERANRTLVEMARCMLLQSELGEALWAEAINTAVYLRN +FT RSTSRALQSKTPMEEWTGKIPAVSHLRVFGAIAVALDKGVHKGKFESKGKEYRMIGYSI +FT AAKGYRLFDKEKRCVIEKQDVLFDESGSLVNHGNTIEFQFPATDDPEPQSDSNAREGDD +FT TEPVGSSDDYESAAEAEEAEVHVGPGRPKIVRTGRPGRPKKQYNVLGVLMASDVEIPKS +FT YEEAINSQYSAKWEEAMGLEYKALLANETWKLADLPRNRRCVACKWVYSLKRDVSGRIE +FT RFKARLVAKGCSQKFGVDYFETFSPVCRLESVRLILALAAEMQLYLHHMDVCTAYLNSE +FT LKDTVYMKQPQGFTDAANPDQVLLLRKAIYGLKQSGREWNSKLDGVLKDLGFKACNHEP +FT CLYQQSGQGNLMLILVYVDDLILACQSREDMEDLKAKISESFECTDKGPLHLFLGMEVQ +FT RDGDLGEITLGHSQYIKELLRDYGSENCRPATTPLDAGHQVLCAGEQCQKVDAGQYQST +FT IGELMWLGLTTRPDMLHSVAKLAQRNQDPHSEHMVAVKHILRYLASTVDVKLHYQKCGQ +FT AFTGFVDADWGGDRLDRKSYTGYVFFLSGGPVSWRSEKQQSVALSSTEAEYMALTTACK +FT EAIALRRLIVEIVCGDLKTPTVMHGDNLKCAAQLAKNPVHHSRTKHIDIRYH" +XX +CC Derived from X07656 (g8700) (Rel. 36, Last updated, Version 6). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 4648 BP; 1316 A; 880 C; 1268 G; 1184 T; 0 other; + TGTTGAATAT AGGCAATGCC CACATGTGTG TTGAATATAG GCAATTTCCA CATGTGCATA 60 + TGTAATTTTG TATGAGAACA TACATACATA CACATGAACT GTATGTATGT ATATATATTA 120 + GCAAATAAGC AGCCGCATGA AGGTGGCATT TTTATGTGTA TCAGTTTCAG TTTCAAATAA 180 + AACTTCTTCG TGTTCGGACA CGCGGCTCAA GACTTTTTAT TTCGCGTTTA CTCTTTCAGC 240 + CTTTGCTCTC AATTCGCTGA GTTTGGGTGA AGATTAGGAT CTTCCCATTA TGATTGTCAG 300 + TGTTCCACAC TTGGAGCACC TTTTCAATAA ACAACAGGTT AATGGGCCCA GCGCCCTAGG 360 + AGCTGCCTAA AGGAGAAACG TGTAGTGAAA CTCAGGAGTT AGATTTTGGA GTCTACTCAA 420 + GATTGCCGGA ATGAGTAACC TGTATCAGAT CGATAAGCTG GAGGATGGAT CCTATGAAAC 480 + GTGGAGCATC CAGATGCGTT CAGTGTTGGT GCACGCATGT TTGTGGAAGG TGGTTTCAGG 540 + AGAGTCCGTG AAACCTGAGG TTGATACTGG AGGTGCTTGG CAATCCCAAG ATGAAAAAGC 600 + ATTGGCCACG ATCATCTTGA GTGTGAAGTC TTCGCAACTT GGTTATGTAA AAGGGTGTCT 660 + CACTGCGGCT GAGGCATGGA AAGTTTTACA GGATGTCCAC CAGCCGAAAG GGCCGTTACG 720 + AACGGTCATG CTGTATAAGA AGTTGCTGAG CAAACGTCTG TTGGAAGGGC AGAGTATATC 780 + GTCACATATT AAAGAATTTA AGGAAATCTT TGATGCCCTT GATGCGGTGG AAATTGGTAT 840 + CACCGAGAAA TTGCGCAGTG TTGTTTTGCT GTCGAGCCTT CCAGAGAGTT TCGAGAATTT 900 + CGTTGTCGCC ATTGAGACGC GCGACGACGT GCCGCTTTTC GATGCTCTAT GTATAAAGCT 960 + GATCGAGGAA GACACGAGAA GGGGAGGAGC GGAGCAGCAG AGAGAAAAAC AAACGGAGAG 1020 + CGCAAAGGCA TTTACTGCAG TACATAAGCC ACAGGCGCCG GCGAGAGAAG CTCGGCCGAG 1080 + CGCAAAGAAG AGGAAAGACG TAGTTTGTTA TAACTGTGGA GAGCGTAGGC ATTTTAAAGC 1140 + GAACTGTCGT CGCGAGAAAG TAAACAAAGA GAGCGCGACA CAAGAACAAT GCAGTTTGTT 1200 + AAATGCGCTG GATAGTGGTG GTTTTTGGCA AAACACAGTG GTGTCTCGAT AGCGGGGCTA 1260 + CCAGTCACAT GTGCTGTGAC AGAAGTGTTT TTACTGAGTT TGAAGAGCAC ACTGAAAAAA 1320 + TTAGTCTTGC TGGAAATGGA TTCCTACTAG CAAAGGGCAT AGGAACAGTG AAGCTGAAGA 1380 + CTGATTTATG TACTCTGGTA TTGAATAACG TACTCTTCGT CCCAGATTTG AACGGCAACT 1440 + TTATGTCAGT CAGCCGTGCA GCTCAGTATA AATGTTTTGT CAATTTTGGA CCACATTACG 1500 + CTGACGTCAT TCAGGAAGGC GAGCGAATAC TGCGTGTAAT GAGAGCTGGT AATTTATATA 1560 + TGTTTCAAGG GAAACATAAC AGTTGTTTTG CGGCCGTTGA TGCTGATGGT TCACTATGGC 1620 + ATAAAAGGAA TGGCCATTTG AATACAAGCA GCCTACAGGA GATGGTGAGG AAGAAGATGG 1680 + TGTACGGTGT TGAAAAGGTC GTTTTCAAAC CAGACGCAGT ATGCAAGACG TGCATGCTGG 1740 + CAAAAATCCA TGTGCAACCA TTTCCGAAGA CAACGAGGAG CAGAGCTGAG GAGCTGTTGG 1800 + ATATGATCCA TTCAGACCTG TGCGGGCCAT TTAGCACACC GTCACTTGCT GGATCAAAGT 1860 + ACTTTCTCAC TTTCATAGAC GACAAGTCCA GGCGGATTTT TGTATATTTC TTGCGGAAGA 1920 + AGGACGAAGT CTTCACTAAG TTTGTCGAGT TTAAGAAACT GGTCGAGCGA CAAACAGGTA 1980 + GAAAGATAAA ATGTATCCGG AGCGATAATG GTGGTGAGTT CGTCAATAAT GTTTTTGATG 2040 + ACTATTTAAA GGCACATGGG ATCGCTAGAC AGCTGACTAT TCCACACACT CCCCAACAAA 2100 + ATGGAGTTGC AGAACGAGCC AACCGCACGC TAGTAGAAAT GGCTAGGTGC ATGTTGCTGC 2160 + AATCGGAGTT GGGTGAGGCT CTATGGGCTG AGGCGATAAA CACTGCGGTG TATCTGAGGA 2220 + ACCGATCAAC GAGCAGAGCA TTACAAAGCA AAACCCCTAT GGAAGAGTGG ACCGGAAAAA 2280 + TACCAGCAGT GAGCCACTTG AGGGTTTTTG GTGCCATAGC AGTGGCATTG GACAAAGGAG 2340 + TCCATAAAGG CAAATTCGAA TCCAAAGGAA AGGAATATCG TATGATTGGA TATTCAATAG 2400 + CTGCTAAGGG GTACCGTCTG TTTGACAAAG AGAAGCGGTG TGTGATCGAG AAGCAAGATG 2460 + TCCTTTTTGA TGAGTCTGGT AGTTTGGTAA ATCATGGAAA TACCATTGAG TTCCAGTTTC 2520 + CCGCAACTGA TGACCCGGAG CCGCAGAGTG ATTCGAATGC ACGGGAAGGT GACGATACAG 2580 + AACCCGTGGG CAGCAGCGAC GACTATGAGA GTGCAGCTGA GGCAGAAGAA GCTGAAGTAC 2640 + ATGTGGGGCC TGGACGGCCA AAGATTGTTC GGACGGGCAG ACCAGGGCGC CCGAAGAAGC 2700 + AATACAATGT ACTTGGCGTG TTGATGGCTA GCGACGTCGA AATTCCCAAG TCCTATGAGG 2760 + AGGCCATCAA TTCGCAGTAT TCTGCAAAGT GGGAAGAGGC AATGGGCCTG GAGTACAAGG 2820 + CGCTACTTGC AAATGAGACA TGGAAGCTGG CTGACTTACC AAGAAATCGC CGGTGTGTGG 2880 + CTTGCAAGTG GGTGTATTCC CTGAAACGAG ACGTCTCTGG TAGAATTGAG CGCTTCAAGG 2940 + CACGACTAGT AGCAAAGGGG TGTTCGCAGA AGTTCGGAGT GGACTACTTC GAGACTTTTT 3000 + CACCCGTGTG CAGGCTCGAG AGTGTGAGGC TCATTTTGGC ATTGGCAGCA GAGATGCAAT 3060 + TGTACTTGCA TCACATGGAC GTATGCACGG CGTACTTAAA TAGCGAGCTA AAGGATACTG 3120 + TGTACATGAA GCAGCCCCAA GGGTTCACAG ATGCTGCTAA TCCCGACCAG GTGTTATTGC 3180 + TGAGGAAGGC AATATACGGC TTGAAGCAGT CAGGCAGAGA GTGGAACTCC AAGCTCGACG 3240 + GTGTTCTAAA AGACTTGGGA TTTAAGGCCT GTAATCATGA ACCATGTCTT TATCAGCAAA 3300 + GTGGTCAAGG TAATCTGATG CTCATCTTAG TATATGTTGA TGATTTAATT CTAGCGTGCC 3360 + AGTCAAGAGA AGATATGGAG GATCTGAAAG CCAAGATTTC AGAGTCTTTC GAGTGCACGG 3420 + ACAAGGGTCC ACTGCATTTG TTCTTAGGCA TGGAGGTGCA ACGAGATGGC GACCTTGGAG 3480 + AAATCACTTT GGGCCATTCG CAATATATCA AGGAACTATT GCGGGATTAT GGCAGCGAGA 3540 + ACTGTAGACC AGCGACGACA CCTTTGGATG CAGGGCATCA AGTTTTGTGC GCGGGTGAGC 3600 + AGTGCCAGAA GGTCGACGCA GGGCAGTATC AGTCTACAAT TGGTGAGCTA ATGTGGCTTG 3660 + GGCTTACTAC CAGACCAGAC ATGCTACATT CGGTGGCGAA GTTGGCTCAG AGGAATCAGG 3720 + ACCCGCATTC TGAGCACATG GTGGCTGTGA AGCACATCCT CCGGTACTTG GCGTCAACTG 3780 + TGGACGTCAA GCTGCATTAT CAAAAGTGCG GTCAGGCATT TACCGGCTTT GTGGATGCAG 3840 + ATTGGGGAGG CGACCGTTTG GACCGAAAGT CATACACAGG GTATGTGTTT TTCCTGTCTG 3900 + GCGGACCAGT ATCATGGAGG TCCGAGAAGC AGCAGAGCGT GGCGTTGAGC AGTACTGAAG 3960 + CCGAGTATAT GGCTCTGACC ACGGCTTGCA AGGAAGCTAT AGCTTTACGA AGGCTAATAG 4020 + TGGAGATCGT ATGCGGTGAT CTGAAGACCC CGACGGTTAT GCATGGCGAC AACCTGAAGT 4080 + GCGCAGCACA GTTAGCGAAG AACCCGGTTC ATCACTCTAG GACGAAGCAC ATCGACATTC 4140 + GATATCATTA GAGAAGTCAT GAAAGAGGGT CACGTTGTGT TAGAGTACAC TTCTACGAAT 4200 + GAGATGATAG CAGACATTAT GACAAAGAAT CTTTCAAAGG GAAAGCATAA TGGGTTTATG 4260 + AAAATGTTAA ATTTGTTTTA ATTTTTGTAA ACATGTTGGC ATTGAGGAAG GCTGTTGAAT 4320 + ATAGGCAATG CCCACATGTG TGTTGAATAT AGGCAATTTC CACATGTGCA TATGTAATTT 4380 + TGTATGAGAA CATACATACA TACACATGAA CTATATGTAT GTATATATAT TAGTAAATAA 4440 + GCAGCCGCAT GAAGCTGGCA TTTTTATGTG TATCAGTTTC AGTTTCAAAT AAAACTTCTT 4500 + CGTGTTCGGA CGCTCGGCTC AAGACTTTTT ATTTCGCGTT TACTCATTCG GCCTTTGCTC 4560 + TCAATGCGCT GAGTTTGGGT GAAGATTAGG ATCTTCCCAT TATGGTTGTC AGTGTTCCAC 4620 + ACTGGGAGCA CCTTTTCAAC AAACCACA 4648 +// +ID DMIS297 standard; DNA; INV; 6995 BP. +XX +AC X03431; +XX +DR FLYBASE; FBte0000675; Dmel\297. +XX +FT source X03431:1..6995 +FT SO_feature five_prime_LTR ; SO:0000425:1..414 +FT SO_feature three_prime_LTR ; SO:0000426:6582..6995 +FT SO_feature TATA_box ; SO:0000174:276..282 +FT SO_feature TATA_box ; SO:0000174:6857..6863 +FT SO_feature polyA_signal_sequence ; SO:0000551:304..309 +FT SO_feature polyA_signal_sequence ; SO:0000551:6885..6890 +FT SO_feature primer_binding_site ; SO:0005850:414..431 +FT SO_feature RR_tract ; SO:0000435:6571..6581 +FT SO_feature CDS ; SO:0000316:803..2047 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\297\gag" +FT /db_xref="FLYBASE:FBgn0044338" +FT /db_xref="SWISS-PROT:P20828" +FT /db_xref="NCBI_PROTEIN:CAA27159.1" +FT /translation="MSQPIIALSDINLAEARRQLKDIMPFKGDPETLHTFISRVDYVIS +FT LYQTNDVRQQRILLGAIERNLDGQITRSLGLPNVEDWPTLKARLIAEFKIQTPNYKLLE +FT NFRETPYRGSLRAFCEEAERRRQLLISKLHLEGNQSDFLIYIQGIKESIKILIRKLPIQ +FT LFTILAHHDITDLRSLITIAQNEGIYEEHINFEFYEKPEYRNKNSNSNQNSKTQKFNTN +FT VQTQNRPSYSQYSQPFQPNFNQYIQPFRPSYTQQITNNPPMWHAPNYFRPNQYINPQPI +FT IQKNHFQQYPNKAQFPQTTHFRGNTYPRLQQPSTYKNTNFPITKRLRPSDSEQTKMSID +FT EIRFQDAHEFEQVQPNYYEQQYFNQNQYNPYQNHSFINEGQQQVQFVQINNKQNQNNSE +FT LNENFRLTVPENTNT" +FT SO_feature CDS ; SO:0000316:<1999..5178 +FT /name="Dmel\297\pol" +FT /db_xref="FLYBASE:FBgn0027622" +FT /db_xref="SWISS-PROT:P20825" +FT /db_xref="NCBI_PROTEIN:CAB57796.1" +FT /translation="TKRKFSVNSSGKYEYIKIVYKGRSYKCLLDTGSTINMINENIFCL +FT PIQNSRCEVLTSNGPITLNDLIMLPRNSIFKKTEPFYVHRFSNNYDMLIGRKLLKNAQS +FT VINYKNDTVTLFDQTYKLITSESERNQNLYIQRTPESIASSDQESIKKLDFSQFRLDHL +FT NQEETFKLKGLLNKFRNLEYKEGEKLTFTNTIKHVLNTTHNSPIYSKQYPLAQTHEIEV +FT ENQVQEMLNQGLIRESNSPYNSPTWVVPKKPDASGANKYRVVIDYRKLNEITIPDRYPI +FT PNMDEILGKLGKCQYFTTIDLAKGFHQIEMDEESISKTAFSTKSGHYEYLRMPFGLRNA +FT PATFQRCMNNILRPLLNKHCLVYLDDIIIFSTSLTEHLNSIQLVFTKLADANLKLQLDK +FT CEFLKKEANFLGHIVTPDGIKPNPIKVKAIVSYPIPTKDKEIRAFLGLTGYYRKFIPNY +FT ADIAKPMTSCLKKRTKIDTQKLEYIEAFEKLKALIIRDPILQLPDFEKKFVLTTDASNL +FT ALGAVLSQNGHPISFISRTLNDHELNYSAIEKELLAIVWATKTFRHYLLGRQFLIASDH +FT QPLRWLHNLKEPGAKLERWRVRLSEYQFKIDYIKGKENSVADALSRIKIEENHHSEATQ +FT HSAEEDNSNLIHLTEKPINYFKKQIIFIKSDKNKVEHSKIFGNSITTIQYDVMTLEKAK +FT QILLDHFIHRNITIYIESDVDFEIVQRAHIEIVNTTYTKVIRSLFLLKNVGSYAEFKEI +FT ILQSHEKLLHPGIQKMTKLFKENHFFPNSQLLIQNIINECNICNLAKTEHRNTKMPLKI +FT TPNPEHCREKFVVDIYSSEGKHYISCIDIYSKFATLEQIKTKDWIECRNALMRIFNQLG +FT KPKLLKADRDGAFSSLALKRWLEEEEVELQLNTAKNGVADVERLHKTINEKIRIINSSD +FT DEEVKLSKIETILYTYNQKIKHDTTGQRPAQIFLYAGHPILDTQKIKEKKIEKINEDRR +FT EFNIDTNYRKGPLQKGKLENPFKPTKNVEQTDPDHYKITNRNRVTHYYKTQFKKQKKNN +FT KLSISQAPGTR" +FT SO_feature CDS ; SO:0000316:5145..6560 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="297\env" +FT /db_xref="FLYBASE:FBgn0027623" +FT /db_xref="SWISS-PROT:P20829" +FT /db_xref="NCBI_PROTEIN:CAB57797.1" +FT /translation="TLNFTGTWYPITLLFILITAVHGQQIQINNIDTNHGYLLFSDKPV +FT QIPSSFEHHSLKINLTEIDIVVDYFEQRLRTDYHAPQINFLYNKIKRELARITLKHRNK +FT RGFINIVGSGFKYLFGTLDENDRVEIQKKLEINVHNSVKLHELNDAIRLINDGMQKIQN +FT YENNHTIIDSLLFELMQFTEYIEDLEMAMQLSRLGLFNPKLLNYDKLENVNSQNILNIK +FT TSTWINYNDNQVLIISHIPIYLSLISTIKIIPYPDSNGYQLDYTDTQSYFEKENKVYNT +FT ENKEVKNECVTNIIKHLNPICNFKPVHTNEIIKYIEPNTIVTWNLTQTILNQNCQNSIN +FT KIKIEGNKMIRVTQCKIEINNINFSETLLEPEIDLTPLYTPLNITKIKIVKHNDIIEMI +FT SENNITLYIQMIIVIIALILLYSYLRYVSFKPFMMLYAKLKIRKNQNQNTPQQTEIEEI +FT PFPTLYPSIPAQV" +XX +CC Derived from X03431 (g8146) (Rel. 36, Last updated, Version 2). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 6995 BP; 2811 A; 1356 C; 972 G; 1856 T; 0 other; + AGTGACGTAT TTGGGTGGTC CAAACCAGCC ACTTCCATTA TTTCAAAGAA ATCAGTAATG 60 + CACTCTAGTA ATTTTCCATA ACTGTATCCC AGCTGCGCAG ACTCGTTTAT CTTTTGCAGC 120 + GCAGCGTTCT TTGTAAACAT CCTAAAGACC TGCCTAAGCA GATTTGACTG CCCTCTTTCA 180 + ACGCTACCTA ATCTTAAGAA CCCAAGAGCG AGGCTCTCCC GAAATACAAA TATTGTTCAA 240 + ATACTGAGGC TTCTCCTCAA TCCAATTTGC ATTTGATTTT TAGTCTTAAG CTGAGATCCA 300 + AAGAATAAAG TCGTGAAACT ATTTCTCCTA AAAACTATTT TTTATTTCTT GGCGTTGTCC 360 + TTAGTCAACT GACGGGACAT TAGTTCGACT CATAAATAAA ACAACAATTT TACTGGCGCA 420 + GTCGGTAGGA TACAAAAGTA TCCGAAAAAA AAGAACCTTC GAATGGAAAA TAAGTTAAAT 480 + TTTATAGTCC TGTGCTCGAA ACATCTCCCA AAATAAATTC GTGAAAACTC TTCAACTTCA 540 + ATTATAATTC CAATTCGGTT ATCCAATAAT AAGTGGAAGT GAAATACGAA ACAAAAATAT 600 + TAAGTCCAAA GGCAACTAAG TTTTAAAACC AACATATAAA AATAAAAAAT TAAAACAATA 660 + TAGAATTTTA ATAATACAAC ACAAAAATTT ACAAAACAAA AAAACAAACA AGTGAAACTA 720 + GAAAGCTTAA AAATAATAAT AACATTGAAT CCGAAACAAA ACAAAAAAAT AAAACACAAA 780 + AGTTAAAAAT TTTACAATAA AAATGTCACA ACCAATTATT GCGCTGAGCG ACATAAACCT 840 + TGCCGAAGCC CGTCGGCAGC TTAAAGACAT TATGCCATTC AAGGGTGATC CAGAAACCCT 900 + TCACACCTTT ATCAGCAGAG TGGATTACGT AATTTCGCTC TACCAAACAA ATGATGTCCG 960 + ACAACAGAGG ATTCTACTGG GAGCCATCGA AAGGAACTTG GACGGACAAA TTACACGATC 1020 + TTTGGGACTT CCGAACGTCG AAGATTGGCC TACCCTTAAA GCAAGACTCA TCGCGGAATT 1080 + TAAAATTCAA ACACCAAACT ACAAACTTCT GGAGAACTTC AGGGAGACAC CATACAGAGG 1140 + AAGCCTAAGA GCATTCTGCG AAGAAGCGGA GAGACGACGT CAATTACTAA TTTCGAAACT 1200 + ACACCTGGAA GGTAACCAAT CGGATTTTCT TATTTATATT CAGGGTATTA AAGAATCTAT 1260 + TAAGATACTG ATAAGGAAAC TACCAATACA ATTATTCACT ATTTTAGCCC ATCACGATAT 1320 + TACAGACTTA AGATCCTTAA TTACCATTGC ACAAAATGAG GGAATTTATG AAGAACACAT 1380 + TAATTTTGAA TTTTATGAAA AACCAGAATA TCGTAATAAA AATTCAAATT CTAACCAGAA 1440 + TTCGAAAACA CAAAAATTCA ATACAAATGT TCAAACTCAA AATCGACCAA GTTACTCACA 1500 + ATATTCCCAA CCCTTCCAAC CTAATTTTAA TCAATACATT CAACCATTTA GACCTAGCTA 1560 + TACACAGCAG ATAACTAACA ACCCACCCAT GTGGCACGCA CCTAATTATT TCAGACCCAA 1620 + CCAATACATA AACCCACAAC CCATTATTCA AAAAAATCAT TTCCAACAAT ATCCCAACAA 1680 + AGCCCAATTT CCCCAAACAA CGCATTTTAG AGGAAATACA TACCCTCGAC TACAACAACC 1740 + CTCTACATAT AAAAATACTA ACTTCCCGAT TACTAAACGA CTAAGACCAT CGGACAGTGA 1800 + ACAAACTAAA ATGTCTATTG ACGAAATTAG ATTCCAAGAC GCGCATGAAT TCGAACAAGT 1860 + CCAACCTAAT TATTACGAGC AACAGTATTT TAACCAAAAT CAATACAATC CGTATCAAAA 1920 + TCATAGCTTC ATTAATGAAG GGCAACAACA AGTTCAATTT GTACAAATTA ATAACAAACA 1980 + AAACCAAAAT AATTCTGAAC TAAACGAAAA TTTTCGGTTA ACAGTTCCGG AAAATACGAA 2040 + TACATAAAAA TAGTATACAA AGGGCGTTCA TACAAATGCC TTCTAGACAC AGGATCAACA 2100 + ATTAATATGA TCAATGAAAA TATATTTTGT CTTCCCATTC AAAATAGTAG ATGTGAAGTT 2160 + TTAACATCAA ATGGCCCTAT TACCTTGAAC GACTTGATTA TGTTACCCAG AAATAGTATT 2220 + TTCAAAAAAA CCGAACCATT TTATGTGCAC AGATTTTCTA ATAATTACGA TATGCTAATT 2280 + GGCAGAAAAT TGTTGAAAAA TGCTCAATCA GTTATTAATT ACAAAAATGA TACAGTTACC 2340 + CTTTTTGATC AAACATACAA ATTAATTACT TCAGAATCCG AAAGAAACCA AAATTTGTAT 2400 + ATCCAAAGGA CACCAGAATC AATTGCAAGC TCAGATCAGG AATCAATAAA AAAATTAGAT 2460 + TTTTCACAGT TTCGATTAGA TCACCTAAAT CAGGAGGAAA CTTTTAAGTT AAAAGGCTTG 2520 + TTAAATAAAT TTAGAAATCT TGAATATAAG GAGGGAGAGA AATTAACATT TACAAATACA 2580 + ATTAAACACG TACTAAATAC AACACATAAC TCCCCAATTT ATTCGAAACA ATACCCACTT 2640 + GCGCAAACAC ACGAAATCGA AGTAGAAAAC CAAGTACAGG AAATGCTGAA TCAGGGATTA 2700 + ATTAGGGAAA GTAATTCTCC ATACAATAGT CCTACTTGGG TCGTACCAAA GAAACCGGAT 2760 + GCTTCTGGTG CAAATAAGTA CAGGGTAGTA ATTGATTATA GAAAGCTAAA TGAAATAACC 2820 + ATACCTGACA GATATCCAAT TCCAAATATG GACGAAATTC TTGGCAAACT GGGTAAATGC 2880 + CAATATTTTA CAACGATCGA TCTGGCAAAG GGATTTCATC AAATAGAAAT GGACGAAGAA 2940 + TCAATTTCTA AAACTGCATT CTCCACAAAA AGCGGTCATT ACGAATACCT TCGAATGCCA 3000 + TTTGGCCTTA GGAATGCACC CGCTACTTTT CAAAGGTGCA TGAATAATAT CCTTCGACCG 3060 + TTGCTTAACA AACACTGTTT GGTGTATCTG GATGATATTA TAATTTTTTC AACATCCCTT 3120 + ACAGAACATT TAAATTCAAT ACAATTAGTT TTTACAAAGC TTGCAGATGC AAATTTAAAA 3180 + TTGCAACTAG ACAAATGTGA GTTCTTAAAA AAGGAAGCTA ACTTTCTTGG TCACATAGTT 3240 + ACCCCTGATG GTATTAAACC AAATCCTATT AAAGTTAAAG CCATAGTTTC ATACCCAATT 3300 + CCGACAAAAG ATAAAGAGAT AAGAGCTTTC CTTGGATTAA CAGGTTATTA TCGCAAATTT 3360 + ATTCCAAATT ACGCAGACAT AGCAAAACCC ATGACCAGCT GCTTAAAAAA AAGGACAAAG 3420 + ATAGATACAC AAAAACTTGA GTACATAGAG GCATTCGAAA AACTTAAGGC TTTGATAATT 3480 + CGTGACCCAA TTTTACAATT ACCTGATTTT GAAAAGAAAT TTGTTTTAAC CACAGATGCA 3540 + AGTAACTTGG CCCTCGGGGC TGTCCTTTCT CAAAACGGTC ATCCTATATC TTTTATTAGT 3600 + AGAACACTTA ACGATCACGA ATTAAATTAC AGTGCTATCG AAAAAGAATT ACTTGCCATA 3660 + GTTTGGGCCA CAAAAACTTT TCGACATTAT TTACTAGGAC GACAATTTCT CATTGCCAGT 3720 + GACCATCAAC CTCTTAGATG GCTTCATAAC TTAAAGGAAC CAGGTGCTAA GTTAGAAAGA 3780 + TGGAGAGTTA GATTAAGCGA ATACCAATTT AAAATAGATT ATATTAAAGG GAAAGAAAAT 3840 + TCAGTTGCCG ATGCATTATC AAGAATTAAA ATTGAAGAAA ATCATCATAG TGAAGCTACT 3900 + CAACATAGTG CAGAAGAGGA CAATAGCAAC CTTATTCATT TAACAGAAAA ACCAATAAAT 3960 + TATTTCAAAA AACAAATAAT CTTTATTAAA TCCGATAAAA ATAAAGTAGA GCATTCAAAA 4020 + ATATTCGGTA ACTCCATTAC CACAATTCAA TATGACGTAA TGACACTTGA AAAGGCCAAA 4080 + CAAATTTTAC TCGATCACTT TATCCATAGA AACATTACCA TTTATATTGA GAGCGATGTA 4140 + GATTTTGAAA TCGTTCAAAG AGCACACATA GAAATTGTTA ATACCACCTA CACAAAAGTA 4200 + ATTCGCAGTC TTTTCCTATT AAAGAACGTT GGTTCATACG CCGAATTCAA AGAAATCATA 4260 + CTTCAATCAC ATGAAAAACT TTTACACCCT GGTATACAGA AAATGACAAA ATTATTTAAA 4320 + GAAAATCACT TCTTTCCAAA TAGCCAACTA TTAATTCAGA ATATAATAAA CGAATGCAAC 4380 + ATATGCAATT TGGCCAAAAC AGAACATAGA AACACCAAAA TGCCTTTAAA AATCACACCC 4440 + AACCCGGAAC ATTGCCGAGA AAAATTTGTA GTAGATATTT ATTCATCTGA GGGAAAACAT 4500 + TACATCAGTT GCATTGATAT TTATTCTAAA TTCGCTACAC TTGAGCAAAT TAAAACTAAG 4560 + GATTGGATAG AATGCAGAAA CGCATTAATG CGCATTTTTA ATCAACTAGG AAAACCCAAA 4620 + TTATTAAAGG CAGACAGAGA CGGAGCTTTC TCCAGTTTAG CTTTAAAGCG ATGGCTTGAA 4680 + GAAGAAGAAG TCGAATTACA GCTCAATACA GCAAAAAACG GAGTAGCAGA CGTCGAAAGA 4740 + TTACACAAAA CAATAAATGA AAAAATTCGT ATAATCAATT CATCTGATGA TGAAGAAGTA 4800 + AAATTAAGCA AGATAGAAAC AATCCTCTAC ACATACAACC AAAAAATTAA ACATGACACT 4860 + ACTGGACAGA GACCTGCTCA AATTTTCTTA TACGCTGGGC ATCCCATATT AGACACTCAA 4920 + AAAATTAAAG AGAAGAAAAT AGAGAAAATA AATGAAGACA GACGGGAATT TAATATTGAC 4980 + ACTAATTACA GAAAAGGTCC ACTACAGAAA GGCAAATTAG AAAACCCATT TAAACCAACC 5040 + AAAAATGTAG AACAGACAGA CCCTGACCAT TACAAAATCA CTAATAGAAA TAGAGTTACG 5100 + CACTACTACA AAACACAATT CAAAAAACAA AAGAAAAATA ATAAACTCTC AATTTCACAG 5160 + GCACCTGGTA CCCGATAACA CTATTGTTTA TACTGATCAC AGCTGTTCAT GGACAACAAA 5220 + TTCAAATTAA TAATATTGAC ACCAACCACG GATATCTCCT TTTTTCTGAT AAGCCAGTAC 5280 + AGATACCATC CTCCTTTGAA CATCACTCCT TAAAAATCAA TTTAACTGAA ATAGACATCG 5340 + TGGTTGACTA TTTTGAGCAA AGACTACGAA CCGATTACCA TGCACCCCAG ATCAATTTTT 5400 + TATACAATAA AATAAAAAGA GAACTAGCCA GAATAACCCT GAAACATAGA AACAAACGGG 5460 + GTTTTATTAA CATTGTGGGT TCAGGTTTTA AATACCTATT TGGAACACTA GATGAAAATG 5520 + ATCGAGTCGA AATACAGAAA AAACTTGAAA TCAACGTCCA TAACTCAGTA AAATTACATG 5580 + AACTCAACGA CGCCATACGA TTGATAAATG ACGGAATGCA AAAAATACAG AATTATGAAA 5640 + ATAACCACAC CATCATTGAC AGTCTTTTGT TCGAACTAAT GCAGTTTACG GAATACATAG 5700 + AAGATTTGGA AATGGCTATG CAGCTTTCCA GACTTGGACT GTTTAACCCC AAATTACTAA 5760 + ACTACGACAA ACTTGAAAAT GTGAACAGCC AAAACATTTT GAACATTAAA ACATCCACTT 5820 + GGATTAACTA CAATGATAAC CAAGTATTAA TCATATCCCA CATACCCATT TACCTTTCAC 5880 + TAATAAGCAC AATTAAAATA ATTCCTTACC CAGACTCCAA CGGCTATCAG CTAGATTACA 5940 + CAGACACACA ATCATATTTT GAAAAAGAAA ATAAAGTTTA TAATACCGAA AATAAAGAAG 6000 + TAAAAAATGA ATGTGTCACC AATATTATTA AACACTTAAA TCCAATTTGT AATTTTAAGC 6060 + CAGTACACAC GAACGAAATA ATAAAATACA TAGAACCAAA CACAATTGTA ACTTGGAACT 6120 + TAACCCAAAC AATTCTTAAC CAAAATTGCC AAAATTCAAT TAATAAAATA AAAATAGAAG 6180 + GAAACAAAAT GATAAGAGTA ACGCAATGCA AAATAGAAAT CAATAATATA AATTTTAGTG 6240 + AAACTCTGTT AGAACCAGAA ATAGATTTGA CACCACTATA CACACCACTT AATATAACAA 6300 + AAATAAAAAT TGTAAAACAC AACGACATTA TTGAGATGAT TTCAGAGAAC AATATTACAC 6360 + TTTACATACA AATGATCATT GTAATAATCG CACTAATTTT GTTGTACTCA TATTTAAGAT 6420 + ATGTATCATT TAAACCATTT ATGATGTTGT ATGCAAAACT TAAAATAAGA AAAAATCAAA 6480 + ATCAAAACAC ACCACAACAA ACAGAAATAG AAGAAATTCC ATTTCCCACA CTATATCCAT 6540 + CAATCCCAGC CCAAGTATAG GCTTCTCTTT AAGGGAAGGG GAGTGACGTA TTTGGGTGGT 6600 + CCAAACCAGC CACTTCCATT ATTTCAAAGA AATCAGTAAT GCACTCTAGT AATTTTCCAT 6660 + AACTGTATCC CAGCTGCGCA GACTCGTTTA TCTTTTGCAG CGCAGCGTTC TTTGTAAACA 6720 + TCCTAAAGAC CTGCCTAAGC AGATTTGACT GCCCTCTTTC AACGCTACCT AATCTTAAGA 6780 + ACCCAAGAGC GAGGCTCTCC CGAAATACAA ATATTGTTCA AATACTGAGG CTTCTCCTCA 6840 + ATCCAATTTG CATTTGATTT TTAGTCTTAA GCTGAGATCC AAAGAATAAA GTCGTGAAAC 6900 + TATTTCTCCT AAAAACTATT TTTTATTTCT TGGCGTTGTC CTTAGTCAAC TGACGGGACA 6960 + TTAGTTCGAC TCATAAATAA AACAACAATT TTACT 6995 +// +ID DM23420 standard; DNA; INV; 6126 BP. +XX +AC U23420; +XX +DR FLYBASE; FBte0000266; Dmel\3S18. +XX +SY synonym: BEL +XX +FT source U23420:1..6126 +FT SO_feature five_prime_LTR ; SO:0000425:1..361 +FT SO_feature three_prime_LTR ; SO:0000426:5766..6126 +FT SO_feature CDS ; SO:0000316:919..5742 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\3S18\ORF" +FT /db_xref="FLYBASE:FBgn0044337" +FT /db_xref="REMTREMBL:AAB03640" +FT /db_xref="NCBI_PROTEIN:AAB03640.1" +FT /translation="MFIGSIASNSSLTDCQRFHYLKSYLAGDALALVKHIPVTNDNYRE +FT AWERLEQRYNKQSLIIRSFLNSFMSLPSAINSNIGTVRKIADGADEVIRGLRALNCEER +FT DPWLIFILLSKLDSDTRQAWAQCAESEEKGVTINRFLKFLTSRCDTLEAFELTRSTQAR +FT RAATTHHADTHPRREEPKCTSCQQNHQLFKCPQFIALDIASRRDFLKSRKLCFNCLSPA +FT HMVGNCTSRHTCRICRRKHHTLVHGSSQPIQNGNNIDTASVDSRDRPAVSHAGSTIGHN +FT QPLAREGHRLGSETPAENNFTHHTLENIPAAGSQTLLPTILADVIDAWGNTTTCRLLLD +FT TGSTITLASESFVQRIGVRRTHARISILGLAANSAGVTRGRAHIKLRSRHSGQTVELVS +FT FILTSLTSSLPAQVIDTSSSTWRQICELPLADPTFCTPGAIDVIVGSDQLWSLYTGDRK +FT HFGNDFPIALNTVFGWILAGSYSAFDDHPTSAVTHHADLDTMVRSFMEMDSIQPNQALL +FT DASDPTERHFAATHKRSTDGVYVVEYPFKEKAPPIDSTLPQAINRFFSLERKFRRYPEL +FT KQQYEAFLDDYLQRGHMEKLTSAQVEESPDTCFYLPHHAVIKLDSLTTKCRVVFDGSGK +FT DSSGVSLNDRLHIGPPIQRDLFGVCLRFRQHQYVLCADVEKMFRGIKVFKPHTNFQRIV +FT WRTTENEPLLHFRLLTVTYGLAPSPFLAVRVLKQLADDHGHEYPAAAHALLHDAYVDDI +FT PTGANTFEELMILKDELIALLDKGKFKLRKWSSNSWRLLKSLPEEDRCFEPIQLLNKSA +FT ADSPVKVLGIQWNPGKDVLYLNLKGCDATISPTKRELLSQLSRIYDPLGLVAPVTVLLK +FT LIFQESWTSVLQWDDPIPESLRTRWRALVEDLPALTQCQVPRYIASPFRDVQLHGFADA +FT SSHAYGAVVYARVAVGCSFQVTLVAAKTRVAPIKPVSIPRLELNAALLLSRLLSIVKTS +FT LTIPLFSTSCWTDSEIVLHWLSAPPRRWNTYVCNRTSEILSDFPRSCWNHVRTEDNPAD +FT CASRGLHPSKLLEHRLWWKGPSWLATPTSEWPPSTSKFSVSSSFDVNTEERAIKPTTLH +FT NFPDESIHELLIHKFSTWTRLIRVSSYCHRFIHTLRSHHRNSAPFLTSEELLDAQRRLI +FT RHVQQKSFAREYEQLENRRQLNAKSHLIRFSPFLDDYGVMRVGGRIEQSTLNYNAKHPI +FT LIPKDTPLAGLLVRHFHVSYLHTGVDATFTNLRQQYWILGARNLVRKAVFQCKSCFLQR +FT KGTSNQIMGELPIPRVQASRCFQHTGLDYAGPIAIKESKGRTPRIGKAWFSIFVCLTTK +FT ALHIEVVSELTTQAFIAAFQRFIARRAKPTDLYSDNGTTFHGGKKTLDDMRRLAIQQAK +FT DEELAGFFANEGISWHFIPPSAPHFGGMWEAGVRSIKLHMKRILGSKALTFEELSTVLT +FT QIEAILNSRPLCPTGDNSLDPLTPAHFLTGSPYTALPEPCRLDMQVNRLERWNQLQAMV +FT QGFWKRWHMEYLTSLHERTKWHLETENLKIDTLVVLKEPNLPPSKWILGRITAVHAGID +FT NKVRVVTVKTAHGLYKRPIAKIAVLPLC" +XX +CC Derived from U23420 (g733531) (Rel. 48, Last updated, Version 3). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 6126 BP; 1623 A; 1556 C; 1346 G; 1601 T; 0 other; + TGTTTGGGAA CGAGACACCC TGTATACGCG AACAAGTCAC CCTTTATCTT TATTTACATT 60 + CTTATTTGTC TGCAGCTTCA TCGGAGCTTA TCAGCGGAAT CAATGTAAGC ATCGCACCGC 120 + TGTAATTGTC CGCGAGCTTG CCCAGTACTT TTCCAAACTT CTAACTCCCT TCTAACTGTA 180 + ACTTGTTTAC GTCTTATGCT AGACTAATCG TATGGCGTGA TTACAGCCAA AGCTGAAGTC 240 + AGTCACAATT TTGATCTGCG AGAAAACGTA CGCATCGGTG TCGAAATAAT TAATATTAAG 300 + TGTCTGAACT TAACCAATAA ATGAAAATTA ACAGTAACAC TGGCGGTTTT ATTTATAAAC 360 + ATAAAAATTG GTCCTTCGAG CCGGATAACC GGAAGTGCGT TTCGTTCGGG CATTTGATTT 420 + TGATTATTGG CCTTTTGGCA AACGATAATC TATAGATTCC TACATCGTGT AGAATCGTTC 480 + CCTTCTTTCG ACCACCATGC GGAGTGTGAT TCAACAACGG GGCTTCTGCA AAAGCCAAAT 540 + TACTCGTGCG CATAATAATG CCTTAAAATT TGTTGATGAC ATTCACTCAG TGCAAACAAT 600 + AGTTGTCCGC CTGGCGCAAC TACAGGAAAA TTATTTGCGG TTCGTACGGC TCTCGGAAGA 660 + GCTGTATGCA TTTCAATCGG AAGCCGATTG GGAGAACCCT GACGAGGATT TTGACGCATA 720 + TGAGGACAAA CATTATGCTA CACACGCTAT TCTCAGCAAT ACTTTGGAGG AGTTGAGACG 780 + GGATGTCACC TCAAACAGTA TTGATGCCAC AGTTCAAGCG CAGGCACACC CCAGAGAAGT 840 + CATGTCGATT TTCAGTTCGA GAGAATTAAA CTTCCGACTT TTTCTGGAAA TTATGAGGAC 900 + TGGAAACATT TTTCGGACAT GTTTATTGGA TCGATTGCTT CCAATTCGAG CCTGACGGAT 960 + TGCCAACGAT TTCATTATTT AAAATCGTAC CTTGCCGGAG ACGCGCTTGC ATTAGTTAAA 1020 + CATATTCCAG TTACTAATGA CAACTATCGG GAAGCATGGG AGCGGCTGGA ACAGCGATAT 1080 + AACAAACAAT CGCTAATTAT TCGATCGTTC TTAAACAGTT TCATGAGCCT TCCGAGTGCT 1140 + ATAAATTCAA ATATCGGCAC AGTGCGGAAA ATTGCCGATG GTGCAGACGA AGTTATTCGT 1200 + GGTCTACGAG CTCTTAATTG CGAAGAGAGG GATCCCTGGC TAATTTTCAT TCTACTTTCA 1260 + AAATTAGATA GCGATACCCG CCAAGCCTGG GCTCAGTGCG CAGAATCCGA GGAAAAAGGT 1320 + GTGACCATCA ACCGATTCTT GAAATTTCTC ACATCACGCT GCGATACGTT GGAGGCTTTT 1380 + GAATTAACTC GATCAACCCA AGCTCGACGC GCAGCTACCA CGCACCACGC AGACACGCAT 1440 + CCAAGACGGG AAGAGCCGAA GTGCACATCG TGCCAGCAGA ATCACCAACT GTTTAAGTGT 1500 + CCTCAATTCA TCGCACTCGA CATTGCATCT CGCCGAGACT TCCTCAAATC AAGAAAGCTC 1560 + TGTTTCAATT GCCTCAGCCC GGCTCATATG GTGGGCAACT GTACATCGAG GCATACTTGT 1620 + CGGATCTGCC GCCGCAAGCA TCATACTTTG GTTCATGGCT CGTCGCAGCC AATTCAAAAT 1680 + GGCAACAACA TTGACACAGC AAGTGTTGAC AGCCGCGATC GACCAGCAGT CTCACATGCG 1740 + GGATCTACAA TTGGCCACAA TCAACCGCTA GCTCGAGAAG GTCATCGCTT GGGAAGCGAG 1800 + ACTCCCGCGG AAAACAACTT TACGCATCAT ACTCTGGAGA ATATTCCGGC GGCTGGTTCT 1860 + CAGACTCTGT TGCCAACCAT CCTTGCTGAC GTCATCGACG CCTGGGGAAA CACTACAACC 1920 + TGCAGGCTGC TCCTGGACAC TGGATCTACA ATAACCTTGG CATCGGAATC ATTTGTTCAG 1980 + CGAATAGGCG TGCGTCGAAC GCACGCACGG ATTTCTATTC TCGGTCTCGC CGCCAACAGC 2040 + GCGGGCGTTA CCCGAGGACG CGCACATATC AAGCTGCGCT CTCGTCATTC GGGCCAAACT 2100 + GTCGAATTGG TCTCGTTCAT TCTCACCTCG CTGACGTCAT CACTTCCTGC CCAAGTTATT 2160 + GACACCTCAT CCTCTACGTG GAGGCAAATC TGCGAGCTTC CTTTGGCAGA CCCAACGTTC 2220 + TGCACACCTG GAGCAATCGA TGTCATTGTT GGATCGGATC AACTTTGGTC TCTATACACA 2280 + GGAGATCGGA AACACTTTGG TAACGACTTT CCTATCGCTC TCAATACTGT ATTTGGTTGG 2340 + ATTCTTGCAG GCTCTTACTC TGCATTCGAT GATCACCCTA CTTCTGCGGT TACTCATCAC 2400 + GCGGACCTAG ACACGATGGT TCGTTCATTC ATGGAGATGG ACAGCATTCA GCCTAACCAG 2460 + GCTCTCCTGG ACGCCAGCGA TCCCACAGAG CGTCATTTTG CTGCCACACA CAAGCGCTCG 2520 + ACGGACGGGG TGTACGTCGT CGAGTATCCC TTCAAGGAAA AGGCACCGCC TATTGATTCG 2580 + ACCTTGCCAC AGGCCATCAA TCGCTTCTTC TCGCTGGAAC GCAAATTTCG TCGGTATCCA 2640 + GAATTGAAGC AGCAGTACGA AGCTTTCCTG GACGACTACT TGCAACGTGG ACATATGGAA 2700 + AAACTGACCT CGGCTCAGGT TGAAGAGTCC CCAGACACCT GCTTCTATTT GCCGCACCAC 2760 + GCTGTCATCA AACTGGACAG TCTGACTACC AAATGTCGTG TAGTTTTTGA TGGATCAGGA 2820 + AAAGACAGCT CTGGAGTATC GCTCAATGAC AGACTACATA TTGGTCCACC GATTCAACGC 2880 + GATCTTTTTG GCGTTTGTCT ACGCTTCCGG CAGCACCAAT ATGTTTTATG TGCAGATGTC 2940 + GAAAAGATGT TTCGAGGCAT TAAAGTCTTT AAGCCACACA CCAATTTTCA GCGCATTGTT 3000 + TGGCGCACGA CTGAGAATGA ACCTCTGCTT CATTTTCGCC TGCTGACGGT TACCTACGGA 3060 + TTGGCACCGT CACCATTTCT GGCTGTTCGA GTTCTAAAGC AACTTGCCGA CGATCATGGC 3120 + CATGAATACC CTGCAGCAGC TCACGCTCTT CTGCACGATG CCTATGTGGA CGATATCCCG 3180 + ACAGGCGCCA ACACATTCGA GGAGCTTATG ATTCTCAAGG ACGAGCTTAT AGCCCTCTTG 3240 + GATAAGGGAA AATTCAAGCT ACGCAAATGG AGTTCTAATA GTTGGCGTCT TCTGAAATCA 3300 + TTACCAGAGG AAGATAGATG TTTTGAACCT ATCCAGCTCC TCAACAAATC AGCTGCGGAT 3360 + TCACCTGTCA AAGTTCTTGG TATCCAATGG AACCCTGGGA AGGACGTCCT GTATCTCAAC 3420 + CTAAAGGGAT GCGATGCGAC CATTTCTCCG ACGAAAAGAG AACTCTTGTC TCAGCTATCA 3480 + AGAATTTATG ATCCGCTTGG ACTGGTAGCG CCGGTCACAG TTCTACTCAA GCTAATCTTC 3540 + CAAGAAAGCT GGACAAGTGT CCTGCAGTGG GACGACCCCA TACCTGAAAG TCTACGTACG 3600 + CGCTGGAGAG CCTTAGTAGA GGATTTGCCA GCACTTACGC AATGCCAAGT ACCACGGTAT 3660 + ATTGCGTCAC CATTTCGAGA TGTTCAACTA CACGGATTCG CCGACGCATC CTCGCACGCC 3720 + TACGGTGCGG TAGTTTACGC TCGAGTTGCA GTTGGATGCA GCTTTCAAGT AACTCTGGTT 3780 + GCCGCCAAAA CACGGGTGGC CCCGATCAAG CCCGTATCAA TTCCACGTTT GGAGCTAAAC 3840 + GCTGCGTTAC TTCTATCTCG ATTGCTTTCT ATTGTCAAAA CATCACTAAC AATTCCTCTT 3900 + TTCAGCACGA GCTGCTGGAC AGATTCAGAA ATTGTGCTAC ACTGGCTTTC AGCTCCCCCT 3960 + CGACGGTGGA ACACCTACGT CTGCAACCGA ACTTCTGAGA TATTGAGCGA CTTTCCCCGT 4020 + AGCTGCTGGA ACCATGTTCG CACGGAAGAC AATCCTGCAG ATTGTGCTTC CCGAGGACTT 4080 + CATCCGTCAA AGCTTCTGGA GCATCGACTG TGGTGGAAAG GTCCGTCTTG GCTGGCCACA 4140 + CCCACCTCTG AGTGGCCACC TTCTACAAGC AAGTTCAGCG TATCTTCAAG TTTCGATGTC 4200 + AACACCGAAG AACGAGCCAT AAAGCCCACG ACTCTACATA ACTTTCCTGA TGAAAGTATA 4260 + CACGAGTTAC TCATCCACAA ATTCTCAACC TGGACGCGTC TTATAAGGGT ATCTAGCTAC 4320 + TGTCATCGCT TTATTCACAC TCTTCGATCC CATCATAGGA ATTCGGCACC ATTCCTTACG 4380 + TCTGAAGAGT TGCTGGACGC ACAGCGCCGA CTTATTCGAC ATGTGCAACA AAAATCCTTT 4440 + GCCAGAGAAT ATGAGCAGCT AGAGAATCGA CGCCAGCTTA ACGCTAAATC GCATCTTATC 4500 + CGGTTTTCTC CGTTTCTGGA TGATTATGGA GTAATGCGAG TCGGTGGGAG AATCGAGCAA 4560 + TCTACACTCA ACTATAACGC CAAGCACCCG ATTCTGATAC CTAAAGATAC ACCACTAGCT 4620 + GGACTCCTGG TTCGACATTT TCATGTCTCC TATCTGCACA CTGGAGTTGA TGCAACGTTC 4680 + ACCAATCTTC GTCAGCAGTA CTGGATTCTG GGAGCCCGCA ATCTCGTCAG AAAGGCAGTC 4740 + TTCCAATGCA AATCCTGTTT TCTTCAACGA AAGGGCACAA GCAACCAGAT CATGGGAGAG 4800 + CTACCAATTC CTCGAGTTCA AGCTAGCCGC TGCTTTCAAC ACACAGGGCT GGACTACGCT 4860 + GGACCGATCG CAATCAAGGA ATCAAAGGGA AGAACTCCAC GCATCGGAAA GGCATGGTTT 4920 + TCTATTTTCG TGTGTCTCAC TACAAAGGCA CTTCACATCG AGGTTGTTAG TGAGCTAACT 4980 + ACACAGGCTT TCATCGCAGC CTTTCAACGA TTCATTGCCC GCCGAGCGAA GCCTACTGAC 5040 + CTGTATTCGG ATAATGGAAC AACATTTCAT GGAGGCAAGA AAACTTTGGA TGACATGAGA 5100 + CGTCTGGCCA TTCAACAAGC CAAAGATGAG GAACTAGCAG GATTCTTTGC CAATGAAGGG 5160 + ATTTCTTGGC ACTTTATACC CCCGTCTGCT CCACATTTTG GAGGGATGTG GGAAGCTGGA 5220 + GTTCGCTCAA TTAAACTCCA TATGAAACGA ATACTTGGAT CAAAGGCTTT AACGTTTGAG 5280 + GAGCTCTCTA CTGTCCTGAC CCAAATTGAA GCTATCCTGA ATTCACGCCC GCTGTGCCCA 5340 + ACTGGGGATA ATTCTTTGGA TCCACTGACG CCTGCTCATT TTTTGACTGG ATCTCCGTAT 5400 + ACTGCATTGC CTGAACCCTG TCGTCTGGAT ATGCAAGTCA ATCGATTGGA GAGGTGGAAT 5460 + CAGCTGCAAG CCATGGTTCA AGGCTTTTGG AAAAGGTGGC ATATGGAATA CCTGACATCT 5520 + CTTCATGAGC GGACAAAGTG GCATCTGGAA ACCGAGAATC TGAAGATCGA CACACTGGTA 5580 + GTACTCAAGG AGCCCAATCT ACCGCCCTCT AAATGGATTC TTGGCCGCAT CACAGCAGTG 5640 + CACGCAGGAA TCGACAACAA GGTCCGAGTC GTTACAGTGA AGACTGCTCA CGGATTATAC 5700 + AAACGCCCAA TTGCCAAAAT CGCTGTACTG CCTCTCTGCT GAACAACCGT TCAGGGGGGC 5760 + CGGTATGTTT GGGAACGAGA CACCCTGTAT ACGCGAACAA GTCACCCTTT ATCTTTATTT 5820 + ACATTCTTAT TTGTCTGCAG CTTCATCGGA GCTTATCAGC GGAATCAATG TAAGCATCGC 5880 + ACCGCTGTAA TTGTCCGCGA GCTTGCCCAG TACTTTTCCA AACTTCTAAC TCCCTTCTAA 5940 + CTGTAACTTG TTTACGTCTT ATGCTAGACT AATCGTATGG CGTGATTACA GCCAAAGCTG 6000 + AAGTCAGTCA CAATTTTGAT CTGCGAGAAA ACGTACGCAT CGGTGTCGAA ATAATTAATA 6060 + TTAAGTGTCT GAACTTAACC AATAAATGAA AATTAACAGT AACACTGGCG GTTTTATTTA 6120 + TAAACA 6126 +// +ID 412 standard; DNA; INV; 7567 BP. +XX +AC nnnnnnnn; +XX +DR FLYBASE; FBte0000007; Dmel\412. +XX +SY synonym: mdg2 +XX +FT source nnnnnnnn:1..7567 +FT SO_feature five_prime_LTR ; SO:0000425:1..514 +FT SO_feature three_prime_LTR ; SO:0000426:7054..7567 +FT SO_feature CDS ; SO:0000316:679..1044 +FT SO_feature CDS ; SO:0000316:1408..1722 +FT SO_feature CDS ; SO:0000316:1888..3243 +FT SO_feature CDS ; SO:0000316:3864..6866 +XX +CC Berkeley Drosophila Genome Project. +XX +SQ Sequence 7567 BP; 2982 A; 1367 C; 1323 G; 1895 T; 0 other; + TGTAGTATGT GCCTATGCAA TATTAAGAAC AATTAAATAA AATAGCATAT TAACTTATGG 60 + CAGCACTTTG TTGCTATGTT TATGTTTATG TTTATGCACG CAGTTAGGCC AGGGCGGATG 120 + TAACATGATC ACCCACTCGA AGGCCACAAA GTATAAGTGC ATTGCCCAAT CGAAGGCAAA 180 + AAGTATAAGT GCATGGTCAG CATTCACACG CCGACCAAAT ACATATTACA TACGTACATA 240 + CATATCTCGC TCTCCCGATA AGCCTAGATA TATAAGATAT ACATAAGAAC GCCGCTCCGC 300 + TGCTGGCGTA CCCGGCAGCG CAGCTACGCG GATTAGCCTA AGTCCAAATA TATAAAAAAC 360 + TGTAAAATCG GAGAGACTCT GTAGACGTTG AGCTGACAGA ACCATTTCTG CCTACTCTAA 420 + AATCAAAAGA AGAAATTGAA TAAATATATG TCAGCCCGAC GGCTGCCTTA AACTTAAAAC 480 + GGACTTGTGT TCTTAATTGG AGTTCATCAT TACATGGCGA CCGTGACAGT CGTCCAACGC 540 + TGGACGAATT GACCAAAGCT GGTGAAAACA AAGGAACAAA GGAACACTGG ACTGGAAGAA 600 + GACTGGACTA ATTAAATGGA ACTGCAAAAA CCAAGGAAAA ATCTGAGTGA GTAGAGTTCT 660 + ATTGAGTATG GGCAAACACC GTGGCGGTTT GAAAACTAAG CTGAATAAAC GTATAGCCCA 720 + CGTAAGGTGG CTAATATACG GTCAGCAAAC GCCACCGGTT TGGTCGAAAG CTCTAAAGCT 780 + ACATGCAGAG CTAGACCACT TGTTGCAATA TCAGCAAGAA TTAAAGACCC ATAAGCTCGA 840 + GAAAACTCAC TCAGATAATA TTAAAAATAT ACCCACAATT AATGAAGTTC CAAAATACCA 900 + GGCATGTCCA GCACCAGCAC CAGCATTAAC AAAACCAAAG AAGTCCTGCC CCCCTGGCTG 960 + CGAAGGAATC TGGAGTCCCC ACTGCCTGGG GACTTGTGAG CGACCATCGA CGTCTTCAGC 1020 + GGCGAAGAAA TAGACAGCAG CGAGGGAGTG TCAGCGTGCC ACCCCCGGCG ACGCCCAGCT 1080 + GACACCCAAC AAATAGACAG CAGCGAGGGA GTGTCAGCGT GCCACCCCCG GCGACGCCCA 1140 + GCTGACACCT GATGAGCATC ATCAACAGCA GAATATAATA ATAAATATAT ATAAATATAA 1200 + AGTAAATATA AAATATATAT AGATAAGAAA AATTGTAAGA AATATTGTAA AACGGAGCAT 1260 + ATACTATTAT GCCCTGTTAA CCCAATATGG CCCGTGAAGC CATAGCTAGA ATCAGGCAGG 1320 + CAACAATGTA AAATACAATT TTTTTTTACT CTTGCGAACA TTGAAAGATT TTATAAATAG 1380 + ATAATTCCAA ACATAAATGT CTATAGAGAC AAATGAAATA AGTAAAACTG AAAATAAAAG 1440 + TATATACAAA GGAAATTTTC TATTCTATTC TCCAAAATAT AAAATTAGTA TACCCAAAAT 1500 + GGGTCTAATA GACACTAAAA CTGTGGACTC TACAGCCAAT GTAATAAATA AAGTAGAAGT 1560 + CCAAAATGCA GACTTGTTCT GGATAACCAT AATACTAATT GTAATTGCAT TAATTATGGT 1620 + ATCCAATGCA TTAATAAAAA TATACAAACT GCATAACAAG TGTCTTAAGA AACGATACCG 1680 + TAGCACTGCT AACGGTATAG ATAATATTTA AGGAAGATCT TTAATAAAGT CAATTATGAA 1740 + TGAAAATATG AGAAAAATTA TATGAAAAAA AAAAATAATA AATAAAAAAA AAATATAAAA 1800 + CGTAATATTG AATTTATCTA CATTAAAAAA AAATATATAC AAATGAATAA ATTTGAAGTT 1860 + ATGAGTATAC CACAGCATGG ACTGGGAAAA GCTTGTTGAT CAGATAAAAG ATCAAAATGA 1920 + AAATTTCAGA AAATCCTATA AGTGCTTAAC GCAAAACAGA TCAACACAAG CTGTAACAAT 1980 + CAATAGGAAT GCCCAAGTCT TGGTAAATAG TTATAATGAA ATCAGAGAGT TGATCCAACA 2040 + AAATAGAAAG AATTTGGAAC GCAAACAGTG TGCTAAGGCT TTGAACCTAC TGGTGACATT 2100 + AAGAGAAAAA TTAATATTTA TAAAAAATAA ATTCAGTCTC CAGATAGAAA TTCCAACCAT 2160 + AGTAAACACC CCACTAAGAA TAAATTTGAA TGAAGACAGC ACTAACTCTG ACGAGGAAGA 2220 + TAGGACTATA GTCAAGGAAG ACATTAAAGA GGAAGATCTT CACGATCTAA CTATACCAGC 2280 + AAAATTAATG CTGAAGAACG ACGATAAAAC AAATAACGCA GCCGACTCCG AAAATAACTT 2340 + AACCATGGCA GAAGAAGCAG CTGCCATTAG GTCTTACATT AGGGAAGTCG CCTGCACAGT 2400 + GCCAGAATTT GATGGGCAAA AGATCCATTT ACAAAGATTC ATTAAGGCAA TCAAATTGGT 2460 + AGACCTAGCT AAGGGACCAT TTGAAGACAT TGCAGTTGAG GTCATTAAGT CAAAAATAGT 2520 + TGGCACAATT TTGAACTCAG TTGACAATGA AACGACAATT CCAGCAATTA TAAACAAATT 2580 + GCAGAAAGTA GTTGTCGGTG AGACATCCAG TAATGTCAAA GCAAAGCTAG CAACAGTTCA 2640 + GCAGAGAGGT AAAACTGCAA CGCAATTTAC CGCTGAAGTT GATAGCCTGA GAAAACTTTT 2700 + AGAAGCTTCC TATATCGATG AGGGTATACC TCTAGAACAT GCCACTGGTC TAAGCACCAA 2760 + AGAGGCAATT GAAACCATGA TACATCGTGC TGAGCACGAA AGTATCAAAA CAGTACTGGA 2820 + AGCAGGGACT TGCACCACTA TGGATGCAGC GATAAGCGCA TACATAAGAA CGAGTACAAG 2880 + AGTTACCGGT GACATCAATA AAGTGATGTA CTTTAGAGGT AACAGACCCA ATAGAGGATA 2940 + CGGAAATGCC AATAGAGGTA GTAACCGCGG TAGAGGCTTT AATAACAATA GTATTAGAGG 3000 + CAACTACCAT AACGGTTACC AAAATAACGG TTACCAAAAT AACGGTTACC AGAATAACGG 3060 + TTATCAAAAC CGCTATAATG GAAATAATAA CCGTTATAAT GGCTATAACA GAGGCCGTTA 3120 + TAATGGAAAC AGAGGCCGTA ACAACAGTCA GAACAACTAC AACAGAAACA ATGCCAATGT 3180 + ACGAGTAATC CAAGAACAGG GAAACTCGCA ACAGCCTTTA GGTACTCAGT AGAAGAAGAT 3240 + CGTAGAGTAT ACACCATCAA TTATAATCTC AACATATTTT CTACATTCAT TCATGCCAAA 3300 + ACAGGCGTAA AACTAGTTTT TCTACTTGAT ACAGGTGCAG ATATCTCTAT TCTCAAAGAG 3360 + AACTCTGACA AATTTTCTAA TATTCAAATA ACCAATAAAA TAAACATTCA AGGCATAGGC 3420 + CAACAGAAAA TTCAGTCTCG AGGACAGACT TTTATTGAGA TACAGACAGG TAAATACGTT 3480 + ATCCCACACG ATTTTCATTT AGTAGATAAA AACTTTCCAA TACCGTGTGA TGGAATAATC 3540 + GGAATAGATT TCATAAAAAA ATATAATTGC CAAATCGATT TAAACCAAGA AGAAGATTGG 3600 + TTTATAATTA GACCAAACAA TTTGAAATTT CCAATATATA TTCCCATAGC ATACAGCTCT 3660 + GGTATTAACA CAACGTTATT ACCAGCAAGA TCCCAAGTTG TCCGAAGATT AATAGTATCA 3720 + TCAAAAGATG ATAACATTTT AATTCCAAAC CAGGAAATTC AAACTGGTAT TTATGTTGCA 3780 + AATACAATCG CAACATCAAG TAATACATTT GTCCGAATTT TAAATACAAC CGATTCCGAC 3840 + CAATTAGTCA ATATGGACAC TCTAAAATAT GAGCCACTTT CGAACTACAA TGTAGTTCAG 3900 + GCAAATAGTG AACACAGAAA TAAAACTGTC TTATCTCAAT TAAAGAAAAA TTTCCCCGAA 3960 + TTGTTTAAAT CACAATTAGA AAATATATGC AGCGAATATA TAGATATATT TGCATTAGAA 4020 + TCAGAACCTA TAACAGTTAA TAATTTGTAT AAACAACAGT TGAGATTAAA AGATGATGAG 4080 + CCAGTATACA CGAAAAATTA TAGAAGTCCT CATAGTCAAG TGGAAGAAAT ACAAGCCCAA 4140 + GTTCAGAAAT TAATAAAAGA TAAAATAGTT GAACCATCAG TTTCACAGTA CAATAGCCCT 4200 + TTGCTATTAG TACCCAAAAA GTCAAGCCCG AATTCTGATA AAAAGAAATG GAGATTAGTA 4260 + ATAGACTATC GCCAAATTAA TAAGAAACTT TTAGCTGACA AATTTCCACT ACCGAGAATA 4320 + GATGATATTT TGGACCAACT TGGTCGAGCA AAATATTTCT CCTGCCTTGA TTTAATGTCA 4380 + GGTTTTCATC AAATCGAACT GGATGAAGGC TCGAGAGATA TAACATCTTT CTCAACCAGC 4440 + AATGGCTCAT ATCGTTTCAC GCGATTGCCA TTTGGCTTAA AAATAGCGCC TAATTCATTC 4500 + CAAAGAATGA TGACTATAGC ATTCTCCGGA ATAGAACCGT CTCAAGCATT CCTTTATATG 4560 + GATGACTTAA TAGTCATAGG TTGTTCCGAA AAACATATGC TTAAAAACCT CACTGAAGTT 4620 + TTTGGTAAAT GCAGGGAATA CAACCTAAAG TTACATCCTG AAAAATGTTC ATTTTTCATG 4680 + CATGAAGTCA CATTTTTGGG ACACAAATGC ACAGACAAAG GAATTTTGCC GGATGACAAA 4740 + AAATATGATG TCATTCAGAA CTACCCAGTT CCACATGATG CGGACAGCGC TAGACGTTTT 4800 + GTAGCATTTT GCAATTACTA CAGACGTTTT ATCAAAAATT TCGCCGACTA TTCGCGGCAC 4860 + ATAACAAGAT TATGTAAAAA GAATGTTCCA TTCGAGTGGA CAGATGAATG TCAAAAAGCA 4920 + TTCATACATT TAAAATCTCA GCTAATTAAC CCAACACTCT TGCAGTACCC AGACTTCAGC 4980 + AAAGAATTTT GCATAACAAC AGATGCAAGC AAGCAAGCGT GTGGCGCAGT TTTAACTCAA 5040 + AACCATAATG GCCACCAACT CCCAGTTGCT TATGCATCCA GAGCTTTTAC GAAAGGTGAA 5100 + AGCAATAAGA GTACAACAGA ACAAGAGTTA GCAGCAATTC ATTGGGCAAT AATACATTTC 5160 + AGACCATACA TTTACGGAAA ACATTTCACT GTGAAAACAG ACCATAGACC ATTGACATAT 5220 + TTATTCTCGA TGGTGAACCC CAGCTCTAAA TTAACTAGAA TAAGGCTTGA ACTAGAGGAA 5280 + TATAATTTTA CAGTAGAGTA TCTAAAGGGC AAGGACAATC ATGTAGCAGA TGCGTTATCA 5340 + AGAATAACCA TCAAAGAGCT AAAAGATATA ACTGGAAATA TATTAAAAGT CACTACAAGA 5400 + TTTCAAAGTA GACAAAAATC CTGCGCAGGA AAAGAACAAT TGGATTTGCA AAAGCAAACC 5460 + AAAGAAATAG CTTCAGAGCC CAACGTATAC GAAGTCATAA CAAATGACGA GGTACGAAAA 5520 + GTAGTGACAT TGCAATTGAA TGACTCGATA TGTTTATTTA AACATGGAAA GAAAATTATT 5580 + GCAAGATATG ATGTTGGTGA TCTTTATACT AATGGAATTC TTGATTTAGA TCAATTTCTC 5640 + CAAAGGCTTG AATTGCAGGC CGGTATATAT GATATCAGCC AAATCAAAAT GGCACCGTGG 5700 + AAAAAAATCT TTGAACACGT TTCAATAGAT AAATTTAAAA ATATGGGCAA TAAAATATTA 5760 + AAGAATTTAA AAGTAGCGCT ACTTAACCCG GTGACCCAAA TAAATAATGA AAAAGAAAAA 5820 + GAAGCTATAT TGTCTACATT ACATGATGAT CCAATACAAG GAGGGCATAC AGGCATTACA 5880 + AAAACCTTGG CCAAGGTCAA AAGACATTAT TACTGGAAAA ATATGAGTAA ATACATAAAA 5940 + GAGTACGTAA GAAAATGTCA AAAATGCCAA AAAGCAAAAA CAACAAAGCA CACAAAGACT 6000 + CCAATGACGA TAACTGAAAC ACCAGAACAT GCTTTCGATA GAGTTGTTGT GGACACAATT 6060 + GGTCCACTAC CCAAGTCAGA AAATGGTAAC GAGTACGCAG TCACTCTCAT ATGTGATTTA 6120 + ACCAAGTACT TAGTTGCCAT ACCAATAGCA AATAAAAGCG CAAAAACAGT CGCAAAAGCT 6180 + ATATTTGAAT CTTTTATTCT AAAGTACGGT CCAATGAAGA CGTTCATAAC GGACATGGGA 6240 + ACAGAGTATA AGAATTCAAT AATTACTGAC CTGTGTAAAT ATTTGAAAAT AAAAAATATA 6300 + ACATCAACAG CTCATCACCA CCAGACAGTT GGAGTAGTAG AAAGAAGTCA TAGAACCTTA 6360 + AACGAGTATA TACGATCCTA CATATCGACG GACAAAACCG ATTGGGACGT ATGGCTTCAA 6420 + TATTTCGTAT ACTGCTTCAA CACGACCCAA TCTATGGTAC ATAATTATTG TCCATATGAA 6480 + TTAGTTTTCG GTAGAACAAG TAATTTACCA AAACATTTTA ATAAACTACA TAGCATAGAA 6540 + CCAATATATA ACATAGATGA TTACGCTAAG GAGAGTAAAT ATAGGTTAGA GGTAGCATAT 6600 + GCTCGAGCAA GAAAACTTCT CGAAGCACAC AAAGAAAAAA ATAAAGAAAA TTATGACTTA 6660 + AAAATAAAAG ACATAGAATT AGAAGTAGGA GATAAAGTTT TACTAAGAAA TGAGGTAGGT 6720 + CATAAATTAG ACTTTAAATA TACGGGGCCC TATAAGATAG AAAGCATAGG AGATAATAAC 6780 + AATATTACGC TACTTACTAA TAAAAACAAA AAACAAATAG TTCATAAAGA TAGATTAAAG 6840 + AAATTTCATT CATGATTGAA TTTAAACTTA TATTTTCCTT AATCATTTAC ACAAATTTTC 6900 + CATACACTAC GTATATTTTT ATCTTTGCAT TATAAAATCA ACTATTGTTG TTCAAACAAA 6960 + AACACAAACA AAATAAAAAT AAAAATAAAA TAATTTGCAT TTAATAATCA AAATAACTTC 7020 + ACTAGGTTAC GTTATTTTTC AAAAGGAGGG AGATGTAGTA TGTGCCTATG CAATATTAAG 7080 + AACAATTAAA TAAAATAGCA TATTAACTTA TGGCAGCACT TTGTTGCTAT GTTTATGTTT 7140 + ATGTTTATGC ACGCAGTTAG GCCAGGGCGG ATGTAACATG ATCACCCACT CGAAGGCCAC 7200 + AAAGTATAAG TGCATTGCCC AATCGAAGGC AAAAAGTATA AGTGCATGGT CAGCATTCAC 7260 + ACGCCGACCA AATACATATT ACATACGTAC ATACATATCT CGCTCTCCCG ATAAGCCTAG 7320 + ATATATAAGA TATACATAAG AACGCCGCTC CGCTGCTGGC GTACCCGGCA GCGCAGCTAC 7380 + GCGGATTAGC CTAAGTCCAA ATATATAAAA AACTGTAAAA TCGGAGAGAC TCTGTAGACG 7440 + TTGAGCTGAC AGAACCATTT CTGCCTACTC TAAAATCAAA AGAAGAAATT GAATAAATAT 7500 + ATGTCAGCCC GACGGCTGCC TTAAACTTAA AACGGACTTG TGTTCTTAAT TGGAGTTCAT 7560 + CATTACA 7567 +// +ID DMAURA standard; DNA; INV; 4581 BP. +XX +AC nnnnnnnn; +XX +DR FLYBASE; FBte0000112; Dmel\aurora-element. +XX +FT source nnnnnnnn:1..4581 +FT SO_feature five_prime_LTR ; SO:0000425:1..324 +FT SO_feature three_prime_LTR ; SO:0000426:4258..4581 +FT SO_feature transcription_start_site ; SO:0000315:191..196 +FT SO_feature polyA_signal_sequence ; SO:0000551:4482..4487 +FT SO_feature primer_binding_site ; SO:0005850:331..346 +FT SO_feature RR_tract ; SO:0000435:4247..4256 +XX +CC Composite sequence derived from AB022762, X70361 and X70362 +CC Assembly based on strategy described in PMID: 10333568 +CC Defective element with incomplete ORFs +CC Casey Bergman, 21-June-2016. +XX +SQ Sequence 4581 BP; 1102 A; 1074 C; 1456 G; 949 T; 0 other; + TGTCGCGGAT CGAATATTGT TATCGATAGG CTCTAGTTAG TATTTTTGAG AAGTCCGAAT 60 + GTGGAAGGAT TTGTAAGCCC ATATGTGTCT GGGCACGTTG TTTTTGGCCA TTGTAAATTA 120 + CCGGGAAAAT TTAGCTTTTC ATTGTCGTGT AAGAGTTGGA GGACACACTG CGGTGAGCTA 180 + ATAAGTTAAG TTAGTTGCAA TTGTGAAACA TTGAATTCTT CAAGAATAAA ACGTGTTCTA 240 + CTACCACGGA TTAGTCTGCC CTTTCTTTCG GGAACCAATG TGTGGGGTAG CCGTTTAAGG 300 + CAACTCCCTG GACGCACGAC GACAACCTTT TATTCGCAGT CCTAGGGCGA CTGCAGGGGC 360 + AACTTGCGCT GGAATGACGG TTTAGACGGC CAGCTAGAGA GTTGCCGGAG CTGGAGTGAC 420 + GGTTTAGACG GCCAGCGAGG AGGATTTGTG TGAGCGCAGC CAGCGCTACG TACCGGCAGA 480 + GGAGTCGCAG TCAGCGACAT AGAGGGACGC AGCCAGCGTC GAACGCCGGT ACGAAAGGGT 540 + CGCAGCCAGC GACAAGGAGA CGCAAGAAGC GTCATTTGTG GAGACCGCAG CCAAGCATCC 600 + GTGGCCGCAG CCAGCGGCAC GAGGCGTCAG AGACGCCATT TCGGACGCGC AGAGGCGCCG 660 + CCATTTTTGG AGCTGGGAAA GATGCAGCAT TCCCCCAGGA AGAGTGCCCG GCTGAACGGA 720 + GGGGAAGTCA CCCCTATAAC AACAGTGAGT CAGCAGCCAG CCAGTAGTGG AGCAGGAACT 780 + CGGACGCGGG TGAACATCAC GGCGGCGTCG ATTCCTTGCC CGGCCACTAC GGTGACTACA 840 + GTAGCTTCCC AACCTAGAAG TACTGCTGTC ACAGCTGCGA GTTCAGTACC GGAGGTGAAC 900 + CAGCCCCTCG TGTTGGAACT CATGGAGAGG ATCGCAGCGT TGGAGAGGGA GCTGGAGAAG 960 + ACTAGATCCC TAGAAAGTGT GAGCACCGCC AATTGCGCGC CAATCGCAGT TGGCCCAAGC 1020 + GCAGTTGGCG CCAACAGTGG AGCGTCGGGG CGGCCGCCAT TTTGGAGCGG CCAGCTAATA 1080 + CCCACATCTA ACGGAGAGGC CTTACATAAC GGGGACTGGG CCAGGCATGC TGCAACGATT 1140 + GCGCCCTTTC CCACTGTAGT CCACTTCAGC GCGTGGCTAC AGGAGTACGC AAACGTGGTG 1200 + TGCACGGTTT TGGACGTCGA GGGAAAGGAG CCGAGGCGTC GACTTCTACA TGCAAGCGTC 1260 + GACCATAATG AATGCGATCA ACAGGATGAT CGGCATGGAG GTTGTCCCAT CTGTGGAGGA 1320 + CAGCATGAAA TATTGAACTG CAGAAAATTT ATTGGAGCTT CGCCACAGGA AAGGTGGAGC 1380 + AATGTGAAGA GGCATCGGCT CTGCTTCAAT TGCCTGCGAA GCGGGCACAC GGCTAGATCC 1440 + TGCTATACGC AAGGTGAGTG CCAGGTTAAT GGATGCCGAA GGGAGCATCA CCGTCTGCTA 1500 + CATGGTGCGG ACGGAGGAAC GAAGGCCGCT GCAGCGAGGT GGCTTCAGAC GCCACGAAGG 1560 + GAACCAGCAG CCAGCAGTTT CCAGACGCAG CCTAAAGGGG AGGCCTTCGC TACGAGATGG 1620 + TCACAGGGAC CAGGAGAGGA ACCGGCAGCC AGCCGTTCCA AGCAACAGTC TGGAGAGAGG 1680 + AGCTCCACGT GAAGCGGGAG CGCCCATGCA GAGGAATTTG AGCTGCGTTG ACGCCGAAGG 1740 + AGGCCGTCTA CTGTTCCGTA TACTGCCGGT TACGCTGTAC GGAGCGGGGC GAAAGGTGGA 1800 + TACATATGCG CTCCTAGATG AGGGATCCTC CGTCACGATG ATCGATGACG AACTACGAAG 1860 + GGATCTTGGA GTGCAAGGAG AGCGTCGGCA GCTAAATATC CAATGGTTTG GTGGTAAGGC 1920 + AACCAGAGAG CCTACCAACG TGGTGAGTCC GAAGATAAGT GGAGTTGGAA AGCCCACTCG 1980 + CCATGTATTG AGAAACGTTT ATGCCGTTTC GAGCTTGAGT TTGCCGATGC AGACATTGAG 2040 + CCGACGAGAT GTCCAGGGCG TGCACAGGGA TGCGCGTCTG CCCGATGAAG CCTTACAGCA 2100 + ACGTGGTGCC GAAGCTGCTC ATCGGTCTGG ATCACGGACA TCTGGGGTTG CCACTTAGGA 2160 + CGAGGCGGTT CGCTCGAGAG GGACCGTATG CGGCCGCAAC CGAGCTGGGC TGGGTTGTGT 2220 + TTGGGCCTGT AAGTGGGCAA CCGACCACGC CGTCACCGAG GTCCTGCCTA CTTGCCGTGT 2280 + CAGTGGATGA CGCGATGGAG AAGATGGTGG AGGACTATTT CGACATGGAG AACTTTGGAG 2340 + TGAAGACCGC GCCGCCGGTC GCAGCCAGCG ACGATGTCCG GGCCCAAAGG ATACTCGAAG 2400 + ACACCACGGT GAAAGTGGGG CGTCGCTACC AGACGGGATT ACTCTGGAAG GACGACCACG 2460 + TTGTGCTGCC ACCGAGATAT GAGGACGACG ACGTGCAAGT GAGCTTCGTG AGTGCGAGGA 2520 + CGAAGTGTGC CCCAATGAGA ACGATGACGA TCCCACGGCT GGAGCTGCAA GCAGCAGTTC 2580 + TTGGAACCAG GCTGATGAAC ACTGTCAAGG AGGAGCACAG TGTGGTCATC ACGGACCTGG 2640 + TGTTATGGAC GGACTCTAAG ACGGTGCTGA GATGGATCGG CAGCACCCAC CGCCGCTGAC 2700 + AATGCGGCTG ATGATGCGAC GCGGTCGCAG AAAAGGAGTC GACCTTAGCC AGGAATCAAG 2760 + GTGGCTAAGA GGACCTGCAT TTTTGATGCA GCCAGCAGCC AGCTGGCCGG GGTCTGAGGA 2820 + AGGAACTGAG CGTGTTCCAG ATGTCCCTGA TGAAGAAGAG ATGCCCAGTG AGTTTGCATT 2880 + AGTTGCGGTA GACGATTTTG TCATTCCGTT TCAGAGATTC TCGAGCTTCA GTCGCCTGGT 2940 + GAGGACCACA GCCTGGGTCC TACGGTTTGC GCGCTGGTGC CGCAAACAGC GAAACGATCT 3000 + CGAGGAATAC GGCCTTACCG CAGCCAGAAT GTAAGGCCGC CGGAACCGCA CTGTGCATCC 3060 + CGTACAGTGC GAGGAGGGCC GTATTACTGT CACACAGGCA CAGTCTGACG GAGCTGATTG 3120 + TGAGAGACTT CCACGCCAGG ATGAAGCATC AAAATGTGGA TGCTACGATC GCGGAGATCC 3180 + GGACAATGTT CTGGGTCACA AAGATGAGGC GTGTGATGCG GAGAGTCATC TCATCGTGCA 3240 + ACGAGTGCAA GTTGCAGCGA GCGCGGCCGA TGCCGCCGAT AATGGGACCC CATCCGGAAG 3300 + ACAAACTGGA TGCGGGTGGA TGGCCATTCA AATACACAGG ACTGGACTAC TTTGGGCCAC 3360 + TGCTGGTGAC TGTGTCCCGT CACAAGGAGA AGCTTGGGTC GCCTTGTTTA CGTGTTTGAC 3420 + GACAAGGGCG ATTCACCTGG AGCTGGCGCA TGACCTGTCG ACGGATTCCT GCATAATTGC 3480 + GATCAGGAAC TTCGTCTGCC GTAGAGGGCC AGTATATAGA CTGCGCAGCG ATAACGGCAA 3540 + GAACTTCGTG GGAGCTGACA GGGAAGCCAG GCGCTTTGGC GACGTATTCG AGATGGAGAA 3600 + GCTTCAGAGT GAGTTGACAA GCAGAAGCAT TGAATGGGTG TTTAATTGTC CAGCGAACCC 3660 + GTCTGAGGGC GGAGTTTGGG AGCGCATGGT GCAGTGCGTC AAGAGAGTAC TGCGTCATAC 3720 + CCAGAAGGAA GTTGCGCCGA GGGACCATGT ATTGGAGAGT TTCCTGATTG AGGCGGAGAA 3780 + TATTGTAAAC TCGCGTCCGC TCACCCACTT GCCTGTGGAT GTGGACCAGG AGGCGCCGTT 3840 + GACGCCAAAC GATCTTCTCA AGGGAGTAGC CAATCTGCCG GATACGCCTG GATTGGATGC 3900 + GGAGCTGCCC AAGGAAGGTA CTACGAGGAA GCAGTGGAGA ATTTCTCGCC TGCTACGAGA 3960 + CCGTTTCTGG AGGAAGTGGG TCATGGAGTA CCTGCCTACG CTTGTGCGCC GCGAGAAGTG 4020 + GTGCCGACGA ACGGAGCCCA TCCACCAGGG TGATGTGGTC TTCGTCTGCG ATCCTGCCTT 4080 + GGCCCGACGA GAGTGCCGCA AGGGTATCGT GGAGGAGATC TACAGCGGAG CTGATGGAGT 4140 + TGTCAGACGC GCTAAGGTGC GCGTGAACGA AAACGGCCTA TCTAGGACAA TGATGCGACC 4200 + CGTCTCTAAA CTTGCAGTTA TGGATTTGAG TGAAGCGGTT CTTCACGGGG TCGGGGATGT 4260 + CGCGGATCGA ATATTGTTAT CGATAGGCTC TAGTTAGTAT TTTTGAGAAG TCCGAATGTG 4320 + GAAGGATTTG TAAGCCCATA TGTGTCTGGG CACGTTGTTT TTGGCCATTG TAAATTACCG 4380 + GGAAAATTTA GCTTTTCATT GTCGTGTAAG AGTTGGAGGA CACACTGCGG TGAGCTAATA 4440 + AGTTAAGTTA GTTGCAATTG TGAAACATTG AATTCTTCCA GAATAAAACG TGTTCTACTA 4500 + CCACGGATTA GTCTGCCCTT TCTTTCGGGA ACCAATGTGT GGGGTAGCCG TTTAAGGCAA 4560 + CTCCCTGGAC GCACGACGAC A 4581 +// +ID DMBARI1 standard; DNA; INV; 1728 BP. +XX +AC X67681; S55767; +XX +DR FLYBASE; FBte0000034; Dmel\Bari1. +XX +FT source X67681:1..1728 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1..28 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1701..1728 +FT SO_feature CDS ; SO:0000316:379..1398 +FT /name="Dmel\Bari1\ORF" +FT /db_xref="FLYBASE:FBgn0043784" +FT /db_xref="SPTREMBL:Q24258" +FT /db_xref="NCBI_PROTEIN:CAA47913.1" +FT /translation="MPKTKELTVEARAGIVARFKAGTPAAKIAEIYQISRRTVYYLIKK +FT FDTVGTLKNKKRSGRKPVLDQRQCRQILGVVAKNPSASPVKIALESKNTIGKQVSSSTI +FT RRRLKEADFKTYVVRKTIEITPTNKTKRLRFALEYVKKPLDFWFNILWTDESAFQYQGS +FT YSKHFMHLKNNQKHLAAQPTNRFGGGTVMFWGCLSYYGFGDLVPIEGTLNQNGYLLILN +FT NHAFTSGNRLFPTTEWILQQDNAPCHKGRIPTKFLNDLNLAVLPWPPQSPDLNIIENVW +FT AFIKNQRTIDKNRKREGAIIEIAEIWSKLTLEFAQTLVRSIPKRLQAVIDAKGGVTKY" +XX +CC Derived from X67681 (g7640) (Rel. 36, Last updated, Version 6). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 1728 BP; 596 A; 291 C; 332 G; 509 T; 0 other; + ACAGTCATGG TCAAAATTAT TTTCACAAAG TGCATTTTTG TGCATGGGTC ACAAACAGTT 60 + GCTTGTGCAG CAAGTGGGGG GAGGTGAAAT GCAAAAAAAC TTTTGCTTTT GCAAATTCAA 120 + ACCTATGCAG AGTCAGATGA AAGAAGAATT GAAAAAATAA CTGTTCCTAT GCGCAAGGAA 180 + GAGGCAAATG AAGAGATCTT TATCAGTTGT CAGAAGTATT TGCACACGGT TTCGTCGCAT 240 + CACAATTATT TTCACAACGC AATTTCTTCT TCAGTGATTG GTTTAGAGTG ACAAGTGCCG 300 + GTTTGTTTGC TTAAATACAT TTAAATTATT GAATAAAAAT TAGATTTAAT CATTTTCCTA 360 + TTACAGTTAT TAAATAAAAT GCCCAAAACA AAAGAGTTAA CAGTTGAGGC CCGGGCTGGT 420 + ATTGTTGCTA GGTTTAAAGC CGGTACACCT GCGGCCAAAA TAGCTGAAAT ATATCAAATT 480 + TCGCGTAGAA CTGTCTACTA CTTAATAAAA AAGTTTGATA CAGTTGGCAC ATTAAAAAAT 540 + AAAAAAAGAT CAGGCCGAAA ACCTGTGCTG GACCAAAGGC AATGCAGGCA AATACTTGGA 600 + GTTGTGGCGA AGAATCCTAG TGCCAGTCCG GTAAAAATTG CCTTAGAATC AAAAAATACA 660 + ATTGGCAAAC AAGTTAGTAG TTCTACAATT CGTCGCAGGC TAAAAGAAGC TGATTTTAAG 720 + ACATACGTTG TTCGCAAAAC GATTGAGATC ACACCAACCA ACAAAACAAA ACGTCTTCGA 780 + TTTGCGTTGG AATATGTTAA GAAGCCTCTT GACTTTTGGT TTAATATTTT ATGGACTGAT 840 + GAGTCTGCAT TTCAGTACCA GGGGTCATAC AGCAAGCATT TTATGCATTT GAAAAATAAT 900 + CAAAAGCATT TGGCAGCCCA GCCAACCAAT AGATTTGGTG GGGGCACAGT CATGTTTTGG 960 + GGATGTCTTT CCTATTATGG ATTCGGAGAC TTGGTACCGA TAGAAGGAAC TTTAAATCAG 1020 + AACGGATACC TTCTTATCTT AAACAACCAT GCTTTTACGT CTGGAAATAG ACTTTTTCCA 1080 + ACTACTGAAT GGATTCTTCA GCAGGACAAT GCTCCATGCC ATAAGGGTAG GATACCAACA 1140 + AAATTTTTAA ACGACCTTAA TCTGGCGGTT CTTCCGTGGC CCCCCCAAAG CCCAGACCTT 1200 + AATATCATTG AAAACGTTTG GGCTTTTATT AAAAACCAAC GAACTATTGA TAAAAATAGA 1260 + AAACGAGAGG GAGCCATCAT TGAAATAGCG GAGATTTGGT CCAAATTGAC ATTAGAATTT 1320 + GCACAAACTT TGGTAAGGTC AATACCAAAA AGACTTCAAG CAGTTATTGA TGCCAAAGGT 1380 + GGTGTTACAA AATATTAGTA TTGTATTTAT ATAAAATAAA GAAATTCTTA TGTTGAAATT 1440 + AGATGTTAAG CTGAAATTTA CTAAATTAAG TTGAGTGAAA ATACTTTTGA AGCGCAATAA 1500 + ACATGTGAAA ATACTATTGA CAACTTGCAT GCATATTTTC TTTTGCTTTA AGCTTTGTAC 1560 + TATGAACCGT TATCTTTCGT ATTTCTTTTC GACTACCTTC TGCATAGATC AAGCTAAGCG 1620 + ATAAGAACTA TTTCAGGCAA ATCGGACAAC AACAAGAAGA AATATAACAA AAAGAAGTTG 1680 + AAGTTTGCAA ATATTGTGCG TTGTGAAAAT ACTTTTGACC ACCTCTGT 1728 +// +ID BS standard; DNA; INV; 5142 BP. +XX +AC nnnnnnnn; +XX +DR FLYBASE; FBte0000780; Dmel\BS. +XX +FT source nnnnnnnn:1..5142 +FT SO_feature CDS ; SO:0000316:341..2248 +FT SO_feature CDS ; SO:0000316:2245..2965 +XX +CC Sequence identified by REPBASE: +CC http://www.girinst.org/server/RepBase/RepBase6.6.embl/drorep.ref +CC Assembled and annotated by Josh Kaminker & Michael Ashburner. +CC REPBASE states this to be a consensus sequence. +CC This replaces that from complement(X77571:651..5776) in versions +CC previous to 4.8. +XX +SQ Sequence 5142 BP; 1652 A; 1222 C; 1075 G; 1193 T; 0 other; + AAATCTGCAT TCATAGAGAT CGGTTGTGTC GCGCGTATGC AAAAGTGATC TATTTTGCTT 60 + TATTGTTGCA ATTTCTTGGG TGCTTAAAAT AGCACTCACC AGTACATTCG GGCGCTGCTT 120 + CGTGCGGTGT CGGCATCTGG CCAACAACAA AAAGCGTTAA TCGAAGTGCG GTGTAGCTAC 180 + GATACCTGCC CTTCGGGCAA CTTATTCCCC TCACCCCGCG CAAAGCCGCT GAAGGGGGCA 240 + ATAAAATCTA TGCTTATCAG CAAAACTGAT CCGTATTTGA TCTGTTTTGT GGTCAGTTAA 300 + GCAAGCTATT TTGTAAATAT TAAGAATTAT TATTAAGACA ATGGATGAGA ACAATTCTGA 360 + TGACACCCAG CTTTTAAATA AGCAGAGTAA CCATAGAACA ATGTTCTCAA TAGCTGGCAA 420 + ATTACCTCAC GAGATTAGAA ACGAGTGCCG ATCAGCAATT CAACGCTTTA CAAGCAGCGT 480 + AACTCAAAGC AGTAGCGTCA CCACAACAAC GGTGACATTT ACTAGTGCCA ATAACAGCAC 540 + CATATATACA ATGGCAAATG CCGCAATAAG CAGCCCGTGC CTTGGAACAA GATCCACTCA 600 + CCAGGAAAGT TCCACATTGA TAAACTCCGG AATCGTAGAA GATAATCTCA GCGATGCTGC 660 + CAGAAGGTTA TTAAATGACC AAAATCAGAG AGCGGGTAAA AGGAAAAATG GAAAGCCCTT 720 + GTCCCCCATC TCCAACCCGA AAAGAGGGAG TAGCAGCCAA GTTTTACACT CGCCCCCTAC 780 + GACTAGCCTG AAGATAAGCT CTAATAATAG GTTTGCCATT CTGGACACGG ATATTTCTAC 840 + TAACGAAGAA AGCGTGGAAG GCATGATGAT AGAGGGTGCT GATATTGACA GTGCCCATAT 900 + GGATGATTCT CAACTCGATG GTTCCAATAC TGGTCGAAAC TTGCAGGAAA CACACAATAC 960 + AGCCAATCAA CTTAATGATC ACAAAAAACC ACCACAAATT GTTGTAAATA TCAGAAACTT 1020 + GAATGATCTG TTTGAGCTTA TAAAAGAAAA GACAAGCTTA GATAACGTTG TCGTTAAAGC 1080 + TAATCAAGGG GAAACGGTCA GAATATTTCC AAAAGACAGC GACACTTACA GGAAAATAGT 1140 + GAGCCATATG GATGACATTG GTATTCAGTT TCACACTTAC CAAATGCTGA CAGATAAGCC 1200 + ACACAGAATT GTAGTAAGGG ACTTACATCA CAGTACATCA AACAAAGACA TAACCGCCGA 1260 + TCTGAAATGT TTAGGCTACG AAGTGCTCCA CATTCACAAC CCTAGTTCTA GGACTAATAA 1320 + GGACGAAAAA CTAAACATCT TTTTCATTAA TATAAAGCCC TGTGCAAAAA TTAATGAAAT 1380 + TTACCATGTC AAGACCCTTT GCCGACAGAA AATACGGATT GAAAGGATGA GAAAGTCTTC 1440 + TGAAATTGCG CAATGTCGTC GTTGTCAGGA GTACGGCCAT ACAGCTAAAT ACTGCCGCAG 1500 + ACACCCAAAT TGTGCCAGAT GTGGCGAAAA TCACCAAACC ATGCAATGCA CCCGACCGAT 1560 + AGACGCACTG CCCACATGTT ACCATTGCTC TGAAAATCAT ACGGCTAGCT TCAAAGGTTG 1620 + CCTAAAGTAT CAGGAGCTTC TTCGCAGATC TATGGGGCCT GCAAGAAATG GAAACAGGTT 1680 + AAATAAGAAC ACCCATCATC ACTCTCCTAG AGACCGGCAA GAGCTTCCTG CCTTGCAGCC 1740 + CAATTACCGC AAGAACAACA CCCAATCAAC AGTACAGCAG TTATCGACAC AACCACAGCT 1800 + TAATTTTGCC CAAAGCCAAC CATCTATAGG CACTGGTGGA AACAGAGCAG TATCCTATGC 1860 + TACAGTAGTA AAAGGATACC CAAAAATAGC GCCCTCCAAG GACGGACCAG CCCAGCGTCA 1920 + ACGCTTAAAC AACCCACAAA CGAAACAAAT ACTGCAGCAA CACCGATCGA ATACACAGCA 1980 + GAATAACTCA TCTGATGTGC AAGTATTCTT ACAACAGCAA CAACAACAGT TTCTGGAATG 2040 + GCAACAGCAG ATCCAACAAC AACAACACCA ACAGTTTCTT ATGTGGTTGC AACAGCAGCA 2100 + GCAAGAACAA CTACAGTATA AAAGCCAAAC CAATCAACGA CTGGAAAAGC TTGAAAAAAT 2160 + GGTTCTTGAA CTAGCGAATA TGTTAAAAGA ATGGGCTGGG AGTGAACTTA AGCCCCAGCT 2220 + CTTTAACAAC GTCTCAGCCT CCCTATGAAT CCACTAAAGA TTCTTATTTG GAATGCTAAC 2280 + GGCATTTCAA GAAAAGCCAA AGATGTTGAG CTGTTCGCGC ACAACAAAAA GATAGACATC 2340 + CTTCTTGTGA CTGAACTAAG ACTCAAAAGA GGGGAAACTG TAAAGATATA TGGATATGCG 2400 + TACTATCCAG CATATAGGCC ATCCCTTAAT AATAATAGTG TTGGCGGAGT AGCGGTGTTC 2460 + GTGAGGACAA CTCTTCGCCA CTTTCCACAA AGGGTCATTG AGACACGCCA CATACAATTG 2520 + TCATCAGTAA AAGTAGCCAC AGGACTCGGG GACCTGCAGT TTAGCGCTAT TTACTGCTCC 2580 + CCAAGTACTA GAATCGAGGA AAGACATTTT ACTGACATAA TACGCGCCTG CGGCCAAAGG 2640 + TACTTGGTAG GTGGCGACTG GAATGCCCGC CACTGGCTTT GGGGCGACAC TTGCAATTCA 2700 + CCTCGCGGGC GGGAACTAGC AGAAGCCTTG TCCGTGACTG GAGCTAAGAT CCTCGCAACT 2760 + GGCTCTCCGA CAAGGTATCC GTATGTGCCC AGCCATACGC CCTCATGCAT AGATTTCGCA 2820 + GTGTATCATG GTATACCAGA CCACCTAGCA ACTATAACAC AAAGCTGGGA CTTGGATTCT 2880 + GATCACTTGC CTCTTATCAT TAGCATTGAG ACAGACAGTA TTCATGTCAA TCCAAGTCCC 2940 + AGGCTAGTCA CCAAACACAC TGACCTCCTT GCCTTTAGCC GACAATTGGA GAGCCTTATT 3000 + TCGCTGAACA CCACGCTTAA TTCTGGTGAG GAAATTGAAA TGGCTGTTGA CAACCTAACT 3060 + GAAAGCATAC ATAGGGCCGC GGCTGTCTCT ACTTCTCCCG TCCCTCGGAT AGGCACCACA 3120 + TATGGGATAG TCTTGACAAG AGAGGCTAGA GAGCTTCTGA CACAGAAAAG AAGACTCCGA 3180 + AGGCGAGCAA TCCGATCTCA AGACCCCTGG GACCGACTTT TATGGAACCG TGCTGCAAAG 3240 + CAACTACGAA ACGTCCTCAG AGAACTTCGA AGCAACTTTT TTGAGCAGAA ACTAGCTAGT 3300 + ATGGACTACA CAGTGGATGC TGGATACTCG CTATGGAAAT GCACCAAGTC CCTTAAAAGA 3360 + CAGCCGTTTA GACAGGTTCC TATAAGGTGT CCGGGAGGCG AACTTGCTAA AAATGAAGAG 3420 + GAGCAGGCTA ATTGTTTTGC AAATCATCTG GAGACAAGGT TCACCCACTT CCAATTCGCT 3480 + ACAACGGAGC AGTATCAAGA GACGCTTGAT AGCCTAGAGA CACCTCTGCA AATGTCACTA 3540 + CCCATTAAGC CCATCAGGGT TGAGGAAATT GTCGAAGCTA TCAAATCTCT TCCGTTAAAG 3600 + AAGTCTCCTG GCATCGACAA CGTTTGCAAT GCCACACTAA AAGCACTACC TGTTCGAGCA 3660 + ATTCTCTACT TGGCGCTGAT ATATAATGCC ATACTCAGGG TGCAGTTTTT CCCAAAGCAG 3720 + TGGAAAATGG CAGCAATCCT AATGATACAT AAGCCTGGTA AACCTGAAGA GAGCCCTGAA 3780 + TCGTACCGAC CCATAAGTCT TTTATCTTCG CTATCCAAGC TATGGGAACG ACTGATTGCC 3840 + AACAGATTAA ATGACATTAT GACCGAGCGT CGTATCCTGC CGGATCATCA GTTTGGCTTT 3900 + CGTCAGGGAC ACAGTACTGT GGAGCAGGTA CACAGACTGA CAAAACATAT CCTTCAGGCC 3960 + TTTGATGATA AGGAATACTG CAATGCTGTG TTCATTGACA TGCAACAGGC ATTCGATAGG 4020 + GTCTGGCATG ACGGCCTTAT CAGCAAAGTT AAAAAGTTAT TCCCAGCACC ATACTATGGA 4080 + GTCCTAAAAT CATACTTGGA AGATCGGAGA TTCATGGTCA GGGTCAGAAA CTCCTACTCG 4140 + ATTCCCCGCG TTATGAGAGC TGGAGTTCCG CAGGGCAGCG TACTGGGACC GTTGCTCTAC 4200 + TCAGTATTTA CTGCAGATCT GCCCTGCCCA AACGCCTATC ATATGGCAGA TCCCAGGAAG 4260 + GCCCTTCTTG CTACGTACGC TGACGATATT GCCCTGCTGT ACAGCTCTAA TTGTTGCAAC 4320 + GAGGCAGCAA GGGGTCTCCA AGAGTACCTC ACCACTCTGG CTGCATGGTG CAAAAGATGG 4380 + AATTTAAAGG TCAATCCGCA AAAGACCATC AATCCCTGCT TCACCTTGAA GACCTTAAGT 4440 + CCCGTCACCG CACCCATAGA GCTGGAAGGT GTAATCCTAG ATCAACCTTC ACAGGCTAAG 4500 + TACCTCGGGA TTACCCTTGA TAAACGGTTG ACTTTCGGCC CGCACCTGAA AGCTACGACT 4560 + CGGAGATGTT ATCAAAGGAT GCAACAACTT CGATGGCTGT TAAACAGAAA AAGCACCATG 4620 + ACACTGAGAG CCAAAAGAGC AGTCTACGTC CACTGCGTAG CCCCGATCTG GCTGTACGGA 4680 + ATACAGATCT GGGGTATCGC AGCAAAATCC AACTACAACC GCATTCAGGT ATTGCAAAAT 4740 + CGTGCCATGC GTGCAATTAC AGACTGCCCA TACTATGTAC GTGGCACTAC CCTTCACCGT 4800 + GATCTGAATC TTCATACAGT GGAAGAGCAG ATCTCCAGGC ACACCAGCAG ATATAGTGAT 4860 + AGACTAAGAC GACACCACAG TATACTTGCT AGACGCTTAC TCCCTGCTAG GCCTCTAAGG 4920 + AGATTAAAAA GGAAGGGTTT CGCCAAAACA CTTGGACAAC CCTAAAGACC CCCTCGAAAT 4980 + ATGAGACAAA GTTGTAAGTC CTCACATGAT TAGTGAGAGG TTTGGTTCTA TCTTTTATAT 5040 + GTTAATTGCG CTGTTATGTT ACTGTTATTG CATTGTATTG ATTCATCGCT TCTAAATAAA 5100 + TAATAAAAAA AAAAAAAAAA AAAAAAAAAA AAAAAAAAAA AA 5142 +// +ID DMU89994 standard; DNA; INV; 6411 BP. +XX +AC U89994; +XX +DR FLYBASE; FBte0000739; Dmel\Burdock. +XX +FT source U89994:1..6411 +FT SO_feature five_prime_LTR ; SO:0000425:1..275 +FT SO_feature three_prime_LTR ; SO:0000426:6136..6411 +FT SO_feature CDS ; SO:0000316:564..2057 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\Burdock\gag" +FT /db_xref="FLYBASE:FBgn0043782" +FT /db_xref="SPTREMBL:O01350" +FT /db_xref="NCBI_PROTEIN:AAB50147.1" +FT /translation="MSDSDNLLDNLVSSLNKWSAHQASRQNSAEKNNKSSDNWWSKTKT +FT TSEMEFEAQLKAIVESAVAGALAVQKQSFEKQLQEMNERIGKLTVNTPEVETYVDAEIR +FT PGVVCSEPLDILKSLPDFDGKSETYVSWRKAAHVAFKVFKDYEGSSTFYQALGIMRNKI +FT KGPANTVLASFNTPLHFKAMISRLDFTYSDKRPIYLIEQELSTLRQGDMTLTEFYDEVE +FT KKLTLLTNKTIMTFDSALAMSLNEKYRTDALRVFVTGAKKSLSDILFAKGPKDLPTALA +FT LAQEVESNHERYQFALIYSKNIGDRGQKIEQRHSDKDRNSIMPMQTKNPYFSKRQVHTY +FT DNQERQDPVQLTNPDVSMRSRRTGNFGQTPFPTQGNIWPSQQQNSWPSQQQYSWPSQQQ +FT NSFRTQNQFASQPQQQNTSQAQGHFGYAQASKRPTSGSARFTGPKQQRINYLPHEKGQC +FT EEDTDGYQKEAEAEVDDYEDELVNYDHVHFLATNPCYRT" +FT SO_feature CDS ; SO:0000316:<1994..5119 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\Burdock\pol" +FT /db_xref="FLYBASE:FBgn0043781" +FT /db_xref="SPTREMBL:O01351" +FT /db_xref="NCBI_PROTEIN:AAB50148.1" +FT /translation="GRTSELRSCSFFSHKSLLPYIEREIAGRTIKLLIDTGASKNYIQP +FT LPELKNIMPVQNKFTVKSLHGCNTVKQKCFIKLFNTSVQFFILPSLSSFDAIIGLDLLK +FT QGNATLDFKNKTLNINNEVESIQFLRCDSVNFANIENIVVPNQISNKFHTMLRNRLAVF +FT AEPEEALPYNTNIVATIRTEDDQPIYSKLYPYPMGVSDFVNKETHALLKDGIIRPSSSP +FT YNNPVWVVDKKGTDEEGNTKKRLVIDFRKLNLKTIDDKYPIPNVVWILSNLGKARFFTT +FT LDLKSAFHQILLAEKDRAKTAFSVGNGKYEFCRLPFGLKNAPSIFQRAIDDVVRDRIGK +FT SCYVYVDDVIIFSNGIEDHVNDVAWVLDRLSGANMRVSKEKSFFFKESVEYLGFMVSSG +FT GITTSPSKVEAIQKYNQPTNLFSVRSFLGLASYYRCFIKDFASIARPLTDILKGENGKV +FT SASQSKKIPISFDERQCSAFEKLKNVLVSENVMLLYPDYRKAFDLTTDASAFGLGAVLS +FT QDGKPVTMISRTLQDRELNFATNERELLAIVWALKSLRNYLYGVKNLNIFTDHQPLTYA +FT VSDRNPNAKIKRWKAFIDEHNAKIFYKPGKETYVADALSRQAIHVLEDEPQSDIATIHS +FT EISLTFTIETIDKPVNCFRNQIVIDEGTADSTRTFVIFGSKTRHLIQFLDKETLIGRIR +FT DVVKPDVVNAIHCELPVLAFIQNSLVNDFPATTFRHTMKMVSDIFNQTEQREIVSLEHN +FT RAHRAAQENVKQILQYYFFPKMSQIAATFVSNCLVCQKAKYDRHPQKQILGRTPIPSHV +FT GETLHIDIFSTGRNYFLTCIDKFSKFAIVQPIGSRTITDLEPAIMQLMNFFPHSKTIFC +FT DNEPSINSESIKSLLKNRFNVDIANAPPLHSTSNGQVERFHSTLLEIARCLKLDSGMND +FT TVNLILQATIEYNKTVHSVTNRRPIDIIHSTPPELANEIVEMVNEAQEKQLRRENVTRR +FT DRTFEVGETVMVKQNNRLGNKLTPRYREELIEADLGTTVLIKGRVVHKDNLR" +XX +CC Derived from U89994 (g1905850) (Rel. 51, Last updated, Version 1). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 6411 BP; 2219 A; 1259 C; 1204 G; 1729 T; 0 other; + AGTTAACACA ATCACAAAAC ACCCGAAATA TAGTCGTAAG CCTCAAGTGC TTTTCCCATC 60 + TATAGATCGA GCTTTACCTA TAAGAAACTG TAACTTGTTA AGCTTTAGAG ATAAGAACTC 120 + TTGCTATACT TAAGTCAGTC GATTTTGGAA GATTAGAAGC GTCGGTCATC GCCACGTACT 180 + TACTATTCGT CTCATTAAGT GCAGACCGCG CAAGCCTATT GTAATTAATA AACTTACGCT 240 + AATAAATATA TGGAAAATCT ACTAAAATGA TAATTGGCGC CCAAACGGAT ATAAAAACCT 300 + ACGATAACTG AATAATTATA AATAAATAAC AAAAGGAGGA TCCGGAGACA AAACCAGCGG 360 + CTTTGGCTAA TTAACTCTAA CCTAAGAAAT AAAAATTTGC TGATTACATA AAATATAATA 420 + TTAATTACTA AGACCATCTA CCTTAAAATT GTTTGTTAAT CACTATTATT ATATTGTAAG 480 + TATAACGCTT ATTGAACGAA TTAAAAATAT TATTATTATT ATTATATTAT AACCTATGCA 540 + AAGAGTATTG ATAATAAAAA TACATGAGTG ACAGTGATAA CCTTTTAGAC AACCTAGTGT 600 + CAAGCTTAAA TAAATGGTCA GCGCACCAGG CAAGTAGGCA AAACAGTGCA GAAAAAAATA 660 + ATAAGTCATC AGATAATTGG TGGTCAAAAA CAAAGACAAC TAGCGAAATG GAATTTGAAG 720 + CTCAGTTAAA AGCGATCGTA GAGAGTGCTG TTGCCGGTGC GCTCGCAGTC CAAAAACAAT 780 + CATTTGAAAA GCAATTGCAG GAGATGAATG AGCGAATCGG GAAATTAACA GTGAACACCC 840 + CAGAGGTGGA AACTTATGTA GATGCTGAAA TTAGACCAGG TGTTGTCTGT AGCGAGCCTC 900 + TAGATATACT TAAATCTCTG CCAGATTTTG ATGGCAAAAG TGAAACATAT GTGTCGTGGA 960 + GAAAAGCGGC TCATGTCGCT TTTAAAGTTT TCAAAGATTA CGAGGGAAGT TCAACATTTT 1020 + ACCAAGCTCT TGGTATTATG CGAAATAAAA TAAAAGGTCC AGCGAATACA GTATTGGCTT 1080 + CTTTTAATAC TCCGTTACAT TTCAAAGCAA TGATCAGCCG TCTTGATTTC ACATATTCTG 1140 + ACAAAAGGCC GATCTATCTA ATCGAACAAG AGCTATCAAC TTTGCGACAG GGAGACATGA 1200 + CTCTTACTGA ATTCTACGAT GAAGTCGAGA AAAAACTGAC CCTACTTACC AACAAGACAA 1260 + TAATGACATT TGATAGTGCC TTGGCGATGT CACTGAATGA AAAGTACAGG ACGGACGCGT 1320 + TACGTGTATT TGTAACCGGA GCTAAGAAAT CGTTGAGCGA CATTCTTTTT GCAAAAGGTC 1380 + CAAAAGATTT ACCAACTGCT CTCGCTTTAG CGCAAGAGGT CGAGTCGAAC CATGAGCGTT 1440 + ACCAATTCGC CCTTATTTAT TCTAAAAATA TTGGAGACAG GGGTCAGAAA ATCGAACAAA 1500 + GGCACAGCGA TAAGGATAGA AACTCAATCA TGCCCATGCA AACTAAAAAC CCATATTTTA 1560 + GCAAGCGTCA GGTGCATACT TATGATAACC AGGAAAGACA AGATCCAGTC CAGTTAACAA 1620 + ATCCTGATGT ATCCATGCGA TCTAGAAGAA CTGGAAATTT TGGACAAACT CCATTTCCGA 1680 + CTCAGGGAAA TATTTGGCCA TCCCAACAGC AAAATTCTTG GCCATCTCAA CAACAATATT 1740 + CTTGGCCATC CCAACAACAA AATTCATTTC GAACACAAAA TCAATTCGCA TCGCAACCCC 1800 + AACAGCAAAA CACAAGTCAG GCTCAGGGAC ATTTTGGGTA TGCGCAAGCA TCAAAAAGAC 1860 + CAACGAGTGG CAGTGCAAGG TTTACAGGGC CAAAACAGCA GAGGATCAAC TACTTACCTC 1920 + ATGAGAAAGG TCAATGTGAG GAAGATACAG ACGGTTATCA AAAGGAGGCA GAAGCGGAGG 1980 + TTGATGATTA TGAGGACGAA CTAGTGAATT ACGATCATGT TCATTTTTTA GCCACAAATC 2040 + CCTGCTACCG TACATAGAAA GAGAGATAGC AGGGAGAACC ATAAAACTTT TGATTGACAC 2100 + CGGGGCTTCG AAAAATTACA TACAGCCCCT CCCTGAATTA AAAAACATAA TGCCGGTACA 2160 + AAATAAATTC ACGGTAAAAT CGCTTCATGG TTGCAACACC GTCAAACAGA AATGCTTTAT 2220 + TAAGCTATTT AACACATCTG TTCAATTCTT TATTCTTCCA AGTCTCTCTA GTTTTGACGC 2280 + AATAATAGGA CTTGACCTTT TGAAACAGGG AAATGCAACG TTAGATTTTA AGAACAAAAC 2340 + GTTGAATATC AACAATGAAG TGGAATCTAT TCAGTTTTTG AGATGTGACA GCGTAAATTT 2400 + CGCCAACATA GAGAATATTG TGGTTCCAAA TCAGATATCT AATAAATTCC ATACAATGCT 2460 + TCGAAACCGA TTGGCCGTCT TTGCGGAACC GGAAGAAGCA CTGCCGTATA ATACCAACAT 2520 + TGTTGCCACA ATACGTACTG AGGACGACCA ACCCATTTAC TCAAAACTCT ATCCGTACCC 2580 + CATGGGCGTA TCGGATTTTG TGAATAAGGA GACACATGCT TTGTTAAAGG ACGGAATTAT 2640 + CAGGCCCTCG TCGTCACCTT ACAACAATCC GGTTTGGGTA GTCGATAAAA AAGGTACAGA 2700 + TGAAGAGGGA AATACTAAGA AAAGGTTGGT TATAGATTTT AGAAAACTAA ATTTAAAAAC 2760 + AATCGACGAC AAGTACCCTA TACCAAACGT AGTATGGATC TTGTCAAATT TGGGAAAAGC 2820 + CAGATTCTTT ACAACCCTTG ACCTTAAATC GGCGTTTCAC CAAATTCTGC TCGCAGAAAA 2880 + GGATAGAGCG AAAACTGCCT TTTCAGTAGG AAATGGAAAA TACGAGTTTT GCCGTTTGCC 2940 + GTTTGGCTTG AAAAATGCCC CAAGTATTTT TCAACGTGCT ATTGATGATG TTGTTAGGGA 3000 + CCGTATAGGA AAGTCATGTT ACGTTTACGT TGACGACGTA ATAATATTTT CAAACGGAAT 3060 + TGAGGACCAC GTAAACGACG TTGCTTGGGT ACTAGACAGA CTGTCTGGGG CAAACATGAG 3120 + GGTTTCTAAA GAGAAATCGT TTTTCTTCAA GGAAAGCGTC GAGTATCTCG GATTCATGGT 3180 + GTCAAGTGGA GGTATCACAA CCAGTCCTAG CAAAGTAGAG GCTATTCAGA AATATAATCA 3240 + ACCTACTAAT CTGTTTAGTG TTCGATCGTT TTTAGGGCTA GCAAGTTATT ACCGCTGCTT 3300 + TATTAAGGAC TTCGCCTCTA TTGCTAGACC ACTCACTGAC ATTCTGAAGG GTGAAAACGG 3360 + AAAGGTTTCC GCAAGCCAGT CTAAAAAGAT ACCAATTTCT TTCGATGAAA GACAATGTTC 3420 + TGCTTTTGAG AAGCTTAAAA ATGTTCTTGT CTCCGAAAAT GTAATGTTAT TGTATCCCGA 3480 + TTATAGAAAA GCCTTTGACT TAACAACAGA CGCTTCGGCT TTTGGCCTGG GGGCAGTCTT 3540 + ATCACAGGAT GGCAAGCCTG TTACAATGAT TTCGAGAACT TTACAGGATA GAGAACTTAA 3600 + TTTCGCAACA AATGAACGAG AACTTTTGGC CATCGTTTGG GCTTTAAAGT CTCTTAGGAA 3660 + CTATCTATAT GGTGTCAAAA ACTTAAACAT TTTTACAGAT CACCAGCCGT TAACATACGC 3720 + CGTGTCAGAT AGGAATCCAA ATGCAAAAAT CAAGAGATGG AAGGCGTTTA TAGACGAACA 3780 + TAATGCTAAA ATTTTCTATA AACCTGGCAA GGAGACCTAT GTTGCCGATG CACTATCCAG 3840 + GCAGGCTATT CATGTCCTAG AGGACGAACC CCAGTCAGAC ATTGCAACAA TACATAGCGA 3900 + AATTTCATTG ACTTTTACAA TCGAAACTAT CGACAAGCCG GTTAACTGTT TTAGAAACCA 3960 + AATTGTGATA GATGAGGGCA CCGCAGACTC AACTCGAACT TTTGTTATTT TCGGAAGCAA 4020 + GACAAGGCAT CTAATACAGT TTCTAGACAA AGAGACCTTA ATCGGAAGAA TTCGTGATGT 4080 + GGTTAAGCCG GATGTAGTGA ATGCGATACA CTGCGAATTA CCTGTACTAG CTTTCATTCA 4140 + AAACAGTCTT GTAAATGACT TTCCAGCAAC AACCTTCCGA CACACTATGA AAATGGTCAG 4200 + CGACATTTTT AATCAAACTG AGCAACGGGA AATAGTGTCT TTGGAGCACA ACAGAGCGCA 4260 + TAGGGCAGCA CAGGAGAATG TAAAACAAAT TCTTCAATAC TACTTTTTCC CTAAAATGTC 4320 + ACAAATAGCC GCTACCTTTG TTTCTAACTG CTTGGTTTGT CAAAAAGCCA AATACGACCG 4380 + CCATCCGCAA AAGCAAATCC TCGGGAGAAC ACCTATTCCG TCACATGTAG GCGAGACATT 4440 + GCATATTGAT ATATTTTCTA CGGGCAGGAA TTACTTTTTG ACATGTATTG ACAAATTTTC 4500 + CAAATTCGCT ATTGTGCAAC CAATCGGCTC TCGAACGATA ACTGATTTAG AACCTGCAAT 4560 + TATGCAACTA ATGAACTTTT TTCCCCATTC AAAGACAATA TTTTGTGACA ATGAACCGTC 4620 + CATAAATTCC GAGTCAATCA AGTCACTTTT GAAAAATCGT TTTAATGTTG ACATAGCGAA 4680 + CGCACCTCCA CTTCATAGTA CCTCAAACGG ACAGGTTGAA AGGTTTCACA GCACGCTTTT 4740 + AGAAATAGCT CGATGCCTGA AACTTGACAG TGGAATGAAT GATACAGTCA ACCTTATTCT 4800 + TCAGGCAACA ATAGAATACA ATAAGACGGT GCACTCAGTC ACCAATAGAA GACCGATCGA 4860 + CATTATTCAT TCAACTCCTC CCGAATTGGC TAACGAGATA GTAGAAATGG TTAACGAAGC 4920 + TCAGGAAAAA CAGCTAAGAA GAGAAAATGT AACAAGACGA GACAGAACCT TTGAGGTGGG 4980 + AGAAACCGTC ATGGTAAAAC AAAACAATCG CTTGGGAAAT AAACTAACCC CACGGTATAG 5040 + GGAAGAACTA ATCGAAGCAG ACCTCGGGAC AACGGTCCTC ATAAAAGGGA GGGTCGTTCA 5100 + TAAAGATAAT CTACGCTAGG TTTAGTATTT CTTTTCCTTT TGTGACCATC GCCAAGTTAG 5160 + CAAAATACAA ACGTGAAATC TGAACACTAG TAAAAGAGTT TGCAAACATT TTTCAATTAA 5220 + ATATTTGTCA AATCCTTCTT ATTTAATCTT TAAACATTTT GTATTATTTC CGCTTCATCC 5280 + TCTTTAGAAA ATTTTAAAGG TATGTGATGA AATGCTAGAC CCGAATGATT TGAAAACTTA 5340 + AAGTCCACGC AACCACAAAT ATTTCCTGAA ACTACCATAG AAAATAAATG CATTACCAAA 5400 + ACGGCATAAT AACAGTATAG CGCACTCACT CTAATTAGAT TTCAAATTCC CGATTAAAAA 5460 + AAAAATAAAA CACTAATGTT ATCAATACCC TTTCCTGATT CTGTTCAACT AAAATAGGAA 5520 + AATCAATACT TGCAATCAAT AAGCGTTTTA CTACATACTT TAATATCAAA ATATCTGAAT 5580 + GAACTTTATT ATAAAATTAT AATTGTTATA CTTAATTATT GTCAAAACTT TAGTATTAAA 5640 + ACTGTAACTA CCTCTTAAGT AGATGAGAAG AGTAGAAGAG GGAATTAAGA TCTATCAACG 5700 + TAGTATCTGC TAAAGACGTA AAGATGCGGC AACTATTTCT GCGCCTGGGT ACTGAAACGA 5760 + CGAACTGAAT AATATCTGCC ATCAGACGCC AACCAGAGTG CGTTCAACAC ATACGTTTTG 5820 + ATGGTCAACT AGTTCAACCA ACATCAGCAT CATCGTCGTC AACAAGTCGA CGGTTACAAT 5880 + AAAGATTTTT TCCAAGTTCG CTACGATCAT CTCCAGAACC TTGTTGCGAA CCCATGACAT 5940 + GGAGAATCAG CAGCATTTAC GAACTTCTCG GATCATCCAG ACACGCAGAG CTGCCTTCCC 6000 + TTCGATGGTT TAACGCAGTA CCAGGTTGGC AGTATGGGAA CTTAGTGCAC AACCAATGTT 6060 + ACCCGTAAGA TCCGCTTTCA AATAGATTTG CCAATTGTAA AAAGTCTGTG GACAGCCTTC 6120 + GTCTTAGAAG GGGAGGAGTT AACACAATCA CAAAACACCC GAAATATAGT CGTAAGCCTC 6180 + AAGTGCTTTT CCCATCTATA GATCGAGCTT TACCTATAAG AAACTGTAAC TTGTTAAGCT 6240 + TTAGAGATAA GAACTCTTGC TATACTTAAG TCAGTCGATT TTGGAAGATT AGAAGCGTCG 6300 + GTCATCGCCA CGTACTTACT ATTCGTCTCA TTAAGTGCAG ACCGCGCAAG CCTATTGTAA 6360 + TTAATAAACT TACGCTAATA AATATATGGA AAATCTACTA AAATGATAAT T 6411 +// +ID DMCOPIA standard; DNA; INV; 5143 BP. +XX +AC X02599; +XX +DR FLYBASE; FBte0000023; Dmel\copia. +XX +FT source X02599:21..5163 +FT SO_feature five_prime_LTR ; SO:0000425:1..276 +FT SO_feature three_prime_LTR ; SO:0000426:4867..5143 +FT SO_feature polyA_signal_sequence ; SO:0000551:1990..1999 +FT SO_feature polyA_signal_sequence ; SO:0000551:5063..5073 +FT SO_feature primer_binding_site ; SO:0005850:277..291 +FT /bound_moiety="tRNA:M-i-RB" +FT SO_feature CDS ; SO:0000316:432..4661 +FT /name="Dmel\copia\GIP" +FT /db_xref="FLYBASE:FBgn0013437" +FT /db_xref="SWISS-PROT:P04146" +FT /db_xref="NCBI_PROTEIN:CAA26444.1" +FT /translation="MDKAKRNIKPFDGEKYAIWKFRIRALLAEQDVLKVVDGLMPNEVD +FT DSWKKAERCAKSTIIEYLSDSFLNFATSDITARQILENLDAVYERKSLASQLALRKRLL +FT SLKLSSEMSLLSHFHIFDELISELLAAGAKIEEMDKISHLLITLPSCYDGIITAIETLS +FT EENLTLAFVKNRLLDQEIKIKNDHNDTSKKVMNAIVHNNNNTYKNNLFKNRVTKPKKIF +FT KGNSKYKVKCHHCGREGHIKKDCFHYKRILNNKNKENEKQVQTATSHGIAFMVKEVNNT +FT SVMDNCGFVLDSGASDHLINDESLYTDSVEVVPPLKIAVAKQGEFIYATKRGIVRLRND +FT HEITLEDVLFCKEAAGNLMSVKRLQEAGMSIEFDKSGVTISKNGLMVVKNSGMLNNVPV +FT INFQAYSINAKHKNNFRLWHERFGHISDGKLLEIKRKNMFSDQSLLNNLELSCEICEPC +FT LNGKQARLPFKQLKDKTHIKRPLFVVHSDVCGPITPVTLDDKNYFVIFVDQFTHYCVTY +FT LIKYKSDVFSMFQDFVAKSEAHFNLKVVYLYIDNGREYLSNEMRQFCVKKGISYHLTVP +FT HTPQLNGVSERMIRTITEKARTMVSGAKLDKSFWGEAVLTATYLINRIPSRALVDSSKT +FT PYEMWHNKKPYLKHLRVFGATVYVHIKNKQGKFDDKSFKSIFVGYEPNGFKLWDAVNEK +FT FIVARDVVVDETNMVNSRAVKFETVFLKDSKESENKNFPNDSRKIIQTEFPNESKECDN +FT IQFLKDSKESENKNFPNDSRKIIQTEFPNESKECDNIQFLKDSKESNKYFLNESKKRKR +FT DDHLNESKGSGNPNESRESETAEHLKEIGIDNPTKNDGIEIINRRSERLKTKPQISYNE +FT EDNSLNKVVLNAHTIFNDVPNSFDEIQYRDDKSSWEEAINTELNAHKINNTWTITKRPE +FT NKNIVDSRWVFSVKYNELGNPIRYKARLVARGFTQKYQIDYEETFAPVARISSFRFILS +FT LVIQYNLKVHQMDVKTAFLNGTLKEEIYMRLPQGISCNSDNVCKLNKAIYGLKQAARCW +FT FEVFEQALKECEFVNSSVDRCIYILDKGNINENIYVLLYVDDVVIATGDMTRMNNFKRY +FT LMEKFRMTDLNEIKHFIGIRIEMQEDKIYLSQSAYVKKILSKFNMENCNAVSTPLPSKI +FT NYELLNSDEDCNTPCRSLIGCLMYIMLCTRPDLTTAVNILSRYSSKNNSELWQNLKRVL +FT RYLKGTIDMKLIFKKNLAFENKIIGYVDSDWAGSEIDRKSTTGYLFKMFDFNLICWNTK +FT RQNSVAASSTEAEYMALFEAVREALWLKFLLTSINIKLENPIKIYEDNQGCISIANNPS +FT CHKRAKHIDIKYHFAREQVQNNVICLEYIPTENQLADIFTKPLPAARFVELRDKLGLLQ +FT DDQSNAE" +FT SO_feature CDS ; SO:0000316:join(432..1605,4555..4661) +FT /name="Dmel\copia\GIP-RB" +FT /db_xref="FLYBASE:FBgnXXXXXXX" +FT /db_xref="SWISS-PROT:P04146" +FT /db_xref="NCBI_PROTEIN:CAA26445.1" +FT /translation="MDKAKRNIKPFDGEKYAIWKFRIRALLAEQDVLKVVDGLMPNEVD +FT DSWKKAERCAKSTIIEYLSDSFLNFATSDITARQILENLDAVYERKSLASQLALRKRLL +FT SLKLSSEMSLLSHFHIFDELISELLAAGAKIEEMDKISHLLITLPSCYDGIITAIETLS +FT EENLTLAFVKNRLLDQEIKIKNDHNDTSKKVMNAIVHNNNNTYKNNLFKNRVTKPKKIF +FT KGNSKYKVKCHHCGREGHIKKDCFHYKRILNNKNKENEKQVQTATSHGIAFMVKEVNNT +FT SVMDNCGFVLDSGASDHLINDESLYTDSVEVVPPLKIAVAKQGEFIYATKRGIVRLRND +FT HEITLEDVLFCKEAAGNLMSVKRLQEAGMSIEFDKSGVTISKNGLMVVKNSENQLADIF +FT TKPLPAARFVELRDKLGLLQDDQSNAE" +XX +CC Derived from X02599 (g7740) (Rel. 49, Last updated, Version 4). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 5143 BP; 1874 A; 727 C; 971 G; 1571 T; 0 other; + TGTTGGAATA TACTATTCAA CCTACAAAAA TAACGTTAAA CAACACTACT TTATATTTGA 60 + TATGAATGGC CACACCTTTT ATGCCATAAA ACATATTGTA AGAGAATACC ACTCTTTTTA 120 + TTCCTTCTTT CCTTCTTGTA CGTTTTTTGC TGTGAGTAGG TCGTGGTGCT GGTGTTGCAG 180 + TTGAAATAAC TTAAAATATA AATCATAAAA CTCAAACATA AACTTGACTA TTTATTTATT 240 + TATTAAGAAA GGAAATATAA ATTATAAATT ACAACAGGTT ATGGGCCCAG TCCATGCCTA 300 + ATAAACAATT AAATTGTGAA TTAAAGATTG TGAAAATAAA TTGTGAAATA GCATTTTTTC 360 + ACATTCTTGT GAAATAGCTT TTTTTTTCAC ATTCTTGTGA AATTATTTCC TTCTCAGAAT 420 + TTGAGTGAAA AATGGACAAG GCTAAACGTA ATATTAAGCC GTTTGATGGC GAGAAGTACG 480 + CGATTTGGAA ATTTAGAATT AGGGCTCTTT TAGCCGAGCA AGATGTGCTT AAAGTAGTTG 540 + ATGGTTTAAT GCCTAACGAG GTAGATGACT CCTGGAAAAA GGCAGAGCGT TGTGCAAAAA 600 + GTACAATAAT AGAGTACCTA AGCGACTCGT TTTTAAATTT CGCAACAAGC GACATTACGG 660 + CGCGTCAGAT TCTTGAGAAT TTGGACGCCG TTTATGAACG AAAAAGTTTG GCGTCGCAAC 720 + TGGCGCTGCG AAAACGTTTG CTTTCTCTGA AGCTATCGAG TGAGATGTCA CTATTAAGCC 780 + ATTTTCATAT TTTTGACGAA CTTATAAGTG AATTGTTGGC AGCTGGTGCA AAAATAGAAG 840 + AGATGGATAA AATTTCTCAT CTACTGATCA CATTGCCTTC GTGTTACGAT GGAATTATTA 900 + CAGCGATAGA GACATTATCT GAAGAAAATT TGACATTGGC GTTTGTGAAA AATAGATTGC 960 + TGGATCAAGA AATTAAAATT AAAAATGACC ACAACGATAC AAGCAAGAAA GTTATGAACG 1020 + CGATCGTGCA CAACAATAAT AACACTTATA AAAATAATTT GTTTAAAAAT CGGGTAACTA 1080 + AACCAAAGAA AATATTCAAG GGAAATTCAA AGTATAAAGT CAAGTGTCAC CACTGTGGCA 1140 + GAGAAGGCCA CATTAAAAAA GATTGTTTCC ATTATAAAAG AATATTAAAT AATAAAAATA 1200 + AAGAAAATGA AAAACAAGTT CAAACTGCAA CATCACACGG CATTGCGTTT ATGGTAAAAG 1260 + AAGTGAATAA TACTTCAGTG ATGGACAACT GCGGGTTTGT CCTTGATTCT GGTGCTAGTG 1320 + ACCATCTTAT AAATGATGAG TCGCTGTATA CCGACAGTGT GGAGGTTGTG CCTCCACTTA 1380 + AGATTGCAGT GGCCAAGCAA GGCGAATTTA TTTATGCCAC TAAGCGTGGT ATTGTCCGAC 1440 + TACGGAATGA CCATGAGATT ACACTGGAGG ATGTACTCTT TTGTAAGGAA GCTGCTGGTA 1500 + ATTTGATGTC CGTAAAGCGT CTCCAAGAGG CAGGAATGTC GATCGAATTT GACAAAAGCG 1560 + GTGTAACCAT TTCGAAAAAT GGGTTAATGG TTGTCAAAAA TTCAGGTATG TTAAACAATG 1620 + TACCTGTGAT CAATTTTCAA GCATATTCTA TAAATGCTAA GCATAAAAAT AATTTTCGTT 1680 + TATGGCATGA GAGGTTTGGC CATATAAGCG ATGGCAAATT ATTAGAAATA AAACGAAAGA 1740 + ATATGTTTAG TGATCAAAGT CTTCTAAACA ACTTAGAGTT ATCATGTGAA ATTTGTGAAC 1800 + CCTGTTTAAA TGGTAAACAG GCAAGACTTC CTTTTAAACA ATTGAAAGAT AAGACCCATA 1860 + TTAAAAGACC ACTTTTTGTA GTACACTCAG ATGTCTGTGG GCCTATTACT CCAGTTACTT 1920 + TAGATGATAA AAATTATTTT GTGATCTTTG TTGATCAGTT TACACATTAT TGTGTAACTT 1980 + ATTTAATTAA ATATAAATCT GATGTGTTTA GCATGTTTCA AGATTTTGTA GCCAAGAGTG 2040 + AAGCTCATTT TAATTTAAAG GTTGTGTACT TATACATTGA CAATGGTAGA GAATACTTGT 2100 + CAAATGAGAT GAGACAATTT TGTGTTAAGA AAGGAATTTC TTATCACTTA ACAGTGCCAC 2160 + ATACACCTCA GTTAAATGGT GTTTCTGAGA GAATGATAAG AACCATTACG GAAAAAGCTC 2220 + GAACCATGGT TAGTGGTGCA AAGCTAGATA AAAGCTTTTG GGGCGAAGCA GTATTAACTG 2280 + CTACTTATTT AATCAACAGA ATTCCTAGTA GAGCACTTGT TGATAGTTCA AAGACCCCAT 2340 + ATGAGATGTG GCACAATAAG AAGCCATACT TAAAACATTT GAGAGTGTTT GGTGCAACTG 2400 + TTTATGTGCA TATTAAAAAC AAACAAGGAA AGTTTGATGA TAAATCATTT AAAAGTATTT 2460 + TTGTGGGCTA TGAACCCAAT GGTTTTAAGT TGTGGGATGC TGTAAATGAA AAATTTATTG 2520 + TCGCAAGAGA TGTTGTTGTC GATGAAACCA ATATGGTTAA TTCTAGAGCT GTTAAATTTG 2580 + AAACAGTGTT CCTGAAAGAT AGTAAGGAAA GTGAAAATAA AAATTTTCCG AATGACAGTA 2640 + GGAAAATAAT ACAAACAGAA TTCCCGAATG AGAGTAAGGA ATGCGACAAC ATACAATTCC 2700 + TGAAAGATAG TAAGGAAAGT GAAAATAAAA ATTTTCCGAA TGACAGTAGG AAAATAATAC 2760 + AAACAGAATT CCCGAATGAG AGTAAGGAAT GCGACAACAT ACAATTCCTG AAAGATAGTA 2820 + AGGAAAGTAA TAAATATTTT CTGAATGAGA GTAAGAAAAG AAAGCGAGAT GATCACCTGA 2880 + ATGAAAGTAA GGGATCAGGC AACCCGAATG AGAGTAGGGA AAGTGAAACA GCAGAGCACT 2940 + TAAAAGAAAT TGGAATTGAT AATCCAACTA AAAATGATGG CATAGAAATT ATTAATAGAA 3000 + GAAGTGAGAG ATTAAAGACT AAGCCTCAGA TATCCTATAA TGAAGAGGAT AATAGTCTAA 3060 + ATAAAGTTGT TCTAAATGCT CACACTATAT TTAACGATGT CCCAAATTCA TTTGATGAAA 3120 + TTCAATATAG GGATGATAAA TCTTCTTGGG AAGAAGCCAT CAATACAGAG TTAAATGCTC 3180 + ATAAAATTAA TAATACTTGG ACAATTACAA AAAGGCCTGA AAACAAAAAT ATTGTAGATA 3240 + GCAGATGGGT ATTTTCTGTT AAATATAATG AACTTGGAAA TCCAATTAGA TACAAAGCTA 3300 + GATTGGTTGC ACGAGGATTC ACTCAAAAAT ACCAAATAGA CTATGAAGAG ACATTTGCTC 3360 + CTGTAGCTAG AATTTCAAGT TTCCGATTTA TATTGTCATT AGTAATACAG TATAACTTGA 3420 + AAGTCCATCA AATGGATGTA AAAACAGCTT TCTTAAATGG CACGTTAAAA GAGGAAATTT 3480 + ATATGAGACT TCCTCAAGGT ATATCGTGTA ATAGTGACAA TGTGTGTAAA TTGAATAAGG 3540 + CAATTTACGG ACTCAAGCAA GCGGCTAGAT GCTGGTTTGA AGTATTTGAG CAAGCATTGA 3600 + AAGAGTGTGA GTTTGTAAAC TCTTCAGTTG ATCGCTGTAT ATATATTTTA GACAAAGGTA 3660 + ACATCAATGA AAACATATAT GTATTATTAT ATGTAGATGA TGTGGTTATA GCTACAGGAG 3720 + ATATGACAAG AATGAATAAC TTCAAAAGGT ATTTAATGGA AAAGTTTAGG ATGACTGACC 3780 + TAAATGAAAT AAAACATTTT ATTGGAATTA GGATAGAGAT GCAGGAAGAT AAAATCTATT 3840 + TAAGCCAATC TGCATATGTT AAAAAAATTT TAAGTAAATT TAACATGGAA AATTGTAATG 3900 + CAGTTAGTAC TCCTTTACCT AGTAAAATAA ATTATGAATT ACTTAATTCA GATGAAGACT 3960 + GCAATACCCC ATGCCGTAGC CTCATAGGAT GTTTAATGTA CATAATGCTT TGTACACGCC 4020 + CAGATTTAAC TACTGCAGTA AATATCTTGA GCAGATATAG TAGCAAAAAT AACTCCGAAT 4080 + TATGGCAGAA CTTAAAAAGA GTTCTTAGAT ATTTGAAGGG CACTATCGAT ATGAAATTGA 4140 + TTTTTAAAAA GAACTTGGCA TTTGAAAATA AAATTATTGG TTATGTGGAT TCTGATTGGG 4200 + CTGGTAGTGA AATTGATAGA AAAAGTACAA CAGGGTATTT ATTCAAAATG TTTGATTTTA 4260 + ATCTCATTTG TTGGAATACA AAGAGACAGA ACTCAGTAGC AGCCTCATCA ACTGAAGCTG 4320 + AGTATATGGC CCTATTTGAA GCCGTGAGAG AAGCTCTATG GCTTAAATTT TTATTAACTA 4380 + GTATTAACAT TAAACTAGAA AACCCCATTA AAATTTACGA AGACAATCAA GGCTGTATTA 4440 + GCATAGCAAA CAACCCCTCA TGTCATAAAC GAGCTAAACA TATTGATATT AAATATCATT 4500 + TTGCCAGAGA GCAAGTTCAG AATAATGTGA TTTGTCTTGA GTATATTCCT ACAGAGAATC 4560 + AACTGGCTGA CATATTTACA AAACCGTTGC CTGCTGCGAG ATTTGTGGAG TTACGAGACA 4620 + AATTGGGTTT GCTGCAAGAC GACCAATCGA ATGCTGAATG AAATTTTTAT ATATATTTTT 4680 + CAAATTTAAA TTCCTGTAAA CATATTTTGT TACAATGATC TGATCGGGTT TTTCTGGGTT 4740 + TTCCCCGTAT CCTCGCAGCA AATGCTGGAT CAGTTAACAC TTCCCAGAAT GCACACCACC 4800 + CACATTTGAT AGTTACTAAT GAATATTATT GTTATGTTTT TAATTATAGA CGTTATTTTT 4860 + GAGGGGGCGT GTTGGAATAT ACTATTCAAC CTACAAAAAT AACGTTAAAC AACACTACTT 4920 + TATATTTGAT ATGAATGGCC ACACCTTTTA TGCCATAAAA CATATTGTAA GAGAATACCA 4980 + CTCTTTTTAT TCCTTCTTTC CTTCTTGTAC GTTTTTTGCT GTGAGTAGGT CGTGGTGCTG 5040 + GTGTTGCAGT TGAAATAACT TAAAATATAA ATCATAAAAC TCAAACATAA ACTTGACTAT 5100 + TTATTTATTA TTAAGAAAGG AAAATAAATT ATAAATTACA ACA 5143 +// +ID DMW1DOC standard; DNA; INV; 4725 BP. +XX +AC X17551; +XX +DR FLYBASE; FBte0000341; Dmel\Doc. +XX +FT source X17551:1..4725 +FT SO_feature CDS ; SO:0000316:213..1910 +FT /name="Dmel\Doc\gag" +FT /db_xref="FLYBASE:FBgn0024789" +FT /db_xref="SPTREMBL:Q04134" +FT /db_xref="NCBI_PROTEIN:CAA35586.1" +FT /translation="MNQNDIRSQRQCEQDERRLSLQRNNAYFSFVSPQIGDRAPSPSTN +FT SKLLPSANDRPRSCSPSLPASAHKSWSEETASPTPLLSQRQTTVPGNCNTAITSAVTSL +FT ATATTSTSSAAQLIIAVPAVNNSAALTVCNNNNARKEESKQKQKSISTVQTGMDRYIQI +FT KRKLSPQNNKAGNQPKINRTNNGNENSAVNNSNRYAILADSATEQPNEKTVGEPKKTRP +FT PPIFIREQSTNALVNKLVALIGDSKFHIIPLKKGNIHEIKLQIQTEADHRIVTKYLNDA +FT GKNYYTYQLKSCKGLQVVLKGIEATVTPAEIIEALKAKNFSAKTAINILNKDKVPQPLF +FT KIELEPELQALKKNEVHPIYNLQYLLHRRITVEEPHKRINPVQCTNCQEYGHTKAYCTL +FT KSVCVVCSEPHTTANCPKNKDDKSVKKCSNCGEKHTANYRGCVVYKELKSRLNKRIATA +FT HTYNKVNFYSPQPIFQPPLTVPSTTPTISFASALKSGLEVPAPPTRTAHSEHTPTNIQQ +FT TQQSGIEAMMLSLQQSMKDFMTFMQNTLQELMKNQNILIQLLVSSKSP" +FT SO_feature CDS ; SO:0000316:1910..4576 +FT /name="Dmel\Doc\RTase" +FT /db_xref="FLYBASE:FBgn0024790" +FT /db_xref="SPTREMBL:Q04135" +FT /db_xref="NCBI_PROTEIN:CAA35587.1" +FT /translation="MASLRISLWNANGVSRHTQELTQFIYEKNIDVMLLSETHLTNKNN +FT FHIPGYLFYGTNHPDGKAHGGTGILIRNRIKHHHLNNFDKNYLQSTSIALQLNNGSTTL +FT AAVYCPPRFPISEDQFMEFFNTLGDRFIAAGDYNAKHTHWGSRLVSPKGKQLYNALTKP +FT ENKLDYVSPGKPTYWPADPRKIPDLIDFAITKHVPRNMVTAEALADLSSDHSPVFLNML +FT TRPHIVDPPYRLTNFRTNWPRYQKYVCSHIELTTALSTKEDIDKSTETLENILVSAAKA +FT STPPVTYAKPNYIKTNREIERLVLDKRRLRRDWQSNRSPITKHMLKIATRRLTNALKQE +FT EKNSQRSYIEQLSPTSTKYPLWRAHRNLKTPIAPIMPLRSPSGTWFRSDEERASAFADH +FT LQNVFRPNPSTNTFILPPLIAANLDPQEPFEFRPCELAKVIKEQLNPRKSPGYDLITPR +FT MLIELPKCAILHICLLFNAIAKLGYFPQKWKKSTIVMIPKPGKDKTQPSSYRPISLLTC +FT LSKLFEKMLLLRISPHLRINNTLPTHQFGFREKHGTIEQVNRITSEIRTAFEHREYCTA +FT IFLDVAQAFDRVWLDGLLFKIIKLLPQNTHKLLKSYLYNRVFAIRCDTSTSRDCAIEAG +FT VPQGSVLGPILYTLYTADFPIDYNLTTSTFADDTAILSRSKCPIKATALLSRHLTSVER +FT WLADWRISINVQKCKQVTFTLNKQTCPPLVLNNICIPQADEVTYLGVHLDRRLTWRKHI +FT EAKSKHLKLKARNLHWLINARSPLSLEFKALLYNSVLKPIWTYGSELWGNASRSNIDII +FT QRAQSRILRIITGAPWYLRNENIHRDLKIKLVIEVIAEKKTKYNEKLTTHTNPLARKLI +FT RVCSQSRLHRNDLPAQQ" +XX +CC Derived from X17551 (g8821) (Rel. 29, Last updated, Version 2). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 4725 BP; 1647 A; 1192 C; 822 G; 1064 T; 0 other; + GACATTCGGC ATTCCACAGT CTTCGGGTGG AGACGTGTTT CTTTCAAGCT ACGAATAGCA 60 + AGTTCTAAAA ACTACAACAG TATAGTGAAA GTTAAACACA AAGTGTAAAG TGCAGTTTGC 120 + ACAACTAACA ATTATTGACT ATAGTAATTA TTTACTAAAA TAAATAATTA TTCCATATTG 180 + TTCTGGTAAT TGTTATATGT GGACTTAGAA CAATGAATCA AAACGACATA CGTTCTCAGC 240 + GACAATGTGA ACAAGACGAG CGCCGGCTCT CTTTACAACG CAACAATGCA TACTTTTCTT 300 + TCGTCTCACC GCAAATCGGT GATCGAGCAC CCTCACCTTC AACTAACTCG AAACTTTTGC 360 + CCTCAGCGAA CGACAGACCG CGTTCTTGCT CTCCCTCTCT GCCTGCTTCG GCTCACAAGT 420 + CGTGGAGCGA AGAGACCGCC TCTCCTACCC CGCTCCTCTC GCAGCGCCAA ACGACCGTCC 480 + CGGGTAACTG TAACACTGCA ATAACGAGTG CAGTGACCTC ACTGGCAACT GCCACAACAT 540 + CAACTTCGTC AGCGGCCCAA CTAATTATCG CTGTGCCAGC TGTAAATAAT TCAGCAGCAC 600 + TGACCGTTTG CAACAACAAT AATGCACGTA AAGAAGAATC AAAACAAAAG CAGAAGTCGA 660 + TTTCGACTGT GCAGACTGGC ATGGATCGCT ACATCCAAAT CAAGAGAAAG CTCAGCCCTC 720 + AAAACAATAA GGCAGGTAAT CAACCCAAAA TCAATCGAAC CAACAACGGC AATGAAAACT 780 + CTGCAGTAAA TAATTCAAAC CGATATGCTA TCTTGGCTGA TTCTGCGACC GAACAACCCA 840 + ACGAAAAAAC GGTAGGGGAA CCAAAAAAGA CCAGGCCTCC ACCAATTTTC ATACGAGAAC 900 + AAAGTACAAA TGCACTTGTA AATAAACTCG TTGCTTTGAT TGGTGACAGC AAGTTCCACA 960 + TTATCCCACT TAAAAAAGGA AATATTCATG AAATAAAACT ACAGATCCAA ACAGAAGCAG 1020 + ACCACCGTAT AGTGACTAAA TACCTAAATG ATGCTGGTAA AAACTACTAC ACATACCAAT 1080 + TAAAAAGTTG CAAAGGGCTA CAGGTAGTAC TTAAGGGCAT TGAAGCAACA GTGACACCAG 1140 + CTGAGATAAT TGAGGCTCTG AAGGCCAAAA ACTTTTCTGC AAAGACAGCT ATTAATATTT 1200 + TAAACAAAGA CAAAGTTCCG CAGCCACTAT TCAAAATAGA ACTCGAACCA GAGCTCCAGG 1260 + CACTAAAGAA AAACGAAGTG CACCCAATAT ACAATTTACA GTACTTGCTA CATCGGAGGA 1320 + TCACCGTGGA GGAGCCGCAC AAACGTATCA ATCCAGTTCA ATGTACTAAT TGCCAAGAAT 1380 + ACGGCCACAC CAAGGCATAC TGCACCCTTA AGTCCGTATG TGTTGTCTGT AGCGAACCTC 1440 + ATACTACCGC AAACTGCCCC AAAAACAAGG ACGATAAGTC TGTGAAGAAA TGCAGTAACT 1500 + GCGGGGAAAA ACATACTGCA AACTACAGAG GCTGTGTGGT GTACAAAGAA TTGAAGAGCC 1560 + GCCTAAACAA ACGTATTGCC ACAGCACATA CATACAACAA AGTCAATTTC TACTCTCCGC 1620 + AACCGATTTT TCAACCACCC CTAACTGTCC CAAGCACTAC TCCAACAATT TCTTTCGCTA 1680 + GCGCCCTAAA ATCCGGACTA GAAGTGCCCG CCCCACCGAC AAGAACTGCT CATTCCGAAC 1740 + ATACACCGAC AAACATCCAA CAAACACAAC AAAGTGGCAT CGAAGCTATG ATGCTATCCC 1800 + TACAGCAAAG CATGAAAGAC TTCATGACGT TCATGCAAAA TACTTTGCAA GAGCTCATGA 1860 + AAAACCAAAA TATCCTGATT CAACTTCTTG TATCTTCAAA ATCCCCATAA TGGCTTCCCT 1920 + ACGGATATCT CTGTGGAACG CAAATGGCGT TTCACGGCAT ACACAAGAGC TCACACAGTT 1980 + CATTTACGAA AAAAACATCG ACGTAATGCT ACTATCAGAA ACGCACCTCA CAAATAAAAA 2040 + CAATTTTCAT ATACCAGGAT ACTTGTTCTA TGGTACAAAT CATCCAGATG GTAAAGCTCA 2100 + TGGAGGCACT GGAATACTCA TCAGAAATCG CATAAAACAC CACCACTTAA ACAATTTTGA 2160 + CAAAAACTAC TTACAATCTA CGTCCATAGC CTTACAACTC AACAATGGTT CAACGACTCT 2220 + AGCCGCAGTC TACTGCCCAC CGCGCTTTCC AATCTCTGAG GATCAATTCA TGGAATTCTT 2280 + TAACACACTA GGTGACAGGT TCATCGCAGC GGGTGACTAT AACGCCAAGC ACACCCATTG 2340 + GGGATCTCGA CTTGTGTCGC CAAAGGGTAA GCAATTGTAC AATGCGCTTA CGAAGCCAGA 2400 + AAACAAGCTA GACTATGTAT CCCCGGGTAA GCCTACATAC TGGCCAGCAG ACCCAAGAAA 2460 + AATCCCAGAC CTGATCGATT TTGCAATTAC TAAACATGTC CCCCGCAACA TGGTCACCGC 2520 + CGAAGCACTA GCAGATTTAT CATCAGATCA CTCACCTGTT TTTCTAAATA TGCTAACTCG 2580 + CCCCCACATC GTCGACCCAC CGTATAGACT CACAAATTTT AGAACAAACT GGCCAAGGTA 2640 + TCAAAAGTAT GTCTGTTCAC ACATAGAACT AACGACGGCA TTATCTACAA AGGAGGATAT 2700 + AGACAAGTCA ACGGAAACTC TTGAAAACAT TTTAGTTTCG GCTGCAAAGG CTTCAACCCC 2760 + GCCAGTGACG TATGCAAAAC CAAACTACAT CAAAACTAAT CGCGAAATCG AGCGGCTGGT 2820 + ATTAGATAAA CGACGCCTAC GAAGGGATTG GCAGTCTAAT AGATCACCAA TTACTAAGCA 2880 + CATGCTTAAG ATAGCCACAC GCAGGCTTAC CAATGCTCTC AAACAAGAGG AAAAAAACAG 2940 + CCAACGTTCA TATATCGAGC AACTCTCTCC CACCAGCACT AAGTACCCTC TTTGGAGAGC 3000 + TCACAGAAAC CTAAAGACTC CAATAGCGCC AATTATGCCA CTCCGAAGTC CCTCTGGCAC 3060 + CTGGTTTCGA AGTGATGAAG AAAGAGCCAG TGCTTTCGCT GACCATTTAC AAAATGTATT 3120 + CCGACCAAAT CCCTCTACCA ACACATTTAT TCTCCCTCCT TTAATAGCAG CCAATCTAGA 3180 + TCCTCAAGAA CCCTTTGAAT TCCGACCATG TGAACTAGCA AAGGTTATCA AAGAGCAACT 3240 + GAACCCAAGA AAATCGCCTG GCTACGACCT AATAACTCCA AGAATGCTCA TTGAACTCCC 3300 + AAAGTGTGCT ATTCTTCACA TCTGCCTGTT GTTCAACGCA ATCGCCAAGC TTGGATACTT 3360 + CCCTCAAAAA TGGAAAAAGT CGACCATAGT AATGATTCCA AAGCCAGGAA AAGATAAAAC 3420 + GCAGCCATCA TCATATAGAC CGATAAGCTT ACTAACATGT CTTTCAAAGC TGTTTGAAAA 3480 + AATGCTACTC CTTCGGATTA GCCCTCATCT TAGAATAAAC AACACACTTC CAACACATCA 3540 + ATTTGGCTTT AGAGAAAAAC ATGGAACCAT CGAACAGGTC AACCGAATCA CGTCAGAAAT 3600 + TCGTACTGCT TTTGAACATC GAGAATACTG CACAGCCATT TTTCTAGACG TCGCGCAGGC 3660 + ATTTGACAGA GTGTGGCTCG ATGGACTTTT GTTTAAAATA ATCAAGCTGT TGCCCCAAAA 3720 + CACACATAAG CTACTGAAGT CATACCTATA TAACAGAGTG TTTGCAATAA GATGCGATAC 3780 + AAGCACTTCA CGCGATTGCG CAATCGAAGC TGGAGTGCCG CAAGGCAGTG TACTGGGTCC 3840 + AATCTTATAC ACCCTGTATA CGGCGGATTT CCCCATAGAC TACAATCTAA CAACCTCCAC 3900 + GTTCGCTGAT GATACCGCGA TACTCAGTCG CTCGAAATGC CCAATAAAAG CCACGGCACT 3960 + CCTATCCCGA CACTTAACAT CTGTAGAACG ATGGCTTGCC GACTGGAGAA TTTCAATAAA 4020 + TGTTCAAAAA TGCAAGCAGG TTACCTTTAC CTTAAACAAA CAAACATGCC CACCACTGGT 4080 + CTTGAATAAC ATATGCATTC CACAAGCCGA CGAGGTAACA TATCTGGGAG TTCATCTGGA 4140 + CAGGCGGCTC ACTTGGCGCA AACATATAGA AGCCAAATCG AAACATCTTA AACTTAAAGC 4200 + AAGGAACCTC CACTGGCTCA TAAATGCTCG CTCTCCACTT AGTCTGGAGT TCAAAGCTCT 4260 + TCTATACAAC TCCGTCTTAA AACCTATCTG GACTTATGGC TCCGAGCTGT GGGGCAACGC 4320 + ATCCAGAAGT AACATAGACA TTATTCAGCG AGCACAGTCA AGAATTCTGA GAATTATCAC 4380 + TGGAGCGCCG TGGTACCTTC GAAACGAAAA CATACACAGA GACCTAAAAA TCAAATTAGT 4440 + AATCGAAGTA ATAGCTGAGA AAAAAACGAA GTATAACGAA AAGCTGACCA CCCATACAAA 4500 + TCCCCTCGCA AGAAAACTAA TCCGAGTATG CAGTCAAAGC CGGCTGCACC GCAACGACCT 4560 + CCCAGCCCAG CAATAAACTT ATTAGGGCAT TAATGAAAAA AAAAAACTAT CACTAAGTGA 4620 + AAGTTAATTA AGTTAGATTA AGATTTGAAC ACTTATTGTT AGTCTCTTAA CACAAAGGGA 4680 + AGATTCAATA AATAATAAAA ATTAAAAAAA AAAAAAAAAA AAAAA 4725 +// +ID F standard; DNA; INV; 4708 BP. +XX +AC AC005198; +XX +DR FLYBASE; FBte0000005; Dmel\F-element. +XX +SY synonym: Jiminy +XX +FT source AC005198:38639..43358 +FT SO_feature CDS ; SO:0000316:192..1880 +FT /name="Dmel\F-element\gag-r" +FT /db_xref="FLYBASE:FBgn0041632" +FT /db_xref="TREMBL:P91787" +FT /translation="MSQNDTRAQRQREHDERRLSIQRNNAYFSYVSPTIPNADIERSI +FT THSPGNLLLPTNQERARSCSPALLAPTEAPLPPTTTAGEGPAARSASSSAAPAHGLTK +FT SAKAKPLAINGTAALPAKQNENVNKKAGSTWQTGMDRYITIKRKLSPENSDLGNKPKN +FT TRDNSTLIKNVAPANTNRFALLVDTAEDVPLGSVDIEPKKTKPPPIYIREKSTSRLVN +FT TLIGLIGKDSFHIIPLVRGTINEIKLQTKTEDDYRKVTNYFTAQKIGFYTYQLKSSKG +FT LQVVLKGIESDVTPEEITEALKEKGFYAKNVFNIKNRNRQPQPLFKIELEPENKPPRK +FT NEVHPIYKLQLLLHRRITVEEPHKRNAPVQCTNCQEYGHTRSYCTLRPVCVVCGDLHD +FT SKQCQINKENACEKKCNNCGGNHTANYRGCPIYKELKIRLHKRMNTARAHQGSATLIP +FT SETNPEVIFSKAASFAPWPTFNTNKTTFANVLKSGMTPPTQNSRTPHEVHTKLDTQQN +FT YHPAAQQETKTEAMMQALQQSMMEFMTFMKTTIQDMMRNQNLLIQMLVAQQSNK" +FT SO_feature CDS ; SO:0000316:1880..4561 +FT /name="Dmel\F-element\RTase" +FT /db_xref="FLYBASE:FBgn0041633" +FT /db_xref="TREMBL:Q24335" +FT /translation="MATLRIATWNANGVSQRKLELAQFLHEKHIDVMLLSETHLTSKY +FT NFQIRDYHFYGTNHPDGKAHGGTAILIRNRMKHHFYKEFAENHLQATSINIQLDDNTL +FT LTLAAVYCPPRFTVLEAQFLDFFQALGPHFIAAGDYNAKHTHWGSRLVNPKGKQLYKT +FT IIKATNKLDHVSPGSPTYWPSDLNKLPDLIDFAVTKNISRSLVKAECLPDLSSDHSPV +FT LIHLRRYAENVKPPTRLTSSKTNWLRYKKYISSHIELSPKLNTESDIESCTCALQSIL +FT TAAALTATPKITNNTINSKKTNVQIEQLVHVKRRLRREWQSSRSPTAKQKLKVATRKL +FT ANALKQEEDDDQRRYIEQLTPTGTKQKSLWRAHSTLRPPTETVLPIKNSSGGWARSDE +FT DRANTFAAHLQNVFTPNQATSTFALPSYPVNRHQQHTPIVFRPKEITKIIKDNLSPKK +FT SPGYDLITPEMIIQLPHSAVRYITKLFNAITKLGYFPQRWKMMKIIMIPKPGKNHTVA +FT SSYRPISLLSCISKLFEKCLLIRLNQHQTYHNIIPAHQFGFRESHGTIEQVNRITTEI +FT RTAFEYREYCTAVFLDVSQAFDKVWLDGLMFKIKISLPESTHKLLKSYLYDRKFAVRC +FT NTATSTVHTIEAGVPQGSVLGPTLYLIYTADIPTNSRLTVSTFADDTAILSRSRSPIQ +FT ATAQLALYLIDIKKWLSDWRIKVNEQKCKHVTFTLNRQDCPPLLLNSIPLPKADEVTY +FT LGVHLDRRLTWRRHIEAKKTQLKLKANNLHWLINSGSPLSLDHKVLLYNSILKPIWTY +FT GSQLWGNASNSNIDIIQRAQSKILRTITGAPWYVRSENIQRDLNIPSVTNAITELKEK +FT YL" +XX +CC K. O'Hare, Personal communication to FlyBase, 1 May 2000. +CC CDS2 translation from M17214; AC005198 has a 1-bp deletion. +XX +SQ Sequence 4708 BP; 1618 A; 1242 C; 857 G; 991 T; 0 other; + AATCAATTAA TCAATTCGAT CGCCGACGTG TGAAGACGTT TTTATCGTGC TCCGCACAAA 60 + ATCGGTTGTT TTGAGTGAAG TGAACGCCAA ATAAAATAAA CTAAATAAAA AATCTGAAAG 120 + CGAAAGAGAC GCTCTATGCG ATGCAAGATC GCTTAAATAC ATAGTGAATT GTTATCTTAA 180 + ATAATAAAAC TATGAGTCAG AATGACACTC GCGCCCAGCG TCAGCGCGAG CATGACGAAC 240 + GCCGACTCTC AATTCAGCGC AACAACGCGT ACTTCTCCTA CGTCTCACCG ACAATCCCAA 300 + ACGCAGACAT CGAGCGGTCA ATAACCCATA GCCCAGGAAA CCTTCTTCTA CCAACAAATC 360 + AAGAAAGAGC GCGCTCCTGC TCTCCCGCTC TATTGGCTCC GACAGAAGCC CCGCTACCTC 420 + CAACAACAAC AGCTGGAGAG GGACCGGCAG CCCGCTCTGC CTCGTCATCG GCTGCACCCG 480 + CTCACGGTCT GACTAAGTCA GCGAAAGCAA AACCGCTAGC AATAAACGGT ACTGCTGCAC 540 + TGCCAGCAAA ACAAAACGAA AACGTAAACA AAAAAGCTGG GTCGACCTGG CAGACTGGAA 600 + TGGACCGCTA CATTACAATA AAGCGAAAGC TCAGCCCGGA AAATTCAGAT TTGGGAAACA 660 + AGCCGAAAAA TACACGCGAT AACTCTACCT TGATCAAAAA TGTAGCCCCT GCAAATACCA 720 + ACAGATTTGC CTTGCTGGTA GATACCGCTG AGGACGTGCC GCTGGGATCC GTTGATATCG 780 + AACCGAAGAA AACAAAGCCT CCGCCAATAT ACATCCGCGA GAAGAGCACA AGCCGTCTTG 840 + TAAATACTTT GATTGGCCTT ATTGGGAAAG ATAGCTTTCA TATAATTCCC CTCGTAAGAG 900 + GTACTATCAA CGAAATCAAA CTTCAGACGA AAACGGAGGA CGACTACAGA AAAGTCACAA 960 + ACTATTTTAC CGCACAAAAA ATAGGCTTCT ACACCTACCA GCTTAAAAGC AGCAAGGGCC 1020 + TGCAAGTAGT CCTGAAGGGC ATTGAGTCTG ATGTTACGCC CGAAGAGATA ACTGAGGCGC 1080 + TAAAGGAAAA GGGATTTTAC GCCAAAAACG TGTTCAATAT CAAAAACAGA AACAGGCAGC 1140 + CCCAACCACT CTTCAAGATT GAGCTTGAAC CAGAAAACAA GCCTCCTAGA AAAAACGAGG 1200 + TTCACCCAAT TTACAAACTC CAGCTCCTTT TGCACCGTAG GATCACGGTA GAAGAGCCGC 1260 + ACAAACGCAA CGCTCCTGTA CAATGTACAA ACTGCCAAGA GTATGGCCAC ACGAGGTCAT 1320 + ATTGTACACT TCGCCCGGTG TGCGTAGTCT GTGGAGATCT CCACGACTCC AAACAGTGTC 1380 + AAATTAACAA AGAAAATGCA TGCGAGAAAA AATGTAATAA CTGCGGGGGC AATCACACAG 1440 + CAAACTACAG AGGCTGTCCA ATCTACAAAG AGCTGAAAAT CCGTCTTCAC AAAAGAATGA 1500 + ACACGGCGCG GGCACACCAA GGATCAGCTA CCCTGATACC ATCAGAGACA AATCCTGAAG 1560 + TAATTTTCTC GAAAGCAGCT AGTTTCGCTC CCTGGCCTAC ATTCAACACT AACAAGACAA 1620 + CATTTGCTAA CGTTTTAAAA TCAGGTATGA CGCCTCCAAC CCAAAACTCC CGAACTCCAC 1680 + ATGAAGTGCA CACAAAATTA GACACACAAC AAAACTATCA CCCAGCTGCG CAGCAGGAAA 1740 + CAAAAACTGA AGCTATGATG CAAGCCTTAC AACAGAGCAT GATGGAATTT ATGACATTTA 1800 + TGAAGACCAC CATTCAAGAC ATGATGCGTA ATCAAAACCT TTTGATACAA ATGCTTGTAG 1860 + CCCAACAATC AAATAAATAA TGGCTACCTT ACGCATAGCT ACGTGGAACG CCAATGGCGT 1920 + CTCACAGCGC AAACTTGAGC TAGCTCAATT CCTACATGAG AAGCATATCG ACGTAATGCT 1980 + TCTTTCGGAA ACTCATCTCA CAAGCAAATA CAATTTTCAA ATAAGAGACT ACCATTTCTA 2040 + CGGTACAAAT CATCCCGACG GAAAAGCACA CGGTGGCACC GCCATACTCA TAAGGAACCG 2100 + TATGAAGCAC CACTTTTACA AAGAATTTGC GGAAAATCAT CTTCAGGCCA CATCTATCAA 2160 + CATTCAGCTG GATGACAACA CTCTCCTTAC ACTAGCGGCC GTATACTGCC CCCCCCGTTT 2220 + CACAGTATTA GAAGCTCAAT TCCTGGATTT CTTCCAAGCA CTAGGGCCAC ACTTCATTGC 2280 + AGCAGGCGAC TACAACGCTA AACATACTCA CTGGGGATCG CGACTTGTGA ACCCAAAAGG 2340 + AAAACAGCTT TATAAGACGA TAATAAAAGC CACTAATAAA CTTGACCATG TTTCCCCCGG 2400 + GAGTCCTACA TACTGGCCAT CAGACCTCAA TAAGCTGCCA GACCTGATCG ACTTCGCAGT 2460 + TACGAAAAAT ATTTCCCGCA GTTTGGTTAA AGCTGAATGT CTGCCGGATC TCTCATCTGA 2520 + TCACTCGCCT GTACTAATTC ACCTCCGCCG ATACGCAGAA AACGTGAAAC CACCAACCAG 2580 + ATTGACCTCT AGCAAAACAA ACTGGCTCAG GTATAAAAAA TATATAAGTT CACATATTGA 2640 + GCTAAGCCCA AAACTCAATA CTGAATCTGA TATAGAGAGC TGCACGTGTG CATTGCAATC 2700 + CATCCTTACT GCAGCAGCTC TTACTGCAAC ACCCAAAATA ACAAATAATA CAATTAATTC 2760 + AAAAAAGACC AACGTACAAA TCGAGCAACT CGTCCACGTA AAACGTCGCT TACGCAGAGA 2820 + ATGGCAATCT TCCAGATCCC CAACTGCAAA ACAAAAGCTA AAAGTAGCCA CACGGAAACT 2880 + GGCCAACGCT CTGAAACAAG AAGAGGACGA CGATCAGCGC CGATACATAG AGCAACTCAC 2940 + ACCAACAGGC ACAAAACAAA AGTCACTGTG GCGAGCCCAC TCAACTCTTC GCCCACCGAC 3000 + TGAAACCGTT TTGCCGATAA GGAATTCATC AGGTGGCTGG GCCCGTAGTG ATGAAGACAG 3060 + AGCCAACACA TTTGCCGCTC ACCTACAAAA TGTGTTCACG CCAAACCAGG CTACTAGCAC 3120 + ATTCGCGCTA CCGTCCTATC CCGTAAACCG CCATCAGCAA CACACCCCAA TTGTGTTTCG 3180 + TCCTAAAGAA ATAACTAAAA TAATCAAAGA CAATCTCAGC CCGAAAAAAT CCCCCGGCTA 3240 + CGACCTTATA ACACCGGAAA TGATCATCCA GCTGCCACAT TCTGCAGTTC GCTACATAAC 3300 + CAAGCTCTTT AATGCCATCA CCAAACTTGG TTACTTTCCA CAACGATGGA AGATGATGAA 3360 + GATCATAATG ATTCCAAAGC CTGGTAAGAA CCACACAGTC GCTTCATCTT ACAGACCAAT 3420 + AAGTCTACTC TCATGCATTT CGAAACTATT CGAAAAATGC CTGCTGATCC GACTTAATCA 3480 + ACATCTGATA TACCACAATA TAATCCCAGC CCACCAATTT GGATTTCGCG AAAGCCACGG 3540 + AACCATTGAA CAGGTGAATC GTATTACAAC GGAAATAAGA ACTGCATTTG AATATCGCGA 3600 + ATACTGTACA GCAGTATTTT TAGACGTATC CCAAGCATTC GACAAAGTCT GGCTCGACGG 3660 + CCTAATGTTT AAAATTAAAA CATCCCTACC CGAAAGCACA CACAAACTTC TAAAGTCTTA 3720 + CCTCTATGAC AGAAAGTTTG CAGTGCGGTG CAACACTGCC ACTTCCACTG TTCATACAAT 3780 + TGAGGCTGGA GTCCCCCAAG GCAGCGTTCT TGGGCCAACC TTATACCTCA TCTATACAGC 3840 + CGACATCCCT ACAAATAGTC GCTTAACGGT ATCCACATTT GCCGACGATA CAGCTATCCT 3900 + TAGCCGTTCA AGGTCCCCTA TCCAAGCTAC AGCACAGTTG GCACTGTACC TCATCGACAT 3960 + TGAGAAGTGG CTCTCTGACT GGCGAATAAA AGTAAACGAG CAAAAATGCA AGCACGTGAC 4020 + GTTTACGCTA AACAGACAAG ACTGTCCTCC GCTCTTGTTG AACAGCATAC CACTCCCGAA 4080 + AGCAGACGAG GTAACGTACC TAGGAGTACA CCTAGACAGA AGACTCACAT GGCGCAGGCA 4140 + CATTGAAGCC AAAAAAACCC AACTTAAACT CAAAGCCAAC AACTTACACT GGCTCATCAA 4200 + CTCTGGTTCT CCGCTCAGCC TAGATCACAA GGTCTTGCTC TACAATTCTA TATTGAAACC 4260 + AATCTGGACC TATGGCTCAC AGTTATGGGG CAATGCCAGC AACAGCAATA TTGACATCAT 4320 + TCAGCGAGCA CAATCAAAGA TTCTGAGAAC CATCACTGGG GCACCGTGGT ACGTTCGGAG 4380 + TGAAAACATC CAAAGAGACT TAAATATCCC ATCAGTTACC AACGCAATCA CGGAACTTAA 4440 + GGAAAAATAC CATAGCAAGC TTCACACGCA CCCCAACCAC CTAGCGCGAG GTCTAATCCA 4500 + GCTCAGCAGC CGTTCCCGTC TCCGGCGAAA GGACCTACCA ACCCAGCGAA TAAATTATTA 4560 + GGGCCGTTTA AACATAGAAC AGTTGGAAAA ATAATACAAC TGTTCAAAAA ATACTTGTTA 4620 + TAGTTAAGAT TTTTAAACTT ATTGTTAGTT CTTATACAAG AAGATTCAAT AAATAAAAGC 4680 + AAAGTAAAAT AAAAAAAAAA AAAAAAAA 4708 +// +ID FB standard; DNA; INV; 4347 BP. +XX +AC X51937; +AC X15469; +XX +DR FLYBASE; FBte0000466; Dmel\NOF. +XX +FT source join(X15469:94..1010,X51937:1..3430) +FT SO_feature CDS ; SO:0000316:797..3874 +FT /name="Dmel\NOF\ORF" +FT /db_xref="FLYBASE:FBgn0044029" +FT /db_xref="SWISS-PROT:P16320" +FT /db_xref="NCBI_PROTEIN:CAA36201.1" +FT /translation="IQQLDTSANLTLNSTFPDDDPEFQITEASKNGPLPILYFNLELDL +FT ELWRSIAPKKDQKTEKLQPNWTDTMAKLIYKKVPLPCAFNFRKAKLSDKVDNIWLRIEG +FT YCNDCSSILKGHCLVKPDEQCGIMISVSVPDTRGIPHNKKRRCTGSRRLEIGNELILKK +FT AALWRKEATDNMNDDDPEPSYIPNLPTLRKLREEATNRHLGITKDRDPVSSLYLKKYEG +FT ELAGCILDIGLDEFFCIYCTGTQVKTYASRIKTIRKISIDATGSVVLPIQKPNGDSSYV +FT FLYQIVMEGDDSIFPVFQMLSAKHDTASIQFWLSRFISKSGHFPLEVVSDFSLALLNGI +FT SLSFNECRIATYIKKCFHSLLMEERTDLPPCYIRLDIAHLIKMICRKNVFKSKLPNLKD +FT FYTRCIGLATTCETKDSFAELIKSVLIVALSQSSGEDEKGDILSSYRNEKYLLARIATF +FT TAPDHKETIEDNCIPEDQEEIDEDVTDFISNIKIAAEEEALNCNSVNCRPNPYFLPELM +FT PPLIKLCKYFVLWTNVMKEKFCSKYDVGSSALVEAYFKDLKNTDMSIFHRPVRADKFVV +FT QHIRCIEAVCKLERAAMKRKTVKTPSFIKENAPKKMCSKETKGFLEEILEESEVEYLLQ +FT EENWKVKNKTIKPTEGNDAEDNDTDDENKEMDLSEQPKEKPRGKYLKKCPNVELLYNRP +FT HRRKQDEILHNGGSMGPVWIGKQLLQFKNTCPFDSLVEILSTAYIDNFYYKSLLDDFYT +FT DNLTIELVKKYAVEGVSSSLYCDRGLVLKSFFDEKHQIIKCDANIGSFIEKALNGVPSA +FT SSHRTHIKNNHDCRNQKYIHHRLEVIDVEKVGHLDVQEVVIPFIDEFFARTDGECKICG +FT GQQILERQPGPHVILDIEFAMDAFHQIHHNGLPGTTTLLQVPEEILIQEKKYILSGAIE +FT YVPAMGGEIGHYIAYCRRVIGSWEVHNDMCRQWKKFSALNTKMTLHILIYTRKN" +XX +CC Derived from X15469 (g7962) (Rel. 36, Last updated, Version 3). +CC Derived from X51937 (g8297) (Rel. 44, Last updated, Version 6). +CC Takis Benos and Michael Ashburner, 25-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 4347 BP; 1461 A; 775 C; 885 G; 1226 T; 0 other; + TATATTCTAT TGCCCACCAT ATAAACACGT GCCACTTTCC TAGTTTTAGG ATCTGCCTAC 60 + ATAACACGTG CAGACGCACA GGTGTTTCTG GGTTTATATA GACCAAAAAT TGGTTCCGAT 120 + TGCCAATCTT GTAATTTACA GTTTACCAGG TAATTACATA ATTTTCAAAC CTCACTTTAT 180 + GATAGGGTCC AATTTTTTAC CTGTGACAAA GTGTTAAATT TTTTAAGAAT GGGTTTTTCA 240 + TGGCAGGTCA GAATCCTCTA TAAAATCTAA AACACTTGTC GGTATTTGAA AATCGCTCTC 300 + CTCCTTGATT CTCATATTAG GTGTAAAAGA TAAATCCGGA ACTCATAATT AAAATATTTT 360 + TTATGTGAAA AAGTTGTGCG CGATTTTAAC TACGCTTACC CAGTGCTGGA AAAGTTAAAG 420 + TTGTTTTGTT TTTCAAAGAA AGTGAAAGTT GCTAAGCACG AACTTAAGAA ATCTGAGTGA 480 + TTGTGTTAAA TTTATTTGAA TCCTTGTGAA TTTTGTTGAC AGTCTTTTTA AAGACTTGCA 540 + AAATTTTCAT ATTATTCGGT TCTTGCTTTT ATTTTTATAC AACGCGTTTT TCCTTTAGGC 600 + ATACCTTTAT ACATTTACAG TGTAAACAAC AGTGTAAAAC GTGTAAATCA GTGCAAAATA 660 + GTTTTTTTTA TTTACTCCAT AAAAAATAAG TGTTACTGTC AGGATGCCGG CCAAACCGCA 720 + AGTCGATGGT CACACCTTAG TGGATGCATT TTGCTGCGCG AATATTTTTA CGGAGACTGG 780 + AGCTCTTAAG CCAAGAAGCG ATAAAGTTTG GATGGATATA AGCAACCAAT TGAAAGGAGC 840 + GATCAGCGCG AAGACGCTTA ATTTCTACGC CAGAATCAAT AGGAATAACA TGATAACTGT 900 + GGTTAAAGAA CGATGTGGAA TTCAACAGCT GGATACTAGT GCCAATTTAA CTTTAAATAG 960 + CACATTTCCT GATGATGACC CGGAGTTCCA GATCACCGAA GCTTCAAAAA ATGGACCATT 1020 + GCCTATTTTG TACTTTAACC TGGAGTTGGA CCTGGAATTG TGGAGATCAA TTGCCCCCAA 1080 + AAAGGATCAA AAAACTGAAA AACTGCAACC TAACTGGACG GATACTATGG CAAAGTTGAT 1140 + ATACAAAAAA GTTCCTCTTC CGTGTGCATT TAATTTTAGA AAAGCTAAAC TTTCCGACAA 1200 + AGTGGATAAT ATTTGGCTAC GAATTGAAGG CTATTGCAAT GACTGCAGCT CAATTTTAAA 1260 + GGGACATTGC CTTGTGAAAC CCGATGAACA ATGCGGCATA ATGATATCTG TTTCAGTACC 1320 + GGACACACGA GGTATACCTC ATAATAAAAA ACGACGGTGC ACTGGATCGA GACGACTTGA 1380 + AATTGGGAAC GAGTTGATTT TAAAAAAAGC TGCATTGTGG AGGAAGGAAG CCACCGACAA 1440 + CATGAATGAT GACGACCCAG AACCGAGTTA CATACCAAAT TTACCAACCC TTCGGAAACT 1500 + TCGTGAAGAG GCAACTAACA GACACCTAGG AATTACCAAG GATCGGGATC CAGTTTCATC 1560 + ATTATACCTT AAAAAGTATG AGGGTGAATT GGCTGGATGC ATTCTTGACA TTGGATTGGA 1620 + TGAATTTTTC TGCATATACT GCACAGGAAC CCAAGTAAAA ACATATGCAT CAAGGATAAA 1680 + AACTATTAGA AAGATTTCTA TTGACGCAAC TGGAAGCGTG GTGTTACCCA TCCAAAAACC 1740 + AAACGGTGAC TCTAGTTATG TTTTTCTGTA CCAAATTGTA ATGGAGGGTG ACGACAGTAT 1800 + ATTTCCAGTT TTTCAGATGC TGTCGGCTAA ACATGACACA GCCAGCATAC AGTTTTGGTT 1860 + AAGCAGATTT ATATCAAAGT CGGGGCATTT TCCACTGGAG GTTGTATCTG ATTTTTCCTT 1920 + GGCATTGCTA AATGGAATAA GCTTAAGCTT TAATGAGTGT AGGATTGCGA CGTATATAAA 1980 + AAAATGTTTC CACAGCCTTT TGATGGAGGA ACGGACGGAT CTGCCACCCT GCTATATTCG 2040 + ACTTGACATC GCCCACCTAA TTAAAATGAT ATGCCGGAAG AACGTCTTCA AAAGTAAATT 2100 + ACCGAACCTC AAGGATTTTT ATACTAGATG TATTGGTCTT GCAACAACGT GTGAGACAAA 2160 + GGACAGTTTT GCGGAATTAA TTAAATCAGT ACTGATTGTC GCACTGAGCC AATCCTCAGG 2220 + GGAAGATGAA AAAGGAGACA TTCTTTCAAG TTACAGGAAT GAAAAGTATC TGCTCGCCAG 2280 + AATAGCTACA TTTACTGCCC CGGATCACAA GGAGACCATT GAGGACAACT GCATACCAGA 2340 + GGACCAGGAG GAAATTGACG AGGATGTTAC GGACTTTATC TCTAATATTA AAATCGCTGC 2400 + CGAAGAAGAA GCGTTAAATT GCAATTCGGT CAACTGTCGG CCAAATCCGT ATTTCCTACC 2460 + TGAGCTAATG CCACCATTAA TTAAGTTGTG CAAATATTTT GTTTTATGGA CAAACGTGAT 2520 + GAAGGAAAAG TTCTGTTCCA AATATGATGT CGGCTCTTCG GCTCTTGTGG AAGCCTATTT 2580 + CAAGGATTTA AAAAACACGG ACATGAGCAT ATTCCACCGA CCAGTGAGAG CGGATAAATT 2640 + CGTGGTGCAA CATATCCGAT GCATCGAAGC TGTTTGCAAG CTGGAACGAG CCGCGATGAA 2700 + ACGCAAGACC GTTAAAACTC CCAGCTTTAT AAAAGAAAAC GCTCCTAAGA AAATGTGCAG 2760 + TAAGGAAACC AAGGGATTTC TGGAGGAAAT ACTTGAAGAA AGCGAAGTGG AATACCTTTT 2820 + ACAAGAAGAA AACTGGAAGG TGAAGAATAA AACAATAAAG CCCACGGAAG GAAATGATGC 2880 + TGAAGACAAC GACACTGATG ATGAAAACAA GGAAATGGAT TTAAGTGAAC AGCCCAAAGA 2940 + AAAACCAAGG GGAAAATATC TCAAAAAATG CCCCAATGTG GAGTTATTAT ACAATCGACC 3000 + ACATCGAAGG AAACAGGACG AAATTTTGCA TAATGGTGGA TCAATGGGAC CCGTCTGGAT 3060 + TGGCAAACAA TTATTGCAAT TCAAAAATAC TTGTCCGTTT GACTCTCTAG TGGAAATATT 3120 + GTCGACCGCA TACATAGACA ATTTTTATTA CAAAAGCCTA TTGGATGATT TCTACACTGA 3180 + CAACTTGACG ATAGAATTGG TGAAAAAGTA TGCCGTCGAG GGAGTTTCGT CCAGTCTCTA 3240 + CTGCGACAGA GGTCTGGTCC TAAAAAGTTT TTTTGATGAA AAACACCAGA TTATAAAATG 3300 + CGACGCAAAT ATTGGGTCTT TTATTGAAAA AGCGCTGAAT GGAGTACCCA GTGCGTCAAG 3360 + TCATCGGACC CATATAAAAA ACAACCATGA TTGCAGGAAC CAAAAATATA TCCACCATCG 3420 + GCTGGAGGTT ATAGATGTCG AAAAAGTTGG CCACCTCGAC GTCCAGGAGG TAGTGATCCC 3480 + CTTTATTGAT GAGTTTTTTG CAAGAACTGA TGGAGAATGT AAAATATGCG GTGGACAACA 3540 + GATCCTTGAA AGGCAGCCAG GACCGCATGT CATACTTGAT ATAGAATTTG CAATGGATGC 3600 + TTTTCATCAA ATTCATCATA ACGGTTTACC AGGAACGACC ACTTTACTTC AAGTGCCGGA 3660 + GGAAATTTTA ATACAGGAAA AGAAATATAT TTTAAGTGGT GCCATCGAAT ATGTTCCTGC 3720 + GATGGGAGGG GAAATTGGAC ATTACATTGC ATATTGCCGC AGAGTCATTG GATCTTGGGA 3780 + AGTGCACAAC GATATGTGCA GGCAATGGAA AAAGTTCTCA GCTCTAAATA CCAAAATGAC 3840 + ACTCCACATT TTGATATACA CCCGGAAAAA TTAATGTTTA TTTTTAAGCC TTGTTTAAAA 3900 + GTGTAAAAAA TATTTGTTGT TAAAAATTAC AATCTTAAGT CCTTTGCAAA CGTTGTTTAA 3960 + AAATAAAATT AAATTAATTA TTTTACAAAA CTTAACCCTT TTTCACTTTT ATACCTAATA 4020 + TAAAGAGGTC CGTAAAGTAT CAAGGAGGAG AGCGATTTTC AAATACCGAC AAGTGTTTTA 4080 + GATTTTATAG AGGATTCTGA CCTGCCATGA AAAACCCATT CTTAAAAAAT TTAACACTTT 4140 + GTCACAGGTA AAAAATTGGA CCCTATCATA AAGTGAGGTT TGAAAATTAT GTAATTACCT 4200 + GGTAAACTGT AAATTACAAG ATTGGCAATC GGAACCAATT TTTGGTCTAT ATAAACCCAG 4260 + AAACACCTGT GCGTCTGCAC GTGTTATGTA GGCAGATCCT AAAACTAGGA AAGTGGCACG 4320 + TGTTTATATG GTGGGCAATA GAATTTA 4347 +// +ID DMTNFB standard; DNA; INV; 1106 BP. +XX +AC V00246; J01084; +XX +DR FLYBASE; FBte0000288; Dmel\FB. +XX +FT source V00246:1..1106 +XX +CC Derived from V00246 (g8708) (Rel. 36, Last updated, Version 3). +CC Josh Kaminker 2 Aug 2002. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 1106 BP; 340 A; 228 C; 119 G; 419 T; 0 other; + AGCTCAAAGA AGCTGGGGTC GGAAAAATCG AATTTTTGAA ATTTGAAAGC TGGAATCGTT 60 + TGCCCATTTT TTGCCCATGT TTGCCCACCA ATTAGTTTTT TTTGCCCACG TCCAGTTTTT 120 + GAGATATGGA TTTTCGAAAA AGTTCGAAAA TGTTCGAAAA TCAAAAATTT CGCTTTTTTC 180 + AAATTTTTTT TTTTTTAAAT CGCAATAACA TCGTTTGCCC ACGTTTGCCC ACCCTTTAGA 240 + ATTTTGAAAA AATTTATACT TTAGAAAATA TAAGGCTTTT AAGTTTACCT CGGTCTAATC 300 + AGAGAGTAAA TCGTTTGCCC ATCTCTTAAA ACCAAATATT ATCAACAAAA AACGTTTGCC 360 + CAACCATTAT TATTAGTTTT TATCGTTTGC CCACCCTTTA AAAAACCTTT AACAAAATTT 420 + TTTTTTCGAT TGCCCACACT TGAAATACAA CCAATTTCGT TAGCCCACCT CTTCAAAATA 480 + AATATTTCCA ATAAAAAACG TTTTCCCACC ATTTAAAAAT AAATAATTTC GATTGCCCAT 540 + CCTTCAAAAT TCATTTTAAC GTTTGCCCAC CCTTTAAAAT TTGTTTTTTT CGTTTGCCCA 600 + CTCTTAAAAC TAAATAATTT CGATTGCCCA CCTTTTAAAA CTAAATAATT TCGTTTGCCC 660 + ATCCTTTAAA ATTCATTTTT AACGTTTGCC CACCCTTTAA AAATAAATTA TTTCGTTTGC 720 + CCACCCTTTA AAATTTGTTT TTTTCGTTTG CCCACTCTTA AAACTAAATA ATTTCGATTG 780 + CCCACCTTTT AAAACTAAAT AATTTCGTTT GCCCATCCTT TAAAATTCAT TTTAACGTTT 840 + GCCCACCCTT TAAAAATAAA TTATTTCGTT TGCCCACCCT TTAAAAGTTT TTTTTTTTCG 900 + TTTGCCCACT CTTAAAACTA AATAATTTCG ATTGCCCACC TTTTAAAACT AAATAATTTC 960 + GTTTGCCCAT CCTTTAAAAT TCATTTTTAA CGTTTGCCCA CCCTTTAAAA TTTGTTTTGT 1020 + AAGATGTGGC GCCAATTCAG ATATTTTAGG ATCGGCGGAT AGAAGCACTT ACTTATATGA 1080 + TGATGATGAA CATACATAGA CATAAT 1106 +// +ID DMREPG standard; DNA; INV; 4346 BP. +XX +AC X06950; +XX +DR FLYBASE; FBte0000657; Dmel\G-element. +XX +FT source X06950:1..4346 +FT SO_feature CDS ; SO:0000316:220..951 +FT /name="Dmel\G-element\ORF0" +FT /db_xref="FLYBASE:FBgnXXXXXXX" +FT SO_feature CDS ; SO:0000316:819..1539 +FT /name="Dmel\G-element\ORF1" +FT /db_xref="FLYBASE:FBgnXXXXXXX" +FT SO_feature CDS ; SO:0000316:join(1530..1858,1866..1973,1982..2719,2727..3008,3012..3800,3806..3991,4006..4095) +FT /name="Dmel\G-element\ORF2" +FT /db_xref="FLYBASE:FBgnXXXXXXX" +XX +CC Derived from X06950 (g8427) (Rel. 16, Last updated, Version 1). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 4346 BP; 1215 A; 1356 C; 959 G; 816 T; 0 other; + ACAGTCGCGA TCGAACACTC AACGAGTGCA GACGTGCCTA CGGACCGACG GCAAGTTATT 60 + TTCGTGCTCA AAGTCCCGCT ACTCTAAAAC CGCTACGTAG TGTCGCGAGA TTTCTTCGCG 120 + CACCGTGATT GGTTCAGCCG GCGAACCTTA CGGTATCGCT ACCACTACCA ACGCACTCGT 180 + GCGTGCGTGT TATCGGTATC AACAGTTACA TTCGGCTAAA GTTACTGCGA ACAACTCAGC 240 + AGCAGCCACG TGCTGAGGCT GGTACACCAA CAAACGGTTC CTACCGTGCC CTCCTCCCCT 300 + CCTTCCCTAC TCCGGGACAA CATGGACTGG CAAGCCCCCC CGCGACCCAC CAAGCTGACC 360 + AAAGTGCCTA GAAAGAAGGC GCTCAAAGAG GCGCCAGGAG AAGGTGAAAG CAGCTGCTCA 420 + AGCGATAGCA GCTCCTCGGA GTCAGAGCCT GGGGAAGTCA AGCGCAAAGC AGCGAGCAGA 480 + GACGCTAAGG AAGCCGCCGA CAACGTGCCC AACACCAGCG CAGCTCTGCG CAAGAAGCTG 540 + GAAAATAACT CCTTCGCCCT TCTGTCCAGC ACTGAGGACG AAGACGATGA CGACGACAAC 600 + ACCGACAACG AGCAGCAAAC CCCTGTTGGG GAATCTGCTC CAAAAACCAT GAAAAAACCC 660 + AACCCGACCC CGAAGACCAT CAAGCCACCC CCGATCTACA TCCCAGACGT GACCAACATC 720 + TCAGCCCTTG TCAGGATGAT TACGACTCTC GTCGGTGCCC ACAAGGAATT CTCGTACAAA 780 + ACTGAGAGAA ACAACAATGT ACGAGTAATG ATGCCTGACA AGGAATCCTA CTCAGCCTTT 840 + CGTCAGCAGC TTGTGACCCA GAACAAAAGG CACCGCACAT TTCAACTGTC AGGGACCTGC 900 + ACAACCCAAT TGGCAAAAAA TCAAAGGAAC CCCTGGGGAT CTTCTTTGTA AACCTGGAAC 960 + CTGCGAGCAA CAATACAGAC ATCTACAAAC TCAAGAGAAT CTGCAGGTCG GTCGTCACCG 1020 + TTGAGCCGCC TCTGAAATTC AACGATGTTC CGCAGTGCTT CAGATGTCAA GGGTTCGGAC 1080 + ACACCCAGCG CTACTGCTTT TTAGAGTTTC GCTGCGTCAA GTGTGGTGGC CTCCACGACT 1140 + CCAGGGCGTG TGAAAAAAAG GAAGACGAGA AAGCATGCTG CCTACACTGT CAAGCCGACC 1200 + ATCCAGCGTC GTTCAAAGGG TGCCCCGCGT ATAAGAAGGC AAAGGCTCAA CAAGCTCCTA 1260 + AACCCAAAGC AAGGAGCATG GAAAGCAACA ACAAGCCCTC CTTTGAGCTC CCAAATATTA 1320 + CAAACGGTAT GAGCTATAGA GACGCGCTAA GTGGCACACG CAAGTCCCAA GCAAGCACTC 1380 + CCCCACCGAC ACCCCCAACC CCACCTGAAG CCCCACAACC TAACCACATG GAGGCTATGT 1440 + TCACTCGATT TGAGAGCCTG GTCGAAAGAA TGATGGAGAA GATGTTTGCT CAGGTGACGC 1500 + AGCTTGTTGC TTCCATCCTC AACAGCAAGT CATGCAAATA AGTCTCAACA TAGTCTTCTG 1560 + GAACGCGAAC GGCTTGCAGA GAAGCAAAGC CGAAGTTGAG CACACCATCA AAACCGACAA 1620 + CATCGATATT TTATTGGTCT CAGAATCCCA TTTTTGCCCC AGATCCCACT TCATCATCTC 1680 + CGGTTACGAC CTCATCACAG CCAACCACCC ATCAGGTAGA GCTCGAGGAG GAGCGGCCAT 1740 + GCTCATCAAA AGCGGCATAC AGTTCACTGA ACTGCCTGCG ATACAGGAGG ATTGGGCACA 1800 + GTGTGCAGTG GCCAGAGTCA ATAGCCTACA GGGAGATATT ACGGTTGGAG CGGTTTACTT 1860 + CCACCCCCAG GCACGCGATT ACAGAGACTC ACCTGCATGA GTTCTTCGAG TCCCTCGGAA 1920 + CTCGCTTCAT TGCAGCCGGA GACTTCAATG CAAAGCACTC CTGGTGGGGG TCCGCACAAA 1980 + CAACCCCAAA GGCAAAACGC TCCACAAGTA CCTGATGCGC AAAAACTTGG ACTGCCACTC 2040 + TACTGGAGAG CCCACACACT GGCCCTCGGA CCCTTCTAAG CAGCCGGATC TGCTGGACAT 2100 + CGCGATCTGC AAAGGCATAG GTCGTGCCAA ACTCGTCTGC ACTACATACG ACAGGCTCGT 2160 + ATCGGACCAC AGCGCCGTCA ACCTGCTCCT CAACATCCCT GTCCTCAGGA AGACGCCGCT 2220 + CCGTAGACTC ACGGGGAATC GCACCAATGC CCCCAAGTTC ACGTTCTGGA TGCTCTCCTC 2280 + CCTAAACCCA GACCCAGACC TCTCCACTCC AGGCAATATA GGCGCGGCCA TCGAAAAACT 2340 + GAACAAGGAG ATGCACAACG CCGCTGAGTT TGCGAACCCT CCTCCTCCTA CAACCCCGAG 2400 + AACTCCCGCA AGAGACCTGC ATTTGTGGTC CCCAGAAATC GCCGCCCTCG TGGCCGAGAA 2460 + GAGACGCCTC AGACGAGTAT GGTTCCTCTC GCGTAACCCC AGGGACAAGA CAGCGCTCAA 2520 + TCGCGCCTCC AAGGAACTCA AGGACAAACT AACCACCCTA CGCCAAGACT CGTTTCAACG 2580 + ATTCCTTGAA GATCTGGAAC CTGGAGACCC GCAGCACAAC CTGTGGATCG TCACGCGGCA 2640 + CATCAAAAGA CCCGCCAAGA AAATGGTACC AGTGCGTACA GCAGACTGCT CCTGGTGTCG 2700 + GTCTGAGGCA GAAAGAGCCG AAGCTTGCTG ACCACCTTCG CTCTGCCTTC ACTCCGTTTG 2760 + ACCGATGCAC AGCTGCAGAG CAAGCTGACA CCATCAGAGC TGTTGAAAGC CCATGTGCTC 2820 + CAGGACCTGC AATTCAGCCC GTCGCACCAG AGGAGATCGC GCAGGAAATT GCCTCGCTCA 2880 + GAAACGGCAA GTCTCCCGGC CCTGATCGCA TCGACGCTAC TGCGTTAAAA ATGTTGCCCA 2940 + CATTCTGCTC ACAGCTGCTT GCCAACATTT TTAACAGCTG CTTCCGGCTA GGGTATTTCC 3000 + CAAAACAATA GAAACGCGCC GAAGTGATTA CCATCCCCAA GCCCGGCAAA CCTGAAGCCA 3060 + ATCTTGCCTC CTATCGTCCG ATAAGTCTGC TGGCAATCCT CTCCAAAATA CTCGAAAGAG 3120 + TATTTCTGCG CAGAGTGCTG CCAGTACTGG ATGAGGCTGG TTTGATCCCC GATCACCAGT 3180 + TTGGCTTCAG GCGCTCCCAC GGAACACCAG AGCAATGCCA CCGGCTTGTA GAGCAAATTT 3240 + TGGAGGCCTT CGAAAGGAAG CAATACTGCT GCGCCGTCAT GCTGGATGTG AAGCAGGCCT 3300 + TCGACAAAGT CTGGCACCCT GGACTCCACT ATAAAATCAA GACTCACCTT CCCGGATCCC 3360 + ACTTCGCCTT CCTCAAATCA TTCACTGAGG GTAGAGAGTT CCAAGTTTGC TGCGGAACAG 3420 + CGACCAGCAC GCCTAGGCCG ATAAGAGCCG GAGTACCCCA AGGCAGCGTC CTTGGACCAA 3480 + TACTGTACAC ACTCTACACA GCAGACCTTC CTATCACACC CTCCCGGAGC CTAACAGTGG 3540 + CCACATATGC CGATGACACC GCCTTCCTAG CCTCCGCCTC AGACCCCCAA GAAGCATCAA 3600 + CCATCATTCT AAGCCAGCTG GATGCCCTCG ACCCATGGTT GAAACGATGG ACCATTGCCG 3660 + TGAACGCAGA CAAATCCTCC CAAACCACTT TCTCCCTGCG CAGAGGAGAC TGCCCCCCAG 3720 + TCACGCTCAA CGGGGAAACT ATTCCAACCT CAAGTTCCCC GAAATACCTT GGATTGACTC 3780 + TAGACCGGAG GCTCACTTGG CACACCAGGC TGACCTGCGC CTCAAGCAAC TCCACTGGCT 3840 + CATCGGGAAA AGGTCCAAAC TTAGGGAAAA CCTTAAACTC CTCCTGTACA AGGCCATCCT 3900 + GAAGCCAATT TGGACTTATG GGATTCAGCT GTGGGGCACT GCCAGCATCT CAAACCGCAA 3960 + CCGCATACAG CGCTTCCAGA ACAAGTGCCT GAGTCAATCG CTGACGCTCA CCCATACCAT 4020 + GAAAACTCCG TTATCCACAA GGAGCTTGGA ATGCCATGGG TAGCAGAGGA GATCTCCCGC 4080 + TTCAGCGAGA GATACGCTAA ACGACTGGAC AACCACCCTA ACCATCTGGC TATTAACCTC 4140 + CTGGACAACA GTGAAACCAT CAGACGCCTC CAGAGGAAAC ACCCGCTTGA TCTCCACCAC 4200 + CTATAACCCA CAACAATGAA CCCCCGACCA ATCTACAACT TTGTAATCCC TTAAGTTAAT 4260 + GCCCCCCCCA CCCAAACATT TAATTATTGT CCACATGGAC AGATTTTAAA TTAATACATA 4320 + GATCGCTAAA AAAAAAAAAA AAAAAA 4346 +// +ID DMGYPF1A standard; DNA; INV; 7469 BP. +XX +AC M12927; +XX +DR FLYBASE; FBte0000021; Dmel\gypsy. +XX +SY synonym: mdg4 +XX +FT source M12927:1..7469 +FT SO_feature five_prime_LTR ; SO:0000425:1..482 +FT SO_feature three_prime_LTR ; SO:0000426:6841..7411 +FT SO_feature polyA_site ; SO:0000553:7277..7280 +FT SO_feature primer_binding_site ; SO:0005850:482..492 +FT /bound_moiety="tRNA:lys2" +FT SO_feature CDS ; SO:0000316:1080..2435 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\gypsy\gag" +FT /db_xref="FLYBASE:FBgn0014965" +FT /db_xref="SWISS-PROT:P10405" +FT /db_xref="NCBI_PROTEIN:AAA70218.1" +FT /translation="MSWAHNYRKVKVEYESEDSWEEEQVGQALGRPLDSATVDITMDPN +FT QIQALIDNAVRQALSQQQSQFQTQLNSLAARVQSLQVEAPQIKIYEKVSVNPDVRCDIP +FT LDIIKSVPEFSGTQDEYVAWRQSAIYAYELFKPYNGSSAHYQAVAILRNKIRGAAGALL +FT VSHNTVLNFDAILARLDCTYSDKTSLRLLRQGLEMVRQGDLPLMQYYDEVEKKLTLVTN +FT KIVMTHEQEGADLLNAEVRADALHAFISGLKKALRAVVFPAQPKDLPSALALAREAEAS +FT IERSMFANSYAKAVEERAHSGANGKSRFQGKPNKEEQGQDRNPHFTKRPKNNGQTNKDT +FT QAQAPQPMEVDSSSRFRQRTEHYQNHPNESNAFKRRNSSERSTGPRRQRLNNVVQEAPK +FT QKDPKEEYEKTAKAAVEEIDSENEYAPSDDSLNFLGGAPGCRSLNDGWLGEP" +FT SO_feature CDS ; SO:0000316:2438..5470 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\gypsy\pol" +FT /db_xref="FLYBASE:FBgn0014966" +FT /db_xref="SWISS-PROT:P10401" +FT /db_xref="NCBI_PROTEIN:AAA70219.1" +FT /translation="MLIDTDAAKNYIRPVKELKNVMPVASPFSVSSIHGSTEIKHKCLM +FT KVFKHISPFFLLDSLNAFDAIIGLDLLTQAGVKLNLAEDSLEYQGIAEKLHYFSCPSVN +FT FTDVNDIVVPDSVKKEFKDTIIRRKKAFSTTNEALPFNTAVTATIRTVDNEPVYSRAYP +FT TLMGVSDFVNNEVKQLLKDGIIRPSRSPYNSPTWVVDKKGTDAFGNPNKRLVIDFRKLN +FT EKTIPDRYPMPSIPMILANLGKAKFFTTLDLKSGYHQIYLAEHDREKTSFSVNGGKYEF +FT CRLPFGLRNASSIFQRALDDVLREQIGKICYVYVDDVIIFSENESDHVRHIDTVLKCLI +FT DANMRVSQEKTRFFKESVEYLGFIVSKDGTKSDPEKVKAIQEYPEPDCVYKVRSFLGLA +FT SYYRVFIKDFAAIARPITDILKGENGSVSKHMSKKIPVEFNETQRNAFQRLRNILASED +FT VILKYPDFKKPFDLTTDASASGIGAVLSQEGRPITMISRTLKQPEQNYATNERELLAIV +FT WALGKLQNFLYGSREINIFTDHQPLTFAVADRNTNAKIKRWKSYIDQHNAKVFYKPGKE +FT NFVADALSRQNLNALQNEPQSDAATIHSELSLTYTVETTDKPLNCFRNQIILEAARFPL +FT KRNLVLFRSKSRHLISFTDKSWLLKTLKEVVNPDVVNAIHCDLPTLASFQHDLIAHFPA +FT TQFRHCKNVVLDITDKNEQIEIVTAEHNRAHRAAQENIKQVLRDYYFPKMGSLAKEVVA +FT NCRVCTQAKYDRHPKKQELGETPIPSYTGEMVHIDIFSTDRKLFLTCIDKFSKYAIVQP +FT VVSRTIVDITAPLLQIINLFPNIKTVYCDNEPAFNSETVTSMLKNSFGIDIVNAPPLHS +FT SSNGQVERFHSTLAEIARCLKLDKKTNDTVELILRATIEYNKTVHSVTRERPIEVVHPG +FT AHERCLEIKARLVKAQQDSIGRNNPSRQNRVFEVGERVFVKNNKRLGNKLTPLCTEQKV +FT QADLGTSVLIKGRVVHKDNLK" +FT SO_feature CDS ; SO:0000316:join(567..568,5551..7000) +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="gypsy\env" +FT /db_xref="FLYBASE:FBgn0014964" +FT /translation=" +FT MFTLMMFIPLVVANARITDFSHANYIPVLDGDVLVFEQRDLLKHSSNLSE +FT YASMIDETQKLSESFPHSHMRKLLEVDTDHLRTLLSVLKVHHRIARSLDF +FT LGTALKVVAGTPDATDLFKIKITEAQLVESNSRQIAINSETQKQINKLTD +FT TINKVINARKGDLVDTPHLYEALLARNRMLSTEIQNLILTITLVKSNIIN +FT PTILDHADLKPLVEQDTPIVSLIEASKIRVLQSENSIHILIAYPRVKFSC +FT KKVAVYPVSHQHTILRLDEDTLAECEHDTFAVTGCTDTTHFTFCERSRRE +FT TCVRSLHAGNAAQCHTQPSHLREINPVDDGVVIINEAAAHVSTDGSPETL +FT IEGTYLVTFERTATINGSEFVNLRKTLSKQPGIVRSPLLNIVGHDPVLSI +FT PLLHRMSNENLHSIQNLMDDVESEGSPRLWFVAGVVLNFGLIGSLALYLA +FT LRRRRASREIQRTIDTFNMTEDGHKLEGGVVNN" +XX +CC Derived from M12927 (g157583) (Rel. 44, Last updated, Version 6). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +CC [See also:AF033821; alignments in /alignments/gypsy] +XX +SQ Sequence 7469 BP; 2301 A; 1808 C; 1602 G; 1758 T; 0 other; + AGTTAACAAC TAACAATGTA TTGCTTCGTA GCAACTAAGT AGCTTTGTAT GAACAATGCT 60 + GACGCGCCAG AATTGGGTTC AACGCTCCAC GCGAAGAATG CCTGGCAGCG GAAAGCTGAC 120 + ACTTCCTACC GGGAGTGTTG CTTCACGCTG CAAGAAATGC TGAGTCGGCT TGCCGACTTG 180 + TGGCGGCGCG ATGCATTGCT CGAGGGTAAA CTTAGTTTTC AATATTGTCT TCTACTCAGT 240 + TCAAATCTTG TGTCGAAATA AACCACAGCT TGCTCCGGCT CATTGCCGTT AAACATCATT 300 + GTTCTTATTT ACAATCAAAT CGCTATCGCC ACAAGGCTAG TGATAATAAC TAAGGGGGCG 360 + AAGTCAAGCC CTCCAACCTA ATCTCCATAA ACAGTGTCTA AGACGAACCT CAGCGAAAGA 420 + AGGAAGATCT CTAGACCTAC TGGAAATAAC ATAACTCTGG ACCTATTGGA ACTTATATAA 480 + TTGGCGCCCA ACCAACAATC TGAACCCACC AATCTAATTT AACACACTTT GTCAGGCGAC 540 + AAACAGGGTA GTTAAGTTAG AAAAGCATGT AAGTTTTACA AGACACTTCT TTGACGCAAT 600 + CAAGAAATTT ACGAGTGAAA AAAAAAAAAA AAAAAAGTTG TGTATCTGGC CACGTAATAA 660 + GTGTGCGTTG AATTTATTCG CAAAAACATT GCATATTTTC GGCAAAGTAA AATTTTGTTG 720 + CATACCTTAT CAAAAAATAA GTGCTGCATA CTTTTTAGAG AAACCAAATA ATTTTTTATT 780 + GCATACCCGT TTTTAATAAA ATACATTGCA TACCCTCTTT TAATAAAAAA TATTGCATAC 840 + TTTGACGAAA CAAATTTTCG TTGCATACCC AATAAAAGAT TATTATATTG CATACCCGTT 900 + TTTAATAAAA TACATTGCAT ACCCTCTTTT AATAAAAAAT ATTGCATACG TTGACGAAAC 960 + AAATTTTCGT TGCATACCCA ATAAAAGATT ATTATATTGC ATACCTTTTC TTGCCATACC 1020 + ATTTAGCCGA TCAATTGTGC TCGGCAACAG TATATTTGTG GTGTGCCAAC CAACAACCAA 1080 + TGAGTTGGGC ACATAACTAC AGAAAGGTTA AGGTCGAATA CGAAAGCGAG GATAGCTGGG 1140 + AGGAGGAGCA AGTAGGCCAA GCATTAGGTC GGCCGTTAGA TAGTGCCACG GTAGATATTA 1200 + CCATGGACCC CAATCAGATT CAAGCTCTTA TCGACAATGC TGTCAGACAG GCATTGTCGC 1260 + AACAGCAATC CCAATTTCAG ACACAACTCA ATTCCCTAGC TGCGCGGGTA CAGAGTTTGC 1320 + AGGTGGAAGC ACCGCAAATC AAGATTTACG AAAAAGTCTC TGTTAACCCC GATGTTAGGT 1380 + GCGACATTCC CCTTGACATA ATAAAGTCTG TACCAGAGTT CTCCGGTACC CAAGACGAGT 1440 + ATGTGGCCTG GAGACAATCG GCCATATACG CCTACGAGCT CTTCAAACCA TACAATGGCA 1500 + GCAGTGCCCA TTATCAGGCT GTTGCCATAT TAAGGAATAA AATCCGTGGC GCAGCCGGGG 1560 + CTTTACTGGT CTCCCACAAT ACGGTATTGA ACTTCGATGC TATTTTGGCC AGACTAGACT 1620 + GCACGTACTC GGACAAAACA TCCTTACGCC TGTTGAGGCA AGGATTGGAA ATGGTTAGGC 1680 + AAGGAGACCT ACCACTAATG CAATACTACG ATGAAGTTGA AAAGAAGCTA ACGCTTGTCA 1740 + CTAACAAAAT CGTAATGACG CATGAACAAG AGGGTGCTGA CCTGCTTAAC GCTGAGGTCA 1800 + GAGCCGACGC CCTGCATGCT TTTATTTCGG GGCTCAAAAA GGCCCTCAGA GCTGTGGTCT 1860 + TCCCGGCCCA ACCAAAAGAC CTGCCATCTG CACTGGCTTT AGCTAGAGAA GCAGAGGCAA 1920 + GCATAGAGAG AAGCATGTTC GCTAACTCCT ACGCCAAGGC CGTAGAGGAG CGAGCGCATT 1980 + CGGGGGCAAA CGGCAAGAGC CGTTTCCAGG GGAAGCCAAA TAAAGAAGAA CAGGGACAGG 2040 + ACAGGAATCC CCACTTCACC AAACGCCCCA AAAATAACGG ACAAACCAAC AAGGACACTC 2100 + AGGCGCAAGC ACCCCAGCCA ATGGAGGTCG ATTCATCCTC CAGGTTTAGG CAGCGTACTG 2160 + AACATTATCA GAATCATCCT AACGAGTCGA ACGCGTTTAA GAGGAGAAAT TCCTCAGAAC 2220 + GCTCAACAGG ACCGAGACGA CAACGTCTGA ATAACGTTGT CCAAGAGGCC CCTAAACAAA 2280 + AGGACCCCAA AGAAGAGTAT GAAAAAACAG CAAAGGCTGC AGTCGAGGAA ATCGACAGCG 2340 + AAAATGAGTA CGCTCCCAGT GACGACTCGT TGAATTTTTT AGGGGGCGCT CCCGGTTGCC 2400 + GTTCATTGAA CGACGGCTGG CTGGGAGAAC CTTAAAGATG CTAATCGATA CCGACGCGGC 2460 + AAAAAACTAC ATTAGGCCCG TAAAGGAGCT GAAAAATGTA ATGCCGGTCG CCAGCCCTTT 2520 + CTCGGTGAGC TCAATACACG GCTCCACCGA AATCAAACAC AAATGCTTGA TGAAAGTCTT 2580 + CAAGCACATC TCCCCATTTT TTCTTTTGGA TTCTCTCAAT GCGTTCGACG CTATCATAGG 2640 + CTTGGACCTG TTAACACAGG CCGGGGTAAA ACTCAACCTT GCAGAGGACT CCTTAGAATA 2700 + CCAGGGCATC GCTGAAAAGC TTCATTATTT CAGCTGCCCC AGTGTAAATT TCACTGATGT 2760 + AAACGATATT GTTGTACCTG ACTCCGTTAA AAAGGAGTTC AAGGACACAA TAATAAGGAG 2820 + GAAGAAAGCT TTCTCCACAA CAAATGAAGC TCTTCCTTTT AACACCGCTG TCACTGCCAC 2880 + AATTCGGACA GTTGACAATG AACCGGTGTA CTCAAGAGCG TACCCAACTC TTATGGGTGT 2940 + CTCCGACTTT GTGAACAACG AGGTCAAACA ACTGCTGAAA GACGGCATTA TCAGGCCCTC 3000 + AAGGTCTCCC TATAACAGCC CGACCTGGGT TGTTGACAAA AAGGGGACCG ACGCCTTCGG 3060 + GAACCCAAAC AAGAGGTTGG TCATTGACTT CAGGAAGCTA AATGAGAAAA CTATTCCTGA 3120 + CCGGTACCCG ATGCCTAGCA TTCCCATGAT TCTAGCGAAT CTGGGCAAGG CAAAGTTCTT 3180 + CACTACCCTT GATCTTAAGT CAGGGTATCA TCAAATTTAC CTCGCGGAAC ACGACCGCGA 3240 + GAAGACATCG TTCTCGGTGA ATGGTGGTAA ATACGAGTTT TGCCGTCTAC CGTTCGGCTT 3300 + GAGAAATGCA AGCAGCATTT TTCAAAGAGC CCTAGACGAT GTGCTTAGAG AGCAAATCGG 3360 + GAAGATATGT TACGTCTATG TAGATGACGT CATAATTTTC TCTGAAAACG AGTCCGACCA 3420 + TGTCCGCCAC ATCGATACAG TACTAAAATG CCTGATCGAT GCCAACATGA GAGTAAGCCA 3480 + GGAGAAAACT AGATTCTTTA AAGAGAGTGT AGAATACCTC GGCTTTATTG TCAGTAAGGA 3540 + CGGAACTAAA TCCGATCCAG AGAAGGTGAA GGCCATTCAG GAGTACCCTG AACCAGACTG 3600 + CGTTTACAAG GTTAGGTCCT TCCTTGGTTT AGCCAGCTAC TACAGAGTCT TCATCAAAGA 3660 + CTTTGCTGCC ATAGCCCGCC CGATCACCGA TATCCTAAAA GGGGAAAATG GTTCGGTGAG 3720 + CAAACACATG TCTAAAAAAA TTCCTGTTGA GTTTAATGAA ACTCAACGCA ACGCGTTCCA 3780 + AAGACTGCGA AACATACTAG CATCCGAGGA TGTCATACTC AAATACCCCG ACTTTAAAAA 3840 + GCCTTTTGAC CTTACTACAG ATGCTTCGGC AAGTGGTATC GGTGCAGTCC TATCCCAGGA 3900 + GGGCAGGCCA ATCACCATGA TATCGCGTAC CCTTAAACAG CCCGAGCAGA ACTACGCCAC 3960 + AAACGAAAGG GAATTGCTGG CGATTGTATG GGCCCTAGGT AAGTTGCAGA ACTTCCTGTA 4020 + TGGCTCTAGG GAGATTAATA TATTTACCGA CCATCAACCC CTCACTTTCG CTGTTGCCGA 4080 + CAGGAACACG AATGCCAAGA TAAAGAGGTG GAAATCTTAC ATAGACCAGC ATAATGCCAA 4140 + GGTTTTCTAC AAACCTGGCA AAGAAAATTT CGTGGCAGAC GCCCTCTCTA GGCAGAATCT 4200 + GAATGCCTTA CAAAACGAAC CCCAATCAGA CGCTGCGACC ATTCACAGTG AGCTCTCCCT 4260 + GACCTACACG GTCGAGACAA CAGACAAACC GTTAAATTGC TTCAGGAACC AGATCATTCT 4320 + GGAGGCAGCA CGTTTTCCGC TCAAACGAAA CCTGGTGCTC TTTCGAAGCA AATCTCGCCA 4380 + CTTAATCAGC TTTACTGATA AAAGTTGGCT ATTAAAAACA CTTAAGGAGG TGGTAAACCC 4440 + TGACGTCGTG AACGCTATTC ACTGCGACCT GCCCACTCTG GCAAGCTTCC AACACGACCT 4500 + CATTGCCCAC TTTCCAGCCA CCCAATTTCG TCACTGTAAG AATGTCGTGT TAGACATAAC 4560 + CGACAAAAAC GAACAGATCG AAATCGTCAC TGCCGAGCAC AACCGCGCTC ACAGAGCCGC 4620 + ACAAGAAAAC ATTAAACAAG TCCTTCGGGA TTATTACTTT CCCAAAATGG GCAGTTTAGC 4680 + TAAAGAAGTA GTAGCTAATT GTAGGGTCTG CACCCAAGCA AAGTATGACA GGCACCCGAA 4740 + AAAGCAAGAG CTCGGGGAAA CGCCCATACC CAGCTATACA GGTGAGATGG TGCATATTGA 4800 + CATATTCTCA ACCGACAGGA AGCTATTCCT GACGTGTATT GACAAATTTT CTAAATATGC 4860 + AATAGTGCAA CCAGTGGTGT CTAGAACAAT AGTGGACATC ACAGCACCCC TGTTGCAGAT 4920 + CATTAACCTG TTCCCCAATA TCAAAACGGT CTATTGTGAC AATGAGCCCG CATTTAACTC 4980 + AGAAACTGTC ACCTCAATGC TCAAGAACAG CTTCGGCATT GACATAGTAA ATGCGCCCCC 5040 + ACTCCACAGC TCATCCAATG GCCAAGTTGA ACGGTTCCAC AGCACATTGG CAGAAATCGC 5100 + CAGGTGCCTG AAGTTGGACA AAAAAACGAA TGACACAGTA GAACTAATCT TGAGGGCGAC 5160 + GATAGAATAT AACAAAACCG TGCACTCAGT TACTCGTGAG AGACCAATTG AGGTGGTTCA 5220 + CCCAGGGGCC CACGAGCGCT GCCTAGAAAT CAAGGCAAGA TTAGTAAAGG CTCAGCAAGA 5280 + CAGCATCGGA AGAAACAACC CTTCCCGACA AAACCGCGTG TTTGAGGTGG GAGAACGCGT 5340 + GTTTGTAAAA AACAACAAGA GGTTAGGAAA TAAGCTAACT CCACTATGCA CCGAGCAAAA 5400 + AGTGCAGGCA GACTTGGGAA CGTCTGTTCT TATTAAGGGG AGGGTGGTCC ACAAGGACAA 5460 + CCTCAAGTAG ACATTCCCTC TACAGTTAGG TAGTAAGTTA TGTCAAGGAA AATCCGAGCA 5520 + CTGTAGTATC ACCTTGTCTT TAATTTCCAG GTTCACCCTC ATGATGTTCA TACCCTTGGT 5580 + AGTAGCGAAT GCTCGGATCA CCGACTTTTC GCATGCCAAC TACATTCCTG TGTTAGATGG 5640 + GGATGTGCTG GTGTTTGAAC AGCGTGACCT CTTGAAACAT TCGAGTAACC TTTCCGAGTA 5700 + CGCTAGTATG ATAGATGAAA CACAGAAACT GTCCGAGTCC TTTCCCCACT CACATATGCG 5760 + TAAGTTGCTA GAGGTCGATA CTGACCATCT TAGAACCTTG TTGTCCGTTC TCAAAGTCCA 5820 + CCATAGGATA GCTAGGAGTC TAGATTTCTT AGGTACAGCC TTAAAGGTTG TGGCGGGTAC 5880 + TCCCGATGCC ACGGACCTCT TTAAAATTAA GATCACAGAG GCCCAACTAG TAGAATCTAA 5940 + TTCCAGGCAG ATAGCTATAA ACTCCGAAAC CCAGAAACAG ATAAATAAGT TAACTGACAC 6000 + CATCAATAAG GTGATCAATG CCCGTAAAGG CGACTTGGTT GACACTCCAC ACTTATATGA 6060 + AGCACTACTA GCAAGAAATA GGATGCTGTC TACAGAAATT CAAAATTTAA TTCTCACTAT 6120 + TACTTTGGTC AAATCAAACA TTATAAATCC CACAATTCTT GATCATGCCG ACTTGAAGCC 6180 + TCTTGTAGAA CAGGATACCC CAATTGTCAG CTTAATAGAA GCATCTAAGA TCAGGGTCCT 6240 + CCAGTCCGAG AATAGCATTC ATATTTTAAT TGCCTATCCT AGAGTCAAGT TCAGTTGCAA 6300 + GAAAGTCGCC GTCTACCCTG TATCTCACCA ACACACCATC TTGCGCCTCG ACGAAGACAC 6360 + TTTGGCCGAA TGCGAACATG ACACCTTTGC GGTCACCGGA TGCACAGACA CCACACACTT 6420 + CACGTTCTGC GAGCGGTCTC GGCGCGAAAC TTGCGTGCGC TCACTCCATG CTGGAAACGC 6480 + TGCTCAATGC CACACTCAAC CCAGCCACTT GCGAGAAATA AACCCCGTAG ATGATGGCGT 6540 + TGTGATTATC AACGAAGCCG CAGCTCACGT TAGCACTGAT GGCAGCCCCG AAACACTGAT 6600 + AGAGGGAACC TACCTGGTAA CCTTCGAGCG AACGGCAACC ATCAACGGCT CTGAATTCGT 6660 + AAATCTAAGG AAAACACTAA GCAAGCAGCC AGGCATCGTG CGTTCACCAC TACTTAACAT 6720 + CGTCGGCCAC GACCCTGTGC TCAGTATACC TCTGCTACAC CGGATGAGTA ACGAAAACCT 6780 + ACATTCCATC CAAAACCTTA TGGATGACGT GGAATCTGAA GGCTCGCCCA GACTCTGGTT 6840 + CGTGGCTGGT GTGGTCCTAA ACTTCGGCTT GATTGGCTCT CTCGCCCTTT ATCTGGCATT 6900 + AAGGAGAAGA CGAGCCTCTA GGGAGATACA GCGCACCATC GATACTTTCA ACATGACCGA 6960 + GGACGGTCAT AAACTTGAGG GGGGAGTAGT TAACAACTAA CAATGTATTG CTTCGTAGCA 7020 + ACTAAGTAGC TTTGTATGAA CAATGCTGAC GCGCCAGAAT TGGGTTCAAC GCTCCACGCG 7080 + AAGAATGCCT GGCAGCGGAA AGCTGACACT TCCTACCGGG AGTGTTGCTT CACGCTGCAA 7140 + GAAATGCTGA GTCGGCTTGC CGACTTGTGG CGGCGCGATG CATTGCTCGA GGGTAAACTT 7200 + AGTTTTCAAT ATTGTCTTCT ACTCAGTTCA AATCTTGTGT CGAAATAAAC CACAGCTTGC 7260 + TCCGGCTCAT TGCCGTTAAA CATCATTGTT CTTATTTACA ATCAAATCGC TATCGCCACA 7320 + AGGCTAGTGA TAATAACTAA GGGGGCGAAG TCAAGCCCTC CAACCTAATC TCCATAAACA 7380 + GTGTCTAAGA CGAACCTCAG CGAAAGAAGG AAGATCTCTA GACCTACTGG AAATAACATA 7440 + ACTCTGGACC TATTGGAACT TATATAATT 7469 +// +ID DMHFL1 standard; DNA; INV; 2959 BP. +XX +AC M69216; +XX +DR FLYBASE; FBte0000154; Dmel\hobo. +XX +SY synonym: H-element +XX +XX +FT source M69216:1..2959 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1..12 +FT SO_feature terminal_inverted_repeat ; SO:0000481:2948..2959 +FT SO_feature TATA_box ; SO:0000174:107..112 +FT SO_feature polyA_signal_sequence ; SO:0000551:2382..2394 +FT SO_feature CDS ; SO:0000316:316..2292 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\hobo\T" +FT /db_xref="FLYBASE:FBgn0014191" +FT /translation=" +FT MAPYIMIVEFLCLWSSVSAVNCPFFVFYDAITSLLGFSIIWKPKEKVTIM +FT AEAADFVKNKINNGTYSVANKHKGKSVIWSILCDILKEDETVLDGWLFCR +FT QCQKVLKFLHKNTSNLSRHKCCLTLRRPTELKIVSENDKKVAIEKCTQWV +FT VQDCRPFSAVTGAGFKNLVKFFLQIGAIYGEQVDVDDLLPDPTTLSRKAK +FT SDAEEKRSLISSEIKKAVDSGRASATVDMWTDQYVQRNFLGITFHYEKEF +FT KLCDMILGLKSMNFQKSTAENILMKIKGLFSEFNVENIDNVKFVTDRGAN +FT IKKALEGNTRLNCSSHLLSNVLEKSFNEANELKKIVKSCKKIVKYCKKSN +FT LQHTLETTLKSACPTRWNSNYKMMKSILDNWRSVDKILGEADIHVDFNKS +FT SLKVVVDILGDFERIFKKLQTSSSPSICFVLPSISKILELCEPNILDLSA +FT AALLKERILENIRKIWMANLSIWHKAAFFLYPPAAHLQEEDILEIKVFCI +FT SQIQVPISYTLSLESTETPRTPETPETPESLESPNLFPKKNKTISSENEF +FT FFPKLVTESNSNFNESPLDEIERYIRQRVPLSQNFEVIEWWKNNANLYPQ +FT LSKLALKLLSIPASSAAAERVFSLAGNIITEKRNRLCPKSVDSLLFLHSY +FT YKNLNNSQ" +XX +CC Derived from M69216 (g157606) (Rel. 41, Last updated, Version 3). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +CC CDS annotation from Lynn Crosby's annotation 'H-element.v004'. +XX +SQ Sequence 2959 BP; 994 A; 541 C; 571 G; 853 T; 0 other; + CAGAGAACTG CAAGGGTGGC ACTTTTTTAC CACTCGACTC ACACCCTACA ATTTTGTGTG 60 + CGGGTGCTAC TCGCCACGCA CATCGCGGGT ACTTACAAAC ACACAGTATA AATCTGAACA 120 + TGCAGACAAG ACACCCCGTT GTGTGCGCAC CCGAATCAAT ACGGTGTTTT GCGTCGCGGG 180 + TGCCGCTCAC ACAGTGCCTA AAAAGGGATG AGTGAGAAAA ACACTTGTGG GTATACCGTT 240 + AAACACATGG GTGTTTCCAA AAATACTCGG GTGTTTCCAA AAATACTCGA GTGGTCTCGT 300 + AGGTAGTCGA GTCAAATGGC GCCATACATA ATGATTGTTG AGTTCTTGTG TCTTTGGTCC 360 + AGTGTCTCGG CTGTTAATTG CCCCTTTTTT GTTTTTTACG ATGCAATTAC TAGCTTGTTA 420 + GGATTCAGTA TTATTTGGAA GCCAAAGGAA AAGGTCACAA TAATGGCAGA AGCGGCTGAT 480 + TTCGTTAAAA ATAAAATTAA CAATGGAACA TACTCAGTTG CCAATAAACA TAAAGGAAAA 540 + AGTGTTATTT GGAGCATTTT ATGTGACATT TTAAAGGAAG ATGAAACTGT TCTGGACGGA 600 + TGGCTGTTCT GCAGGCAATG CCAGAAAGTG CTCAAATTTT TACACAAAAA CACCTCCAAT 660 + TTATCCCGCC ATAAATGTTG TCTAACATTA AGACGACCAA CGGAATTAAA AATTGTTTCG 720 + GAAAACGACA AGAAAGTAGC TATTGAAAAA TGCACCCAAT GGGTTGTCCA AGATTGTCGG 780 + CCGTTTTCTG CAGTAACCGG AGCCGGATTT AAAAATTTGG TGAAGTTTTT CCTACAAATC 840 + GGCGCTATCT ATGGGGAACA GGTAGACGTC GATGACTTAC TACCTGATCC AACAACATTA 900 + AGTCGGAAGG CCAAATCGGA TGCAGAAGAG AAGAGGAGTC TAATCTCGTC CGAGATAAAA 960 + AAAGCTGTGG ATAGCGGAAG AGCAAGTGCG ACCGTCGACA TGTGGACTGA CCAGTATGTC 1020 + CAAAGAAACT TTTTGGGCAT CACTTTCCAT TACGAAAAAG AATTTAAACT TTGTGACATG 1080 + ATTTTGGGAC TAAAATCGAT GAATTTTCAA AAATCGACTG CCGAAAACAT TTTAATGAAA 1140 + ATTAAAGGTT TATTTTCGGA ATTCAATGTT GAGAACATTG ATAATGTTAA GTTTGTGACT 1200 + GACAGGGGAG CAAATATAAA AAAGGCTTTA GAGGGCAATA CCCGTTTAAA TTGTAGCAGT 1260 + CACCTGTTGT CAAATGTTTT AGAAAAATCG TTTAACGAGG CCAATGAACT CAAAAAAATT 1320 + GTGAAATCAT GCAAAAAAAT CGTGAAGTAC TGCAAAAAAT CAAATTTGCA GCATACTCTA 1380 + GAAACCACTT TGAAAAGCGC CTGTCCGACT AGATGGAACT CCAACTACAA AATGATGAAG 1440 + TCCATTCTGG ATAACTGGCG TAGTGTGGAT AAAATATTAG GTGAAGCTGA TATCCATGTA 1500 + GATTTTAATA AATCATCTTT AAAAGTTGTG GTAGATATTC TAGGAGACTT TGAACGAATA 1560 + TTTAAGAAGT TGCAAACATC TAGCTCACCA TCTATATGCT TCGTATTGCC ATCCATCTCT 1620 + AAAATTTTAG AATTATGCGA GCCGAATATT TTAGACCTTT CTGCAGCAGC ATTGCTTAAG 1680 + GAAAGAATTT TGGAAAATAT TCGTAAGATT TGGATGGCAA ATCTAAGCAT ATGGCATAAG 1740 + GCGGCATTTT TTTTATATCC ACCCGCAGCA CATCTTCAGG AAGAAGATAT TCTTGAAATA 1800 + AAGGTGTTTT GCATTTCACA AATTCAAGTC CCAATTTCAT ACACATTAAG CTTAGAATCT 1860 + ACAGAAACTC CAAGAACTCC AGAAACTCCA GAAACTCCAG AAAGTCTAGA AAGTCCAAAC 1920 + TTATTTCCAA AAAAAAACAA AACAATATCT TCTGAAAACG AATTCTTCTT CCCAAAGTTA 1980 + GTAACTGAGT CTAATTCCAA CTTCAATGAA TCTCCATTAG ATGAAATTGA ACGATATATT 2040 + AGACAAAGAG TTCCATTGTC TCAAAATTTT GAAGTAATTG AGTGGTGGAA AAATAACGCA 2100 + AACTTATACC CTCAGTTGTC AAAGTTAGCA TTAAAACTTT TATCAATACC AGCCAGTAGC 2160 + GCAGCAGCTG AAAGAGTGTT TTCCCTAGCA GGTAATATAA TAACAGAAAA GCGAAATAGA 2220 + TTATGCCCAA AATCTGTAGA TAGCCTCCTT TTTTTGCATT CCTATTACAA AAACCTAAAC 2280 + AACTCGCAAT AGATATTCCT TCTTATAAGT ATATTTTATA TTATTAATTC TTATTATTTG 2340 + CTTAATTTTT GTATAAGTGT TAAGTATTAA GTATAAGTAT TAATTAATAA TATATAAGAT 2400 + TGTTATTTGT TAAGACATTA GATGCAAAAT CCTAAAAATG TGAAAGTAAT GAAGTTCCTT 2460 + ATATTTAATA GATACTTTTT AAGCCCACTA TGTTTTTATT ATTTAGATTG AGACATTAAA 2520 + AAACGTAAAA ATCAACAAAT GCCGTCTTTA ATTGCAATTA CTTTATGTGT TTGAAATGGG 2580 + AGGCACCCAT TGAGTCCATC AAAGAGCAAA GACATGAGCA CAAAAATTTT CTTGGGTATT 2640 + CCCTTTTACC CTTCATTTCT TATACCCGTC ACGCTTCCAC CCATACAAAT TTTAGGCGTA 2700 + CAAAAAATGA CCAGAGAACT GCAGCCCGCA TACAAAAAAT GACCTGCGGC CGATCGTTGA 2760 + CTGTGCGTCC ACTCACCCAT ACGGCTCTTG CGCAGCAGGC CTCGGGTGGT TTTTTTACTC 2820 + GTAACAAAAA CACAACGTCG GTAAAACACT CGAGTATTTT GTGTTGCCGC AAGTAGGGTG 2880 + TCAAAAAAAA CGGGGTGCCT AGAGTACCGA GTGTTTATCG GGTGGACGTA GAGTGCGAGT 2940 + GGCGGGCTGC AGTTCTCTG 2959 +// +ID DMTHB1 standard; DNA; INV; 1653 BP. +XX +AC X01748; +XX +DR FLYBASE; FBte0000414; Dmel\HB. +XX +FT source X01748:189..1841 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1..31 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1622..1653 +FT SO_feature CDS ; SO:0000316:387..534 +FT /name="Dmel\HB\T" +FT /db_xref="FLYBASE:FBgn0044055" +FT /db_xref="SPTREMBL:Q27293" +FT /db_xref="NCBI_PROTEIN:CAA25884.1" +FT /translation="MLILKLRKEGKTYKDIQKTLKCSAKMVSNAIKYKWKPENRGTKHK +FT TTDIEDRRIVSYSKVYRFASFRDIKSELNLGISDVTIRRRLLNQNFSARSPRKVPLPSP +FT RHIKARLSLAKTYLNWPVSKWRNILWTDGSKIMLFGGTGSLQYI" +XX +CC Derived from X01748 (g8693) (Rel. 49, Last updated, Version 3). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 1653 BP; 568 A; 288 C; 302 G; 495 T; 0 other; + ATGTACAGCT GTGTTCAGAA AAATAGCAGT GCGAAGGAAA CTAAGTAATA CAAAGGTATT 60 + TTTCCATGTC CCTTTTCGGA ATCGACTTTT TATTCCTCTT ATTTTTGTTA AATGGAATGT 120 + GTAGATAGGG AAAAAAAGAA AATCCGGTCA GTTTTTCTTG TTATCCTTTT TTTATTTACA 180 + TTCTTGAGCA AAATCACAAT TTTTAGGCTG TTCATAAGAA TAGCAGTGTC TGGTTCTGAC 240 + CAACGTAAAG TCCCGAAATG ATCAATATTT TCTAAAAAGT GAGTTTGGTT AAGTTAATTC 300 + GTATATTTAA AAGGACAATA AATTAAAAAA ATTAAAAAAA TTTTATTTTA GTGGGTAGAG 360 + GACAGCACTA CTCCCAGGGG AAAAGAATGT TAATTCTTAA GCTTAGAAAG GAAGGAAAAA 420 + CATATAAGGA CATTCAAAAA ACCCTTAAAT GTTCTGCCAA AATGGTATCC AATGCCATTA 480 + AATATAAATG GAAGCCCGAA AACCGTGGTA CCAAACATAA AACCACAGAT ATAGAGGATC 540 + GACGCATTGT TTCTTACAGC AAAGTCTATC GTTTTGCATC CTTTAGGGAC ATAAAGTCTG 600 + AGCTGAACTT GGGAATCAGC GACGTTACTA TTCGTAGACG ACTACTGAAT CAAAATTTCA 660 + GTGCGAGGAG TCCACGAAAG GTTCCCCTAC CTAGCCCAAG GCATATTAAG GCAAGGTTAA 720 + GCTTAGCTAA AACCTACCTA AACTGGCCAG TCTCCAAATG GCGTAATATC CTTTGGACTG 780 + ATGGGTCAAA AATCATGCTA TTTGGTGGAA CTGGTTCACT ACAGTATATC TGACGACCTC 840 + CAAACACGGA GTATCACCCA AAACACCCAG TGAAGACTTT CAATCACGGT GGACCTAAAA 900 + TCATGGTATG GGCTTGTTTT TTTTATAATG GTATGAGTCA TGCTATGGAT TATGATTTAT 960 + GGTATTATAG ACCAAAACGC ATATGTAAAT ATACTTAGTG ATGTCTTATT GTCATATTCT 1020 + GAATAAAATA TACCCTTAAA ATGGACATTC CAACAGGATA ATGATCAGAA ACGCAGATGT 1080 + AAATCGGCTA AGAATAGGTT CACCCAAAAT AGAATAGATG CAATGCCGTG GCAAGCACCA 1140 + CCTTCCCATT TAAACCCGAT TGAAAACCTG TATGGGGACA TTAAACAGTT TGTGTCGAAG 1200 + AAGTCCCCGA CGTCTAAGAC TCAGATTTGG CAAGTTGTGC AGGATACATG GGCAAAAATT 1260 + CCTCCCAAAC CTTGCTAGGA CTTGGTGGAC TTCATGCCGC GTGGGTGTAA GGCTGTGCTG 1320 + GCTAACAAAG GCTATCCAGC CAAGTATTAG GCCCGAATTA ACATATTAAA AAGAAAAACT 1380 + AAGTTCGTTC TAGGTCAAGT TAAATTTTGT TACTATTTTT TCATAGCACT GCTATTTTAT 1440 + TGAACACCAG AATTTCTGCC TATTTATTGT TTTAATCTAT ATTTTCGAAA CTATTGAAGA 1500 + AATAAAAGTG AAACATTTGT TAAATTGTTT GAAATGAAAT ACCTAATGAT ATTATTAAAA 1560 + AAAAATTCCC ATTAAAACTG TAAATCATAG GAATTTTTTA TCTTAAACTC TGAAGTCCAA 1620 + AGCACTGCTA TTATTCTGAA CACAGCTGTA CAT 1653 +// +ID DM06920 standard; DNA; INV; 6083 BP. +XX +AC U06920; +XX +DR FLYBASE; FBte0000143; Dmel\HeT-A. +XX +FT source U06920:1015..7097 +FT SO_feature five_prime_UTR ; SO:0000204:1..731 +FT SO_feature three_prime_UTR ; SO:0000205:3497..6083 +FT SO_feature polyA_sequence ; SO:0000610:6077..6083 +FT SO_feature CDS ; SO:0000316:732..3497 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\HeT-A\gag" +FT /db_xref="FLYBASE:FBgn0016662" +FT /db_xref="REMTREMBL:AAC17188" +FT /db_xref="NCBI_PROTEIN:AAC17188.3" +FT /translation="MSMSDNLFSDDEVLSISSSPEQRSSPFYLNISPMSHGSDNSQINT +FT VIINSKKLPSNQADISLKNSSGAAIKIVNSLSHKKKENTNVNNAQKDPLSLTNTTASTC +FT GAKSSISEGKLSSPPSTSHTYEGKLLTKLTHTHTDFRGAKTSDAMGSFPSLSHSDNSIE +FT KNLSSSTKIGPNASSPPSHAHTHTSKSTDISLESRSKHPALANTDARSIKANANDNGEI +FT FSSLIQIDERKQEERPCTTINAFWSIFKPKPDVTKLSLKRKPTNPTKNTGKKCISPHKK +FT SAYLCPSAQDDLNLNLNPKSSAKPTVVNLPAARILSRPAAKRDLFKSSSSRSPDEQPMS +FT FSEVVAGTGSIFAAPCVPAPLTKTPGKRTNDDLDCSNFKTPNKKLCATSNFVTPSIFPP +FT LITPVFKSKAAQSVYEESKARNGPPPPALACSINASARSAAAPPGIAPLPPHNTDAELP +FT PWKIVPQSRRAPPILVNDVKEIVPLLEKLNYTAGVSSYTTRAIEGNGVRIQAKDMTAYN +FT KIKEVLVANGLPLFTNQPKSERGFRVIIRHLHHSTPCSWIVEELLKLGFQARFVRNMTN +FT PATGGPMRMFEVEIVMAKDGSHDKILSLKQIGGQRVDIERKNRTREPVQCYRCQGFRHA +FT KNSCMRPPRCMKCAGEHLSSCCTKPRTTPATCVNCSGQHISAYKGCPAYKAEKQKLAAN +FT NVDINKIRTIKDATNNFYKRQGPPLRNNTPRLPHSSAILSKSIAEARQEAARKSMLNPF +FT RQNINDRRPRFSSHDTAIQKRLNKWRRNTNKIPKKGRIALKDNAKPRPAHRTSNPAQRH +FT LEDYQDMLRRERSEENDQESEKGTPNTKQVGNDSPPTTSRAARASFKPRIIDDTTPSPK +FT ICNPNSQKGLLDDPTTSLANRVDNLEKKIDILMALIIQGRNNNLDMDTSN" +XX +CC Derived from U06920.2 (Rel. 67, Last updated, Version 14). +CC Michael Ashburner, 26-Jan-2002. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 6083 BP; 2199 A; 1545 C; 1033 G; 1306 T; 0 other; + TAAATAAATA AAATAAATTA AACAATTAAC TAAATAATTA AATAACTAAA ATTAATAATA 60 + TAATCCGTTC GCTTGCCAAA GACTCTCACG CGCATAACTA ATTAAAATCG ATTTTCAAGT 120 + TGACAAATAA ATGGTTTAAA ATTGTCCTCA GGCTGCAAAG AAAAGCCGCG GCAACAATAA 180 + ACATTTAGTG ACACGCGAAA AGCGAACATT TGATTAGTGT AATACTTGTG CAAACCGACA 240 + AGCTGCCGCC ATAACAAAAC GGAGACGAAG AATCATAAAG AACAAAAGCT AAATCCACCA 300 + GCATAGCAAA AATAAATTAA CAAATAAAAT AAAAGCAAAT TTAAATAACA TAATAAATTA 360 + AACTTATTTA ATAAACCAAT TAATTTTAAT TAATTCAATT AAACGCTAAA TCTACATAAT 420 + ACTCCACGCG CAAATTAATT GAAATCGTCT TTCTAGTTAA TAAATTAAAA GTTTAAAAAT 480 + TGTCTCCGGC CGCAAAATTT GAACCGCGAC GATAAAAACA TTTAATTGAC AAACAAAAAG 540 + CGAACAATTA TTCAGTGAAC TATTTGTGCA AAATTGACAA GCAGACGCCA TAATTAAAAG 600 + GAGAAGAAGC CAAAAGACGA AGAGAAGAAA GCAACCAGAA GAACTCAAAG AAGAAAAGGA 660 + GGAAAGCCCA ATTAAAGAAA GCCAGGGTAT TTATACCTTA CACTTATCGT TTAATATAAC 720 + AAAAACCCAA CATGTCCATG TCCGACAACC TTTTTTCTGA CGATGAGGTA CTTTCAATTT 780 + CCTCAAGCCC AGAACAGCGA TCTTCTCCGT TCTACCTCAA TATATCGCCC ATGTCCCACG 840 + GATCAGACAA TTCTCAGATT AATACAGTCA TCATTAATTC GAAGAAATTG CCCTCAAATC 900 + AAGCAGACAT AAGTTTAAAA AACTCTTCTG GGGCTGCTAT AAAAATTGTT AATTCCCTTT 960 + CACACAAGAA GAAAGAGAAC ACAAACGTTA ATAATGCCCA AAAAGACCCC CTCTCACTCA 1020 + CCAATACTAC TGCAAGCACT TGTGGCGCCA AAAGCAGCAT CTCAGAGGGG AAATTGTCTT 1080 + CTCCTCCGTC CACCTCACAC ACATATGAGG GGAAATTACT CACAAAACTT ACTCACACAC 1140 + ACACAGACTT TAGAGGCGCC AAAACGAGCG ATGCAATGGG AAGTTTCCCC TCTCTCTCGC 1200 + ACAGCGACAA TAGCATAGAG AAAAATCTGA GTTCTTCCAC CAAAATTGGA CCAAACGCTT 1260 + CTTCCCCTCC TTCTCATGCA CACACTCACA CTAGCAAATC CACTGATATA AGCTTAGAAA 1320 + GCCGCTCAAA ACATCCCGCG CTTGCCAATA CGGACGCACG CTCTATAAAA GCCAATGCTA 1380 + ATGACAATGG GGAAATTTTC TCCTCACTTA TACAAATTGA CGAACGCAAG CAAGAGGAAA 1440 + GGCCTTGCAC AACTATCAAC GCTTTTTGGT CTATTTTTAA ACCCAAGCCG GACGTTACTA 1500 + AACTAAGTCT AAAGAGGAAA CCCACCAATC CCACTAAAAA CACTGGGAAA AAATGCATCT 1560 + CCCCTCATAA AAAGAGCGCT TATTTATGCC CTTCCGCTCA GGATGATTTA AATTTAAATT 1620 + TAAACCCCAA ATCTAGCGCC AAGCCCACTG TGGTGAATTT ACCAGCTGCC CGCATCCTAA 1680 + GCCGGCCTGC AGCCAAGCGG GATTTATTTA AATCATCATC CTCCCGAAGC CCAGACGAGC 1740 + AGCCTATGAG TTTTTCGGAA GTGGTCGCTG GCACGGGTTC AATTTTTGCG GCACCCTGTG 1800 + TCCCGGCACC TTTAACGAAA ACTCCAGGCA AGCGGACAAA CGACGATCTG GACTGCTCCA 1860 + ACTTTAAGAC GCCCAATAAA AAATTATGCG CGACTTCCAA CTTTGTAACT CCCAGCATTT 1920 + TTCCGCCGCT CATCACTCCC GTTTTCAAGA GCAAGGCAGC TCAATCTGTT TACGAGGAAT 1980 + CCAAAGCCAG AAATGGACCC CCCCCGCCGG CCCTCGCCTG CAGCATCAAT GCCTCTGCTC 2040 + GCAGCGCAGC GGCGCCACCC GGGATCGCCC CCCTACCCCC TCATAATACA GATGCAGAGC 2100 + TGCCTCCATG GAAAATCGTG CCCCAGAGCC GTAGAGCACC TCCTATACTC GTCAATGATG 2160 + TAAAGGAAAT TGTACCTCTA CTGGAAAAGC TGAACTACAC AGCAGGAGTC TCCAGCTATA 2220 + CTACTAGGGC TATAGAAGGA AACGGGGTCA GGATACAGGC AAAGGACATG ACCGCCTATA 2280 + ACAAAATTAA AGAAGTCCTG GTGGCCAACG GACTTCCTTT ATTCACCAAC CAGCCCAAGT 2340 + CCGAGAGAGG CTTCCGAGTC ATCATCAGAC ATCTCCACCA CTCCACACCA TGCTCGTGGA 2400 + TAGTCGAGGA ACTGCTGAAG CTCGGATTCC AAGCGCGATT CGTCAGAAAT ATGACGAATC 2460 + CGGCTACAGG TGGCCCCATG CGAATGTTTG AAGTGGAGAT CGTCATGGCC AAAGACGGCA 2520 + GTCATGACAA AATACTCTCA CTCAAACAAA TCGGTGGGCA AAGGGTGGAC ATTGAAAGGA 2580 + AAAACAGGAC ACGGGAGCCA GTCCAGTGCT ACAGATGCCA AGGCTTCAGG CATGCCAAAA 2640 + ACTCTTGCAT GAGGCCGCCA AGATGCATGA AATGCGCTGG CGAACACCTG TCTTCCTGTT 2700 + GCACCAAACC AAGAACCACC CCCGCCACCT GCGTAAATTG CTCTGGGCAG CATATTAGCG 2760 + CGTACAAAGG ATGCCCTGCA TATAAGGCGG AAAAACAAAA GCTGGCGGCA AACAACGTTG 2820 + ACATAAACAA AATAAGAACA ATCAAAGACG CAACAAATAA CTTTTATAAA CGTCAAGGCC 2880 + CCCCTCTACG CAACAACACC CCTCGGCTAC CGCACAGCTC AGCAATCCTG AGCAAATCAA 2940 + TTGCCGAAGC TCGCCAGGAG GCAGCCAGAA AGTCGATGTT AAATCCATTC CGACAAAATA 3000 + TAAACGACAG AAGACCACGA TTCTCCTCCC ACGACACGGC CATTCAGAAG CGTCTGAATA 3060 + AATGGCGCCG AAACACCAAC AAAATACCCA AAAAGGGTAG GATAGCCTTA AAGGATAATG 3120 + CAAAGCCACG ACCGGCACAT AGGACAAGTA ACCCAGCGCA AAGACATCTG GAGGACTACC 3180 + AGGACATGCT CCGAAGGGAA AGGAGTGAAG AAAACGACCA GGAATCTGAG AAGGGCACCC 3240 + CCAATACCAA GCAGGTCGGC AATGACAGCC CTCCGACCAC GAGCAGAGCA GCCAGAGCCA 3300 + GCTTTAAGCC AAGAATCATT GACGATACCA CGCCATCGCC AAAAATCTGC AATCCCAACT 3360 + CACAAAAAGG CCTCTTGGAC GACCCCACAA CAAGCTTAGC TAATAGAGTC GACAATTTAG 3420 + AAAAGAAAAT TGACATTTTA ATGGCCTTAA TCATACAAGG AAGAAATAAC AATCTTGACA 3480 + TGGATACATC CAATTAATCT TACAACTACT TATATATTCT TTAATAAATA TATCCAATAG 3540 + AAAAGCGCAC GTCGGTCTGC TTTTAAAATC CTTCACCGTC ATCACCTTCC TCGACGGAGC 3600 + CTAATTTATT GGAAAAATAA ATCAATTATA TGTTGGCACA AAAATGTAAA CACACACTCA 3660 + CCTAAACGCA CCCGGACGAA CAAGCCTATG ACAACGCACT CCAGCTGATC TGTAAGAAAC 3720 + AAAAAATATG AATAGATAGA TCGATATGAA AAGGATATGT GCGGCAGAAA CATGATGAGC 3780 + AAAAGGCGAC TCGCTGCAGC AACTTATGCA CAACGTCACT TACCTGAAAT TTCTTGCCGT 3840 + ACGATCTCCT GTAGTATCCC TTATCACAGC TGCAATCTAC TTGCAATGCT GCACTGCAAT 3900 + AAACGTACTA CAAAAGCTGC ATACGTTTTG ATCAGGACAC CTCGTGCGGA CGTGCTAAAA 3960 + AAAATTTCCT TTCTGCTGCT CTTATTGACG CTAAAACCTT AAAACCTACA AACAAAACAA 4020 + TTAAATAATA ACAAATCAAA TAAGACAACC AAATAATACA CTTACCTCAT TGACTGCAGC 4080 + TAAATCGCTG ACCCACATTC AGTGCAGCCG ACAGCAGGAG ACGGGCCCGC AAAAGCAAAA 4140 + CAAAATCGCC AATTTTGCGA TTATAAACAC GAAAAATTGA CAATTTTGCG ATGCCGTCTC 4200 + CGCCTCCTGA TGCCACTGCA TTGACAAGCA TCACTAGCGA GGAGCTGACA CCACACCAAA 4260 + AAGCTGTAAA ATCCGTCCAC AAATTGTATA TTTTGCCTCA GTGTCGTATC TGCAATGTTT 4320 + TTCCGATAAC CTGTAAGGAA AGAAAAATTA ATAAGAAAAT TATACAAAAT TAATTAAGGA 4380 + CGACAGAAAA TAGCAAACCA GACAGGCAAA TTAACAGATA CAAATATGAG ACTCCATCCT 4440 + GCTGCCGACA CACAAGTAAA TCCTTCAACT CGACAACAGG AGACGGGCCT TGCAAAAGCA 4500 + AAACAAAATC GCCAACTTTT GCGATTATAA ATACAAAAAA TTGACAATTT TGCAACGCCG 4560 + TCTCCACCTC CTGTTGCCAC TGCATTAATA AGGATCACCA GCGCGGCGTG ACGCCACACT 4620 + AAAAGGCTGC AAAATCCGTC CACAAAATGT ATACTTTTCC TCAGTACAAT ACTTTCTAAT 4680 + GAACTTCCGC CAACCTGCAA TGAAAAGAAA AGAAATAGGT ATATAAAACA AAACAAACAA 4740 + AAGGACAACC TAAAATTAGC AAACCAGACA GGCATACTAG TAGATGCTAA TATGCAGCTC 4800 + CATCCTACTG ACGACAACCA CGCAACTCCT TTCTCCAAGA CCGCAAATAC TGAAACAAGG 4860 + AAGCACAAGC TAATACTGGG AATTATTTAT TTAAACAAAA ATACTTATCT AATTGCCAAT 4920 + TCGACGACTC CAAATCCGCG GCTAACCGGC GGCGATGGCC CATAAATAAA GGGCCTCCTA 4980 + ATTAATTACA AAATGTACCT GAAAAACATA AAATTAACGC AACTATAATT AACGCAATTA 5040 + ATAAATCAAA TAAATACAAG TATAATACTT ACCTCCAAGC AAACGTACCT GAAAAACAAA 5100 + ACCAAAAAAA AAATTAATGC AATAAATAAA TCAAATAAAT ACAAACATAA TACTTACCTC 5160 + CAATTTACCT CCCAGCCAAT CTACCTGAAA AACATAATCT AATACAATCT CAAAAACAAA 5220 + TAACAAATGT AATACTTACC AAATTTTAAT TTTGTATTCA TTTCCATGAC CCCAACGCTG 5280 + CAACTGTCCT CGGCAACAAT TCCTGTTCCG GCGGCTCCAT GCTGCCAATC CTGACGCACT 5340 + GGCCACAAGA CGCGGCGCTG CTGGCAATCT CTCGATGAAC AACCGATCTA CAATTTCCAT 5400 + GACGACTCCT CTGTCACGAT GAGACAGAAG ACACCACCAA CGCCAGCAGC TCCAAAACAA 5460 + TACAACAACG GCCGCGCGGA ACCCATCTTC AGAATTCCCT CTTCCTGACG ACCGGCGAAC 5520 + GAGTTCTGGA ATAAACAATG TATTAATTGC AAACATCTAC CGATGAGGGT AGAAGAGATA 5580 + CTCACCAAAC GACTGCGGCG CGGGAACAAA CTAACTGCAA CGCCGGCCGG ACCTATTTGT 5640 + TGCAAGTGGC GCGCATCCAG CGCCTGCAAC ATGCCCCAGC CCAAGTACAC AACTACTTAC 5700 + CTGCAACGTC GCCAGAGGCT CCCAGCGAAT CGGTGCTTCC GTCCTTCTGG CGGGGGTACC 5760 + TGAAAAGAAA CAAATTAAAC AATATTAATC CTAAATTTCA ATGTTTTTTG TAAAATAATT 5820 + TAAATTGTTA AATGTAAACA AGCCTTGCAA TATGTTAATG TTACCAGTCC ATGCTACTGT 5880 + CTAAAAGCCA AGAATACAAA AAATACTAAT TATAAACTAA CTCACCACGC CCAACCCCCA 5940 + AACTCACCCC ATGCAATGTT AAACCTATAA ATTCAAATAA TTGTACCTAT ATATTGCACA 6000 + TACTGTAATC AAAGGCAAAA TAAATCGTGG ATGCGGAACA GAATTTACTC TGTCTCCGTA 6060 + CCTCCACCAG CAAAGTTAAA AAA 6083 +// +ID DMIFACA standard; DNA; INV; 5371 BP. +XX +AC M14954; +XX +DR FLYBASE; FBte0000133; Dmel\I-element. +XX +FT source M14954:100..5470 +FT SO_feature CDS ; SO:0000316:187..1467 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\I-element\gag" +FT /db_xref="FLYBASE:FBgn0020417" +FT /db_xref="SPTREMBL:Q24362" +FT /db_xref="NCBI_PROTEIN:AAA70221.1" +FT /translation="MTDPPNIYKITSKTYQSQLGEPKFIIIKRNDNNSFERTSPFIIKK +FT SVDFACGGEVEGCKRTRDGNLLIKTKNELQARKLLKLTKIADEDVTASEHKTLNFSKGV +FT IYCNDLRHIDEDTILQELKPQKVSEVKKIMKRQNPNSNSDTNNITLVETGLIIITFESH +FT KLPEIVRIGYETVRVRDYIPLPLRCKKCLRFGHPTPICKSVETCINCSETKHTNDGEKC +FT TNEKNCLNCRNNPELDHQHSPIDRKCPTFIKNQELTAIKTTQKVDHKTAQHIYFERHGF +FT QTKNTYAKTLTNGTTQRTTNTPSPNIHTNTTQSQQQNPHHTPKSAAQNTSAKTPTTEPA +FT KTTLLSNQPHQHHHHHSYDKLEDMDTDYTPTRKPSTTYSSQLTEDLKIKIFPKDKSNNL +FT SINLKASKLKAKAHKNKHTNNSDSESI" +FT SO_feature CDS ; SO:0000316:1938..5195 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\I-element\RTase" +FT /db_xref="FLYBASE:FBgn0020418" +FT /db_xref="SPTREMBL:Q24363" +FT /db_xref="NCBI_PROTEIN:AAA70222.1" +FT /translation="MAPSWGSPTTNKRGKITHRFIDNMHLILLNDKSPTHFSTHNTYTH +FT IDLTLCSPILAPHAKWKILNDLHGSDHFPIITTLFPTTNPQKFYRPFFKLKEANWEQFN +FT ALTHQTNKKYPTSHNVNKEAALINRIILYSANLSIPQTSPNTHPYRVPWWNKHLDQLRK +FT EKQLAWKKLNRTITVDNILDYRRKNAIFRYELKKRKKEASSSFTSTIHPTTPSSKIWAN +FT IRRFCGLNPAKQIHAITNPVNNETTLASNEIANIFAQHFSDLSGDWNFSEEFRNNKYRN +FT NIHLYTPSPIAQTIEENITYLELSSALQTLKGCAPGLNRISYQMIKNSSHTTKNRITKL +FT FNEIFNSHIPQAYKTSLIIPILKPNTDKTKTSSYRPISLNCCIAKILDKIIAKRLWWLV +FT TYNNLINDKQFGFKKGKSTSDCLLYVDYLITKSKMHTSLVTLDFSRAFDRVGVHSIIQQ +FT LQEWKTGPKIIKYIKNFMSNRKITVRVGPHTSSPLPLFNGIPQGSPISVILFLIAFNKL +FT SNIISLHKEIKFNAYADDFFLIINFNKNTNTNFNLDNLFDDIENWCSYSGASLSLSKCQ +FT HLHICRKRHCTCKISCNNFQIPSVTSLKILGITLNNKYKWNTHINLLLPKLHNKLNIIK +FT CLSSLKFNCNTHTLLNVAKATIIAKLEYGLFLYGHAPKSILNKIKTPFNSAIRLALGAY +FT RSTPINNLLYESNTPPLEMKRDLQIAKLSQNLILSKNTPIHKFLKPKKANKKKTSTIDR +FT TIKLSLELNLPYKPIKLHKNKPPWTLPNLIDTSLRIHKKEQTSPDQYRKLYEHTKNNLK +FT THNFIFTDGSKINYTISFAITTETDVLKYGILPPYSSVLTSETIAILEAIELTKNRRGK +FT FIICSDSLSAVDSIQNTNNNSFYPSRIRSLITQHAPKIKIMWIPGHSGIKGNELADQAA +FT KSASSMPLILTPNINTTDIKKHLKADLATKQKEHIINCSPWYQSINTNTSHPCDYLKQS +FT HPNWTRLDQIKIIRLRLGHTNITHQHYLNPNSIPTCPFCQGDISLNHIFNSCPSLLQTK +FT QDIFNNTNPLDLLSKPNPDNIQKLILFLKKTKLYHKI" +XX +CC Derived from M14954 (g157749) (Rel. 44, Last updated, Version 2). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 5371 BP; 2176 A; 1446 C; 606 G; 1143 T; 0 other; + CATTACCACT TCAACCTCCG AAGAGATAAG TCGTGCCTCT CAGTCTAAAG CCTCGCTTCG 60 + CGTAAGCCCA AAACTCTTAT CAGCAAAATC TTGATAAACA AATATCAACC ACAAAGAGAA 120 + AATAAAAAAC TTAACAACAA AAACAACAAT ACCGCTAATC CGGGCTCAAG CCCTTAACCA 180 + ACAATCATGA CAGACCCACC AAACATTTAC AAAATCACTT CAAAAACATA CCAATCCCAA 240 + TTAGGCGAAC CTAAATTTAT AATTATTAAA AGAAATGACA ACAACTCTTT CGAAAGAACT 300 + TCACCATTCA TCATAAAAAA ATCGGTGGAC TTTGCCTGTG GAGGAGAAGT TGAGGGATGC 360 + AAACGTACAA GAGACGGCAA CCTGCTAATA AAAACCAAAA ATGAATTACA AGCCAGAAAA 420 + CTCCTAAAAC TAACAAAAAT TGCAGATGAG GATGTAACAG CAAGTGAACA TAAAACATTA 480 + AACTTCTCTA AGGGAGTTAT TTACTGTAAC GACCTTAGAC ACATCGACGA AGACACAATT 540 + CTACAAGAAC TAAAACCACA AAAAGTATCT GAAGTTAAAA AAATAATGAA ACGGCAAAAC 600 + CCCAACTCTA ACTCCGACAC CAACAACATC ACATTAGTTG AAACTGGACT CATAATTATA 660 + ACCTTTGAAT CGCATAAGCT CCCCGAGATA GTACGAATCG GGTACGAAAC AGTCCGAGTA 720 + CGAGACTATA TCCCACTCCC ACTTCGATGC AAAAAATGCC TCCGCTTCGG TCATCCAACA 780 + CCCATATGCA AAAGTGTAGA AACTTGCATC AATTGCTCTG AAACAAAACA CACAAACGAC 840 + GGAGAAAAAT GCACAAACGA AAAAAACTGC TTAAATTGCC GAAATAACCC AGAACTTGAC 900 + CATCAACACA GCCCAATTGA CCGCAAATGC CCTACGTTCA TAAAAAACCA GGAATTAACA 960 + GCAATTAAAA CCACACAAAA AGTTGACCAT AAAACGGCCC AACACATATA TTTCGAACGT 1020 + CACGGCTTCC AAACGAAAAA CACCTACGCC AAAACACTTA CAAACGGCAC AACCCAGAGG 1080 + ACAACAAACA CTCCATCACC TAATATTCAC ACAAACACAA CCCAATCACA ACAACAAAAT 1140 + CCGCACCACA CACCCAAATC AGCAGCACAA AACACTTCAG CTAAGACACC AACAACTGAA 1200 + CCAGCCAAAA CAACCTTACT ATCCAACCAA CCACACCAAC ACCACCACCA CCACAGCTAC 1260 + GACAAACTAG AAGACATGGA TACCGACTAC ACACCTACCA GAAAACCATC TACGACATAC 1320 + TCATCACAAC TCACAGAAGA CCTAAAAATA AAAATCTTCC CTAAAGATAA GTCCAATAAC 1380 + CTATCCATAA ACCTTAAAGC ATCAAAACTA AAGGCCAAAG CCCACAAAAA CAAGCACACT 1440 + AACAACAGCG ACAGCGAATC CATATAGAAC TCTACACAAA ACCCTAACCG TTAACACTAC 1500 + CTTTAAGTAA GTTATAAGCT TTAATTTTCT CACAAATGTC CCTAACTATA ATCCAATGGA 1560 + ATCTAAAAGG ATATCTAAAC AACTACAGCC ATCTCCTTAT TCTAATCAAA AAATACTCCC 1620 + CCCACATAAT TTCCCTCCAA GAAACCCATA TACAATACAC TAATAACATT CCAACCCCAA 1680 + TAAACTACAA ACTATTAACA AATATTGCCA CCAACAGATT TGGGGGGCGT ACGACTACTA 1740 + GTGCATAAGT CAATACAACA CACTGTCCTC AACATAACAA TCGATATAGA AGCAATAGCC 1800 + ATAAATATAG AATCTAAACT TAAATTAAAC ATATTTTCCA CATACATTTC TCCGACCAAA 1860 + AACATAACTA ACCAGACACT CCATAACACA TTTAACATAC AACAAACACC CTCTCTAATT 1920 + ACGGGAGATT TTAATGGATG GCACCATCCT GGGGCTCCCC AACAACAAAT AAACGAGGAA 1980 + AAATAACTCA TAGATTCATT GACAACATGC ACCTTATCCT GTTAAACGAC AAATCTCCCA 2040 + CACACTTTTC AACACACAAT ACATACACAC ACATAGACCT CACACTCTGC TCTCCAATCC 2100 + TAGCCCCCCA CGCCAAGTGG AAAATACTAA ACGATCTTCA CGGTAGCGAC CATTTCCCTA 2160 + TTATCACAAC ACTATTCCCA ACAACCAATC CACAAAAATT CTACAGACCC TTTTTTAAAC 2220 + TCAAAGAAGC CAACTGGGAA CAGTTCAACG CTCTTACCCA CCAAACCAAC AAGAAATACC 2280 + CCACCTCCCA CAACGTAAAC AAAGAAGCCG CTCTAATCAA TAGAATCATC CTTTATAGCG 2340 + CAAACCTCTC CATCCCACAA ACCTCACCTA ACACACATCC ATACAGGGTT CCATGGTGGA 2400 + ATAAACACCT CGACCAATTA CGTAAAGAAA AACAACTTGC CTGGAAAAAA TTAAACCGCA 2460 + CAATTACTGT TGACAACATT CTAGACTATA GACGCAAAAA CGCAATATTT AGATACGAAC 2520 + TAAAAAAGAG GAAAAAAGAA GCTTCCAGCT CTTTCACCTC AACCATCCAT CCCACTACTC 2580 + CCTCATCCAA AATATGGGCC AATATAAGAC GCTTCTGCGG ACTTAACCCA GCAAAACAAA 2640 + TTCATGCCAT CACAAACCCA GTAAATAACG AGACTACATT GGCTAGCAAC GAAATTGCTA 2700 + ACATATTCGC ACAACATTTC TCTGACCTCT CCGGCGACTG GAACTTCTCA GAGGAGTTCC 2760 + GGAACAATAA ATATAGAAAT AACATACATC TCTACACCCC CTCTCCAATA GCCCAAACCA 2820 + TAGAAGAGAA CATAACGTAT CTAGAACTTA GCTCAGCACT ACAAACATTA AAAGGATGTG 2880 + CTCCAGGACT AAATAGAATC TCGTATCAAA TGATCAAAAA TAGCTCCCAC ACAACAAAAA 2940 + ACCGAATAAC GAAACTATTT AATGAAATAT TCAATAGCCA CATACCTCAA GCCTACAAAA 3000 + CAAGCCTAAT CATCCCAATC CTTAAGCCAA ACACCGACAA AACGAAAACT TCCTCATACC 3060 + GACCCATCTC CCTCAACTGC TGTATAGCAA AGATACTTGA TAAAATAATT GCGAAAAGAC 3120 + TCTGGTGGCT AGTGACATAT AACAACCTAA TTAACGACAA ACAATTCGGG TTCAAAAAAG 3180 + GCAAATCGAC TTCGGACTGT CTACTCTATG TAGACTATCT CATAACGAAG TCAAAAATGC 3240 + ACACCTCCCT CGTCACTCTT GATTTTTCAA GAGCCTTCGA TCGAGTAGGT GTGCACTCCA 3300 + TAATCCAGCA ATTGCAGGAA TGGAAAACGG GTCCCAAAAT AATAAAATAC ATTAAAAACT 3360 + TCATGAGCAA CAGAAAAATA ACTGTCCGCG TCGGTCCGCA TACATCAAGC CCGTTACCCC 3420 + TATTCAACGG AATCCCCCAA GGTTCACCCA TATCCGTAAT ACTTTTCCTC ATAGCATTCA 3480 + ACAAATTATC CAACATCATA TCCCTACATA AAGAAATTAA ATTCAACGCA TATGCCGACG 3540 + ACTTCTTCCT TATAATAAAT TTCAACAAAA ACACAAATAC AAATTTCAAC TTAGACAATC 3600 + TATTCGACGA TATAGAAAAT TGGTGCTCCT ACTCAGGGGC ATCGCTTTCC CTATCCAAAT 3660 + GTCAACACCT CCACATATGC AGAAAACGTC ACTGCACATG CAAGATAAGC TGCAACAACT 3720 + TCCAAATTCC TAGCGTTACG TCCTTAAAAA TTCTAGGAAT AACCTTAAAC AACAAATACA 3780 + AATGGAACAC ACACATAAAC CTACTTCTAC CCAAACTACA CAACAAGCTA AATATAATAA 3840 + AATGCCTATC TAGTCTTAAA TTTAACTGCA ACACGCATAC ACTACTTAAT GTCGCAAAAG 3900 + CAACAATTAT AGCCAAACTA GAGTATGGTT TGTTTCTGTA CGGCCATGCT CCCAAAAGCA 3960 + TTTTAAACAA AATAAAAACA CCGTTTAACT CCGCTATCCG TCTAGCTCTC GGCGCATATC 4020 + GCTCTACCCC AATAAATAAC TTACTTTACG AATCGAATAC TCCCCCCTTA GAAATGAAAC 4080 + GAGACCTTCA AATAGCCAAA CTATCCCAAA ACCTAATCCT CTCCAAAAAC ACACCAATAC 4140 + ATAAGTTCTT AAAGCCTAAA AAAGCTAATA AGAAAAAAAC ATCAACAATA GACCGAACAA 4200 + TCAAACTTAG CCTAGAACTT AATCTACCCT ACAAACCAAT AAAACTCCAT AAAAACAAAC 4260 + CACCATGGAC CCTCCCCAAT CTAATAGACA CGTCACTTAG AATCCATAAG AAAGAACAAA 4320 + CATCTCCAGA CCAATACAGA AAATTATACG AACACACAAA GAATAACCTC AAAACACACA 4380 + ATTTCATATT CACTGACGGT TCAAAAATTA ATTACACAAT ATCATTCGCC ATTACAACGG 4440 + AGACAGACGT CTTGAAATAC GGCATACTGC CCCCATATTC ATCCGTCCTC ACCTCCGAAA 4500 + CAATCGCCAT CCTAGAAGCA ATAGAACTTA CTAAAAACCG AAGAGGCAAA TTTATTATCT 4560 + GCTCCGACTC CCTATCAGCA GTAGATTCAA TTCAAAACAC AAATAATAAC AGCTTTTACC 4620 + CAAGCAGAAT ACGATCGCTA ATAACGCAAC ACGCACCTAA AATTAAAATA ATGTGGATTC 4680 + CTGGCCATTC AGGAATAAAA GGAAATGAAT TAGCCGATCA AGCTGCAAAA TCAGCAAGCA 4740 + GTATGCCACT TATCCTCACC CCAAACATAA ATACCACAGA TATAAAAAAA CACCTTAAAG 4800 + CCGACCTTGC GACAAAACAG AAAGAACACA TAATAAACTG CAGTCCATGG TACCAATCTA 4860 + TTAACACGAA CACCTCACAC CCATGCGATT ACCTTAAACA ATCCCACCCA AATTGGACCA 4920 + GACTCGACCA AATAAAAATA ATACGACTTC GACTAGGACA CACAAACATA ACCCACCAAC 4980 + ACTACCTAAA TCCCAATTCA ATACCAACTT GCCCGTTTTG CCAAGGTGAT ATTTCTTTAA 5040 + ACCACATATT TAACTCATGC CCATCCCTCC TACAAACCAA GCAAGATATA TTTAACAACA 5100 + CCAACCCTCT AGACCTTCTT AGCAAACCCA ATCCAGATAA CATACAAAAA CTCATACTTT 5160 + TCCTCAAAAA AACTAAATTA TACCACAAAA TCTAAAAACA AAACAGGCAT TTGTACATAA 5220 + CAAGCCAGCA ATTAGTTACC AAATTAGATA TTAACTAAAT TAAGATATAA TAACATTGTA 5280 + AATAAATATA GCTGTAAGCC CCGTAGCTAA TGCTATACTA TCTAAGTTAG TCTAGTTTTG 5340 + TAAACTATTC TATCTATCAT AATAATAATA A 5371 +// +ID DMLINEJA standard; DNA; INV; 5020 BP. +XX +AC M22874; +XX +DR FLYBASE; FBte0000088; Dmel\jockey. +XX +SY synonym: wallaby +SY synonym: sancho +XX +FT source M22874:115..5134 +FT SO_feature CDS ; SO:0000316:300..2051 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\jockey\gag" +FT /db_xref="FLYBASE:FBgn0020297" +FT /db_xref="SWISS-PROT:P21330" +FT /db_xref="NCBI_PROTEIN:AAA28674.1" +FT /translation="ISIALYGISIKTIDIMENSFAQSRPSNGCDKFEKMRKVAGVEPGE +FT LRSQLRASCAVVSPNLEGMPTQSAVSSLMVTISSNTNASVTCTISNVQANMICTPTYTD +FT CTTVTTSICPTTPYDNGLPTPLSSLPNKPSKANCPFQAHDRTVNRKRKGVSQPPLPILT +FT PSPSRKTKRQATMPLNEEASTSTAAALNNNRFALLSAEAENMEQDVSDADSDIEDSAAR +FT DGGGQSAKYSKPPAICVPSVSDPVTLERALNLSTGSSNYYIRISRFGVSRIYTANPDAF +FT RTAVKELNKLNCQFWHHQLKEEKPYRVVLKGIHANVPSSQIEQAFSDHGYEVLNIYCPR +FT KSDWKNIQVNEDDNEATKNFKTRQNLFYINLKQGPNVKESLKITRLGRYRVTVERATRR +FT KELLQCQRCQIFGHSKNYCAQDPICGKCSGPHMTGFALCISDVCLCINCGGDHVSTDKS +FT CPVRAEKAKKLKPRSRLPMTNNIATLKPPQRSSSGYIPAEALRTNISYADIARRNTTQS +FT RARATVQAEVIPTSDNSLNNKFMTLDNSIRAINTRMDELFKLIHETVEANKAFRELVQV +FT LITRIPK" +FT SO_feature CDS ; SO:0000316:2048..4798 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\jockey\pol" +FT /db_xref="FLYBASE:FBgn0015952" +FT /db_xref="SWISS-PROT:P21328" +FT /db_xref="NCBI_PROTEIN:AAA28675.1" +FT /translation="MTQPTLKIGLWNARGLTRGSEELRIFLSDHDIDVMLTTETHMRVG +FT QRIYLPGYLMYHAHHPSGNSRGGSAVIIKSRLCHSPLTPISTNDRQIARVHLQTSVGTV +FT TVAAVYLPPAERWIVDDFKSMFAALGNKFIAGGDYNAKHAWWGNPRSCPRGKMLQEVIA +FT HGQYQVLATGEPTFYSYNPLLTPSALDFFITCGYGMGRLDVQTLQELSSDHLPILAVLH +FT ATPLKKPQRVRLLAHNADINIFKTHLEQLSEVNMQILEAVDIDNATSLFMSKLSEAAQL +FT AAPRNRHEVEAFRPLQLPSSILALLRLKRRVRKEYARTGDPRMQQIHSRLANCLHKALA +FT RRKQAQIDTFLDNLGADASTNYSLWRITKRFKAQPTPKSAIKNPSGGWCRTSLEKTEVF +FT ANNLEQRFTPYNYAPESLCRQVEEYLESPFQMSLPLSAVTLEEVKNLIAKLPLKKAPGE +FT DLLDNRTIRLLPDQALQFLALIFNSVLDVGYFPKAWKSASIIMIHKTGKTPTDVDSYRP +FT TSLLPSLGKIMERLILNRLLTCKDVTKAIPKFQFGFRLQHGTPEQLHRVVNFALEAMEN +FT KEYAVGAFLDIQQAFDRVWHPGLLYKAKRLFPPQLYLVVKSFLEERTFHVSVDGYKSSI +FT KPIAAGVPQGSVLGPTLYSVFASDMPTHTPVTEVDEEDVLIATYADDTAVLTKSKSILA +FT ATSGLQEYLDAFQQWAENWNVRINAEKCANVTFANRTGSCPGVSLNGRLIRHHQAYKYL +FT GITLDRKLTFSRHITNIQQAFRTKVARMSWLIAPRNKLSLGCKVNIYKSILAPCLFYGL +FT QVYGIAAKSHLNKIRILQAKTLRRISGAPWYMRTRDIERDLKVPKLGDKLQNIAQKYME +FT RLNVHPNSLARKLGTAAVVNADPRTRVKRRLKRHHPHDLPNLVLT" +XX +CC Derived from M22874 (g157823) (Rel. 47, Last updated, Version 5). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 5020 BP; 1527 A; 1198 C; 1055 G; 1240 T; 0 other; + AAAAATCATT CACATGGGAG ATGAGCAATC GAGTGGACGT GTTCACAGAA GTCGCGAGAT 60 + AAAACAAAAA CGTAATTGTG ATCCATCACA AACATCTGCG CAGATCGTGT GCTTATCTCA 120 + CAAACAAAAT CTATTTTTAG TCACTGCATA ACGGTGACGG CTTCGGTTCG CGAAACTTAT 180 + CAGCAACTAG CAATTTCTAA GCTGTGTTGT TTTTGCCCCT CGCCCTGCGC GCTGCGCAAG 240 + CGGGAGGTTG TTACAATTTA CCTTACAAGT AAACCGGTAA ATCTTATCGT GTTTAGTAAA 300 + TATCAATTGC ATTATACGGC ATAAGTATAA AGACAATTGA TATAATGGAG AATTCATTTG 360 + CTCAATCGCG ACCTAGCAAT GGGTGCGATA AATTTGAGAA AATGAGGAAA GTAGCAGGTG 420 + TTGAGCCAGG AGAATTACGC TCCCAACTCC GCGCCAGCTG TGCAGTTGTT TCCCCTAACC 480 + TGGAAGGTAT GCCAACTCAA TCTGCGGTCT CCAGCTTAAT GGTGACAATC AGCAGCAACA 540 + CCAATGCAAG TGTTACCTGC ACTATTTCTA ACGTACAGGC CAACATGATC TGTACTCCTA 600 + CATACACTGA TTGCACAACC GTGACCACTA GCATTTGCCC AACTACGCCT TATGACAATG 660 + GACTGCCGAC ACCTCTGTCA TCACTGCCCA ATAAGCCATC TAAAGCGAAT TGCCCCTTTC 720 + AAGCACATGA TCGTACTGTC AACAGGAAAC GAAAAGGCGT GTCTCAGCCC CCATTACCTA 780 + TCCTCACCCC TTCTCCAAGC CGTAAAACTA AAAGGCAGGC CACTATGCCA CTCAATGAGG 840 + AGGCCTCTAC CTCCACTGCA GCAGCATTAA ATAACAATCG CTTCGCGCTT TTGTCCGCTG 900 + AAGCGGAGAA TATGGAGCAA GACGTGTCGG ATGCTGATTC TGACATTGAA GACTCTGCTG 960 + CCCGAGATGG TGGTGGACAA TCCGCTAAAT ATAGCAAACC CCCAGCCATA TGCGTACCAA 1020 + GTGTAAGCGA TCCGGTCACC TTGGAACGGG CTCTCAATCT GAGCACCGGC TCCTCAAACT 1080 + ACTACATCCG CATTTCTAGA TTTGGTGTAT CCAGAATCTA TACAGCCAAC CCTGATGCTT 1140 + TCCGCACCGC TGTAAAAGAA CTAAATAAGT TAAATTGTCA ATTCTGGCAT CACCAACTTA 1200 + AAGAAGAAAA ACCCTACAGA GTAGTGCTTA AAGGAATCCA TGCTAATGTT CCTAGTTCGC 1260 + AGATAGAACA AGCATTTAGT GATCACGGCT ATGAGGTCCT TAATATCTAT TGCCCCAGAA 1320 + AGTCTGACTG GAAGAACATT CAGGTAAACG AAGATGATAA TGAAGCTACA AAAAACTTCA 1380 + AAACTAGACA AAATTTGTTT TATATTAATC TTAAACAAGG CCCGAATGTT AAAGAGTCTC 1440 + TTAAGATAAC TCGACTTGGC AGATACAGAG TCACTGTTGA GCGCGCTACA CGTAGAAAAG 1500 + AACTGCTACA ATGTCAAAGA TGCCAAATTT TTGGACACTC TAAGAACTAT TGCGCCCAGG 1560 + ATCCTATTTG TGGTAAATGT AGTGGTCCCC ATATGACCGG GTTCGCTTTG TGCATAAGTG 1620 + ACGTATGTCT GTGTATAAAT TGTGGTGGTG ATCATGTCTC GACAGACAAA AGCTGCCCTG 1680 + TCAGAGCAGA GAAAGCCAAG AAGCTAAAAC CAAGGTCCAG GCTACCGATG ACTAATAATA 1740 + TTGCCACACT CAAACCTCCA CAACGTTCTT CAAGCGGTTA CATACCAGCT GAGGCATTAA 1800 + GAACCAACAT CTCTTATGCT GATATTGCTC GACGCAACAC GACTCAATCT AGGGCTCGTG 1860 + CTACTGTGCA GGCTGAAGTT ATACCAACGT CGGACAATAG CCTTAACAAT AAATTTATGA 1920 + CGTTAGACAA CTCCATTCGG GCCATCAATA CGAGAATGGA CGAACTATTT AAGCTTATAC 1980 + ACGAAACTGT AGAGGCTAAT AAAGCTTTCA GAGAACTGGT TCAGGTTCTA ATTACACGTA 2040 + TTCCTAAATG ACTCAACCAA CCTTAAAAAT CGGATTGTGG AACGCTCGCG GATTAACAAG 2100 + GGGCTCTGAG GAGCTTCGGA TATTCCTCAG CGATCACGAT ATAGACGTAA TGCTTACCAC 2160 + GGAAACACAC ATGCGAGTTG GTCAGCGCAT CTATCTCCCA GGGTATCTTA TGTATCACGC 2220 + CCACCACCCC AGTGGTAACA GTAGAGGTGG CTCTGCAGTC ATCATAAAAT CTAGACTTTG 2280 + TCACAGCCCT CTGACACCTA TCTCTACTAA TGACAGGCAG ATAGCGAGAG TGCACCTGCA 2340 + AACATCGGTT GGGACCGTCA CTGTAGCTGC TGTTTATCTA CCTCCAGCAG AAAGATGGAT 2400 + AGTAGATGAC TTCAAATCCA TGTTTGCTGC GTTAGGCAAC AAATTTATTG CTGGTGGTGA 2460 + TTACAATGCC AAACATGCAT GGTGGGGGAA CCCAAGATCC TGTCCTAGAG GTAAAATGTT 2520 + GCAAGAAGTC ATTGCACATG GGCAATACCA AGTTCTGGCT ACGGGCGAAC CCACTTTCTA 2580 + CTCTTACAAC CCTTTGTTAA CACCATCAGC CCTTGATTTT TTTATAACCT GTGGGTACGG 2640 + CATGGGCAGG CTAGATGTAC AAACTCTCCA GGAACTCTCG TCGGACCATC TTCCTATTCT 2700 + GGCTGTATTG CACGCTACGC CGTTAAAGAA ACCACAACGC GTACGACTAC TTGCCCATAA 2760 + TGCTGACATA AACATATTCA AAACCCATCT TGAACAGCTG AGTGAGGTAA ATATGCAAAT 2820 + TCTGGAGGCG GTGGACATTG ATAATGCCAC AAGCCTTTTC ATGAGCAAAC TAAGTGAGGC 2880 + TGCTCAGCTT GCTGCACCGA GAAATCGGCA TGAAGTAGAG GCCTTCAGAC CACTTCAACT 2940 + TCCTTCCAGT ATATTGGCAC TGCTCAGGCT AAAACGAAGA GTTCGAAAAG AATATGCTAG 3000 + AACAGGTGAT CCCCGCATGC AACAGATCCA CAGTAGACTG GCCAACTGCC TGCATAAGGC 3060 + CCTTGCTCGA AGAAAGCAGG CCCAAATAGA TACCTTCTTG GATAACTTGG GTGCTGACGC 3120 + GAGCACAAAT TACTCACTGT GGCGTATCAC GAAACGGTTC AAAGCTCAGC CCACCCCAAA 3180 + ATCAGCAATC AAAAATCCGT CTGGTGGCTG GTGTCGCACT AGCTTGGAAA AAACTGAAGT 3240 + GTTCGCTAAC AACCTTGAGC AACGTTTTAC ACCCTATAAC TATGCACCGG AAAGTCTCTG 3300 + TCGTCAGGTT GAAGAATACT TGGAATCGCC CTTTCAAATG AGCCTGCCTC TGAGTGCTGT 3360 + CACACTGGAA GAAGTGAAGA ATTTAATAGC CAAGCTGCCA CTTAAGAAAG CTCCTGGAGA 3420 + AGATCTTCTT GATAATAGAA CCATTAGACT TCTCCCAGAT CAAGCATTGC AGTTCCTTGC 3480 + CTTAATATTC AACAGCGTTC TTGATGTTGG CTACTTTCCG AAAGCTTGGA AATCGGCGAG 3540 + CATAATTATG ATCCATAAGA CTGGAAAAAC ACCGACAGAC GTTGACTCGT ACAGGCCCAC 3600 + CAGCTTACTC CCATCTCTGG GTAAAATTAT GGAGAGGCTG ATCCTAAACA GGCTGCTCAC 3660 + ATGCAAGGAT GTTACCAAAG CGATTCCCAA ATTTCAGTTT GGCTTCCGGT TGCAGCACGG 3720 + TACTCCTGAG CAACTACATA GAGTAGTGAA CTTTGCTCTG GAAGCTATGG AAAACAAGGA 3780 + GTATGCAGTA GGTGCCTTTC TTGATATTCA ACAGGCATTT GACAGAGTCT GGCACCCTGG 3840 + GCTCCTGTAC AAAGCGAAGA GGCTGTTCCC GCCGCAGCTA TATTTGGTTG TTAAAAGTTT 3900 + CCTGGAAGAA CGCACATTCC ACGTCTCTGT TGATGGGTAC AAATCATCAA TCAAGCCAAT 3960 + TGCAGCTGGA GTTCCTCAAG GAAGCGTTCT TGGCCCAACC CTATACTCAG TTTTTGCTTC 4020 + GGACATGCCT ACTCACACAC CAGTCACAGA GGTAGACGAA GAAGATGTGC TCATAGCCAC 4080 + CTACGCTGAC GATACTGCTG TGCTCACGAA AAGTAAAAGT ATCCTGGCTG CCACTTCTGG 4140 + TCTACAGGAA TACCTGGATG CATTCCAGCA ATGGGCTGAG AACTGGAATG TGCGCATCAA 4200 + CGCTGAGAAG TGTGCCAATG TGACGTTCGC CAACCGAACA GGTAGCTGTC CGGGTGTCAG 4260 + TCTGAATGGA AGACTGATCA GACACCATCA GGCTTATAAA TACCTTGGTA TTACCCTCGA 4320 + TAGGAAGCTC ACCTTCAGCA GGCACATCAC AAATATTCAG CAAGCGTTCA GGACCAAGGT 4380 + TGCTCGGATG TCTTGGCTCA TTGCACCACG CAACAAACTG TCGCTTGGCT GCAAGGTCAA 4440 + TATTTACAAG TCCATATTGG CCCCCTGCCT GTTCTACGGC CTGCAGGTAT ACGGCATTGC 4500 + TGCGAAGAGT CACCTTAATA AGATCCGGAT TTTACAGGCG AAGACCTTAA GAAGAATTTC 4560 + GGGGGCTCCT TGGTATATGA GAACAAGAGA CATCGAACGC GACCTCAAGG TGCCCAAATT 4620 + AGGAGACAAG CTCCAGAACA TCGCCCAAAA ATATATGGAA AGGCTTAATG TACACCCCAA 4680 + CAGCCTAGCA AGGAAGCTAG GAACTGCAGC TGTGGTCAAT GCTGACCCTC GGACTAGAGT 4740 + CAAAAGAAGA CTCAAGCGAC ACCACCCTCA TGACCTCCCT AACCTGGTTT TGACCTAGAA 4800 + AGTCTTAGTT TTAAAATTCA TTAGAATAAT CAAATAAATA ATAATTACTA TGTTATATCA 4860 + ACTATTATAA TTCTCCCTAT CATTTTTAGA TTAAAAATCT GTTAGTCTTA AGTAACCAAG 4920 + ACACATTGTA AAATAAAATA ATTTAAGCAG ATCAAATTAA GTTGCCGCAT GGGTAACAGT 4980 + GCGTTGATCA AATAATAAAA ACATCATAAA AAAAAAAAAA 5020 +// +ID DMTRDNA standard; DNA; INV; 1435 BP. +XX +AC X80025; +XX +DR FLYBASE; FBte0000670; Dmel\hopper. +XX +SY synonym: M4 +XX +FT source X80025:1..1435 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1..33 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1403..1435 +XX +CC Derived from X80025 (g510507) (Rel. 44, Last updated, Version 11). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 1435 BP; 456 A; 265 C; 212 G; 502 T; 0 other; + CACTATGGGG CATTTGGCCT GTTTTTTTTA CAAAAATTAA TACCTCCTAA ACTATTGGAG 60 + ATATTTGGAT GAATTTTTTT TTATGCGTTA CACATGCCTC CAGGAATATT TTGGAAAAGT 120 + GGGCGTGCCC CAACTCCGCC CCATTTTTTT TTTTTTTTTT TTTTTTTTTT AATAATATAT 180 + TTTTAAAGTT TATTTTTAAT TTCAATAATG TATAATTCAT AACCGTCTTC CTCTTCACAA 240 + TCAGTAGAGT CTGAAGAATT TTTATCAGGT TCAAATTCGC AAGCTAACAT TTCAATGACT 300 + TCTGGTGGAA GAGATAGTCG CTTATGTTTT CGCCTCTTTA AATTTATTGA TGATATTATG 360 + GGATCCGAAG TATCCATTGC TCTGTAAAAG ACATCTGCGA AGCTACTAAT AGTTTTTGCC 420 + GTGGCTGGCT TCAACAAAAG AATTTTAAGT ATGGCTGCAA GATCCCGCAG GCAGCACTTC 480 + CGTGCAGCTT GAACCAAAAG ACGTTCGTTG TGTTTCTGCG CCCTTACGAG TTCATCTGCT 540 + TGCTGTCTTG GGCCACTCAA ATTTTTTAAA TAATATGACG TTTTCGGGAG TCCAACTAAT 600 + TTCCTTTCCT ATTTATTTTT CTCCTTTACC TTCAGGACTA GGTGTTCTTC TAACCAATTT 660 + GAAAAAAATT TTAAAAATTC ATATATTTTT CGATTGCATT TTCTCCAATT TCGTAAAAGA 720 + TTGACTGAAA TCATTCGTTA TTATTATTAT TAGTTAATCG TTTATTAAAG TCTAGCTTGC 780 + TATCAGAAAA ATGCCCACTG ATAAAAGTGC AAATAGAATT TTCCTTTTGA CGAACACCCT 840 + TTTGCGTGCG CCACACTTCC AGCAGGGCAG CATTGGAAAT CGAGATATTG CTCCCTAAAA 900 + AATGAAATTT CTCAAAAAAC CGCAAAAAAC GCACATAGAG ACTACCTGAT ATGAGTTAGG 960 + AATTGAACAC ACTACAACAT GGATATAAAC ACTTACTGAA CAAATTTGAA CAAATTGTTG 1020 + TAGCTCTATT CAAAGTTGAA AATTTTTTCA AACAACTACA TCTTGACACC ACTTGTTAAA 1080 + TGTACAAATT GTTAGAAATA GGCGCACACA ATAAACAATA TATTAATAAC AACACATAAT 1140 + AAGAACCTAA AGATTGATTA TCCATTTCAA ATTATACTCT CCTTCTTCTT CTTTTTAAAT 1200 + TTTAACACTT TGAAAGTTAA GCTAAATTTT GTGCGCAAAG CAGCCACGTG GTATATGCTC 1260 + GCAACAGCCG ACTTTAACAG CTGTTATTAT AACAGTGCAT TGTTAAATTA ACTTATGCGG 1320 + GCTATATCAT AACAGTTTAA CGTATTTCCA ATGTATTAAT ACTAAAATAC TTCAAATTTG 1380 + CATACTTGTG AAAAACACAT TATTGTAAAA AAAACAGGCC AAATGCCCCA TAGTG 1435 +// +ID DMRTMGD1 standard; DNA; INV; 7480 BP. +XX +AC X59545; +XX +DR FLYBASE; FBte0000015; Dmel\mdg1. +XX +FT source X59545:1..7480 +FT SO_feature five_prime_LTR ; SO:0000425:1..441 +FT SO_feature three_prime_LTR ; SO:0000426:7039..7480 +FT SO_feature CDS ; SO:0000316:548..923 +FT SO_feature CDS ; SO:0000316:1327..1557 +FT SO_feature CDS ; SO:0000316:1749..3062 +FT SO_feature CDS ; SO:0000316:2987..6673 +XX +CC Derived from X59545 (g8507) (Rel. 49, Last updated, Version 4). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 7480 BP; 3067 A; 1298 C; 1235 G; 1880 T; 0 other; + TGTAGTATAT ACGAATATAA TAACAATAAT AATAACAATA ATAATAATAA TATTAATAAT 60 + AATTATAATA TGAATCATAA TAATAAGTCA ACTAATAAGT AAACTTAGGA CCACCCTAAT 120 + TCCTTAGGGT CACCCTAGTA GATCTTTAGA TACACCCTAA TACTAAATAT GCGAATTCAG 180 + GATGTACGCC TTTAGGGGTC GGACTCGACT CCCATTGGTT ATCGAGTATG AACTTCATAC 240 + ATACATATTG CAGAATTTGC TAGTGTCAGC ACTTGGCTGT CACAAGAGAT CTCCCTGTAG 300 + ACCACACTAA GATCAGTTAT AAATCAGGAA TAGATCTGGA ATGTACACTC GCTTAATAAA 360 + AACCAAATAA AGATAAAATG ACCAACTGCG TTTTGAGACT TTATTAACTA CATCAGAAGT 420 + ATTAGAATTC AAATTAACTA CATGGCGACC GTGACAAAGG ATCGTTATAA GTTGTAGCAG 480 + AAGCTAAAGG AAACCGCTTG TGATAATTTT CAACTTCGAT GCTCATCCAC CAAGACGGCG 540 + GCAATTATGA AGAAAAAAGC GATCTGAGTG AGTAGAGTGT CAGTGTGATG GGAAAAAACA 600 + GGGGCGGAGT TCGACATAAT ATAAAAAAGA GAATAGCGCA CATAAAGTGG CTATTATATA 660 + CGAACACTCC ACCACCCCAA TGGTCGAAAG CTCAAAAACT ACAAGCTGAG CTAGACCACT 720 + GTGTCGAATA TCTCAAGAAA AAAATCCCCA CCACACGCGC TCACTCAGAA AATCAAATAA 780 + AATCGTTAAC AATTAACAAA ACTCCAACTC CCAATCCGAA AAGCCTGCCT GTTTTCAAGA 840 + AAAGATGCCC GAACGACTGC GAGGGACCAC TGTTCACACC GCATTGTGAA CATACGTGCA 900 + GACATTGCAG CTCCACCACA TAACCCCTAA ATGAGGAAAT CATCATCAAC GTGGTGAGCA 960 + GCCCGCTCAT TACGTCATCG AGGGAGTGTC AGCGTGCCAA CCCGGCGACG ACCAGATGAC 1020 + GCAGGAGGGT CAGAGTGAAG CAAATAGGAG CTGAAAAATA AAATATTTTT TTTGTTGCCC 1080 + TGCGTGGCAC ACCCTCGATG CACTGCGCTG CATATTAATA TTACACAAAA TATTGTAACA 1140 + TTGAGCGGAA CTTTTTCTGC CCGATGAGAA GAATGGCCCG TAAAGCCATA CACCAACTAG 1200 + GTAGGAAAAT GTAACTATAT TGAACAAAAA AAAAAAAAAT CAAAACAACA TATTTTTAAA 1260 + GTAAAATAAA CCAAAACCCA AAAATAAAAA AAAAAAAAAA AAAAAAAAAA ATAAAAATAT 1320 + ACAAAAATGG GTTGGTTTGG ATCTGACGAT AGTCAGACAA AAGATAATAC GGCCAATGTG 1380 + GTCAATAACT TAAAAATAGT CGACCATACA GATGACATTC AGTCACTGTG GTTACTCCTT 1440 + TTGATCATGA CGATCGTAAC AGTCGCTCAG TTTATATTAA CGCTATATGT TAAGCATAAC 1500 + AAGATAATAA AGAGGCGTTA TATAGGCAAA GCAGAGAATA GTTTGGATAA AATTTGAAAA 1560 + AAAAAAAAAA AAAAAAAAAA AAAAAAACAT CCGAGATGTA TTTTGAATTA AGATGATCTA 1620 + AAATTTTTAT TTTTAATATC AGAAAACTAG AATGAAAAAA AAAAAAAAAG ATTATTGAAG 1680 + AAACCTATTT GAGAGAGGCC AAAATTTATA AAGTTCGATT GCATAGATAA ATCCATAGTA 1740 + TTCTTTAAAT GGACTGGCAA GAAATACAAA ACGAGCTTAA AGAAATTAAA ACAACTTTTG 1800 + ACAAGTCTTA TAAATGCATG ACACCAAATA GAGAAGTGCA ACAAGACACT CTCAACAAGC 1860 + ATGCGCAGAT ATTGGTAAGA TGCTTTAATG GAGCACGCCA ATTAATTTAC AGAGAAAGGA 1920 + AAAGATTAAC AAAAAATCAT TTATCACAAG CAGTAAAATT TCTAAACAGG TTCCGTGAGA 1980 + ACTTGTTAAA CGTCAAGTAC AGACACAACT TAAATATTAC AATCCCAACG ATTTTAAGCA 2040 + CACCTATAGT GGCTGAGATC GGTGAGGATA TCGAAAGTGT AGGAGAATCA GAAATAGAAA 2100 + TAAAAGAAGA GGATCTCCAC GATCTTGCAA TTCCAGCGGT AATAACATTA CCCGAATTAC 2160 + TTGAAGAAGA ACTTTCAGAT TCAAATACAG GAATAAGAAT ACAGGAAACG GACAAAATGA 2220 + CAGACTCTGC CGCAACAGCA AGGGAATATG TGCGACAAAT TTCGTCCACA ATACCTGAGT 2280 + TTGACGGCAA AAAGTTAAAC TTGAATAGAT TCCTCACGGC TCTCCGGCTG ATAGATCTGA 2340 + CAAAAGGAGA TCAGGAGATG CTAGCGGTTG AGGTAATCAA GACAAAGATA CTTGGTCCAT 2400 + TATCACACAA AGTTGAAAAT GAAAAGACCA TTATCGGTAT AATAAATCTA TTAAAAGCAT 2460 + CAGTTAAAGG CGAATCGCCC GATGTCATCA AAGCAAAAAT GCTTAGTACA CAACAGCGCG 2520 + GCAAAACTGC AGCGCAATAT ACCACGGAGA TAGAAAACCT ACGTGGGTTG CTCGAAGCAG 2580 + CCTATATAGA TGATGGTTTA GATTCCAACA ATGCAGACAA ATTCGCTACA AAGGAAGCCA 2640 + TATCTGCAAT GACCAAGAAC TGTGGGCACG ATAAGCTCAA AACCATATTG GAAGCTGGAA 2700 + ATTTCAACAC GATGAATAGC GTGATTGAAA AATACATACA CTGCAGTACA GAAATGACCG 2760 + GCAATTCAAA TAGTGTATTA TTCTATAATA ATAGAGGACA CTATCGAGGT AATAATTACC 2820 + GAGGAAATTA CCAAAACAGA GGTAATGGCC GAGGAAATTA TAACTCCTAC AATAACAACT 2880 + ATAGAGGCAG AGGTGGTTAC CATGGTGGAA ACAGAGGACG AGGTGGTAAC CAAAATTATA 2940 + ATAGAGGTGG AGGTTACTCA AGAGGTAACC AAAACCATAA CTATAAAACA AGTCATGCCC 3000 + ACAATGTCCG AAACATACAA TCGGAAAACG AACATACCCC CTTGAGCGAC AATCTACAAT 3060 + AAAATTATAC AAAATTAATC TCAATTTAAG CATTTTTATA CGATTGAAGA ATATGAGTAC 3120 + CAATTCATGG GTAACTCTTT TAATAGATAC AGGTGCAGAA ATTTCCCTGC TTAAATGCAG 3180 + AAACAATAAT CTTAACGATT TAAATCCAAA AAATACAACA AATATATCAG GAATAGGGCA 3240 + AGGGACAATT CAGTCTCTAG GTACACTACA TTTAGAAATG TGTATTGCTA ATGCAGCAAT 3300 + ACCATATGAA TTCCATATCG TACCTAACAA TTTTCCTATA CCAGGGGATG GTATAATTGG 3360 + CTTGGATTTC ATTAAGAAAT ACAATTGTAT TTTGGAATTC CACGACCAAG AAGATTGGTT 3420 + CACTTTGAGG CCCAAAAATT TCAGGAACAT AAACATTCCT ATTATACATA CACTAGATAA 3480 + TGAAATAATT TTGCCAGCTA GATCAGAAGT GATTCGAAAG ATTCAACTAA CATCTACTGA 3540 + CACACATGTT CTCATTCCCA ACCAAGAATT ACAACCTAGC ATAATAATCG CAAGTGCACT 3600 + CGTAAACACT CAGAACGTTT TGATTCGAAT TATTAATACA ACTGAAAAAG ACGCTATAGT 3660 + TAGTAGCGCA AATATAAAAA GCGAATCATT GGATGATTAT GATGTATACA ACGCAAATAT 3720 + AGAAAATAGT GCACAAAGAA CTTCAGAAGT ATTAAAACTT CTTAAATTTC CATCGTTATT 3780 + CAAAAGCGAT TTAACAAAAT TATGCACCGA ATATAGCGAT ATTTTTGGTC TTGAAACAGA 3840 + AACCATATCA GCTAATAATT TTTACAAGCA AAAATTGAGA TTAAATGACA AAACTCCAGT 3900 + CTATATCAAA AACTATAGAA TGCCAGAAAG TCAAAAACCA GAAATTCAAA GGCAAGTTGA 3960 + CAAATTAATA AAAGATGGCA TTGTCGAACA ATCTATTTCA GAATATAATA GCCCTCTTCT 4020 + CTTGGTACCC AAGAAATCAC TGCCTAACTC GGAGGAAAAG AGATGGCGAT TAGTAGTCGA 4080 + TTATCGCCAA ATAAACAAGA AACTGCTAGC AGATAAATTC CCACTTCCAA GAATAGAAGA 4140 + CATTCTTGAT CAATTAGGCC GAGCAAAATA TTTCTCGTGC CTAGACCTGA TGTCAGGATT 4200 + TCATCAAATA GAATTAGACG AAAGGTCAAG AAATATAACA TCTTTCTCAA CTTCAACGGG 4260 + AGCATACCGC TACACGCGAT TACCATTTGG TTTAAAAATA GCCCCAAATT CTTTTCAAAG 4320 + AATGATGACC CTTGCATTTT CAGGTTTAAC GCCTTCGCAA GCATTTCTGT ATATGGATGA 4380 + TTTAGTAGTC ATAGGCTGTT CTGAAAAGCA CATGCTTAAA AATCTAACCG ACGTTTTCAA 4440 + ATTATGTAGG CAACATAATT TAAAATTACA TCCAGAAAAA TGCACTTTCT TTATGAAAGA 4500 + GGTTACTTAT TTAGGTCACA AGTGTACTGA CAAAGGTATA TTGCCAGATG ACTCTAAATA 4560 + TGAGGTAATA AAGAACTACC CCAAACCAGT AAACGCAGAC GAAGCTAGAC GCTTCGTGGC 4620 + ATTTTGCAAT TATTACAGAA GATTTATTAA GAACTTTTCT GAGAAATCAC GCCACTTAAC 4680 + GAGGCTTTGT AAAAAGAATG TTCCATTTGA ATGGACAAGC GAATGCAATG ATGTATTCGA 4740 + ATATCTCAAA AGGAAATTAA TGAAACCAAC ACTCCTTCAG TACCCAGATT TCAGCAAACA 4800 + ATTTTGCATA ACCACAGATG CTAGTAAACA AGCATGTGGA GCGGTACTAT CTCAAGACCA 4860 + TAACGGTCAA CAGCTACCAG TGGCATACGC TTCAAGAAGC TTTACAAAAG GCGAAAGTAA 4920 + TAAGTCCACT ACAGAGCAGG AGCTAGCAGC TATTCACTGG GCAATAAATC ACTTCAGACC 4980 + ATACGTATAT GGTAGACATT TCTTAGTACA AAGTGACCAT AGGCCACTAT CATATCTTTT 5040 + TTCAATGAGA AACCCCAGTT CAAAATTAAC CAGAATGAGA CTAGACTTGG AGGAGTTCGA 5100 + ATTCACAGTA GAATATCTCA AGGGGAAAGA TAATCATGTC GCAGACGCAT TGTTCCGAAT 5160 + AACAATCGGA GAACTTAAAG CAATAAATAG ACAGATACTA AAGGTAACAA CAAGATCAAC 5220 + AACAAGACAG AAAAATACCT GCGCAGGTGA AAAATTGCAT GAACCAAATG AGAAAGAAAA 5280 + TATAAAAATG CCCAATATCT ATCAGGTAAT CAATAACATT GATGCCAAAA AATATGTTAT 5340 + ACTCAAAATA GACAAGCATA AGTGTTTGTT GAAAAGAGGA AAACAAATTA TAACACGTTT 5400 + TGATATGACT AATTTTTATT CTAATGAAAT AATCGATTTA GATCAATTCT TTCAAAGGCT 5460 + TAATGAAGAA GCAAGAATAA ATAGCATCAT TCAAACACAA TTGTCACCAA GTGAACAAAT 5520 + CTTCGAATTT GTCACTATAA AGAACTTTAA AGAAAAGGGC AATAAAATAC TAAAAAATTT 5580 + AAAAATAGCG CTATTAAACA AGGTGACTAA GATAGATAAA AATGATAAGG TTCAAATAAA 5640 + AGCAATACTG TCTAAATATC ATGATGATCC ATCAGAAGGA GGCCATTCAG GAATTTCTAG 5700 + AACCCTGAGG AAAATGAAAA ACTGTTGTTG TTGGCCACGA ATGACGAAGG CGATAAGTGA 5760 + ATATGTTGAA ACATGTTTGA AATGTCAACA AGCCAAGACT ACGAAACATA CTAAAACACC 5820 + GTTGACAATA ACAGAAACGC CAGCAACAGC ATTTGATAAA GTTTTGATAG ATACCATTGG 5880 + TCCACTGCCA AGATCAGAAA ACGGAAATGA GTATGCTGTT ACTATCATTT GCGATTTAAC 5940 + AAAATATTTG GTAACGGTAC CAATTCCAAA TAAAAGTGCA AAATCAGTTG CTAAGGCTAT 6000 + ATTCGAAAAT TTTATTCTAA AGTACGGTCC AATGAAAACA ATCACAACGG ACATGGGAAC 6060 + GGAATATAAA AACCAAATTA TAGACGACCT ATGCAAATAT ATGAAGATAA AAAACATTAC 6120 + TTCAACAGCA CACCATCACC AGACATTAGG AACAGTAGAA CGAAGTCACA GAACTTTCAA 6180 + CGAGTATGTT CGCTCATATA TATCTGTTGA CAAAACCGAT TGGGATATAT GGATACAATA 6240 + TTTTACTTAT TGTTTCAACA CAACACCATC GGTAGTTCAT GAATATTGTC CATATGAATT 6300 + AGTATTTGGA AGATTACCAA GACAGTTCAT AGATTTTAAC AGGATAGACA GAATAGATCC 6360 + TATTTACAAC ATGGATGATT ATTCAAAAGA AGTTAAGCTA CGATTAGAAA TAGCATATAG 6420 + AAGAGCTAAA AATATGTTAG ACAAGGCAAA AGCCGATAGA AAGATAAAAT ATGATAGAAA 6480 + TATTAGTAAC TTTGAATTAA AGATAGGAGA TAAGATATTA CTTAAAAACG AAACGGGTCA 6540 + TAAACTTGAC AATAATTATT TAGGACCATA TTTAGTTTCA GAAATAGGAG ATAATGACAA 6600 + CATTACAATT ATAGGAAATA AAAATAAAAA ACAGATAGTC CATAAAGATA GGTTAAAAAT 6660 + TTTTAATTCA TAATACATTT TGTTTGGTTG GCCAACCACA AATAAAAAAC CACAAATAAA 6720 + AAACCACAAA TAAAAAACCA CAAATAAAAA ACCACAAATA AAAAACCACA AATAAAAAAC 6780 + CACAAATAAA AAACCACAAA TAAAAAACCA CAAATAAAAA ACCACAAATA AAAAAACCAC 6840 + AAATAAAATA AAAACCAATA AAAACATTAT AATACAAAAC TTTTACTTTG CAAAATATAA 6900 + TGAAAATATA TATATTTTTT TTAATATCTC TTTAATCATT CATTTCAAAT ATTAATGTAC 6960 + ATTTAAAAAA AAAAAAAAAA ATATTATATA CTTGAAAATA ACTTCATGTT ATTACGTTAT 7020 + TTTTCAAAAG GAGGGAGATG TAGTATATAC GAATATAATA ACAATAATAA TAACAATAAT 7080 + AATAATAATA TTAATAATAA TTATAATATG AATCATAATA ATAAGTCAAC TAATAAGTAA 7140 + ACTTAGGACC ACCCTAATTC CTTAGGGTCA CCCTAGTAGA TCTTTAGATA CACCCTAATA 7200 + CTAAATATGC GAATTCAGGA TGTACGCCTT TAGGGGTCGG ACTCGACTCC CATTGGTTAT 7260 + CGAGTATGAA CTTCATACAT ACATATTGCA GAATTTGCTA GTGTCAGCAC TTGGCTGTCA 7320 + CAAGAGATCT CCCTGTAGAC CACACTAAGA TCAGTTATAA ATCAGGAATA GATCTGGAAT 7380 + GTACACTCGC TTAATAAAAA CCAAATAAAG ATAAAATGAC CAACTGCGTT TTGAGACTTT 7440 + ATTAACTACA TCAGAAGTAT TAGAATTCAA ATTAACTACA 7480 +// +ID DMMDG3 standard; DNA; INV; 5519 BP. +XX +AC X95908; +XX +DR FLYBASE; FBte0000010; Dmel\mdg3. +XX +FT source X95908:1..5519 +FT SO_feature five_prime_LTR ; SO:0000425:1..267 +FT SO_feature three_prime_LTR ; SO:0000426:5253..5519 +FT SO_feature transcription_start_site ; SO:0000315:178 +FT SO_feature polyA_signal_sequence ; SO:0000551:5253..5519 +FT SO_feature CDS ; SO:0000316:296..4780 +FT /name="Dmel\mdg3\ORF" +FT /db_xref="FLYBASE:FBgn0043882" +FT /db_xref="SPTREMBL:Q94885" +FT /db_xref="NCBI_PROTEIN:CAA65152.1" +FT /translation="MDDKIILNDFSLTTLKDWLRILGQNTEGTKTELIARLQDIPTAVR +FT GDCPPEHPQKNAPPGNDIFSSLDFQNCEINTDHVSVNAMNRKESTETGSERETNMFELQ +FT QLRAELAEAKAMLNGTRSSLQFQEQQQPEQSKATVSSVIQTAQFTQAGATKENTTFHSP +FT QRSNERAESQRFPVDALALAKETITDYDGKTCARAWITVVKNIARTFNIDDNHLRILLI +FT TKLKGNAQVWLHAHPARLIEPIDNLLDQLSLTFGEQSSKAEIRRKFESRKWKTEENFCS +FT YYDEKMALSNGINIDDDELLDQMIEGIPLQNFRTQARIQCFSTPSEMLRAFSNIRLPAR +FT REPPVQPTDYKDAIRCANCNSRGHKADICKKPKREPGSCYACGQLGHLVAQCPTRKSVS +FT SNNYVRWFKINFFENAYKPIISECLIDSGSPISIIKKSLINETMKLALVNTCYFGLNNC +FT ILKTHGQTTCYVLKGSIKIYFRLIIVCDQSMRYNVILGRDFLTACNLNLDPYTLGMIAL +FT RKPMEINKISMFTENDSPEKSLENEIVSPKSLENEIVSSQSLENEIVSPKSLENEIVSP +FT KSFKNATISPKSLENKIVNQQHKETGPISLRDEIVNQQKNVSKSKLSEDEIVNTSKEIV +FT SFKLPKDKNVYEQLNHNFDKEVLRICHVTESELEYKIGENVSNRLQLEFDRLFRNFYIN +FT AKRPNEPTVRSEIQLCLKNPKPFSCSPRRLSYTEKDRLQKLLDEYLENGFIRPSDSEYA +FT SPIVLVKKKTGDLRMCVDFRKLNKMTMKDNYPLPLIDDLLDRMNEKTVFTKLDLKNGFF +FT HVHVKKESIKYTSFVTPLGQYEWLRMPFGLKNAPSVFQRFVNKIFADMIRENKVVVYMD +FT DILLATENINEHLETLKEIFKRLVENKLELRIDKCEFMQSSIKYLGFIINKDGIMPNDK +FT GIEAIKNFPIPNNVHTVQSFLGLCSYFRRFIKDFSRLAKPLHDILKKDKPFKFGSEEMI +FT CFNMLKDKLIQSPVLAIYNHKHETELHCDASSSGFGAVLMQKKEDQKWHPVSFFSKRTT +FT DIESKYHSFELETLAIVYSLRRFRVYLHWRTFKIVTDCNSLILTLSKKELNPRIARWAL +FT EFQGYDFEIVHRAGSRMQHVDALSRCTNIMVIQTNSFEDNLVICQGKDTKLKEIRQLLE +FT NTENKLYEMRNGIVYKKTNENRLLFYVPIEMEEQVLYKYHNELGHVGRDKMIEAIMKNY +FT WFPNLKQKCSTHISNCLKCISFSPKTGKTEGFLHNIPKGNKPFEIIHIDHYGPVDLARP +FT KKHILVIVDAFTKFVRLYATKTTNTKEVIQSLNDYFRAYSRPKCIISDRGACFTSGDFD +FT SFLKECNVKHIKIATGSPQANGQVERINRSLGPMISKLIEPDQGLHWDLVLEKVEYTLN +FT NTLHRSIKQYPSIMLFGLQQKGQIMDELKEKIEEIGETIEERDLESIRNKGEASQKIAQ +FT AYNKEYVDKKRKRSGVFTKGTTSWLKILTQQQA" +XX +CC Derived from X95908 (e990667) (Rel. 49, Last updated, Version 3). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 5519 BP; 2078 A; 1005 C; 1029 G; 1407 T; 0 other; + TGTAGTAGGC TGCACCTTCT ACCCTCTTCC TTTACTCTTA GTCATACATA CCTAATTATA 60 + CATAGCCAAT CTAGTCATAA GCTTATACAC TCATACACCC ATCCTTAACA TACAAATATT 120 + ATCGAGAAAC TTATCGACTA ATCGACTCGC CACTCTGCAG AGAGCGCGGC AGTCAGTCGC 180 + TGTTGAACCA AGCTAAAGGA CAGATCAAAA ATAAAAGAGA CACGTGAAAT TGTATTAGAA 240 + TATTAACTTC TGTAAACGGC GGCTAAAATC TCAGAAGTGG GATTAATAAT CCAAAATGGA 300 + CGATAAAATC ATCCTGAACG ACTTTTCGCT GACAACCCTA AAAGATTGGC TACGTATTCT 360 + GGGCCAAAAT ACGGAGGGCA CAAAAACCGA ATTAATCGCG AGGCTGCAAG ACATCCCAAC 420 + GGCAGTTCGG GGCGATTGTC CACCGGAGCA CCCCCAGAAA AACGCTCCAC CAGGAAACGA 480 + CATTTTTTCT TCACTGGATT TTCAGAATTG TGAAATTAAC ACCGATCACG TAAGTGTGAA 540 + TGCGATGAAC AGAAAAGAAT CAACCGAAAC TGGCAGTGAG AGGGAGACAA ACATGTTCGA 600 + GCTACAGCAA CTACGCGCAG AGCTAGCAGA AGCGAAGGCA ATGCTTAACG GAACACGATC 660 + GAGCTTGCAG TTCCAAGAAC AACAACAACC AGAGCAAAGC AAGGCTACAG TTAGTTCCGT 720 + TATCCAGACG GCGCAGTTTA CGCAGGCTGG CGCCACAAAA GAGAACACAA CATTTCACTC 780 + GCCGCAGCGA TCCAACGAGA GAGCGGAGAG CCAGCGTTTT CCAGTTGATG CTCTCGCTCT 840 + CGCCAAAGAG ACGATAACCG ATTACGATGG GAAAACTTGC GCGCGTGCCT GGATAACAGT 900 + GGTCAAAAAT ATCGCACGCA CTTTCAACAT CGATGACAAC CATTTACGCA TCTTACTCAT 960 + CACTAAACTT AAAGGAAACG CGCAAGTCTG GTTACATGCG CACCCTGCTC GATTGATCGA 1020 + ACCAATTGAC AATTTGCTTG ATCAATTGTC ATTGACTTTT GGCGAGCAAT CATCCAAGGC 1080 + TGAGATCCGG CGAAAATTCG AGAGTCGCAA GTGGAAAACC GAGGAGAATT TCTGCAGTTA 1140 + TTACGACGAG AAGATGGCTC TCTCAAACGG GATAAACATC GACGACGACG AACTACTGGA 1200 + CCAGATGATA GAGGGCATAC CGCTACAAAA TTTCCGTACC CAAGCACGGA TTCAATGCTT 1260 + CTCTACTCCA TCGGAGATGC TACGCGCATT TTCGAACATC CGTTTGCCAG CTCGGAGGGA 1320 + GCCACCTGTA CAGCCAACCG ACTACAAAGA TGCCATACGA TGCGCAAACT GTAATTCAAG 1380 + AGGACACAAA GCTGACATCT GCAAGAAGCC CAAACGTGAA CCAGGTTCGT GCTACGCCTG 1440 + TGGACAACTT GGACACCTGG TGGCACAATG TCCCACAAGG AAGAGCGTTT CATCTAATAA 1500 + TTATGTAAGA TGGTTTAAAA TTAATTTTTT TGAAAATGCT TATAAGCCCA TAATTTCAGA 1560 + ATGCCTCATA GACTCTGGCA GTCCTATATC TATCATTAAA AAGTCACTTA TTAACGAGAC 1620 + AATGAAGTTA GCCCTAGTTA ATACTTGCTA TTTTGGTTTA AACAACTGTA TTCTCAAAAC 1680 + ACATGGACAA ACCACATGTT ATGTTTTGAA AGGATCAATA AAAATATATT TTCGTTTAAT 1740 + CATTGTTTGC GACCAGTCTA TGAGGTATAA TGTTATTCTC GGCAGAGATT TTTTAACTGC 1800 + ATGCAATTTA AATTTAGACC CGTACACCTT GGGAATGATT GCGTTGAGAA AACCCATGGA 1860 + AATAAACAAA ATATCAATGT TTACTGAAAA TGATAGTCCT GAGAAATCTT TAGAAAATGA 1920 + AATTGTTAGT CCAAAATCGT TAGAGAATGA AATTGTTAGT TCACAATCGT TAGAAAATGA 1980 + AATTGTTAGC CCCAAATCGT TAGAGAATGA AATTGTTAGT CCAAAATCGT TTAAAAATGC 2040 + AACTATTAGT CCGAAATCGT TAGAAAATAA AATCGTTAAT CAACAGCATA AAGAAACTGG 2100 + TCCAATATCG TTAAGAGATG AAATAGTTAA TCAACAAAAG AATGTCAGTA AATCAAAATT 2160 + ATCAGAAGAT GAAATTGTTA ACACTTCAAA AGAAATCGTT AGTTTTAAAT TGCCAAAAGA 2220 + TAAAAACGTT TACGAACAAT TAAATCACAA CTTTGATAAG GAAGTACTAA GAATATGTCA 2280 + TGTAACTGAA AGTGAGTTAG AATACAAAAT AGGAGAAAAT GTTAGCAATA GGTTACAACT 2340 + AGAATTCGAT AGGTTGTTTA GAAATTTTTA TATAAATGCA AAAAGGCCAA ATGAACCGAC 2400 + AGTTAGAAGT GAAATACAAT TGTGTTTGAA AAACCCGAAA CCGTTTAGCT GTTCTCCTAG 2460 + GAGGCTTTCA TACACAGAAA AAGACAGGTT ACAAAAACTA TTAGACGAAT ATTTGGAAAA 2520 + CGGATTTATA CGACCAAGCG ACTCGGAATA TGCATCGCCT ATTGTTTTAG TGAAAAAGAA 2580 + AACTGGAGAC TTACGTATGT GCGTCGACTT TAGAAAACTT AATAAAATGA CAATGAAAGA 2640 + CAACTATCCT CTACCTCTTA TAGATGACTT GTTAGATAGA ATGAATGAGA AAACTGTTTT 2700 + CACCAAACTC GATCTTAAAA ACGGTTTTTT CCACGTGCAT GTTAAAAAAG AATCAATAAA 2760 + ATACACCTCT TTCGTTACAC CATTAGGCCA ATACGAGTGG CTGCGAATGC CATTTGGCCT 2820 + CAAAAACGCC CCGTCTGTGT TCCAAAGATT TGTTAACAAA ATTTTTGCGG ATATGATTAG 2880 + AGAAAACAAA GTAGTAGTAT ATATGGACGA CATTCTATTG GCAACCGAAA ATATAAACGA 2940 + ACACTTAGAA ACGTTGAAAG AAATTTTTAA AAGATTAGTT GAAAATAAAC TTGAATTAAG 3000 + AATAGACAAA TGTGAGTTTA TGCAATCAAG TATAAAATAT CTTGGGTTCA TAATAAATAA 3060 + AGACGGCATA ATGCCCAATG ACAAAGGAAT CGAGGCAATA AAAAATTTCC CAATACCTAA 3120 + TAATGTTCAT ACAGTACAAA GTTTTTTGGG ATTATGCTCA TATTTTCGAC GGTTTATAAA 3180 + AGATTTTTCT AGACTAGCTA AACCATTGCA TGACATTCTA AAAAAAGATA AACCGTTCAA 3240 + ATTTGGTAGT GAAGAAATGA TTTGTTTTAA TATGTTAAAA GATAAATTAA TACAGTCACC 3300 + GGTCTTAGCT ATATACAACC ATAAACACGA AACAGAATTG CATTGTGATG CAAGTTCTTC 3360 + TGGATTCGGT GCTGTACTTA TGCAAAAGAA GGAGGACCAG AAATGGCACC CAGTTTCATT 3420 + CTTTTCAAAA CGGACAACAG ATATTGAATC AAAATACCAC AGTTTCGAGT TAGAAACTTT 3480 + AGCCATTGTT TATTCGTTAC GTAGATTTAG AGTTTATCTT CATTGGAGGA CATTTAAAAT 3540 + AGTCACCGAC TGCAACTCAT TAATTTTGAC CCTAAGCAAA AAAGAGCTAA ACCCTAGGAT 3600 + AGCCAGGTGG GCTTTAGAAT TCCAAGGTTA TGATTTTGAA ATTGTGCATA GGGCAGGTAG 3660 + CCGCATGCAA CATGTTGACG CACTGAGTAG GTGTACAAAT ATTATGGTAA TACAAACAAA 3720 + CAGTTTCGAA GATAATCTAG TTATATGTCA AGGGAAAGAT ACAAAATTAA AAGAAATCAG 3780 + GCAATTGTTA GAAAACACAG AAAATAAATT GTATGAGATG AGAAATGGTA TAGTTTACAA 3840 + AAAGACAAAT GAAAATAGAT TGCTGTTCTA CGTTCCGATA GAAATGGAAG AACAAGTGTT 3900 + ATACAAATAT CACAACGAAC TTGGACACGT AGGAAGAGAC AAAATGATAG AAGCTATAAT 3960 + GAAAAACTAT TGGTTTCCAA ATTTAAAACA GAAGTGTAGC ACACATATCA GCAACTGTTT 4020 + AAAATGTATT TCATTCAGTC CCAAAACAGG AAAAACAGAA GGATTTCTAC ACAACATACC 4080 + TAAGGGAAAC AAACCTTTTG AAATAATCCA TATTGACCAT TATGGTCCAG TAGACTTGGC 4140 + TAGACCGAAG AAACATATTC TAGTGATAGT AGATGCATTC ACAAAGTTTG TCAGACTATA 4200 + CGCAACAAAA ACTACGAACA CAAAAGAAGT CATACAATCG TTAAATGACT ACTTCAGAGC 4260 + ATACAGTAGG CCTAAGTGTA TCATATCAGA TAGAGGAGCA TGTTTCACGT CTGGCGATTT 4320 + TGACTCATTT TTGAAAGAAT GCAATGTTAA ACACATAAAA ATTGCAACAG GATCGCCACA 4380 + AGCCAACGGT CAAGTTGAAC GTATAAACCG AAGTCTTGGT CCAATGATTA GCAAGTTAAT 4440 + TGAACCTGAT CAAGGTCTAC ACTGGGACTT AGTCTTAGAA AAGGTCGAAT ATACCCTGAA 4500 + CAATACACTA CACCGCAGCA TTAAACAGTA TCCTAGCATA ATGTTATTTG GGTTACAACA 4560 + AAAAGGACAA ATTATGGATG AGTTAAAAGA AAAAATTGAG GAAATTGGAG AAACGATTGA 4620 + AGAAAGAGAT TTAGAAAGTA TTAGAAATAA AGGCGAGGCA AGTCAGAAAA TAGCACAAGC 4680 + ATACAATAAA GAATATGTTG ACAAAAAACG AAAACGATCA GGAGTGTTCA CAAAAGGCAC 4740 + TACGTCATGG TTAAAAATTT TGACTCAACA ACAGGCATAG CTAAGAAGTT AATTCCAAAG 4800 + CATAAAGGAC CCTATGTCAT AAGCAAAGTT CTCAAAAATG ATCGCTTCCT TCTGGAAGAT 4860 + GTTGATGGAT TTCAAATTTC TCGCAATCCT TACCGGGGTG TATGGAGCAT ACAGAATATA 4920 + AAACACTGGC AAAGAAAAAT TAAGAGTCTA CAAAATAGAA AGTATAATTT GAGAAACTCT 4980 + GTACAAAATA GAAAGTATAA TTTGAGAAAC TCTGTACAAA ATAGAAAGTA TAATTTAAGA 5040 + AACTCTGTAC GAAATCGAAA GTATAATTTA AGAAGCAATT GTAAAACAAA GAAAACAAAC 5100 + AAGAAGAAAA GAAAACCAAA AAAATGTTTA AGACCGTTCA AAAGTATCTC CACTAAGAAG 5160 + AATAAAATAA GAAACAGGAC CCTTAGCTTT AAGAAACGTT AATTGTTATA AAATCCTACG 5220 + ATCGGGAGAT CTAGTTGTCA GGACGGCCGA GTTGTAGTAG GCTGCTCCTT CTACCCTCTT 5280 + CCTTTACTCT TAGTCATACA TACCTAATTA TACATAGCCA ATCTAGTCAT AAGCTTATAC 5340 + ACTCATACAC CCATCCTTAA CATACAAATA TTATCGAGAA ACTTATCGAC TAATCGACTC 5400 + GCCACTCTGC AGAGAGCGCG GCAGTCAGTC GCTGTTGAAC CAAGCTAAAG GACAGATCAA 5460 + AAATAAAAGA GACACGTGAA ATTGTATTAG AATATTAACT TCTGTAAACG GCGGCTAAA 5519 +// +ID DMDM11 standard; DNA; INV; 5461 BP. +XX +AC X14037; +AC X15066; +XX +DR FLYBASE; FBte0000042; Dmel\micropia. +XX +FT source join(X14037:5..3664,X15066:3534..3593,X14037:3721..5461) +FT SO_feature five_prime_LTR ; SO:0000425:1..476 +FT SO_feature three_prime_LTR ; SO:0000426:4957..5461 +FT SO_feature primer_binding_site ; SO:0005850:477..489 +FT /bound_moiety="tRNA-leu" +FT SO_feature primer_binding_site ; SO:0005850:4939..4956 +FT SO_feature CDS ; SO:0000316:540..4415 +FT /name="Dmel\micropia\polyprotein" +FT /db_xref="FLYBASE:FBgn0043876" +FT /translation=" +FT MQNRNLAELVKIMQKTPAREQQPSYDVKLPKFNPDAACVEAAKWCSTTDI +FT ILTEHPLKGSKLITALSNCMEGTASQWLTQISYQGMTWQEFQELFLQRFE +FT TEETPAATFLNLLNSRPTAAECYAVYASRLVTQLTTKWRNMEIEEIAVTT +FT VLAHMANIDSRLQRVLFTSNVRTRSKLQAELKAFTFDKKRHARDDNLGPD +FT QKNRKASPVVCHFCSKPGRRIAECRSKMRQDRRAKPQREKSNVTCYRCGQ +FT PGHFSNQCPKNGTAAKQDVTQQKTVNQCCVTEPKGSLHQRGEIYPICFDS +FT GAECSLIKDDISSKLSGKRINNTVMIKGIGGGSVCSTLQILSEVTINENI +FT MEILFHVVPNEEMRNDILIGREILKQGFYVILTSDNFKVVKSKTVNNCSV +FT TERSFTLSDIDTELVDNEKAQLIELLEKHSTSFTNGIPHTRVNTGEMKIR +FT LIDPTKTVQRRPYRLSPEEREVVRMQVSELIRCNIVRPSCSPFASPMLLV +FT KKKNGTDRLCVDFRELNSNTISDKYPLPLISDQIARLRGANYFTCLDMAS +FT GFHQIPIHPESVEYTAFVPDGLKNAPSVFQRTVINALGDLANSFVIVYMD +FT DIMVVSPTKELALERLKTVLNVLTKAGFTFNLAKCSFLKTTVQYLGYEVR +FT AGEIRPNVRKIASLSSLPPPQTVSGVRQFIGLASYFRKFVSGFSQLMKPL +FT YSLSSGSGKITWSAELEEIRLKVVTILTNEPALVIFDPQYPIELHTDASA +FT CGYGAILLHRIESKPHVIEYFSKTTTSVESRYHSYELETLAVVKAVKHFR +FT HYLIGREFVVYTDCNSLKASRTKIDLTPRVHRWWAYLQSFNFEIQYREGK +FT RMAHVDFLSRNPLSPEHILSINKIPEKRVNLSEISSTWLLAEQRLDLEII +FT EIVNKLESDELAENLAKTYDLRKGVLYRKVQRRGRTSYLPVVPRAFKWSV +FT INQVHESIMHLGWQKTLDKVYQYYWFAKMNKYVRKFVSNCITCRSVKSSS +FT GKVQAELHSIPKTSIPWHTIHIDITGKLSGKSDLKEYVIVQIDAYTKFVY +FT LYHTLKIDAESCVNAMKSSISLFGVPDRIIADQGRCFTSSKFSEFCVSQK +FT VELHLIATGMSRANGQVERVMETLKNLLSVVESSQRSWQDALGEVQLALN +FT CTISRATDASPLEMLIGKQARPLGLVPPCETECEIDLATVRAHATENMNS +FT LASYDKSRFDSSRAAVDKHHVGDYVLLRNEERHQTKLDPKFRGPFLVTEV +FT LEGDRYTLKSLTSNRSFKYCHESIKMPDAEIPNELNENVEQ" +XX +CC Sequence assembled by Lynn Crosby (FlyBase), 'micropia.v006'. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 5461 BP; 1679 A; 1051 C; 1264 G; 1467 T; 0 other; + TGTCGTGGCG AAAATAATGA GTATGCGTGT AGTCGCTGTT TACTTCTTCT CCATGTTCCC 60 + TTTGCTATTA TGCGTGTTCC TATTTATGAA CACGTGGCGA AAATAATAAA TGCGTGTAGT 120 + CGCCGTTTAC TTCTTCTCCA TGTTCCCTTT GCTATTATGC GTGTTCCTAT TTATTGTCAA 180 + TGTGTGAGGA TGAATAGATG AATTATCTAT GAACGGGATT TTGCAAAAAC GACTTGCGCT 240 + GCTTGGTTAG AAAGGGAAAA CTATATAATG AAAAGGGAAT GCCAAAAATT GAGAAGAGAC 300 + AAAGCAGGCT GCACGAAGCT GGAGTGAGGG CATTAATCGT GGAGAAGCCA AAGCAGACGC 360 + AAGTGGACTC GTTGACTGCG CACAGCTGCA TAAAATTATA TAGTAAAAAG AGATTTGAGC 420 + GACGCTGATA TGGACGGACG GACGGACGCG AGGCCCCTGA TATTCTTAAC CCGACATCAG 480 + AAGTGGGATC TGTGCCACAC CCTGCATTTT CTGAGGATCA GTGGCGTGCA GTAGTGGAAA 540 + TGCAAAATCG GAATTTGGCT GAACTTGTAA AAATCATGCA AAAGACGCCG GCACGTGAGC 600 + AGCAACCTAG TTATGATGTT AAGCTACCCA AATTTAACCC TGATGCTGCA TGCGTAGAGG 660 + CAGCAAAGTG GTGTTCAACA ACCGATATAA TTCTAACTGA GCACCCCCTT AAAGGAAGTA 720 + AATTGATCAC GGCACTAAGT AACTGCATGG AGGGAACTGC ATCTCAGTGG CTAACACAAA 780 + TCTCGTACCA GGGTATGACT TGGCAAGAGT TCCAGGAATT ATTTCTGCAG CGCTTTGAAA 840 + CCGAAGAGAC GCCGGCCGCT ACGTTTTTAA ATTTACTCAA CAGCCGCCCG ACTGCCGCCG 900 + AATGTTACGC GGTGTATGCG AGTCGGCTGG TGACGCAGCT GACTACAAAG TGGCGGAATA 960 + TGGAAATAGA AGAAATTGCC GTTACAACTG TTCTTGCGCA TATGGCAAAC ATTGACAGTC 1020 + GTTTGCAGCG CGTCCTCTTC ACATCCAATG TGCGTACCAG AAGTAAGCTA CAGGCGGAGT 1080 + TAAAAGCGTT TACGTTCGAC AAGAAGCGAC ATGCTCGAGA TGACAACCTT GGACCTGACC 1140 + AGAAGAACCG TAAGGCATCG CCAGTTGTAT GCCACTTCTG TTCAAAGCCG GGACGTCGAA 1200 + TTGCTGAATG CCGAAGTAAA ATGCGACAAG ATAGACGGGC GAAACCGCAG CGTGAAAAAT 1260 + CAAATGTTAC GTGCTATCGG TGCGGCCAAC CGGGACATTT CTCCAACCAG TGCCCGAAAA 1320 + ACGGAACTGC AGCCAAACAA GATGTGACTC AACAGAAGAC TGTTAACCAA TGTTGTGTGA 1380 + CTGAGCCAAA GGGAAGCTTG CATCAACGAG GTGAGATCTA TCCAATTTGT TTCGATTCCG 1440 + GTGCAGAGTG CTCCCTTATT AAAGACGACA TTAGCAGTAA GTTATCTGGT AAACGTATAA 1500 + ACAATACTGT AATGATAAAA GGCATTGGTG GTGGCAGTGT GTGCAGTACA TTGCAAATCT 1560 + TGAGTGAAGT CACTATAAAC GAAAATATTA TGGAAATATT ATTTCATGTA GTCCCGAACG 1620 + AGGAAATGAG GAATGATATT CTGATAGGGC GAGAAATACT TAAACAAGGC TTTTATGTAA 1680 + TTTTGACATC CGATAATTTT AAAGTTGTAA AATCAAAAAC TGTTAATAAT TGTTCCGTTA 1740 + CTGAGCGATC GTTTACTTTG TCCGATATTG ACACCGAATT AGTCGACAAT GAGAAAGCTC 1800 + AATTAATTGA GTTACTTGAA AAGCACTCGA CTTCATTTAC CAACGGGATA CCTCATACTC 1860 + GAGTAAATAC AGGCGAAATG AAAATCCGTT TGATTGATCC AACTAAAACT GTTCAGCGCC 1920 + GACCTTACAG ACTTAGCCCC GAAGAGAGAG AAGTAGTGCG AATGCAGGTG AGCGAATTGA 1980 + TAAGATGTAA TATTGTTCGC CCAAGTTGCT CTCCCTTTGC TAGCCCCATG TTGCTCGTCA 2040 + AAAAGAAGAA CGGAACCGAC CGTCTATGTG TTGATTTTAG AGAGCTAAAC TCGAACACGA 2100 + TTTCGGATAA ATACCCCTTG CCGCTTATCA GCGATCAAAT TGCTAGACTT CGCGGAGCAA 2160 + ATTATTTCAC ATGCCTGGAT ATGGCAAGTG GTTTCCACCA AATCCCGATT CACCCTGAAT 2220 + CCGTGGAATA TACTGCATTT GTGCCCGACG GCCTCAAAAA TGCGCCATCT GTTTTCCAGC 2280 + GCACAGTCAT AAATGCACTT GGTGACCTTG CTAACTCTTT TGTAATCGTT TACATGGACG 2340 + ACATAATGGT AGTATCGCCA ACCAAGGAAT TGGCTTTGGA AAGGTTAAAA ACTGTTTTGA 2400 + ATGTTCTTAC AAAGGCTGGT TTTACCTTTA ACCTTGCTAA ATGCAGTTTT CTCAAAACAA 2460 + CGGTTCAGTA TTTAGGCTAT GAAGTGCGAG CGGGAGAAAT TCGTCCGAAT GTGCGAAAGA 2520 + TAGCTTCTTT AAGCTCCTTG CCTCCTCCTC AAACTGTCTC CGGCGTTAGA CAATTCATTG 2580 + GCTTGGCCTC TTACTTTCGC AAATTCGTGT CTGGATTCTC CCAACTTATG AAACCATTGT 2640 + ATTCACTTTC GTCTGGTAGC GGCAAGATTA CATGGAGCGC TGAGCTGGAA GAGATCAGAC 2700 + TTAAAGTTGT GACGATCCTC ACAAATGAGC CTGCTCTGGT AATCTTCGAC CCGCAATATC 2760 + CTATTGAGTT GCACACTGAT GCAAGTGCCT GTGGATATGG AGCGATACTT TTGCACCGTA 2820 + TAGAAAGTAA GCCCCATGTA ATCGAATACT TCAGCAAAAC AACTACCTCT GTTGAATCTA 2880 + GATATCACTC CTACGAGCTG GAAACCTTGG CAGTGGTAAA AGCCGTTAAA CATTTTCGCC 2940 + ATTACCTAAT TGGCCGTGAG TTCGTTGTCT ATACAGACTG CAATTCATTA AAAGCTTCTC 3000 + GCACAAAAAT AGATTTAACC CCCAGAGTTC ACCGCTGGTG GGCCTACTTA CAATCGTTTA 3060 + ATTTCGAAAT TCAGTATAGA GAGGGTAAGC GTATGGCTCA TGTGGATTTC CTATCAAGAA 3120 + ATCCTTTATC ACCCGAACAC ATTTTGTCAA TAAACAAGAT TCCCGAAAAA CGAGTAAATC 3180 + TGTCTGAAAT TTCAAGTACT TGGCTTCTTG CTGAGCAACG GTTAGACCTT GAGATAATAG 3240 + AAATTGTTAA CAAATTGGAG TCAGATGAAT TAGCCGAAAA CTTGGCCAAA ACGTATGATT 3300 + TGCGAAAAGG TGTATTATAT CGCAAGGTCC AAAGACGAGG TAGAACAAGT TATTTACCAG 3360 + TTGTACCCAG AGCTTTCAAA TGGTCAGTAA TTAACCAGGT ACACGAGTCG ATAATGCATT 3420 + TAGGGTGGCA AAAGACACTT GATAAAGTGT ACCAGTATTA TTGGTTCGCT AAAATGAACA 3480 + AGTATGTTCG AAAATTTGTT TCAAACTGCA TAACTTGTAG ATCAGTGAAA TCATCTTCCG 3540 + GGAAGGTTCA GGCGGAACTT CATTCCATTC CGAAGACAAG TATACCGTGG CACACCATCC 3600 + ACATAGATAT AACGGGGAAA TTAAGTGGCA AGAGCGATTT GAAGGAGTAT GTCATTGTTC 3660 + AGATCGATGC CTATACAAAG TTTGTTTATC TGTATCACAC CTTAAAGATA GATGCCGAAA 3720 + GCTGTGTTAA TGCTATGAAA TCTTCCATAT CCTTATTTGG AGTACCAGAT CGCATTATCG 3780 + CCGACCAGGG CAGATGTTTT ACTAGCTCTA AGTTTTCAGA GTTTTGCGTA TCGCAGAAAG 3840 + TTGAACTTCA CTTGATTGCT ACGGGAATGA GCCGTGCAAA TGGGCAAGTG GAACGGGTGA 3900 + TGGAAACACT GAAAAATTTG TTGTCAGTGG TAGAATCAAG TCAACGATCG TGGCAGGACG 3960 + CACTTGGCGA AGTCCAACTT GCACTGAATT GTACAATTTC TCGTGCCACT GATGCAAGTC 4020 + CGTTAGAAAT GTTAATTGGT AAACAGGCTC GACCCCTTGG ATTAGTTCCC CCATGTGAGA 4080 + CCGAATGTGA AATAGATTTG GCAACTGTTA GAGCTCATGC GACAGAAAAT ATGAATTCCT 4140 + TAGCGTCTTA CGACAAATCC CGATTTGATA GCAGTAGAGC AGCCGTTGAC AAACACCACG 4200 + TAGGTGACTA TGTGCTATTG AGGAATGAAG AAAGACACCA AACTAAGTTA GATCCGAAAT 4260 + TCAGAGGACC GTTTTTGGTA ACTGAAGTAT TAGAGGGTGA CAGGTATACA CTAAAGTCGT 4320 + TGACGAGTAA CCGATCGTTC AAGTATTGCC ATGAATCAAT CAAAATGCCG GATGCAGAAA 4380 + TCCCGAATGA GTTAAACGAG AATGTAGAGC AATAGCTGAA ATATAGAAAC AGTTGAATGA 4440 + AAAGAAAAGC CCGCCAATGA GTTCTTTTGT GAACGAGAGA TATCCGTCTA GGTGAGACGA 4500 + TGAATTGTGA GTTATCCGTC TAGGTGAGAC GATGAATTGT GAGTTATCCG TCTAGGTGAG 4560 + ACGATGAATT GTCAGTTATC CGTCAGGTGA GACGATGAAT TGTGAGTTAT CCGTCCAGGA 4620 + GAGACGATGA GTTTGGATTG AATTAATAAT CAAGTGTGTG TGAACTGGCG GAAGATCGAT 4680 + ATATAGAAAT CGATAAATGA TAATGTTAAG ATAAGTTGTG AGCTGATGTA TTACTGATCA 4740 + ATGGAACTGA ATATGAAAAT AGAATAAGTT ATCCCAGCAA CAGTGAAATA AGAGCTGTTT 4800 + TGTTTCTTCA CAGAATTAAG ATTTAAGAAA TACACCTGAT AAAGTCAAAC TAATGAAATT 4860 + AAATGTTATT GAATAGTGAT GAAAGTAGGT GATCTTGATA TCTTGGTATC TCGGTATCAA 4920 + AAGCTTACAC GAGGACGTGA AATGTCAGAA TGGCCGTGTC GTGGCGAAAA TAATGAGTAT 4980 + GCGTGTAGTC GCTGTTTACT TCTTCTCCAT GTTCCCTTTG CTATTATGCG TGTTCCTATT 5040 + TATGAACACG TGGCGAAAAT AATGAATGCG CGTAGTCCGG TTTACTTCTT CTCCATGTTC 5100 + CCTTTGCTAT TATGCGTGTT CCTATTTATT GTCAATGTGT GAGGATGAAT AGATGAATTA 5160 + TCTATGAACG GGATTTTGCA AAAACGAGAG CGATAGAGCT GTTGCTGAAC GTGGCCACTT 5220 + GCGCTGCTTG GTTAGAAAGG GAAAACTATA TAATGAAAAG GGAATGCCAA AAATTGAGAA 5280 + GAGACAAAGC AGGCTGCACG AAACTGGAGT GAGGGCATTA ATCGTGGAGA AGCCAAAGCA 5340 + GACGCAAGTG GACTCGTTGA CTGCGCACAG CTGCATAAAA TTATATAGTA AAAAGAGATT 5400 + TGAGCGACGC TGATATGGAC GGACGGACGG ACGCGAGGCC CCTGATATTC TTAACCCGAC 5460 + A 5461 +// +ID PPI251 standard; DNA; SYN; 2907 BP. +XX +AC X06779; V01520; X69493; +XX +DR FLYBASE; FBte0000037; Dmel\P-element. +XX +FT source X06779:996..3902 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1..31 +FT SO_feature terminal_inverted_repeat ; SO:0000481:2877..2907 +FT SO_feature CDS ; SO:0000316:join(153..442,501..1168,1222..1947,2138..2709) +FT /name="Dmel\P\T" +FT /db_xref="FLYBASE:FBgn0013311" +FT /translation=" +FT MKYCKFCCKAVTGVKLIHVPKCAIKRKLWEQSLGCSLGENSQICDTHFND +FT SQWKAAPAKGQTFKRRRLNADAVPSKVIEPEPEKIKEGYTSGSTQTESCS +FT LFNENKSLREKIRTLEYEMRRLEQQLRESQQLEESLRKIFTDTQIRILKN +FT GGQRATFNSDDISTAICLHTAGPRAYNHLYKKGFPLPSRTTLYRWLSDVD +FT IKRGCLDVVIDLMDSDGVDDADKLCVLAFDEMKVAAAFEYDSSADIVYEP +FT SDYVQLAIVRGLKKSWKQPVFFDFNTRMDPDTLNNILRKLHRKGYLVVAI +FT VSDLGTGNQKLWTELGISESKTWFSHPADDHLKIFVFSDTPHLIKLVRNH +FT YVDSGLTINGKKLTKKTIQEALHLCNKSDLSILFKINENHINVRSLAKQK +FT VKLATQLFSNTTASSIRRCYSLGYDIENATETADFFKLMNDWFDIFNSKL +FT STSNCIECSQPYGKQLDIQNDILNRMSEIMRTGILDKPKRLPFQKGIIVN +FT NASLDGLYKYLQENFSMQYILTSRLNQDIVEHFFGSMRSRGGQFDHPTPL +FT QFKYRLRKYIIARNTEMLRNSGNIEEDNSESWLNLDFSSKENENKSKDDE +FT PVDDEPVDEMLSNIDFTEMDELTEDAMEYIAGYVIKKLRISDKVKENLTF +FT TYVDEVSHGGLIKPSEKFQEKLKELECIFLHYTNNNNFEITNNVKEKLIL +FT AARNVDVDKQVKSFYFKIRIYFRIKYFNKKIEIKNQKQKLIGNSKLLKIK +FT L" +FT SO_feature CDS ; SO:0000316:join(153..442,501..1168,1222..1994) +FT /db_xref="FLYBASE:FBgnXXXXXXX" +FT /translation=" +FT MKYCKFCCKAVTGVKLIHVPKCAIKRKLWEQSLGCSLGENSQICDTHFND +FT SQWKAAPAKGQTFKRRRLNADAVPSKVIEPEPEKIKEGYTSGSTQTESCS +FT LFNENKSLREKIRTLEYEMRRLEQQLRESQQLEESLRKIFTDTQIRILKN +FT GGQRATFNSDDISTAICLHTAGPRAYNHLYKKGFPLPSRTTLYRWLSDVD +FT IKRGCLDVVIDLMDSDGVDDADKLCVLAFDEMKVAAAFEYDSSADIVYEP +FT SDYVQLAIVRGLKKSWKQPVFFDFNTRMDPDTLNNILRKLHRKGYLVVAI +FT VSDLGTGNQKLWTELGISESKTWFSHPADDHLKIFVFSDTPHLIKLVRNH +FT YVDSGLTINGKKLTKKTIQEALHLCNKSDLSILFKINENHINVRSLAKQK +FT VKLATQLFSNTTASSIRRCYSLGYDIENATETADFFKLMNDWFDIFNSKL +FT STSNCIECSQPYGKQLDIQNDILNRMSEIMRTGILDKPKRLPFQKGIIVN +FT NASLDGLYKYLQENFSMQYILTSRLNQDIVEHFFGSMRSRGGQFDHPTPL +FT QFKYRLRKYIIGMTNLKECVNKNVIP" +FT SO_feature intron ; SO:0000188:443..500 +FT SO_feature intron ; SO:0000188:1169..1221 +FT SO_feature intron ; SO:0000188:1948..2137 +XX +CC Derived from X06779 (g58305) (Rel. 49, Last updated, Version 8). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +CC CDS annotation from Lynn Crosby's annotation 'P-element.v010'. +XX +SQ Sequence 2907 BP; 989 A; 491 C; 582 G; 845 T; 0 other; + CATGATGAAA TAACATAAGG TGGTCCCGTC GAAAGCCGAA GCTTACCGAA GTATACACTT 60 + AAATTCAGTG CACGTTTGCT TGTTGAGAGG AAAGGTTGTG TGCGGACGAA TTTTTTTTTG 120 + AAAACATTAA CCCTTACGTG GAATAAAAAA AAATGAAATA TTGCAAATTT TGCTGCAAAG 180 + CTGTGACTGG AGTAAAATTA ATTCACGTGC CGAAGTGTGC TATTAAGAGA AAATTGTGGG 240 + AGCAGAGCCT TGGGTGCAGC CTTGGTGAAA ACTCCCAAAT TTGTGATACC CACTTTAATG 300 + ATTCGCAGTG GAAGGCTGCA CCTGCAAAAG GTCAGACATT TAAAAGGAGG CGACTCAACG 360 + CAGATGCCGT ACCTAGTAAA GTGATAGAGC CTGAACCAGA AAAGATAAAA GAAGGCTATA 420 + CCAGTGGGAG TACACAAACA GAGTAAGTTT GAATAGTAAA AAAAATCATT TATGTAAACA 480 + ATAACGTGAC TGTGCGTTAG GTCCTGTTCA TTGTTTAATG AAAATAAGAG CTTGAGGGAA 540 + AAAATTCGTA CTTTGGAGTA CGAAATGCGT CGTTTAGAGC AGCAGCTGAG GGAGTCTCAA 600 + CAGTTGGAGG AGTCTCTACG CAAAATCTTC ACGGACACGC AGATACGGAT ACTGAAGAAT 660 + GGTGGACAAA GAGCTACGTT CAATTCCGAC GACATTTCTA CAGCTATTTG TCTCCACACC 720 + GCAGGCCCTC GAGCGTATAA CCATCTGTAC AAAAAAGGAT TTCCTTTGCC CAGTCGTACG 780 + ACTTTGTACA GATGGTTATC AGATGTGGAC ATAAAAAGAG GATGTTTGGA TGTGGTCATA 840 + GACCTAATGG ACAGTGATGG AGTTGATGAC GCCGACAAGC TTTGCGTACT CGCTTTCGAC 900 + GAGATGAAGG TCGCTGCTGC CTTCGAGTAT GACAGCTCTG CTGATATTGT TTACGAGCCA 960 + AGCGACTATG TCCAACTGGC TATTGTTCGT GGTCTAAAAA AATCGTGGAA GCAGCCAGTT 1020 + TTTTTCGATT TTAATACCCG AATGGACCCG GATACTCTTA ACAATATATT AAGGAAACTG 1080 + CATAGGAAAG GATATTTAGT AGTTGCTATT GTATCCGATT TAGGTACCGG AAACCAAAAG 1140 + CTATGGACAG AGCTCGGTAT ATCAGAATGT AAGTTTCGTA TATTACAAAA ATCAGATAAT 1200 + CCTTGAAATT CCATTTTTTA GCAAAAACCT GGTTTAGCCA TCCTGCAGAT GACCATTTAA 1260 + AGATTTTCGT TTTTTCGGAT ACGCCACATT TAATTAAGTT AGTCCGTAAC CACTATGTGG 1320 + ATTCCGGATT AACAATAAAT GGGAAAAAAT TAACAAAAAA AACAATTCAG GAGGCACTTC 1380 + ATCTTTGCAA CAAGTCCGAT CTGTCTATCC TCTTTAAAAT TAATGAAAAT CACATTAATG 1440 + TTCGATCGCT CGCAAAACAG AAGGTTAAAT TGGCTACCCA GCTGTTTTCG AATACCACCG 1500 + CTAGCTCGAT CAGACGCTGC TATTCATTGG GGTATGACAT TGAAAATGCC ACCGAAACTG 1560 + CGGACTTCTT CAAATTGATG AATGATTGGT TCGACATTTT TAATTCTAAA TTGTCCACAT 1620 + CCAATTGCAT TGAGTGCTCG CAACCTTATG GCAAGCAGTT GGATATACAG AATGATATTT 1680 + TGAATCGAAT GTCGGAAATT ATGCGAACAG GAATTCTGGA TAAACCCAAA AGGCTCCCAT 1740 + TTCAAAAAGG TATCATTGTG AATAATGCTT CGCTTGATGG CTTGTATAAA TATTTGCAAG 1800 + AAAACTTCAG TATGCAATAC ATATTAACAA GCCGTCTCAA CCAAGACATT GTGGAGCATT 1860 + TTTTTGGCAG CATGCGATCG AGAGGTGGAC AATTCGACCA TCCCACTCCA CTGCAGTTTA 1920 + AGTATAGGTT AAGAAAATAT ATAATAGGTA TGACAAATTT AAAAGAATGC GTAAACAAAA 1980 + ATGTAATTCC ATGATTTATA ATTGTTTAAT GTTTAGCTAT ATGTTTCAGG AAAGTTTCAG 2040 + TTGAGAATGT AGGTAGTTAT GTGCTGTCTA TTGTGTTTTG TCTTTTATCT GTTTCTTTTC 2100 + ATTTTATTAT TTAATCATTA TCCTTTTGCT TATCCAGCCA GGAATACAGA AATGTTAAGA 2160 + AATTCGGGAA ATATCGAAGA GGACAACTCT GAAAGCTGGC TTAATTTAGA TTTCAGTTCT 2220 + AAAGAAAACG AAAATAAAAG TAAAGATGAT GAGCCTGTCG ATGATGAGCC TGTCGATGAG 2280 + ATGTTAAGCA ATATAGATTT CACCGAAATG GATGAGTTGA CGGAGGATGC GATGGAATAT 2340 + ATCGCGGGCT ATGTCATTAA AAAATTGAGA ATCAGTGACA AAGTAAAAGA AAATTTGACA 2400 + TTTACATACG TCGACGAGGT GTCTCACGGC GGACTTATTA AGCCGTCCGA AAAATTTCAA 2460 + GAGAAGTTAA AAGAGCTAGA ATGTATTTTT TTGCATTATA CAAATAATAA TAATTTTGAA 2520 + ATTACAAATA ATGTAAAGGA AAAATTAATA TTAGCAGCGC GAAACGTCGA TGTTGATAAA 2580 + CAAGTAAAAT CTTTTTATTT TAAAATTAGA ATATATTTTA GAATTAAGTA CTTCAACAAA 2640 + AAAATTGAAA TTAAAAATCA AAAACAAAAG TTAATTGGAA ACTCCAAATT ATTAAAAATA 2700 + AAACTTTAAA AATAATTTCG TCTAATTAAT ATTATGAGTT AATTCAAACC CCACGGACAT 2760 + GCTAAGGGTT AATCAACAAT CATATCGCTG TCTCACTCAG ACTCAATACG ACACTCAGAA 2820 + TACTATTCCT TTCACTCGCA CTTATTGCAA GCATACGTTA AGTGGATGTC TCTTGCCGAC 2880 + GGGACCACCT TATGTTATTT CATCATG 2907 +// +ID DMPOGOR11 standard; DNA; INV; 2121 BP. +XX +AC X59837; S90749; +XX +DR FLYBASE; FBte0000568; Dmel\pogo. +XX +FT source X59837:1..2121 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1..21 +FT SO_feature terminal_inverted_repeat ; SO:0000481:2101..2121 +FT SO_feature intron ; SO:0000188:1438..1541 +XX +CC Derived from X59837 (g8354) (Rel. 45, Last updated, Version 10). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +CC K. O'Hare, Personal communication to FlyBase, 1 May 2000. +CC This is probably complete element. +XX +SQ Sequence 2121 BP; 724 A; 353 C; 399 G; 645 T; 0 other; + CAGTATAATT CGCTTAGCTG CATCGATAGT TAGCTGCATC GGCAAGATAT CTGCATTATT 60 + TTTCCATTTT TTTGTGTGAA TAGAAAATTT GTACGAAAAT TCATACGTTT GCTGCATCGC 120 + AGATAACAGC CTTTTTAACT TAAGTGCATC ATATCAGCTG TTTTTTTTGC CAATTTCAAT 180 + GAATATCATC AAAGTTAGCT GCGCCATCTA TGAATCATTT TTGCATATCT AAAAGATGCA 240 + AGAATGCCAA CTCGTTTCAG TATCTGCGCA TGTCCGTTTT TGTTTTTGCT TTGATCGTGA 300 + TTTTTGTGTT TTTGTTTCTT ATGGCACAAA GTTATTAAAA TGGGTAAAAC AAAGCGTGTC 360 + GTTGGACTAA CACTAAAGGA AAAGCTTCAA ATAATCGAGT TAGTGACCAA CAAAGTGGAC 420 + AAAAAGGAAA TTTGTGCCAA GTTCAAATGC GACAGATCCA CAGTCAACCG CATTTTACAA 480 + AAAACAAATG AAATTCATGA AGCTGTGGCC GCGTCAGGTT TAAAAAGAAA GCGTCAAAGA 540 + AAAGGAGCGC ACGACTTAGT AGAAGAAGCC TTATACATTT GGTTCGGACA GCAGGAATCA 600 + AAGAACGTAA TTCTTGACCG GCACGTCATA TTAGCAAAAG CGAAAGAATT TTGCCAAAAA 660 + TTTAACGACG CCTTTGAACC TGACGCCAGC TGGCTTTGGC GCTGGCGCAA GCGCCACAAT 720 + ATAAAGTATG GCAAAATACA CGGCGAAACT GCTACAAATG ATTCCGTATC AGCAAATGAG 780 + TACAAAAATG ATATTTTGCC AGGATTGCTT AAAGGTTATA ACCCAGAAGA CATTTTTAAC 840 + GCTGACGAAA CTGCACTCTT TTATAAAGCA ATGCCGAATG CGACATTTTT TACTTGTGGA 900 + AAGCAATTAA ATGGCCAGAA ATCTCAGAGA GTGAGACTTA CTTTGCTGTT TATATGCAAT 960 + GCAACTGGGA CATACAAAAA AACTTTTGTA ATCGGCAGAT CTAAATCGCC ACGATGCTTC 1020 + AAGAATGCTA ATGTGCCCAT TCCGTACTAT GCAAATAAGA AGGCCTGGAT GACTAAGGAT 1080 + CTCTGGCGAA AAATAATGAC AGGATTTGAC GAAGAAATGA AAAAGCAAAA TCGAAAGATT 1140 + TTACTCTTCA TCGACAATGC AACTAGTCAC ACGACTGTCA AGGACTTCGA AAACATAAAA 1200 + TTGTGCTTCA TGCCACCAAA CGCAACGGCT CTACTTCAAC CTCTGGACCA AGGTATTATC 1260 + CACTCATTCA AATTAGAGTA TAGGCGTATT TTGGTCAAAC AGCAGCTCAT TGCTGTTAAT 1320 + TGTGGTAAAT CTACTGTGGA ATTTTTAAAA TCATTATCGT TATTGGATGC TCTATATTTT 1380 + GTCAACCAAG GATGGAAGAA TGTTAAAATG TTAACTATTC AGAATTGTTT TAAAAAGGTA 1440 + AGATGGGATT ATTATTGATA TGTATCTCAA ATAACGAATT TATTATTTTC AGGCTGGATT 1500 + TAAGTTCAGT TTTGAAAATG AAGACACCAT TGCTGAAAAA GACAAACAAT GCGTAGAAGT 1560 + TGACATTGTA TCGAATATTA ATTGGAATGA ATATGCCAAT GTTGATGCAG ATGAGGCTTG 1620 + CCATGGTCAA TTAGATGATG ATGAAATCGT GCGCTCTTTA GTTCAAGATG CAAAAACCAG 1680 + CGATAACGAA GAAAGCCATA GTGATGAAGA TGTGGACGAT ACTGAGCGTC CTACTTTTAA 1740 + GGATGGGTTT GCAGCAATTA AGGCTTTAAA GTCCATTTTT ATGCGAAACA ATAATGATGA 1800 + GTTTTTGCAA AACTTGAATT CTATGGAAGA CAAGCTGTTT AATTTACATA TAAACTCAGC 1860 + TGTATTGCAA AAAAAAATTA CTGACTATTT TTAAGTTAGT TTTAAAAAGT GTTTTAATCA 1920 + ATTCACCATC ACTTAAATTT ATATGTCGAT CTTACTTATC ATTAAGAATG AAATTATCAG 1980 + TTCCTTTTAT GTTTAACATT GTTATAAAGA AATAAATTCT TTATTTTTCC TTAAAAAAAA 2040 + AAATTAAGTT AGCTGCATTT TTAAGTTACC TGCATCGAGG CATTGTGCAA AGTACTCGAG 2100 + GCAGCTAAGC GAATTATACT G 2121 +// +ID DMRER1DM standard; DNA; INV; 5356 BP. +XX +AC X51968; +XX +DR FLYBASE; FBte0000118; Dmel\R1A1-element. +XX +FT source X51968:1..5356 +FT SO_feature CDS ; SO:0000316:319..1731 +FT /name="Dmel\R1A1-element\ORF1" +FT /db_xref="FLYBASE:FBgn0044825" +FT /db_xref="SWISS-PROT:P16424" +FT /db_xref="NCBI_PROTEIN:CAA36226.1" +FT /translation="PVSASIRLLDSSKGGATIGATPMESDSSVSALSGSSASKVSRRGR +FT RRSHLASKSSAPTQAKLVALASNGVPEPVGVLEEAFSSLEDARAATSNAANDAAPPAAA +FT PAVDHTVAPDVSTAAKIAATTATAATAAARAGQAAMMAELSATQRMVRNSFRSLGGVDT +FT EELSCAISRYDELVMALMLRCGELETRLAMPPPPPPPSKANTTAANAPQMPQVAPIAAP +FT RTTKVRETWSAVVKCDDPALSGKAIAEKVRTMVAPSLGVRVHEVRELPSRWWCDHSYSS +FT VGELQKVMASKRFAELGLNVARNAAEKPKVIVYDVDTAIGPEEFMQELHENNFDSEMTL +FT AQFKKSVHLVTKAWSATDGATVNVTLEVDDRAMAKLDVGRVYIKWFSFRCRSQVRTYAC +FT HRCVGFDHKVSECRQKESVCRQCGQQGHTAAKCQNPVDCRNCRHRGQPSGHYMLSNACP +FT IYGALLARVQARH" +FT SO_feature CDS ; SO:0000316:1728..4790 +FT /name="Dmel\R1A1-element\ORF2" +FT /db_xref="FLYBASE:FBgn0044824" +FT /db_xref="SWISS-PROT:P16425" +FT /db_xref="NCBI_PROTEIN:CAA36227.1" +FT /translation="TLMFSFIQANCGRGRAATIELGVRLRRSESMFALVQEPYLGGDEM +FT DVLPEGMRVFTDRRGKAAILVDHQEAICMPVETLTTDYGVCLVVKGSFGSIFLCAAYCQ +FT FDAPLEPYLRYMDAVLLQASRTPAILGLDANAVSPMWLSKLSRHAEGQANYRRGELLSE +FT WMLEARVAALNQSTEVYTFDNHRATSDIDVTIVNEAASMWATYEWRVDEWELSDHNIIT +FT VVAEPTTARSVESIAPVPSWNFSNARWRLFKEEMVSRIAELPENFSESPLDQQVSTLRS +FT IVHSVCDTALGRKLTRSPSRRARWWTADLCAARREVRRLRRLLQDGRRRDDDAAVELVV +FT VELRRASAYYKKLIGRAKMDDWKRFVGDHADDPWGRVYKICRGRRKCTEIGCLRVNGEL +FT ITDWGDCARVLLRNFFPVAESEAPTAIAEEVPPALEVFEVDTCVARLKSRRSPGLDGIN +FT GTICKAVWRAIPEHLASLFSRCIRLGYFPAEWKCPRVVSLLKGPDKDKCEPSSYRGICL +FT LPVFGKVLEAIMVNRVREVLPEGCRWQFGFRQGRCVEDAWRHVKSSVGASAAQYVLGTF +FT VDFKGAFDNVEWSAALSRLADLGCREMGLWQSFFSGRRAVIRSSSGTVEVPVTRGCPQG +FT SISGPFIWDILMDVLLQRLQPYCQLSAYADDLLLLVEGNSRAVLEEKGAQLMSIVETWG +FT AEVGDCLSTSKTVIMLLKGALRRAPTVRFAGRNLPYVRSCRYLGITVSEGMKFLTHIAS +FT LRQRMTGVVGALARVLRADWGFSPRARRTIYDGLMAPCVLFGAPVWYDTAEQVAAQRRL +FT ASCQRLILLGCLSVCRTVSTVALQVLGGAPPLDLAAKLLAIKYKLKRGFPLEENDWLYG +FT EDIACLSWEQRKTRLEECLIQSWQNRWDDDSEPGRVTHRFIPYVTLAYRDPSFGFSMRT +FT SFLLTGHGSFNAFLHGRALSDTTACACGDPYEDWMHILCACPLYADLRDLDGLGVQRLG +FT ENWIFEGILDDQEKTQRLAMFAEEVFLRRRAL" +XX +CC Derived from X51968 (g8429) (Rel. 23, Last updated, Version 1). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 5356 BP; 1213 A; 1340 C; 1634 G; 1169 T; 0 other; + CGGACGTGTT TTCGTTGCGC TCGTGGACAT AGTGCGAAGA ACTTTGTTTT CCGTATTTGG 60 + AAGTATACGG AATAAATAAT TTAGTGTTCC GTGGAAGTGG TGCGCAAATT TTCGCGAATT 120 + AAAAACAAGC GGTTTGGAAG TAATTGACAA TAAATTATTG GAAATTTTCC ACTCCGCACG 180 + TGTTGAGCGG CGGAGCTTGC GGGTGAGCTT TTCGAACAGC TGAGAGAAGC TTATTGGTGG 240 + TAGTCACCGC TAAGGATTGT GTCTTGGGAC AGCTTAGTGC ACTCTACCAA TAGGTGGAGC 300 + TATCACCATA GCAACTAGCC CGTGTCAGCG AGCATACGAT TGCTGGACTC GTCAAAAGGA 360 + GGAGCCACCA TCGGAGCAAC GCCGATGGAG AGCGACAGCA GTGTGAGTGC CTTGAGCGGA 420 + AGCAGTGCCT CAAAGGTGTC AAGACGAGGC AGGCGTAGGA GCCATCTGGC CTCCAAGAGC 480 + TCGGCGCCAA CGCAGGCGAA ACTGGTTGCC CTGGCCTCGA ATGGAGTGCC GGAACCCGTT 540 + GGTGTGCTGG AGGAGGCGTT TTCGTCGCTG GAGGATGCCC GGGCGGCTAC GTCAAACGCT 600 + GCCAACGATG CTGCCCCCCC CGCTGCTGCC CCCGCTGTTG ATCACACTGT TGCCCCTGAT 660 + GTTTCCACTG CTGCTAAAAT CGCTGCCACC ACTGCCACCG CTGCCACCGC TGCCGCCCGT 720 + GCTGGGCAAG CAGCCATGAT GGCAGAGCTG TCGGCCACCC AGCGCATGGT GCGAAACAGT 780 + TTCCGCAGCC TAGGAGGCGT AGACACGGAA GAGCTCTCGT GTGCCATCAG CCGCTATGAT 840 + GAGCTGGTGA TGGCATTAAT GCTCCGGTGT GGAGAACTGG AGACGCGGCT CGCTATGCCA 900 + CCACCGCCGC CGCCGCCGTC CAAGGCGAAC ACTACTGCCG CCAATGCTCC CCAGATGCCT 960 + CAGGTTGCAC CCATCGCTGC CCCGCGGACA ACCAAGGTTC GTGAGACGTG GTCAGCGGTG 1020 + GTGAAGTGCG ACGACCCTGC GCTATCGGGG AAAGCCATAG CCGAAAAGGT GCGGACGATG 1080 + GTTGCACCCT CCCTCGGAGT CAGAGTACAC GAGGTACGTG AGCTGCCGTC GAGGTGGTGG 1140 + TGCGATCATT CGTACTCTTC GGTTGGAGAG CTGCAGAAGG TGATGGCATC GAAAAGATTC 1200 + GCAGAACTTG GACTGAATGT GGCACGGAAC GCGGCCGAGA AGCCGAAGGT CATAGTCTAT 1260 + GACGTCGACA CAGCCATCGG CCCAGAAGAG TTCATGCAGG AGCTTCACGA GAACAACTTC 1320 + GACAGTGAAA TGACTCTGGC CCAGTTCAAA AAGTCGGTGC ACCTGGTGAC CAAGGCGTGG 1380 + TCGGCTACTG ACGGTGCCAC CGTAAACGTG ACGCTAGAGG TAGACGACCG GGCGATGGCG 1440 + AAACTTGATG TAGGACGTGT CTACATTAAG TGGTTTTCGT TCCGATGCCG ATCGCAAGTC 1500 + CGCACCTATG CCTGCCACAG ATGTGTGGGT TTCGACCACA AGGTTAGTGA ATGCAGGCAG 1560 + AAGGAGAGTG TTTGCCGCCA GTGCGGGCAA CAAGGCCACA CCGCGGCAAA GTGCCAAAAC 1620 + CCGGTGGACT GCCGGAACTG CCGTCACAGA GGGCAACCTT CGGGGCATTA TATGCTCTCG 1680 + AATGCTTGCC CGATATACGG AGCGTTGTTA GCGAGGGTGC AAGCTAGACA CTAATGTTTA 1740 + GCTTCATCCA AGCGAACTGT GGCCGAGGCA GAGCTGCGAC CATCGAGCTC GGAGTCCGAC 1800 + TCAGGAGATC GGAGTCAATG TTTGCTCTGG TGCAGGAGCC GTATCTTGGC GGGGATGAAA 1860 + TGGATGTGCT GCCTGAAGGA ATGAGGGTTT TCACCGACCG GCGAGGGAAG GCAGCCATCC 1920 + TAGTGGATCA TCAGGAAGCC ATCTGCATGC CAGTGGAAAC TCTCACCACA GATTATGGCG 1980 + TATGTCTGGT CGTTAAAGGG AGTTTTGGCT CAATCTTCCT TTGCGCCGCA TACTGCCAGT 2040 + TCGATGCACC TCTGGAACCG TACCTCCGGT ACATGGATGC GGTCCTGCTG CAGGCCAGCA 2100 + GAACCCCCGC AATCCTGGGC CTCGACGCGA ATGCAGTGTC CCCCATGTGG CTTAGCAAAC 2160 + TCTCTCGTCA TGCCGAGGGG CAAGCTAACT ACAGACGGGG TGAGCTGCTG TCTGAGTGGA 2220 + TGCTGGAGGC AAGAGTCGCC GCCCTAAACC AGTCAACAGA GGTGTACACG TTCGATAATC 2280 + ACAGAGCGAC TAGTGATATC GACGTGACAA TCGTCAATGA AGCAGCATCT ATGTGGGCCA 2340 + CATATGAGTG GAGAGTGGAC GAGTGGGAAT TGAGTGACCA CAACATCATT ACTGTTGTGG 2400 + CCGAACCAAC TACCGCGCGC TCAGTTGAGA GCATAGCTCC TGTGCCGTCC TGGAACTTCT 2460 + CCAATGCACG TTGGCGATTG TTCAAGGAGG AAATGGTGAG TAGAATAGCC GAACTTCCGG 2520 + AAAACTTTTC AGAGTCGCCG TTGGACCAGC AAGTTTCGAC CCTGCGCAGT ATAGTACATA 2580 + GTGTATGTGA TACTGCGCTA GGAAGGAAGT TGACTCGATC GCCCAGCAGG AGAGCACGTT 2640 + GGTGGACTGC CGACCTCTGC GCTGCAAGGC GCGAAGTCCG AAGACTTCGT CGCCTGCTCC 2700 + AAGATGGAAG GCGTCGAGAT GACGATGCCG CTGTAGAGCT TGTAGTGGTC GAGCTGAGGC 2760 + GTGCCTCAGC CTACTACAAG AAGCTCATTG GAAGGGCGAA GATGGATGAC TGGAAACGCT 2820 + TCGTGGGAGA TCATGCCGAC GACCCATGGG GGCGCGTCTA CAAGATTTGC CGAGGTCGCA 2880 + GGAAGTGCAC GGAGATTGGG TGCCTCCGCG TGAATGGCGA GCTGATCACT GATTGGGGTG 2940 + ACTGCGCACG AGTGCTCCTC CGCAATTTTT TCCCAGTTGC GGAGTCCGAA GCACCGACTG 3000 + CCATCGCGGA GGAAGTCCCA CCGGCCCTCG AAGTATTCGA GGTTGATACA TGTGTTGCCC 3060 + GGCTGAAGAG CAGGCGCTCT CCCGGGTTGG ACGGCATCAA TGGCACTATC TGCAAGGCAG 3120 + TCTGGCGCGC CATACCCGAG CACCTAGCAT CATTGTTTTC CCGATGCATC CGATTGGGAT 3180 + ACTTTCCAGC CGAGTGGAAG TGCCCACGAG TTGTCTCGTT GCTCAAAGGG CCAGATAAGG 3240 + ACAAGTGTGA GCCCTCCTCA TACAGAGGAA TATGCTTGCT ACCAGTCTTT GGAAAGGTGC 3300 + TCGAGGCCAT CATGGTGAAT CGTGTGAGAG AAGTTCTTCC GGAAGGCTGC AGATGGCAAT 3360 + TCGGATTTCG CCAAGGACGA TGTGTGGAGG ATGCTTGGAG GCACGTGAAG AGCAGTGTTG 3420 + GCGCCAGCGC GGCGCAATAC GTGCTCGGCA CATTCGTGGA CTTCAAAGGA GCATTCGACA 3480 + ACGTCGAATG GAGTGCTGCA CTCAGCCGAC TAGCCGACTT GGGATGCCGG GAAATGGGCT 3540 + TGTGGCAGAG CTTTTTCTCC GGCCGAAGAG CAGTGATCCG AAGCAGTTCC GGTACTGTGG 3600 + AGGTACCGGT AACTAGAGGC TGCCCGCAGG GATCAATCAG CGGCCCATTT ATCTGGGACA 3660 + TACTGATGGA TGTACTGCTT CAGCGTCTCC AGCCGTATTG CCAGCTGAGT GCATACGCGG 3720 + ATGACTTGCT GCTTCTCGTC GAGGGAAATT CCCGAGCTGT GCTAGAGGAA AAAGGAGCGC 3780 + AACTAATGTC CATCGTAGAA ACGTGGGGAG CGGAAGTTGG CGATTGCCTC TCGACCAGCA 3840 + AGACGGTAAT CATGCTGCTG AAAGGTGCCT TGAGACGTGC GCCTACGGTG AGGTTTGCTG 3900 + GACGGAACCT TCCGTATGTG CGTAGCTGTC GGTACCTTGG CATCACGGTC AGTGAAGGAA 3960 + TGAAATTCCT CACGCACATA GCTTCGCTTC GCCAGCGGAT GACAGGAGTC GTTGGAGCAT 4020 + TGGCGCGTGT GCTTCGAGCC GACTGGGGCT TCAGTCCTCG AGCCAGGCGG ACCATATATG 4080 + ACGGACTCAT GGCACCTTGT GTGCTGTTTG GTGCCCCGGT ATGGTATGAC ACCGCGGAAC 4140 + AAGTAGCTGC CCAGAGGCGA CTAGCCTCCT GCCAGAGGCT AATCCTGCTT GGATGCCTTT 4200 + CGGTATGCCG AACAGTATCC ACAGTGGCAC TGCAGGTACT TGGTGGAGCT CCCCCGCTTG 4260 + ATCTGGCTGC TAAGTTATTA GCGATCAAAT ACAAGCTAAA ACGTGGATTC CCGCTGGAGG 4320 + AGAACGACTG GCTTTACGGC GAGGACATTG CGTGTCTTAG CTGGGAGCAG AGGAAGACTC 4380 + GCCTAGAGGA GTGTTTAATC CAGAGTTGGC AGAACAGATG GGACGATGAC AGCGAACCAG 4440 + GACGGGTGAC GCATAGGTTT ATCCCATACG TCACTCTTGC CTATCGGGAT CCAAGTTTTG 4500 + GATTCTCGAT GAGGACGTCT TTCCTGCTTA CAGGGCACGG GTCGTTCAAT GCATTTTTGC 4560 + ACGGGAGAGC CCTCAGCGAT ACCACTGCTT GCGCATGTGG AGATCCATAT GAGGACTGGA 4620 + TGCATATCTT GTGCGCTTGC CCCCTATATG CAGATCTGCG GGACCTAGAT GGACTTGGAG 4680 + TGCAGCGCCT TGGCGAAAAC TGGATCTTCG AGGGAATCCT GGATGATCAA GAGAAGACTC 4740 + AACGGCTGGC AATGTTTGCG GAAGAAGTGT TCCTGAGGAG GAGGGCCCTT TAGCTCAACA 4800 + TCTCTGCCGT GTGGTTAGCG GGCGAGAATA CTACCACAGT CCGCTGTTGC TTGTCGTAAG 4860 + AGACGACTAA TACAGCGATA GGATTCCTCT AACCCTGCTT GTCGGAGCAA AAGGGGGAGG 4920 + CCCACCGAGC CTCTTTTCGG TACCACGGGT TGAGCAGCTA TCCAAGACTG CTCATTGAGG 4980 + TAGGCCCCCT GGTGGGAGTA TCGTGGTGGC TGTGGTTGGT ACCCATATCG CGGGTAGAGC 5040 + CTTCATGCTC GACGTTTGAG TTACGGTGCT AGTTGCGCAA AACTCGGGTG CTGTGACCCA 5100 + GAGATCAGTA GAGATTTTAG GTAGATCTCG CTCCTCAGCA AGGGGGAGTG CTTGCCCGGC 5160 + AAGCAAGTAC TCGAATTGCT ACCGGGGTGG TCGCTATGTA CATAGCTATA GCTTCTAGTC 5220 + CGGGACGCTT GTCTGGCGTA TCCAGACACA TGCACCATAT GCTCACTTGT GGGCGTATAG 5280 + GGTGCCGTGG TTGTAATCCC TTCAGTGTGG AACACGCCAC GTAAAATAAG TTCGGAGGGA 5340 + TCCGAAAAGC ATACAT 5356 +// +ID DMRER2DM standard; DNA; INV; 3607 BP. +XX +AC X51967; +XX +DR FLYBASE; FBte0000030; Dmel\R2-element. +XX +FT source X51967:1..3607 +FT SO_feature CDS ; SO:0000316:181..3351 +FT /name="Dmel\R2-element\ORF" +FT /db_xref="FLYBASE:FBgn0016699" +FT /db_xref="SWISS-PROT:P16423" +FT /db_xref="NCBI_PROTEIN:CAA36225.1" +FT /translation="FERKNFSDGLVPQRKFIHIGTTSTNNEPRIPLHNLMTTRPSVDIF +FT PEDQYEPNAAATLSRVPCTVCGRSFNSKRGLGVHMRSRHPDELDEERRRVDIKARWSDE +FT EKWMMARKEVELTANGCKHINKQLAVYFANRSVEAIKKLRQRGDYKEKIEQIRGQSALA +FT PEVANLTIRRRPSRSEQDHQVTTSETTPITPFEQSNREILRTLRGYSPVECHSKWRAQE +FT LQTIIDRAHLEGKETTLQCLSLYLLGIFPAQGVRHTLTRPPRRPRNRRESRRQQYAVVQ +FT RNWDKHKGRCIKSLLNGTDESVMPSQEIMVPYWREVMTQPSPSSCSGEVIQMDHSLERV +FT WSAITEQDLRASRVSLSSSPGPDGITPKSAREVPSGIMLRIMNLILWCGNLPHSIRLAR +FT TVFIPKTVTAKRPQDFRPISVPSVLVRQLNAILATRLNSSINWDPRQRGFLPTDGCADN +FT ATIVDLVLRHSHKHFRSCYIANLDVSKAFDSLSHASIYDTLRAYGAPKGFVDYVQNTYE +FT GGGTSLNGDGWSSEEFVPARGVKQGDPLSPILFNLVMDRLLRTLPSEIGAKVGNAITNA +FT AAFADDLVLFAETRMGLQVLLDKTLDFLSIVGLKLNADKCFTVGIKGQPKQKCTVLEAQ +FT SFYVGSSEIPSLKRTDEWKYLGINFTATGRVRCNPAEDIGPKLQRLTKAPLKPQQRLFA +FT LRTVLIPQLYHKLALGSVAIGVLRKTDKLIRYYVRRWLNLPLDVPIAFVHAPPKSGGLG +FT IPSLRWVAPMLRLRRLSNIKWPHLTQNEVASSFLEAEKQRARDRLLAEQNELLSRPAIE +FT KYWANKLYLSVDGSGLREGGHYGPQHGWVSQPTRLLTGKEYMDGIRLRINALPTKSRTT +FT RGRHELERQCRAGCDAPETTNHIMQKCYRSHGRRVARHNCVVNRIKRGLEERGCVVIVE +FT PSLQCESGLNKPDLVALRQNHIDVIDTQIVTDGHSMDDAHQRKINRYDRPDIRTELRRR +FT FEAAGDIEFHSATLNWRGIWSGQSVKRLIAKGLLSKYDSHIISVQVMRGSLGCFKQFMY +FT LSGFSRDWT" +XX +CC Derived from X51967 (g8432) (Rel. 24, Last updated, Version 1). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 3607 BP; 1064 A; 818 C; 900 G; 825 T; 0 other; + TTGGGGATCA TGGGGTATTT GAGAGCAGAG GGGGAGTATT CTTCTGTAAT TCGTAAGTCA 60 + TATCATATGA TGTGCGGAAG GGGAATTTTA CTCTGTAACT CACAAGTCTC TCCTTTACTC 120 + AAGTCGACTC AAAACCTCCT CGTGGTGGTC CCGGTAATGC TAAACTCGTT TAGCAGCTAA 180 + TTTGAGCGGA AAAACTTTTC CGATGGGCTG GTTCCCCAGA GGAAATTTAT TCATATTGGA 240 + ACTACAAGCA CAAATAACGA GCCTCGGATA CCTTTACACA ATCTGATGAC GACCCGACCC 300 + TCCGTGGATA TCTTCCCGGA GGACCAATAT GAACCAAACG CAGCGGCTAC TCTATCTAGG 360 + GTTCCCTGCA CAGTATGTGG CCGGTCCTTT AACAGCAAGA GAGGACTCGG TGTTCACATG 420 + CGATCTCGGC ACCCAGACGA ACTTGATGAA GAACGTCGAC GTGTCGATAT AAAGGCAAGA 480 + TGGAGTGATG AAGAGAAGTG GATGATGGCG AGAAAGGAGG TTGAGCTCAC AGCAAATGGA 540 + TGTAAACACA TAAACAAGCA ACTAGCGGTG TATTTTGCAA ACCGCAGCGT CGAAGCCATC 600 + AAAAAGCTAA GACAGAGGGG CGATTATAAG GAGAAAATAG AGCAGATAAG AGGGCAATCA 660 + GCTCTCGCCC CGGAAGTTGC TAATCTAACC ATAAGGCGCC GCCCTAGTAG AAGTGAGCAA 720 + GACCACCAAG TAACAACATC GGAAACAACT CCAATCACTC CCTTCGAACA GTCGAACAGG 780 + GAAATTTTGC GGACACTACG CGGGTATAGC CCCGTAGAAT GCCATTCCAA ATGGAGAGCC 840 + CAAGAGTTGC AAACTATCAT TGATAGGGCA CATCTCGAGG GAAAGGAAAC CACTCTCCAA 900 + TGCTTATCGC TATATCTCCT GGGAATTTTT CCGGCACAGG GTGTACGACA CACACTGACG 960 + AGACCTCCTC GGAGACCTCG GAACAGGAGA GAAAGCAGAA GGCAGCAGTA CGCTGTCGTC 1020 + CAGCGTAACT GGGATAAGCA TAAAGGAAGA TGCATCAAGT CCTTGCTAAA TGGAACTGAT 1080 + GAGTCGGTAA TGCCAAGCCA AGAAATAATG GTTCCCTACT GGAGAGAAGT AATGACTCAG 1140 + CCTAGCCCAA GCTCTTGCAG TGGAGAAGTG ATACAAATGG ATCACTCGCT TGAGAGGGTA 1200 + TGGTCTGCTA TTACAGAGCA GGACCTTCGG GCGTCAAGAG TCTCATTATC CTCGTCTCCG 1260 + GGGCCTGACG GGATAACTCC AAAATCTGCC AGGGAGGTGC CGTCAGGTAT TATGCTGCGC 1320 + ATAATGAACC TAATTCTATG GTGCGGTAAT CTACCACACT CCATACGACT GGCCAGAACC 1380 + GTCTTCATCC CGAAGACGGT GACGGCGAAG CGACCGCAAG ACTTTCGTCC AATATCAGTG 1440 + CCTTCAGTCC TGGTAAGACA GCTAAATGCA ATATTGGCAA CCCGGTTGAA CTCATCAATC 1500 + AATTGGGACC CGCGCCAGCG GGGCTTCTTA CCAACCGACG GATGCGCCGA TAATGCGACG 1560 + ATAGTCGACT TAGTCTTGAG GCATAGCCAT AAGCACTTTA GATCTTGCTA CATCGCAAAT 1620 + TTAGATGTAA GCAAGGCATT TGATTCTCTA TCACATGCAT CTATATACGA CACCTTACGT 1680 + GCTTATGGTG CGCCAAAGGG CTTCGTTGAC TACGTACAGA ACACGTACGA GGGCGGTGGT 1740 + ACCAGTCTCA ATGGGGACGG TTGGAGTTCA GAGGAATTCG TCCCTGCTAG AGGAGTGAAG 1800 + CAGGGTGACC CTTTGTCTCC TATTCTATTT AACTTGGTAA TGGACAGGTT ACTTAGAACC 1860 + TTACCCAGCG AAATTGGTGC CAAAGTCGGA AATGCCATTA CTAACGCGGC CGCGTTTGCA 1920 + GATGATTTGG TACTATTTGC GGAAACTCGG ATGGGGCTTC AAGTATTGTT GGACAAGACG 1980 + TTGGATTTTC TATCTATCGT CGGCCTCAAA CTTAATGCCG ACAAATGTTT TACCGTTGGC 2040 + ATTAAGGGCC AGCCGAAACA GAAGTGTACC GTGTTAGAGG CACAGAGCTT CTACGTAGGC 2100 + TCGAGTGAGA TTCCATCACT GAAGCGCACG GACGAGTGGA AGTACTTAGG CATCAACTTC 2160 + ACTGCAACCG GGAGGGTTCG ATGCAATCCG GCCGAGGACA TTGGTCCAAA GCTACAAAGA 2220 + TTGACAAAGG CCCCCCTCAA ACCACAACAG AGGTTGTTCG CCCTTCGGAC TGTCCTTATC 2280 + CCACAGCTCT ACCACAAGTT AGCCCTTGGG AGTGTGGCGA TAGGCGTCCT AAGAAAAACT 2340 + GATAAACTTA TAAGATATTA TGTGCGAAGA TGGCTAAATC TTCCGCTGGA TGTGCCGATA 2400 + GCATTTGTTC ATGCACCCCC AAAAAGTGGA GGTCTCGGAA TTCCATCACT AAGATGGGTA 2460 + GCTCCAATGT TAAGGCTAAG ACGCTTGAGT AACATTAAAT GGCCTCACCT CACGCAAAAC 2520 + GAGGTAGCCA GCTCTTTCCT CGAAGCCGAA AAACAACGGG CCCGAGATAG ATTATTAGCT 2580 + GAACAAAATG AACTGTTATC GCGTCCGGCA ATAGAAAAAT ATTGGGCGAA CAAGTTGTAC 2640 + CTCTCAGTTG ATGGTAGCGG ACTCCGTGAA GGCGGCCATT ATGGCCCGCA ACACGGGTGG 2700 + GTTAGTCAAC CCACGCGTTT ATTAACAGGA AAGGAATATA TGGACGGTAT TCGTCTGCGG 2760 + ATAAATGCCC TACCCACAAA GTCTCGTACT ACAAGGGGAA GGCACGAATT GGAACGACAG 2820 + TGTCGTGCAG GATGTGATGC TCCCGAAACA ACAAACCACA TAATGCAAAA ATGCTACCGC 2880 + TCGCATGGGA GGCGGGTAGC TAGACACAAC TGCGTAGTAA ATCGAATCAA GCGGGGACTT 2940 + GAGGAGAGAG GCTGCGTGGT CATTGTTGAA CCAAGTCTGC AGTGCGAATC CGGCCTTAAT 3000 + AAACCAGACC TGGTGGCACT ACGACAAAAT CACATTGATG TGATCGACAC ACAAATTGTG 3060 + ACAGACGGAC ACTCTATGGA TGATGCGCAC CAGCGCAAAA TCAATAGATA CGACAGACCG 3120 + GACATACGAA CTGAATTGCG TCGCAGATTC GAAGCCGCAG GTGACATTGA ATTCCATTCT 3180 + GCCACCCTGA ACTGGAGGGG GATCTGGAGT GGTCAATCCG TTAAAAGATT GATAGCAAAG 3240 + GGTCTCCTCA GCAAATATGA TAGTCATATC ATTAGCGTCC AGGTTATGAG AGGCAGTCTC 3300 + GGTTGTTTTA AACAGTTCAT GTACCTGAGC GGGTTTTCCC GAGATTGGAC TTAGCTAAAT 3360 + CGTTTGGTTC AAAACATTTG CTTGCTGTCT TGGCATAACA TCAATAAAGG CATAAACATC 3420 + GCAAAATAAT GGTTATAATT AAATGGCTAT GAGGATGGTT TTAGTACGTA GGCGTTGCGG 3480 + AACTTCGGTT CATATAGAGC AATGAATCGT GCATGCTAGG AAAACTGACC ACACACAGTG 3540 + TTGGCAGACC TAGTATCTTT CGAAGATTTC CATACCTCCG CGATCAAAAA AAAAAAAAAA 3600 + AAAAAAA 3607 +// +ID DM33463 standard; DNA; INV; 1736 BP. +XX +AC U33463; +XX +DR FLYBASE; FBte0001005; Dmel\S-element. +XX +FT source U33463:37..1772 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1..234 +FT SO_feature terminal_inverted_repeat ; SO:0000481:1503..1736 +FT SO_feature CDS ; SO:0000316:404..1441 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\S-element\T" +FT /db_xref="FLYBASE:FBgn0044019" +FT /db_xref="REMTREMBL:AAC47095" +FT /db_xref="NCBI_PROTEIN:AAC47095.1" +FT /translation="MPGKRLAFEVTQLIYYNHQLGKSIPELVEIFSVSRKTVYNILNRX +FT XKEGRLEPKSGGGCKTKINKRVDRLIMRKAIANPRISVRSLAQDIREECHLTVSHETVR +FT QVILRHRYSSRVARKKPLLSEINIEKRHSFAVSMMDHAEEYWDDVIFCDETKMMLFYND +FT GPSRVWRKPLSALETQNIIPTIKFGKLSVMIWGCISSHGVGKLAFIESTMNAVQYLDIL +FT KTNLKASAEKFGLFSNNKPNFKFYQDNDPKHKEYNVRNWLLYNCGKVIDTPPQSPDLNP +FT IENLWAYLKKKVAKRGPKTRQQLMAAIIEEWEKIPLEYDLKKLIHSMKKRLQLVAKANG +FT GHTKY" +XX +CC Derived from U33463 (g1006788) (Rel. 47, Last updated, Version 5). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 1736 BP; 600 A; 287 C; 300 G; 545 T; 4 other; + CAGTTTGTCA AGAAACTGTT TACACACCGC AAAATAAGTA GAATTTTTGA CTTTAAAGGC 60 + CAAAATTAAG GGTTTTTTGC TTAATTAAAC GCAATTTTTT TATGAAATAT AATTAAACAA 120 + TATTTATTTT ACTTATAAAT TAAAAAACAA ATTCAATATA TCAAATATAC AAGAAAATAA 180 + ACAACAAATT TCTTGTTTAC ACACTTTTGA GAGTGCCAAG AAACTCTTTA CACAGTTTTG 240 + GGTTCCTACT TTGTTTTGCT CTTTTTCTTA GAAACAATCT CATTTTTCCG TTATTTTTGT 300 + CTTATGCATT CCTTTTTACA ACGCTTCTAT TGCAATTTTT TCACTTTGCT TGTGAAATTT 360 + TGTTGATCTA ACGTGCTTAA AGCGAATTAT TAAATTTAAT GAAATGCCTG GAAAGAGATT 420 + GGCTTTTGAA GTGACCCAGC TAATATACTA TAACCACCAG TTGGGAAAAT CTATTCCTGA 480 + ATTAGTAGAA ATATTTTCCG TATCCCGTAA AACCGTCTAT AATATTTTAA ATCGTNNNNA 540 + AAAAGAGGGC AGGCTTGAAC CTAAGAGTGG TGGTGGGTGT AAAACGAAAA TTAACAAGCG 600 + AGTAGACCGC CTTATTATGC GAAAAGCGAT TGCGAACCCC CGAATCTCGG TCAGATCACT 660 + TGCTCAGGAT ATCAGGGAAG AATGTCACCT AACTGTATCA CACGAAACTG TGCGCCAAGT 720 + CATCCTACGC CATAGGTACT CTTCAAGAGT TGCAAGAAAA AAGCCTTTGC TATCAGAGAT 780 + CAATATTGAA AAGCGTCATT CATTCGCTGT GAGCATGATG GATCATGCGG AAGAGTACTG 840 + GGATGACGTC ATATTTTGTG ACGAAACAAA AATGATGCTC TTTTATAACG ATGGGCCAAG 900 + CAGAGTATGG CGCAAACCGT TGAGTGCGCT AGAAACACAA AATATAATTC CAACAATCAA 960 + ATTTGGAAAA TTGTCAGTGA TGATTTGGGG CTGTATTTCC AGCCATGGAG TGGGCAAACT 1020 + AGCCTTTATT GAAAGCACTA TGAATGCCGT GCAATATCTA GATATTTTAA AAACAAATTT 1080 + GAAGGCCAGT GCAGAAAAAT TTGGTTTGTT TAGCAACAAC AAGCCAAATT TTAAGTTTTA 1140 + TCAGGACAAT GATCCCAAAC ATAAAGAGTA CAATGTACGC AACTGGCTAC TCTATAACTG 1200 + TGGCAAGGTG ATCGATACGC CCCCTCAGAG TCCTGATCTA AACCCCATTG AAAATTTGTG 1260 + GGCCTACTTA AAGAAGAAGG TTGCAAAAAG GGGCCCCAAA ACTCGACAAC AACTCATGGC 1320 + TGCGATAATC GAAGAGTGGG AAAAGATCCC GCTTGAATAT GACCTAAAAA AACTCATACA 1380 + TTCCATGAAA AAAAGGCTTC AACTTGTAGC CAAAGCCAAT GGGGGTCATA CTAAATACTA 1440 + AAACTTTTCA AATATTATCA AAATAATTAA AAAATTTAGG ATTAAACTTA GGTTTAGTGT 1500 + TTTGTGTAAA GAGTTTCTTG ACACTCTCAA AAGTGTGTAA ACTTGAAATT TGTTGTTTAT 1560 + TTTCTTGTAT ATTTGATATA TTGAATTTGT TTTTTAATTT ATAAGTAAAA TAAATATTGT 1620 + TTAATTATAT TTCATAAAAA AATTGCGTTT AATTAAGCGA AAAACCCTTA ATTTTGACCT 1680 + TTAAAGTCAA AAATTCTACT TATTTTACGG TGTGTAAACA GTTTCTTGAC AAACTG 1736 +// +ID SPRINGER standard; DNA; INV; 7546 BP. +XX +AC AF364549; +XX +DR FLYBASE; FBte0000333; Dmel\springer. +XX +FT source AF364549:1..7546 +FT SO_feature five_prime_LTR ; SO:0000425:1..403 +FT SO_feature three_prime_LTR ; SO:0000426:7143..7546 +FT SO_feature CDS ; SO:0000316:1058..2422 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\springer\gag" +FT /db_xref="FLYBASE:FBgn0044343" +FT /db_xref="SPTREMBL:Q967T6" +FT /db_xref="NCBI_PROTEIN:AAK52057.1" +FT /translation="MSESFRQYRNSKKCASDSESESDDSTENSVRKNTPTNAFTAYKMS +FT LETEQIKALIRALQEQALESQRREADLRKTIQDLAGQVAAIQIAPARAEAPPIKVYRPV +FT EITGLVPCGETLDAVKCLPDFMGTQETYVSWRQAANAAYHMFRKYEDSSRHYQAVVIIR +FT SKVKGPADAVLSSFGTILNFDAIISRLDFTYSDKRPIHVIEQELGTLRQGSLTLLQYYD +FT EVEKKLTLLTNKATMSYEASAATVLCEKFRDDALRVFVSGLRRNLTDVLFAAKPKDMPS +FT ALALAQEVESNHERYTFATSFARSQEDRDHKQYPKVQERQRAPPQAGSQGSAGKNPHFT +FT KQHRAQVHSAPRSDRMARENMPEPMDVDPSLSRMQPSHAPAYPKSKPAASGRSVPPKRQ +FT RVNHVAQASDDLDKVYNTAASSAAVKVDDDSILEYDSDTINFLGESPCYPSSDEE" +FT SO_feature CDS ; SO:0000316:2434..5475 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\springer\pol" +FT /db_xref="FLYBASE:FBgn0044342" +FT /db_xref="SPTREMBL:Q967T5" +FT /db_xref="NCBI_PROTEIN:AAK52055.1" +FT /translation="MKLLIDTGAAKNFIRPFKGLKGVRPVQSPFTIHSIHGVTTITKKC +FT FVSIFNLKATFFLLPDLTSFDAIVGLDLLKQAGASLCLASGKLKWGSGAEQIDFHTCPD +FT VNFTKVDCSDAPPLIKDAFLKMLGNRKKAFADPNEALPYNTSVVATIRTVDEEPIYAKL +FT YPYPMGAADFVNGEIQELLKNGIIQKSKSPYNNPIWVVDKKGTDDAGNKKMRLVLDFRK +FT LNERTVPDRYPMPNISMILGNLGKAKYFTTLDLKSGYHQITLAERDREKTAFAVNGGKY +FT EFRRLPFGLRNAASIFQRTIDDILREQIGKFCYVYVDDVIIFSEDENDHVKHVDWVLKS +FT LYDANMRISAEKSRFFKKSVSFLGFIVTNNGAATDPEKVKAIKEFPEPKNVFEVRSFLG +FT LASYYRCFIKDFASIARPISDILKGENGSVSRHRSRSIQVEFSEAQQRAFEKLRNILAS +FT EDVILRYPDYKKAFDLTTDASAYGIGAVLSQEGRPITMISRTLSDREVNYATNERELLA +FT IVWALAKLRHYLYAVKEINIFTDHQPLTFAVSESNPNAKIKRWKARIDESGARIFYKPG +FT RNNLVADALSRQQLNVVEEQEPESCAATIHSELSLTHTIESTDKPVNCFQNQIILEEAR +FT SHWKRTFILFGNKRRHSINFSCKQALLEELANIIIPNGVNAFHCDLHTLALIQDDVVRQ +FT FPATKFWHCKNRVTDIFAMQERKEILTVEHNRAHRSAQENVKQVLSEYYFPKMTKLASE +FT IAANCKTCAKAKYDRHPKKQELGETPVPTHVGEILHIDIFSTDKKYFLTCVDKFSKFAM +FT VQPILSRTIEDLKAPLLQLMNVFPKAKTIYCDNEPSLKSQTIVAMLENHFGVSISNAPP +FT LHSVSNGQVERFHSTLIELARCLKIDKGISDTVELVLLATARYNMSIHSVINKKPAEVM +FT RADPDDPHTDVQEKIKNAQILTRKRENASRQNRVFQVGDKVLVKSNRRLGNKLTPLCEE +FT KTIEADLGTTVLIKGRVVHKDNLK" +FT SO_feature CDS ; SO:0000316:5870..7147 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\springer\env" +FT /db_xref="FLYBASE:FBgn0044344" +FT /db_xref="SPTREMBL:Q967T4" +FT /db_xref="NCBI_PROTEIN:AAK52056.1" +FT /translation="MLDMFPQSHMKKLLSVDIAHLRDMLDSLSIHHRVARSLDFLGTAL +FT KVVAGTPDAEDFEKVKFTEARLVDAHNSQIEINTKTQVRINELTDTINKLLKISKSAQI +FT DTGHLYETLSTRNRIIVMELQNLMLTITLAKINVVSPNFLDHADLESIWGEEPTNTPIR +FT EILSVASVKVLQSLNILHFIIKFPKIIMACNKVTILPVVHHDTVLRLKDNVVAECNREI +FT RTVKNCSITPGATFCQLSSVSSCAQELHAGVVAHCDAQQSDLHPITYVDEGIIVINDRP +FT ALVRVDNGTAIHIRGTHLITFIESAMVNETVFFNHDMVQNRAPGVANSPVLNISMKHEV +FT LSLPYLHRLSEKNLEQIRNFEKDVDGYRLSQIALVAGAIFCALICIGLTWQRTTRAKKS +FT TAQLKEVLAQIGSAEGGLNLEEGIVN" +XX +CC Derived from BACR06P08 by Sue Celniker, 29 March 2001. +CC Michael Ashburner, 9-Apr-2001. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 7546 BP; 2131 A; 1909 C; 1712 G; 1794 T; 0 other; + AGTTAACTAA GTTAACCGGA CTGATCGTCC GCACACCAGC ACCGGTCAAA CTGCTGACCA 60 + AGCATTTGGC CGGAAGCTCA TGCATAGCCG GCAGAAGCTC TGCGCATTGG CAGAGGCCGC 120 + TATGATGTTT TTCCCTTTGT TAGCTTATAG TCAGTTTGAT TTTGTATTCA ATAAAGAGCG 180 + CATCGCGCCT TCAATCAACT CCAGCTACTG CTGTTATCAT TGAATTGGTT GGCTAGCCTT 240 + AAGGGCAGTC AACAACGGAG AGACGTTCTC CCACCATATC TCCCAATCTA GGAGAAGAGG 300 + TCTGCGGCAA CCGCCCTGCC TCCCAGTGAC AGAAGAACCC CCCGTTACCT GCAACCTACG 360 + CCGGAGACCG CGGCGAGGGA CCTGCACCTT ATATTTAATT AATTGGCACC CAACTCCAGG 420 + AACCCACACC ACTACCCTGA ATCATGTAAG TGGGATTCTC AACTTAAACA CTACTCCAAA 480 + CTGCGTCTAG AATTTTAAAA TATTTGGGAT GTTTGTGCGA GTTACATAAA TAAATTAAGA 540 + AAATCGGCAT TTCCACTACA ATAAACGTTT ATATGTGTTG CGAATTAAGA TTATGTTACT 600 + GTTATGAAGT TTAAATATCG AATTTTGATT TGTGGTTGAC TTTGCAATCC ATATTGTGTG 660 + CATTTCATTC CGCCTTCGCA CATCCGCGGG ACACTGTCGT TTCATTCGAA ATTTAATTCG 720 + CTACATTGGC TTCACAGCCC TTTCAAGCTT TGTTGTTTTT GACCCACTCC ACTTCGCTAC 780 + CCGATACTGG CGCATGCATT GCTGTGACAA TTTTGTGCCT TTTATTTATC TCTTTGTCTT 840 + TGCTGTGGCA ATTTTTGTCT TTGGATATTT GTTTGCCTTA TTGGAGACCC GCTCCCCGCA 900 + GGCCCTTCAC CTTATCGTTA CTTAGCTGGA CAGTGGCTCT GCTCGTTGAG TCTTCGTCCA 960 + ATGCCTTCAA AGCGGCGACT CAGCCCCCGC GACCCCCTTG CCGTACTGTT TGGCCCCACG 1020 + GGCACAACGG CCTGAGTATT CACATACATA GCTACCCATG AGCGAGTCAT TCCGACAATA 1080 + TAGGAATTCT AAAAAGTGCG CTAGCGACTC AGAGTCCGAA AGCGACGATT CGACAGAAAA 1140 + CTCTGTACGT AAAAACACCC CAACTAACGC ATTCACTGCA TATAAAATGT CCCTCGAAAC 1200 + GGAACAAATT AAAGCTCTCA TAAGGGCATT ACAAGAGCAA GCCTTAGAGA GTCAACGCAG 1260 + GGAGGCTGAC TTGCGTAAAA CAATTCAAGA TCTGGCCGGC CAGGTCGCGG CCATACAGAT 1320 + TGCCCCTGCC CGGGCAGAAG CTCCCCCAAT CAAAGTTTAC AGACCAGTAG AAATCACCGG 1380 + ACTGGTCCCT TGTGGGGAAA CATTGGATGC CGTTAAATGT CTTCCAGACT TTATGGGGAC 1440 + ACAGGAGACA TACGTCTCCT GGCGGCAAGC GGCAAATGCC GCTTACCATA TGTTCAGGAA 1500 + ATATGAGGAT AGTTCGCGGC ACTATCAAGC TGTGGTCATC ATCAGGAGCA AAGTTAAAGG 1560 + CCCTGCTGAT GCAGTTCTGT CGTCCTTTGG GACTATACTG AATTTCGATG CGATCATAAG 1620 + TCGCCTCGAT TTCACGTATA GTGACAAACG CCCGATACAC GTTATCGAGC AGGAGCTAGG 1680 + CACCCTCAGA CAGGGAAGCC TGACGCTCCT CCAGTATTAT GATGAGGTCG AGAAAAAACT 1740 + CACCTTACTC ACCAATAAGG CGACTATGTC TTATGAAGCG TCGGCAGCAA CGGTGCTGTG 1800 + TGAGAAGTTC CGAGATGATG CTTTGAGAGT TTTTGTCTCG GGGCTCAGGC GCAACCTCAC 1860 + AGACGTGCTA TTCGCGGCAA AGCCTAAGGA CATGCCGTCA GCGCTCGCCC TGGCGCAAGA 1920 + AGTAGAGTCC AATCATGAGC GGTACACTTT TGCAACTTCA TTTGCACGAA GCCAAGAGGA 1980 + TAGGGACCAC AAGCAATATC CCAAAGTGCA GGAGCGCCAA CGGGCCCCCC CACAAGCCGG 2040 + CTCGCAGGGA AGTGCTGGGA AGAACCCGCA CTTTACTAAG CAGCATAGAG CACAGGTGCA 2100 + CTCCGCTCCA CGTAGCGACC GAATGGCCCG AGAAAACATG CCAGAACCCA TGGACGTTGA 2160 + CCCGTCGTTG TCCAGGATGC AGCCATCTCA CGCCCCGGCT TACCCGAAAT CGAAGCCGGC 2220 + CGCGTCTGGC CGTTCGGTCC CACCAAAAAG GCAAAGGGTC AACCATGTTG CCCAGGCCTC 2280 + TGATGATTTG GACAAGGTTT ATAACACCGC AGCCTCCAGT GCAGCAGTTA AAGTCGACGA 2340 + CGATTCCATC CTAGAGTACG ACTCGGATAC CATTAATTTT TTAGGGGAAA GTCCCTGCTA 2400 + CCCGTCATCA GACGAAGAGT AGCGGGGATC GACATGAAAC TACTGATTGA TACGGGCGCG 2460 + GCAAAAAATT TTATCCGACC ATTTAAGGGG TTGAAAGGCG TCCGCCCGGT GCAGTCCCCA 2520 + TTTACAATCC ATTCGATTCA TGGTGTGACT ACAATAACTA AGAAATGTTT CGTGTCCATT 2580 + TTTAATCTTA AAGCTACCTT TTTTTTATTA CCAGACTTGA CCTCCTTTGA CGCGATCGTT 2640 + GGCCTAGACC TGTTAAAACA GGCCGGCGCG TCACTTTGCC TAGCTTCCGG CAAGCTCAAA 2700 + TGGGGCTCCG GAGCAGAGCA AATTGACTTT CATACTTGCC CCGATGTCAA TTTCACCAAA 2760 + GTAGATTGCT CGGACGCACC GCCCTTAATT AAGGATGCTT TTTTAAAAAT GCTCGGGAAT 2820 + AGGAAAAAAG CTTTTGCTGA TCCTAATGAG GCTCTTCCTT ACAATACGTC GGTGGTAGCC 2880 + ACCATCCGGA CGGTTGATGA GGAGCCCATT TATGCCAAGT TATACCCATA TCCCATGGGA 2940 + GCAGCTGACT TCGTCAACGG CGAAATTCAG GAACTGCTTA AAAATGGCAT AATCCAAAAG 3000 + TCAAAGTCCC CCTACAATAA CCCAATATGG GTCGTAGACA AAAAGGGCAC TGACGATGCG 3060 + GGCAATAAAA AAATGCGCTT GGTGCTGGAC TTTCGAAAAC TTAACGAAAG GACGGTACCA 3120 + GACAGATACC CCATGCCAAA TATCTCTATG ATATTGGGGA ATCTCGGCAA GGCCAAATAC 3180 + TTCACGACCC TCGATCTGAA GTCTGGCTAC CACCAAATCA CGCTCGCAGA ACGCGACCGT 3240 + GAAAAGACAG CGTTCGCAGT AAACGGAGGG AAGTATGAGT TCCGAAGGCT GCCATTCGGA 3300 + CTCAGGAATG CTGCAAGCAT CTTCCAAAGA ACAATTGACG ATATTCTGCG AGAGCAGATC 3360 + GGAAAGTTCT GCTACGTTTA CGTCGATGAC GTCATCATCT TTTCGGAAGA TGAAAACGAC 3420 + CATGTCAAGC ATGTAGATTG GGTTCTGAAG AGCCTGTACG ACGCTAACAT GAGAATATCG 3480 + GCAGAAAAGT CACGTTTTTT TAAGAAAAGC GTGAGCTTCC TGGGGTTCAT CGTCACCAAC 3540 + AATGGGGCGG CGACTGACCC AGAAAAGGTT AAGGCCATAA AGGAATTTCC GGAACCCAAA 3600 + AACGTATTTG AGGTAAGGTC ATTCTTGGGC TTAGCCAGCT ATTATCGTTG CTTTATCAAA 3660 + GACTTCGCAT CAATAGCTAG GCCCATTTCA GACATATTGA AGGGCGAGAA CGGTAGTGTT 3720 + AGCCGACACA GGTCCAGGAG TATCCAGGTA GAATTTTCCG AAGCGCAACA ACGTGCCTTC 3780 + GAAAAGCTAC GCAATATCCT GGCGTCTGAG GACGTCATCC TGAGATACCC TGATTACAAA 3840 + AAAGCGTTTG ATCTAACGAC AGACGCTTCG GCCTACGGCA TTGGCGCAGT GCTGTCCCAG 3900 + GAGGGACGTC CCATTACAAT GATCTCAAGG ACATTGTCTG ACAGAGAGGT TAACTATGCT 3960 + ACCAACGAAA GGGAGCTGTT AGCCATAGTC TGGGCACTGG CTAAGTTGCG GCACTACCTG 4020 + TATGCGGTTA AAGAGATAAA CATCTTTACC GATCACCAAC CTCTGACGTT CGCGGTATCG 4080 + GAGTCCAATC CGAACGCCAA AATTAAGAGA TGGAAAGCAC GCATCGACGA GTCCGGCGCA 4140 + CGAATTTTTT ACAAGCCTGG GAGAAACAAC CTCGTTGCAG ATGCCCTCTC GAGACAACAA 4200 + CTCAACGTTG TTGAAGAGCA AGAACCGGAG TCGTGCGCGG CCACGATTCA CAGCGAACTT 4260 + TCGCTTACGC ACACGATCGA GTCCACGGAC AAACCCGTGA ATTGCTTCCA GAACCAGATA 4320 + ATTTTGGAAG AGGCGCGCTC CCATTGGAAA CGCACTTTTA TATTATTTGG GAATAAGAGG 4380 + CGGCACTCGA TCAATTTCTC GTGCAAACAA GCTTTGCTGG AGGAACTCGC CAACATCATT 4440 + ATCCCTAATG GTGTAAACGC CTTCCACTGT GATCTTCACA CGCTGGCGCT AATCCAGGAC 4500 + GACGTAGTTC GACAGTTTCC AGCCACGAAA TTCTGGCATT GTAAGAATAG GGTCACCGAC 4560 + ATCTTCGCGA TGCAGGAGAG AAAAGAAATC CTCACCGTCG AGCACAACAG AGCTCACAGG 4620 + TCGGCCCAAG AAAACGTGAA ACAAGTACTC TCCGAGTACT ACTTCCCGAA AATGACCAAA 4680 + TTGGCGAGCG AAATAGCAGC CAATTGCAAA ACTTGCGCAA AGGCGAAGTA TGACAGACAT 4740 + CCGAAGAAGC AGGAGCTCGG TGAGACACCA GTCCCGACCC ACGTAGGAGA AATATTGCAC 4800 + ATCGATATTT TCTCAACGGA TAAAAAATAC TTTCTCACCT GTGTTGACAA GTTTTCTAAA 4860 + TTCGCCATGG TACAGCCGAT TCTGTCTAGA ACCATAGAAG ATTTGAAAGC ACCCCTTTTA 4920 + CAACTTATGA ATGTTTTCCC CAAAGCCAAA ACCATCTACT GCGACAATGA ACCATCATTG 4980 + AAATCGCAGA CAATAGTGGC TATGCTGGAA AACCATTTTG GCGTCAGCAT TTCGAATGCA 5040 + CCGCCCCTAC ATAGCGTCTC AAACGGACAG GTGGAACGAT TCCACAGCAC GTTAATTGAG 5100 + CTCGCCAGAT GCCTAAAAAT CGACAAAGGC ATAAGTGACA CAGTGGAATT GGTCTTGCTG 5160 + GCCACAGCCA GATATAACAT GTCCATCCAC TCCGTCATCA ATAAAAAACC GGCCGAAGTC 5220 + ATGCGGGCAG ATCCGGACGA TCCACATACC GATGTCCAAG AAAAAATCAA AAACGCCCAG 5280 + ATTTTGACAA GAAAACGAGA GAACGCTTCT CGGCAGAACA GAGTGTTCCA GGTCGGCGAC 5340 + AAAGTCCTAG TAAAGTCAAA CAGACGATTA GGCAACAAAC TTACTCCTTT ATGTGAGGAG 5400 + AAGACCATCG AGGCAGACTT GGGGACCACA GTCCTTATTA AAGGGAGGGT GGTCCATAAA 5460 + GACAACCTCA AGTGACCCAA GCAGAGCCTA GCCGCGGCTC CCTCGGAGGC ACACTTTTAT 5520 + TCCTCCAATT TGTAGCCACT CGGCATAAGT TTTTTCATTG TTTTTATAGC CGCTTGGCAT 5580 + AAGTTTTTTA TTTTTTAGCC ACTTGGCATA TTTTTTATAT ATTTTCGCTA TTATTGGTGG 5640 + TGGGCAACTC CATTCCGAAC AAGTAATAAT TTATCACACA CGTTACAGGT CGCTCCCAAC 5700 + CCTTCTTCTT TGTTTCCTGG CCACGACATC GGCCCACATT ACTGACTATT CCCGAGCGAA 5760 + TTACATTCCC GTCATTGACG GTAAAGTCTT AGTCTGGGAG GAATTCGCCT ATGTCAGACA 5820 + CTCGGCTAAC CTCTCCGAGT ATAGGCGGGT AATTGACGAA ACCGACAGCA TGCTCGATAT 5880 + GTTCCCCCAG TCCCATATGA AGAAGCTCCT GAGCGTTGAT ATCGCTCACC TCCGTGACAT 5940 + GCTTGATTCT TTGAGCATCC ATCACAGAGT GGCAAGGAGC CTAGACTTCT TGGGAACTGC 6000 + GTTAAAGGTT GTCGCAGGGA CACCTGACGC GGAAGACTTC GAGAAAGTCA AGTTCACTGA 6060 + AGCGCGGCTT GTTGATGCAC ACAATAGCCA AATCGAAATA AACACCAAAA CACAAGTTCG 6120 + AATTAACGAA CTCACTGATA CCATAAATAA ACTTTTAAAA ATTTCCAAAA GCGCTCAGAT 6180 + TGATACAGGT CACCTGTATG AAACGCTTTC TACTCGCAAC AGAATCATTG TAATGGAATT 6240 + GCAAAACTTA ATGCTCACTA TAACCCTCGC TAAAATTAAC GTAGTGAGTC CAAACTTCTT 6300 + GGACCACGCA GATCTGGAGA GTATTTGGGG CGAGGAGCCC ACCAACACCC CCATAAGGGA 6360 + GATTTTGTCC GTTGCGTCTG TAAAAGTCCT ACAATCCCTT AACATCTTAC ACTTTATTAT 6420 + TAAATTCCCC AAGATTATCA TGGCGTGCAA CAAAGTCACT ATCCTTCCAG TGGTACACCA 6480 + CGATACGGTG TTAAGGTTGA AAGATAATGT GGTAGCAGAG TGCAACAGAG AAATACGCAC 6540 + AGTAAAGAAT TGCTCCATAA CACCAGGGGC AACATTTTGC CAGTTATCTT CAGTGAGCTC 6600 + GTGTGCGCAG GAGCTCCACG CTGGGGTCGT AGCACATTGC GACGCACAGC AGAGTGATCT 6660 + ACATCCGATC ACCTACGTCG ACGAAGGAAT AATCGTCATC AATGACAGAC CAGCACTCGT 6720 + GCGTGTGGAC AATGGAACGG CCATCCACAT TAGAGGCACG CACCTCATAA CATTCATTGA 6780 + GAGTGCCATG GTCAACGAGA CCGTCTTCTT TAATCATGAC ATGGTCCAGA ATAGGGCGCC 6840 + GGGAGTGGCT AATTCCCCAG TCCTTAATAT CTCGATGAAA CACGAGGTCC TGAGCCTCCC 6900 + ATACCTTCAC CGTTTAAGTG AAAAGAACTT GGAGCAAATC AGGAACTTCG AGAAGGACGT 6960 + CGACGGATAC CGACTAAGTC AGATAGCGTT AGTTGCGGGA GCAATTTTCT GCGCTCTTAT 7020 + CTGCATCGGT TTAACCTGGC AGCGAACCAC TAGGGCCAAG AAATCTACAG CCCAACTGAA 7080 + GGAAGTTCTC GCCCAAATAG GGTCAGCCGA GGGCGGCCTT AATCTTGAGG AGGGAATAGT 7140 + TAACTAAGTT AACCGGACTG ATCGTCCGCA CACCAGCACC GGTCAAACTG CTGACCAAGC 7200 + ATTTGGCCGG AAGCTCATGC ATAGCCGGCA GAAGCTCTGC GCATTGGCAG AGGCCGCTAT 7260 + GATGTTTTTC CCTTTGTTAG CTTATAGTCA GTTTGATTTT GTATTCAATA AAGAGCGCAT 7320 + CGCGCCTTCA ATCAACTCCA GCTACTGCTG TTATCATTGA ATTGGTTGGC TAGCCTTAAG 7380 + GGCAGTCAAC AACGGAGAGA CGTTCTCCCA CCATATCTCC CAATCTAGGA GAAGAGGTCT 7440 + GCGGCAACCG CCCTGCCTCC CAGTGACAGA AGAACCCCCC GTTACCTGCA ACCTACGCCG 7500 + GAGACCGCGG CGAGGGACCT GCACCTTATA TTTAATTAAT TTAACT 7546 +// +ID TARTC standard; DNA; INV; 11124 BP. +XX +AC AY600955; +XX +DR FLYBASE; FBte0001208; Dmel\TART-C. +XX +FT source AY600955:1..11124 +FT SO_feature non_LTR_retrotransposon ; SO:0000189 +CC telomeric retrotransposon +FT SO_feature direct_repeat ; SO:0000314:1..331 +FT SO_feature direct_repeat ; SO:0000314:10383..10713 +FT SO_feature five_prime_UTR ; SO:0000204:1..205 +FT SO_feature three_prime_UTR ; SO:0000205:6629..11102 +FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:11103..11124 +CC derived from polyA tail of RNA transposition intermediate +FT SO_feature CDS ; SO:0000316:206..3349 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\TART-element\gag" +FT /db_xref="FLYBASE:FBgn0014071" +FT /db_xref="NCBI_PROTEIN:AAT12844.1" +FT /db_xref="SPTREMBL:Q6J4U8" +FT /translation="MDGHNGDINEGWATVLSISSDDSNQLSSPPSIIVSSLDTTPTSN +FT ETTIVRRSLHNPKADMKSYRFENIVLNENKNTILPDPLFVDKCGNTANTTEANEKKPA +FT NSPFPISIIKNLSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTQIKPAKPS +FT PPSKELSTNSAPKTLSYTDKITVTQKNLPDKTHVDRPTQDDDINATKASKTAKIISTQ +FT LHLRETKPTQPAKDPSPRTQKPIANKAAETLTHTDKLIASQNLVPAKTHINSPTQYND +FT TNATNALKTAKINFSSHSHQSEIKPTQSAKNISPLTQKQFTSESAGTHTHTDKHKNTA +FT SQNLFSAKTHINSPTQHNDTSAATASKTAKLILSPHSHLSETKPTQPALSPSPLSQKQ +FT ITSIAAKTLTHTNKHTASQNFIPAKTHINIPTQYNDTNATKALKTAKAASPSHTYSRQ +FT TKPIKPAINALHAAQDTNPSPAISAVTYTDKPTATQNIFPVKTFAELIRENAKRSPTP +FT IENPPQAKHDSAALGRPPTAARKNLNKTLISPKTPGKRRGDCLDEGLLQTSNKKVRIR +FT DDFSDDDLGVTNLLSETPLFKSKAAIKIRQDSRRESLQKSAEMDTAPAISPSNAAADP +FT DLPPWKTVPASRKPPSIFLSNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTM +FT DAYNAIQNVLLEANIPLHSHQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFI +FT RAMQFRDTRNPMRIHEVEVVPKADGSHLKVLLIKSLGGQTVKVERKRVSKDPTQCHRC +FT QCFGHTKNYCRNPFKCMKCGQLHASVSCTKPKNLPATCANCNGSHVSSYKGCPVFQEA +FT KQRLSINKIQSLHSQPTHLQTPRNKHPYPKPTHIQTPLNKQPYTHPLPRTLVNNTKLP +FT AKRIQGKKISQRNLSINKRLNRIRTLDRKPRNETSPPTTSKKVLASLEESRKNPNSAL +FT NPANTHLTHFRPPPLAQNIPNDESKELSGEQYLLNRIEGMEKKLNNLLEIVTRLLSQG +FT KDCPKSPKNPFRDPIFV" +FT SO_feature CDS ; SO:0000316:3350..6628 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\TART-element\pol" +FT /db_xref="FLYBASE:FBgn0014072" +FT /db_xref="NCBI_PROTEIN:AAT12845.1" +FT /db_xref="SPTREMBL:Q6J4U7" +FT /translation="MLFLVTSEVTFPMTRECNRDILKIAFWNAGGINNKIDELKLFIL +FT NIDAHIIIVTETRLDNNSTKLELPGYFTYLAQNPASSKRGGVATIVNSSLRHMALEPI +FT EKECIQSAPIVLLPENNRRSEMIVIASVYCPPSLSWSPHHFTDVLNFAEKTMGGQTKL +FT ILCGDWNAKHRQWGCIRACQRGAALYDAIQADSMAEIVATGSATHFPHDTRKSPSAID +FT FSICKRLGRYEKRISSSAHLSSDHLPILLEINLDIKTISLQKQNNNILKKTTNIELFK +FT NVLERKILLNTEIRVAEDINDAINIFIKNIKDSAAESTPSPRIPDNHRRRYGQANRNS +FT HTLTLDENTSRLLEEKRIQSRIFKATRTNEDKTKLKAAENRLKKVIKILREKRINEQI +FT EGIDTNNPDRMRKIWRLLSEGKKMNQPNFPLKLETKKGPKWTKTIKETTEAFVSHLEG +FT RFKPNKIVPDYHIDKVNTGLRIIKESMLTERHNLNKNPHNQPITLNELNEEIKNLKNS +FT KAPGKDLITNQLIKTLPTKATLYLILIYNSILRLGYYPEAWKHAQVKMILKPGKSSNE +FT PKSYRPISLLSGLSKMFERLLLKRLFRVDLFKKAIPLHQFGFRKEHGTEQQIARVTQF +FT ILEAFERKEYCSAVFLDISEAFDRVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVK +FT DQAGETSRTGQIGAGVPQGSNLGPLLYSIFSSDMPLPYIYRPSPTQRIMLSTYADDTI +FT VLSSDTLATAATRNNENYLKTFSDWADKWGISVNAAKTGHVIFTLKNDLPTNSMNVKI +FT KGQTIKKESKQSYLGVTLDSKLTLSSHVTKLLGKYSTAYRKLTWILNGRSKLPTKTKI +FT LILKSVLSPIWQYAIAAWGPLVTDAQIRRVQVEENRKIRDICRAGRYTRNQTIRDLFG +FT VKTVEEFYQQAMHRFSETIKSHPNIAVRRILSRHYIPNRLERSRQRYFKMTNDHITQK +FT QTGLALSPKLLKIPDIDDCRTVKKRSEREKIRQMHLTELPTLLRLEEEEEELKRIKKQ +FT EEREKRERENQKWPPDRWCELEINRYNKQYRKGDLTRQEVIEKFRGQPLNVQRIILPD +FT YEGD" +XX +CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially +CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314"). +CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates +CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short +CC distance into ORF-1. The 5’ ends of TART-C elements are variable and the +CC minimal size for functionality has not been determined. Thus, this +CC canonical sequence, AY600955, may be 5’ truncated within the 5’ PNTR (M-L +CC Pardue, 2009). +XX +CC Derived from AY600955, Michael Ashburner, 6-Apr-2004; updated Jan-2009 as +CC per Mary-Lou Pardue and Greg DeBaryshe. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 11124 BP; 3774 A; 2893 C; 2173 G; 2284 T; 0 other; + AAGCTTCGCG GGATATCGAT AACAATCAGG TGGTTAAAAA TACTATAACA TCGAGTACCA 60 + GCCGTGTTTT TCCTGTCGAT TTATCGAAGT CCAACAGCCC GCCTTCGCTC CGAACACAAA 120 + TCGGCAAGTC AGTAGCTTTT TTAACCCGGC AGTGGCGCCT GTGCAGCAGC TATTTAAAGT 180 + GAAAAACACG AAACGCAACA ACAAAATGGA CGGCCATAAT GGAGACATAA ATGAAGGATG 240 + GGCAACAGTA CTATCTATCT CGTCGGATGA TAGTAACCAA CTTTCGTCGC CGCCGTCAAT 300 + TATAGTCTCA TCGCTGGACA CCACGCCAAC GTCAAACGAA ACCACCATAG TAAGAAGAAG 360 + CCTACACAAC CCAAAAGCTG ACATGAAATC TTACAGATTT GAAAATATTG TATTAAATGA 420 + AAATAAAAAT ACCATATTGC CAGATCCTTT ATTTGTTGAT AAATGCGGAA ATACTGCTAA 480 + TACCACAGAA GCCAATGAAA AAAAGCCTGC CAATAGCCCC TTCCCCATTT CCATTATCAA 540 + GAATCTTAGC ACTTCCTCGC CACTAACACA TGTAGACACG CCTACACAAG AAGATGACGC 600 + CAGTGCATTC AATACATTGA AAGCAGCCAA AACAGCTAGA ATAATTTTTC CCACACACAC 660 + ACAGATAAAG CCCGCCAAAC CCTCGCCCCC TTCCAAAGAA TTAAGCACAA ACTCAGCACC 720 + CAAAACTCTT AGCTACACAG ACAAAATTAC AGTAACACAG AAAAATCTAC CCGACAAAAC 780 + ACATGTAGAC AGACCTACAC AAGATGACGA CATTAATGCA ACCAAAGCAT CAAAAACCGC 840 + CAAAATAATT TCTACACAGT TACACCTACG TGAAACCAAG CCAACACAGC CCGCCAAAGA 900 + CCCCTCACCC CGCACCCAAA AGCCTATTGC AAACAAAGCA GCCGAGACAC TCACCCACAC 960 + AGACAAACTC ATAGCATCAC AAAACCTAGT TCCCGCCAAA ACACATATAA ACTCCCCCAC 1020 + ACAATATAAC GACACTAATG CAACCAATGC ATTAAAAACC GCTAAAATAA ATTTCTCTTC 1080 + ACACTCACAC CAAAGTGAAA TCAAGCCAAC ACAGTCCGCC AAAAACATTT CACCCCTCAC 1140 + ACAAAAGCAA TTCACAAGCG AATCAGCCGG GACACACACC CATACAGACA AACACAAAAA 1200 + CACAGCATCA CAAAATCTCT TTTCCGCCAA AACACACATT AACTCACCCA CACAACATAA 1260 + CGACACTAGT GCAGCCACAG CATCAAAAAC CGCTAAATTA ATTCTCTCCC CACACTCACA 1320 + CCTAAGTGAA ACCAAGCCCA CACAGCCCGC TTTAAGCCCC TCGCCCCTCT CCCAGAAGCA 1380 + AATAACAAGC ATAGCAGCCA AGACACTCAC CCACACAAAC AAACACACAG CATCACAAAA 1440 + CTTTATTCCC GCCAAAACAC ATATAAACAT ACCCACACAA TATAACGACA CCAATGCAAC 1500 + CAAAGCATTA AAAACCGCAA AAGCAGCTTC TCCCTCCCAC ACATACTCAC GTCAGACAAA 1560 + ACCAATAAAG CCCGCCATAA ACGCATTGCA TGCCGCCCAA GACACAAACC CAAGCCCAGC 1620 + AATCAGTGCT GTCACTTACA CAGACAAACC CACAGCTACT CAGAATATTT TTCCTGTCAA 1680 + AACTTTTGCA GAGCTGATTA GAGAAAATGC AAAACGCTCA CCAACTCCAA TCGAAAATCC 1740 + CCCTCAAGCA AAACATGACT CTGCCGCCCT CGGACGCCCT CCGACTGCAG CTAGAAAAAA 1800 + TCTAAATAAA ACACTGATTT CTCCTAAAAC TCCTGGGAAG CGCCGTGGGG ACTGTCTTGA 1860 + TGAAGGCCTA CTTCAAACCT CTAACAAAAA GGTTAGAATA CGCGACGACT TCTCTGATGA 1920 + TGATCTGGGG GTCACAAACC TACTCTCTGA AACACCCTTA TTCAAAAGCA AAGCAGCTAT 1980 + TAAGATTCGG CAAGACTCGA GAAGAGAATC CCTGCAGAAG TCAGCTGAAA TGGACACAGC 2040 + TCCAGCAATA AGTCCCTCAA ACGCAGCAGC CGATCCCGAC CTACCGCCCT GGAAAACTGT 2100 + TCCAGCTAGC AGAAAACCAC CATCAATCTT CCTGTCCAAT ATACAGCAGA TTATCCCGCT 2160 + AATAGAAAAA CTAAACTATA AAGCCGGGGT AAATAGCTTT ACTACCAAGT CTGAACTTGG 2220 + CAACAATATT AGAATCCAGG CTAAAACGAT GGACGCCTAC AATGCAATTC AGAATGTCCT 2280 + CCTTGAAGCA AACATTCCCC TACACTCTCA CCAGCCAAAG AGTGCAAAGG GCTTCCAAAT 2340 + TGTAATTAGG CACCTCCACC AGTCAACCCC GACCAAATGG ATTGAAAGCC AACTTCAAGA 2400 + CATCGGTATA GCTACAAAAT TTATCAGGGC AATGCAGTTT AGGGACACGA GAAATCCTAT 2460 + GCGCATCCAT GAGGTTGAGG TTGTACCCAA GGCTGACGGC AGCCATCTTA AGGTCCTGCT 2520 + AATAAAATCC CTTGGAGGAC AAACGGTCAA GGTCGAAAGG AAACGGGTAT CGAAGGATCC 2580 + TACACAATGC CACCGCTGCC AATGCTTTGG ACACACAAAA AATTATTGCA GAAACCCGTT 2640 + TAAATGTATG AAATGTGGCC AGCTGCACGC CTCGGTCTCA TGCACCAAAC CCAAAAACCT 2700 + TCCGGCTACT TGTGCAAACT GCAATGGAAG CCACGTTAGC AGCTATAAAG GATGTCCTGT 2760 + TTTCCAAGAA GCAAAGCAAA GACTATCTAT CAACAAAATT CAATCCCTTC ACTCACAACC 2820 + CACCCACCTT CAGACCCCCC GCAATAAACA TCCCTACCCA AAACCCACCC ACATTCAGAC 2880 + GCCCCTCAAT AAGCAGCCCT ACACACACCC CCTCCCTCGC ACATTAGTAA ACAACACAAA 2940 + ACTACCTGCC AAAAGAATCC AAGGAAAGAA GATATCGCAA AGGAATCTAT CTATAAATAA 3000 + ACGCTTAAAC AGAATCAGGA CATTGGACAG AAAACCGAGG AATGAGACAA GCCCGCCGAC 3060 + AACTAGCAAA AAGGTCTTGG CCTCTCTAGA AGAAAGCAGA AAAAACCCAA ATAGCGCCCT 3120 + AAACCCGGCC AACACCCATC TCACTCATTT CCGCCCACCA CCATTAGCAC AAAATATTCC 3180 + TAATGACGAA TCTAAGGAGC TGAGTGGGGA GCAATACCTT TTAAATCGCA TTGAAGGGAT 3240 + GGAAAAGAAG CTCAACAACC TTCTTGAAAT CGTCACCCGC CTACTAAGCC AAGGAAAAGA 3300 + CTGTCCAAAG TCTCCAAAAA ATCCTTTCCG AGATCCAATC TTCGTTTAAA TGCTCTTTCT 3360 + AGTAACATCA GAAGTGACGT TTCCTATGAC TCGGGAGTGC AACAGGGACA TCCTTAAAAT 3420 + CGCTTTCTGG AATGCTGGTG GGATCAACAA TAAAATAGAT GAGCTTAAGC TGTTCATTCT 3480 + AAATATTGAT GCCCACATAA TCATAGTCAC CGAAACTAGA CTAGACAACA ATTCTACCAA 3540 + ACTAGAGCTG CCAGGATATT TCACATACTT AGCCCAAAAT CCTGCCTCTA GCAAGAGAGG 3600 + AGGAGTCGCC ACGATAGTAA ACAGTAGTCT CCGCCACATG GCCTTAGAAC CGATTGAAAA 3660 + GGAATGCATA CAGAGTGCCC CAATAGTATT ACTGCCTGAA AACAACAGAC GCAGCGAAAT 3720 + GATTGTAATA GCATCTGTCT ACTGTCCGCC TTCGCTAAGC TGGTCGCCCC ACCATTTTAC 3780 + TGACGTTCTC AATTTTGCTG AGAAAACTAT GGGAGGGCAG ACTAAGCTCA TTCTATGTGG 3840 + CGACTGGAAC GCAAAACATA GACAATGGGG TTGTATACGC GCCTGCCAAC GTGGCGCCGC 3900 + ACTCTACGAT GCAATTCAAG CAGACTCCAT GGCTGAAATC GTCGCGACTG GCAGCGCTAC 3960 + ACATTTCCCG CACGATACAA GGAAAAGCCC GTCAGCAATA GACTTCTCGA TATGTAAACG 4020 + GCTTGGCAGG TATGAAAAAA GAATCTCCTC AAGTGCACAC CTATCCTCAG ACCATCTTCC 4080 + CATATTACTT GAGATAAACC TAGATATAAA AACCATCTCC CTGCAAAAAC AAAACAACAA 4140 + TATCCTCAAG AAAACAACGA ACATTGAGCT CTTTAAGAAC GTTCTAGAAA GGAAGATACT 4200 + TCTAAACACT GAGATAAGGG TAGCAGAAGA CATAAATGAC GCCATAAACA TCTTTATTAA 4260 + AAACATCAAG GACTCGGCTG CTGAATCAAC TCCCTCCCCA AGAATTCCTG ATAACCACAG 4320 + AAGAAGATAT GGGCAAGCTA ACAGAAATAG TCATACGCTC ACACTAGACG AAAACACAAG 4380 + CAGATTGCTG GAAGAAAAAC GTATACAAAG TAGAATTTTT AAAGCTACTA GAACGAACGA 4440 + GGACAAAACT AAACTAAAAG CAGCTGAAAA TCGACTTAAA AAAGTAATCA AAATCTTAAG 4500 + AGAAAAGAGA ATCAATGAGC AAATTGAAGG AATTGACACA AATAACCCGG ACAGAATGAG 4560 + GAAAATTTGG AGGCTGCTGA GTGAAGGGAA AAAAATGAAT CAACCCAACT TTCCCCTCAA 4620 + ATTAGAAACC AAAAAAGGCC CTAAATGGAC TAAAACAATT AAGGAGACAA CAGAAGCGTT 4680 + TGTCTCCCAC CTGGAAGGAA GATTCAAGCC AAATAAAATT GTACCTGATT ACCACATAGA 4740 + TAAGGTTAAC ACCGGACTAA GAATAATTAA GGAAAGCATG CTAACAGAAC GACATAATCT 4800 + AAACAAAAAC CCCCATAACC AACCCATTAC GCTAAACGAA TTAAATGAAG AAATAAAAAA 4860 + CTTAAAGAAT AGCAAAGCAC CTGGTAAAGA CCTTATAACA AACCAGCTCA TAAAAACCCT 4920 + ACCGACTAAA GCTACCCTGT ACCTTATCCT AATCTATAAC TCCATACTTA GATTAGGATA 4980 + CTACCCTGAA GCCTGGAAAC ATGCACAGGT AAAAATGATC CTGAAGCCAG GGAAAAGCTC 5040 + AAACGAGCCG AAGTCATACA GGCCGATTAG TCTACTCTCG GGACTCTCTA AAATGTTTGA 5100 + AAGACTACTC CTAAAAAGAC TTTTTAGGGT AGATCTATTC AAAAAAGCCA TACCACTGCA 5160 + CCAATTTGGC TTCAGAAAAG AGCACGGAAC TGAGCAGCAA ATAGCCAGGG TCACCCAGTT 5220 + CATCCTCGAG GCCTTCGAGC GGAAGGAATA CTGCTCAGCG GTTTTCCTTG ACATCTCTGA 5280 + GGCCTTTGAT AGGGTATGGC ACGAAGGCCT TTTACTTAAA TTAGCTAAGA TCCTACCTTA 5340 + CAACCTATAC ATTATACTGG AGAGCTACCT TACAAATAGA ACGTTCGAAG TTAAAGACCA 5400 + AGCAGGAGAG ACTTCGAGAA CAGGACAAAT AGGCGCAGGA GTGCCTCAAG GAAGCAATCT 5460 + CGGACCACTA CTTTACTCTA TCTTCTCCTC TGACATGCCC CTCCCATATA TCTACCGCCC 5520 + TTCACCAACA CAAAGAATTA TGCTCTCAAC ATACGCAGAC GACACTATAG TCCTCAGCTC 5580 + AGACACACTA GCAACTGCCG CCACAAGAAA CAACGAAAAC TACCTCAAGA CATTTTCGGA 5640 + CTGGGCGGAC AAATGGGGTA TCTCAGTAAA CGCTGCTAAA ACCGGACATG TCATTTTTAC 5700 + ATTAAAAAAC GACTTACCTA CAAACTCAAT GAATGTGAAG ATCAAGGGTC AAACAATAAA 5760 + GAAGGAAAGC AAGCAATCAT ACCTTGGGGT AACCCTTGAT AGCAAGCTAA CCCTTAGCTC 5820 + TCACGTCACA AAGCTATTGG GTAAATACTC TACAGCCTAC AGAAAATTGA CATGGATCCT 5880 + AAACGGAAGA AGTAAACTCC CTACTAAAAC TAAGATACTG ATCCTTAAAT CAGTTTTATC 5940 + ACCAATATGG CAGTATGCCA TAGCAGCTTG GGGTCCCCTT GTGACAGATG CACAGATAAG 6000 + GAGGGTCCAG GTTGAGGAAA ACAGAAAAAT AAGAGACATA TGTAGAGCGG GAAGATATAC 6060 + GAGAAACCAA ACTATAAGGG ACCTTTTTGG CGTCAAAACA GTAGAAGAAT TCTATCAACA 6120 + GGCTATGCAC AGGTTCTCAG AAACTATAAA ATCGCACCCA AATATAGCTG TTCGCAGGAT 6180 + TCTCTCTAGG CACTATATCC CGAACAGACT AGAAAGAAGC AGGCAGAGGT ACTTTAAAAT 6240 + GACAAATGAT CATATCACGC AAAAGCAGAC TGGACTTGCC CTCTCACCTA AACTCTTAAA 6300 + AATCCCTGAT ATAGATGACT GCAGAACCGT AAAAAAGCGT AGCGAGAGAG AGAAAATAAG 6360 + ACAAATGCAT CTAACTGAAC TCCCCACCTT GCTGAGACTA GAGGAAGAGG AGGAAGAGCT 6420 + CAAAAGAATA AAAAAACAGG AAGAAAGGGA AAAAAGAGAA AGGGAAAACC AAAAGTGGCC 6480 + TCCAGATAGA TGGTGCGAAT TGGAAATAAA CCGATATAAT AAACAATATA GAAAGGGCGA 6540 + CCTAACCAGG CAGGAAGTTA TAGAAAAATT CAGAGGGCAA CCATTAAATG TACAACGAAT 6600 + AATCCTACCC GACTATGAAG GGGACTAAAA TTAAATCAAA ACAAACCAGG ACAGGAGCAG 6660 + AAGGCAGAAA TAATCAAAAC TGGCGGAAGG GGTGGCAAAA TATTGAAAAG AGAGGAAAGA 6720 + AATATAAAAA GGCTAAAGGC TAAGTTACAG GTTACATAAA AAGGGAAATC TGCTTATAGA 6780 + TATTATGGTA AAATTAACTT AACTAAACAC CTACTGGTTA ACAAAATAAT TATGCCTGCA 6840 + TGGCACAAGC TGCGTACTCA AATCATTTCT CCTGACGCTA TTGAAAATCC ATCTTTACTT 6900 + TCCAACCGAG GGACTTGCGA CTGCGGTCTT TCCGCCTTAT TGGCTCCTTA TGGATCCATC 6960 + TGCTGCCGTA TTGGGCGACA CACCAGCGCT CCAACCTAAA AGAGAGATAA CATGTTTTAA 7020 + TTCACTTTCC TTTTCTTATA ACTAAATCAC AACAACAGCA ACAGCGCATC GGGCGACTGA 7080 + CAAAAGCATT AGCTCACCAA GTCAGCAACA ACAGCAGCAG CAAGACCAGA ATCAGTTGAG 7140 + GAGGAGGCCT GGTGGTGTGC TGAACATTTC GCCGCCCACA CCCACCATTT CTGTAGGCCT 7200 + GTATGACCCT GAGCCCAACG CCGGCATGGC AAATCCGGTC TTCCTGAGGA GGCGGGGCTC 7260 + TAGTGTTAGG CGCGCTTTTG CCCCAAAAGC AACAACGACA GCGGCAGTAG GGTCGGCGCC 7320 + CCCTGCGTGA CCGAGTCCAT CTTAGCAATC GGTCCTTTTG GCGGTGTTAT GCCGACGCGG 7380 + CGGTCGCGCT TATGAGGACT GCCTGCAATG CTTGGCCATG AGACGGCGTC ATCGACAACA 7440 + TTTCAATCAC GCTCAGCTGG TTGACCGGGG GCAACATGCT TGCCATGCAG CAACAATGGT 7500 + GCATGCAGTC CAGCATGCAG CAACAACAAC AATATTGGCA GCAGCAGACT AATGTTTCGC 7560 + AGCAGATTCC ATCTGGCAAC TTCCGACGAC CAGACTCCTC GCTTGGCCCC TGGAGACTCG 7620 + CTCTGGAAAA AAAAAGAAAG AAGCATGGAT TAGTTTTTTT TTTTCCCTTT AGCTATTGGA 7680 + TTAAATTTCT TTCCTGGACA ACCGGCGCCT TCATGCAGAT GACGCTGGAC TGCGGCGATT 7740 + CTTTCCCTCC AGCCACAGAT GGGAAGCTCA CATCATGGCA TATATGCGGC ATCGTGCTAA 7800 + TCAGCTCCCC ATGCTGAGCG AGATCTTGAT GCGGCGATGC ACTCACTAGC GAGCAGCGGG 7860 + AACAGCATAC AGCGTCAGCA ACAGCAGGAA GAGACTTTGT AGCAGAAGCC TTTCGGCATT 7920 + CTCCGACGAC CCGACTCCTC GATCGGGGTC AGGCAAATTC TCCTGGACCG ACAAATTTTC 7980 + CCGGCGTTTC GTCCTGGAAT AAGGAAGGAA GCACGGATTA ATTTCTCCCC TTCAGCTTAC 8040 + GACCCTTCTC ACCAACAGCA GCAACTACAA CAACATCGGC AGCAGACGAC TTGCAGCTGC 8100 + TTGGCTCACC TAATGCGACA GCAATAATCC CGGCAAGGCC AGAAACGGCA CCGAGCAGAA 8160 + GCACGACAGG GTGAAGAACA ACATGCCGCC CACGTCCACC AATCCGGAAG CCCTGCATTA 8220 + GGGGTCTGAA GCGCCATTAA CTGGAGGATC CGGCAGCGTA TGCCTACGCA GAAGCGGGGC 8280 + GTCGTAAATC CGGTGGCCGG AATAGCGCCT TGAACAGCAT GCTGTGTATG TTTGCCCCAA 8340 + AAGCAGAAAC TGCCGCAGCA AAGGAACCGC AAGCAGGATC ATCACTCGTG GCAAACTGGC 8400 + GTATTCCTGT TGAAGACGCG GGACTGCGGC GCATTCTTCC TTTCCAACCG GGGGCTTTAG 8460 + CGCTGCGGTA TTTCTGCTTT CACGGCTCCA TTTGCTGCTG CATCTGACGC CTCATCAGCG 8520 + CTCCTCCCTG AAAGAAAGAG AATATGTATT AGTTTTCTTT CCATTCCTTA CAATCTCTCT 8580 + CACCAAACCT CCACGACACA ACAACAGCAG CAGAAACAGG TCTAGCCCAC AATGGCAGCA 8640 + GCTACAGCAA TCAGCAGAAG CAAGGCCGGC AAAAGCAACA ACAAAAGCCC TCTCTGAAAG 8700 + CCCGGATGTG GAGACTGAAG CGCCGGAAAC TTGAGGATCC GCCCCCGATG CACGCCCACC 8760 + AACAATAAGC TGGAGGAGAA GTTACTGAAG CATGGGAAGC AGCACCAGGG GTCGCATACG 8820 + CAGCGTCAGG GCTTTGCGAA CCAGATGAAT GAGGAGAGAC TGGAACAGCA TAACATCAGC 8880 + GGCAGCAACA ACAGCGCCAC GAGGGTCAGC GGCGTCTGCA TGGCTGTGTC CAAAACAACT 8940 + CCAATTCAAC TGCTGTATGA TGCAGCGCAC CAGCGGCTTT CACAGGGACC GTCTGAAACG 9000 + CTTGGCAGGA GCCGGCTGAA GGCCTGGGCG AAGACACTGG AGACACCAAT GCGGCTCCTT 9060 + TCGGCCGACG GCAACAGGCT TGCCATGCAA TAAGAACAGT AAATCCTGAA ATAACAGCAG 9120 + AAGATACAGA CGTCCAAATT GCGAACACTG ACGCCAGCCC TCACCTGAAC GACTCACTGT 9180 + GCAGCAGCAG CAACATCAGC ACCGATGCCC TCAGCATCGG CAGCAGAGGG TGTTTTTGGC 9240 + CTTTGACAAT TCCCTGCGAC TTGACTTCTT CTTGGCATCT GGTCAATCAT CACGTGCCAG 9300 + CAAACAGTGG CTTGTCACCC TGGAAGAAAG AAGACTGGAT TAGCTTCTCC CCTTCTAATA 9360 + CATTTTGTGT GTTGAAATGC ATCAGGCGGC GACACACTCA CCAGCAACAG CAGCAACAAC 9420 + ACCAGCGGCA CCGGTAGCAG GAAATGGATC CTCAGCAAAA ACCATCGGCA CTTTCAGACG 9480 + TCCCGTACTC CTCGCCTGGC CCTGGCCGGT AACAGGGGCT TGTTAGATGG AGAAGACGAC 9540 + GGTCATCCGA CGGACAGCAG CCTGAAGATG GAAGCAGGCC TACGCTGCCC ACCTCTCCGA 9600 + TGCCTGCAGC AGCAACGGCA GCGGCTCATA AATGCAAACT GGCGCCAGCC CTCGGCTCTT 9660 + CGGGCTCATG TAGGCGGTGA CACACTCACT AGCAGCTAAA ACAGCAACGG CGGAATTAGT 9720 + AGAAGCAATG TTTTGCCGCA GCTGCCAGAT GGCATACTCC TAGCTTGGCC CCTGCCCAAA 9780 + CCGTATTGGA CCGGCAAATG ATTCGACAAT CCGATCTGGA AAAAATAAGT ATTGATTAAT 9840 + TTTTCCCCCA CAGATTGGTA TAAAATTGCA TTTACGGCCA ACCGGCTTCT TCCTGTTGAT 9900 + GACGTCACGC TGCGCCGCAT GCTTTTCGCC AGCCACAGTT GGAATGCATG CATTGGGGTT 9960 + GACGGTCCGG ATGGGCCGTT GCCTGTTATA TGCTGGCATC TCCGCAGCGG CGTTGTGAGC 10020 + AACGACACTG AAAGCAACAA TAATATTGTT AATTACTGCT CAAAACTATA ACACATTTAA 10080 + TCACTTACAC AATTTACACA CGCTTCCTGC CTAGGAGTTG TGGGACCAGC TACCGATAAT 10140 + GCCAACAATA CCGGGAAACG CGTCGCGGGA CATCGATAAC AATTTGGCGG TTAAAATGCT 10200 + AGAACATCGA GTACCAGACA TGTTTTTCCT GCCGATATAT CGAAGCCCAA TAGCCGCCAA 10260 + CGCTCAAAAC ATAAATCGGA GTGTGAGACC AGATACTGAA GCCGTTAAAA GCTTTTACCG 10320 + GCATCGGTAG CTGGTCTCAC ACTCCGATTT AAATTTGGAG CGTTGGCGGG CTGTTTGACG 10380 + CGAAGCTTCG CGGGATATCG ATAACAATCA GGTGGTTAAA AATACTATAA CATCGAGTAC 10440 + CAGCCGTGTT TTTCCTGTCG ATTTATCGAA GTCCAACAGC CCGCCTTCGC TCCGAACACA 10500 + AATCGGCAAG TCAGTAGCTT TTTTAACCCG GCAGTGGCGC CTGTGCAGCA GCTATTTAAA 10560 + GTGAAAAACA CGAAACGCAA CAACAAAATG GACGGCCATA ATGGAGACAT AAATGAAGGA 10620 + TGGGCAACAG TACTATCTAT CTCGTCGGAT GATAGTAACC AACTTTCGTC GCCGCCGTCA 10680 + ATTATAGTCT CATCGCTGGA CACCACGCCA ACGCCTGTCT AATGCAAATC AACTTACATA 10740 + TTACTCTAAA ATCTACTTAT AACTGTCCCC TCTAATGATA AGCAATTTTT ATGTTTACTT 10800 + TAAACTTAAA CCGATACCTT AAACTATGGC GCGCAAAATG ACTACCAAGA AATCTAAAAC 10860 + TGTAAATTGT TGCAAACTAT TTCTCCTAGT AATGTTAAAT TTAAATGCGC GCATAACCGC 10920 + AGCCAAGTTA ACCAAAAATG TCACTCGTAA ATGTAATTCC TAAATTAACA CTTGTAACTA 10980 + AGCGCGTATA AATACCGCAA ATCCAAAAAT GTAAATATGC CATAAATTGT TACTATATAT 11040 + TTTTAAAAAA GAAAAATCAG AGTACAATAA AAATGCCAGC GTCTATTAGG CGTTGAAAAT 11100 + TTAAAAAAAA AAAAAAAAAA AAAA 11124 +// +ID AY561850 standard; DNA; INV; 13424 BP. +XX +AC AY561850; +XX +DR FLYBASE; FBte0001206; Dmel\TART-A. +XX +FT source AY561850:1..13424 +FT SO_feature non_LTR_retrotransposon ; SO:0000189 +CC telomeric retrotransposon +FT SO_feature direct_repeat ; SO:0000314:1..1850 +FT SO_feature direct_repeat ; SO:0000314:11179..13028 +FT SO_feature five_prime_UTR ; SO:0000204:1..1759 +FT SO_feature three_prime_UTR ; SO:0000205:7953..13411 +FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:13412..13424 +CC derived from polyA tail of RNA transposition intermediate +FT SO_feature CDS ; SO:0000316:1760..4672 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /db_xref="FLYBASE:FBgnXXXXXXX" +FT /db_xref="GI:45594384" +FT /db_xref="NCBI_PROTEIN:AAS68533.1" +FT /translation="MDGQNVNQSGGWASVLSISSDDGNCSSSPPSAIVSSLDTTPTSN +FT ETTIVRRSLYQTNADMKSYDFENIVLNENKNTILPDPLFVDKCGSTANTTEANEKQPA +FT DSPFPISISKNFSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTQIEPAKPS +FT PPSKELSSNSAPKTLSYTDKITATQKNFPTKTHVDTPTQDDDTNATKASKTAQIDSSH +FT SQLHETKPTQPAKNPSPLTQKLTTNKTAKTHTHTDKPTASQNLFPTKTHINSPTQYND +FT TNASTASKDGKINLSSHSHLRETKPTQPAKNPSPLSQKQITSIAANTLTHTNKHTASQ +FT NFIPAKTHINIPTQYNDTNATKALKTAKPASPSHTYSRQTKPIKPAINALHPAQDTNP +FT SPAISAVTYTDKPTATQNIFPAKTFAELVRENAKRSQTAMQNPPHAKHDSAALGRLPS +FT AARKNLTKTLSSPKTPGKRRGDCLDEGLLQTSNKKVRIRDDFSDDDLGVTNLLSETPI +FT FKSKVAIKIRQDSRRESLQKSVEMDTAPAISPSNTAAEPDLPPWKTVPASRKPPSIFL +FT SNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTMDAYKAIQNVLLGANIPLHS +FT HQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFIRAMQFRDTRNPMRIHEVEV +FT VPKADGSHLKVLLLKSLGGQTVKVERKRVSKDPTQCHRCQCFGHTKNYCRNPFKCMKC +FT GQLHATVSCTKPKNLPATCANCNGSHVSSYKGCPAFQEAKQRLSINKIQSLHSQPTHL +FT QTPRNKHPYPKPTHFQTPRNKQSYTHPPPRTTVNNTKLPAKRIQGKKLSQRNISINKR +FT LNRIRAFDKKPRKETSPPTTSKKVLASLEESSKNPNSVLNPANTHLTHFCPPPITQDI +FT PNDEPTEPSQEQYLLNRIEGMEKKLNNLLEIVTRLLNQGRECPKSPKNPFRDPILI" +FT SO_feature CDS ; SO:0000316:4710..7952 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /db_xref="FLYBASE:FBgnXXXXXXX" +FT /db_xref="GI:45594385" +FT /db_xref="NCBI_PROTEIN:AAS68534.1" +FT /translation="MTRACNRDILKIAFWNAGGINNKIDELKLFILNIDAHIVIVTET +FT RLDNKSTKLELPGYFTYLAQNPVSSKRGGVATIVNSSIRHMALEPIEKECIQSAPIVL +FT LPENNRRSEMIVIASVYCPPSLSWSPHHFTDVLNFAEKTLGGQTKFILCGDWNAKHRQ +FT WGCTRACQRGTALYEAVQADPMAEIIATGCATHFPHDTRKNPSAIDFSICKGLGRLEK +FT RISSSADLSSDHLPILLEINLDTSTLFLQKQNNNILKKTTNIELFKTVLERKILLNTE +FT IRVAEDINDAINIFIKNIKDSADESTPSPRIPDNLRRMHGQANRNSHTLTLDENTSRL +FT LEEKRILSRIFKATRTDEDKAKLKAAENRLKKAVKILREKRINKQIEGIDTKNPDRMR +FT KMWRLLDEGKKTNQPNFPLKLETKRGPKWTKTIKETTEAFVSHLEGRFKPNNNVPDYH +FT INTVNSGLRTIKESMLTERYDVNKNPCNQPITLKELNDEIKNLKNSKAPGKDLITNQL +FT IKTLPTKATLYLILIYNSILRIGYYPDAWKHAQVKMILKPGKSVNDPKSYRPISLLSG +FT LSKMFERLLLKRLFRVDLFKKAIPLHQFGFRKEHGTEQQIARVTQFILEAFERKEYCS +FT AVFLDISEAFDRVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVKDQAGETSRAGQI +FT GAGVPQGSNLGPILYSIFSSDMPLPHIYHPSPTERIMLSTYADDTIVLSSDILATAAT +FT RNNENYLKTFSDWADKWGISVNAAKTGHVIYTLKNDIPTNLKTMKIKGQAIKKESKQS +FT YLGVILDSKLTLSPHVTKVVGKYLTAYRKMSWILNERSKLPTNTKMLILKSVLSPIWQ +FT YAIAAWGPLVTDAQIRRIQVEENRKMRDICRAGRYTKNQTIRDRYCVKTVEEFYQQAV +FT HRFSETTKSHPNVAVRRIFSRHYIPNRLERSRQRYLKMTMDHITQKQTGLTLSPKLLK +FT IPDLDDCRTLKKRSEREKIRQTHLTELPTLLRLEEEEAELKRIKKQEERERRERENQK +FT WPPDRWCELEINRYNKKYRNGDLTRQEIIEKFRGQPLNVQRIILPDYEGD" +XX +CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially +CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314"). +CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates +CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short +CC distance into ORF-1. The 5’ ends of TART-A elements are variable and the +CC minimal size for functionality has not been determined. Thus, this +CC canonical sequence, AY561850, may be 5’ truncated within the 5’ PNTR (M-L +CC Pardue, 2009). +XX +CC Derived from AY561850, Michael Ashburner, 6-Apr-2004; updated Jan-2009 as +CC per Mary-Lou Pardue and Greg DeBaryshe. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 13424 BP; 4373 A; 3415 C; 2870 G; 2766 T; 0 other; + CACGCTTTTT GGCCCCTGGC CGATCTTCAT ATATCTCAAA TCGACGGCTG CTTTTACCCT 60 + GGAAAAAAAA AAAGGAGCTT GGGTTATATT GAACTACACT AGGCGGCGAC ACACTCACCA 120 + GCAGCAGCCA GAACAACAAC AGCGGCAGAA GTAGCAGGAA ATTATCTCAC TGCAAAATCC 180 + AATTGGCACT TTCCGAAGTC CGTATTTCTC GCCTGGCCCC TGGCCAGTAA CAGGGGCCTG 240 + TGCGACGGAG ATGACGACGA TGATCTGCCC TGTGGACGGC CTCAAGAAGG AATCGGCCCT 300 + GTACTGCCCA CCTGACCTGT GCCAGGATAG CAGCAATGTC AGCGGACCAT GGATGGAAGA 360 + GGCGGCACTG GCGACGGTCC TCAGTTTTGC GGTTTCCGCG GGGCGTAGGC GCAGTAATCG 420 + GCGGCAGCAA CAGTGGCGGC AGCAGAAGGG AATGTGTATC TGCAGTCGCC GAATGGCAAT 480 + TTCCTGCCCA GCTGTAATGG ACCGCCAAAT GTTTTTTGGC ATGTCGACCT GTAAGAAAGA 540 + AGCAAGGATA AGTTTTTTCT TTACAAGATT GTATATGAAT TTGTATTTAC GGACAACTGG 600 + CTTGTTTCCT GTCGACGATA AATGGCGCTT CATGTTTTCA CTCTGCCAAA ATCTGAGTGC 660 + AAGCATCGGG GCTGACGGGC CGAATTTGCT GATGCCTTGT ACATGCTAGC ATCTTTATGC 720 + CGCCGTGTAA TTTTGCGACA GCAAAACACA TGATGGAGAA GACGAAGGTG ATCGATGGCG 780 + CCCGGATGAC GGATGCAGGC CCGTGCTACC CACTGGTCCG TTGCCAGGAC AGCAGCGTTT 840 + CAATTATGCG AACAGAGGCA CTGGAGCCAC TTCTCAGGCG ATAGGGATCA TGAGGCGACG 900 + ACAACTCGCC AGCAGCAGTA ACAACAACAG CGGCAGCAGC GATCTCGGAC TTGCTGAACA 960 + TTGCGGCTTT TTCCCAGCCT GGACCGTCAT CACAAACGCT CTCAAAGATC GGTGCGCCTG 1020 + CAGCCTACGG AAGCGTACAA CTGCCCAAAG TCGTGCTATT GCATAATGTT AGGTGTCCTG 1080 + GCTGCTCCGG CGGATGAGCT CCACCCGATT GAGAGAGGTA AGAAGGCCCA GCAAGTCGCC 1140 + CTTAAATAAA AGAAACAAGC ATTAGACTCG GCTGAAATTG TAACATCAGT CAGACTGTAC 1200 + TCACGCATGC ACTTAGACAA ACCGAAGCCT ATTCTATTGA CGACGCGGAC TCCAACACAT 1260 + GTTTTCCTCC ACAAAAGGCT GTGAGTGCAC CAAAGTTGAC GGGCCACGCC GGCCGATGCT 1320 + TGCTGCATAC CGGCATCTCC GCAGCAGCGA CGTTACAAGC ACCACTAAAA TTAGAAAGAG 1380 + GCTTACTATA GGCAAAGCGC AGAAAAACAA ATATTACAAT AAGAAATAGC ACGCGATTTT 1440 + TCTGCTTCGT TTCCGCTTGG TACAAGTGAG ACCATTCTCC CTATATGCCA TTCTAGTATA 1500 + TTTGCCCGAT AAGCGATATG CTGGCGGCAA AAAAAAAAGA TAATAGCCGA TAAGCCCGCC 1560 + AAAAAAAAAG CGCGAAATAT CGATAACGAG CTGGCACGAA AATTGCTGGC ATATCGATCA 1620 + ACCGCTGTGT CTTTGAGCTA TCGAAAAAGC CCGCCTACGC GCCTAGCCCA AATTTGCAAG 1680 + TCAGTTGAGA TTATAAAACC GACAGAGGCG CGCGCGCAAC AGTAGCTAAA AGTGAAGCCA 1740 + GCAGCAACAA CAACAACTAA TGGACGGCCA GAACGTGAAC CAAAGCGGAG GATGGGCATC 1800 + GGTTTTATCC ATCTCATCGG ACGATGGTAA CTGCTCATCC TCGCCGCCAT CAGCTATAGT 1860 + CTCATCGCTG GATACCACGC CAACGTCAAA TGAAACCACC ATAGTAAGAA GAAGCCTATA 1920 + TCAAACAAAT GCCGACATGA AATCTTACGA TTTTGAAAAT ATTGTATTAA ATGAAAATAA 1980 + AAATACCATA TTGCCAGACC CTTTATTTGT TGATAAATGC GGGAGTACTG CTAATACCAC 2040 + AGAAGCCAAT GAAAAACAGC CTGCCGATAG CCCCTTCCCC ATTTCCATAA GCAAAAATTT 2100 + TAGCACTTCC TCGCCACTAA CACATGTAGA CACGCCTACA CAAGAAGATG ACGCCAGTGC 2160 + ATTTAATACA TTGAAAGCAG CCAAAACAGC TAGAATAATT TTTCCCACAC ACACACAGAT 2220 + AGAGCCCGCC AAACCCTCGC CCCCCTCCAA AGAATTAAGC TCAAACTCAG CACCCAAAAC 2280 + TCTTAGCTAC ACAGACAAAA TTACAGCAAC ACAGAAAAAT TTCCCCACTA AAACACATGT 2340 + AGACACACCT ACACAAGACG ATGACACTAA TGCAACCAAA GCATCAAAAA CCGCCCAAAT 2400 + AGATTCATCA CACTCACAAC TACATGAAAC CAAGCCAACA CAGCCCGCCA AAAACCCTTC 2460 + ACCCCTCACC CAAAAGCTAA CCACAAACAA AACAGCCAAG ACACACACAC ACACAGACAA 2520 + ACCGACAGCG TCACAAAATC TTTTTCCCAC CAAAACACAT ATAAACTCAC CCACACAATA 2580 + TAACGACACT AATGCAAGCA CAGCATCAAA AGACGGTAAA ATAAACCTCT CTTCACACTC 2640 + ACACTTACGT GAAACCAAGC CAACACAGCC CGCCAAAAAC CCCTCACCCC TCTCCCAGAA 2700 + GCAAATAACA AGCATAGCAG CCAATACACT CACCCACACA AACAAACACA CAGCATCACA 2760 + AAACTTTATT CCCGCCAAAA CACATATAAA CATACCCACA CAATATAACG ACACCAATGC 2820 + AACCAAAGCA TTAAAAACCG CAAAACCAGC TTCTCCCTCC CACACATACT CACGCCAGAC 2880 + AAAACCAATA AAGCCCGCCA TAAACGCATT GCATCCCGCC CAAGACACAA ACCCAAGTCC 2940 + AGCAATCAGT GCTGTCACTT ACACAGACAA ACCCACAGCT ACTCAGAATA TTTTTCCTGC 3000 + CAAAACTTTT GCAGAGCTGG TGAGAGAAAA TGCTAAACGC TCACAAACTG CAATGCAAAA 3060 + TCCCCCTCAT GCAAAACATG ACTCTGCCGC CCTCGGACGC TTACCGAGTG CAGCTAGAAA 3120 + AAACCTAACT AAAACACTGA GTTCTCCTAA AACTCCTGGG AAGCGCCGCG GGGACTGTTT 3180 + GGATGAGGGC TTACTTCAAA CCTCTAACAA AAAGGTTAGA ATACGCGACG ACTTCTCTGA 3240 + TGATGATCTG GGGGTCACAA ATCTACTCTC CGAAACACCC ATATTCAAAA GCAAAGTAGC 3300 + TATTAAAATT CGGCAAGACT CAAGAAGAGA ATCCCTGCAG AAGTCAGTTG AAATGGACAC 3360 + AGCACCAGCA ATTAGTCCCT CAAACACAGC AGCTGAGCCC GACCTACCGC CCTGGAAAAC 3420 + TGTTCCAGCT AGCAGAAAAC CACCATCAAT CTTCTTGTCC AATATTCAGC AGATTATCCC 3480 + GCTAATAGAA AAACTAAACT ATAAAGCCGG GGTAAATAGC TTTACTACCA AATCTGAACT 3540 + TGGCAACAAT ATTAGAATCC AGGCTAAAAC GATGGATGCC TATAAAGCAA TTCAGAATGT 3600 + CCTCCTTGGG GCAAACATTC CCCTACACTC TCACCAGCCA AAGAGCGCAA AGGGCTTCCA 3660 + AATTGTAATT AGGCACCTCC ACCAGTCAAC CCCGACCAAA TGGATTGAAA GCCAACTTCA 3720 + AGACATCGGT ATAGCTACAA AATTCATCAG GGCAATGCAG TTTAGGGACA CGAGAAATCC 3780 + TATGCGCATT CATGAGGTTG AGGTTGTACC CAAGGCTGAC GGCAGCCATC TCAAGGTCCT 3840 + GCTACTAAAA TCCCTTGGAG GTCAAACGGT CAAGGTTGAA AGGAAACGGG TATCGAAGGA 3900 + TCCCACACAA TGTCATCGCT GCCAATGTTT TGGGCATACA AAAAATTATT GTAGAAACCC 3960 + GTTTAAATGT ATGAAATGTG GCCAGCTGCA CGCCACGGTT TCTTGCACTA AACCCAAAAA 4020 + CCTTCCGGCT ACTTGTGCAA ACTGCAATGG AAGCCACGTA AGCAGCTATA AAGGATGTCC 4080 + TGCTTTCCAA GAAGCAAAGC AAAGACTATC TATCAACAAA ATTCAATCCC TACACTCACA 4140 + ACCCACGCAC CTTCAGACCC CCCGCAATAA ACATCCCTAC CCAAAACCCA CCCACTTTCA 4200 + GACGCCCCGC AATAAGCAGT CCTACACACA CCCCCCTCCT CGAACAACAG TAAACAACAC 4260 + AAAATTACCT GCCAAAAGAA TCCAAGGAAA AAAGTTATCG CAAAGGAACA TATCTATAAA 4320 + TAAACGCTTA AATAGAATTA GGGCTTTTGA CAAGAAACCG AGAAAGGAGA CAAGCCCGCC 4380 + GACAACTAGC AAAAAGGTAC TGGCCTCCCT AGAAGAAAGC AGCAAAAACC CAAACAGCGT 4440 + CCTAAACCCA GCCAACACCC ATCTCACTCA TTTCTGTCCA CCCCCAATAA CACAAGATAT 4500 + CCCTAATGAC GAACCCACGG AGCCGAGTCA GGAGCAATAC CTTCTAAATC GTATTGAAGG 4560 + GATGGAAAAG AAGCTCAACA ATCTCCTGGA AATCGTCACC CGCCTACTAA ACCAAGGAAG 4620 + AGAGTGTCCA AAATCTCCAA AAAATCCTTT CCGAGATCCA ATCCTCATTT AAACGCTCTT 4680 + GCTAGTAGCA TCAGAAAGTG ACGTATCTTA TGACTCGGGC GTGCAACAGG GATATCCTTA 4740 + AAATTGCTTT CTGGAACGCT GGTGGGATCA ATAATAAAAT AGACGAGCTC AAACTGTTCA 4800 + TTCTAAATAT TGATGCCCAC ATAGTCATAG TCACTGAAAC CAGACTTGAC AACAAATCGA 4860 + CCAAACTAGA ACTTCCAGGA TATTTCACAT ACTTAGCCCA AAATCCTGTT TCTAGCAAGA 4920 + GAGGAGGAGT CGCCACTATA GTAAACAGCA GTATCCGACA CATGGCCTTA GAACCGATTG 4980 + AAAAAGAATG CATACAGAGC GCCCCAATAG TCTTGCTGCC TGAAAACAAC AGACGCAGCG 5040 + AAATGATAGT AATAGCATCT GTCTACTGTC CGCCTTCGCT AAGCTGGTCG CCCCACCACT 5100 + TTACTGACGT TCTCAATTTT GCCGAGAAAA CTCTGGGAGG GCAGACAAAG TTCATTCTAT 5160 + GTGGCGACTG GAATGCAAAA CACAGGCAAT GGGGTTGTAC CCGCGCCTGT CAACGCGGCA 5220 + CCGCACTCTA CGAAGCAGTT CAAGCAGATC CCATGGCTGA GATTATTGCT ACCGGCTGTG 5280 + CGACACATTT CCCGCACGAC ACACGGAAAA ACCCGTCAGC AATAGATTTC TCCATATGCA 5340 + AAGGACTGGG CAGGCTCGAA AAGAGAATTT CCTCAAGTGC GGACTTATCT TCAGACCACC 5400 + TTCCCATCCT GCTTGAGATC AACTTAGATA CAAGCACCCT CTTTCTGCAA AAGCAAAACA 5460 + ATAACATCCT CAAGAAAACT ACGAACATTG AGCTCTTTAA GACTGTTCTT GAAAGAAAGA 5520 + TACTTCTTAA TACGGAGATA AGAGTAGCAG AAGACATAAA TGACGCCATA AATATCTTTA 5580 + TCAAAAACAT CAAGGACTCG GCTGATGAAT CAACTCCCTC CCCAAGAATC CCTGACAACC 5640 + TCAGAAGAAT GCATGGACAA GCTAACAGAA ATAGTCACAC CCTCACACTA GACGAAAACA 5700 + CAAGCAGATT GTTGGAAGAA AAACGGATAC TAAGTAGAAT TTTTAAAGCT ACTAGAACGG 5760 + ACGAGGACAA AGCTAAACTA AAAGCAGCTG AAAATCGACT AAAAAAAGCG GTAAAGATCT 5820 + TGAGAGAAAA GAGAATTAAT AAACAAATTG AAGGAATAGA CACGAAAAAC CCGGACAGAA 5880 + TGAGGAAAAT GTGGAGACTG CTAGATGAAG GAAAAAAGAC AAACCAACCG AACTTTCCCC 5940 + TCAAACTGGA AACCAAAAGA GGCCCCAAAT GGACAAAAAC GATAAAGGAG ACAACAGAAG 6000 + CATTTGTTTC CCACTTAGAA GGAAGATTTA AGCCAAATAA CAACGTACCT GATTACCACA 6060 + TAAATACAGT TAACTCTGGA CTAAGAACAA TTAAAGAAAG CATGTTAACA GAAAGATATG 6120 + ATGTAAACAA GAATCCCTGT AACCAACCTA TCACACTAAA GGAATTAAAT GACGAAATAA 6180 + AAAACTTAAA GAATAGTAAA GCACCGGGAA AAGACCTTAT AACAAACCAA CTTATAAAAA 6240 + CCCTACCGAC TAAAGCTACA CTGTACCTTA TCCTAATCTA TAACTCTATA CTTAGAATTG 6300 + GATACTACCC AGACGCCTGG AAACATGCCC AAGTGAAAAT GATCTTAAAA CCAGGGAAAA 6360 + GTGTGAACGA CCCGAAGTCA TATAGGCCGA TCAGTCTACT CTCGGGACTC TCTAAAATGT 6420 + TTGAAAGACT ACTTCTAAAA AGACTTTTTA GGGTAGATCT ATTCAAAAAA GCCATACCAC 6480 + TGCACCAATT TGGCTTCAGA AAAGAGCACG GAACTGAGCA GCAAATAGCC AGGGTCACCC 6540 + AGTTCATCCT CGAGGCCTTT GAGCGAAAGG AATACTGCTC AGCGGTTTTC CTTGACATCT 6600 + CTGAGGCTTT CGATAGGGTC TGGCACGAAG GCCTTTTACT TAAACTAGCT AAAATATTAC 6660 + CATACAACCT ATACATTATT CTCGAAAGCT ACCTTACAAA CAGAACATTT GAAGTTAAAG 6720 + ACCAAGCTGG AGAGACTTCG AGAGCAGGAC AAATAGGCGC AGGGGTGCCC CAAGGAAGCA 6780 + ACCTTGGACC CATACTGTAC TCTATCTTCT CCTCAGACAT GCCACTCCCA CACATATACC 6840 + ACCCCTCCCC AACAGAAAGA ATTATGCTCT CAACATACGC AGACGACACT ATAGTACTCA 6900 + GCTCAGACAT ACTAGCAACT GCTGCCACAA GAAACAACGA AAACTACCTC AAGACATTTT 6960 + CGGACTGGGC AGACAAATGG GGTATCTCAG TAAATGCTGC TAAAACAGGA CATGTCATTT 7020 + ATACATTAAA AAACGACATA CCTACAAATC TAAAGACCAT GAAGATTAAG GGTCAAGCAA 7080 + TAAAAAAGGA AAGCAAGCAA TCATACCTTG GCGTAATCCT TGATAGCAAG CTAACACTTA 7140 + GTCCTCACGT CACGAAGGTA GTAGGTAAAT ACTTGACAGC CTATAGAAAA ATGTCATGGA 7200 + TCTTAAATGA AAGAAGCAAA CTCCCTACTA ATACTAAGAT GCTGATCCTC AAATCAGTTC 7260 + TATCGCCAAT ATGGCAGTAT GCCATAGCAG CCTGGGGTCC CCTTGTGACA GATGCACAGA 7320 + TAAGACGGAT ACAAGTTGAG GAAAACAGAA AAATGAGAGA CATATGCAGA GCGGGAAGAT 7380 + ACACGAAAAA CCAAACTATA AGGGACCGCT ACTGTGTCAA AACAGTAGAA GAGTTCTATC 7440 + AACAGGCTGT CCACAGGTTC TCAGAAACTA CAAAATCGCA CCCTAATGTA GCTGTTCGCA 7500 + GGATATTCTC TAGGCACTAT ATCCCGAACA GACTAGAAAG AAGCAGGCAG AGGTACTTGA 7560 + AAATGACAAT GGACCATATC ACGCAAAAAC AGACTGGACT GACCCTCTCA CCTAAACTCT 7620 + TAAAAATCCC TGATCTAGAT GACTGCAGAA CCTTAAAAAA GCGAAGCGAG AGAGAGAAAA 7680 + TAAGACAAAC GCATCTAACT GAACTCCCCA CCCTGCTGAG ACTAGAGGAA GAGGAGGCAG 7740 + AGCTCAAAAG AATAAAAAAA CAGGAAGAGA GGGAAAGAAG GGAAAGGGAA AACCAAAAGT 7800 + GGCCTCCAGA TAGGTGGTGT GAACTGGAAA TAAACCGATA TAATAAAAAA TATAGAAATG 7860 + GCGATCTAAC CAGGCAGGAA ATTATAGAAA AATTCCGAGG GCAACCATTA AATGTACAAC 7920 + GAATAATCCT ACCCGACTAC GAAGGTGACT AAAAGTAAAT CAAAACAAAC TAGGGTCGGA 7980 + GCATAAAGCA GAAATAATTA ACCTGGCGGA AGGGGCGGCA AAAATATTTA AAAGAAAGGA 8040 + AATAAATACA AAAAGGCTAA AGGCTAAGTT ACAGGTTACA TAAAAAGGGA AATGTGCTTA 8100 + TAGATATAAT GGTAAAATTA ACTTAACTAA ACACCTACTG GAAAACAAAA CCATGATGGC 8160 + TGCGTACTTA AAACGTTTCT CCTGGCGCGA TTGAAAATCC ATCTTTCCTA TCCAACCGAG 8220 + GGATCTGCGA CTGCGGCCTT CTGCCGTTCG GCTCCTGATG GATCCATCTG CTGCTGGAAT 8280 + GGGTGCCACA CCGGCGCTCC AACCTAAAAG AAAGATAATA TGTCTTAGTT TTCTTTCCCT 8340 + TTTTCTCATA AAAAACAAAA GCTCATCTGG AGTCTGATAA TAGCTTTAGC TCACCAAGAC 8400 + AGCAAAAACA ACAGCATCAA GGCCAGCAAC AGTGGAGGCA GAGACCAAGC GGTTTGCTGA 8460 + ACATTTCGCT GCCCACACCC ACCATTCCTG GAGGCTCTGA ATGAGGGAGC TGAAGCCTCT 8520 + GAAAATTGAA GATCCTACTC CAATGTGACA CTTTCGGCTC CGAGCTCAAC GCCGGCGCTG 8580 + CAAATCCGGC GTTATAAGGA AAGGGTGCTC CAGCTTGTGG AGTGGTCTTT CCCCAGAGGC 8640 + AGCAGCAGCA GCAACGCCAG CGGCAATTGG CGACCTCTGC GTAGCCGAGT CAATCCCGTT 8700 + ATCGGTCCGT CTGGCGATGC GTTTCCGACG CGGCGGTATG CGTCCATAGG GACCGCCTAG 8760 + AATGCTTGGC CAGGAGACAG CAGTAGACCT GGGCGTGGGC GTCACCAGCA ACATGGTAGC 8820 + CATGCGCAGT CAATTGGCCG GTGGCAACAA TCTTGCCATG CAGCAATAGC GGCGCATGCT 8880 + ACCCTTGGAG CGACGTCAAC AGCTACATAT TTTTCAACAG TGTAGCGCGA CCTTTAGGCG 8940 + CCTACACCTA CACCAGCAGC AGCGATATTG GCAGTAGCAG CATTTAATGT CTTGCAGCAG 9000 + TTTCCATTTG ACAACTTCCG ACGACCAGAC TCCTCGCTTG GCCCCTGGCG ATTCGCCCTG 9060 + GAAGAAAGAA AGAAGCATGG ATTAGTCAAA TATCAAAGCA CAACAAGCAT GCACGAAATC 9120 + TTCGCAACAA GGACTATTCC AAGGCAAGCG ATGGTGTGTT CTTTGGCTCT ACATATATCG 9180 + TTGAAATCCG TCTCCAACTG CCGCGAGTCA CCCACGACTT CCACTCCCTG CAGACGGACG 9240 + TAATGCACTA CGATGTGTAA ATTTTCCGGA TCCAAGTGAA CGCCAGGCGG AAGAGGATTC 9300 + CCTGGATGTG AAGGATCACA AACTGCTGCT TTTTCAAGAG TCCCCATTTA ACAACTTCCG 9360 + ACGACCAGAC TCCTCGCTTG GCCCCTGGCG ATTCGCCCTG AAAGAAAGAA AGAAGCATGG 9420 + ATTAGTCAAA TACCAAAGCA CAACAAGCAT GCACGAAATC TGCGCAACAA GGACTATTCC 9480 + AAGGCAAGCG ATGACGGACG GAATGCACTA CTATGTGTAA ATTTTCCGGA TCCAAGTGAA 9540 + CGCCAGGCGG AAGAGGATTC CCTGGATGTG AAGGATCACA AACTGCTGCT TCTTCAAGAG 9600 + GTAACCGGCC TCATTTCCAC TTGGGTCACA TCGATTGTGG AGGAAGCCGA TTGGGACTTT 9660 + GAGCGAGCCC TAAAATTGTT CATTCAGAAG AACGCTGATC ACGAAATCCC AGATCTAGCA 9720 + TTCGCCTAGA ATATGTGATC TCGTTGGACT GCGTGCTGGA CTGCGGCGCA TGCTTTCCCT 9780 + CCCGCCAGAG ACGGGATGCG CGCATCAGGA TCGACGGGAC AGACCGGCCG ACGCCTGGCT 9840 + TCACGTCGGC ATCTATGCGA CGACGTGATA ATCAGCTTCA CAGTACCTGC GGATGAGGGC 9900 + ACAGGCGCCA GTCCTCTGCC TAGCGACACA TACACCAACA GCAACATCTA AAACAGTCGC 9960 + AGTAGATGCA GGGAATTTTC TTGCTGCATT CTCCAACTGG AAAAATCCGA CGGCCCAACT 10020 + CCTAGCTTAG CCCGGCCAAT CTTCTTGGAC TGGCAAACGA TGTGATGAAT CGTCCTGGAA 10080 + GAAAGAAGCA TGGATTATTT CTTCATACAC AGCTTGTCTA CTAAAATGCA TTTCCCGGCA 10140 + AACTGGCACT GGGGCGTTGA AAATACGACA CTACTCACCA AACAGCAGCA AAAACAACAG 10200 + CATCGGCAGC AGGCGACCAG CAGCTGCTTT GGCTCACCCA ATGCGACAGC AATATCTGCG 10260 + CATGGCCAGC AACATGCAGC AAGCAAAAGA CCGGCATGGT GGTGAACAAC ATATCGCTCA 10320 + CGCCCAACGA TCTGGAAGCC CTGAGCTAGG GAACTGAGTA TCCGCCAGCG GATACTTATG 10380 + CAGCGGCGAG GCGTCGGAAA TCCGATAGCC GGAAGAGAGG CCGGAGCAGC ATGTTGGGCA 10440 + TTTTCGCCCC AGTAGCAGCT GCTGGGGCAG CAAGGGCAGA GGTAGCAGTG TCAGCGCTCC 10500 + TGGTAAACCG GCCTTTTCTG TTGAAGACGC GGGACTGCGG CGCAATTGTT CCTGCCAACC 10560 + GGGAGTTCTC TGCGCCTGAG GTCCTGTTGT GCTTCAGCGG CTCCATCTGC TGTTGCATCT 10620 + GGCGCTTCTC CAACTTTCCT CCCTGAAAGA AGAGAATATT AGTAGGAGCA TGAGACCAAC 10680 + AACAGCCCTA GCTTACCACG TCAGCGGAAA CAGCAACTGC AGAAGCCCGG TAACTTTCTG 10740 + ATAATATGCA GCAATAAGAG CGGCTGGATC AGCATGTTGT GTAGCTTGGC CCCAGAAGCA 10800 + GCAGCTGCGG TACCAAAGGC AGCGGAAGCA GGGTCAACAT AGTCTGCTAT GCTGTGTCCA 10860 + TACTAGCATA GTCAAGTCAG CGGTGGTGAC GTTGCCGCAG CAGCTGATCC ACAGGGTACG 10920 + GCCTGGAATG TTTTGTCAGA GACGGCAGTG GCCTGGGCGT ATTAGTCAGA TACGCCAACA 10980 + ACATGATACC CATGCGCAAC CATTCTTCCG GTGGCGGCAT GCTCGTAAAG TAGCGGCGGC 11040 + GCATGCATCT CTCGAAGCAG CAGCAGCAAC AGAGGCGTCT CATAAGTGCA TGCGCAGCAG 11100 + CGGTAGCAGC GGTGGTGGCA GCAGCAGGGA GATTTCATTG CTGCAGTCGC CAAATTACAT 11160 + GCATCCTACG ACTCGACTCA CGCTTTTTGG CCCCTGGCCG ATCTTCATAT ATCTCAAATC 11220 + GACGGCTGCT TTTACCCTGG AAAAAAAAAA AGGAGCTTGG GTTATATTGA ACTACACTAG 11280 + GCGGCGACAC ACTCACCAGC AGCAGCCAGA ACAACAACAG CGGCAGAAGT AGCAGGAAAT 11340 + TATCTCACTG CAAAATCCAA TTGGCACTTT CCGAAGTCCG TATTTCTCGC CTGGCCCCTG 11400 + GCCAGTAACA GGGGCCTGTG CGACGGAGAT GACGACGATG ATCTGCCCTG TGGACGGCCT 11460 + CAAGAAGGAA TCGGCCCTGT ACTGCCCACC TGACCTGTGC CAGGATAGCA GCAATGTCAG 11520 + CGGACCATGG ATGGAAGAGG CGGCACTGGC GACGGTCCTC AGTTTTGCGG TTTCCGCGGG 11580 + GCGTAGGCGC AGTAATCGGC GGCAGCAACA GTGGCGGCAG CAGAAGGGAA TGTGTATCTG 11640 + CAGTCGCCGA ATGGCAATTT CCTGCCCAGC TGTAATGGAC CGACAAATGT TTTTTGGCAT 11700 + GTCGACCTGT AAGAAAGAAG CAAGGATAAG TTTTTTCTTT ACAAGATTGT ATATGAATTT 11760 + GTATTTACGG ACAACTGGCT TGTTTCCTGT CGACGATAAA TGGCGCTTCA TGTTTTCACT 11820 + CTGCCAAAAT CTGAGTGCAA GCATCGGGGC TGACGGGCCG AATTTGCTGA TGCCTTGTAC 11880 + ATGCTAGCAT CTTTATGCCG CCGTGTAATT TTGCGACAGC AAAACACATG ATGGAGAAGA 11940 + CGAAGGTGAT CGATGGCGCC CGGATGACGG ATGCAGGCCC GTGCTACCCA CTGGTCCGTT 12000 + GCCAGGACAG CAGCGTTTCA ATTATGCGAA CAGAGGCACT GGAGCCACTT CTCAGGCGAT 12060 + AGGGATCATG AGGCGACGAC AACTCGCCAG CAGCAGTAAC AACAACAGCG GCAGCAGCGA 12120 + TCTCGGACTT GCTGAACATT GCGGCTTTTT CCCAGCCTGG ACCGTCATCA CAAACGCTCT 12180 + CAAAGATCGG TGCGCCTGCA GCCTACGGAA GCGTACAACT GCCCAAAGTC GTGCTATTGC 12240 + ATAATGTTAG GTGTCCTGGC TGCTCCGGCG GATGAGCTCC ACCCGATTGA GAGAGGTAAG 12300 + AAGGCCCAGC AAGTCGCCCT TAAATAAAAG AAACAAGCAT TAGACTCGGC TGAAATTGTA 12360 + ACATCAGTCA GACTGTACTC ACGCATGCAC TTAGACAAAC CGAAGCCTAT TCTATTGACG 12420 + ACGCGGACTC CAACACATGT TTTCCTCCAC AAAAGGCTGT GAGTGCACCA AAGTTGACGG 12480 + GCCACGCCGG CCGATGCTTG CTGCATACCG GCATCTCCGC AGCAGCGACG TTACAAGCAC 12540 + CACTAAAATT AGAAAGAGGC TTACTATAGG CAAAGCGCAG AAAAACAAAT ATTACAATAA 12600 + GAAATAGCAC GCGATTTTTC TGCTTCGTTT CCGCTTGGTA CAAGTGAGAC CATTCTCCCT 12660 + ATATGCCATT CTAGTATATT TGCCCGATAA GCGATATGCT GGCGGCAAAA AAAAAAGATA 12720 + ATAGCCGATA AGCCCGCCAA AAAAAAAGCG CGAAATATCG ATAACGAGCT GGCACGAAAA 12780 + TTGCTGGCAT ATCGATCAAC CGCTGTGTCT TTGAGCTATC GAAAAAGCCC GCCTACGCGC 12840 + CTAGCCCAAA TTTGCAAGTC AGTTGAGATT ATAAAACCGA CAGAGGCGCG CGCCGAACAG 12900 + TAGCTAAAAG TGAAGCCAGC AGCAACAACA ACAACTAATG GACGGCCAGA ACGTGAACCA 12960 + AAGCGGAGGA TGGGCATTGG TCTTATCCAT CTCATCGGAC GATGGTAACT GCTCATCCTT 13020 + GCCGCCATAG TCTCATCGCT GGATATCAAG TCATCGCTCA ACTATACCTT AAAATTACTC 13080 + ACCAAAACTC TTTTCTCCTT TTCCATAAGA TAAAGTAAAG TAAAGTAATG TAAAGTAAAG 13140 + TAAAGTAAAT TAAAGTAAAG TAAAGTAACG TAAAGTAACA TAATATTTAA ATTTAAATTC 13200 + TACACTTGAA CAATGGCGCG CAAAACTGCC GCAATGTAAT TCAAAAATGT CTCCCGCAAA 13260 + TTTAAAACAT AGATTAATAC TTGTAAGTAT GGCGCGCATA TCTGCGGCCA AGAAATCCGA 13320 + AAATGTAATT TGCCACAAAT TGTCACTATA TATTTTTAAG CAAAAATCAG AGGACAATAA 13380 + ATGCCAACGT CATTAGACGT TGAAAATATT CAAAAAAAAA AAAA 13424 +// +ID DM14101 standard; DNA; INV; 10654 BP. +XX +AC U14101; +XX +DR FLYBASE; FBte0001207; Dmel\TART-B. +XX +FT source U14101:1..10654 +FT SO_feature non_LTR_retrotransposon ; SO:0000189 +CC telomeric retrotransposon +FT SO_feature direct_repeat ; SO:0000314:1..1046 +FT SO_feature direct_repeat ; SO:0000314:9031..10076 +FT SO_feature five_prime_UTR ; SO:0000204:1..961 +FT SO_feature three_prime_UTR ; SO:0000205:7386..10637 +FT SO_feature polyA_signal_sequence ; SO:0000551:10479..10484 +FT SO_feature polyA_signal_sequence ; SO:0000551:10600..10605 +FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:10638..10654 +CC derived from polyA tail of RNA transposition intermediate +FT SO_feature CDS ; SO:0000316:962..4093 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\TART-element\gag" +FT /db_xref="FLYBASE:FBgn0014071" +FT /db_xref="SPTREMBL:Q23999" +FT /db_xref="GI:603663" +FT /db_xref="NCBI_PROTEIN:AAC46493.1" +FT /translation="MDGHNGDQSEGWATVLSISSDDSNSLSSPPSIIVSSLDTTPTSHE +FT TTIVRRSLYQTNADMKSYDFENIVLNENKNTILPDPLFVDKCGSTANTTEANEKKPANS +FT PFPISISKNFSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTHIKPTKPSPPS +FT KELSTNSALKTLSYTDKITGTQKNLPDKTHVDTPTQDDDINATKASKTAKIISTQTHLG +FT ETKPIQPAKDPSPRTQKPIAHKADETLTHTDKLTASQNLVPAKTHINTPTQYNDTNATN +FT ALKTAKINFSSHSHQSEIKPTQSAKNISPLTQKQFTSESAGTHTHTDKHKNTASQNLFS +FT AKTHINSPTQHNYTSAATASKTAKLILSPHSHLSETKPTQPALSPSPLSQKQITSIAAK +FT TLTHTNKHTASQNFIPAKTHINIPTQYNDTNATKALKTAKAASPSHTYSRQTKPIKSAI +FT NALHPAQDTNPSPAISAVTYTDKPTATQNIFPVKTFAELVRENAKRLPTPMQNSHQAKN +FT DSAALGRPPTAARKNLNKTLISPKTPGKRRGDCLDEGLLQTSNKKVRIRDDFSDDDLGV +FT TNLLSETPLFKSKAAIKIRQDSRRDSLQKSAEMDTAPAISPSNTAADSDLPPWKTVPAS +FT RKPPSIFLSNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTMDAHNAIQNVLLE +FT ANIPLHSHQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFIRAMQFRDTRNPMR +FT IHEVEVVPKADGSHLKVLLLKSLGGQTVKVERKRVSKDPTQCHRCQCFGHTKNYCRNPF +FT KCMKCGQLHATVSCTKPKNLPATCANCNGSHVSSYKGCPAFQEAKQRLSINKIQSLHSQ +FT PTHLQTPRNKHPYPKPTHLQTPRNKQPYTHPLPRTSVNNTKLPAKRIQGKKISQRNLSI +FT NKRLHRMKKPRKETSPPTTSKKVLASLEESRKNPNSVLNPANTHLTHFRPPPLAQNIPN +FT DEPKELSGEQYLLNRIEGMEKKINNLLEIVTRLLRQGKDCPKSPKNPFRDPIFV" +FT SO_feature CDS ; SO:0000316:4131..7385 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\TART-element\pol" +FT /db_xref="FLYBASE:FBgn0014072" +FT /db_xref="REMTREMBL:AAC46494" +FT /db_xref="GI:603664" +FT /db_xref="NCBI_PROTEIN:AAC46494.1" +FT /translation="MTRADNRDILKIAFWNAGGINNKIDELKLFILNIDAHIIIVTETR +FT LDNNSTKLELPGYFTYLAQNPVSSKRGGVATIVNSSIRHMALKPIEKECIQSAPIVLLP +FT ENNRRSEMIVIASVYCPPSLRWLPHHFTDVLNFAEKTLGGQTKFILCGDWNAKHRQWGC +FT TRACQRGTALYEAVQADSTAEIIATGCATHFPHDTRKNPSAIDFSICKGLGRFEKRISS +FT GADLSSDHLPILLEINLDTNTLFLQKQNNNILKKNTNIELFKKVLERKILLNTEIRVAE +FT DINDAISTFMKNIKDSAAESTPSPRIRDNPRRRHRQANRNSHTLALDENTSRLLEEKRI +FT LSRVFKATKNYEDKAKLKAAENRLKKAIKILRENRINEQVEGIDTSNPDRMRKMWKLLD +FT EGKRTNQPNFPLKLETQKGPKWTKTIKETTETFVSHLEGRFKPNNNVPDYHIDRVNTGL +FT RIIKESMLTERHNLNKNPHNQPITLKELNDEIKNLKNSKAPGKDLITNQLIKTLPTKAT +FT LYLILIYNSILRLGYYPEAWKHAQVKMILKPGKSANEPRSYRPISLLSGLSKIFERLLL +FT KRLFKVDLFKKAIPLHQFGFRKEHGSEQQIARVTQFILEAFERKEYCSAVFLDISEAFD +FT RVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVKDQAGETSRTGQIGAGVPQGSNLGP +FT LLYSIFSSDMPLPYIYRPSPTERIMLSTYADDTIVLSSDTLATAATRNNENYLKSFSDW +FT ADKWGISVNAAKTGHVIFTLKNDLPTSLRTMKIKGQVIKIESKQSYLGVILDSKLTLSS +FT HVTKLMGKYTTAYRKMTWILNRRSKLPTKTKMLILKSVLSPIWQYAIAAWGPLVTDAQI +FT RRIQVEENRKMRDICRAGRYTSNQTIRDRYGIKTVEEFYQQALHRFSETIKSHPNIAVR +FT RIFTRHYIPNRLERSRQRYLKMTNEHITQKQTGQTLSPKLLKIPDLNDCRTLKKRNERD +FT KIRQTHLIELPTLLRLEEEEEELRRIKKQEERERREKETQKWPPDRWCELEINLYNKQY +FT RRGDLTRQEIIQKFRGQPLNVQRIILPDYKGDQEHN" +XX +CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially +CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314"). +CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates +CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short +CC distance into ORF-1. The 5’ ends of TART-B elements are variable and the +CC minimal size for functionality has not been determined. Thus, this +CC canonical sequence, U14101, may be 5’ truncated within the 5’ PNTR (M-L +CC Pardue, 2009). +XX +CC Derived from U14101 (g603662) (Rel. 42, Last updated, Version 1). +CC Takis Benos and Michael Ashburner, 20-Aug-1997; updated Jan-2009 as per +CC Mary-Lou Pardue and Greg DeBaryshe. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 10654 BP; 3669 A; 2717 C; 2036 G; 2232 T; 0 other; + GATCCGGCCG GATGGCAGCT CGACGACGGT AGCAGGCCAC CATGCCCGCC AGCCCGCAGC 60 + TAGGATAGCA GCAACATCAG CGTCTTATTA ACGCGAACGG CGGCACTGGC CCTTAGCTGA 120 + CCAGCTGCAA CAACATCAGC GACGCAGTCT CCACCAGCAG CAACAACAGC AGCGGCGCTT 180 + GCGACAGCAG CAGCAGGGAA TGGTTCTGCC GCAGTCGCCT ATTGCTGCCT ATAAAGAGCA 240 + TTCCTTGCCA ATTGGCTTTC TGTACGACGA CGATGATCCT GCGGACAAAT CCACCTTTCC 300 + GGACGCCTGA GTATTATGGC GAGCCTGCTG ATCATTGTTT CTCCGACTCC TTACTTGACC 360 + ACTGGACAAT CATACAATCA CCGGCTTTTC ACATCTGGAA GAAAGAAACC TGGATTAGTA 420 + TTTGCCCTTC AGATTTGTAT GAAACTGCAT TTCTGGCCAA CCGGAGTGTT TCCTGCAGAC 480 + GACGCTGGAC TGCGACGCAC TTTTTTCTAC CAACACAGAT GGGACGCTTG CATCAGATCT 540 + GACGGGCCAG ACTGGCCGAT GCCTGGTACA CGATGGCATC TCCGCGGCGG CGAGATGTGC 600 + AGCGACGCTG AAAGCAATAA TAATTCTTTT ACTTTGCAGT ATCAAAAATG AGAAGCCACA 660 + TCACAATTTA CATCAGCAAA AATTACACGT GATATCTTTT TCTTTTGCCT AGGAGTAGTG 720 + AGACCTGCTA CCAAAATGAC CAGTAATACC GGCTAACGGA AGCGAGATAT CGATAATCAT 780 + TCTGGCGGTA AAATAGCCAG AACATCGATA ACCAGCTGTG CATTTTCCCT TCGATTTATC 840 + GAAGTCAAAT AGCCCGCCTA GGCTATCGGA CCGGATCGGC AAGTCAGTAG TGATTAAAAA 900 + TCCGGCAGAG GCGCCTGTGC AGCAGCTACC CAAAGTGAAC ACGACGAAAC GCAACAACAA 960 + AATGGACGGA CATAATGGAG ATCAAAGTGA AGGATGGGCA ACAGTGCTAT CTATCTCCTC 1020 + GGATGATAGT AACTCCTTGT CGTCGCCGCC GTCTATAATA GTTTCATCGC TGGACACCAC 1080 + GCCAACTTCG CACGAAACCA CCATAGTAAG AAGAAGCCTA TATCAAACAA ATGCTGACAT 1140 + GAAATCTTAC GATTTTGAAA ATATTGTATT AAATGAGAAT AAAAATACCA TATTGCCAGA 1200 + CCCTTTATTT GTTGATAAAT GCGGGAGTAC TGCTAATACC ACAGAAGCCA ATGAAAAAAA 1260 + GCCTGCCAAT AGCCCCTTCC CCATTTCCAT TAGCAAGAAT TTTAGCACTT CCTCGCCACT 1320 + AACACATGTA GACACGCCTA CACAAGAAGA TGACGCCAGT GCGTTCAATA CATTGAAAGC 1380 + AGCTAAAACA GCTAGAATAA TTTTTCCCAC ACACACACAT ATAAAGCCCA CCAAACCCTC 1440 + GCCCCCCTCC AAAGAATTAA GCACAAACTC AGCACTAAAA ACTCTCAGCT ACACAGACAA 1500 + AATAACAGGA ACACAGAAAA ATCTACCCGA CAAAACACAT GTAGACACAC CTACACAAGA 1560 + TGACGACATT AATGCAACCA AAGCATCAAA AACCGCTAAA ATAATTTCTA CACAGACACA 1620 + CCTAGGTGAA ACCAAGCCAA TACAGCCCGC CAAAGACCCC TCACCCCGCA CCCAAAAGCC 1680 + TATTGCACAC AAAGCTGACG AGACACTTAC CCACACAGAC AAACTCACAG CATCACAAAA 1740 + CCTCGTTCCC GCCAAAACAC ATATAAACAC ACCCACACAA TATAACGACA CTAATGCAAC 1800 + CAATGCATTA AAAACCGCTA AAATAAATTT CTCTTCACAC TCACACCAAA GTGAAATCAA 1860 + GCCAACACAG TCCGCCAAAA ACATTTCACC CCTCACACAA AAGCAATTCA CAAGCGAATC 1920 + AGCCGGGACA CACACCCATA CAGACAAACA CAAAAACACA GCATCACAAA ATCTCTTTTC 1980 + CGCCAAAACA CACATTAACT CACCCACACA ACATAACTAC ACTAGTGCAG CCACAGCATC 2040 + AAAAACCGCT AAATTAATTC TCTCCCCACA CTCACACCTA AGTGAAACCA AGCCAACACA 2100 + GCCCGCTTTA AGCCCCTCGC CCCTCTCCCA GAAGCAAATA ACAAGCATAG CAGCCAAGAC 2160 + ACTCACCCAC ACAAACAAAC ACACAGCATC ACAAAACTTT ATTCCCGCCA AAACACATAT 2220 + AAACATACCC ACACAATATA ACGACACCAA TGCAACCAAA GCATTAAAAA CCGCAAAAGC 2280 + AGCTTCTCCC TCCCACACAT ACTCACGTCA GACAAAACCA ATAAAGTCCG CCATAAACGC 2340 + ATTGCATCCC GCCCAAGACA CAAACCCAAG CCCAGCAATC AGTGCTGTCA CTTACACAGA 2400 + CAAACCCACA GCTACTCAGA ATATTTTTCC TGTCAAAACT TTTGCAGAGC TGGTTAGGGA 2460 + AAATGCAAAA CGCTTACCAA CTCCAATGCA GAATTCCCAT CAAGCTAAAA ATGACTCTGC 2520 + CGCTCTCGGA CGCCCCCCGA CTGCAGCTAG AAAAAATCTA AATAAAACAC TGATTTCTCC 2580 + TAAAACTCCT GGGAAGCGCC GTGGGGACTG TCTTGATGAA GGCCTACTAC AAACCTCTAA 2640 + CAAAAAGGTT AGAATACGCG ATGACTTCTC TGACGATGAT CTTGGGGTCA CAAATCTACT 2700 + CTCTGAAACA CCCTTATTCA AAAGCAAAGC AGCTATCAAG ATCCGGCAAG ACTCGAGAAG 2760 + AGATTCCCTG CAGAAGTCAG CCGAAATGGA CACAGCTCCA GCAATTAGTC CCTCAAACAC 2820 + AGCAGCCGAT TCCGACCTAC CGCCCTGGAA AACTGTTCCA GCTAGCAGAA AACCACCATC 2880 + AATCTTCTTG TCCAATATAC AGCAGATTAT CCCGCTAATA GAAAAACTAA ACTATAAAGC 2940 + CGGGGTAAAT AGCTTTACCA CCAAATCTGA ACTTGGCAAC AATATTAGAA TCCAGGCTAA 3000 + AACGATGGAC GCCCACAATG CAATTCAGAA TGTTCTCCTT GAGGCAAATA TTCCCCTACA 3060 + CTCCCACCAG CCAAAGAGTG CAAAGGGCTT CCAAATTGTA ATTAGGCACC TCCACCAGTC 3120 + AACCCCGACC AAATGGATTG AAAGCCAACT TCAAGACATC GGTATAGCTA CAAAATTTAT 3180 + CAGGGCAATG CAGTTTAGGG ACACGAGAAA TCCTATGCGC ATTCATGAGG TTGAAGTTGT 3240 + ACCCAAGGCT GACGGCAGCC ATCTCAAGGT CCTGCTACTA AAATCCCTTG GAGGTCAAAC 3300 + GGTCAAGGTT GAAAGGAAAC GGGTATCGAA GGATCCCACA CAATGTCATC GCTGCCAATG 3360 + TTTTGGGCAC ACAAAAAATT ATTGTAGAAA CCCGTTTAAA TGTATGAAAT GTGGCCAGCT 3420 + GCACGCCACG GTTTCATGCA CTAAACCCAA AAACCTTCCG GCTACTTGTG CAAACTGCAA 3480 + TGGAAGCCAC GTAAGCAGCT ATAAAGGATG TCCCGCTTTC CAAGAAGCAA AGCAAAGACT 3540 + ATCTATCAAC AAAATTCAAT CCCTACACTC ACAACCCACG CACCTTCAGA CCCCCCGCAA 3600 + TAAACATCCC TACCCAAAAC CCACCCACCT TCAGACGCCC CGCAATAAGC AGCCCTACAC 3660 + ACACCCCCTC CCTCGCACAT CAGTAAACAA CACAAAACTA CCTGCCAAAA GAATCCAAGG 3720 + AAAGAAGATA TCGCAAAGGA ATCTATCTAT AAACAAACGC TTACACAGAA TGAAAAAACC 3780 + GAGGAAGGAG ACAAGCCCGC CGACAACTAG CAAAAAGGTC TTGGCCTCTC TAGAAGAAAG 3840 + CAGAAAAAAC CCAAATAGCG TCCTAAACCC GGCCAACACC CATCTCACTC ATTTCCGCCC 3900 + ACCCCCTTTA GCACAAAATA TTCCTAATGA CGAACCTAAG GAGCTGAGTG GGGAGCAATA 3960 + CCTTCTAAAT CGCATTGAAG GGATGGAAAA GAAGATCAAC AACCTTCTTG AAATCGTCAC 4020 + CCGCCTACTA AGACAAGGAA AAGACTGTCC AAAGTCTCCA AAAAATCCTT TCCGAGATCC 4080 + AATCTTCGTG TAAATGCTCT TTCTAGTAAC ATCAGAAAGT GACGTTTCCT ATGACTCGGG 4140 + CTGACAACAG GGACATCCTT AAAATCGCTT TCTGGAATGC TGGTGGGATT AACAATAAAA 4200 + TAGATGAGCT TAAGCTGTTC ATTCTAAATA TTGATGCCCA CATAATCATA GTCACCGAAA 4260 + CTAGACTAGA CAACAATTCT ACCAAACTAG AGCTGCCAGG ATATTTCACA TACTTAGCCC 4320 + AAAATCCTGT CTCTAGCAAG AGAGGAGGGG TCGCTACTAT AGTAAACAGC AGTATCCGAC 4380 + ACATGGCCCT AAAACCGATC GAAAAAGAAT GCATACAAAG CGCCCCAATA GTCCTGCTGC 4440 + CTGAAAACAA CAGACGCAGC GAAATGATAG TAATAGCATC TGTCTACTGT CCGCCCTCGC 4500 + TAAGGTGGTT GCCCCACCAC TTTACTGACG TTCTCAATTT TGCAGAGAAA ACTTTAGGAG 4560 + GGCAGACCAA GTTTATCCTA TGTGGCGACT GGAATGCAAA ACATAGACAA TGGGGTTGTA 4620 + CACGCGCCTG CCAACGTGGC ACCGCACTCT ACGAAGCAGT CCAAGCCGAC TCCACTGCAG 4680 + AGATCATTGC CACTGGCTGT GCTACACATT TCCCACATGA CACAAGAAAA AACCCGTCAG 4740 + CAATAGATTT CTCCATTTGC AAAGGGCTTG GCAGGTTTGA AAAAAGAATT TCTTCAGGGG 4800 + CGGATCTATC CTCAGACCAT CTTCCCATCT TGTTAGAGAT AAACCTAGAC ACAAACACCC 4860 + TCTTCTTGCA AAAACAAAAC AACAATATAC TCAAGAAAAA TACAAACATC GAGCTGTTTA 4920 + AGAAAGTTCT AGAAAGAAAG ATACTATTAA ACACTGAGAT AAGGGTAGCA GAAGATATAA 4980 + ATGACGCCAT AAGCACCTTT ATGAAAAACA TCAAGGACTC GGCTGCGGAA TCAACTCCCT 5040 + CCCCAAGAAT ACGTGACAAC CCCAGAAGAA GACATAGGCA AGCCAACAGA AACAGTCATA 5100 + CCCTCGCACT AGACGAAAAC ACAAGCAGAC TGCTTGAGGA AAAACGCATA TTAAGTAGAG 5160 + TTTTCAAAGC TACCAAAAAT TACGAGGACA AAGCTAAACT AAAGGCAGCT GAAAACCGAC 5220 + TAAAAAAAGC GATAAAAATA TTGAGAGAAA ACAGAATCAA TGAGCAAGTT GAAGGAATAG 5280 + ATACAAGTAA CCCGGACAGA ATGAGAAAAA TGTGGAAACT GCTAGATGAA GGGAAAAGGA 5340 + CAAATCAGCC TAATTTTCCC CTCAAATTAG AAACCCAAAA AGGACCCAAA TGGACAAAAA 5400 + CGATTAAGGA GACAACAGAA ACATTTGTCT CCCACTTGGA AGGAAGATTT AAGCCAAACA 5460 + ATAATGTACC TGATTACCAC ATAGATAGAG TCAATACTGG ACTAAGAATA ATTAAGGAAA 5520 + GCATGCTAAC TGAACGACAT AATCTGAACA AAAACCCCCA TAACCAACCT ATTACTCTAA 5580 + AGGAATTAAA TGACGAAATA AAAAACTTAA AGAATAGTAA AGCACCGGGA AAAGACCTTA 5640 + TAACAAACCA GCTAATAAAA ACCCTACCGA CTAAAGCTAC CCTTTACCTT ATCCTAATCT 5700 + ATAACTCCAT ACTTAGACTA GGATACTACC CAGAAGCCTG GAAACATGCG CAGGTAAAAA 5760 + TGATTCTCAA GCCAGGGAAA AGTGCAAACG AGCCAAGGTC ATATAGGCCG ATTAGCCTAC 5820 + TCTCGGGACT CTCAAAAATC TTTGAAAGAC TACTCTTAAA AAGACTTTTT AAGGTAGATT 5880 + TATTCAAAAA AGCTATTCCT CTGCACCAAT TTGGCTTTAG AAAAGAACAC GGATCGGAGC 5940 + AGCAAATAGC CAGGGTCACC CAGTTCATTC TTGAGGCCTT CGAGAGAAAG GAATACTGCT 6000 + CCGCGGTCTT CCTTGACATC TCTGAGGCTT TCGACAGGGT ATGGCACGAA GGCCTTTTAC 6060 + TTAAATTAGC TAAGATCCTA CCTTACAACT TGTACATTAT ACTGGAGAGC TACCTAACAA 6120 + ATAGAACGTT CGAAGTTAAA GACCAAGCTG GAGAGACTTC GAGAACAGGA CAAATTGGTG 6180 + CTGGTGTGCC TCAAGGAAGC AATCTTGGAC CACTACTCTA CTCTATCTTC TCCTCAGACA 6240 + TGCCCCTTCC ATATATCTAC CGCCCCTCAC CAACAGAAAG AATCATGCTC TCAACATACG 6300 + CAGACGACAC TATAGTCCTC AGCTCAGACA CACTAGCAAC TGCCGCTACA AGAAACAACG 6360 + AAAACTACCT CAAGTCATTC TCGGACTGGG CGGACAAATG GGGTATATCA GTAAACGCTG 6420 + CTAAAACCGG ACATGTCATT TTTACATTAA AAAACGACTT ACCTACAAGT CTAAGGACTA 6480 + TGAAGATCAA GGGTCAAGTA ATAAAGATTG AAAGCAAACA ATCATACCTT GGCGTAATCC 6540 + TTGACAGCAA GCTAACCCTC AGCTCCCACG TCACAAAGCT GATGGGCAAA TACACTACAG 6600 + CCTACAGAAA AATGACATGG ATTCTAAACA GAAGAAGCAA ACTCCCTACC AAGACTAAAA 6660 + TGCTGATCCT TAAGTCAGTC CTTTCACCAA TATGGCAGTA TGCCATAGCA GCTTGGGGTC 6720 + CCCTTGTGAC GGATGCACAG ATAAGACGGA TCCAAGTCGA GGAAAATAGG AAAATGAGAG 6780 + ACATATGCAG AGCGGGTAGA TACACGAGCA ACCAAACTAT AAGGGACCGC TATGGAATCA 6840 + AAACAGTAGA AGAATTCTAT CAACAGGCAC TCCACAGGTT CTCAGAAACA ATAAAATCTC 6900 + ACCCAAATAT AGCTGTACGC AGGATATTCA CAAGGCACTA TATCCCGAAC AGACTAGAAA 6960 + GAAGCAGGCA GAGGTACTTG AAAATGACAA ATGAACACAT CACGCAAAAA CAGACTGGAC 7020 + AAACACTCTC ACCTAAACTC CTAAAAATCC CTGATCTAAA TGACTGCAGA ACCCTTAAAA 7080 + AGCGGAATGA AAGAGATAAA ATAAGGCAAA CCCATCTAAT TGAACTCCCC ACCCTGCTGA 7140 + GACTAGAGGA AGAAGAGGAA GAGCTTAGAA GAATAAAAAA ACAGGAAGAG AGGGAAAGAA 7200 + GGGAAAAGGA AACCCAAAAG TGGCCTCCAG ACAGATGGTG TGAATTAGAA ATTAACCTAT 7260 + ATAATAAGCA ATATAGAAGG GGCGATCTAA CCAGGCAGGA AATCATACAA AAATTTAGAG 7320 + GACAACCACT AAATGTACAG AGGATAATTT TACCCGACTA TAAAGGAGAC CAGGAACACA 7380 + ATTAAAAGTA AATCATGGGA AAGCAGGGGA AAAAAAACAG AAGTAACAAA ATGGCGGAAG 7440 + GGGTGGCAAA ATATATATAA AAATAAGAAA AGATAGAAAT AAAAAGGCTA AAGGCTCACT 7500 + TACAGGTTAA TTCAAAAGGG AAACGTGCTT ACATATCTAA TGGTAAAAAC TAACTTATAA 7560 + CACCTACTGG ATGACATAGT GAGGATGCCA CAGGTTGCGC ACTTGAATCA CGCTTTCCTG 7620 + GCGAGATTGT TAAGGCATCA CCGGGATCCC GTCTCTCTTT CCTAACTGGA GGACTCATGC 7680 + CTGAAATCTT TTCCGCTTCA CCGGCACCTG ATGGCCATAT CTGCTACTGC GCCTTGCGTC 7740 + CACGGACGCT CCTTCCTGAA AGAAAGAGAA TTTGTTTTAG TTTTCCTTTC TCTTCTTAAA 7800 + AATATAACAA AAACAGCAGC AGTAGCCGAC CAACAACATA CTTAGCTTAC CAAGGCAGCA 7860 + GCAATGATAC CAACAGAAGC CCTACAGTGT GCTGAACAAT ATGCCGCCCA CGCCCACCAC 7920 + TTCTGGAACT CAGGAATGGG GGGTACGGAA TGCCGGAAAC TGGAGGATTC GCCTCAAATG 7980 + TTACGCTTAC ATCTTTGAGC AAATCGCCTG CCTCCTCGTC TAACGGCCCG GCGTCTTGGT 8040 + ACGCCCAGAA GTAGCAGCGG TAGCAGGATT AGCAGCCTCC ACAGAGATAT GTTCATCCCA 8100 + GCATCAGTCC AGTTGGCATT GTGATGCCGC CGTAGCGTAC GCCCTCAGAG ACCCGACTGG 8160 + AATCCCAGGA CAAGAGACGG CAGCACGCCT GGGCTTAGGC GCGGGACAAC ATGCAGAGAT 8220 + TCGTCAATGA GAATGGCGGC ACTGGAATCA CCTTTCAGCT GAGCGGGATA ATGAGTCGGC 8280 + AACGCACCGC ACTATCAGCA GCAATAACAA CATCGGCAGA TGACCTGGAA GAAAGGAAAA 8340 + AACATGTATC AGTCTTTTCT TTTCTTTTTT TTTCCCATTA GCATGCGTTT TTAAATTCCA 8400 + TTCCTGAAAA CCGGCGTTTT CCTGTAAAAG ACACTGGACG GCGGCGTTTG TTTTAAATGC 8460 + AAAGATTGGA TGCTTGCATC AGGGCTGACG TCCTTGAATA GCCGATGCCT TGTAATTGCC 8520 + TGCATAGCCG CGGAGGTCCT GATGACGGAT GCTGGCCTGT ATTTGGCCAC CACTCCGATG 8580 + CCATGACAGC AGCAACAGCA GCGGTTTTTG CAAATGAGAG GGATCAGGAG GCGGCAACAC 8640 + ATTCACCCGT AGCAGCAACA ACAAGCAGTG GTAGCATCAG CAGGGAGTCT TCTCGCCACA 8700 + ATAGCCATTT GGAAATTTCT CGACGACCCG ACTTCCTGCT TGGCCCATGG TCAATCACAC 8760 + TGGACCAGTT AACAGCGGCG TTTTACCCTG GAAGAAAGAA AACTTGTATT ATTCATTCCC 8820 + TTTTCTCTCA CAGTTGGGTA TTTAAGTGCA TTCCTGGCCA ACCTAGCGTG TCTCCTGGCA 8880 + ATGACGTCGG ACTCAACGCA TGCTTCCCTT CCGACACAGT AAGGATGTTC GCATCTGGGC 8940 + TGACGGGCCA GGCCGGTCCG TTGCCATACA TGCTAGCGTT TCCGCGGCGG CGTAGTGAAC 9000 + ATCAAACCGT ATAATGGCGA AGACGACGAT GATCCGGCCG GATGGCAGCT CGACGACGGT 9060 + AGCAGGCCAC CATGCCCGCC AGCCCGCAGC TAGGATAGCA GCAACATCAG CGTCTTATTA 9120 + ACGCGAACGG CGGCACTGGC CCTTAGCTGA CCAGCTGCAA CAACATCAGC GACGCAGTCT 9180 + CCACCAGCAG CAACAACAGC AGCGGCGCTT GCGACAGCAG CAGCAGGGAA TGGTTCTGCC 9240 + GCAGTCGCCT ATTGCTGCCT ATAAAGAGCA TTCCTTGCCA ATTGGCTTTC TGTACGACGA 9300 + CGATGATCCT GCGGACAAAT CCACCTTTCC GGACGCCTGA GTATTATGGC GAGCCTGCTG 9360 + ATCATTGTTT CTCCGACTCC TTACTTGACC ACTGGACAAT CATACAATCA CCGGCTTTTC 9420 + ACATCTGGAA GAAAGAAACC TGGATTAGTA TTTGCCCTTC AGATTTGTAT GAAACTGCAT 9480 + TTCTGGCCAA CCGGAGTGTT TCCTGCAGAC GACGCTGGAC TGCGACGCAC TTTTTTCTAC 9540 + CAACACAGAT GGGACGCTTG CATCAGATCT GACGGGCCAG ACTGGCCGAT GCCTGGTACA 9600 + CGATGGCATC TCCGCGGCGG CGAGATGTGC AGCGACGCTG AAAGCAATAA TAATTCTTTT 9660 + ACTTTGCAGT ATCAAAAATG AGAAGCCACA TCACAATTTA CATCAGCAAA AATTACACGT 9720 + GATATCTTTT TCTTTTGCCT AGGAGTAGTG AGACCTGCTA CCAAAATGAC CAGTAATACC 9780 + GGCTAACGGA AGCGAGATAT CGATAATCAT TCTGGCGGTA AAATAGCCAG AACATCGATA 9840 + ACCAGCTGTG CATTTTCCCT TCGATTTATC GAAGTCAAAT AGCCCGCCTA GGCTATCGGA 9900 + CCGGATCGGC AAGTCAGTAG TGATTAAAAA TCCGGCAGAG GCGCCTGTGC AGCAGCTACC 9960 + CAAAGTGAAC ACGACGAAAC GCAACAACAA AATGGACGGA CATAATGGAG ATCAAAGTGA 10020 + AGGATGGGCA ACAGTGCTAT CTATCTCCTC GGATGATAGT AACTCCTTGT CGTCGCTGCA 10080 + TATATAAAAT AATAAATTTC TTAAAATAAT TTCATCGCTG GATTCCTGCG CCACCATAAA 10140 + TTACTTATAG AATACACTTA ACACTGTACC CACTAATGCT AAAAATTTTC TTATACAATT 10200 + TTACTTTAAA GCTAAAACTA CTTAAACTAT GGCGCGTAAA ACGGCCGTCA AAAATATCCA 10260 + AAAATTGTAC TTGCCATAAA CAAATTCTAA CATAATGTAA ATCCTAAATC GTAAAATCAT 10320 + GGCGAACATA ACCGCCGCCA AGCAAATCAA AAAATGTTCC TAGAAATTGT AAATCTTAAA 10380 + CCTACTTCTC TAACTAAAGC GCGCACAACT GCCGCTGATC CGAAATTGTA AAATGCCATA 10440 + AATTGTAACT ATATATTTTA TAAAAAAAAT CAGAGTACAA TAAAATGACA GCGCCGAAAG 10500 + GCACTGAAAA TATTTAAAAA AAAAAAAAAC TGCCGCTGAT CCGAAATTGT AAAATGCCAT 10560 + AAATTGTAAC TATATATTTT ATAAAAAAAA TCAGAGTACA ATAAAATGAC AGCGCCGAAA 10620 + GGCACTGAAA ATATTTAAAA AAAAAAAAAA AAAA 10654 +// +ID TIRANT standard; DNA; INV; 8526 BP. +XX +AC nnnnnnnn; +XX +DR FLYBASE; FBte0000179; Dmel\Tirant. +XX +SY synonym: prygun +XX +FT source X93507:1..2484 +FT SO_feature five_prime_LTR ; SO:0000425:1..417 +FT SO_feature three_prime_LTR ; SO:0000426:8109..8526 +FT SO_feature CDS ; SO:0000316:1866..2999 +FT SO_feature CDS ; SO:0000316:3239..6505 +FT SO_feature CDS ; SO:0000316:6683..8146 +XX +CC Sequence identified by REPBASE: +CC http://www.girinst.org/server/RepBase/RepBase6.6.embl/drorep.ref +CC Assembled and annotated by Josh Kaminker & Michael Ashburner. +CC REPBASE states this to be a consensus sequence. +CC This replaces that from X93507 in versions previous to 4.8. +XX +SQ Sequence 8526 BP; 2961 A; 2097 C; 1384 G; 2084 T; 0 other; + GGAGTTACCA CCCCACCCCC TAAACCCCCA CGCCTCTAAA CAAATCATCG GACACTCAAC 60 + CGGGAAGACG GCAACTGGAA CACCGCATCC GGCCGAATGC TGACATTCCG GCCGAATGCT 120 + GACATTACAC AAAAGTCGCA CTGCAACATT GTCCCCAGCT AGCCAGCCAC ATGCCGAGTC 180 + GGCATGTTCA TTATGCTTAC AATTAAGAAC CTATGTACTT ATGTATAAGA CGAAAACGGA 240 + GGACTCGAGT AGCCACTCTC TGACAATAAA CTTGATACTG ATTTTGAACT TCAAGAAAGT 300 + CAGTCGTATT CTTTATTGGA AATCTTCACA CTACAACTAT CTGCTGAAAC TTAAAAACCT 360 + TCATACATTT ACACATCATA TCTTCACAAA AGGCTCCACC CTCGATCACG GACTTAACTG 420 + GCGCAGCCGG TAGGATGTCC TACCTATTAA TAATTACCTA CCTGTAAGTA AACATGTAAG 480 + AAACGAAACA AACTATATGC AAGATGTCGA CTGAAAGTGA CTAGGAACAA ATTTTTATAA 540 + AACAAAATTG AAGTTGTGAA GTACCAAATG AAACTCAAAC ATATATTCAA ACACAGGAAA 600 + AAAAAAGAGA GAGGAAAAAT GTAAAATAAA TAAATATACA AAAAAAAGTG CAAGTGTACC 660 + GTACTGCCGC GCTGACGTGG AATCTATCGC TGATCATCAC GCCATCGGTA TGTCCATACT 720 + CTGCCGAACG TCATAATTTT TTTAAAAAAG TGCAAGTGTA CCGTACTGCC GCACTGACGT 780 + GGAATCTATC GCTGATCATC ACGCCATCGG TATGTCCATA CTCTGCCGAA CGTCATAATT 840 + TTTATAAAAA AGTGCAAGTG TACCGTACTG CCGCGCTGAC GTGGAATCTA TCGCTGATCA 900 + TCACGCCATC GGTATGTCCA TACTCTGCCA AACGTCATAA TTTTTATAAA AAAGTGCAAG 960 + TGTACCGTAC TGCCGCGCTG ACGTGGAATC TATCGCTGAT CATCACGCCA TCGGTATGTC 1020 + CATACTCTGC CAAACGTCAT AATTTTTATA AAAAAAGTGC AAGTGTACCG TACTGCTGCG 1080 + CTGACGTGGA ATCTATCGCT GATCACCACG CCATCGGTAT GTCCATACTC TGCCAAACGT 1140 + CATAAGTTTT TATAAAAAAA AAGAGTGCAA GTGTACCGTA CTGCCGCGCT GACGTGGAAT 1200 + CTATCGCTGA TCATCACGTC ATCGGCACTT ACATACGCTG GCCAACGCAT CGCCAAAGCC 1260 + TCTATATACA CTTATATATG TGAGCATACA ATATCAACTA CAATCCAATA CATCCACGTA 1320 + CTGTACCGCC TCGTTGGCAT GGAATCAAAC GCTGATCACC ATGCCACCGT GGTAAACAAA 1380 + CAAAGCACCA AAGCCTCTCT AATACATTGT ACACTCAAAA CGCACACTGC CATACGTCGG 1440 + CGAAAAATCA AAACATAAGC AAAAATCATT TCAAACCAAG CGAGGCTCAT TCTGCGTACC 1500 + ACAACGACAA CGACACTGCA TGTGTAGTGG CGCACCCATG TCTGGGTAGC CGAGGTAAGG 1560 + GGAAAACGCT TGAGTATCGT CAAGTGTTCT TGCCTTTCAC TCTTCTACAA TGGGTTGCTA 1620 + CGCTCATGTA TTGCACATTC AAAATAACCA AAACAAATGT ACTAAAGAAG TCGACATATA 1680 + CAGATATATT TTGTTTCCTT TCATTGTGTA ATTTTGTATA TCAAACAAAT ACTAATACCA 1740 + ATCACATTGC AGAATATAAA AGGGAAAATA TAAAGCCAAA GACAGACACC CATACACTCT 1800 + AGTAAACAAG AAATTTGTTC ATTATTTTTC AATCATACAT AATATACTAA GTAACCTCAA 1860 + ATTTAATGTC AAAAAAGTTC GTTTACAACC TTAGGAAAAC TACACGTTCA GTTGTTGGAG 1920 + TTCCACCAAA CACTAATAGG CCCCCACATC CCGTTAGACG TCCTGACTCC CTTCTCCCGA 1980 + TTTCGGAAGA ACCCAAATCA ATATCTTCCC AAACCCCCAA TATGGACTCG GGAAACGATT 2040 + CTGCCCGCCC CACTCCATCC CCTCTGGCGC CCACTGTCAG TGGTATTAGC TCCTTAATTT 2100 + CAACTACGTT CAAGCCTAAA GATATCATGG CATTTGTTGA GCATTTGCCA ACCTTTGATG 2160 + GTACACCTCG TCTATTGGAC AGGTTTATCA CTAGCGTAGA AGAAATCCTG ATGCTCATCA 2220 + GGGGAGCTGA CCAAACACCG TATGGCCTGC TTACTCTGAG GACCATCAGG AACAAAATCA 2280 + TTGATAGGGC CGACGAAGCC TTGGAACTGG CAAATACCCC CTTGGTTTGG GATGAGATTA 2340 + AAAGCAATCT CATCCGCCTC TACTCGAGCA AGAAAAGCGA GGCCAACTTG TTAAGCGAGC 2400 + TTAACACATT TTCGGACAAC CTGACCTTGG GCCAACTGTT CTTTGGTATA TCAAAGGTGA 2460 + GAAGCCAACT CTTCTCCATA CTCAAAAACA GCGAACACAA CAACACTGTT GTAGATGCAA 2520 + AAAAGGTTGT CTACAACGAG GTTTGTCTCA ATGCTTTTAT GACTGGTTTG AAGGAACCTC 2580 + TCAAGACTTT CGTCAGGATA AAGTCCCCTT CTACACTTGA ACAGGCGTAC GAGCAATGCC 2640 + AAATAGAGCA GACCTTATAT AGGGCACAAA ACAAGCGAAC CAACAGACCA GAGCAGGGAC 2700 + CCAATGGATC AGACAATAAA ACCTACCGAA ATAGCTACGA CAGCAATTAC CGCAGCGGAC 2760 + GTAACGACCG AAATGACCGT AGGGGACCCT ACTCTAACTC TAACTCTAAC TCTAACTCTG 2820 + GCCAAAATAG ACCATTTAAT TCACACAATC GCACACCCCA ATCCGGCACC AAGGACAACC 2880 + GGGCCAATAC ATCAAACCCC TTTCGAGCAC CTTCACATAG TTTGAATAAT ATAGAGGAGA 2940 + ACCCTCAACC TGATTCGAAT TTTCAGCAAA CGGCCTCGGG AAACCAACAG GGTACATAAG 3000 + CCCAGCCACG CACAACCCCT CGCTTCCTTT TATAAAAATC AAACTATCCC AGACAAACCC 3060 + CCTGAAGTTT TTAATTGACA CAGGCTCTAC ACACTCCTTC ATCGACCCAA AATATGTCGA 3120 + CCCTAGGAAC TGTGTGACCT TAGATACGCC CATAACACTC AAAACAGCCC TGAACAGTTT 3180 + TAAAATATAT CAAAACGTCT CTATACCATT TCCACCGGAA TTCCAAATCA CGGGCAAAAT 3240 + GACCCTTCTA CCTTTCAAGT TCCACTCTTA TTTTGACGGA TTGATAGGAA TGGACTTATT 3300 + ATCTTACCTA AAAACAGAAA TAGATTTACT TAACCTAAAT CTAAAAACCC CAAGTACCAT 3360 + TATACCCTTA TGGACCCACA GTAACTCAAC TTCAAACGTA TTTAATATCT CTGGACATAC 3420 + GAAAACTATT TTGCCACTAC CAGTGGAAAC CAAACAGGGC GACTTCTACA TCGATTCAAT 3480 + TACAATCAAT GATGACTTAA TAATATCAGA CGGGATTTAT AATGCCCAAA ACAATATTGC 3540 + TAATTTCGTT ATCACAAACT ATAGCGAGAG GGATCAGTTA TTGTACCTCG AGAGCCCGAT 3600 + AAAAGGCATG CCATACTCCA CGGCCAACAA TGTTGAACTT TTCAGTATCA CTTCAGACAC 3660 + CCCACAGCCC CAAAACTCCG CAGCGTCGTT ACAAGCCCTT GGCGTCGATC ACCTCTCCTC 3720 + TGAAGAGAAA CAAAGCCTAC TTTCACTTTG CAAAAGTTAT CTAGATATCT TCTACAATGA 3780 + AGACAAATCA TTGACCTTCA CCAACAAGAT TACACACACG ATTAAAACCA CGGACGACAC 3840 + CCCCATTCAT ACAAAATCTT ATAGATATCC TTACATTCAT AAAGAGGAGG TCAAAAAACA 3900 + AATAGAGGCA ATGTTAAATC AGGACATTAT CAAATCCAGT TATTCCCCGT GGAGCGCCCC 3960 + CGTCTGGGTC GTCCCAAAGA AAATCACTCC TACGGGAGAG CAAAAATGGC GTCTAGTTAT 4020 + CGATTATAGA AAACTCAACG AGAAGACTAT ATCCGATAGA TATCCAATAC CTAACATCGC 4080 + GGATATCTTA GACAGATTGG GCAAAGCCAA ATATTTCTCC ACACTTGATC TGGCAAGTGG 4140 + ATTCCATCAG ATAGAAATGA ATCCCGACGA CACACCCAAA ACTGCATTTA CAGTAGAGGG 4200 + GGGCCACTAC GAGTTCATTA GAATGCCGTT TGGCCTCAAA AATGCCCCAG CCACATTCCA 4260 + AAGGGTGATG GACAATATTT TTGGAGACCT TATCGGAACT ATCTGCCTAG TTTACCTAGA 4320 + TGATATAATA ATTTTCTCAA CCTCCTTACA AGAACACTTC ATACACTTGA AAACTATTTT 4380 + TGGAAGACTC AGATCTGCCA ACTTTAAAGT CCAACTCACA AAATCCTACT TCCTCAGGCG 4440 + GGAGACAGAA TTCCTTGGCC ACATCGTTTC ACAAGAAGGT GTTAGGCCAA ATCCCAATAA 4500 + GATCGAAGCT ATAAAAAACT TTCCATGTCC CCACAGTAAA AAGTCAATTA AGTCTTTCCT 4560 + AGGCTTGTTG GGATATTACA GAAAATTTAT CAGAGATTTT GCGAGACTTA CCCAACCCAT 4620 + GACACAAAAA TTAAGGGGAA ACAATAAATC GATCATAATA GATGATGAAT TCAAAAAGGC 4680 + CTTTGAATAT TGCAAAACCT TACTGTCTAA CGACCCAATC CTCCAATACC CGGACTTTAC 4740 + AAAACCTTTC ACACTAACCA CGGACGCAAG TAATTTCGCA ATAGGAGCTG TCCTATCCCA 4800 + AGGTCCGGTG CATAGTGATA GGCCCGTATG TTTTGCTAGT AGAACCTTGT CGGCTGCGGA 4860 + AACAAATTAT TCCACAATTG AGAAGGAAAT GCTGGCCATT ATATGGGCGG TCCAATACTT 4920 + CAGACCCTAC CTCTTTGGCA GGAGATTCAC TATAATCACC GATCACAAAC CACTAACTTG 4980 + GTTAATGAAT TTCAAACAAC CAAATTCTAA AATAGTTAGG TGGAGACTCC AGCTTCAGGA 5040 + GTACGATTTC GAAGTCGTCT ACAAGAAAGG CTCTCAAAAT GTAATTGCTG ATGCTCTCAG 5100 + TAGACCAGAG GCCTCTGTCA ACCATAACGA AGCCCTATCA ATTCCTCAAA ATGTTTGCCC 5160 + CATCTCAGAG AAACCCCTTA ATGATTTTAA TATTCAGCTC CTGTTCAAAA TAACCCCAGA 5220 + TACAAATAAC GCCACACTGA CCCCGTTTAA ACACAAACTT AGGAGGGAAT TCTGTAAACC 5280 + CAATTTTCAG TATGACGACG TAGTTTGCAT TCTTAGGCAG TCGTTAAAAC CAAACAAGAC 5340 + ATGCGCGGTA TTTGCCCCCG ACCACATTTT TCAAATGGTG GAACAAGCCT ACCAAACCTA 5400 + CTTCTCAGCC CACAGTCAAT TTAAACTCAT TAGATGTTTG ATCTTCCTCC CCGAAATTAC 5460 + TGATAGTACG GAGATCGAAA AAATTATAAC CGACTATCAC TATAATAGTA ACCATCGAGG 5520 + GATCGATGAA ACATATTTAC ACATAAAACG ACAACAGTTC TTCCCACATA TGAAGGAGAG 5580 + AATAACTCAG TTAATTCGAA AATGTGAAAC ATGTTTAAAA TTAAAATACG ACAGACAACC 5640 + TCAAAAGATC ACTTACCAAA TATCCGAACT ACCTTCAAAA CCGTTGGACA TCTTACATAT 5700 + AGACATTTAT ACTATTAACA AAAATTATAA CCTTACTATT ATCGATAAAT TTTCTAAATT 5760 + TGCGGCTGCC TACCCTATAA CTAATAGGAA TTGCATTAAC GTAGTTAAAG CCTTAAAACA 5820 + TTTCATTTCC CAATTTGGTA TTCCCAAAAA GCTGATCTAT GATCAGGGAG CAGAATTCGC 5880 + TAGCGATATG TTCAATAAGT TCTGCACTCA ATTTAACATT GACCTACACG TTACGTCCTT 5940 + TCAACAATCC TCTAGTAACT CTCCCGTTGA ACGGCTTCAC TCGACACTAA CTGAGATTTA 6000 + CAGAATAATA CTTGACGTCA GGAAACAACA GAAACTCAGT AGCGAGCATG ACGAGATAAT 6060 + GTCCGAAACC CTAATCACAT ATAATAACGC TATTCATTCT GCAACTAAAC ATACCCCCTT 6120 + TGAACTATTT AACGGACGTA CTCATATATT CAACCAAACA ATCCAGTTCA ATAACGAACA 6180 + CGACTACTTA ACGAAATTAA ATGAATTTCG CGAGAAGTTG TACCCCCTCA TCACGGACAA 6240 + ACTTTCAAAT GACGTAGTTA GGAGAACCCT AAAATTAAAT GAAACCCGAA CAGACCCCGT 6300 + AGACCTACAA CCAGACACTT TAGTCCTTAG GAAGGAAAAC AGACGTAATA AGATTACACC 6360 + CAGGTTTTCG ATTCACAAAG TCAAACACGA CAAAGGTCAT ACATTGATAA CTGCTAGGAA 6420 + TCAAAAACTA CACAAATCAA AAATTCGAAA AACAGTTTTG AAAAAAGACA AAAGCAACAA 6480 + CGTACCCAAC ACTGATAATA ACTGACCCCA CTACCTCTTA ACTTACCATT TCAGGTTCAC 6540 + CCTTGTGCCA ACTCAGGCTA TCCATGTCCA TTATTTAAAT GATAACGCCC CTATAGCCAA 6600 + GATAGAACTA GGGAAAGCCT TACTAATTGA GAGGTACAAA ATAATTAGTC ATGTAATCAA 6660 + CCTACAAGAC TACAGCAGAT GTATGGAACA ATTCCATCTG ACCATTAATA AATTTAACCC 6720 + CGATTCCACG TTGACGGACT CCGTCACAAT TTTAAAAACC AAATTAACCC AAGCCCAAGT 6780 + AAAGCTCAAA GCCCTTACAC CTTCATATAG AAACAAACGG GGTTTGATTA ACGGATTGGG 6840 + GAGTCTAGTA AAGGTGGTTA CCGGCAACAT GGATGCCAAC GACAATAAAG AAATACATGA 6900 + AGAACTTGAC AATATAAAGA AAAATTCCGA AGTCAGTAAC GACAATCTCC AAAAACAAGT 6960 + AATGTTTAAC AACGAAATAC TTATCCGGTT CGAAAATATC ACGGACCATA TAAATAATGA 7020 + ACAAATTTTG ATAAGTAAAT TCTTTGATAC CTCACAAAAC AAAATATACA AACACTTAAA 7080 + CTTACAAGAT ACCCTTCTGG AAGAAATACA ATATTTAAAT AGGATTAATT ATAACATAGA 7140 + ATTATTCATT AACCACCTAA ACGACATAAC AGAAAGTATG CTATTGGCGA AAATAAATAT 7200 + AATTCCCAAG TTCATCCTAA ATGAACAAGA AATGGATAAA ATAAAAACAA TACTGGAAAA 7260 + ACAAAATATC ACAGTCAAAA ATGAACAAAG TATATACAAT TTCCTACAAA TGAATACACT 7320 + AAATTACGAA CAAAAGATTA TTTTTAATAT CAAAGTCCCA ATTTTTAAAC AACCTTTTCA 7380 + TACCCTCGCC AGACTAGTTC CATTACCAAT AAATAACACA TATTTTGTAA TAACCCCAAA 7440 + TTACCTAGCT TATAATATTA ATAATAAGAA ATTTCATATG ACCCGTAAAT GCCCCAAACT 7500 + GGATAATACA TTCTTGTGCG ACGAGAACTT CTACGTTGAT ACACCACAGA ACAACACATG 7560 + CCTGGAACAC CTTTTGAACG GAGAAAACAG TTCCTGCGAT GTACGGGAAA CCGGCCCCAT 7620 + CACCGACGTG TTCGAGGCAG AGAGAGGTTA CATCTTCGCA TTCAACGTGA ACAAACTGAA 7680 + GGTATCCCTA ACAAACGGCT CCGAGCTCTC AATAATGGGG TCAGCCATCA TCAGATACAT 7740 + TAACGAAACA ATACAGATTA ACGGTATCGA TTACGACGGC ACGGTTGACA CGTTCCCTGA 7800 + ACAGACGGAT TTTGATCTTC CCCCCATGCG AAAAGTAACT AGGAATACCA CTATTACGGT 7860 + ACTAAGCCTA GAAAAACTGC ACCTCGAAGC CACCCAAACA ATGGATAAAA TCCTGGCCGT 7920 + CCATCACAAT ACTATACAGC ACACCTGGAC ACTCTACACT CTGCTCGGAT TGGTAACGTT 7980 + CCTAGCAGTC ATCTTATGGC TGCACCGACG AACGAAACAC ATCGTCCACA TCCACGAGGA 8040 + TCATCACGTA CCAATCTACG CGTCATCCAT ACCTTCGCTA TGGCCGTCAC TTCGAACTGG 8100 + GGGGGGAGGA GTTACCACCC CACCCCCTAA ACCCCCACGC CTCTAAACAA ATCATCGGAC 8160 + ACTCAACCGG GAAGACGGCA ACTGGAACAC CGCATCCGGC CGAATGCTGA CATTCCGGCC 8220 + GAATGCTGAC ATTACACAAA AGTCGCACTG CAACATTGTC CCCAGCTAGC CAGCCACATG 8280 + CCGAGTCGGC ATGTTCATTA TGCTTACAAT TAAGAACCTA TGTACTTATG TATAAGACGA 8340 + AAACGGAGGA CTCGAGTAGC CACTCTCTGA CAATAAACTT GATACTGATT TTGAACTTCA 8400 + AGAAAGTCAG TCGTATTCTT TATTGGAAAT CTTCACACTA CAACTATCTG CTGAAACTTA 8460 + AAAACCTTCA TACATTTACA CATCATATCT TCACAAAAGG CTCCACCCTC GATCACGGAC 8520 + TTAACT 8526 +// +ID DMBLPP standard; DNA; INV; 5034 BP. +XX +AC Z27119; +XX +DR FLYBASE; FBte0000660; Dmel\flea. +XX +SY synonym: blastopia +SY synonym: Kermit +XX +FT source Z27119:372..5405 +FT SO_feature five_prime_LTR ; SO:0000425:1..275 +FT SO_feature three_prime_LTR ; SO:0000426:4757..5034 +FT SO_feature polyA_site ; SO:0000553:5006..5011 +FT SO_feature polyA_site ; SO:0000553:5019..5024 +FT SO_feature CDS ; SO:0000316:760..4761 +FT /name="Dmel\flea\polyprotein" +FT /db_xref="FLYBASE:FBgn0043491" +FT /db_xref="SPTREMBL:Q24262" +FT /db_xref="NCBI_PROTEIN:CAA81643.1" +FT /translation="MFTRTPPTNKKLNTDQIQAILENESEDESRKEKMNEEDQKLAPVG +FT EAEAKKQNKDASAKVEEKFEQMMNTLTQSMLAKSKQEGQVIIAAEKFEKVVSDCDGKSI +FT PIKKWFEIFEKNAEAYELSEKQKYVQARSKMIGSAELFLESECVSGYTELKELLIEEFS +FT GSYNSAVIHKKLQDRKKKREETLHDYLLQMKKIAALGEVETVALITHIVNGLDIKKEYK +FT GAMLRCKTLKELKQEFEIYESLNIVDKPNIQPKPKQITQGVKADHCFNCGSREHKRKDC +FT TLPTKCFSCNQEGHISSKCPEKVNSMRIHVDSARTKPVIINGIIINCLVDTGSDVTIIK +FT EAIFKKMKDVDLNRTATVLRGLGNASTQPIGCFRALIKTDQVEASHNVLVVHDSKFSCD +FT GIVGHDFISKFRLICSAEGYTFLDLEADKKQAVEYSQMFNICEESSFTVAPQYREDVER +FT MIERTYETPPKQIKQCPVELKIIPDGVIKPFRHGHTRLSEEEAIAVKKQVEEWVEQSIV +FT RKSTSNVASRIVVVRKKDGTLRVCVDYRKLNTMVLMDCFPVPIMEEVLEKLQSAKWFTT +FT MDLQNGFFHVAVEEASKPYTAFVTREGLFEFNKAPFGFKNSPAAFIRFVQFIFQELINS +FT NIMQLYMDDIIVYAATPEECMEKTEMVLKRAAEFGLKIKWKKCNFMQRRIHFLGHIIEG +FT GQICPGKEKTSAVNSFGTPQNVKAVQGFLGLTGFFRKFIPGYAQIARPLTDLLKKDAIF +FT NIGPVEQQSVNKLKEILVNEPVLRIYSREAETELHTDASKDGLGAVLLQKFEGSFHPVC +FT FWSRKTTKAESNRHSYYLEVKAAYLALKKFRHYLLGVPFKLVTDCVAFKQTTKKADVPR +FT EVGPWILYMQDFNFQPEHRAGERMRHVDFLSRHPQACMMITSELTARIKKSQQNDDSIR +FT AILEILKDRLFQPYKLKGGLLYSMVNGNELLVVPALMEREVIQSAHEVGHLSLQKTMHS +FT IQQQFFYFLIWEYKVKKLISNCIKCIIHSKKLGKQEGYLNCIDKGDAPLHTLHIDHLGP +FT MDSSAKQYKYILATVDAFSKFVWLFPTKSTGQEEVVKRLTDWSNIFGFPKRIVSDKGTA +FT FTSGAFEQFMSSHNVEHVCTTTGVARGNGQIERVNRLILAIISKLSSDEPSKWYKYVPE +FT VQKAINCHVHSSLKLSPFEVMFGTKMYTRVEDRLLELLQEEVVCQFNEDRYEMRQLVKR +FT NIEQAQKDYKRNYDKKRRAEYKYKAGDLVAIKRTQFVAGRKMASGYLGPYEVTGVKDNG +FT RYDVKKAANVEGPNVTSTSCDNMKLWKYIAENADLLSSGSDDDDQEGRM" +XX +CC Derived from Z27119 (g415797) (Rel. 50, Last updated, Version 6). +CC Takis Benos and Michael Ashburner, 20-Aug-1997. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 5034 BP; 1719 A; 938 C; 1145 G; 1232 T; 0 other; + TGTAACATGA GTAAGGCTGA AGGCTGGCAA CAACCCGGTT GGCAGCGCTG TTGAGCAGCA 60 + ACATGATTGT CGGAAATCCA AGTTATCGAC AATCAGTCAT CGAAGGACGA TCGCAGGCAG 120 + CAGTAGAGGC GAGTGGAAGT CAGCGTTGCA GTCAGTCGAG TTCTCAGCAG CAGTCGTTCG 180 + GTCCACAAAC TAAGAAATAC TTTATATAAT TACCGCATTT AGAATTAAAC TAATAATTAA 240 + ATTAATAATA AACAATAATA ATAAACAATC TTACATGGGG GCTCGTCCAG TCCTAAATCG 300 + GTTATATGAA GGTGCAGTTG TTTAAAGAAA AAAGACATTG TTGTGTGCGT GGGTATAGTC 360 + TTTAAAACGT TGTAAAGTTG TGGCTATATC TATTGCATTT AAAGTTGGAA AAATCAGTTG 420 + TACAGATTTT GTTTGAACAC AAGTCGGTAA AAGTCGGGAA AGCTGCTAGA GAGAACTGAT 480 + AAAGTTGAAA TTGTCGTGTG CGTGGATTTA GTCTTTAAAG TTGTAAAGTT ATGGCTACGT 540 + CTACTGCATT GAAAGTTGAA AAAATCGATT GAACTCATAC AGACTCAAGT CGTTTTGCTG 600 + TTGTGGAATT TAAAACAATT AAATTGCAAA GGTGGTGAAA TTCGTTTCTA ACGAAAATCA 660 + AAATTTGTCT TTTAACCGGT GGCGCCGTCT GCAAAATCGA CTACCGTCGC GCCGTTAGAA 720 + CATTGTCGTT GTTTGCTGGT GTTAGTGCCT TGTCGCGGAA TGTTCACACG TACACCACCT 780 + ACAAATAAAA AACTTAACAC CGACCAAATA CAAGCAATTC TAGAGAACGA AAGCGAGGAC 840 + GAAAGCAGAA AAGAAAAAAT GAACGAAGAA GATCAAAAGT TGGCGCCTGT AGGAGAAGCA 900 + GAGGCAAAGA AGCAGAATAA AGACGCTAGT GCTAAAGTCG AAGAGAAATT TGAACAAATG 960 + ATGAATACTC TAACCCAGAG CATGTTGGCA AAATCTAAAC AAGAGGGGCA AGTAATTATC 1020 + GCTGCAGAAA AATTTGAAAA AGTTGTAAGT GACTGTGATG GCAAATCAAT TCCTATTAAA 1080 + AAATGGTTTG AAATTTTTGA GAAAAATGCC GAGGCATATG AACTTTCGGA GAAACAAAAA 1140 + TATGTTCAAG CCAGAAGTAA GATGATTGGA TCAGCAGAAC TTTTCTTAGA ATCTGAATGT 1200 + GTCAGTGGAT ACACTGAACT CAAAGAGTTA CTAATTGAAG AATTTTCAGG CAGCTATAAT 1260 + AGCGCCGTTA TTCACAAAAA GTTGCAAGAC AGGAAGAAGA AGAGGGAGGA AACTCTACAC 1320 + GACTATTTGT TACAAATGAA GAAAATAGCA GCCTTAGGTG AAGTTGAAAC AGTTGCTTTG 1380 + ATAACTCATA TCGTAAACGG CCTCGACATT AAAAAGGAGT ATAAGGGTGC TATGCTCCGT 1440 + TGTAAAACTC TTAAGGAATT AAAGCAAGAA TTCGAAATCT ACGAGAGTCT GAATATTGTT 1500 + GACAAGCCGA ATATTCAACC AAAACCAAAG CAAATTACAC AAGGTGTAAA AGCAGATCAC 1560 + TGCTTCAACT GTGGTTCGAG GGAACACAAA CGAAAGGATT GTACACTTCC TACCAAATGT 1620 + TTCAGCTGTA ATCAAGAGGG CCATATCTCA AGCAAGTGTC CGGAAAAAGT AAACAGCATG 1680 + CGCATTCACG TTGATAGTGC ACGAACAAAG CCAGTAATCA TAAATGGGAT TATCATCAAC 1740 + TGTCTGGTGG ACACAGGATC AGATGTGACC ATAATTAAAG AAGCTATATT CAAGAAGATG 1800 + AAAGATGTTG ATTTAAACCG CACTGCAACA GTATTGCGAG GTTTGGGAAA TGCCTCAACA 1860 + CAGCCGATTG GATGCTTCAG AGCATTAATC AAGACCGACC AGGTGGAAGC AAGCCACAAC 1920 + GTTTTAGTCG TCCACGATTC TAAATTCAGT TGCGATGGAA TAGTGGGACA CGATTTTATC 1980 + AGCAAGTTTC GTCTTATCTG TAGTGCAGAA GGCTATACTT TTCTTGACCT GGAAGCAGAT 2040 + AAAAAACAAG CGGTTGAGTA TTCCCAAATG TTTAATATTT GTGAAGAATC TTCTTTTACA 2100 + GTTGCACCAC AATACCGAGA AGACGTTGAA CGCATGATAG AGAGAACATA CGAAACACCA 2160 + CCCAAGCAGA TAAAGCAATG TCCAGTCGAA CTCAAAATTA TTCCTGATGG CGTGATTAAA 2220 + CCCTTTCGCC ATGGACACAC CCGACTATCT GAAGAAGAAG CTATAGCTGT AAAGAAGCAG 2280 + GTAGAGGAAT GGGTCGAGCA GTCAATCGTC CGTAAATCTA CATCAAATGT TGCCAGTCGC 2340 + ATAGTCGTTG TCAGGAAAAA GGATGGTACC CTACGCGTTT GCGTGGACTA TAGAAAATTG 2400 + AACACCATGG TTCTGATGGA TTGTTTTCCG GTACCCATAA TGGAGGAGGT GCTTGAAAAA 2460 + CTGCAGAGTG CCAAATGGTT TACAACCATG GACTTACAGA ACGGATTTTT TCATGTGGCC 2520 + GTAGAAGAAG CCAGCAAGCC GTACACAGCA TTTGTTACCC GAGAAGGCTT ATTCGAGTTT 2580 + AACAAAGCGC CCTTTGGTTT TAAGAATTCC CCAGCAGCGT TTATACGGTT CGTTCAATTT 2640 + ATTTTTCAAG AACTAATCAA TTCCAATATA ATGCAGCTAT ATATGGATGA CATAATTGTA 2700 + TATGCCGCTA CCCCAGAAGA ATGCATGGAA AAGACGGAAA TGGTACTTAA GAGAGCTGCA 2760 + GAATTTGGTC TAAAAATAAA ATGGAAGAAG TGCAACTTTA TGCAGAGGCG AATTCATTTC 2820 + CTGGGACATA TTATCGAAGG TGGACAAATA TGCCCTGGAA AAGAGAAAAC ATCAGCAGTG 2880 + AATTCCTTTG GAACACCTCA GAATGTAAAA GCCGTTCAAG GATTTCTGGG TCTCACAGGA 2940 + TTCTTCAGAA AATTCATACC TGGATACGCC CAAATTGCGA GACCACTGAC GGACCTATTA 3000 + AAAAAAGATG CCATTTTCAA CATTGGACCA GTAGAGCAGC AGTCGGTGAA TAAGCTGAAA 3060 + GAGATTCTGG TAAACGAACC AGTATTGAGG ATCTACTCAC GAGAAGCAGA AACCGAACTT 3120 + CATACAGATG CCTCTAAGGA CGGGTTAGGA GCCGTTTTAT TGCAGAAGTT CGAAGGCAGT 3180 + TTTCACCCAG TCTGCTTTTG GAGCAGAAAA ACTACAAAAG CCGAATCAAA TCGTCATAGT 3240 + TATTACCTTG AAGTAAAAGC CGCATACTTA GCTCTGAAAA AGTTCAGACA CTATTTATTG 3300 + GGAGTCCCTT TCAAGCTCGT CACGGACTGT GTCGCATTTA AACAGACAAC AAAAAAAGCA 3360 + GATGTCCCAA GAGAAGTTGG CCCATGGATT CTCTATATGC AGGATTTTAA TTTTCAACCC 3420 + GAACATCGTG CAGGAGAAAG AATGAGACAC GTTGATTTTT TAAGCCGCCA TCCCCAAGCA 3480 + TGCATGATGA TAACATCCGA GTTGACAGCA CGTATTAAAA AGTCGCAGCA GAACGATGAT 3540 + TCAATTAGAG CAATCCTGGA AATTCTAAAA GATCGTCTAT TCCAACCCTA CAAGCTAAAA 3600 + GGTGGCCTGT TGTATAGTAT GGTCAATGGC AATGAACTAC TGGTTGTCCC TGCACTAATG 3660 + GAGAGGGAGG TGATTCAAAG CGCACATGAA GTTGGCCATT TGTCGTTGCA AAAGACGATG 3720 + CATAGCATAC AGCAGCAATT TTTTTATTTC CTCATTTGGG AATACAAGGT AAAAAAGCTA 3780 + ATTTCTAACT GTATAAAATG TATCATCCAC AGCAAAAAGT TGGGAAAGCA GGAGGGATAT 3840 + CTAAATTGCA TAGATAAAGG AGACGCACCG TTGCACACAC TACACATCGA TCATTTGGGG 3900 + CCAATGGATT CATCGGCCAA ACAGTATAAA TACATTCTGG CAACAGTCGA TGCGTTTTCA 3960 + AAGTTTGTCT GGTTATTCCC AACCAAATCA ACCGGACAGG AAGAAGTGGT CAAGAGGCTG 4020 + ACCGACTGGT CAAACATTTT TGGTTTCCCT AAGCGAATTG TTAGCGACAA AGGAACGGCC 4080 + TTTACGAGTG GTGCGTTCGA ACAATTTATG AGCAGCCATA ACGTGGAACA CGTCTGCACA 4140 + ACTACTGGAG TGGCCAGAGG CAACGGCCAG ATAGAACGAG TAAATCGTTT AATTTTGGCA 4200 + ATAATATCAA AGCTGTCTTC AGACGAACCG TCGAAGTGGT ACAAATATGT GCCTGAGGTA 4260 + CAAAAGGCGA TCAACTGTCA CGTGCATTCA TCACTGAAGC TGTCACCATT TGAGGTCATG 4320 + TTTGGCACCA AGATGTACAC CCGAGTTGAG GATCGGTTAC TGGAACTGCT CCAAGAAGAA 4380 + GTGGTCTGTC AATTCAACGA GGACCGCTAT GAGATGAGAC AGCTGGTAAA ACGCAACATC 4440 + GAGCAGGCGC AGAAGGACTA CAAGCGCAAT TACGACAAAA AGCGCCGAGC TGAATACAAA 4500 + TACAAAGCAG GTGATCTGGT TGCAATTAAA AGGACCCAAT TTGTAGCTGG CCGCAAGATG 4560 + GCAAGCGGGT ATTTAGGTCC ATACGAAGTC ACAGGGGTCA AAGACAATGG CAGATATGAC 4620 + GTTAAAAAAG CAGCAAACGT CGAAGGACCC AATGTCACAT CCACCAGCTG TGACAACATG 4680 + AAGTTGTGGA AGTACATAGC CGAAAATGCA GACCTATTGT CATCCGGGTC GGATGATGAT 4740 + GATCAGGAGG GCCGAATGTA ACATGGAGTA AGGCTGAAGG CTGGCAACAA CCCGGTTGGC 4800 + AGCGCTGTTG AGCAGCAACA TGATTGTCGG AAATCGAAGT TATCGACAAT CAGTCATCGA 4860 + AGGAACGATC GCAAGGCAGC AGTGGAGTAG GAGTGGAAGT CAGCGTTGCA GTCAGTCGTG 4920 + TTCTCAGCAG CAGTTCGTTC GGTCACAAAC TAAGAATACT TTATATAATT ACCGCATTTA 4980 + GAATTAAACT AATAATTAAA TTAATAATAA ACAATAATAA TAAACAATCT TACA 5034 +// +ID OPUS standard; DNA; INV; 7521 BP. +XX +AC AY180918; +XX +DR FLYBASE; FBte0000918; Dmel\opus. +XX +SY synonym: nomad +SY synonym: yoyo +XX +FT source AY180918:1..7521 +FT SO_feature five_prime_LTR ; SO:0000425:1..518 +FT SO_feature three_prime_LTR ; SO:0000426:7004..7521 +FT SO_feature CDS ; SO:0000316:1578..2831 +FT /name="Dmel\opus\gag" +FT /db_xref="FLYBASE:FBgn0025876" +FT /db_xref="SPTREMBL:Q8I7Q0" +FT /db_xref="NCBI_PROTEIN:AAN87270.1" +FT /translation="MEETLRALSESLNALTNVVTGIKEDIKKNNDRLAILEQERGNAD +FT PTVDQPQPLVRARTEYELREISVLPDCVKELQAFEGRQEAYLSWINRAQSILTEYDLI +FT KTRPLYRAIVLHIRQKIRGHADMALAAYGVQDDDWDDIKRVLALHYADKRDLRTLEHE +FT LGAMCQGSRPLDRFYMDVNGHLSLILNNLKARNHPREVVNALIETYRDKALDVFIRGV +FT GRDCSKHLLVRSPKNLPEAYSFCMGLQNVMSRNFTAQNYQPSGAPRFAGPYQHQARPP +FT FRTPFSPGSGRFSQNSYRTQGPRQAIKMESNRSGQSYQSGYSGRQEEGSGIKRMSEGN +FT NPFQKAQRLYHMELAPPPLAPAASGDNQGRSHEGYYDDESQAVERSNNYPPQKNVEGV +FT TDAPHNLETEGGANFMTNASPVYRT" +FT SO_feature CDS ; SO:0000316:2972..5983 +FT /name="Dmel\opus\pol" +FT /db_xref="FLYBASE:FBgn0025875" +FT /db_xref="SPTREMBL:Q8I7P9" +FT /db_xref="NCBI_PROTEIN:AAN87271.1" +FT /translation="MITHRLVGKFFKPLGNDSDITFFVLPNLHSFDGIIGDDTLKDLK +FT AIVDRKNNCLIITPGIKIPLLARASINVNPLLAAEHPDGTQEILNSLLGEFPRIFEPP +FT LSGMSVETAVKAEIRTNTQDPIYAKSYPYPVNMRGEVERQIDELLQDGIIRPSNSPYN +FT SPIWIVPKKPKPNGEKQYRMVVDFKRLNTVTIPDTYPIPDINATLASLGNAKYFTTLD +FT LTSGFHQIHMKESDIPKTAFSTLNGKYEFLRLPFGLKNAPAIFQRMIDDILREHIGKV +FT CYVYIDDIIVFSEDYDTHWKNLRLVLASLSKANLQVNLEKSHFLDTQVEFLGYIVTAD +FT GIKADPKKVRAISEMPPPTSVKELKRFLGMTSYYRKFIQDYAKVAKPLTNLTRGLYAN +FT IKSSQSSKVPITLDETALQSFNDLKSILCSSEILAFPCFTKPFHLTTDASNWAIGAVL +FT SQDDQGRDRPIAYISRSLNKTEENYATIEKEMLAIIWSLDNLRAYLYGAGTIKVYTDH +FT QPLTFALGNRNFNAKLKRWKARIEEYNCELIYKPGKSNVVADALSRIPPQLNQLSTDL +FT DANPEDDMQSLATAHSALHDSSRLIPHVESPINVFKNQLIFDTTRSKYLCEHPFPGYT +FT RHLIPLKDGSLADLTNSLQSCLRPVIINGVKIPEAHLQRFQSICLANFLLYKIRITQR +FT LVADVSGAEEICEIIEKEHRRAHRGPTEIRLQLLEKYYFPRMSSTIRLQTSSCQCCKL +FT YKYERHPNKPNLQPTPIPNYPCEILHIDIFALEKRLYLSCIDKFSKFAKLFHLQSKAS +FT VHLRETLVEALHYFTAPKVLVSDNERGLLCPTVLNYLRSLDIDLYYAPTQKSEVNGQV +FT ERFHSTFLEIYRCLKDELPTFKPVELVHIAVDRYNTSVHSVTNRKPADVFFDRSSRVN +FT YQGLTDFRRQTLEDIKGLIEYKQIRGNMARNKNRDEPKSYGPGDEVFVANKQIKTKEK +FT ARFRCEKVQEDNKITVKTRSGKIFHKSDLRN" +XX +CC Sequence from P1 DS01219.2:861..8381 provided by Guochon Liao +CC Berkeley Drosophila Genome Project. +XX +SQ Sequence 7521 BP; 2322 A; 1740 C; 1677 G; 1782 T; 0 other; + AGTTAAGAAC CCTCTTCTTG CGCTCTTCGT CAGGACTCAC CAGCGCTCGG CTCTCGTGTT 60 + TTCGGGCCCC GTCAGCAGGC GACTCGGGGC CTGTCTAGTA ACATGTTCGT GTAAGTTACG 120 + AACCCTCTTC TTGCGATCTT CGTCAGGACT CACCAGCGCT CGGCTCTCGT GTTTTCGGGC 180 + CCCGTCAGCA GGCGACTCGG GGCCTGTCTA GGAACATGTT TGTGTATGTG TGCATTCGGA 240 + ACAAGTGCCG TTGGTCGCAC TCAGGGTGAG GGGTCAACGG GGGAAGCGGA TATAAAAGCA 300 + GCGGGGCGGG AGAAGAGGTC CCAGTCTCGA ACGGACACAT AACGGAACCG CTAGCAGATC 360 + GCGAACTGAA TCTTAAAATA AAGCTAATCG TAAACTCGAA CCCTCTTAAC TATCTTGACT 420 + ATTATTTGGA GAACCACAGC ATGTTGGTTG TCATATCAAG GTGAGGTATG CGGCAGCGAG 480 + TGCCGAGAAC CCTGATGCAA GTGGAACTTG CGTTAACTGG CGCCCGAACA GGGACCGGCA 540 + ATGTCCGGCC GATAAAAGTG ATACGAAAAA ATTGTGGAAA TTTGTGCGTA AAAATAGTGG 600 + TGGTGTGCAT AAGTCAGATT AAGATCTGAA ATCCATAAAT GAAAAAGAAG TGCTGCGTGA 660 + GCTGTGTATA AAATGATAAA ATAGCAATTA CCCGCTGCCG GGGGGAACTA CGCCCATCCC 720 + GGGGCGCAAC AAATATTGCA TAATTCAATA AAAGGTGTAA AATTTCTAAA ATAAAAATGT 780 + AAACCTATGT TGCGCCAAGA CCTAATTTAA ATTAATAAAA CAACGACCCG CTACCGGAGG 840 + ACGCCACGTC GCCCATGCCG AGCGCAAAAG TTGTACGATA CCTATAACAT AATTAAAACA 900 + CGATCAACCC ACTGCGGCGG TACGGCTTGT GGGAAAATTT TTTTTTTTTT CTCTCCTTGC 960 + CAATTCGCGA GTGCAAAAGA TTGTGTATAA TAAACCAATA ATTAACCATT GCAGCAGTTT 1020 + ACCTGCGGCA GTACGAGTAA TATGAGCGCC CAGAGTGATA AGGTGGTGTG TGGCAGCTTG 1080 + TTGGATACGT TAAGTGGTGT GGAATGCACC CAAAAAAAAC CGCCCAACAA GTTGTGTGGC 1140 + GGCCGTACCT TAGTAGGCAA CCAGCCAAAA GGGATACTAC GGAACCACCG TGCCCAGTGC 1200 + CGAAATAAAT TAGAGGTCAT CAATAAAAAA CTGTAACAGC ACGCACGCAA GGAAAAAATA 1260 + TTGCAAAATG GAATAGCGCA CAAAAATTGT ATAAACACAT GCACAACACC ACAATTCAAA 1320 + GGAAAACAAA ATATTCATGC TGTAGGGGTA CAACCTAAAC GACGAAAACT AATAAAGAGC 1380 + ATACAAGGGT GAGTGAAATA TTTCATTAAA CTTTATTGCC ATATTTGCTA AATTTAGAGA 1440 + AATAAAGAAA AAGCAAAGAA GAACAGATAT TCTTTTTTAT CGGGTTAAAA CCGTTGTCTC 1500 + ACATTTCCGT AAAGTAATAA CGAATTCTGT TGCCTTGAAA GCTTCCTGCA TCTTTCCAAC 1560 + GCAAACTAAA AATCAAAATG GAAGAGACCC TGCGTGCTCT TAGCGAGTCC CTCAATGCCC 1620 + TGACCAACGT GGTGACAGGC ATTAAGGAAG ATATTAAGAA AAATAATGAT AGGTTGGCTA 1680 + TTTTAGAACA GGAGCGCGGG AACGCTGACC CTACGGTCGA CCAACCGCAA CCCCTGGTGC 1740 + GCGCACGCAC CGAGTATGAG CTGAGAGAGA TATCGGTCCT CCCTGACTGC GTCAAAGAAC 1800 + TGCAGGCGTT CGAAGGACGG CAGGAGGCTT ACCTGTCTTG GATAAACAGG GCACAGTCAA 1860 + TACTGACCGA ATATGACTTG ATTAAAACCA GACCCCTGTA TAGGGCAATT GTCTTGCATA 1920 + TTAGACAGAA AATAAGGGGA CACGCCGACA TGGCCTTGGC GGCCTATGGC GTCCAAGACG 1980 + ACGATTGGGA CGACATAAAA CGAGTCTTGG CGCTGCATTA CGCAGACAAA CGAGACTTAC 2040 + GTACGCTTGA GCATGAGCTT GGCGCTATGT GCCAAGGTTC TAGACCACTA GATAGGTTCT 2100 + ATATGGACGT TAATGGCCAT CTCTCGTTGA TCTTAAATAA CTTGAAGGCC AGAAACCACC 2160 + CTCGTGAAGT AGTCAACGCT TTGATAGAAA CCTATAGAGA CAAGGCTTTG GATGTTTTTA 2220 + TCCGAGGAGT GGGGAGAGAT TGTTCCAAAC ACTTACTTGT CCGCAGCCCG AAGAATCTAC 2280 + CAGAGGCTTA CTCTTTTTGT ATGGGATTGC AGAATGTAAT GTCAAGAAAT TTCACAGCTC 2340 + AGAACTATCA ACCGTCAGGT GCCCCAAGAT TCGCAGGCCC ATATCAACAT CAGGCCAGGC 2400 + CACCGTTCCG AACCCCTTTT TCTCCTGGTT CAGGCAGATT TTCGCAAAAC TCCTACAGAA 2460 + CTCAGGGTCC TAGACAGGCC ATAAAAATGG AATCCAATCG GTCGGGTCAA TCTTACCAAT 2520 + CAGGATACAG TGGTCGCCAG GAAGAAGGCT CCGGTATTAA GAGAATGTCC GAAGGAAACA 2580 + ACCCATTCCA AAAGGCACAA AGATTGTACC ACATGGAATT GGCACCACCC CCGCTAGCCC 2640 + CGGCGGCTAG TGGAGATAAC CAAGGACGTT CACACGAGGG TTACTATGAT GACGAGTCTC 2700 + AAGCTGTCGA GAGAAGCAAC AATTATCCTC CGCAGAAAAA CGTGGAAGGA GTTACAGATG 2760 + CTCCACATAA CCTTGAGACT GAGGGAGGGG CAAATTTTAT GACCAACGCC TCTCCAGTGT 2820 + ACCGTACTTA GAGTATGCTA CGGAGAGGGG AGAAAGGCTG AAGTTTTTGA TCGACACGGG 2880 + GGCGAACAAA AACTTTATTA GCCGAAGACT TGCAGCCGGG TGTACCACAG TCCGTAAACC 2940 + CTTCTCCGTA CTGTCCGCTG CGGGTAACAT CATGATAACG CACCGCCTAG TTGGTAAATT 3000 + CTTCAAACCA CTAGGGAACG ACTCGGATAT TACCTTTTTC GTACTACCGA ATTTACATTC 3060 + CTTTGATGGT ATCATTGGCG ACGATACTCT CAAAGACTTA AAAGCCATAG TGGATAGGAA 3120 + AAACAATTGT TTGATAATAA CCCCAGGAAT TAAAATCCCT CTTTTGGCGA GAGCTTCAAT 3180 + AAACGTTAAC CCGCTACTCG CCGCCGAACA CCCAGATGGT ACACAAGAAA TTTTGAATTC 3240 + CCTTCTCGGG GAATTTCCCC GCATCTTCGA GCCCCCCTTA TCTGGAATGT CCGTGGAGAC 3300 + GGCCGTCAAG GCTGAAATCC GGACAAACAC ACAAGACCCG ATCTATGCTA AAAGTTATCC 3360 + TTACCCAGTC AACATGCGCG GAGAAGTCGA ACGTCAAATC GATGAACTGC TGCAGGACGG 3420 + TATAATTCGA CCCTCTAATA GCCCTTACAA TTCCCCTATC TGGATAGTCC CGAAGAAACC 3480 + TAAACCAAAC GGAGAAAAAC AATATCGCAT GGTAGTCGAT TTCAAGCGGT TAAATACCGT 3540 + CACCATACCC GACACTTACC CCATCCCAGA TATAAACGCT ACGCTAGCCA GCCTTGGCAA 3600 + TGCCAAATAC TTTACCACCC TAGATTTGAC TTCTGGATTC CATCAAATCC ACATGAAGGA 3660 + AAGCGACATT CCAAAGACAG CTTTCTCTAC TCTAAATGGA AAGTACGAGT TCCTCCGTCT 3720 + ACCATTCGGT TTGAAGAATG CACCTGCAAT CTTCCAAAGA ATGATCGATG ATATTTTGCG 3780 + CGAGCATATT GGCAAGGTCT GCTACGTTTA TATTGACGAT ATCATCGTCT TCAGTGAAGA 3840 + TTATGACACA CACTGGAAAA ATCTCCGATT GGTATTAGCG AGTTTATCAA AAGCTAACCT 3900 + CCAAGTGAAC CTTGAGAAGT CGCATTTTTT AGACACGCAG GTAGAATTTT TAGGATATAT 3960 + CGTCACGGCC GATGGCATTA AGGCAGATCC GAAAAAGGTC AGAGCGATTA GCGAAATGCC 4020 + TCCTCCGACC TCTGTTAAGG AGTTAAAAAG ATTTCTAGGC ATGACCTCGT ACTACAGGAA 4080 + GTTCATTCAG GACTATGCGA AGGTAGCAAA GCCCCTTACA AACTTGACGC GTGGATTGTA 4140 + CGCTAATATA AAGTCTTCAC AATCAAGCAA AGTGCCAATT ACATTAGACG AGACGGCCCT 4200 + ACAGTCTTTT AATGATTTAA AATCAATTCT CTGTTCTTCT GAAATACTGG CGTTCCCATG 4260 + TTTCACTAAA CCTTTCCATC TAACCACGGA CGCTTCTAAC TGGGCCATCG GAGCTGTCCT 4320 + CTCACAGGAC GACCAGGGTA GAGATAGGCC GATAGCGTAC ATTTCCCGTT CATTAAATAA 4380 + GACGGAGGAA AACTACGCTA CTATCGAAAA GGAAATGCTC GCGATAATTT GGTCATTGGA 4440 + CAATCTTCGG GCTTACTTAT ATGGCGCTGG TACTATTAAA GTATATACTG ACCATCAACC 4500 + TCTAACGTTT GCCCTAGGCA ACAGAAATTT CAATGCGAAG CTAAAACGCT GGAAGGCTCG 4560 + TATAGAGGAA TACAACTGCG AACTCATCTA CAAGCCTGGG AAATCTAATG TGGTGGCTGA 4620 + CGCGCTTTCA CGCATTCCGC CTCAGCTTAA CCAGTTGAGC ACCGATTTAG ATGCTAATCC 4680 + CGAGGATGAC ATGCAGTCTT TGGCTACTGC CCATAGCGCT TTACATGACA GTTCACGATT 4740 + GATTCCCCAC GTTGAATCTC CAATCAACGT TTTCAAGAAT CAACTCATTT TTGACACAAC 4800 + CAGGTCAAAA TACTTATGCG AGCACCCGTT CCCAGGTTAT ACTCGCCATC TGATTCCTCT 4860 + CAAAGACGGA TCACTTGCCG ATTTAACCAA CTCGTTACAA TCGTGTCTAC GACCTGTAAT 4920 + AATTAACGGC GTCAAAATCC CGGAAGCACA TTTGCAACGC TTTCAGTCCA TCTGCTTAGC 4980 + GAATTTTCTT TTATACAAAA TTCGGATAAC GCAGCGCCTA GTGGCGGACG TGTCTGGCGC 5040 + AGAGGAAATT TGTGAAATAA TTGAAAAAGA ACACCGTAGA GCACATAGGG GCCCTACGGA 5100 + GATTCGTCTC CAACTTTTAG AAAAATATTA TTTCCCGCGA ATGTCCAGTA CGATCCGTCT 5160 + GCAAACTTCC TCATGTCAGT GTTGCAAACT CTACAAGTAC GAGAGACACC CTAACAAACC 5220 + AAACCTACAA CCTACGCCAA TTCCTAACTA CCCATGTGAA ATACTTCACA TCGACATTTT 5280 + TGCGCTCGAA AAAAGGTTAT ACCTAAGTTG TATTGACAAA TTTAGCAAGT TTGCCAAACT 5340 + TTTCCATCTG CAGTCAAAAG CATCTGTGCA TTTGCGAGAA ACTTTGGTGG AGGCCCTACA 5400 + TTACTTCACC GCCCCTAAGG TCTTGGTTTC GGATAACGAG CGAGGGTTGT TATGCCCCAC 5460 + AGTGCTCAAC TATCTTCGGT CTCTAGATAT CGATCTGTAT TATGCTCCAA CCCAGAAGAG 5520 + CGAAGTAAAT GGTCAAGTCG AGAGATTCCA CTCTACGTTC CTAGAAATTT ATCGTTGCCT 5580 + TAAAGATGAG CTCCCTACCT TCAAACCCGT TGAGCTGGTA CACATAGCAG TGGACCGCTA 5640 + CAACACTTCC GTTCACTCGG TAACGAATCG AAAACCAGCA GACGTTTTTT TCGACCGCTC 5700 + GTCAAGGGTA AACTATCAGG GTCTGACAGA TTTCCGGCGG CAGACTTTAG AGGACATCAA 5760 + GGGCTTAATT GAGTATAAGC AAATTAGAGG TAATATGGCT CGGAATAAAA ATAGGGACGA 5820 + GCCAAAGTCT TATGGGCCGG GAGATGAAGT TTTTGTTGCA AATAAGCAAA TAAAAACAAA 5880 + GGAAAAAGCG AGGTTCAGAT GCGAAAAGGT ACAGGAAGAC AACAAGATAA CAGTTAAAAC 5940 + CAGATCAGGA AAAATTTTCC ACAAATCTGA TCTAAGAAAT TGAGACGTGG CTTTCACATT 6000 + TAAAAAAGAA ACGCGAAAAA GAATAACGAA AGTAATAAAA GTACGTTGTG GCAGCTAATG 6060 + AAATATTCCA CCCATGCATA CCCTATATAA AAAAAACATT AATAAAAAAA AAAAAAAAAA 6120 + AAAAAAAAAA AAAAAAAAAT GAGTTAAGAA ATACAAAAAG AAATACAAAA AAAACTATAA 6180 + AAAAAATAAT ATAAAAAAAT ACAGATTATA AGAAATAAGA AATAAGAAAT ATAAAAAAAT 6240 + AAAAATATAA GTACACAAAA TGTACCGTAC CCCCACACAC TACGTAGTCT TAGAACAACT 6300 + TAGACGACCA GATATTTACG AATTGTCTTT TTGTAAGCGC GATTTCTGCA TGCGGCGCAA 6360 + ATCCCGCTCA CTGGACTGGC TGGGGTCGGC TTGGAAATGG GTAGCTGGAT CTCCAGATGC 6420 + TGCTGATTGG AACGCCGTCT TGGCCGCGCA AGCGACGGCT TCGAGGAACT GCAAAAACTG 6480 + GAGGAGGCTA GCTGTATCCC TCGGCTACTG AAGTAACCAA CGAGTGGTTA AGCAAGTCGA 6540 + CGATGGAATG CTCCTCCTGA CCAACTTCAA CGGAACTCTA AGAACGGCTG CAGAGAACTA 6600 + CGACCTGATC GGCTCCTTTA TCATCCAATT CGACAATGAG ACGATAATGG TCAACGGTCA 6660 + AAACTATTCC AGTTACTCGG TCAGTCATCT AATGGCGATG CCGGCCGTGT TGAGCCACAT 6720 + AACGGCCAGC AACTTTCAAC TTTCTCTGGA ATACGTCCAC GACGTGAGCA TGAAGAATTT 6780 + GGAAAAGATG TCCAACATGG CGAGTGAGCT ACTAGCCTCT CTTCTCACCG AGGCGGCACT 6840 + CGCAATCTGC ATATTCCTAG GCTTTTATTT CCTATGGAAG AAGCTGATGT CCACCAAAGG 6900 + CATGCCCGAT GTCCGCGAGA TTGCCGCAAA CTTAGAAGCA TTGGGCCAAA CCGAGCTGAA 6960 + CAAGGCTCAC TAATCTGCGG GACGCAGATC TTGAGGGGGG AGGAGTTAAG AACCCTCTTC 7020 + TTGCGCTCTT CGTCAGGACT CACCAGCGCT CGGCTCTCGT GTTTTCGGGC CCCGTCAGCA 7080 + GGCGACTCGG GGCCTGTCTA GTAACATGTT CGTGTAAGTT ACGAACCCTC TTCTTGCGAT 7140 + CTTCGTCAGG ACTCACCAGC GCTCGGCTCT CGTGTTTTCG GGCCCCGTCA GCAGGCGACT 7200 + CGGGGCCTGT CTAGGAACAT GTTTGTGTAT GTGTGCATTC GGAACAAGTG CCGTTGGTCG 7260 + CACTCAGGGT GAGGGGTCAA CGGGGGAAGC GGATATAAAA GCAGCGGGGC GGGAGAAGAG 7320 + GTCCCAGTCT CGAACGGACA CATAACGGAA CCGCTAGCAG ATCGCGAACT GAATCTTAAA 7380 + ATAAAGCTAA TCGTAAACTC GAACCCTCTT AACTATCTTG ACTATTATTT GGAGAACCAC 7440 + AGCATGTTGG TTGTCATATC AAGGTGAGGT ATGCGGCAGC GAGTGCCGAG AACCCTGATG 7500 + CAAGTGGAAC TTGCGTTAAC T 7521 +// +ID DM_ROO standard; DNA; INV; 9092 BP. +XX +AC AY180917; +XX +DR FLYBASE; FBte0000100; Dmel\roo. +XX +SY synonym: B104 +XX +FT source AY180917:1..9092 +FT SO_feature five_prime_LTR ; SO:0000425:1..429 +FT SO_feature three_prime_LTR ; SO:0000426:8665..9092 +FT SO_feature CDS ; SO:0000316:1275..8357 +FT /name="Dmel\roo\ORF" +FT /db_xref="FLYBASE:FBgn0043856" +FT /db_xref="NCBI_PROTEIN:AAN87269.1" +FT /translation="MMSEKTIQFLKKQSEIILEIRKLEVKPTLTDVEILKLNELQKCF +FT IANHSNLLKIGVVDHEYFNAKQYDLIMMVLEKIKNKNEKIKGESVENTFPKSNTVPKS +FT NPPPTLNLEMRGHPEKEGIAQNNALKVEQAFRNNVGQFRVYLEDTSKLIDSSPDFLKI +FT RKNKIEFLWHKIDNLIEQVNSRFESSLFEEEISELEFDKQNILTAINSRLSGTINKAE +FT MSTVVKAEELPTLPKIQIPTFFGDSKEWDLFNELFTELIHVREDLSPSLKFNYLKSAL +FT KGEARNVVTHLLLGSGENYEATWEFLTKRYENKRNIFSDHMNRLMDMPNLNLESNKQI +FT KTFIDTINESIYIIKLKAQLPEDVDAIFAHIILRKFNKESLNLYESHVKKTKEIQALS +FT DVMDFLEQRLNSISSFSQEVKPVKKMINNNKNKNYSDNCAYCKLPGHYLIQCHKFKIM +FT NPAERSDWVRKNGICLRCLRHPFGKKCISEQLCSTCRKPHHTLLHFAGHNPEKVNTCR +FT TTGQALLATALIQVKSRYGGFEQLRALIDSGSQSTIISEESAQILKLKKFRSHTEISG +FT VSSTGTCISKHKAVISIRNSPKNLEIEAIILPKLMKALPVNTINVDQKKWKNFKLADP +FT DFNKPGRIDLIIGADVYTHILQNGVIKIDGLLGQKTDFGWIVSGCKKSKGKETIVATT +FT IEIKELDRYWEVEEEEKDDIESEICENKFIKTTKKDSDGRYIVSIPFKEDVTLGDSKK +FT QAIARYMNLEKKLKRNEKLKVDYTKFMNEYMDLGHMIEVSDEGKYFLPHQAVIRDSSL +FT TTKLRVVFDASAKTTNNKSLNDIMWVGPRVQKDIFDIIIKWRKWEFVVSADIEKMYRQ +FT IKIDNNDQKYQYILWRNSPKEKIKTYKLTTVTYGTASAPYLATRVLVDIADKCKNQVI +FT SAIIRNDFYMDDLMTGADSVEEANKLITLIPHELQKVGFNLRKWISNNSKILTTVEDT +FT GDNKVLNIIENECVKTLGLKWEPQKDLFKFSVNCNDESKNINKRVVLSTLAKIFDPLG +FT WLAPVTVSGKLFIQKLWINKSEWDQELSIEDKNYWEKYKENLLLLENIRIPRWINSNS +FT SSVIQIHGFADASEKAYAAVVYAKVGPHVNIIASKSRVNPIKNRKTIPKLELCAAHLL +FT SELIQRLKGSIDNIMEIYAWSDSTITLAWINSGQSKIKFIKRRTDDIRKLKNTEWNHV +FT KSEDNPADLASRGVDSNQLINCDFWWKGPKWLADPKELWPRQQSVEEPVLINTVLNDK +FT IDDPIYELIERYSSIEKLIRIIAYINRFVQMKTRNKAYSSIISVKEIRIAETVVIKKQ +FT QEYQFRQEIKCLKIKKEIKTNNKILSLNPFLDKGGVLRVGGRLQNSNAEFNVKHPIIL +FT EKCHLTSLLIKNAHKETLHGGINLMRNYIQRKYWIFGLKNSLKKYLRECVTCARYKQN +FT TAQQIMGNLPKYRVTMTFPFLNTGIDYAGPYYVKCSKNRGQKTFKGYVAVFVCMATKA +FT IHLEMVSDLTSDAFLAALRRFIARRGKCSNIYSDNGTNFVGAARKLDQELFNAIQENI +FT TIAAQLEKDRIDWHFIPPAGPHFGGIWEAGVKSMKYHLKRIIGDTIFTYEEMSTLLCQ +FT IEACLNSRPLYTIVSEKDQQEVLTPGHFLIGRPPLEIVEPMEDEKIGNLDRWRLIQKI +FT KKDFWVKWKSEYLHTLQQRNKWKKEIPNIEEGQIVLLKDENCHPARWPLGKVEKVHKG +FT NDDKVRVAKVKMQEGYITRPITKICPLEGIKSVDKNEADQEPKRRTRATSGMSKIGII +FT MAMLLFVLSCQVSSALPKDIAPRYSIDKINKTSAIYLDPLGDVEIVSTSWNLVIYYKM +FT DPYFKMLTKGNALIQSMRKVCERLHSFEEQCSLVLDNMQSQLSELEENNKLFMMQSRS +FT RSKRAPFEFMGSLYHILFGIMDEDDREQLEENMKNLLDNQNNLDKLIQKQTSVVDSTS +FT NLLKRTTEDVNSNFRSMQIRIENMTEVLKENYYVYKESIKFFMITKQLHSLIEEGEKI +FT QAGIISLLIDINHGRLNTNILRPNQLKKEIAKIQQSLSENLVIPGKRSGTELKEVYTL +FT LTARGLFIDDKLIISAKVPLFSRHPSKLFRLIPVPIRNEDRIIMVHTTSEYLIYNFEI +FT DSYHIMTEATLNQCQKWQLNKRICKGSWPWNSANDNACEIQPLKPDKAANCIYKTVVD +FT SKSYWVELEKKSSWLFKVPANSKVRLQCTGSQIELFDLPQQGVLSIAPYCTARTDDKI +FT LVAHHNIQSESEELLSTPYIGEVSGVPKIIWDPLKLSILNHTEEFERLNNEIKFMKEN +FT HQKLKDLHFHHISGHAGLIIALILMIVLIIYFIRKCAVQQRMQAITFAGPLPVLXX" +XX +CC Sequence from P1 sequence DS00941:20448..29535 provided by +CC Guochun Liao, Berkeley Drosophila Genome Project. +XX +SQ Sequence 9092 BP; 3468 A; 1442 C; 1710 G; 2472 T; 0 other; + TGTTCACACA TGAACACGAA TATATTTAAA GACTTACAAT TTTGGGCTCC GTTCATATCT 60 + TATGTAAATG AATCGAGAGC GATAAATTAT ATTTAGGATT TTGTTATCTA AGGCGACATG 120 + GGTGCATTGC TCAAAAACAT GTAATTTAAG TGCACACTAC ATGAGTCAGT CACTTGAGAT 180 + CGTTCCCCGC CTCCTAAAAT AGTCCCTTAG TGGGAGACCA CAGATAAGGT CCTCGCCGCT 240 + CAAGATAGGC AGATGTGCCC GAGCGTGGGA CCTCGATAAG GCGGGGACTA TTTACGTAGG 300 + CCTCTGCGTA GGCCATTTAC TTTAAGATGC GATTCTCATG TCACCTATTT AAACCGAAGA 360 + TATTTCCAAA TAAAATCAGT TTTTTTACAA AAACTCAACG AGTAAAGTCT TCTTATTTGG 420 + GATTTTACAT TTGGTCAATC GAGCCTTTAA TCGACTCTGC AGTTTCCCCC TACCAAAGGT 480 + AAGGAACTCA GAGAAAGGCC AGCTCCTTTA AGCATCTTAC AGCTAAAGGT AGCAAAAATA 540 + AGTGACTCTT GTTTCCCCCT ACCAAAGGTA AGGAACAGAG TATAAATATA AAAAGCAAAA 600 + GATACAAAAG AATCTTTTAT GTTTTAAAAC AAGCACCTTA TAGTCTATAG CTAAAGGTTG 660 + CTTTGTGTAC CATTATAAAT TGTGGTAAGG CGTGCTTGAG GCCATACATC AGCAATTGTG 720 + AAATTAAAAA GTGCATAACA AAAGTGCCTT ATAAATGCTC TAATAGCATT AAATCAGCTC 780 + ATAAATAGAG TGCAGTGTAT ATGCCATAAG AGCATAAATT AAATAAAAAG TGCCTGAAAA 840 + CAGTGCCTTA TAAATGCTCT AATAGCATTA AATCAGCTCA TAAATAGAGT GCAGTGTATA 900 + TGCCAAAAGA GCATAAATGC CGAAATAAAT GGCTAAAAAA CAAAAAATCT GACTGGACTA 960 + CAAAAATAAT AAAACGTGCC AAAAAAAAAA AAAAAATCAT CTTTAAACAT CGACGGAGCC 1020 + TTAAAGAAGA GAAGGAAGTC AAATTCAAAG GAGCCTCTAC CAGCAGCAGA AGCAGCAACA 1080 + ACAGCAGCAG CAGAAGCAGC AACAGCAGTA GCAACAGCAG CAACAACAGC AGCAACAGCA 1140 + GCAGCAACAA CAACGACATC AGCTAAGTCA AAACAAGAAT TTTCTGTTTA TCCAAACACA 1200 + CATATATATA TAAATACATA TAAAATACAT ATACACGTAC TATATATATT AAGAAATTAC 1260 + AAAAAATTTT CAAAATGATG TCAGAAAAGA CTATTCAATT CCTTAAGAAG CAGTCCGAAA 1320 + TTATTTTGGA AATTAGAAAG TTGGAAGTAA AACCAACATT AACAGATGTA GAAATTCTAA 1380 + AATTAAATGA GCTTCAAAAA TGTTTCATTG CTAATCATAG CAATTTGTTA AAGATCGGCG 1440 + TTGTCGATCA TGAATATTTT AACGCGAAGC AGTATGATTT AATAATGATG GTGTTAGAAA 1500 + AAATTAAAAA TAAAAATGAA AAAATTAAGG GCGAGTCGGT AGAAAACACT TTCCCTAAAT 1560 + CAAACACTGT CCCTAAATCA AACCCTCCCC CTACATTAAA CCTTGAAATG CGTGGTCACC 1620 + CTGAAAAAGA GGGTATAGCA CAAAACAACG CTTTAAAAGT AGAGCAGGCA TTTCGTAATA 1680 + ATGTTGGCCA ATTTCGAGTA TATCTAGAAG ATACGTCTAA ACTAATAGAC AGTAGTCCAG 1740 + ATTTCCTTAA AATAAGGAAA AATAAAATTG AATTTTTATG GCATAAAATA GATAACCTGA 1800 + TTGAACAGGT GAATAGTCGT TTTGAGAGTT CGCTATTCGA AGAAGAAATT AGCGAACTTG 1860 + AATTTGACAA ACAAAATATT CTTACAGCCA TTAATAGTCG ACTCAGTGGC ACAATAAATA 1920 + AAGCTGAAAT GTCGACGGTT GTTAAGGCGG AGGAGTTACC AACCCTGCCT AAAATACAGA 1980 + TTCCCACCTT CTTTGGTGAT TCCAAAGAAT GGGATCTTTT TAATGAACTC TTTACAGAGC 2040 + TCATACATGT GAGAGAGGAT CTCAGTCCTT CTCTCAAATT TAATTATCTA AAGTCAGCAT 2100 + TAAAAGGAGA AGCCAGAAAT GTGGTTACTC ATTTACTGCT CGGCTCTGGA GAAAATTATG 2160 + AAGCCACTTG GGAGTTTTTG ACCAAGCGAT ATGAGAATAA AAGAAACATA TTCTCAGATC 2220 + ATATGAATAG GCTTATGGAT ATGCCAAATT TAAATTTAGA ATCCAATAAG CAAATAAAGA 2280 + CATTTATTGA CACGATTAAC GAGTCAATTT ATATTATAAA ATTAAAGGCA CAATTACCAG 2340 + AAGATGTGGA TGCAATTTTC GCTCACATAA TTCTTCGGAA ATTCAATAAA GAATCACTCA 2400 + ATTTATATGA AAGCCATGTT AAAAAGACAA AAGAAATACA GGCACTTTCT GATGTCATGG 2460 + ACTTTTTAGA GCAAAGGCTC AATTCTATAT CATCATTCTC ACAGGAAGTA AAACCTGTAA 2520 + AGAAAATGAT TAATAATAAC AAGAATAAAA ATTATAGTGA CAATTGTGCA TATTGCAAAC 2580 + TACCAGGGCA TTATTTAATT CAATGCCATA AATTTAAAAT AATGAATCCA GCAGAACGGT 2640 + CTGACTGGGT AAGAAAAAAT GGGATTTGCC TAAGATGTCT GAGGCATCCG TTTGGTAAAA 2700 + AATGTATAAG CGAGCAGCTT TGTTCGACTT GTCGTAAACC TCACCACACG TTACTTCACT 2760 + TTGCAGGTCA TAATCCAGAA AAAGTGAATA CGTGTAGAAC AACAGGTCAA GCCTTGTTGG 2820 + CCACGGCCTT GATTCAAGTA AAGTCGAGGT ATGGAGGCTT TGAACAATTA AGAGCATTGA 2880 + TTGATAGTGG CTCTCAAAGC ACAATTATTT CAGAAGAGTC TGCACAGATT CTAAAATTGA 2940 + AAAAATTTCG GTCTCATACT GAAATAAGTG GAGTATCTTC CACAGGAACG TGCATCTCCA 3000 + AGCACAAAGC GGTTATTTCG ATAAGAAATT CTCCGAAAAA TTTAGAAATT GAAGCAATTA 3060 + TTCTCCCAAA ACTTATGAAG GCACTTCCAG TCAACACGAT TAATGTTGAT CAGAAAAAAT 3120 + GGAAGAACTT TAAATTAGCC GACCCCGATT TTAATAAACC GGGTCGCATT GATTTAATCA 3180 + TTGGAGCAGA CGTATATACT CACATTCTGC AAAATGGAGT TATAAAAATA GACGGTCTCC 3240 + TTGGGCAAAA AACTGATTTC GGGTGGATAG TTTCTGGATG TAAAAAATCC AAAGGAAAAG 3300 + AAACCATTGT AGCCACAACA ATAGAAATAA AAGAGTTAGA TCGCTACTGG GAAGTGGAAG 3360 + AAGAAGAAAA AGATGATATC GAGTCTGAAA TCTGTGAAAA TAAATTTATC AAAACGACAA 3420 + AAAAAGATTC AGATGGGCGA TACATTGTGT CAATTCCATT CAAGGAGGAT GTCACCTTAG 3480 + GAGATTCAAA GAAACAAGCG ATAGCTCGTT ACATGAATCT GGAGAAAAAA CTAAAAAGAA 3540 + ATGAAAAACT TAAGGTTGAC TACACTAAAT TCATGAATGA ATACATGGAT TTAGGACACA 3600 + TGATTGAAGT GAGTGATGAA GGCAAATATT TTTTACCGCA CCAGGCAGTG ATTAGAGATT 3660 + CAAGCCTTAC GACCAAATTG AGAGTAGTTT TTGATGCTTC AGCAAAAACT ACGAATAACA 3720 + AAAGTTTGAA CGACATAATG TGGGTTGGGC CACGAGTTCA AAAAGATATT TTTGACATTA 3780 + TTATTAAATG GAGAAAATGG GAATTTGTTG TTTCGGCAGA CATTGAAAAG ATGTACCGAC 3840 + AAATTAAAAT AGATAATAAT GATCAAAAAT ATCAATATAT TTTATGGAGA AATTCTCCAA 3900 + AAGAAAAAAT TAAAACATAT AAATTAACCA CAGTCACTTA CGGAACTGCA TCTGCACCAT 3960 + ATTTGGCTAC CAGGGTTCTG GTAGATATTG CAGATAAATG TAAAAACCAA GTTATTAGTG 4020 + CAATAATTAG GAATGATTTC TATATGGATG ACCTAATGAC TGGAGCTGAT TCGGTAGAAG 4080 + AAGCTAATAA ATTAATAACA TTAATTCCCC ATGAATTGCA GAAAGTTGGA TTCAACTTAA 4140 + GGAAATGGAT TTCCAACAAT TCCAAAATAT TAACCACTGT GGAGGACACA GGGGACAATA 4200 + AGGTTCTCAA TATTATCGAA AATGAATGTG TTAAAACTTT AGGACTAAAA TGGGAACCTC 4260 + AAAAGGATTT ATTTAAGTTC AGCGTAAATT GTAATGATGA ATCAAAAAAT ATAAATAAGC 4320 + GCGTTGTGTT ATCAACGCTA GCAAAAATAT TTGATCCGTT AGGATGGTTG GCACCAGTCA 4380 + CGGTTTCAGG AAAACTTTTT ATTCAAAAAC TTTGGATAAA TAAAAGTGAA TGGGATCAGG 4440 + AATTATCCAT AGAAGATAAA AATTATTGGG AAAAATATAA AGAAAATTTA TTATTGTTAG 4500 + AGAATATTCG AATCCCAAGG TGGATTAATT CAAACAGTTC TTCAGTCATT CAGATTCACG 4560 + GATTTGCGGA CGCCTCCGAA AAAGCATATG CTGCAGTAGT CTATGCTAAA GTAGGACCTC 4620 + ATGTTAATAT AATAGCTAGC AAAAGTAGAG TCAACCCTAT AAAAAATAGG AAGACAATTC 4680 + CCAAACTCGA GCTGTGTGCA GCTCACCTGC TTAGTGAATT AATCCAAAGA CTAAAAGGAT 4740 + CAATTGACAA TATAATGGAG ATCTATGCTT GGAGTGATTC CACGATTACC TTAGCATGGA 4800 + TTAACAGTGG TCAAAGTAAG ATCAAATTTA TAAAAAGAAG AACGGATGAC ATTCGGAAAT 4860 + TAAAAAATAC TGAATGGAAT CATGTTAAGT CAGAGGATAA TCCAGCAGAT TTAGCATCCA 4920 + GGGGAGTGGA TTCTAACCAG TTGATCAACT GTGATTTTTG GTGGAAAGGT CCGAAATGGC 4980 + TAGCAGACCC AAAAGAACTT TGGCCTCGGC AGCAGTCTGT AGAAGAACCT GTCTTAATAA 5040 + ATACGGTATT AAATGACAAA ATAGATGATC CTATTTACGA ATTAATAGAA AGGTATTCCA 5100 + GTATAGAAAA ACTTATACGT ATAATAGCAT ACATAAATAG ATTCGTGCAG ATGAAAACAA 5160 + GAAATAAAGC CTATTCATCA ATTATTTCAG TAAAGGAGAT AAGAATAGCG GAAACAGTTG 5220 + TTATTAAGAA ACAACAAGAA TACCAGTTTA GGCAAGAGAT AAAGTGCCTT AAAATCAAAA 5280 + AGGAAATCAA GACAAATAAT AAAATATTGT CATTGAATCC ATTTTTGGAC AAGGGTGGGG 5340 + TTCTAAGAGT TGGAGGAAGA TTGCAAAATT CCAATGCAGA ATTTAATGTT AAACATCCAA 5400 + TCATTTTAGA AAAATGCCAC CTAACAAGCT TATTAATAAA AAATGCTCAT AAGGAAACAT 5460 + TGCATGGAGG GATAAACCTA ATGCGAAACT ATATCCAAAG AAAGTATTGG ATTTTCGGGT 5520 + TGAAAAATTC GTTGAAAAAG TATTTAAGAG AATGTGTAAC GTGTGCAAGG TATAAACAAA 5580 + ATACAGCTCA GCAAATAATG GGTAACTTGC CAAAATATAG AGTGACGATG ACATTCCCGT 5640 + TTCTTAATAC TGGAATAGAT TACGCAGGTC CTTATTATGT TAAATGTTCA AAAAATCGTG 5700 + GCCAAAAAAC ATTTAAAGGA TACGTTGCTG TATTCGTTTG CATGGCCACC AAAGCCATAC 5760 + ACTTAGAAAT GGTAAGCGAT CTAACTTCAG ACGCATTTTT AGCAGCACTC AGAAGATTTA 5820 + TTGCTAGACG GGGAAAATGT TCCAATATCT ATTCAGACAA CGGAACAAAT TTTGTAGGAG 5880 + CTGCAAGAAA ATTAGATCAA GAGTTATTTA ATGCAATACA AGAAAATATA ACGATTGCAG 5940 + CGCAACTTGA AAAGGACAGG ATTGATTGGC ATTTTATTCC CCCGGCAGGA CCTCACTTCG 6000 + GAGGTATTTG GGAAGCTGGA GTTAAGTCAA TGAAATACCA TTTAAAGCGT ATAATCGGCG 6060 + ACACTATTTT TACTTATGAA GAAATGTCAA CTCTTTTATG TCAAATAGAA GCATGCTTAA 6120 + ATTCAAGGCC ATTATACACT ATAGTTAGTG AGAAGGACCA ACAAGAAGTT TTAACACCAG 6180 + GTCATTTTTT AATTGGAAGA CCACCTTTAG AAATAGTCGA ACCAATGGAA GATGAAAAAA 6240 + TCGGAAATTT GGATAGGTGG AGACTTATCC AAAAAATAAA GAAAGATTTC TGGGTTAAGT 6300 + GGAAAAGTGA ATATTTGCAT ACGCTCCAGC AAAGGAATAA ATGGAAAAAG GAAATTCCTA 6360 + ATATAGAAGA AGGGCAAATA GTTTTATTAA AGGATGAGAA TTGTCATCCT GCAAGATGGC 6420 + CTTTAGGAAA GGTGGAAAAG GTGCATAAGG GGAATGATGA TAAGGTCCGA GTGGCTAAAG 6480 + TAAAGATGCA GGAAGGATAT ATCACTAGAC CCATTACTAA AATTTGTCCC TTGGAAGGAA 6540 + TAAAGTCTGT TGACAAAAAT GAGGCTGACC AAGAGCCAAA AAGACGAACT AGAGCGACAT 6600 + CGGGAATGTC CAAGATCGGA ATCATTATGG CAATGTTGTT GTTTGTGTTA AGTTGTCAAG 6660 + TTTCTAGCGC ATTACCTAAA GATATAGCAC CAAGATATTC TATAGACAAA ATAAATAAAA 6720 + CCTCAGCAAT ATATCTAGAC CCGCTAGGAG ATGTTGAGAT TGTGAGTACT TCTTGGAATT 6780 + TGGTTATCTA TTATAAAATG GATCCATATT TTAAAATGTT AACAAAGGGT AATGCGCTTA 6840 + TACAAAGTAT GAGGAAAGTT TGCGAAAGAC TTCATAGCTT TGAAGAGCAA TGTAGTCTAG 6900 + TCTTAGATAA TATGCAAAGT CAGTTATCGG AACTTGAAGA AAACAATAAA TTGTTTATGA 6960 + TGCAGTCTAG ATCTAGAAGC AAGCGTGCTC CTTTCGAATT TATGGGTTCC TTGTATCATA 7020 + TTTTATTTGG TATAATGGAT GAAGATGATA GAGAGCAATT AGAAGAAAAT ATGAAGAATT 7080 + TGTTAGATAA CCAGAACAAC CTTGATAAAC TAATTCAAAA ACAAACATCT GTGGTTGATT 7140 + CAACTTCTAA TCTATTAAAG AGAACAACAG AAGATGTTAA CTCCAATTTT AGAAGTATGC 7200 + AAATAAGAAT TGAGAACATG ACAGAAGTTC TTAAAGAAAA TTATTATGTT TATAAGGAAT 7260 + CAATAAAATT CTTTATGATT ACGAAACAGC TACACTCATT GATTGAAGAA GGCGAAAAAA 7320 + TTCAAGCAGG CATTATAAGC CTGTTGATTG ATATTAATCA CGGTAGGCTA AATACAAATA 7380 + TTCTCAGGCC AAATCAGCTT AAAAAAGAAA TTGCCAAAAT TCAGCAGAGT CTTTCAGAGA 7440 + ACCTAGTAAT TCCAGGAAAA CGGTCAGGTA CGGAACTTAA GGAGGTGTAT ACACTGTTAA 7500 + CAGCCAGGGG TTTATTCATC GACGATAAAT TGATCATTAG TGCAAAAGTG CCTCTGTTTA 7560 + GCAGGCATCC ATCCAAATTG TTCAGGCTTA TTCCGGTGCC AATTCGAAAT GAAGATCGGA 7620 + TAATAATGGT GCATACAACG TCCGAATATT TAATTTATAA TTTTGAGATA GATTCCTATC 7680 + ACATAATGAC GGAAGCCACA TTAAATCAAT GTCAGAAATG GCAACTAAAT AAGAGAATAT 7740 + GCAAAGGAAG TTGGCCCTGG AATTCAGCGA ATGATAATGC ATGTGAGATT CAGCCTCTAA 7800 + AGCCAGATAA AGCGGCGAAC TGCATCTATA AAACAGTAGT CGACTCTAAA AGTTACTGGG 7860 + TAGAGTTAGA AAAGAAAAGT AGTTGGTTGT TTAAGGTTCC TGCGAATTCA AAAGTCCGTC 7920 + TGCAATGTAC TGGCTCTCAA ATTGAATTGT TTGATTTGCC TCAGCAAGGA GTTTTAAGCA 7980 + TTGCGCCATA TTGTACGGCA AGAACCGACG ATAAAATTCT AGTTGCCCAC CATAACATTC 8040 + AGTCCGAAAG TGAAGAATTA TTATCAACAC CTTATATAGG AGAAGTTAGT GGAGTGCCGA 8100 + AGATTATTTG GGATCCGCTG AAACTATCAA TATTAAATCA TACTGAGGAA TTTGAACGAT 8160 + TGAATAATGA AATTAAATTT ATGAAAGAGA ACCATCAAAA ATTGAAAGAT TTACATTTCC 8220 + ATCATATTTC CGGACATGCT GGATTAATTA TTGCTTTAAT ACTAATGATA GTATTAATAA 8280 + TATATTTCAT ACGGAAATGT GCTGTGCAAC AAAGAATGCA AGCAATAACC TTTGCAGGTC 8340 + CGTTGCCAGT ACTATAAATA TCAATAGTAA ATAAACAATA AAATAATATA ACAAATAAAA 8400 + ATATACAGTC CACTAATAGA AAATGTACTT CTACATAGAA AAAGCAAAAT GTTTAAAATA 8460 + AGTTAATTAA GTACAAATTG TTGAATTAAA AATAATATAA ACCATAATTG TAATCCAATA 8520 + AAATTAAAAG CCAGAAAAAC TAGGCCCATT GAAATCTTAG TTGCAAAATA AATGAACATA 8580 + TATCAAATAA ATACAGTCCA CTACTGTTAT AAATGCAACT AATATACTAA TGTACATCTC 8640 + AGCTTTGCTG GCCCTTTGGC AGAATGTTCA CACATGAACA CGAATATATT TAAAGACTTA 8700 + CAATTTTGGG CTCCGTTCAT ATCTTATGTA AATGAATCGA GAGCGATAAA TTATATTTAG 8760 + GATTTTGTTA TCTAAGGCGA CATGGGTGCA TTGCTCAAAA ACATGTAATT TAAGTGCACA 8820 + CTACATGAGT CAGTCACTTG AGATCGTTCC CCGCCTCCTA AAATAGTCCC TTAGTGGGAG 8880 + ACCACAGATA AGGTCCTCGC CGCTCAAGAT AGGCAGATGT GCCCGAGCGT GGGACCTCGA 8940 + TAAGGCGGGG ACTATTTACG TAGGCCTCTG CGTAGGCCAT TTACTTTAAG ATGCGATTCT 9000 + CATGTCACCT ATTTAAACCG AAGATATTTC CAAATAAAAT CAGTTTCTTA CAAAAACTCA 9060 + ACGAGTAAAG TCTTCTCATT TGGGATTTTA CA 9092 +// +ID BLOOD standard; DNA; INV; 7410 BP. +XX +AC AY180916; +XX +DR FLYBASE; FBte0000279; Dmel\blood. +XX +FT source AY180916:1..7410 +FT SO_feature five_prime_LTR ; SO:0000425:1..398 +FT SO_feature three_prime_LTR ; SO:0000426:7011..7410 +FT SO_feature CDS ; SO:0000316:966..1271 +FT /name="Dmel\blood\sORF" +FT /db_xref="FLYBASE:FBgn0045863" +FT /db_xref="NCBI_PROTEIN:AAN87266.1" +FT /translation="MSTKQTFEHPAPVEQRDLPSIKEVIEVDPSAGPKPLTIQEYKAR +FT TAAREQPPKKKRGGRRIKLLSARRLNIELLKTATNEEDRQRYKERLAAINQQLRGAK" +FT SO_feature CDS ; SO:0000316:1863..3116 +FT /name="Dmel\blood\ORF1" +FT /db_xref="FLYBASE:FBgn0045865" +FT /db_xref="NCBI_PROTEIN:AAN87267.1" +FT /translation="MEWLNLTISINNIRDAFDKSYKCINKTALIKTQTLIFHIKVLIT +FT QYNTLQNLIVTNKSKLTEEHKVQCFKVLSSFGKRLHNTSVRHSIIIEVPTELTKIAEF +FT DESQLRDLDESQPLEDLDIESDIESIEELKFNTVQPNTRNMANALEAQRAYVKQVSAT +FT VPDFDGKKLHLNRFVTALKLTDLTKGDQETLAVEVIKTKIIGPLNYKVEHATTIQAII +FT TILQANVKGESPDVIKAKLINAQQRGKTASQYVTEIDSMRKQLEAAYIDGGLDADNAD +FT KFATKESISAMTKNCANEALKMILTAGTFSTFNDAMEKYLHCSTEITGNSNTVLFYNG +FT NNRRGNYNAYYRGRGRNNYNHNYNQNYNQGYNNNNRGRGGYRGHGNNRDGGNRRGNQS +FT QNNNNNRNVRNVQSENSQTPLSDQQ" +FT SO_feature CDS ; SO:0000316:3749..6733 +FT /name="Dmel\blood\ORF2" +FT /db_xref="FLYBASE:FBgn0045864" +FT /db_xref="NCBI_PROTEIN:AAN87268.1" +FT /translation="MKDYDIFTTPVEKENRTEEILKQLRFPKQFNNELTKLCTEFSDI +FT FGLETEPISANNFYKQKLRLGEKTPVYIKNYRMADSQKPEIARQVKKLIDDGIVEPSM +FT SEYNSPLLLVPKKPLPNSTEKRWRLAVDYRQINKKLLSDKFPLPRIEDILDQLGRAKY +FT FSCLDLMSGFHQIELEKRYRDITSFSTANGSYRFTRLPYGLKVAPNSFQRRMTLAFSG +FT LEPSQAFLYMDDLVVIGCSEKHMLKNLTNVFELCRRHNLKLHPGKCSFFMKEVTYLGH +FT KCTDKGILPDDTKYEVIEKYPIPTDADSARRFVAFCNYYRRFIKNFSDHSRHLTRLCK +FT KNVQFEWTAECNDAFEYLKTELMKPTLLQYPDFGKEFCITTDASKQACGAVLTQDHNG +FT QQLPVAYASRMFTQGESNKSTTEQELTAIHWAINHFRPYIYGKHFMVKSDHRPLSYLF +FT SMKNPSSKLTRMRLDLEEYDFTVEYLKGKDNHIADALSRITIKDLKTINREILKVTTR +FT SKAKQENSCKDEAIVKIQEEKEQTIEKPKVYEVVNNNDTKKYVLIKIDKHKCLLKRGK +FT TIVSRFDVDDLYSNETFDLNQFFQRLISKAGMHKITKMRISPSEQMFQFVSLNEFKIK +FT GNRVLEKVELAILQKVIIIDKNDEAQIKEILTKFHDDPIEGGHTGISRTQSKIKRFYY +FT WPQMTKTISKYVKTCLKCQQAKITTHTKTPLTLMPTPATAFDTVLIDTIGPLPKSEDG +FT NEYAVTIICDLTKFLVTIPTPNKSAKTVAKAIFELFVLKYGPMKTFITDQGTEYKNSL +FT MNELCKYMHIENLTSSAHHHQTLGTIERSHRTFNEYIRSYISVNKSDWDIWLPYFTYC +FT FNTTPSIVHDYCPYELVFGRLPRQFKDFSKINKIDPIYNLDDYSKELKCRLELSYNRA +FT RRMLEKAKADRKLRYDRNTNNFELKIGDKVLLRKETGHKLDKRYEGPYDVVDIGINDN +FT ITIKTGSKKQQIVHKDRLKKHK" +XX +CC Sequence from P1 (complement)DS03023:69372..76782 provided by Guochon Liao, +CC Berkeley Drosophila Genome Project. +XX +SQ Sequence 7410 BP; 2840 A; 1403 C; 1328 G; 1839 T; 0 other; + TGTAGTATGT GCATATATCG AGGGTACACT GTACCTATAA GTACACAGCA ACACTTAGTT 60 + GCATTGCATA AATAAATGTC TCAAGTGAGC GTGATATAAG ATCACCCATT TATGCTTTAA 120 + GCTAAGTCAG CATCCCCACG CTGGCCGCTG GCCATATATG CGCATAAGCT CTCTCTCTCT 180 + CTCTCTTATA CATATATATA TACGCTGCTC TTCTGCCGCT GTCGACGGCG GCGCAGTCGC 240 + AGTATTTAGG TAAGATTAGA CACTCTGTAG AGGTTAAGCG GGCAGAACCG TTTCTGCTAC 300 + TCGAAGAGAT AAGAAGAAAT AAAAAGGTGC CTGACGGCTG CACCCAACTG CAAGGAAAAC 360 + ACGTGTTCTC AATTGGTGGC ATATATTGGT TTATTACATG GCGACCGTGA GGCAGGAGCC 420 + TGCGATCTGA GGACTACTGA GGAAATGCTG CTAATATTGC CGATTTGATT TGGGAATTCT 480 + AAACAGCGAC AACAGGTGTG AGAAGCAGGC CGCCCCTTAC ACCAGTGCGG GAGACCTAGA 540 + GACGGGACAC TGATGAAAAA AAAAGAAACA AAAATACTGA GTGAGTAGAG TGTGGTAATG 600 + GGCAAACGCG GATGTCAGGA AATCAAAAAT AAAGGTATAG CACATATTAA GTGGCTATGA 660 + TATACAAATA AAACACCGCC CCCATGGGCA ACGGCACAGA AATTAACTGC CGAATTAGAC 720 + TTTCTGAAAG AAAACCTCCA GCAAAGAAAG CCGAATACCA CAACTCACTC AGCAAAAATA 780 + GAAATAATCA ATGAAGAAAT AACTGAAAAT TCAACATCAC CCAAGCCGAA AAGACCCGAC 840 + GTCTGCATGA AAGACTGCCC TCGACCATTG TAAGCCGCAA CAGCAATTAG CACGGCATCC 900 + TGCGAGGGTA GGATTAGGAT AAAGGATAAA GGATTCCACC GGCGCGCCGC ACATGACAAC 960 + AGCGAATGTC TACCAAGCAG ACGTTCGAAC ACCCTGCTCC TGTCGAGCAA AGGGATCTGC 1020 + CAAGTATCAA AGAGGTAATA GAGGTAGATC CGTCCGCGGG ACCAAAGCCC TTGACCATAC 1080 + AAGAGTACAA GGCACGGACT GCAGCGAGGG AGCAGCCACC TAAAAAGAAG AGGGGTGGCC 1140 + GCCGGATTAA GTTGCTCAGC GCCCGGAGGC TCAACATCGA ACTACTGAAG ACGGCAACTA 1200 + ATGAGGAAGA CCGGCAGCGC TACAAAGAGC GCCTTGCAGC CATCAATCAA CAACTTCGTG 1260 + GTGCGAAGTA AAGCGGCGGG CTGCGTTATA CGCCATAGCC TCAACCGCCC AAATATTATA 1320 + TTAATGTTGT CGATGCGGTT TCCGCTGCAA CAAAATTACT AACTTATCAG GGACCCATTT 1380 + CATAACTAAC ACATTATACT CAGTCCTAAA CTTAAAATAA GTAATAATAT TGTAAAATTG 1440 + CAAATTGCAA CCGATGTAAA CTGAGTATAA TGAATTCATC TATCAAGTAA AAATATGTTT 1500 + AACAACAGTT TAGACCTATT AAAATTTCGA GCTATATTTA TATCTGATCG AGATAACAAT 1560 + AATTGACCAA TTCTCAAAGT TAAAATTCTA TTTGTACTTT TGATATACAA ATAAAGACTA 1620 + ATTTTCCCCA TATCAAAATG GGACATAAGT CGTGGATACA ACCCCACAGT TAAATTCAAT 1680 + GTACTTACTA TTTTTGATTT TAGTTATCCT ATCAGCCTTT TTACCTTGGC CTTAAAACTT 1740 + TATCAGTTTC ACACAAGATC GTTGAAAAGA CTTACATGAG TCGAGCCAAT GATTTAGACA 1800 + AAATCTAATA GAAACTACAC CAAAAAGGTA CAAGGTCGAT TACATCGCTA AAAGGTACAT 1860 + ACATGGAATG GCTAAACTTA ACCATATCCA TAAACAATAT TAGAGATGCT TTTGATAAAT 1920 + CCTATAAATG TATTAATAAA ACCGCGCTGA TCAAAACTCA GACGCTTATT TTTCACATAA 1980 + AGGTATTGAT AACACAATAC AACACATTAC AAAACCTAAT AGTAACAAAC AAAAGCAAAC 2040 + TCACTGAAGA ACATAAAGTC CAATGCTTCA AAGTTCTCAG TTCATTTGGT AAAAGACTAC 2100 + ATAATACCAG CGTTAGACAC AGTATTATAA TAGAAGTCCC AACAGAACTA ACCAAAATAG 2160 + CAGAATTCGA CGAAAGCCAG TTAAGAGACT TGGACGAGTC GCAGCCGTTA GAAGATTTAG 2220 + ATATCGAAAG CGATATCGAA TCAATAGAAG AATTAAAATT TAATACCGTA CAACCAAATA 2280 + CAAGAAACAT GGCCAACGCA TTAGAAGCTC AGAGAGCATA CGTTAAACAG GTATCTGCCA 2340 + CAGTACCTGA TTTCGATGGT AAGAAACTCC ATTTAAACAG GTTTGTGACA GCACTTAAGT 2400 + TGACGGATCT AACTAAAGGA GATCAAGAAA CTTTAGCAGT AGAGGTCATA AAGACCAAAA 2460 + TTATTGGCCC ATTAAACTAT AAAGTAGAAC ATGCGACAAC GATACAGGCA ATAATTACCA 2520 + TATTGCAGGC AAACGTAAAA GGCGAATCGC CTGACGTTAT AAAGGCCAAA TTAATAAATG 2580 + CCCAACAAAG AGGCAAGACC GCGTCTCAGT ATGTTACAGA AATAGACAGT ATGCGTAAGC 2640 + AGCTCGAGGC AGCTTACATA GACGGCGGAT TAGACGCCGA TAATGCTGAC AAATTCGCGA 2700 + CTAAAGAGTC GATATCAGCA ATGACCAAAA ACTGTGCCAA CGAGGCACTT AAAATGATCT 2760 + TAACTGCAGG TACATTTAGT ACATTCAACG ACGCAATGGA AAAATACCTA CATTGCAGTA 2820 + CAGAAATAAC CGGCAATTCA AATACAGTCT TATTCTATAA TGGGAATAAT AGACGTGGTA 2880 + ATTATAATGC CTACTATCGT GGTAGAGGCA GAAATAATTA TAACCATAAT TATAACCAGA 2940 + ATTATAACCA AGGTTATAAT AATAACAACA GAGGTCGCGG AGGCTACCGC GGCCACGGTA 3000 + ATAACAGAGA CGGAGGTAAC CGAAGGGGTA ACCAAAGTCA GAATAATAAT AACAACCGAA 3060 + ATGTGCGTAA CGTACAATCG GAAAACAGCC AGACCCCCTT AAGCGATCAA CAGTAAAAGT 3120 + GTTTAAAGTA AACCTAAATC TGAGTATTTT CATTAAGACA AAAAACCATG AAACAAACAC 3180 + AGTTCTTACA TTACTAATAG ACACAGGTGC AGAAATTTCA TTGCTAAAAG CCAAAGCAAA 3240 + GGAATATAAT AATATAAATT TCAGTAATAT ATCAAATATT ACAGGTATTG GGCAAGGAAC 3300 + CATACAGTCT ATAGGTACAG TAGATCTTGA CATACGCATT CAGGATGTTC TAGTGCCACA 3360 + TGAATTTCAT GTAGTACCTG AGAATTTTCC GATACCATGC GATGGCATAA TCGGAATAGA 3420 + TTTTATCAAG AAATACAATT GCGTATTAGA GTTTCAAAAT AACAAAGACT GGTTCACAAT 3480 + AAGACCCAAT AACTTCAGTA GACAGATTAG TGTACCAATT ACACATAACT TAGACTCCAA 3540 + CACACTCTTA TTGCCAGCTA GATGCGAAGT AATCAGACAA GTCAAATTAC TCACTAACGA 3600 + AAAAACGGTG GTAGTACCAA ATCAGGAGCT GCAACCAGGT ATAATAGTAG CAAGCACCAT 3660 + TGCCGATAGC AAAAACGCAT TGATTCGCAT TATAAATACA AATAATAAAG ACGCCATAAT 3720 + AGATAGCGCG AAGATCAAAT GCGAATCAAT GAAAGACTAT GACATTTTTA CAACACCAGT 3780 + AGAAAAGGAA AATAGAACTG AAGAAATTTT AAAACAATTA AGATTCCCTA AACAATTCAA 3840 + TAATGAACTA ACTAAGTTAT GCACCGAGTT TAGCGATATT TTTGGTCTAG AAACAGAACC 3900 + AATATCGGCT AACAATTTCT ACAAACAAAA ACTCAGATTA GGGGAAAAAA CACCGGTCTA 3960 + TATAAAAAAC TATCGCATGG CAGATAGCCA AAAACCAGAA ATCGCCAGAC AGGTAAAAAA 4020 + ATTAATAGAT GATGGAATAG TTGAACCATC AATGTCTGAA TATAATAGTC CATTACTTTT 4080 + GGTTCCAAAG AAACCACTTC CGAATTCCAC GGAAAAAAGA TGGCGATTAG CAGTTGACTA 4140 + TCGTCAAATA AATAAGAAAC TATTATCAGA CAAATTTCCA CTTCCAAGAA TAGAAGATAT 4200 + TCTTGATCAA TTAGGAAGAG CAAAGTATTT TTCATGTCTC GACCTAATGT CTGGATTCCA 4260 + CCAGATAGAA CTAGAAAAAA GGTATAGAGA TATAACGTCA TTTTCAACAG CCAATGGCTC 4320 + ATATCGCTTC ACGCGATTAC CATACGGACT GAAAGTAGCA CCAAACTCCT TCCAACGTAG 4380 + GATGACACTT GCATTTTCTG GTCTTGAACC ATCGCAAGCA TTTCTATATA TGGATGACTT 4440 + AGTAGTAATA GGTTGTTCAG AAAAACATAT GCTCAAAAAT TTGACTAACG TATTCGAGCT 4500 + ATGTAGACGA CATAATTTGA AACTACATCC AGGGAAATGT TCTTTCTTTA TGAAAGAAGT 4560 + AACATATTTG GGTCACAAAT GTACCGATAA AGGTATACTC CCAGATGACA CCAAATATGA 4620 + AGTTATAGAA AAATATCCTA TACCAACAGA TGCCGACAGT GCTAGGCGTT TCGTAGCCTT 4680 + CTGTAATTAT TACAGACGTT TCATTAAAAA TTTTTCTGAT CATTCACGCC ACTTAACGAG 4740 + GCTTTGTAAA AAGAATGTTC AATTCGAATG GACAGCAGAA TGCAATGATG CATTCGAATA 4800 + CCTTAAAACA GAATTAATGA AACCAACATT ACTACAGTAC CCAGATTTCG GTAAAGAATT 4860 + TTGCATAACA ACCGATGCTA GTAAACAGGC ATGCGGAGCG GTACTTACAC AAGATCACAA 4920 + TGGTCAACAA CTTCCAGTGG CATACGCTTC AAGAATGTTC ACTCAAGGTG AAAGTAATAA 4980 + GTCCACTACA GAACAAGAAT TAACGGCCAT TCATTGGGCC ATAAATCATT TTCGACCATA 5040 + CATATATGGC AAGCATTTCA TGGTAAAAAG CGATCATAGA CCATTGTCAT ACCTATTCTC 5100 + TATGAAAAAT CCAAGTTCAA AACTCACTCG TATGAGGCTG GATTTAGAAG AGTATGACTT 5160 + TACTGTAGAA TATCTTAAGG GGAAAGATAA CCATATTGCG GACGCCTTGT CTCGCATAAC 5220 + AATAAAAGAT CTGAAAACAA TCAACAGAGA AATATTAAAA GTTACCACCA GATCAAAAGC 5280 + TAAACAGGAA AATTCCTGTA AGGACGAAGC AATAGTCAAA ATACAAGAGG AAAAAGAGCA 5340 + AACAATAGAA AAGCCCAAAG TCTATGAAGT TGTCAATAAT AATGACACAA AGAAATATGT 5400 + TTTAATCAAA ATAGATAAAC ACAAGTGTTT ATTAAAACGA GGAAAAACAA TTGTTTCACG 5460 + CTTTGATGTT GATGACTTGT ATTCTAATGA AACATTTGAT CTAAATCAAT TCTTTCAAAG 5520 + GCTTATTTCA AAAGCCGGAA TGCATAAAAT AACAAAAATG CGAATATCAC CAAGCGAACA 5580 + GATGTTCCAA TTTGTATCAC TAAATGAATT TAAAATAAAG GGCAACCGAG TACTCGAAAA 5640 + AGTAGAACTA GCTATTCTAC AAAAGGTGAT AATTATAGAC AAAAATGACG AAGCTCAGAT 5700 + TAAAGAAATT TTGACAAAAT TCCATGATGA TCCTATAGAA GGAGGCCACA CTGGTATTTC 5760 + GCGAACCCAG TCAAAAATCA AAAGATTTTA TTATTGGCCC CAGATGACCA AGACAATCTC 5820 + AAAGTATGTA AAGACTTGTT TGAAATGTCA ACAAGCCAAA ATTACAACAC ATACGAAAAC 5880 + TCCATTAACA TTGATGCCAA CGCCAGCAAC AGCATTTGAT ACTGTTTTAA TTGATACCAT 5940 + TGGTCCACTA CCGAAATCGG AAGACGGAAA TGAGTATGCA GTTACAATCA TATGCGATCT 6000 + AACCAAGTTT TTAGTAACTA TTCCAACACC AAATAAAAGT GCTAAAACAG TTGCAAAGGC 6060 + TATATTTGAA TTATTTGTAC TGAAGTACGG TCCAATGAAG ACGTTCATTA CAGATCAAGG 6120 + TACGGAATAC AAAAATTCAC TTATGAATGA ATTATGCAAA TATATGCATA TAGAAAATCT 6180 + AACATCTAGC GCTCACCATC ATCAAACTTT AGGAACAATA GAAAGAAGCC ACCGAACTTT 6240 + TAATGAATAT ATACGTTCAT ACATATCGGT TAACAAAAGT GATTGGGACA TTTGGTTACC 6300 + ATATTTCACT TATTGCTTCA ATACAACACC CTCAATAGTC CATGACTATT GCCCATACGA 6360 + ACTAGTATTT GGCAGACTAC CCAGACAATT CAAAGATTTC AGTAAGATAA ACAAAATAGA 6420 + CCCAATATAC AACTTAGACG ACTACTCTAA AGAGCTTAAA TGCAGACTAG AATTGTCGTA 6480 + CAACAGAGCA AGAAGAATGT TAGAAAAAGC AAAAGCGGAT AGAAAATTAA GATATGATAG 6540 + GAATACAAAT AATTTCGAAT TAAAAATAGG AGATAAAGTA TTACTTAGAA AAGAAACAGG 6600 + TCATAAGTTA GATAAAAGAT ATGAAGGTCC TTATGACGTA GTAGATATAG GAATAAATGA 6660 + CAATATAACC ATTAAAACAG GAAGTAAGAA ACAACAAATA GTACATAAAG ATAGGCTAAA 6720 + AAAGCACAAA TAGAATGAAA AAAAAAAAGG GCAATCAATG CCAAACCTTT CATAATAAAA 6780 + CTTAAATAAC GGCCTGATCA GCCAAAACAA TATAACAAAG ACATAGACAT AATCGAATTT 6840 + TTATTAATTC AAAATACATA CATATTTTTT CTTTATTCAT TTAAAAATTC TATATCATAA 6900 + ATAATGTTAA TTCATTAAAA ATAATATTTA AGTAATTTTT ATTTTATAAT GGTAATATAG 6960 + TTGATAGAAA ATAACTTCAT TTCTTTACGT TATTTTAAAA AAGAGGGGAG GTGTAGTATG 7020 + TGCATATATC GAGGGTACAC TGTACCTATA AGTACACAGC AACACTTAGT TGCATTGCAT 7080 + AAATAAATGT CTCAAGTGAG CGTGATATAA GATCACCCAT TTATGCTTTA AGCTAAGTCA 7140 + GCATCCCCAC GCTGGCCGCT GGCCATATAT GCGCATAAGC TCTCTCTCTC TCTCTCTTAT 7200 + ACATATATAT ATACGCTGCT CTTCTGCCGC TGTCGACGGC GGCGCAGTCG CAGTATTTAG 7260 + GTAAGATTAG ACACTCTGTA GAGGTTAAGC GGGCAGAACC GTTTCTGCTA CTCGAAGAGA 7320 + TAAGAAGAAA TAAAAAGGTG GCCTGACGGC TGCACCCAAC TGCAAGGAAA ACACGTGTTC 7380 + TCAATTGGTG GCATATATTG GTTTATTACA 7410 +// +ID DMZAM standard; DNA; INV; 8435 BP. +XX +AC AJ000387; +XX +DR FLYBASE; FBte0000217; Dmel\ZAM. +XX +FT source AJ000387:1..8435 +FT SO_feature five_prime_LTR ; SO:0000425:1..473 +FT SO_feature three_prime_LTR ; SO:0000426:7963..8435 +FT SO_feature CDS ; SO:0000316:join(494..531,6387..8004) +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\ZAM\env" +FT /db_xref="FLYBASE:FBgn0024272" +FT /db_xref="SPTREMBL:O46113" +FT /db_xref="NCBI_PROTEIN:CAA04048.1" +FT /translation="MENTLLNLLLVLLSCHGAYQSIFIHNFNSTNLLAKVPVGKTLVIG +FT NYKKISHIIDLSEYTNCIEKLYHTIDTLRQDETLTDSISILNAKLAQTQSKIDALTPFS +FT RHKRGLINGLGSLVKVVTGNMDANDAKNIETEINHLKSQSTTISDNFEIQNSFNDEVQL +FT RFKNLTRHINNEQNLIKNFFENTQNTIYTKIYNNEEEIKKLQYINRLNYNIDLLVSHLS +FT DIIESTLLAKINVIPKLILDKTEITKIKQIFKTQNYTIKSEQHIYNLLKMNALNYQNKI +FT IFSIKIPIFLSCNYEMARLIPLPINSTQFVIAPKYLIYNNKSNSMFSTMYKCPVIEEQF +FT VCEIDSINNLKNNTCLGHLIQNKTSYCDIKETGLTTDVFEPEKGFILVFNGNNLPIISS +FT NQTITSINGSAIIKYNNCTLKINEINYDNRAVSTEEHPDFFLPPMRKLIKNATINILTL +FT ERLHLDTLTTSNKLLVVAAGNSRHSTTLYILFTVSLVAVILTWTLRRDTHIFHTGPDHI +FT LPIVAPPIPPSMAFAPNWGGRSYRPIGTIHHPSL" +FT SO_feature CDS ; SO:0000316:1789..2820 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\ZAM\gag" +FT /db_xref="FLYBASE:FBgn0024271" +FT /db_xref="SPTREMBL:O46114" +FT /db_xref="NCBI_PROTEIN:CAA04049.1" +FT /translation="MSKKLTQTIKQTTRSVLESHTFPKRVTRSVSKTNTLPVIRESTPL +FT PPLQPINMDSGNASVGNSAPVTPTVSGFSSIATALSATDILAFVKELPTFDGTPGQLDK +FT YITSVEEIIMLIRGTDQTPYGLLTLRAIRNKIVGRADEALNLANTKLIWDDIKSNLLRL +FT YSSKKSEATLLGELQSLPDNLTLGQLFFGLSRIRSQLISITSNSGQSATIIEAKKTLYD +FT EVCLNAFISRIREPLKTVIRLKDPKTIETAYELCQGERARYQNRNPYPPTQNNTERRTN +FT NYNNNNNNNHRDNNNRNNVTRLTPKTTQTITQTPIPNIVNQTTATELVTRLKIIKQIMG +FT YTT" +FT SO_feature CDS ; SO:0000316:<2795..6448 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\ZAM\pol" +FT /db_xref="FLYBASE:FBgn0024270" +FT /db_xref="SPTREMBL:O46115" +FT /db_xref="NCBI_PROTEIN:CAA04050.1" +FT /translation="NKLWATQHRRRKTHPTLPYQLKFSGTRLRNPTGYINPTTHATSLP +FT YITLNLQQKFPLSFLIDTGSNNSFIDPESANQLECTILPTSTSITTALNSFKIEEKAIF +FT PMPPEFKTEGQITLLKFKFHSYFNGLIGMDLLSHLEAKVDLVNLQLVTSKSTLPIFLYT +FT NQASKIFNIPAYSKVILPLPVKTNHGEFYCCTTQLNNELSLSEGLYKSNNNIANVEISN +FT QSDSDKLLYLEYPLETIPYNKNDHIELFNISATPLNNDTPQAPLHILTEHLNPEEKTAL +FT TTLCKQFRDIFYNPETPLTFTNKITHSIPTIDNTPIHTKSYRYPFVHKTEVKKQIESML +FT DQQIIRSSHSPWSAPVWVVPKKLDGTGNRKWRLVIDYRKLNDKTISDRYPIPNINDILD +FT SIGKAKYFSTLDLTSGFHQIEMNPKDIAKTAFTVEGGHYEFTRMPFGLKNAPATFQRVM +FT DSVLGDLNGTICLFYLDDIIIFSPSLQKHLLDIKMVFEKLRAANFKLQPSKSEFLRKEI +FT EFLGHIVTQDGVKPNPNKISAIKKFPCPTNRRAIKSFLGLLGYYRKFIRDFARITKPMT +FT KQLKGKRQVTTDKDFVDAFEQCKTLLSNDPILIHPDFEKPFILTTDASNFALGAVLSQG +FT SLQNDRPVCFASRTLSDTEVNYSTIEKEMLAIIWAVKYFRPYIYGVKFTIVTDHKPLIW +FT LMNFKEPNSKIIRWRLQLMEYNFEIIHKKGSQNVIADALSRADPNLNYNETLTVKPCPT +FT SEKPINEFNTQLILEIDTNTSYQTTTPFKQKIRKKYSQPCFDFDNIVKILKGTLKPNRI +FT CAFLADDNNSALIEKAFSTYFAHKKHFKIIRCKSLLHEIVGNPEQNKFIQEYHTNSNHR +FT GIDETFLHLKRETYFPNMKNKISELIRNCETCLKLKYDRQPQNIVFETPETPSKPLDII +FT HIDIYTINNNFNLTIIDKFSKFAAVYPIPNRNGINCIKAIKNFFSQFGLPKKLIHDQGV +FT EFCNDIFRKFCSQYNILLHVTSFQQSSSNSPVERLHSSLTEIYRIILDTRKKHKLPTDH +FT EEIMSETVITYNNAIHSTTKHTPFELFNGRTHLFEKTIIPNNEHDYLNKLNTFQDKLYS +FT EIKEKLSTNTQQRIEKLNTSRVEPTTVQPNSTIFRKENRRNKLTPRFSLHRTAKDKGKT +FT LVTTRNQKIHKSKIRKISKPPNDLSLSTCIPDLAMGHTNLSSSTTSIAPTS" +XX +CC Derived from AJ000387 (e1237231) ((Rel. 54, Last updated, Version 1). +CC Takis Benos and Michael Ashburner, 19-Jan-1998. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 8435 BP; 3286 A; 2055 C; 1151 G; 1943 T; 0 other; + AGTTACCGAC CCATCGGTAC CATACACCAC CCCTCCCTCT AAGCCACCAC GCCTACACAA 60 + GTAGAAGACA TCGAACCGGG AAGCTTTGCG ATACAAAGTT GCAGCATAAA CATCAACAAC 120 + GGGTCAGACG CCGACATCCG CCCAAAATGC TGACACCACA TCCTTTTCGC TCAGACAGAA 180 + CAACGCATAC AATTCCATAT ACATACGTAT AAACATACTC ATACTTTCTG CTGTGTCAGA 240 + TACTTTATTT CTAAGAACTT TAACATTGTA ATACATACAC ACATATTCAC TGTTAGCCCA 300 + TTTAAGACGA AGAATAAAGA CGACCACAGT CGAGTGCAAG CAGCAAACAC TTGTAGACGT 360 + ACATAATCTC CGATCAAAAT TCTCCCAAGA CGACCGTGGC TACGTTCTGG ACCCGCATAA 420 + CTCCTCTATC TTTCTGAGTG ATAATACCTC CGCAAGACTC CCCGGAGGTA ACTGGCGCAG 480 + CCGGAAAACT GGAATGGAAA ATACTTTATT AAACCTTCTA TTAGTTCTAT TGTAAGTAGT 540 + TGTGGAAAAA GAGTGAGAAT GAAGTGCAGA AATGTCTAAA AGTGATTACA ACAAAAATCC 600 + TAATACAATA CATAAACCGC CTTAACAAAC ATACAAAACA CGCATATAAA AAAAAAAAAA 660 + AAAAAAAAAA GAAAAAAAAA AACCCAAAAC TTAAAAATGC CGTAACCGCG AAACATGATA 720 + TGCGTTGTAC TTGTGTGAAA TCAATCGCTG ATAGTCACTG CCGAAGTTTA TTAAGGCCAA 780 + GTACCATATC ATTACTTTCA TGTTTACATA CATATATATG CCCCACAATT AAAACAACAT 840 + ACACACACAC AAATATTTCA AATGCAAAAA AAAAAAAAAG AATGTAGTGT ACCTGCGTGG 900 + CATCAATCGC TGATAAACCA CTGCCGAAAT ATTAAAGGCC CGGTACTACA TCACAAAACA 960 + CGTATATATG CAACAAAAAT ATACACAACA AAACCATATA TACAAACGTG TATGAGTGAC 1020 + GTGTAATGTA CTTGTGTGAA ATCAATCGCT GATAATCACT GCCGAAGCTT AGTAAGGCCA 1080 + AGTACCACAT CATTACTAAC ATGTGTACAT ATATATATAT GCAAAACAAT TAAAACAACA 1140 + TACACACACA CAAATATTTC AAATGCAAAA AAAAAAAAAA AAGAGGAAAT GTTGTGTACC 1200 + TGCGTGGCAT CAATCGCTGA TAAACCACTG CCGAAATATT AAAGGCCCGG TACTACATCA 1260 + CAAAACACGT ATATATGCAA CAAAAATATA CACAACAAAA CCATATATAC AAACGTGTAT 1320 + GAGTGACGTG TAATGTACTT GTGTGAAATC AATCGCTGAT AATCACTGCC GAAGCTTAGT 1380 + AAGGCCAAGT ACCACATCAT TACTAACATG TGTACATATA TATATGCAAA CCACCAAAAC 1440 + AAATACATAT ACACATACAA ACACTCCAAA AAAAAAAACA AATAATACTA TATGAACGGC 1500 + GAAGCGTATG TTTTCTAAGG CTGGATACAA AACCACAAAA CCAAATATAA ATTGCACACC 1560 + TTAATAAAGA AAAGAACAAA AATGATAATA AACAAAAGAA ATTTTTTTTG GAACATGCAC 1620 + CCATACTCTC ACTCTTTCAA CACAAATAAA GTATTCAAAT TATACATACA TACAATAATA 1680 + CCACTATATT ACAGAAATTA ACGCACAAGA AAACACACAC ACTATCCAAC AACAAACAAG 1740 + TAATTAAGAG TTATTAAGTA CATTGTAAAC TACATATTTT TATCTTAAAT GTCAAAGAAA 1800 + TTAACACAAA CTATTAAACA AACAACTCGC TCCGTGTTAG AATCACACAC ATTTCCCAAA 1860 + AGAGTTACAC GATCAGTTTC GAAAACAAAC ACCCTCCCCG TAATAAGAGA AAGCACCCCC 1920 + TTACCGCCCC TTCAACCTAT AAATATGGAT TCGGGCAACG CCTCCGTAGG TAATTCCGCC 1980 + CCCGTAACAC CTACTGTCAG TGGCTTTAGC AGTATTGCTA CGGCACTTAG TGCCACCGAT 2040 + ATTTTAGCCT TCGTTAAAGA ACTTCCGACC TTCGATGGTA CTCCAGGCCA ACTCGACAAA 2100 + TATATAACTA GCGTTGAGGA AATAATCATG CTCATTAGGG GTACCGACCA AACTCCGTAC 2160 + GGACTTCTGA CACTCAGGGC AATTAGGAAT AAAATAGTTG GAAGAGCAGA CGAAGCTCTA 2220 + AACCTAGCCA ACACCAAACT TATATGGGAC GATATCAAAA GTAACCTACT ACGTTTATAC 2280 + TCTAGCAAGA AAAGCGAAGC TACCCTCTTA GGCGAGCTCC AATCTCTCCC AGATAACCTA 2340 + ACCCTAGGGC AATTGTTCTT CGGCTTATCG AGGATTAGGA GCCAACTTAT ATCCATTACT 2400 + TCCAATAGTG GACAGTCGGC CACAATCATC GAAGCCAAGA AAACACTATA TGACGAAGTC 2460 + TGTTTAAACG CCTTCATCTC AAGAATTAGA GAACCACTTA AAACAGTCAT CAGATTGAAA 2520 + GACCCCAAGA CTATCGAAAC AGCTTACGAG CTATGTCAAG GAGAAAGGGC TCGTTACCAG 2580 + AACAGAAACC CATATCCCCC AACACAAAAC AACACCGAAC GACGAACTAA CAACTACAAT 2640 + AACAATAACA ACAACAATCA CAGAGACAAC AACAACCGCA ACAACGTAAC TCGTCTTACA 2700 + CCCAAAACCA CTCAAACCAT TACTCAAACC CCAATTCCCA ATATCGTCAA TCAAACAACG 2760 + GCAACAGAAC TAGTAACCCG TTTAAAGATA ATAAAACAAA TTATGGGCTA CACAACATAG 2820 + AAGAAGAAAA ACTCACCCAA CACTGCCTTA CCAACTTAAA TTTTCAGGCA CCCGCCTCAG 2880 + GAACCCAACA GGATACATAA ATCCTACCAC ACATGCAACA TCCCTTCCAT ACATAACTCT 2940 + AAACCTCCAA CAAAAATTCC CTTTATCATT TCTTATCGAT ACAGGATCCA ATAACTCCTT 3000 + CATTGACCCA GAATCTGCAA ACCAACTAGA GTGCACAATT CTACCAACAT CCACTTCAAT 3060 + TACAACAGCA TTAAATAGTT TCAAAATTGA AGAAAAGGCA ATATTCCCAA TGCCACCCGA 3120 + GTTCAAAACC GAAGGTCAAA TTACCCTACT TAAATTCAAA TTTCACTCTT ATTTCAATGG 3180 + CCTCATAGGA ATGGACCTAT TATCACACCT AGAAGCAAAA GTAGACCTAG TAAACTTACA 3240 + ACTAGTAACT TCAAAGTCTA CACTCCCAAT ATTCTTATAC ACTAACCAGG CTTCAAAAAT 3300 + TTTTAACATC CCCGCCTACA GTAAAGTTAT CTTACCACTA CCAGTAAAGA CTAATCATGG 3360 + GGAATTCTAT TGTTGTACTA CACAACTAAA TAATGAGTTA TCGTTGTCAG AAGGACTATA 3420 + TAAATCAAAC AATAATATTG CCAATGTCGA AATCTCTAAC CAATCCGACT CAGATAAACT 3480 + ATTATACCTA GAATACCCCC TAGAAACCAT TCCATACAAT AAAAACGACC ATATAGAGCT 3540 + CTTTAATATA TCAGCTACAC CTCTTAATAA CGATACCCCT CAAGCCCCAT TACATATCCT 3600 + CACAGAACAC CTCAATCCAG AGGAAAAAAC AGCCTTAACA ACCCTATGTA AACAATTTCG 3660 + CGACATATTC TACAACCCAG AAACACCATT AACTTTTACC AACAAAATCA CACACTCCAT 3720 + CCCAACCATA GATAACACTC CTATCCACAC AAAATCCTAC AGATACCCTT TTGTCCATAA 3780 + AACAGAAGTC AAAAAACAAA TCGAATCCAT GTTAGACCAA CAAATTATTA GATCTAGCCA 3840 + CTCCCCTTGG AGCGCCCCGG TGTGGGTGGT CCCAAAAAAA CTAGACGGGA CAGGGAACAG 3900 + GAAATGGCGA CTTGTAATAG ACTACCGGAA ACTCAACGAC AAAACCATTT CGGACAGATA 3960 + CCCCATCCCA AACATAAATG ACATATTAGA TAGCATAGGC AAAGCAAAAT ATTTCTCAAC 4020 + GCTCGACCTA ACTAGCGGTT TTCATCAAAT CGAGATGAAT CCAAAAGATA TCGCCAAAAC 4080 + AGCCTTTACA GTCGAAGGGG GTCACTACGA ATTCACACGG ATGCCCTTCG GCTTAAAAAA 4140 + CGCACCGGCT ACCTTTCAAC GGGTTATGGA CAGCGTTCTT GGCGATCTCA ACGGCACCAT 4200 + TTGCCTATTC TATCTTGACG ATATTATAAT TTTCTCGCCT TCCCTACAAA AACACCTGTT 4260 + GGACATAAAA ATGGTATTCG AAAAACTCAG AGCGGCAAAC TTTAAACTAC AACCTTCAAA 4320 + ATCAGAATTC CTAAGGAAAG AGATAGAATT TCTAGGCCAC ATAGTCACAC AAGACGGAGT 4380 + TAAACCAAAC CCGAACAAAA TAAGTGCGAT CAAAAAATTT CCTTGCCCCA CCAACAGAAG 4440 + AGCTATCAAA TCTTTTCTCG GGTTACTGGG TTATTATAGG AAGTTTATAA GAGACTTTGC 4500 + ACGAATAACG AAGCCCATGA CTAAACAATT GAAAGGGAAA AGACAAGTTA CTACAGACAA 4560 + AGACTTTGTA GACGCATTCG AACAGTGCAA AACTCTTCTG TCCAATGACC CAATACTCAT 4620 + ACACCCAGAC TTCGAAAAAC CATTCATTCT TACTACGGAT GCTAGTAACT TCGCGTTAGG 4680 + AGCCGTACTA TCTCAAGGCT CCTTACAAAA CGATAGACCT GTATGTTTTG CCAGCAGGAC 4740 + CCTCTCCGAC ACCGAAGTCA ACTATTCAAC CATAGAAAAA GAAATGTTGG CAATAATATG 4800 + GGCAGTAAAA TACTTCAGAC CATATATTTA TGGCGTAAAA TTTACTATTG TTACAGATCA 4860 + CAAGCCACTA ATATGGCTTA TGAATTTCAA AGAACCCAAC TCAAAAATAA TTCGTTGGAG 4920 + ACTCCAACTC ATGGAATACA ATTTTGAAAT AATTCACAAG AAAGGTTCAC AAAATGTAAT 4980 + TGCAGACGCC TTAAGTAGAG CGGACCCAAA TTTAAACTAC AACGAAACAC TGACTGTTAA 5040 + GCCTTGCCCC ACATCCGAAA AACCTATTAA CGAATTTAAC ACGCAACTCA TACTAGAAAT 5100 + AGATACAAAT ACGTCTTACC AAACTACAAC ACCATTTAAA CAAAAGATTA GGAAAAAATA 5160 + TTCACAGCCT TGCTTCGATT TCGATAATAT TGTTAAAATC TTGAAAGGAA CCCTAAAACC 5220 + TAACAGGATT TGCGCATTCT TGGCGGACGA TAATAATTCC GCATTAATCG AAAAAGCATT 5280 + CTCAACGTAT TTTGCACATA AAAAACACTT TAAAATTATC AGATGCAAAT CACTTCTCCA 5340 + CGAAATCGTA GGAAACCCCG AACAAAACAA ATTCATTCAG GAATATCACA CTAACAGCAA 5400 + CCACAGAGGC ATAGACGAAA CATTCCTTCA CCTCAAACGA GAAACCTACT TCCCCAATAT 5460 + GAAAAACAAA ATCTCTGAAT TAATTAGGAA TTGCGAAACC TGTCTAAAAC TCAAATACGA 5520 + CAGGCAACCA CAAAATATAG TATTTGAAAC CCCAGAAACC CCATCGAAAC CCCTCGACAT 5580 + AATACACATA GACATCTATA CTATTAACAA TAATTTTAAC CTGACAATCA TAGACAAATT 5640 + CTCAAAATTC GCAGCTGTCT ACCCCATCCC AAATAGAAAC GGCATCAATT GCATCAAAGC 5700 + AATCAAAAAT TTTTTCAGTC AATTCGGACT ACCCAAAAAA CTAATACACG ACCAAGGAGT 5760 + AGAATTTTGC AACGACATAT TTCGAAAGTT TTGCTCTCAA TATAATATAC TTCTCCATGT 5820 + CACATCCTTC CAGCAATCTT CAAGTAATTC TCCAGTAGAA CGTTTACACT CCTCTTTGAC 5880 + AGAGATTTAC AGAATAATAC TAGACACACG GAAAAAACAC AAATTACCTA CAGACCACGA 5940 + AGAAATAATG TCAGAAACTG TAATAACATA TAACAACGCA ATCCACTCCA CCACCAAACA 6000 + CACCCCTTTT GAACTTTTTA ATGGTAGGAC CCATTTATTC GAGAAAACAA TAATACCCAA 6060 + TAATGAGCAT GACTATTTAA ATAAACTAAA TACGTTCCAA GACAAACTAT ACTCCGAAAT 6120 + AAAAGAAAAA TTGTCCACAA ACACCCAACA AAGGATAGAA AAGCTAAACA CAAGCAGAGT 6180 + AGAACCAACA ACAGTACAAC CTAACAGCAC AATTTTCAGA AAAGAAAACA GGAGAAATAA 6240 + ATTAACACCA CGGTTTTCCT TACACAGAAC AGCAAAAGAC AAAGGAAAAA CTCTAGTAAC 6300 + CACAAGAAAT CAAAAAATCC ACAAATCAAA AATTAGGAAA ATATCCAAAC CTCCAAATGA 6360 + CTTAAGCCTT TCCACCTGCA TTCCAGATCT TGCCATGGGG CATACCAATC TATCTTCATC 6420 + CACAACTTCA ATAGCACCAA CCTCCTAGCA AAAGTGCCGG TAGGGAAAAC ACTCGTGATA 6480 + GGAAACTATA AAAAAATTAG CCACATAATC GATCTGTCCG AATACACCAA CTGTATTGAA 6540 + AAATTATACC ACACCATCGA TACCCTAAGA CAAGATGAAA CACTCACCGA TTCTATATCA 6600 + ATACTAAATG CTAAACTGGC CCAAACTCAA AGTAAAATAG ACGCACTAAC ACCCTTTTCA 6660 + CGCCACAAAA GAGGTCTTAT TAACGGGTTA GGTAGTTTAG TCAAAGTCGT CACCGGCAAC 6720 + ATGGACGCCA ATGATGCAAA GAATATAGAA ACAGAAATTA ACCACTTAAA AAGCCAGTCC 6780 + ACCACTATCT CAGATAACTT CGAAATACAG AACTCGTTCA ATGATGAAGT TCAACTACGG 6840 + TTCAAAAACT TAACAAGACA CATTAACAAT GAACAGAATT TGATTAAAAA CTTCTTCGAA 6900 + AACACTCAAA ATACAATTTA CACAAAAATA TACAACAACG AAGAAGAAAT AAAGAAACTA 6960 + CAATATATAA ATAGGCTTAA CTACAATATA GATTTATTAG TTAGCCACCT AAGCGACATT 7020 + ATAGAAAGTA CACTGCTTGC CAAAATTAAT GTTATCCCAA AACTCATCTT AGACAAGACA 7080 + GAAATAACCA AAATCAAACA AATTTTTAAA ACACAAAACT ACACAATAAA ATCCGAGCAA 7140 + CACATTTATA ACCTCTTAAA AATGAACGCA CTCAATTACC AAAACAAAAT AATTTTTAGT 7200 + ATCAAAATTC CTATTTTTTT AAGTTGTAAC TACGAAATGG CAAGATTAAT TCCACTTCCA 7260 + ATAAATTCCA CACAATTTGT AATAGCACCT AAGTACTTAA TATATAATAA CAAAAGTAAC 7320 + AGCATGTTTT CAACTATGTA TAAATGTCCT GTAATAGAAG AACAATTCGT CTGCGAAATC 7380 + GACTCCATCA ATAATCTTAA AAATAATACT TGCCTGGGAC ACCTTATCCA AAATAAGACC 7440 + AGCTACTGCG ACATAAAGGA AACGGGACTC ACGACTGATG TGTTCGAACC GGAAAAAGGC 7500 + TTCATACTTG TATTTAACGG GAACAACCTC CCAATCATCT CCTCCAACCA GACCATAACT 7560 + AGTATCAATG GATCAGCTAT AATAAAGTAT AACAATTGCA CATTAAAAAT CAATGAAATA 7620 + AACTACGACA ACAGGGCGGT ATCAACAGAA GAGCACCCCG ACTTCTTCCT ACCACCAATG 7680 + CGGAAACTAA TAAAAAATGC CACTATCAAC ATACTCACCT TGGAAAGACT TCACCTGGAT 7740 + ACACTCACAA CATCCAATAA GCTACTGGTC GTCGCCGCAG GAAACTCTCG ACACTCGACA 7800 + ACCTTGTATA TCCTCTTCAC CGTATCCCTA GTCGCCGTAA TACTCACCTG GACACTTCGA 7860 + AGGGACACCC ACATCTTCCA TACCGGGCCC GACCACATTC TTCCAATCGT CGCTCCACCA 7920 + ATTCCTCCGT CTATGGCCTT CGCTCCAAAC TGGGGGGGGA GGAGTTACCG ACCCATCGGT 7980 + ACCATACACC ACCCCTCCCT CTAAGCCACC ACGCCTACAC AAGTAGAAGA CATCGAACCG 8040 + GGAAGCTTTG CGATACAAAG TTGCAGCATA AACATCAACA ACGGGTCAGA CGCCGACATC 8100 + CGCCCAAAAT GCTGACACCA CATCCTTTTC GCTCAGACAG AACAACGCAT ACAATTCCAT 8160 + ATACATACGT ATAAACATAC TCATACTTTC TGCTGTGTCA GATACTTTAT TTCTAAGAAC 8220 + TTTAACATTG TAATACATAC ACACATATTC ACTGTTAGCC TATTTAAGAC GAAGAATAAA 8280 + GACGACCACA GTCGAGTGCA AGCAGCAAAC ACTTGTAGAC GTACATAATC TCCGATCAAA 8340 + ATTCTCCCAA GACGACCGTG GCTACGTTCT GGACCCGCAT AACTCCTCTA TCTTTCTGAG 8400 + TGATAATACC TCCGCAAGAC TCCCCGGAGG TAACT 8435 +// +ID DME010298 standard; DNA; INV; 8507 BP. +XX +AC AJ010298; +XX +DR FLYBASE; FBte0000359; Dmel\GATE. +XX +SY synonym: Batumi +XX +FT source AJ010298:1..8507 +FT SO_feature five_prime_LTR ; SO:0000425:1..272 +FT SO_feature three_prime_LTR ; SO:0000426:8236..8507 +FT SO_feature polyA_signal_sequence ; SO:0000551:158..163 +FT SO_feature polyA_signal_sequence ; SO:0000551:8383..8398 +FT SO_feature primer_binding_site ; SO:0005850:276..293 +FT SO_feature RR_tract ; SO:0000435:8236..8507 +FT SO_feature CDS ; SO:0000316:1741..6456 +FT /name="Dmel\GATE\polyprotein" +FT /db_xref="FLYBASE:FBgn0044067" +FT /db_xref="SPTREMBL:O76925" +FT /db_xref="NCBI_PROTEIN:CAA09069.1" +FT /translation="MPIGDDKKKLSADKPRSIFSPQGPKSPRIPSISVKTPAQISDDCA +FT TPSKATVQRTAKNMAASDLALAKFISVSDAQANLRLRSTLRNPQLQPSRCLASVATKSE +FT AYGTRLKRIRPLLRVPCVSRRAAASGMPILRASYSYCYSVYERCVAQLVDKIEQGHFSV +FT HPKRTLRPRPTFPLAVGCLHAIQEFSQVTIFAGRFPDLLHAIYINNPRLTPFEKLFHLN +FT AKTSGDAHAIVSISPLTKRGFSSAWENLIERFENKRLLVNSQLKILFNVQSIPQESGAA +FT LKVMQSTVQGCLTALELSGINTENWDCLLEYLCSSKLPKITLSLWEQSLHKKADIPTWG +FT ELNTFLTERHRTLEAIDDVRPSVPSQSHSKAMNSSGPSRDGKLASDLCNKENHPVRVCR +FT VFSKWSVDDRSAYIKRKQLCLNYFAKGHQLRECKDRQSFTWWPASHVVAPKQPLFQQFK +FT PFKSCKPNFRYSGQFRSKRASRCSKLFCHGSRAILLGSAIINSSHLGTNFKARALIDSG +FT SEATFITEPLFNLIRLPFQVVQAQVSGLNQTVAAQFKNAAVSPSDLRLGRVAVGDDGLC +FT PPSTSRKSAFLPNSAKFLRDLPDFPLADPKFYESAPIDVLIRSPHPASVLLSGAKTNIC +FT GSLLGQETIFRWVLTGPVSASAQSRIPLFRHRSPTRTIIHWTNSSQNLGRWRIYQQSCK +FT RIRFHVRERVGKCLRRHQCGKYVVTLPFRDPEHIGCGLGHSRSWALAQFLKNEQRLKKD +FT EALKARYDSVIQEYLDLKHMRQVLPTHDCNAYYMPHHAVLKPESVTTKLRVVFNASSPS +FT SNGTSLNDILHAGPVLQSDLTVQILKWRDFRYVFSADIQKMYRQIWVDPKHTPFQRILF +FT RNNRGEIRDFELKTVTFGVNCAPLLAIRVLQQLAADEELSHPKASNVIRNFMYVDDVLA +FT GADSTEEAQLMVHELRDALNSSSSRQRWLSKRPLQRQVLSQIAKLFDPAGWLAPFIVRA +FT KIFMQEIWLQELGWDENVPNDLFQRWLNFLQSYSVFEQIRIPRWLSFHPDFKVEHHGFC +FT DASQKAYGAAIYVRGEVGSAIMVQLLTAKTRVAPVKTVSLPRLELCGALLLSEMAAAII +FT PQMPTINSKLYCWTDSTIVLAWLSKPACQWTTFVANRETKIAQATKTENWSHVQSEHNP +FT ADLASRGVSLQDLADSQLWWHGPTWLQNPRNQWPTQVNAPVTDLEKRALKVHLAKAPSE +FT ELLARFSKLEKALRVLAYVYRFIQRCRKQTSPSDVHLLATEIAAAERFLISNTQRREFP +FT VEYHCLSEKRPVPSSSAILSMNPFLDPQGLIRACGRVAASESPQYNERHPVILPYNCLL +FT SRLLAKFTHRTTLHGGNQLMVRLIRSKYWIPRIKNLMKAVVNSCKVCVIHKRRLQSQLM +FT GVLPKERASFSRPFTVSAWITPVRDIKNYTGRACVITKGYVLVFVCFSTKAIHLEPTSD +FT LTTEKFLAAFSRFVSRRGCPRQVQSDNGKTFVGAATLLSRDFLQAVKESVTNAYIHQEM +FT QWQLFSGGTQYGRPLGSRRKKLQDAILQMHGHTKIHVRRTLHALGKNRSVP" +XX +CC Derived from AJ010298 (e1315889) (Rel. 56, Last updated, Version 1). +CC Takis Benos and Michael Ashburner, 08-Sept-1998. +CC Any changes to original sequence record are annotated in an FT line. +XX +SQ Sequence 8507 BP; 2245 A; 2251 C; 1836 G; 2175 T; 0 other; + TGTTCAAGTT ACGCTCACCC GCTGTCACCC GCTGTCACCC GCTCTCCGCT CCCTCTTACG 60 + CTCTCCCGCT CTTCACCTCA GAGTCTCCAA GGAGTCCTCG GGCTTGGGAT AGCCTAACTA 120 + ATTAGAATAA GCATCAGTGT AAAAACTAAC CACGCTGAAT AAACATACGC CCGGTCGCCG 180 + CGCAATTACG AAAAGTCTAG TGTTTGCTTT CCTTCGAGTG TTTCTTTTCA GCATATTTGA 240 + ATTCAGGACA GCCATCCCCC TACATCCCAA CATTTTGGTC CTTCGAGCCG GATCACCTGG 300 + ATTTTCAAGT TTGTCCACCA GCGAACAAAT TATAAGATAA GTACGAAATT TCCATTCCTT 360 + TTAATTGCCG GTCTGCAGCA AAAGGTTCGA AAATCCAATT TCGTTCAATT TGCTGTAAGA 420 + TTTATTGTCA AATCTAACGG ATTTCTCCGA CAAAAGGCAA TTAAAGAAAA GTACTTATCC 480 + AATCTCACGG GCGCCGCATA TTACTCGCCG TTCTCCGTTC TCCTTTCACC CTCATTCGTG 540 + AAAATTTCTA AAGTCCAAAT GGGCGAATAT ATTTAAATAT TAATCCAGTG CGATAATGCA 600 + AAATTCCAAA TGTGAAAAAG TGAATAATTT GTGCCAAGTT CAGTGAAACT TTCTAAGTCC 660 + AAAGCTCTGC CAAAATTGGC AAAAATTCTG TTCTCGTTTC ACTGTGTCAA AGCGAAGCCA 720 + AACTTCTTTT CGCAACACAT TTTTGCTTTA ACTCCGCAGT CCACTTAATA CCATTTGCTT 780 + TGCTATCGAA GAATACCACA ACGAAACAAA CAACACCATA CCCTCTGGCC ATTCAAATAA 840 + CATATTAATT AACATTTCCG CAGTTCCATA TCTCTTACAT CAACATATAC CTACTCCATA 900 + CTCTTGCATA TATTCACATC TTACACAATA TATCCTCACC ATATATTACA TATATTACAT 960 + CAACATATAA TATCCACATA TATTACCGAC ATACATTGCG CATATTATCA GCATTCCTTT 1020 + AACGTATACC AAAGTTTAAA TTCGATCCCG TCGGCAAATC CAACCACAAA TAAAATTTAT 1080 + TCCAAGTGCC GACGCGGAAA GGCGTTTTCT TTTCCATCAA TTTTTTCCGT AAATTTCCAA 1140 + ATTAATTTCC GAGCAATAAA TTAAAAGCGG TTTTTTCTTT TTTTTTAACA AATAACTTAT 1200 + TGTTGAAAAC ATTTATTAAA TTATTAAAAA TTATATAAAT AATACGACCG CCAAATACAA 1260 + GTCGTTCACC CGACAAATAT TTTTTCCTGT ATTGCTTGGA TATTAATTTG TGTTTGTTTT 1320 + AGAAGTACTT ACAACGCGGA GAAAAGACTC CAAATCCACC ATTCCATTTT CTCCGTTTCC 1380 + AGTTATAAAC AAAAAAATAA ATAAAATTTT CTTCCTTCTA ATAAACATTT TATTTTACCG 1440 + TGTTCACATT CCAAGTGTTC CAACCGTAAA TAAGGTGGAC CTAATTACCA TAAATCACAG 1500 + GTCATTTATA CAATTCGCTG TTCACTCCGA GTCACCTGTC CAATTAGTCT AAACTACGGC 1560 + GTTTCCACTT CGCAAATTCA ACACCACTTT CTCACCCATT ACATCCTATA CGGTCCTTTT 1620 + CCGCTGCTTT ATACCGTTCA CGGCAGGAAG CTTAAATTTA TTAAGTGGAA TCTGTCTACT 1680 + TTTTCAAAAG TGTGACCGGG CTCCAAAAAC GCTTCCCTTC CATTTCGTAT TTCTTCGATT 1740 + ATGCCCATCG GGGACGATAA GAAGAAATTG TCCGCTGACA AACCCAGGTC TATTTTTTCA 1800 + CCACAAGGGC CCAAGAGTCC AAGAATCCCA AGCATTTCGG TGAAAACGCC TGCGCAGATT 1860 + TCCGACGACT GTGCCACTCC ATCCAAAGCC ACAGTACAGC GCACAGCTAA AAATATGGCT 1920 + GCTTCCGATC TAGCGCTAGC CAAATTCATT TCGGTTTCTG ACGCTCAAGC GAATTTGAGG 1980 + CTCAGATCAA CACTCCGGAA TCCGCAGCTC CAACCGTCAC GATGCTTAGC GTCCGTCGCG 2040 + ACCAAGTCCG AAGCCTATGG GACAAGGTTG AAAAGAATTC GACCTCTGCT CAGAGTGCCT 2100 + TGTGTCAGCA GGCGAGCGGC AGCAAGCGGC ATGCCTATTC TCAGGGCTAG TTACAGTTAT 2160 + TGCTATTCAG TCTATGAAAG GTGTGTTGCC CAGCTCGTTG ATAAAATCGA GCAGGGGCAC 2220 + TTCTCAGTCC ATCCCAAGCG AACGCTGCGG CCCAGGCCTA CATTTCCTCT GGCTGTCGGT 2280 + TGCCTCCATG CGATACAGGA GTTTTCGCAG GTGACTATCT TCGCTGGCCG CTTTCCGGAT 2340 + CTTTTACACG CCATTTATAT TAATAATCCA CGGCTGACTC CGTTCGAAAA GTTATTCCAC 2400 + TTAAATGCCA AAACAAGTGG CGACGCGCAT GCCATAGTTT CGATTTCGCC TCTCACCAAA 2460 + CGAGGGTTTT CCTCTGCGTG GGAAAACCTA ATAGAGCGTT TCGAAAATAA ACGATTGTTG 2520 + GTAAACAGTC AATTGAAAAT ACTGTTTAAT GTGCAGTCGA TACCACAGGA ATCTGGGGCG 2580 + GCCTTGAAGG TAATGCAAAG TACTGTTCAA GGTTGCTTGA CTGCCTTAGA ACTGTCAGGC 2640 + ATCAACACTG AGAACTGGGA CTGCCTGCTG GAATATCTGT GTTCATCCAA GCTCCCGAAG 2700 + ATAACTCTCT CCTTATGGGA GCAGTCTCTA CATAAGAAAG CCGACATCCC GACATGGGGA 2760 + GAACTGAACA CCTTCCTCAC AGAACGTCAT CGAACCCTAG AGGCCATCGA TGATGTGAGA 2820 + CCGTCCGTAC CAAGTCAGTC GCACTCCAAA GCGATGAACT CAAGTGGGCC CTCTAGAGAT 2880 + GGCAAGCTGG CGTCCGACTT GTGCAACAAG GAAAACCATC CTGTCCGTGT ATGTCGCGTT 2940 + TTCTCCAAAT GGTCGGTTGA CGACCGGTCA GCCTACATTA AACGGAAGCA GTTATGCTTA 3000 + AACTACTTTG CAAAGGGACA TCAGCTTCGT GAGTGCAAAG ATCGACAAAG TTTTACTTGG 3060 + TGGCCGGCAT CACACGTTGT TGCACCGAAA CAACCTCTTT TCCAGCAATT CAAGCCCTTC 3120 + AAATCCTGCA AGCCCAATTT CCGCTACTCA GGCCAATTTC GTTCCAAACG AGCAAGCCGG 3180 + TGTTCAAAAT TATTTTGCCA CGGCTCAAGA GCTATCCTTC TTGGCAGTGC CATAATCAAT 3240 + AGTTCCCATC TTGGCACTAA CTTTAAGGCA CGCGCCCTGA TCGACTCCGG ATCAGAGGCG 3300 + ACATTCATAA CCGAGCCACT GTTCAATCTA ATTAGATTGC CATTCCAGGT GGTTCAAGCC 3360 + CAAGTCTCGG GCTTAAACCA AACAGTAGCT GCTCAGTTCA AGAACGCTGC AGTTTCACCA 3420 + TCCGATCTCC GACTAGGCCG CGTTGCAGTT GGAGACGACG GCCTATGTCC TCCCTCAACT 3480 + AGCCGGAAAT CTGCCTTCCT ACCCAATTCC GCAAAATTTC TTCGGGATCT TCCCGATTTT 3540 + CCACTGGCGG ATCCAAAATT CTATGAGAGC GCCCCAATAG ATGTACTTAT CCGGAGCCCA 3600 + CATCCTGCTT CGGTGCTTCT GAGTGGAGCA AAAACCAACA TCTGTGGCTC TCTCTTGGGG 3660 + CAAGAGACCA TTTTCCGCTG GGTACTAACT GGGCCAGTGT CAGCCTCAGC CCAAAGCAGG 3720 + ATTCCTCTTT TTCGACACAG ATCTCCCACG CGTACGATAA TTCACTGGAC AAACTCCTCA 3780 + CAAAATTTGG GGAGGTGGAG GATATACCAA CAAAGTTGCA AAAGAATCCG ATTCCATGTG 3840 + CGAGAACGGG TTGGTAAATG CTTACGACGA CACCAGTGCG GCAAATATGT CGTTACTCTG 3900 + CCTTTTCGCG ACCCAGAACA TATCGGTTGC GGGCTAGGGC ATTCTAGGTC TTGGGCGTTG 3960 + GCTCAGTTCT TGAAGAATGA GCAGCGTCTA AAAAAAGATG AGGCCTTGAA AGCGAGATAC 4020 + GATTCGGTGA TCCAGGAATA TCTCGACTTA AAGCACATGC GACAAGTTCT GCCTACCCAT 4080 + GATTGCAACG CCTATTATAT GCCACATCAC GCCGTCTTAA AACCGGAGAG TGTAACTACT 4140 + AAACTCCGTG TAGTATTCAA TGCCTCCAGC CCTTCATCGA ATGGTACCAG TTTAAATGAT 4200 + ATCCTTCATG CTGGCCCTGT CTTGCAGTCC GACTTGACAG TGCAAATTCT GAAGTGGCGC 4260 + GATTTCCGAT ACGTGTTCAG TGCCGATATT CAAAAAATGT ATCGGCAGAT CTGGGTAGAT 4320 + CCGAAACACA CTCCATTCCA GCGAATACTT TTCCGTAACA ATAGAGGGGA AATCAGAGAT 4380 + TTCGAATTGA AAACAGTAAC CTTTGGAGTC AATTGCGCGC CCTTGCTGGC GATCCGAGTA 4440 + CTGCAGCAGC TAGCAGCTGA CGAAGAACTC AGCCATCCAA AAGCTAGCAA TGTCATTCGA 4500 + AATTTCATGT ATGTGGATGA TGTTTTAGCC GGAGCGGACT CTACGGAAGA AGCTCAGCTC 4560 + ATGGTGCACG AGCTCCGAGA CGCTCTGAAT TCTTCTTCGT CCCGCCAGAG ATGGCTATCG 4620 + AAACGTCCTT TACAACGCCA AGTCCTGTCC CAAATTGCCA AATTGTTCGA CCCTGCAGGC 4680 + TGGTTAGCAC CGTTTATCGT TCGAGCTAAA ATTTTCATGC AGGAGATTTG GCTACAGGAG 4740 + CTTGGGTGGG ACGAAAACGT TCCAAATGAC CTTTTTCAGC GATGGCTTAA TTTTCTCCAA 4800 + AGTTATTCGG TTTTCGAGCA GATACGCATT CCACGCTGGC TATCGTTTCA TCCAGATTTC 4860 + AAGGTCGAGC ATCATGGCTT TTGCGATGCA TCGCAAAAGG CTTATGGCGC CGCAATATAT 4920 + GTCCGCGGAG AAGTGGGCAG CGCCATTATG GTGCAACTCC TAACCGCCAA AACCCGGGTA 4980 + GCACCAGTCA AAACGGTTTC GCTCCCAAGA CTCGAGCTCT GCGGAGCGTT ATTGCTTTCC 5040 + GAAATGGCTG CAGCCATCAT TCCGCAGATG CCTACGATTA ACTCCAAACT TTACTGTTGG 5100 + ACGGACTCCA CCATAGTGCT TGCATGGTTA AGCAAGCCAG CATGCCAGTG GACCACATTT 5160 + GTAGCCAATA GGGAGACGAA GATCGCCCAG GCCACAAAAA CAGAGAATTG GTCTCATGTT 5220 + CAATCTGAGC ATAATCCAGC AGACCTGGCA AGTAGAGGAG TTTCCCTCCA AGATCTAGCC 5280 + GATAGCCAGT TATGGTGGCA CGGACCGACT TGGTTGCAAA ATCCACGCAA CCAATGGCCT 5340 + ACTCAGGTCA ACGCTCCGGT GACCGACCTG GAGAAGCGTG CTCTAAAAGT CCATCTCGCG 5400 + AAAGCTCCTT CTGAAGAGTT GTTGGCACGT TTCTCCAAGC TAGAGAAAGC TCTACGAGTC 5460 + CTTGCCTATG TTTATCGCTT CATTCAGCGG TGCAGGAAGC AGACATCTCC ATCTGATGTT 5520 + CATCTACTGG CCACTGAAAT CGCCGCCGCC GAGCGGTTCC TAATTTCGAA CACTCAACGC 5580 + AGAGAATTCC CTGTGGAATA TCACTGCCTA AGTGAAAAGC GTCCAGTGCC AAGTTCAAGT 5640 + GCCATCCTAA GCATGAACCC GTTTCTAGAT CCGCAAGGAC TGATCAGGGC ATGCGGCCGT 5700 + GTGGCGGCTT CCGAAAGCCC TCAATACAAT GAACGCCATC CAGTGATTCT TCCGTATAAC 5760 + TGCCTGCTTT CTCGCCTCCT TGCGAAGTTC ACGCATCGCA CAACTCTCCA TGGTGGTAAC 5820 + CAGTTAATGG TGCGCCTCAT CCGGTCGAAA TACTGGATTC CGAGAATCAA GAACCTGATG 5880 + AAAGCAGTGG TAAATTCGTG CAAAGTATGT GTGATCCACA AAAGGCGGTT GCAAAGCCAA 5940 + CTGATGGGTG TCCTGCCCAA AGAAAGAGCA TCGTTCTCCC GACCATTCAC GGTATCGGCA 6000 + TGGATTACGC CGGTCCGCGA TATAAAGAAC TATACGGGAA GAGCATGTGT TATTACAAAG 6060 + GGGTATGTGT TAGTTTTTGT TTGTTTCTCC ACCAAGGCCA TCCACTTAGA GCCTACATCT 6120 + GACTTAACGA CCGAGAAGTT TCTTGCCGCT TTCTCTCGTT TTGTATCCAG GAGAGGGTGT 6180 + CCACGTCAAG TCCAGTCAGA CAATGGCAAA ACCTTTGTTG GCGCTGCCAC CCTGCTTTCC 6240 + CGCGATTTCC TTCAAGCCGT AAAAGAGTCG GTGACGAATG CCTATATTCA TCAAGAGATG 6300 + CAATGGCAAT TATTCTCCGG GGGCACCCAA TATGGGAGGC CTTTGGGAAG CAGGCGTAAA 6360 + AAGCTTCAAG ACGCTATTTT ACAAATGCAC GGCCACACGA AAATACACGT TCGAAGAACT 6420 + CTCCACGCTC TTGGCAAAAA TAGAAGCGTG CCTTAACTCC AGGCCGCTCT CTCCTATGTC 6480 + TGAAGATCCG ACAGACTTGC TGGCTCTGAC GCCAGGGCAT TTCCTTGTCG GGGGACCCCT 6540 + TATGTCCACG GTGGAACCCG AAGTAAAGGG GGAAACGAAA TCCCTTCTTA ATCGGTGGCA 6600 + GCATTTGAAG GCTCTCCATC AGCAGTTCCG TGTGCGATGG AAAGAAGAGT ACCTCAAAGA 6660 + ACTCCACAAG CGTTCTAAAT GGCAGGTCCC GTGAACTTCG AGCTAAAATA CTCGTGCATG 6720 + TGGAGCAGCG TGTGGTGGGA TCGGTCGCAC TTCTTGCAAC GATCACCGCT TCGGCAGTCT 6780 + CCCGTGGAAT GCTCGTGAGC GAGGCAATTG GCGCTAGTAT GTTGGTAATG AGGACTGCTC 6840 + GCAAACGCTT TTCAGCGCTG AGCTTTAGGA ACCTCGCGCA CGTCCGAAGA GGATGGATTA 6900 + CCGCGGCAGA CTCGGCATCG GTAGGATTTA ATACCTCGGG TACGTCTGCT CTCCACGGCA 6960 + CGACCTGCGT GCGTTTTGTT GACGAGGAGC CATGTGCGCG TAGTCGAATG TCGAAAGGAG 7020 + ATCGAAAACG AAATGAAAAA TAACGGATGA TTAGTGATAG TGAACTACAA CTAAGGACGA 7080 + GAGGAGAGAC CTATTATTGT GGAGATTCGG AACTCCGTCG GCAAAAGCAC CTTTTTTGCC 7140 + ACTGGACGTT TAATAACTCC ACGTGCAGTA CGGATGTTTA CTACACGACG TTGCCGTCAG 7200 + CTCCTGGGAA AACAGACTCA ATTCTGCCGA GCCGCCACTC ATTAGAGGGC AAGTTGTCGT 7260 + CCTTGATGAC GACTGTTGAG TTACGGGGTT TGGACTGTCA CCGTCTCCGC TCCCTCTTAC 7320 + GTTCTCCACT CCCTCTTACG CTCTCCCGCT CTTCACCACA GAGTCTCCGA GGAGTCTCTG 7380 + GCGCTTGGGA GAACCCAACG CATTAGAATA AGTTTTAGTG TAAAACTAAC CACGATCAAT 7440 + AAAACATACG CCCGGTGCCC GCGCTAATTC TACAAGTCTT CGAGTGTTTT TTCGAGTGGT 7500 + CTTTTTTTCA GCAAACTAGG AACTTTCCAG GACCAGCACC CCCCATCACC CCAACAACGA 7560 + CCATGTCATC GATGGCGTCG CCAACCGGCG CCAACCCTGC AAGCAGCTTC GGCCTCGTCC 7620 + CAACGTTCCC GCCGGCACAA TCCGCCAACT CAGCGTAGGA GTTCACCGCC ACGACGACCG 7680 + GAATCGACGA CGCCAGGCCC ATCACTCTCG TCGCCGCTGC AACGCCACAG CGTGAACATC 7740 + CTTCCCACAG CGCTGGTCAA GATGGAGACC GGGACGAAGA CCTTCAGACC GCAGCACTCA 7800 + TCGATCCGTG CAGCCCCATG AGCTGCATCG ACGCTTCGTT GGCGTCAGCC TTTAAGCTTT 7860 + CGATGACCAA TGTTGGCGAC GAGAAGGTCT GCACGACGAC GATTCGCTCC AGGATCGACG 7920 + CGAACACGAA GCTCGAGGTC GTGCTCAAGA TCGAGCCCAG GGTGCGGATC CGTACACCTG 7980 + TCCGGGCATT GAGCGACACC GTAGTGTCCA AGTACAGGGA CATCATGCTG GCGGATGACG 8040 + GGTTCCATCG GCCTGCTACC GTATCCATGG TCTTAGGAGC AGACATTTAT CCTAAGGTTA 8100 + TCCAATCCGG ATTCCTGACC TTCGACGAGG GAATGCCGGT CGCTCAAAAG ACCGTGTTTG 8160 + GGTGGATCGT GTCCGGTGCC TGCAGCTTGC CTAGATGGCT ATGTTGCAAC CCCAGTGATT 8220 + GCAAGGGGGG CGGAATGTTC AAGTTACGCT CACCCGCTGT CACCCGCTGT CACCCGCTCT 8280 + CCGCTCCCTC TTACGCTCTC CCGCTCTTCA CCTCAGAGTC TCCAAGGAGT CCTCGGGCTT 8340 + GGGATAGCCT AACTAATTAG AATAAGCATC AGTGTAAAAA CTAACCACGC TGAATAAACA 8400 + TACGCCCGGT CGCCGCGCAA TTACGAAAAG TCTAGTGTTT GCTTTCCTTC GAGTGTTTCT 8460 + TTTCAGCATA TTTGAATTCA GGACAGCCAT CCCCCTACAT CCCAACA 8507 +// +ID ROXELEMENT standard; DNA; INV; 4740 BP. +XX +AC AF237761; +XX +XX +DR FLYBASE; FBte0001160; Dmel\X-element. +XX +SY synonym: BS2 +XX +FT source AF237761:1..4740 +FT SO_feature CDS ; SO:0000316:322..1827 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\X-element\ORF1" +FT /db_xref="FLYBASE:FBgn0041613" +FT /db_xref="SPTREMBL:Q9NBX5" +FT /db_xref="NCBI_PROTEIN:AAF81410.1" +FT /translation="MNTLNETAAADESLDTAFLSSPQCAAPQRFQKIKRKSRASPETER +FT KKPKSTIGKQGENPSATEPRYGGNSNRFGLLAHLTADKQVGNEIGDLYDQPSTSHQAAI +FT AAAKRDAASAGTTSSAKRAQSKPPPIVMEGVDDVYLMMQSIENIVDLEKIEARASMSGV +FT LRLYAADANTFRTIVNWLEIEEYEFHCYQLKEDRPYRVCVKGLHHSTLHHQIKDELEKI +FT GHKVLDIHTPLRRNEPGTSKASPVNMFFLNIAAAANNKEILAVKALCHMRVVIEPLRKR +FT NAIVQCHRCQQIGHTAKYCRKAHICVKCAGEHPAKDCTRPRIELCTCYNCGGQHPANYK +FT GCSKLQAFLQRSRPRSGVAGRTEVSDRPTPRGLAGGKEIPSSRGGISYADVARGSIHHK +FT QPMSLTHQQQKQKQQPYDGSPSRQRSRSRTRASRGTLQRSTDASSSIEAILQTLNENIN +FT SLRSIQEKQMELMMMMMKQQQQQSHQQGQIINLLTALQARQAP" +FT SO_feature CDS ; SO:0000316:1827..4553 +FT SO_feature start_codon ; SO:0000318:1..3 +FT /name="Dmel\X-element\ORF2" +FT /db_xref="FLYBASE:FBgn0041612" +FT /db_xref="SPTREMBL:Q9NBX4" +FT /db_xref="NCBI_PROTEIN:AAF81411.1" +FT /translation="MMPLRILVWNADGVSTKLPEVECFVRRHEIDVLLLSETHCKGAET +FT PKLFGFVAYTANDPSGGNAKGGAAILIKNSLAHFPLTPIATAKVQLAPAVIETALGPIS +FT FGAVYCPPRFAWTTDEFKDILEEFQTKFIVAGDWNASHWLWGAGRSNQRGIALANLVLN +FT SEVDSLATGGPTRYPYGCRGSPGYIDFALTKGVLGIHANISAVVELSSDHLPLVITLDA +FT GAISYPKMERLITRRTNLEVFQSQLESTLPLNTAINSGQDVDDAIELLTNNIKSAARLA +FT TRSISRQPAADRIPIPREILLLIAEKRRLRTRWMRSRHPSDKTEWNRALSRLRCALVLH +FT KAAWFDERLANTGVESEATHSLWKATRAIKRRCTRKAPLVDSNGTWCRTDLGQAEVFAA +FT HLAERFQPFKLASLQQVEETQDQLNQALQMDMPITPFEPCEVAEVIVRQSNNKAPGHDV +FT ICNATLKALPRQAILYITLVFNAIVRLQYFPYQWKLGIISMIHKPGKPEREPASYRPIS +FT LLPSISKVFERLIAVRIVSIMEAQGITPEHQFGFRAGHCTVEQLHRVVEQILTAYDSKE +FT YCNSLFLDIREAFDRVWHIGLQLKIKQTLPAPYFGLLKSYLEGRRFAVRFHSAISTEHN +FT VAAGVPQGSVLGPLLYCLYSHDMPQPDVSLYGKSMLATFADDVCVTYRSRCEHDAADGI +FT QDFAYRFSEWARRWNIGINSSKSNNVCFTLKRRTPPPVYIEEVPVPQPNAAKYLGVLLD +FT RRLTFSKHVTDIRTRLRAKVAKHYWLLSSRSKLSLSNKLTIYKQILAPNWKYGCQIWGL +FT ACDSHIKRIQAIQNKVARLITGCEWFVRNTTLHRDLKLATVFDEINKHSSRYHDRLERH +FT RNRLASALNRSRPPRRLNRRQPRDLITRSPLTRVRRS" +XX +SQ Sequence 4740 BP; 1336 A; 1215 C; 1183 G; 1006 T; 0 other; + AATGTTAAAT AAAGGTTCGT GTCTAACAAT ACGCACCTGA CAAAGTGGAT TAAGTGAAAT 60 + TAGTTTTCGC GGTAATAAAC TTATGGACAA GACCAGAATA CTGGCACACA TAGCAAATAG 120 + TGACCCCCCA AGTCACTAAC AGTGAAATAA TAGTGAAACG AAAACATTTT CATTCAAAAA 180 + TACAAAGTTA AGTTTCTCGA ACTGGGGCTC CGCTGCCCAG CTGCCACGCG ATCGCACAAA 240 + CAGCTGTTTG CGAGCTTAAA GCTTTCTATC CCAGGGTTCA AGTTTTGGCT AGAACCCTGG 300 + TGATTTGGTG CACACTTCAA TATGAACACT TTAAATGAAA CCGCTGCGGC TGATGAATCG 360 + TTGGATACTG CGTTTCTCTC GAGCCCCCAA TGTGCTGCCC CGCAGCGCTT TCAAAAAATA 420 + AAGCGAAAGT CTCGTGCTTC TCCGGAGACT GAAAGGAAAA AACCCAAATC AACCATCGGC 480 + AAACAAGGGG AAAACCCTTC GGCTACAGAA CCTAGATATG GCGGCAATTC AAACCGATTT 540 + GGTTTACTTG CGCATCTCAC AGCTGACAAA CAAGTAGGCA ATGAAATTGG CGATCTGTAT 600 + GACCAGCCCA GTACCAGTCA TCAAGCTGCA ATTGCTGCCG CTAAGCGGGA TGCAGCCTCC 660 + GCTGGTACCA CTAGCTCAGC CAAAAGAGCG CAGTCCAAAC CACCTCCTAT AGTAATGGAG 720 + GGAGTGGACG ACGTATACCT GATGATGCAG AGCATCGAAA ATATAGTGGA CCTAGAAAAG 780 + ATTGAGGCTA GGGCGTCAAT GAGCGGTGTC CTAAGGCTTT ACGCGGCTGA CGCTAATACA 840 + TTTCGCACCA TAGTGAACTG GCTCGAGATC GAAGAGTATG AGTTCCACTG CTACCAGCTT 900 + AAAGAGGACA GGCCTTACAG GGTATGCGTG AAAGGCCTGC ACCACAGTAC GCTACATCAC 960 + CAAATCAAGG ATGAGCTGGA AAAGATCGGG CACAAGGTTC TCGATATTCA CACACCGCTT 1020 + AGGCGAAACG AACCGGGTAC CTCAAAAGCG TCGCCAGTCA ATATGTTCTT CCTAAATATT 1080 + GCTGCTGCGG CAAACAATAA GGAGATCCTG GCGGTAAAGG CACTATGCCA TATGAGAGTA 1140 + GTTATTGAGC CTCTCCGCAA GCGTAACGCT ATTGTCCAGT GCCATCGTTG TCAGCAGATT 1200 + GGCCACACAG CCAAATACTG CCGTAAGGCC CACATTTGTG TGAAATGTGC CGGCGAACAC 1260 + CCAGCCAAGG ACTGTACCAG GCCACGCATC GAGCTGTGCA CTTGCTACAA CTGTGGCGGC 1320 + CAGCATCCTG CAAACTATAA AGGTTGCAGC AAGCTACAAG CGTTCCTGCA GCGATCCAGA 1380 + CCCAGAAGTG GAGTGGCTGG AAGAACAGAA GTAAGCGATC GACCAACTCC ACGGGGCTTA 1440 + GCTGGAGGTA AGGAGATCCC CTCTTCTCGA GGCGGAATAT CTTATGCAGA TGTGGCTAGA 1500 + GGGTCCATTC ACCACAAGCA ACCAATGAGC CTGACGCACC AGCAACAGAA GCAAAAGCAA 1560 + CAGCCCTATG ATGGAAGCCC CAGTCGTCAA AGGAGCCGCA GCCGGACAAG GGCGTCTAGG 1620 + GGTACACTCC AGCGCTCGAC GGATGCTAGC AGCAGCATTG AAGCCATCCT GCAGACGCTT 1680 + AATGAGAACA TTAATTCTTT GCGCTCGATT CAAGAGAAGC AAATGGAATT AATGATGATG 1740 + ATGATGAAGC AACAGCAACA ACAGTCACAT CAGCAGGGGC AGATTATCAA TCTGCTCACT 1800 + GCTCTCCAAG CGCGTCAAGC GCCATAATGA TGCCGCTGCG CATCCTAGTG TGGAACGCCG 1860 + ACGGCGTATC CACGAAGTTG CCTGAAGTAG AGTGCTTCGT GCGACGTCAC GAAATCGATG 1920 + TATTACTGCT CAGCGAGACA CACTGCAAGG GGGCAGAGAC GCCTAAGCTA TTCGGATTTG 1980 + TAGCCTACAC TGCCAATGAT CCGAGTGGTG GCAACGCCAA AGGCGGAGCA GCTATCTTAA 2040 + TCAAAAATAG CCTTGCCCAC TTTCCGCTAA CACCAATAGC CACTGCCAAG GTGCAACTTG 2100 + CGCCGGCGGT TATTGAAACG GCACTTGGTC CTATAAGCTT TGGAGCGGTC TACTGCCCAC 2160 + CGAGATTTGC ATGGACTACG GACGAGTTTA AGGACATTTT GGAAGAGTTC CAGACGAAGT 2220 + TCATTGTTGC AGGCGATTGG AACGCGTCCC ACTGGCTCTG GGGTGCGGGA AGGAGCAACC 2280 + AAAGAGGCAT TGCATTAGCG AATCTCGTCC TAAATTCGGA GGTGGACTCG CTAGCAACAG 2340 + GAGGACCAAC AAGATACCCG TACGGCTGTA GAGGCTCACC AGGGTACATC GATTTTGCAC 2400 + TGACAAAGGG TGTGCTGGGC ATCCACGCTA ACATAAGTGC GGTTGTTGAG CTTAGCTCCG 2460 + ACCACCTGCC TCTGGTAATT ACGCTGGATG CGGGGGCAAT ATCCTACCCT AAGATGGAGC 2520 + GGCTTATCAC TAGGCGTACT AACCTGGAGG TATTCCAATC GCAACTGGAG TCCACACTGC 2580 + CCCTCAACAC TGCCATAAAC TCTGGACAGG ACGTTGATGA TGCTATCGAA CTGCTCACCA 2640 + ACAATATCAA GTCAGCAGCT AGATTGGCAA CTCGCAGCAT ATCTCGGCAG CCCGCGGCAG 2700 + ATCGAATCCC AATACCCAGG GAGATCCTGC TGCTTATAGC TGAGAAGAGG CGCTTACGCA 2760 + CTAGGTGGAT GAGGTCTCGG CACCCGTCGG ACAAAACGGA ATGGAACCGA GCTCTGAGTA 2820 + GGCTCCGATG CGCGTTGGTG CTGCACAAAG CCGCATGGTT CGACGAAAGG CTTGCCAATA 2880 + CCGGAGTCGA AAGCGAAGCG ACGCATTCGC TGTGGAAGGC CACGCGCGCA ATCAAAAGGC 2940 + GTTGCACGAG GAAGGCGCCT CTAGTCGATA GCAACGGGAC ATGGTGTCGG ACCGACTTGG 3000 + GACAAGCGGA GGTATTCGCT GCGCACCTCG CCGAGCGATT TCAACCATTC AAGCTTGCCA 3060 + GCCTGCAACA GGTTGAAGAA ACTCAGGACC AGCTGAACCA AGCGCTTCAA ATGGATATGC 3120 + CAATCACGCC GTTTGAACCC TGCGAGGTAG CCGAAGTCAT TGTGCGCCAG AGTAACAACA 3180 + AAGCACCTGG ACATGACGTC ATCTGCAACG CCACATTGAA GGCCCTGCCC AGACAAGCGA 3240 + TCCTCTACAT AACGTTGGTT TTCAACGCTA TTGTGAGGTT GCAATACTTC CCTTATCAGT 3300 + GGAAGCTCGG GATAATCTCC ATGATCCACA AACCTGGCAA GCCGGAAAGG GAGCCCGCCT 3360 + CCTACCGGCC GATCAGTCTC CTCCCTTCAA TTTCGAAGGT GTTTGAGAGA CTGATTGCTG 3420 + TCCGGATTGT AAGCATTATG GAAGCCCAGG GGATTACCCC TGAGCACCAG TTCGGTTTCC 3480 + GTGCTGGCCA CTGTACTGTC GAGCAGCTCC ATCGAGTCGT CGAGCAAATT CTGACTGCCT 3540 + ACGACAGTAA GGAATATTGT AACAGCCTCT TCTTGGACAT TCGAGAAGCG TTTGATCGAG 3600 + TGTGGCACAT TGGACTCCAA CTGAAAATCA AGCAGACGCT GCCTGCCCCA TATTTTGGGT 3660 + TGCTGAAATC GTACCTGGAA GGAAGGAGGT TCGCTGTGCG CTTTCATTCA GCAATTTCCA 3720 + CCGAGCACAA CGTGGCAGCT GGTGTTCCAC AAGGTAGTGT CCTCGGCCCC CTGCTCTACT 3780 + GCCTGTATAG CCACGACATG CCGCAGCCAG ATGTAAGCCT TTACGGGAAA TCTATGTTGG 3840 + CCACATTTGC CGATGACGTG TGCGTCACCT ACAGGTCCCG ATGCGAGCAC GACGCAGCCG 3900 + ATGGTATCCA GGACTTTGCA TACCGGTTCT CGGAATGGGC AAGACGATGG AATATTGGCA 3960 + TCAATAGCAG TAAATCCAAC AACGTCTGCT TCACTTTAAA GCGGAGAACG CCACCGCCCG 4020 + TCTACATCGA GGAAGTCCCC GTACCACAGC CGAACGCAGC AAAGTACCTT GGAGTGCTTC 4080 + TGGATCGCAG ACTCACATTT TCCAAGCATG TGACCGACAT CAGAACGCGC CTACGTGCTA 4140 + AGGTGGCGAA GCACTACTGG CTACTTTCTT CGCGCAGTAA ATTGTCGCTA TCCAACAAGC 4200 + TGACAATTTA CAAACAGATC CTAGCACCAA ACTGGAAGTA TGGGTGCCAA ATCTGGGGCT 4260 + TAGCCTGCGA CAGCCACATC AAAAGGATCC AGGCTATTCA AAATAAGGTA GCAAGACTCA 4320 + TCACCGGCTG CGAGTGGTTT GTTCGAAACA CCACCCTGCA CAGAGACCTG AAACTCGCAA 4380 + CGGTATTTGA CGAAATAAAC AAGCACTCGA GCAGATACCA TGACAGGCTG GAGCGCCACA 4440 + GAAATCGGCT GGCCAGCGCT TTAAACAGAT CTCGCCCACC AAGGAGGCTC AATAGAAGGC 4500 + AACCGAGGGA TCTCATTACC CGATCTCCTT TGACAAGGGT CCGCAGAAGC TGACGCTTAT 4560 + CTTAAATCCT ATTTGTTATA TGTGATTGTT ATGTAATTGT AGTTAAATTA CTGTAAATTT 4620 + GAAAAAGCTA ACTATAGTTA GCCGGCGAGC CCAAATGGGC TGAATTAATA GATAAGAAGG 4680 + ACACAAAGGG GCTTCAAGAC TTCCCCGTAT GCCTTAATAA ATAAATTAAA TAAAAAAAAA 4740 +// diff -r 000000000000 -r 3c8c9911cf2a test-data/transposon_sequence_set_v9.5.fa --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/transposon_sequence_set_v9.5.fa Sun Nov 13 00:23:23 2022 +0000 @@ -0,0 +1,4206 @@ +>DME9736 +GTGACATATCCATAAGTCCCTAAGACTTAAGCATATGCCTACATACTAATACACTTACAA +CACATACACCCCAATACAACATACACTACTCCGGATGTACCCAACAGATACCAGATAAGA +ATAAGATTGTTATATGATCCTCGAGAATGGAAAAAACCCCAATTCTAGATAAGTCACCCA +CTGGTAGACTAAACATCCGTCCCCTAATTTAAACAATTCCTTGCTTAAGCCTCACCCCAT +CGTCACATTCCCACGTTCAAAGCTCGGAGCCGCAATCCCGAAAAACAAAAGTATCGATTT +CAATAAACAAATTATAAGAATCTAAGAGCACTTGTATCCAAGAGCAAATGCACTTGAATC +CAAGAGAAACGCAAAGCTTTTTCTCTTTACGATCAGAATCCTAAAGTCTAAAGTCCATAT +TAGAAAAGCTCGATACCGAGGCTTGAACGTCAACCAAATCAGAATAATTATCAGAGTTCA +GTTTGAGACCTAATTGTAAAAGGTTCGGTGTTCTTCTCAAATAAAAAGATTGTAATCATT +TAGTGAAATAAAAATTATATTTTTTTCACTTATAAATATTGCAAGTATTTAATTGGCGCA +GTCGGTTAGGATCCAATAAAATAAAAGAGTCCTTTTAGTACGGTACTGATCAACTGAAGG +ATATGCTATACGACTAGCTATCCAAGATCAGCGAATTAAAATAGTGATTCAAAAATATTT +TTTAATCCGCAAAAGAATCTACGTGAAAGTAGTATTCAAAATAAAATCCCGTGCGGTCGG +AAACAAAAATTAATTTAAATTTTTTAATTCCGAAACTTAAAACCAAGTTTAAAGAAAACT +TAAAATCAAGAAAACTTAAAACCAAGTTTAAAGAAAACTTAAAATCAAGAAAACTTAAAA +CCAAGTTTAAAGAAAACTTAAAATCAAGAAAACTTAAAACCAAGTTTAAAGAAAACTCAA +AATCAAGAAAACTTAAAGCCAAAATAAGCTAGAAAACTAAAAGACATCATGGCAGTCCCA +CAACTCTCAGAAACACACCTAAACCAACTGCTAAACCAAATCAAAGAATTAAACTACTAC +GATGGCGCACCTGGCAAATTATCTGGATTCGTCAACCAAGTGGAACAACTGCTCAGTTTA +TACCCAACACAGGAAGCAAGACAGGCACACGTCATATATGGAGCAGTGAAGCGGTTATTA +GTGGATTCAGCCTTAGAAGTCGTAACCCAGGAAAGAGCTAACACATGGCTGGACATGAAG +AAAGCACTGGCAATGGCATTCAAAGACCATAGACCTTATGTAACTCTCATCAGACAATTA +GAAGACATATCATACCCAGGAAGTATCTGTAAGTTTATAGAAAAATTAGAAACACAATAC +TGGATTATGTTCGATAAGTTAGAATTAGAAAGTGACCATGTTGATAAATCGAATTATACC +GAAATGTTAAACAAAACTGTTAAATCAGTAATAGATCGAAAACTGCCGGATAGAATTTAT +ATGTCTTTGGCACGTAAAGATATTGATACAATTTATAAATTAAAACAAGCATCAATGGAA +TTAGGCCTTTATGATGCTATTCCAGAAAATCACCGTTCTAATAGAACAGAAATGAATAAA +CGTAGGAACAGGGGAAACTATAATCAAAATAATAATCAAAAATATTACAATAATAGAAAT +CACAACTACAGTAATTATTATCCTAGCATGAATCAGAATCATAATACACAACCACCTCAG +AATCCGACTCAACCTATGACAAATCAAAACCAATATTCACCGCGTTTCATACCGAATAAT +CAAAGAGGGAATTATTATGCATTTAGACGAGACTTAACACAAGCTCAGCAGAACAACCCA +CTTAATAACACCCTTAACTTCCAACCTTCGACATCGAATAATATTAACAGACAAGGGCCA +GTAAAAAGACAACGCGAGAGTCAGAGTGACCAAAGCAGGATGGATGTAAATTTTCATCAA +GCTGCCTCGGACACTCAAATGATAGAGAAGGACATACAAGTCCCTATGTAAAAATAATTC +ATCATAATAAAAATTATAAGGGAATGATCGATACAGGATCATCAATTAACATCATAAGAG +AAAATTTTGAGAACTTAGAAGAAAAGGAAGAAAACCTAATAGTATACACTATTAAAGGAC +CAATAACACTAAAGAGAAGTATAATAATAAAACCTACTTCAGTATGTCCGTCTGCTCAAA +AATTCTACATTCACAAATTTTCTGATAACTATGATTTCTTGTTAGGTCGAAAGTATTTAG +AAGATACAAAAGCTAAAATAGATTATGCTAACGAAACAGTAACACTAGGCTCAAAAGTAT +TTAAGTTTCTCTATGAAGAAAAGAAGGGCGAGACCGCATCCAAATGCCTTGACCCACAAG +AAAAGAATGATTCCGCTCTAGTGGACAGAACCAAACCAAAAATGCAAAAGGTTAAGACCG +CACCTAAGTGCCTTAAACCAAAGCATCAACAGCAGAAGAAAGAGACCGCATTACCCAAAT +GCCTCATTTCAAATGTTGTTAAAGACACAGTGGACAATGATGTAACACATCTCGATCCCA +TGTCCGTTGACAACGATATAGTCAACTTCGCGATTAACAATGAGTTACGCGAATGTAACG +AGTATAGACTCGAACACTTAAATGCAGAGGAAGTTGAATGTTTAAAGAAGTTCCTATACG +AATATAGAGACATTCAGTACAAAGAGGGCGAAAATTTGACCTTCACCAGTACTATTAAAC +ATGTCATCCAGACTCAACACGAAGACCCAGTATACCGTAAACCCTACAAGTACCCTCAAA +GCGTTGACCAAGAAGTTAACAAACAAATTAAAGAAATGATAGAACAAGGGATTGTTCGCA +AATCGAAGTCCCCTTATTGTTCTCCTATTTGGGTGGTCCCCAAGAAGGCAGACGCCTCTG +GGAAACAAAAATTCAGGTTGGTAGTCGATTACAGGAACCTAAATGAGATAACTGTTAACG +ACAAATTTCCCATTCCCCGAATGGATGAGATATTGGACAAACTAGGTAGATGCCAATACT +TTACCACTATAGATCTAGCCAAGGGTTTTCACCAAATCCAAATGGATGAAAATTCTATTG +CAAAAACAGCTTTTTCAACTAAGCATGGGCATTATGAATATACTCGTATGCCCTTTGGTT +TAAAAAACGCTCCAGCTACTTTTCAGAGATGCATGAATAATCTTCTGGAAGATTTAATCT +ACAAAGACTGTTTAGTCTATTTAGACGATATTATTGTTTATTCCACTCCATTGGAAGAAC +ACATTTTATCCCTAAAGAAAGTCTTTGAAAAACTGAGAGACGCTAATTTAAAGTTGCAAC +TAGATAAATGTGAATTCATGAAGAAAGAAACTGAATTCCTAGGACACATCGTCACAACAA +ATGGCATCAAACCAAATCCAAATAAAACTAAAGCAATTACAAATTTTCCATTACCCAAGA +CACCTAAGCAAATAAAATCATTTTTGGGATTATGTGGATTCTATCGCAAGTTTATTCCTA +ACTTTGCCAAAATAGTTAAACCCATGACCCTCAAATTAAAGAAAGGTGCTATAATAGACA +CCAAATGTAAAGAATACATCGAATCATTTGAAAAATTAAAAGTTTTGATAACTTCAGACC +CGATATTAATCTATCCTGATTTTTCAAAACCTTTTTCTTTGACAACTGATGCTAGCAACG +TAGCTATTGGTGCAGTGTTATCACAAAATCACAAGCCAGTTTGTTATGCCAGTAGAACGC +TAAACGAACATGAAATCAACTATGCTACGATTGAAAAAGAATTGTTAGCTATAGTTTGGG +CTACAAAATATTTCAGGTCATACTTATTCGGCAGACCATTTGAAGTATTAAGTGATCACA +AGCCACTGGTATGGCTCAACAACATTAAAGAACCAAACATGAAATTGCAAAGATGGAAAA +TAAAACTTAATGAATTCGATTATAAAATCAAATATCTTCCAGGCAAAGAAAACCATGTCG +CGGATGCTCTTTCCCGCACGAAAATAGAAGTTATGGTTGGCGAGGTCGCAAATAGCGCAG +ACGCAACTATACACAGTGCCATTGAAGATAATCTAAATTACATACCCATAACAGAAAGAC +CAATAAATTACTTCTCTAGACAAATAGAGATAGAAAAAGGCGATAACGATACAACAAGTG +TACAACATTTGTTTCAAAAATTAAAGATTAAGATAGTCTATAAAGAAATGACACCTGAAC +TCGCCAAAAACCTCATTAAGGAATATGTGTGCACCAAAAAGAGTGCAATTTATTTCCCTA +ATGACGAAGATTTTCTGATCTTCCAGAGAGCGTTTACCGAAATTATAAGCCCTAACAATT +TCACAAAACTCTTGAGATGTACCACAAAGTTAATTGATATACTAACGTATGCAGAATTCA +AAGATTTAATCTTAAAGAAACATAAGGAACTTTTACATCCGGGTATAGAAAAAACAATCA +ATTTATTTAAAGAAGAATATTACTATCCTGATAGTCAAAAGCTTATTCAAACCATTATCA +ATGAATGTCAAATTTGTTATCTAGCAAAAACGGAACATCAAACACAAATGACATATGAGA +CTACACCAGAAATATTTAACACAAGAGAAAAATACATGATAGATTTTTATCTCACAGGAA +ACCAGATCTTCTTATCTTGCATTGATATCTATTCGAAATTTGCATCACTAGTTGAATTAA +AAAGTAGAGATTGGCTAGAAGCAAAAAGAGCCATTACTAAAATATTCAATGACATGGGAA +AACCGCAAGAAATTAAAGCAGACAAAGACTCAGCTTTTATGTGTTTAGCCTTACAAAATT +GGTTAAGATCTGAAGGTGTACAAATTTCTATAAGCACTAGCAAAAATGGTATATCTGATA +TAGAAAGATTCCACAAGACCGTAAACGAAAAGCTAAGAATCATTGGTAGCCAACAAAATG +TTGAAGATAGGTGCACAAAATTCGAAAGAATTCTATACATATACAATCACAAAACTAAAC +ATAATAGTACTAAAAGATTTCCAGCAGACATTTTCCTATATGCAGGCAGTCCAGATTTTA +ATGTACAACAAAACAAAATCGATAGGATAGAATACCTCAATAAGAATAGACACGATTTTG +AAGTTGATATAAAATATAGACAAGCCCCACTTGTAAAAAGTAAAATAACCAATCCATTTA +AAAAGACAGGAAGAATTGGACAAGTAGATGATAAACATTTCGAAGAACAAAATCGTGGCA +GGAAGATCGTTCACTATAAGTCAAAATTTAAGAAACAGAAAAAGTTTAATAAGAGCAAAT +ATGATAATTCCAGACCAACCAAAGAAGCACAAAGTACACAACATACTTCTAATAATGCTT +AGTTGCATACTATCACTTATCATCACGGTCAAGTGCAACAATATAGAAGTAAATCCAGTA +AACGCGAAAAATGGATACCTTATATTCCAAACAGGAACAATGGAAATTCCAACCAGCTAT +GAATACCATTATTTAAGCATAAACATAACAAAGACAATGCTCATGTTCGAAGATATAGTA +AGTGAAGCAAACAACTATCCTAATGTACCACAAATACAATATTTAGTCGACAAATTAAAA +CGAGAAATAAATGGGTTAAGAATTATTAGTCGAAGTAAAAGAGGTCTTTTAAACGTAGTA +GGAAAAGCATACAAATACTTATTCGGCACATTAGATGAGGATGACAGAGAAGAGTTAGAA +GAAAAAATAAACAACATGTCAGAAGACTCTGTAAAAACCCATGACCTAAACACGATTCTA +GATGTAATCAATAGTGGTATAGATATAATTAATAAGCTCAAAGTAGATAAAGAACAACAC +CAACAAATTGCGGTACTAATATTTAACCTAGAGCAATTTACAGAATATATAGAAGACATA +GAATTGGGTCTGCAATTAACCAGACTAGGAATTTTCAATCCAAGATTACTAAAGCATGAC +TATTTAAAACATGTAAATTCAGAAAAAATGCTAAAGATAAAAACGTCAACCTGGCTTAAA +ACAGACACGAACGAAATTTTGATTATTTCCCATATTCCTAGCGAAGTTACTAAAGTTCCA +ATATTCCAAATTGTTCCGTACCCAGATGAACATAATTATATTCTAACCGAGCAAATATTC +GATAAATTCTACATATTTGATAACCAAGTATTCCATAAAGATACCAATAGGGATATATTC +GACAAATGTATTATTGGAATCATCAAACAAGAGCAAACTCAATGCAAATATATTAAAACA +CATAAAAATTACCAAATAAATTATATAGAACCAAATATACTATTAACATGGAATATTCCT +GAAACAGCTGTTAACCAAGACTGTACACACAATAAAATATTAATTTCAGGAAACAACATC +ATTAAAATTAAAAATTGTACCATACAAATAGATGAATTCTTAATCTCTAATAATCTAGCA +GACTTTACACAAACAATTTATATCACCAACAATGTAACACGTCTAGAACCAATAAATCAC +TTACAAACGAGAGAAATGATAGAAACCCATGTAAAACACTATAACTTTTTTCAAATTATA +TGCATTACAACGTTCGTCATAATGATAATTAGTTTGACTCTGTATGTAGCATATAAGTTT +AAAAATATACCTAAGAAAATTATTGTCAATATCGTAAGCAAAAAGAACACACGCACCTTG +AAAATAATGTCAATGAAAATATTCAACAAGGAAATAATATTACCTTATACCCAAATTTAA +CGACCTGAGGACAGGCCAAATTCAAAGGTTGGGGGAGTGACATATCCATAAGTCCCTAAG +ACTTAAGCATATGCCTACATACTAATACACTTACAACACATACACCCCAATACAACATAC +ACTACTCCGGATGTACCCAACAGATACCAGATAAGAATAAGATTGTTATATGATCCTCGA +GAATGGAAAAAACCCCAATTCTAGATAAGTCACCCACTGGTAGACTAAACATCCGTTCCC +CTAATTTAAACAATTCCTTGCTTAAGCCTCACCCCATCGTCACATTCCCACGTTCAAAGC +TCGGAGCCGCAATCCCGAAAAACAAAAGTATCGATTTCAATAAACAAATTATAAGAATCT +AAGAGCACTTGTATCCAAGAGCAAATGCACTTGAATCCAAGAGAAACGCAAAGCTTTTTC +TCTTTACGATCAGAATCCTAAAGTCTAAAGTCCATATTAGAAAAGCTCGATACCGAGGCT +TGAACGTCAACCAAATCAGAATAATTATCAGAGTTCAGTTTGAGACCTAATTGTAAAAGG +TTCGGTGTTCTTCTCAAATAAAAAGATTGTAATCATTTAGTGAAATAAAAATTATATTTT +TTTCACTTATAAATATTGCAAGTATTTAATT +>DMIS176 +AGTGACATATTCACATACAAAACCACATAACATAGAGTAAACATATTGAAAAGCCGCATA +CGTAAACAATAAGTGACCACCATGCTAATGTGGATCAAATAACAAAAATATCCACTCTGC +ATTTTGACACCCCCATACTGTATGCCATCTGCGCAGTATGCATTCTAATAAACAAATTCT +TTGACAGCGGCACTTAGCCATTCTTGTAAACAAATCTTAAAGTCTGCCTGCTCTCTCTGA +GGCTTCTCCTCCACTTAAGAATCCAAGAGCAATGCTCTCCCAAAAACACTAACATATTCT +TTAAGCAAGCACAGAGGCTTCTCCTCATTTTCACTTTCATTTGATTTTCAGTCTTAAGCT +GAACGTTAATCAATAAACAACACAATCGATACCGAAATTTTGATTCGTTTTATTTTGGCA +AAACTCAATTTTCAGCGTTGGTCTTAGTTCATATTCGGAACGGTCCATTTAATAGACTCA +AAACTATTTATTGCAACCATTTATTTGCAATTGGCGCAGTCGATGTGATCAGTGTTAAAG +TTCCTTGATGCGGTAACCAGATTTGCCAATTCCTGTGTTCTTTTTGTTCTCTGACAAAAG +TACCACGATAACGGGCACCCACGTGACGGTTAATATCGCTTTAAGTTTTTAATTAAACCT +CGACAATAAAGTGAAACCGAAAAATCACAATTTGCCTAAACAAACCTGAATTTATTATCA +GGAAGACGCTATTGAATTTGTGAGAGGCTGTAAATCCAATTGGTTACCTCAAAGACCCAC +GAAAAAGCTATAGTGCAACCCTTGCGAAAATCAAAACCTATCTTAAAAAAAAAAAAAAAA +TATAAATAATAAATTAATAAGCGAAAATTAAAACGTATTAAAAGTAAGAATAATAAATAA +ATAAGTGAAAATTCTATATGATAAAAATTAAAAATAAGAATAATAAATAAAAAGACAACA +TTTTAAATTAAACAATATTAAAAAAATATAAAAATATTAAAAACTATATTAAAAAAAAAA +AAAAAACAAAAAAACAAAAAAAAAAAAATAAATAAATAATCCAAAAATCAAAAATGGCTC +AAGAACCAGCAATTGTGCCACCACTATCAGACAGCAACATGACCCAGGTTGCCTACCAGA +TTGGCAATGTGGAGAAATTCAACGGTGATCCAGGCTCACTATACACCTTTGTGAGTCGAA +TTGATTACATACTGGCTCTTTATGCTACCGGAGATGAACGCCAACAGCAGATCATATTTG +GGCATATTGAACGCAGCATCAGCGGAGAAGTTATGCGCTGCATTGGAGCCTATGACATGT +ACACCTGGCAGCAGCTTAGAAGACAATTGGTACTCAACTATAAACCCCAGACCCCTAACC +ACGTTCTTTTAGAAGAGTTTCGAAAGACCCCATTTCGAGGCAATGTACGAGCATTCCTGG +AAGAAGCAGAAAGCCGCAGACAAACACTTACTAGTAAGCTTGAATTAGAGCAAGATCTTG +AAGAAAAGACTTTTTATTTGAAATTAATAAAATCCAGTATAGAATCACTAATTGAAAAAT +TACCTACACACATTTATTTAAGAATAAATAACCACAACATACCAGATTTGCGATCACTTA +TAAACCTTTTACAAGAGAAGGGCATGTACGAACAAATAAATCATACAAGTACACATGTCC +AAAAACAAAATTTCTCTGATAAGCCACAAAAGTCCTTTAATCAAAATACTAATCAGTCTA +ACAATATCAGAAAATATCCAACACCTTTCCTACATTATAATTCACCAATACCATATCAAG +CTCCACAAATTTATCAAACACCACCAACTAATAACCCACTTTATCGTCATCCAATACCCT +ACCACCCTAATCCAAACAATGTTTTTCAACCAAGCCAACAAAACAATGTTTTCCAACCAA +GCCAACAAAACAATGCTTTTCAACCAAATCAACGAACAAACTTTACATCTCGACCAATTT +TTAACACCAATCGAAACAATGCATTCGATCAGAATAGGTTCGGACAACAACCCCAATATC +AAAATCAACAATCAACACAAAATTCAAGTTCCTATGTACCCAATCGACCAATAAAACGAT +TAAGACCAGCTAATAGTGGACAGACTGGGATGAGTGTTGACGAAACATTATATCAAGAGG +ACGCTTTTTATCAGCAGTGTGTTCCATATGACTATTTTTATTATCCAACTTACGACCATT +CAGACTATTATCCAGAAAATCAATATCAAATTGACGAAAACAACCAAAATTTACAAAGAA +CACAACAGTTACAGCAGATTAATACAGACGAGACAAACAATGACAACCAAGAACCCAATG +TTGAACAGGCCGAAAATTTTCAGCCACAAGCCTTGGAAAACCCCAATATATAACAATTAA +ATACAAAGAAAATAATTTGAAATGCCTTATTGATACCGGATCAACAGTTAACATGACATC +TAAAAATATATTTGATTTACCAATCCAGAATACTAGTACTTTTATTCATACCAGCAATGG +ACCGCTCATTGTCAACAAAAGTATAATCATACCTTCAAAGATTTTGTTCCCAACAACAAA +TGAATTTTTATTGCACCCTTTCTCTGAGAATTACGATCTTTTATTAGGAAGAAAACTTTT +AGCAGAAGCAAAAGCAACAATAAGTTACCGCGATCAAGAGGTAACTCTTTACAACAACAA +ATACAAATTAATAGAAGGAATAGCAACACATGAACAGAGTCATTTTCAAAATGTAAATAT +GATACCTGACACCATGCTCAGACAGCCAAATAAAATTTCACCCATTTTAGAATCAGACCT +ATACAGATTGGAACATTTAAATAACGAAGAAAAACAAAGATTGTGCGCACTCCTGCAGAA +ATACCATGACATACAGTACCATGAAGGTGATAAGTTGACATTTACTAATCAAACCAAACA +TACTATCAATACAAAGCACAATCTACCACTTTACTCTAAATACAGTTACCCACAGGCTTA +TGAACAGGAGGTCGAAAGCCAAATACAAGATATGCTAAATCAAGGTATTATACGTACCAG +TAATTCACCTTACAATAGCCCCATCTGGGTGGTTCCAAAGAAACAAGATGCATCAGGCAA +ACAGAAATTTAGAATTGTAATAGACTACCGAAAATTAAATGAAATAACAGTAGGAGACAG +ACACCCAATCCCAAACATGGACGAAATCTTGGGAAAATTGGGCAGATGTAATTACTTCAC +AACTATAGACTTGGCAAAGGGTTTCCACCAGATCGAAATGGATCCAGAATCAGTTTCAAA +GACAGCCTTTTCTACCAAGCACGGTCATTATGAATATTTGCGCATGCCATTCGGATTAAA +AAACGCGCCAGCCACCTTTCAACGGTGCATGAATGATATTTTAAGACCACTCTTAAACAA +ACACTGTCTTGTGTATTTGGACGACATAATTGTATTCTCGACATCCCTTGATGAACACCT +GCAATCGCTCGGACTAGTTTTCGAAAAATTAGCAAAAGCCAACCTTAAATTACAACTTGA +CAAATGTGAGTTTCTCAAGCAAGAAACCACATTTTTAGGACATGTTCTAACACCAGATGG +AATAAAACCAAACCCTGAAAAAATTGAAGCCATTCAAAAATATCCAATTCCCACTAAACC +AAAAGAAATAAAAGCTTTTCTTGGACTGACAGGATATTATCGTAAATTTATTCCAAACTT +TGCAGACATAGCCAAACCCATGACTAAGTGTTTAAAAAAGAACATGAAAATTGACACTAC +CAACCCAGAATATGACTCTGCATTTAAAAAATTAAAATATCTAATATCAGAAGACCCAAT +TCTTAAAGTACCCGACTTTACAAAGAAATTCACTTTAACCACAGACGCAAGTGATGTCGC +TTTGGGGGCAGTACTGTCACAAGATGGACACCCACTTAGCTACATTAGCCGAACACTTAA +TGAACACGAAATAAATTACAGCACAATTGAAAAAGAACTCTTAGCAATTGTATGGGCGAC +AAAGACTTTTCGACACTACCTACTTGGAAGACACTTTGAAATATCCAGTGACCATCAACC +ATTGAGCTGGTTGTACCGTATGAAAGACCCAAATTCAAAACTGACCCGATGGAGAGTAAA +ATTATCCGAATTCGATTTTGATATAAAATATATAAAAGGAAAAGAAAATTGCGTGGCGGA +TGCTCTGTCCAGAATAAAACTTGAGGAGACATATTTGAGCGAACAAACCCAACATAGTGC +AGAAGAGGACAATAGTGATTTAATTTTTATTACAGAAAGACCTCTAAATACATTTAACAG +ACAAGTTATATTTTCAAAAGGACCACCAGACATTAAAGTTACGAAATATTTCAAAAAACA +CATCACCCAAATATTTTACGACATTATGACCAGGGAAAAAGCCGAACAATATTTGATAGA +CCATTTTTGTGGTAAGAAAAGTGCGTTGTATATTGAGAGTGACGCTGATTTCGAAGTCAT +TCAAGCCGCACATAAATTAGCCATAAACACCAAATATACAAAAATCCTGCGTAGCACGAT +TTTGTTAAAAAACATAACCACTTATGCGGAATTTAAGGAATTGATCTTGACTGCTCATGA +AAAACTTCTACACCCAGGCATACAGAAAACTACTAAACTTTTCGGAGAAACTTACTATTT +CCCTAATAGCCAGCTACTTATTCAGAATATAATAAATGAGTGCAGTATTTGCAATCTGGC +AAAAACAGAGCACCGAAATACAGACATGCCAACGAAAACCACACCCAAACCAGAACATTG +CCGCGAAAAATTCATGATAGACATTTACTCATCCGAAGGCAAACATTACGTTAGTTGCAT +AGACATTTATTCGAAATTTGCCACATTAGAAGAAATAAAAACAAAAGACTGGATAGAATG +CAAAAACGCGCTTATGCGCATATTCAACCAGCTTGGCAAGCCAAAGTTACTAAAGGCGGA +CAGAGACGGCGCATTTTCCAGTTTAGCCCTCAAGAGATGGCTGGAGAGTGAGGAAGTCGA +ATTGCAGCTTAACACAACAAAAACTGGTGTGGCGGACATAGAAAGACTACATAAAACAAT +TAATGAAAAGATTCGCATAATCAAAACATCCGATGACGAAGAAACCAAATTGAGCAAAAT +GGAAACAGTACTTAACATATACAATCATAAAACCAAACACGACACCACTGGACAGACCCC +TGCACACATATTTCTCTACGCTGGACAACCAATATTAGATACCCAACAAAACAAAGAAAA +CAAAATAAACAAAATAAATAATGACAGAGTGGAGTACGAAGTCGACACAAGATACAGAAA +AGGTCCACTACAGAAAGGCAAATTAGAAAATCCTTTTAAGCCAACAAAAAATGTGGAGCA +GACTGACTCTGATCATTATAAAATTACTAATAGAAATAGAATTACTCACTACTACAAAAC +ACAATTCAAAAAACGAAAGAAAAATAATCAGCTCTCAATTTCACAGGCACCTGGCACTTG +ATAACATTGCTGCTGATGCTGATCACAACAGTTCATGGACAACAAATTGAAATTAATAAT +ATTGACACAAACCACGGATATCTCCTTTTTTCTGATAAACCAGTCCAGATACCATCATCC +TTTGAACATCATTGCTTGAGAATCAATTTAACTGAAATAGACACCATAGCTGATTATTTT +GAGCAAAGACTACGTACCGACTACCATGCACCCCAGGTCAAATTTTTATACAACAAAATG +AGAAGAGAACTAGCTGGAATAGCCTTGCGACATAGAAATAAACGGGGACTTATTAACATT +GTAGGTTCAGTTTTTAAATACCTATTTGGCACACTTGACGAAAATGATCGAGTGGATATA +CAGAGGAAACTTGAAACAAACGCCCATAACTCGGTAAATTTACATGAACTCAATGACGCT +ATTCAATTAATAAATGACGGAATGCAAAAGATACAGAATTATGAAAACAACAGCAACATC +ATTAACAGTCTTTTATATGAACTCATGCAGTTTACAGAATACATAGAAGATGTGGAAATG +GGAATGCAGCTTTCCAGACTCGGTCTATTTAATCCCAAACTACTAAACTACGATAAACTT +GAGAATGTAAACAGCCAAAATATTTTAAACATTAAAACATCCACTTGGATTAATTACAAT +GATAACCAATTATTAATCATATCTCACATACCTATTAACTTTTCATTAATAAATACAGTA +AAAATAATCCCTTACCCAGACTCGAACGGCTATCAGCTAGAATACACAGACACACAATCA +TATTTTGAAAGAGAAAATAAAGTTTACAATAACGAAAATAAAGAAATAAACAATGAGTGT +GTCACCAACATTATTAAACATTTAAAACCAATTTGTAATTTTGAGTCAATCCACACAGAT +GAAATAATAAAATACATAGAACCAAACACAATTGTAACCTGGAATTTAACCCAAACAAGT +CTCAAACAAAATTGTCAAAATTCATTTAATAATATAAAAATAAAAGGAAACAAAATGATA +AAAGTAACCCAATGTAAAATAGAAATCAATAGCATAATTCTAAGTGAAAATCTCTTTAAA +CCAGAAATAGATTTGACACCATTATACACACCACTTAACATAACAAAAATAAAAACTGTT +AAACACAACGACATTAATGAAATGATTTCACAAAACAATATTACACTTTACATATTTATG +ACTACTGTCATCATTATACTTATTTTATTGTACTTATATTTAAGATACGTATCATTTAAC +CCATTCATGATGCTGTATGCAAAACTAAAATTAAGAAAAAATCAAAATCAAAACACAGCA +CAACAAATAGAAATGGAAGACGTTCCATTACCCCTACTATATCCATCAATCCCAGCCCAA +GTATAGGCTTCTCTTTAAGGGAAGGGAAGTGACATATTCACATACAAAACCACATAACGT +AGAGTAAACATATTGAAAAGCCGCATACGTCAACAATAAGTGACCACCATGCTAATGTGG +ATCAAATAACAAAAATATCCACTCTGCATTTTGACACCCCCATACTGTATGCCATCTGCG +CAGTATGCATTCTAATAAACAAATTCTTTGACAGCGGCACTTAGCCATTCTTGTAAACAA +ATCTTAAAGTCTGCCTGCTCTCTCTGAGGCTTCTCCTCCACTTAAGAATCCAAGAGCAAT +GCTCTCCCAAAAACACTAACATATTCTTTAAGCAAGCACAGAGGCTTCTCCTCATTTTCA +CTTTCATTTGATTTTCAGTCTTAAGCTGAACGTTAATCAATAAACAACACAATCGATACC +GAAATTTTGATTCGTTTTATTTTGGCAAAACTCAATTTTCAGCGTTGGTCTTAGTTCATA +TTCGGAACGGTCCATTTAATAGACTCAAAACTATTTATTGCAACCATTTATTTGCAATT +>DMTN1731 +TGTTGAATATAGGCAATGCCCACATGTGTGTTGAATATAGGCAATTTCCACATGTGCATA +TGTAATTTTGTATGAGAACATACATACATACACATGAACTGTATGTATGTATATATATTA +GCAAATAAGCAGCCGCATGAAGGTGGCATTTTTATGTGTATCAGTTTCAGTTTCAAATAA +AACTTCTTCGTGTTCGGACACGCGGCTCAAGACTTTTTATTTCGCGTTTACTCTTTCAGC +CTTTGCTCTCAATTCGCTGAGTTTGGGTGAAGATTAGGATCTTCCCATTATGATTGTCAG +TGTTCCACACTTGGAGCACCTTTTCAATAAACAACAGGTTAATGGGCCCAGCGCCCTAGG +AGCTGCCTAAAGGAGAAACGTGTAGTGAAACTCAGGAGTTAGATTTTGGAGTCTACTCAA +GATTGCCGGAATGAGTAACCTGTATCAGATCGATAAGCTGGAGGATGGATCCTATGAAAC +GTGGAGCATCCAGATGCGTTCAGTGTTGGTGCACGCATGTTTGTGGAAGGTGGTTTCAGG +AGAGTCCGTGAAACCTGAGGTTGATACTGGAGGTGCTTGGCAATCCCAAGATGAAAAAGC +ATTGGCCACGATCATCTTGAGTGTGAAGTCTTCGCAACTTGGTTATGTAAAAGGGTGTCT +CACTGCGGCTGAGGCATGGAAAGTTTTACAGGATGTCCACCAGCCGAAAGGGCCGTTACG +AACGGTCATGCTGTATAAGAAGTTGCTGAGCAAACGTCTGTTGGAAGGGCAGAGTATATC +GTCACATATTAAAGAATTTAAGGAAATCTTTGATGCCCTTGATGCGGTGGAAATTGGTAT +CACCGAGAAATTGCGCAGTGTTGTTTTGCTGTCGAGCCTTCCAGAGAGTTTCGAGAATTT +CGTTGTCGCCATTGAGACGCGCGACGACGTGCCGCTTTTCGATGCTCTATGTATAAAGCT +GATCGAGGAAGACACGAGAAGGGGAGGAGCGGAGCAGCAGAGAGAAAAACAAACGGAGAG +CGCAAAGGCATTTACTGCAGTACATAAGCCACAGGCGCCGGCGAGAGAAGCTCGGCCGAG +CGCAAAGAAGAGGAAAGACGTAGTTTGTTATAACTGTGGAGAGCGTAGGCATTTTAAAGC +GAACTGTCGTCGCGAGAAAGTAAACAAAGAGAGCGCGACACAAGAACAATGCAGTTTGTT +AAATGCGCTGGATAGTGGTGGTTTTTGGCAAAACACAGTGGTGTCTCGATAGCGGGGCTA +CCAGTCACATGTGCTGTGACAGAAGTGTTTTTACTGAGTTTGAAGAGCACACTGAAAAAA +TTAGTCTTGCTGGAAATGGATTCCTACTAGCAAAGGGCATAGGAACAGTGAAGCTGAAGA +CTGATTTATGTACTCTGGTATTGAATAACGTACTCTTCGTCCCAGATTTGAACGGCAACT +TTATGTCAGTCAGCCGTGCAGCTCAGTATAAATGTTTTGTCAATTTTGGACCACATTACG +CTGACGTCATTCAGGAAGGCGAGCGAATACTGCGTGTAATGAGAGCTGGTAATTTATATA +TGTTTCAAGGGAAACATAACAGTTGTTTTGCGGCCGTTGATGCTGATGGTTCACTATGGC +ATAAAAGGAATGGCCATTTGAATACAAGCAGCCTACAGGAGATGGTGAGGAAGAAGATGG +TGTACGGTGTTGAAAAGGTCGTTTTCAAACCAGACGCAGTATGCAAGACGTGCATGCTGG +CAAAAATCCATGTGCAACCATTTCCGAAGACAACGAGGAGCAGAGCTGAGGAGCTGTTGG +ATATGATCCATTCAGACCTGTGCGGGCCATTTAGCACACCGTCACTTGCTGGATCAAAGT +ACTTTCTCACTTTCATAGACGACAAGTCCAGGCGGATTTTTGTATATTTCTTGCGGAAGA +AGGACGAAGTCTTCACTAAGTTTGTCGAGTTTAAGAAACTGGTCGAGCGACAAACAGGTA +GAAAGATAAAATGTATCCGGAGCGATAATGGTGGTGAGTTCGTCAATAATGTTTTTGATG +ACTATTTAAAGGCACATGGGATCGCTAGACAGCTGACTATTCCACACACTCCCCAACAAA +ATGGAGTTGCAGAACGAGCCAACCGCACGCTAGTAGAAATGGCTAGGTGCATGTTGCTGC +AATCGGAGTTGGGTGAGGCTCTATGGGCTGAGGCGATAAACACTGCGGTGTATCTGAGGA +ACCGATCAACGAGCAGAGCATTACAAAGCAAAACCCCTATGGAAGAGTGGACCGGAAAAA +TACCAGCAGTGAGCCACTTGAGGGTTTTTGGTGCCATAGCAGTGGCATTGGACAAAGGAG +TCCATAAAGGCAAATTCGAATCCAAAGGAAAGGAATATCGTATGATTGGATATTCAATAG +CTGCTAAGGGGTACCGTCTGTTTGACAAAGAGAAGCGGTGTGTGATCGAGAAGCAAGATG +TCCTTTTTGATGAGTCTGGTAGTTTGGTAAATCATGGAAATACCATTGAGTTCCAGTTTC +CCGCAACTGATGACCCGGAGCCGCAGAGTGATTCGAATGCACGGGAAGGTGACGATACAG +AACCCGTGGGCAGCAGCGACGACTATGAGAGTGCAGCTGAGGCAGAAGAAGCTGAAGTAC +ATGTGGGGCCTGGACGGCCAAAGATTGTTCGGACGGGCAGACCAGGGCGCCCGAAGAAGC +AATACAATGTACTTGGCGTGTTGATGGCTAGCGACGTCGAAATTCCCAAGTCCTATGAGG +AGGCCATCAATTCGCAGTATTCTGCAAAGTGGGAAGAGGCAATGGGCCTGGAGTACAAGG +CGCTACTTGCAAATGAGACATGGAAGCTGGCTGACTTACCAAGAAATCGCCGGTGTGTGG +CTTGCAAGTGGGTGTATTCCCTGAAACGAGACGTCTCTGGTAGAATTGAGCGCTTCAAGG +CACGACTAGTAGCAAAGGGGTGTTCGCAGAAGTTCGGAGTGGACTACTTCGAGACTTTTT +CACCCGTGTGCAGGCTCGAGAGTGTGAGGCTCATTTTGGCATTGGCAGCAGAGATGCAAT +TGTACTTGCATCACATGGACGTATGCACGGCGTACTTAAATAGCGAGCTAAAGGATACTG +TGTACATGAAGCAGCCCCAAGGGTTCACAGATGCTGCTAATCCCGACCAGGTGTTATTGC +TGAGGAAGGCAATATACGGCTTGAAGCAGTCAGGCAGAGAGTGGAACTCCAAGCTCGACG +GTGTTCTAAAAGACTTGGGATTTAAGGCCTGTAATCATGAACCATGTCTTTATCAGCAAA +GTGGTCAAGGTAATCTGATGCTCATCTTAGTATATGTTGATGATTTAATTCTAGCGTGCC +AGTCAAGAGAAGATATGGAGGATCTGAAAGCCAAGATTTCAGAGTCTTTCGAGTGCACGG +ACAAGGGTCCACTGCATTTGTTCTTAGGCATGGAGGTGCAACGAGATGGCGACCTTGGAG +AAATCACTTTGGGCCATTCGCAATATATCAAGGAACTATTGCGGGATTATGGCAGCGAGA +ACTGTAGACCAGCGACGACACCTTTGGATGCAGGGCATCAAGTTTTGTGCGCGGGTGAGC +AGTGCCAGAAGGTCGACGCAGGGCAGTATCAGTCTACAATTGGTGAGCTAATGTGGCTTG +GGCTTACTACCAGACCAGACATGCTACATTCGGTGGCGAAGTTGGCTCAGAGGAATCAGG +ACCCGCATTCTGAGCACATGGTGGCTGTGAAGCACATCCTCCGGTACTTGGCGTCAACTG +TGGACGTCAAGCTGCATTATCAAAAGTGCGGTCAGGCATTTACCGGCTTTGTGGATGCAG +ATTGGGGAGGCGACCGTTTGGACCGAAAGTCATACACAGGGTATGTGTTTTTCCTGTCTG +GCGGACCAGTATCATGGAGGTCCGAGAAGCAGCAGAGCGTGGCGTTGAGCAGTACTGAAG +CCGAGTATATGGCTCTGACCACGGCTTGCAAGGAAGCTATAGCTTTACGAAGGCTAATAG +TGGAGATCGTATGCGGTGATCTGAAGACCCCGACGGTTATGCATGGCGACAACCTGAAGT +GCGCAGCACAGTTAGCGAAGAACCCGGTTCATCACTCTAGGACGAAGCACATCGACATTC +GATATCATTAGAGAAGTCATGAAAGAGGGTCACGTTGTGTTAGAGTACACTTCTACGAAT +GAGATGATAGCAGACATTATGACAAAGAATCTTTCAAAGGGAAAGCATAATGGGTTTATG +AAAATGTTAAATTTGTTTTAATTTTTGTAAACATGTTGGCATTGAGGAAGGCTGTTGAAT +ATAGGCAATGCCCACATGTGTGTTGAATATAGGCAATTTCCACATGTGCATATGTAATTT +TGTATGAGAACATACATACATACACATGAACTATATGTATGTATATATATTAGTAAATAA +GCAGCCGCATGAAGCTGGCATTTTTATGTGTATCAGTTTCAGTTTCAAATAAAACTTCTT +CGTGTTCGGACGCTCGGCTCAAGACTTTTTATTTCGCGTTTACTCATTCGGCCTTTGCTC +TCAATGCGCTGAGTTTGGGTGAAGATTAGGATCTTCCCATTATGGTTGTCAGTGTTCCAC +ACTGGGAGCACCTTTTCAACAAACCACA +>DMIS297 +AGTGACGTATTTGGGTGGTCCAAACCAGCCACTTCCATTATTTCAAAGAAATCAGTAATG +CACTCTAGTAATTTTCCATAACTGTATCCCAGCTGCGCAGACTCGTTTATCTTTTGCAGC +GCAGCGTTCTTTGTAAACATCCTAAAGACCTGCCTAAGCAGATTTGACTGCCCTCTTTCA +ACGCTACCTAATCTTAAGAACCCAAGAGCGAGGCTCTCCCGAAATACAAATATTGTTCAA +ATACTGAGGCTTCTCCTCAATCCAATTTGCATTTGATTTTTAGTCTTAAGCTGAGATCCA +AAGAATAAAGTCGTGAAACTATTTCTCCTAAAAACTATTTTTTATTTCTTGGCGTTGTCC +TTAGTCAACTGACGGGACATTAGTTCGACTCATAAATAAAACAACAATTTTACTGGCGCA +GTCGGTAGGATACAAAAGTATCCGAAAAAAAAGAACCTTCGAATGGAAAATAAGTTAAAT +TTTATAGTCCTGTGCTCGAAACATCTCCCAAAATAAATTCGTGAAAACTCTTCAACTTCA +ATTATAATTCCAATTCGGTTATCCAATAATAAGTGGAAGTGAAATACGAAACAAAAATAT +TAAGTCCAAAGGCAACTAAGTTTTAAAACCAACATATAAAAATAAAAAATTAAAACAATA +TAGAATTTTAATAATACAACACAAAAATTTACAAAACAAAAAAACAAACAAGTGAAACTA +GAAAGCTTAAAAATAATAATAACATTGAATCCGAAACAAAACAAAAAAATAAAACACAAA +AGTTAAAAATTTTACAATAAAAATGTCACAACCAATTATTGCGCTGAGCGACATAAACCT +TGCCGAAGCCCGTCGGCAGCTTAAAGACATTATGCCATTCAAGGGTGATCCAGAAACCCT +TCACACCTTTATCAGCAGAGTGGATTACGTAATTTCGCTCTACCAAACAAATGATGTCCG +ACAACAGAGGATTCTACTGGGAGCCATCGAAAGGAACTTGGACGGACAAATTACACGATC +TTTGGGACTTCCGAACGTCGAAGATTGGCCTACCCTTAAAGCAAGACTCATCGCGGAATT +TAAAATTCAAACACCAAACTACAAACTTCTGGAGAACTTCAGGGAGACACCATACAGAGG +AAGCCTAAGAGCATTCTGCGAAGAAGCGGAGAGACGACGTCAATTACTAATTTCGAAACT +ACACCTGGAAGGTAACCAATCGGATTTTCTTATTTATATTCAGGGTATTAAAGAATCTAT +TAAGATACTGATAAGGAAACTACCAATACAATTATTCACTATTTTAGCCCATCACGATAT +TACAGACTTAAGATCCTTAATTACCATTGCACAAAATGAGGGAATTTATGAAGAACACAT +TAATTTTGAATTTTATGAAAAACCAGAATATCGTAATAAAAATTCAAATTCTAACCAGAA +TTCGAAAACACAAAAATTCAATACAAATGTTCAAACTCAAAATCGACCAAGTTACTCACA +ATATTCCCAACCCTTCCAACCTAATTTTAATCAATACATTCAACCATTTAGACCTAGCTA +TACACAGCAGATAACTAACAACCCACCCATGTGGCACGCACCTAATTATTTCAGACCCAA +CCAATACATAAACCCACAACCCATTATTCAAAAAAATCATTTCCAACAATATCCCAACAA +AGCCCAATTTCCCCAAACAACGCATTTTAGAGGAAATACATACCCTCGACTACAACAACC +CTCTACATATAAAAATACTAACTTCCCGATTACTAAACGACTAAGACCATCGGACAGTGA +ACAAACTAAAATGTCTATTGACGAAATTAGATTCCAAGACGCGCATGAATTCGAACAAGT +CCAACCTAATTATTACGAGCAACAGTATTTTAACCAAAATCAATACAATCCGTATCAAAA +TCATAGCTTCATTAATGAAGGGCAACAACAAGTTCAATTTGTACAAATTAATAACAAACA +AAACCAAAATAATTCTGAACTAAACGAAAATTTTCGGTTAACAGTTCCGGAAAATACGAA +TACATAAAAATAGTATACAAAGGGCGTTCATACAAATGCCTTCTAGACACAGGATCAACA +ATTAATATGATCAATGAAAATATATTTTGTCTTCCCATTCAAAATAGTAGATGTGAAGTT +TTAACATCAAATGGCCCTATTACCTTGAACGACTTGATTATGTTACCCAGAAATAGTATT +TTCAAAAAAACCGAACCATTTTATGTGCACAGATTTTCTAATAATTACGATATGCTAATT +GGCAGAAAATTGTTGAAAAATGCTCAATCAGTTATTAATTACAAAAATGATACAGTTACC +CTTTTTGATCAAACATACAAATTAATTACTTCAGAATCCGAAAGAAACCAAAATTTGTAT +ATCCAAAGGACACCAGAATCAATTGCAAGCTCAGATCAGGAATCAATAAAAAAATTAGAT +TTTTCACAGTTTCGATTAGATCACCTAAATCAGGAGGAAACTTTTAAGTTAAAAGGCTTG +TTAAATAAATTTAGAAATCTTGAATATAAGGAGGGAGAGAAATTAACATTTACAAATACA +ATTAAACACGTACTAAATACAACACATAACTCCCCAATTTATTCGAAACAATACCCACTT +GCGCAAACACACGAAATCGAAGTAGAAAACCAAGTACAGGAAATGCTGAATCAGGGATTA +ATTAGGGAAAGTAATTCTCCATACAATAGTCCTACTTGGGTCGTACCAAAGAAACCGGAT +GCTTCTGGTGCAAATAAGTACAGGGTAGTAATTGATTATAGAAAGCTAAATGAAATAACC +ATACCTGACAGATATCCAATTCCAAATATGGACGAAATTCTTGGCAAACTGGGTAAATGC +CAATATTTTACAACGATCGATCTGGCAAAGGGATTTCATCAAATAGAAATGGACGAAGAA +TCAATTTCTAAAACTGCATTCTCCACAAAAAGCGGTCATTACGAATACCTTCGAATGCCA +TTTGGCCTTAGGAATGCACCCGCTACTTTTCAAAGGTGCATGAATAATATCCTTCGACCG +TTGCTTAACAAACACTGTTTGGTGTATCTGGATGATATTATAATTTTTTCAACATCCCTT +ACAGAACATTTAAATTCAATACAATTAGTTTTTACAAAGCTTGCAGATGCAAATTTAAAA +TTGCAACTAGACAAATGTGAGTTCTTAAAAAAGGAAGCTAACTTTCTTGGTCACATAGTT +ACCCCTGATGGTATTAAACCAAATCCTATTAAAGTTAAAGCCATAGTTTCATACCCAATT +CCGACAAAAGATAAAGAGATAAGAGCTTTCCTTGGATTAACAGGTTATTATCGCAAATTT +ATTCCAAATTACGCAGACATAGCAAAACCCATGACCAGCTGCTTAAAAAAAAGGACAAAG +ATAGATACACAAAAACTTGAGTACATAGAGGCATTCGAAAAACTTAAGGCTTTGATAATT +CGTGACCCAATTTTACAATTACCTGATTTTGAAAAGAAATTTGTTTTAACCACAGATGCA +AGTAACTTGGCCCTCGGGGCTGTCCTTTCTCAAAACGGTCATCCTATATCTTTTATTAGT +AGAACACTTAACGATCACGAATTAAATTACAGTGCTATCGAAAAAGAATTACTTGCCATA +GTTTGGGCCACAAAAACTTTTCGACATTATTTACTAGGACGACAATTTCTCATTGCCAGT +GACCATCAACCTCTTAGATGGCTTCATAACTTAAAGGAACCAGGTGCTAAGTTAGAAAGA +TGGAGAGTTAGATTAAGCGAATACCAATTTAAAATAGATTATATTAAAGGGAAAGAAAAT +TCAGTTGCCGATGCATTATCAAGAATTAAAATTGAAGAAAATCATCATAGTGAAGCTACT +CAACATAGTGCAGAAGAGGACAATAGCAACCTTATTCATTTAACAGAAAAACCAATAAAT +TATTTCAAAAAACAAATAATCTTTATTAAATCCGATAAAAATAAAGTAGAGCATTCAAAA +ATATTCGGTAACTCCATTACCACAATTCAATATGACGTAATGACACTTGAAAAGGCCAAA +CAAATTTTACTCGATCACTTTATCCATAGAAACATTACCATTTATATTGAGAGCGATGTA +GATTTTGAAATCGTTCAAAGAGCACACATAGAAATTGTTAATACCACCTACACAAAAGTA +ATTCGCAGTCTTTTCCTATTAAAGAACGTTGGTTCATACGCCGAATTCAAAGAAATCATA +CTTCAATCACATGAAAAACTTTTACACCCTGGTATACAGAAAATGACAAAATTATTTAAA +GAAAATCACTTCTTTCCAAATAGCCAACTATTAATTCAGAATATAATAAACGAATGCAAC +ATATGCAATTTGGCCAAAACAGAACATAGAAACACCAAAATGCCTTTAAAAATCACACCC +AACCCGGAACATTGCCGAGAAAAATTTGTAGTAGATATTTATTCATCTGAGGGAAAACAT +TACATCAGTTGCATTGATATTTATTCTAAATTCGCTACACTTGAGCAAATTAAAACTAAG +GATTGGATAGAATGCAGAAACGCATTAATGCGCATTTTTAATCAACTAGGAAAACCCAAA +TTATTAAAGGCAGACAGAGACGGAGCTTTCTCCAGTTTAGCTTTAAAGCGATGGCTTGAA +GAAGAAGAAGTCGAATTACAGCTCAATACAGCAAAAAACGGAGTAGCAGACGTCGAAAGA +TTACACAAAACAATAAATGAAAAAATTCGTATAATCAATTCATCTGATGATGAAGAAGTA +AAATTAAGCAAGATAGAAACAATCCTCTACACATACAACCAAAAAATTAAACATGACACT +ACTGGACAGAGACCTGCTCAAATTTTCTTATACGCTGGGCATCCCATATTAGACACTCAA +AAAATTAAAGAGAAGAAAATAGAGAAAATAAATGAAGACAGACGGGAATTTAATATTGAC +ACTAATTACAGAAAAGGTCCACTACAGAAAGGCAAATTAGAAAACCCATTTAAACCAACC +AAAAATGTAGAACAGACAGACCCTGACCATTACAAAATCACTAATAGAAATAGAGTTACG +CACTACTACAAAACACAATTCAAAAAACAAAAGAAAAATAATAAACTCTCAATTTCACAG +GCACCTGGTACCCGATAACACTATTGTTTATACTGATCACAGCTGTTCATGGACAACAAA +TTCAAATTAATAATATTGACACCAACCACGGATATCTCCTTTTTTCTGATAAGCCAGTAC +AGATACCATCCTCCTTTGAACATCACTCCTTAAAAATCAATTTAACTGAAATAGACATCG +TGGTTGACTATTTTGAGCAAAGACTACGAACCGATTACCATGCACCCCAGATCAATTTTT +TATACAATAAAATAAAAAGAGAACTAGCCAGAATAACCCTGAAACATAGAAACAAACGGG +GTTTTATTAACATTGTGGGTTCAGGTTTTAAATACCTATTTGGAACACTAGATGAAAATG +ATCGAGTCGAAATACAGAAAAAACTTGAAATCAACGTCCATAACTCAGTAAAATTACATG +AACTCAACGACGCCATACGATTGATAAATGACGGAATGCAAAAAATACAGAATTATGAAA +ATAACCACACCATCATTGACAGTCTTTTGTTCGAACTAATGCAGTTTACGGAATACATAG +AAGATTTGGAAATGGCTATGCAGCTTTCCAGACTTGGACTGTTTAACCCCAAATTACTAA +ACTACGACAAACTTGAAAATGTGAACAGCCAAAACATTTTGAACATTAAAACATCCACTT +GGATTAACTACAATGATAACCAAGTATTAATCATATCCCACATACCCATTTACCTTTCAC +TAATAAGCACAATTAAAATAATTCCTTACCCAGACTCCAACGGCTATCAGCTAGATTACA +CAGACACACAATCATATTTTGAAAAAGAAAATAAAGTTTATAATACCGAAAATAAAGAAG +TAAAAAATGAATGTGTCACCAATATTATTAAACACTTAAATCCAATTTGTAATTTTAAGC +CAGTACACACGAACGAAATAATAAAATACATAGAACCAAACACAATTGTAACTTGGAACT +TAACCCAAACAATTCTTAACCAAAATTGCCAAAATTCAATTAATAAAATAAAAATAGAAG +GAAACAAAATGATAAGAGTAACGCAATGCAAAATAGAAATCAATAATATAAATTTTAGTG +AAACTCTGTTAGAACCAGAAATAGATTTGACACCACTATACACACCACTTAATATAACAA +AAATAAAAATTGTAAAACACAACGACATTATTGAGATGATTTCAGAGAACAATATTACAC +TTTACATACAAATGATCATTGTAATAATCGCACTAATTTTGTTGTACTCATATTTAAGAT +ATGTATCATTTAAACCATTTATGATGTTGTATGCAAAACTTAAAATAAGAAAAAATCAAA +ATCAAAACACACCACAACAAACAGAAATAGAAGAAATTCCATTTCCCACACTATATCCAT +CAATCCCAGCCCAAGTATAGGCTTCTCTTTAAGGGAAGGGGAGTGACGTATTTGGGTGGT +CCAAACCAGCCACTTCCATTATTTCAAAGAAATCAGTAATGCACTCTAGTAATTTTCCAT +AACTGTATCCCAGCTGCGCAGACTCGTTTATCTTTTGCAGCGCAGCGTTCTTTGTAAACA +TCCTAAAGACCTGCCTAAGCAGATTTGACTGCCCTCTTTCAACGCTACCTAATCTTAAGA +ACCCAAGAGCGAGGCTCTCCCGAAATACAAATATTGTTCAAATACTGAGGCTTCTCCTCA +ATCCAATTTGCATTTGATTTTTAGTCTTAAGCTGAGATCCAAAGAATAAAGTCGTGAAAC +TATTTCTCCTAAAAACTATTTTTTATTTCTTGGCGTTGTCCTTAGTCAACTGACGGGACA +TTAGTTCGACTCATAAATAAAACAACAATTTTACT +>DM23420 +TGTTTGGGAACGAGACACCCTGTATACGCGAACAAGTCACCCTTTATCTTTATTTACATT +CTTATTTGTCTGCAGCTTCATCGGAGCTTATCAGCGGAATCAATGTAAGCATCGCACCGC +TGTAATTGTCCGCGAGCTTGCCCAGTACTTTTCCAAACTTCTAACTCCCTTCTAACTGTA +ACTTGTTTACGTCTTATGCTAGACTAATCGTATGGCGTGATTACAGCCAAAGCTGAAGTC +AGTCACAATTTTGATCTGCGAGAAAACGTACGCATCGGTGTCGAAATAATTAATATTAAG +TGTCTGAACTTAACCAATAAATGAAAATTAACAGTAACACTGGCGGTTTTATTTATAAAC +ATAAAAATTGGTCCTTCGAGCCGGATAACCGGAAGTGCGTTTCGTTCGGGCATTTGATTT +TGATTATTGGCCTTTTGGCAAACGATAATCTATAGATTCCTACATCGTGTAGAATCGTTC +CCTTCTTTCGACCACCATGCGGAGTGTGATTCAACAACGGGGCTTCTGCAAAAGCCAAAT +TACTCGTGCGCATAATAATGCCTTAAAATTTGTTGATGACATTCACTCAGTGCAAACAAT +AGTTGTCCGCCTGGCGCAACTACAGGAAAATTATTTGCGGTTCGTACGGCTCTCGGAAGA +GCTGTATGCATTTCAATCGGAAGCCGATTGGGAGAACCCTGACGAGGATTTTGACGCATA +TGAGGACAAACATTATGCTACACACGCTATTCTCAGCAATACTTTGGAGGAGTTGAGACG +GGATGTCACCTCAAACAGTATTGATGCCACAGTTCAAGCGCAGGCACACCCCAGAGAAGT +CATGTCGATTTTCAGTTCGAGAGAATTAAACTTCCGACTTTTTCTGGAAATTATGAGGAC +TGGAAACATTTTTCGGACATGTTTATTGGATCGATTGCTTCCAATTCGAGCCTGACGGAT +TGCCAACGATTTCATTATTTAAAATCGTACCTTGCCGGAGACGCGCTTGCATTAGTTAAA +CATATTCCAGTTACTAATGACAACTATCGGGAAGCATGGGAGCGGCTGGAACAGCGATAT +AACAAACAATCGCTAATTATTCGATCGTTCTTAAACAGTTTCATGAGCCTTCCGAGTGCT +ATAAATTCAAATATCGGCACAGTGCGGAAAATTGCCGATGGTGCAGACGAAGTTATTCGT +GGTCTACGAGCTCTTAATTGCGAAGAGAGGGATCCCTGGCTAATTTTCATTCTACTTTCA +AAATTAGATAGCGATACCCGCCAAGCCTGGGCTCAGTGCGCAGAATCCGAGGAAAAAGGT +GTGACCATCAACCGATTCTTGAAATTTCTCACATCACGCTGCGATACGTTGGAGGCTTTT +GAATTAACTCGATCAACCCAAGCTCGACGCGCAGCTACCACGCACCACGCAGACACGCAT +CCAAGACGGGAAGAGCCGAAGTGCACATCGTGCCAGCAGAATCACCAACTGTTTAAGTGT +CCTCAATTCATCGCACTCGACATTGCATCTCGCCGAGACTTCCTCAAATCAAGAAAGCTC +TGTTTCAATTGCCTCAGCCCGGCTCATATGGTGGGCAACTGTACATCGAGGCATACTTGT +CGGATCTGCCGCCGCAAGCATCATACTTTGGTTCATGGCTCGTCGCAGCCAATTCAAAAT +GGCAACAACATTGACACAGCAAGTGTTGACAGCCGCGATCGACCAGCAGTCTCACATGCG +GGATCTACAATTGGCCACAATCAACCGCTAGCTCGAGAAGGTCATCGCTTGGGAAGCGAG +ACTCCCGCGGAAAACAACTTTACGCATCATACTCTGGAGAATATTCCGGCGGCTGGTTCT +CAGACTCTGTTGCCAACCATCCTTGCTGACGTCATCGACGCCTGGGGAAACACTACAACC +TGCAGGCTGCTCCTGGACACTGGATCTACAATAACCTTGGCATCGGAATCATTTGTTCAG +CGAATAGGCGTGCGTCGAACGCACGCACGGATTTCTATTCTCGGTCTCGCCGCCAACAGC +GCGGGCGTTACCCGAGGACGCGCACATATCAAGCTGCGCTCTCGTCATTCGGGCCAAACT +GTCGAATTGGTCTCGTTCATTCTCACCTCGCTGACGTCATCACTTCCTGCCCAAGTTATT +GACACCTCATCCTCTACGTGGAGGCAAATCTGCGAGCTTCCTTTGGCAGACCCAACGTTC +TGCACACCTGGAGCAATCGATGTCATTGTTGGATCGGATCAACTTTGGTCTCTATACACA +GGAGATCGGAAACACTTTGGTAACGACTTTCCTATCGCTCTCAATACTGTATTTGGTTGG +ATTCTTGCAGGCTCTTACTCTGCATTCGATGATCACCCTACTTCTGCGGTTACTCATCAC +GCGGACCTAGACACGATGGTTCGTTCATTCATGGAGATGGACAGCATTCAGCCTAACCAG +GCTCTCCTGGACGCCAGCGATCCCACAGAGCGTCATTTTGCTGCCACACACAAGCGCTCG +ACGGACGGGGTGTACGTCGTCGAGTATCCCTTCAAGGAAAAGGCACCGCCTATTGATTCG +ACCTTGCCACAGGCCATCAATCGCTTCTTCTCGCTGGAACGCAAATTTCGTCGGTATCCA +GAATTGAAGCAGCAGTACGAAGCTTTCCTGGACGACTACTTGCAACGTGGACATATGGAA +AAACTGACCTCGGCTCAGGTTGAAGAGTCCCCAGACACCTGCTTCTATTTGCCGCACCAC +GCTGTCATCAAACTGGACAGTCTGACTACCAAATGTCGTGTAGTTTTTGATGGATCAGGA +AAAGACAGCTCTGGAGTATCGCTCAATGACAGACTACATATTGGTCCACCGATTCAACGC +GATCTTTTTGGCGTTTGTCTACGCTTCCGGCAGCACCAATATGTTTTATGTGCAGATGTC +GAAAAGATGTTTCGAGGCATTAAAGTCTTTAAGCCACACACCAATTTTCAGCGCATTGTT +TGGCGCACGACTGAGAATGAACCTCTGCTTCATTTTCGCCTGCTGACGGTTACCTACGGA +TTGGCACCGTCACCATTTCTGGCTGTTCGAGTTCTAAAGCAACTTGCCGACGATCATGGC +CATGAATACCCTGCAGCAGCTCACGCTCTTCTGCACGATGCCTATGTGGACGATATCCCG +ACAGGCGCCAACACATTCGAGGAGCTTATGATTCTCAAGGACGAGCTTATAGCCCTCTTG +GATAAGGGAAAATTCAAGCTACGCAAATGGAGTTCTAATAGTTGGCGTCTTCTGAAATCA +TTACCAGAGGAAGATAGATGTTTTGAACCTATCCAGCTCCTCAACAAATCAGCTGCGGAT +TCACCTGTCAAAGTTCTTGGTATCCAATGGAACCCTGGGAAGGACGTCCTGTATCTCAAC +CTAAAGGGATGCGATGCGACCATTTCTCCGACGAAAAGAGAACTCTTGTCTCAGCTATCA +AGAATTTATGATCCGCTTGGACTGGTAGCGCCGGTCACAGTTCTACTCAAGCTAATCTTC +CAAGAAAGCTGGACAAGTGTCCTGCAGTGGGACGACCCCATACCTGAAAGTCTACGTACG +CGCTGGAGAGCCTTAGTAGAGGATTTGCCAGCACTTACGCAATGCCAAGTACCACGGTAT +ATTGCGTCACCATTTCGAGATGTTCAACTACACGGATTCGCCGACGCATCCTCGCACGCC +TACGGTGCGGTAGTTTACGCTCGAGTTGCAGTTGGATGCAGCTTTCAAGTAACTCTGGTT +GCCGCCAAAACACGGGTGGCCCCGATCAAGCCCGTATCAATTCCACGTTTGGAGCTAAAC +GCTGCGTTACTTCTATCTCGATTGCTTTCTATTGTCAAAACATCACTAACAATTCCTCTT +TTCAGCACGAGCTGCTGGACAGATTCAGAAATTGTGCTACACTGGCTTTCAGCTCCCCCT +CGACGGTGGAACACCTACGTCTGCAACCGAACTTCTGAGATATTGAGCGACTTTCCCCGT +AGCTGCTGGAACCATGTTCGCACGGAAGACAATCCTGCAGATTGTGCTTCCCGAGGACTT +CATCCGTCAAAGCTTCTGGAGCATCGACTGTGGTGGAAAGGTCCGTCTTGGCTGGCCACA +CCCACCTCTGAGTGGCCACCTTCTACAAGCAAGTTCAGCGTATCTTCAAGTTTCGATGTC +AACACCGAAGAACGAGCCATAAAGCCCACGACTCTACATAACTTTCCTGATGAAAGTATA +CACGAGTTACTCATCCACAAATTCTCAACCTGGACGCGTCTTATAAGGGTATCTAGCTAC +TGTCATCGCTTTATTCACACTCTTCGATCCCATCATAGGAATTCGGCACCATTCCTTACG +TCTGAAGAGTTGCTGGACGCACAGCGCCGACTTATTCGACATGTGCAACAAAAATCCTTT +GCCAGAGAATATGAGCAGCTAGAGAATCGACGCCAGCTTAACGCTAAATCGCATCTTATC +CGGTTTTCTCCGTTTCTGGATGATTATGGAGTAATGCGAGTCGGTGGGAGAATCGAGCAA +TCTACACTCAACTATAACGCCAAGCACCCGATTCTGATACCTAAAGATACACCACTAGCT +GGACTCCTGGTTCGACATTTTCATGTCTCCTATCTGCACACTGGAGTTGATGCAACGTTC +ACCAATCTTCGTCAGCAGTACTGGATTCTGGGAGCCCGCAATCTCGTCAGAAAGGCAGTC +TTCCAATGCAAATCCTGTTTTCTTCAACGAAAGGGCACAAGCAACCAGATCATGGGAGAG +CTACCAATTCCTCGAGTTCAAGCTAGCCGCTGCTTTCAACACACAGGGCTGGACTACGCT +GGACCGATCGCAATCAAGGAATCAAAGGGAAGAACTCCACGCATCGGAAAGGCATGGTTT +TCTATTTTCGTGTGTCTCACTACAAAGGCACTTCACATCGAGGTTGTTAGTGAGCTAACT +ACACAGGCTTTCATCGCAGCCTTTCAACGATTCATTGCCCGCCGAGCGAAGCCTACTGAC +CTGTATTCGGATAATGGAACAACATTTCATGGAGGCAAGAAAACTTTGGATGACATGAGA +CGTCTGGCCATTCAACAAGCCAAAGATGAGGAACTAGCAGGATTCTTTGCCAATGAAGGG +ATTTCTTGGCACTTTATACCCCCGTCTGCTCCACATTTTGGAGGGATGTGGGAAGCTGGA +GTTCGCTCAATTAAACTCCATATGAAACGAATACTTGGATCAAAGGCTTTAACGTTTGAG +GAGCTCTCTACTGTCCTGACCCAAATTGAAGCTATCCTGAATTCACGCCCGCTGTGCCCA +ACTGGGGATAATTCTTTGGATCCACTGACGCCTGCTCATTTTTTGACTGGATCTCCGTAT +ACTGCATTGCCTGAACCCTGTCGTCTGGATATGCAAGTCAATCGATTGGAGAGGTGGAAT +CAGCTGCAAGCCATGGTTCAAGGCTTTTGGAAAAGGTGGCATATGGAATACCTGACATCT +CTTCATGAGCGGACAAAGTGGCATCTGGAAACCGAGAATCTGAAGATCGACACACTGGTA +GTACTCAAGGAGCCCAATCTACCGCCCTCTAAATGGATTCTTGGCCGCATCACAGCAGTG +CACGCAGGAATCGACAACAAGGTCCGAGTCGTTACAGTGAAGACTGCTCACGGATTATAC +AAACGCCCAATTGCCAAAATCGCTGTACTGCCTCTCTGCTGAACAACCGTTCAGGGGGGC +CGGTATGTTTGGGAACGAGACACCCTGTATACGCGAACAAGTCACCCTTTATCTTTATTT +ACATTCTTATTTGTCTGCAGCTTCATCGGAGCTTATCAGCGGAATCAATGTAAGCATCGC +ACCGCTGTAATTGTCCGCGAGCTTGCCCAGTACTTTTCCAAACTTCTAACTCCCTTCTAA +CTGTAACTTGTTTACGTCTTATGCTAGACTAATCGTATGGCGTGATTACAGCCAAAGCTG +AAGTCAGTCACAATTTTGATCTGCGAGAAAACGTACGCATCGGTGTCGAAATAATTAATA +TTAAGTGTCTGAACTTAACCAATAAATGAAAATTAACAGTAACACTGGCGGTTTTATTTA +TAAACA +>412 +TGTAGTATGTGCCTATGCAATATTAAGAACAATTAAATAAAATAGCATATTAACTTATGG +CAGCACTTTGTTGCTATGTTTATGTTTATGTTTATGCACGCAGTTAGGCCAGGGCGGATG +TAACATGATCACCCACTCGAAGGCCACAAAGTATAAGTGCATTGCCCAATCGAAGGCAAA +AAGTATAAGTGCATGGTCAGCATTCACACGCCGACCAAATACATATTACATACGTACATA +CATATCTCGCTCTCCCGATAAGCCTAGATATATAAGATATACATAAGAACGCCGCTCCGC +TGCTGGCGTACCCGGCAGCGCAGCTACGCGGATTAGCCTAAGTCCAAATATATAAAAAAC +TGTAAAATCGGAGAGACTCTGTAGACGTTGAGCTGACAGAACCATTTCTGCCTACTCTAA +AATCAAAAGAAGAAATTGAATAAATATATGTCAGCCCGACGGCTGCCTTAAACTTAAAAC +GGACTTGTGTTCTTAATTGGAGTTCATCATTACATGGCGACCGTGACAGTCGTCCAACGC +TGGACGAATTGACCAAAGCTGGTGAAAACAAAGGAACAAAGGAACACTGGACTGGAAGAA +GACTGGACTAATTAAATGGAACTGCAAAAACCAAGGAAAAATCTGAGTGAGTAGAGTTCT +ATTGAGTATGGGCAAACACCGTGGCGGTTTGAAAACTAAGCTGAATAAACGTATAGCCCA +CGTAAGGTGGCTAATATACGGTCAGCAAACGCCACCGGTTTGGTCGAAAGCTCTAAAGCT +ACATGCAGAGCTAGACCACTTGTTGCAATATCAGCAAGAATTAAAGACCCATAAGCTCGA +GAAAACTCACTCAGATAATATTAAAAATATACCCACAATTAATGAAGTTCCAAAATACCA +GGCATGTCCAGCACCAGCACCAGCATTAACAAAACCAAAGAAGTCCTGCCCCCCTGGCTG +CGAAGGAATCTGGAGTCCCCACTGCCTGGGGACTTGTGAGCGACCATCGACGTCTTCAGC +GGCGAAGAAATAGACAGCAGCGAGGGAGTGTCAGCGTGCCACCCCCGGCGACGCCCAGCT +GACACCCAACAAATAGACAGCAGCGAGGGAGTGTCAGCGTGCCACCCCCGGCGACGCCCA +GCTGACACCTGATGAGCATCATCAACAGCAGAATATAATAATAAATATATATAAATATAA +AGTAAATATAAAATATATATAGATAAGAAAAATTGTAAGAAATATTGTAAAACGGAGCAT +ATACTATTATGCCCTGTTAACCCAATATGGCCCGTGAAGCCATAGCTAGAATCAGGCAGG +CAACAATGTAAAATACAATTTTTTTTTACTCTTGCGAACATTGAAAGATTTTATAAATAG +ATAATTCCAAACATAAATGTCTATAGAGACAAATGAAATAAGTAAAACTGAAAATAAAAG +TATATACAAAGGAAATTTTCTATTCTATTCTCCAAAATATAAAATTAGTATACCCAAAAT +GGGTCTAATAGACACTAAAACTGTGGACTCTACAGCCAATGTAATAAATAAAGTAGAAGT +CCAAAATGCAGACTTGTTCTGGATAACCATAATACTAATTGTAATTGCATTAATTATGGT +ATCCAATGCATTAATAAAAATATACAAACTGCATAACAAGTGTCTTAAGAAACGATACCG +TAGCACTGCTAACGGTATAGATAATATTTAAGGAAGATCTTTAATAAAGTCAATTATGAA +TGAAAATATGAGAAAAATTATATGAAAAAAAAAAATAATAAATAAAAAAAAAATATAAAA +CGTAATATTGAATTTATCTACATTAAAAAAAAATATATACAAATGAATAAATTTGAAGTT +ATGAGTATACCACAGCATGGACTGGGAAAAGCTTGTTGATCAGATAAAAGATCAAAATGA +AAATTTCAGAAAATCCTATAAGTGCTTAACGCAAAACAGATCAACACAAGCTGTAACAAT +CAATAGGAATGCCCAAGTCTTGGTAAATAGTTATAATGAAATCAGAGAGTTGATCCAACA +AAATAGAAAGAATTTGGAACGCAAACAGTGTGCTAAGGCTTTGAACCTACTGGTGACATT +AAGAGAAAAATTAATATTTATAAAAAATAAATTCAGTCTCCAGATAGAAATTCCAACCAT +AGTAAACACCCCACTAAGAATAAATTTGAATGAAGACAGCACTAACTCTGACGAGGAAGA +TAGGACTATAGTCAAGGAAGACATTAAAGAGGAAGATCTTCACGATCTAACTATACCAGC +AAAATTAATGCTGAAGAACGACGATAAAACAAATAACGCAGCCGACTCCGAAAATAACTT +AACCATGGCAGAAGAAGCAGCTGCCATTAGGTCTTACATTAGGGAAGTCGCCTGCACAGT +GCCAGAATTTGATGGGCAAAAGATCCATTTACAAAGATTCATTAAGGCAATCAAATTGGT +AGACCTAGCTAAGGGACCATTTGAAGACATTGCAGTTGAGGTCATTAAGTCAAAAATAGT +TGGCACAATTTTGAACTCAGTTGACAATGAAACGACAATTCCAGCAATTATAAACAAATT +GCAGAAAGTAGTTGTCGGTGAGACATCCAGTAATGTCAAAGCAAAGCTAGCAACAGTTCA +GCAGAGAGGTAAAACTGCAACGCAATTTACCGCTGAAGTTGATAGCCTGAGAAAACTTTT +AGAAGCTTCCTATATCGATGAGGGTATACCTCTAGAACATGCCACTGGTCTAAGCACCAA +AGAGGCAATTGAAACCATGATACATCGTGCTGAGCACGAAAGTATCAAAACAGTACTGGA +AGCAGGGACTTGCACCACTATGGATGCAGCGATAAGCGCATACATAAGAACGAGTACAAG +AGTTACCGGTGACATCAATAAAGTGATGTACTTTAGAGGTAACAGACCCAATAGAGGATA +CGGAAATGCCAATAGAGGTAGTAACCGCGGTAGAGGCTTTAATAACAATAGTATTAGAGG +CAACTACCATAACGGTTACCAAAATAACGGTTACCAAAATAACGGTTACCAGAATAACGG +TTATCAAAACCGCTATAATGGAAATAATAACCGTTATAATGGCTATAACAGAGGCCGTTA +TAATGGAAACAGAGGCCGTAACAACAGTCAGAACAACTACAACAGAAACAATGCCAATGT +ACGAGTAATCCAAGAACAGGGAAACTCGCAACAGCCTTTAGGTACTCAGTAGAAGAAGAT +CGTAGAGTATACACCATCAATTATAATCTCAACATATTTTCTACATTCATTCATGCCAAA +ACAGGCGTAAAACTAGTTTTTCTACTTGATACAGGTGCAGATATCTCTATTCTCAAAGAG +AACTCTGACAAATTTTCTAATATTCAAATAACCAATAAAATAAACATTCAAGGCATAGGC +CAACAGAAAATTCAGTCTCGAGGACAGACTTTTATTGAGATACAGACAGGTAAATACGTT +ATCCCACACGATTTTCATTTAGTAGATAAAAACTTTCCAATACCGTGTGATGGAATAATC +GGAATAGATTTCATAAAAAAATATAATTGCCAAATCGATTTAAACCAAGAAGAAGATTGG +TTTATAATTAGACCAAACAATTTGAAATTTCCAATATATATTCCCATAGCATACAGCTCT +GGTATTAACACAACGTTATTACCAGCAAGATCCCAAGTTGTCCGAAGATTAATAGTATCA +TCAAAAGATGATAACATTTTAATTCCAAACCAGGAAATTCAAACTGGTATTTATGTTGCA +AATACAATCGCAACATCAAGTAATACATTTGTCCGAATTTTAAATACAACCGATTCCGAC +CAATTAGTCAATATGGACACTCTAAAATATGAGCCACTTTCGAACTACAATGTAGTTCAG +GCAAATAGTGAACACAGAAATAAAACTGTCTTATCTCAATTAAAGAAAAATTTCCCCGAA +TTGTTTAAATCACAATTAGAAAATATATGCAGCGAATATATAGATATATTTGCATTAGAA +TCAGAACCTATAACAGTTAATAATTTGTATAAACAACAGTTGAGATTAAAAGATGATGAG +CCAGTATACACGAAAAATTATAGAAGTCCTCATAGTCAAGTGGAAGAAATACAAGCCCAA +GTTCAGAAATTAATAAAAGATAAAATAGTTGAACCATCAGTTTCACAGTACAATAGCCCT +TTGCTATTAGTACCCAAAAAGTCAAGCCCGAATTCTGATAAAAAGAAATGGAGATTAGTA +ATAGACTATCGCCAAATTAATAAGAAACTTTTAGCTGACAAATTTCCACTACCGAGAATA +GATGATATTTTGGACCAACTTGGTCGAGCAAAATATTTCTCCTGCCTTGATTTAATGTCA +GGTTTTCATCAAATCGAACTGGATGAAGGCTCGAGAGATATAACATCTTTCTCAACCAGC +AATGGCTCATATCGTTTCACGCGATTGCCATTTGGCTTAAAAATAGCGCCTAATTCATTC +CAAAGAATGATGACTATAGCATTCTCCGGAATAGAACCGTCTCAAGCATTCCTTTATATG +GATGACTTAATAGTCATAGGTTGTTCCGAAAAACATATGCTTAAAAACCTCACTGAAGTT +TTTGGTAAATGCAGGGAATACAACCTAAAGTTACATCCTGAAAAATGTTCATTTTTCATG +CATGAAGTCACATTTTTGGGACACAAATGCACAGACAAAGGAATTTTGCCGGATGACAAA +AAATATGATGTCATTCAGAACTACCCAGTTCCACATGATGCGGACAGCGCTAGACGTTTT +GTAGCATTTTGCAATTACTACAGACGTTTTATCAAAAATTTCGCCGACTATTCGCGGCAC +ATAACAAGATTATGTAAAAAGAATGTTCCATTCGAGTGGACAGATGAATGTCAAAAAGCA +TTCATACATTTAAAATCTCAGCTAATTAACCCAACACTCTTGCAGTACCCAGACTTCAGC +AAAGAATTTTGCATAACAACAGATGCAAGCAAGCAAGCGTGTGGCGCAGTTTTAACTCAA +AACCATAATGGCCACCAACTCCCAGTTGCTTATGCATCCAGAGCTTTTACGAAAGGTGAA +AGCAATAAGAGTACAACAGAACAAGAGTTAGCAGCAATTCATTGGGCAATAATACATTTC +AGACCATACATTTACGGAAAACATTTCACTGTGAAAACAGACCATAGACCATTGACATAT +TTATTCTCGATGGTGAACCCCAGCTCTAAATTAACTAGAATAAGGCTTGAACTAGAGGAA +TATAATTTTACAGTAGAGTATCTAAAGGGCAAGGACAATCATGTAGCAGATGCGTTATCA +AGAATAACCATCAAAGAGCTAAAAGATATAACTGGAAATATATTAAAAGTCACTACAAGA +TTTCAAAGTAGACAAAAATCCTGCGCAGGAAAAGAACAATTGGATTTGCAAAAGCAAACC +AAAGAAATAGCTTCAGAGCCCAACGTATACGAAGTCATAACAAATGACGAGGTACGAAAA +GTAGTGACATTGCAATTGAATGACTCGATATGTTTATTTAAACATGGAAAGAAAATTATT +GCAAGATATGATGTTGGTGATCTTTATACTAATGGAATTCTTGATTTAGATCAATTTCTC +CAAAGGCTTGAATTGCAGGCCGGTATATATGATATCAGCCAAATCAAAATGGCACCGTGG +AAAAAAATCTTTGAACACGTTTCAATAGATAAATTTAAAAATATGGGCAATAAAATATTA +AAGAATTTAAAAGTAGCGCTACTTAACCCGGTGACCCAAATAAATAATGAAAAAGAAAAA +GAAGCTATATTGTCTACATTACATGATGATCCAATACAAGGAGGGCATACAGGCATTACA +AAAACCTTGGCCAAGGTCAAAAGACATTATTACTGGAAAAATATGAGTAAATACATAAAA +GAGTACGTAAGAAAATGTCAAAAATGCCAAAAAGCAAAAACAACAAAGCACACAAAGACT +CCAATGACGATAACTGAAACACCAGAACATGCTTTCGATAGAGTTGTTGTGGACACAATT +GGTCCACTACCCAAGTCAGAAAATGGTAACGAGTACGCAGTCACTCTCATATGTGATTTA +ACCAAGTACTTAGTTGCCATACCAATAGCAAATAAAAGCGCAAAAACAGTCGCAAAAGCT +ATATTTGAATCTTTTATTCTAAAGTACGGTCCAATGAAGACGTTCATAACGGACATGGGA +ACAGAGTATAAGAATTCAATAATTACTGACCTGTGTAAATATTTGAAAATAAAAAATATA +ACATCAACAGCTCATCACCACCAGACAGTTGGAGTAGTAGAAAGAAGTCATAGAACCTTA +AACGAGTATATACGATCCTACATATCGACGGACAAAACCGATTGGGACGTATGGCTTCAA +TATTTCGTATACTGCTTCAACACGACCCAATCTATGGTACATAATTATTGTCCATATGAA +TTAGTTTTCGGTAGAACAAGTAATTTACCAAAACATTTTAATAAACTACATAGCATAGAA +CCAATATATAACATAGATGATTACGCTAAGGAGAGTAAATATAGGTTAGAGGTAGCATAT +GCTCGAGCAAGAAAACTTCTCGAAGCACACAAAGAAAAAAATAAAGAAAATTATGACTTA +AAAATAAAAGACATAGAATTAGAAGTAGGAGATAAAGTTTTACTAAGAAATGAGGTAGGT +CATAAATTAGACTTTAAATATACGGGGCCCTATAAGATAGAAAGCATAGGAGATAATAAC +AATATTACGCTACTTACTAATAAAAACAAAAAACAAATAGTTCATAAAGATAGATTAAAG +AAATTTCATTCATGATTGAATTTAAACTTATATTTTCCTTAATCATTTACACAAATTTTC +CATACACTACGTATATTTTTATCTTTGCATTATAAAATCAACTATTGTTGTTCAAACAAA +AACACAAACAAAATAAAAATAAAAATAAAATAATTTGCATTTAATAATCAAAATAACTTC +ACTAGGTTACGTTATTTTTCAAAAGGAGGGAGATGTAGTATGTGCCTATGCAATATTAAG +AACAATTAAATAAAATAGCATATTAACTTATGGCAGCACTTTGTTGCTATGTTTATGTTT +ATGTTTATGCACGCAGTTAGGCCAGGGCGGATGTAACATGATCACCCACTCGAAGGCCAC +AAAGTATAAGTGCATTGCCCAATCGAAGGCAAAAAGTATAAGTGCATGGTCAGCATTCAC +ACGCCGACCAAATACATATTACATACGTACATACATATCTCGCTCTCCCGATAAGCCTAG +ATATATAAGATATACATAAGAACGCCGCTCCGCTGCTGGCGTACCCGGCAGCGCAGCTAC +GCGGATTAGCCTAAGTCCAAATATATAAAAAACTGTAAAATCGGAGAGACTCTGTAGACG +TTGAGCTGACAGAACCATTTCTGCCTACTCTAAAATCAAAAGAAGAAATTGAATAAATAT +ATGTCAGCCCGACGGCTGCCTTAAACTTAAAACGGACTTGTGTTCTTAATTGGAGTTCAT +CATTACA +>DMAURA +TGTCGCGGATCGAATATTGTTATCGATAGGCTCTAGTTAGTATTTTTGAGAAGTCCGAAT +GTGGAAGGATTTGTAAGCCCATATGTGTCTGGGCACGTTGTTTTTGGCCATTGTAAATTA +CCGGGAAAATTTAGCTTTTCATTGTCGTGTAAGAGTTGGAGGACACACTGCGGTGAGCTA +ATAAGTTAAGTTAGTTGCAATTGTGAAACATTGAATTCTTCAAGAATAAAACGTGTTCTA +CTACCACGGATTAGTCTGCCCTTTCTTTCGGGAACCAATGTGTGGGGTAGCCGTTTAAGG +CAACTCCCTGGACGCACGACGACAACCTTTTATTCGCAGTCCTAGGGCGACTGCAGGGGC +AACTTGCGCTGGAATGACGGTTTAGACGGCCAGCTAGAGAGTTGCCGGAGCTGGAGTGAC +GGTTTAGACGGCCAGCGAGGAGGATTTGTGTGAGCGCAGCCAGCGCTACGTACCGGCAGA +GGAGTCGCAGTCAGCGACATAGAGGGACGCAGCCAGCGTCGAACGCCGGTACGAAAGGGT +CGCAGCCAGCGACAAGGAGACGCAAGAAGCGTCATTTGTGGAGACCGCAGCCAAGCATCC +GTGGCCGCAGCCAGCGGCACGAGGCGTCAGAGACGCCATTTCGGACGCGCAGAGGCGCCG +CCATTTTTGGAGCTGGGAAAGATGCAGCATTCCCCCAGGAAGAGTGCCCGGCTGAACGGA +GGGGAAGTCACCCCTATAACAACAGTGAGTCAGCAGCCAGCCAGTAGTGGAGCAGGAACT +CGGACGCGGGTGAACATCACGGCGGCGTCGATTCCTTGCCCGGCCACTACGGTGACTACA +GTAGCTTCCCAACCTAGAAGTACTGCTGTCACAGCTGCGAGTTCAGTACCGGAGGTGAAC +CAGCCCCTCGTGTTGGAACTCATGGAGAGGATCGCAGCGTTGGAGAGGGAGCTGGAGAAG +ACTAGATCCCTAGAAAGTGTGAGCACCGCCAATTGCGCGCCAATCGCAGTTGGCCCAAGC +GCAGTTGGCGCCAACAGTGGAGCGTCGGGGCGGCCGCCATTTTGGAGCGGCCAGCTAATA +CCCACATCTAACGGAGAGGCCTTACATAACGGGGACTGGGCCAGGCATGCTGCAACGATT +GCGCCCTTTCCCACTGTAGTCCACTTCAGCGCGTGGCTACAGGAGTACGCAAACGTGGTG +TGCACGGTTTTGGACGTCGAGGGAAAGGAGCCGAGGCGTCGACTTCTACATGCAAGCGTC +GACCATAATGAATGCGATCAACAGGATGATCGGCATGGAGGTTGTCCCATCTGTGGAGGA +CAGCATGAAATATTGAACTGCAGAAAATTTATTGGAGCTTCGCCACAGGAAAGGTGGAGC +AATGTGAAGAGGCATCGGCTCTGCTTCAATTGCCTGCGAAGCGGGCACACGGCTAGATCC +TGCTATACGCAAGGTGAGTGCCAGGTTAATGGATGCCGAAGGGAGCATCACCGTCTGCTA +CATGGTGCGGACGGAGGAACGAAGGCCGCTGCAGCGAGGTGGCTTCAGACGCCACGAAGG +GAACCAGCAGCCAGCAGTTTCCAGACGCAGCCTAAAGGGGAGGCCTTCGCTACGAGATGG +TCACAGGGACCAGGAGAGGAACCGGCAGCCAGCCGTTCCAAGCAACAGTCTGGAGAGAGG +AGCTCCACGTGAAGCGGGAGCGCCCATGCAGAGGAATTTGAGCTGCGTTGACGCCGAAGG +AGGCCGTCTACTGTTCCGTATACTGCCGGTTACGCTGTACGGAGCGGGGCGAAAGGTGGA +TACATATGCGCTCCTAGATGAGGGATCCTCCGTCACGATGATCGATGACGAACTACGAAG +GGATCTTGGAGTGCAAGGAGAGCGTCGGCAGCTAAATATCCAATGGTTTGGTGGTAAGGC +AACCAGAGAGCCTACCAACGTGGTGAGTCCGAAGATAAGTGGAGTTGGAAAGCCCACTCG +CCATGTATTGAGAAACGTTTATGCCGTTTCGAGCTTGAGTTTGCCGATGCAGACATTGAG +CCGACGAGATGTCCAGGGCGTGCACAGGGATGCGCGTCTGCCCGATGAAGCCTTACAGCA +ACGTGGTGCCGAAGCTGCTCATCGGTCTGGATCACGGACATCTGGGGTTGCCACTTAGGA +CGAGGCGGTTCGCTCGAGAGGGACCGTATGCGGCCGCAACCGAGCTGGGCTGGGTTGTGT +TTGGGCCTGTAAGTGGGCAACCGACCACGCCGTCACCGAGGTCCTGCCTACTTGCCGTGT +CAGTGGATGACGCGATGGAGAAGATGGTGGAGGACTATTTCGACATGGAGAACTTTGGAG +TGAAGACCGCGCCGCCGGTCGCAGCCAGCGACGATGTCCGGGCCCAAAGGATACTCGAAG +ACACCACGGTGAAAGTGGGGCGTCGCTACCAGACGGGATTACTCTGGAAGGACGACCACG +TTGTGCTGCCACCGAGATATGAGGACGACGACGTGCAAGTGAGCTTCGTGAGTGCGAGGA +CGAAGTGTGCCCCAATGAGAACGATGACGATCCCACGGCTGGAGCTGCAAGCAGCAGTTC +TTGGAACCAGGCTGATGAACACTGTCAAGGAGGAGCACAGTGTGGTCATCACGGACCTGG +TGTTATGGACGGACTCTAAGACGGTGCTGAGATGGATCGGCAGCACCCACCGCCGCTGAC +AATGCGGCTGATGATGCGACGCGGTCGCAGAAAAGGAGTCGACCTTAGCCAGGAATCAAG +GTGGCTAAGAGGACCTGCATTTTTGATGCAGCCAGCAGCCAGCTGGCCGGGGTCTGAGGA +AGGAACTGAGCGTGTTCCAGATGTCCCTGATGAAGAAGAGATGCCCAGTGAGTTTGCATT +AGTTGCGGTAGACGATTTTGTCATTCCGTTTCAGAGATTCTCGAGCTTCAGTCGCCTGGT +GAGGACCACAGCCTGGGTCCTACGGTTTGCGCGCTGGTGCCGCAAACAGCGAAACGATCT +CGAGGAATACGGCCTTACCGCAGCCAGAATGTAAGGCCGCCGGAACCGCACTGTGCATCC +CGTACAGTGCGAGGAGGGCCGTATTACTGTCACACAGGCACAGTCTGACGGAGCTGATTG +TGAGAGACTTCCACGCCAGGATGAAGCATCAAAATGTGGATGCTACGATCGCGGAGATCC +GGACAATGTTCTGGGTCACAAAGATGAGGCGTGTGATGCGGAGAGTCATCTCATCGTGCA +ACGAGTGCAAGTTGCAGCGAGCGCGGCCGATGCCGCCGATAATGGGACCCCATCCGGAAG +ACAAACTGGATGCGGGTGGATGGCCATTCAAATACACAGGACTGGACTACTTTGGGCCAC +TGCTGGTGACTGTGTCCCGTCACAAGGAGAAGCTTGGGTCGCCTTGTTTACGTGTTTGAC +GACAAGGGCGATTCACCTGGAGCTGGCGCATGACCTGTCGACGGATTCCTGCATAATTGC +GATCAGGAACTTCGTCTGCCGTAGAGGGCCAGTATATAGACTGCGCAGCGATAACGGCAA +GAACTTCGTGGGAGCTGACAGGGAAGCCAGGCGCTTTGGCGACGTATTCGAGATGGAGAA +GCTTCAGAGTGAGTTGACAAGCAGAAGCATTGAATGGGTGTTTAATTGTCCAGCGAACCC +GTCTGAGGGCGGAGTTTGGGAGCGCATGGTGCAGTGCGTCAAGAGAGTACTGCGTCATAC +CCAGAAGGAAGTTGCGCCGAGGGACCATGTATTGGAGAGTTTCCTGATTGAGGCGGAGAA +TATTGTAAACTCGCGTCCGCTCACCCACTTGCCTGTGGATGTGGACCAGGAGGCGCCGTT +GACGCCAAACGATCTTCTCAAGGGAGTAGCCAATCTGCCGGATACGCCTGGATTGGATGC +GGAGCTGCCCAAGGAAGGTACTACGAGGAAGCAGTGGAGAATTTCTCGCCTGCTACGAGA +CCGTTTCTGGAGGAAGTGGGTCATGGAGTACCTGCCTACGCTTGTGCGCCGCGAGAAGTG +GTGCCGACGAACGGAGCCCATCCACCAGGGTGATGTGGTCTTCGTCTGCGATCCTGCCTT +GGCCCGACGAGAGTGCCGCAAGGGTATCGTGGAGGAGATCTACAGCGGAGCTGATGGAGT +TGTCAGACGCGCTAAGGTGCGCGTGAACGAAAACGGCCTATCTAGGACAATGATGCGACC +CGTCTCTAAACTTGCAGTTATGGATTTGAGTGAAGCGGTTCTTCACGGGGTCGGGGATGT +CGCGGATCGAATATTGTTATCGATAGGCTCTAGTTAGTATTTTTGAGAAGTCCGAATGTG +GAAGGATTTGTAAGCCCATATGTGTCTGGGCACGTTGTTTTTGGCCATTGTAAATTACCG +GGAAAATTTAGCTTTTCATTGTCGTGTAAGAGTTGGAGGACACACTGCGGTGAGCTAATA +AGTTAAGTTAGTTGCAATTGTGAAACATTGAATTCTTCCAGAATAAAACGTGTTCTACTA +CCACGGATTAGTCTGCCCTTTCTTTCGGGAACCAATGTGTGGGGTAGCCGTTTAAGGCAA +CTCCCTGGACGCACGACGACA +>DMBARI1 +ACAGTCATGGTCAAAATTATTTTCACAAAGTGCATTTTTGTGCATGGGTCACAAACAGTT +GCTTGTGCAGCAAGTGGGGGGAGGTGAAATGCAAAAAAACTTTTGCTTTTGCAAATTCAA +ACCTATGCAGAGTCAGATGAAAGAAGAATTGAAAAAATAACTGTTCCTATGCGCAAGGAA +GAGGCAAATGAAGAGATCTTTATCAGTTGTCAGAAGTATTTGCACACGGTTTCGTCGCAT +CACAATTATTTTCACAACGCAATTTCTTCTTCAGTGATTGGTTTAGAGTGACAAGTGCCG +GTTTGTTTGCTTAAATACATTTAAATTATTGAATAAAAATTAGATTTAATCATTTTCCTA +TTACAGTTATTAAATAAAATGCCCAAAACAAAAGAGTTAACAGTTGAGGCCCGGGCTGGT +ATTGTTGCTAGGTTTAAAGCCGGTACACCTGCGGCCAAAATAGCTGAAATATATCAAATT +TCGCGTAGAACTGTCTACTACTTAATAAAAAAGTTTGATACAGTTGGCACATTAAAAAAT +AAAAAAAGATCAGGCCGAAAACCTGTGCTGGACCAAAGGCAATGCAGGCAAATACTTGGA +GTTGTGGCGAAGAATCCTAGTGCCAGTCCGGTAAAAATTGCCTTAGAATCAAAAAATACA +ATTGGCAAACAAGTTAGTAGTTCTACAATTCGTCGCAGGCTAAAAGAAGCTGATTTTAAG +ACATACGTTGTTCGCAAAACGATTGAGATCACACCAACCAACAAAACAAAACGTCTTCGA +TTTGCGTTGGAATATGTTAAGAAGCCTCTTGACTTTTGGTTTAATATTTTATGGACTGAT +GAGTCTGCATTTCAGTACCAGGGGTCATACAGCAAGCATTTTATGCATTTGAAAAATAAT +CAAAAGCATTTGGCAGCCCAGCCAACCAATAGATTTGGTGGGGGCACAGTCATGTTTTGG +GGATGTCTTTCCTATTATGGATTCGGAGACTTGGTACCGATAGAAGGAACTTTAAATCAG +AACGGATACCTTCTTATCTTAAACAACCATGCTTTTACGTCTGGAAATAGACTTTTTCCA +ACTACTGAATGGATTCTTCAGCAGGACAATGCTCCATGCCATAAGGGTAGGATACCAACA +AAATTTTTAAACGACCTTAATCTGGCGGTTCTTCCGTGGCCCCCCCAAAGCCCAGACCTT +AATATCATTGAAAACGTTTGGGCTTTTATTAAAAACCAACGAACTATTGATAAAAATAGA +AAACGAGAGGGAGCCATCATTGAAATAGCGGAGATTTGGTCCAAATTGACATTAGAATTT +GCACAAACTTTGGTAAGGTCAATACCAAAAAGACTTCAAGCAGTTATTGATGCCAAAGGT +GGTGTTACAAAATATTAGTATTGTATTTATATAAAATAAAGAAATTCTTATGTTGAAATT +AGATGTTAAGCTGAAATTTACTAAATTAAGTTGAGTGAAAATACTTTTGAAGCGCAATAA +ACATGTGAAAATACTATTGACAACTTGCATGCATATTTTCTTTTGCTTTAAGCTTTGTAC +TATGAACCGTTATCTTTCGTATTTCTTTTCGACTACCTTCTGCATAGATCAAGCTAAGCG +ATAAGAACTATTTCAGGCAAATCGGACAACAACAAGAAGAAATATAACAAAAAGAAGTTG +AAGTTTGCAAATATTGTGCGTTGTGAAAATACTTTTGACCACCTCTGT +>BS +AAATCTGCATTCATAGAGATCGGTTGTGTCGCGCGTATGCAAAAGTGATCTATTTTGCTT +TATTGTTGCAATTTCTTGGGTGCTTAAAATAGCACTCACCAGTACATTCGGGCGCTGCTT +CGTGCGGTGTCGGCATCTGGCCAACAACAAAAAGCGTTAATCGAAGTGCGGTGTAGCTAC +GATACCTGCCCTTCGGGCAACTTATTCCCCTCACCCCGCGCAAAGCCGCTGAAGGGGGCA +ATAAAATCTATGCTTATCAGCAAAACTGATCCGTATTTGATCTGTTTTGTGGTCAGTTAA +GCAAGCTATTTTGTAAATATTAAGAATTATTATTAAGACAATGGATGAGAACAATTCTGA +TGACACCCAGCTTTTAAATAAGCAGAGTAACCATAGAACAATGTTCTCAATAGCTGGCAA +ATTACCTCACGAGATTAGAAACGAGTGCCGATCAGCAATTCAACGCTTTACAAGCAGCGT +AACTCAAAGCAGTAGCGTCACCACAACAACGGTGACATTTACTAGTGCCAATAACAGCAC +CATATATACAATGGCAAATGCCGCAATAAGCAGCCCGTGCCTTGGAACAAGATCCACTCA +CCAGGAAAGTTCCACATTGATAAACTCCGGAATCGTAGAAGATAATCTCAGCGATGCTGC +CAGAAGGTTATTAAATGACCAAAATCAGAGAGCGGGTAAAAGGAAAAATGGAAAGCCCTT +GTCCCCCATCTCCAACCCGAAAAGAGGGAGTAGCAGCCAAGTTTTACACTCGCCCCCTAC +GACTAGCCTGAAGATAAGCTCTAATAATAGGTTTGCCATTCTGGACACGGATATTTCTAC +TAACGAAGAAAGCGTGGAAGGCATGATGATAGAGGGTGCTGATATTGACAGTGCCCATAT +GGATGATTCTCAACTCGATGGTTCCAATACTGGTCGAAACTTGCAGGAAACACACAATAC +AGCCAATCAACTTAATGATCACAAAAAACCACCACAAATTGTTGTAAATATCAGAAACTT +GAATGATCTGTTTGAGCTTATAAAAGAAAAGACAAGCTTAGATAACGTTGTCGTTAAAGC +TAATCAAGGGGAAACGGTCAGAATATTTCCAAAAGACAGCGACACTTACAGGAAAATAGT +GAGCCATATGGATGACATTGGTATTCAGTTTCACACTTACCAAATGCTGACAGATAAGCC +ACACAGAATTGTAGTAAGGGACTTACATCACAGTACATCAAACAAAGACATAACCGCCGA +TCTGAAATGTTTAGGCTACGAAGTGCTCCACATTCACAACCCTAGTTCTAGGACTAATAA +GGACGAAAAACTAAACATCTTTTTCATTAATATAAAGCCCTGTGCAAAAATTAATGAAAT +TTACCATGTCAAGACCCTTTGCCGACAGAAAATACGGATTGAAAGGATGAGAAAGTCTTC +TGAAATTGCGCAATGTCGTCGTTGTCAGGAGTACGGCCATACAGCTAAATACTGCCGCAG +ACACCCAAATTGTGCCAGATGTGGCGAAAATCACCAAACCATGCAATGCACCCGACCGAT +AGACGCACTGCCCACATGTTACCATTGCTCTGAAAATCATACGGCTAGCTTCAAAGGTTG +CCTAAAGTATCAGGAGCTTCTTCGCAGATCTATGGGGCCTGCAAGAAATGGAAACAGGTT +AAATAAGAACACCCATCATCACTCTCCTAGAGACCGGCAAGAGCTTCCTGCCTTGCAGCC +CAATTACCGCAAGAACAACACCCAATCAACAGTACAGCAGTTATCGACACAACCACAGCT +TAATTTTGCCCAAAGCCAACCATCTATAGGCACTGGTGGAAACAGAGCAGTATCCTATGC +TACAGTAGTAAAAGGATACCCAAAAATAGCGCCCTCCAAGGACGGACCAGCCCAGCGTCA +ACGCTTAAACAACCCACAAACGAAACAAATACTGCAGCAACACCGATCGAATACACAGCA +GAATAACTCATCTGATGTGCAAGTATTCTTACAACAGCAACAACAACAGTTTCTGGAATG +GCAACAGCAGATCCAACAACAACAACACCAACAGTTTCTTATGTGGTTGCAACAGCAGCA +GCAAGAACAACTACAGTATAAAAGCCAAACCAATCAACGACTGGAAAAGCTTGAAAAAAT +GGTTCTTGAACTAGCGAATATGTTAAAAGAATGGGCTGGGAGTGAACTTAAGCCCCAGCT +CTTTAACAACGTCTCAGCCTCCCTATGAATCCACTAAAGATTCTTATTTGGAATGCTAAC +GGCATTTCAAGAAAAGCCAAAGATGTTGAGCTGTTCGCGCACAACAAAAAGATAGACATC +CTTCTTGTGACTGAACTAAGACTCAAAAGAGGGGAAACTGTAAAGATATATGGATATGCG +TACTATCCAGCATATAGGCCATCCCTTAATAATAATAGTGTTGGCGGAGTAGCGGTGTTC +GTGAGGACAACTCTTCGCCACTTTCCACAAAGGGTCATTGAGACACGCCACATACAATTG +TCATCAGTAAAAGTAGCCACAGGACTCGGGGACCTGCAGTTTAGCGCTATTTACTGCTCC +CCAAGTACTAGAATCGAGGAAAGACATTTTACTGACATAATACGCGCCTGCGGCCAAAGG +TACTTGGTAGGTGGCGACTGGAATGCCCGCCACTGGCTTTGGGGCGACACTTGCAATTCA +CCTCGCGGGCGGGAACTAGCAGAAGCCTTGTCCGTGACTGGAGCTAAGATCCTCGCAACT +GGCTCTCCGACAAGGTATCCGTATGTGCCCAGCCATACGCCCTCATGCATAGATTTCGCA +GTGTATCATGGTATACCAGACCACCTAGCAACTATAACACAAAGCTGGGACTTGGATTCT +GATCACTTGCCTCTTATCATTAGCATTGAGACAGACAGTATTCATGTCAATCCAAGTCCC +AGGCTAGTCACCAAACACACTGACCTCCTTGCCTTTAGCCGACAATTGGAGAGCCTTATT +TCGCTGAACACCACGCTTAATTCTGGTGAGGAAATTGAAATGGCTGTTGACAACCTAACT +GAAAGCATACATAGGGCCGCGGCTGTCTCTACTTCTCCCGTCCCTCGGATAGGCACCACA +TATGGGATAGTCTTGACAAGAGAGGCTAGAGAGCTTCTGACACAGAAAAGAAGACTCCGA +AGGCGAGCAATCCGATCTCAAGACCCCTGGGACCGACTTTTATGGAACCGTGCTGCAAAG +CAACTACGAAACGTCCTCAGAGAACTTCGAAGCAACTTTTTTGAGCAGAAACTAGCTAGT +ATGGACTACACAGTGGATGCTGGATACTCGCTATGGAAATGCACCAAGTCCCTTAAAAGA +CAGCCGTTTAGACAGGTTCCTATAAGGTGTCCGGGAGGCGAACTTGCTAAAAATGAAGAG +GAGCAGGCTAATTGTTTTGCAAATCATCTGGAGACAAGGTTCACCCACTTCCAATTCGCT +ACAACGGAGCAGTATCAAGAGACGCTTGATAGCCTAGAGACACCTCTGCAAATGTCACTA +CCCATTAAGCCCATCAGGGTTGAGGAAATTGTCGAAGCTATCAAATCTCTTCCGTTAAAG +AAGTCTCCTGGCATCGACAACGTTTGCAATGCCACACTAAAAGCACTACCTGTTCGAGCA +ATTCTCTACTTGGCGCTGATATATAATGCCATACTCAGGGTGCAGTTTTTCCCAAAGCAG +TGGAAAATGGCAGCAATCCTAATGATACATAAGCCTGGTAAACCTGAAGAGAGCCCTGAA +TCGTACCGACCCATAAGTCTTTTATCTTCGCTATCCAAGCTATGGGAACGACTGATTGCC +AACAGATTAAATGACATTATGACCGAGCGTCGTATCCTGCCGGATCATCAGTTTGGCTTT +CGTCAGGGACACAGTACTGTGGAGCAGGTACACAGACTGACAAAACATATCCTTCAGGCC +TTTGATGATAAGGAATACTGCAATGCTGTGTTCATTGACATGCAACAGGCATTCGATAGG +GTCTGGCATGACGGCCTTATCAGCAAAGTTAAAAAGTTATTCCCAGCACCATACTATGGA +GTCCTAAAATCATACTTGGAAGATCGGAGATTCATGGTCAGGGTCAGAAACTCCTACTCG +ATTCCCCGCGTTATGAGAGCTGGAGTTCCGCAGGGCAGCGTACTGGGACCGTTGCTCTAC +TCAGTATTTACTGCAGATCTGCCCTGCCCAAACGCCTATCATATGGCAGATCCCAGGAAG +GCCCTTCTTGCTACGTACGCTGACGATATTGCCCTGCTGTACAGCTCTAATTGTTGCAAC +GAGGCAGCAAGGGGTCTCCAAGAGTACCTCACCACTCTGGCTGCATGGTGCAAAAGATGG +AATTTAAAGGTCAATCCGCAAAAGACCATCAATCCCTGCTTCACCTTGAAGACCTTAAGT +CCCGTCACCGCACCCATAGAGCTGGAAGGTGTAATCCTAGATCAACCTTCACAGGCTAAG +TACCTCGGGATTACCCTTGATAAACGGTTGACTTTCGGCCCGCACCTGAAAGCTACGACT +CGGAGATGTTATCAAAGGATGCAACAACTTCGATGGCTGTTAAACAGAAAAAGCACCATG +ACACTGAGAGCCAAAAGAGCAGTCTACGTCCACTGCGTAGCCCCGATCTGGCTGTACGGA +ATACAGATCTGGGGTATCGCAGCAAAATCCAACTACAACCGCATTCAGGTATTGCAAAAT +CGTGCCATGCGTGCAATTACAGACTGCCCATACTATGTACGTGGCACTACCCTTCACCGT +GATCTGAATCTTCATACAGTGGAAGAGCAGATCTCCAGGCACACCAGCAGATATAGTGAT +AGACTAAGACGACACCACAGTATACTTGCTAGACGCTTACTCCCTGCTAGGCCTCTAAGG +AGATTAAAAAGGAAGGGTTTCGCCAAAACACTTGGACAACCCTAAAGACCCCCTCGAAAT +ATGAGACAAAGTTGTAAGTCCTCACATGATTAGTGAGAGGTTTGGTTCTATCTTTTATAT +GTTAATTGCGCTGTTATGTTACTGTTATTGCATTGTATTGATTCATCGCTTCTAAATAAA +TAATAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA +>DMU89994 +AGTTAACACAATCACAAAACACCCGAAATATAGTCGTAAGCCTCAAGTGCTTTTCCCATC +TATAGATCGAGCTTTACCTATAAGAAACTGTAACTTGTTAAGCTTTAGAGATAAGAACTC +TTGCTATACTTAAGTCAGTCGATTTTGGAAGATTAGAAGCGTCGGTCATCGCCACGTACT +TACTATTCGTCTCATTAAGTGCAGACCGCGCAAGCCTATTGTAATTAATAAACTTACGCT +AATAAATATATGGAAAATCTACTAAAATGATAATTGGCGCCCAAACGGATATAAAAACCT +ACGATAACTGAATAATTATAAATAAATAACAAAAGGAGGATCCGGAGACAAAACCAGCGG +CTTTGGCTAATTAACTCTAACCTAAGAAATAAAAATTTGCTGATTACATAAAATATAATA +TTAATTACTAAGACCATCTACCTTAAAATTGTTTGTTAATCACTATTATTATATTGTAAG +TATAACGCTTATTGAACGAATTAAAAATATTATTATTATTATTATATTATAACCTATGCA +AAGAGTATTGATAATAAAAATACATGAGTGACAGTGATAACCTTTTAGACAACCTAGTGT +CAAGCTTAAATAAATGGTCAGCGCACCAGGCAAGTAGGCAAAACAGTGCAGAAAAAAATA +ATAAGTCATCAGATAATTGGTGGTCAAAAACAAAGACAACTAGCGAAATGGAATTTGAAG +CTCAGTTAAAAGCGATCGTAGAGAGTGCTGTTGCCGGTGCGCTCGCAGTCCAAAAACAAT +CATTTGAAAAGCAATTGCAGGAGATGAATGAGCGAATCGGGAAATTAACAGTGAACACCC +CAGAGGTGGAAACTTATGTAGATGCTGAAATTAGACCAGGTGTTGTCTGTAGCGAGCCTC +TAGATATACTTAAATCTCTGCCAGATTTTGATGGCAAAAGTGAAACATATGTGTCGTGGA +GAAAAGCGGCTCATGTCGCTTTTAAAGTTTTCAAAGATTACGAGGGAAGTTCAACATTTT +ACCAAGCTCTTGGTATTATGCGAAATAAAATAAAAGGTCCAGCGAATACAGTATTGGCTT +CTTTTAATACTCCGTTACATTTCAAAGCAATGATCAGCCGTCTTGATTTCACATATTCTG +ACAAAAGGCCGATCTATCTAATCGAACAAGAGCTATCAACTTTGCGACAGGGAGACATGA +CTCTTACTGAATTCTACGATGAAGTCGAGAAAAAACTGACCCTACTTACCAACAAGACAA +TAATGACATTTGATAGTGCCTTGGCGATGTCACTGAATGAAAAGTACAGGACGGACGCGT +TACGTGTATTTGTAACCGGAGCTAAGAAATCGTTGAGCGACATTCTTTTTGCAAAAGGTC +CAAAAGATTTACCAACTGCTCTCGCTTTAGCGCAAGAGGTCGAGTCGAACCATGAGCGTT +ACCAATTCGCCCTTATTTATTCTAAAAATATTGGAGACAGGGGTCAGAAAATCGAACAAA +GGCACAGCGATAAGGATAGAAACTCAATCATGCCCATGCAAACTAAAAACCCATATTTTA +GCAAGCGTCAGGTGCATACTTATGATAACCAGGAAAGACAAGATCCAGTCCAGTTAACAA +ATCCTGATGTATCCATGCGATCTAGAAGAACTGGAAATTTTGGACAAACTCCATTTCCGA +CTCAGGGAAATATTTGGCCATCCCAACAGCAAAATTCTTGGCCATCTCAACAACAATATT +CTTGGCCATCCCAACAACAAAATTCATTTCGAACACAAAATCAATTCGCATCGCAACCCC +AACAGCAAAACACAAGTCAGGCTCAGGGACATTTTGGGTATGCGCAAGCATCAAAAAGAC +CAACGAGTGGCAGTGCAAGGTTTACAGGGCCAAAACAGCAGAGGATCAACTACTTACCTC +ATGAGAAAGGTCAATGTGAGGAAGATACAGACGGTTATCAAAAGGAGGCAGAAGCGGAGG +TTGATGATTATGAGGACGAACTAGTGAATTACGATCATGTTCATTTTTTAGCCACAAATC +CCTGCTACCGTACATAGAAAGAGAGATAGCAGGGAGAACCATAAAACTTTTGATTGACAC +CGGGGCTTCGAAAAATTACATACAGCCCCTCCCTGAATTAAAAAACATAATGCCGGTACA +AAATAAATTCACGGTAAAATCGCTTCATGGTTGCAACACCGTCAAACAGAAATGCTTTAT +TAAGCTATTTAACACATCTGTTCAATTCTTTATTCTTCCAAGTCTCTCTAGTTTTGACGC +AATAATAGGACTTGACCTTTTGAAACAGGGAAATGCAACGTTAGATTTTAAGAACAAAAC +GTTGAATATCAACAATGAAGTGGAATCTATTCAGTTTTTGAGATGTGACAGCGTAAATTT +CGCCAACATAGAGAATATTGTGGTTCCAAATCAGATATCTAATAAATTCCATACAATGCT +TCGAAACCGATTGGCCGTCTTTGCGGAACCGGAAGAAGCACTGCCGTATAATACCAACAT +TGTTGCCACAATACGTACTGAGGACGACCAACCCATTTACTCAAAACTCTATCCGTACCC +CATGGGCGTATCGGATTTTGTGAATAAGGAGACACATGCTTTGTTAAAGGACGGAATTAT +CAGGCCCTCGTCGTCACCTTACAACAATCCGGTTTGGGTAGTCGATAAAAAAGGTACAGA +TGAAGAGGGAAATACTAAGAAAAGGTTGGTTATAGATTTTAGAAAACTAAATTTAAAAAC +AATCGACGACAAGTACCCTATACCAAACGTAGTATGGATCTTGTCAAATTTGGGAAAAGC +CAGATTCTTTACAACCCTTGACCTTAAATCGGCGTTTCACCAAATTCTGCTCGCAGAAAA +GGATAGAGCGAAAACTGCCTTTTCAGTAGGAAATGGAAAATACGAGTTTTGCCGTTTGCC +GTTTGGCTTGAAAAATGCCCCAAGTATTTTTCAACGTGCTATTGATGATGTTGTTAGGGA +CCGTATAGGAAAGTCATGTTACGTTTACGTTGACGACGTAATAATATTTTCAAACGGAAT +TGAGGACCACGTAAACGACGTTGCTTGGGTACTAGACAGACTGTCTGGGGCAAACATGAG +GGTTTCTAAAGAGAAATCGTTTTTCTTCAAGGAAAGCGTCGAGTATCTCGGATTCATGGT +GTCAAGTGGAGGTATCACAACCAGTCCTAGCAAAGTAGAGGCTATTCAGAAATATAATCA +ACCTACTAATCTGTTTAGTGTTCGATCGTTTTTAGGGCTAGCAAGTTATTACCGCTGCTT +TATTAAGGACTTCGCCTCTATTGCTAGACCACTCACTGACATTCTGAAGGGTGAAAACGG +AAAGGTTTCCGCAAGCCAGTCTAAAAAGATACCAATTTCTTTCGATGAAAGACAATGTTC +TGCTTTTGAGAAGCTTAAAAATGTTCTTGTCTCCGAAAATGTAATGTTATTGTATCCCGA +TTATAGAAAAGCCTTTGACTTAACAACAGACGCTTCGGCTTTTGGCCTGGGGGCAGTCTT +ATCACAGGATGGCAAGCCTGTTACAATGATTTCGAGAACTTTACAGGATAGAGAACTTAA +TTTCGCAACAAATGAACGAGAACTTTTGGCCATCGTTTGGGCTTTAAAGTCTCTTAGGAA +CTATCTATATGGTGTCAAAAACTTAAACATTTTTACAGATCACCAGCCGTTAACATACGC +CGTGTCAGATAGGAATCCAAATGCAAAAATCAAGAGATGGAAGGCGTTTATAGACGAACA +TAATGCTAAAATTTTCTATAAACCTGGCAAGGAGACCTATGTTGCCGATGCACTATCCAG +GCAGGCTATTCATGTCCTAGAGGACGAACCCCAGTCAGACATTGCAACAATACATAGCGA +AATTTCATTGACTTTTACAATCGAAACTATCGACAAGCCGGTTAACTGTTTTAGAAACCA +AATTGTGATAGATGAGGGCACCGCAGACTCAACTCGAACTTTTGTTATTTTCGGAAGCAA +GACAAGGCATCTAATACAGTTTCTAGACAAAGAGACCTTAATCGGAAGAATTCGTGATGT +GGTTAAGCCGGATGTAGTGAATGCGATACACTGCGAATTACCTGTACTAGCTTTCATTCA +AAACAGTCTTGTAAATGACTTTCCAGCAACAACCTTCCGACACACTATGAAAATGGTCAG +CGACATTTTTAATCAAACTGAGCAACGGGAAATAGTGTCTTTGGAGCACAACAGAGCGCA +TAGGGCAGCACAGGAGAATGTAAAACAAATTCTTCAATACTACTTTTTCCCTAAAATGTC +ACAAATAGCCGCTACCTTTGTTTCTAACTGCTTGGTTTGTCAAAAAGCCAAATACGACCG +CCATCCGCAAAAGCAAATCCTCGGGAGAACACCTATTCCGTCACATGTAGGCGAGACATT +GCATATTGATATATTTTCTACGGGCAGGAATTACTTTTTGACATGTATTGACAAATTTTC +CAAATTCGCTATTGTGCAACCAATCGGCTCTCGAACGATAACTGATTTAGAACCTGCAAT +TATGCAACTAATGAACTTTTTTCCCCATTCAAAGACAATATTTTGTGACAATGAACCGTC +CATAAATTCCGAGTCAATCAAGTCACTTTTGAAAAATCGTTTTAATGTTGACATAGCGAA +CGCACCTCCACTTCATAGTACCTCAAACGGACAGGTTGAAAGGTTTCACAGCACGCTTTT +AGAAATAGCTCGATGCCTGAAACTTGACAGTGGAATGAATGATACAGTCAACCTTATTCT +TCAGGCAACAATAGAATACAATAAGACGGTGCACTCAGTCACCAATAGAAGACCGATCGA +CATTATTCATTCAACTCCTCCCGAATTGGCTAACGAGATAGTAGAAATGGTTAACGAAGC +TCAGGAAAAACAGCTAAGAAGAGAAAATGTAACAAGACGAGACAGAACCTTTGAGGTGGG +AGAAACCGTCATGGTAAAACAAAACAATCGCTTGGGAAATAAACTAACCCCACGGTATAG +GGAAGAACTAATCGAAGCAGACCTCGGGACAACGGTCCTCATAAAAGGGAGGGTCGTTCA +TAAAGATAATCTACGCTAGGTTTAGTATTTCTTTTCCTTTTGTGACCATCGCCAAGTTAG +CAAAATACAAACGTGAAATCTGAACACTAGTAAAAGAGTTTGCAAACATTTTTCAATTAA +ATATTTGTCAAATCCTTCTTATTTAATCTTTAAACATTTTGTATTATTTCCGCTTCATCC +TCTTTAGAAAATTTTAAAGGTATGTGATGAAATGCTAGACCCGAATGATTTGAAAACTTA +AAGTCCACGCAACCACAAATATTTCCTGAAACTACCATAGAAAATAAATGCATTACCAAA +ACGGCATAATAACAGTATAGCGCACTCACTCTAATTAGATTTCAAATTCCCGATTAAAAA +AAAAATAAAACACTAATGTTATCAATACCCTTTCCTGATTCTGTTCAACTAAAATAGGAA +AATCAATACTTGCAATCAATAAGCGTTTTACTACATACTTTAATATCAAAATATCTGAAT +GAACTTTATTATAAAATTATAATTGTTATACTTAATTATTGTCAAAACTTTAGTATTAAA +ACTGTAACTACCTCTTAAGTAGATGAGAAGAGTAGAAGAGGGAATTAAGATCTATCAACG +TAGTATCTGCTAAAGACGTAAAGATGCGGCAACTATTTCTGCGCCTGGGTACTGAAACGA +CGAACTGAATAATATCTGCCATCAGACGCCAACCAGAGTGCGTTCAACACATACGTTTTG +ATGGTCAACTAGTTCAACCAACATCAGCATCATCGTCGTCAACAAGTCGACGGTTACAAT +AAAGATTTTTTCCAAGTTCGCTACGATCATCTCCAGAACCTTGTTGCGAACCCATGACAT +GGAGAATCAGCAGCATTTACGAACTTCTCGGATCATCCAGACACGCAGAGCTGCCTTCCC +TTCGATGGTTTAACGCAGTACCAGGTTGGCAGTATGGGAACTTAGTGCACAACCAATGTT +ACCCGTAAGATCCGCTTTCAAATAGATTTGCCAATTGTAAAAAGTCTGTGGACAGCCTTC +GTCTTAGAAGGGGAGGAGTTAACACAATCACAAAACACCCGAAATATAGTCGTAAGCCTC +AAGTGCTTTTCCCATCTATAGATCGAGCTTTACCTATAAGAAACTGTAACTTGTTAAGCT +TTAGAGATAAGAACTCTTGCTATACTTAAGTCAGTCGATTTTGGAAGATTAGAAGCGTCG +GTCATCGCCACGTACTTACTATTCGTCTCATTAAGTGCAGACCGCGCAAGCCTATTGTAA +TTAATAAACTTACGCTAATAAATATATGGAAAATCTACTAAAATGATAATT +>DMCOPIA +TGTTGGAATATACTATTCAACCTACAAAAATAACGTTAAACAACACTACTTTATATTTGA +TATGAATGGCCACACCTTTTATGCCATAAAACATATTGTAAGAGAATACCACTCTTTTTA +TTCCTTCTTTCCTTCTTGTACGTTTTTTGCTGTGAGTAGGTCGTGGTGCTGGTGTTGCAG +TTGAAATAACTTAAAATATAAATCATAAAACTCAAACATAAACTTGACTATTTATTTATT +TATTAAGAAAGGAAATATAAATTATAAATTACAACAGGTTATGGGCCCAGTCCATGCCTA +ATAAACAATTAAATTGTGAATTAAAGATTGTGAAAATAAATTGTGAAATAGCATTTTTTC +ACATTCTTGTGAAATAGCTTTTTTTTTCACATTCTTGTGAAATTATTTCCTTCTCAGAAT +TTGAGTGAAAAATGGACAAGGCTAAACGTAATATTAAGCCGTTTGATGGCGAGAAGTACG +CGATTTGGAAATTTAGAATTAGGGCTCTTTTAGCCGAGCAAGATGTGCTTAAAGTAGTTG +ATGGTTTAATGCCTAACGAGGTAGATGACTCCTGGAAAAAGGCAGAGCGTTGTGCAAAAA +GTACAATAATAGAGTACCTAAGCGACTCGTTTTTAAATTTCGCAACAAGCGACATTACGG +CGCGTCAGATTCTTGAGAATTTGGACGCCGTTTATGAACGAAAAAGTTTGGCGTCGCAAC +TGGCGCTGCGAAAACGTTTGCTTTCTCTGAAGCTATCGAGTGAGATGTCACTATTAAGCC +ATTTTCATATTTTTGACGAACTTATAAGTGAATTGTTGGCAGCTGGTGCAAAAATAGAAG +AGATGGATAAAATTTCTCATCTACTGATCACATTGCCTTCGTGTTACGATGGAATTATTA +CAGCGATAGAGACATTATCTGAAGAAAATTTGACATTGGCGTTTGTGAAAAATAGATTGC +TGGATCAAGAAATTAAAATTAAAAATGACCACAACGATACAAGCAAGAAAGTTATGAACG +CGATCGTGCACAACAATAATAACACTTATAAAAATAATTTGTTTAAAAATCGGGTAACTA +AACCAAAGAAAATATTCAAGGGAAATTCAAAGTATAAAGTCAAGTGTCACCACTGTGGCA +GAGAAGGCCACATTAAAAAAGATTGTTTCCATTATAAAAGAATATTAAATAATAAAAATA +AAGAAAATGAAAAACAAGTTCAAACTGCAACATCACACGGCATTGCGTTTATGGTAAAAG +AAGTGAATAATACTTCAGTGATGGACAACTGCGGGTTTGTCCTTGATTCTGGTGCTAGTG +ACCATCTTATAAATGATGAGTCGCTGTATACCGACAGTGTGGAGGTTGTGCCTCCACTTA +AGATTGCAGTGGCCAAGCAAGGCGAATTTATTTATGCCACTAAGCGTGGTATTGTCCGAC +TACGGAATGACCATGAGATTACACTGGAGGATGTACTCTTTTGTAAGGAAGCTGCTGGTA +ATTTGATGTCCGTAAAGCGTCTCCAAGAGGCAGGAATGTCGATCGAATTTGACAAAAGCG +GTGTAACCATTTCGAAAAATGGGTTAATGGTTGTCAAAAATTCAGGTATGTTAAACAATG +TACCTGTGATCAATTTTCAAGCATATTCTATAAATGCTAAGCATAAAAATAATTTTCGTT +TATGGCATGAGAGGTTTGGCCATATAAGCGATGGCAAATTATTAGAAATAAAACGAAAGA +ATATGTTTAGTGATCAAAGTCTTCTAAACAACTTAGAGTTATCATGTGAAATTTGTGAAC +CCTGTTTAAATGGTAAACAGGCAAGACTTCCTTTTAAACAATTGAAAGATAAGACCCATA +TTAAAAGACCACTTTTTGTAGTACACTCAGATGTCTGTGGGCCTATTACTCCAGTTACTT +TAGATGATAAAAATTATTTTGTGATCTTTGTTGATCAGTTTACACATTATTGTGTAACTT +ATTTAATTAAATATAAATCTGATGTGTTTAGCATGTTTCAAGATTTTGTAGCCAAGAGTG +AAGCTCATTTTAATTTAAAGGTTGTGTACTTATACATTGACAATGGTAGAGAATACTTGT +CAAATGAGATGAGACAATTTTGTGTTAAGAAAGGAATTTCTTATCACTTAACAGTGCCAC +ATACACCTCAGTTAAATGGTGTTTCTGAGAGAATGATAAGAACCATTACGGAAAAAGCTC +GAACCATGGTTAGTGGTGCAAAGCTAGATAAAAGCTTTTGGGGCGAAGCAGTATTAACTG +CTACTTATTTAATCAACAGAATTCCTAGTAGAGCACTTGTTGATAGTTCAAAGACCCCAT +ATGAGATGTGGCACAATAAGAAGCCATACTTAAAACATTTGAGAGTGTTTGGTGCAACTG +TTTATGTGCATATTAAAAACAAACAAGGAAAGTTTGATGATAAATCATTTAAAAGTATTT +TTGTGGGCTATGAACCCAATGGTTTTAAGTTGTGGGATGCTGTAAATGAAAAATTTATTG +TCGCAAGAGATGTTGTTGTCGATGAAACCAATATGGTTAATTCTAGAGCTGTTAAATTTG +AAACAGTGTTCCTGAAAGATAGTAAGGAAAGTGAAAATAAAAATTTTCCGAATGACAGTA +GGAAAATAATACAAACAGAATTCCCGAATGAGAGTAAGGAATGCGACAACATACAATTCC +TGAAAGATAGTAAGGAAAGTGAAAATAAAAATTTTCCGAATGACAGTAGGAAAATAATAC +AAACAGAATTCCCGAATGAGAGTAAGGAATGCGACAACATACAATTCCTGAAAGATAGTA +AGGAAAGTAATAAATATTTTCTGAATGAGAGTAAGAAAAGAAAGCGAGATGATCACCTGA +ATGAAAGTAAGGGATCAGGCAACCCGAATGAGAGTAGGGAAAGTGAAACAGCAGAGCACT +TAAAAGAAATTGGAATTGATAATCCAACTAAAAATGATGGCATAGAAATTATTAATAGAA +GAAGTGAGAGATTAAAGACTAAGCCTCAGATATCCTATAATGAAGAGGATAATAGTCTAA +ATAAAGTTGTTCTAAATGCTCACACTATATTTAACGATGTCCCAAATTCATTTGATGAAA +TTCAATATAGGGATGATAAATCTTCTTGGGAAGAAGCCATCAATACAGAGTTAAATGCTC +ATAAAATTAATAATACTTGGACAATTACAAAAAGGCCTGAAAACAAAAATATTGTAGATA +GCAGATGGGTATTTTCTGTTAAATATAATGAACTTGGAAATCCAATTAGATACAAAGCTA +GATTGGTTGCACGAGGATTCACTCAAAAATACCAAATAGACTATGAAGAGACATTTGCTC +CTGTAGCTAGAATTTCAAGTTTCCGATTTATATTGTCATTAGTAATACAGTATAACTTGA +AAGTCCATCAAATGGATGTAAAAACAGCTTTCTTAAATGGCACGTTAAAAGAGGAAATTT +ATATGAGACTTCCTCAAGGTATATCGTGTAATAGTGACAATGTGTGTAAATTGAATAAGG +CAATTTACGGACTCAAGCAAGCGGCTAGATGCTGGTTTGAAGTATTTGAGCAAGCATTGA +AAGAGTGTGAGTTTGTAAACTCTTCAGTTGATCGCTGTATATATATTTTAGACAAAGGTA +ACATCAATGAAAACATATATGTATTATTATATGTAGATGATGTGGTTATAGCTACAGGAG +ATATGACAAGAATGAATAACTTCAAAAGGTATTTAATGGAAAAGTTTAGGATGACTGACC +TAAATGAAATAAAACATTTTATTGGAATTAGGATAGAGATGCAGGAAGATAAAATCTATT +TAAGCCAATCTGCATATGTTAAAAAAATTTTAAGTAAATTTAACATGGAAAATTGTAATG +CAGTTAGTACTCCTTTACCTAGTAAAATAAATTATGAATTACTTAATTCAGATGAAGACT +GCAATACCCCATGCCGTAGCCTCATAGGATGTTTAATGTACATAATGCTTTGTACACGCC +CAGATTTAACTACTGCAGTAAATATCTTGAGCAGATATAGTAGCAAAAATAACTCCGAAT +TATGGCAGAACTTAAAAAGAGTTCTTAGATATTTGAAGGGCACTATCGATATGAAATTGA +TTTTTAAAAAGAACTTGGCATTTGAAAATAAAATTATTGGTTATGTGGATTCTGATTGGG +CTGGTAGTGAAATTGATAGAAAAAGTACAACAGGGTATTTATTCAAAATGTTTGATTTTA +ATCTCATTTGTTGGAATACAAAGAGACAGAACTCAGTAGCAGCCTCATCAACTGAAGCTG +AGTATATGGCCCTATTTGAAGCCGTGAGAGAAGCTCTATGGCTTAAATTTTTATTAACTA +GTATTAACATTAAACTAGAAAACCCCATTAAAATTTACGAAGACAATCAAGGCTGTATTA +GCATAGCAAACAACCCCTCATGTCATAAACGAGCTAAACATATTGATATTAAATATCATT +TTGCCAGAGAGCAAGTTCAGAATAATGTGATTTGTCTTGAGTATATTCCTACAGAGAATC +AACTGGCTGACATATTTACAAAACCGTTGCCTGCTGCGAGATTTGTGGAGTTACGAGACA +AATTGGGTTTGCTGCAAGACGACCAATCGAATGCTGAATGAAATTTTTATATATATTTTT +CAAATTTAAATTCCTGTAAACATATTTTGTTACAATGATCTGATCGGGTTTTTCTGGGTT +TTCCCCGTATCCTCGCAGCAAATGCTGGATCAGTTAACACTTCCCAGAATGCACACCACC +CACATTTGATAGTTACTAATGAATATTATTGTTATGTTTTTAATTATAGACGTTATTTTT +GAGGGGGCGTGTTGGAATATACTATTCAACCTACAAAAATAACGTTAAACAACACTACTT +TATATTTGATATGAATGGCCACACCTTTTATGCCATAAAACATATTGTAAGAGAATACCA +CTCTTTTTATTCCTTCTTTCCTTCTTGTACGTTTTTTGCTGTGAGTAGGTCGTGGTGCTG +GTGTTGCAGTTGAAATAACTTAAAATATAAATCATAAAACTCAAACATAAACTTGACTAT +TTATTTATTATTAAGAAAGGAAAATAAATTATAAATTACAACA +>DMW1DOC +GACATTCGGCATTCCACAGTCTTCGGGTGGAGACGTGTTTCTTTCAAGCTACGAATAGCA +AGTTCTAAAAACTACAACAGTATAGTGAAAGTTAAACACAAAGTGTAAAGTGCAGTTTGC +ACAACTAACAATTATTGACTATAGTAATTATTTACTAAAATAAATAATTATTCCATATTG +TTCTGGTAATTGTTATATGTGGACTTAGAACAATGAATCAAAACGACATACGTTCTCAGC +GACAATGTGAACAAGACGAGCGCCGGCTCTCTTTACAACGCAACAATGCATACTTTTCTT +TCGTCTCACCGCAAATCGGTGATCGAGCACCCTCACCTTCAACTAACTCGAAACTTTTGC +CCTCAGCGAACGACAGACCGCGTTCTTGCTCTCCCTCTCTGCCTGCTTCGGCTCACAAGT +CGTGGAGCGAAGAGACCGCCTCTCCTACCCCGCTCCTCTCGCAGCGCCAAACGACCGTCC +CGGGTAACTGTAACACTGCAATAACGAGTGCAGTGACCTCACTGGCAACTGCCACAACAT +CAACTTCGTCAGCGGCCCAACTAATTATCGCTGTGCCAGCTGTAAATAATTCAGCAGCAC +TGACCGTTTGCAACAACAATAATGCACGTAAAGAAGAATCAAAACAAAAGCAGAAGTCGA +TTTCGACTGTGCAGACTGGCATGGATCGCTACATCCAAATCAAGAGAAAGCTCAGCCCTC +AAAACAATAAGGCAGGTAATCAACCCAAAATCAATCGAACCAACAACGGCAATGAAAACT +CTGCAGTAAATAATTCAAACCGATATGCTATCTTGGCTGATTCTGCGACCGAACAACCCA +ACGAAAAAACGGTAGGGGAACCAAAAAAGACCAGGCCTCCACCAATTTTCATACGAGAAC +AAAGTACAAATGCACTTGTAAATAAACTCGTTGCTTTGATTGGTGACAGCAAGTTCCACA +TTATCCCACTTAAAAAAGGAAATATTCATGAAATAAAACTACAGATCCAAACAGAAGCAG +ACCACCGTATAGTGACTAAATACCTAAATGATGCTGGTAAAAACTACTACACATACCAAT +TAAAAAGTTGCAAAGGGCTACAGGTAGTACTTAAGGGCATTGAAGCAACAGTGACACCAG +CTGAGATAATTGAGGCTCTGAAGGCCAAAAACTTTTCTGCAAAGACAGCTATTAATATTT +TAAACAAAGACAAAGTTCCGCAGCCACTATTCAAAATAGAACTCGAACCAGAGCTCCAGG +CACTAAAGAAAAACGAAGTGCACCCAATATACAATTTACAGTACTTGCTACATCGGAGGA +TCACCGTGGAGGAGCCGCACAAACGTATCAATCCAGTTCAATGTACTAATTGCCAAGAAT +ACGGCCACACCAAGGCATACTGCACCCTTAAGTCCGTATGTGTTGTCTGTAGCGAACCTC +ATACTACCGCAAACTGCCCCAAAAACAAGGACGATAAGTCTGTGAAGAAATGCAGTAACT +GCGGGGAAAAACATACTGCAAACTACAGAGGCTGTGTGGTGTACAAAGAATTGAAGAGCC +GCCTAAACAAACGTATTGCCACAGCACATACATACAACAAAGTCAATTTCTACTCTCCGC +AACCGATTTTTCAACCACCCCTAACTGTCCCAAGCACTACTCCAACAATTTCTTTCGCTA +GCGCCCTAAAATCCGGACTAGAAGTGCCCGCCCCACCGACAAGAACTGCTCATTCCGAAC +ATACACCGACAAACATCCAACAAACACAACAAAGTGGCATCGAAGCTATGATGCTATCCC +TACAGCAAAGCATGAAAGACTTCATGACGTTCATGCAAAATACTTTGCAAGAGCTCATGA +AAAACCAAAATATCCTGATTCAACTTCTTGTATCTTCAAAATCCCCATAATGGCTTCCCT +ACGGATATCTCTGTGGAACGCAAATGGCGTTTCACGGCATACACAAGAGCTCACACAGTT +CATTTACGAAAAAAACATCGACGTAATGCTACTATCAGAAACGCACCTCACAAATAAAAA +CAATTTTCATATACCAGGATACTTGTTCTATGGTACAAATCATCCAGATGGTAAAGCTCA +TGGAGGCACTGGAATACTCATCAGAAATCGCATAAAACACCACCACTTAAACAATTTTGA +CAAAAACTACTTACAATCTACGTCCATAGCCTTACAACTCAACAATGGTTCAACGACTCT +AGCCGCAGTCTACTGCCCACCGCGCTTTCCAATCTCTGAGGATCAATTCATGGAATTCTT +TAACACACTAGGTGACAGGTTCATCGCAGCGGGTGACTATAACGCCAAGCACACCCATTG +GGGATCTCGACTTGTGTCGCCAAAGGGTAAGCAATTGTACAATGCGCTTACGAAGCCAGA +AAACAAGCTAGACTATGTATCCCCGGGTAAGCCTACATACTGGCCAGCAGACCCAAGAAA +AATCCCAGACCTGATCGATTTTGCAATTACTAAACATGTCCCCCGCAACATGGTCACCGC +CGAAGCACTAGCAGATTTATCATCAGATCACTCACCTGTTTTTCTAAATATGCTAACTCG +CCCCCACATCGTCGACCCACCGTATAGACTCACAAATTTTAGAACAAACTGGCCAAGGTA +TCAAAAGTATGTCTGTTCACACATAGAACTAACGACGGCATTATCTACAAAGGAGGATAT +AGACAAGTCAACGGAAACTCTTGAAAACATTTTAGTTTCGGCTGCAAAGGCTTCAACCCC +GCCAGTGACGTATGCAAAACCAAACTACATCAAAACTAATCGCGAAATCGAGCGGCTGGT +ATTAGATAAACGACGCCTACGAAGGGATTGGCAGTCTAATAGATCACCAATTACTAAGCA +CATGCTTAAGATAGCCACACGCAGGCTTACCAATGCTCTCAAACAAGAGGAAAAAAACAG +CCAACGTTCATATATCGAGCAACTCTCTCCCACCAGCACTAAGTACCCTCTTTGGAGAGC +TCACAGAAACCTAAAGACTCCAATAGCGCCAATTATGCCACTCCGAAGTCCCTCTGGCAC +CTGGTTTCGAAGTGATGAAGAAAGAGCCAGTGCTTTCGCTGACCATTTACAAAATGTATT +CCGACCAAATCCCTCTACCAACACATTTATTCTCCCTCCTTTAATAGCAGCCAATCTAGA +TCCTCAAGAACCCTTTGAATTCCGACCATGTGAACTAGCAAAGGTTATCAAAGAGCAACT +GAACCCAAGAAAATCGCCTGGCTACGACCTAATAACTCCAAGAATGCTCATTGAACTCCC +AAAGTGTGCTATTCTTCACATCTGCCTGTTGTTCAACGCAATCGCCAAGCTTGGATACTT +CCCTCAAAAATGGAAAAAGTCGACCATAGTAATGATTCCAAAGCCAGGAAAAGATAAAAC +GCAGCCATCATCATATAGACCGATAAGCTTACTAACATGTCTTTCAAAGCTGTTTGAAAA +AATGCTACTCCTTCGGATTAGCCCTCATCTTAGAATAAACAACACACTTCCAACACATCA +ATTTGGCTTTAGAGAAAAACATGGAACCATCGAACAGGTCAACCGAATCACGTCAGAAAT +TCGTACTGCTTTTGAACATCGAGAATACTGCACAGCCATTTTTCTAGACGTCGCGCAGGC +ATTTGACAGAGTGTGGCTCGATGGACTTTTGTTTAAAATAATCAAGCTGTTGCCCCAAAA +CACACATAAGCTACTGAAGTCATACCTATATAACAGAGTGTTTGCAATAAGATGCGATAC +AAGCACTTCACGCGATTGCGCAATCGAAGCTGGAGTGCCGCAAGGCAGTGTACTGGGTCC +AATCTTATACACCCTGTATACGGCGGATTTCCCCATAGACTACAATCTAACAACCTCCAC +GTTCGCTGATGATACCGCGATACTCAGTCGCTCGAAATGCCCAATAAAAGCCACGGCACT +CCTATCCCGACACTTAACATCTGTAGAACGATGGCTTGCCGACTGGAGAATTTCAATAAA +TGTTCAAAAATGCAAGCAGGTTACCTTTACCTTAAACAAACAAACATGCCCACCACTGGT +CTTGAATAACATATGCATTCCACAAGCCGACGAGGTAACATATCTGGGAGTTCATCTGGA +CAGGCGGCTCACTTGGCGCAAACATATAGAAGCCAAATCGAAACATCTTAAACTTAAAGC +AAGGAACCTCCACTGGCTCATAAATGCTCGCTCTCCACTTAGTCTGGAGTTCAAAGCTCT +TCTATACAACTCCGTCTTAAAACCTATCTGGACTTATGGCTCCGAGCTGTGGGGCAACGC +ATCCAGAAGTAACATAGACATTATTCAGCGAGCACAGTCAAGAATTCTGAGAATTATCAC +TGGAGCGCCGTGGTACCTTCGAAACGAAAACATACACAGAGACCTAAAAATCAAATTAGT +AATCGAAGTAATAGCTGAGAAAAAAACGAAGTATAACGAAAAGCTGACCACCCATACAAA +TCCCCTCGCAAGAAAACTAATCCGAGTATGCAGTCAAAGCCGGCTGCACCGCAACGACCT +CCCAGCCCAGCAATAAACTTATTAGGGCATTAATGAAAAAAAAAAACTATCACTAAGTGA +AAGTTAATTAAGTTAGATTAAGATTTGAACACTTATTGTTAGTCTCTTAACACAAAGGGA +AGATTCAATAAATAATAAAAATTAAAAAAAAAAAAAAAAAAAAAA +>F +AATCAATTAATCAATTCGATCGCCGACGTGTGAAGACGTTTTTATCGTGCTCCGCACAAA +ATCGGTTGTTTTGAGTGAAGTGAACGCCAAATAAAATAAACTAAATAAAAAATCTGAAAG +CGAAAGAGACGCTCTATGCGATGCAAGATCGCTTAAATACATAGTGAATTGTTATCTTAA +ATAATAAAACTATGAGTCAGAATGACACTCGCGCCCAGCGTCAGCGCGAGCATGACGAAC +GCCGACTCTCAATTCAGCGCAACAACGCGTACTTCTCCTACGTCTCACCGACAATCCCAA +ACGCAGACATCGAGCGGTCAATAACCCATAGCCCAGGAAACCTTCTTCTACCAACAAATC +AAGAAAGAGCGCGCTCCTGCTCTCCCGCTCTATTGGCTCCGACAGAAGCCCCGCTACCTC +CAACAACAACAGCTGGAGAGGGACCGGCAGCCCGCTCTGCCTCGTCATCGGCTGCACCCG +CTCACGGTCTGACTAAGTCAGCGAAAGCAAAACCGCTAGCAATAAACGGTACTGCTGCAC +TGCCAGCAAAACAAAACGAAAACGTAAACAAAAAAGCTGGGTCGACCTGGCAGACTGGAA +TGGACCGCTACATTACAATAAAGCGAAAGCTCAGCCCGGAAAATTCAGATTTGGGAAACA +AGCCGAAAAATACACGCGATAACTCTACCTTGATCAAAAATGTAGCCCCTGCAAATACCA +ACAGATTTGCCTTGCTGGTAGATACCGCTGAGGACGTGCCGCTGGGATCCGTTGATATCG +AACCGAAGAAAACAAAGCCTCCGCCAATATACATCCGCGAGAAGAGCACAAGCCGTCTTG +TAAATACTTTGATTGGCCTTATTGGGAAAGATAGCTTTCATATAATTCCCCTCGTAAGAG +GTACTATCAACGAAATCAAACTTCAGACGAAAACGGAGGACGACTACAGAAAAGTCACAA +ACTATTTTACCGCACAAAAAATAGGCTTCTACACCTACCAGCTTAAAAGCAGCAAGGGCC +TGCAAGTAGTCCTGAAGGGCATTGAGTCTGATGTTACGCCCGAAGAGATAACTGAGGCGC +TAAAGGAAAAGGGATTTTACGCCAAAAACGTGTTCAATATCAAAAACAGAAACAGGCAGC +CCCAACCACTCTTCAAGATTGAGCTTGAACCAGAAAACAAGCCTCCTAGAAAAAACGAGG +TTCACCCAATTTACAAACTCCAGCTCCTTTTGCACCGTAGGATCACGGTAGAAGAGCCGC +ACAAACGCAACGCTCCTGTACAATGTACAAACTGCCAAGAGTATGGCCACACGAGGTCAT +ATTGTACACTTCGCCCGGTGTGCGTAGTCTGTGGAGATCTCCACGACTCCAAACAGTGTC +AAATTAACAAAGAAAATGCATGCGAGAAAAAATGTAATAACTGCGGGGGCAATCACACAG +CAAACTACAGAGGCTGTCCAATCTACAAAGAGCTGAAAATCCGTCTTCACAAAAGAATGA +ACACGGCGCGGGCACACCAAGGATCAGCTACCCTGATACCATCAGAGACAAATCCTGAAG +TAATTTTCTCGAAAGCAGCTAGTTTCGCTCCCTGGCCTACATTCAACACTAACAAGACAA +CATTTGCTAACGTTTTAAAATCAGGTATGACGCCTCCAACCCAAAACTCCCGAACTCCAC +ATGAAGTGCACACAAAATTAGACACACAACAAAACTATCACCCAGCTGCGCAGCAGGAAA +CAAAAACTGAAGCTATGATGCAAGCCTTACAACAGAGCATGATGGAATTTATGACATTTA +TGAAGACCACCATTCAAGACATGATGCGTAATCAAAACCTTTTGATACAAATGCTTGTAG +CCCAACAATCAAATAAATAATGGCTACCTTACGCATAGCTACGTGGAACGCCAATGGCGT +CTCACAGCGCAAACTTGAGCTAGCTCAATTCCTACATGAGAAGCATATCGACGTAATGCT +TCTTTCGGAAACTCATCTCACAAGCAAATACAATTTTCAAATAAGAGACTACCATTTCTA +CGGTACAAATCATCCCGACGGAAAAGCACACGGTGGCACCGCCATACTCATAAGGAACCG +TATGAAGCACCACTTTTACAAAGAATTTGCGGAAAATCATCTTCAGGCCACATCTATCAA +CATTCAGCTGGATGACAACACTCTCCTTACACTAGCGGCCGTATACTGCCCCCCCCGTTT +CACAGTATTAGAAGCTCAATTCCTGGATTTCTTCCAAGCACTAGGGCCACACTTCATTGC +AGCAGGCGACTACAACGCTAAACATACTCACTGGGGATCGCGACTTGTGAACCCAAAAGG +AAAACAGCTTTATAAGACGATAATAAAAGCCACTAATAAACTTGACCATGTTTCCCCCGG +GAGTCCTACATACTGGCCATCAGACCTCAATAAGCTGCCAGACCTGATCGACTTCGCAGT +TACGAAAAATATTTCCCGCAGTTTGGTTAAAGCTGAATGTCTGCCGGATCTCTCATCTGA +TCACTCGCCTGTACTAATTCACCTCCGCCGATACGCAGAAAACGTGAAACCACCAACCAG +ATTGACCTCTAGCAAAACAAACTGGCTCAGGTATAAAAAATATATAAGTTCACATATTGA +GCTAAGCCCAAAACTCAATACTGAATCTGATATAGAGAGCTGCACGTGTGCATTGCAATC +CATCCTTACTGCAGCAGCTCTTACTGCAACACCCAAAATAACAAATAATACAATTAATTC +AAAAAAGACCAACGTACAAATCGAGCAACTCGTCCACGTAAAACGTCGCTTACGCAGAGA +ATGGCAATCTTCCAGATCCCCAACTGCAAAACAAAAGCTAAAAGTAGCCACACGGAAACT +GGCCAACGCTCTGAAACAAGAAGAGGACGACGATCAGCGCCGATACATAGAGCAACTCAC +ACCAACAGGCACAAAACAAAAGTCACTGTGGCGAGCCCACTCAACTCTTCGCCCACCGAC +TGAAACCGTTTTGCCGATAAGGAATTCATCAGGTGGCTGGGCCCGTAGTGATGAAGACAG +AGCCAACACATTTGCCGCTCACCTACAAAATGTGTTCACGCCAAACCAGGCTACTAGCAC +ATTCGCGCTACCGTCCTATCCCGTAAACCGCCATCAGCAACACACCCCAATTGTGTTTCG +TCCTAAAGAAATAACTAAAATAATCAAAGACAATCTCAGCCCGAAAAAATCCCCCGGCTA +CGACCTTATAACACCGGAAATGATCATCCAGCTGCCACATTCTGCAGTTCGCTACATAAC +CAAGCTCTTTAATGCCATCACCAAACTTGGTTACTTTCCACAACGATGGAAGATGATGAA +GATCATAATGATTCCAAAGCCTGGTAAGAACCACACAGTCGCTTCATCTTACAGACCAAT +AAGTCTACTCTCATGCATTTCGAAACTATTCGAAAAATGCCTGCTGATCCGACTTAATCA +ACATCTGATATACCACAATATAATCCCAGCCCACCAATTTGGATTTCGCGAAAGCCACGG +AACCATTGAACAGGTGAATCGTATTACAACGGAAATAAGAACTGCATTTGAATATCGCGA +ATACTGTACAGCAGTATTTTTAGACGTATCCCAAGCATTCGACAAAGTCTGGCTCGACGG +CCTAATGTTTAAAATTAAAACATCCCTACCCGAAAGCACACACAAACTTCTAAAGTCTTA +CCTCTATGACAGAAAGTTTGCAGTGCGGTGCAACACTGCCACTTCCACTGTTCATACAAT +TGAGGCTGGAGTCCCCCAAGGCAGCGTTCTTGGGCCAACCTTATACCTCATCTATACAGC +CGACATCCCTACAAATAGTCGCTTAACGGTATCCACATTTGCCGACGATACAGCTATCCT +TAGCCGTTCAAGGTCCCCTATCCAAGCTACAGCACAGTTGGCACTGTACCTCATCGACAT +TGAGAAGTGGCTCTCTGACTGGCGAATAAAAGTAAACGAGCAAAAATGCAAGCACGTGAC +GTTTACGCTAAACAGACAAGACTGTCCTCCGCTCTTGTTGAACAGCATACCACTCCCGAA +AGCAGACGAGGTAACGTACCTAGGAGTACACCTAGACAGAAGACTCACATGGCGCAGGCA +CATTGAAGCCAAAAAAACCCAACTTAAACTCAAAGCCAACAACTTACACTGGCTCATCAA +CTCTGGTTCTCCGCTCAGCCTAGATCACAAGGTCTTGCTCTACAATTCTATATTGAAACC +AATCTGGACCTATGGCTCACAGTTATGGGGCAATGCCAGCAACAGCAATATTGACATCAT +TCAGCGAGCACAATCAAAGATTCTGAGAACCATCACTGGGGCACCGTGGTACGTTCGGAG +TGAAAACATCCAAAGAGACTTAAATATCCCATCAGTTACCAACGCAATCACGGAACTTAA +GGAAAAATACCATAGCAAGCTTCACACGCACCCCAACCACCTAGCGCGAGGTCTAATCCA +GCTCAGCAGCCGTTCCCGTCTCCGGCGAAAGGACCTACCAACCCAGCGAATAAATTATTA +GGGCCGTTTAAACATAGAACAGTTGGAAAAATAATACAACTGTTCAAAAAATACTTGTTA +TAGTTAAGATTTTTAAACTTATTGTTAGTTCTTATACAAGAAGATTCAATAAATAAAAGC +AAAGTAAAATAAAAAAAAAAAAAAAAAA +>FB +TATATTCTATTGCCCACCATATAAACACGTGCCACTTTCCTAGTTTTAGGATCTGCCTAC +ATAACACGTGCAGACGCACAGGTGTTTCTGGGTTTATATAGACCAAAAATTGGTTCCGAT +TGCCAATCTTGTAATTTACAGTTTACCAGGTAATTACATAATTTTCAAACCTCACTTTAT +GATAGGGTCCAATTTTTTACCTGTGACAAAGTGTTAAATTTTTTAAGAATGGGTTTTTCA +TGGCAGGTCAGAATCCTCTATAAAATCTAAAACACTTGTCGGTATTTGAAAATCGCTCTC +CTCCTTGATTCTCATATTAGGTGTAAAAGATAAATCCGGAACTCATAATTAAAATATTTT +TTATGTGAAAAAGTTGTGCGCGATTTTAACTACGCTTACCCAGTGCTGGAAAAGTTAAAG +TTGTTTTGTTTTTCAAAGAAAGTGAAAGTTGCTAAGCACGAACTTAAGAAATCTGAGTGA +TTGTGTTAAATTTATTTGAATCCTTGTGAATTTTGTTGACAGTCTTTTTAAAGACTTGCA +AAATTTTCATATTATTCGGTTCTTGCTTTTATTTTTATACAACGCGTTTTTCCTTTAGGC +ATACCTTTATACATTTACAGTGTAAACAACAGTGTAAAACGTGTAAATCAGTGCAAAATA +GTTTTTTTTATTTACTCCATAAAAAATAAGTGTTACTGTCAGGATGCCGGCCAAACCGCA +AGTCGATGGTCACACCTTAGTGGATGCATTTTGCTGCGCGAATATTTTTACGGAGACTGG +AGCTCTTAAGCCAAGAAGCGATAAAGTTTGGATGGATATAAGCAACCAATTGAAAGGAGC +GATCAGCGCGAAGACGCTTAATTTCTACGCCAGAATCAATAGGAATAACATGATAACTGT +GGTTAAAGAACGATGTGGAATTCAACAGCTGGATACTAGTGCCAATTTAACTTTAAATAG +CACATTTCCTGATGATGACCCGGAGTTCCAGATCACCGAAGCTTCAAAAAATGGACCATT +GCCTATTTTGTACTTTAACCTGGAGTTGGACCTGGAATTGTGGAGATCAATTGCCCCCAA +AAAGGATCAAAAAACTGAAAAACTGCAACCTAACTGGACGGATACTATGGCAAAGTTGAT +ATACAAAAAAGTTCCTCTTCCGTGTGCATTTAATTTTAGAAAAGCTAAACTTTCCGACAA +AGTGGATAATATTTGGCTACGAATTGAAGGCTATTGCAATGACTGCAGCTCAATTTTAAA +GGGACATTGCCTTGTGAAACCCGATGAACAATGCGGCATAATGATATCTGTTTCAGTACC +GGACACACGAGGTATACCTCATAATAAAAAACGACGGTGCACTGGATCGAGACGACTTGA +AATTGGGAACGAGTTGATTTTAAAAAAAGCTGCATTGTGGAGGAAGGAAGCCACCGACAA +CATGAATGATGACGACCCAGAACCGAGTTACATACCAAATTTACCAACCCTTCGGAAACT +TCGTGAAGAGGCAACTAACAGACACCTAGGAATTACCAAGGATCGGGATCCAGTTTCATC +ATTATACCTTAAAAAGTATGAGGGTGAATTGGCTGGATGCATTCTTGACATTGGATTGGA +TGAATTTTTCTGCATATACTGCACAGGAACCCAAGTAAAAACATATGCATCAAGGATAAA +AACTATTAGAAAGATTTCTATTGACGCAACTGGAAGCGTGGTGTTACCCATCCAAAAACC +AAACGGTGACTCTAGTTATGTTTTTCTGTACCAAATTGTAATGGAGGGTGACGACAGTAT +ATTTCCAGTTTTTCAGATGCTGTCGGCTAAACATGACACAGCCAGCATACAGTTTTGGTT +AAGCAGATTTATATCAAAGTCGGGGCATTTTCCACTGGAGGTTGTATCTGATTTTTCCTT +GGCATTGCTAAATGGAATAAGCTTAAGCTTTAATGAGTGTAGGATTGCGACGTATATAAA +AAAATGTTTCCACAGCCTTTTGATGGAGGAACGGACGGATCTGCCACCCTGCTATATTCG +ACTTGACATCGCCCACCTAATTAAAATGATATGCCGGAAGAACGTCTTCAAAAGTAAATT +ACCGAACCTCAAGGATTTTTATACTAGATGTATTGGTCTTGCAACAACGTGTGAGACAAA +GGACAGTTTTGCGGAATTAATTAAATCAGTACTGATTGTCGCACTGAGCCAATCCTCAGG +GGAAGATGAAAAAGGAGACATTCTTTCAAGTTACAGGAATGAAAAGTATCTGCTCGCCAG +AATAGCTACATTTACTGCCCCGGATCACAAGGAGACCATTGAGGACAACTGCATACCAGA +GGACCAGGAGGAAATTGACGAGGATGTTACGGACTTTATCTCTAATATTAAAATCGCTGC +CGAAGAAGAAGCGTTAAATTGCAATTCGGTCAACTGTCGGCCAAATCCGTATTTCCTACC +TGAGCTAATGCCACCATTAATTAAGTTGTGCAAATATTTTGTTTTATGGACAAACGTGAT +GAAGGAAAAGTTCTGTTCCAAATATGATGTCGGCTCTTCGGCTCTTGTGGAAGCCTATTT +CAAGGATTTAAAAAACACGGACATGAGCATATTCCACCGACCAGTGAGAGCGGATAAATT +CGTGGTGCAACATATCCGATGCATCGAAGCTGTTTGCAAGCTGGAACGAGCCGCGATGAA +ACGCAAGACCGTTAAAACTCCCAGCTTTATAAAAGAAAACGCTCCTAAGAAAATGTGCAG +TAAGGAAACCAAGGGATTTCTGGAGGAAATACTTGAAGAAAGCGAAGTGGAATACCTTTT +ACAAGAAGAAAACTGGAAGGTGAAGAATAAAACAATAAAGCCCACGGAAGGAAATGATGC +TGAAGACAACGACACTGATGATGAAAACAAGGAAATGGATTTAAGTGAACAGCCCAAAGA +AAAACCAAGGGGAAAATATCTCAAAAAATGCCCCAATGTGGAGTTATTATACAATCGACC +ACATCGAAGGAAACAGGACGAAATTTTGCATAATGGTGGATCAATGGGACCCGTCTGGAT +TGGCAAACAATTATTGCAATTCAAAAATACTTGTCCGTTTGACTCTCTAGTGGAAATATT +GTCGACCGCATACATAGACAATTTTTATTACAAAAGCCTATTGGATGATTTCTACACTGA +CAACTTGACGATAGAATTGGTGAAAAAGTATGCCGTCGAGGGAGTTTCGTCCAGTCTCTA +CTGCGACAGAGGTCTGGTCCTAAAAAGTTTTTTTGATGAAAAACACCAGATTATAAAATG +CGACGCAAATATTGGGTCTTTTATTGAAAAAGCGCTGAATGGAGTACCCAGTGCGTCAAG +TCATCGGACCCATATAAAAAACAACCATGATTGCAGGAACCAAAAATATATCCACCATCG +GCTGGAGGTTATAGATGTCGAAAAAGTTGGCCACCTCGACGTCCAGGAGGTAGTGATCCC +CTTTATTGATGAGTTTTTTGCAAGAACTGATGGAGAATGTAAAATATGCGGTGGACAACA +GATCCTTGAAAGGCAGCCAGGACCGCATGTCATACTTGATATAGAATTTGCAATGGATGC +TTTTCATCAAATTCATCATAACGGTTTACCAGGAACGACCACTTTACTTCAAGTGCCGGA +GGAAATTTTAATACAGGAAAAGAAATATATTTTAAGTGGTGCCATCGAATATGTTCCTGC +GATGGGAGGGGAAATTGGACATTACATTGCATATTGCCGCAGAGTCATTGGATCTTGGGA +AGTGCACAACGATATGTGCAGGCAATGGAAAAAGTTCTCAGCTCTAAATACCAAAATGAC +ACTCCACATTTTGATATACACCCGGAAAAATTAATGTTTATTTTTAAGCCTTGTTTAAAA +GTGTAAAAAATATTTGTTGTTAAAAATTACAATCTTAAGTCCTTTGCAAACGTTGTTTAA +AAATAAAATTAAATTAATTATTTTACAAAACTTAACCCTTTTTCACTTTTATACCTAATA +TAAAGAGGTCCGTAAAGTATCAAGGAGGAGAGCGATTTTCAAATACCGACAAGTGTTTTA +GATTTTATAGAGGATTCTGACCTGCCATGAAAAACCCATTCTTAAAAAATTTAACACTTT +GTCACAGGTAAAAAATTGGACCCTATCATAAAGTGAGGTTTGAAAATTATGTAATTACCT +GGTAAACTGTAAATTACAAGATTGGCAATCGGAACCAATTTTTGGTCTATATAAACCCAG +AAACACCTGTGCGTCTGCACGTGTTATGTAGGCAGATCCTAAAACTAGGAAAGTGGCACG +TGTTTATATGGTGGGCAATAGAATTTA +>DMTNFB +AGCTCAAAGAAGCTGGGGTCGGAAAAATCGAATTTTTGAAATTTGAAAGCTGGAATCGTT +TGCCCATTTTTTGCCCATGTTTGCCCACCAATTAGTTTTTTTTGCCCACGTCCAGTTTTT +GAGATATGGATTTTCGAAAAAGTTCGAAAATGTTCGAAAATCAAAAATTTCGCTTTTTTC +AAATTTTTTTTTTTTTAAATCGCAATAACATCGTTTGCCCACGTTTGCCCACCCTTTAGA +ATTTTGAAAAAATTTATACTTTAGAAAATATAAGGCTTTTAAGTTTACCTCGGTCTAATC +AGAGAGTAAATCGTTTGCCCATCTCTTAAAACCAAATATTATCAACAAAAAACGTTTGCC +CAACCATTATTATTAGTTTTTATCGTTTGCCCACCCTTTAAAAAACCTTTAACAAAATTT +TTTTTTCGATTGCCCACACTTGAAATACAACCAATTTCGTTAGCCCACCTCTTCAAAATA +AATATTTCCAATAAAAAACGTTTTCCCACCATTTAAAAATAAATAATTTCGATTGCCCAT +CCTTCAAAATTCATTTTAACGTTTGCCCACCCTTTAAAATTTGTTTTTTTCGTTTGCCCA +CTCTTAAAACTAAATAATTTCGATTGCCCACCTTTTAAAACTAAATAATTTCGTTTGCCC +ATCCTTTAAAATTCATTTTTAACGTTTGCCCACCCTTTAAAAATAAATTATTTCGTTTGC +CCACCCTTTAAAATTTGTTTTTTTCGTTTGCCCACTCTTAAAACTAAATAATTTCGATTG +CCCACCTTTTAAAACTAAATAATTTCGTTTGCCCATCCTTTAAAATTCATTTTAACGTTT +GCCCACCCTTTAAAAATAAATTATTTCGTTTGCCCACCCTTTAAAAGTTTTTTTTTTTCG +TTTGCCCACTCTTAAAACTAAATAATTTCGATTGCCCACCTTTTAAAACTAAATAATTTC +GTTTGCCCATCCTTTAAAATTCATTTTTAACGTTTGCCCACCCTTTAAAATTTGTTTTGT +AAGATGTGGCGCCAATTCAGATATTTTAGGATCGGCGGATAGAAGCACTTACTTATATGA +TGATGATGAACATACATAGACATAAT +>DMREPG +ACAGTCGCGATCGAACACTCAACGAGTGCAGACGTGCCTACGGACCGACGGCAAGTTATT +TTCGTGCTCAAAGTCCCGCTACTCTAAAACCGCTACGTAGTGTCGCGAGATTTCTTCGCG +CACCGTGATTGGTTCAGCCGGCGAACCTTACGGTATCGCTACCACTACCAACGCACTCGT +GCGTGCGTGTTATCGGTATCAACAGTTACATTCGGCTAAAGTTACTGCGAACAACTCAGC +AGCAGCCACGTGCTGAGGCTGGTACACCAACAAACGGTTCCTACCGTGCCCTCCTCCCCT +CCTTCCCTACTCCGGGACAACATGGACTGGCAAGCCCCCCCGCGACCCACCAAGCTGACC +AAAGTGCCTAGAAAGAAGGCGCTCAAAGAGGCGCCAGGAGAAGGTGAAAGCAGCTGCTCA +AGCGATAGCAGCTCCTCGGAGTCAGAGCCTGGGGAAGTCAAGCGCAAAGCAGCGAGCAGA +GACGCTAAGGAAGCCGCCGACAACGTGCCCAACACCAGCGCAGCTCTGCGCAAGAAGCTG +GAAAATAACTCCTTCGCCCTTCTGTCCAGCACTGAGGACGAAGACGATGACGACGACAAC +ACCGACAACGAGCAGCAAACCCCTGTTGGGGAATCTGCTCCAAAAACCATGAAAAAACCC +AACCCGACCCCGAAGACCATCAAGCCACCCCCGATCTACATCCCAGACGTGACCAACATC +TCAGCCCTTGTCAGGATGATTACGACTCTCGTCGGTGCCCACAAGGAATTCTCGTACAAA +ACTGAGAGAAACAACAATGTACGAGTAATGATGCCTGACAAGGAATCCTACTCAGCCTTT +CGTCAGCAGCTTGTGACCCAGAACAAAAGGCACCGCACATTTCAACTGTCAGGGACCTGC +ACAACCCAATTGGCAAAAAATCAAAGGAACCCCTGGGGATCTTCTTTGTAAACCTGGAAC +CTGCGAGCAACAATACAGACATCTACAAACTCAAGAGAATCTGCAGGTCGGTCGTCACCG +TTGAGCCGCCTCTGAAATTCAACGATGTTCCGCAGTGCTTCAGATGTCAAGGGTTCGGAC +ACACCCAGCGCTACTGCTTTTTAGAGTTTCGCTGCGTCAAGTGTGGTGGCCTCCACGACT +CCAGGGCGTGTGAAAAAAAGGAAGACGAGAAAGCATGCTGCCTACACTGTCAAGCCGACC +ATCCAGCGTCGTTCAAAGGGTGCCCCGCGTATAAGAAGGCAAAGGCTCAACAAGCTCCTA +AACCCAAAGCAAGGAGCATGGAAAGCAACAACAAGCCCTCCTTTGAGCTCCCAAATATTA +CAAACGGTATGAGCTATAGAGACGCGCTAAGTGGCACACGCAAGTCCCAAGCAAGCACTC +CCCCACCGACACCCCCAACCCCACCTGAAGCCCCACAACCTAACCACATGGAGGCTATGT +TCACTCGATTTGAGAGCCTGGTCGAAAGAATGATGGAGAAGATGTTTGCTCAGGTGACGC +AGCTTGTTGCTTCCATCCTCAACAGCAAGTCATGCAAATAAGTCTCAACATAGTCTTCTG +GAACGCGAACGGCTTGCAGAGAAGCAAAGCCGAAGTTGAGCACACCATCAAAACCGACAA +CATCGATATTTTATTGGTCTCAGAATCCCATTTTTGCCCCAGATCCCACTTCATCATCTC +CGGTTACGACCTCATCACAGCCAACCACCCATCAGGTAGAGCTCGAGGAGGAGCGGCCAT +GCTCATCAAAAGCGGCATACAGTTCACTGAACTGCCTGCGATACAGGAGGATTGGGCACA +GTGTGCAGTGGCCAGAGTCAATAGCCTACAGGGAGATATTACGGTTGGAGCGGTTTACTT +CCACCCCCAGGCACGCGATTACAGAGACTCACCTGCATGAGTTCTTCGAGTCCCTCGGAA +CTCGCTTCATTGCAGCCGGAGACTTCAATGCAAAGCACTCCTGGTGGGGGTCCGCACAAA +CAACCCCAAAGGCAAAACGCTCCACAAGTACCTGATGCGCAAAAACTTGGACTGCCACTC +TACTGGAGAGCCCACACACTGGCCCTCGGACCCTTCTAAGCAGCCGGATCTGCTGGACAT +CGCGATCTGCAAAGGCATAGGTCGTGCCAAACTCGTCTGCACTACATACGACAGGCTCGT +ATCGGACCACAGCGCCGTCAACCTGCTCCTCAACATCCCTGTCCTCAGGAAGACGCCGCT +CCGTAGACTCACGGGGAATCGCACCAATGCCCCCAAGTTCACGTTCTGGATGCTCTCCTC +CCTAAACCCAGACCCAGACCTCTCCACTCCAGGCAATATAGGCGCGGCCATCGAAAAACT +GAACAAGGAGATGCACAACGCCGCTGAGTTTGCGAACCCTCCTCCTCCTACAACCCCGAG +AACTCCCGCAAGAGACCTGCATTTGTGGTCCCCAGAAATCGCCGCCCTCGTGGCCGAGAA +GAGACGCCTCAGACGAGTATGGTTCCTCTCGCGTAACCCCAGGGACAAGACAGCGCTCAA +TCGCGCCTCCAAGGAACTCAAGGACAAACTAACCACCCTACGCCAAGACTCGTTTCAACG +ATTCCTTGAAGATCTGGAACCTGGAGACCCGCAGCACAACCTGTGGATCGTCACGCGGCA +CATCAAAAGACCCGCCAAGAAAATGGTACCAGTGCGTACAGCAGACTGCTCCTGGTGTCG +GTCTGAGGCAGAAAGAGCCGAAGCTTGCTGACCACCTTCGCTCTGCCTTCACTCCGTTTG +ACCGATGCACAGCTGCAGAGCAAGCTGACACCATCAGAGCTGTTGAAAGCCCATGTGCTC +CAGGACCTGCAATTCAGCCCGTCGCACCAGAGGAGATCGCGCAGGAAATTGCCTCGCTCA +GAAACGGCAAGTCTCCCGGCCCTGATCGCATCGACGCTACTGCGTTAAAAATGTTGCCCA +CATTCTGCTCACAGCTGCTTGCCAACATTTTTAACAGCTGCTTCCGGCTAGGGTATTTCC +CAAAACAATAGAAACGCGCCGAAGTGATTACCATCCCCAAGCCCGGCAAACCTGAAGCCA +ATCTTGCCTCCTATCGTCCGATAAGTCTGCTGGCAATCCTCTCCAAAATACTCGAAAGAG +TATTTCTGCGCAGAGTGCTGCCAGTACTGGATGAGGCTGGTTTGATCCCCGATCACCAGT +TTGGCTTCAGGCGCTCCCACGGAACACCAGAGCAATGCCACCGGCTTGTAGAGCAAATTT +TGGAGGCCTTCGAAAGGAAGCAATACTGCTGCGCCGTCATGCTGGATGTGAAGCAGGCCT +TCGACAAAGTCTGGCACCCTGGACTCCACTATAAAATCAAGACTCACCTTCCCGGATCCC +ACTTCGCCTTCCTCAAATCATTCACTGAGGGTAGAGAGTTCCAAGTTTGCTGCGGAACAG +CGACCAGCACGCCTAGGCCGATAAGAGCCGGAGTACCCCAAGGCAGCGTCCTTGGACCAA +TACTGTACACACTCTACACAGCAGACCTTCCTATCACACCCTCCCGGAGCCTAACAGTGG +CCACATATGCCGATGACACCGCCTTCCTAGCCTCCGCCTCAGACCCCCAAGAAGCATCAA +CCATCATTCTAAGCCAGCTGGATGCCCTCGACCCATGGTTGAAACGATGGACCATTGCCG +TGAACGCAGACAAATCCTCCCAAACCACTTTCTCCCTGCGCAGAGGAGACTGCCCCCCAG +TCACGCTCAACGGGGAAACTATTCCAACCTCAAGTTCCCCGAAATACCTTGGATTGACTC +TAGACCGGAGGCTCACTTGGCACACCAGGCTGACCTGCGCCTCAAGCAACTCCACTGGCT +CATCGGGAAAAGGTCCAAACTTAGGGAAAACCTTAAACTCCTCCTGTACAAGGCCATCCT +GAAGCCAATTTGGACTTATGGGATTCAGCTGTGGGGCACTGCCAGCATCTCAAACCGCAA +CCGCATACAGCGCTTCCAGAACAAGTGCCTGAGTCAATCGCTGACGCTCACCCATACCAT +GAAAACTCCGTTATCCACAAGGAGCTTGGAATGCCATGGGTAGCAGAGGAGATCTCCCGC +TTCAGCGAGAGATACGCTAAACGACTGGACAACCACCCTAACCATCTGGCTATTAACCTC +CTGGACAACAGTGAAACCATCAGACGCCTCCAGAGGAAACACCCGCTTGATCTCCACCAC +CTATAACCCACAACAATGAACCCCCGACCAATCTACAACTTTGTAATCCCTTAAGTTAAT +GCCCCCCCCACCCAAACATTTAATTATTGTCCACATGGACAGATTTTAAATTAATACATA +GATCGCTAAAAAAAAAAAAAAAAAAA +>DMGYPF1A +AGTTAACAACTAACAATGTATTGCTTCGTAGCAACTAAGTAGCTTTGTATGAACAATGCT +GACGCGCCAGAATTGGGTTCAACGCTCCACGCGAAGAATGCCTGGCAGCGGAAAGCTGAC +ACTTCCTACCGGGAGTGTTGCTTCACGCTGCAAGAAATGCTGAGTCGGCTTGCCGACTTG +TGGCGGCGCGATGCATTGCTCGAGGGTAAACTTAGTTTTCAATATTGTCTTCTACTCAGT +TCAAATCTTGTGTCGAAATAAACCACAGCTTGCTCCGGCTCATTGCCGTTAAACATCATT +GTTCTTATTTACAATCAAATCGCTATCGCCACAAGGCTAGTGATAATAACTAAGGGGGCG +AAGTCAAGCCCTCCAACCTAATCTCCATAAACAGTGTCTAAGACGAACCTCAGCGAAAGA +AGGAAGATCTCTAGACCTACTGGAAATAACATAACTCTGGACCTATTGGAACTTATATAA +TTGGCGCCCAACCAACAATCTGAACCCACCAATCTAATTTAACACACTTTGTCAGGCGAC +AAACAGGGTAGTTAAGTTAGAAAAGCATGTAAGTTTTACAAGACACTTCTTTGACGCAAT +CAAGAAATTTACGAGTGAAAAAAAAAAAAAAAAAAAGTTGTGTATCTGGCCACGTAATAA +GTGTGCGTTGAATTTATTCGCAAAAACATTGCATATTTTCGGCAAAGTAAAATTTTGTTG +CATACCTTATCAAAAAATAAGTGCTGCATACTTTTTAGAGAAACCAAATAATTTTTTATT +GCATACCCGTTTTTAATAAAATACATTGCATACCCTCTTTTAATAAAAAATATTGCATAC +TTTGACGAAACAAATTTTCGTTGCATACCCAATAAAAGATTATTATATTGCATACCCGTT +TTTAATAAAATACATTGCATACCCTCTTTTAATAAAAAATATTGCATACGTTGACGAAAC +AAATTTTCGTTGCATACCCAATAAAAGATTATTATATTGCATACCTTTTCTTGCCATACC +ATTTAGCCGATCAATTGTGCTCGGCAACAGTATATTTGTGGTGTGCCAACCAACAACCAA +TGAGTTGGGCACATAACTACAGAAAGGTTAAGGTCGAATACGAAAGCGAGGATAGCTGGG +AGGAGGAGCAAGTAGGCCAAGCATTAGGTCGGCCGTTAGATAGTGCCACGGTAGATATTA +CCATGGACCCCAATCAGATTCAAGCTCTTATCGACAATGCTGTCAGACAGGCATTGTCGC +AACAGCAATCCCAATTTCAGACACAACTCAATTCCCTAGCTGCGCGGGTACAGAGTTTGC +AGGTGGAAGCACCGCAAATCAAGATTTACGAAAAAGTCTCTGTTAACCCCGATGTTAGGT +GCGACATTCCCCTTGACATAATAAAGTCTGTACCAGAGTTCTCCGGTACCCAAGACGAGT +ATGTGGCCTGGAGACAATCGGCCATATACGCCTACGAGCTCTTCAAACCATACAATGGCA +GCAGTGCCCATTATCAGGCTGTTGCCATATTAAGGAATAAAATCCGTGGCGCAGCCGGGG +CTTTACTGGTCTCCCACAATACGGTATTGAACTTCGATGCTATTTTGGCCAGACTAGACT +GCACGTACTCGGACAAAACATCCTTACGCCTGTTGAGGCAAGGATTGGAAATGGTTAGGC +AAGGAGACCTACCACTAATGCAATACTACGATGAAGTTGAAAAGAAGCTAACGCTTGTCA +CTAACAAAATCGTAATGACGCATGAACAAGAGGGTGCTGACCTGCTTAACGCTGAGGTCA +GAGCCGACGCCCTGCATGCTTTTATTTCGGGGCTCAAAAAGGCCCTCAGAGCTGTGGTCT +TCCCGGCCCAACCAAAAGACCTGCCATCTGCACTGGCTTTAGCTAGAGAAGCAGAGGCAA +GCATAGAGAGAAGCATGTTCGCTAACTCCTACGCCAAGGCCGTAGAGGAGCGAGCGCATT +CGGGGGCAAACGGCAAGAGCCGTTTCCAGGGGAAGCCAAATAAAGAAGAACAGGGACAGG +ACAGGAATCCCCACTTCACCAAACGCCCCAAAAATAACGGACAAACCAACAAGGACACTC +AGGCGCAAGCACCCCAGCCAATGGAGGTCGATTCATCCTCCAGGTTTAGGCAGCGTACTG +AACATTATCAGAATCATCCTAACGAGTCGAACGCGTTTAAGAGGAGAAATTCCTCAGAAC +GCTCAACAGGACCGAGACGACAACGTCTGAATAACGTTGTCCAAGAGGCCCCTAAACAAA +AGGACCCCAAAGAAGAGTATGAAAAAACAGCAAAGGCTGCAGTCGAGGAAATCGACAGCG +AAAATGAGTACGCTCCCAGTGACGACTCGTTGAATTTTTTAGGGGGCGCTCCCGGTTGCC +GTTCATTGAACGACGGCTGGCTGGGAGAACCTTAAAGATGCTAATCGATACCGACGCGGC +AAAAAACTACATTAGGCCCGTAAAGGAGCTGAAAAATGTAATGCCGGTCGCCAGCCCTTT +CTCGGTGAGCTCAATACACGGCTCCACCGAAATCAAACACAAATGCTTGATGAAAGTCTT +CAAGCACATCTCCCCATTTTTTCTTTTGGATTCTCTCAATGCGTTCGACGCTATCATAGG +CTTGGACCTGTTAACACAGGCCGGGGTAAAACTCAACCTTGCAGAGGACTCCTTAGAATA +CCAGGGCATCGCTGAAAAGCTTCATTATTTCAGCTGCCCCAGTGTAAATTTCACTGATGT +AAACGATATTGTTGTACCTGACTCCGTTAAAAAGGAGTTCAAGGACACAATAATAAGGAG +GAAGAAAGCTTTCTCCACAACAAATGAAGCTCTTCCTTTTAACACCGCTGTCACTGCCAC +AATTCGGACAGTTGACAATGAACCGGTGTACTCAAGAGCGTACCCAACTCTTATGGGTGT +CTCCGACTTTGTGAACAACGAGGTCAAACAACTGCTGAAAGACGGCATTATCAGGCCCTC +AAGGTCTCCCTATAACAGCCCGACCTGGGTTGTTGACAAAAAGGGGACCGACGCCTTCGG +GAACCCAAACAAGAGGTTGGTCATTGACTTCAGGAAGCTAAATGAGAAAACTATTCCTGA +CCGGTACCCGATGCCTAGCATTCCCATGATTCTAGCGAATCTGGGCAAGGCAAAGTTCTT +CACTACCCTTGATCTTAAGTCAGGGTATCATCAAATTTACCTCGCGGAACACGACCGCGA +GAAGACATCGTTCTCGGTGAATGGTGGTAAATACGAGTTTTGCCGTCTACCGTTCGGCTT +GAGAAATGCAAGCAGCATTTTTCAAAGAGCCCTAGACGATGTGCTTAGAGAGCAAATCGG +GAAGATATGTTACGTCTATGTAGATGACGTCATAATTTTCTCTGAAAACGAGTCCGACCA +TGTCCGCCACATCGATACAGTACTAAAATGCCTGATCGATGCCAACATGAGAGTAAGCCA +GGAGAAAACTAGATTCTTTAAAGAGAGTGTAGAATACCTCGGCTTTATTGTCAGTAAGGA +CGGAACTAAATCCGATCCAGAGAAGGTGAAGGCCATTCAGGAGTACCCTGAACCAGACTG +CGTTTACAAGGTTAGGTCCTTCCTTGGTTTAGCCAGCTACTACAGAGTCTTCATCAAAGA +CTTTGCTGCCATAGCCCGCCCGATCACCGATATCCTAAAAGGGGAAAATGGTTCGGTGAG +CAAACACATGTCTAAAAAAATTCCTGTTGAGTTTAATGAAACTCAACGCAACGCGTTCCA +AAGACTGCGAAACATACTAGCATCCGAGGATGTCATACTCAAATACCCCGACTTTAAAAA +GCCTTTTGACCTTACTACAGATGCTTCGGCAAGTGGTATCGGTGCAGTCCTATCCCAGGA +GGGCAGGCCAATCACCATGATATCGCGTACCCTTAAACAGCCCGAGCAGAACTACGCCAC +AAACGAAAGGGAATTGCTGGCGATTGTATGGGCCCTAGGTAAGTTGCAGAACTTCCTGTA +TGGCTCTAGGGAGATTAATATATTTACCGACCATCAACCCCTCACTTTCGCTGTTGCCGA +CAGGAACACGAATGCCAAGATAAAGAGGTGGAAATCTTACATAGACCAGCATAATGCCAA +GGTTTTCTACAAACCTGGCAAAGAAAATTTCGTGGCAGACGCCCTCTCTAGGCAGAATCT +GAATGCCTTACAAAACGAACCCCAATCAGACGCTGCGACCATTCACAGTGAGCTCTCCCT +GACCTACACGGTCGAGACAACAGACAAACCGTTAAATTGCTTCAGGAACCAGATCATTCT +GGAGGCAGCACGTTTTCCGCTCAAACGAAACCTGGTGCTCTTTCGAAGCAAATCTCGCCA +CTTAATCAGCTTTACTGATAAAAGTTGGCTATTAAAAACACTTAAGGAGGTGGTAAACCC +TGACGTCGTGAACGCTATTCACTGCGACCTGCCCACTCTGGCAAGCTTCCAACACGACCT +CATTGCCCACTTTCCAGCCACCCAATTTCGTCACTGTAAGAATGTCGTGTTAGACATAAC +CGACAAAAACGAACAGATCGAAATCGTCACTGCCGAGCACAACCGCGCTCACAGAGCCGC +ACAAGAAAACATTAAACAAGTCCTTCGGGATTATTACTTTCCCAAAATGGGCAGTTTAGC +TAAAGAAGTAGTAGCTAATTGTAGGGTCTGCACCCAAGCAAAGTATGACAGGCACCCGAA +AAAGCAAGAGCTCGGGGAAACGCCCATACCCAGCTATACAGGTGAGATGGTGCATATTGA +CATATTCTCAACCGACAGGAAGCTATTCCTGACGTGTATTGACAAATTTTCTAAATATGC +AATAGTGCAACCAGTGGTGTCTAGAACAATAGTGGACATCACAGCACCCCTGTTGCAGAT +CATTAACCTGTTCCCCAATATCAAAACGGTCTATTGTGACAATGAGCCCGCATTTAACTC +AGAAACTGTCACCTCAATGCTCAAGAACAGCTTCGGCATTGACATAGTAAATGCGCCCCC +ACTCCACAGCTCATCCAATGGCCAAGTTGAACGGTTCCACAGCACATTGGCAGAAATCGC +CAGGTGCCTGAAGTTGGACAAAAAAACGAATGACACAGTAGAACTAATCTTGAGGGCGAC +GATAGAATATAACAAAACCGTGCACTCAGTTACTCGTGAGAGACCAATTGAGGTGGTTCA +CCCAGGGGCCCACGAGCGCTGCCTAGAAATCAAGGCAAGATTAGTAAAGGCTCAGCAAGA +CAGCATCGGAAGAAACAACCCTTCCCGACAAAACCGCGTGTTTGAGGTGGGAGAACGCGT +GTTTGTAAAAAACAACAAGAGGTTAGGAAATAAGCTAACTCCACTATGCACCGAGCAAAA +AGTGCAGGCAGACTTGGGAACGTCTGTTCTTATTAAGGGGAGGGTGGTCCACAAGGACAA +CCTCAAGTAGACATTCCCTCTACAGTTAGGTAGTAAGTTATGTCAAGGAAAATCCGAGCA +CTGTAGTATCACCTTGTCTTTAATTTCCAGGTTCACCCTCATGATGTTCATACCCTTGGT +AGTAGCGAATGCTCGGATCACCGACTTTTCGCATGCCAACTACATTCCTGTGTTAGATGG +GGATGTGCTGGTGTTTGAACAGCGTGACCTCTTGAAACATTCGAGTAACCTTTCCGAGTA +CGCTAGTATGATAGATGAAACACAGAAACTGTCCGAGTCCTTTCCCCACTCACATATGCG +TAAGTTGCTAGAGGTCGATACTGACCATCTTAGAACCTTGTTGTCCGTTCTCAAAGTCCA +CCATAGGATAGCTAGGAGTCTAGATTTCTTAGGTACAGCCTTAAAGGTTGTGGCGGGTAC +TCCCGATGCCACGGACCTCTTTAAAATTAAGATCACAGAGGCCCAACTAGTAGAATCTAA +TTCCAGGCAGATAGCTATAAACTCCGAAACCCAGAAACAGATAAATAAGTTAACTGACAC +CATCAATAAGGTGATCAATGCCCGTAAAGGCGACTTGGTTGACACTCCACACTTATATGA +AGCACTACTAGCAAGAAATAGGATGCTGTCTACAGAAATTCAAAATTTAATTCTCACTAT +TACTTTGGTCAAATCAAACATTATAAATCCCACAATTCTTGATCATGCCGACTTGAAGCC +TCTTGTAGAACAGGATACCCCAATTGTCAGCTTAATAGAAGCATCTAAGATCAGGGTCCT +CCAGTCCGAGAATAGCATTCATATTTTAATTGCCTATCCTAGAGTCAAGTTCAGTTGCAA +GAAAGTCGCCGTCTACCCTGTATCTCACCAACACACCATCTTGCGCCTCGACGAAGACAC +TTTGGCCGAATGCGAACATGACACCTTTGCGGTCACCGGATGCACAGACACCACACACTT +CACGTTCTGCGAGCGGTCTCGGCGCGAAACTTGCGTGCGCTCACTCCATGCTGGAAACGC +TGCTCAATGCCACACTCAACCCAGCCACTTGCGAGAAATAAACCCCGTAGATGATGGCGT +TGTGATTATCAACGAAGCCGCAGCTCACGTTAGCACTGATGGCAGCCCCGAAACACTGAT +AGAGGGAACCTACCTGGTAACCTTCGAGCGAACGGCAACCATCAACGGCTCTGAATTCGT +AAATCTAAGGAAAACACTAAGCAAGCAGCCAGGCATCGTGCGTTCACCACTACTTAACAT +CGTCGGCCACGACCCTGTGCTCAGTATACCTCTGCTACACCGGATGAGTAACGAAAACCT +ACATTCCATCCAAAACCTTATGGATGACGTGGAATCTGAAGGCTCGCCCAGACTCTGGTT +CGTGGCTGGTGTGGTCCTAAACTTCGGCTTGATTGGCTCTCTCGCCCTTTATCTGGCATT +AAGGAGAAGACGAGCCTCTAGGGAGATACAGCGCACCATCGATACTTTCAACATGACCGA +GGACGGTCATAAACTTGAGGGGGGAGTAGTTAACAACTAACAATGTATTGCTTCGTAGCA +ACTAAGTAGCTTTGTATGAACAATGCTGACGCGCCAGAATTGGGTTCAACGCTCCACGCG +AAGAATGCCTGGCAGCGGAAAGCTGACACTTCCTACCGGGAGTGTTGCTTCACGCTGCAA +GAAATGCTGAGTCGGCTTGCCGACTTGTGGCGGCGCGATGCATTGCTCGAGGGTAAACTT +AGTTTTCAATATTGTCTTCTACTCAGTTCAAATCTTGTGTCGAAATAAACCACAGCTTGC +TCCGGCTCATTGCCGTTAAACATCATTGTTCTTATTTACAATCAAATCGCTATCGCCACA +AGGCTAGTGATAATAACTAAGGGGGCGAAGTCAAGCCCTCCAACCTAATCTCCATAAACA +GTGTCTAAGACGAACCTCAGCGAAAGAAGGAAGATCTCTAGACCTACTGGAAATAACATA +ACTCTGGACCTATTGGAACTTATATAATT +>DMHFL1 +CAGAGAACTGCAAGGGTGGCACTTTTTTACCACTCGACTCACACCCTACAATTTTGTGTG +CGGGTGCTACTCGCCACGCACATCGCGGGTACTTACAAACACACAGTATAAATCTGAACA +TGCAGACAAGACACCCCGTTGTGTGCGCACCCGAATCAATACGGTGTTTTGCGTCGCGGG +TGCCGCTCACACAGTGCCTAAAAAGGGATGAGTGAGAAAAACACTTGTGGGTATACCGTT +AAACACATGGGTGTTTCCAAAAATACTCGGGTGTTTCCAAAAATACTCGAGTGGTCTCGT +AGGTAGTCGAGTCAAATGGCGCCATACATAATGATTGTTGAGTTCTTGTGTCTTTGGTCC +AGTGTCTCGGCTGTTAATTGCCCCTTTTTTGTTTTTTACGATGCAATTACTAGCTTGTTA +GGATTCAGTATTATTTGGAAGCCAAAGGAAAAGGTCACAATAATGGCAGAAGCGGCTGAT +TTCGTTAAAAATAAAATTAACAATGGAACATACTCAGTTGCCAATAAACATAAAGGAAAA +AGTGTTATTTGGAGCATTTTATGTGACATTTTAAAGGAAGATGAAACTGTTCTGGACGGA +TGGCTGTTCTGCAGGCAATGCCAGAAAGTGCTCAAATTTTTACACAAAAACACCTCCAAT +TTATCCCGCCATAAATGTTGTCTAACATTAAGACGACCAACGGAATTAAAAATTGTTTCG +GAAAACGACAAGAAAGTAGCTATTGAAAAATGCACCCAATGGGTTGTCCAAGATTGTCGG +CCGTTTTCTGCAGTAACCGGAGCCGGATTTAAAAATTTGGTGAAGTTTTTCCTACAAATC +GGCGCTATCTATGGGGAACAGGTAGACGTCGATGACTTACTACCTGATCCAACAACATTA +AGTCGGAAGGCCAAATCGGATGCAGAAGAGAAGAGGAGTCTAATCTCGTCCGAGATAAAA +AAAGCTGTGGATAGCGGAAGAGCAAGTGCGACCGTCGACATGTGGACTGACCAGTATGTC +CAAAGAAACTTTTTGGGCATCACTTTCCATTACGAAAAAGAATTTAAACTTTGTGACATG +ATTTTGGGACTAAAATCGATGAATTTTCAAAAATCGACTGCCGAAAACATTTTAATGAAA +ATTAAAGGTTTATTTTCGGAATTCAATGTTGAGAACATTGATAATGTTAAGTTTGTGACT +GACAGGGGAGCAAATATAAAAAAGGCTTTAGAGGGCAATACCCGTTTAAATTGTAGCAGT +CACCTGTTGTCAAATGTTTTAGAAAAATCGTTTAACGAGGCCAATGAACTCAAAAAAATT +GTGAAATCATGCAAAAAAATCGTGAAGTACTGCAAAAAATCAAATTTGCAGCATACTCTA +GAAACCACTTTGAAAAGCGCCTGTCCGACTAGATGGAACTCCAACTACAAAATGATGAAG +TCCATTCTGGATAACTGGCGTAGTGTGGATAAAATATTAGGTGAAGCTGATATCCATGTA +GATTTTAATAAATCATCTTTAAAAGTTGTGGTAGATATTCTAGGAGACTTTGAACGAATA +TTTAAGAAGTTGCAAACATCTAGCTCACCATCTATATGCTTCGTATTGCCATCCATCTCT +AAAATTTTAGAATTATGCGAGCCGAATATTTTAGACCTTTCTGCAGCAGCATTGCTTAAG +GAAAGAATTTTGGAAAATATTCGTAAGATTTGGATGGCAAATCTAAGCATATGGCATAAG +GCGGCATTTTTTTTATATCCACCCGCAGCACATCTTCAGGAAGAAGATATTCTTGAAATA +AAGGTGTTTTGCATTTCACAAATTCAAGTCCCAATTTCATACACATTAAGCTTAGAATCT +ACAGAAACTCCAAGAACTCCAGAAACTCCAGAAACTCCAGAAAGTCTAGAAAGTCCAAAC +TTATTTCCAAAAAAAAACAAAACAATATCTTCTGAAAACGAATTCTTCTTCCCAAAGTTA +GTAACTGAGTCTAATTCCAACTTCAATGAATCTCCATTAGATGAAATTGAACGATATATT +AGACAAAGAGTTCCATTGTCTCAAAATTTTGAAGTAATTGAGTGGTGGAAAAATAACGCA +AACTTATACCCTCAGTTGTCAAAGTTAGCATTAAAACTTTTATCAATACCAGCCAGTAGC +GCAGCAGCTGAAAGAGTGTTTTCCCTAGCAGGTAATATAATAACAGAAAAGCGAAATAGA +TTATGCCCAAAATCTGTAGATAGCCTCCTTTTTTTGCATTCCTATTACAAAAACCTAAAC +AACTCGCAATAGATATTCCTTCTTATAAGTATATTTTATATTATTAATTCTTATTATTTG +CTTAATTTTTGTATAAGTGTTAAGTATTAAGTATAAGTATTAATTAATAATATATAAGAT +TGTTATTTGTTAAGACATTAGATGCAAAATCCTAAAAATGTGAAAGTAATGAAGTTCCTT +ATATTTAATAGATACTTTTTAAGCCCACTATGTTTTTATTATTTAGATTGAGACATTAAA +AAACGTAAAAATCAACAAATGCCGTCTTTAATTGCAATTACTTTATGTGTTTGAAATGGG +AGGCACCCATTGAGTCCATCAAAGAGCAAAGACATGAGCACAAAAATTTTCTTGGGTATT +CCCTTTTACCCTTCATTTCTTATACCCGTCACGCTTCCACCCATACAAATTTTAGGCGTA +CAAAAAATGACCAGAGAACTGCAGCCCGCATACAAAAAATGACCTGCGGCCGATCGTTGA +CTGTGCGTCCACTCACCCATACGGCTCTTGCGCAGCAGGCCTCGGGTGGTTTTTTTACTC +GTAACAAAAACACAACGTCGGTAAAACACTCGAGTATTTTGTGTTGCCGCAAGTAGGGTG +TCAAAAAAAACGGGGTGCCTAGAGTACCGAGTGTTTATCGGGTGGACGTAGAGTGCGAGT +GGCGGGCTGCAGTTCTCTG +>DMTHB1 +ATGTACAGCTGTGTTCAGAAAAATAGCAGTGCGAAGGAAACTAAGTAATACAAAGGTATT +TTTCCATGTCCCTTTTCGGAATCGACTTTTTATTCCTCTTATTTTTGTTAAATGGAATGT +GTAGATAGGGAAAAAAAGAAAATCCGGTCAGTTTTTCTTGTTATCCTTTTTTTATTTACA +TTCTTGAGCAAAATCACAATTTTTAGGCTGTTCATAAGAATAGCAGTGTCTGGTTCTGAC +CAACGTAAAGTCCCGAAATGATCAATATTTTCTAAAAAGTGAGTTTGGTTAAGTTAATTC +GTATATTTAAAAGGACAATAAATTAAAAAAATTAAAAAAATTTTATTTTAGTGGGTAGAG +GACAGCACTACTCCCAGGGGAAAAGAATGTTAATTCTTAAGCTTAGAAAGGAAGGAAAAA +CATATAAGGACATTCAAAAAACCCTTAAATGTTCTGCCAAAATGGTATCCAATGCCATTA +AATATAAATGGAAGCCCGAAAACCGTGGTACCAAACATAAAACCACAGATATAGAGGATC +GACGCATTGTTTCTTACAGCAAAGTCTATCGTTTTGCATCCTTTAGGGACATAAAGTCTG +AGCTGAACTTGGGAATCAGCGACGTTACTATTCGTAGACGACTACTGAATCAAAATTTCA +GTGCGAGGAGTCCACGAAAGGTTCCCCTACCTAGCCCAAGGCATATTAAGGCAAGGTTAA +GCTTAGCTAAAACCTACCTAAACTGGCCAGTCTCCAAATGGCGTAATATCCTTTGGACTG +ATGGGTCAAAAATCATGCTATTTGGTGGAACTGGTTCACTACAGTATATCTGACGACCTC +CAAACACGGAGTATCACCCAAAACACCCAGTGAAGACTTTCAATCACGGTGGACCTAAAA +TCATGGTATGGGCTTGTTTTTTTTATAATGGTATGAGTCATGCTATGGATTATGATTTAT +GGTATTATAGACCAAAACGCATATGTAAATATACTTAGTGATGTCTTATTGTCATATTCT +GAATAAAATATACCCTTAAAATGGACATTCCAACAGGATAATGATCAGAAACGCAGATGT +AAATCGGCTAAGAATAGGTTCACCCAAAATAGAATAGATGCAATGCCGTGGCAAGCACCA +CCTTCCCATTTAAACCCGATTGAAAACCTGTATGGGGACATTAAACAGTTTGTGTCGAAG +AAGTCCCCGACGTCTAAGACTCAGATTTGGCAAGTTGTGCAGGATACATGGGCAAAAATT +CCTCCCAAACCTTGCTAGGACTTGGTGGACTTCATGCCGCGTGGGTGTAAGGCTGTGCTG +GCTAACAAAGGCTATCCAGCCAAGTATTAGGCCCGAATTAACATATTAAAAAGAAAAACT +AAGTTCGTTCTAGGTCAAGTTAAATTTTGTTACTATTTTTTCATAGCACTGCTATTTTAT +TGAACACCAGAATTTCTGCCTATTTATTGTTTTAATCTATATTTTCGAAACTATTGAAGA +AATAAAAGTGAAACATTTGTTAAATTGTTTGAAATGAAATACCTAATGATATTATTAAAA +AAAAATTCCCATTAAAACTGTAAATCATAGGAATTTTTTATCTTAAACTCTGAAGTCCAA +AGCACTGCTATTATTCTGAACACAGCTGTACAT +>DM06920 +TAAATAAATAAAATAAATTAAACAATTAACTAAATAATTAAATAACTAAAATTAATAATA +TAATCCGTTCGCTTGCCAAAGACTCTCACGCGCATAACTAATTAAAATCGATTTTCAAGT +TGACAAATAAATGGTTTAAAATTGTCCTCAGGCTGCAAAGAAAAGCCGCGGCAACAATAA +ACATTTAGTGACACGCGAAAAGCGAACATTTGATTAGTGTAATACTTGTGCAAACCGACA +AGCTGCCGCCATAACAAAACGGAGACGAAGAATCATAAAGAACAAAAGCTAAATCCACCA +GCATAGCAAAAATAAATTAACAAATAAAATAAAAGCAAATTTAAATAACATAATAAATTA +AACTTATTTAATAAACCAATTAATTTTAATTAATTCAATTAAACGCTAAATCTACATAAT +ACTCCACGCGCAAATTAATTGAAATCGTCTTTCTAGTTAATAAATTAAAAGTTTAAAAAT +TGTCTCCGGCCGCAAAATTTGAACCGCGACGATAAAAACATTTAATTGACAAACAAAAAG +CGAACAATTATTCAGTGAACTATTTGTGCAAAATTGACAAGCAGACGCCATAATTAAAAG +GAGAAGAAGCCAAAAGACGAAGAGAAGAAAGCAACCAGAAGAACTCAAAGAAGAAAAGGA +GGAAAGCCCAATTAAAGAAAGCCAGGGTATTTATACCTTACACTTATCGTTTAATATAAC +AAAAACCCAACATGTCCATGTCCGACAACCTTTTTTCTGACGATGAGGTACTTTCAATTT +CCTCAAGCCCAGAACAGCGATCTTCTCCGTTCTACCTCAATATATCGCCCATGTCCCACG +GATCAGACAATTCTCAGATTAATACAGTCATCATTAATTCGAAGAAATTGCCCTCAAATC +AAGCAGACATAAGTTTAAAAAACTCTTCTGGGGCTGCTATAAAAATTGTTAATTCCCTTT +CACACAAGAAGAAAGAGAACACAAACGTTAATAATGCCCAAAAAGACCCCCTCTCACTCA +CCAATACTACTGCAAGCACTTGTGGCGCCAAAAGCAGCATCTCAGAGGGGAAATTGTCTT +CTCCTCCGTCCACCTCACACACATATGAGGGGAAATTACTCACAAAACTTACTCACACAC +ACACAGACTTTAGAGGCGCCAAAACGAGCGATGCAATGGGAAGTTTCCCCTCTCTCTCGC +ACAGCGACAATAGCATAGAGAAAAATCTGAGTTCTTCCACCAAAATTGGACCAAACGCTT +CTTCCCCTCCTTCTCATGCACACACTCACACTAGCAAATCCACTGATATAAGCTTAGAAA +GCCGCTCAAAACATCCCGCGCTTGCCAATACGGACGCACGCTCTATAAAAGCCAATGCTA +ATGACAATGGGGAAATTTTCTCCTCACTTATACAAATTGACGAACGCAAGCAAGAGGAAA +GGCCTTGCACAACTATCAACGCTTTTTGGTCTATTTTTAAACCCAAGCCGGACGTTACTA +AACTAAGTCTAAAGAGGAAACCCACCAATCCCACTAAAAACACTGGGAAAAAATGCATCT +CCCCTCATAAAAAGAGCGCTTATTTATGCCCTTCCGCTCAGGATGATTTAAATTTAAATT +TAAACCCCAAATCTAGCGCCAAGCCCACTGTGGTGAATTTACCAGCTGCCCGCATCCTAA +GCCGGCCTGCAGCCAAGCGGGATTTATTTAAATCATCATCCTCCCGAAGCCCAGACGAGC +AGCCTATGAGTTTTTCGGAAGTGGTCGCTGGCACGGGTTCAATTTTTGCGGCACCCTGTG +TCCCGGCACCTTTAACGAAAACTCCAGGCAAGCGGACAAACGACGATCTGGACTGCTCCA +ACTTTAAGACGCCCAATAAAAAATTATGCGCGACTTCCAACTTTGTAACTCCCAGCATTT +TTCCGCCGCTCATCACTCCCGTTTTCAAGAGCAAGGCAGCTCAATCTGTTTACGAGGAAT +CCAAAGCCAGAAATGGACCCCCCCCGCCGGCCCTCGCCTGCAGCATCAATGCCTCTGCTC +GCAGCGCAGCGGCGCCACCCGGGATCGCCCCCCTACCCCCTCATAATACAGATGCAGAGC +TGCCTCCATGGAAAATCGTGCCCCAGAGCCGTAGAGCACCTCCTATACTCGTCAATGATG +TAAAGGAAATTGTACCTCTACTGGAAAAGCTGAACTACACAGCAGGAGTCTCCAGCTATA +CTACTAGGGCTATAGAAGGAAACGGGGTCAGGATACAGGCAAAGGACATGACCGCCTATA +ACAAAATTAAAGAAGTCCTGGTGGCCAACGGACTTCCTTTATTCACCAACCAGCCCAAGT +CCGAGAGAGGCTTCCGAGTCATCATCAGACATCTCCACCACTCCACACCATGCTCGTGGA +TAGTCGAGGAACTGCTGAAGCTCGGATTCCAAGCGCGATTCGTCAGAAATATGACGAATC +CGGCTACAGGTGGCCCCATGCGAATGTTTGAAGTGGAGATCGTCATGGCCAAAGACGGCA +GTCATGACAAAATACTCTCACTCAAACAAATCGGTGGGCAAAGGGTGGACATTGAAAGGA +AAAACAGGACACGGGAGCCAGTCCAGTGCTACAGATGCCAAGGCTTCAGGCATGCCAAAA +ACTCTTGCATGAGGCCGCCAAGATGCATGAAATGCGCTGGCGAACACCTGTCTTCCTGTT +GCACCAAACCAAGAACCACCCCCGCCACCTGCGTAAATTGCTCTGGGCAGCATATTAGCG +CGTACAAAGGATGCCCTGCATATAAGGCGGAAAAACAAAAGCTGGCGGCAAACAACGTTG +ACATAAACAAAATAAGAACAATCAAAGACGCAACAAATAACTTTTATAAACGTCAAGGCC +CCCCTCTACGCAACAACACCCCTCGGCTACCGCACAGCTCAGCAATCCTGAGCAAATCAA +TTGCCGAAGCTCGCCAGGAGGCAGCCAGAAAGTCGATGTTAAATCCATTCCGACAAAATA +TAAACGACAGAAGACCACGATTCTCCTCCCACGACACGGCCATTCAGAAGCGTCTGAATA +AATGGCGCCGAAACACCAACAAAATACCCAAAAAGGGTAGGATAGCCTTAAAGGATAATG +CAAAGCCACGACCGGCACATAGGACAAGTAACCCAGCGCAAAGACATCTGGAGGACTACC +AGGACATGCTCCGAAGGGAAAGGAGTGAAGAAAACGACCAGGAATCTGAGAAGGGCACCC +CCAATACCAAGCAGGTCGGCAATGACAGCCCTCCGACCACGAGCAGAGCAGCCAGAGCCA +GCTTTAAGCCAAGAATCATTGACGATACCACGCCATCGCCAAAAATCTGCAATCCCAACT +CACAAAAAGGCCTCTTGGACGACCCCACAACAAGCTTAGCTAATAGAGTCGACAATTTAG +AAAAGAAAATTGACATTTTAATGGCCTTAATCATACAAGGAAGAAATAACAATCTTGACA +TGGATACATCCAATTAATCTTACAACTACTTATATATTCTTTAATAAATATATCCAATAG +AAAAGCGCACGTCGGTCTGCTTTTAAAATCCTTCACCGTCATCACCTTCCTCGACGGAGC +CTAATTTATTGGAAAAATAAATCAATTATATGTTGGCACAAAAATGTAAACACACACTCA +CCTAAACGCACCCGGACGAACAAGCCTATGACAACGCACTCCAGCTGATCTGTAAGAAAC +AAAAAATATGAATAGATAGATCGATATGAAAAGGATATGTGCGGCAGAAACATGATGAGC +AAAAGGCGACTCGCTGCAGCAACTTATGCACAACGTCACTTACCTGAAATTTCTTGCCGT +ACGATCTCCTGTAGTATCCCTTATCACAGCTGCAATCTACTTGCAATGCTGCACTGCAAT +AAACGTACTACAAAAGCTGCATACGTTTTGATCAGGACACCTCGTGCGGACGTGCTAAAA +AAAATTTCCTTTCTGCTGCTCTTATTGACGCTAAAACCTTAAAACCTACAAACAAAACAA +TTAAATAATAACAAATCAAATAAGACAACCAAATAATACACTTACCTCATTGACTGCAGC +TAAATCGCTGACCCACATTCAGTGCAGCCGACAGCAGGAGACGGGCCCGCAAAAGCAAAA +CAAAATCGCCAATTTTGCGATTATAAACACGAAAAATTGACAATTTTGCGATGCCGTCTC +CGCCTCCTGATGCCACTGCATTGACAAGCATCACTAGCGAGGAGCTGACACCACACCAAA +AAGCTGTAAAATCCGTCCACAAATTGTATATTTTGCCTCAGTGTCGTATCTGCAATGTTT +TTCCGATAACCTGTAAGGAAAGAAAAATTAATAAGAAAATTATACAAAATTAATTAAGGA +CGACAGAAAATAGCAAACCAGACAGGCAAATTAACAGATACAAATATGAGACTCCATCCT +GCTGCCGACACACAAGTAAATCCTTCAACTCGACAACAGGAGACGGGCCTTGCAAAAGCA +AAACAAAATCGCCAACTTTTGCGATTATAAATACAAAAAATTGACAATTTTGCAACGCCG +TCTCCACCTCCTGTTGCCACTGCATTAATAAGGATCACCAGCGCGGCGTGACGCCACACT +AAAAGGCTGCAAAATCCGTCCACAAAATGTATACTTTTCCTCAGTACAATACTTTCTAAT +GAACTTCCGCCAACCTGCAATGAAAAGAAAAGAAATAGGTATATAAAACAAAACAAACAA +AAGGACAACCTAAAATTAGCAAACCAGACAGGCATACTAGTAGATGCTAATATGCAGCTC +CATCCTACTGACGACAACCACGCAACTCCTTTCTCCAAGACCGCAAATACTGAAACAAGG +AAGCACAAGCTAATACTGGGAATTATTTATTTAAACAAAAATACTTATCTAATTGCCAAT +TCGACGACTCCAAATCCGCGGCTAACCGGCGGCGATGGCCCATAAATAAAGGGCCTCCTA +ATTAATTACAAAATGTACCTGAAAAACATAAAATTAACGCAACTATAATTAACGCAATTA +ATAAATCAAATAAATACAAGTATAATACTTACCTCCAAGCAAACGTACCTGAAAAACAAA +ACCAAAAAAAAAATTAATGCAATAAATAAATCAAATAAATACAAACATAATACTTACCTC +CAATTTACCTCCCAGCCAATCTACCTGAAAAACATAATCTAATACAATCTCAAAAACAAA +TAACAAATGTAATACTTACCAAATTTTAATTTTGTATTCATTTCCATGACCCCAACGCTG +CAACTGTCCTCGGCAACAATTCCTGTTCCGGCGGCTCCATGCTGCCAATCCTGACGCACT +GGCCACAAGACGCGGCGCTGCTGGCAATCTCTCGATGAACAACCGATCTACAATTTCCAT +GACGACTCCTCTGTCACGATGAGACAGAAGACACCACCAACGCCAGCAGCTCCAAAACAA +TACAACAACGGCCGCGCGGAACCCATCTTCAGAATTCCCTCTTCCTGACGACCGGCGAAC +GAGTTCTGGAATAAACAATGTATTAATTGCAAACATCTACCGATGAGGGTAGAAGAGATA +CTCACCAAACGACTGCGGCGCGGGAACAAACTAACTGCAACGCCGGCCGGACCTATTTGT +TGCAAGTGGCGCGCATCCAGCGCCTGCAACATGCCCCAGCCCAAGTACACAACTACTTAC +CTGCAACGTCGCCAGAGGCTCCCAGCGAATCGGTGCTTCCGTCCTTCTGGCGGGGGTACC +TGAAAAGAAACAAATTAAACAATATTAATCCTAAATTTCAATGTTTTTTGTAAAATAATT +TAAATTGTTAAATGTAAACAAGCCTTGCAATATGTTAATGTTACCAGTCCATGCTACTGT +CTAAAAGCCAAGAATACAAAAAATACTAATTATAAACTAACTCACCACGCCCAACCCCCA +AACTCACCCCATGCAATGTTAAACCTATAAATTCAAATAATTGTACCTATATATTGCACA +TACTGTAATCAAAGGCAAAATAAATCGTGGATGCGGAACAGAATTTACTCTGTCTCCGTA +CCTCCACCAGCAAAGTTAAAAAA +>DMIFACA +CATTACCACTTCAACCTCCGAAGAGATAAGTCGTGCCTCTCAGTCTAAAGCCTCGCTTCG +CGTAAGCCCAAAACTCTTATCAGCAAAATCTTGATAAACAAATATCAACCACAAAGAGAA +AATAAAAAACTTAACAACAAAAACAACAATACCGCTAATCCGGGCTCAAGCCCTTAACCA +ACAATCATGACAGACCCACCAAACATTTACAAAATCACTTCAAAAACATACCAATCCCAA +TTAGGCGAACCTAAATTTATAATTATTAAAAGAAATGACAACAACTCTTTCGAAAGAACT +TCACCATTCATCATAAAAAAATCGGTGGACTTTGCCTGTGGAGGAGAAGTTGAGGGATGC +AAACGTACAAGAGACGGCAACCTGCTAATAAAAACCAAAAATGAATTACAAGCCAGAAAA +CTCCTAAAACTAACAAAAATTGCAGATGAGGATGTAACAGCAAGTGAACATAAAACATTA +AACTTCTCTAAGGGAGTTATTTACTGTAACGACCTTAGACACATCGACGAAGACACAATT +CTACAAGAACTAAAACCACAAAAAGTATCTGAAGTTAAAAAAATAATGAAACGGCAAAAC +CCCAACTCTAACTCCGACACCAACAACATCACATTAGTTGAAACTGGACTCATAATTATA +ACCTTTGAATCGCATAAGCTCCCCGAGATAGTACGAATCGGGTACGAAACAGTCCGAGTA +CGAGACTATATCCCACTCCCACTTCGATGCAAAAAATGCCTCCGCTTCGGTCATCCAACA +CCCATATGCAAAAGTGTAGAAACTTGCATCAATTGCTCTGAAACAAAACACACAAACGAC +GGAGAAAAATGCACAAACGAAAAAAACTGCTTAAATTGCCGAAATAACCCAGAACTTGAC +CATCAACACAGCCCAATTGACCGCAAATGCCCTACGTTCATAAAAAACCAGGAATTAACA +GCAATTAAAACCACACAAAAAGTTGACCATAAAACGGCCCAACACATATATTTCGAACGT +CACGGCTTCCAAACGAAAAACACCTACGCCAAAACACTTACAAACGGCACAACCCAGAGG +ACAACAAACACTCCATCACCTAATATTCACACAAACACAACCCAATCACAACAACAAAAT +CCGCACCACACACCCAAATCAGCAGCACAAAACACTTCAGCTAAGACACCAACAACTGAA +CCAGCCAAAACAACCTTACTATCCAACCAACCACACCAACACCACCACCACCACAGCTAC +GACAAACTAGAAGACATGGATACCGACTACACACCTACCAGAAAACCATCTACGACATAC +TCATCACAACTCACAGAAGACCTAAAAATAAAAATCTTCCCTAAAGATAAGTCCAATAAC +CTATCCATAAACCTTAAAGCATCAAAACTAAAGGCCAAAGCCCACAAAAACAAGCACACT +AACAACAGCGACAGCGAATCCATATAGAACTCTACACAAAACCCTAACCGTTAACACTAC +CTTTAAGTAAGTTATAAGCTTTAATTTTCTCACAAATGTCCCTAACTATAATCCAATGGA +ATCTAAAAGGATATCTAAACAACTACAGCCATCTCCTTATTCTAATCAAAAAATACTCCC +CCCACATAATTTCCCTCCAAGAAACCCATATACAATACACTAATAACATTCCAACCCCAA +TAAACTACAAACTATTAACAAATATTGCCACCAACAGATTTGGGGGGCGTACGACTACTA +GTGCATAAGTCAATACAACACACTGTCCTCAACATAACAATCGATATAGAAGCAATAGCC +ATAAATATAGAATCTAAACTTAAATTAAACATATTTTCCACATACATTTCTCCGACCAAA +AACATAACTAACCAGACACTCCATAACACATTTAACATACAACAAACACCCTCTCTAATT +ACGGGAGATTTTAATGGATGGCACCATCCTGGGGCTCCCCAACAACAAATAAACGAGGAA +AAATAACTCATAGATTCATTGACAACATGCACCTTATCCTGTTAAACGACAAATCTCCCA +CACACTTTTCAACACACAATACATACACACACATAGACCTCACACTCTGCTCTCCAATCC +TAGCCCCCCACGCCAAGTGGAAAATACTAAACGATCTTCACGGTAGCGACCATTTCCCTA +TTATCACAACACTATTCCCAACAACCAATCCACAAAAATTCTACAGACCCTTTTTTAAAC +TCAAAGAAGCCAACTGGGAACAGTTCAACGCTCTTACCCACCAAACCAACAAGAAATACC +CCACCTCCCACAACGTAAACAAAGAAGCCGCTCTAATCAATAGAATCATCCTTTATAGCG +CAAACCTCTCCATCCCACAAACCTCACCTAACACACATCCATACAGGGTTCCATGGTGGA +ATAAACACCTCGACCAATTACGTAAAGAAAAACAACTTGCCTGGAAAAAATTAAACCGCA +CAATTACTGTTGACAACATTCTAGACTATAGACGCAAAAACGCAATATTTAGATACGAAC +TAAAAAAGAGGAAAAAAGAAGCTTCCAGCTCTTTCACCTCAACCATCCATCCCACTACTC +CCTCATCCAAAATATGGGCCAATATAAGACGCTTCTGCGGACTTAACCCAGCAAAACAAA +TTCATGCCATCACAAACCCAGTAAATAACGAGACTACATTGGCTAGCAACGAAATTGCTA +ACATATTCGCACAACATTTCTCTGACCTCTCCGGCGACTGGAACTTCTCAGAGGAGTTCC +GGAACAATAAATATAGAAATAACATACATCTCTACACCCCCTCTCCAATAGCCCAAACCA +TAGAAGAGAACATAACGTATCTAGAACTTAGCTCAGCACTACAAACATTAAAAGGATGTG +CTCCAGGACTAAATAGAATCTCGTATCAAATGATCAAAAATAGCTCCCACACAACAAAAA +ACCGAATAACGAAACTATTTAATGAAATATTCAATAGCCACATACCTCAAGCCTACAAAA +CAAGCCTAATCATCCCAATCCTTAAGCCAAACACCGACAAAACGAAAACTTCCTCATACC +GACCCATCTCCCTCAACTGCTGTATAGCAAAGATACTTGATAAAATAATTGCGAAAAGAC +TCTGGTGGCTAGTGACATATAACAACCTAATTAACGACAAACAATTCGGGTTCAAAAAAG +GCAAATCGACTTCGGACTGTCTACTCTATGTAGACTATCTCATAACGAAGTCAAAAATGC +ACACCTCCCTCGTCACTCTTGATTTTTCAAGAGCCTTCGATCGAGTAGGTGTGCACTCCA +TAATCCAGCAATTGCAGGAATGGAAAACGGGTCCCAAAATAATAAAATACATTAAAAACT +TCATGAGCAACAGAAAAATAACTGTCCGCGTCGGTCCGCATACATCAAGCCCGTTACCCC +TATTCAACGGAATCCCCCAAGGTTCACCCATATCCGTAATACTTTTCCTCATAGCATTCA +ACAAATTATCCAACATCATATCCCTACATAAAGAAATTAAATTCAACGCATATGCCGACG +ACTTCTTCCTTATAATAAATTTCAACAAAAACACAAATACAAATTTCAACTTAGACAATC +TATTCGACGATATAGAAAATTGGTGCTCCTACTCAGGGGCATCGCTTTCCCTATCCAAAT +GTCAACACCTCCACATATGCAGAAAACGTCACTGCACATGCAAGATAAGCTGCAACAACT +TCCAAATTCCTAGCGTTACGTCCTTAAAAATTCTAGGAATAACCTTAAACAACAAATACA +AATGGAACACACACATAAACCTACTTCTACCCAAACTACACAACAAGCTAAATATAATAA +AATGCCTATCTAGTCTTAAATTTAACTGCAACACGCATACACTACTTAATGTCGCAAAAG +CAACAATTATAGCCAAACTAGAGTATGGTTTGTTTCTGTACGGCCATGCTCCCAAAAGCA +TTTTAAACAAAATAAAAACACCGTTTAACTCCGCTATCCGTCTAGCTCTCGGCGCATATC +GCTCTACCCCAATAAATAACTTACTTTACGAATCGAATACTCCCCCCTTAGAAATGAAAC +GAGACCTTCAAATAGCCAAACTATCCCAAAACCTAATCCTCTCCAAAAACACACCAATAC +ATAAGTTCTTAAAGCCTAAAAAAGCTAATAAGAAAAAAACATCAACAATAGACCGAACAA +TCAAACTTAGCCTAGAACTTAATCTACCCTACAAACCAATAAAACTCCATAAAAACAAAC +CACCATGGACCCTCCCCAATCTAATAGACACGTCACTTAGAATCCATAAGAAAGAACAAA +CATCTCCAGACCAATACAGAAAATTATACGAACACACAAAGAATAACCTCAAAACACACA +ATTTCATATTCACTGACGGTTCAAAAATTAATTACACAATATCATTCGCCATTACAACGG +AGACAGACGTCTTGAAATACGGCATACTGCCCCCATATTCATCCGTCCTCACCTCCGAAA +CAATCGCCATCCTAGAAGCAATAGAACTTACTAAAAACCGAAGAGGCAAATTTATTATCT +GCTCCGACTCCCTATCAGCAGTAGATTCAATTCAAAACACAAATAATAACAGCTTTTACC +CAAGCAGAATACGATCGCTAATAACGCAACACGCACCTAAAATTAAAATAATGTGGATTC +CTGGCCATTCAGGAATAAAAGGAAATGAATTAGCCGATCAAGCTGCAAAATCAGCAAGCA +GTATGCCACTTATCCTCACCCCAAACATAAATACCACAGATATAAAAAAACACCTTAAAG +CCGACCTTGCGACAAAACAGAAAGAACACATAATAAACTGCAGTCCATGGTACCAATCTA +TTAACACGAACACCTCACACCCATGCGATTACCTTAAACAATCCCACCCAAATTGGACCA +GACTCGACCAAATAAAAATAATACGACTTCGACTAGGACACACAAACATAACCCACCAAC +ACTACCTAAATCCCAATTCAATACCAACTTGCCCGTTTTGCCAAGGTGATATTTCTTTAA +ACCACATATTTAACTCATGCCCATCCCTCCTACAAACCAAGCAAGATATATTTAACAACA +CCAACCCTCTAGACCTTCTTAGCAAACCCAATCCAGATAACATACAAAAACTCATACTTT +TCCTCAAAAAAACTAAATTATACCACAAAATCTAAAAACAAAACAGGCATTTGTACATAA +CAAGCCAGCAATTAGTTACCAAATTAGATATTAACTAAATTAAGATATAATAACATTGTA +AATAAATATAGCTGTAAGCCCCGTAGCTAATGCTATACTATCTAAGTTAGTCTAGTTTTG +TAAACTATTCTATCTATCATAATAATAATAA +>DMLINEJA +AAAAATCATTCACATGGGAGATGAGCAATCGAGTGGACGTGTTCACAGAAGTCGCGAGAT +AAAACAAAAACGTAATTGTGATCCATCACAAACATCTGCGCAGATCGTGTGCTTATCTCA +CAAACAAAATCTATTTTTAGTCACTGCATAACGGTGACGGCTTCGGTTCGCGAAACTTAT +CAGCAACTAGCAATTTCTAAGCTGTGTTGTTTTTGCCCCTCGCCCTGCGCGCTGCGCAAG +CGGGAGGTTGTTACAATTTACCTTACAAGTAAACCGGTAAATCTTATCGTGTTTAGTAAA +TATCAATTGCATTATACGGCATAAGTATAAAGACAATTGATATAATGGAGAATTCATTTG +CTCAATCGCGACCTAGCAATGGGTGCGATAAATTTGAGAAAATGAGGAAAGTAGCAGGTG +TTGAGCCAGGAGAATTACGCTCCCAACTCCGCGCCAGCTGTGCAGTTGTTTCCCCTAACC +TGGAAGGTATGCCAACTCAATCTGCGGTCTCCAGCTTAATGGTGACAATCAGCAGCAACA +CCAATGCAAGTGTTACCTGCACTATTTCTAACGTACAGGCCAACATGATCTGTACTCCTA +CATACACTGATTGCACAACCGTGACCACTAGCATTTGCCCAACTACGCCTTATGACAATG +GACTGCCGACACCTCTGTCATCACTGCCCAATAAGCCATCTAAAGCGAATTGCCCCTTTC +AAGCACATGATCGTACTGTCAACAGGAAACGAAAAGGCGTGTCTCAGCCCCCATTACCTA +TCCTCACCCCTTCTCCAAGCCGTAAAACTAAAAGGCAGGCCACTATGCCACTCAATGAGG +AGGCCTCTACCTCCACTGCAGCAGCATTAAATAACAATCGCTTCGCGCTTTTGTCCGCTG +AAGCGGAGAATATGGAGCAAGACGTGTCGGATGCTGATTCTGACATTGAAGACTCTGCTG +CCCGAGATGGTGGTGGACAATCCGCTAAATATAGCAAACCCCCAGCCATATGCGTACCAA +GTGTAAGCGATCCGGTCACCTTGGAACGGGCTCTCAATCTGAGCACCGGCTCCTCAAACT +ACTACATCCGCATTTCTAGATTTGGTGTATCCAGAATCTATACAGCCAACCCTGATGCTT +TCCGCACCGCTGTAAAAGAACTAAATAAGTTAAATTGTCAATTCTGGCATCACCAACTTA +AAGAAGAAAAACCCTACAGAGTAGTGCTTAAAGGAATCCATGCTAATGTTCCTAGTTCGC +AGATAGAACAAGCATTTAGTGATCACGGCTATGAGGTCCTTAATATCTATTGCCCCAGAA +AGTCTGACTGGAAGAACATTCAGGTAAACGAAGATGATAATGAAGCTACAAAAAACTTCA +AAACTAGACAAAATTTGTTTTATATTAATCTTAAACAAGGCCCGAATGTTAAAGAGTCTC +TTAAGATAACTCGACTTGGCAGATACAGAGTCACTGTTGAGCGCGCTACACGTAGAAAAG +AACTGCTACAATGTCAAAGATGCCAAATTTTTGGACACTCTAAGAACTATTGCGCCCAGG +ATCCTATTTGTGGTAAATGTAGTGGTCCCCATATGACCGGGTTCGCTTTGTGCATAAGTG +ACGTATGTCTGTGTATAAATTGTGGTGGTGATCATGTCTCGACAGACAAAAGCTGCCCTG +TCAGAGCAGAGAAAGCCAAGAAGCTAAAACCAAGGTCCAGGCTACCGATGACTAATAATA +TTGCCACACTCAAACCTCCACAACGTTCTTCAAGCGGTTACATACCAGCTGAGGCATTAA +GAACCAACATCTCTTATGCTGATATTGCTCGACGCAACACGACTCAATCTAGGGCTCGTG +CTACTGTGCAGGCTGAAGTTATACCAACGTCGGACAATAGCCTTAACAATAAATTTATGA +CGTTAGACAACTCCATTCGGGCCATCAATACGAGAATGGACGAACTATTTAAGCTTATAC +ACGAAACTGTAGAGGCTAATAAAGCTTTCAGAGAACTGGTTCAGGTTCTAATTACACGTA +TTCCTAAATGACTCAACCAACCTTAAAAATCGGATTGTGGAACGCTCGCGGATTAACAAG +GGGCTCTGAGGAGCTTCGGATATTCCTCAGCGATCACGATATAGACGTAATGCTTACCAC +GGAAACACACATGCGAGTTGGTCAGCGCATCTATCTCCCAGGGTATCTTATGTATCACGC +CCACCACCCCAGTGGTAACAGTAGAGGTGGCTCTGCAGTCATCATAAAATCTAGACTTTG +TCACAGCCCTCTGACACCTATCTCTACTAATGACAGGCAGATAGCGAGAGTGCACCTGCA +AACATCGGTTGGGACCGTCACTGTAGCTGCTGTTTATCTACCTCCAGCAGAAAGATGGAT +AGTAGATGACTTCAAATCCATGTTTGCTGCGTTAGGCAACAAATTTATTGCTGGTGGTGA +TTACAATGCCAAACATGCATGGTGGGGGAACCCAAGATCCTGTCCTAGAGGTAAAATGTT +GCAAGAAGTCATTGCACATGGGCAATACCAAGTTCTGGCTACGGGCGAACCCACTTTCTA +CTCTTACAACCCTTTGTTAACACCATCAGCCCTTGATTTTTTTATAACCTGTGGGTACGG +CATGGGCAGGCTAGATGTACAAACTCTCCAGGAACTCTCGTCGGACCATCTTCCTATTCT +GGCTGTATTGCACGCTACGCCGTTAAAGAAACCACAACGCGTACGACTACTTGCCCATAA +TGCTGACATAAACATATTCAAAACCCATCTTGAACAGCTGAGTGAGGTAAATATGCAAAT +TCTGGAGGCGGTGGACATTGATAATGCCACAAGCCTTTTCATGAGCAAACTAAGTGAGGC +TGCTCAGCTTGCTGCACCGAGAAATCGGCATGAAGTAGAGGCCTTCAGACCACTTCAACT +TCCTTCCAGTATATTGGCACTGCTCAGGCTAAAACGAAGAGTTCGAAAAGAATATGCTAG +AACAGGTGATCCCCGCATGCAACAGATCCACAGTAGACTGGCCAACTGCCTGCATAAGGC +CCTTGCTCGAAGAAAGCAGGCCCAAATAGATACCTTCTTGGATAACTTGGGTGCTGACGC +GAGCACAAATTACTCACTGTGGCGTATCACGAAACGGTTCAAAGCTCAGCCCACCCCAAA +ATCAGCAATCAAAAATCCGTCTGGTGGCTGGTGTCGCACTAGCTTGGAAAAAACTGAAGT +GTTCGCTAACAACCTTGAGCAACGTTTTACACCCTATAACTATGCACCGGAAAGTCTCTG +TCGTCAGGTTGAAGAATACTTGGAATCGCCCTTTCAAATGAGCCTGCCTCTGAGTGCTGT +CACACTGGAAGAAGTGAAGAATTTAATAGCCAAGCTGCCACTTAAGAAAGCTCCTGGAGA +AGATCTTCTTGATAATAGAACCATTAGACTTCTCCCAGATCAAGCATTGCAGTTCCTTGC +CTTAATATTCAACAGCGTTCTTGATGTTGGCTACTTTCCGAAAGCTTGGAAATCGGCGAG +CATAATTATGATCCATAAGACTGGAAAAACACCGACAGACGTTGACTCGTACAGGCCCAC +CAGCTTACTCCCATCTCTGGGTAAAATTATGGAGAGGCTGATCCTAAACAGGCTGCTCAC +ATGCAAGGATGTTACCAAAGCGATTCCCAAATTTCAGTTTGGCTTCCGGTTGCAGCACGG +TACTCCTGAGCAACTACATAGAGTAGTGAACTTTGCTCTGGAAGCTATGGAAAACAAGGA +GTATGCAGTAGGTGCCTTTCTTGATATTCAACAGGCATTTGACAGAGTCTGGCACCCTGG +GCTCCTGTACAAAGCGAAGAGGCTGTTCCCGCCGCAGCTATATTTGGTTGTTAAAAGTTT +CCTGGAAGAACGCACATTCCACGTCTCTGTTGATGGGTACAAATCATCAATCAAGCCAAT +TGCAGCTGGAGTTCCTCAAGGAAGCGTTCTTGGCCCAACCCTATACTCAGTTTTTGCTTC +GGACATGCCTACTCACACACCAGTCACAGAGGTAGACGAAGAAGATGTGCTCATAGCCAC +CTACGCTGACGATACTGCTGTGCTCACGAAAAGTAAAAGTATCCTGGCTGCCACTTCTGG +TCTACAGGAATACCTGGATGCATTCCAGCAATGGGCTGAGAACTGGAATGTGCGCATCAA +CGCTGAGAAGTGTGCCAATGTGACGTTCGCCAACCGAACAGGTAGCTGTCCGGGTGTCAG +TCTGAATGGAAGACTGATCAGACACCATCAGGCTTATAAATACCTTGGTATTACCCTCGA +TAGGAAGCTCACCTTCAGCAGGCACATCACAAATATTCAGCAAGCGTTCAGGACCAAGGT +TGCTCGGATGTCTTGGCTCATTGCACCACGCAACAAACTGTCGCTTGGCTGCAAGGTCAA +TATTTACAAGTCCATATTGGCCCCCTGCCTGTTCTACGGCCTGCAGGTATACGGCATTGC +TGCGAAGAGTCACCTTAATAAGATCCGGATTTTACAGGCGAAGACCTTAAGAAGAATTTC +GGGGGCTCCTTGGTATATGAGAACAAGAGACATCGAACGCGACCTCAAGGTGCCCAAATT +AGGAGACAAGCTCCAGAACATCGCCCAAAAATATATGGAAAGGCTTAATGTACACCCCAA +CAGCCTAGCAAGGAAGCTAGGAACTGCAGCTGTGGTCAATGCTGACCCTCGGACTAGAGT +CAAAAGAAGACTCAAGCGACACCACCCTCATGACCTCCCTAACCTGGTTTTGACCTAGAA +AGTCTTAGTTTTAAAATTCATTAGAATAATCAAATAAATAATAATTACTATGTTATATCA +ACTATTATAATTCTCCCTATCATTTTTAGATTAAAAATCTGTTAGTCTTAAGTAACCAAG +ACACATTGTAAAATAAAATAATTTAAGCAGATCAAATTAAGTTGCCGCATGGGTAACAGT +GCGTTGATCAAATAATAAAAACATCATAAAAAAAAAAAAA +>DMTRDNA +CACTATGGGGCATTTGGCCTGTTTTTTTTACAAAAATTAATACCTCCTAAACTATTGGAG +ATATTTGGATGAATTTTTTTTTATGCGTTACACATGCCTCCAGGAATATTTTGGAAAAGT +GGGCGTGCCCCAACTCCGCCCCATTTTTTTTTTTTTTTTTTTTTTTTTTTAATAATATAT +TTTTAAAGTTTATTTTTAATTTCAATAATGTATAATTCATAACCGTCTTCCTCTTCACAA +TCAGTAGAGTCTGAAGAATTTTTATCAGGTTCAAATTCGCAAGCTAACATTTCAATGACT +TCTGGTGGAAGAGATAGTCGCTTATGTTTTCGCCTCTTTAAATTTATTGATGATATTATG +GGATCCGAAGTATCCATTGCTCTGTAAAAGACATCTGCGAAGCTACTAATAGTTTTTGCC +GTGGCTGGCTTCAACAAAAGAATTTTAAGTATGGCTGCAAGATCCCGCAGGCAGCACTTC +CGTGCAGCTTGAACCAAAAGACGTTCGTTGTGTTTCTGCGCCCTTACGAGTTCATCTGCT +TGCTGTCTTGGGCCACTCAAATTTTTTAAATAATATGACGTTTTCGGGAGTCCAACTAAT +TTCCTTTCCTATTTATTTTTCTCCTTTACCTTCAGGACTAGGTGTTCTTCTAACCAATTT +GAAAAAAATTTTAAAAATTCATATATTTTTCGATTGCATTTTCTCCAATTTCGTAAAAGA +TTGACTGAAATCATTCGTTATTATTATTATTAGTTAATCGTTTATTAAAGTCTAGCTTGC +TATCAGAAAAATGCCCACTGATAAAAGTGCAAATAGAATTTTCCTTTTGACGAACACCCT +TTTGCGTGCGCCACACTTCCAGCAGGGCAGCATTGGAAATCGAGATATTGCTCCCTAAAA +AATGAAATTTCTCAAAAAACCGCAAAAAACGCACATAGAGACTACCTGATATGAGTTAGG +AATTGAACACACTACAACATGGATATAAACACTTACTGAACAAATTTGAACAAATTGTTG +TAGCTCTATTCAAAGTTGAAAATTTTTTCAAACAACTACATCTTGACACCACTTGTTAAA +TGTACAAATTGTTAGAAATAGGCGCACACAATAAACAATATATTAATAACAACACATAAT +AAGAACCTAAAGATTGATTATCCATTTCAAATTATACTCTCCTTCTTCTTCTTTTTAAAT +TTTAACACTTTGAAAGTTAAGCTAAATTTTGTGCGCAAAGCAGCCACGTGGTATATGCTC +GCAACAGCCGACTTTAACAGCTGTTATTATAACAGTGCATTGTTAAATTAACTTATGCGG +GCTATATCATAACAGTTTAACGTATTTCCAATGTATTAATACTAAAATACTTCAAATTTG +CATACTTGTGAAAAACACATTATTGTAAAAAAAACAGGCCAAATGCCCCATAGTG +>DMRTMGD1 +TGTAGTATATACGAATATAATAACAATAATAATAACAATAATAATAATAATATTAATAAT +AATTATAATATGAATCATAATAATAAGTCAACTAATAAGTAAACTTAGGACCACCCTAAT +TCCTTAGGGTCACCCTAGTAGATCTTTAGATACACCCTAATACTAAATATGCGAATTCAG +GATGTACGCCTTTAGGGGTCGGACTCGACTCCCATTGGTTATCGAGTATGAACTTCATAC +ATACATATTGCAGAATTTGCTAGTGTCAGCACTTGGCTGTCACAAGAGATCTCCCTGTAG +ACCACACTAAGATCAGTTATAAATCAGGAATAGATCTGGAATGTACACTCGCTTAATAAA +AACCAAATAAAGATAAAATGACCAACTGCGTTTTGAGACTTTATTAACTACATCAGAAGT +ATTAGAATTCAAATTAACTACATGGCGACCGTGACAAAGGATCGTTATAAGTTGTAGCAG +AAGCTAAAGGAAACCGCTTGTGATAATTTTCAACTTCGATGCTCATCCACCAAGACGGCG +GCAATTATGAAGAAAAAAGCGATCTGAGTGAGTAGAGTGTCAGTGTGATGGGAAAAAACA +GGGGCGGAGTTCGACATAATATAAAAAAGAGAATAGCGCACATAAAGTGGCTATTATATA +CGAACACTCCACCACCCCAATGGTCGAAAGCTCAAAAACTACAAGCTGAGCTAGACCACT +GTGTCGAATATCTCAAGAAAAAAATCCCCACCACACGCGCTCACTCAGAAAATCAAATAA +AATCGTTAACAATTAACAAAACTCCAACTCCCAATCCGAAAAGCCTGCCTGTTTTCAAGA +AAAGATGCCCGAACGACTGCGAGGGACCACTGTTCACACCGCATTGTGAACATACGTGCA +GACATTGCAGCTCCACCACATAACCCCTAAATGAGGAAATCATCATCAACGTGGTGAGCA +GCCCGCTCATTACGTCATCGAGGGAGTGTCAGCGTGCCAACCCGGCGACGACCAGATGAC +GCAGGAGGGTCAGAGTGAAGCAAATAGGAGCTGAAAAATAAAATATTTTTTTTGTTGCCC +TGCGTGGCACACCCTCGATGCACTGCGCTGCATATTAATATTACACAAAATATTGTAACA +TTGAGCGGAACTTTTTCTGCCCGATGAGAAGAATGGCCCGTAAAGCCATACACCAACTAG +GTAGGAAAATGTAACTATATTGAACAAAAAAAAAAAAAATCAAAACAACATATTTTTAAA +GTAAAATAAACCAAAACCCAAAAATAAAAAAAAAAAAAAAAAAAAAAAAAATAAAAATAT +ACAAAAATGGGTTGGTTTGGATCTGACGATAGTCAGACAAAAGATAATACGGCCAATGTG +GTCAATAACTTAAAAATAGTCGACCATACAGATGACATTCAGTCACTGTGGTTACTCCTT +TTGATCATGACGATCGTAACAGTCGCTCAGTTTATATTAACGCTATATGTTAAGCATAAC +AAGATAATAAAGAGGCGTTATATAGGCAAAGCAGAGAATAGTTTGGATAAAATTTGAAAA +AAAAAAAAAAAAAAAAAAAAAAAAAAACATCCGAGATGTATTTTGAATTAAGATGATCTA +AAATTTTTATTTTTAATATCAGAAAACTAGAATGAAAAAAAAAAAAAAAGATTATTGAAG +AAACCTATTTGAGAGAGGCCAAAATTTATAAAGTTCGATTGCATAGATAAATCCATAGTA +TTCTTTAAATGGACTGGCAAGAAATACAAAACGAGCTTAAAGAAATTAAAACAACTTTTG +ACAAGTCTTATAAATGCATGACACCAAATAGAGAAGTGCAACAAGACACTCTCAACAAGC +ATGCGCAGATATTGGTAAGATGCTTTAATGGAGCACGCCAATTAATTTACAGAGAAAGGA +AAAGATTAACAAAAAATCATTTATCACAAGCAGTAAAATTTCTAAACAGGTTCCGTGAGA +ACTTGTTAAACGTCAAGTACAGACACAACTTAAATATTACAATCCCAACGATTTTAAGCA +CACCTATAGTGGCTGAGATCGGTGAGGATATCGAAAGTGTAGGAGAATCAGAAATAGAAA +TAAAAGAAGAGGATCTCCACGATCTTGCAATTCCAGCGGTAATAACATTACCCGAATTAC +TTGAAGAAGAACTTTCAGATTCAAATACAGGAATAAGAATACAGGAAACGGACAAAATGA +CAGACTCTGCCGCAACAGCAAGGGAATATGTGCGACAAATTTCGTCCACAATACCTGAGT +TTGACGGCAAAAAGTTAAACTTGAATAGATTCCTCACGGCTCTCCGGCTGATAGATCTGA +CAAAAGGAGATCAGGAGATGCTAGCGGTTGAGGTAATCAAGACAAAGATACTTGGTCCAT +TATCACACAAAGTTGAAAATGAAAAGACCATTATCGGTATAATAAATCTATTAAAAGCAT +CAGTTAAAGGCGAATCGCCCGATGTCATCAAAGCAAAAATGCTTAGTACACAACAGCGCG +GCAAAACTGCAGCGCAATATACCACGGAGATAGAAAACCTACGTGGGTTGCTCGAAGCAG +CCTATATAGATGATGGTTTAGATTCCAACAATGCAGACAAATTCGCTACAAAGGAAGCCA +TATCTGCAATGACCAAGAACTGTGGGCACGATAAGCTCAAAACCATATTGGAAGCTGGAA +ATTTCAACACGATGAATAGCGTGATTGAAAAATACATACACTGCAGTACAGAAATGACCG +GCAATTCAAATAGTGTATTATTCTATAATAATAGAGGACACTATCGAGGTAATAATTACC +GAGGAAATTACCAAAACAGAGGTAATGGCCGAGGAAATTATAACTCCTACAATAACAACT +ATAGAGGCAGAGGTGGTTACCATGGTGGAAACAGAGGACGAGGTGGTAACCAAAATTATA +ATAGAGGTGGAGGTTACTCAAGAGGTAACCAAAACCATAACTATAAAACAAGTCATGCCC +ACAATGTCCGAAACATACAATCGGAAAACGAACATACCCCCTTGAGCGACAATCTACAAT +AAAATTATACAAAATTAATCTCAATTTAAGCATTTTTATACGATTGAAGAATATGAGTAC +CAATTCATGGGTAACTCTTTTAATAGATACAGGTGCAGAAATTTCCCTGCTTAAATGCAG +AAACAATAATCTTAACGATTTAAATCCAAAAAATACAACAAATATATCAGGAATAGGGCA +AGGGACAATTCAGTCTCTAGGTACACTACATTTAGAAATGTGTATTGCTAATGCAGCAAT +ACCATATGAATTCCATATCGTACCTAACAATTTTCCTATACCAGGGGATGGTATAATTGG +CTTGGATTTCATTAAGAAATACAATTGTATTTTGGAATTCCACGACCAAGAAGATTGGTT +CACTTTGAGGCCCAAAAATTTCAGGAACATAAACATTCCTATTATACATACACTAGATAA +TGAAATAATTTTGCCAGCTAGATCAGAAGTGATTCGAAAGATTCAACTAACATCTACTGA +CACACATGTTCTCATTCCCAACCAAGAATTACAACCTAGCATAATAATCGCAAGTGCACT +CGTAAACACTCAGAACGTTTTGATTCGAATTATTAATACAACTGAAAAAGACGCTATAGT +TAGTAGCGCAAATATAAAAAGCGAATCATTGGATGATTATGATGTATACAACGCAAATAT +AGAAAATAGTGCACAAAGAACTTCAGAAGTATTAAAACTTCTTAAATTTCCATCGTTATT +CAAAAGCGATTTAACAAAATTATGCACCGAATATAGCGATATTTTTGGTCTTGAAACAGA +AACCATATCAGCTAATAATTTTTACAAGCAAAAATTGAGATTAAATGACAAAACTCCAGT +CTATATCAAAAACTATAGAATGCCAGAAAGTCAAAAACCAGAAATTCAAAGGCAAGTTGA +CAAATTAATAAAAGATGGCATTGTCGAACAATCTATTTCAGAATATAATAGCCCTCTTCT +CTTGGTACCCAAGAAATCACTGCCTAACTCGGAGGAAAAGAGATGGCGATTAGTAGTCGA +TTATCGCCAAATAAACAAGAAACTGCTAGCAGATAAATTCCCACTTCCAAGAATAGAAGA +CATTCTTGATCAATTAGGCCGAGCAAAATATTTCTCGTGCCTAGACCTGATGTCAGGATT +TCATCAAATAGAATTAGACGAAAGGTCAAGAAATATAACATCTTTCTCAACTTCAACGGG +AGCATACCGCTACACGCGATTACCATTTGGTTTAAAAATAGCCCCAAATTCTTTTCAAAG +AATGATGACCCTTGCATTTTCAGGTTTAACGCCTTCGCAAGCATTTCTGTATATGGATGA +TTTAGTAGTCATAGGCTGTTCTGAAAAGCACATGCTTAAAAATCTAACCGACGTTTTCAA +ATTATGTAGGCAACATAATTTAAAATTACATCCAGAAAAATGCACTTTCTTTATGAAAGA +GGTTACTTATTTAGGTCACAAGTGTACTGACAAAGGTATATTGCCAGATGACTCTAAATA +TGAGGTAATAAAGAACTACCCCAAACCAGTAAACGCAGACGAAGCTAGACGCTTCGTGGC +ATTTTGCAATTATTACAGAAGATTTATTAAGAACTTTTCTGAGAAATCACGCCACTTAAC +GAGGCTTTGTAAAAAGAATGTTCCATTTGAATGGACAAGCGAATGCAATGATGTATTCGA +ATATCTCAAAAGGAAATTAATGAAACCAACACTCCTTCAGTACCCAGATTTCAGCAAACA +ATTTTGCATAACCACAGATGCTAGTAAACAAGCATGTGGAGCGGTACTATCTCAAGACCA +TAACGGTCAACAGCTACCAGTGGCATACGCTTCAAGAAGCTTTACAAAAGGCGAAAGTAA +TAAGTCCACTACAGAGCAGGAGCTAGCAGCTATTCACTGGGCAATAAATCACTTCAGACC +ATACGTATATGGTAGACATTTCTTAGTACAAAGTGACCATAGGCCACTATCATATCTTTT +TTCAATGAGAAACCCCAGTTCAAAATTAACCAGAATGAGACTAGACTTGGAGGAGTTCGA +ATTCACAGTAGAATATCTCAAGGGGAAAGATAATCATGTCGCAGACGCATTGTTCCGAAT +AACAATCGGAGAACTTAAAGCAATAAATAGACAGATACTAAAGGTAACAACAAGATCAAC +AACAAGACAGAAAAATACCTGCGCAGGTGAAAAATTGCATGAACCAAATGAGAAAGAAAA +TATAAAAATGCCCAATATCTATCAGGTAATCAATAACATTGATGCCAAAAAATATGTTAT +ACTCAAAATAGACAAGCATAAGTGTTTGTTGAAAAGAGGAAAACAAATTATAACACGTTT +TGATATGACTAATTTTTATTCTAATGAAATAATCGATTTAGATCAATTCTTTCAAAGGCT +TAATGAAGAAGCAAGAATAAATAGCATCATTCAAACACAATTGTCACCAAGTGAACAAAT +CTTCGAATTTGTCACTATAAAGAACTTTAAAGAAAAGGGCAATAAAATACTAAAAAATTT +AAAAATAGCGCTATTAAACAAGGTGACTAAGATAGATAAAAATGATAAGGTTCAAATAAA +AGCAATACTGTCTAAATATCATGATGATCCATCAGAAGGAGGCCATTCAGGAATTTCTAG +AACCCTGAGGAAAATGAAAAACTGTTGTTGTTGGCCACGAATGACGAAGGCGATAAGTGA +ATATGTTGAAACATGTTTGAAATGTCAACAAGCCAAGACTACGAAACATACTAAAACACC +GTTGACAATAACAGAAACGCCAGCAACAGCATTTGATAAAGTTTTGATAGATACCATTGG +TCCACTGCCAAGATCAGAAAACGGAAATGAGTATGCTGTTACTATCATTTGCGATTTAAC +AAAATATTTGGTAACGGTACCAATTCCAAATAAAAGTGCAAAATCAGTTGCTAAGGCTAT +ATTCGAAAATTTTATTCTAAAGTACGGTCCAATGAAAACAATCACAACGGACATGGGAAC +GGAATATAAAAACCAAATTATAGACGACCTATGCAAATATATGAAGATAAAAAACATTAC +TTCAACAGCACACCATCACCAGACATTAGGAACAGTAGAACGAAGTCACAGAACTTTCAA +CGAGTATGTTCGCTCATATATATCTGTTGACAAAACCGATTGGGATATATGGATACAATA +TTTTACTTATTGTTTCAACACAACACCATCGGTAGTTCATGAATATTGTCCATATGAATT +AGTATTTGGAAGATTACCAAGACAGTTCATAGATTTTAACAGGATAGACAGAATAGATCC +TATTTACAACATGGATGATTATTCAAAAGAAGTTAAGCTACGATTAGAAATAGCATATAG +AAGAGCTAAAAATATGTTAGACAAGGCAAAAGCCGATAGAAAGATAAAATATGATAGAAA +TATTAGTAACTTTGAATTAAAGATAGGAGATAAGATATTACTTAAAAACGAAACGGGTCA +TAAACTTGACAATAATTATTTAGGACCATATTTAGTTTCAGAAATAGGAGATAATGACAA +CATTACAATTATAGGAAATAAAAATAAAAAACAGATAGTCCATAAAGATAGGTTAAAAAT +TTTTAATTCATAATACATTTTGTTTGGTTGGCCAACCACAAATAAAAAACCACAAATAAA +AAACCACAAATAAAAAACCACAAATAAAAAACCACAAATAAAAAACCACAAATAAAAAAC +CACAAATAAAAAACCACAAATAAAAAACCACAAATAAAAAACCACAAATAAAAAAACCAC +AAATAAAATAAAAACCAATAAAAACATTATAATACAAAACTTTTACTTTGCAAAATATAA +TGAAAATATATATATTTTTTTTAATATCTCTTTAATCATTCATTTCAAATATTAATGTAC +ATTTAAAAAAAAAAAAAAAAATATTATATACTTGAAAATAACTTCATGTTATTACGTTAT +TTTTCAAAAGGAGGGAGATGTAGTATATACGAATATAATAACAATAATAATAACAATAAT +AATAATAATATTAATAATAATTATAATATGAATCATAATAATAAGTCAACTAATAAGTAA +ACTTAGGACCACCCTAATTCCTTAGGGTCACCCTAGTAGATCTTTAGATACACCCTAATA +CTAAATATGCGAATTCAGGATGTACGCCTTTAGGGGTCGGACTCGACTCCCATTGGTTAT +CGAGTATGAACTTCATACATACATATTGCAGAATTTGCTAGTGTCAGCACTTGGCTGTCA +CAAGAGATCTCCCTGTAGACCACACTAAGATCAGTTATAAATCAGGAATAGATCTGGAAT +GTACACTCGCTTAATAAAAACCAAATAAAGATAAAATGACCAACTGCGTTTTGAGACTTT +ATTAACTACATCAGAAGTATTAGAATTCAAATTAACTACA +>DMMDG3 +TGTAGTAGGCTGCACCTTCTACCCTCTTCCTTTACTCTTAGTCATACATACCTAATTATA +CATAGCCAATCTAGTCATAAGCTTATACACTCATACACCCATCCTTAACATACAAATATT +ATCGAGAAACTTATCGACTAATCGACTCGCCACTCTGCAGAGAGCGCGGCAGTCAGTCGC +TGTTGAACCAAGCTAAAGGACAGATCAAAAATAAAAGAGACACGTGAAATTGTATTAGAA +TATTAACTTCTGTAAACGGCGGCTAAAATCTCAGAAGTGGGATTAATAATCCAAAATGGA +CGATAAAATCATCCTGAACGACTTTTCGCTGACAACCCTAAAAGATTGGCTACGTATTCT +GGGCCAAAATACGGAGGGCACAAAAACCGAATTAATCGCGAGGCTGCAAGACATCCCAAC +GGCAGTTCGGGGCGATTGTCCACCGGAGCACCCCCAGAAAAACGCTCCACCAGGAAACGA +CATTTTTTCTTCACTGGATTTTCAGAATTGTGAAATTAACACCGATCACGTAAGTGTGAA +TGCGATGAACAGAAAAGAATCAACCGAAACTGGCAGTGAGAGGGAGACAAACATGTTCGA +GCTACAGCAACTACGCGCAGAGCTAGCAGAAGCGAAGGCAATGCTTAACGGAACACGATC +GAGCTTGCAGTTCCAAGAACAACAACAACCAGAGCAAAGCAAGGCTACAGTTAGTTCCGT +TATCCAGACGGCGCAGTTTACGCAGGCTGGCGCCACAAAAGAGAACACAACATTTCACTC +GCCGCAGCGATCCAACGAGAGAGCGGAGAGCCAGCGTTTTCCAGTTGATGCTCTCGCTCT +CGCCAAAGAGACGATAACCGATTACGATGGGAAAACTTGCGCGCGTGCCTGGATAACAGT +GGTCAAAAATATCGCACGCACTTTCAACATCGATGACAACCATTTACGCATCTTACTCAT +CACTAAACTTAAAGGAAACGCGCAAGTCTGGTTACATGCGCACCCTGCTCGATTGATCGA +ACCAATTGACAATTTGCTTGATCAATTGTCATTGACTTTTGGCGAGCAATCATCCAAGGC +TGAGATCCGGCGAAAATTCGAGAGTCGCAAGTGGAAAACCGAGGAGAATTTCTGCAGTTA +TTACGACGAGAAGATGGCTCTCTCAAACGGGATAAACATCGACGACGACGAACTACTGGA +CCAGATGATAGAGGGCATACCGCTACAAAATTTCCGTACCCAAGCACGGATTCAATGCTT +CTCTACTCCATCGGAGATGCTACGCGCATTTTCGAACATCCGTTTGCCAGCTCGGAGGGA +GCCACCTGTACAGCCAACCGACTACAAAGATGCCATACGATGCGCAAACTGTAATTCAAG +AGGACACAAAGCTGACATCTGCAAGAAGCCCAAACGTGAACCAGGTTCGTGCTACGCCTG +TGGACAACTTGGACACCTGGTGGCACAATGTCCCACAAGGAAGAGCGTTTCATCTAATAA +TTATGTAAGATGGTTTAAAATTAATTTTTTTGAAAATGCTTATAAGCCCATAATTTCAGA +ATGCCTCATAGACTCTGGCAGTCCTATATCTATCATTAAAAAGTCACTTATTAACGAGAC +AATGAAGTTAGCCCTAGTTAATACTTGCTATTTTGGTTTAAACAACTGTATTCTCAAAAC +ACATGGACAAACCACATGTTATGTTTTGAAAGGATCAATAAAAATATATTTTCGTTTAAT +CATTGTTTGCGACCAGTCTATGAGGTATAATGTTATTCTCGGCAGAGATTTTTTAACTGC +ATGCAATTTAAATTTAGACCCGTACACCTTGGGAATGATTGCGTTGAGAAAACCCATGGA +AATAAACAAAATATCAATGTTTACTGAAAATGATAGTCCTGAGAAATCTTTAGAAAATGA +AATTGTTAGTCCAAAATCGTTAGAGAATGAAATTGTTAGTTCACAATCGTTAGAAAATGA +AATTGTTAGCCCCAAATCGTTAGAGAATGAAATTGTTAGTCCAAAATCGTTTAAAAATGC +AACTATTAGTCCGAAATCGTTAGAAAATAAAATCGTTAATCAACAGCATAAAGAAACTGG +TCCAATATCGTTAAGAGATGAAATAGTTAATCAACAAAAGAATGTCAGTAAATCAAAATT +ATCAGAAGATGAAATTGTTAACACTTCAAAAGAAATCGTTAGTTTTAAATTGCCAAAAGA +TAAAAACGTTTACGAACAATTAAATCACAACTTTGATAAGGAAGTACTAAGAATATGTCA +TGTAACTGAAAGTGAGTTAGAATACAAAATAGGAGAAAATGTTAGCAATAGGTTACAACT +AGAATTCGATAGGTTGTTTAGAAATTTTTATATAAATGCAAAAAGGCCAAATGAACCGAC +AGTTAGAAGTGAAATACAATTGTGTTTGAAAAACCCGAAACCGTTTAGCTGTTCTCCTAG +GAGGCTTTCATACACAGAAAAAGACAGGTTACAAAAACTATTAGACGAATATTTGGAAAA +CGGATTTATACGACCAAGCGACTCGGAATATGCATCGCCTATTGTTTTAGTGAAAAAGAA +AACTGGAGACTTACGTATGTGCGTCGACTTTAGAAAACTTAATAAAATGACAATGAAAGA +CAACTATCCTCTACCTCTTATAGATGACTTGTTAGATAGAATGAATGAGAAAACTGTTTT +CACCAAACTCGATCTTAAAAACGGTTTTTTCCACGTGCATGTTAAAAAAGAATCAATAAA +ATACACCTCTTTCGTTACACCATTAGGCCAATACGAGTGGCTGCGAATGCCATTTGGCCT +CAAAAACGCCCCGTCTGTGTTCCAAAGATTTGTTAACAAAATTTTTGCGGATATGATTAG +AGAAAACAAAGTAGTAGTATATATGGACGACATTCTATTGGCAACCGAAAATATAAACGA +ACACTTAGAAACGTTGAAAGAAATTTTTAAAAGATTAGTTGAAAATAAACTTGAATTAAG +AATAGACAAATGTGAGTTTATGCAATCAAGTATAAAATATCTTGGGTTCATAATAAATAA +AGACGGCATAATGCCCAATGACAAAGGAATCGAGGCAATAAAAAATTTCCCAATACCTAA +TAATGTTCATACAGTACAAAGTTTTTTGGGATTATGCTCATATTTTCGACGGTTTATAAA +AGATTTTTCTAGACTAGCTAAACCATTGCATGACATTCTAAAAAAAGATAAACCGTTCAA +ATTTGGTAGTGAAGAAATGATTTGTTTTAATATGTTAAAAGATAAATTAATACAGTCACC +GGTCTTAGCTATATACAACCATAAACACGAAACAGAATTGCATTGTGATGCAAGTTCTTC +TGGATTCGGTGCTGTACTTATGCAAAAGAAGGAGGACCAGAAATGGCACCCAGTTTCATT +CTTTTCAAAACGGACAACAGATATTGAATCAAAATACCACAGTTTCGAGTTAGAAACTTT +AGCCATTGTTTATTCGTTACGTAGATTTAGAGTTTATCTTCATTGGAGGACATTTAAAAT +AGTCACCGACTGCAACTCATTAATTTTGACCCTAAGCAAAAAAGAGCTAAACCCTAGGAT +AGCCAGGTGGGCTTTAGAATTCCAAGGTTATGATTTTGAAATTGTGCATAGGGCAGGTAG +CCGCATGCAACATGTTGACGCACTGAGTAGGTGTACAAATATTATGGTAATACAAACAAA +CAGTTTCGAAGATAATCTAGTTATATGTCAAGGGAAAGATACAAAATTAAAAGAAATCAG +GCAATTGTTAGAAAACACAGAAAATAAATTGTATGAGATGAGAAATGGTATAGTTTACAA +AAAGACAAATGAAAATAGATTGCTGTTCTACGTTCCGATAGAAATGGAAGAACAAGTGTT +ATACAAATATCACAACGAACTTGGACACGTAGGAAGAGACAAAATGATAGAAGCTATAAT +GAAAAACTATTGGTTTCCAAATTTAAAACAGAAGTGTAGCACACATATCAGCAACTGTTT +AAAATGTATTTCATTCAGTCCCAAAACAGGAAAAACAGAAGGATTTCTACACAACATACC +TAAGGGAAACAAACCTTTTGAAATAATCCATATTGACCATTATGGTCCAGTAGACTTGGC +TAGACCGAAGAAACATATTCTAGTGATAGTAGATGCATTCACAAAGTTTGTCAGACTATA +CGCAACAAAAACTACGAACACAAAAGAAGTCATACAATCGTTAAATGACTACTTCAGAGC +ATACAGTAGGCCTAAGTGTATCATATCAGATAGAGGAGCATGTTTCACGTCTGGCGATTT +TGACTCATTTTTGAAAGAATGCAATGTTAAACACATAAAAATTGCAACAGGATCGCCACA +AGCCAACGGTCAAGTTGAACGTATAAACCGAAGTCTTGGTCCAATGATTAGCAAGTTAAT +TGAACCTGATCAAGGTCTACACTGGGACTTAGTCTTAGAAAAGGTCGAATATACCCTGAA +CAATACACTACACCGCAGCATTAAACAGTATCCTAGCATAATGTTATTTGGGTTACAACA +AAAAGGACAAATTATGGATGAGTTAAAAGAAAAAATTGAGGAAATTGGAGAAACGATTGA +AGAAAGAGATTTAGAAAGTATTAGAAATAAAGGCGAGGCAAGTCAGAAAATAGCACAAGC +ATACAATAAAGAATATGTTGACAAAAAACGAAAACGATCAGGAGTGTTCACAAAAGGCAC +TACGTCATGGTTAAAAATTTTGACTCAACAACAGGCATAGCTAAGAAGTTAATTCCAAAG +CATAAAGGACCCTATGTCATAAGCAAAGTTCTCAAAAATGATCGCTTCCTTCTGGAAGAT +GTTGATGGATTTCAAATTTCTCGCAATCCTTACCGGGGTGTATGGAGCATACAGAATATA +AAACACTGGCAAAGAAAAATTAAGAGTCTACAAAATAGAAAGTATAATTTGAGAAACTCT +GTACAAAATAGAAAGTATAATTTGAGAAACTCTGTACAAAATAGAAAGTATAATTTAAGA +AACTCTGTACGAAATCGAAAGTATAATTTAAGAAGCAATTGTAAAACAAAGAAAACAAAC +AAGAAGAAAAGAAAACCAAAAAAATGTTTAAGACCGTTCAAAAGTATCTCCACTAAGAAG +AATAAAATAAGAAACAGGACCCTTAGCTTTAAGAAACGTTAATTGTTATAAAATCCTACG +ATCGGGAGATCTAGTTGTCAGGACGGCCGAGTTGTAGTAGGCTGCTCCTTCTACCCTCTT +CCTTTACTCTTAGTCATACATACCTAATTATACATAGCCAATCTAGTCATAAGCTTATAC +ACTCATACACCCATCCTTAACATACAAATATTATCGAGAAACTTATCGACTAATCGACTC +GCCACTCTGCAGAGAGCGCGGCAGTCAGTCGCTGTTGAACCAAGCTAAAGGACAGATCAA +AAATAAAAGAGACACGTGAAATTGTATTAGAATATTAACTTCTGTAAACGGCGGCTAAA +>DMDM11 +TGTCGTGGCGAAAATAATGAGTATGCGTGTAGTCGCTGTTTACTTCTTCTCCATGTTCCC +TTTGCTATTATGCGTGTTCCTATTTATGAACACGTGGCGAAAATAATAAATGCGTGTAGT +CGCCGTTTACTTCTTCTCCATGTTCCCTTTGCTATTATGCGTGTTCCTATTTATTGTCAA +TGTGTGAGGATGAATAGATGAATTATCTATGAACGGGATTTTGCAAAAACGACTTGCGCT +GCTTGGTTAGAAAGGGAAAACTATATAATGAAAAGGGAATGCCAAAAATTGAGAAGAGAC +AAAGCAGGCTGCACGAAGCTGGAGTGAGGGCATTAATCGTGGAGAAGCCAAAGCAGACGC +AAGTGGACTCGTTGACTGCGCACAGCTGCATAAAATTATATAGTAAAAAGAGATTTGAGC +GACGCTGATATGGACGGACGGACGGACGCGAGGCCCCTGATATTCTTAACCCGACATCAG +AAGTGGGATCTGTGCCACACCCTGCATTTTCTGAGGATCAGTGGCGTGCAGTAGTGGAAA +TGCAAAATCGGAATTTGGCTGAACTTGTAAAAATCATGCAAAAGACGCCGGCACGTGAGC +AGCAACCTAGTTATGATGTTAAGCTACCCAAATTTAACCCTGATGCTGCATGCGTAGAGG +CAGCAAAGTGGTGTTCAACAACCGATATAATTCTAACTGAGCACCCCCTTAAAGGAAGTA +AATTGATCACGGCACTAAGTAACTGCATGGAGGGAACTGCATCTCAGTGGCTAACACAAA +TCTCGTACCAGGGTATGACTTGGCAAGAGTTCCAGGAATTATTTCTGCAGCGCTTTGAAA +CCGAAGAGACGCCGGCCGCTACGTTTTTAAATTTACTCAACAGCCGCCCGACTGCCGCCG +AATGTTACGCGGTGTATGCGAGTCGGCTGGTGACGCAGCTGACTACAAAGTGGCGGAATA +TGGAAATAGAAGAAATTGCCGTTACAACTGTTCTTGCGCATATGGCAAACATTGACAGTC +GTTTGCAGCGCGTCCTCTTCACATCCAATGTGCGTACCAGAAGTAAGCTACAGGCGGAGT +TAAAAGCGTTTACGTTCGACAAGAAGCGACATGCTCGAGATGACAACCTTGGACCTGACC +AGAAGAACCGTAAGGCATCGCCAGTTGTATGCCACTTCTGTTCAAAGCCGGGACGTCGAA +TTGCTGAATGCCGAAGTAAAATGCGACAAGATAGACGGGCGAAACCGCAGCGTGAAAAAT +CAAATGTTACGTGCTATCGGTGCGGCCAACCGGGACATTTCTCCAACCAGTGCCCGAAAA +ACGGAACTGCAGCCAAACAAGATGTGACTCAACAGAAGACTGTTAACCAATGTTGTGTGA +CTGAGCCAAAGGGAAGCTTGCATCAACGAGGTGAGATCTATCCAATTTGTTTCGATTCCG +GTGCAGAGTGCTCCCTTATTAAAGACGACATTAGCAGTAAGTTATCTGGTAAACGTATAA +ACAATACTGTAATGATAAAAGGCATTGGTGGTGGCAGTGTGTGCAGTACATTGCAAATCT +TGAGTGAAGTCACTATAAACGAAAATATTATGGAAATATTATTTCATGTAGTCCCGAACG +AGGAAATGAGGAATGATATTCTGATAGGGCGAGAAATACTTAAACAAGGCTTTTATGTAA +TTTTGACATCCGATAATTTTAAAGTTGTAAAATCAAAAACTGTTAATAATTGTTCCGTTA +CTGAGCGATCGTTTACTTTGTCCGATATTGACACCGAATTAGTCGACAATGAGAAAGCTC +AATTAATTGAGTTACTTGAAAAGCACTCGACTTCATTTACCAACGGGATACCTCATACTC +GAGTAAATACAGGCGAAATGAAAATCCGTTTGATTGATCCAACTAAAACTGTTCAGCGCC +GACCTTACAGACTTAGCCCCGAAGAGAGAGAAGTAGTGCGAATGCAGGTGAGCGAATTGA +TAAGATGTAATATTGTTCGCCCAAGTTGCTCTCCCTTTGCTAGCCCCATGTTGCTCGTCA +AAAAGAAGAACGGAACCGACCGTCTATGTGTTGATTTTAGAGAGCTAAACTCGAACACGA +TTTCGGATAAATACCCCTTGCCGCTTATCAGCGATCAAATTGCTAGACTTCGCGGAGCAA +ATTATTTCACATGCCTGGATATGGCAAGTGGTTTCCACCAAATCCCGATTCACCCTGAAT +CCGTGGAATATACTGCATTTGTGCCCGACGGCCTCAAAAATGCGCCATCTGTTTTCCAGC +GCACAGTCATAAATGCACTTGGTGACCTTGCTAACTCTTTTGTAATCGTTTACATGGACG +ACATAATGGTAGTATCGCCAACCAAGGAATTGGCTTTGGAAAGGTTAAAAACTGTTTTGA +ATGTTCTTACAAAGGCTGGTTTTACCTTTAACCTTGCTAAATGCAGTTTTCTCAAAACAA +CGGTTCAGTATTTAGGCTATGAAGTGCGAGCGGGAGAAATTCGTCCGAATGTGCGAAAGA +TAGCTTCTTTAAGCTCCTTGCCTCCTCCTCAAACTGTCTCCGGCGTTAGACAATTCATTG +GCTTGGCCTCTTACTTTCGCAAATTCGTGTCTGGATTCTCCCAACTTATGAAACCATTGT +ATTCACTTTCGTCTGGTAGCGGCAAGATTACATGGAGCGCTGAGCTGGAAGAGATCAGAC +TTAAAGTTGTGACGATCCTCACAAATGAGCCTGCTCTGGTAATCTTCGACCCGCAATATC +CTATTGAGTTGCACACTGATGCAAGTGCCTGTGGATATGGAGCGATACTTTTGCACCGTA +TAGAAAGTAAGCCCCATGTAATCGAATACTTCAGCAAAACAACTACCTCTGTTGAATCTA +GATATCACTCCTACGAGCTGGAAACCTTGGCAGTGGTAAAAGCCGTTAAACATTTTCGCC +ATTACCTAATTGGCCGTGAGTTCGTTGTCTATACAGACTGCAATTCATTAAAAGCTTCTC +GCACAAAAATAGATTTAACCCCCAGAGTTCACCGCTGGTGGGCCTACTTACAATCGTTTA +ATTTCGAAATTCAGTATAGAGAGGGTAAGCGTATGGCTCATGTGGATTTCCTATCAAGAA +ATCCTTTATCACCCGAACACATTTTGTCAATAAACAAGATTCCCGAAAAACGAGTAAATC +TGTCTGAAATTTCAAGTACTTGGCTTCTTGCTGAGCAACGGTTAGACCTTGAGATAATAG +AAATTGTTAACAAATTGGAGTCAGATGAATTAGCCGAAAACTTGGCCAAAACGTATGATT +TGCGAAAAGGTGTATTATATCGCAAGGTCCAAAGACGAGGTAGAACAAGTTATTTACCAG +TTGTACCCAGAGCTTTCAAATGGTCAGTAATTAACCAGGTACACGAGTCGATAATGCATT +TAGGGTGGCAAAAGACACTTGATAAAGTGTACCAGTATTATTGGTTCGCTAAAATGAACA +AGTATGTTCGAAAATTTGTTTCAAACTGCATAACTTGTAGATCAGTGAAATCATCTTCCG +GGAAGGTTCAGGCGGAACTTCATTCCATTCCGAAGACAAGTATACCGTGGCACACCATCC +ACATAGATATAACGGGGAAATTAAGTGGCAAGAGCGATTTGAAGGAGTATGTCATTGTTC +AGATCGATGCCTATACAAAGTTTGTTTATCTGTATCACACCTTAAAGATAGATGCCGAAA +GCTGTGTTAATGCTATGAAATCTTCCATATCCTTATTTGGAGTACCAGATCGCATTATCG +CCGACCAGGGCAGATGTTTTACTAGCTCTAAGTTTTCAGAGTTTTGCGTATCGCAGAAAG +TTGAACTTCACTTGATTGCTACGGGAATGAGCCGTGCAAATGGGCAAGTGGAACGGGTGA +TGGAAACACTGAAAAATTTGTTGTCAGTGGTAGAATCAAGTCAACGATCGTGGCAGGACG +CACTTGGCGAAGTCCAACTTGCACTGAATTGTACAATTTCTCGTGCCACTGATGCAAGTC +CGTTAGAAATGTTAATTGGTAAACAGGCTCGACCCCTTGGATTAGTTCCCCCATGTGAGA +CCGAATGTGAAATAGATTTGGCAACTGTTAGAGCTCATGCGACAGAAAATATGAATTCCT +TAGCGTCTTACGACAAATCCCGATTTGATAGCAGTAGAGCAGCCGTTGACAAACACCACG +TAGGTGACTATGTGCTATTGAGGAATGAAGAAAGACACCAAACTAAGTTAGATCCGAAAT +TCAGAGGACCGTTTTTGGTAACTGAAGTATTAGAGGGTGACAGGTATACACTAAAGTCGT +TGACGAGTAACCGATCGTTCAAGTATTGCCATGAATCAATCAAAATGCCGGATGCAGAAA +TCCCGAATGAGTTAAACGAGAATGTAGAGCAATAGCTGAAATATAGAAACAGTTGAATGA +AAAGAAAAGCCCGCCAATGAGTTCTTTTGTGAACGAGAGATATCCGTCTAGGTGAGACGA +TGAATTGTGAGTTATCCGTCTAGGTGAGACGATGAATTGTGAGTTATCCGTCTAGGTGAG +ACGATGAATTGTCAGTTATCCGTCAGGTGAGACGATGAATTGTGAGTTATCCGTCCAGGA +GAGACGATGAGTTTGGATTGAATTAATAATCAAGTGTGTGTGAACTGGCGGAAGATCGAT +ATATAGAAATCGATAAATGATAATGTTAAGATAAGTTGTGAGCTGATGTATTACTGATCA +ATGGAACTGAATATGAAAATAGAATAAGTTATCCCAGCAACAGTGAAATAAGAGCTGTTT +TGTTTCTTCACAGAATTAAGATTTAAGAAATACACCTGATAAAGTCAAACTAATGAAATT +AAATGTTATTGAATAGTGATGAAAGTAGGTGATCTTGATATCTTGGTATCTCGGTATCAA +AAGCTTACACGAGGACGTGAAATGTCAGAATGGCCGTGTCGTGGCGAAAATAATGAGTAT +GCGTGTAGTCGCTGTTTACTTCTTCTCCATGTTCCCTTTGCTATTATGCGTGTTCCTATT +TATGAACACGTGGCGAAAATAATGAATGCGCGTAGTCCGGTTTACTTCTTCTCCATGTTC +CCTTTGCTATTATGCGTGTTCCTATTTATTGTCAATGTGTGAGGATGAATAGATGAATTA +TCTATGAACGGGATTTTGCAAAAACGAGAGCGATAGAGCTGTTGCTGAACGTGGCCACTT +GCGCTGCTTGGTTAGAAAGGGAAAACTATATAATGAAAAGGGAATGCCAAAAATTGAGAA +GAGACAAAGCAGGCTGCACGAAACTGGAGTGAGGGCATTAATCGTGGAGAAGCCAAAGCA +GACGCAAGTGGACTCGTTGACTGCGCACAGCTGCATAAAATTATATAGTAAAAAGAGATT +TGAGCGACGCTGATATGGACGGACGGACGGACGCGAGGCCCCTGATATTCTTAACCCGAC +A +>PPI251 +CATGATGAAATAACATAAGGTGGTCCCGTCGAAAGCCGAAGCTTACCGAAGTATACACTT +AAATTCAGTGCACGTTTGCTTGTTGAGAGGAAAGGTTGTGTGCGGACGAATTTTTTTTTG +AAAACATTAACCCTTACGTGGAATAAAAAAAAATGAAATATTGCAAATTTTGCTGCAAAG +CTGTGACTGGAGTAAAATTAATTCACGTGCCGAAGTGTGCTATTAAGAGAAAATTGTGGG +AGCAGAGCCTTGGGTGCAGCCTTGGTGAAAACTCCCAAATTTGTGATACCCACTTTAATG +ATTCGCAGTGGAAGGCTGCACCTGCAAAAGGTCAGACATTTAAAAGGAGGCGACTCAACG +CAGATGCCGTACCTAGTAAAGTGATAGAGCCTGAACCAGAAAAGATAAAAGAAGGCTATA +CCAGTGGGAGTACACAAACAGAGTAAGTTTGAATAGTAAAAAAAATCATTTATGTAAACA +ATAACGTGACTGTGCGTTAGGTCCTGTTCATTGTTTAATGAAAATAAGAGCTTGAGGGAA +AAAATTCGTACTTTGGAGTACGAAATGCGTCGTTTAGAGCAGCAGCTGAGGGAGTCTCAA +CAGTTGGAGGAGTCTCTACGCAAAATCTTCACGGACACGCAGATACGGATACTGAAGAAT +GGTGGACAAAGAGCTACGTTCAATTCCGACGACATTTCTACAGCTATTTGTCTCCACACC +GCAGGCCCTCGAGCGTATAACCATCTGTACAAAAAAGGATTTCCTTTGCCCAGTCGTACG +ACTTTGTACAGATGGTTATCAGATGTGGACATAAAAAGAGGATGTTTGGATGTGGTCATA +GACCTAATGGACAGTGATGGAGTTGATGACGCCGACAAGCTTTGCGTACTCGCTTTCGAC +GAGATGAAGGTCGCTGCTGCCTTCGAGTATGACAGCTCTGCTGATATTGTTTACGAGCCA +AGCGACTATGTCCAACTGGCTATTGTTCGTGGTCTAAAAAAATCGTGGAAGCAGCCAGTT +TTTTTCGATTTTAATACCCGAATGGACCCGGATACTCTTAACAATATATTAAGGAAACTG +CATAGGAAAGGATATTTAGTAGTTGCTATTGTATCCGATTTAGGTACCGGAAACCAAAAG +CTATGGACAGAGCTCGGTATATCAGAATGTAAGTTTCGTATATTACAAAAATCAGATAAT +CCTTGAAATTCCATTTTTTAGCAAAAACCTGGTTTAGCCATCCTGCAGATGACCATTTAA +AGATTTTCGTTTTTTCGGATACGCCACATTTAATTAAGTTAGTCCGTAACCACTATGTGG +ATTCCGGATTAACAATAAATGGGAAAAAATTAACAAAAAAAACAATTCAGGAGGCACTTC +ATCTTTGCAACAAGTCCGATCTGTCTATCCTCTTTAAAATTAATGAAAATCACATTAATG +TTCGATCGCTCGCAAAACAGAAGGTTAAATTGGCTACCCAGCTGTTTTCGAATACCACCG +CTAGCTCGATCAGACGCTGCTATTCATTGGGGTATGACATTGAAAATGCCACCGAAACTG +CGGACTTCTTCAAATTGATGAATGATTGGTTCGACATTTTTAATTCTAAATTGTCCACAT +CCAATTGCATTGAGTGCTCGCAACCTTATGGCAAGCAGTTGGATATACAGAATGATATTT +TGAATCGAATGTCGGAAATTATGCGAACAGGAATTCTGGATAAACCCAAAAGGCTCCCAT +TTCAAAAAGGTATCATTGTGAATAATGCTTCGCTTGATGGCTTGTATAAATATTTGCAAG +AAAACTTCAGTATGCAATACATATTAACAAGCCGTCTCAACCAAGACATTGTGGAGCATT +TTTTTGGCAGCATGCGATCGAGAGGTGGACAATTCGACCATCCCACTCCACTGCAGTTTA +AGTATAGGTTAAGAAAATATATAATAGGTATGACAAATTTAAAAGAATGCGTAAACAAAA +ATGTAATTCCATGATTTATAATTGTTTAATGTTTAGCTATATGTTTCAGGAAAGTTTCAG +TTGAGAATGTAGGTAGTTATGTGCTGTCTATTGTGTTTTGTCTTTTATCTGTTTCTTTTC +ATTTTATTATTTAATCATTATCCTTTTGCTTATCCAGCCAGGAATACAGAAATGTTAAGA +AATTCGGGAAATATCGAAGAGGACAACTCTGAAAGCTGGCTTAATTTAGATTTCAGTTCT +AAAGAAAACGAAAATAAAAGTAAAGATGATGAGCCTGTCGATGATGAGCCTGTCGATGAG +ATGTTAAGCAATATAGATTTCACCGAAATGGATGAGTTGACGGAGGATGCGATGGAATAT +ATCGCGGGCTATGTCATTAAAAAATTGAGAATCAGTGACAAAGTAAAAGAAAATTTGACA +TTTACATACGTCGACGAGGTGTCTCACGGCGGACTTATTAAGCCGTCCGAAAAATTTCAA +GAGAAGTTAAAAGAGCTAGAATGTATTTTTTTGCATTATACAAATAATAATAATTTTGAA +ATTACAAATAATGTAAAGGAAAAATTAATATTAGCAGCGCGAAACGTCGATGTTGATAAA +CAAGTAAAATCTTTTTATTTTAAAATTAGAATATATTTTAGAATTAAGTACTTCAACAAA +AAAATTGAAATTAAAAATCAAAAACAAAAGTTAATTGGAAACTCCAAATTATTAAAAATA +AAACTTTAAAAATAATTTCGTCTAATTAATATTATGAGTTAATTCAAACCCCACGGACAT +GCTAAGGGTTAATCAACAATCATATCGCTGTCTCACTCAGACTCAATACGACACTCAGAA +TACTATTCCTTTCACTCGCACTTATTGCAAGCATACGTTAAGTGGATGTCTCTTGCCGAC +GGGACCACCTTATGTTATTTCATCATG +>DMPOGOR11 +CAGTATAATTCGCTTAGCTGCATCGATAGTTAGCTGCATCGGCAAGATATCTGCATTATT +TTTCCATTTTTTTGTGTGAATAGAAAATTTGTACGAAAATTCATACGTTTGCTGCATCGC +AGATAACAGCCTTTTTAACTTAAGTGCATCATATCAGCTGTTTTTTTTGCCAATTTCAAT +GAATATCATCAAAGTTAGCTGCGCCATCTATGAATCATTTTTGCATATCTAAAAGATGCA +AGAATGCCAACTCGTTTCAGTATCTGCGCATGTCCGTTTTTGTTTTTGCTTTGATCGTGA +TTTTTGTGTTTTTGTTTCTTATGGCACAAAGTTATTAAAATGGGTAAAACAAAGCGTGTC +GTTGGACTAACACTAAAGGAAAAGCTTCAAATAATCGAGTTAGTGACCAACAAAGTGGAC +AAAAAGGAAATTTGTGCCAAGTTCAAATGCGACAGATCCACAGTCAACCGCATTTTACAA +AAAACAAATGAAATTCATGAAGCTGTGGCCGCGTCAGGTTTAAAAAGAAAGCGTCAAAGA +AAAGGAGCGCACGACTTAGTAGAAGAAGCCTTATACATTTGGTTCGGACAGCAGGAATCA +AAGAACGTAATTCTTGACCGGCACGTCATATTAGCAAAAGCGAAAGAATTTTGCCAAAAA +TTTAACGACGCCTTTGAACCTGACGCCAGCTGGCTTTGGCGCTGGCGCAAGCGCCACAAT +ATAAAGTATGGCAAAATACACGGCGAAACTGCTACAAATGATTCCGTATCAGCAAATGAG +TACAAAAATGATATTTTGCCAGGATTGCTTAAAGGTTATAACCCAGAAGACATTTTTAAC +GCTGACGAAACTGCACTCTTTTATAAAGCAATGCCGAATGCGACATTTTTTACTTGTGGA +AAGCAATTAAATGGCCAGAAATCTCAGAGAGTGAGACTTACTTTGCTGTTTATATGCAAT +GCAACTGGGACATACAAAAAAACTTTTGTAATCGGCAGATCTAAATCGCCACGATGCTTC +AAGAATGCTAATGTGCCCATTCCGTACTATGCAAATAAGAAGGCCTGGATGACTAAGGAT +CTCTGGCGAAAAATAATGACAGGATTTGACGAAGAAATGAAAAAGCAAAATCGAAAGATT +TTACTCTTCATCGACAATGCAACTAGTCACACGACTGTCAAGGACTTCGAAAACATAAAA +TTGTGCTTCATGCCACCAAACGCAACGGCTCTACTTCAACCTCTGGACCAAGGTATTATC +CACTCATTCAAATTAGAGTATAGGCGTATTTTGGTCAAACAGCAGCTCATTGCTGTTAAT +TGTGGTAAATCTACTGTGGAATTTTTAAAATCATTATCGTTATTGGATGCTCTATATTTT +GTCAACCAAGGATGGAAGAATGTTAAAATGTTAACTATTCAGAATTGTTTTAAAAAGGTA +AGATGGGATTATTATTGATATGTATCTCAAATAACGAATTTATTATTTTCAGGCTGGATT +TAAGTTCAGTTTTGAAAATGAAGACACCATTGCTGAAAAAGACAAACAATGCGTAGAAGT +TGACATTGTATCGAATATTAATTGGAATGAATATGCCAATGTTGATGCAGATGAGGCTTG +CCATGGTCAATTAGATGATGATGAAATCGTGCGCTCTTTAGTTCAAGATGCAAAAACCAG +CGATAACGAAGAAAGCCATAGTGATGAAGATGTGGACGATACTGAGCGTCCTACTTTTAA +GGATGGGTTTGCAGCAATTAAGGCTTTAAAGTCCATTTTTATGCGAAACAATAATGATGA +GTTTTTGCAAAACTTGAATTCTATGGAAGACAAGCTGTTTAATTTACATATAAACTCAGC +TGTATTGCAAAAAAAAATTACTGACTATTTTTAAGTTAGTTTTAAAAAGTGTTTTAATCA +ATTCACCATCACTTAAATTTATATGTCGATCTTACTTATCATTAAGAATGAAATTATCAG +TTCCTTTTATGTTTAACATTGTTATAAAGAAATAAATTCTTTATTTTTCCTTAAAAAAAA +AAATTAAGTTAGCTGCATTTTTAAGTTACCTGCATCGAGGCATTGTGCAAAGTACTCGAG +GCAGCTAAGCGAATTATACTG +>DMRER1DM +CGGACGTGTTTTCGTTGCGCTCGTGGACATAGTGCGAAGAACTTTGTTTTCCGTATTTGG +AAGTATACGGAATAAATAATTTAGTGTTCCGTGGAAGTGGTGCGCAAATTTTCGCGAATT +AAAAACAAGCGGTTTGGAAGTAATTGACAATAAATTATTGGAAATTTTCCACTCCGCACG +TGTTGAGCGGCGGAGCTTGCGGGTGAGCTTTTCGAACAGCTGAGAGAAGCTTATTGGTGG +TAGTCACCGCTAAGGATTGTGTCTTGGGACAGCTTAGTGCACTCTACCAATAGGTGGAGC +TATCACCATAGCAACTAGCCCGTGTCAGCGAGCATACGATTGCTGGACTCGTCAAAAGGA +GGAGCCACCATCGGAGCAACGCCGATGGAGAGCGACAGCAGTGTGAGTGCCTTGAGCGGA +AGCAGTGCCTCAAAGGTGTCAAGACGAGGCAGGCGTAGGAGCCATCTGGCCTCCAAGAGC +TCGGCGCCAACGCAGGCGAAACTGGTTGCCCTGGCCTCGAATGGAGTGCCGGAACCCGTT +GGTGTGCTGGAGGAGGCGTTTTCGTCGCTGGAGGATGCCCGGGCGGCTACGTCAAACGCT +GCCAACGATGCTGCCCCCCCCGCTGCTGCCCCCGCTGTTGATCACACTGTTGCCCCTGAT +GTTTCCACTGCTGCTAAAATCGCTGCCACCACTGCCACCGCTGCCACCGCTGCCGCCCGT +GCTGGGCAAGCAGCCATGATGGCAGAGCTGTCGGCCACCCAGCGCATGGTGCGAAACAGT +TTCCGCAGCCTAGGAGGCGTAGACACGGAAGAGCTCTCGTGTGCCATCAGCCGCTATGAT +GAGCTGGTGATGGCATTAATGCTCCGGTGTGGAGAACTGGAGACGCGGCTCGCTATGCCA +CCACCGCCGCCGCCGCCGTCCAAGGCGAACACTACTGCCGCCAATGCTCCCCAGATGCCT +CAGGTTGCACCCATCGCTGCCCCGCGGACAACCAAGGTTCGTGAGACGTGGTCAGCGGTG +GTGAAGTGCGACGACCCTGCGCTATCGGGGAAAGCCATAGCCGAAAAGGTGCGGACGATG +GTTGCACCCTCCCTCGGAGTCAGAGTACACGAGGTACGTGAGCTGCCGTCGAGGTGGTGG +TGCGATCATTCGTACTCTTCGGTTGGAGAGCTGCAGAAGGTGATGGCATCGAAAAGATTC +GCAGAACTTGGACTGAATGTGGCACGGAACGCGGCCGAGAAGCCGAAGGTCATAGTCTAT +GACGTCGACACAGCCATCGGCCCAGAAGAGTTCATGCAGGAGCTTCACGAGAACAACTTC +GACAGTGAAATGACTCTGGCCCAGTTCAAAAAGTCGGTGCACCTGGTGACCAAGGCGTGG +TCGGCTACTGACGGTGCCACCGTAAACGTGACGCTAGAGGTAGACGACCGGGCGATGGCG +AAACTTGATGTAGGACGTGTCTACATTAAGTGGTTTTCGTTCCGATGCCGATCGCAAGTC +CGCACCTATGCCTGCCACAGATGTGTGGGTTTCGACCACAAGGTTAGTGAATGCAGGCAG +AAGGAGAGTGTTTGCCGCCAGTGCGGGCAACAAGGCCACACCGCGGCAAAGTGCCAAAAC +CCGGTGGACTGCCGGAACTGCCGTCACAGAGGGCAACCTTCGGGGCATTATATGCTCTCG +AATGCTTGCCCGATATACGGAGCGTTGTTAGCGAGGGTGCAAGCTAGACACTAATGTTTA +GCTTCATCCAAGCGAACTGTGGCCGAGGCAGAGCTGCGACCATCGAGCTCGGAGTCCGAC +TCAGGAGATCGGAGTCAATGTTTGCTCTGGTGCAGGAGCCGTATCTTGGCGGGGATGAAA +TGGATGTGCTGCCTGAAGGAATGAGGGTTTTCACCGACCGGCGAGGGAAGGCAGCCATCC +TAGTGGATCATCAGGAAGCCATCTGCATGCCAGTGGAAACTCTCACCACAGATTATGGCG +TATGTCTGGTCGTTAAAGGGAGTTTTGGCTCAATCTTCCTTTGCGCCGCATACTGCCAGT +TCGATGCACCTCTGGAACCGTACCTCCGGTACATGGATGCGGTCCTGCTGCAGGCCAGCA +GAACCCCCGCAATCCTGGGCCTCGACGCGAATGCAGTGTCCCCCATGTGGCTTAGCAAAC +TCTCTCGTCATGCCGAGGGGCAAGCTAACTACAGACGGGGTGAGCTGCTGTCTGAGTGGA +TGCTGGAGGCAAGAGTCGCCGCCCTAAACCAGTCAACAGAGGTGTACACGTTCGATAATC +ACAGAGCGACTAGTGATATCGACGTGACAATCGTCAATGAAGCAGCATCTATGTGGGCCA +CATATGAGTGGAGAGTGGACGAGTGGGAATTGAGTGACCACAACATCATTACTGTTGTGG +CCGAACCAACTACCGCGCGCTCAGTTGAGAGCATAGCTCCTGTGCCGTCCTGGAACTTCT +CCAATGCACGTTGGCGATTGTTCAAGGAGGAAATGGTGAGTAGAATAGCCGAACTTCCGG +AAAACTTTTCAGAGTCGCCGTTGGACCAGCAAGTTTCGACCCTGCGCAGTATAGTACATA +GTGTATGTGATACTGCGCTAGGAAGGAAGTTGACTCGATCGCCCAGCAGGAGAGCACGTT +GGTGGACTGCCGACCTCTGCGCTGCAAGGCGCGAAGTCCGAAGACTTCGTCGCCTGCTCC +AAGATGGAAGGCGTCGAGATGACGATGCCGCTGTAGAGCTTGTAGTGGTCGAGCTGAGGC +GTGCCTCAGCCTACTACAAGAAGCTCATTGGAAGGGCGAAGATGGATGACTGGAAACGCT +TCGTGGGAGATCATGCCGACGACCCATGGGGGCGCGTCTACAAGATTTGCCGAGGTCGCA +GGAAGTGCACGGAGATTGGGTGCCTCCGCGTGAATGGCGAGCTGATCACTGATTGGGGTG +ACTGCGCACGAGTGCTCCTCCGCAATTTTTTCCCAGTTGCGGAGTCCGAAGCACCGACTG +CCATCGCGGAGGAAGTCCCACCGGCCCTCGAAGTATTCGAGGTTGATACATGTGTTGCCC +GGCTGAAGAGCAGGCGCTCTCCCGGGTTGGACGGCATCAATGGCACTATCTGCAAGGCAG +TCTGGCGCGCCATACCCGAGCACCTAGCATCATTGTTTTCCCGATGCATCCGATTGGGAT +ACTTTCCAGCCGAGTGGAAGTGCCCACGAGTTGTCTCGTTGCTCAAAGGGCCAGATAAGG +ACAAGTGTGAGCCCTCCTCATACAGAGGAATATGCTTGCTACCAGTCTTTGGAAAGGTGC +TCGAGGCCATCATGGTGAATCGTGTGAGAGAAGTTCTTCCGGAAGGCTGCAGATGGCAAT +TCGGATTTCGCCAAGGACGATGTGTGGAGGATGCTTGGAGGCACGTGAAGAGCAGTGTTG +GCGCCAGCGCGGCGCAATACGTGCTCGGCACATTCGTGGACTTCAAAGGAGCATTCGACA +ACGTCGAATGGAGTGCTGCACTCAGCCGACTAGCCGACTTGGGATGCCGGGAAATGGGCT +TGTGGCAGAGCTTTTTCTCCGGCCGAAGAGCAGTGATCCGAAGCAGTTCCGGTACTGTGG +AGGTACCGGTAACTAGAGGCTGCCCGCAGGGATCAATCAGCGGCCCATTTATCTGGGACA +TACTGATGGATGTACTGCTTCAGCGTCTCCAGCCGTATTGCCAGCTGAGTGCATACGCGG +ATGACTTGCTGCTTCTCGTCGAGGGAAATTCCCGAGCTGTGCTAGAGGAAAAAGGAGCGC +AACTAATGTCCATCGTAGAAACGTGGGGAGCGGAAGTTGGCGATTGCCTCTCGACCAGCA +AGACGGTAATCATGCTGCTGAAAGGTGCCTTGAGACGTGCGCCTACGGTGAGGTTTGCTG +GACGGAACCTTCCGTATGTGCGTAGCTGTCGGTACCTTGGCATCACGGTCAGTGAAGGAA +TGAAATTCCTCACGCACATAGCTTCGCTTCGCCAGCGGATGACAGGAGTCGTTGGAGCAT +TGGCGCGTGTGCTTCGAGCCGACTGGGGCTTCAGTCCTCGAGCCAGGCGGACCATATATG +ACGGACTCATGGCACCTTGTGTGCTGTTTGGTGCCCCGGTATGGTATGACACCGCGGAAC +AAGTAGCTGCCCAGAGGCGACTAGCCTCCTGCCAGAGGCTAATCCTGCTTGGATGCCTTT +CGGTATGCCGAACAGTATCCACAGTGGCACTGCAGGTACTTGGTGGAGCTCCCCCGCTTG +ATCTGGCTGCTAAGTTATTAGCGATCAAATACAAGCTAAAACGTGGATTCCCGCTGGAGG +AGAACGACTGGCTTTACGGCGAGGACATTGCGTGTCTTAGCTGGGAGCAGAGGAAGACTC +GCCTAGAGGAGTGTTTAATCCAGAGTTGGCAGAACAGATGGGACGATGACAGCGAACCAG +GACGGGTGACGCATAGGTTTATCCCATACGTCACTCTTGCCTATCGGGATCCAAGTTTTG +GATTCTCGATGAGGACGTCTTTCCTGCTTACAGGGCACGGGTCGTTCAATGCATTTTTGC +ACGGGAGAGCCCTCAGCGATACCACTGCTTGCGCATGTGGAGATCCATATGAGGACTGGA +TGCATATCTTGTGCGCTTGCCCCCTATATGCAGATCTGCGGGACCTAGATGGACTTGGAG +TGCAGCGCCTTGGCGAAAACTGGATCTTCGAGGGAATCCTGGATGATCAAGAGAAGACTC +AACGGCTGGCAATGTTTGCGGAAGAAGTGTTCCTGAGGAGGAGGGCCCTTTAGCTCAACA +TCTCTGCCGTGTGGTTAGCGGGCGAGAATACTACCACAGTCCGCTGTTGCTTGTCGTAAG +AGACGACTAATACAGCGATAGGATTCCTCTAACCCTGCTTGTCGGAGCAAAAGGGGGAGG +CCCACCGAGCCTCTTTTCGGTACCACGGGTTGAGCAGCTATCCAAGACTGCTCATTGAGG +TAGGCCCCCTGGTGGGAGTATCGTGGTGGCTGTGGTTGGTACCCATATCGCGGGTAGAGC +CTTCATGCTCGACGTTTGAGTTACGGTGCTAGTTGCGCAAAACTCGGGTGCTGTGACCCA +GAGATCAGTAGAGATTTTAGGTAGATCTCGCTCCTCAGCAAGGGGGAGTGCTTGCCCGGC +AAGCAAGTACTCGAATTGCTACCGGGGTGGTCGCTATGTACATAGCTATAGCTTCTAGTC +CGGGACGCTTGTCTGGCGTATCCAGACACATGCACCATATGCTCACTTGTGGGCGTATAG +GGTGCCGTGGTTGTAATCCCTTCAGTGTGGAACACGCCACGTAAAATAAGTTCGGAGGGA +TCCGAAAAGCATACAT +>DMRER2DM +TTGGGGATCATGGGGTATTTGAGAGCAGAGGGGGAGTATTCTTCTGTAATTCGTAAGTCA +TATCATATGATGTGCGGAAGGGGAATTTTACTCTGTAACTCACAAGTCTCTCCTTTACTC +AAGTCGACTCAAAACCTCCTCGTGGTGGTCCCGGTAATGCTAAACTCGTTTAGCAGCTAA +TTTGAGCGGAAAAACTTTTCCGATGGGCTGGTTCCCCAGAGGAAATTTATTCATATTGGA +ACTACAAGCACAAATAACGAGCCTCGGATACCTTTACACAATCTGATGACGACCCGACCC +TCCGTGGATATCTTCCCGGAGGACCAATATGAACCAAACGCAGCGGCTACTCTATCTAGG +GTTCCCTGCACAGTATGTGGCCGGTCCTTTAACAGCAAGAGAGGACTCGGTGTTCACATG +CGATCTCGGCACCCAGACGAACTTGATGAAGAACGTCGACGTGTCGATATAAAGGCAAGA +TGGAGTGATGAAGAGAAGTGGATGATGGCGAGAAAGGAGGTTGAGCTCACAGCAAATGGA +TGTAAACACATAAACAAGCAACTAGCGGTGTATTTTGCAAACCGCAGCGTCGAAGCCATC +AAAAAGCTAAGACAGAGGGGCGATTATAAGGAGAAAATAGAGCAGATAAGAGGGCAATCA +GCTCTCGCCCCGGAAGTTGCTAATCTAACCATAAGGCGCCGCCCTAGTAGAAGTGAGCAA +GACCACCAAGTAACAACATCGGAAACAACTCCAATCACTCCCTTCGAACAGTCGAACAGG +GAAATTTTGCGGACACTACGCGGGTATAGCCCCGTAGAATGCCATTCCAAATGGAGAGCC +CAAGAGTTGCAAACTATCATTGATAGGGCACATCTCGAGGGAAAGGAAACCACTCTCCAA +TGCTTATCGCTATATCTCCTGGGAATTTTTCCGGCACAGGGTGTACGACACACACTGACG +AGACCTCCTCGGAGACCTCGGAACAGGAGAGAAAGCAGAAGGCAGCAGTACGCTGTCGTC +CAGCGTAACTGGGATAAGCATAAAGGAAGATGCATCAAGTCCTTGCTAAATGGAACTGAT +GAGTCGGTAATGCCAAGCCAAGAAATAATGGTTCCCTACTGGAGAGAAGTAATGACTCAG +CCTAGCCCAAGCTCTTGCAGTGGAGAAGTGATACAAATGGATCACTCGCTTGAGAGGGTA +TGGTCTGCTATTACAGAGCAGGACCTTCGGGCGTCAAGAGTCTCATTATCCTCGTCTCCG +GGGCCTGACGGGATAACTCCAAAATCTGCCAGGGAGGTGCCGTCAGGTATTATGCTGCGC +ATAATGAACCTAATTCTATGGTGCGGTAATCTACCACACTCCATACGACTGGCCAGAACC +GTCTTCATCCCGAAGACGGTGACGGCGAAGCGACCGCAAGACTTTCGTCCAATATCAGTG +CCTTCAGTCCTGGTAAGACAGCTAAATGCAATATTGGCAACCCGGTTGAACTCATCAATC +AATTGGGACCCGCGCCAGCGGGGCTTCTTACCAACCGACGGATGCGCCGATAATGCGACG +ATAGTCGACTTAGTCTTGAGGCATAGCCATAAGCACTTTAGATCTTGCTACATCGCAAAT +TTAGATGTAAGCAAGGCATTTGATTCTCTATCACATGCATCTATATACGACACCTTACGT +GCTTATGGTGCGCCAAAGGGCTTCGTTGACTACGTACAGAACACGTACGAGGGCGGTGGT +ACCAGTCTCAATGGGGACGGTTGGAGTTCAGAGGAATTCGTCCCTGCTAGAGGAGTGAAG +CAGGGTGACCCTTTGTCTCCTATTCTATTTAACTTGGTAATGGACAGGTTACTTAGAACC +TTACCCAGCGAAATTGGTGCCAAAGTCGGAAATGCCATTACTAACGCGGCCGCGTTTGCA +GATGATTTGGTACTATTTGCGGAAACTCGGATGGGGCTTCAAGTATTGTTGGACAAGACG +TTGGATTTTCTATCTATCGTCGGCCTCAAACTTAATGCCGACAAATGTTTTACCGTTGGC +ATTAAGGGCCAGCCGAAACAGAAGTGTACCGTGTTAGAGGCACAGAGCTTCTACGTAGGC +TCGAGTGAGATTCCATCACTGAAGCGCACGGACGAGTGGAAGTACTTAGGCATCAACTTC +ACTGCAACCGGGAGGGTTCGATGCAATCCGGCCGAGGACATTGGTCCAAAGCTACAAAGA +TTGACAAAGGCCCCCCTCAAACCACAACAGAGGTTGTTCGCCCTTCGGACTGTCCTTATC +CCACAGCTCTACCACAAGTTAGCCCTTGGGAGTGTGGCGATAGGCGTCCTAAGAAAAACT +GATAAACTTATAAGATATTATGTGCGAAGATGGCTAAATCTTCCGCTGGATGTGCCGATA +GCATTTGTTCATGCACCCCCAAAAAGTGGAGGTCTCGGAATTCCATCACTAAGATGGGTA +GCTCCAATGTTAAGGCTAAGACGCTTGAGTAACATTAAATGGCCTCACCTCACGCAAAAC +GAGGTAGCCAGCTCTTTCCTCGAAGCCGAAAAACAACGGGCCCGAGATAGATTATTAGCT +GAACAAAATGAACTGTTATCGCGTCCGGCAATAGAAAAATATTGGGCGAACAAGTTGTAC +CTCTCAGTTGATGGTAGCGGACTCCGTGAAGGCGGCCATTATGGCCCGCAACACGGGTGG +GTTAGTCAACCCACGCGTTTATTAACAGGAAAGGAATATATGGACGGTATTCGTCTGCGG +ATAAATGCCCTACCCACAAAGTCTCGTACTACAAGGGGAAGGCACGAATTGGAACGACAG +TGTCGTGCAGGATGTGATGCTCCCGAAACAACAAACCACATAATGCAAAAATGCTACCGC +TCGCATGGGAGGCGGGTAGCTAGACACAACTGCGTAGTAAATCGAATCAAGCGGGGACTT +GAGGAGAGAGGCTGCGTGGTCATTGTTGAACCAAGTCTGCAGTGCGAATCCGGCCTTAAT +AAACCAGACCTGGTGGCACTACGACAAAATCACATTGATGTGATCGACACACAAATTGTG +ACAGACGGACACTCTATGGATGATGCGCACCAGCGCAAAATCAATAGATACGACAGACCG +GACATACGAACTGAATTGCGTCGCAGATTCGAAGCCGCAGGTGACATTGAATTCCATTCT +GCCACCCTGAACTGGAGGGGGATCTGGAGTGGTCAATCCGTTAAAAGATTGATAGCAAAG +GGTCTCCTCAGCAAATATGATAGTCATATCATTAGCGTCCAGGTTATGAGAGGCAGTCTC +GGTTGTTTTAAACAGTTCATGTACCTGAGCGGGTTTTCCCGAGATTGGACTTAGCTAAAT +CGTTTGGTTCAAAACATTTGCTTGCTGTCTTGGCATAACATCAATAAAGGCATAAACATC +GCAAAATAATGGTTATAATTAAATGGCTATGAGGATGGTTTTAGTACGTAGGCGTTGCGG +AACTTCGGTTCATATAGAGCAATGAATCGTGCATGCTAGGAAAACTGACCACACACAGTG +TTGGCAGACCTAGTATCTTTCGAAGATTTCCATACCTCCGCGATCAAAAAAAAAAAAAAA +AAAAAAA +>DM33463 +CAGTTTGTCAAGAAACTGTTTACACACCGCAAAATAAGTAGAATTTTTGACTTTAAAGGC +CAAAATTAAGGGTTTTTTGCTTAATTAAACGCAATTTTTTTATGAAATATAATTAAACAA +TATTTATTTTACTTATAAATTAAAAAACAAATTCAATATATCAAATATACAAGAAAATAA +ACAACAAATTTCTTGTTTACACACTTTTGAGAGTGCCAAGAAACTCTTTACACAGTTTTG +GGTTCCTACTTTGTTTTGCTCTTTTTCTTAGAAACAATCTCATTTTTCCGTTATTTTTGT +CTTATGCATTCCTTTTTACAACGCTTCTATTGCAATTTTTTCACTTTGCTTGTGAAATTT +TGTTGATCTAACGTGCTTAAAGCGAATTATTAAATTTAATGAAATGCCTGGAAAGAGATT +GGCTTTTGAAGTGACCCAGCTAATATACTATAACCACCAGTTGGGAAAATCTATTCCTGA +ATTAGTAGAAATATTTTCCGTATCCCGTAAAACCGTCTATAATATTTTAAATCGTNNNNA +AAAAGAGGGCAGGCTTGAACCTAAGAGTGGTGGTGGGTGTAAAACGAAAATTAACAAGCG +AGTAGACCGCCTTATTATGCGAAAAGCGATTGCGAACCCCCGAATCTCGGTCAGATCACT +TGCTCAGGATATCAGGGAAGAATGTCACCTAACTGTATCACACGAAACTGTGCGCCAAGT +CATCCTACGCCATAGGTACTCTTCAAGAGTTGCAAGAAAAAAGCCTTTGCTATCAGAGAT +CAATATTGAAAAGCGTCATTCATTCGCTGTGAGCATGATGGATCATGCGGAAGAGTACTG +GGATGACGTCATATTTTGTGACGAAACAAAAATGATGCTCTTTTATAACGATGGGCCAAG +CAGAGTATGGCGCAAACCGTTGAGTGCGCTAGAAACACAAAATATAATTCCAACAATCAA +ATTTGGAAAATTGTCAGTGATGATTTGGGGCTGTATTTCCAGCCATGGAGTGGGCAAACT +AGCCTTTATTGAAAGCACTATGAATGCCGTGCAATATCTAGATATTTTAAAAACAAATTT +GAAGGCCAGTGCAGAAAAATTTGGTTTGTTTAGCAACAACAAGCCAAATTTTAAGTTTTA +TCAGGACAATGATCCCAAACATAAAGAGTACAATGTACGCAACTGGCTACTCTATAACTG +TGGCAAGGTGATCGATACGCCCCCTCAGAGTCCTGATCTAAACCCCATTGAAAATTTGTG +GGCCTACTTAAAGAAGAAGGTTGCAAAAAGGGGCCCCAAAACTCGACAACAACTCATGGC +TGCGATAATCGAAGAGTGGGAAAAGATCCCGCTTGAATATGACCTAAAAAAACTCATACA +TTCCATGAAAAAAAGGCTTCAACTTGTAGCCAAAGCCAATGGGGGTCATACTAAATACTA +AAACTTTTCAAATATTATCAAAATAATTAAAAAATTTAGGATTAAACTTAGGTTTAGTGT +TTTGTGTAAAGAGTTTCTTGACACTCTCAAAAGTGTGTAAACTTGAAATTTGTTGTTTAT +TTTCTTGTATATTTGATATATTGAATTTGTTTTTTAATTTATAAGTAAAATAAATATTGT +TTAATTATATTTCATAAAAAAATTGCGTTTAATTAAGCGAAAAACCCTTAATTTTGACCT +TTAAAGTCAAAAATTCTACTTATTTTACGGTGTGTAAACAGTTTCTTGACAAACTG +>SPRINGER +AGTTAACTAAGTTAACCGGACTGATCGTCCGCACACCAGCACCGGTCAAACTGCTGACCA +AGCATTTGGCCGGAAGCTCATGCATAGCCGGCAGAAGCTCTGCGCATTGGCAGAGGCCGC +TATGATGTTTTTCCCTTTGTTAGCTTATAGTCAGTTTGATTTTGTATTCAATAAAGAGCG +CATCGCGCCTTCAATCAACTCCAGCTACTGCTGTTATCATTGAATTGGTTGGCTAGCCTT +AAGGGCAGTCAACAACGGAGAGACGTTCTCCCACCATATCTCCCAATCTAGGAGAAGAGG +TCTGCGGCAACCGCCCTGCCTCCCAGTGACAGAAGAACCCCCCGTTACCTGCAACCTACG +CCGGAGACCGCGGCGAGGGACCTGCACCTTATATTTAATTAATTGGCACCCAACTCCAGG +AACCCACACCACTACCCTGAATCATGTAAGTGGGATTCTCAACTTAAACACTACTCCAAA +CTGCGTCTAGAATTTTAAAATATTTGGGATGTTTGTGCGAGTTACATAAATAAATTAAGA +AAATCGGCATTTCCACTACAATAAACGTTTATATGTGTTGCGAATTAAGATTATGTTACT +GTTATGAAGTTTAAATATCGAATTTTGATTTGTGGTTGACTTTGCAATCCATATTGTGTG +CATTTCATTCCGCCTTCGCACATCCGCGGGACACTGTCGTTTCATTCGAAATTTAATTCG +CTACATTGGCTTCACAGCCCTTTCAAGCTTTGTTGTTTTTGACCCACTCCACTTCGCTAC +CCGATACTGGCGCATGCATTGCTGTGACAATTTTGTGCCTTTTATTTATCTCTTTGTCTT +TGCTGTGGCAATTTTTGTCTTTGGATATTTGTTTGCCTTATTGGAGACCCGCTCCCCGCA +GGCCCTTCACCTTATCGTTACTTAGCTGGACAGTGGCTCTGCTCGTTGAGTCTTCGTCCA +ATGCCTTCAAAGCGGCGACTCAGCCCCCGCGACCCCCTTGCCGTACTGTTTGGCCCCACG +GGCACAACGGCCTGAGTATTCACATACATAGCTACCCATGAGCGAGTCATTCCGACAATA +TAGGAATTCTAAAAAGTGCGCTAGCGACTCAGAGTCCGAAAGCGACGATTCGACAGAAAA +CTCTGTACGTAAAAACACCCCAACTAACGCATTCACTGCATATAAAATGTCCCTCGAAAC +GGAACAAATTAAAGCTCTCATAAGGGCATTACAAGAGCAAGCCTTAGAGAGTCAACGCAG +GGAGGCTGACTTGCGTAAAACAATTCAAGATCTGGCCGGCCAGGTCGCGGCCATACAGAT +TGCCCCTGCCCGGGCAGAAGCTCCCCCAATCAAAGTTTACAGACCAGTAGAAATCACCGG +ACTGGTCCCTTGTGGGGAAACATTGGATGCCGTTAAATGTCTTCCAGACTTTATGGGGAC +ACAGGAGACATACGTCTCCTGGCGGCAAGCGGCAAATGCCGCTTACCATATGTTCAGGAA +ATATGAGGATAGTTCGCGGCACTATCAAGCTGTGGTCATCATCAGGAGCAAAGTTAAAGG +CCCTGCTGATGCAGTTCTGTCGTCCTTTGGGACTATACTGAATTTCGATGCGATCATAAG +TCGCCTCGATTTCACGTATAGTGACAAACGCCCGATACACGTTATCGAGCAGGAGCTAGG +CACCCTCAGACAGGGAAGCCTGACGCTCCTCCAGTATTATGATGAGGTCGAGAAAAAACT +CACCTTACTCACCAATAAGGCGACTATGTCTTATGAAGCGTCGGCAGCAACGGTGCTGTG +TGAGAAGTTCCGAGATGATGCTTTGAGAGTTTTTGTCTCGGGGCTCAGGCGCAACCTCAC +AGACGTGCTATTCGCGGCAAAGCCTAAGGACATGCCGTCAGCGCTCGCCCTGGCGCAAGA +AGTAGAGTCCAATCATGAGCGGTACACTTTTGCAACTTCATTTGCACGAAGCCAAGAGGA +TAGGGACCACAAGCAATATCCCAAAGTGCAGGAGCGCCAACGGGCCCCCCCACAAGCCGG +CTCGCAGGGAAGTGCTGGGAAGAACCCGCACTTTACTAAGCAGCATAGAGCACAGGTGCA +CTCCGCTCCACGTAGCGACCGAATGGCCCGAGAAAACATGCCAGAACCCATGGACGTTGA +CCCGTCGTTGTCCAGGATGCAGCCATCTCACGCCCCGGCTTACCCGAAATCGAAGCCGGC +CGCGTCTGGCCGTTCGGTCCCACCAAAAAGGCAAAGGGTCAACCATGTTGCCCAGGCCTC +TGATGATTTGGACAAGGTTTATAACACCGCAGCCTCCAGTGCAGCAGTTAAAGTCGACGA +CGATTCCATCCTAGAGTACGACTCGGATACCATTAATTTTTTAGGGGAAAGTCCCTGCTA +CCCGTCATCAGACGAAGAGTAGCGGGGATCGACATGAAACTACTGATTGATACGGGCGCG +GCAAAAAATTTTATCCGACCATTTAAGGGGTTGAAAGGCGTCCGCCCGGTGCAGTCCCCA +TTTACAATCCATTCGATTCATGGTGTGACTACAATAACTAAGAAATGTTTCGTGTCCATT +TTTAATCTTAAAGCTACCTTTTTTTTATTACCAGACTTGACCTCCTTTGACGCGATCGTT +GGCCTAGACCTGTTAAAACAGGCCGGCGCGTCACTTTGCCTAGCTTCCGGCAAGCTCAAA +TGGGGCTCCGGAGCAGAGCAAATTGACTTTCATACTTGCCCCGATGTCAATTTCACCAAA +GTAGATTGCTCGGACGCACCGCCCTTAATTAAGGATGCTTTTTTAAAAATGCTCGGGAAT +AGGAAAAAAGCTTTTGCTGATCCTAATGAGGCTCTTCCTTACAATACGTCGGTGGTAGCC +ACCATCCGGACGGTTGATGAGGAGCCCATTTATGCCAAGTTATACCCATATCCCATGGGA +GCAGCTGACTTCGTCAACGGCGAAATTCAGGAACTGCTTAAAAATGGCATAATCCAAAAG +TCAAAGTCCCCCTACAATAACCCAATATGGGTCGTAGACAAAAAGGGCACTGACGATGCG +GGCAATAAAAAAATGCGCTTGGTGCTGGACTTTCGAAAACTTAACGAAAGGACGGTACCA +GACAGATACCCCATGCCAAATATCTCTATGATATTGGGGAATCTCGGCAAGGCCAAATAC +TTCACGACCCTCGATCTGAAGTCTGGCTACCACCAAATCACGCTCGCAGAACGCGACCGT +GAAAAGACAGCGTTCGCAGTAAACGGAGGGAAGTATGAGTTCCGAAGGCTGCCATTCGGA +CTCAGGAATGCTGCAAGCATCTTCCAAAGAACAATTGACGATATTCTGCGAGAGCAGATC +GGAAAGTTCTGCTACGTTTACGTCGATGACGTCATCATCTTTTCGGAAGATGAAAACGAC +CATGTCAAGCATGTAGATTGGGTTCTGAAGAGCCTGTACGACGCTAACATGAGAATATCG +GCAGAAAAGTCACGTTTTTTTAAGAAAAGCGTGAGCTTCCTGGGGTTCATCGTCACCAAC +AATGGGGCGGCGACTGACCCAGAAAAGGTTAAGGCCATAAAGGAATTTCCGGAACCCAAA +AACGTATTTGAGGTAAGGTCATTCTTGGGCTTAGCCAGCTATTATCGTTGCTTTATCAAA +GACTTCGCATCAATAGCTAGGCCCATTTCAGACATATTGAAGGGCGAGAACGGTAGTGTT +AGCCGACACAGGTCCAGGAGTATCCAGGTAGAATTTTCCGAAGCGCAACAACGTGCCTTC +GAAAAGCTACGCAATATCCTGGCGTCTGAGGACGTCATCCTGAGATACCCTGATTACAAA +AAAGCGTTTGATCTAACGACAGACGCTTCGGCCTACGGCATTGGCGCAGTGCTGTCCCAG +GAGGGACGTCCCATTACAATGATCTCAAGGACATTGTCTGACAGAGAGGTTAACTATGCT +ACCAACGAAAGGGAGCTGTTAGCCATAGTCTGGGCACTGGCTAAGTTGCGGCACTACCTG +TATGCGGTTAAAGAGATAAACATCTTTACCGATCACCAACCTCTGACGTTCGCGGTATCG +GAGTCCAATCCGAACGCCAAAATTAAGAGATGGAAAGCACGCATCGACGAGTCCGGCGCA +CGAATTTTTTACAAGCCTGGGAGAAACAACCTCGTTGCAGATGCCCTCTCGAGACAACAA +CTCAACGTTGTTGAAGAGCAAGAACCGGAGTCGTGCGCGGCCACGATTCACAGCGAACTT +TCGCTTACGCACACGATCGAGTCCACGGACAAACCCGTGAATTGCTTCCAGAACCAGATA +ATTTTGGAAGAGGCGCGCTCCCATTGGAAACGCACTTTTATATTATTTGGGAATAAGAGG +CGGCACTCGATCAATTTCTCGTGCAAACAAGCTTTGCTGGAGGAACTCGCCAACATCATT +ATCCCTAATGGTGTAAACGCCTTCCACTGTGATCTTCACACGCTGGCGCTAATCCAGGAC +GACGTAGTTCGACAGTTTCCAGCCACGAAATTCTGGCATTGTAAGAATAGGGTCACCGAC +ATCTTCGCGATGCAGGAGAGAAAAGAAATCCTCACCGTCGAGCACAACAGAGCTCACAGG +TCGGCCCAAGAAAACGTGAAACAAGTACTCTCCGAGTACTACTTCCCGAAAATGACCAAA +TTGGCGAGCGAAATAGCAGCCAATTGCAAAACTTGCGCAAAGGCGAAGTATGACAGACAT +CCGAAGAAGCAGGAGCTCGGTGAGACACCAGTCCCGACCCACGTAGGAGAAATATTGCAC +ATCGATATTTTCTCAACGGATAAAAAATACTTTCTCACCTGTGTTGACAAGTTTTCTAAA +TTCGCCATGGTACAGCCGATTCTGTCTAGAACCATAGAAGATTTGAAAGCACCCCTTTTA +CAACTTATGAATGTTTTCCCCAAAGCCAAAACCATCTACTGCGACAATGAACCATCATTG +AAATCGCAGACAATAGTGGCTATGCTGGAAAACCATTTTGGCGTCAGCATTTCGAATGCA +CCGCCCCTACATAGCGTCTCAAACGGACAGGTGGAACGATTCCACAGCACGTTAATTGAG +CTCGCCAGATGCCTAAAAATCGACAAAGGCATAAGTGACACAGTGGAATTGGTCTTGCTG +GCCACAGCCAGATATAACATGTCCATCCACTCCGTCATCAATAAAAAACCGGCCGAAGTC +ATGCGGGCAGATCCGGACGATCCACATACCGATGTCCAAGAAAAAATCAAAAACGCCCAG +ATTTTGACAAGAAAACGAGAGAACGCTTCTCGGCAGAACAGAGTGTTCCAGGTCGGCGAC +AAAGTCCTAGTAAAGTCAAACAGACGATTAGGCAACAAACTTACTCCTTTATGTGAGGAG +AAGACCATCGAGGCAGACTTGGGGACCACAGTCCTTATTAAAGGGAGGGTGGTCCATAAA +GACAACCTCAAGTGACCCAAGCAGAGCCTAGCCGCGGCTCCCTCGGAGGCACACTTTTAT +TCCTCCAATTTGTAGCCACTCGGCATAAGTTTTTTCATTGTTTTTATAGCCGCTTGGCAT +AAGTTTTTTATTTTTTAGCCACTTGGCATATTTTTTATATATTTTCGCTATTATTGGTGG +TGGGCAACTCCATTCCGAACAAGTAATAATTTATCACACACGTTACAGGTCGCTCCCAAC +CCTTCTTCTTTGTTTCCTGGCCACGACATCGGCCCACATTACTGACTATTCCCGAGCGAA +TTACATTCCCGTCATTGACGGTAAAGTCTTAGTCTGGGAGGAATTCGCCTATGTCAGACA +CTCGGCTAACCTCTCCGAGTATAGGCGGGTAATTGACGAAACCGACAGCATGCTCGATAT +GTTCCCCCAGTCCCATATGAAGAAGCTCCTGAGCGTTGATATCGCTCACCTCCGTGACAT +GCTTGATTCTTTGAGCATCCATCACAGAGTGGCAAGGAGCCTAGACTTCTTGGGAACTGC +GTTAAAGGTTGTCGCAGGGACACCTGACGCGGAAGACTTCGAGAAAGTCAAGTTCACTGA +AGCGCGGCTTGTTGATGCACACAATAGCCAAATCGAAATAAACACCAAAACACAAGTTCG +AATTAACGAACTCACTGATACCATAAATAAACTTTTAAAAATTTCCAAAAGCGCTCAGAT +TGATACAGGTCACCTGTATGAAACGCTTTCTACTCGCAACAGAATCATTGTAATGGAATT +GCAAAACTTAATGCTCACTATAACCCTCGCTAAAATTAACGTAGTGAGTCCAAACTTCTT +GGACCACGCAGATCTGGAGAGTATTTGGGGCGAGGAGCCCACCAACACCCCCATAAGGGA +GATTTTGTCCGTTGCGTCTGTAAAAGTCCTACAATCCCTTAACATCTTACACTTTATTAT +TAAATTCCCCAAGATTATCATGGCGTGCAACAAAGTCACTATCCTTCCAGTGGTACACCA +CGATACGGTGTTAAGGTTGAAAGATAATGTGGTAGCAGAGTGCAACAGAGAAATACGCAC +AGTAAAGAATTGCTCCATAACACCAGGGGCAACATTTTGCCAGTTATCTTCAGTGAGCTC +GTGTGCGCAGGAGCTCCACGCTGGGGTCGTAGCACATTGCGACGCACAGCAGAGTGATCT +ACATCCGATCACCTACGTCGACGAAGGAATAATCGTCATCAATGACAGACCAGCACTCGT +GCGTGTGGACAATGGAACGGCCATCCACATTAGAGGCACGCACCTCATAACATTCATTGA +GAGTGCCATGGTCAACGAGACCGTCTTCTTTAATCATGACATGGTCCAGAATAGGGCGCC +GGGAGTGGCTAATTCCCCAGTCCTTAATATCTCGATGAAACACGAGGTCCTGAGCCTCCC +ATACCTTCACCGTTTAAGTGAAAAGAACTTGGAGCAAATCAGGAACTTCGAGAAGGACGT +CGACGGATACCGACTAAGTCAGATAGCGTTAGTTGCGGGAGCAATTTTCTGCGCTCTTAT +CTGCATCGGTTTAACCTGGCAGCGAACCACTAGGGCCAAGAAATCTACAGCCCAACTGAA +GGAAGTTCTCGCCCAAATAGGGTCAGCCGAGGGCGGCCTTAATCTTGAGGAGGGAATAGT +TAACTAAGTTAACCGGACTGATCGTCCGCACACCAGCACCGGTCAAACTGCTGACCAAGC +ATTTGGCCGGAAGCTCATGCATAGCCGGCAGAAGCTCTGCGCATTGGCAGAGGCCGCTAT +GATGTTTTTCCCTTTGTTAGCTTATAGTCAGTTTGATTTTGTATTCAATAAAGAGCGCAT +CGCGCCTTCAATCAACTCCAGCTACTGCTGTTATCATTGAATTGGTTGGCTAGCCTTAAG +GGCAGTCAACAACGGAGAGACGTTCTCCCACCATATCTCCCAATCTAGGAGAAGAGGTCT +GCGGCAACCGCCCTGCCTCCCAGTGACAGAAGAACCCCCCGTTACCTGCAACCTACGCCG +GAGACCGCGGCGAGGGACCTGCACCTTATATTTAATTAATTTAACT +>TARTC +AAGCTTCGCGGGATATCGATAACAATCAGGTGGTTAAAAATACTATAACATCGAGTACCA +GCCGTGTTTTTCCTGTCGATTTATCGAAGTCCAACAGCCCGCCTTCGCTCCGAACACAAA +TCGGCAAGTCAGTAGCTTTTTTAACCCGGCAGTGGCGCCTGTGCAGCAGCTATTTAAAGT +GAAAAACACGAAACGCAACAACAAAATGGACGGCCATAATGGAGACATAAATGAAGGATG +GGCAACAGTACTATCTATCTCGTCGGATGATAGTAACCAACTTTCGTCGCCGCCGTCAAT +TATAGTCTCATCGCTGGACACCACGCCAACGTCAAACGAAACCACCATAGTAAGAAGAAG +CCTACACAACCCAAAAGCTGACATGAAATCTTACAGATTTGAAAATATTGTATTAAATGA +AAATAAAAATACCATATTGCCAGATCCTTTATTTGTTGATAAATGCGGAAATACTGCTAA +TACCACAGAAGCCAATGAAAAAAAGCCTGCCAATAGCCCCTTCCCCATTTCCATTATCAA +GAATCTTAGCACTTCCTCGCCACTAACACATGTAGACACGCCTACACAAGAAGATGACGC +CAGTGCATTCAATACATTGAAAGCAGCCAAAACAGCTAGAATAATTTTTCCCACACACAC +ACAGATAAAGCCCGCCAAACCCTCGCCCCCTTCCAAAGAATTAAGCACAAACTCAGCACC +CAAAACTCTTAGCTACACAGACAAAATTACAGTAACACAGAAAAATCTACCCGACAAAAC +ACATGTAGACAGACCTACACAAGATGACGACATTAATGCAACCAAAGCATCAAAAACCGC +CAAAATAATTTCTACACAGTTACACCTACGTGAAACCAAGCCAACACAGCCCGCCAAAGA +CCCCTCACCCCGCACCCAAAAGCCTATTGCAAACAAAGCAGCCGAGACACTCACCCACAC +AGACAAACTCATAGCATCACAAAACCTAGTTCCCGCCAAAACACATATAAACTCCCCCAC +ACAATATAACGACACTAATGCAACCAATGCATTAAAAACCGCTAAAATAAATTTCTCTTC +ACACTCACACCAAAGTGAAATCAAGCCAACACAGTCCGCCAAAAACATTTCACCCCTCAC +ACAAAAGCAATTCACAAGCGAATCAGCCGGGACACACACCCATACAGACAAACACAAAAA +CACAGCATCACAAAATCTCTTTTCCGCCAAAACACACATTAACTCACCCACACAACATAA +CGACACTAGTGCAGCCACAGCATCAAAAACCGCTAAATTAATTCTCTCCCCACACTCACA +CCTAAGTGAAACCAAGCCCACACAGCCCGCTTTAAGCCCCTCGCCCCTCTCCCAGAAGCA +AATAACAAGCATAGCAGCCAAGACACTCACCCACACAAACAAACACACAGCATCACAAAA +CTTTATTCCCGCCAAAACACATATAAACATACCCACACAATATAACGACACCAATGCAAC +CAAAGCATTAAAAACCGCAAAAGCAGCTTCTCCCTCCCACACATACTCACGTCAGACAAA +ACCAATAAAGCCCGCCATAAACGCATTGCATGCCGCCCAAGACACAAACCCAAGCCCAGC +AATCAGTGCTGTCACTTACACAGACAAACCCACAGCTACTCAGAATATTTTTCCTGTCAA +AACTTTTGCAGAGCTGATTAGAGAAAATGCAAAACGCTCACCAACTCCAATCGAAAATCC +CCCTCAAGCAAAACATGACTCTGCCGCCCTCGGACGCCCTCCGACTGCAGCTAGAAAAAA +TCTAAATAAAACACTGATTTCTCCTAAAACTCCTGGGAAGCGCCGTGGGGACTGTCTTGA +TGAAGGCCTACTTCAAACCTCTAACAAAAAGGTTAGAATACGCGACGACTTCTCTGATGA +TGATCTGGGGGTCACAAACCTACTCTCTGAAACACCCTTATTCAAAAGCAAAGCAGCTAT +TAAGATTCGGCAAGACTCGAGAAGAGAATCCCTGCAGAAGTCAGCTGAAATGGACACAGC +TCCAGCAATAAGTCCCTCAAACGCAGCAGCCGATCCCGACCTACCGCCCTGGAAAACTGT +TCCAGCTAGCAGAAAACCACCATCAATCTTCCTGTCCAATATACAGCAGATTATCCCGCT +AATAGAAAAACTAAACTATAAAGCCGGGGTAAATAGCTTTACTACCAAGTCTGAACTTGG +CAACAATATTAGAATCCAGGCTAAAACGATGGACGCCTACAATGCAATTCAGAATGTCCT +CCTTGAAGCAAACATTCCCCTACACTCTCACCAGCCAAAGAGTGCAAAGGGCTTCCAAAT +TGTAATTAGGCACCTCCACCAGTCAACCCCGACCAAATGGATTGAAAGCCAACTTCAAGA +CATCGGTATAGCTACAAAATTTATCAGGGCAATGCAGTTTAGGGACACGAGAAATCCTAT +GCGCATCCATGAGGTTGAGGTTGTACCCAAGGCTGACGGCAGCCATCTTAAGGTCCTGCT +AATAAAATCCCTTGGAGGACAAACGGTCAAGGTCGAAAGGAAACGGGTATCGAAGGATCC +TACACAATGCCACCGCTGCCAATGCTTTGGACACACAAAAAATTATTGCAGAAACCCGTT +TAAATGTATGAAATGTGGCCAGCTGCACGCCTCGGTCTCATGCACCAAACCCAAAAACCT +TCCGGCTACTTGTGCAAACTGCAATGGAAGCCACGTTAGCAGCTATAAAGGATGTCCTGT +TTTCCAAGAAGCAAAGCAAAGACTATCTATCAACAAAATTCAATCCCTTCACTCACAACC +CACCCACCTTCAGACCCCCCGCAATAAACATCCCTACCCAAAACCCACCCACATTCAGAC +GCCCCTCAATAAGCAGCCCTACACACACCCCCTCCCTCGCACATTAGTAAACAACACAAA +ACTACCTGCCAAAAGAATCCAAGGAAAGAAGATATCGCAAAGGAATCTATCTATAAATAA +ACGCTTAAACAGAATCAGGACATTGGACAGAAAACCGAGGAATGAGACAAGCCCGCCGAC +AACTAGCAAAAAGGTCTTGGCCTCTCTAGAAGAAAGCAGAAAAAACCCAAATAGCGCCCT +AAACCCGGCCAACACCCATCTCACTCATTTCCGCCCACCACCATTAGCACAAAATATTCC +TAATGACGAATCTAAGGAGCTGAGTGGGGAGCAATACCTTTTAAATCGCATTGAAGGGAT +GGAAAAGAAGCTCAACAACCTTCTTGAAATCGTCACCCGCCTACTAAGCCAAGGAAAAGA +CTGTCCAAAGTCTCCAAAAAATCCTTTCCGAGATCCAATCTTCGTTTAAATGCTCTTTCT +AGTAACATCAGAAGTGACGTTTCCTATGACTCGGGAGTGCAACAGGGACATCCTTAAAAT +CGCTTTCTGGAATGCTGGTGGGATCAACAATAAAATAGATGAGCTTAAGCTGTTCATTCT +AAATATTGATGCCCACATAATCATAGTCACCGAAACTAGACTAGACAACAATTCTACCAA +ACTAGAGCTGCCAGGATATTTCACATACTTAGCCCAAAATCCTGCCTCTAGCAAGAGAGG +AGGAGTCGCCACGATAGTAAACAGTAGTCTCCGCCACATGGCCTTAGAACCGATTGAAAA +GGAATGCATACAGAGTGCCCCAATAGTATTACTGCCTGAAAACAACAGACGCAGCGAAAT +GATTGTAATAGCATCTGTCTACTGTCCGCCTTCGCTAAGCTGGTCGCCCCACCATTTTAC +TGACGTTCTCAATTTTGCTGAGAAAACTATGGGAGGGCAGACTAAGCTCATTCTATGTGG +CGACTGGAACGCAAAACATAGACAATGGGGTTGTATACGCGCCTGCCAACGTGGCGCCGC +ACTCTACGATGCAATTCAAGCAGACTCCATGGCTGAAATCGTCGCGACTGGCAGCGCTAC +ACATTTCCCGCACGATACAAGGAAAAGCCCGTCAGCAATAGACTTCTCGATATGTAAACG +GCTTGGCAGGTATGAAAAAAGAATCTCCTCAAGTGCACACCTATCCTCAGACCATCTTCC +CATATTACTTGAGATAAACCTAGATATAAAAACCATCTCCCTGCAAAAACAAAACAACAA +TATCCTCAAGAAAACAACGAACATTGAGCTCTTTAAGAACGTTCTAGAAAGGAAGATACT +TCTAAACACTGAGATAAGGGTAGCAGAAGACATAAATGACGCCATAAACATCTTTATTAA +AAACATCAAGGACTCGGCTGCTGAATCAACTCCCTCCCCAAGAATTCCTGATAACCACAG +AAGAAGATATGGGCAAGCTAACAGAAATAGTCATACGCTCACACTAGACGAAAACACAAG +CAGATTGCTGGAAGAAAAACGTATACAAAGTAGAATTTTTAAAGCTACTAGAACGAACGA +GGACAAAACTAAACTAAAAGCAGCTGAAAATCGACTTAAAAAAGTAATCAAAATCTTAAG +AGAAAAGAGAATCAATGAGCAAATTGAAGGAATTGACACAAATAACCCGGACAGAATGAG +GAAAATTTGGAGGCTGCTGAGTGAAGGGAAAAAAATGAATCAACCCAACTTTCCCCTCAA +ATTAGAAACCAAAAAAGGCCCTAAATGGACTAAAACAATTAAGGAGACAACAGAAGCGTT +TGTCTCCCACCTGGAAGGAAGATTCAAGCCAAATAAAATTGTACCTGATTACCACATAGA +TAAGGTTAACACCGGACTAAGAATAATTAAGGAAAGCATGCTAACAGAACGACATAATCT +AAACAAAAACCCCCATAACCAACCCATTACGCTAAACGAATTAAATGAAGAAATAAAAAA +CTTAAAGAATAGCAAAGCACCTGGTAAAGACCTTATAACAAACCAGCTCATAAAAACCCT +ACCGACTAAAGCTACCCTGTACCTTATCCTAATCTATAACTCCATACTTAGATTAGGATA +CTACCCTGAAGCCTGGAAACATGCACAGGTAAAAATGATCCTGAAGCCAGGGAAAAGCTC +AAACGAGCCGAAGTCATACAGGCCGATTAGTCTACTCTCGGGACTCTCTAAAATGTTTGA +AAGACTACTCCTAAAAAGACTTTTTAGGGTAGATCTATTCAAAAAAGCCATACCACTGCA +CCAATTTGGCTTCAGAAAAGAGCACGGAACTGAGCAGCAAATAGCCAGGGTCACCCAGTT +CATCCTCGAGGCCTTCGAGCGGAAGGAATACTGCTCAGCGGTTTTCCTTGACATCTCTGA +GGCCTTTGATAGGGTATGGCACGAAGGCCTTTTACTTAAATTAGCTAAGATCCTACCTTA +CAACCTATACATTATACTGGAGAGCTACCTTACAAATAGAACGTTCGAAGTTAAAGACCA +AGCAGGAGAGACTTCGAGAACAGGACAAATAGGCGCAGGAGTGCCTCAAGGAAGCAATCT +CGGACCACTACTTTACTCTATCTTCTCCTCTGACATGCCCCTCCCATATATCTACCGCCC +TTCACCAACACAAAGAATTATGCTCTCAACATACGCAGACGACACTATAGTCCTCAGCTC +AGACACACTAGCAACTGCCGCCACAAGAAACAACGAAAACTACCTCAAGACATTTTCGGA +CTGGGCGGACAAATGGGGTATCTCAGTAAACGCTGCTAAAACCGGACATGTCATTTTTAC +ATTAAAAAACGACTTACCTACAAACTCAATGAATGTGAAGATCAAGGGTCAAACAATAAA +GAAGGAAAGCAAGCAATCATACCTTGGGGTAACCCTTGATAGCAAGCTAACCCTTAGCTC +TCACGTCACAAAGCTATTGGGTAAATACTCTACAGCCTACAGAAAATTGACATGGATCCT +AAACGGAAGAAGTAAACTCCCTACTAAAACTAAGATACTGATCCTTAAATCAGTTTTATC +ACCAATATGGCAGTATGCCATAGCAGCTTGGGGTCCCCTTGTGACAGATGCACAGATAAG +GAGGGTCCAGGTTGAGGAAAACAGAAAAATAAGAGACATATGTAGAGCGGGAAGATATAC +GAGAAACCAAACTATAAGGGACCTTTTTGGCGTCAAAACAGTAGAAGAATTCTATCAACA +GGCTATGCACAGGTTCTCAGAAACTATAAAATCGCACCCAAATATAGCTGTTCGCAGGAT +TCTCTCTAGGCACTATATCCCGAACAGACTAGAAAGAAGCAGGCAGAGGTACTTTAAAAT +GACAAATGATCATATCACGCAAAAGCAGACTGGACTTGCCCTCTCACCTAAACTCTTAAA +AATCCCTGATATAGATGACTGCAGAACCGTAAAAAAGCGTAGCGAGAGAGAGAAAATAAG +ACAAATGCATCTAACTGAACTCCCCACCTTGCTGAGACTAGAGGAAGAGGAGGAAGAGCT +CAAAAGAATAAAAAAACAGGAAGAAAGGGAAAAAAGAGAAAGGGAAAACCAAAAGTGGCC +TCCAGATAGATGGTGCGAATTGGAAATAAACCGATATAATAAACAATATAGAAAGGGCGA +CCTAACCAGGCAGGAAGTTATAGAAAAATTCAGAGGGCAACCATTAAATGTACAACGAAT +AATCCTACCCGACTATGAAGGGGACTAAAATTAAATCAAAACAAACCAGGACAGGAGCAG +AAGGCAGAAATAATCAAAACTGGCGGAAGGGGTGGCAAAATATTGAAAAGAGAGGAAAGA +AATATAAAAAGGCTAAAGGCTAAGTTACAGGTTACATAAAAAGGGAAATCTGCTTATAGA +TATTATGGTAAAATTAACTTAACTAAACACCTACTGGTTAACAAAATAATTATGCCTGCA +TGGCACAAGCTGCGTACTCAAATCATTTCTCCTGACGCTATTGAAAATCCATCTTTACTT +TCCAACCGAGGGACTTGCGACTGCGGTCTTTCCGCCTTATTGGCTCCTTATGGATCCATC +TGCTGCCGTATTGGGCGACACACCAGCGCTCCAACCTAAAAGAGAGATAACATGTTTTAA +TTCACTTTCCTTTTCTTATAACTAAATCACAACAACAGCAACAGCGCATCGGGCGACTGA +CAAAAGCATTAGCTCACCAAGTCAGCAACAACAGCAGCAGCAAGACCAGAATCAGTTGAG +GAGGAGGCCTGGTGGTGTGCTGAACATTTCGCCGCCCACACCCACCATTTCTGTAGGCCT +GTATGACCCTGAGCCCAACGCCGGCATGGCAAATCCGGTCTTCCTGAGGAGGCGGGGCTC +TAGTGTTAGGCGCGCTTTTGCCCCAAAAGCAACAACGACAGCGGCAGTAGGGTCGGCGCC +CCCTGCGTGACCGAGTCCATCTTAGCAATCGGTCCTTTTGGCGGTGTTATGCCGACGCGG +CGGTCGCGCTTATGAGGACTGCCTGCAATGCTTGGCCATGAGACGGCGTCATCGACAACA +TTTCAATCACGCTCAGCTGGTTGACCGGGGGCAACATGCTTGCCATGCAGCAACAATGGT +GCATGCAGTCCAGCATGCAGCAACAACAACAATATTGGCAGCAGCAGACTAATGTTTCGC +AGCAGATTCCATCTGGCAACTTCCGACGACCAGACTCCTCGCTTGGCCCCTGGAGACTCG +CTCTGGAAAAAAAAAGAAAGAAGCATGGATTAGTTTTTTTTTTTCCCTTTAGCTATTGGA +TTAAATTTCTTTCCTGGACAACCGGCGCCTTCATGCAGATGACGCTGGACTGCGGCGATT +CTTTCCCTCCAGCCACAGATGGGAAGCTCACATCATGGCATATATGCGGCATCGTGCTAA +TCAGCTCCCCATGCTGAGCGAGATCTTGATGCGGCGATGCACTCACTAGCGAGCAGCGGG +AACAGCATACAGCGTCAGCAACAGCAGGAAGAGACTTTGTAGCAGAAGCCTTTCGGCATT +CTCCGACGACCCGACTCCTCGATCGGGGTCAGGCAAATTCTCCTGGACCGACAAATTTTC +CCGGCGTTTCGTCCTGGAATAAGGAAGGAAGCACGGATTAATTTCTCCCCTTCAGCTTAC +GACCCTTCTCACCAACAGCAGCAACTACAACAACATCGGCAGCAGACGACTTGCAGCTGC +TTGGCTCACCTAATGCGACAGCAATAATCCCGGCAAGGCCAGAAACGGCACCGAGCAGAA +GCACGACAGGGTGAAGAACAACATGCCGCCCACGTCCACCAATCCGGAAGCCCTGCATTA +GGGGTCTGAAGCGCCATTAACTGGAGGATCCGGCAGCGTATGCCTACGCAGAAGCGGGGC +GTCGTAAATCCGGTGGCCGGAATAGCGCCTTGAACAGCATGCTGTGTATGTTTGCCCCAA +AAGCAGAAACTGCCGCAGCAAAGGAACCGCAAGCAGGATCATCACTCGTGGCAAACTGGC +GTATTCCTGTTGAAGACGCGGGACTGCGGCGCATTCTTCCTTTCCAACCGGGGGCTTTAG +CGCTGCGGTATTTCTGCTTTCACGGCTCCATTTGCTGCTGCATCTGACGCCTCATCAGCG +CTCCTCCCTGAAAGAAAGAGAATATGTATTAGTTTTCTTTCCATTCCTTACAATCTCTCT +CACCAAACCTCCACGACACAACAACAGCAGCAGAAACAGGTCTAGCCCACAATGGCAGCA +GCTACAGCAATCAGCAGAAGCAAGGCCGGCAAAAGCAACAACAAAAGCCCTCTCTGAAAG +CCCGGATGTGGAGACTGAAGCGCCGGAAACTTGAGGATCCGCCCCCGATGCACGCCCACC +AACAATAAGCTGGAGGAGAAGTTACTGAAGCATGGGAAGCAGCACCAGGGGTCGCATACG +CAGCGTCAGGGCTTTGCGAACCAGATGAATGAGGAGAGACTGGAACAGCATAACATCAGC +GGCAGCAACAACAGCGCCACGAGGGTCAGCGGCGTCTGCATGGCTGTGTCCAAAACAACT +CCAATTCAACTGCTGTATGATGCAGCGCACCAGCGGCTTTCACAGGGACCGTCTGAAACG +CTTGGCAGGAGCCGGCTGAAGGCCTGGGCGAAGACACTGGAGACACCAATGCGGCTCCTT +TCGGCCGACGGCAACAGGCTTGCCATGCAATAAGAACAGTAAATCCTGAAATAACAGCAG +AAGATACAGACGTCCAAATTGCGAACACTGACGCCAGCCCTCACCTGAACGACTCACTGT +GCAGCAGCAGCAACATCAGCACCGATGCCCTCAGCATCGGCAGCAGAGGGTGTTTTTGGC +CTTTGACAATTCCCTGCGACTTGACTTCTTCTTGGCATCTGGTCAATCATCACGTGCCAG +CAAACAGTGGCTTGTCACCCTGGAAGAAAGAAGACTGGATTAGCTTCTCCCCTTCTAATA +CATTTTGTGTGTTGAAATGCATCAGGCGGCGACACACTCACCAGCAACAGCAGCAACAAC +ACCAGCGGCACCGGTAGCAGGAAATGGATCCTCAGCAAAAACCATCGGCACTTTCAGACG +TCCCGTACTCCTCGCCTGGCCCTGGCCGGTAACAGGGGCTTGTTAGATGGAGAAGACGAC +GGTCATCCGACGGACAGCAGCCTGAAGATGGAAGCAGGCCTACGCTGCCCACCTCTCCGA +TGCCTGCAGCAGCAACGGCAGCGGCTCATAAATGCAAACTGGCGCCAGCCCTCGGCTCTT +CGGGCTCATGTAGGCGGTGACACACTCACTAGCAGCTAAAACAGCAACGGCGGAATTAGT +AGAAGCAATGTTTTGCCGCAGCTGCCAGATGGCATACTCCTAGCTTGGCCCCTGCCCAAA +CCGTATTGGACCGGCAAATGATTCGACAATCCGATCTGGAAAAAATAAGTATTGATTAAT +TTTTCCCCCACAGATTGGTATAAAATTGCATTTACGGCCAACCGGCTTCTTCCTGTTGAT +GACGTCACGCTGCGCCGCATGCTTTTCGCCAGCCACAGTTGGAATGCATGCATTGGGGTT +GACGGTCCGGATGGGCCGTTGCCTGTTATATGCTGGCATCTCCGCAGCGGCGTTGTGAGC +AACGACACTGAAAGCAACAATAATATTGTTAATTACTGCTCAAAACTATAACACATTTAA +TCACTTACACAATTTACACACGCTTCCTGCCTAGGAGTTGTGGGACCAGCTACCGATAAT +GCCAACAATACCGGGAAACGCGTCGCGGGACATCGATAACAATTTGGCGGTTAAAATGCT +AGAACATCGAGTACCAGACATGTTTTTCCTGCCGATATATCGAAGCCCAATAGCCGCCAA +CGCTCAAAACATAAATCGGAGTGTGAGACCAGATACTGAAGCCGTTAAAAGCTTTTACCG +GCATCGGTAGCTGGTCTCACACTCCGATTTAAATTTGGAGCGTTGGCGGGCTGTTTGACG +CGAAGCTTCGCGGGATATCGATAACAATCAGGTGGTTAAAAATACTATAACATCGAGTAC +CAGCCGTGTTTTTCCTGTCGATTTATCGAAGTCCAACAGCCCGCCTTCGCTCCGAACACA +AATCGGCAAGTCAGTAGCTTTTTTAACCCGGCAGTGGCGCCTGTGCAGCAGCTATTTAAA +GTGAAAAACACGAAACGCAACAACAAAATGGACGGCCATAATGGAGACATAAATGAAGGA +TGGGCAACAGTACTATCTATCTCGTCGGATGATAGTAACCAACTTTCGTCGCCGCCGTCA +ATTATAGTCTCATCGCTGGACACCACGCCAACGCCTGTCTAATGCAAATCAACTTACATA +TTACTCTAAAATCTACTTATAACTGTCCCCTCTAATGATAAGCAATTTTTATGTTTACTT +TAAACTTAAACCGATACCTTAAACTATGGCGCGCAAAATGACTACCAAGAAATCTAAAAC +TGTAAATTGTTGCAAACTATTTCTCCTAGTAATGTTAAATTTAAATGCGCGCATAACCGC +AGCCAAGTTAACCAAAAATGTCACTCGTAAATGTAATTCCTAAATTAACACTTGTAACTA +AGCGCGTATAAATACCGCAAATCCAAAAATGTAAATATGCCATAAATTGTTACTATATAT +TTTTAAAAAAGAAAAATCAGAGTACAATAAAAATGCCAGCGTCTATTAGGCGTTGAAAAT +TTAAAAAAAAAAAAAAAAAAAAAA +>AY561850 +CACGCTTTTTGGCCCCTGGCCGATCTTCATATATCTCAAATCGACGGCTGCTTTTACCCT +GGAAAAAAAAAAAGGAGCTTGGGTTATATTGAACTACACTAGGCGGCGACACACTCACCA +GCAGCAGCCAGAACAACAACAGCGGCAGAAGTAGCAGGAAATTATCTCACTGCAAAATCC +AATTGGCACTTTCCGAAGTCCGTATTTCTCGCCTGGCCCCTGGCCAGTAACAGGGGCCTG +TGCGACGGAGATGACGACGATGATCTGCCCTGTGGACGGCCTCAAGAAGGAATCGGCCCT +GTACTGCCCACCTGACCTGTGCCAGGATAGCAGCAATGTCAGCGGACCATGGATGGAAGA +GGCGGCACTGGCGACGGTCCTCAGTTTTGCGGTTTCCGCGGGGCGTAGGCGCAGTAATCG +GCGGCAGCAACAGTGGCGGCAGCAGAAGGGAATGTGTATCTGCAGTCGCCGAATGGCAAT +TTCCTGCCCAGCTGTAATGGACCGCCAAATGTTTTTTGGCATGTCGACCTGTAAGAAAGA +AGCAAGGATAAGTTTTTTCTTTACAAGATTGTATATGAATTTGTATTTACGGACAACTGG +CTTGTTTCCTGTCGACGATAAATGGCGCTTCATGTTTTCACTCTGCCAAAATCTGAGTGC +AAGCATCGGGGCTGACGGGCCGAATTTGCTGATGCCTTGTACATGCTAGCATCTTTATGC +CGCCGTGTAATTTTGCGACAGCAAAACACATGATGGAGAAGACGAAGGTGATCGATGGCG +CCCGGATGACGGATGCAGGCCCGTGCTACCCACTGGTCCGTTGCCAGGACAGCAGCGTTT +CAATTATGCGAACAGAGGCACTGGAGCCACTTCTCAGGCGATAGGGATCATGAGGCGACG +ACAACTCGCCAGCAGCAGTAACAACAACAGCGGCAGCAGCGATCTCGGACTTGCTGAACA +TTGCGGCTTTTTCCCAGCCTGGACCGTCATCACAAACGCTCTCAAAGATCGGTGCGCCTG +CAGCCTACGGAAGCGTACAACTGCCCAAAGTCGTGCTATTGCATAATGTTAGGTGTCCTG +GCTGCTCCGGCGGATGAGCTCCACCCGATTGAGAGAGGTAAGAAGGCCCAGCAAGTCGCC +CTTAAATAAAAGAAACAAGCATTAGACTCGGCTGAAATTGTAACATCAGTCAGACTGTAC +TCACGCATGCACTTAGACAAACCGAAGCCTATTCTATTGACGACGCGGACTCCAACACAT +GTTTTCCTCCACAAAAGGCTGTGAGTGCACCAAAGTTGACGGGCCACGCCGGCCGATGCT +TGCTGCATACCGGCATCTCCGCAGCAGCGACGTTACAAGCACCACTAAAATTAGAAAGAG +GCTTACTATAGGCAAAGCGCAGAAAAACAAATATTACAATAAGAAATAGCACGCGATTTT +TCTGCTTCGTTTCCGCTTGGTACAAGTGAGACCATTCTCCCTATATGCCATTCTAGTATA +TTTGCCCGATAAGCGATATGCTGGCGGCAAAAAAAAAAGATAATAGCCGATAAGCCCGCC +AAAAAAAAAGCGCGAAATATCGATAACGAGCTGGCACGAAAATTGCTGGCATATCGATCA +ACCGCTGTGTCTTTGAGCTATCGAAAAAGCCCGCCTACGCGCCTAGCCCAAATTTGCAAG +TCAGTTGAGATTATAAAACCGACAGAGGCGCGCGCGCAACAGTAGCTAAAAGTGAAGCCA +GCAGCAACAACAACAACTAATGGACGGCCAGAACGTGAACCAAAGCGGAGGATGGGCATC +GGTTTTATCCATCTCATCGGACGATGGTAACTGCTCATCCTCGCCGCCATCAGCTATAGT +CTCATCGCTGGATACCACGCCAACGTCAAATGAAACCACCATAGTAAGAAGAAGCCTATA +TCAAACAAATGCCGACATGAAATCTTACGATTTTGAAAATATTGTATTAAATGAAAATAA +AAATACCATATTGCCAGACCCTTTATTTGTTGATAAATGCGGGAGTACTGCTAATACCAC +AGAAGCCAATGAAAAACAGCCTGCCGATAGCCCCTTCCCCATTTCCATAAGCAAAAATTT +TAGCACTTCCTCGCCACTAACACATGTAGACACGCCTACACAAGAAGATGACGCCAGTGC +ATTTAATACATTGAAAGCAGCCAAAACAGCTAGAATAATTTTTCCCACACACACACAGAT +AGAGCCCGCCAAACCCTCGCCCCCCTCCAAAGAATTAAGCTCAAACTCAGCACCCAAAAC +TCTTAGCTACACAGACAAAATTACAGCAACACAGAAAAATTTCCCCACTAAAACACATGT +AGACACACCTACACAAGACGATGACACTAATGCAACCAAAGCATCAAAAACCGCCCAAAT +AGATTCATCACACTCACAACTACATGAAACCAAGCCAACACAGCCCGCCAAAAACCCTTC +ACCCCTCACCCAAAAGCTAACCACAAACAAAACAGCCAAGACACACACACACACAGACAA +ACCGACAGCGTCACAAAATCTTTTTCCCACCAAAACACATATAAACTCACCCACACAATA +TAACGACACTAATGCAAGCACAGCATCAAAAGACGGTAAAATAAACCTCTCTTCACACTC +ACACTTACGTGAAACCAAGCCAACACAGCCCGCCAAAAACCCCTCACCCCTCTCCCAGAA +GCAAATAACAAGCATAGCAGCCAATACACTCACCCACACAAACAAACACACAGCATCACA +AAACTTTATTCCCGCCAAAACACATATAAACATACCCACACAATATAACGACACCAATGC +AACCAAAGCATTAAAAACCGCAAAACCAGCTTCTCCCTCCCACACATACTCACGCCAGAC +AAAACCAATAAAGCCCGCCATAAACGCATTGCATCCCGCCCAAGACACAAACCCAAGTCC +AGCAATCAGTGCTGTCACTTACACAGACAAACCCACAGCTACTCAGAATATTTTTCCTGC +CAAAACTTTTGCAGAGCTGGTGAGAGAAAATGCTAAACGCTCACAAACTGCAATGCAAAA +TCCCCCTCATGCAAAACATGACTCTGCCGCCCTCGGACGCTTACCGAGTGCAGCTAGAAA +AAACCTAACTAAAACACTGAGTTCTCCTAAAACTCCTGGGAAGCGCCGCGGGGACTGTTT +GGATGAGGGCTTACTTCAAACCTCTAACAAAAAGGTTAGAATACGCGACGACTTCTCTGA +TGATGATCTGGGGGTCACAAATCTACTCTCCGAAACACCCATATTCAAAAGCAAAGTAGC +TATTAAAATTCGGCAAGACTCAAGAAGAGAATCCCTGCAGAAGTCAGTTGAAATGGACAC +AGCACCAGCAATTAGTCCCTCAAACACAGCAGCTGAGCCCGACCTACCGCCCTGGAAAAC +TGTTCCAGCTAGCAGAAAACCACCATCAATCTTCTTGTCCAATATTCAGCAGATTATCCC +GCTAATAGAAAAACTAAACTATAAAGCCGGGGTAAATAGCTTTACTACCAAATCTGAACT +TGGCAACAATATTAGAATCCAGGCTAAAACGATGGATGCCTATAAAGCAATTCAGAATGT +CCTCCTTGGGGCAAACATTCCCCTACACTCTCACCAGCCAAAGAGCGCAAAGGGCTTCCA +AATTGTAATTAGGCACCTCCACCAGTCAACCCCGACCAAATGGATTGAAAGCCAACTTCA +AGACATCGGTATAGCTACAAAATTCATCAGGGCAATGCAGTTTAGGGACACGAGAAATCC +TATGCGCATTCATGAGGTTGAGGTTGTACCCAAGGCTGACGGCAGCCATCTCAAGGTCCT +GCTACTAAAATCCCTTGGAGGTCAAACGGTCAAGGTTGAAAGGAAACGGGTATCGAAGGA +TCCCACACAATGTCATCGCTGCCAATGTTTTGGGCATACAAAAAATTATTGTAGAAACCC +GTTTAAATGTATGAAATGTGGCCAGCTGCACGCCACGGTTTCTTGCACTAAACCCAAAAA +CCTTCCGGCTACTTGTGCAAACTGCAATGGAAGCCACGTAAGCAGCTATAAAGGATGTCC +TGCTTTCCAAGAAGCAAAGCAAAGACTATCTATCAACAAAATTCAATCCCTACACTCACA +ACCCACGCACCTTCAGACCCCCCGCAATAAACATCCCTACCCAAAACCCACCCACTTTCA +GACGCCCCGCAATAAGCAGTCCTACACACACCCCCCTCCTCGAACAACAGTAAACAACAC +AAAATTACCTGCCAAAAGAATCCAAGGAAAAAAGTTATCGCAAAGGAACATATCTATAAA +TAAACGCTTAAATAGAATTAGGGCTTTTGACAAGAAACCGAGAAAGGAGACAAGCCCGCC +GACAACTAGCAAAAAGGTACTGGCCTCCCTAGAAGAAAGCAGCAAAAACCCAAACAGCGT +CCTAAACCCAGCCAACACCCATCTCACTCATTTCTGTCCACCCCCAATAACACAAGATAT +CCCTAATGACGAACCCACGGAGCCGAGTCAGGAGCAATACCTTCTAAATCGTATTGAAGG +GATGGAAAAGAAGCTCAACAATCTCCTGGAAATCGTCACCCGCCTACTAAACCAAGGAAG +AGAGTGTCCAAAATCTCCAAAAAATCCTTTCCGAGATCCAATCCTCATTTAAACGCTCTT +GCTAGTAGCATCAGAAAGTGACGTATCTTATGACTCGGGCGTGCAACAGGGATATCCTTA +AAATTGCTTTCTGGAACGCTGGTGGGATCAATAATAAAATAGACGAGCTCAAACTGTTCA +TTCTAAATATTGATGCCCACATAGTCATAGTCACTGAAACCAGACTTGACAACAAATCGA +CCAAACTAGAACTTCCAGGATATTTCACATACTTAGCCCAAAATCCTGTTTCTAGCAAGA +GAGGAGGAGTCGCCACTATAGTAAACAGCAGTATCCGACACATGGCCTTAGAACCGATTG +AAAAAGAATGCATACAGAGCGCCCCAATAGTCTTGCTGCCTGAAAACAACAGACGCAGCG +AAATGATAGTAATAGCATCTGTCTACTGTCCGCCTTCGCTAAGCTGGTCGCCCCACCACT +TTACTGACGTTCTCAATTTTGCCGAGAAAACTCTGGGAGGGCAGACAAAGTTCATTCTAT +GTGGCGACTGGAATGCAAAACACAGGCAATGGGGTTGTACCCGCGCCTGTCAACGCGGCA +CCGCACTCTACGAAGCAGTTCAAGCAGATCCCATGGCTGAGATTATTGCTACCGGCTGTG +CGACACATTTCCCGCACGACACACGGAAAAACCCGTCAGCAATAGATTTCTCCATATGCA +AAGGACTGGGCAGGCTCGAAAAGAGAATTTCCTCAAGTGCGGACTTATCTTCAGACCACC +TTCCCATCCTGCTTGAGATCAACTTAGATACAAGCACCCTCTTTCTGCAAAAGCAAAACA +ATAACATCCTCAAGAAAACTACGAACATTGAGCTCTTTAAGACTGTTCTTGAAAGAAAGA +TACTTCTTAATACGGAGATAAGAGTAGCAGAAGACATAAATGACGCCATAAATATCTTTA +TCAAAAACATCAAGGACTCGGCTGATGAATCAACTCCCTCCCCAAGAATCCCTGACAACC +TCAGAAGAATGCATGGACAAGCTAACAGAAATAGTCACACCCTCACACTAGACGAAAACA +CAAGCAGATTGTTGGAAGAAAAACGGATACTAAGTAGAATTTTTAAAGCTACTAGAACGG +ACGAGGACAAAGCTAAACTAAAAGCAGCTGAAAATCGACTAAAAAAAGCGGTAAAGATCT +TGAGAGAAAAGAGAATTAATAAACAAATTGAAGGAATAGACACGAAAAACCCGGACAGAA +TGAGGAAAATGTGGAGACTGCTAGATGAAGGAAAAAAGACAAACCAACCGAACTTTCCCC +TCAAACTGGAAACCAAAAGAGGCCCCAAATGGACAAAAACGATAAAGGAGACAACAGAAG +CATTTGTTTCCCACTTAGAAGGAAGATTTAAGCCAAATAACAACGTACCTGATTACCACA +TAAATACAGTTAACTCTGGACTAAGAACAATTAAAGAAAGCATGTTAACAGAAAGATATG +ATGTAAACAAGAATCCCTGTAACCAACCTATCACACTAAAGGAATTAAATGACGAAATAA +AAAACTTAAAGAATAGTAAAGCACCGGGAAAAGACCTTATAACAAACCAACTTATAAAAA +CCCTACCGACTAAAGCTACACTGTACCTTATCCTAATCTATAACTCTATACTTAGAATTG +GATACTACCCAGACGCCTGGAAACATGCCCAAGTGAAAATGATCTTAAAACCAGGGAAAA +GTGTGAACGACCCGAAGTCATATAGGCCGATCAGTCTACTCTCGGGACTCTCTAAAATGT +TTGAAAGACTACTTCTAAAAAGACTTTTTAGGGTAGATCTATTCAAAAAAGCCATACCAC +TGCACCAATTTGGCTTCAGAAAAGAGCACGGAACTGAGCAGCAAATAGCCAGGGTCACCC +AGTTCATCCTCGAGGCCTTTGAGCGAAAGGAATACTGCTCAGCGGTTTTCCTTGACATCT +CTGAGGCTTTCGATAGGGTCTGGCACGAAGGCCTTTTACTTAAACTAGCTAAAATATTAC +CATACAACCTATACATTATTCTCGAAAGCTACCTTACAAACAGAACATTTGAAGTTAAAG +ACCAAGCTGGAGAGACTTCGAGAGCAGGACAAATAGGCGCAGGGGTGCCCCAAGGAAGCA +ACCTTGGACCCATACTGTACTCTATCTTCTCCTCAGACATGCCACTCCCACACATATACC +ACCCCTCCCCAACAGAAAGAATTATGCTCTCAACATACGCAGACGACACTATAGTACTCA +GCTCAGACATACTAGCAACTGCTGCCACAAGAAACAACGAAAACTACCTCAAGACATTTT +CGGACTGGGCAGACAAATGGGGTATCTCAGTAAATGCTGCTAAAACAGGACATGTCATTT +ATACATTAAAAAACGACATACCTACAAATCTAAAGACCATGAAGATTAAGGGTCAAGCAA +TAAAAAAGGAAAGCAAGCAATCATACCTTGGCGTAATCCTTGATAGCAAGCTAACACTTA +GTCCTCACGTCACGAAGGTAGTAGGTAAATACTTGACAGCCTATAGAAAAATGTCATGGA +TCTTAAATGAAAGAAGCAAACTCCCTACTAATACTAAGATGCTGATCCTCAAATCAGTTC +TATCGCCAATATGGCAGTATGCCATAGCAGCCTGGGGTCCCCTTGTGACAGATGCACAGA +TAAGACGGATACAAGTTGAGGAAAACAGAAAAATGAGAGACATATGCAGAGCGGGAAGAT +ACACGAAAAACCAAACTATAAGGGACCGCTACTGTGTCAAAACAGTAGAAGAGTTCTATC +AACAGGCTGTCCACAGGTTCTCAGAAACTACAAAATCGCACCCTAATGTAGCTGTTCGCA +GGATATTCTCTAGGCACTATATCCCGAACAGACTAGAAAGAAGCAGGCAGAGGTACTTGA +AAATGACAATGGACCATATCACGCAAAAACAGACTGGACTGACCCTCTCACCTAAACTCT +TAAAAATCCCTGATCTAGATGACTGCAGAACCTTAAAAAAGCGAAGCGAGAGAGAGAAAA +TAAGACAAACGCATCTAACTGAACTCCCCACCCTGCTGAGACTAGAGGAAGAGGAGGCAG +AGCTCAAAAGAATAAAAAAACAGGAAGAGAGGGAAAGAAGGGAAAGGGAAAACCAAAAGT +GGCCTCCAGATAGGTGGTGTGAACTGGAAATAAACCGATATAATAAAAAATATAGAAATG +GCGATCTAACCAGGCAGGAAATTATAGAAAAATTCCGAGGGCAACCATTAAATGTACAAC +GAATAATCCTACCCGACTACGAAGGTGACTAAAAGTAAATCAAAACAAACTAGGGTCGGA +GCATAAAGCAGAAATAATTAACCTGGCGGAAGGGGCGGCAAAAATATTTAAAAGAAAGGA +AATAAATACAAAAAGGCTAAAGGCTAAGTTACAGGTTACATAAAAAGGGAAATGTGCTTA +TAGATATAATGGTAAAATTAACTTAACTAAACACCTACTGGAAAACAAAACCATGATGGC +TGCGTACTTAAAACGTTTCTCCTGGCGCGATTGAAAATCCATCTTTCCTATCCAACCGAG +GGATCTGCGACTGCGGCCTTCTGCCGTTCGGCTCCTGATGGATCCATCTGCTGCTGGAAT +GGGTGCCACACCGGCGCTCCAACCTAAAAGAAAGATAATATGTCTTAGTTTTCTTTCCCT +TTTTCTCATAAAAAACAAAAGCTCATCTGGAGTCTGATAATAGCTTTAGCTCACCAAGAC +AGCAAAAACAACAGCATCAAGGCCAGCAACAGTGGAGGCAGAGACCAAGCGGTTTGCTGA +ACATTTCGCTGCCCACACCCACCATTCCTGGAGGCTCTGAATGAGGGAGCTGAAGCCTCT +GAAAATTGAAGATCCTACTCCAATGTGACACTTTCGGCTCCGAGCTCAACGCCGGCGCTG +CAAATCCGGCGTTATAAGGAAAGGGTGCTCCAGCTTGTGGAGTGGTCTTTCCCCAGAGGC +AGCAGCAGCAGCAACGCCAGCGGCAATTGGCGACCTCTGCGTAGCCGAGTCAATCCCGTT +ATCGGTCCGTCTGGCGATGCGTTTCCGACGCGGCGGTATGCGTCCATAGGGACCGCCTAG +AATGCTTGGCCAGGAGACAGCAGTAGACCTGGGCGTGGGCGTCACCAGCAACATGGTAGC +CATGCGCAGTCAATTGGCCGGTGGCAACAATCTTGCCATGCAGCAATAGCGGCGCATGCT +ACCCTTGGAGCGACGTCAACAGCTACATATTTTTCAACAGTGTAGCGCGACCTTTAGGCG +CCTACACCTACACCAGCAGCAGCGATATTGGCAGTAGCAGCATTTAATGTCTTGCAGCAG +TTTCCATTTGACAACTTCCGACGACCAGACTCCTCGCTTGGCCCCTGGCGATTCGCCCTG +GAAGAAAGAAAGAAGCATGGATTAGTCAAATATCAAAGCACAACAAGCATGCACGAAATC +TTCGCAACAAGGACTATTCCAAGGCAAGCGATGGTGTGTTCTTTGGCTCTACATATATCG +TTGAAATCCGTCTCCAACTGCCGCGAGTCACCCACGACTTCCACTCCCTGCAGACGGACG +TAATGCACTACGATGTGTAAATTTTCCGGATCCAAGTGAACGCCAGGCGGAAGAGGATTC +CCTGGATGTGAAGGATCACAAACTGCTGCTTTTTCAAGAGTCCCCATTTAACAACTTCCG +ACGACCAGACTCCTCGCTTGGCCCCTGGCGATTCGCCCTGAAAGAAAGAAAGAAGCATGG +ATTAGTCAAATACCAAAGCACAACAAGCATGCACGAAATCTGCGCAACAAGGACTATTCC +AAGGCAAGCGATGACGGACGGAATGCACTACTATGTGTAAATTTTCCGGATCCAAGTGAA +CGCCAGGCGGAAGAGGATTCCCTGGATGTGAAGGATCACAAACTGCTGCTTCTTCAAGAG +GTAACCGGCCTCATTTCCACTTGGGTCACATCGATTGTGGAGGAAGCCGATTGGGACTTT +GAGCGAGCCCTAAAATTGTTCATTCAGAAGAACGCTGATCACGAAATCCCAGATCTAGCA +TTCGCCTAGAATATGTGATCTCGTTGGACTGCGTGCTGGACTGCGGCGCATGCTTTCCCT +CCCGCCAGAGACGGGATGCGCGCATCAGGATCGACGGGACAGACCGGCCGACGCCTGGCT +TCACGTCGGCATCTATGCGACGACGTGATAATCAGCTTCACAGTACCTGCGGATGAGGGC +ACAGGCGCCAGTCCTCTGCCTAGCGACACATACACCAACAGCAACATCTAAAACAGTCGC +AGTAGATGCAGGGAATTTTCTTGCTGCATTCTCCAACTGGAAAAATCCGACGGCCCAACT +CCTAGCTTAGCCCGGCCAATCTTCTTGGACTGGCAAACGATGTGATGAATCGTCCTGGAA +GAAAGAAGCATGGATTATTTCTTCATACACAGCTTGTCTACTAAAATGCATTTCCCGGCA +AACTGGCACTGGGGCGTTGAAAATACGACACTACTCACCAAACAGCAGCAAAAACAACAG +CATCGGCAGCAGGCGACCAGCAGCTGCTTTGGCTCACCCAATGCGACAGCAATATCTGCG +CATGGCCAGCAACATGCAGCAAGCAAAAGACCGGCATGGTGGTGAACAACATATCGCTCA +CGCCCAACGATCTGGAAGCCCTGAGCTAGGGAACTGAGTATCCGCCAGCGGATACTTATG +CAGCGGCGAGGCGTCGGAAATCCGATAGCCGGAAGAGAGGCCGGAGCAGCATGTTGGGCA +TTTTCGCCCCAGTAGCAGCTGCTGGGGCAGCAAGGGCAGAGGTAGCAGTGTCAGCGCTCC +TGGTAAACCGGCCTTTTCTGTTGAAGACGCGGGACTGCGGCGCAATTGTTCCTGCCAACC +GGGAGTTCTCTGCGCCTGAGGTCCTGTTGTGCTTCAGCGGCTCCATCTGCTGTTGCATCT +GGCGCTTCTCCAACTTTCCTCCCTGAAAGAAGAGAATATTAGTAGGAGCATGAGACCAAC +AACAGCCCTAGCTTACCACGTCAGCGGAAACAGCAACTGCAGAAGCCCGGTAACTTTCTG +ATAATATGCAGCAATAAGAGCGGCTGGATCAGCATGTTGTGTAGCTTGGCCCCAGAAGCA +GCAGCTGCGGTACCAAAGGCAGCGGAAGCAGGGTCAACATAGTCTGCTATGCTGTGTCCA +TACTAGCATAGTCAAGTCAGCGGTGGTGACGTTGCCGCAGCAGCTGATCCACAGGGTACG +GCCTGGAATGTTTTGTCAGAGACGGCAGTGGCCTGGGCGTATTAGTCAGATACGCCAACA +ACATGATACCCATGCGCAACCATTCTTCCGGTGGCGGCATGCTCGTAAAGTAGCGGCGGC +GCATGCATCTCTCGAAGCAGCAGCAGCAACAGAGGCGTCTCATAAGTGCATGCGCAGCAG +CGGTAGCAGCGGTGGTGGCAGCAGCAGGGAGATTTCATTGCTGCAGTCGCCAAATTACAT +GCATCCTACGACTCGACTCACGCTTTTTGGCCCCTGGCCGATCTTCATATATCTCAAATC +GACGGCTGCTTTTACCCTGGAAAAAAAAAAAGGAGCTTGGGTTATATTGAACTACACTAG +GCGGCGACACACTCACCAGCAGCAGCCAGAACAACAACAGCGGCAGAAGTAGCAGGAAAT +TATCTCACTGCAAAATCCAATTGGCACTTTCCGAAGTCCGTATTTCTCGCCTGGCCCCTG +GCCAGTAACAGGGGCCTGTGCGACGGAGATGACGACGATGATCTGCCCTGTGGACGGCCT +CAAGAAGGAATCGGCCCTGTACTGCCCACCTGACCTGTGCCAGGATAGCAGCAATGTCAG +CGGACCATGGATGGAAGAGGCGGCACTGGCGACGGTCCTCAGTTTTGCGGTTTCCGCGGG +GCGTAGGCGCAGTAATCGGCGGCAGCAACAGTGGCGGCAGCAGAAGGGAATGTGTATCTG +CAGTCGCCGAATGGCAATTTCCTGCCCAGCTGTAATGGACCGACAAATGTTTTTTGGCAT +GTCGACCTGTAAGAAAGAAGCAAGGATAAGTTTTTTCTTTACAAGATTGTATATGAATTT +GTATTTACGGACAACTGGCTTGTTTCCTGTCGACGATAAATGGCGCTTCATGTTTTCACT +CTGCCAAAATCTGAGTGCAAGCATCGGGGCTGACGGGCCGAATTTGCTGATGCCTTGTAC +ATGCTAGCATCTTTATGCCGCCGTGTAATTTTGCGACAGCAAAACACATGATGGAGAAGA +CGAAGGTGATCGATGGCGCCCGGATGACGGATGCAGGCCCGTGCTACCCACTGGTCCGTT +GCCAGGACAGCAGCGTTTCAATTATGCGAACAGAGGCACTGGAGCCACTTCTCAGGCGAT +AGGGATCATGAGGCGACGACAACTCGCCAGCAGCAGTAACAACAACAGCGGCAGCAGCGA +TCTCGGACTTGCTGAACATTGCGGCTTTTTCCCAGCCTGGACCGTCATCACAAACGCTCT +CAAAGATCGGTGCGCCTGCAGCCTACGGAAGCGTACAACTGCCCAAAGTCGTGCTATTGC +ATAATGTTAGGTGTCCTGGCTGCTCCGGCGGATGAGCTCCACCCGATTGAGAGAGGTAAG +AAGGCCCAGCAAGTCGCCCTTAAATAAAAGAAACAAGCATTAGACTCGGCTGAAATTGTA +ACATCAGTCAGACTGTACTCACGCATGCACTTAGACAAACCGAAGCCTATTCTATTGACG +ACGCGGACTCCAACACATGTTTTCCTCCACAAAAGGCTGTGAGTGCACCAAAGTTGACGG +GCCACGCCGGCCGATGCTTGCTGCATACCGGCATCTCCGCAGCAGCGACGTTACAAGCAC +CACTAAAATTAGAAAGAGGCTTACTATAGGCAAAGCGCAGAAAAACAAATATTACAATAA +GAAATAGCACGCGATTTTTCTGCTTCGTTTCCGCTTGGTACAAGTGAGACCATTCTCCCT +ATATGCCATTCTAGTATATTTGCCCGATAAGCGATATGCTGGCGGCAAAAAAAAAAGATA +ATAGCCGATAAGCCCGCCAAAAAAAAAGCGCGAAATATCGATAACGAGCTGGCACGAAAA +TTGCTGGCATATCGATCAACCGCTGTGTCTTTGAGCTATCGAAAAAGCCCGCCTACGCGC +CTAGCCCAAATTTGCAAGTCAGTTGAGATTATAAAACCGACAGAGGCGCGCGCCGAACAG +TAGCTAAAAGTGAAGCCAGCAGCAACAACAACAACTAATGGACGGCCAGAACGTGAACCA +AAGCGGAGGATGGGCATTGGTCTTATCCATCTCATCGGACGATGGTAACTGCTCATCCTT +GCCGCCATAGTCTCATCGCTGGATATCAAGTCATCGCTCAACTATACCTTAAAATTACTC +ACCAAAACTCTTTTCTCCTTTTCCATAAGATAAAGTAAAGTAAAGTAATGTAAAGTAAAG +TAAAGTAAATTAAAGTAAAGTAAAGTAACGTAAAGTAACATAATATTTAAATTTAAATTC +TACACTTGAACAATGGCGCGCAAAACTGCCGCAATGTAATTCAAAAATGTCTCCCGCAAA +TTTAAAACATAGATTAATACTTGTAAGTATGGCGCGCATATCTGCGGCCAAGAAATCCGA +AAATGTAATTTGCCACAAATTGTCACTATATATTTTTAAGCAAAAATCAGAGGACAATAA +ATGCCAACGTCATTAGACGTTGAAAATATTCAAAAAAAAAAAAA +>DM14101 +GATCCGGCCGGATGGCAGCTCGACGACGGTAGCAGGCCACCATGCCCGCCAGCCCGCAGC +TAGGATAGCAGCAACATCAGCGTCTTATTAACGCGAACGGCGGCACTGGCCCTTAGCTGA +CCAGCTGCAACAACATCAGCGACGCAGTCTCCACCAGCAGCAACAACAGCAGCGGCGCTT +GCGACAGCAGCAGCAGGGAATGGTTCTGCCGCAGTCGCCTATTGCTGCCTATAAAGAGCA +TTCCTTGCCAATTGGCTTTCTGTACGACGACGATGATCCTGCGGACAAATCCACCTTTCC +GGACGCCTGAGTATTATGGCGAGCCTGCTGATCATTGTTTCTCCGACTCCTTACTTGACC +ACTGGACAATCATACAATCACCGGCTTTTCACATCTGGAAGAAAGAAACCTGGATTAGTA +TTTGCCCTTCAGATTTGTATGAAACTGCATTTCTGGCCAACCGGAGTGTTTCCTGCAGAC +GACGCTGGACTGCGACGCACTTTTTTCTACCAACACAGATGGGACGCTTGCATCAGATCT +GACGGGCCAGACTGGCCGATGCCTGGTACACGATGGCATCTCCGCGGCGGCGAGATGTGC +AGCGACGCTGAAAGCAATAATAATTCTTTTACTTTGCAGTATCAAAAATGAGAAGCCACA +TCACAATTTACATCAGCAAAAATTACACGTGATATCTTTTTCTTTTGCCTAGGAGTAGTG +AGACCTGCTACCAAAATGACCAGTAATACCGGCTAACGGAAGCGAGATATCGATAATCAT +TCTGGCGGTAAAATAGCCAGAACATCGATAACCAGCTGTGCATTTTCCCTTCGATTTATC +GAAGTCAAATAGCCCGCCTAGGCTATCGGACCGGATCGGCAAGTCAGTAGTGATTAAAAA +TCCGGCAGAGGCGCCTGTGCAGCAGCTACCCAAAGTGAACACGACGAAACGCAACAACAA +AATGGACGGACATAATGGAGATCAAAGTGAAGGATGGGCAACAGTGCTATCTATCTCCTC +GGATGATAGTAACTCCTTGTCGTCGCCGCCGTCTATAATAGTTTCATCGCTGGACACCAC +GCCAACTTCGCACGAAACCACCATAGTAAGAAGAAGCCTATATCAAACAAATGCTGACAT +GAAATCTTACGATTTTGAAAATATTGTATTAAATGAGAATAAAAATACCATATTGCCAGA +CCCTTTATTTGTTGATAAATGCGGGAGTACTGCTAATACCACAGAAGCCAATGAAAAAAA +GCCTGCCAATAGCCCCTTCCCCATTTCCATTAGCAAGAATTTTAGCACTTCCTCGCCACT +AACACATGTAGACACGCCTACACAAGAAGATGACGCCAGTGCGTTCAATACATTGAAAGC +AGCTAAAACAGCTAGAATAATTTTTCCCACACACACACATATAAAGCCCACCAAACCCTC +GCCCCCCTCCAAAGAATTAAGCACAAACTCAGCACTAAAAACTCTCAGCTACACAGACAA +AATAACAGGAACACAGAAAAATCTACCCGACAAAACACATGTAGACACACCTACACAAGA +TGACGACATTAATGCAACCAAAGCATCAAAAACCGCTAAAATAATTTCTACACAGACACA +CCTAGGTGAAACCAAGCCAATACAGCCCGCCAAAGACCCCTCACCCCGCACCCAAAAGCC +TATTGCACACAAAGCTGACGAGACACTTACCCACACAGACAAACTCACAGCATCACAAAA +CCTCGTTCCCGCCAAAACACATATAAACACACCCACACAATATAACGACACTAATGCAAC +CAATGCATTAAAAACCGCTAAAATAAATTTCTCTTCACACTCACACCAAAGTGAAATCAA +GCCAACACAGTCCGCCAAAAACATTTCACCCCTCACACAAAAGCAATTCACAAGCGAATC +AGCCGGGACACACACCCATACAGACAAACACAAAAACACAGCATCACAAAATCTCTTTTC +CGCCAAAACACACATTAACTCACCCACACAACATAACTACACTAGTGCAGCCACAGCATC +AAAAACCGCTAAATTAATTCTCTCCCCACACTCACACCTAAGTGAAACCAAGCCAACACA +GCCCGCTTTAAGCCCCTCGCCCCTCTCCCAGAAGCAAATAACAAGCATAGCAGCCAAGAC +ACTCACCCACACAAACAAACACACAGCATCACAAAACTTTATTCCCGCCAAAACACATAT +AAACATACCCACACAATATAACGACACCAATGCAACCAAAGCATTAAAAACCGCAAAAGC +AGCTTCTCCCTCCCACACATACTCACGTCAGACAAAACCAATAAAGTCCGCCATAAACGC +ATTGCATCCCGCCCAAGACACAAACCCAAGCCCAGCAATCAGTGCTGTCACTTACACAGA +CAAACCCACAGCTACTCAGAATATTTTTCCTGTCAAAACTTTTGCAGAGCTGGTTAGGGA +AAATGCAAAACGCTTACCAACTCCAATGCAGAATTCCCATCAAGCTAAAAATGACTCTGC +CGCTCTCGGACGCCCCCCGACTGCAGCTAGAAAAAATCTAAATAAAACACTGATTTCTCC +TAAAACTCCTGGGAAGCGCCGTGGGGACTGTCTTGATGAAGGCCTACTACAAACCTCTAA +CAAAAAGGTTAGAATACGCGATGACTTCTCTGACGATGATCTTGGGGTCACAAATCTACT +CTCTGAAACACCCTTATTCAAAAGCAAAGCAGCTATCAAGATCCGGCAAGACTCGAGAAG +AGATTCCCTGCAGAAGTCAGCCGAAATGGACACAGCTCCAGCAATTAGTCCCTCAAACAC +AGCAGCCGATTCCGACCTACCGCCCTGGAAAACTGTTCCAGCTAGCAGAAAACCACCATC +AATCTTCTTGTCCAATATACAGCAGATTATCCCGCTAATAGAAAAACTAAACTATAAAGC +CGGGGTAAATAGCTTTACCACCAAATCTGAACTTGGCAACAATATTAGAATCCAGGCTAA +AACGATGGACGCCCACAATGCAATTCAGAATGTTCTCCTTGAGGCAAATATTCCCCTACA +CTCCCACCAGCCAAAGAGTGCAAAGGGCTTCCAAATTGTAATTAGGCACCTCCACCAGTC +AACCCCGACCAAATGGATTGAAAGCCAACTTCAAGACATCGGTATAGCTACAAAATTTAT +CAGGGCAATGCAGTTTAGGGACACGAGAAATCCTATGCGCATTCATGAGGTTGAAGTTGT +ACCCAAGGCTGACGGCAGCCATCTCAAGGTCCTGCTACTAAAATCCCTTGGAGGTCAAAC +GGTCAAGGTTGAAAGGAAACGGGTATCGAAGGATCCCACACAATGTCATCGCTGCCAATG +TTTTGGGCACACAAAAAATTATTGTAGAAACCCGTTTAAATGTATGAAATGTGGCCAGCT +GCACGCCACGGTTTCATGCACTAAACCCAAAAACCTTCCGGCTACTTGTGCAAACTGCAA +TGGAAGCCACGTAAGCAGCTATAAAGGATGTCCCGCTTTCCAAGAAGCAAAGCAAAGACT +ATCTATCAACAAAATTCAATCCCTACACTCACAACCCACGCACCTTCAGACCCCCCGCAA +TAAACATCCCTACCCAAAACCCACCCACCTTCAGACGCCCCGCAATAAGCAGCCCTACAC +ACACCCCCTCCCTCGCACATCAGTAAACAACACAAAACTACCTGCCAAAAGAATCCAAGG +AAAGAAGATATCGCAAAGGAATCTATCTATAAACAAACGCTTACACAGAATGAAAAAACC +GAGGAAGGAGACAAGCCCGCCGACAACTAGCAAAAAGGTCTTGGCCTCTCTAGAAGAAAG +CAGAAAAAACCCAAATAGCGTCCTAAACCCGGCCAACACCCATCTCACTCATTTCCGCCC +ACCCCCTTTAGCACAAAATATTCCTAATGACGAACCTAAGGAGCTGAGTGGGGAGCAATA +CCTTCTAAATCGCATTGAAGGGATGGAAAAGAAGATCAACAACCTTCTTGAAATCGTCAC +CCGCCTACTAAGACAAGGAAAAGACTGTCCAAAGTCTCCAAAAAATCCTTTCCGAGATCC +AATCTTCGTGTAAATGCTCTTTCTAGTAACATCAGAAAGTGACGTTTCCTATGACTCGGG +CTGACAACAGGGACATCCTTAAAATCGCTTTCTGGAATGCTGGTGGGATTAACAATAAAA +TAGATGAGCTTAAGCTGTTCATTCTAAATATTGATGCCCACATAATCATAGTCACCGAAA +CTAGACTAGACAACAATTCTACCAAACTAGAGCTGCCAGGATATTTCACATACTTAGCCC +AAAATCCTGTCTCTAGCAAGAGAGGAGGGGTCGCTACTATAGTAAACAGCAGTATCCGAC +ACATGGCCCTAAAACCGATCGAAAAAGAATGCATACAAAGCGCCCCAATAGTCCTGCTGC +CTGAAAACAACAGACGCAGCGAAATGATAGTAATAGCATCTGTCTACTGTCCGCCCTCGC +TAAGGTGGTTGCCCCACCACTTTACTGACGTTCTCAATTTTGCAGAGAAAACTTTAGGAG +GGCAGACCAAGTTTATCCTATGTGGCGACTGGAATGCAAAACATAGACAATGGGGTTGTA +CACGCGCCTGCCAACGTGGCACCGCACTCTACGAAGCAGTCCAAGCCGACTCCACTGCAG +AGATCATTGCCACTGGCTGTGCTACACATTTCCCACATGACACAAGAAAAAACCCGTCAG +CAATAGATTTCTCCATTTGCAAAGGGCTTGGCAGGTTTGAAAAAAGAATTTCTTCAGGGG +CGGATCTATCCTCAGACCATCTTCCCATCTTGTTAGAGATAAACCTAGACACAAACACCC +TCTTCTTGCAAAAACAAAACAACAATATACTCAAGAAAAATACAAACATCGAGCTGTTTA +AGAAAGTTCTAGAAAGAAAGATACTATTAAACACTGAGATAAGGGTAGCAGAAGATATAA +ATGACGCCATAAGCACCTTTATGAAAAACATCAAGGACTCGGCTGCGGAATCAACTCCCT +CCCCAAGAATACGTGACAACCCCAGAAGAAGACATAGGCAAGCCAACAGAAACAGTCATA +CCCTCGCACTAGACGAAAACACAAGCAGACTGCTTGAGGAAAAACGCATATTAAGTAGAG +TTTTCAAAGCTACCAAAAATTACGAGGACAAAGCTAAACTAAAGGCAGCTGAAAACCGAC +TAAAAAAAGCGATAAAAATATTGAGAGAAAACAGAATCAATGAGCAAGTTGAAGGAATAG +ATACAAGTAACCCGGACAGAATGAGAAAAATGTGGAAACTGCTAGATGAAGGGAAAAGGA +CAAATCAGCCTAATTTTCCCCTCAAATTAGAAACCCAAAAAGGACCCAAATGGACAAAAA +CGATTAAGGAGACAACAGAAACATTTGTCTCCCACTTGGAAGGAAGATTTAAGCCAAACA +ATAATGTACCTGATTACCACATAGATAGAGTCAATACTGGACTAAGAATAATTAAGGAAA +GCATGCTAACTGAACGACATAATCTGAACAAAAACCCCCATAACCAACCTATTACTCTAA +AGGAATTAAATGACGAAATAAAAAACTTAAAGAATAGTAAAGCACCGGGAAAAGACCTTA +TAACAAACCAGCTAATAAAAACCCTACCGACTAAAGCTACCCTTTACCTTATCCTAATCT +ATAACTCCATACTTAGACTAGGATACTACCCAGAAGCCTGGAAACATGCGCAGGTAAAAA +TGATTCTCAAGCCAGGGAAAAGTGCAAACGAGCCAAGGTCATATAGGCCGATTAGCCTAC +TCTCGGGACTCTCAAAAATCTTTGAAAGACTACTCTTAAAAAGACTTTTTAAGGTAGATT +TATTCAAAAAAGCTATTCCTCTGCACCAATTTGGCTTTAGAAAAGAACACGGATCGGAGC +AGCAAATAGCCAGGGTCACCCAGTTCATTCTTGAGGCCTTCGAGAGAAAGGAATACTGCT +CCGCGGTCTTCCTTGACATCTCTGAGGCTTTCGACAGGGTATGGCACGAAGGCCTTTTAC +TTAAATTAGCTAAGATCCTACCTTACAACTTGTACATTATACTGGAGAGCTACCTAACAA +ATAGAACGTTCGAAGTTAAAGACCAAGCTGGAGAGACTTCGAGAACAGGACAAATTGGTG +CTGGTGTGCCTCAAGGAAGCAATCTTGGACCACTACTCTACTCTATCTTCTCCTCAGACA +TGCCCCTTCCATATATCTACCGCCCCTCACCAACAGAAAGAATCATGCTCTCAACATACG +CAGACGACACTATAGTCCTCAGCTCAGACACACTAGCAACTGCCGCTACAAGAAACAACG +AAAACTACCTCAAGTCATTCTCGGACTGGGCGGACAAATGGGGTATATCAGTAAACGCTG +CTAAAACCGGACATGTCATTTTTACATTAAAAAACGACTTACCTACAAGTCTAAGGACTA +TGAAGATCAAGGGTCAAGTAATAAAGATTGAAAGCAAACAATCATACCTTGGCGTAATCC +TTGACAGCAAGCTAACCCTCAGCTCCCACGTCACAAAGCTGATGGGCAAATACACTACAG +CCTACAGAAAAATGACATGGATTCTAAACAGAAGAAGCAAACTCCCTACCAAGACTAAAA +TGCTGATCCTTAAGTCAGTCCTTTCACCAATATGGCAGTATGCCATAGCAGCTTGGGGTC +CCCTTGTGACGGATGCACAGATAAGACGGATCCAAGTCGAGGAAAATAGGAAAATGAGAG +ACATATGCAGAGCGGGTAGATACACGAGCAACCAAACTATAAGGGACCGCTATGGAATCA +AAACAGTAGAAGAATTCTATCAACAGGCACTCCACAGGTTCTCAGAAACAATAAAATCTC +ACCCAAATATAGCTGTACGCAGGATATTCACAAGGCACTATATCCCGAACAGACTAGAAA +GAAGCAGGCAGAGGTACTTGAAAATGACAAATGAACACATCACGCAAAAACAGACTGGAC +AAACACTCTCACCTAAACTCCTAAAAATCCCTGATCTAAATGACTGCAGAACCCTTAAAA +AGCGGAATGAAAGAGATAAAATAAGGCAAACCCATCTAATTGAACTCCCCACCCTGCTGA +GACTAGAGGAAGAAGAGGAAGAGCTTAGAAGAATAAAAAAACAGGAAGAGAGGGAAAGAA +GGGAAAAGGAAACCCAAAAGTGGCCTCCAGACAGATGGTGTGAATTAGAAATTAACCTAT +ATAATAAGCAATATAGAAGGGGCGATCTAACCAGGCAGGAAATCATACAAAAATTTAGAG +GACAACCACTAAATGTACAGAGGATAATTTTACCCGACTATAAAGGAGACCAGGAACACA +ATTAAAAGTAAATCATGGGAAAGCAGGGGAAAAAAAACAGAAGTAACAAAATGGCGGAAG +GGGTGGCAAAATATATATAAAAATAAGAAAAGATAGAAATAAAAAGGCTAAAGGCTCACT +TACAGGTTAATTCAAAAGGGAAACGTGCTTACATATCTAATGGTAAAAACTAACTTATAA +CACCTACTGGATGACATAGTGAGGATGCCACAGGTTGCGCACTTGAATCACGCTTTCCTG +GCGAGATTGTTAAGGCATCACCGGGATCCCGTCTCTCTTTCCTAACTGGAGGACTCATGC +CTGAAATCTTTTCCGCTTCACCGGCACCTGATGGCCATATCTGCTACTGCGCCTTGCGTC +CACGGACGCTCCTTCCTGAAAGAAAGAGAATTTGTTTTAGTTTTCCTTTCTCTTCTTAAA +AATATAACAAAAACAGCAGCAGTAGCCGACCAACAACATACTTAGCTTACCAAGGCAGCA +GCAATGATACCAACAGAAGCCCTACAGTGTGCTGAACAATATGCCGCCCACGCCCACCAC +TTCTGGAACTCAGGAATGGGGGGTACGGAATGCCGGAAACTGGAGGATTCGCCTCAAATG +TTACGCTTACATCTTTGAGCAAATCGCCTGCCTCCTCGTCTAACGGCCCGGCGTCTTGGT +ACGCCCAGAAGTAGCAGCGGTAGCAGGATTAGCAGCCTCCACAGAGATATGTTCATCCCA +GCATCAGTCCAGTTGGCATTGTGATGCCGCCGTAGCGTACGCCCTCAGAGACCCGACTGG +AATCCCAGGACAAGAGACGGCAGCACGCCTGGGCTTAGGCGCGGGACAACATGCAGAGAT +TCGTCAATGAGAATGGCGGCACTGGAATCACCTTTCAGCTGAGCGGGATAATGAGTCGGC +AACGCACCGCACTATCAGCAGCAATAACAACATCGGCAGATGACCTGGAAGAAAGGAAAA +AACATGTATCAGTCTTTTCTTTTCTTTTTTTTTCCCATTAGCATGCGTTTTTAAATTCCA +TTCCTGAAAACCGGCGTTTTCCTGTAAAAGACACTGGACGGCGGCGTTTGTTTTAAATGC +AAAGATTGGATGCTTGCATCAGGGCTGACGTCCTTGAATAGCCGATGCCTTGTAATTGCC +TGCATAGCCGCGGAGGTCCTGATGACGGATGCTGGCCTGTATTTGGCCACCACTCCGATG +CCATGACAGCAGCAACAGCAGCGGTTTTTGCAAATGAGAGGGATCAGGAGGCGGCAACAC +ATTCACCCGTAGCAGCAACAACAAGCAGTGGTAGCATCAGCAGGGAGTCTTCTCGCCACA +ATAGCCATTTGGAAATTTCTCGACGACCCGACTTCCTGCTTGGCCCATGGTCAATCACAC +TGGACCAGTTAACAGCGGCGTTTTACCCTGGAAGAAAGAAAACTTGTATTATTCATTCCC +TTTTCTCTCACAGTTGGGTATTTAAGTGCATTCCTGGCCAACCTAGCGTGTCTCCTGGCA +ATGACGTCGGACTCAACGCATGCTTCCCTTCCGACACAGTAAGGATGTTCGCATCTGGGC +TGACGGGCCAGGCCGGTCCGTTGCCATACATGCTAGCGTTTCCGCGGCGGCGTAGTGAAC +ATCAAACCGTATAATGGCGAAGACGACGATGATCCGGCCGGATGGCAGCTCGACGACGGT +AGCAGGCCACCATGCCCGCCAGCCCGCAGCTAGGATAGCAGCAACATCAGCGTCTTATTA +ACGCGAACGGCGGCACTGGCCCTTAGCTGACCAGCTGCAACAACATCAGCGACGCAGTCT +CCACCAGCAGCAACAACAGCAGCGGCGCTTGCGACAGCAGCAGCAGGGAATGGTTCTGCC +GCAGTCGCCTATTGCTGCCTATAAAGAGCATTCCTTGCCAATTGGCTTTCTGTACGACGA +CGATGATCCTGCGGACAAATCCACCTTTCCGGACGCCTGAGTATTATGGCGAGCCTGCTG +ATCATTGTTTCTCCGACTCCTTACTTGACCACTGGACAATCATACAATCACCGGCTTTTC +ACATCTGGAAGAAAGAAACCTGGATTAGTATTTGCCCTTCAGATTTGTATGAAACTGCAT +TTCTGGCCAACCGGAGTGTTTCCTGCAGACGACGCTGGACTGCGACGCACTTTTTTCTAC +CAACACAGATGGGACGCTTGCATCAGATCTGACGGGCCAGACTGGCCGATGCCTGGTACA +CGATGGCATCTCCGCGGCGGCGAGATGTGCAGCGACGCTGAAAGCAATAATAATTCTTTT +ACTTTGCAGTATCAAAAATGAGAAGCCACATCACAATTTACATCAGCAAAAATTACACGT +GATATCTTTTTCTTTTGCCTAGGAGTAGTGAGACCTGCTACCAAAATGACCAGTAATACC +GGCTAACGGAAGCGAGATATCGATAATCATTCTGGCGGTAAAATAGCCAGAACATCGATA +ACCAGCTGTGCATTTTCCCTTCGATTTATCGAAGTCAAATAGCCCGCCTAGGCTATCGGA +CCGGATCGGCAAGTCAGTAGTGATTAAAAATCCGGCAGAGGCGCCTGTGCAGCAGCTACC +CAAAGTGAACACGACGAAACGCAACAACAAAATGGACGGACATAATGGAGATCAAAGTGA +AGGATGGGCAACAGTGCTATCTATCTCCTCGGATGATAGTAACTCCTTGTCGTCGCTGCA +TATATAAAATAATAAATTTCTTAAAATAATTTCATCGCTGGATTCCTGCGCCACCATAAA +TTACTTATAGAATACACTTAACACTGTACCCACTAATGCTAAAAATTTTCTTATACAATT +TTACTTTAAAGCTAAAACTACTTAAACTATGGCGCGTAAAACGGCCGTCAAAAATATCCA +AAAATTGTACTTGCCATAAACAAATTCTAACATAATGTAAATCCTAAATCGTAAAATCAT +GGCGAACATAACCGCCGCCAAGCAAATCAAAAAATGTTCCTAGAAATTGTAAATCTTAAA +CCTACTTCTCTAACTAAAGCGCGCACAACTGCCGCTGATCCGAAATTGTAAAATGCCATA +AATTGTAACTATATATTTTATAAAAAAAATCAGAGTACAATAAAATGACAGCGCCGAAAG +GCACTGAAAATATTTAAAAAAAAAAAAAACTGCCGCTGATCCGAAATTGTAAAATGCCAT +AAATTGTAACTATATATTTTATAAAAAAAATCAGAGTACAATAAAATGACAGCGCCGAAA +GGCACTGAAAATATTTAAAAAAAAAAAAAAAAAA +>TIRANT +GGAGTTACCACCCCACCCCCTAAACCCCCACGCCTCTAAACAAATCATCGGACACTCAAC +CGGGAAGACGGCAACTGGAACACCGCATCCGGCCGAATGCTGACATTCCGGCCGAATGCT +GACATTACACAAAAGTCGCACTGCAACATTGTCCCCAGCTAGCCAGCCACATGCCGAGTC +GGCATGTTCATTATGCTTACAATTAAGAACCTATGTACTTATGTATAAGACGAAAACGGA +GGACTCGAGTAGCCACTCTCTGACAATAAACTTGATACTGATTTTGAACTTCAAGAAAGT +CAGTCGTATTCTTTATTGGAAATCTTCACACTACAACTATCTGCTGAAACTTAAAAACCT +TCATACATTTACACATCATATCTTCACAAAAGGCTCCACCCTCGATCACGGACTTAACTG +GCGCAGCCGGTAGGATGTCCTACCTATTAATAATTACCTACCTGTAAGTAAACATGTAAG +AAACGAAACAAACTATATGCAAGATGTCGACTGAAAGTGACTAGGAACAAATTTTTATAA +AACAAAATTGAAGTTGTGAAGTACCAAATGAAACTCAAACATATATTCAAACACAGGAAA +AAAAAAGAGAGAGGAAAAATGTAAAATAAATAAATATACAAAAAAAAGTGCAAGTGTACC +GTACTGCCGCGCTGACGTGGAATCTATCGCTGATCATCACGCCATCGGTATGTCCATACT +CTGCCGAACGTCATAATTTTTTTAAAAAAGTGCAAGTGTACCGTACTGCCGCACTGACGT +GGAATCTATCGCTGATCATCACGCCATCGGTATGTCCATACTCTGCCGAACGTCATAATT +TTTATAAAAAAGTGCAAGTGTACCGTACTGCCGCGCTGACGTGGAATCTATCGCTGATCA +TCACGCCATCGGTATGTCCATACTCTGCCAAACGTCATAATTTTTATAAAAAAGTGCAAG +TGTACCGTACTGCCGCGCTGACGTGGAATCTATCGCTGATCATCACGCCATCGGTATGTC +CATACTCTGCCAAACGTCATAATTTTTATAAAAAAAGTGCAAGTGTACCGTACTGCTGCG +CTGACGTGGAATCTATCGCTGATCACCACGCCATCGGTATGTCCATACTCTGCCAAACGT +CATAAGTTTTTATAAAAAAAAAGAGTGCAAGTGTACCGTACTGCCGCGCTGACGTGGAAT +CTATCGCTGATCATCACGTCATCGGCACTTACATACGCTGGCCAACGCATCGCCAAAGCC +TCTATATACACTTATATATGTGAGCATACAATATCAACTACAATCCAATACATCCACGTA +CTGTACCGCCTCGTTGGCATGGAATCAAACGCTGATCACCATGCCACCGTGGTAAACAAA +CAAAGCACCAAAGCCTCTCTAATACATTGTACACTCAAAACGCACACTGCCATACGTCGG +CGAAAAATCAAAACATAAGCAAAAATCATTTCAAACCAAGCGAGGCTCATTCTGCGTACC +ACAACGACAACGACACTGCATGTGTAGTGGCGCACCCATGTCTGGGTAGCCGAGGTAAGG +GGAAAACGCTTGAGTATCGTCAAGTGTTCTTGCCTTTCACTCTTCTACAATGGGTTGCTA +CGCTCATGTATTGCACATTCAAAATAACCAAAACAAATGTACTAAAGAAGTCGACATATA +CAGATATATTTTGTTTCCTTTCATTGTGTAATTTTGTATATCAAACAAATACTAATACCA +ATCACATTGCAGAATATAAAAGGGAAAATATAAAGCCAAAGACAGACACCCATACACTCT +AGTAAACAAGAAATTTGTTCATTATTTTTCAATCATACATAATATACTAAGTAACCTCAA +ATTTAATGTCAAAAAAGTTCGTTTACAACCTTAGGAAAACTACACGTTCAGTTGTTGGAG +TTCCACCAAACACTAATAGGCCCCCACATCCCGTTAGACGTCCTGACTCCCTTCTCCCGA +TTTCGGAAGAACCCAAATCAATATCTTCCCAAACCCCCAATATGGACTCGGGAAACGATT +CTGCCCGCCCCACTCCATCCCCTCTGGCGCCCACTGTCAGTGGTATTAGCTCCTTAATTT +CAACTACGTTCAAGCCTAAAGATATCATGGCATTTGTTGAGCATTTGCCAACCTTTGATG +GTACACCTCGTCTATTGGACAGGTTTATCACTAGCGTAGAAGAAATCCTGATGCTCATCA +GGGGAGCTGACCAAACACCGTATGGCCTGCTTACTCTGAGGACCATCAGGAACAAAATCA +TTGATAGGGCCGACGAAGCCTTGGAACTGGCAAATACCCCCTTGGTTTGGGATGAGATTA +AAAGCAATCTCATCCGCCTCTACTCGAGCAAGAAAAGCGAGGCCAACTTGTTAAGCGAGC +TTAACACATTTTCGGACAACCTGACCTTGGGCCAACTGTTCTTTGGTATATCAAAGGTGA +GAAGCCAACTCTTCTCCATACTCAAAAACAGCGAACACAACAACACTGTTGTAGATGCAA +AAAAGGTTGTCTACAACGAGGTTTGTCTCAATGCTTTTATGACTGGTTTGAAGGAACCTC +TCAAGACTTTCGTCAGGATAAAGTCCCCTTCTACACTTGAACAGGCGTACGAGCAATGCC +AAATAGAGCAGACCTTATATAGGGCACAAAACAAGCGAACCAACAGACCAGAGCAGGGAC +CCAATGGATCAGACAATAAAACCTACCGAAATAGCTACGACAGCAATTACCGCAGCGGAC +GTAACGACCGAAATGACCGTAGGGGACCCTACTCTAACTCTAACTCTAACTCTAACTCTG +GCCAAAATAGACCATTTAATTCACACAATCGCACACCCCAATCCGGCACCAAGGACAACC +GGGCCAATACATCAAACCCCTTTCGAGCACCTTCACATAGTTTGAATAATATAGAGGAGA +ACCCTCAACCTGATTCGAATTTTCAGCAAACGGCCTCGGGAAACCAACAGGGTACATAAG +CCCAGCCACGCACAACCCCTCGCTTCCTTTTATAAAAATCAAACTATCCCAGACAAACCC +CCTGAAGTTTTTAATTGACACAGGCTCTACACACTCCTTCATCGACCCAAAATATGTCGA +CCCTAGGAACTGTGTGACCTTAGATACGCCCATAACACTCAAAACAGCCCTGAACAGTTT +TAAAATATATCAAAACGTCTCTATACCATTTCCACCGGAATTCCAAATCACGGGCAAAAT +GACCCTTCTACCTTTCAAGTTCCACTCTTATTTTGACGGATTGATAGGAATGGACTTATT +ATCTTACCTAAAAACAGAAATAGATTTACTTAACCTAAATCTAAAAACCCCAAGTACCAT +TATACCCTTATGGACCCACAGTAACTCAACTTCAAACGTATTTAATATCTCTGGACATAC +GAAAACTATTTTGCCACTACCAGTGGAAACCAAACAGGGCGACTTCTACATCGATTCAAT +TACAATCAATGATGACTTAATAATATCAGACGGGATTTATAATGCCCAAAACAATATTGC +TAATTTCGTTATCACAAACTATAGCGAGAGGGATCAGTTATTGTACCTCGAGAGCCCGAT +AAAAGGCATGCCATACTCCACGGCCAACAATGTTGAACTTTTCAGTATCACTTCAGACAC +CCCACAGCCCCAAAACTCCGCAGCGTCGTTACAAGCCCTTGGCGTCGATCACCTCTCCTC +TGAAGAGAAACAAAGCCTACTTTCACTTTGCAAAAGTTATCTAGATATCTTCTACAATGA +AGACAAATCATTGACCTTCACCAACAAGATTACACACACGATTAAAACCACGGACGACAC +CCCCATTCATACAAAATCTTATAGATATCCTTACATTCATAAAGAGGAGGTCAAAAAACA +AATAGAGGCAATGTTAAATCAGGACATTATCAAATCCAGTTATTCCCCGTGGAGCGCCCC +CGTCTGGGTCGTCCCAAAGAAAATCACTCCTACGGGAGAGCAAAAATGGCGTCTAGTTAT +CGATTATAGAAAACTCAACGAGAAGACTATATCCGATAGATATCCAATACCTAACATCGC +GGATATCTTAGACAGATTGGGCAAAGCCAAATATTTCTCCACACTTGATCTGGCAAGTGG +ATTCCATCAGATAGAAATGAATCCCGACGACACACCCAAAACTGCATTTACAGTAGAGGG +GGGCCACTACGAGTTCATTAGAATGCCGTTTGGCCTCAAAAATGCCCCAGCCACATTCCA +AAGGGTGATGGACAATATTTTTGGAGACCTTATCGGAACTATCTGCCTAGTTTACCTAGA +TGATATAATAATTTTCTCAACCTCCTTACAAGAACACTTCATACACTTGAAAACTATTTT +TGGAAGACTCAGATCTGCCAACTTTAAAGTCCAACTCACAAAATCCTACTTCCTCAGGCG +GGAGACAGAATTCCTTGGCCACATCGTTTCACAAGAAGGTGTTAGGCCAAATCCCAATAA +GATCGAAGCTATAAAAAACTTTCCATGTCCCCACAGTAAAAAGTCAATTAAGTCTTTCCT +AGGCTTGTTGGGATATTACAGAAAATTTATCAGAGATTTTGCGAGACTTACCCAACCCAT +GACACAAAAATTAAGGGGAAACAATAAATCGATCATAATAGATGATGAATTCAAAAAGGC +CTTTGAATATTGCAAAACCTTACTGTCTAACGACCCAATCCTCCAATACCCGGACTTTAC +AAAACCTTTCACACTAACCACGGACGCAAGTAATTTCGCAATAGGAGCTGTCCTATCCCA +AGGTCCGGTGCATAGTGATAGGCCCGTATGTTTTGCTAGTAGAACCTTGTCGGCTGCGGA +AACAAATTATTCCACAATTGAGAAGGAAATGCTGGCCATTATATGGGCGGTCCAATACTT +CAGACCCTACCTCTTTGGCAGGAGATTCACTATAATCACCGATCACAAACCACTAACTTG +GTTAATGAATTTCAAACAACCAAATTCTAAAATAGTTAGGTGGAGACTCCAGCTTCAGGA +GTACGATTTCGAAGTCGTCTACAAGAAAGGCTCTCAAAATGTAATTGCTGATGCTCTCAG +TAGACCAGAGGCCTCTGTCAACCATAACGAAGCCCTATCAATTCCTCAAAATGTTTGCCC +CATCTCAGAGAAACCCCTTAATGATTTTAATATTCAGCTCCTGTTCAAAATAACCCCAGA +TACAAATAACGCCACACTGACCCCGTTTAAACACAAACTTAGGAGGGAATTCTGTAAACC +CAATTTTCAGTATGACGACGTAGTTTGCATTCTTAGGCAGTCGTTAAAACCAAACAAGAC +ATGCGCGGTATTTGCCCCCGACCACATTTTTCAAATGGTGGAACAAGCCTACCAAACCTA +CTTCTCAGCCCACAGTCAATTTAAACTCATTAGATGTTTGATCTTCCTCCCCGAAATTAC +TGATAGTACGGAGATCGAAAAAATTATAACCGACTATCACTATAATAGTAACCATCGAGG +GATCGATGAAACATATTTACACATAAAACGACAACAGTTCTTCCCACATATGAAGGAGAG +AATAACTCAGTTAATTCGAAAATGTGAAACATGTTTAAAATTAAAATACGACAGACAACC +TCAAAAGATCACTTACCAAATATCCGAACTACCTTCAAAACCGTTGGACATCTTACATAT +AGACATTTATACTATTAACAAAAATTATAACCTTACTATTATCGATAAATTTTCTAAATT +TGCGGCTGCCTACCCTATAACTAATAGGAATTGCATTAACGTAGTTAAAGCCTTAAAACA +TTTCATTTCCCAATTTGGTATTCCCAAAAAGCTGATCTATGATCAGGGAGCAGAATTCGC +TAGCGATATGTTCAATAAGTTCTGCACTCAATTTAACATTGACCTACACGTTACGTCCTT +TCAACAATCCTCTAGTAACTCTCCCGTTGAACGGCTTCACTCGACACTAACTGAGATTTA +CAGAATAATACTTGACGTCAGGAAACAACAGAAACTCAGTAGCGAGCATGACGAGATAAT +GTCCGAAACCCTAATCACATATAATAACGCTATTCATTCTGCAACTAAACATACCCCCTT +TGAACTATTTAACGGACGTACTCATATATTCAACCAAACAATCCAGTTCAATAACGAACA +CGACTACTTAACGAAATTAAATGAATTTCGCGAGAAGTTGTACCCCCTCATCACGGACAA +ACTTTCAAATGACGTAGTTAGGAGAACCCTAAAATTAAATGAAACCCGAACAGACCCCGT +AGACCTACAACCAGACACTTTAGTCCTTAGGAAGGAAAACAGACGTAATAAGATTACACC +CAGGTTTTCGATTCACAAAGTCAAACACGACAAAGGTCATACATTGATAACTGCTAGGAA +TCAAAAACTACACAAATCAAAAATTCGAAAAACAGTTTTGAAAAAAGACAAAAGCAACAA +CGTACCCAACACTGATAATAACTGACCCCACTACCTCTTAACTTACCATTTCAGGTTCAC +CCTTGTGCCAACTCAGGCTATCCATGTCCATTATTTAAATGATAACGCCCCTATAGCCAA +GATAGAACTAGGGAAAGCCTTACTAATTGAGAGGTACAAAATAATTAGTCATGTAATCAA +CCTACAAGACTACAGCAGATGTATGGAACAATTCCATCTGACCATTAATAAATTTAACCC +CGATTCCACGTTGACGGACTCCGTCACAATTTTAAAAACCAAATTAACCCAAGCCCAAGT +AAAGCTCAAAGCCCTTACACCTTCATATAGAAACAAACGGGGTTTGATTAACGGATTGGG +GAGTCTAGTAAAGGTGGTTACCGGCAACATGGATGCCAACGACAATAAAGAAATACATGA +AGAACTTGACAATATAAAGAAAAATTCCGAAGTCAGTAACGACAATCTCCAAAAACAAGT +AATGTTTAACAACGAAATACTTATCCGGTTCGAAAATATCACGGACCATATAAATAATGA +ACAAATTTTGATAAGTAAATTCTTTGATACCTCACAAAACAAAATATACAAACACTTAAA +CTTACAAGATACCCTTCTGGAAGAAATACAATATTTAAATAGGATTAATTATAACATAGA +ATTATTCATTAACCACCTAAACGACATAACAGAAAGTATGCTATTGGCGAAAATAAATAT +AATTCCCAAGTTCATCCTAAATGAACAAGAAATGGATAAAATAAAAACAATACTGGAAAA +ACAAAATATCACAGTCAAAAATGAACAAAGTATATACAATTTCCTACAAATGAATACACT +AAATTACGAACAAAAGATTATTTTTAATATCAAAGTCCCAATTTTTAAACAACCTTTTCA +TACCCTCGCCAGACTAGTTCCATTACCAATAAATAACACATATTTTGTAATAACCCCAAA +TTACCTAGCTTATAATATTAATAATAAGAAATTTCATATGACCCGTAAATGCCCCAAACT +GGATAATACATTCTTGTGCGACGAGAACTTCTACGTTGATACACCACAGAACAACACATG +CCTGGAACACCTTTTGAACGGAGAAAACAGTTCCTGCGATGTACGGGAAACCGGCCCCAT +CACCGACGTGTTCGAGGCAGAGAGAGGTTACATCTTCGCATTCAACGTGAACAAACTGAA +GGTATCCCTAACAAACGGCTCCGAGCTCTCAATAATGGGGTCAGCCATCATCAGATACAT +TAACGAAACAATACAGATTAACGGTATCGATTACGACGGCACGGTTGACACGTTCCCTGA +ACAGACGGATTTTGATCTTCCCCCCATGCGAAAAGTAACTAGGAATACCACTATTACGGT +ACTAAGCCTAGAAAAACTGCACCTCGAAGCCACCCAAACAATGGATAAAATCCTGGCCGT +CCATCACAATACTATACAGCACACCTGGACACTCTACACTCTGCTCGGATTGGTAACGTT +CCTAGCAGTCATCTTATGGCTGCACCGACGAACGAAACACATCGTCCACATCCACGAGGA +TCATCACGTACCAATCTACGCGTCATCCATACCTTCGCTATGGCCGTCACTTCGAACTGG +GGGGGGAGGAGTTACCACCCCACCCCCTAAACCCCCACGCCTCTAAACAAATCATCGGAC +ACTCAACCGGGAAGACGGCAACTGGAACACCGCATCCGGCCGAATGCTGACATTCCGGCC +GAATGCTGACATTACACAAAAGTCGCACTGCAACATTGTCCCCAGCTAGCCAGCCACATG +CCGAGTCGGCATGTTCATTATGCTTACAATTAAGAACCTATGTACTTATGTATAAGACGA +AAACGGAGGACTCGAGTAGCCACTCTCTGACAATAAACTTGATACTGATTTTGAACTTCA +AGAAAGTCAGTCGTATTCTTTATTGGAAATCTTCACACTACAACTATCTGCTGAAACTTA +AAAACCTTCATACATTTACACATCATATCTTCACAAAAGGCTCCACCCTCGATCACGGAC +TTAACT +>DMBLPP +TGTAACATGAGTAAGGCTGAAGGCTGGCAACAACCCGGTTGGCAGCGCTGTTGAGCAGCA +ACATGATTGTCGGAAATCCAAGTTATCGACAATCAGTCATCGAAGGACGATCGCAGGCAG +CAGTAGAGGCGAGTGGAAGTCAGCGTTGCAGTCAGTCGAGTTCTCAGCAGCAGTCGTTCG +GTCCACAAACTAAGAAATACTTTATATAATTACCGCATTTAGAATTAAACTAATAATTAA +ATTAATAATAAACAATAATAATAAACAATCTTACATGGGGGCTCGTCCAGTCCTAAATCG +GTTATATGAAGGTGCAGTTGTTTAAAGAAAAAAGACATTGTTGTGTGCGTGGGTATAGTC +TTTAAAACGTTGTAAAGTTGTGGCTATATCTATTGCATTTAAAGTTGGAAAAATCAGTTG +TACAGATTTTGTTTGAACACAAGTCGGTAAAAGTCGGGAAAGCTGCTAGAGAGAACTGAT +AAAGTTGAAATTGTCGTGTGCGTGGATTTAGTCTTTAAAGTTGTAAAGTTATGGCTACGT +CTACTGCATTGAAAGTTGAAAAAATCGATTGAACTCATACAGACTCAAGTCGTTTTGCTG +TTGTGGAATTTAAAACAATTAAATTGCAAAGGTGGTGAAATTCGTTTCTAACGAAAATCA +AAATTTGTCTTTTAACCGGTGGCGCCGTCTGCAAAATCGACTACCGTCGCGCCGTTAGAA +CATTGTCGTTGTTTGCTGGTGTTAGTGCCTTGTCGCGGAATGTTCACACGTACACCACCT +ACAAATAAAAAACTTAACACCGACCAAATACAAGCAATTCTAGAGAACGAAAGCGAGGAC +GAAAGCAGAAAAGAAAAAATGAACGAAGAAGATCAAAAGTTGGCGCCTGTAGGAGAAGCA +GAGGCAAAGAAGCAGAATAAAGACGCTAGTGCTAAAGTCGAAGAGAAATTTGAACAAATG +ATGAATACTCTAACCCAGAGCATGTTGGCAAAATCTAAACAAGAGGGGCAAGTAATTATC +GCTGCAGAAAAATTTGAAAAAGTTGTAAGTGACTGTGATGGCAAATCAATTCCTATTAAA +AAATGGTTTGAAATTTTTGAGAAAAATGCCGAGGCATATGAACTTTCGGAGAAACAAAAA +TATGTTCAAGCCAGAAGTAAGATGATTGGATCAGCAGAACTTTTCTTAGAATCTGAATGT +GTCAGTGGATACACTGAACTCAAAGAGTTACTAATTGAAGAATTTTCAGGCAGCTATAAT +AGCGCCGTTATTCACAAAAAGTTGCAAGACAGGAAGAAGAAGAGGGAGGAAACTCTACAC +GACTATTTGTTACAAATGAAGAAAATAGCAGCCTTAGGTGAAGTTGAAACAGTTGCTTTG +ATAACTCATATCGTAAACGGCCTCGACATTAAAAAGGAGTATAAGGGTGCTATGCTCCGT +TGTAAAACTCTTAAGGAATTAAAGCAAGAATTCGAAATCTACGAGAGTCTGAATATTGTT +GACAAGCCGAATATTCAACCAAAACCAAAGCAAATTACACAAGGTGTAAAAGCAGATCAC +TGCTTCAACTGTGGTTCGAGGGAACACAAACGAAAGGATTGTACACTTCCTACCAAATGT +TTCAGCTGTAATCAAGAGGGCCATATCTCAAGCAAGTGTCCGGAAAAAGTAAACAGCATG +CGCATTCACGTTGATAGTGCACGAACAAAGCCAGTAATCATAAATGGGATTATCATCAAC +TGTCTGGTGGACACAGGATCAGATGTGACCATAATTAAAGAAGCTATATTCAAGAAGATG +AAAGATGTTGATTTAAACCGCACTGCAACAGTATTGCGAGGTTTGGGAAATGCCTCAACA +CAGCCGATTGGATGCTTCAGAGCATTAATCAAGACCGACCAGGTGGAAGCAAGCCACAAC +GTTTTAGTCGTCCACGATTCTAAATTCAGTTGCGATGGAATAGTGGGACACGATTTTATC +AGCAAGTTTCGTCTTATCTGTAGTGCAGAAGGCTATACTTTTCTTGACCTGGAAGCAGAT +AAAAAACAAGCGGTTGAGTATTCCCAAATGTTTAATATTTGTGAAGAATCTTCTTTTACA +GTTGCACCACAATACCGAGAAGACGTTGAACGCATGATAGAGAGAACATACGAAACACCA +CCCAAGCAGATAAAGCAATGTCCAGTCGAACTCAAAATTATTCCTGATGGCGTGATTAAA +CCCTTTCGCCATGGACACACCCGACTATCTGAAGAAGAAGCTATAGCTGTAAAGAAGCAG +GTAGAGGAATGGGTCGAGCAGTCAATCGTCCGTAAATCTACATCAAATGTTGCCAGTCGC +ATAGTCGTTGTCAGGAAAAAGGATGGTACCCTACGCGTTTGCGTGGACTATAGAAAATTG +AACACCATGGTTCTGATGGATTGTTTTCCGGTACCCATAATGGAGGAGGTGCTTGAAAAA +CTGCAGAGTGCCAAATGGTTTACAACCATGGACTTACAGAACGGATTTTTTCATGTGGCC +GTAGAAGAAGCCAGCAAGCCGTACACAGCATTTGTTACCCGAGAAGGCTTATTCGAGTTT +AACAAAGCGCCCTTTGGTTTTAAGAATTCCCCAGCAGCGTTTATACGGTTCGTTCAATTT +ATTTTTCAAGAACTAATCAATTCCAATATAATGCAGCTATATATGGATGACATAATTGTA +TATGCCGCTACCCCAGAAGAATGCATGGAAAAGACGGAAATGGTACTTAAGAGAGCTGCA +GAATTTGGTCTAAAAATAAAATGGAAGAAGTGCAACTTTATGCAGAGGCGAATTCATTTC +CTGGGACATATTATCGAAGGTGGACAAATATGCCCTGGAAAAGAGAAAACATCAGCAGTG +AATTCCTTTGGAACACCTCAGAATGTAAAAGCCGTTCAAGGATTTCTGGGTCTCACAGGA +TTCTTCAGAAAATTCATACCTGGATACGCCCAAATTGCGAGACCACTGACGGACCTATTA +AAAAAAGATGCCATTTTCAACATTGGACCAGTAGAGCAGCAGTCGGTGAATAAGCTGAAA +GAGATTCTGGTAAACGAACCAGTATTGAGGATCTACTCACGAGAAGCAGAAACCGAACTT +CATACAGATGCCTCTAAGGACGGGTTAGGAGCCGTTTTATTGCAGAAGTTCGAAGGCAGT +TTTCACCCAGTCTGCTTTTGGAGCAGAAAAACTACAAAAGCCGAATCAAATCGTCATAGT +TATTACCTTGAAGTAAAAGCCGCATACTTAGCTCTGAAAAAGTTCAGACACTATTTATTG +GGAGTCCCTTTCAAGCTCGTCACGGACTGTGTCGCATTTAAACAGACAACAAAAAAAGCA +GATGTCCCAAGAGAAGTTGGCCCATGGATTCTCTATATGCAGGATTTTAATTTTCAACCC +GAACATCGTGCAGGAGAAAGAATGAGACACGTTGATTTTTTAAGCCGCCATCCCCAAGCA +TGCATGATGATAACATCCGAGTTGACAGCACGTATTAAAAAGTCGCAGCAGAACGATGAT +TCAATTAGAGCAATCCTGGAAATTCTAAAAGATCGTCTATTCCAACCCTACAAGCTAAAA +GGTGGCCTGTTGTATAGTATGGTCAATGGCAATGAACTACTGGTTGTCCCTGCACTAATG +GAGAGGGAGGTGATTCAAAGCGCACATGAAGTTGGCCATTTGTCGTTGCAAAAGACGATG +CATAGCATACAGCAGCAATTTTTTTATTTCCTCATTTGGGAATACAAGGTAAAAAAGCTA +ATTTCTAACTGTATAAAATGTATCATCCACAGCAAAAAGTTGGGAAAGCAGGAGGGATAT +CTAAATTGCATAGATAAAGGAGACGCACCGTTGCACACACTACACATCGATCATTTGGGG +CCAATGGATTCATCGGCCAAACAGTATAAATACATTCTGGCAACAGTCGATGCGTTTTCA +AAGTTTGTCTGGTTATTCCCAACCAAATCAACCGGACAGGAAGAAGTGGTCAAGAGGCTG +ACCGACTGGTCAAACATTTTTGGTTTCCCTAAGCGAATTGTTAGCGACAAAGGAACGGCC +TTTACGAGTGGTGCGTTCGAACAATTTATGAGCAGCCATAACGTGGAACACGTCTGCACA +ACTACTGGAGTGGCCAGAGGCAACGGCCAGATAGAACGAGTAAATCGTTTAATTTTGGCA +ATAATATCAAAGCTGTCTTCAGACGAACCGTCGAAGTGGTACAAATATGTGCCTGAGGTA +CAAAAGGCGATCAACTGTCACGTGCATTCATCACTGAAGCTGTCACCATTTGAGGTCATG +TTTGGCACCAAGATGTACACCCGAGTTGAGGATCGGTTACTGGAACTGCTCCAAGAAGAA +GTGGTCTGTCAATTCAACGAGGACCGCTATGAGATGAGACAGCTGGTAAAACGCAACATC +GAGCAGGCGCAGAAGGACTACAAGCGCAATTACGACAAAAAGCGCCGAGCTGAATACAAA +TACAAAGCAGGTGATCTGGTTGCAATTAAAAGGACCCAATTTGTAGCTGGCCGCAAGATG +GCAAGCGGGTATTTAGGTCCATACGAAGTCACAGGGGTCAAAGACAATGGCAGATATGAC +GTTAAAAAAGCAGCAAACGTCGAAGGACCCAATGTCACATCCACCAGCTGTGACAACATG +AAGTTGTGGAAGTACATAGCCGAAAATGCAGACCTATTGTCATCCGGGTCGGATGATGAT +GATCAGGAGGGCCGAATGTAACATGGAGTAAGGCTGAAGGCTGGCAACAACCCGGTTGGC +AGCGCTGTTGAGCAGCAACATGATTGTCGGAAATCGAAGTTATCGACAATCAGTCATCGA +AGGAACGATCGCAAGGCAGCAGTGGAGTAGGAGTGGAAGTCAGCGTTGCAGTCAGTCGTG +TTCTCAGCAGCAGTTCGTTCGGTCACAAACTAAGAATACTTTATATAATTACCGCATTTA +GAATTAAACTAATAATTAAATTAATAATAAACAATAATAATAAACAATCTTACA +>OPUS +AGTTAAGAACCCTCTTCTTGCGCTCTTCGTCAGGACTCACCAGCGCTCGGCTCTCGTGTT +TTCGGGCCCCGTCAGCAGGCGACTCGGGGCCTGTCTAGTAACATGTTCGTGTAAGTTACG +AACCCTCTTCTTGCGATCTTCGTCAGGACTCACCAGCGCTCGGCTCTCGTGTTTTCGGGC +CCCGTCAGCAGGCGACTCGGGGCCTGTCTAGGAACATGTTTGTGTATGTGTGCATTCGGA +ACAAGTGCCGTTGGTCGCACTCAGGGTGAGGGGTCAACGGGGGAAGCGGATATAAAAGCA +GCGGGGCGGGAGAAGAGGTCCCAGTCTCGAACGGACACATAACGGAACCGCTAGCAGATC +GCGAACTGAATCTTAAAATAAAGCTAATCGTAAACTCGAACCCTCTTAACTATCTTGACT +ATTATTTGGAGAACCACAGCATGTTGGTTGTCATATCAAGGTGAGGTATGCGGCAGCGAG +TGCCGAGAACCCTGATGCAAGTGGAACTTGCGTTAACTGGCGCCCGAACAGGGACCGGCA +ATGTCCGGCCGATAAAAGTGATACGAAAAAATTGTGGAAATTTGTGCGTAAAAATAGTGG +TGGTGTGCATAAGTCAGATTAAGATCTGAAATCCATAAATGAAAAAGAAGTGCTGCGTGA +GCTGTGTATAAAATGATAAAATAGCAATTACCCGCTGCCGGGGGGAACTACGCCCATCCC +GGGGCGCAACAAATATTGCATAATTCAATAAAAGGTGTAAAATTTCTAAAATAAAAATGT +AAACCTATGTTGCGCCAAGACCTAATTTAAATTAATAAAACAACGACCCGCTACCGGAGG +ACGCCACGTCGCCCATGCCGAGCGCAAAAGTTGTACGATACCTATAACATAATTAAAACA +CGATCAACCCACTGCGGCGGTACGGCTTGTGGGAAAATTTTTTTTTTTTTCTCTCCTTGC +CAATTCGCGAGTGCAAAAGATTGTGTATAATAAACCAATAATTAACCATTGCAGCAGTTT +ACCTGCGGCAGTACGAGTAATATGAGCGCCCAGAGTGATAAGGTGGTGTGTGGCAGCTTG +TTGGATACGTTAAGTGGTGTGGAATGCACCCAAAAAAAACCGCCCAACAAGTTGTGTGGC +GGCCGTACCTTAGTAGGCAACCAGCCAAAAGGGATACTACGGAACCACCGTGCCCAGTGC +CGAAATAAATTAGAGGTCATCAATAAAAAACTGTAACAGCACGCACGCAAGGAAAAAATA +TTGCAAAATGGAATAGCGCACAAAAATTGTATAAACACATGCACAACACCACAATTCAAA +GGAAAACAAAATATTCATGCTGTAGGGGTACAACCTAAACGACGAAAACTAATAAAGAGC +ATACAAGGGTGAGTGAAATATTTCATTAAACTTTATTGCCATATTTGCTAAATTTAGAGA +AATAAAGAAAAAGCAAAGAAGAACAGATATTCTTTTTTATCGGGTTAAAACCGTTGTCTC +ACATTTCCGTAAAGTAATAACGAATTCTGTTGCCTTGAAAGCTTCCTGCATCTTTCCAAC +GCAAACTAAAAATCAAAATGGAAGAGACCCTGCGTGCTCTTAGCGAGTCCCTCAATGCCC +TGACCAACGTGGTGACAGGCATTAAGGAAGATATTAAGAAAAATAATGATAGGTTGGCTA +TTTTAGAACAGGAGCGCGGGAACGCTGACCCTACGGTCGACCAACCGCAACCCCTGGTGC +GCGCACGCACCGAGTATGAGCTGAGAGAGATATCGGTCCTCCCTGACTGCGTCAAAGAAC +TGCAGGCGTTCGAAGGACGGCAGGAGGCTTACCTGTCTTGGATAAACAGGGCACAGTCAA +TACTGACCGAATATGACTTGATTAAAACCAGACCCCTGTATAGGGCAATTGTCTTGCATA +TTAGACAGAAAATAAGGGGACACGCCGACATGGCCTTGGCGGCCTATGGCGTCCAAGACG +ACGATTGGGACGACATAAAACGAGTCTTGGCGCTGCATTACGCAGACAAACGAGACTTAC +GTACGCTTGAGCATGAGCTTGGCGCTATGTGCCAAGGTTCTAGACCACTAGATAGGTTCT +ATATGGACGTTAATGGCCATCTCTCGTTGATCTTAAATAACTTGAAGGCCAGAAACCACC +CTCGTGAAGTAGTCAACGCTTTGATAGAAACCTATAGAGACAAGGCTTTGGATGTTTTTA +TCCGAGGAGTGGGGAGAGATTGTTCCAAACACTTACTTGTCCGCAGCCCGAAGAATCTAC +CAGAGGCTTACTCTTTTTGTATGGGATTGCAGAATGTAATGTCAAGAAATTTCACAGCTC +AGAACTATCAACCGTCAGGTGCCCCAAGATTCGCAGGCCCATATCAACATCAGGCCAGGC +CACCGTTCCGAACCCCTTTTTCTCCTGGTTCAGGCAGATTTTCGCAAAACTCCTACAGAA +CTCAGGGTCCTAGACAGGCCATAAAAATGGAATCCAATCGGTCGGGTCAATCTTACCAAT +CAGGATACAGTGGTCGCCAGGAAGAAGGCTCCGGTATTAAGAGAATGTCCGAAGGAAACA +ACCCATTCCAAAAGGCACAAAGATTGTACCACATGGAATTGGCACCACCCCCGCTAGCCC +CGGCGGCTAGTGGAGATAACCAAGGACGTTCACACGAGGGTTACTATGATGACGAGTCTC +AAGCTGTCGAGAGAAGCAACAATTATCCTCCGCAGAAAAACGTGGAAGGAGTTACAGATG +CTCCACATAACCTTGAGACTGAGGGAGGGGCAAATTTTATGACCAACGCCTCTCCAGTGT +ACCGTACTTAGAGTATGCTACGGAGAGGGGAGAAAGGCTGAAGTTTTTGATCGACACGGG +GGCGAACAAAAACTTTATTAGCCGAAGACTTGCAGCCGGGTGTACCACAGTCCGTAAACC +CTTCTCCGTACTGTCCGCTGCGGGTAACATCATGATAACGCACCGCCTAGTTGGTAAATT +CTTCAAACCACTAGGGAACGACTCGGATATTACCTTTTTCGTACTACCGAATTTACATTC +CTTTGATGGTATCATTGGCGACGATACTCTCAAAGACTTAAAAGCCATAGTGGATAGGAA +AAACAATTGTTTGATAATAACCCCAGGAATTAAAATCCCTCTTTTGGCGAGAGCTTCAAT +AAACGTTAACCCGCTACTCGCCGCCGAACACCCAGATGGTACACAAGAAATTTTGAATTC +CCTTCTCGGGGAATTTCCCCGCATCTTCGAGCCCCCCTTATCTGGAATGTCCGTGGAGAC +GGCCGTCAAGGCTGAAATCCGGACAAACACACAAGACCCGATCTATGCTAAAAGTTATCC +TTACCCAGTCAACATGCGCGGAGAAGTCGAACGTCAAATCGATGAACTGCTGCAGGACGG +TATAATTCGACCCTCTAATAGCCCTTACAATTCCCCTATCTGGATAGTCCCGAAGAAACC +TAAACCAAACGGAGAAAAACAATATCGCATGGTAGTCGATTTCAAGCGGTTAAATACCGT +CACCATACCCGACACTTACCCCATCCCAGATATAAACGCTACGCTAGCCAGCCTTGGCAA +TGCCAAATACTTTACCACCCTAGATTTGACTTCTGGATTCCATCAAATCCACATGAAGGA +AAGCGACATTCCAAAGACAGCTTTCTCTACTCTAAATGGAAAGTACGAGTTCCTCCGTCT +ACCATTCGGTTTGAAGAATGCACCTGCAATCTTCCAAAGAATGATCGATGATATTTTGCG +CGAGCATATTGGCAAGGTCTGCTACGTTTATATTGACGATATCATCGTCTTCAGTGAAGA +TTATGACACACACTGGAAAAATCTCCGATTGGTATTAGCGAGTTTATCAAAAGCTAACCT +CCAAGTGAACCTTGAGAAGTCGCATTTTTTAGACACGCAGGTAGAATTTTTAGGATATAT +CGTCACGGCCGATGGCATTAAGGCAGATCCGAAAAAGGTCAGAGCGATTAGCGAAATGCC +TCCTCCGACCTCTGTTAAGGAGTTAAAAAGATTTCTAGGCATGACCTCGTACTACAGGAA +GTTCATTCAGGACTATGCGAAGGTAGCAAAGCCCCTTACAAACTTGACGCGTGGATTGTA +CGCTAATATAAAGTCTTCACAATCAAGCAAAGTGCCAATTACATTAGACGAGACGGCCCT +ACAGTCTTTTAATGATTTAAAATCAATTCTCTGTTCTTCTGAAATACTGGCGTTCCCATG +TTTCACTAAACCTTTCCATCTAACCACGGACGCTTCTAACTGGGCCATCGGAGCTGTCCT +CTCACAGGACGACCAGGGTAGAGATAGGCCGATAGCGTACATTTCCCGTTCATTAAATAA +GACGGAGGAAAACTACGCTACTATCGAAAAGGAAATGCTCGCGATAATTTGGTCATTGGA +CAATCTTCGGGCTTACTTATATGGCGCTGGTACTATTAAAGTATATACTGACCATCAACC +TCTAACGTTTGCCCTAGGCAACAGAAATTTCAATGCGAAGCTAAAACGCTGGAAGGCTCG +TATAGAGGAATACAACTGCGAACTCATCTACAAGCCTGGGAAATCTAATGTGGTGGCTGA +CGCGCTTTCACGCATTCCGCCTCAGCTTAACCAGTTGAGCACCGATTTAGATGCTAATCC +CGAGGATGACATGCAGTCTTTGGCTACTGCCCATAGCGCTTTACATGACAGTTCACGATT +GATTCCCCACGTTGAATCTCCAATCAACGTTTTCAAGAATCAACTCATTTTTGACACAAC +CAGGTCAAAATACTTATGCGAGCACCCGTTCCCAGGTTATACTCGCCATCTGATTCCTCT +CAAAGACGGATCACTTGCCGATTTAACCAACTCGTTACAATCGTGTCTACGACCTGTAAT +AATTAACGGCGTCAAAATCCCGGAAGCACATTTGCAACGCTTTCAGTCCATCTGCTTAGC +GAATTTTCTTTTATACAAAATTCGGATAACGCAGCGCCTAGTGGCGGACGTGTCTGGCGC +AGAGGAAATTTGTGAAATAATTGAAAAAGAACACCGTAGAGCACATAGGGGCCCTACGGA +GATTCGTCTCCAACTTTTAGAAAAATATTATTTCCCGCGAATGTCCAGTACGATCCGTCT +GCAAACTTCCTCATGTCAGTGTTGCAAACTCTACAAGTACGAGAGACACCCTAACAAACC +AAACCTACAACCTACGCCAATTCCTAACTACCCATGTGAAATACTTCACATCGACATTTT +TGCGCTCGAAAAAAGGTTATACCTAAGTTGTATTGACAAATTTAGCAAGTTTGCCAAACT +TTTCCATCTGCAGTCAAAAGCATCTGTGCATTTGCGAGAAACTTTGGTGGAGGCCCTACA +TTACTTCACCGCCCCTAAGGTCTTGGTTTCGGATAACGAGCGAGGGTTGTTATGCCCCAC +AGTGCTCAACTATCTTCGGTCTCTAGATATCGATCTGTATTATGCTCCAACCCAGAAGAG +CGAAGTAAATGGTCAAGTCGAGAGATTCCACTCTACGTTCCTAGAAATTTATCGTTGCCT +TAAAGATGAGCTCCCTACCTTCAAACCCGTTGAGCTGGTACACATAGCAGTGGACCGCTA +CAACACTTCCGTTCACTCGGTAACGAATCGAAAACCAGCAGACGTTTTTTTCGACCGCTC +GTCAAGGGTAAACTATCAGGGTCTGACAGATTTCCGGCGGCAGACTTTAGAGGACATCAA +GGGCTTAATTGAGTATAAGCAAATTAGAGGTAATATGGCTCGGAATAAAAATAGGGACGA +GCCAAAGTCTTATGGGCCGGGAGATGAAGTTTTTGTTGCAAATAAGCAAATAAAAACAAA +GGAAAAAGCGAGGTTCAGATGCGAAAAGGTACAGGAAGACAACAAGATAACAGTTAAAAC +CAGATCAGGAAAAATTTTCCACAAATCTGATCTAAGAAATTGAGACGTGGCTTTCACATT +TAAAAAAGAAACGCGAAAAAGAATAACGAAAGTAATAAAAGTACGTTGTGGCAGCTAATG +AAATATTCCACCCATGCATACCCTATATAAAAAAAACATTAATAAAAAAAAAAAAAAAAA +AAAAAAAAAAAAAAAAAAATGAGTTAAGAAATACAAAAAGAAATACAAAAAAAACTATAA +AAAAAATAATATAAAAAAATACAGATTATAAGAAATAAGAAATAAGAAATATAAAAAAAT +AAAAATATAAGTACACAAAATGTACCGTACCCCCACACACTACGTAGTCTTAGAACAACT +TAGACGACCAGATATTTACGAATTGTCTTTTTGTAAGCGCGATTTCTGCATGCGGCGCAA +ATCCCGCTCACTGGACTGGCTGGGGTCGGCTTGGAAATGGGTAGCTGGATCTCCAGATGC +TGCTGATTGGAACGCCGTCTTGGCCGCGCAAGCGACGGCTTCGAGGAACTGCAAAAACTG +GAGGAGGCTAGCTGTATCCCTCGGCTACTGAAGTAACCAACGAGTGGTTAAGCAAGTCGA +CGATGGAATGCTCCTCCTGACCAACTTCAACGGAACTCTAAGAACGGCTGCAGAGAACTA +CGACCTGATCGGCTCCTTTATCATCCAATTCGACAATGAGACGATAATGGTCAACGGTCA +AAACTATTCCAGTTACTCGGTCAGTCATCTAATGGCGATGCCGGCCGTGTTGAGCCACAT +AACGGCCAGCAACTTTCAACTTTCTCTGGAATACGTCCACGACGTGAGCATGAAGAATTT +GGAAAAGATGTCCAACATGGCGAGTGAGCTACTAGCCTCTCTTCTCACCGAGGCGGCACT +CGCAATCTGCATATTCCTAGGCTTTTATTTCCTATGGAAGAAGCTGATGTCCACCAAAGG +CATGCCCGATGTCCGCGAGATTGCCGCAAACTTAGAAGCATTGGGCCAAACCGAGCTGAA +CAAGGCTCACTAATCTGCGGGACGCAGATCTTGAGGGGGGAGGAGTTAAGAACCCTCTTC +TTGCGCTCTTCGTCAGGACTCACCAGCGCTCGGCTCTCGTGTTTTCGGGCCCCGTCAGCA +GGCGACTCGGGGCCTGTCTAGTAACATGTTCGTGTAAGTTACGAACCCTCTTCTTGCGAT +CTTCGTCAGGACTCACCAGCGCTCGGCTCTCGTGTTTTCGGGCCCCGTCAGCAGGCGACT +CGGGGCCTGTCTAGGAACATGTTTGTGTATGTGTGCATTCGGAACAAGTGCCGTTGGTCG +CACTCAGGGTGAGGGGTCAACGGGGGAAGCGGATATAAAAGCAGCGGGGCGGGAGAAGAG +GTCCCAGTCTCGAACGGACACATAACGGAACCGCTAGCAGATCGCGAACTGAATCTTAAA +ATAAAGCTAATCGTAAACTCGAACCCTCTTAACTATCTTGACTATTATTTGGAGAACCAC +AGCATGTTGGTTGTCATATCAAGGTGAGGTATGCGGCAGCGAGTGCCGAGAACCCTGATG +CAAGTGGAACTTGCGTTAACT +>DM_ROO +TGTTCACACATGAACACGAATATATTTAAAGACTTACAATTTTGGGCTCCGTTCATATCT +TATGTAAATGAATCGAGAGCGATAAATTATATTTAGGATTTTGTTATCTAAGGCGACATG +GGTGCATTGCTCAAAAACATGTAATTTAAGTGCACACTACATGAGTCAGTCACTTGAGAT +CGTTCCCCGCCTCCTAAAATAGTCCCTTAGTGGGAGACCACAGATAAGGTCCTCGCCGCT +CAAGATAGGCAGATGTGCCCGAGCGTGGGACCTCGATAAGGCGGGGACTATTTACGTAGG +CCTCTGCGTAGGCCATTTACTTTAAGATGCGATTCTCATGTCACCTATTTAAACCGAAGA +TATTTCCAAATAAAATCAGTTTTTTTACAAAAACTCAACGAGTAAAGTCTTCTTATTTGG +GATTTTACATTTGGTCAATCGAGCCTTTAATCGACTCTGCAGTTTCCCCCTACCAAAGGT +AAGGAACTCAGAGAAAGGCCAGCTCCTTTAAGCATCTTACAGCTAAAGGTAGCAAAAATA +AGTGACTCTTGTTTCCCCCTACCAAAGGTAAGGAACAGAGTATAAATATAAAAAGCAAAA +GATACAAAAGAATCTTTTATGTTTTAAAACAAGCACCTTATAGTCTATAGCTAAAGGTTG +CTTTGTGTACCATTATAAATTGTGGTAAGGCGTGCTTGAGGCCATACATCAGCAATTGTG +AAATTAAAAAGTGCATAACAAAAGTGCCTTATAAATGCTCTAATAGCATTAAATCAGCTC +ATAAATAGAGTGCAGTGTATATGCCATAAGAGCATAAATTAAATAAAAAGTGCCTGAAAA +CAGTGCCTTATAAATGCTCTAATAGCATTAAATCAGCTCATAAATAGAGTGCAGTGTATA +TGCCAAAAGAGCATAAATGCCGAAATAAATGGCTAAAAAACAAAAAATCTGACTGGACTA +CAAAAATAATAAAACGTGCCAAAAAAAAAAAAAAAATCATCTTTAAACATCGACGGAGCC +TTAAAGAAGAGAAGGAAGTCAAATTCAAAGGAGCCTCTACCAGCAGCAGAAGCAGCAACA +ACAGCAGCAGCAGAAGCAGCAACAGCAGTAGCAACAGCAGCAACAACAGCAGCAACAGCA +GCAGCAACAACAACGACATCAGCTAAGTCAAAACAAGAATTTTCTGTTTATCCAAACACA +CATATATATATAAATACATATAAAATACATATACACGTACTATATATATTAAGAAATTAC +AAAAAATTTTCAAAATGATGTCAGAAAAGACTATTCAATTCCTTAAGAAGCAGTCCGAAA +TTATTTTGGAAATTAGAAAGTTGGAAGTAAAACCAACATTAACAGATGTAGAAATTCTAA +AATTAAATGAGCTTCAAAAATGTTTCATTGCTAATCATAGCAATTTGTTAAAGATCGGCG +TTGTCGATCATGAATATTTTAACGCGAAGCAGTATGATTTAATAATGATGGTGTTAGAAA +AAATTAAAAATAAAAATGAAAAAATTAAGGGCGAGTCGGTAGAAAACACTTTCCCTAAAT +CAAACACTGTCCCTAAATCAAACCCTCCCCCTACATTAAACCTTGAAATGCGTGGTCACC +CTGAAAAAGAGGGTATAGCACAAAACAACGCTTTAAAAGTAGAGCAGGCATTTCGTAATA +ATGTTGGCCAATTTCGAGTATATCTAGAAGATACGTCTAAACTAATAGACAGTAGTCCAG +ATTTCCTTAAAATAAGGAAAAATAAAATTGAATTTTTATGGCATAAAATAGATAACCTGA +TTGAACAGGTGAATAGTCGTTTTGAGAGTTCGCTATTCGAAGAAGAAATTAGCGAACTTG +AATTTGACAAACAAAATATTCTTACAGCCATTAATAGTCGACTCAGTGGCACAATAAATA +AAGCTGAAATGTCGACGGTTGTTAAGGCGGAGGAGTTACCAACCCTGCCTAAAATACAGA +TTCCCACCTTCTTTGGTGATTCCAAAGAATGGGATCTTTTTAATGAACTCTTTACAGAGC +TCATACATGTGAGAGAGGATCTCAGTCCTTCTCTCAAATTTAATTATCTAAAGTCAGCAT +TAAAAGGAGAAGCCAGAAATGTGGTTACTCATTTACTGCTCGGCTCTGGAGAAAATTATG +AAGCCACTTGGGAGTTTTTGACCAAGCGATATGAGAATAAAAGAAACATATTCTCAGATC +ATATGAATAGGCTTATGGATATGCCAAATTTAAATTTAGAATCCAATAAGCAAATAAAGA +CATTTATTGACACGATTAACGAGTCAATTTATATTATAAAATTAAAGGCACAATTACCAG +AAGATGTGGATGCAATTTTCGCTCACATAATTCTTCGGAAATTCAATAAAGAATCACTCA +ATTTATATGAAAGCCATGTTAAAAAGACAAAAGAAATACAGGCACTTTCTGATGTCATGG +ACTTTTTAGAGCAAAGGCTCAATTCTATATCATCATTCTCACAGGAAGTAAAACCTGTAA +AGAAAATGATTAATAATAACAAGAATAAAAATTATAGTGACAATTGTGCATATTGCAAAC +TACCAGGGCATTATTTAATTCAATGCCATAAATTTAAAATAATGAATCCAGCAGAACGGT +CTGACTGGGTAAGAAAAAATGGGATTTGCCTAAGATGTCTGAGGCATCCGTTTGGTAAAA +AATGTATAAGCGAGCAGCTTTGTTCGACTTGTCGTAAACCTCACCACACGTTACTTCACT +TTGCAGGTCATAATCCAGAAAAAGTGAATACGTGTAGAACAACAGGTCAAGCCTTGTTGG +CCACGGCCTTGATTCAAGTAAAGTCGAGGTATGGAGGCTTTGAACAATTAAGAGCATTGA +TTGATAGTGGCTCTCAAAGCACAATTATTTCAGAAGAGTCTGCACAGATTCTAAAATTGA +AAAAATTTCGGTCTCATACTGAAATAAGTGGAGTATCTTCCACAGGAACGTGCATCTCCA +AGCACAAAGCGGTTATTTCGATAAGAAATTCTCCGAAAAATTTAGAAATTGAAGCAATTA +TTCTCCCAAAACTTATGAAGGCACTTCCAGTCAACACGATTAATGTTGATCAGAAAAAAT +GGAAGAACTTTAAATTAGCCGACCCCGATTTTAATAAACCGGGTCGCATTGATTTAATCA +TTGGAGCAGACGTATATACTCACATTCTGCAAAATGGAGTTATAAAAATAGACGGTCTCC +TTGGGCAAAAAACTGATTTCGGGTGGATAGTTTCTGGATGTAAAAAATCCAAAGGAAAAG +AAACCATTGTAGCCACAACAATAGAAATAAAAGAGTTAGATCGCTACTGGGAAGTGGAAG +AAGAAGAAAAAGATGATATCGAGTCTGAAATCTGTGAAAATAAATTTATCAAAACGACAA +AAAAAGATTCAGATGGGCGATACATTGTGTCAATTCCATTCAAGGAGGATGTCACCTTAG +GAGATTCAAAGAAACAAGCGATAGCTCGTTACATGAATCTGGAGAAAAAACTAAAAAGAA +ATGAAAAACTTAAGGTTGACTACACTAAATTCATGAATGAATACATGGATTTAGGACACA +TGATTGAAGTGAGTGATGAAGGCAAATATTTTTTACCGCACCAGGCAGTGATTAGAGATT +CAAGCCTTACGACCAAATTGAGAGTAGTTTTTGATGCTTCAGCAAAAACTACGAATAACA +AAAGTTTGAACGACATAATGTGGGTTGGGCCACGAGTTCAAAAAGATATTTTTGACATTA +TTATTAAATGGAGAAAATGGGAATTTGTTGTTTCGGCAGACATTGAAAAGATGTACCGAC +AAATTAAAATAGATAATAATGATCAAAAATATCAATATATTTTATGGAGAAATTCTCCAA +AAGAAAAAATTAAAACATATAAATTAACCACAGTCACTTACGGAACTGCATCTGCACCAT +ATTTGGCTACCAGGGTTCTGGTAGATATTGCAGATAAATGTAAAAACCAAGTTATTAGTG +CAATAATTAGGAATGATTTCTATATGGATGACCTAATGACTGGAGCTGATTCGGTAGAAG +AAGCTAATAAATTAATAACATTAATTCCCCATGAATTGCAGAAAGTTGGATTCAACTTAA +GGAAATGGATTTCCAACAATTCCAAAATATTAACCACTGTGGAGGACACAGGGGACAATA +AGGTTCTCAATATTATCGAAAATGAATGTGTTAAAACTTTAGGACTAAAATGGGAACCTC +AAAAGGATTTATTTAAGTTCAGCGTAAATTGTAATGATGAATCAAAAAATATAAATAAGC +GCGTTGTGTTATCAACGCTAGCAAAAATATTTGATCCGTTAGGATGGTTGGCACCAGTCA +CGGTTTCAGGAAAACTTTTTATTCAAAAACTTTGGATAAATAAAAGTGAATGGGATCAGG +AATTATCCATAGAAGATAAAAATTATTGGGAAAAATATAAAGAAAATTTATTATTGTTAG +AGAATATTCGAATCCCAAGGTGGATTAATTCAAACAGTTCTTCAGTCATTCAGATTCACG +GATTTGCGGACGCCTCCGAAAAAGCATATGCTGCAGTAGTCTATGCTAAAGTAGGACCTC +ATGTTAATATAATAGCTAGCAAAAGTAGAGTCAACCCTATAAAAAATAGGAAGACAATTC +CCAAACTCGAGCTGTGTGCAGCTCACCTGCTTAGTGAATTAATCCAAAGACTAAAAGGAT +CAATTGACAATATAATGGAGATCTATGCTTGGAGTGATTCCACGATTACCTTAGCATGGA +TTAACAGTGGTCAAAGTAAGATCAAATTTATAAAAAGAAGAACGGATGACATTCGGAAAT +TAAAAAATACTGAATGGAATCATGTTAAGTCAGAGGATAATCCAGCAGATTTAGCATCCA +GGGGAGTGGATTCTAACCAGTTGATCAACTGTGATTTTTGGTGGAAAGGTCCGAAATGGC +TAGCAGACCCAAAAGAACTTTGGCCTCGGCAGCAGTCTGTAGAAGAACCTGTCTTAATAA +ATACGGTATTAAATGACAAAATAGATGATCCTATTTACGAATTAATAGAAAGGTATTCCA +GTATAGAAAAACTTATACGTATAATAGCATACATAAATAGATTCGTGCAGATGAAAACAA +GAAATAAAGCCTATTCATCAATTATTTCAGTAAAGGAGATAAGAATAGCGGAAACAGTTG +TTATTAAGAAACAACAAGAATACCAGTTTAGGCAAGAGATAAAGTGCCTTAAAATCAAAA +AGGAAATCAAGACAAATAATAAAATATTGTCATTGAATCCATTTTTGGACAAGGGTGGGG +TTCTAAGAGTTGGAGGAAGATTGCAAAATTCCAATGCAGAATTTAATGTTAAACATCCAA +TCATTTTAGAAAAATGCCACCTAACAAGCTTATTAATAAAAAATGCTCATAAGGAAACAT +TGCATGGAGGGATAAACCTAATGCGAAACTATATCCAAAGAAAGTATTGGATTTTCGGGT +TGAAAAATTCGTTGAAAAAGTATTTAAGAGAATGTGTAACGTGTGCAAGGTATAAACAAA +ATACAGCTCAGCAAATAATGGGTAACTTGCCAAAATATAGAGTGACGATGACATTCCCGT +TTCTTAATACTGGAATAGATTACGCAGGTCCTTATTATGTTAAATGTTCAAAAAATCGTG +GCCAAAAAACATTTAAAGGATACGTTGCTGTATTCGTTTGCATGGCCACCAAAGCCATAC +ACTTAGAAATGGTAAGCGATCTAACTTCAGACGCATTTTTAGCAGCACTCAGAAGATTTA +TTGCTAGACGGGGAAAATGTTCCAATATCTATTCAGACAACGGAACAAATTTTGTAGGAG +CTGCAAGAAAATTAGATCAAGAGTTATTTAATGCAATACAAGAAAATATAACGATTGCAG +CGCAACTTGAAAAGGACAGGATTGATTGGCATTTTATTCCCCCGGCAGGACCTCACTTCG +GAGGTATTTGGGAAGCTGGAGTTAAGTCAATGAAATACCATTTAAAGCGTATAATCGGCG +ACACTATTTTTACTTATGAAGAAATGTCAACTCTTTTATGTCAAATAGAAGCATGCTTAA +ATTCAAGGCCATTATACACTATAGTTAGTGAGAAGGACCAACAAGAAGTTTTAACACCAG +GTCATTTTTTAATTGGAAGACCACCTTTAGAAATAGTCGAACCAATGGAAGATGAAAAAA +TCGGAAATTTGGATAGGTGGAGACTTATCCAAAAAATAAAGAAAGATTTCTGGGTTAAGT +GGAAAAGTGAATATTTGCATACGCTCCAGCAAAGGAATAAATGGAAAAAGGAAATTCCTA +ATATAGAAGAAGGGCAAATAGTTTTATTAAAGGATGAGAATTGTCATCCTGCAAGATGGC +CTTTAGGAAAGGTGGAAAAGGTGCATAAGGGGAATGATGATAAGGTCCGAGTGGCTAAAG +TAAAGATGCAGGAAGGATATATCACTAGACCCATTACTAAAATTTGTCCCTTGGAAGGAA +TAAAGTCTGTTGACAAAAATGAGGCTGACCAAGAGCCAAAAAGACGAACTAGAGCGACAT +CGGGAATGTCCAAGATCGGAATCATTATGGCAATGTTGTTGTTTGTGTTAAGTTGTCAAG +TTTCTAGCGCATTACCTAAAGATATAGCACCAAGATATTCTATAGACAAAATAAATAAAA +CCTCAGCAATATATCTAGACCCGCTAGGAGATGTTGAGATTGTGAGTACTTCTTGGAATT +TGGTTATCTATTATAAAATGGATCCATATTTTAAAATGTTAACAAAGGGTAATGCGCTTA +TACAAAGTATGAGGAAAGTTTGCGAAAGACTTCATAGCTTTGAAGAGCAATGTAGTCTAG +TCTTAGATAATATGCAAAGTCAGTTATCGGAACTTGAAGAAAACAATAAATTGTTTATGA +TGCAGTCTAGATCTAGAAGCAAGCGTGCTCCTTTCGAATTTATGGGTTCCTTGTATCATA +TTTTATTTGGTATAATGGATGAAGATGATAGAGAGCAATTAGAAGAAAATATGAAGAATT +TGTTAGATAACCAGAACAACCTTGATAAACTAATTCAAAAACAAACATCTGTGGTTGATT +CAACTTCTAATCTATTAAAGAGAACAACAGAAGATGTTAACTCCAATTTTAGAAGTATGC +AAATAAGAATTGAGAACATGACAGAAGTTCTTAAAGAAAATTATTATGTTTATAAGGAAT +CAATAAAATTCTTTATGATTACGAAACAGCTACACTCATTGATTGAAGAAGGCGAAAAAA +TTCAAGCAGGCATTATAAGCCTGTTGATTGATATTAATCACGGTAGGCTAAATACAAATA +TTCTCAGGCCAAATCAGCTTAAAAAAGAAATTGCCAAAATTCAGCAGAGTCTTTCAGAGA +ACCTAGTAATTCCAGGAAAACGGTCAGGTACGGAACTTAAGGAGGTGTATACACTGTTAA +CAGCCAGGGGTTTATTCATCGACGATAAATTGATCATTAGTGCAAAAGTGCCTCTGTTTA +GCAGGCATCCATCCAAATTGTTCAGGCTTATTCCGGTGCCAATTCGAAATGAAGATCGGA +TAATAATGGTGCATACAACGTCCGAATATTTAATTTATAATTTTGAGATAGATTCCTATC +ACATAATGACGGAAGCCACATTAAATCAATGTCAGAAATGGCAACTAAATAAGAGAATAT +GCAAAGGAAGTTGGCCCTGGAATTCAGCGAATGATAATGCATGTGAGATTCAGCCTCTAA +AGCCAGATAAAGCGGCGAACTGCATCTATAAAACAGTAGTCGACTCTAAAAGTTACTGGG +TAGAGTTAGAAAAGAAAAGTAGTTGGTTGTTTAAGGTTCCTGCGAATTCAAAAGTCCGTC +TGCAATGTACTGGCTCTCAAATTGAATTGTTTGATTTGCCTCAGCAAGGAGTTTTAAGCA +TTGCGCCATATTGTACGGCAAGAACCGACGATAAAATTCTAGTTGCCCACCATAACATTC +AGTCCGAAAGTGAAGAATTATTATCAACACCTTATATAGGAGAAGTTAGTGGAGTGCCGA +AGATTATTTGGGATCCGCTGAAACTATCAATATTAAATCATACTGAGGAATTTGAACGAT +TGAATAATGAAATTAAATTTATGAAAGAGAACCATCAAAAATTGAAAGATTTACATTTCC +ATCATATTTCCGGACATGCTGGATTAATTATTGCTTTAATACTAATGATAGTATTAATAA +TATATTTCATACGGAAATGTGCTGTGCAACAAAGAATGCAAGCAATAACCTTTGCAGGTC +CGTTGCCAGTACTATAAATATCAATAGTAAATAAACAATAAAATAATATAACAAATAAAA +ATATACAGTCCACTAATAGAAAATGTACTTCTACATAGAAAAAGCAAAATGTTTAAAATA +AGTTAATTAAGTACAAATTGTTGAATTAAAAATAATATAAACCATAATTGTAATCCAATA +AAATTAAAAGCCAGAAAAACTAGGCCCATTGAAATCTTAGTTGCAAAATAAATGAACATA +TATCAAATAAATACAGTCCACTACTGTTATAAATGCAACTAATATACTAATGTACATCTC +AGCTTTGCTGGCCCTTTGGCAGAATGTTCACACATGAACACGAATATATTTAAAGACTTA +CAATTTTGGGCTCCGTTCATATCTTATGTAAATGAATCGAGAGCGATAAATTATATTTAG +GATTTTGTTATCTAAGGCGACATGGGTGCATTGCTCAAAAACATGTAATTTAAGTGCACA +CTACATGAGTCAGTCACTTGAGATCGTTCCCCGCCTCCTAAAATAGTCCCTTAGTGGGAG +ACCACAGATAAGGTCCTCGCCGCTCAAGATAGGCAGATGTGCCCGAGCGTGGGACCTCGA +TAAGGCGGGGACTATTTACGTAGGCCTCTGCGTAGGCCATTTACTTTAAGATGCGATTCT +CATGTCACCTATTTAAACCGAAGATATTTCCAAATAAAATCAGTTTCTTACAAAAACTCA +ACGAGTAAAGTCTTCTCATTTGGGATTTTACA +>BLOOD +TGTAGTATGTGCATATATCGAGGGTACACTGTACCTATAAGTACACAGCAACACTTAGTT +GCATTGCATAAATAAATGTCTCAAGTGAGCGTGATATAAGATCACCCATTTATGCTTTAA +GCTAAGTCAGCATCCCCACGCTGGCCGCTGGCCATATATGCGCATAAGCTCTCTCTCTCT +CTCTCTTATACATATATATATACGCTGCTCTTCTGCCGCTGTCGACGGCGGCGCAGTCGC +AGTATTTAGGTAAGATTAGACACTCTGTAGAGGTTAAGCGGGCAGAACCGTTTCTGCTAC +TCGAAGAGATAAGAAGAAATAAAAAGGTGCCTGACGGCTGCACCCAACTGCAAGGAAAAC +ACGTGTTCTCAATTGGTGGCATATATTGGTTTATTACATGGCGACCGTGAGGCAGGAGCC +TGCGATCTGAGGACTACTGAGGAAATGCTGCTAATATTGCCGATTTGATTTGGGAATTCT +AAACAGCGACAACAGGTGTGAGAAGCAGGCCGCCCCTTACACCAGTGCGGGAGACCTAGA +GACGGGACACTGATGAAAAAAAAAGAAACAAAAATACTGAGTGAGTAGAGTGTGGTAATG +GGCAAACGCGGATGTCAGGAAATCAAAAATAAAGGTATAGCACATATTAAGTGGCTATGA +TATACAAATAAAACACCGCCCCCATGGGCAACGGCACAGAAATTAACTGCCGAATTAGAC +TTTCTGAAAGAAAACCTCCAGCAAAGAAAGCCGAATACCACAACTCACTCAGCAAAAATA +GAAATAATCAATGAAGAAATAACTGAAAATTCAACATCACCCAAGCCGAAAAGACCCGAC +GTCTGCATGAAAGACTGCCCTCGACCATTGTAAGCCGCAACAGCAATTAGCACGGCATCC +TGCGAGGGTAGGATTAGGATAAAGGATAAAGGATTCCACCGGCGCGCCGCACATGACAAC +AGCGAATGTCTACCAAGCAGACGTTCGAACACCCTGCTCCTGTCGAGCAAAGGGATCTGC +CAAGTATCAAAGAGGTAATAGAGGTAGATCCGTCCGCGGGACCAAAGCCCTTGACCATAC +AAGAGTACAAGGCACGGACTGCAGCGAGGGAGCAGCCACCTAAAAAGAAGAGGGGTGGCC +GCCGGATTAAGTTGCTCAGCGCCCGGAGGCTCAACATCGAACTACTGAAGACGGCAACTA +ATGAGGAAGACCGGCAGCGCTACAAAGAGCGCCTTGCAGCCATCAATCAACAACTTCGTG +GTGCGAAGTAAAGCGGCGGGCTGCGTTATACGCCATAGCCTCAACCGCCCAAATATTATA +TTAATGTTGTCGATGCGGTTTCCGCTGCAACAAAATTACTAACTTATCAGGGACCCATTT +CATAACTAACACATTATACTCAGTCCTAAACTTAAAATAAGTAATAATATTGTAAAATTG +CAAATTGCAACCGATGTAAACTGAGTATAATGAATTCATCTATCAAGTAAAAATATGTTT +AACAACAGTTTAGACCTATTAAAATTTCGAGCTATATTTATATCTGATCGAGATAACAAT +AATTGACCAATTCTCAAAGTTAAAATTCTATTTGTACTTTTGATATACAAATAAAGACTA +ATTTTCCCCATATCAAAATGGGACATAAGTCGTGGATACAACCCCACAGTTAAATTCAAT +GTACTTACTATTTTTGATTTTAGTTATCCTATCAGCCTTTTTACCTTGGCCTTAAAACTT +TATCAGTTTCACACAAGATCGTTGAAAAGACTTACATGAGTCGAGCCAATGATTTAGACA +AAATCTAATAGAAACTACACCAAAAAGGTACAAGGTCGATTACATCGCTAAAAGGTACAT +ACATGGAATGGCTAAACTTAACCATATCCATAAACAATATTAGAGATGCTTTTGATAAAT +CCTATAAATGTATTAATAAAACCGCGCTGATCAAAACTCAGACGCTTATTTTTCACATAA +AGGTATTGATAACACAATACAACACATTACAAAACCTAATAGTAACAAACAAAAGCAAAC +TCACTGAAGAACATAAAGTCCAATGCTTCAAAGTTCTCAGTTCATTTGGTAAAAGACTAC +ATAATACCAGCGTTAGACACAGTATTATAATAGAAGTCCCAACAGAACTAACCAAAATAG +CAGAATTCGACGAAAGCCAGTTAAGAGACTTGGACGAGTCGCAGCCGTTAGAAGATTTAG +ATATCGAAAGCGATATCGAATCAATAGAAGAATTAAAATTTAATACCGTACAACCAAATA +CAAGAAACATGGCCAACGCATTAGAAGCTCAGAGAGCATACGTTAAACAGGTATCTGCCA +CAGTACCTGATTTCGATGGTAAGAAACTCCATTTAAACAGGTTTGTGACAGCACTTAAGT +TGACGGATCTAACTAAAGGAGATCAAGAAACTTTAGCAGTAGAGGTCATAAAGACCAAAA +TTATTGGCCCATTAAACTATAAAGTAGAACATGCGACAACGATACAGGCAATAATTACCA +TATTGCAGGCAAACGTAAAAGGCGAATCGCCTGACGTTATAAAGGCCAAATTAATAAATG +CCCAACAAAGAGGCAAGACCGCGTCTCAGTATGTTACAGAAATAGACAGTATGCGTAAGC +AGCTCGAGGCAGCTTACATAGACGGCGGATTAGACGCCGATAATGCTGACAAATTCGCGA +CTAAAGAGTCGATATCAGCAATGACCAAAAACTGTGCCAACGAGGCACTTAAAATGATCT +TAACTGCAGGTACATTTAGTACATTCAACGACGCAATGGAAAAATACCTACATTGCAGTA +CAGAAATAACCGGCAATTCAAATACAGTCTTATTCTATAATGGGAATAATAGACGTGGTA +ATTATAATGCCTACTATCGTGGTAGAGGCAGAAATAATTATAACCATAATTATAACCAGA +ATTATAACCAAGGTTATAATAATAACAACAGAGGTCGCGGAGGCTACCGCGGCCACGGTA +ATAACAGAGACGGAGGTAACCGAAGGGGTAACCAAAGTCAGAATAATAATAACAACCGAA +ATGTGCGTAACGTACAATCGGAAAACAGCCAGACCCCCTTAAGCGATCAACAGTAAAAGT +GTTTAAAGTAAACCTAAATCTGAGTATTTTCATTAAGACAAAAAACCATGAAACAAACAC +AGTTCTTACATTACTAATAGACACAGGTGCAGAAATTTCATTGCTAAAAGCCAAAGCAAA +GGAATATAATAATATAAATTTCAGTAATATATCAAATATTACAGGTATTGGGCAAGGAAC +CATACAGTCTATAGGTACAGTAGATCTTGACATACGCATTCAGGATGTTCTAGTGCCACA +TGAATTTCATGTAGTACCTGAGAATTTTCCGATACCATGCGATGGCATAATCGGAATAGA +TTTTATCAAGAAATACAATTGCGTATTAGAGTTTCAAAATAACAAAGACTGGTTCACAAT +AAGACCCAATAACTTCAGTAGACAGATTAGTGTACCAATTACACATAACTTAGACTCCAA +CACACTCTTATTGCCAGCTAGATGCGAAGTAATCAGACAAGTCAAATTACTCACTAACGA +AAAAACGGTGGTAGTACCAAATCAGGAGCTGCAACCAGGTATAATAGTAGCAAGCACCAT +TGCCGATAGCAAAAACGCATTGATTCGCATTATAAATACAAATAATAAAGACGCCATAAT +AGATAGCGCGAAGATCAAATGCGAATCAATGAAAGACTATGACATTTTTACAACACCAGT +AGAAAAGGAAAATAGAACTGAAGAAATTTTAAAACAATTAAGATTCCCTAAACAATTCAA +TAATGAACTAACTAAGTTATGCACCGAGTTTAGCGATATTTTTGGTCTAGAAACAGAACC +AATATCGGCTAACAATTTCTACAAACAAAAACTCAGATTAGGGGAAAAAACACCGGTCTA +TATAAAAAACTATCGCATGGCAGATAGCCAAAAACCAGAAATCGCCAGACAGGTAAAAAA +ATTAATAGATGATGGAATAGTTGAACCATCAATGTCTGAATATAATAGTCCATTACTTTT +GGTTCCAAAGAAACCACTTCCGAATTCCACGGAAAAAAGATGGCGATTAGCAGTTGACTA +TCGTCAAATAAATAAGAAACTATTATCAGACAAATTTCCACTTCCAAGAATAGAAGATAT +TCTTGATCAATTAGGAAGAGCAAAGTATTTTTCATGTCTCGACCTAATGTCTGGATTCCA +CCAGATAGAACTAGAAAAAAGGTATAGAGATATAACGTCATTTTCAACAGCCAATGGCTC +ATATCGCTTCACGCGATTACCATACGGACTGAAAGTAGCACCAAACTCCTTCCAACGTAG +GATGACACTTGCATTTTCTGGTCTTGAACCATCGCAAGCATTTCTATATATGGATGACTT +AGTAGTAATAGGTTGTTCAGAAAAACATATGCTCAAAAATTTGACTAACGTATTCGAGCT +ATGTAGACGACATAATTTGAAACTACATCCAGGGAAATGTTCTTTCTTTATGAAAGAAGT +AACATATTTGGGTCACAAATGTACCGATAAAGGTATACTCCCAGATGACACCAAATATGA +AGTTATAGAAAAATATCCTATACCAACAGATGCCGACAGTGCTAGGCGTTTCGTAGCCTT +CTGTAATTATTACAGACGTTTCATTAAAAATTTTTCTGATCATTCACGCCACTTAACGAG +GCTTTGTAAAAAGAATGTTCAATTCGAATGGACAGCAGAATGCAATGATGCATTCGAATA +CCTTAAAACAGAATTAATGAAACCAACATTACTACAGTACCCAGATTTCGGTAAAGAATT +TTGCATAACAACCGATGCTAGTAAACAGGCATGCGGAGCGGTACTTACACAAGATCACAA +TGGTCAACAACTTCCAGTGGCATACGCTTCAAGAATGTTCACTCAAGGTGAAAGTAATAA +GTCCACTACAGAACAAGAATTAACGGCCATTCATTGGGCCATAAATCATTTTCGACCATA +CATATATGGCAAGCATTTCATGGTAAAAAGCGATCATAGACCATTGTCATACCTATTCTC +TATGAAAAATCCAAGTTCAAAACTCACTCGTATGAGGCTGGATTTAGAAGAGTATGACTT +TACTGTAGAATATCTTAAGGGGAAAGATAACCATATTGCGGACGCCTTGTCTCGCATAAC +AATAAAAGATCTGAAAACAATCAACAGAGAAATATTAAAAGTTACCACCAGATCAAAAGC +TAAACAGGAAAATTCCTGTAAGGACGAAGCAATAGTCAAAATACAAGAGGAAAAAGAGCA +AACAATAGAAAAGCCCAAAGTCTATGAAGTTGTCAATAATAATGACACAAAGAAATATGT +TTTAATCAAAATAGATAAACACAAGTGTTTATTAAAACGAGGAAAAACAATTGTTTCACG +CTTTGATGTTGATGACTTGTATTCTAATGAAACATTTGATCTAAATCAATTCTTTCAAAG +GCTTATTTCAAAAGCCGGAATGCATAAAATAACAAAAATGCGAATATCACCAAGCGAACA +GATGTTCCAATTTGTATCACTAAATGAATTTAAAATAAAGGGCAACCGAGTACTCGAAAA +AGTAGAACTAGCTATTCTACAAAAGGTGATAATTATAGACAAAAATGACGAAGCTCAGAT +TAAAGAAATTTTGACAAAATTCCATGATGATCCTATAGAAGGAGGCCACACTGGTATTTC +GCGAACCCAGTCAAAAATCAAAAGATTTTATTATTGGCCCCAGATGACCAAGACAATCTC +AAAGTATGTAAAGACTTGTTTGAAATGTCAACAAGCCAAAATTACAACACATACGAAAAC +TCCATTAACATTGATGCCAACGCCAGCAACAGCATTTGATACTGTTTTAATTGATACCAT +TGGTCCACTACCGAAATCGGAAGACGGAAATGAGTATGCAGTTACAATCATATGCGATCT +AACCAAGTTTTTAGTAACTATTCCAACACCAAATAAAAGTGCTAAAACAGTTGCAAAGGC +TATATTTGAATTATTTGTACTGAAGTACGGTCCAATGAAGACGTTCATTACAGATCAAGG +TACGGAATACAAAAATTCACTTATGAATGAATTATGCAAATATATGCATATAGAAAATCT +AACATCTAGCGCTCACCATCATCAAACTTTAGGAACAATAGAAAGAAGCCACCGAACTTT +TAATGAATATATACGTTCATACATATCGGTTAACAAAAGTGATTGGGACATTTGGTTACC +ATATTTCACTTATTGCTTCAATACAACACCCTCAATAGTCCATGACTATTGCCCATACGA +ACTAGTATTTGGCAGACTACCCAGACAATTCAAAGATTTCAGTAAGATAAACAAAATAGA +CCCAATATACAACTTAGACGACTACTCTAAAGAGCTTAAATGCAGACTAGAATTGTCGTA +CAACAGAGCAAGAAGAATGTTAGAAAAAGCAAAAGCGGATAGAAAATTAAGATATGATAG +GAATACAAATAATTTCGAATTAAAAATAGGAGATAAAGTATTACTTAGAAAAGAAACAGG +TCATAAGTTAGATAAAAGATATGAAGGTCCTTATGACGTAGTAGATATAGGAATAAATGA +CAATATAACCATTAAAACAGGAAGTAAGAAACAACAAATAGTACATAAAGATAGGCTAAA +AAAGCACAAATAGAATGAAAAAAAAAAAGGGCAATCAATGCCAAACCTTTCATAATAAAA +CTTAAATAACGGCCTGATCAGCCAAAACAATATAACAAAGACATAGACATAATCGAATTT +TTATTAATTCAAAATACATACATATTTTTTCTTTATTCATTTAAAAATTCTATATCATAA +ATAATGTTAATTCATTAAAAATAATATTTAAGTAATTTTTATTTTATAATGGTAATATAG +TTGATAGAAAATAACTTCATTTCTTTACGTTATTTTAAAAAAGAGGGGAGGTGTAGTATG +TGCATATATCGAGGGTACACTGTACCTATAAGTACACAGCAACACTTAGTTGCATTGCAT +AAATAAATGTCTCAAGTGAGCGTGATATAAGATCACCCATTTATGCTTTAAGCTAAGTCA +GCATCCCCACGCTGGCCGCTGGCCATATATGCGCATAAGCTCTCTCTCTCTCTCTCTTAT +ACATATATATATACGCTGCTCTTCTGCCGCTGTCGACGGCGGCGCAGTCGCAGTATTTAG +GTAAGATTAGACACTCTGTAGAGGTTAAGCGGGCAGAACCGTTTCTGCTACTCGAAGAGA +TAAGAAGAAATAAAAAGGTGGCCTGACGGCTGCACCCAACTGCAAGGAAAACACGTGTTC +TCAATTGGTGGCATATATTGGTTTATTACA +>DMZAM +AGTTACCGACCCATCGGTACCATACACCACCCCTCCCTCTAAGCCACCACGCCTACACAA +GTAGAAGACATCGAACCGGGAAGCTTTGCGATACAAAGTTGCAGCATAAACATCAACAAC +GGGTCAGACGCCGACATCCGCCCAAAATGCTGACACCACATCCTTTTCGCTCAGACAGAA +CAACGCATACAATTCCATATACATACGTATAAACATACTCATACTTTCTGCTGTGTCAGA +TACTTTATTTCTAAGAACTTTAACATTGTAATACATACACACATATTCACTGTTAGCCCA +TTTAAGACGAAGAATAAAGACGACCACAGTCGAGTGCAAGCAGCAAACACTTGTAGACGT +ACATAATCTCCGATCAAAATTCTCCCAAGACGACCGTGGCTACGTTCTGGACCCGCATAA +CTCCTCTATCTTTCTGAGTGATAATACCTCCGCAAGACTCCCCGGAGGTAACTGGCGCAG +CCGGAAAACTGGAATGGAAAATACTTTATTAAACCTTCTATTAGTTCTATTGTAAGTAGT +TGTGGAAAAAGAGTGAGAATGAAGTGCAGAAATGTCTAAAAGTGATTACAACAAAAATCC +TAATACAATACATAAACCGCCTTAACAAACATACAAAACACGCATATAAAAAAAAAAAAA +AAAAAAAAAAGAAAAAAAAAAACCCAAAACTTAAAAATGCCGTAACCGCGAAACATGATA +TGCGTTGTACTTGTGTGAAATCAATCGCTGATAGTCACTGCCGAAGTTTATTAAGGCCAA +GTACCATATCATTACTTTCATGTTTACATACATATATATGCCCCACAATTAAAACAACAT +ACACACACACAAATATTTCAAATGCAAAAAAAAAAAAAAGAATGTAGTGTACCTGCGTGG +CATCAATCGCTGATAAACCACTGCCGAAATATTAAAGGCCCGGTACTACATCACAAAACA +CGTATATATGCAACAAAAATATACACAACAAAACCATATATACAAACGTGTATGAGTGAC +GTGTAATGTACTTGTGTGAAATCAATCGCTGATAATCACTGCCGAAGCTTAGTAAGGCCA +AGTACCACATCATTACTAACATGTGTACATATATATATATGCAAAACAATTAAAACAACA +TACACACACACAAATATTTCAAATGCAAAAAAAAAAAAAAAAGAGGAAATGTTGTGTACC +TGCGTGGCATCAATCGCTGATAAACCACTGCCGAAATATTAAAGGCCCGGTACTACATCA +CAAAACACGTATATATGCAACAAAAATATACACAACAAAACCATATATACAAACGTGTAT +GAGTGACGTGTAATGTACTTGTGTGAAATCAATCGCTGATAATCACTGCCGAAGCTTAGT +AAGGCCAAGTACCACATCATTACTAACATGTGTACATATATATATGCAAACCACCAAAAC +AAATACATATACACATACAAACACTCCAAAAAAAAAAACAAATAATACTATATGAACGGC +GAAGCGTATGTTTTCTAAGGCTGGATACAAAACCACAAAACCAAATATAAATTGCACACC +TTAATAAAGAAAAGAACAAAAATGATAATAAACAAAAGAAATTTTTTTTGGAACATGCAC +CCATACTCTCACTCTTTCAACACAAATAAAGTATTCAAATTATACATACATACAATAATA +CCACTATATTACAGAAATTAACGCACAAGAAAACACACACACTATCCAACAACAAACAAG +TAATTAAGAGTTATTAAGTACATTGTAAACTACATATTTTTATCTTAAATGTCAAAGAAA +TTAACACAAACTATTAAACAAACAACTCGCTCCGTGTTAGAATCACACACATTTCCCAAA +AGAGTTACACGATCAGTTTCGAAAACAAACACCCTCCCCGTAATAAGAGAAAGCACCCCC +TTACCGCCCCTTCAACCTATAAATATGGATTCGGGCAACGCCTCCGTAGGTAATTCCGCC +CCCGTAACACCTACTGTCAGTGGCTTTAGCAGTATTGCTACGGCACTTAGTGCCACCGAT +ATTTTAGCCTTCGTTAAAGAACTTCCGACCTTCGATGGTACTCCAGGCCAACTCGACAAA +TATATAACTAGCGTTGAGGAAATAATCATGCTCATTAGGGGTACCGACCAAACTCCGTAC +GGACTTCTGACACTCAGGGCAATTAGGAATAAAATAGTTGGAAGAGCAGACGAAGCTCTA +AACCTAGCCAACACCAAACTTATATGGGACGATATCAAAAGTAACCTACTACGTTTATAC +TCTAGCAAGAAAAGCGAAGCTACCCTCTTAGGCGAGCTCCAATCTCTCCCAGATAACCTA +ACCCTAGGGCAATTGTTCTTCGGCTTATCGAGGATTAGGAGCCAACTTATATCCATTACT +TCCAATAGTGGACAGTCGGCCACAATCATCGAAGCCAAGAAAACACTATATGACGAAGTC +TGTTTAAACGCCTTCATCTCAAGAATTAGAGAACCACTTAAAACAGTCATCAGATTGAAA +GACCCCAAGACTATCGAAACAGCTTACGAGCTATGTCAAGGAGAAAGGGCTCGTTACCAG +AACAGAAACCCATATCCCCCAACACAAAACAACACCGAACGACGAACTAACAACTACAAT +AACAATAACAACAACAATCACAGAGACAACAACAACCGCAACAACGTAACTCGTCTTACA +CCCAAAACCACTCAAACCATTACTCAAACCCCAATTCCCAATATCGTCAATCAAACAACG +GCAACAGAACTAGTAACCCGTTTAAAGATAATAAAACAAATTATGGGCTACACAACATAG +AAGAAGAAAAACTCACCCAACACTGCCTTACCAACTTAAATTTTCAGGCACCCGCCTCAG +GAACCCAACAGGATACATAAATCCTACCACACATGCAACATCCCTTCCATACATAACTCT +AAACCTCCAACAAAAATTCCCTTTATCATTTCTTATCGATACAGGATCCAATAACTCCTT +CATTGACCCAGAATCTGCAAACCAACTAGAGTGCACAATTCTACCAACATCCACTTCAAT +TACAACAGCATTAAATAGTTTCAAAATTGAAGAAAAGGCAATATTCCCAATGCCACCCGA +GTTCAAAACCGAAGGTCAAATTACCCTACTTAAATTCAAATTTCACTCTTATTTCAATGG +CCTCATAGGAATGGACCTATTATCACACCTAGAAGCAAAAGTAGACCTAGTAAACTTACA +ACTAGTAACTTCAAAGTCTACACTCCCAATATTCTTATACACTAACCAGGCTTCAAAAAT +TTTTAACATCCCCGCCTACAGTAAAGTTATCTTACCACTACCAGTAAAGACTAATCATGG +GGAATTCTATTGTTGTACTACACAACTAAATAATGAGTTATCGTTGTCAGAAGGACTATA +TAAATCAAACAATAATATTGCCAATGTCGAAATCTCTAACCAATCCGACTCAGATAAACT +ATTATACCTAGAATACCCCCTAGAAACCATTCCATACAATAAAAACGACCATATAGAGCT +CTTTAATATATCAGCTACACCTCTTAATAACGATACCCCTCAAGCCCCATTACATATCCT +CACAGAACACCTCAATCCAGAGGAAAAAACAGCCTTAACAACCCTATGTAAACAATTTCG +CGACATATTCTACAACCCAGAAACACCATTAACTTTTACCAACAAAATCACACACTCCAT +CCCAACCATAGATAACACTCCTATCCACACAAAATCCTACAGATACCCTTTTGTCCATAA +AACAGAAGTCAAAAAACAAATCGAATCCATGTTAGACCAACAAATTATTAGATCTAGCCA +CTCCCCTTGGAGCGCCCCGGTGTGGGTGGTCCCAAAAAAACTAGACGGGACAGGGAACAG +GAAATGGCGACTTGTAATAGACTACCGGAAACTCAACGACAAAACCATTTCGGACAGATA +CCCCATCCCAAACATAAATGACATATTAGATAGCATAGGCAAAGCAAAATATTTCTCAAC +GCTCGACCTAACTAGCGGTTTTCATCAAATCGAGATGAATCCAAAAGATATCGCCAAAAC +AGCCTTTACAGTCGAAGGGGGTCACTACGAATTCACACGGATGCCCTTCGGCTTAAAAAA +CGCACCGGCTACCTTTCAACGGGTTATGGACAGCGTTCTTGGCGATCTCAACGGCACCAT +TTGCCTATTCTATCTTGACGATATTATAATTTTCTCGCCTTCCCTACAAAAACACCTGTT +GGACATAAAAATGGTATTCGAAAAACTCAGAGCGGCAAACTTTAAACTACAACCTTCAAA +ATCAGAATTCCTAAGGAAAGAGATAGAATTTCTAGGCCACATAGTCACACAAGACGGAGT +TAAACCAAACCCGAACAAAATAAGTGCGATCAAAAAATTTCCTTGCCCCACCAACAGAAG +AGCTATCAAATCTTTTCTCGGGTTACTGGGTTATTATAGGAAGTTTATAAGAGACTTTGC +ACGAATAACGAAGCCCATGACTAAACAATTGAAAGGGAAAAGACAAGTTACTACAGACAA +AGACTTTGTAGACGCATTCGAACAGTGCAAAACTCTTCTGTCCAATGACCCAATACTCAT +ACACCCAGACTTCGAAAAACCATTCATTCTTACTACGGATGCTAGTAACTTCGCGTTAGG +AGCCGTACTATCTCAAGGCTCCTTACAAAACGATAGACCTGTATGTTTTGCCAGCAGGAC +CCTCTCCGACACCGAAGTCAACTATTCAACCATAGAAAAAGAAATGTTGGCAATAATATG +GGCAGTAAAATACTTCAGACCATATATTTATGGCGTAAAATTTACTATTGTTACAGATCA +CAAGCCACTAATATGGCTTATGAATTTCAAAGAACCCAACTCAAAAATAATTCGTTGGAG +ACTCCAACTCATGGAATACAATTTTGAAATAATTCACAAGAAAGGTTCACAAAATGTAAT +TGCAGACGCCTTAAGTAGAGCGGACCCAAATTTAAACTACAACGAAACACTGACTGTTAA +GCCTTGCCCCACATCCGAAAAACCTATTAACGAATTTAACACGCAACTCATACTAGAAAT +AGATACAAATACGTCTTACCAAACTACAACACCATTTAAACAAAAGATTAGGAAAAAATA +TTCACAGCCTTGCTTCGATTTCGATAATATTGTTAAAATCTTGAAAGGAACCCTAAAACC +TAACAGGATTTGCGCATTCTTGGCGGACGATAATAATTCCGCATTAATCGAAAAAGCATT +CTCAACGTATTTTGCACATAAAAAACACTTTAAAATTATCAGATGCAAATCACTTCTCCA +CGAAATCGTAGGAAACCCCGAACAAAACAAATTCATTCAGGAATATCACACTAACAGCAA +CCACAGAGGCATAGACGAAACATTCCTTCACCTCAAACGAGAAACCTACTTCCCCAATAT +GAAAAACAAAATCTCTGAATTAATTAGGAATTGCGAAACCTGTCTAAAACTCAAATACGA +CAGGCAACCACAAAATATAGTATTTGAAACCCCAGAAACCCCATCGAAACCCCTCGACAT +AATACACATAGACATCTATACTATTAACAATAATTTTAACCTGACAATCATAGACAAATT +CTCAAAATTCGCAGCTGTCTACCCCATCCCAAATAGAAACGGCATCAATTGCATCAAAGC +AATCAAAAATTTTTTCAGTCAATTCGGACTACCCAAAAAACTAATACACGACCAAGGAGT +AGAATTTTGCAACGACATATTTCGAAAGTTTTGCTCTCAATATAATATACTTCTCCATGT +CACATCCTTCCAGCAATCTTCAAGTAATTCTCCAGTAGAACGTTTACACTCCTCTTTGAC +AGAGATTTACAGAATAATACTAGACACACGGAAAAAACACAAATTACCTACAGACCACGA +AGAAATAATGTCAGAAACTGTAATAACATATAACAACGCAATCCACTCCACCACCAAACA +CACCCCTTTTGAACTTTTTAATGGTAGGACCCATTTATTCGAGAAAACAATAATACCCAA +TAATGAGCATGACTATTTAAATAAACTAAATACGTTCCAAGACAAACTATACTCCGAAAT +AAAAGAAAAATTGTCCACAAACACCCAACAAAGGATAGAAAAGCTAAACACAAGCAGAGT +AGAACCAACAACAGTACAACCTAACAGCACAATTTTCAGAAAAGAAAACAGGAGAAATAA +ATTAACACCACGGTTTTCCTTACACAGAACAGCAAAAGACAAAGGAAAAACTCTAGTAAC +CACAAGAAATCAAAAAATCCACAAATCAAAAATTAGGAAAATATCCAAACCTCCAAATGA +CTTAAGCCTTTCCACCTGCATTCCAGATCTTGCCATGGGGCATACCAATCTATCTTCATC +CACAACTTCAATAGCACCAACCTCCTAGCAAAAGTGCCGGTAGGGAAAACACTCGTGATA +GGAAACTATAAAAAAATTAGCCACATAATCGATCTGTCCGAATACACCAACTGTATTGAA +AAATTATACCACACCATCGATACCCTAAGACAAGATGAAACACTCACCGATTCTATATCA +ATACTAAATGCTAAACTGGCCCAAACTCAAAGTAAAATAGACGCACTAACACCCTTTTCA +CGCCACAAAAGAGGTCTTATTAACGGGTTAGGTAGTTTAGTCAAAGTCGTCACCGGCAAC +ATGGACGCCAATGATGCAAAGAATATAGAAACAGAAATTAACCACTTAAAAAGCCAGTCC +ACCACTATCTCAGATAACTTCGAAATACAGAACTCGTTCAATGATGAAGTTCAACTACGG +TTCAAAAACTTAACAAGACACATTAACAATGAACAGAATTTGATTAAAAACTTCTTCGAA +AACACTCAAAATACAATTTACACAAAAATATACAACAACGAAGAAGAAATAAAGAAACTA +CAATATATAAATAGGCTTAACTACAATATAGATTTATTAGTTAGCCACCTAAGCGACATT +ATAGAAAGTACACTGCTTGCCAAAATTAATGTTATCCCAAAACTCATCTTAGACAAGACA +GAAATAACCAAAATCAAACAAATTTTTAAAACACAAAACTACACAATAAAATCCGAGCAA +CACATTTATAACCTCTTAAAAATGAACGCACTCAATTACCAAAACAAAATAATTTTTAGT +ATCAAAATTCCTATTTTTTTAAGTTGTAACTACGAAATGGCAAGATTAATTCCACTTCCA +ATAAATTCCACACAATTTGTAATAGCACCTAAGTACTTAATATATAATAACAAAAGTAAC +AGCATGTTTTCAACTATGTATAAATGTCCTGTAATAGAAGAACAATTCGTCTGCGAAATC +GACTCCATCAATAATCTTAAAAATAATACTTGCCTGGGACACCTTATCCAAAATAAGACC +AGCTACTGCGACATAAAGGAAACGGGACTCACGACTGATGTGTTCGAACCGGAAAAAGGC +TTCATACTTGTATTTAACGGGAACAACCTCCCAATCATCTCCTCCAACCAGACCATAACT +AGTATCAATGGATCAGCTATAATAAAGTATAACAATTGCACATTAAAAATCAATGAAATA +AACTACGACAACAGGGCGGTATCAACAGAAGAGCACCCCGACTTCTTCCTACCACCAATG +CGGAAACTAATAAAAAATGCCACTATCAACATACTCACCTTGGAAAGACTTCACCTGGAT +ACACTCACAACATCCAATAAGCTACTGGTCGTCGCCGCAGGAAACTCTCGACACTCGACA +ACCTTGTATATCCTCTTCACCGTATCCCTAGTCGCCGTAATACTCACCTGGACACTTCGA +AGGGACACCCACATCTTCCATACCGGGCCCGACCACATTCTTCCAATCGTCGCTCCACCA +ATTCCTCCGTCTATGGCCTTCGCTCCAAACTGGGGGGGGAGGAGTTACCGACCCATCGGT +ACCATACACCACCCCTCCCTCTAAGCCACCACGCCTACACAAGTAGAAGACATCGAACCG +GGAAGCTTTGCGATACAAAGTTGCAGCATAAACATCAACAACGGGTCAGACGCCGACATC +CGCCCAAAATGCTGACACCACATCCTTTTCGCTCAGACAGAACAACGCATACAATTCCAT +ATACATACGTATAAACATACTCATACTTTCTGCTGTGTCAGATACTTTATTTCTAAGAAC +TTTAACATTGTAATACATACACACATATTCACTGTTAGCCTATTTAAGACGAAGAATAAA +GACGACCACAGTCGAGTGCAAGCAGCAAACACTTGTAGACGTACATAATCTCCGATCAAA +ATTCTCCCAAGACGACCGTGGCTACGTTCTGGACCCGCATAACTCCTCTATCTTTCTGAG +TGATAATACCTCCGCAAGACTCCCCGGAGGTAACT +>DME010298 +TGTTCAAGTTACGCTCACCCGCTGTCACCCGCTGTCACCCGCTCTCCGCTCCCTCTTACG +CTCTCCCGCTCTTCACCTCAGAGTCTCCAAGGAGTCCTCGGGCTTGGGATAGCCTAACTA +ATTAGAATAAGCATCAGTGTAAAAACTAACCACGCTGAATAAACATACGCCCGGTCGCCG +CGCAATTACGAAAAGTCTAGTGTTTGCTTTCCTTCGAGTGTTTCTTTTCAGCATATTTGA +ATTCAGGACAGCCATCCCCCTACATCCCAACATTTTGGTCCTTCGAGCCGGATCACCTGG +ATTTTCAAGTTTGTCCACCAGCGAACAAATTATAAGATAAGTACGAAATTTCCATTCCTT +TTAATTGCCGGTCTGCAGCAAAAGGTTCGAAAATCCAATTTCGTTCAATTTGCTGTAAGA +TTTATTGTCAAATCTAACGGATTTCTCCGACAAAAGGCAATTAAAGAAAAGTACTTATCC +AATCTCACGGGCGCCGCATATTACTCGCCGTTCTCCGTTCTCCTTTCACCCTCATTCGTG +AAAATTTCTAAAGTCCAAATGGGCGAATATATTTAAATATTAATCCAGTGCGATAATGCA +AAATTCCAAATGTGAAAAAGTGAATAATTTGTGCCAAGTTCAGTGAAACTTTCTAAGTCC +AAAGCTCTGCCAAAATTGGCAAAAATTCTGTTCTCGTTTCACTGTGTCAAAGCGAAGCCA +AACTTCTTTTCGCAACACATTTTTGCTTTAACTCCGCAGTCCACTTAATACCATTTGCTT +TGCTATCGAAGAATACCACAACGAAACAAACAACACCATACCCTCTGGCCATTCAAATAA +CATATTAATTAACATTTCCGCAGTTCCATATCTCTTACATCAACATATACCTACTCCATA +CTCTTGCATATATTCACATCTTACACAATATATCCTCACCATATATTACATATATTACAT +CAACATATAATATCCACATATATTACCGACATACATTGCGCATATTATCAGCATTCCTTT +AACGTATACCAAAGTTTAAATTCGATCCCGTCGGCAAATCCAACCACAAATAAAATTTAT +TCCAAGTGCCGACGCGGAAAGGCGTTTTCTTTTCCATCAATTTTTTCCGTAAATTTCCAA +ATTAATTTCCGAGCAATAAATTAAAAGCGGTTTTTTCTTTTTTTTTAACAAATAACTTAT +TGTTGAAAACATTTATTAAATTATTAAAAATTATATAAATAATACGACCGCCAAATACAA +GTCGTTCACCCGACAAATATTTTTTCCTGTATTGCTTGGATATTAATTTGTGTTTGTTTT +AGAAGTACTTACAACGCGGAGAAAAGACTCCAAATCCACCATTCCATTTTCTCCGTTTCC +AGTTATAAACAAAAAAATAAATAAAATTTTCTTCCTTCTAATAAACATTTTATTTTACCG +TGTTCACATTCCAAGTGTTCCAACCGTAAATAAGGTGGACCTAATTACCATAAATCACAG +GTCATTTATACAATTCGCTGTTCACTCCGAGTCACCTGTCCAATTAGTCTAAACTACGGC +GTTTCCACTTCGCAAATTCAACACCACTTTCTCACCCATTACATCCTATACGGTCCTTTT +CCGCTGCTTTATACCGTTCACGGCAGGAAGCTTAAATTTATTAAGTGGAATCTGTCTACT +TTTTCAAAAGTGTGACCGGGCTCCAAAAACGCTTCCCTTCCATTTCGTATTTCTTCGATT +ATGCCCATCGGGGACGATAAGAAGAAATTGTCCGCTGACAAACCCAGGTCTATTTTTTCA +CCACAAGGGCCCAAGAGTCCAAGAATCCCAAGCATTTCGGTGAAAACGCCTGCGCAGATT +TCCGACGACTGTGCCACTCCATCCAAAGCCACAGTACAGCGCACAGCTAAAAATATGGCT +GCTTCCGATCTAGCGCTAGCCAAATTCATTTCGGTTTCTGACGCTCAAGCGAATTTGAGG +CTCAGATCAACACTCCGGAATCCGCAGCTCCAACCGTCACGATGCTTAGCGTCCGTCGCG +ACCAAGTCCGAAGCCTATGGGACAAGGTTGAAAAGAATTCGACCTCTGCTCAGAGTGCCT +TGTGTCAGCAGGCGAGCGGCAGCAAGCGGCATGCCTATTCTCAGGGCTAGTTACAGTTAT +TGCTATTCAGTCTATGAAAGGTGTGTTGCCCAGCTCGTTGATAAAATCGAGCAGGGGCAC +TTCTCAGTCCATCCCAAGCGAACGCTGCGGCCCAGGCCTACATTTCCTCTGGCTGTCGGT +TGCCTCCATGCGATACAGGAGTTTTCGCAGGTGACTATCTTCGCTGGCCGCTTTCCGGAT +CTTTTACACGCCATTTATATTAATAATCCACGGCTGACTCCGTTCGAAAAGTTATTCCAC +TTAAATGCCAAAACAAGTGGCGACGCGCATGCCATAGTTTCGATTTCGCCTCTCACCAAA +CGAGGGTTTTCCTCTGCGTGGGAAAACCTAATAGAGCGTTTCGAAAATAAACGATTGTTG +GTAAACAGTCAATTGAAAATACTGTTTAATGTGCAGTCGATACCACAGGAATCTGGGGCG +GCCTTGAAGGTAATGCAAAGTACTGTTCAAGGTTGCTTGACTGCCTTAGAACTGTCAGGC +ATCAACACTGAGAACTGGGACTGCCTGCTGGAATATCTGTGTTCATCCAAGCTCCCGAAG +ATAACTCTCTCCTTATGGGAGCAGTCTCTACATAAGAAAGCCGACATCCCGACATGGGGA +GAACTGAACACCTTCCTCACAGAACGTCATCGAACCCTAGAGGCCATCGATGATGTGAGA +CCGTCCGTACCAAGTCAGTCGCACTCCAAAGCGATGAACTCAAGTGGGCCCTCTAGAGAT +GGCAAGCTGGCGTCCGACTTGTGCAACAAGGAAAACCATCCTGTCCGTGTATGTCGCGTT +TTCTCCAAATGGTCGGTTGACGACCGGTCAGCCTACATTAAACGGAAGCAGTTATGCTTA +AACTACTTTGCAAAGGGACATCAGCTTCGTGAGTGCAAAGATCGACAAAGTTTTACTTGG +TGGCCGGCATCACACGTTGTTGCACCGAAACAACCTCTTTTCCAGCAATTCAAGCCCTTC +AAATCCTGCAAGCCCAATTTCCGCTACTCAGGCCAATTTCGTTCCAAACGAGCAAGCCGG +TGTTCAAAATTATTTTGCCACGGCTCAAGAGCTATCCTTCTTGGCAGTGCCATAATCAAT +AGTTCCCATCTTGGCACTAACTTTAAGGCACGCGCCCTGATCGACTCCGGATCAGAGGCG +ACATTCATAACCGAGCCACTGTTCAATCTAATTAGATTGCCATTCCAGGTGGTTCAAGCC +CAAGTCTCGGGCTTAAACCAAACAGTAGCTGCTCAGTTCAAGAACGCTGCAGTTTCACCA +TCCGATCTCCGACTAGGCCGCGTTGCAGTTGGAGACGACGGCCTATGTCCTCCCTCAACT +AGCCGGAAATCTGCCTTCCTACCCAATTCCGCAAAATTTCTTCGGGATCTTCCCGATTTT +CCACTGGCGGATCCAAAATTCTATGAGAGCGCCCCAATAGATGTACTTATCCGGAGCCCA +CATCCTGCTTCGGTGCTTCTGAGTGGAGCAAAAACCAACATCTGTGGCTCTCTCTTGGGG +CAAGAGACCATTTTCCGCTGGGTACTAACTGGGCCAGTGTCAGCCTCAGCCCAAAGCAGG +ATTCCTCTTTTTCGACACAGATCTCCCACGCGTACGATAATTCACTGGACAAACTCCTCA +CAAAATTTGGGGAGGTGGAGGATATACCAACAAAGTTGCAAAAGAATCCGATTCCATGTG +CGAGAACGGGTTGGTAAATGCTTACGACGACACCAGTGCGGCAAATATGTCGTTACTCTG +CCTTTTCGCGACCCAGAACATATCGGTTGCGGGCTAGGGCATTCTAGGTCTTGGGCGTTG +GCTCAGTTCTTGAAGAATGAGCAGCGTCTAAAAAAAGATGAGGCCTTGAAAGCGAGATAC +GATTCGGTGATCCAGGAATATCTCGACTTAAAGCACATGCGACAAGTTCTGCCTACCCAT +GATTGCAACGCCTATTATATGCCACATCACGCCGTCTTAAAACCGGAGAGTGTAACTACT +AAACTCCGTGTAGTATTCAATGCCTCCAGCCCTTCATCGAATGGTACCAGTTTAAATGAT +ATCCTTCATGCTGGCCCTGTCTTGCAGTCCGACTTGACAGTGCAAATTCTGAAGTGGCGC +GATTTCCGATACGTGTTCAGTGCCGATATTCAAAAAATGTATCGGCAGATCTGGGTAGAT +CCGAAACACACTCCATTCCAGCGAATACTTTTCCGTAACAATAGAGGGGAAATCAGAGAT +TTCGAATTGAAAACAGTAACCTTTGGAGTCAATTGCGCGCCCTTGCTGGCGATCCGAGTA +CTGCAGCAGCTAGCAGCTGACGAAGAACTCAGCCATCCAAAAGCTAGCAATGTCATTCGA +AATTTCATGTATGTGGATGATGTTTTAGCCGGAGCGGACTCTACGGAAGAAGCTCAGCTC +ATGGTGCACGAGCTCCGAGACGCTCTGAATTCTTCTTCGTCCCGCCAGAGATGGCTATCG +AAACGTCCTTTACAACGCCAAGTCCTGTCCCAAATTGCCAAATTGTTCGACCCTGCAGGC +TGGTTAGCACCGTTTATCGTTCGAGCTAAAATTTTCATGCAGGAGATTTGGCTACAGGAG +CTTGGGTGGGACGAAAACGTTCCAAATGACCTTTTTCAGCGATGGCTTAATTTTCTCCAA +AGTTATTCGGTTTTCGAGCAGATACGCATTCCACGCTGGCTATCGTTTCATCCAGATTTC +AAGGTCGAGCATCATGGCTTTTGCGATGCATCGCAAAAGGCTTATGGCGCCGCAATATAT +GTCCGCGGAGAAGTGGGCAGCGCCATTATGGTGCAACTCCTAACCGCCAAAACCCGGGTA +GCACCAGTCAAAACGGTTTCGCTCCCAAGACTCGAGCTCTGCGGAGCGTTATTGCTTTCC +GAAATGGCTGCAGCCATCATTCCGCAGATGCCTACGATTAACTCCAAACTTTACTGTTGG +ACGGACTCCACCATAGTGCTTGCATGGTTAAGCAAGCCAGCATGCCAGTGGACCACATTT +GTAGCCAATAGGGAGACGAAGATCGCCCAGGCCACAAAAACAGAGAATTGGTCTCATGTT +CAATCTGAGCATAATCCAGCAGACCTGGCAAGTAGAGGAGTTTCCCTCCAAGATCTAGCC +GATAGCCAGTTATGGTGGCACGGACCGACTTGGTTGCAAAATCCACGCAACCAATGGCCT +ACTCAGGTCAACGCTCCGGTGACCGACCTGGAGAAGCGTGCTCTAAAAGTCCATCTCGCG +AAAGCTCCTTCTGAAGAGTTGTTGGCACGTTTCTCCAAGCTAGAGAAAGCTCTACGAGTC +CTTGCCTATGTTTATCGCTTCATTCAGCGGTGCAGGAAGCAGACATCTCCATCTGATGTT +CATCTACTGGCCACTGAAATCGCCGCCGCCGAGCGGTTCCTAATTTCGAACACTCAACGC +AGAGAATTCCCTGTGGAATATCACTGCCTAAGTGAAAAGCGTCCAGTGCCAAGTTCAAGT +GCCATCCTAAGCATGAACCCGTTTCTAGATCCGCAAGGACTGATCAGGGCATGCGGCCGT +GTGGCGGCTTCCGAAAGCCCTCAATACAATGAACGCCATCCAGTGATTCTTCCGTATAAC +TGCCTGCTTTCTCGCCTCCTTGCGAAGTTCACGCATCGCACAACTCTCCATGGTGGTAAC +CAGTTAATGGTGCGCCTCATCCGGTCGAAATACTGGATTCCGAGAATCAAGAACCTGATG +AAAGCAGTGGTAAATTCGTGCAAAGTATGTGTGATCCACAAAAGGCGGTTGCAAAGCCAA +CTGATGGGTGTCCTGCCCAAAGAAAGAGCATCGTTCTCCCGACCATTCACGGTATCGGCA +TGGATTACGCCGGTCCGCGATATAAAGAACTATACGGGAAGAGCATGTGTTATTACAAAG +GGGTATGTGTTAGTTTTTGTTTGTTTCTCCACCAAGGCCATCCACTTAGAGCCTACATCT +GACTTAACGACCGAGAAGTTTCTTGCCGCTTTCTCTCGTTTTGTATCCAGGAGAGGGTGT +CCACGTCAAGTCCAGTCAGACAATGGCAAAACCTTTGTTGGCGCTGCCACCCTGCTTTCC +CGCGATTTCCTTCAAGCCGTAAAAGAGTCGGTGACGAATGCCTATATTCATCAAGAGATG +CAATGGCAATTATTCTCCGGGGGCACCCAATATGGGAGGCCTTTGGGAAGCAGGCGTAAA +AAGCTTCAAGACGCTATTTTACAAATGCACGGCCACACGAAAATACACGTTCGAAGAACT +CTCCACGCTCTTGGCAAAAATAGAAGCGTGCCTTAACTCCAGGCCGCTCTCTCCTATGTC +TGAAGATCCGACAGACTTGCTGGCTCTGACGCCAGGGCATTTCCTTGTCGGGGGACCCCT +TATGTCCACGGTGGAACCCGAAGTAAAGGGGGAAACGAAATCCCTTCTTAATCGGTGGCA +GCATTTGAAGGCTCTCCATCAGCAGTTCCGTGTGCGATGGAAAGAAGAGTACCTCAAAGA +ACTCCACAAGCGTTCTAAATGGCAGGTCCCGTGAACTTCGAGCTAAAATACTCGTGCATG +TGGAGCAGCGTGTGGTGGGATCGGTCGCACTTCTTGCAACGATCACCGCTTCGGCAGTCT +CCCGTGGAATGCTCGTGAGCGAGGCAATTGGCGCTAGTATGTTGGTAATGAGGACTGCTC +GCAAACGCTTTTCAGCGCTGAGCTTTAGGAACCTCGCGCACGTCCGAAGAGGATGGATTA +CCGCGGCAGACTCGGCATCGGTAGGATTTAATACCTCGGGTACGTCTGCTCTCCACGGCA +CGACCTGCGTGCGTTTTGTTGACGAGGAGCCATGTGCGCGTAGTCGAATGTCGAAAGGAG +ATCGAAAACGAAATGAAAAATAACGGATGATTAGTGATAGTGAACTACAACTAAGGACGA +GAGGAGAGACCTATTATTGTGGAGATTCGGAACTCCGTCGGCAAAAGCACCTTTTTTGCC +ACTGGACGTTTAATAACTCCACGTGCAGTACGGATGTTTACTACACGACGTTGCCGTCAG +CTCCTGGGAAAACAGACTCAATTCTGCCGAGCCGCCACTCATTAGAGGGCAAGTTGTCGT +CCTTGATGACGACTGTTGAGTTACGGGGTTTGGACTGTCACCGTCTCCGCTCCCTCTTAC +GTTCTCCACTCCCTCTTACGCTCTCCCGCTCTTCACCACAGAGTCTCCGAGGAGTCTCTG +GCGCTTGGGAGAACCCAACGCATTAGAATAAGTTTTAGTGTAAAACTAACCACGATCAAT +AAAACATACGCCCGGTGCCCGCGCTAATTCTACAAGTCTTCGAGTGTTTTTTCGAGTGGT +CTTTTTTTCAGCAAACTAGGAACTTTCCAGGACCAGCACCCCCCATCACCCCAACAACGA +CCATGTCATCGATGGCGTCGCCAACCGGCGCCAACCCTGCAAGCAGCTTCGGCCTCGTCC +CAACGTTCCCGCCGGCACAATCCGCCAACTCAGCGTAGGAGTTCACCGCCACGACGACCG +GAATCGACGACGCCAGGCCCATCACTCTCGTCGCCGCTGCAACGCCACAGCGTGAACATC +CTTCCCACAGCGCTGGTCAAGATGGAGACCGGGACGAAGACCTTCAGACCGCAGCACTCA +TCGATCCGTGCAGCCCCATGAGCTGCATCGACGCTTCGTTGGCGTCAGCCTTTAAGCTTT +CGATGACCAATGTTGGCGACGAGAAGGTCTGCACGACGACGATTCGCTCCAGGATCGACG +CGAACACGAAGCTCGAGGTCGTGCTCAAGATCGAGCCCAGGGTGCGGATCCGTACACCTG +TCCGGGCATTGAGCGACACCGTAGTGTCCAAGTACAGGGACATCATGCTGGCGGATGACG +GGTTCCATCGGCCTGCTACCGTATCCATGGTCTTAGGAGCAGACATTTATCCTAAGGTTA +TCCAATCCGGATTCCTGACCTTCGACGAGGGAATGCCGGTCGCTCAAAAGACCGTGTTTG +GGTGGATCGTGTCCGGTGCCTGCAGCTTGCCTAGATGGCTATGTTGCAACCCCAGTGATT +GCAAGGGGGGCGGAATGTTCAAGTTACGCTCACCCGCTGTCACCCGCTGTCACCCGCTCT +CCGCTCCCTCTTACGCTCTCCCGCTCTTCACCTCAGAGTCTCCAAGGAGTCCTCGGGCTT +GGGATAGCCTAACTAATTAGAATAAGCATCAGTGTAAAAACTAACCACGCTGAATAAACA +TACGCCCGGTCGCCGCGCAATTACGAAAAGTCTAGTGTTTGCTTTCCTTCGAGTGTTTCT +TTTCAGCATATTTGAATTCAGGACAGCCATCCCCCTACATCCCAACA +>ROXELEMENT +AATGTTAAATAAAGGTTCGTGTCTAACAATACGCACCTGACAAAGTGGATTAAGTGAAAT +TAGTTTTCGCGGTAATAAACTTATGGACAAGACCAGAATACTGGCACACATAGCAAATAG +TGACCCCCCAAGTCACTAACAGTGAAATAATAGTGAAACGAAAACATTTTCATTCAAAAA +TACAAAGTTAAGTTTCTCGAACTGGGGCTCCGCTGCCCAGCTGCCACGCGATCGCACAAA +CAGCTGTTTGCGAGCTTAAAGCTTTCTATCCCAGGGTTCAAGTTTTGGCTAGAACCCTGG +TGATTTGGTGCACACTTCAATATGAACACTTTAAATGAAACCGCTGCGGCTGATGAATCG +TTGGATACTGCGTTTCTCTCGAGCCCCCAATGTGCTGCCCCGCAGCGCTTTCAAAAAATA +AAGCGAAAGTCTCGTGCTTCTCCGGAGACTGAAAGGAAAAAACCCAAATCAACCATCGGC +AAACAAGGGGAAAACCCTTCGGCTACAGAACCTAGATATGGCGGCAATTCAAACCGATTT +GGTTTACTTGCGCATCTCACAGCTGACAAACAAGTAGGCAATGAAATTGGCGATCTGTAT +GACCAGCCCAGTACCAGTCATCAAGCTGCAATTGCTGCCGCTAAGCGGGATGCAGCCTCC +GCTGGTACCACTAGCTCAGCCAAAAGAGCGCAGTCCAAACCACCTCCTATAGTAATGGAG +GGAGTGGACGACGTATACCTGATGATGCAGAGCATCGAAAATATAGTGGACCTAGAAAAG +ATTGAGGCTAGGGCGTCAATGAGCGGTGTCCTAAGGCTTTACGCGGCTGACGCTAATACA +TTTCGCACCATAGTGAACTGGCTCGAGATCGAAGAGTATGAGTTCCACTGCTACCAGCTT +AAAGAGGACAGGCCTTACAGGGTATGCGTGAAAGGCCTGCACCACAGTACGCTACATCAC +CAAATCAAGGATGAGCTGGAAAAGATCGGGCACAAGGTTCTCGATATTCACACACCGCTT +AGGCGAAACGAACCGGGTACCTCAAAAGCGTCGCCAGTCAATATGTTCTTCCTAAATATT +GCTGCTGCGGCAAACAATAAGGAGATCCTGGCGGTAAAGGCACTATGCCATATGAGAGTA +GTTATTGAGCCTCTCCGCAAGCGTAACGCTATTGTCCAGTGCCATCGTTGTCAGCAGATT +GGCCACACAGCCAAATACTGCCGTAAGGCCCACATTTGTGTGAAATGTGCCGGCGAACAC +CCAGCCAAGGACTGTACCAGGCCACGCATCGAGCTGTGCACTTGCTACAACTGTGGCGGC +CAGCATCCTGCAAACTATAAAGGTTGCAGCAAGCTACAAGCGTTCCTGCAGCGATCCAGA +CCCAGAAGTGGAGTGGCTGGAAGAACAGAAGTAAGCGATCGACCAACTCCACGGGGCTTA +GCTGGAGGTAAGGAGATCCCCTCTTCTCGAGGCGGAATATCTTATGCAGATGTGGCTAGA +GGGTCCATTCACCACAAGCAACCAATGAGCCTGACGCACCAGCAACAGAAGCAAAAGCAA +CAGCCCTATGATGGAAGCCCCAGTCGTCAAAGGAGCCGCAGCCGGACAAGGGCGTCTAGG +GGTACACTCCAGCGCTCGACGGATGCTAGCAGCAGCATTGAAGCCATCCTGCAGACGCTT +AATGAGAACATTAATTCTTTGCGCTCGATTCAAGAGAAGCAAATGGAATTAATGATGATG +ATGATGAAGCAACAGCAACAACAGTCACATCAGCAGGGGCAGATTATCAATCTGCTCACT +GCTCTCCAAGCGCGTCAAGCGCCATAATGATGCCGCTGCGCATCCTAGTGTGGAACGCCG +ACGGCGTATCCACGAAGTTGCCTGAAGTAGAGTGCTTCGTGCGACGTCACGAAATCGATG +TATTACTGCTCAGCGAGACACACTGCAAGGGGGCAGAGACGCCTAAGCTATTCGGATTTG +TAGCCTACACTGCCAATGATCCGAGTGGTGGCAACGCCAAAGGCGGAGCAGCTATCTTAA +TCAAAAATAGCCTTGCCCACTTTCCGCTAACACCAATAGCCACTGCCAAGGTGCAACTTG +CGCCGGCGGTTATTGAAACGGCACTTGGTCCTATAAGCTTTGGAGCGGTCTACTGCCCAC +CGAGATTTGCATGGACTACGGACGAGTTTAAGGACATTTTGGAAGAGTTCCAGACGAAGT +TCATTGTTGCAGGCGATTGGAACGCGTCCCACTGGCTCTGGGGTGCGGGAAGGAGCAACC +AAAGAGGCATTGCATTAGCGAATCTCGTCCTAAATTCGGAGGTGGACTCGCTAGCAACAG +GAGGACCAACAAGATACCCGTACGGCTGTAGAGGCTCACCAGGGTACATCGATTTTGCAC +TGACAAAGGGTGTGCTGGGCATCCACGCTAACATAAGTGCGGTTGTTGAGCTTAGCTCCG +ACCACCTGCCTCTGGTAATTACGCTGGATGCGGGGGCAATATCCTACCCTAAGATGGAGC +GGCTTATCACTAGGCGTACTAACCTGGAGGTATTCCAATCGCAACTGGAGTCCACACTGC +CCCTCAACACTGCCATAAACTCTGGACAGGACGTTGATGATGCTATCGAACTGCTCACCA +ACAATATCAAGTCAGCAGCTAGATTGGCAACTCGCAGCATATCTCGGCAGCCCGCGGCAG +ATCGAATCCCAATACCCAGGGAGATCCTGCTGCTTATAGCTGAGAAGAGGCGCTTACGCA +CTAGGTGGATGAGGTCTCGGCACCCGTCGGACAAAACGGAATGGAACCGAGCTCTGAGTA +GGCTCCGATGCGCGTTGGTGCTGCACAAAGCCGCATGGTTCGACGAAAGGCTTGCCAATA +CCGGAGTCGAAAGCGAAGCGACGCATTCGCTGTGGAAGGCCACGCGCGCAATCAAAAGGC +GTTGCACGAGGAAGGCGCCTCTAGTCGATAGCAACGGGACATGGTGTCGGACCGACTTGG +GACAAGCGGAGGTATTCGCTGCGCACCTCGCCGAGCGATTTCAACCATTCAAGCTTGCCA +GCCTGCAACAGGTTGAAGAAACTCAGGACCAGCTGAACCAAGCGCTTCAAATGGATATGC +CAATCACGCCGTTTGAACCCTGCGAGGTAGCCGAAGTCATTGTGCGCCAGAGTAACAACA +AAGCACCTGGACATGACGTCATCTGCAACGCCACATTGAAGGCCCTGCCCAGACAAGCGA +TCCTCTACATAACGTTGGTTTTCAACGCTATTGTGAGGTTGCAATACTTCCCTTATCAGT +GGAAGCTCGGGATAATCTCCATGATCCACAAACCTGGCAAGCCGGAAAGGGAGCCCGCCT +CCTACCGGCCGATCAGTCTCCTCCCTTCAATTTCGAAGGTGTTTGAGAGACTGATTGCTG +TCCGGATTGTAAGCATTATGGAAGCCCAGGGGATTACCCCTGAGCACCAGTTCGGTTTCC +GTGCTGGCCACTGTACTGTCGAGCAGCTCCATCGAGTCGTCGAGCAAATTCTGACTGCCT +ACGACAGTAAGGAATATTGTAACAGCCTCTTCTTGGACATTCGAGAAGCGTTTGATCGAG +TGTGGCACATTGGACTCCAACTGAAAATCAAGCAGACGCTGCCTGCCCCATATTTTGGGT +TGCTGAAATCGTACCTGGAAGGAAGGAGGTTCGCTGTGCGCTTTCATTCAGCAATTTCCA +CCGAGCACAACGTGGCAGCTGGTGTTCCACAAGGTAGTGTCCTCGGCCCCCTGCTCTACT +GCCTGTATAGCCACGACATGCCGCAGCCAGATGTAAGCCTTTACGGGAAATCTATGTTGG +CCACATTTGCCGATGACGTGTGCGTCACCTACAGGTCCCGATGCGAGCACGACGCAGCCG +ATGGTATCCAGGACTTTGCATACCGGTTCTCGGAATGGGCAAGACGATGGAATATTGGCA +TCAATAGCAGTAAATCCAACAACGTCTGCTTCACTTTAAAGCGGAGAACGCCACCGCCCG +TCTACATCGAGGAAGTCCCCGTACCACAGCCGAACGCAGCAAAGTACCTTGGAGTGCTTC +TGGATCGCAGACTCACATTTTCCAAGCATGTGACCGACATCAGAACGCGCCTACGTGCTA +AGGTGGCGAAGCACTACTGGCTACTTTCTTCGCGCAGTAAATTGTCGCTATCCAACAAGC +TGACAATTTACAAACAGATCCTAGCACCAAACTGGAAGTATGGGTGCCAAATCTGGGGCT +TAGCCTGCGACAGCCACATCAAAAGGATCCAGGCTATTCAAAATAAGGTAGCAAGACTCA +TCACCGGCTGCGAGTGGTTTGTTCGAAACACCACCCTGCACAGAGACCTGAAACTCGCAA +CGGTATTTGACGAAATAAACAAGCACTCGAGCAGATACCATGACAGGCTGGAGCGCCACA +GAAATCGGCTGGCCAGCGCTTTAAACAGATCTCGCCCACCAAGGAGGCTCAATAGAAGGC +AACCGAGGGATCTCATTACCCGATCTCCTTTGACAAGGGTCCGCAGAAGCTGACGCTTAT +CTTAAATCCTATTTGTTATATGTGATTGTTATGTAATTGTAGTTAAATTACTGTAAATTT +GAAAAAGCTAACTATAGTTAGCCGGCGAGCCCAAATGGGCTGAATTAATAGATAAGAAGG +ACACAAAGGGGCTTCAAGACTTCCCCGTATGCCTTAATAAATAAATTAAATAAAAAAAAA