view test-data/transposon_sequence_set_v9.5.embl.txt @ 0:3c8c9911cf2a draft

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/embl2fa commit 6e5860cedc0ed0bc807ff64f752e62355c1b19d4
author artbio
date Sun, 13 Nov 2022 00:23:23 +0000
parents
children
line wrap: on
line source


ID   DME9736    standard; DNA; INV; 7411 BP.
XX
AC   AJ009736;
XX
DR   FLYBASE; FBte0000104; Dmel\Idefix.
XX
FT   source          AJ009736:1..7411
FT   SO_feature      five_prime_LTR ; SO:0000425:1..600
FT   SO_feature      three_prime_LTR ; SO:0000426:6841..7411
FT   SO_feature      CDS ; SO:0000316:<988..2031
FT                   /name="Dmel\Idefix\gag"
FT                   /db_xref="FLYBASE:FBgn0027381"
FT                   /db_xref="SPTREMBL:O96739"
FT                   /db_xref="NCBI_PROTEIN:CAA08806.1"
FT                   /translation="ARKLKDIMAVPQLSETHLNQLLNQIKELNYYDGAPGKLSGFVNQV
FT                   EQLLSLYPTQEARQAHVIYGAVKRLLVDSALEVVTQERANTWLDMKKALAMAFKDHRPY
FT                   VTLIRQLEDISYPGSICKFIEKLETQYWIMFDKLELESDHVDKSNYTEMLNKTVKSVID
FT                   RKLPDRIYMSLARKDIDTIYKLKQASMELGLYDAIPENHRSNRTEMNKRRNRGNYNQNN
FT                   NQKYYNNRNHNYSNYYPSMNQNHNTQPPQNPTQPMTNQNQYSPRFIPNNQRGNYYAFRR
FT                   DLTQAQQNNPLNNTLNFQPSTSNNINRQGPVKRQRESQSDQSRMDVNFHQAASDTQMIE
FT                   KDIQVPM"
FT   SO_feature      CDS ; SO:0000316:<1950..5402
FT                   /name="Dmel\Idefix\pol"
FT                   /db_xref="FLYBASE:FBgn0027380"
FT                   /db_xref="SPTREMBL:O96740"
FT                   /db_xref="NCBI_PROTEIN:CAA08807.1"
FT                   /translation="PKQDGCKFSSSCLGHSNDREGHTSPYVKIIHHNKNYKGMIDTGSS
FT                   INIIRENFENLEEKEENLIVYTIKGPITLKRSIIIKPTSVCPSAQKFYIHKFSDNYDFL
FT                   LGRKYLEDTKAKIDYANETVTLGSKVFKFLYEEKKGETASKCLDPQEKNDSALVDRTKP
FT                   KMQKVKTAPKCLKPKHQQQKKETALPKCLISNVVKDTVDNDVTHLDPMSVDNDIVNFAI
FT                   NNELRECNEYRLEHLNAEEVECLKKFLYEYRDIQYKEGENLTFTSTIKHVIQTQHEDPV
FT                   YRKPYKYPQSVDQEVNKQIKEMIEQGIVRKSKSPYCSPIWVVPKKADASGKQKFRLVVD
FT                   YRNLNEITVNDKFPIPRMDEILDKLGRCQYFTTIDLAKGFHQIQMDENSIAKTAFSTKH
FT                   GHYEYTRMPFGLKNAPATFQRCMNNLLEDLIYKDCLVYLDDIIVYSTPLEEHILSLKKV
FT                   FEKLRDANLKLQLDKCEFMKKETEFLGHIVTTNGIKPNPNKTKAITNFPLPKTPKQIKS
FT                   FLGLCGFYRKFIPNFAKIVKPMTLKLKKGAIIDTKCKEYIESFEKLKVLITSDPILIYP
FT                   DFSKPFSLTTDASNVAIGAVLSQNHKPVCYASRTLNEHEINYATIEKELLAIVWATKYF
FT                   RSYLFGRPFEVLSDHKPLVWLNNIKEPNMKLQRWKIKLNEFDYKIKYLPGKENHVADAL
FT                   SRTKIEVMVGEVANSADATIHSAIEDNLNYIPITERPINYFSRQIEIEKGDNDTTSVQH
FT                   LFQKLKIKIVYKEMTPELAKNLIKEYVCTKKSAIYFPNDEDFLIFQRAFTEIISPNNFT
FT                   KLLRCTTKLIDILTYAEFKDLILKKHKELLHPGIEKTINLFKEEYYYPDSQKLIQTIIN
FT                   ECQICYLAKTEHQTQMTYETTPEIFNTREKYMIDFYLTGNQIFLSCIDIYSKFASLVEL
FT                   KSRDWLEAKRAITKIFNDMGKPQEIKADKDSAFMCLALQNWLRSEGVQISISTSKNGIS
FT                   DIERFHKTVNEKLRIIGSQQNVEDRCTKFERILYIYNHKTKHNSTKRFPADIFLYAGSP
FT                   DFNVQQNKIDRIEYLNKNRHDFEVDIKYRQAPLVKSKITNPFKKTGRIGQVDDKHFEET
FT                   NRGRKIVHYKSKFKKQKKFNKSKYDNSRPTKEAQSTQHTSNNA"
FT   SO_feature      CDS ; SO:0000316:5248..6780
FT                   /name="Dmel\Idefix\env"
FT                   /db_xref="FLYBASE:FBgn0027382"
FT                   /db_xref="SPTREMBL:O96741"
FT                   /db_xref="NCBI_PROTEIN:CAA08808.1"
FT                   /translation="MINISKKQIVAGRSFTISQNLRNRKSLIRANMIIPDQPKKHKVHN
FT                   ILLIMLSCILSLIITVKCNNIEVNPVNAKNGYLIFQTGTMEIPTSYEYHYLSINITKTM
FT                   LMFEDIVSEANNYPNVPQIQYLVDKLKREINGLRIISRSKRGLLNVVGKAYKYLFGTLD
FT                   EDDREELEEKINNMSEDSVKTHDLNTILDVINSGIDIINKLKVDKEQHQQIAVLIFNLE
FT                   QFTEYIEDIELGLQLTRLGIFNPRLLKHDYLKHVNSEKMLKIKTSTWLKTDTNEILIIS
FT                   HIPSEVTKVPIFQIVPYPDEHNYILTEQIFDKFYIFDNQVFHKDTNRDIFDKCIIGIIK
FT                   QEQTQCKYIKTHKNYQINYIEPNILLTWNIPETAVNQDCTHNKILISGNNIIKIKNCTI
FT                   QIDEFLISNNLADFTQTIYITNNVTRLEPINHLQTREMIETHVKHYNFFQIICITTFVI
FT                   MIISLTLYVAYKFKNIPKKIIVNIVSKKNTRTLKIMSMKIFNKEIILPYTQI"
XX
CC   Derived from AJ009736 (e1371475) (Rel. 58, Last updated, Version 1).
CC   Takis Benos and Michael Ashburner, 1-Feb-1999.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 7411 BP; 3047 A; 1363 C; 1109 G; 1892 T; 0 other;
     GTGACATATC CATAAGTCCC TAAGACTTAA GCATATGCCT ACATACTAAT ACACTTACAA        60
     CACATACACC CCAATACAAC ATACACTACT CCGGATGTAC CCAACAGATA CCAGATAAGA       120
     ATAAGATTGT TATATGATCC TCGAGAATGG AAAAAACCCC AATTCTAGAT AAGTCACCCA       180
     CTGGTAGACT AAACATCCGT CCCCTAATTT AAACAATTCC TTGCTTAAGC CTCACCCCAT       240
     CGTCACATTC CCACGTTCAA AGCTCGGAGC CGCAATCCCG AAAAACAAAA GTATCGATTT       300
     CAATAAACAA ATTATAAGAA TCTAAGAGCA CTTGTATCCA AGAGCAAATG CACTTGAATC       360
     CAAGAGAAAC GCAAAGCTTT TTCTCTTTAC GATCAGAATC CTAAAGTCTA AAGTCCATAT       420
     TAGAAAAGCT CGATACCGAG GCTTGAACGT CAACCAAATC AGAATAATTA TCAGAGTTCA       480
     GTTTGAGACC TAATTGTAAA AGGTTCGGTG TTCTTCTCAA ATAAAAAGAT TGTAATCATT       540
     TAGTGAAATA AAAATTATAT TTTTTTCACT TATAAATATT GCAAGTATTT AATTGGCGCA       600
     GTCGGTTAGG ATCCAATAAA ATAAAAGAGT CCTTTTAGTA CGGTACTGAT CAACTGAAGG       660
     ATATGCTATA CGACTAGCTA TCCAAGATCA GCGAATTAAA ATAGTGATTC AAAAATATTT       720
     TTTAATCCGC AAAAGAATCT ACGTGAAAGT AGTATTCAAA ATAAAATCCC GTGCGGTCGG       780
     AAACAAAAAT TAATTTAAAT TTTTTAATTC CGAAACTTAA AACCAAGTTT AAAGAAAACT       840
     TAAAATCAAG AAAACTTAAA ACCAAGTTTA AAGAAAACTT AAAATCAAGA AAACTTAAAA       900
     CCAAGTTTAA AGAAAACTTA AAATCAAGAA AACTTAAAAC CAAGTTTAAA GAAAACTCAA       960
     AATCAAGAAA ACTTAAAGCC AAAATAAGCT AGAAAACTAA AAGACATCAT GGCAGTCCCA      1020
     CAACTCTCAG AAACACACCT AAACCAACTG CTAAACCAAA TCAAAGAATT AAACTACTAC      1080
     GATGGCGCAC CTGGCAAATT ATCTGGATTC GTCAACCAAG TGGAACAACT GCTCAGTTTA      1140
     TACCCAACAC AGGAAGCAAG ACAGGCACAC GTCATATATG GAGCAGTGAA GCGGTTATTA      1200
     GTGGATTCAG CCTTAGAAGT CGTAACCCAG GAAAGAGCTA ACACATGGCT GGACATGAAG      1260
     AAAGCACTGG CAATGGCATT CAAAGACCAT AGACCTTATG TAACTCTCAT CAGACAATTA      1320
     GAAGACATAT CATACCCAGG AAGTATCTGT AAGTTTATAG AAAAATTAGA AACACAATAC      1380
     TGGATTATGT TCGATAAGTT AGAATTAGAA AGTGACCATG TTGATAAATC GAATTATACC      1440
     GAAATGTTAA ACAAAACTGT TAAATCAGTA ATAGATCGAA AACTGCCGGA TAGAATTTAT      1500
     ATGTCTTTGG CACGTAAAGA TATTGATACA ATTTATAAAT TAAAACAAGC ATCAATGGAA      1560
     TTAGGCCTTT ATGATGCTAT TCCAGAAAAT CACCGTTCTA ATAGAACAGA AATGAATAAA      1620
     CGTAGGAACA GGGGAAACTA TAATCAAAAT AATAATCAAA AATATTACAA TAATAGAAAT      1680
     CACAACTACA GTAATTATTA TCCTAGCATG AATCAGAATC ATAATACACA ACCACCTCAG      1740
     AATCCGACTC AACCTATGAC AAATCAAAAC CAATATTCAC CGCGTTTCAT ACCGAATAAT      1800
     CAAAGAGGGA ATTATTATGC ATTTAGACGA GACTTAACAC AAGCTCAGCA GAACAACCCA      1860
     CTTAATAACA CCCTTAACTT CCAACCTTCG ACATCGAATA ATATTAACAG ACAAGGGCCA      1920
     GTAAAAAGAC AACGCGAGAG TCAGAGTGAC CAAAGCAGGA TGGATGTAAA TTTTCATCAA      1980
     GCTGCCTCGG ACACTCAAAT GATAGAGAAG GACATACAAG TCCCTATGTA AAAATAATTC      2040
     ATCATAATAA AAATTATAAG GGAATGATCG ATACAGGATC ATCAATTAAC ATCATAAGAG      2100
     AAAATTTTGA GAACTTAGAA GAAAAGGAAG AAAACCTAAT AGTATACACT ATTAAAGGAC      2160
     CAATAACACT AAAGAGAAGT ATAATAATAA AACCTACTTC AGTATGTCCG TCTGCTCAAA      2220
     AATTCTACAT TCACAAATTT TCTGATAACT ATGATTTCTT GTTAGGTCGA AAGTATTTAG      2280
     AAGATACAAA AGCTAAAATA GATTATGCTA ACGAAACAGT AACACTAGGC TCAAAAGTAT      2340
     TTAAGTTTCT CTATGAAGAA AAGAAGGGCG AGACCGCATC CAAATGCCTT GACCCACAAG      2400
     AAAAGAATGA TTCCGCTCTA GTGGACAGAA CCAAACCAAA AATGCAAAAG GTTAAGACCG      2460
     CACCTAAGTG CCTTAAACCA AAGCATCAAC AGCAGAAGAA AGAGACCGCA TTACCCAAAT      2520
     GCCTCATTTC AAATGTTGTT AAAGACACAG TGGACAATGA TGTAACACAT CTCGATCCCA      2580
     TGTCCGTTGA CAACGATATA GTCAACTTCG CGATTAACAA TGAGTTACGC GAATGTAACG      2640
     AGTATAGACT CGAACACTTA AATGCAGAGG AAGTTGAATG TTTAAAGAAG TTCCTATACG      2700
     AATATAGAGA CATTCAGTAC AAAGAGGGCG AAAATTTGAC CTTCACCAGT ACTATTAAAC      2760
     ATGTCATCCA GACTCAACAC GAAGACCCAG TATACCGTAA ACCCTACAAG TACCCTCAAA      2820
     GCGTTGACCA AGAAGTTAAC AAACAAATTA AAGAAATGAT AGAACAAGGG ATTGTTCGCA      2880
     AATCGAAGTC CCCTTATTGT TCTCCTATTT GGGTGGTCCC CAAGAAGGCA GACGCCTCTG      2940
     GGAAACAAAA ATTCAGGTTG GTAGTCGATT ACAGGAACCT AAATGAGATA ACTGTTAACG      3000
     ACAAATTTCC CATTCCCCGA ATGGATGAGA TATTGGACAA ACTAGGTAGA TGCCAATACT      3060
     TTACCACTAT AGATCTAGCC AAGGGTTTTC ACCAAATCCA AATGGATGAA AATTCTATTG      3120
     CAAAAACAGC TTTTTCAACT AAGCATGGGC ATTATGAATA TACTCGTATG CCCTTTGGTT      3180
     TAAAAAACGC TCCAGCTACT TTTCAGAGAT GCATGAATAA TCTTCTGGAA GATTTAATCT      3240
     ACAAAGACTG TTTAGTCTAT TTAGACGATA TTATTGTTTA TTCCACTCCA TTGGAAGAAC      3300
     ACATTTTATC CCTAAAGAAA GTCTTTGAAA AACTGAGAGA CGCTAATTTA AAGTTGCAAC      3360
     TAGATAAATG TGAATTCATG AAGAAAGAAA CTGAATTCCT AGGACACATC GTCACAACAA      3420
     ATGGCATCAA ACCAAATCCA AATAAAACTA AAGCAATTAC AAATTTTCCA TTACCCAAGA      3480
     CACCTAAGCA AATAAAATCA TTTTTGGGAT TATGTGGATT CTATCGCAAG TTTATTCCTA      3540
     ACTTTGCCAA AATAGTTAAA CCCATGACCC TCAAATTAAA GAAAGGTGCT ATAATAGACA      3600
     CCAAATGTAA AGAATACATC GAATCATTTG AAAAATTAAA AGTTTTGATA ACTTCAGACC      3660
     CGATATTAAT CTATCCTGAT TTTTCAAAAC CTTTTTCTTT GACAACTGAT GCTAGCAACG      3720
     TAGCTATTGG TGCAGTGTTA TCACAAAATC ACAAGCCAGT TTGTTATGCC AGTAGAACGC      3780
     TAAACGAACA TGAAATCAAC TATGCTACGA TTGAAAAAGA ATTGTTAGCT ATAGTTTGGG      3840
     CTACAAAATA TTTCAGGTCA TACTTATTCG GCAGACCATT TGAAGTATTA AGTGATCACA      3900
     AGCCACTGGT ATGGCTCAAC AACATTAAAG AACCAAACAT GAAATTGCAA AGATGGAAAA      3960
     TAAAACTTAA TGAATTCGAT TATAAAATCA AATATCTTCC AGGCAAAGAA AACCATGTCG      4020
     CGGATGCTCT TTCCCGCACG AAAATAGAAG TTATGGTTGG CGAGGTCGCA AATAGCGCAG      4080
     ACGCAACTAT ACACAGTGCC ATTGAAGATA ATCTAAATTA CATACCCATA ACAGAAAGAC      4140
     CAATAAATTA CTTCTCTAGA CAAATAGAGA TAGAAAAAGG CGATAACGAT ACAACAAGTG      4200
     TACAACATTT GTTTCAAAAA TTAAAGATTA AGATAGTCTA TAAAGAAATG ACACCTGAAC      4260
     TCGCCAAAAA CCTCATTAAG GAATATGTGT GCACCAAAAA GAGTGCAATT TATTTCCCTA      4320
     ATGACGAAGA TTTTCTGATC TTCCAGAGAG CGTTTACCGA AATTATAAGC CCTAACAATT      4380
     TCACAAAACT CTTGAGATGT ACCACAAAGT TAATTGATAT ACTAACGTAT GCAGAATTCA      4440
     AAGATTTAAT CTTAAAGAAA CATAAGGAAC TTTTACATCC GGGTATAGAA AAAACAATCA      4500
     ATTTATTTAA AGAAGAATAT TACTATCCTG ATAGTCAAAA GCTTATTCAA ACCATTATCA      4560
     ATGAATGTCA AATTTGTTAT CTAGCAAAAA CGGAACATCA AACACAAATG ACATATGAGA      4620
     CTACACCAGA AATATTTAAC ACAAGAGAAA AATACATGAT AGATTTTTAT CTCACAGGAA      4680
     ACCAGATCTT CTTATCTTGC ATTGATATCT ATTCGAAATT TGCATCACTA GTTGAATTAA      4740
     AAAGTAGAGA TTGGCTAGAA GCAAAAAGAG CCATTACTAA AATATTCAAT GACATGGGAA      4800
     AACCGCAAGA AATTAAAGCA GACAAAGACT CAGCTTTTAT GTGTTTAGCC TTACAAAATT      4860
     GGTTAAGATC TGAAGGTGTA CAAATTTCTA TAAGCACTAG CAAAAATGGT ATATCTGATA      4920
     TAGAAAGATT CCACAAGACC GTAAACGAAA AGCTAAGAAT CATTGGTAGC CAACAAAATG      4980
     TTGAAGATAG GTGCACAAAA TTCGAAAGAA TTCTATACAT ATACAATCAC AAAACTAAAC      5040
     ATAATAGTAC TAAAAGATTT CCAGCAGACA TTTTCCTATA TGCAGGCAGT CCAGATTTTA      5100
     ATGTACAACA AAACAAAATC GATAGGATAG AATACCTCAA TAAGAATAGA CACGATTTTG      5160
     AAGTTGATAT AAAATATAGA CAAGCCCCAC TTGTAAAAAG TAAAATAACC AATCCATTTA      5220
     AAAAGACAGG AAGAATTGGA CAAGTAGATG ATAAACATTT CGAAGAACAA AATCGTGGCA      5280
     GGAAGATCGT TCACTATAAG TCAAAATTTA AGAAACAGAA AAAGTTTAAT AAGAGCAAAT      5340
     ATGATAATTC CAGACCAACC AAAGAAGCAC AAAGTACACA ACATACTTCT AATAATGCTT      5400
     AGTTGCATAC TATCACTTAT CATCACGGTC AAGTGCAACA ATATAGAAGT AAATCCAGTA      5460
     AACGCGAAAA ATGGATACCT TATATTCCAA ACAGGAACAA TGGAAATTCC AACCAGCTAT      5520
     GAATACCATT ATTTAAGCAT AAACATAACA AAGACAATGC TCATGTTCGA AGATATAGTA      5580
     AGTGAAGCAA ACAACTATCC TAATGTACCA CAAATACAAT ATTTAGTCGA CAAATTAAAA      5640
     CGAGAAATAA ATGGGTTAAG AATTATTAGT CGAAGTAAAA GAGGTCTTTT AAACGTAGTA      5700
     GGAAAAGCAT ACAAATACTT ATTCGGCACA TTAGATGAGG ATGACAGAGA AGAGTTAGAA      5760
     GAAAAAATAA ACAACATGTC AGAAGACTCT GTAAAAACCC ATGACCTAAA CACGATTCTA      5820
     GATGTAATCA ATAGTGGTAT AGATATAATT AATAAGCTCA AAGTAGATAA AGAACAACAC      5880
     CAACAAATTG CGGTACTAAT ATTTAACCTA GAGCAATTTA CAGAATATAT AGAAGACATA      5940
     GAATTGGGTC TGCAATTAAC CAGACTAGGA ATTTTCAATC CAAGATTACT AAAGCATGAC      6000
     TATTTAAAAC ATGTAAATTC AGAAAAAATG CTAAAGATAA AAACGTCAAC CTGGCTTAAA      6060
     ACAGACACGA ACGAAATTTT GATTATTTCC CATATTCCTA GCGAAGTTAC TAAAGTTCCA      6120
     ATATTCCAAA TTGTTCCGTA CCCAGATGAA CATAATTATA TTCTAACCGA GCAAATATTC      6180
     GATAAATTCT ACATATTTGA TAACCAAGTA TTCCATAAAG ATACCAATAG GGATATATTC      6240
     GACAAATGTA TTATTGGAAT CATCAAACAA GAGCAAACTC AATGCAAATA TATTAAAACA      6300
     CATAAAAATT ACCAAATAAA TTATATAGAA CCAAATATAC TATTAACATG GAATATTCCT      6360
     GAAACAGCTG TTAACCAAGA CTGTACACAC AATAAAATAT TAATTTCAGG AAACAACATC      6420
     ATTAAAATTA AAAATTGTAC CATACAAATA GATGAATTCT TAATCTCTAA TAATCTAGCA      6480
     GACTTTACAC AAACAATTTA TATCACCAAC AATGTAACAC GTCTAGAACC AATAAATCAC      6540
     TTACAAACGA GAGAAATGAT AGAAACCCAT GTAAAACACT ATAACTTTTT TCAAATTATA      6600
     TGCATTACAA CGTTCGTCAT AATGATAATT AGTTTGACTC TGTATGTAGC ATATAAGTTT      6660
     AAAAATATAC CTAAGAAAAT TATTGTCAAT ATCGTAAGCA AAAAGAACAC ACGCACCTTG      6720
     AAAATAATGT CAATGAAAAT ATTCAACAAG GAAATAATAT TACCTTATAC CCAAATTTAA      6780
     CGACCTGAGG ACAGGCCAAA TTCAAAGGTT GGGGGAGTGA CATATCCATA AGTCCCTAAG      6840
     ACTTAAGCAT ATGCCTACAT ACTAATACAC TTACAACACA TACACCCCAA TACAACATAC      6900
     ACTACTCCGG ATGTACCCAA CAGATACCAG ATAAGAATAA GATTGTTATA TGATCCTCGA      6960
     GAATGGAAAA AACCCCAATT CTAGATAAGT CACCCACTGG TAGACTAAAC ATCCGTTCCC      7020
     CTAATTTAAA CAATTCCTTG CTTAAGCCTC ACCCCATCGT CACATTCCCA CGTTCAAAGC      7080
     TCGGAGCCGC AATCCCGAAA AACAAAAGTA TCGATTTCAA TAAACAAATT ATAAGAATCT      7140
     AAGAGCACTT GTATCCAAGA GCAAATGCAC TTGAATCCAA GAGAAACGCA AAGCTTTTTC      7200
     TCTTTACGAT CAGAATCCTA AAGTCTAAAG TCCATATTAG AAAAGCTCGA TACCGAGGCT      7260
     TGAACGTCAA CCAAATCAGA ATAATTATCA GAGTTCAGTT TGAGACCTAA TTGTAAAAGG      7320
     TTCGGTGTTC TTCTCAAATA AAAAGATTGT AATCATTTAG TGAAATAAAA ATTATATTTT      7380
     TTTCACTTAT AAATATTGCA AGTATTTAAT T                                     7411
//
ID   DMIS176    standard; DNA; INV; 7439 BP.
XX
AC   X01472; J01060; J01061;
XX
DR   FLYBASE; FBte0000109; Dmel\17.6.
XX
FT   source          X01472:1..7439
FT   SO_feature      five_prime_LTR ; SO:0000425:1..512
FT   SO_feature      three_prime_LTR ; SO:0000426:6928..7439
FT   SO_feature      TATA_box ; SO:0000174:372..377
FT   SO_feature      TATA_box ; SO:0000174:7271..7277
FT   SO_feature      primer_binding_site ; SO:0005850:511..529
FT   SO_feature      polyA_signal_sequence ; SO:0000551:372..377
FT   SO_feature      polyA_signal_sequence ; SO:0000551:7299.7304
FT   SO_feature      RR_tract ; SO:0000435:6917..6927
FT   SO_feature      CDS ; SO:0000316:1074..2393
FT                   /name="Dmel\17.6\gag"
FT                   /db_xref="FLYBASE:FBgn0044339"
FT                   /db_xref="SWISS-PROT:P04282"
FT                   /db_xref="NCBI_PROTEIN:CAA25701.1"
FT                   /translation="MAQEPAIVPPLSDSNMTQVAYQIGNVEKFNGDPGSLYTFVSRIDY
FT                   ILALYATGDERQQQIIFGHIERSISGEVMRCIGAYDMYTWQQLRRQLVLNYKPQTPNHV
FT                   LLEEFRKTPFRGNVRAFLEEAESRRQTLTSKLELEQDLEEKTFYLKLIKSSIESLIEKL
FT                   PTHIYLRINNHNIPDLRSLINLLQEKGMYEQINHTSTHVQKQNFSDKPQKSFNQNTNQS
FT                   NNIRKYPTPFLHYNSPIPYQAPQIYQTPPTNNPLYRHPIPYHPNPNNVFQPSQQNNVFQ
FT                   PSQQNNAFQPNQRTNFTSRPIFNTNRNNAFDQNRFGQQPQYQNQQSTQNSSSYVPNRPI
FT                   KRLRPANSGQTGMSVDETLYQEDAFYQQCVPYDYFYYPTYDHSDYYPENQYQIDENNQN
FT                   LQRTQQLQQINTDETNNDNQEPNVEQAENFQPQALENPNI"
FT   SO_feature      CDS ; SO:0000316:2345..5518
FT                   /name="Dmel\17.6\pol"
FT                   /db_xref="FLYBASE:FBgn0014453"
FT                   /db_xref="SWISS-PROT:P04323"
FT                   /db_xref="NCBI_PROTEIN:CAA25702.1"
FT                   /translation="TGRKFSATSLGKPQYITIKYKENNLKCLIDTGSTVNMTSKNIFDL
FT                   PIQNTSTFIHTSNGPLIVNKSIIIPSKILFPTTNEFLLHPFSENYDLLLGRKLLAEAKA
FT                   TISYRDQEVTLYNNKYKLIEGIATHEQSHFQNVNMIPDTMLRQPNKISPILESDLYRLE
FT                   HLNNEEKQRLCALLQKYHDIQYHEGDKLTFTNQTKHTINTKHNLPLYSKYSYPQAYEQE
FT                   VESQIQDMLNQGIIRTSNSPYNSPIWVVPKKQDASGKQKFRIVIDYRKLNEITVGDRHP
FT                   IPNMDEILGKLGRCNYFTTIDLAKGFHQIEMDPESVSKTAFSTKHGHYEYLRMPFGLKN
FT                   APATFQRCMNDILRPLLNKHCLVYLDDIIVFSTSLDEHLQSLGLVFEKLAKANLKLQLD
FT                   KCEFLKQETTFLGHVLTPDGIKPNPEKIEAIQKYPIPTKPKEIKAFLGLTGYYRKFIPN
FT                   FADIAKPMTKCLKKNMKIDTTNPEYDSAFKKLKYLISEDPILKVPDFTKKFTLTTDASD
FT                   VALGAVLSQDGHPLSYISRTLNEHEINYSTIEKELLAIVWATKTFRHYLLGRHFEISSD
FT                   HQPLSWLYRMKDPNSKLTRWRVKLSEFDFDIKYIKGKENCVADALSRIKLEETYLSEQT
FT                   QHSAEEDNSDLIFITERPLNTFNRQVIFSKGPPDIKVTKYFKKHITQIFYDIMTREKAE
FT                   QYLIDHFCGKKSALYIESDADFEVIQAAHKLAINTKYTKILRSTILLKNITTYAEFKEL
FT                   ILTAHEKLLHPGIQKTTKLFGETYYFPNSQLLIQNIINECSICNLAKTEHRNTDMPTKT
FT                   TPKPEHCREKFMIDIYSSEGKHYVSCIDIYSKFATLEEIKTKDWIECKNALMRIFNQLG
FT                   KPKLLKADRDGAFSSLALKRWLESEEVELQLNTTKTGVADIERLHKTINEKIRIIKTSD
FT                   DEETKLSKMETVLNIYNHKTKHDTTGQTPAHIFLYAGQPILDTQQNKENKINKINNDRV
FT                   EYEVDTRYRKGPLQKGKLENPFKPTKNVEQTDSDHYKITNRNRITHYYKTQFKKRKKNN
FT                   QLSISQAPGT"
FT   SO_feature      CDS ; SO:0000316:5488..6903
FT                   /name="17.6\env"
FT                   /db_xref="FLYBASE:FBgn0027624"
FT                   /db_xref="SWISS-PROT:P04283"
FT                   /db_xref="NCBI_PROTEIN:CAA25703.1"
FT                   /translation="SALNFTGTWHLITLLLMLITTVHGQQIEINNIDTNHGYLLFSDKP
FT                   VQIPSSFEHHCLRINLTEIDTIADYFEQRLRTDYHAPQVKFLYNKMRRELAGIALRHRN
FT                   KRGLINIVGSVFKYLFGTLDENDRVDIQRKLETNAHNSVNLHELNDAIQLINDGMQKIQ
FT                   NYENNSNIINSLLYELMQFTEYIEDVEMGMQLSRLGLFNPKLLNYDKLENVNSQNILNI
FT                   KTSTWINYNDNQLLIISHIPINFSLINTVKIIPYPDSNGYQLEYTDTQSYFERENKVYN
FT                   NENKEINNECVTNIIKHLKPICNFESIHTDEIIKYIEPNTIVTWNLTQTSLKQNCQNSF
FT                   NNIKIKGNKMIKVTQCKIEINSIILSENLFKPEIDLTPLYTPLNITKIKTVKHNDINEM
FT                   ISQNNITLYIFMTTVIIILILLYLYLRYVSFNPFMMLYAKLKLRKNQNQNTAQQIEMED
FT                   VPLPLLYPSIPAQV"
XX
CC   Derived from X01472 (g8142) (Rel. 36, Last updated, Version 2).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 7439 BP;  2985 A; 1512 C; 1048 G; 1894 T; 0 other;
     AGTGACATAT TCACATACAA AACCACATAA CATAGAGTAA ACATATTGAA AAGCCGCATA        60
     CGTAAACAAT AAGTGACCAC CATGCTAATG TGGATCAAAT AACAAAAATA TCCACTCTGC       120
     ATTTTGACAC CCCCATACTG TATGCCATCT GCGCAGTATG CATTCTAATA AACAAATTCT       180
     TTGACAGCGG CACTTAGCCA TTCTTGTAAA CAAATCTTAA AGTCTGCCTG CTCTCTCTGA       240
     GGCTTCTCCT CCACTTAAGA ATCCAAGAGC AATGCTCTCC CAAAAACACT AACATATTCT       300
     TTAAGCAAGC ACAGAGGCTT CTCCTCATTT TCACTTTCAT TTGATTTTCA GTCTTAAGCT       360
     GAACGTTAAT CAATAAACAA CACAATCGAT ACCGAAATTT TGATTCGTTT TATTTTGGCA       420
     AAACTCAATT TTCAGCGTTG GTCTTAGTTC ATATTCGGAA CGGTCCATTT AATAGACTCA       480
     AAACTATTTA TTGCAACCAT TTATTTGCAA TTGGCGCAGT CGATGTGATC AGTGTTAAAG       540
     TTCCTTGATG CGGTAACCAG ATTTGCCAAT TCCTGTGTTC TTTTTGTTCT CTGACAAAAG       600
     TACCACGATA ACGGGCACCC ACGTGACGGT TAATATCGCT TTAAGTTTTT AATTAAACCT       660
     CGACAATAAA GTGAAACCGA AAAATCACAA TTTGCCTAAA CAAACCTGAA TTTATTATCA       720
     GGAAGACGCT ATTGAATTTG TGAGAGGCTG TAAATCCAAT TGGTTACCTC AAAGACCCAC       780
     GAAAAAGCTA TAGTGCAACC CTTGCGAAAA TCAAAACCTA TCTTAAAAAA AAAAAAAAAA       840
     TATAAATAAT AAATTAATAA GCGAAAATTA AAACGTATTA AAAGTAAGAA TAATAAATAA       900
     ATAAGTGAAA ATTCTATATG ATAAAAATTA AAAATAAGAA TAATAAATAA AAAGACAACA       960
     TTTTAAATTA AACAATATTA AAAAAATATA AAAATATTAA AAACTATATT AAAAAAAAAA      1020
     AAAAAACAAA AAAACAAAAA AAAAAAAATA AATAAATAAT CCAAAAATCA AAAATGGCTC      1080
     AAGAACCAGC AATTGTGCCA CCACTATCAG ACAGCAACAT GACCCAGGTT GCCTACCAGA      1140
     TTGGCAATGT GGAGAAATTC AACGGTGATC CAGGCTCACT ATACACCTTT GTGAGTCGAA      1200
     TTGATTACAT ACTGGCTCTT TATGCTACCG GAGATGAACG CCAACAGCAG ATCATATTTG      1260
     GGCATATTGA ACGCAGCATC AGCGGAGAAG TTATGCGCTG CATTGGAGCC TATGACATGT      1320
     ACACCTGGCA GCAGCTTAGA AGACAATTGG TACTCAACTA TAAACCCCAG ACCCCTAACC      1380
     ACGTTCTTTT AGAAGAGTTT CGAAAGACCC CATTTCGAGG CAATGTACGA GCATTCCTGG      1440
     AAGAAGCAGA AAGCCGCAGA CAAACACTTA CTAGTAAGCT TGAATTAGAG CAAGATCTTG      1500
     AAGAAAAGAC TTTTTATTTG AAATTAATAA AATCCAGTAT AGAATCACTA ATTGAAAAAT      1560
     TACCTACACA CATTTATTTA AGAATAAATA ACCACAACAT ACCAGATTTG CGATCACTTA      1620
     TAAACCTTTT ACAAGAGAAG GGCATGTACG AACAAATAAA TCATACAAGT ACACATGTCC      1680
     AAAAACAAAA TTTCTCTGAT AAGCCACAAA AGTCCTTTAA TCAAAATACT AATCAGTCTA      1740
     ACAATATCAG AAAATATCCA ACACCTTTCC TACATTATAA TTCACCAATA CCATATCAAG      1800
     CTCCACAAAT TTATCAAACA CCACCAACTA ATAACCCACT TTATCGTCAT CCAATACCCT      1860
     ACCACCCTAA TCCAAACAAT GTTTTTCAAC CAAGCCAACA AAACAATGTT TTCCAACCAA      1920
     GCCAACAAAA CAATGCTTTT CAACCAAATC AACGAACAAA CTTTACATCT CGACCAATTT      1980
     TTAACACCAA TCGAAACAAT GCATTCGATC AGAATAGGTT CGGACAACAA CCCCAATATC      2040
     AAAATCAACA ATCAACACAA AATTCAAGTT CCTATGTACC CAATCGACCA ATAAAACGAT      2100
     TAAGACCAGC TAATAGTGGA CAGACTGGGA TGAGTGTTGA CGAAACATTA TATCAAGAGG      2160
     ACGCTTTTTA TCAGCAGTGT GTTCCATATG ACTATTTTTA TTATCCAACT TACGACCATT      2220
     CAGACTATTA TCCAGAAAAT CAATATCAAA TTGACGAAAA CAACCAAAAT TTACAAAGAA      2280
     CACAACAGTT ACAGCAGATT AATACAGACG AGACAAACAA TGACAACCAA GAACCCAATG      2340
     TTGAACAGGC CGAAAATTTT CAGCCACAAG CCTTGGAAAA CCCCAATATA TAACAATTAA      2400
     ATACAAAGAA AATAATTTGA AATGCCTTAT TGATACCGGA TCAACAGTTA ACATGACATC      2460
     TAAAAATATA TTTGATTTAC CAATCCAGAA TACTAGTACT TTTATTCATA CCAGCAATGG      2520
     ACCGCTCATT GTCAACAAAA GTATAATCAT ACCTTCAAAG ATTTTGTTCC CAACAACAAA      2580
     TGAATTTTTA TTGCACCCTT TCTCTGAGAA TTACGATCTT TTATTAGGAA GAAAACTTTT      2640
     AGCAGAAGCA AAAGCAACAA TAAGTTACCG CGATCAAGAG GTAACTCTTT ACAACAACAA      2700
     ATACAAATTA ATAGAAGGAA TAGCAACACA TGAACAGAGT CATTTTCAAA ATGTAAATAT      2760
     GATACCTGAC ACCATGCTCA GACAGCCAAA TAAAATTTCA CCCATTTTAG AATCAGACCT      2820
     ATACAGATTG GAACATTTAA ATAACGAAGA AAAACAAAGA TTGTGCGCAC TCCTGCAGAA      2880
     ATACCATGAC ATACAGTACC ATGAAGGTGA TAAGTTGACA TTTACTAATC AAACCAAACA      2940
     TACTATCAAT ACAAAGCACA ATCTACCACT TTACTCTAAA TACAGTTACC CACAGGCTTA      3000
     TGAACAGGAG GTCGAAAGCC AAATACAAGA TATGCTAAAT CAAGGTATTA TACGTACCAG      3060
     TAATTCACCT TACAATAGCC CCATCTGGGT GGTTCCAAAG AAACAAGATG CATCAGGCAA      3120
     ACAGAAATTT AGAATTGTAA TAGACTACCG AAAATTAAAT GAAATAACAG TAGGAGACAG      3180
     ACACCCAATC CCAAACATGG ACGAAATCTT GGGAAAATTG GGCAGATGTA ATTACTTCAC      3240
     AACTATAGAC TTGGCAAAGG GTTTCCACCA GATCGAAATG GATCCAGAAT CAGTTTCAAA      3300
     GACAGCCTTT TCTACCAAGC ACGGTCATTA TGAATATTTG CGCATGCCAT TCGGATTAAA      3360
     AAACGCGCCA GCCACCTTTC AACGGTGCAT GAATGATATT TTAAGACCAC TCTTAAACAA      3420
     ACACTGTCTT GTGTATTTGG ACGACATAAT TGTATTCTCG ACATCCCTTG ATGAACACCT      3480
     GCAATCGCTC GGACTAGTTT TCGAAAAATT AGCAAAAGCC AACCTTAAAT TACAACTTGA      3540
     CAAATGTGAG TTTCTCAAGC AAGAAACCAC ATTTTTAGGA CATGTTCTAA CACCAGATGG      3600
     AATAAAACCA AACCCTGAAA AAATTGAAGC CATTCAAAAA TATCCAATTC CCACTAAACC      3660
     AAAAGAAATA AAAGCTTTTC TTGGACTGAC AGGATATTAT CGTAAATTTA TTCCAAACTT      3720
     TGCAGACATA GCCAAACCCA TGACTAAGTG TTTAAAAAAG AACATGAAAA TTGACACTAC      3780
     CAACCCAGAA TATGACTCTG CATTTAAAAA ATTAAAATAT CTAATATCAG AAGACCCAAT      3840
     TCTTAAAGTA CCCGACTTTA CAAAGAAATT CACTTTAACC ACAGACGCAA GTGATGTCGC      3900
     TTTGGGGGCA GTACTGTCAC AAGATGGACA CCCACTTAGC TACATTAGCC GAACACTTAA      3960
     TGAACACGAA ATAAATTACA GCACAATTGA AAAAGAACTC TTAGCAATTG TATGGGCGAC      4020
     AAAGACTTTT CGACACTACC TACTTGGAAG ACACTTTGAA ATATCCAGTG ACCATCAACC      4080
     ATTGAGCTGG TTGTACCGTA TGAAAGACCC AAATTCAAAA CTGACCCGAT GGAGAGTAAA      4140
     ATTATCCGAA TTCGATTTTG ATATAAAATA TATAAAAGGA AAAGAAAATT GCGTGGCGGA      4200
     TGCTCTGTCC AGAATAAAAC TTGAGGAGAC ATATTTGAGC GAACAAACCC AACATAGTGC      4260
     AGAAGAGGAC AATAGTGATT TAATTTTTAT TACAGAAAGA CCTCTAAATA CATTTAACAG      4320
     ACAAGTTATA TTTTCAAAAG GACCACCAGA CATTAAAGTT ACGAAATATT TCAAAAAACA      4380
     CATCACCCAA ATATTTTACG ACATTATGAC CAGGGAAAAA GCCGAACAAT ATTTGATAGA      4440
     CCATTTTTGT GGTAAGAAAA GTGCGTTGTA TATTGAGAGT GACGCTGATT TCGAAGTCAT      4500
     TCAAGCCGCA CATAAATTAG CCATAAACAC CAAATATACA AAAATCCTGC GTAGCACGAT      4560
     TTTGTTAAAA AACATAACCA CTTATGCGGA ATTTAAGGAA TTGATCTTGA CTGCTCATGA      4620
     AAAACTTCTA CACCCAGGCA TACAGAAAAC TACTAAACTT TTCGGAGAAA CTTACTATTT      4680
     CCCTAATAGC CAGCTACTTA TTCAGAATAT AATAAATGAG TGCAGTATTT GCAATCTGGC      4740
     AAAAACAGAG CACCGAAATA CAGACATGCC AACGAAAACC ACACCCAAAC CAGAACATTG      4800
     CCGCGAAAAA TTCATGATAG ACATTTACTC ATCCGAAGGC AAACATTACG TTAGTTGCAT      4860
     AGACATTTAT TCGAAATTTG CCACATTAGA AGAAATAAAA ACAAAAGACT GGATAGAATG      4920
     CAAAAACGCG CTTATGCGCA TATTCAACCA GCTTGGCAAG CCAAAGTTAC TAAAGGCGGA      4980
     CAGAGACGGC GCATTTTCCA GTTTAGCCCT CAAGAGATGG CTGGAGAGTG AGGAAGTCGA      5040
     ATTGCAGCTT AACACAACAA AAACTGGTGT GGCGGACATA GAAAGACTAC ATAAAACAAT      5100
     TAATGAAAAG ATTCGCATAA TCAAAACATC CGATGACGAA GAAACCAAAT TGAGCAAAAT      5160
     GGAAACAGTA CTTAACATAT ACAATCATAA AACCAAACAC GACACCACTG GACAGACCCC      5220
     TGCACACATA TTTCTCTACG CTGGACAACC AATATTAGAT ACCCAACAAA ACAAAGAAAA      5280
     CAAAATAAAC AAAATAAATA ATGACAGAGT GGAGTACGAA GTCGACACAA GATACAGAAA      5340
     AGGTCCACTA CAGAAAGGCA AATTAGAAAA TCCTTTTAAG CCAACAAAAA ATGTGGAGCA      5400
     GACTGACTCT GATCATTATA AAATTACTAA TAGAAATAGA ATTACTCACT ACTACAAAAC      5460
     ACAATTCAAA AAACGAAAGA AAAATAATCA GCTCTCAATT TCACAGGCAC CTGGCACTTG      5520
     ATAACATTGC TGCTGATGCT GATCACAACA GTTCATGGAC AACAAATTGA AATTAATAAT      5580
     ATTGACACAA ACCACGGATA TCTCCTTTTT TCTGATAAAC CAGTCCAGAT ACCATCATCC      5640
     TTTGAACATC ATTGCTTGAG AATCAATTTA ACTGAAATAG ACACCATAGC TGATTATTTT      5700
     GAGCAAAGAC TACGTACCGA CTACCATGCA CCCCAGGTCA AATTTTTATA CAACAAAATG      5760
     AGAAGAGAAC TAGCTGGAAT AGCCTTGCGA CATAGAAATA AACGGGGACT TATTAACATT      5820
     GTAGGTTCAG TTTTTAAATA CCTATTTGGC ACACTTGACG AAAATGATCG AGTGGATATA      5880
     CAGAGGAAAC TTGAAACAAA CGCCCATAAC TCGGTAAATT TACATGAACT CAATGACGCT      5940
     ATTCAATTAA TAAATGACGG AATGCAAAAG ATACAGAATT ATGAAAACAA CAGCAACATC      6000
     ATTAACAGTC TTTTATATGA ACTCATGCAG TTTACAGAAT ACATAGAAGA TGTGGAAATG      6060
     GGAATGCAGC TTTCCAGACT CGGTCTATTT AATCCCAAAC TACTAAACTA CGATAAACTT      6120
     GAGAATGTAA ACAGCCAAAA TATTTTAAAC ATTAAAACAT CCACTTGGAT TAATTACAAT      6180
     GATAACCAAT TATTAATCAT ATCTCACATA CCTATTAACT TTTCATTAAT AAATACAGTA      6240
     AAAATAATCC CTTACCCAGA CTCGAACGGC TATCAGCTAG AATACACAGA CACACAATCA      6300
     TATTTTGAAA GAGAAAATAA AGTTTACAAT AACGAAAATA AAGAAATAAA CAATGAGTGT      6360
     GTCACCAACA TTATTAAACA TTTAAAACCA ATTTGTAATT TTGAGTCAAT CCACACAGAT      6420
     GAAATAATAA AATACATAGA ACCAAACACA ATTGTAACCT GGAATTTAAC CCAAACAAGT      6480
     CTCAAACAAA ATTGTCAAAA TTCATTTAAT AATATAAAAA TAAAAGGAAA CAAAATGATA      6540
     AAAGTAACCC AATGTAAAAT AGAAATCAAT AGCATAATTC TAAGTGAAAA TCTCTTTAAA      6600
     CCAGAAATAG ATTTGACACC ATTATACACA CCACTTAACA TAACAAAAAT AAAAACTGTT      6660
     AAACACAACG ACATTAATGA AATGATTTCA CAAAACAATA TTACACTTTA CATATTTATG      6720
     ACTACTGTCA TCATTATACT TATTTTATTG TACTTATATT TAAGATACGT ATCATTTAAC      6780
     CCATTCATGA TGCTGTATGC AAAACTAAAA TTAAGAAAAA ATCAAAATCA AAACACAGCA      6840
     CAACAAATAG AAATGGAAGA CGTTCCATTA CCCCTACTAT ATCCATCAAT CCCAGCCCAA      6900
     GTATAGGCTT CTCTTTAAGG GAAGGGAAGT GACATATTCA CATACAAAAC CACATAACGT      6960
     AGAGTAAACA TATTGAAAAG CCGCATACGT CAACAATAAG TGACCACCAT GCTAATGTGG      7020
     ATCAAATAAC AAAAATATCC ACTCTGCATT TTGACACCCC CATACTGTAT GCCATCTGCG      7080
     CAGTATGCAT TCTAATAAAC AAATTCTTTG ACAGCGGCAC TTAGCCATTC TTGTAAACAA      7140
     ATCTTAAAGT CTGCCTGCTC TCTCTGAGGC TTCTCCTCCA CTTAAGAATC CAAGAGCAAT      7200
     GCTCTCCCAA AAACACTAAC ATATTCTTTA AGCAAGCACA GAGGCTTCTC CTCATTTTCA      7260
     CTTTCATTTG ATTTTCAGTC TTAAGCTGAA CGTTAATCAA TAAACAACAC AATCGATACC      7320
     GAAATTTTGA TTCGTTTTAT TTTGGCAAAA CTCAATTTTC AGCGTTGGTC TTAGTTCATA      7380
     TTCGGAACGG TCCATTTAAT AGACTCAAAA CTATTTATTG CAACCATTTA TTTGCAATT       7439
//
ID   DMTN1731   standard; DNA; INV; 4648 BP.
XX
AC   X07656;
XX
DR   FLYBASE; FBte0000003; Dmel\1731.
XX
FT   source          X07656:1..4648
FT   SO_feature      five_prime_LTR ; SO:0000425:1..336
FT   SO_feature      three_prime_LTR ; SO:0000426:4313..4648
FT   SO_feature      TATA_box ; SO:0000174:110..116
FT   SO_feature      primer_binding_site ; SO:0005850:342..352
FT   SO_feature      CDS ; SO:0000316:431..1252
FT                   /name="Dmel\1731\gag"
FT                   /db_xref="FLYBASE:FBgn0020768"
FT                   /db_xref="REMTREMBL:CAA30502"
FT                   /db_xref="NCBI_PROTEIN:CAA30502.1"
FT                   /translation="MSNLYQIDKLEDGSYETWSIQMRSVLVHACLWKVVSGESVKPEVD
FT                   TGGAWQSQDEKALATIILSVKSSQLGYVKGCLTAAEAWKVLQDVHQPKGPLRTVMLYKK
FT                   LLSKRLLEGQSISSHIKEFKEIFDALDAVEIGITEKLRSVVLLSSLPESFENFVVAIET
FT                   RDDVPLFDALCIKLIEEDTRRGGAEQQREKQTESAKAFTAVHKPQAPAREARPSAKKRK
FT                   DVVCYNCGERRHFKANCRREKVNKESATQEQCSLLNALDSGGFWQNTVVSR"
FT   SO_feature      CDS ; SO:0000316:1203..4151
FT                   /name="Dmel\1731\RTase"
FT                   /db_xref="FLYBASE:FBgn0012032"
FT                   /db_xref="REMTREMBL:CAA30503"
FT                   /db_xref="NCBI_PROTEIN:CAA30503.1"
FT                   /translation="MRWIVVVFGKTQWCLDSGATSHMCCDRSVFTEFEEHTEKISLAGN
FT                   GFLLAKGIGTVKLKTDLCTLVLNNVLFVPDLNGNFMSVSRAAQYKCFVNFGPHYADVIQ
FT                   EGERILRVMRAGNLYMFQGKHNSCFAAVDADGSLWHKRNGHLNTSSLQEMVRKKMVYGV
FT                   EKVVFKPDAVCKTCMLAKIHVQPFPKTTRSRAEELLDMIHSDLCGPFSTPSLAGSKYFL
FT                   TFIDDKSRRIFVYFLRKKDEVFTKFVEFKKLVERQTGRKIKCIRSDNGGEFVNNVFDDY
FT                   LKAHGIARQLTIPHTPQQNGVAERANRTLVEMARCMLLQSELGEALWAEAINTAVYLRN
FT                   RSTSRALQSKTPMEEWTGKIPAVSHLRVFGAIAVALDKGVHKGKFESKGKEYRMIGYSI
FT                   AAKGYRLFDKEKRCVIEKQDVLFDESGSLVNHGNTIEFQFPATDDPEPQSDSNAREGDD
FT                   TEPVGSSDDYESAAEAEEAEVHVGPGRPKIVRTGRPGRPKKQYNVLGVLMASDVEIPKS
FT                   YEEAINSQYSAKWEEAMGLEYKALLANETWKLADLPRNRRCVACKWVYSLKRDVSGRIE
FT                   RFKARLVAKGCSQKFGVDYFETFSPVCRLESVRLILALAAEMQLYLHHMDVCTAYLNSE
FT                   LKDTVYMKQPQGFTDAANPDQVLLLRKAIYGLKQSGREWNSKLDGVLKDLGFKACNHEP
FT                   CLYQQSGQGNLMLILVYVDDLILACQSREDMEDLKAKISESFECTDKGPLHLFLGMEVQ
FT                   RDGDLGEITLGHSQYIKELLRDYGSENCRPATTPLDAGHQVLCAGEQCQKVDAGQYQST
FT                   IGELMWLGLTTRPDMLHSVAKLAQRNQDPHSEHMVAVKHILRYLASTVDVKLHYQKCGQ
FT                   AFTGFVDADWGGDRLDRKSYTGYVFFLSGGPVSWRSEKQQSVALSSTEAEYMALTTACK
FT                   EAIALRRLIVEIVCGDLKTPTVMHGDNLKCAAQLAKNPVHHSRTKHIDIRYH"
XX
CC   Derived from X07656 (g8700) (Rel. 36, Last updated, Version 6).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 4648 BP;  1316 A; 880 C; 1268 G; 1184 T; 0 other;
     TGTTGAATAT AGGCAATGCC CACATGTGTG TTGAATATAG GCAATTTCCA CATGTGCATA        60
     TGTAATTTTG TATGAGAACA TACATACATA CACATGAACT GTATGTATGT ATATATATTA       120
     GCAAATAAGC AGCCGCATGA AGGTGGCATT TTTATGTGTA TCAGTTTCAG TTTCAAATAA       180
     AACTTCTTCG TGTTCGGACA CGCGGCTCAA GACTTTTTAT TTCGCGTTTA CTCTTTCAGC       240
     CTTTGCTCTC AATTCGCTGA GTTTGGGTGA AGATTAGGAT CTTCCCATTA TGATTGTCAG       300
     TGTTCCACAC TTGGAGCACC TTTTCAATAA ACAACAGGTT AATGGGCCCA GCGCCCTAGG       360
     AGCTGCCTAA AGGAGAAACG TGTAGTGAAA CTCAGGAGTT AGATTTTGGA GTCTACTCAA       420
     GATTGCCGGA ATGAGTAACC TGTATCAGAT CGATAAGCTG GAGGATGGAT CCTATGAAAC       480
     GTGGAGCATC CAGATGCGTT CAGTGTTGGT GCACGCATGT TTGTGGAAGG TGGTTTCAGG       540
     AGAGTCCGTG AAACCTGAGG TTGATACTGG AGGTGCTTGG CAATCCCAAG ATGAAAAAGC       600
     ATTGGCCACG ATCATCTTGA GTGTGAAGTC TTCGCAACTT GGTTATGTAA AAGGGTGTCT       660
     CACTGCGGCT GAGGCATGGA AAGTTTTACA GGATGTCCAC CAGCCGAAAG GGCCGTTACG       720
     AACGGTCATG CTGTATAAGA AGTTGCTGAG CAAACGTCTG TTGGAAGGGC AGAGTATATC       780
     GTCACATATT AAAGAATTTA AGGAAATCTT TGATGCCCTT GATGCGGTGG AAATTGGTAT       840
     CACCGAGAAA TTGCGCAGTG TTGTTTTGCT GTCGAGCCTT CCAGAGAGTT TCGAGAATTT       900
     CGTTGTCGCC ATTGAGACGC GCGACGACGT GCCGCTTTTC GATGCTCTAT GTATAAAGCT       960
     GATCGAGGAA GACACGAGAA GGGGAGGAGC GGAGCAGCAG AGAGAAAAAC AAACGGAGAG      1020
     CGCAAAGGCA TTTACTGCAG TACATAAGCC ACAGGCGCCG GCGAGAGAAG CTCGGCCGAG      1080
     CGCAAAGAAG AGGAAAGACG TAGTTTGTTA TAACTGTGGA GAGCGTAGGC ATTTTAAAGC      1140
     GAACTGTCGT CGCGAGAAAG TAAACAAAGA GAGCGCGACA CAAGAACAAT GCAGTTTGTT      1200
     AAATGCGCTG GATAGTGGTG GTTTTTGGCA AAACACAGTG GTGTCTCGAT AGCGGGGCTA      1260
     CCAGTCACAT GTGCTGTGAC AGAAGTGTTT TTACTGAGTT TGAAGAGCAC ACTGAAAAAA      1320
     TTAGTCTTGC TGGAAATGGA TTCCTACTAG CAAAGGGCAT AGGAACAGTG AAGCTGAAGA      1380
     CTGATTTATG TACTCTGGTA TTGAATAACG TACTCTTCGT CCCAGATTTG AACGGCAACT      1440
     TTATGTCAGT CAGCCGTGCA GCTCAGTATA AATGTTTTGT CAATTTTGGA CCACATTACG      1500
     CTGACGTCAT TCAGGAAGGC GAGCGAATAC TGCGTGTAAT GAGAGCTGGT AATTTATATA      1560
     TGTTTCAAGG GAAACATAAC AGTTGTTTTG CGGCCGTTGA TGCTGATGGT TCACTATGGC      1620
     ATAAAAGGAA TGGCCATTTG AATACAAGCA GCCTACAGGA GATGGTGAGG AAGAAGATGG      1680
     TGTACGGTGT TGAAAAGGTC GTTTTCAAAC CAGACGCAGT ATGCAAGACG TGCATGCTGG      1740
     CAAAAATCCA TGTGCAACCA TTTCCGAAGA CAACGAGGAG CAGAGCTGAG GAGCTGTTGG      1800
     ATATGATCCA TTCAGACCTG TGCGGGCCAT TTAGCACACC GTCACTTGCT GGATCAAAGT      1860
     ACTTTCTCAC TTTCATAGAC GACAAGTCCA GGCGGATTTT TGTATATTTC TTGCGGAAGA      1920
     AGGACGAAGT CTTCACTAAG TTTGTCGAGT TTAAGAAACT GGTCGAGCGA CAAACAGGTA      1980
     GAAAGATAAA ATGTATCCGG AGCGATAATG GTGGTGAGTT CGTCAATAAT GTTTTTGATG      2040
     ACTATTTAAA GGCACATGGG ATCGCTAGAC AGCTGACTAT TCCACACACT CCCCAACAAA      2100
     ATGGAGTTGC AGAACGAGCC AACCGCACGC TAGTAGAAAT GGCTAGGTGC ATGTTGCTGC      2160
     AATCGGAGTT GGGTGAGGCT CTATGGGCTG AGGCGATAAA CACTGCGGTG TATCTGAGGA      2220
     ACCGATCAAC GAGCAGAGCA TTACAAAGCA AAACCCCTAT GGAAGAGTGG ACCGGAAAAA      2280
     TACCAGCAGT GAGCCACTTG AGGGTTTTTG GTGCCATAGC AGTGGCATTG GACAAAGGAG      2340
     TCCATAAAGG CAAATTCGAA TCCAAAGGAA AGGAATATCG TATGATTGGA TATTCAATAG      2400
     CTGCTAAGGG GTACCGTCTG TTTGACAAAG AGAAGCGGTG TGTGATCGAG AAGCAAGATG      2460
     TCCTTTTTGA TGAGTCTGGT AGTTTGGTAA ATCATGGAAA TACCATTGAG TTCCAGTTTC      2520
     CCGCAACTGA TGACCCGGAG CCGCAGAGTG ATTCGAATGC ACGGGAAGGT GACGATACAG      2580
     AACCCGTGGG CAGCAGCGAC GACTATGAGA GTGCAGCTGA GGCAGAAGAA GCTGAAGTAC      2640
     ATGTGGGGCC TGGACGGCCA AAGATTGTTC GGACGGGCAG ACCAGGGCGC CCGAAGAAGC      2700
     AATACAATGT ACTTGGCGTG TTGATGGCTA GCGACGTCGA AATTCCCAAG TCCTATGAGG      2760
     AGGCCATCAA TTCGCAGTAT TCTGCAAAGT GGGAAGAGGC AATGGGCCTG GAGTACAAGG      2820
     CGCTACTTGC AAATGAGACA TGGAAGCTGG CTGACTTACC AAGAAATCGC CGGTGTGTGG      2880
     CTTGCAAGTG GGTGTATTCC CTGAAACGAG ACGTCTCTGG TAGAATTGAG CGCTTCAAGG      2940
     CACGACTAGT AGCAAAGGGG TGTTCGCAGA AGTTCGGAGT GGACTACTTC GAGACTTTTT      3000
     CACCCGTGTG CAGGCTCGAG AGTGTGAGGC TCATTTTGGC ATTGGCAGCA GAGATGCAAT      3060
     TGTACTTGCA TCACATGGAC GTATGCACGG CGTACTTAAA TAGCGAGCTA AAGGATACTG      3120
     TGTACATGAA GCAGCCCCAA GGGTTCACAG ATGCTGCTAA TCCCGACCAG GTGTTATTGC      3180
     TGAGGAAGGC AATATACGGC TTGAAGCAGT CAGGCAGAGA GTGGAACTCC AAGCTCGACG      3240
     GTGTTCTAAA AGACTTGGGA TTTAAGGCCT GTAATCATGA ACCATGTCTT TATCAGCAAA      3300
     GTGGTCAAGG TAATCTGATG CTCATCTTAG TATATGTTGA TGATTTAATT CTAGCGTGCC      3360
     AGTCAAGAGA AGATATGGAG GATCTGAAAG CCAAGATTTC AGAGTCTTTC GAGTGCACGG      3420
     ACAAGGGTCC ACTGCATTTG TTCTTAGGCA TGGAGGTGCA ACGAGATGGC GACCTTGGAG      3480
     AAATCACTTT GGGCCATTCG CAATATATCA AGGAACTATT GCGGGATTAT GGCAGCGAGA      3540
     ACTGTAGACC AGCGACGACA CCTTTGGATG CAGGGCATCA AGTTTTGTGC GCGGGTGAGC      3600
     AGTGCCAGAA GGTCGACGCA GGGCAGTATC AGTCTACAAT TGGTGAGCTA ATGTGGCTTG      3660
     GGCTTACTAC CAGACCAGAC ATGCTACATT CGGTGGCGAA GTTGGCTCAG AGGAATCAGG      3720
     ACCCGCATTC TGAGCACATG GTGGCTGTGA AGCACATCCT CCGGTACTTG GCGTCAACTG      3780
     TGGACGTCAA GCTGCATTAT CAAAAGTGCG GTCAGGCATT TACCGGCTTT GTGGATGCAG      3840
     ATTGGGGAGG CGACCGTTTG GACCGAAAGT CATACACAGG GTATGTGTTT TTCCTGTCTG      3900
     GCGGACCAGT ATCATGGAGG TCCGAGAAGC AGCAGAGCGT GGCGTTGAGC AGTACTGAAG      3960
     CCGAGTATAT GGCTCTGACC ACGGCTTGCA AGGAAGCTAT AGCTTTACGA AGGCTAATAG      4020
     TGGAGATCGT ATGCGGTGAT CTGAAGACCC CGACGGTTAT GCATGGCGAC AACCTGAAGT      4080
     GCGCAGCACA GTTAGCGAAG AACCCGGTTC ATCACTCTAG GACGAAGCAC ATCGACATTC      4140
     GATATCATTA GAGAAGTCAT GAAAGAGGGT CACGTTGTGT TAGAGTACAC TTCTACGAAT      4200
     GAGATGATAG CAGACATTAT GACAAAGAAT CTTTCAAAGG GAAAGCATAA TGGGTTTATG      4260
     AAAATGTTAA ATTTGTTTTA ATTTTTGTAA ACATGTTGGC ATTGAGGAAG GCTGTTGAAT      4320
     ATAGGCAATG CCCACATGTG TGTTGAATAT AGGCAATTTC CACATGTGCA TATGTAATTT      4380
     TGTATGAGAA CATACATACA TACACATGAA CTATATGTAT GTATATATAT TAGTAAATAA      4440
     GCAGCCGCAT GAAGCTGGCA TTTTTATGTG TATCAGTTTC AGTTTCAAAT AAAACTTCTT      4500
     CGTGTTCGGA CGCTCGGCTC AAGACTTTTT ATTTCGCGTT TACTCATTCG GCCTTTGCTC      4560
     TCAATGCGCT GAGTTTGGGT GAAGATTAGG ATCTTCCCAT TATGGTTGTC AGTGTTCCAC      4620
     ACTGGGAGCA CCTTTTCAAC AAACCACA                                         4648
//
ID   DMIS297    standard; DNA; INV; 6995 BP.
XX
AC   X03431;
XX
DR   FLYBASE; FBte0000675; Dmel\297.
XX
FT   source          X03431:1..6995
FT   SO_feature      five_prime_LTR ; SO:0000425:1..414
FT   SO_feature      three_prime_LTR ; SO:0000426:6582..6995
FT   SO_feature      TATA_box ; SO:0000174:276..282
FT   SO_feature      TATA_box ; SO:0000174:6857..6863
FT   SO_feature      polyA_signal_sequence ; SO:0000551:304..309
FT   SO_feature      polyA_signal_sequence ; SO:0000551:6885..6890
FT   SO_feature      primer_binding_site ; SO:0005850:414..431
FT   SO_feature      RR_tract ; SO:0000435:6571..6581
FT   SO_feature      CDS ; SO:0000316:803..2047
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\297\gag"
FT                   /db_xref="FLYBASE:FBgn0044338"
FT                   /db_xref="SWISS-PROT:P20828"
FT                   /db_xref="NCBI_PROTEIN:CAA27159.1"
FT                   /translation="MSQPIIALSDINLAEARRQLKDIMPFKGDPETLHTFISRVDYVIS
FT                   LYQTNDVRQQRILLGAIERNLDGQITRSLGLPNVEDWPTLKARLIAEFKIQTPNYKLLE
FT                   NFRETPYRGSLRAFCEEAERRRQLLISKLHLEGNQSDFLIYIQGIKESIKILIRKLPIQ
FT                   LFTILAHHDITDLRSLITIAQNEGIYEEHINFEFYEKPEYRNKNSNSNQNSKTQKFNTN
FT                   VQTQNRPSYSQYSQPFQPNFNQYIQPFRPSYTQQITNNPPMWHAPNYFRPNQYINPQPI
FT                   IQKNHFQQYPNKAQFPQTTHFRGNTYPRLQQPSTYKNTNFPITKRLRPSDSEQTKMSID
FT                   EIRFQDAHEFEQVQPNYYEQQYFNQNQYNPYQNHSFINEGQQQVQFVQINNKQNQNNSE
FT                   LNENFRLTVPENTNT"
FT   SO_feature      CDS ; SO:0000316:<1999..5178
FT                   /name="Dmel\297\pol"
FT                   /db_xref="FLYBASE:FBgn0027622"
FT                   /db_xref="SWISS-PROT:P20825"
FT                   /db_xref="NCBI_PROTEIN:CAB57796.1"
FT                   /translation="TKRKFSVNSSGKYEYIKIVYKGRSYKCLLDTGSTINMINENIFCL
FT                   PIQNSRCEVLTSNGPITLNDLIMLPRNSIFKKTEPFYVHRFSNNYDMLIGRKLLKNAQS
FT                   VINYKNDTVTLFDQTYKLITSESERNQNLYIQRTPESIASSDQESIKKLDFSQFRLDHL
FT                   NQEETFKLKGLLNKFRNLEYKEGEKLTFTNTIKHVLNTTHNSPIYSKQYPLAQTHEIEV
FT                   ENQVQEMLNQGLIRESNSPYNSPTWVVPKKPDASGANKYRVVIDYRKLNEITIPDRYPI
FT                   PNMDEILGKLGKCQYFTTIDLAKGFHQIEMDEESISKTAFSTKSGHYEYLRMPFGLRNA
FT                   PATFQRCMNNILRPLLNKHCLVYLDDIIIFSTSLTEHLNSIQLVFTKLADANLKLQLDK
FT                   CEFLKKEANFLGHIVTPDGIKPNPIKVKAIVSYPIPTKDKEIRAFLGLTGYYRKFIPNY
FT                   ADIAKPMTSCLKKRTKIDTQKLEYIEAFEKLKALIIRDPILQLPDFEKKFVLTTDASNL
FT                   ALGAVLSQNGHPISFISRTLNDHELNYSAIEKELLAIVWATKTFRHYLLGRQFLIASDH
FT                   QPLRWLHNLKEPGAKLERWRVRLSEYQFKIDYIKGKENSVADALSRIKIEENHHSEATQ
FT                   HSAEEDNSNLIHLTEKPINYFKKQIIFIKSDKNKVEHSKIFGNSITTIQYDVMTLEKAK
FT                   QILLDHFIHRNITIYIESDVDFEIVQRAHIEIVNTTYTKVIRSLFLLKNVGSYAEFKEI
FT                   ILQSHEKLLHPGIQKMTKLFKENHFFPNSQLLIQNIINECNICNLAKTEHRNTKMPLKI
FT                   TPNPEHCREKFVVDIYSSEGKHYISCIDIYSKFATLEQIKTKDWIECRNALMRIFNQLG
FT                   KPKLLKADRDGAFSSLALKRWLEEEEVELQLNTAKNGVADVERLHKTINEKIRIINSSD
FT                   DEEVKLSKIETILYTYNQKIKHDTTGQRPAQIFLYAGHPILDTQKIKEKKIEKINEDRR
FT                   EFNIDTNYRKGPLQKGKLENPFKPTKNVEQTDPDHYKITNRNRVTHYYKTQFKKQKKNN
FT                   KLSISQAPGTR"
FT   SO_feature      CDS ; SO:0000316:5145..6560
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="297\env"
FT                   /db_xref="FLYBASE:FBgn0027623"
FT                   /db_xref="SWISS-PROT:P20829"
FT                   /db_xref="NCBI_PROTEIN:CAB57797.1"
FT                   /translation="TLNFTGTWYPITLLFILITAVHGQQIQINNIDTNHGYLLFSDKPV
FT                   QIPSSFEHHSLKINLTEIDIVVDYFEQRLRTDYHAPQINFLYNKIKRELARITLKHRNK
FT                   RGFINIVGSGFKYLFGTLDENDRVEIQKKLEINVHNSVKLHELNDAIRLINDGMQKIQN
FT                   YENNHTIIDSLLFELMQFTEYIEDLEMAMQLSRLGLFNPKLLNYDKLENVNSQNILNIK
FT                   TSTWINYNDNQVLIISHIPIYLSLISTIKIIPYPDSNGYQLDYTDTQSYFEKENKVYNT
FT                   ENKEVKNECVTNIIKHLNPICNFKPVHTNEIIKYIEPNTIVTWNLTQTILNQNCQNSIN
FT                   KIKIEGNKMIRVTQCKIEINNINFSETLLEPEIDLTPLYTPLNITKIKIVKHNDIIEMI
FT                   SENNITLYIQMIIVIIALILLYSYLRYVSFKPFMMLYAKLKIRKNQNQNTPQQTEIEEI
FT                   PFPTLYPSIPAQV"
XX
CC   Derived from X03431 (g8146) (Rel. 36, Last updated, Version 2).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 6995 BP;  2811 A; 1356 C; 972 G; 1856 T; 0 other;
     AGTGACGTAT TTGGGTGGTC CAAACCAGCC ACTTCCATTA TTTCAAAGAA ATCAGTAATG        60
     CACTCTAGTA ATTTTCCATA ACTGTATCCC AGCTGCGCAG ACTCGTTTAT CTTTTGCAGC       120
     GCAGCGTTCT TTGTAAACAT CCTAAAGACC TGCCTAAGCA GATTTGACTG CCCTCTTTCA       180
     ACGCTACCTA ATCTTAAGAA CCCAAGAGCG AGGCTCTCCC GAAATACAAA TATTGTTCAA       240
     ATACTGAGGC TTCTCCTCAA TCCAATTTGC ATTTGATTTT TAGTCTTAAG CTGAGATCCA       300
     AAGAATAAAG TCGTGAAACT ATTTCTCCTA AAAACTATTT TTTATTTCTT GGCGTTGTCC       360
     TTAGTCAACT GACGGGACAT TAGTTCGACT CATAAATAAA ACAACAATTT TACTGGCGCA       420
     GTCGGTAGGA TACAAAAGTA TCCGAAAAAA AAGAACCTTC GAATGGAAAA TAAGTTAAAT       480
     TTTATAGTCC TGTGCTCGAA ACATCTCCCA AAATAAATTC GTGAAAACTC TTCAACTTCA       540
     ATTATAATTC CAATTCGGTT ATCCAATAAT AAGTGGAAGT GAAATACGAA ACAAAAATAT       600
     TAAGTCCAAA GGCAACTAAG TTTTAAAACC AACATATAAA AATAAAAAAT TAAAACAATA       660
     TAGAATTTTA ATAATACAAC ACAAAAATTT ACAAAACAAA AAAACAAACA AGTGAAACTA       720
     GAAAGCTTAA AAATAATAAT AACATTGAAT CCGAAACAAA ACAAAAAAAT AAAACACAAA       780
     AGTTAAAAAT TTTACAATAA AAATGTCACA ACCAATTATT GCGCTGAGCG ACATAAACCT       840
     TGCCGAAGCC CGTCGGCAGC TTAAAGACAT TATGCCATTC AAGGGTGATC CAGAAACCCT       900
     TCACACCTTT ATCAGCAGAG TGGATTACGT AATTTCGCTC TACCAAACAA ATGATGTCCG       960
     ACAACAGAGG ATTCTACTGG GAGCCATCGA AAGGAACTTG GACGGACAAA TTACACGATC      1020
     TTTGGGACTT CCGAACGTCG AAGATTGGCC TACCCTTAAA GCAAGACTCA TCGCGGAATT      1080
     TAAAATTCAA ACACCAAACT ACAAACTTCT GGAGAACTTC AGGGAGACAC CATACAGAGG      1140
     AAGCCTAAGA GCATTCTGCG AAGAAGCGGA GAGACGACGT CAATTACTAA TTTCGAAACT      1200
     ACACCTGGAA GGTAACCAAT CGGATTTTCT TATTTATATT CAGGGTATTA AAGAATCTAT      1260
     TAAGATACTG ATAAGGAAAC TACCAATACA ATTATTCACT ATTTTAGCCC ATCACGATAT      1320
     TACAGACTTA AGATCCTTAA TTACCATTGC ACAAAATGAG GGAATTTATG AAGAACACAT      1380
     TAATTTTGAA TTTTATGAAA AACCAGAATA TCGTAATAAA AATTCAAATT CTAACCAGAA      1440
     TTCGAAAACA CAAAAATTCA ATACAAATGT TCAAACTCAA AATCGACCAA GTTACTCACA      1500
     ATATTCCCAA CCCTTCCAAC CTAATTTTAA TCAATACATT CAACCATTTA GACCTAGCTA      1560
     TACACAGCAG ATAACTAACA ACCCACCCAT GTGGCACGCA CCTAATTATT TCAGACCCAA      1620
     CCAATACATA AACCCACAAC CCATTATTCA AAAAAATCAT TTCCAACAAT ATCCCAACAA      1680
     AGCCCAATTT CCCCAAACAA CGCATTTTAG AGGAAATACA TACCCTCGAC TACAACAACC      1740
     CTCTACATAT AAAAATACTA ACTTCCCGAT TACTAAACGA CTAAGACCAT CGGACAGTGA      1800
     ACAAACTAAA ATGTCTATTG ACGAAATTAG ATTCCAAGAC GCGCATGAAT TCGAACAAGT      1860
     CCAACCTAAT TATTACGAGC AACAGTATTT TAACCAAAAT CAATACAATC CGTATCAAAA      1920
     TCATAGCTTC ATTAATGAAG GGCAACAACA AGTTCAATTT GTACAAATTA ATAACAAACA      1980
     AAACCAAAAT AATTCTGAAC TAAACGAAAA TTTTCGGTTA ACAGTTCCGG AAAATACGAA      2040
     TACATAAAAA TAGTATACAA AGGGCGTTCA TACAAATGCC TTCTAGACAC AGGATCAACA      2100
     ATTAATATGA TCAATGAAAA TATATTTTGT CTTCCCATTC AAAATAGTAG ATGTGAAGTT      2160
     TTAACATCAA ATGGCCCTAT TACCTTGAAC GACTTGATTA TGTTACCCAG AAATAGTATT      2220
     TTCAAAAAAA CCGAACCATT TTATGTGCAC AGATTTTCTA ATAATTACGA TATGCTAATT      2280
     GGCAGAAAAT TGTTGAAAAA TGCTCAATCA GTTATTAATT ACAAAAATGA TACAGTTACC      2340
     CTTTTTGATC AAACATACAA ATTAATTACT TCAGAATCCG AAAGAAACCA AAATTTGTAT      2400
     ATCCAAAGGA CACCAGAATC AATTGCAAGC TCAGATCAGG AATCAATAAA AAAATTAGAT      2460
     TTTTCACAGT TTCGATTAGA TCACCTAAAT CAGGAGGAAA CTTTTAAGTT AAAAGGCTTG      2520
     TTAAATAAAT TTAGAAATCT TGAATATAAG GAGGGAGAGA AATTAACATT TACAAATACA      2580
     ATTAAACACG TACTAAATAC AACACATAAC TCCCCAATTT ATTCGAAACA ATACCCACTT      2640
     GCGCAAACAC ACGAAATCGA AGTAGAAAAC CAAGTACAGG AAATGCTGAA TCAGGGATTA      2700
     ATTAGGGAAA GTAATTCTCC ATACAATAGT CCTACTTGGG TCGTACCAAA GAAACCGGAT      2760
     GCTTCTGGTG CAAATAAGTA CAGGGTAGTA ATTGATTATA GAAAGCTAAA TGAAATAACC      2820
     ATACCTGACA GATATCCAAT TCCAAATATG GACGAAATTC TTGGCAAACT GGGTAAATGC      2880
     CAATATTTTA CAACGATCGA TCTGGCAAAG GGATTTCATC AAATAGAAAT GGACGAAGAA      2940
     TCAATTTCTA AAACTGCATT CTCCACAAAA AGCGGTCATT ACGAATACCT TCGAATGCCA      3000
     TTTGGCCTTA GGAATGCACC CGCTACTTTT CAAAGGTGCA TGAATAATAT CCTTCGACCG      3060
     TTGCTTAACA AACACTGTTT GGTGTATCTG GATGATATTA TAATTTTTTC AACATCCCTT      3120
     ACAGAACATT TAAATTCAAT ACAATTAGTT TTTACAAAGC TTGCAGATGC AAATTTAAAA      3180
     TTGCAACTAG ACAAATGTGA GTTCTTAAAA AAGGAAGCTA ACTTTCTTGG TCACATAGTT      3240
     ACCCCTGATG GTATTAAACC AAATCCTATT AAAGTTAAAG CCATAGTTTC ATACCCAATT      3300
     CCGACAAAAG ATAAAGAGAT AAGAGCTTTC CTTGGATTAA CAGGTTATTA TCGCAAATTT      3360
     ATTCCAAATT ACGCAGACAT AGCAAAACCC ATGACCAGCT GCTTAAAAAA AAGGACAAAG      3420
     ATAGATACAC AAAAACTTGA GTACATAGAG GCATTCGAAA AACTTAAGGC TTTGATAATT      3480
     CGTGACCCAA TTTTACAATT ACCTGATTTT GAAAAGAAAT TTGTTTTAAC CACAGATGCA      3540
     AGTAACTTGG CCCTCGGGGC TGTCCTTTCT CAAAACGGTC ATCCTATATC TTTTATTAGT      3600
     AGAACACTTA ACGATCACGA ATTAAATTAC AGTGCTATCG AAAAAGAATT ACTTGCCATA      3660
     GTTTGGGCCA CAAAAACTTT TCGACATTAT TTACTAGGAC GACAATTTCT CATTGCCAGT      3720
     GACCATCAAC CTCTTAGATG GCTTCATAAC TTAAAGGAAC CAGGTGCTAA GTTAGAAAGA      3780
     TGGAGAGTTA GATTAAGCGA ATACCAATTT AAAATAGATT ATATTAAAGG GAAAGAAAAT      3840
     TCAGTTGCCG ATGCATTATC AAGAATTAAA ATTGAAGAAA ATCATCATAG TGAAGCTACT      3900
     CAACATAGTG CAGAAGAGGA CAATAGCAAC CTTATTCATT TAACAGAAAA ACCAATAAAT      3960
     TATTTCAAAA AACAAATAAT CTTTATTAAA TCCGATAAAA ATAAAGTAGA GCATTCAAAA      4020
     ATATTCGGTA ACTCCATTAC CACAATTCAA TATGACGTAA TGACACTTGA AAAGGCCAAA      4080
     CAAATTTTAC TCGATCACTT TATCCATAGA AACATTACCA TTTATATTGA GAGCGATGTA      4140
     GATTTTGAAA TCGTTCAAAG AGCACACATA GAAATTGTTA ATACCACCTA CACAAAAGTA      4200
     ATTCGCAGTC TTTTCCTATT AAAGAACGTT GGTTCATACG CCGAATTCAA AGAAATCATA      4260
     CTTCAATCAC ATGAAAAACT TTTACACCCT GGTATACAGA AAATGACAAA ATTATTTAAA      4320
     GAAAATCACT TCTTTCCAAA TAGCCAACTA TTAATTCAGA ATATAATAAA CGAATGCAAC      4380
     ATATGCAATT TGGCCAAAAC AGAACATAGA AACACCAAAA TGCCTTTAAA AATCACACCC      4440
     AACCCGGAAC ATTGCCGAGA AAAATTTGTA GTAGATATTT ATTCATCTGA GGGAAAACAT      4500
     TACATCAGTT GCATTGATAT TTATTCTAAA TTCGCTACAC TTGAGCAAAT TAAAACTAAG      4560
     GATTGGATAG AATGCAGAAA CGCATTAATG CGCATTTTTA ATCAACTAGG AAAACCCAAA      4620
     TTATTAAAGG CAGACAGAGA CGGAGCTTTC TCCAGTTTAG CTTTAAAGCG ATGGCTTGAA      4680
     GAAGAAGAAG TCGAATTACA GCTCAATACA GCAAAAAACG GAGTAGCAGA CGTCGAAAGA      4740
     TTACACAAAA CAATAAATGA AAAAATTCGT ATAATCAATT CATCTGATGA TGAAGAAGTA      4800
     AAATTAAGCA AGATAGAAAC AATCCTCTAC ACATACAACC AAAAAATTAA ACATGACACT      4860
     ACTGGACAGA GACCTGCTCA AATTTTCTTA TACGCTGGGC ATCCCATATT AGACACTCAA      4920
     AAAATTAAAG AGAAGAAAAT AGAGAAAATA AATGAAGACA GACGGGAATT TAATATTGAC      4980
     ACTAATTACA GAAAAGGTCC ACTACAGAAA GGCAAATTAG AAAACCCATT TAAACCAACC      5040
     AAAAATGTAG AACAGACAGA CCCTGACCAT TACAAAATCA CTAATAGAAA TAGAGTTACG      5100
     CACTACTACA AAACACAATT CAAAAAACAA AAGAAAAATA ATAAACTCTC AATTTCACAG      5160
     GCACCTGGTA CCCGATAACA CTATTGTTTA TACTGATCAC AGCTGTTCAT GGACAACAAA      5220
     TTCAAATTAA TAATATTGAC ACCAACCACG GATATCTCCT TTTTTCTGAT AAGCCAGTAC      5280
     AGATACCATC CTCCTTTGAA CATCACTCCT TAAAAATCAA TTTAACTGAA ATAGACATCG      5340
     TGGTTGACTA TTTTGAGCAA AGACTACGAA CCGATTACCA TGCACCCCAG ATCAATTTTT      5400
     TATACAATAA AATAAAAAGA GAACTAGCCA GAATAACCCT GAAACATAGA AACAAACGGG      5460
     GTTTTATTAA CATTGTGGGT TCAGGTTTTA AATACCTATT TGGAACACTA GATGAAAATG      5520
     ATCGAGTCGA AATACAGAAA AAACTTGAAA TCAACGTCCA TAACTCAGTA AAATTACATG      5580
     AACTCAACGA CGCCATACGA TTGATAAATG ACGGAATGCA AAAAATACAG AATTATGAAA      5640
     ATAACCACAC CATCATTGAC AGTCTTTTGT TCGAACTAAT GCAGTTTACG GAATACATAG      5700
     AAGATTTGGA AATGGCTATG CAGCTTTCCA GACTTGGACT GTTTAACCCC AAATTACTAA      5760
     ACTACGACAA ACTTGAAAAT GTGAACAGCC AAAACATTTT GAACATTAAA ACATCCACTT      5820
     GGATTAACTA CAATGATAAC CAAGTATTAA TCATATCCCA CATACCCATT TACCTTTCAC      5880
     TAATAAGCAC AATTAAAATA ATTCCTTACC CAGACTCCAA CGGCTATCAG CTAGATTACA      5940
     CAGACACACA ATCATATTTT GAAAAAGAAA ATAAAGTTTA TAATACCGAA AATAAAGAAG      6000
     TAAAAAATGA ATGTGTCACC AATATTATTA AACACTTAAA TCCAATTTGT AATTTTAAGC      6060
     CAGTACACAC GAACGAAATA ATAAAATACA TAGAACCAAA CACAATTGTA ACTTGGAACT      6120
     TAACCCAAAC AATTCTTAAC CAAAATTGCC AAAATTCAAT TAATAAAATA AAAATAGAAG      6180
     GAAACAAAAT GATAAGAGTA ACGCAATGCA AAATAGAAAT CAATAATATA AATTTTAGTG      6240
     AAACTCTGTT AGAACCAGAA ATAGATTTGA CACCACTATA CACACCACTT AATATAACAA      6300
     AAATAAAAAT TGTAAAACAC AACGACATTA TTGAGATGAT TTCAGAGAAC AATATTACAC      6360
     TTTACATACA AATGATCATT GTAATAATCG CACTAATTTT GTTGTACTCA TATTTAAGAT      6420
     ATGTATCATT TAAACCATTT ATGATGTTGT ATGCAAAACT TAAAATAAGA AAAAATCAAA      6480
     ATCAAAACAC ACCACAACAA ACAGAAATAG AAGAAATTCC ATTTCCCACA CTATATCCAT      6540
     CAATCCCAGC CCAAGTATAG GCTTCTCTTT AAGGGAAGGG GAGTGACGTA TTTGGGTGGT      6600
     CCAAACCAGC CACTTCCATT ATTTCAAAGA AATCAGTAAT GCACTCTAGT AATTTTCCAT      6660
     AACTGTATCC CAGCTGCGCA GACTCGTTTA TCTTTTGCAG CGCAGCGTTC TTTGTAAACA      6720
     TCCTAAAGAC CTGCCTAAGC AGATTTGACT GCCCTCTTTC AACGCTACCT AATCTTAAGA      6780
     ACCCAAGAGC GAGGCTCTCC CGAAATACAA ATATTGTTCA AATACTGAGG CTTCTCCTCA      6840
     ATCCAATTTG CATTTGATTT TTAGTCTTAA GCTGAGATCC AAAGAATAAA GTCGTGAAAC      6900
     TATTTCTCCT AAAAACTATT TTTTATTTCT TGGCGTTGTC CTTAGTCAAC TGACGGGACA      6960
     TTAGTTCGAC TCATAAATAA AACAACAATT TTACT                                 6995
//
ID   DM23420    standard; DNA; INV; 6126 BP.
XX
AC   U23420;
XX
DR   FLYBASE; FBte0000266; Dmel\3S18.
XX
SY   synonym: BEL
XX
FT   source          U23420:1..6126
FT   SO_feature      five_prime_LTR ; SO:0000425:1..361
FT   SO_feature      three_prime_LTR ; SO:0000426:5766..6126
FT   SO_feature      CDS ; SO:0000316:919..5742
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\3S18\ORF"
FT                   /db_xref="FLYBASE:FBgn0044337"
FT                   /db_xref="REMTREMBL:AAB03640"
FT                   /db_xref="NCBI_PROTEIN:AAB03640.1"
FT                   /translation="MFIGSIASNSSLTDCQRFHYLKSYLAGDALALVKHIPVTNDNYRE
FT                   AWERLEQRYNKQSLIIRSFLNSFMSLPSAINSNIGTVRKIADGADEVIRGLRALNCEER
FT                   DPWLIFILLSKLDSDTRQAWAQCAESEEKGVTINRFLKFLTSRCDTLEAFELTRSTQAR
FT                   RAATTHHADTHPRREEPKCTSCQQNHQLFKCPQFIALDIASRRDFLKSRKLCFNCLSPA
FT                   HMVGNCTSRHTCRICRRKHHTLVHGSSQPIQNGNNIDTASVDSRDRPAVSHAGSTIGHN
FT                   QPLAREGHRLGSETPAENNFTHHTLENIPAAGSQTLLPTILADVIDAWGNTTTCRLLLD
FT                   TGSTITLASESFVQRIGVRRTHARISILGLAANSAGVTRGRAHIKLRSRHSGQTVELVS
FT                   FILTSLTSSLPAQVIDTSSSTWRQICELPLADPTFCTPGAIDVIVGSDQLWSLYTGDRK
FT                   HFGNDFPIALNTVFGWILAGSYSAFDDHPTSAVTHHADLDTMVRSFMEMDSIQPNQALL
FT                   DASDPTERHFAATHKRSTDGVYVVEYPFKEKAPPIDSTLPQAINRFFSLERKFRRYPEL
FT                   KQQYEAFLDDYLQRGHMEKLTSAQVEESPDTCFYLPHHAVIKLDSLTTKCRVVFDGSGK
FT                   DSSGVSLNDRLHIGPPIQRDLFGVCLRFRQHQYVLCADVEKMFRGIKVFKPHTNFQRIV
FT                   WRTTENEPLLHFRLLTVTYGLAPSPFLAVRVLKQLADDHGHEYPAAAHALLHDAYVDDI
FT                   PTGANTFEELMILKDELIALLDKGKFKLRKWSSNSWRLLKSLPEEDRCFEPIQLLNKSA
FT                   ADSPVKVLGIQWNPGKDVLYLNLKGCDATISPTKRELLSQLSRIYDPLGLVAPVTVLLK
FT                   LIFQESWTSVLQWDDPIPESLRTRWRALVEDLPALTQCQVPRYIASPFRDVQLHGFADA
FT                   SSHAYGAVVYARVAVGCSFQVTLVAAKTRVAPIKPVSIPRLELNAALLLSRLLSIVKTS
FT                   LTIPLFSTSCWTDSEIVLHWLSAPPRRWNTYVCNRTSEILSDFPRSCWNHVRTEDNPAD
FT                   CASRGLHPSKLLEHRLWWKGPSWLATPTSEWPPSTSKFSVSSSFDVNTEERAIKPTTLH
FT                   NFPDESIHELLIHKFSTWTRLIRVSSYCHRFIHTLRSHHRNSAPFLTSEELLDAQRRLI
FT                   RHVQQKSFAREYEQLENRRQLNAKSHLIRFSPFLDDYGVMRVGGRIEQSTLNYNAKHPI
FT                   LIPKDTPLAGLLVRHFHVSYLHTGVDATFTNLRQQYWILGARNLVRKAVFQCKSCFLQR
FT                   KGTSNQIMGELPIPRVQASRCFQHTGLDYAGPIAIKESKGRTPRIGKAWFSIFVCLTTK
FT                   ALHIEVVSELTTQAFIAAFQRFIARRAKPTDLYSDNGTTFHGGKKTLDDMRRLAIQQAK
FT                   DEELAGFFANEGISWHFIPPSAPHFGGMWEAGVRSIKLHMKRILGSKALTFEELSTVLT
FT                   QIEAILNSRPLCPTGDNSLDPLTPAHFLTGSPYTALPEPCRLDMQVNRLERWNQLQAMV
FT                   QGFWKRWHMEYLTSLHERTKWHLETENLKIDTLVVLKEPNLPPSKWILGRITAVHAGID
FT                   NKVRVVTVKTAHGLYKRPIAKIAVLPLC"
XX
CC   Derived from U23420 (g733531) (Rel. 48, Last updated, Version 3).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 6126 BP;  1623 A; 1556 C; 1346 G; 1601 T; 0 other;
     TGTTTGGGAA CGAGACACCC TGTATACGCG AACAAGTCAC CCTTTATCTT TATTTACATT        60
     CTTATTTGTC TGCAGCTTCA TCGGAGCTTA TCAGCGGAAT CAATGTAAGC ATCGCACCGC       120
     TGTAATTGTC CGCGAGCTTG CCCAGTACTT TTCCAAACTT CTAACTCCCT TCTAACTGTA       180
     ACTTGTTTAC GTCTTATGCT AGACTAATCG TATGGCGTGA TTACAGCCAA AGCTGAAGTC       240
     AGTCACAATT TTGATCTGCG AGAAAACGTA CGCATCGGTG TCGAAATAAT TAATATTAAG       300
     TGTCTGAACT TAACCAATAA ATGAAAATTA ACAGTAACAC TGGCGGTTTT ATTTATAAAC       360
     ATAAAAATTG GTCCTTCGAG CCGGATAACC GGAAGTGCGT TTCGTTCGGG CATTTGATTT       420
     TGATTATTGG CCTTTTGGCA AACGATAATC TATAGATTCC TACATCGTGT AGAATCGTTC       480
     CCTTCTTTCG ACCACCATGC GGAGTGTGAT TCAACAACGG GGCTTCTGCA AAAGCCAAAT       540
     TACTCGTGCG CATAATAATG CCTTAAAATT TGTTGATGAC ATTCACTCAG TGCAAACAAT       600
     AGTTGTCCGC CTGGCGCAAC TACAGGAAAA TTATTTGCGG TTCGTACGGC TCTCGGAAGA       660
     GCTGTATGCA TTTCAATCGG AAGCCGATTG GGAGAACCCT GACGAGGATT TTGACGCATA       720
     TGAGGACAAA CATTATGCTA CACACGCTAT TCTCAGCAAT ACTTTGGAGG AGTTGAGACG       780
     GGATGTCACC TCAAACAGTA TTGATGCCAC AGTTCAAGCG CAGGCACACC CCAGAGAAGT       840
     CATGTCGATT TTCAGTTCGA GAGAATTAAA CTTCCGACTT TTTCTGGAAA TTATGAGGAC       900
     TGGAAACATT TTTCGGACAT GTTTATTGGA TCGATTGCTT CCAATTCGAG CCTGACGGAT       960
     TGCCAACGAT TTCATTATTT AAAATCGTAC CTTGCCGGAG ACGCGCTTGC ATTAGTTAAA      1020
     CATATTCCAG TTACTAATGA CAACTATCGG GAAGCATGGG AGCGGCTGGA ACAGCGATAT      1080
     AACAAACAAT CGCTAATTAT TCGATCGTTC TTAAACAGTT TCATGAGCCT TCCGAGTGCT      1140
     ATAAATTCAA ATATCGGCAC AGTGCGGAAA ATTGCCGATG GTGCAGACGA AGTTATTCGT      1200
     GGTCTACGAG CTCTTAATTG CGAAGAGAGG GATCCCTGGC TAATTTTCAT TCTACTTTCA      1260
     AAATTAGATA GCGATACCCG CCAAGCCTGG GCTCAGTGCG CAGAATCCGA GGAAAAAGGT      1320
     GTGACCATCA ACCGATTCTT GAAATTTCTC ACATCACGCT GCGATACGTT GGAGGCTTTT      1380
     GAATTAACTC GATCAACCCA AGCTCGACGC GCAGCTACCA CGCACCACGC AGACACGCAT      1440
     CCAAGACGGG AAGAGCCGAA GTGCACATCG TGCCAGCAGA ATCACCAACT GTTTAAGTGT      1500
     CCTCAATTCA TCGCACTCGA CATTGCATCT CGCCGAGACT TCCTCAAATC AAGAAAGCTC      1560
     TGTTTCAATT GCCTCAGCCC GGCTCATATG GTGGGCAACT GTACATCGAG GCATACTTGT      1620
     CGGATCTGCC GCCGCAAGCA TCATACTTTG GTTCATGGCT CGTCGCAGCC AATTCAAAAT      1680
     GGCAACAACA TTGACACAGC AAGTGTTGAC AGCCGCGATC GACCAGCAGT CTCACATGCG      1740
     GGATCTACAA TTGGCCACAA TCAACCGCTA GCTCGAGAAG GTCATCGCTT GGGAAGCGAG      1800
     ACTCCCGCGG AAAACAACTT TACGCATCAT ACTCTGGAGA ATATTCCGGC GGCTGGTTCT      1860
     CAGACTCTGT TGCCAACCAT CCTTGCTGAC GTCATCGACG CCTGGGGAAA CACTACAACC      1920
     TGCAGGCTGC TCCTGGACAC TGGATCTACA ATAACCTTGG CATCGGAATC ATTTGTTCAG      1980
     CGAATAGGCG TGCGTCGAAC GCACGCACGG ATTTCTATTC TCGGTCTCGC CGCCAACAGC      2040
     GCGGGCGTTA CCCGAGGACG CGCACATATC AAGCTGCGCT CTCGTCATTC GGGCCAAACT      2100
     GTCGAATTGG TCTCGTTCAT TCTCACCTCG CTGACGTCAT CACTTCCTGC CCAAGTTATT      2160
     GACACCTCAT CCTCTACGTG GAGGCAAATC TGCGAGCTTC CTTTGGCAGA CCCAACGTTC      2220
     TGCACACCTG GAGCAATCGA TGTCATTGTT GGATCGGATC AACTTTGGTC TCTATACACA      2280
     GGAGATCGGA AACACTTTGG TAACGACTTT CCTATCGCTC TCAATACTGT ATTTGGTTGG      2340
     ATTCTTGCAG GCTCTTACTC TGCATTCGAT GATCACCCTA CTTCTGCGGT TACTCATCAC      2400
     GCGGACCTAG ACACGATGGT TCGTTCATTC ATGGAGATGG ACAGCATTCA GCCTAACCAG      2460
     GCTCTCCTGG ACGCCAGCGA TCCCACAGAG CGTCATTTTG CTGCCACACA CAAGCGCTCG      2520
     ACGGACGGGG TGTACGTCGT CGAGTATCCC TTCAAGGAAA AGGCACCGCC TATTGATTCG      2580
     ACCTTGCCAC AGGCCATCAA TCGCTTCTTC TCGCTGGAAC GCAAATTTCG TCGGTATCCA      2640
     GAATTGAAGC AGCAGTACGA AGCTTTCCTG GACGACTACT TGCAACGTGG ACATATGGAA      2700
     AAACTGACCT CGGCTCAGGT TGAAGAGTCC CCAGACACCT GCTTCTATTT GCCGCACCAC      2760
     GCTGTCATCA AACTGGACAG TCTGACTACC AAATGTCGTG TAGTTTTTGA TGGATCAGGA      2820
     AAAGACAGCT CTGGAGTATC GCTCAATGAC AGACTACATA TTGGTCCACC GATTCAACGC      2880
     GATCTTTTTG GCGTTTGTCT ACGCTTCCGG CAGCACCAAT ATGTTTTATG TGCAGATGTC      2940
     GAAAAGATGT TTCGAGGCAT TAAAGTCTTT AAGCCACACA CCAATTTTCA GCGCATTGTT      3000
     TGGCGCACGA CTGAGAATGA ACCTCTGCTT CATTTTCGCC TGCTGACGGT TACCTACGGA      3060
     TTGGCACCGT CACCATTTCT GGCTGTTCGA GTTCTAAAGC AACTTGCCGA CGATCATGGC      3120
     CATGAATACC CTGCAGCAGC TCACGCTCTT CTGCACGATG CCTATGTGGA CGATATCCCG      3180
     ACAGGCGCCA ACACATTCGA GGAGCTTATG ATTCTCAAGG ACGAGCTTAT AGCCCTCTTG      3240
     GATAAGGGAA AATTCAAGCT ACGCAAATGG AGTTCTAATA GTTGGCGTCT TCTGAAATCA      3300
     TTACCAGAGG AAGATAGATG TTTTGAACCT ATCCAGCTCC TCAACAAATC AGCTGCGGAT      3360
     TCACCTGTCA AAGTTCTTGG TATCCAATGG AACCCTGGGA AGGACGTCCT GTATCTCAAC      3420
     CTAAAGGGAT GCGATGCGAC CATTTCTCCG ACGAAAAGAG AACTCTTGTC TCAGCTATCA      3480
     AGAATTTATG ATCCGCTTGG ACTGGTAGCG CCGGTCACAG TTCTACTCAA GCTAATCTTC      3540
     CAAGAAAGCT GGACAAGTGT CCTGCAGTGG GACGACCCCA TACCTGAAAG TCTACGTACG      3600
     CGCTGGAGAG CCTTAGTAGA GGATTTGCCA GCACTTACGC AATGCCAAGT ACCACGGTAT      3660
     ATTGCGTCAC CATTTCGAGA TGTTCAACTA CACGGATTCG CCGACGCATC CTCGCACGCC      3720
     TACGGTGCGG TAGTTTACGC TCGAGTTGCA GTTGGATGCA GCTTTCAAGT AACTCTGGTT      3780
     GCCGCCAAAA CACGGGTGGC CCCGATCAAG CCCGTATCAA TTCCACGTTT GGAGCTAAAC      3840
     GCTGCGTTAC TTCTATCTCG ATTGCTTTCT ATTGTCAAAA CATCACTAAC AATTCCTCTT      3900
     TTCAGCACGA GCTGCTGGAC AGATTCAGAA ATTGTGCTAC ACTGGCTTTC AGCTCCCCCT      3960
     CGACGGTGGA ACACCTACGT CTGCAACCGA ACTTCTGAGA TATTGAGCGA CTTTCCCCGT      4020
     AGCTGCTGGA ACCATGTTCG CACGGAAGAC AATCCTGCAG ATTGTGCTTC CCGAGGACTT      4080
     CATCCGTCAA AGCTTCTGGA GCATCGACTG TGGTGGAAAG GTCCGTCTTG GCTGGCCACA      4140
     CCCACCTCTG AGTGGCCACC TTCTACAAGC AAGTTCAGCG TATCTTCAAG TTTCGATGTC      4200
     AACACCGAAG AACGAGCCAT AAAGCCCACG ACTCTACATA ACTTTCCTGA TGAAAGTATA      4260
     CACGAGTTAC TCATCCACAA ATTCTCAACC TGGACGCGTC TTATAAGGGT ATCTAGCTAC      4320
     TGTCATCGCT TTATTCACAC TCTTCGATCC CATCATAGGA ATTCGGCACC ATTCCTTACG      4380
     TCTGAAGAGT TGCTGGACGC ACAGCGCCGA CTTATTCGAC ATGTGCAACA AAAATCCTTT      4440
     GCCAGAGAAT ATGAGCAGCT AGAGAATCGA CGCCAGCTTA ACGCTAAATC GCATCTTATC      4500
     CGGTTTTCTC CGTTTCTGGA TGATTATGGA GTAATGCGAG TCGGTGGGAG AATCGAGCAA      4560
     TCTACACTCA ACTATAACGC CAAGCACCCG ATTCTGATAC CTAAAGATAC ACCACTAGCT      4620
     GGACTCCTGG TTCGACATTT TCATGTCTCC TATCTGCACA CTGGAGTTGA TGCAACGTTC      4680
     ACCAATCTTC GTCAGCAGTA CTGGATTCTG GGAGCCCGCA ATCTCGTCAG AAAGGCAGTC      4740
     TTCCAATGCA AATCCTGTTT TCTTCAACGA AAGGGCACAA GCAACCAGAT CATGGGAGAG      4800
     CTACCAATTC CTCGAGTTCA AGCTAGCCGC TGCTTTCAAC ACACAGGGCT GGACTACGCT      4860
     GGACCGATCG CAATCAAGGA ATCAAAGGGA AGAACTCCAC GCATCGGAAA GGCATGGTTT      4920
     TCTATTTTCG TGTGTCTCAC TACAAAGGCA CTTCACATCG AGGTTGTTAG TGAGCTAACT      4980
     ACACAGGCTT TCATCGCAGC CTTTCAACGA TTCATTGCCC GCCGAGCGAA GCCTACTGAC      5040
     CTGTATTCGG ATAATGGAAC AACATTTCAT GGAGGCAAGA AAACTTTGGA TGACATGAGA      5100
     CGTCTGGCCA TTCAACAAGC CAAAGATGAG GAACTAGCAG GATTCTTTGC CAATGAAGGG      5160
     ATTTCTTGGC ACTTTATACC CCCGTCTGCT CCACATTTTG GAGGGATGTG GGAAGCTGGA      5220
     GTTCGCTCAA TTAAACTCCA TATGAAACGA ATACTTGGAT CAAAGGCTTT AACGTTTGAG      5280
     GAGCTCTCTA CTGTCCTGAC CCAAATTGAA GCTATCCTGA ATTCACGCCC GCTGTGCCCA      5340
     ACTGGGGATA ATTCTTTGGA TCCACTGACG CCTGCTCATT TTTTGACTGG ATCTCCGTAT      5400
     ACTGCATTGC CTGAACCCTG TCGTCTGGAT ATGCAAGTCA ATCGATTGGA GAGGTGGAAT      5460
     CAGCTGCAAG CCATGGTTCA AGGCTTTTGG AAAAGGTGGC ATATGGAATA CCTGACATCT      5520
     CTTCATGAGC GGACAAAGTG GCATCTGGAA ACCGAGAATC TGAAGATCGA CACACTGGTA      5580
     GTACTCAAGG AGCCCAATCT ACCGCCCTCT AAATGGATTC TTGGCCGCAT CACAGCAGTG      5640
     CACGCAGGAA TCGACAACAA GGTCCGAGTC GTTACAGTGA AGACTGCTCA CGGATTATAC      5700
     AAACGCCCAA TTGCCAAAAT CGCTGTACTG CCTCTCTGCT GAACAACCGT TCAGGGGGGC      5760
     CGGTATGTTT GGGAACGAGA CACCCTGTAT ACGCGAACAA GTCACCCTTT ATCTTTATTT      5820
     ACATTCTTAT TTGTCTGCAG CTTCATCGGA GCTTATCAGC GGAATCAATG TAAGCATCGC      5880
     ACCGCTGTAA TTGTCCGCGA GCTTGCCCAG TACTTTTCCA AACTTCTAAC TCCCTTCTAA      5940
     CTGTAACTTG TTTACGTCTT ATGCTAGACT AATCGTATGG CGTGATTACA GCCAAAGCTG      6000
     AAGTCAGTCA CAATTTTGAT CTGCGAGAAA ACGTACGCAT CGGTGTCGAA ATAATTAATA      6060
     TTAAGTGTCT GAACTTAACC AATAAATGAA AATTAACAGT AACACTGGCG GTTTTATTTA      6120
     TAAACA                                                                 6126
//
ID   412      standard; DNA; INV; 7567 BP.
XX
AC   nnnnnnnn;
XX
DR   FLYBASE; FBte0000007; Dmel\412.
XX
SY   synonym: mdg2
XX
FT   source          nnnnnnnn:1..7567
FT   SO_feature      five_prime_LTR ; SO:0000425:1..514
FT   SO_feature      three_prime_LTR ; SO:0000426:7054..7567
FT   SO_feature      CDS ; SO:0000316:679..1044
FT   SO_feature      CDS ; SO:0000316:1408..1722
FT   SO_feature      CDS ; SO:0000316:1888..3243
FT   SO_feature      CDS ; SO:0000316:3864..6866
XX
CC   Berkeley Drosophila Genome Project.
XX
SQ   Sequence 7567 BP; 2982 A; 1367 C; 1323 G; 1895 T; 0 other;
     TGTAGTATGT GCCTATGCAA TATTAAGAAC AATTAAATAA AATAGCATAT TAACTTATGG        60
     CAGCACTTTG TTGCTATGTT TATGTTTATG TTTATGCACG CAGTTAGGCC AGGGCGGATG       120
     TAACATGATC ACCCACTCGA AGGCCACAAA GTATAAGTGC ATTGCCCAAT CGAAGGCAAA       180
     AAGTATAAGT GCATGGTCAG CATTCACACG CCGACCAAAT ACATATTACA TACGTACATA       240
     CATATCTCGC TCTCCCGATA AGCCTAGATA TATAAGATAT ACATAAGAAC GCCGCTCCGC       300
     TGCTGGCGTA CCCGGCAGCG CAGCTACGCG GATTAGCCTA AGTCCAAATA TATAAAAAAC       360
     TGTAAAATCG GAGAGACTCT GTAGACGTTG AGCTGACAGA ACCATTTCTG CCTACTCTAA       420
     AATCAAAAGA AGAAATTGAA TAAATATATG TCAGCCCGAC GGCTGCCTTA AACTTAAAAC       480
     GGACTTGTGT TCTTAATTGG AGTTCATCAT TACATGGCGA CCGTGACAGT CGTCCAACGC       540
     TGGACGAATT GACCAAAGCT GGTGAAAACA AAGGAACAAA GGAACACTGG ACTGGAAGAA       600
     GACTGGACTA ATTAAATGGA ACTGCAAAAA CCAAGGAAAA ATCTGAGTGA GTAGAGTTCT       660
     ATTGAGTATG GGCAAACACC GTGGCGGTTT GAAAACTAAG CTGAATAAAC GTATAGCCCA       720
     CGTAAGGTGG CTAATATACG GTCAGCAAAC GCCACCGGTT TGGTCGAAAG CTCTAAAGCT       780
     ACATGCAGAG CTAGACCACT TGTTGCAATA TCAGCAAGAA TTAAAGACCC ATAAGCTCGA       840
     GAAAACTCAC TCAGATAATA TTAAAAATAT ACCCACAATT AATGAAGTTC CAAAATACCA       900
     GGCATGTCCA GCACCAGCAC CAGCATTAAC AAAACCAAAG AAGTCCTGCC CCCCTGGCTG       960
     CGAAGGAATC TGGAGTCCCC ACTGCCTGGG GACTTGTGAG CGACCATCGA CGTCTTCAGC      1020
     GGCGAAGAAA TAGACAGCAG CGAGGGAGTG TCAGCGTGCC ACCCCCGGCG ACGCCCAGCT      1080
     GACACCCAAC AAATAGACAG CAGCGAGGGA GTGTCAGCGT GCCACCCCCG GCGACGCCCA      1140
     GCTGACACCT GATGAGCATC ATCAACAGCA GAATATAATA ATAAATATAT ATAAATATAA      1200
     AGTAAATATA AAATATATAT AGATAAGAAA AATTGTAAGA AATATTGTAA AACGGAGCAT      1260
     ATACTATTAT GCCCTGTTAA CCCAATATGG CCCGTGAAGC CATAGCTAGA ATCAGGCAGG      1320
     CAACAATGTA AAATACAATT TTTTTTTACT CTTGCGAACA TTGAAAGATT TTATAAATAG      1380
     ATAATTCCAA ACATAAATGT CTATAGAGAC AAATGAAATA AGTAAAACTG AAAATAAAAG      1440
     TATATACAAA GGAAATTTTC TATTCTATTC TCCAAAATAT AAAATTAGTA TACCCAAAAT      1500
     GGGTCTAATA GACACTAAAA CTGTGGACTC TACAGCCAAT GTAATAAATA AAGTAGAAGT      1560
     CCAAAATGCA GACTTGTTCT GGATAACCAT AATACTAATT GTAATTGCAT TAATTATGGT      1620
     ATCCAATGCA TTAATAAAAA TATACAAACT GCATAACAAG TGTCTTAAGA AACGATACCG      1680
     TAGCACTGCT AACGGTATAG ATAATATTTA AGGAAGATCT TTAATAAAGT CAATTATGAA      1740
     TGAAAATATG AGAAAAATTA TATGAAAAAA AAAAATAATA AATAAAAAAA AAATATAAAA      1800
     CGTAATATTG AATTTATCTA CATTAAAAAA AAATATATAC AAATGAATAA ATTTGAAGTT      1860
     ATGAGTATAC CACAGCATGG ACTGGGAAAA GCTTGTTGAT CAGATAAAAG ATCAAAATGA      1920
     AAATTTCAGA AAATCCTATA AGTGCTTAAC GCAAAACAGA TCAACACAAG CTGTAACAAT      1980
     CAATAGGAAT GCCCAAGTCT TGGTAAATAG TTATAATGAA ATCAGAGAGT TGATCCAACA      2040
     AAATAGAAAG AATTTGGAAC GCAAACAGTG TGCTAAGGCT TTGAACCTAC TGGTGACATT      2100
     AAGAGAAAAA TTAATATTTA TAAAAAATAA ATTCAGTCTC CAGATAGAAA TTCCAACCAT      2160
     AGTAAACACC CCACTAAGAA TAAATTTGAA TGAAGACAGC ACTAACTCTG ACGAGGAAGA      2220
     TAGGACTATA GTCAAGGAAG ACATTAAAGA GGAAGATCTT CACGATCTAA CTATACCAGC      2280
     AAAATTAATG CTGAAGAACG ACGATAAAAC AAATAACGCA GCCGACTCCG AAAATAACTT      2340
     AACCATGGCA GAAGAAGCAG CTGCCATTAG GTCTTACATT AGGGAAGTCG CCTGCACAGT      2400
     GCCAGAATTT GATGGGCAAA AGATCCATTT ACAAAGATTC ATTAAGGCAA TCAAATTGGT      2460
     AGACCTAGCT AAGGGACCAT TTGAAGACAT TGCAGTTGAG GTCATTAAGT CAAAAATAGT      2520
     TGGCACAATT TTGAACTCAG TTGACAATGA AACGACAATT CCAGCAATTA TAAACAAATT      2580
     GCAGAAAGTA GTTGTCGGTG AGACATCCAG TAATGTCAAA GCAAAGCTAG CAACAGTTCA      2640
     GCAGAGAGGT AAAACTGCAA CGCAATTTAC CGCTGAAGTT GATAGCCTGA GAAAACTTTT      2700
     AGAAGCTTCC TATATCGATG AGGGTATACC TCTAGAACAT GCCACTGGTC TAAGCACCAA      2760
     AGAGGCAATT GAAACCATGA TACATCGTGC TGAGCACGAA AGTATCAAAA CAGTACTGGA      2820
     AGCAGGGACT TGCACCACTA TGGATGCAGC GATAAGCGCA TACATAAGAA CGAGTACAAG      2880
     AGTTACCGGT GACATCAATA AAGTGATGTA CTTTAGAGGT AACAGACCCA ATAGAGGATA      2940
     CGGAAATGCC AATAGAGGTA GTAACCGCGG TAGAGGCTTT AATAACAATA GTATTAGAGG      3000
     CAACTACCAT AACGGTTACC AAAATAACGG TTACCAAAAT AACGGTTACC AGAATAACGG      3060
     TTATCAAAAC CGCTATAATG GAAATAATAA CCGTTATAAT GGCTATAACA GAGGCCGTTA      3120
     TAATGGAAAC AGAGGCCGTA ACAACAGTCA GAACAACTAC AACAGAAACA ATGCCAATGT      3180
     ACGAGTAATC CAAGAACAGG GAAACTCGCA ACAGCCTTTA GGTACTCAGT AGAAGAAGAT      3240
     CGTAGAGTAT ACACCATCAA TTATAATCTC AACATATTTT CTACATTCAT TCATGCCAAA      3300
     ACAGGCGTAA AACTAGTTTT TCTACTTGAT ACAGGTGCAG ATATCTCTAT TCTCAAAGAG      3360
     AACTCTGACA AATTTTCTAA TATTCAAATA ACCAATAAAA TAAACATTCA AGGCATAGGC      3420
     CAACAGAAAA TTCAGTCTCG AGGACAGACT TTTATTGAGA TACAGACAGG TAAATACGTT      3480
     ATCCCACACG ATTTTCATTT AGTAGATAAA AACTTTCCAA TACCGTGTGA TGGAATAATC      3540
     GGAATAGATT TCATAAAAAA ATATAATTGC CAAATCGATT TAAACCAAGA AGAAGATTGG      3600
     TTTATAATTA GACCAAACAA TTTGAAATTT CCAATATATA TTCCCATAGC ATACAGCTCT      3660
     GGTATTAACA CAACGTTATT ACCAGCAAGA TCCCAAGTTG TCCGAAGATT AATAGTATCA      3720
     TCAAAAGATG ATAACATTTT AATTCCAAAC CAGGAAATTC AAACTGGTAT TTATGTTGCA      3780
     AATACAATCG CAACATCAAG TAATACATTT GTCCGAATTT TAAATACAAC CGATTCCGAC      3840
     CAATTAGTCA ATATGGACAC TCTAAAATAT GAGCCACTTT CGAACTACAA TGTAGTTCAG      3900
     GCAAATAGTG AACACAGAAA TAAAACTGTC TTATCTCAAT TAAAGAAAAA TTTCCCCGAA      3960
     TTGTTTAAAT CACAATTAGA AAATATATGC AGCGAATATA TAGATATATT TGCATTAGAA      4020
     TCAGAACCTA TAACAGTTAA TAATTTGTAT AAACAACAGT TGAGATTAAA AGATGATGAG      4080
     CCAGTATACA CGAAAAATTA TAGAAGTCCT CATAGTCAAG TGGAAGAAAT ACAAGCCCAA      4140
     GTTCAGAAAT TAATAAAAGA TAAAATAGTT GAACCATCAG TTTCACAGTA CAATAGCCCT      4200
     TTGCTATTAG TACCCAAAAA GTCAAGCCCG AATTCTGATA AAAAGAAATG GAGATTAGTA      4260
     ATAGACTATC GCCAAATTAA TAAGAAACTT TTAGCTGACA AATTTCCACT ACCGAGAATA      4320
     GATGATATTT TGGACCAACT TGGTCGAGCA AAATATTTCT CCTGCCTTGA TTTAATGTCA      4380
     GGTTTTCATC AAATCGAACT GGATGAAGGC TCGAGAGATA TAACATCTTT CTCAACCAGC      4440
     AATGGCTCAT ATCGTTTCAC GCGATTGCCA TTTGGCTTAA AAATAGCGCC TAATTCATTC      4500
     CAAAGAATGA TGACTATAGC ATTCTCCGGA ATAGAACCGT CTCAAGCATT CCTTTATATG      4560
     GATGACTTAA TAGTCATAGG TTGTTCCGAA AAACATATGC TTAAAAACCT CACTGAAGTT      4620
     TTTGGTAAAT GCAGGGAATA CAACCTAAAG TTACATCCTG AAAAATGTTC ATTTTTCATG      4680
     CATGAAGTCA CATTTTTGGG ACACAAATGC ACAGACAAAG GAATTTTGCC GGATGACAAA      4740
     AAATATGATG TCATTCAGAA CTACCCAGTT CCACATGATG CGGACAGCGC TAGACGTTTT      4800
     GTAGCATTTT GCAATTACTA CAGACGTTTT ATCAAAAATT TCGCCGACTA TTCGCGGCAC      4860
     ATAACAAGAT TATGTAAAAA GAATGTTCCA TTCGAGTGGA CAGATGAATG TCAAAAAGCA      4920
     TTCATACATT TAAAATCTCA GCTAATTAAC CCAACACTCT TGCAGTACCC AGACTTCAGC      4980
     AAAGAATTTT GCATAACAAC AGATGCAAGC AAGCAAGCGT GTGGCGCAGT TTTAACTCAA      5040
     AACCATAATG GCCACCAACT CCCAGTTGCT TATGCATCCA GAGCTTTTAC GAAAGGTGAA      5100
     AGCAATAAGA GTACAACAGA ACAAGAGTTA GCAGCAATTC ATTGGGCAAT AATACATTTC      5160
     AGACCATACA TTTACGGAAA ACATTTCACT GTGAAAACAG ACCATAGACC ATTGACATAT      5220
     TTATTCTCGA TGGTGAACCC CAGCTCTAAA TTAACTAGAA TAAGGCTTGA ACTAGAGGAA      5280
     TATAATTTTA CAGTAGAGTA TCTAAAGGGC AAGGACAATC ATGTAGCAGA TGCGTTATCA      5340
     AGAATAACCA TCAAAGAGCT AAAAGATATA ACTGGAAATA TATTAAAAGT CACTACAAGA      5400
     TTTCAAAGTA GACAAAAATC CTGCGCAGGA AAAGAACAAT TGGATTTGCA AAAGCAAACC      5460
     AAAGAAATAG CTTCAGAGCC CAACGTATAC GAAGTCATAA CAAATGACGA GGTACGAAAA      5520
     GTAGTGACAT TGCAATTGAA TGACTCGATA TGTTTATTTA AACATGGAAA GAAAATTATT      5580
     GCAAGATATG ATGTTGGTGA TCTTTATACT AATGGAATTC TTGATTTAGA TCAATTTCTC      5640
     CAAAGGCTTG AATTGCAGGC CGGTATATAT GATATCAGCC AAATCAAAAT GGCACCGTGG      5700
     AAAAAAATCT TTGAACACGT TTCAATAGAT AAATTTAAAA ATATGGGCAA TAAAATATTA      5760
     AAGAATTTAA AAGTAGCGCT ACTTAACCCG GTGACCCAAA TAAATAATGA AAAAGAAAAA      5820
     GAAGCTATAT TGTCTACATT ACATGATGAT CCAATACAAG GAGGGCATAC AGGCATTACA      5880
     AAAACCTTGG CCAAGGTCAA AAGACATTAT TACTGGAAAA ATATGAGTAA ATACATAAAA      5940
     GAGTACGTAA GAAAATGTCA AAAATGCCAA AAAGCAAAAA CAACAAAGCA CACAAAGACT      6000
     CCAATGACGA TAACTGAAAC ACCAGAACAT GCTTTCGATA GAGTTGTTGT GGACACAATT      6060
     GGTCCACTAC CCAAGTCAGA AAATGGTAAC GAGTACGCAG TCACTCTCAT ATGTGATTTA      6120
     ACCAAGTACT TAGTTGCCAT ACCAATAGCA AATAAAAGCG CAAAAACAGT CGCAAAAGCT      6180
     ATATTTGAAT CTTTTATTCT AAAGTACGGT CCAATGAAGA CGTTCATAAC GGACATGGGA      6240
     ACAGAGTATA AGAATTCAAT AATTACTGAC CTGTGTAAAT ATTTGAAAAT AAAAAATATA      6300
     ACATCAACAG CTCATCACCA CCAGACAGTT GGAGTAGTAG AAAGAAGTCA TAGAACCTTA      6360
     AACGAGTATA TACGATCCTA CATATCGACG GACAAAACCG ATTGGGACGT ATGGCTTCAA      6420
     TATTTCGTAT ACTGCTTCAA CACGACCCAA TCTATGGTAC ATAATTATTG TCCATATGAA      6480
     TTAGTTTTCG GTAGAACAAG TAATTTACCA AAACATTTTA ATAAACTACA TAGCATAGAA      6540
     CCAATATATA ACATAGATGA TTACGCTAAG GAGAGTAAAT ATAGGTTAGA GGTAGCATAT      6600
     GCTCGAGCAA GAAAACTTCT CGAAGCACAC AAAGAAAAAA ATAAAGAAAA TTATGACTTA      6660
     AAAATAAAAG ACATAGAATT AGAAGTAGGA GATAAAGTTT TACTAAGAAA TGAGGTAGGT      6720
     CATAAATTAG ACTTTAAATA TACGGGGCCC TATAAGATAG AAAGCATAGG AGATAATAAC      6780
     AATATTACGC TACTTACTAA TAAAAACAAA AAACAAATAG TTCATAAAGA TAGATTAAAG      6840
     AAATTTCATT CATGATTGAA TTTAAACTTA TATTTTCCTT AATCATTTAC ACAAATTTTC      6900
     CATACACTAC GTATATTTTT ATCTTTGCAT TATAAAATCA ACTATTGTTG TTCAAACAAA      6960
     AACACAAACA AAATAAAAAT AAAAATAAAA TAATTTGCAT TTAATAATCA AAATAACTTC      7020
     ACTAGGTTAC GTTATTTTTC AAAAGGAGGG AGATGTAGTA TGTGCCTATG CAATATTAAG      7080
     AACAATTAAA TAAAATAGCA TATTAACTTA TGGCAGCACT TTGTTGCTAT GTTTATGTTT      7140
     ATGTTTATGC ACGCAGTTAG GCCAGGGCGG ATGTAACATG ATCACCCACT CGAAGGCCAC      7200
     AAAGTATAAG TGCATTGCCC AATCGAAGGC AAAAAGTATA AGTGCATGGT CAGCATTCAC      7260
     ACGCCGACCA AATACATATT ACATACGTAC ATACATATCT CGCTCTCCCG ATAAGCCTAG      7320
     ATATATAAGA TATACATAAG AACGCCGCTC CGCTGCTGGC GTACCCGGCA GCGCAGCTAC      7380
     GCGGATTAGC CTAAGTCCAA ATATATAAAA AACTGTAAAA TCGGAGAGAC TCTGTAGACG      7440
     TTGAGCTGAC AGAACCATTT CTGCCTACTC TAAAATCAAA AGAAGAAATT GAATAAATAT      7500
     ATGTCAGCCC GACGGCTGCC TTAAACTTAA AACGGACTTG TGTTCTTAAT TGGAGTTCAT      7560
     CATTACA                                                                7567
//
ID   DMAURA     standard; DNA; INV; 4581 BP.
XX
AC   nnnnnnnn;
XX
DR   FLYBASE; FBte0000112; Dmel\aurora-element.
XX
FT   source          nnnnnnnn:1..4581
FT   SO_feature      five_prime_LTR ; SO:0000425:1..324
FT   SO_feature      three_prime_LTR ; SO:0000426:4258..4581
FT   SO_feature      transcription_start_site ; SO:0000315:191..196
FT   SO_feature      polyA_signal_sequence ; SO:0000551:4482..4487
FT   SO_feature      primer_binding_site ; SO:0005850:331..346
FT   SO_feature      RR_tract ; SO:0000435:4247..4256
XX
CC   Composite sequence derived from AB022762, X70361 and X70362
CC   Assembly based on strategy described in PMID: 10333568
CC   Defective element with incomplete ORFs
CC   Casey Bergman, 21-June-2016.
XX
SQ   Sequence 4581 BP; 1102 A; 1074 C; 1456 G; 949 T; 0 other;
     TGTCGCGGAT CGAATATTGT TATCGATAGG CTCTAGTTAG TATTTTTGAG AAGTCCGAAT        60
     GTGGAAGGAT TTGTAAGCCC ATATGTGTCT GGGCACGTTG TTTTTGGCCA TTGTAAATTA       120
     CCGGGAAAAT TTAGCTTTTC ATTGTCGTGT AAGAGTTGGA GGACACACTG CGGTGAGCTA       180
     ATAAGTTAAG TTAGTTGCAA TTGTGAAACA TTGAATTCTT CAAGAATAAA ACGTGTTCTA       240
     CTACCACGGA TTAGTCTGCC CTTTCTTTCG GGAACCAATG TGTGGGGTAG CCGTTTAAGG       300
     CAACTCCCTG GACGCACGAC GACAACCTTT TATTCGCAGT CCTAGGGCGA CTGCAGGGGC       360
     AACTTGCGCT GGAATGACGG TTTAGACGGC CAGCTAGAGA GTTGCCGGAG CTGGAGTGAC       420
     GGTTTAGACG GCCAGCGAGG AGGATTTGTG TGAGCGCAGC CAGCGCTACG TACCGGCAGA       480
     GGAGTCGCAG TCAGCGACAT AGAGGGACGC AGCCAGCGTC GAACGCCGGT ACGAAAGGGT       540
     CGCAGCCAGC GACAAGGAGA CGCAAGAAGC GTCATTTGTG GAGACCGCAG CCAAGCATCC       600
     GTGGCCGCAG CCAGCGGCAC GAGGCGTCAG AGACGCCATT TCGGACGCGC AGAGGCGCCG       660
     CCATTTTTGG AGCTGGGAAA GATGCAGCAT TCCCCCAGGA AGAGTGCCCG GCTGAACGGA       720
     GGGGAAGTCA CCCCTATAAC AACAGTGAGT CAGCAGCCAG CCAGTAGTGG AGCAGGAACT       780
     CGGACGCGGG TGAACATCAC GGCGGCGTCG ATTCCTTGCC CGGCCACTAC GGTGACTACA       840
     GTAGCTTCCC AACCTAGAAG TACTGCTGTC ACAGCTGCGA GTTCAGTACC GGAGGTGAAC       900
     CAGCCCCTCG TGTTGGAACT CATGGAGAGG ATCGCAGCGT TGGAGAGGGA GCTGGAGAAG       960
     ACTAGATCCC TAGAAAGTGT GAGCACCGCC AATTGCGCGC CAATCGCAGT TGGCCCAAGC      1020
     GCAGTTGGCG CCAACAGTGG AGCGTCGGGG CGGCCGCCAT TTTGGAGCGG CCAGCTAATA      1080
     CCCACATCTA ACGGAGAGGC CTTACATAAC GGGGACTGGG CCAGGCATGC TGCAACGATT      1140
     GCGCCCTTTC CCACTGTAGT CCACTTCAGC GCGTGGCTAC AGGAGTACGC AAACGTGGTG      1200
     TGCACGGTTT TGGACGTCGA GGGAAAGGAG CCGAGGCGTC GACTTCTACA TGCAAGCGTC      1260
     GACCATAATG AATGCGATCA ACAGGATGAT CGGCATGGAG GTTGTCCCAT CTGTGGAGGA      1320
     CAGCATGAAA TATTGAACTG CAGAAAATTT ATTGGAGCTT CGCCACAGGA AAGGTGGAGC      1380
     AATGTGAAGA GGCATCGGCT CTGCTTCAAT TGCCTGCGAA GCGGGCACAC GGCTAGATCC      1440
     TGCTATACGC AAGGTGAGTG CCAGGTTAAT GGATGCCGAA GGGAGCATCA CCGTCTGCTA      1500
     CATGGTGCGG ACGGAGGAAC GAAGGCCGCT GCAGCGAGGT GGCTTCAGAC GCCACGAAGG      1560
     GAACCAGCAG CCAGCAGTTT CCAGACGCAG CCTAAAGGGG AGGCCTTCGC TACGAGATGG      1620
     TCACAGGGAC CAGGAGAGGA ACCGGCAGCC AGCCGTTCCA AGCAACAGTC TGGAGAGAGG      1680
     AGCTCCACGT GAAGCGGGAG CGCCCATGCA GAGGAATTTG AGCTGCGTTG ACGCCGAAGG      1740
     AGGCCGTCTA CTGTTCCGTA TACTGCCGGT TACGCTGTAC GGAGCGGGGC GAAAGGTGGA      1800
     TACATATGCG CTCCTAGATG AGGGATCCTC CGTCACGATG ATCGATGACG AACTACGAAG      1860
     GGATCTTGGA GTGCAAGGAG AGCGTCGGCA GCTAAATATC CAATGGTTTG GTGGTAAGGC      1920
     AACCAGAGAG CCTACCAACG TGGTGAGTCC GAAGATAAGT GGAGTTGGAA AGCCCACTCG      1980
     CCATGTATTG AGAAACGTTT ATGCCGTTTC GAGCTTGAGT TTGCCGATGC AGACATTGAG      2040
     CCGACGAGAT GTCCAGGGCG TGCACAGGGA TGCGCGTCTG CCCGATGAAG CCTTACAGCA      2100
     ACGTGGTGCC GAAGCTGCTC ATCGGTCTGG ATCACGGACA TCTGGGGTTG CCACTTAGGA      2160
     CGAGGCGGTT CGCTCGAGAG GGACCGTATG CGGCCGCAAC CGAGCTGGGC TGGGTTGTGT      2220
     TTGGGCCTGT AAGTGGGCAA CCGACCACGC CGTCACCGAG GTCCTGCCTA CTTGCCGTGT      2280
     CAGTGGATGA CGCGATGGAG AAGATGGTGG AGGACTATTT CGACATGGAG AACTTTGGAG      2340
     TGAAGACCGC GCCGCCGGTC GCAGCCAGCG ACGATGTCCG GGCCCAAAGG ATACTCGAAG      2400
     ACACCACGGT GAAAGTGGGG CGTCGCTACC AGACGGGATT ACTCTGGAAG GACGACCACG      2460
     TTGTGCTGCC ACCGAGATAT GAGGACGACG ACGTGCAAGT GAGCTTCGTG AGTGCGAGGA      2520
     CGAAGTGTGC CCCAATGAGA ACGATGACGA TCCCACGGCT GGAGCTGCAA GCAGCAGTTC      2580
     TTGGAACCAG GCTGATGAAC ACTGTCAAGG AGGAGCACAG TGTGGTCATC ACGGACCTGG      2640
     TGTTATGGAC GGACTCTAAG ACGGTGCTGA GATGGATCGG CAGCACCCAC CGCCGCTGAC      2700
     AATGCGGCTG ATGATGCGAC GCGGTCGCAG AAAAGGAGTC GACCTTAGCC AGGAATCAAG      2760
     GTGGCTAAGA GGACCTGCAT TTTTGATGCA GCCAGCAGCC AGCTGGCCGG GGTCTGAGGA      2820
     AGGAACTGAG CGTGTTCCAG ATGTCCCTGA TGAAGAAGAG ATGCCCAGTG AGTTTGCATT      2880
     AGTTGCGGTA GACGATTTTG TCATTCCGTT TCAGAGATTC TCGAGCTTCA GTCGCCTGGT      2940
     GAGGACCACA GCCTGGGTCC TACGGTTTGC GCGCTGGTGC CGCAAACAGC GAAACGATCT      3000
     CGAGGAATAC GGCCTTACCG CAGCCAGAAT GTAAGGCCGC CGGAACCGCA CTGTGCATCC      3060
     CGTACAGTGC GAGGAGGGCC GTATTACTGT CACACAGGCA CAGTCTGACG GAGCTGATTG      3120
     TGAGAGACTT CCACGCCAGG ATGAAGCATC AAAATGTGGA TGCTACGATC GCGGAGATCC      3180
     GGACAATGTT CTGGGTCACA AAGATGAGGC GTGTGATGCG GAGAGTCATC TCATCGTGCA      3240
     ACGAGTGCAA GTTGCAGCGA GCGCGGCCGA TGCCGCCGAT AATGGGACCC CATCCGGAAG      3300
     ACAAACTGGA TGCGGGTGGA TGGCCATTCA AATACACAGG ACTGGACTAC TTTGGGCCAC      3360
     TGCTGGTGAC TGTGTCCCGT CACAAGGAGA AGCTTGGGTC GCCTTGTTTA CGTGTTTGAC      3420
     GACAAGGGCG ATTCACCTGG AGCTGGCGCA TGACCTGTCG ACGGATTCCT GCATAATTGC      3480
     GATCAGGAAC TTCGTCTGCC GTAGAGGGCC AGTATATAGA CTGCGCAGCG ATAACGGCAA      3540
     GAACTTCGTG GGAGCTGACA GGGAAGCCAG GCGCTTTGGC GACGTATTCG AGATGGAGAA      3600
     GCTTCAGAGT GAGTTGACAA GCAGAAGCAT TGAATGGGTG TTTAATTGTC CAGCGAACCC      3660
     GTCTGAGGGC GGAGTTTGGG AGCGCATGGT GCAGTGCGTC AAGAGAGTAC TGCGTCATAC      3720
     CCAGAAGGAA GTTGCGCCGA GGGACCATGT ATTGGAGAGT TTCCTGATTG AGGCGGAGAA      3780
     TATTGTAAAC TCGCGTCCGC TCACCCACTT GCCTGTGGAT GTGGACCAGG AGGCGCCGTT      3840
     GACGCCAAAC GATCTTCTCA AGGGAGTAGC CAATCTGCCG GATACGCCTG GATTGGATGC      3900
     GGAGCTGCCC AAGGAAGGTA CTACGAGGAA GCAGTGGAGA ATTTCTCGCC TGCTACGAGA      3960
     CCGTTTCTGG AGGAAGTGGG TCATGGAGTA CCTGCCTACG CTTGTGCGCC GCGAGAAGTG      4020
     GTGCCGACGA ACGGAGCCCA TCCACCAGGG TGATGTGGTC TTCGTCTGCG ATCCTGCCTT      4080
     GGCCCGACGA GAGTGCCGCA AGGGTATCGT GGAGGAGATC TACAGCGGAG CTGATGGAGT      4140
     TGTCAGACGC GCTAAGGTGC GCGTGAACGA AAACGGCCTA TCTAGGACAA TGATGCGACC      4200
     CGTCTCTAAA CTTGCAGTTA TGGATTTGAG TGAAGCGGTT CTTCACGGGG TCGGGGATGT      4260
     CGCGGATCGA ATATTGTTAT CGATAGGCTC TAGTTAGTAT TTTTGAGAAG TCCGAATGTG      4320
     GAAGGATTTG TAAGCCCATA TGTGTCTGGG CACGTTGTTT TTGGCCATTG TAAATTACCG      4380
     GGAAAATTTA GCTTTTCATT GTCGTGTAAG AGTTGGAGGA CACACTGCGG TGAGCTAATA      4440
     AGTTAAGTTA GTTGCAATTG TGAAACATTG AATTCTTCCA GAATAAAACG TGTTCTACTA      4500
     CCACGGATTA GTCTGCCCTT TCTTTCGGGA ACCAATGTGT GGGGTAGCCG TTTAAGGCAA      4560
     CTCCCTGGAC GCACGACGAC A                                                4581
//
ID   DMBARI1    standard; DNA; INV; 1728 BP.
XX
AC   X67681; S55767;
XX
DR   FLYBASE; FBte0000034; Dmel\Bari1.
XX
FT   source          X67681:1..1728
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1..28
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1701..1728
FT   SO_feature      CDS ; SO:0000316:379..1398
FT                   /name="Dmel\Bari1\ORF"
FT                   /db_xref="FLYBASE:FBgn0043784"
FT                   /db_xref="SPTREMBL:Q24258"
FT                   /db_xref="NCBI_PROTEIN:CAA47913.1"
FT                   /translation="MPKTKELTVEARAGIVARFKAGTPAAKIAEIYQISRRTVYYLIKK
FT                   FDTVGTLKNKKRSGRKPVLDQRQCRQILGVVAKNPSASPVKIALESKNTIGKQVSSSTI
FT                   RRRLKEADFKTYVVRKTIEITPTNKTKRLRFALEYVKKPLDFWFNILWTDESAFQYQGS
FT                   YSKHFMHLKNNQKHLAAQPTNRFGGGTVMFWGCLSYYGFGDLVPIEGTLNQNGYLLILN
FT                   NHAFTSGNRLFPTTEWILQQDNAPCHKGRIPTKFLNDLNLAVLPWPPQSPDLNIIENVW
FT                   AFIKNQRTIDKNRKREGAIIEIAEIWSKLTLEFAQTLVRSIPKRLQAVIDAKGGVTKY"
XX
CC   Derived from X67681 (g7640) (Rel. 36, Last updated, Version 6).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 1728 BP;  596 A; 291 C; 332 G; 509 T; 0 other;
     ACAGTCATGG TCAAAATTAT TTTCACAAAG TGCATTTTTG TGCATGGGTC ACAAACAGTT        60
     GCTTGTGCAG CAAGTGGGGG GAGGTGAAAT GCAAAAAAAC TTTTGCTTTT GCAAATTCAA       120
     ACCTATGCAG AGTCAGATGA AAGAAGAATT GAAAAAATAA CTGTTCCTAT GCGCAAGGAA       180
     GAGGCAAATG AAGAGATCTT TATCAGTTGT CAGAAGTATT TGCACACGGT TTCGTCGCAT       240
     CACAATTATT TTCACAACGC AATTTCTTCT TCAGTGATTG GTTTAGAGTG ACAAGTGCCG       300
     GTTTGTTTGC TTAAATACAT TTAAATTATT GAATAAAAAT TAGATTTAAT CATTTTCCTA       360
     TTACAGTTAT TAAATAAAAT GCCCAAAACA AAAGAGTTAA CAGTTGAGGC CCGGGCTGGT       420
     ATTGTTGCTA GGTTTAAAGC CGGTACACCT GCGGCCAAAA TAGCTGAAAT ATATCAAATT       480
     TCGCGTAGAA CTGTCTACTA CTTAATAAAA AAGTTTGATA CAGTTGGCAC ATTAAAAAAT       540
     AAAAAAAGAT CAGGCCGAAA ACCTGTGCTG GACCAAAGGC AATGCAGGCA AATACTTGGA       600
     GTTGTGGCGA AGAATCCTAG TGCCAGTCCG GTAAAAATTG CCTTAGAATC AAAAAATACA       660
     ATTGGCAAAC AAGTTAGTAG TTCTACAATT CGTCGCAGGC TAAAAGAAGC TGATTTTAAG       720
     ACATACGTTG TTCGCAAAAC GATTGAGATC ACACCAACCA ACAAAACAAA ACGTCTTCGA       780
     TTTGCGTTGG AATATGTTAA GAAGCCTCTT GACTTTTGGT TTAATATTTT ATGGACTGAT       840
     GAGTCTGCAT TTCAGTACCA GGGGTCATAC AGCAAGCATT TTATGCATTT GAAAAATAAT       900
     CAAAAGCATT TGGCAGCCCA GCCAACCAAT AGATTTGGTG GGGGCACAGT CATGTTTTGG       960
     GGATGTCTTT CCTATTATGG ATTCGGAGAC TTGGTACCGA TAGAAGGAAC TTTAAATCAG      1020
     AACGGATACC TTCTTATCTT AAACAACCAT GCTTTTACGT CTGGAAATAG ACTTTTTCCA      1080
     ACTACTGAAT GGATTCTTCA GCAGGACAAT GCTCCATGCC ATAAGGGTAG GATACCAACA      1140
     AAATTTTTAA ACGACCTTAA TCTGGCGGTT CTTCCGTGGC CCCCCCAAAG CCCAGACCTT      1200
     AATATCATTG AAAACGTTTG GGCTTTTATT AAAAACCAAC GAACTATTGA TAAAAATAGA      1260
     AAACGAGAGG GAGCCATCAT TGAAATAGCG GAGATTTGGT CCAAATTGAC ATTAGAATTT      1320
     GCACAAACTT TGGTAAGGTC AATACCAAAA AGACTTCAAG CAGTTATTGA TGCCAAAGGT      1380
     GGTGTTACAA AATATTAGTA TTGTATTTAT ATAAAATAAA GAAATTCTTA TGTTGAAATT      1440
     AGATGTTAAG CTGAAATTTA CTAAATTAAG TTGAGTGAAA ATACTTTTGA AGCGCAATAA      1500
     ACATGTGAAA ATACTATTGA CAACTTGCAT GCATATTTTC TTTTGCTTTA AGCTTTGTAC      1560
     TATGAACCGT TATCTTTCGT ATTTCTTTTC GACTACCTTC TGCATAGATC AAGCTAAGCG      1620
     ATAAGAACTA TTTCAGGCAA ATCGGACAAC AACAAGAAGA AATATAACAA AAAGAAGTTG      1680
     AAGTTTGCAA ATATTGTGCG TTGTGAAAAT ACTTTTGACC ACCTCTGT                   1728
//
ID   BS     standard; DNA; INV; 5142 BP.
XX
AC   nnnnnnnn;
XX
DR   FLYBASE; FBte0000780; Dmel\BS.
XX
FT   source          nnnnnnnn:1..5142
FT   SO_feature      CDS ; SO:0000316:341..2248
FT   SO_feature      CDS ; SO:0000316:2245..2965
XX
CC   Sequence identified by REPBASE:
CC   http://www.girinst.org/server/RepBase/RepBase6.6.embl/drorep.ref
CC   Assembled and annotated by Josh Kaminker & Michael Ashburner.
CC   REPBASE states this to be a consensus sequence.
CC   This replaces that from complement(X77571:651..5776) in versions
CC   previous to 4.8.
XX
SQ   Sequence 5142 BP; 1652 A; 1222 C; 1075 G; 1193 T; 0 other;
     AAATCTGCAT TCATAGAGAT CGGTTGTGTC GCGCGTATGC AAAAGTGATC TATTTTGCTT        60
     TATTGTTGCA ATTTCTTGGG TGCTTAAAAT AGCACTCACC AGTACATTCG GGCGCTGCTT       120
     CGTGCGGTGT CGGCATCTGG CCAACAACAA AAAGCGTTAA TCGAAGTGCG GTGTAGCTAC       180
     GATACCTGCC CTTCGGGCAA CTTATTCCCC TCACCCCGCG CAAAGCCGCT GAAGGGGGCA       240
     ATAAAATCTA TGCTTATCAG CAAAACTGAT CCGTATTTGA TCTGTTTTGT GGTCAGTTAA       300
     GCAAGCTATT TTGTAAATAT TAAGAATTAT TATTAAGACA ATGGATGAGA ACAATTCTGA       360
     TGACACCCAG CTTTTAAATA AGCAGAGTAA CCATAGAACA ATGTTCTCAA TAGCTGGCAA       420
     ATTACCTCAC GAGATTAGAA ACGAGTGCCG ATCAGCAATT CAACGCTTTA CAAGCAGCGT       480
     AACTCAAAGC AGTAGCGTCA CCACAACAAC GGTGACATTT ACTAGTGCCA ATAACAGCAC       540
     CATATATACA ATGGCAAATG CCGCAATAAG CAGCCCGTGC CTTGGAACAA GATCCACTCA       600
     CCAGGAAAGT TCCACATTGA TAAACTCCGG AATCGTAGAA GATAATCTCA GCGATGCTGC       660
     CAGAAGGTTA TTAAATGACC AAAATCAGAG AGCGGGTAAA AGGAAAAATG GAAAGCCCTT       720
     GTCCCCCATC TCCAACCCGA AAAGAGGGAG TAGCAGCCAA GTTTTACACT CGCCCCCTAC       780
     GACTAGCCTG AAGATAAGCT CTAATAATAG GTTTGCCATT CTGGACACGG ATATTTCTAC       840
     TAACGAAGAA AGCGTGGAAG GCATGATGAT AGAGGGTGCT GATATTGACA GTGCCCATAT       900
     GGATGATTCT CAACTCGATG GTTCCAATAC TGGTCGAAAC TTGCAGGAAA CACACAATAC       960
     AGCCAATCAA CTTAATGATC ACAAAAAACC ACCACAAATT GTTGTAAATA TCAGAAACTT      1020
     GAATGATCTG TTTGAGCTTA TAAAAGAAAA GACAAGCTTA GATAACGTTG TCGTTAAAGC      1080
     TAATCAAGGG GAAACGGTCA GAATATTTCC AAAAGACAGC GACACTTACA GGAAAATAGT      1140
     GAGCCATATG GATGACATTG GTATTCAGTT TCACACTTAC CAAATGCTGA CAGATAAGCC      1200
     ACACAGAATT GTAGTAAGGG ACTTACATCA CAGTACATCA AACAAAGACA TAACCGCCGA      1260
     TCTGAAATGT TTAGGCTACG AAGTGCTCCA CATTCACAAC CCTAGTTCTA GGACTAATAA      1320
     GGACGAAAAA CTAAACATCT TTTTCATTAA TATAAAGCCC TGTGCAAAAA TTAATGAAAT      1380
     TTACCATGTC AAGACCCTTT GCCGACAGAA AATACGGATT GAAAGGATGA GAAAGTCTTC      1440
     TGAAATTGCG CAATGTCGTC GTTGTCAGGA GTACGGCCAT ACAGCTAAAT ACTGCCGCAG      1500
     ACACCCAAAT TGTGCCAGAT GTGGCGAAAA TCACCAAACC ATGCAATGCA CCCGACCGAT      1560
     AGACGCACTG CCCACATGTT ACCATTGCTC TGAAAATCAT ACGGCTAGCT TCAAAGGTTG      1620
     CCTAAAGTAT CAGGAGCTTC TTCGCAGATC TATGGGGCCT GCAAGAAATG GAAACAGGTT      1680
     AAATAAGAAC ACCCATCATC ACTCTCCTAG AGACCGGCAA GAGCTTCCTG CCTTGCAGCC      1740
     CAATTACCGC AAGAACAACA CCCAATCAAC AGTACAGCAG TTATCGACAC AACCACAGCT      1800
     TAATTTTGCC CAAAGCCAAC CATCTATAGG CACTGGTGGA AACAGAGCAG TATCCTATGC      1860
     TACAGTAGTA AAAGGATACC CAAAAATAGC GCCCTCCAAG GACGGACCAG CCCAGCGTCA      1920
     ACGCTTAAAC AACCCACAAA CGAAACAAAT ACTGCAGCAA CACCGATCGA ATACACAGCA      1980
     GAATAACTCA TCTGATGTGC AAGTATTCTT ACAACAGCAA CAACAACAGT TTCTGGAATG      2040
     GCAACAGCAG ATCCAACAAC AACAACACCA ACAGTTTCTT ATGTGGTTGC AACAGCAGCA      2100
     GCAAGAACAA CTACAGTATA AAAGCCAAAC CAATCAACGA CTGGAAAAGC TTGAAAAAAT      2160
     GGTTCTTGAA CTAGCGAATA TGTTAAAAGA ATGGGCTGGG AGTGAACTTA AGCCCCAGCT      2220
     CTTTAACAAC GTCTCAGCCT CCCTATGAAT CCACTAAAGA TTCTTATTTG GAATGCTAAC      2280
     GGCATTTCAA GAAAAGCCAA AGATGTTGAG CTGTTCGCGC ACAACAAAAA GATAGACATC      2340
     CTTCTTGTGA CTGAACTAAG ACTCAAAAGA GGGGAAACTG TAAAGATATA TGGATATGCG      2400
     TACTATCCAG CATATAGGCC ATCCCTTAAT AATAATAGTG TTGGCGGAGT AGCGGTGTTC      2460
     GTGAGGACAA CTCTTCGCCA CTTTCCACAA AGGGTCATTG AGACACGCCA CATACAATTG      2520
     TCATCAGTAA AAGTAGCCAC AGGACTCGGG GACCTGCAGT TTAGCGCTAT TTACTGCTCC      2580
     CCAAGTACTA GAATCGAGGA AAGACATTTT ACTGACATAA TACGCGCCTG CGGCCAAAGG      2640
     TACTTGGTAG GTGGCGACTG GAATGCCCGC CACTGGCTTT GGGGCGACAC TTGCAATTCA      2700
     CCTCGCGGGC GGGAACTAGC AGAAGCCTTG TCCGTGACTG GAGCTAAGAT CCTCGCAACT      2760
     GGCTCTCCGA CAAGGTATCC GTATGTGCCC AGCCATACGC CCTCATGCAT AGATTTCGCA      2820
     GTGTATCATG GTATACCAGA CCACCTAGCA ACTATAACAC AAAGCTGGGA CTTGGATTCT      2880
     GATCACTTGC CTCTTATCAT TAGCATTGAG ACAGACAGTA TTCATGTCAA TCCAAGTCCC      2940
     AGGCTAGTCA CCAAACACAC TGACCTCCTT GCCTTTAGCC GACAATTGGA GAGCCTTATT      3000
     TCGCTGAACA CCACGCTTAA TTCTGGTGAG GAAATTGAAA TGGCTGTTGA CAACCTAACT      3060
     GAAAGCATAC ATAGGGCCGC GGCTGTCTCT ACTTCTCCCG TCCCTCGGAT AGGCACCACA      3120
     TATGGGATAG TCTTGACAAG AGAGGCTAGA GAGCTTCTGA CACAGAAAAG AAGACTCCGA      3180
     AGGCGAGCAA TCCGATCTCA AGACCCCTGG GACCGACTTT TATGGAACCG TGCTGCAAAG      3240
     CAACTACGAA ACGTCCTCAG AGAACTTCGA AGCAACTTTT TTGAGCAGAA ACTAGCTAGT      3300
     ATGGACTACA CAGTGGATGC TGGATACTCG CTATGGAAAT GCACCAAGTC CCTTAAAAGA      3360
     CAGCCGTTTA GACAGGTTCC TATAAGGTGT CCGGGAGGCG AACTTGCTAA AAATGAAGAG      3420
     GAGCAGGCTA ATTGTTTTGC AAATCATCTG GAGACAAGGT TCACCCACTT CCAATTCGCT      3480
     ACAACGGAGC AGTATCAAGA GACGCTTGAT AGCCTAGAGA CACCTCTGCA AATGTCACTA      3540
     CCCATTAAGC CCATCAGGGT TGAGGAAATT GTCGAAGCTA TCAAATCTCT TCCGTTAAAG      3600
     AAGTCTCCTG GCATCGACAA CGTTTGCAAT GCCACACTAA AAGCACTACC TGTTCGAGCA      3660
     ATTCTCTACT TGGCGCTGAT ATATAATGCC ATACTCAGGG TGCAGTTTTT CCCAAAGCAG      3720
     TGGAAAATGG CAGCAATCCT AATGATACAT AAGCCTGGTA AACCTGAAGA GAGCCCTGAA      3780
     TCGTACCGAC CCATAAGTCT TTTATCTTCG CTATCCAAGC TATGGGAACG ACTGATTGCC      3840
     AACAGATTAA ATGACATTAT GACCGAGCGT CGTATCCTGC CGGATCATCA GTTTGGCTTT      3900
     CGTCAGGGAC ACAGTACTGT GGAGCAGGTA CACAGACTGA CAAAACATAT CCTTCAGGCC      3960
     TTTGATGATA AGGAATACTG CAATGCTGTG TTCATTGACA TGCAACAGGC ATTCGATAGG      4020
     GTCTGGCATG ACGGCCTTAT CAGCAAAGTT AAAAAGTTAT TCCCAGCACC ATACTATGGA      4080
     GTCCTAAAAT CATACTTGGA AGATCGGAGA TTCATGGTCA GGGTCAGAAA CTCCTACTCG      4140
     ATTCCCCGCG TTATGAGAGC TGGAGTTCCG CAGGGCAGCG TACTGGGACC GTTGCTCTAC      4200
     TCAGTATTTA CTGCAGATCT GCCCTGCCCA AACGCCTATC ATATGGCAGA TCCCAGGAAG      4260
     GCCCTTCTTG CTACGTACGC TGACGATATT GCCCTGCTGT ACAGCTCTAA TTGTTGCAAC      4320
     GAGGCAGCAA GGGGTCTCCA AGAGTACCTC ACCACTCTGG CTGCATGGTG CAAAAGATGG      4380
     AATTTAAAGG TCAATCCGCA AAAGACCATC AATCCCTGCT TCACCTTGAA GACCTTAAGT      4440
     CCCGTCACCG CACCCATAGA GCTGGAAGGT GTAATCCTAG ATCAACCTTC ACAGGCTAAG      4500
     TACCTCGGGA TTACCCTTGA TAAACGGTTG ACTTTCGGCC CGCACCTGAA AGCTACGACT      4560
     CGGAGATGTT ATCAAAGGAT GCAACAACTT CGATGGCTGT TAAACAGAAA AAGCACCATG      4620
     ACACTGAGAG CCAAAAGAGC AGTCTACGTC CACTGCGTAG CCCCGATCTG GCTGTACGGA      4680
     ATACAGATCT GGGGTATCGC AGCAAAATCC AACTACAACC GCATTCAGGT ATTGCAAAAT      4740
     CGTGCCATGC GTGCAATTAC AGACTGCCCA TACTATGTAC GTGGCACTAC CCTTCACCGT      4800
     GATCTGAATC TTCATACAGT GGAAGAGCAG ATCTCCAGGC ACACCAGCAG ATATAGTGAT      4860
     AGACTAAGAC GACACCACAG TATACTTGCT AGACGCTTAC TCCCTGCTAG GCCTCTAAGG      4920
     AGATTAAAAA GGAAGGGTTT CGCCAAAACA CTTGGACAAC CCTAAAGACC CCCTCGAAAT      4980
     ATGAGACAAA GTTGTAAGTC CTCACATGAT TAGTGAGAGG TTTGGTTCTA TCTTTTATAT      5040
     GTTAATTGCG CTGTTATGTT ACTGTTATTG CATTGTATTG ATTCATCGCT TCTAAATAAA      5100
     TAATAAAAAA AAAAAAAAAA AAAAAAAAAA AAAAAAAAAA AA                         5142
//
ID   DMU89994   standard; DNA; INV; 6411 BP.
XX
AC   U89994;
XX
DR   FLYBASE; FBte0000739; Dmel\Burdock.
XX
FT   source          U89994:1..6411
FT   SO_feature      five_prime_LTR ; SO:0000425:1..275
FT   SO_feature      three_prime_LTR ; SO:0000426:6136..6411
FT   SO_feature      CDS ; SO:0000316:564..2057
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\Burdock\gag"
FT                   /db_xref="FLYBASE:FBgn0043782"
FT                   /db_xref="SPTREMBL:O01350"
FT                   /db_xref="NCBI_PROTEIN:AAB50147.1"
FT                   /translation="MSDSDNLLDNLVSSLNKWSAHQASRQNSAEKNNKSSDNWWSKTKT
FT                   TSEMEFEAQLKAIVESAVAGALAVQKQSFEKQLQEMNERIGKLTVNTPEVETYVDAEIR
FT                   PGVVCSEPLDILKSLPDFDGKSETYVSWRKAAHVAFKVFKDYEGSSTFYQALGIMRNKI
FT                   KGPANTVLASFNTPLHFKAMISRLDFTYSDKRPIYLIEQELSTLRQGDMTLTEFYDEVE
FT                   KKLTLLTNKTIMTFDSALAMSLNEKYRTDALRVFVTGAKKSLSDILFAKGPKDLPTALA
FT                   LAQEVESNHERYQFALIYSKNIGDRGQKIEQRHSDKDRNSIMPMQTKNPYFSKRQVHTY
FT                   DNQERQDPVQLTNPDVSMRSRRTGNFGQTPFPTQGNIWPSQQQNSWPSQQQYSWPSQQQ
FT                   NSFRTQNQFASQPQQQNTSQAQGHFGYAQASKRPTSGSARFTGPKQQRINYLPHEKGQC
FT                   EEDTDGYQKEAEAEVDDYEDELVNYDHVHFLATNPCYRT"
FT   SO_feature      CDS ; SO:0000316:<1994..5119
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\Burdock\pol"
FT                   /db_xref="FLYBASE:FBgn0043781"
FT                   /db_xref="SPTREMBL:O01351"
FT                   /db_xref="NCBI_PROTEIN:AAB50148.1"
FT                   /translation="GRTSELRSCSFFSHKSLLPYIEREIAGRTIKLLIDTGASKNYIQP
FT                   LPELKNIMPVQNKFTVKSLHGCNTVKQKCFIKLFNTSVQFFILPSLSSFDAIIGLDLLK
FT                   QGNATLDFKNKTLNINNEVESIQFLRCDSVNFANIENIVVPNQISNKFHTMLRNRLAVF
FT                   AEPEEALPYNTNIVATIRTEDDQPIYSKLYPYPMGVSDFVNKETHALLKDGIIRPSSSP
FT                   YNNPVWVVDKKGTDEEGNTKKRLVIDFRKLNLKTIDDKYPIPNVVWILSNLGKARFFTT
FT                   LDLKSAFHQILLAEKDRAKTAFSVGNGKYEFCRLPFGLKNAPSIFQRAIDDVVRDRIGK
FT                   SCYVYVDDVIIFSNGIEDHVNDVAWVLDRLSGANMRVSKEKSFFFKESVEYLGFMVSSG
FT                   GITTSPSKVEAIQKYNQPTNLFSVRSFLGLASYYRCFIKDFASIARPLTDILKGENGKV
FT                   SASQSKKIPISFDERQCSAFEKLKNVLVSENVMLLYPDYRKAFDLTTDASAFGLGAVLS
FT                   QDGKPVTMISRTLQDRELNFATNERELLAIVWALKSLRNYLYGVKNLNIFTDHQPLTYA
FT                   VSDRNPNAKIKRWKAFIDEHNAKIFYKPGKETYVADALSRQAIHVLEDEPQSDIATIHS
FT                   EISLTFTIETIDKPVNCFRNQIVIDEGTADSTRTFVIFGSKTRHLIQFLDKETLIGRIR
FT                   DVVKPDVVNAIHCELPVLAFIQNSLVNDFPATTFRHTMKMVSDIFNQTEQREIVSLEHN
FT                   RAHRAAQENVKQILQYYFFPKMSQIAATFVSNCLVCQKAKYDRHPQKQILGRTPIPSHV
FT                   GETLHIDIFSTGRNYFLTCIDKFSKFAIVQPIGSRTITDLEPAIMQLMNFFPHSKTIFC
FT                   DNEPSINSESIKSLLKNRFNVDIANAPPLHSTSNGQVERFHSTLLEIARCLKLDSGMND
FT                   TVNLILQATIEYNKTVHSVTNRRPIDIIHSTPPELANEIVEMVNEAQEKQLRRENVTRR
FT                   DRTFEVGETVMVKQNNRLGNKLTPRYREELIEADLGTTVLIKGRVVHKDNLR"
XX
CC   Derived from U89994 (g1905850) (Rel. 51, Last updated, Version 1).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 6411 BP;  2219 A; 1259 C; 1204 G; 1729 T; 0 other;
     AGTTAACACA ATCACAAAAC ACCCGAAATA TAGTCGTAAG CCTCAAGTGC TTTTCCCATC        60
     TATAGATCGA GCTTTACCTA TAAGAAACTG TAACTTGTTA AGCTTTAGAG ATAAGAACTC       120
     TTGCTATACT TAAGTCAGTC GATTTTGGAA GATTAGAAGC GTCGGTCATC GCCACGTACT       180
     TACTATTCGT CTCATTAAGT GCAGACCGCG CAAGCCTATT GTAATTAATA AACTTACGCT       240
     AATAAATATA TGGAAAATCT ACTAAAATGA TAATTGGCGC CCAAACGGAT ATAAAAACCT       300
     ACGATAACTG AATAATTATA AATAAATAAC AAAAGGAGGA TCCGGAGACA AAACCAGCGG       360
     CTTTGGCTAA TTAACTCTAA CCTAAGAAAT AAAAATTTGC TGATTACATA AAATATAATA       420
     TTAATTACTA AGACCATCTA CCTTAAAATT GTTTGTTAAT CACTATTATT ATATTGTAAG       480
     TATAACGCTT ATTGAACGAA TTAAAAATAT TATTATTATT ATTATATTAT AACCTATGCA       540
     AAGAGTATTG ATAATAAAAA TACATGAGTG ACAGTGATAA CCTTTTAGAC AACCTAGTGT       600
     CAAGCTTAAA TAAATGGTCA GCGCACCAGG CAAGTAGGCA AAACAGTGCA GAAAAAAATA       660
     ATAAGTCATC AGATAATTGG TGGTCAAAAA CAAAGACAAC TAGCGAAATG GAATTTGAAG       720
     CTCAGTTAAA AGCGATCGTA GAGAGTGCTG TTGCCGGTGC GCTCGCAGTC CAAAAACAAT       780
     CATTTGAAAA GCAATTGCAG GAGATGAATG AGCGAATCGG GAAATTAACA GTGAACACCC       840
     CAGAGGTGGA AACTTATGTA GATGCTGAAA TTAGACCAGG TGTTGTCTGT AGCGAGCCTC       900
     TAGATATACT TAAATCTCTG CCAGATTTTG ATGGCAAAAG TGAAACATAT GTGTCGTGGA       960
     GAAAAGCGGC TCATGTCGCT TTTAAAGTTT TCAAAGATTA CGAGGGAAGT TCAACATTTT      1020
     ACCAAGCTCT TGGTATTATG CGAAATAAAA TAAAAGGTCC AGCGAATACA GTATTGGCTT      1080
     CTTTTAATAC TCCGTTACAT TTCAAAGCAA TGATCAGCCG TCTTGATTTC ACATATTCTG      1140
     ACAAAAGGCC GATCTATCTA ATCGAACAAG AGCTATCAAC TTTGCGACAG GGAGACATGA      1200
     CTCTTACTGA ATTCTACGAT GAAGTCGAGA AAAAACTGAC CCTACTTACC AACAAGACAA      1260
     TAATGACATT TGATAGTGCC TTGGCGATGT CACTGAATGA AAAGTACAGG ACGGACGCGT      1320
     TACGTGTATT TGTAACCGGA GCTAAGAAAT CGTTGAGCGA CATTCTTTTT GCAAAAGGTC      1380
     CAAAAGATTT ACCAACTGCT CTCGCTTTAG CGCAAGAGGT CGAGTCGAAC CATGAGCGTT      1440
     ACCAATTCGC CCTTATTTAT TCTAAAAATA TTGGAGACAG GGGTCAGAAA ATCGAACAAA      1500
     GGCACAGCGA TAAGGATAGA AACTCAATCA TGCCCATGCA AACTAAAAAC CCATATTTTA      1560
     GCAAGCGTCA GGTGCATACT TATGATAACC AGGAAAGACA AGATCCAGTC CAGTTAACAA      1620
     ATCCTGATGT ATCCATGCGA TCTAGAAGAA CTGGAAATTT TGGACAAACT CCATTTCCGA      1680
     CTCAGGGAAA TATTTGGCCA TCCCAACAGC AAAATTCTTG GCCATCTCAA CAACAATATT      1740
     CTTGGCCATC CCAACAACAA AATTCATTTC GAACACAAAA TCAATTCGCA TCGCAACCCC      1800
     AACAGCAAAA CACAAGTCAG GCTCAGGGAC ATTTTGGGTA TGCGCAAGCA TCAAAAAGAC      1860
     CAACGAGTGG CAGTGCAAGG TTTACAGGGC CAAAACAGCA GAGGATCAAC TACTTACCTC      1920
     ATGAGAAAGG TCAATGTGAG GAAGATACAG ACGGTTATCA AAAGGAGGCA GAAGCGGAGG      1980
     TTGATGATTA TGAGGACGAA CTAGTGAATT ACGATCATGT TCATTTTTTA GCCACAAATC      2040
     CCTGCTACCG TACATAGAAA GAGAGATAGC AGGGAGAACC ATAAAACTTT TGATTGACAC      2100
     CGGGGCTTCG AAAAATTACA TACAGCCCCT CCCTGAATTA AAAAACATAA TGCCGGTACA      2160
     AAATAAATTC ACGGTAAAAT CGCTTCATGG TTGCAACACC GTCAAACAGA AATGCTTTAT      2220
     TAAGCTATTT AACACATCTG TTCAATTCTT TATTCTTCCA AGTCTCTCTA GTTTTGACGC      2280
     AATAATAGGA CTTGACCTTT TGAAACAGGG AAATGCAACG TTAGATTTTA AGAACAAAAC      2340
     GTTGAATATC AACAATGAAG TGGAATCTAT TCAGTTTTTG AGATGTGACA GCGTAAATTT      2400
     CGCCAACATA GAGAATATTG TGGTTCCAAA TCAGATATCT AATAAATTCC ATACAATGCT      2460
     TCGAAACCGA TTGGCCGTCT TTGCGGAACC GGAAGAAGCA CTGCCGTATA ATACCAACAT      2520
     TGTTGCCACA ATACGTACTG AGGACGACCA ACCCATTTAC TCAAAACTCT ATCCGTACCC      2580
     CATGGGCGTA TCGGATTTTG TGAATAAGGA GACACATGCT TTGTTAAAGG ACGGAATTAT      2640
     CAGGCCCTCG TCGTCACCTT ACAACAATCC GGTTTGGGTA GTCGATAAAA AAGGTACAGA      2700
     TGAAGAGGGA AATACTAAGA AAAGGTTGGT TATAGATTTT AGAAAACTAA ATTTAAAAAC      2760
     AATCGACGAC AAGTACCCTA TACCAAACGT AGTATGGATC TTGTCAAATT TGGGAAAAGC      2820
     CAGATTCTTT ACAACCCTTG ACCTTAAATC GGCGTTTCAC CAAATTCTGC TCGCAGAAAA      2880
     GGATAGAGCG AAAACTGCCT TTTCAGTAGG AAATGGAAAA TACGAGTTTT GCCGTTTGCC      2940
     GTTTGGCTTG AAAAATGCCC CAAGTATTTT TCAACGTGCT ATTGATGATG TTGTTAGGGA      3000
     CCGTATAGGA AAGTCATGTT ACGTTTACGT TGACGACGTA ATAATATTTT CAAACGGAAT      3060
     TGAGGACCAC GTAAACGACG TTGCTTGGGT ACTAGACAGA CTGTCTGGGG CAAACATGAG      3120
     GGTTTCTAAA GAGAAATCGT TTTTCTTCAA GGAAAGCGTC GAGTATCTCG GATTCATGGT      3180
     GTCAAGTGGA GGTATCACAA CCAGTCCTAG CAAAGTAGAG GCTATTCAGA AATATAATCA      3240
     ACCTACTAAT CTGTTTAGTG TTCGATCGTT TTTAGGGCTA GCAAGTTATT ACCGCTGCTT      3300
     TATTAAGGAC TTCGCCTCTA TTGCTAGACC ACTCACTGAC ATTCTGAAGG GTGAAAACGG      3360
     AAAGGTTTCC GCAAGCCAGT CTAAAAAGAT ACCAATTTCT TTCGATGAAA GACAATGTTC      3420
     TGCTTTTGAG AAGCTTAAAA ATGTTCTTGT CTCCGAAAAT GTAATGTTAT TGTATCCCGA      3480
     TTATAGAAAA GCCTTTGACT TAACAACAGA CGCTTCGGCT TTTGGCCTGG GGGCAGTCTT      3540
     ATCACAGGAT GGCAAGCCTG TTACAATGAT TTCGAGAACT TTACAGGATA GAGAACTTAA      3600
     TTTCGCAACA AATGAACGAG AACTTTTGGC CATCGTTTGG GCTTTAAAGT CTCTTAGGAA      3660
     CTATCTATAT GGTGTCAAAA ACTTAAACAT TTTTACAGAT CACCAGCCGT TAACATACGC      3720
     CGTGTCAGAT AGGAATCCAA ATGCAAAAAT CAAGAGATGG AAGGCGTTTA TAGACGAACA      3780
     TAATGCTAAA ATTTTCTATA AACCTGGCAA GGAGACCTAT GTTGCCGATG CACTATCCAG      3840
     GCAGGCTATT CATGTCCTAG AGGACGAACC CCAGTCAGAC ATTGCAACAA TACATAGCGA      3900
     AATTTCATTG ACTTTTACAA TCGAAACTAT CGACAAGCCG GTTAACTGTT TTAGAAACCA      3960
     AATTGTGATA GATGAGGGCA CCGCAGACTC AACTCGAACT TTTGTTATTT TCGGAAGCAA      4020
     GACAAGGCAT CTAATACAGT TTCTAGACAA AGAGACCTTA ATCGGAAGAA TTCGTGATGT      4080
     GGTTAAGCCG GATGTAGTGA ATGCGATACA CTGCGAATTA CCTGTACTAG CTTTCATTCA      4140
     AAACAGTCTT GTAAATGACT TTCCAGCAAC AACCTTCCGA CACACTATGA AAATGGTCAG      4200
     CGACATTTTT AATCAAACTG AGCAACGGGA AATAGTGTCT TTGGAGCACA ACAGAGCGCA      4260
     TAGGGCAGCA CAGGAGAATG TAAAACAAAT TCTTCAATAC TACTTTTTCC CTAAAATGTC      4320
     ACAAATAGCC GCTACCTTTG TTTCTAACTG CTTGGTTTGT CAAAAAGCCA AATACGACCG      4380
     CCATCCGCAA AAGCAAATCC TCGGGAGAAC ACCTATTCCG TCACATGTAG GCGAGACATT      4440
     GCATATTGAT ATATTTTCTA CGGGCAGGAA TTACTTTTTG ACATGTATTG ACAAATTTTC      4500
     CAAATTCGCT ATTGTGCAAC CAATCGGCTC TCGAACGATA ACTGATTTAG AACCTGCAAT      4560
     TATGCAACTA ATGAACTTTT TTCCCCATTC AAAGACAATA TTTTGTGACA ATGAACCGTC      4620
     CATAAATTCC GAGTCAATCA AGTCACTTTT GAAAAATCGT TTTAATGTTG ACATAGCGAA      4680
     CGCACCTCCA CTTCATAGTA CCTCAAACGG ACAGGTTGAA AGGTTTCACA GCACGCTTTT      4740
     AGAAATAGCT CGATGCCTGA AACTTGACAG TGGAATGAAT GATACAGTCA ACCTTATTCT      4800
     TCAGGCAACA ATAGAATACA ATAAGACGGT GCACTCAGTC ACCAATAGAA GACCGATCGA      4860
     CATTATTCAT TCAACTCCTC CCGAATTGGC TAACGAGATA GTAGAAATGG TTAACGAAGC      4920
     TCAGGAAAAA CAGCTAAGAA GAGAAAATGT AACAAGACGA GACAGAACCT TTGAGGTGGG      4980
     AGAAACCGTC ATGGTAAAAC AAAACAATCG CTTGGGAAAT AAACTAACCC CACGGTATAG      5040
     GGAAGAACTA ATCGAAGCAG ACCTCGGGAC AACGGTCCTC ATAAAAGGGA GGGTCGTTCA      5100
     TAAAGATAAT CTACGCTAGG TTTAGTATTT CTTTTCCTTT TGTGACCATC GCCAAGTTAG      5160
     CAAAATACAA ACGTGAAATC TGAACACTAG TAAAAGAGTT TGCAAACATT TTTCAATTAA      5220
     ATATTTGTCA AATCCTTCTT ATTTAATCTT TAAACATTTT GTATTATTTC CGCTTCATCC      5280
     TCTTTAGAAA ATTTTAAAGG TATGTGATGA AATGCTAGAC CCGAATGATT TGAAAACTTA      5340
     AAGTCCACGC AACCACAAAT ATTTCCTGAA ACTACCATAG AAAATAAATG CATTACCAAA      5400
     ACGGCATAAT AACAGTATAG CGCACTCACT CTAATTAGAT TTCAAATTCC CGATTAAAAA      5460
     AAAAATAAAA CACTAATGTT ATCAATACCC TTTCCTGATT CTGTTCAACT AAAATAGGAA      5520
     AATCAATACT TGCAATCAAT AAGCGTTTTA CTACATACTT TAATATCAAA ATATCTGAAT      5580
     GAACTTTATT ATAAAATTAT AATTGTTATA CTTAATTATT GTCAAAACTT TAGTATTAAA      5640
     ACTGTAACTA CCTCTTAAGT AGATGAGAAG AGTAGAAGAG GGAATTAAGA TCTATCAACG      5700
     TAGTATCTGC TAAAGACGTA AAGATGCGGC AACTATTTCT GCGCCTGGGT ACTGAAACGA      5760
     CGAACTGAAT AATATCTGCC ATCAGACGCC AACCAGAGTG CGTTCAACAC ATACGTTTTG      5820
     ATGGTCAACT AGTTCAACCA ACATCAGCAT CATCGTCGTC AACAAGTCGA CGGTTACAAT      5880
     AAAGATTTTT TCCAAGTTCG CTACGATCAT CTCCAGAACC TTGTTGCGAA CCCATGACAT      5940
     GGAGAATCAG CAGCATTTAC GAACTTCTCG GATCATCCAG ACACGCAGAG CTGCCTTCCC      6000
     TTCGATGGTT TAACGCAGTA CCAGGTTGGC AGTATGGGAA CTTAGTGCAC AACCAATGTT      6060
     ACCCGTAAGA TCCGCTTTCA AATAGATTTG CCAATTGTAA AAAGTCTGTG GACAGCCTTC      6120
     GTCTTAGAAG GGGAGGAGTT AACACAATCA CAAAACACCC GAAATATAGT CGTAAGCCTC      6180
     AAGTGCTTTT CCCATCTATA GATCGAGCTT TACCTATAAG AAACTGTAAC TTGTTAAGCT      6240
     TTAGAGATAA GAACTCTTGC TATACTTAAG TCAGTCGATT TTGGAAGATT AGAAGCGTCG      6300
     GTCATCGCCA CGTACTTACT ATTCGTCTCA TTAAGTGCAG ACCGCGCAAG CCTATTGTAA      6360
     TTAATAAACT TACGCTAATA AATATATGGA AAATCTACTA AAATGATAAT T               6411
//
ID   DMCOPIA    standard; DNA; INV; 5143 BP.
XX
AC   X02599;
XX
DR   FLYBASE; FBte0000023; Dmel\copia.
XX
FT   source          X02599:21..5163
FT   SO_feature      five_prime_LTR ; SO:0000425:1..276
FT   SO_feature      three_prime_LTR ; SO:0000426:4867..5143
FT   SO_feature      polyA_signal_sequence ; SO:0000551:1990..1999
FT   SO_feature      polyA_signal_sequence ; SO:0000551:5063..5073
FT   SO_feature      primer_binding_site ; SO:0005850:277..291
FT                   /bound_moiety="tRNA:M-i-RB"
FT   SO_feature      CDS ; SO:0000316:432..4661
FT                   /name="Dmel\copia\GIP"
FT                   /db_xref="FLYBASE:FBgn0013437"
FT                   /db_xref="SWISS-PROT:P04146"
FT                   /db_xref="NCBI_PROTEIN:CAA26444.1"
FT                   /translation="MDKAKRNIKPFDGEKYAIWKFRIRALLAEQDVLKVVDGLMPNEVD
FT                   DSWKKAERCAKSTIIEYLSDSFLNFATSDITARQILENLDAVYERKSLASQLALRKRLL
FT                   SLKLSSEMSLLSHFHIFDELISELLAAGAKIEEMDKISHLLITLPSCYDGIITAIETLS
FT                   EENLTLAFVKNRLLDQEIKIKNDHNDTSKKVMNAIVHNNNNTYKNNLFKNRVTKPKKIF
FT                   KGNSKYKVKCHHCGREGHIKKDCFHYKRILNNKNKENEKQVQTATSHGIAFMVKEVNNT
FT                   SVMDNCGFVLDSGASDHLINDESLYTDSVEVVPPLKIAVAKQGEFIYATKRGIVRLRND
FT                   HEITLEDVLFCKEAAGNLMSVKRLQEAGMSIEFDKSGVTISKNGLMVVKNSGMLNNVPV
FT                   INFQAYSINAKHKNNFRLWHERFGHISDGKLLEIKRKNMFSDQSLLNNLELSCEICEPC
FT                   LNGKQARLPFKQLKDKTHIKRPLFVVHSDVCGPITPVTLDDKNYFVIFVDQFTHYCVTY
FT                   LIKYKSDVFSMFQDFVAKSEAHFNLKVVYLYIDNGREYLSNEMRQFCVKKGISYHLTVP
FT                   HTPQLNGVSERMIRTITEKARTMVSGAKLDKSFWGEAVLTATYLINRIPSRALVDSSKT
FT                   PYEMWHNKKPYLKHLRVFGATVYVHIKNKQGKFDDKSFKSIFVGYEPNGFKLWDAVNEK
FT                   FIVARDVVVDETNMVNSRAVKFETVFLKDSKESENKNFPNDSRKIIQTEFPNESKECDN
FT                   IQFLKDSKESENKNFPNDSRKIIQTEFPNESKECDNIQFLKDSKESNKYFLNESKKRKR
FT                   DDHLNESKGSGNPNESRESETAEHLKEIGIDNPTKNDGIEIINRRSERLKTKPQISYNE
FT                   EDNSLNKVVLNAHTIFNDVPNSFDEIQYRDDKSSWEEAINTELNAHKINNTWTITKRPE
FT                   NKNIVDSRWVFSVKYNELGNPIRYKARLVARGFTQKYQIDYEETFAPVARISSFRFILS
FT                   LVIQYNLKVHQMDVKTAFLNGTLKEEIYMRLPQGISCNSDNVCKLNKAIYGLKQAARCW
FT                   FEVFEQALKECEFVNSSVDRCIYILDKGNINENIYVLLYVDDVVIATGDMTRMNNFKRY
FT                   LMEKFRMTDLNEIKHFIGIRIEMQEDKIYLSQSAYVKKILSKFNMENCNAVSTPLPSKI
FT                   NYELLNSDEDCNTPCRSLIGCLMYIMLCTRPDLTTAVNILSRYSSKNNSELWQNLKRVL
FT                   RYLKGTIDMKLIFKKNLAFENKIIGYVDSDWAGSEIDRKSTTGYLFKMFDFNLICWNTK
FT                   RQNSVAASSTEAEYMALFEAVREALWLKFLLTSINIKLENPIKIYEDNQGCISIANNPS
FT                   CHKRAKHIDIKYHFAREQVQNNVICLEYIPTENQLADIFTKPLPAARFVELRDKLGLLQ
FT                   DDQSNAE"
FT   SO_feature      CDS ; SO:0000316:join(432..1605,4555..4661)
FT                   /name="Dmel\copia\GIP-RB"
FT                   /db_xref="FLYBASE:FBgnXXXXXXX"
FT                   /db_xref="SWISS-PROT:P04146"
FT                   /db_xref="NCBI_PROTEIN:CAA26445.1"
FT                   /translation="MDKAKRNIKPFDGEKYAIWKFRIRALLAEQDVLKVVDGLMPNEVD
FT                   DSWKKAERCAKSTIIEYLSDSFLNFATSDITARQILENLDAVYERKSLASQLALRKRLL
FT                   SLKLSSEMSLLSHFHIFDELISELLAAGAKIEEMDKISHLLITLPSCYDGIITAIETLS
FT                   EENLTLAFVKNRLLDQEIKIKNDHNDTSKKVMNAIVHNNNNTYKNNLFKNRVTKPKKIF
FT                   KGNSKYKVKCHHCGREGHIKKDCFHYKRILNNKNKENEKQVQTATSHGIAFMVKEVNNT
FT                   SVMDNCGFVLDSGASDHLINDESLYTDSVEVVPPLKIAVAKQGEFIYATKRGIVRLRND
FT                   HEITLEDVLFCKEAAGNLMSVKRLQEAGMSIEFDKSGVTISKNGLMVVKNSENQLADIF
FT                   TKPLPAARFVELRDKLGLLQDDQSNAE"
XX
CC   Derived from X02599 (g7740) (Rel. 49, Last updated, Version 4).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 5143 BP;  1874 A; 727 C; 971 G; 1571 T; 0 other;
     TGTTGGAATA TACTATTCAA CCTACAAAAA TAACGTTAAA CAACACTACT TTATATTTGA        60
     TATGAATGGC CACACCTTTT ATGCCATAAA ACATATTGTA AGAGAATACC ACTCTTTTTA       120
     TTCCTTCTTT CCTTCTTGTA CGTTTTTTGC TGTGAGTAGG TCGTGGTGCT GGTGTTGCAG       180
     TTGAAATAAC TTAAAATATA AATCATAAAA CTCAAACATA AACTTGACTA TTTATTTATT       240
     TATTAAGAAA GGAAATATAA ATTATAAATT ACAACAGGTT ATGGGCCCAG TCCATGCCTA       300
     ATAAACAATT AAATTGTGAA TTAAAGATTG TGAAAATAAA TTGTGAAATA GCATTTTTTC       360
     ACATTCTTGT GAAATAGCTT TTTTTTTCAC ATTCTTGTGA AATTATTTCC TTCTCAGAAT       420
     TTGAGTGAAA AATGGACAAG GCTAAACGTA ATATTAAGCC GTTTGATGGC GAGAAGTACG       480
     CGATTTGGAA ATTTAGAATT AGGGCTCTTT TAGCCGAGCA AGATGTGCTT AAAGTAGTTG       540
     ATGGTTTAAT GCCTAACGAG GTAGATGACT CCTGGAAAAA GGCAGAGCGT TGTGCAAAAA       600
     GTACAATAAT AGAGTACCTA AGCGACTCGT TTTTAAATTT CGCAACAAGC GACATTACGG       660
     CGCGTCAGAT TCTTGAGAAT TTGGACGCCG TTTATGAACG AAAAAGTTTG GCGTCGCAAC       720
     TGGCGCTGCG AAAACGTTTG CTTTCTCTGA AGCTATCGAG TGAGATGTCA CTATTAAGCC       780
     ATTTTCATAT TTTTGACGAA CTTATAAGTG AATTGTTGGC AGCTGGTGCA AAAATAGAAG       840
     AGATGGATAA AATTTCTCAT CTACTGATCA CATTGCCTTC GTGTTACGAT GGAATTATTA       900
     CAGCGATAGA GACATTATCT GAAGAAAATT TGACATTGGC GTTTGTGAAA AATAGATTGC       960
     TGGATCAAGA AATTAAAATT AAAAATGACC ACAACGATAC AAGCAAGAAA GTTATGAACG      1020
     CGATCGTGCA CAACAATAAT AACACTTATA AAAATAATTT GTTTAAAAAT CGGGTAACTA      1080
     AACCAAAGAA AATATTCAAG GGAAATTCAA AGTATAAAGT CAAGTGTCAC CACTGTGGCA      1140
     GAGAAGGCCA CATTAAAAAA GATTGTTTCC ATTATAAAAG AATATTAAAT AATAAAAATA      1200
     AAGAAAATGA AAAACAAGTT CAAACTGCAA CATCACACGG CATTGCGTTT ATGGTAAAAG      1260
     AAGTGAATAA TACTTCAGTG ATGGACAACT GCGGGTTTGT CCTTGATTCT GGTGCTAGTG      1320
     ACCATCTTAT AAATGATGAG TCGCTGTATA CCGACAGTGT GGAGGTTGTG CCTCCACTTA      1380
     AGATTGCAGT GGCCAAGCAA GGCGAATTTA TTTATGCCAC TAAGCGTGGT ATTGTCCGAC      1440
     TACGGAATGA CCATGAGATT ACACTGGAGG ATGTACTCTT TTGTAAGGAA GCTGCTGGTA      1500
     ATTTGATGTC CGTAAAGCGT CTCCAAGAGG CAGGAATGTC GATCGAATTT GACAAAAGCG      1560
     GTGTAACCAT TTCGAAAAAT GGGTTAATGG TTGTCAAAAA TTCAGGTATG TTAAACAATG      1620
     TACCTGTGAT CAATTTTCAA GCATATTCTA TAAATGCTAA GCATAAAAAT AATTTTCGTT      1680
     TATGGCATGA GAGGTTTGGC CATATAAGCG ATGGCAAATT ATTAGAAATA AAACGAAAGA      1740
     ATATGTTTAG TGATCAAAGT CTTCTAAACA ACTTAGAGTT ATCATGTGAA ATTTGTGAAC      1800
     CCTGTTTAAA TGGTAAACAG GCAAGACTTC CTTTTAAACA ATTGAAAGAT AAGACCCATA      1860
     TTAAAAGACC ACTTTTTGTA GTACACTCAG ATGTCTGTGG GCCTATTACT CCAGTTACTT      1920
     TAGATGATAA AAATTATTTT GTGATCTTTG TTGATCAGTT TACACATTAT TGTGTAACTT      1980
     ATTTAATTAA ATATAAATCT GATGTGTTTA GCATGTTTCA AGATTTTGTA GCCAAGAGTG      2040
     AAGCTCATTT TAATTTAAAG GTTGTGTACT TATACATTGA CAATGGTAGA GAATACTTGT      2100
     CAAATGAGAT GAGACAATTT TGTGTTAAGA AAGGAATTTC TTATCACTTA ACAGTGCCAC      2160
     ATACACCTCA GTTAAATGGT GTTTCTGAGA GAATGATAAG AACCATTACG GAAAAAGCTC      2220
     GAACCATGGT TAGTGGTGCA AAGCTAGATA AAAGCTTTTG GGGCGAAGCA GTATTAACTG      2280
     CTACTTATTT AATCAACAGA ATTCCTAGTA GAGCACTTGT TGATAGTTCA AAGACCCCAT      2340
     ATGAGATGTG GCACAATAAG AAGCCATACT TAAAACATTT GAGAGTGTTT GGTGCAACTG      2400
     TTTATGTGCA TATTAAAAAC AAACAAGGAA AGTTTGATGA TAAATCATTT AAAAGTATTT      2460
     TTGTGGGCTA TGAACCCAAT GGTTTTAAGT TGTGGGATGC TGTAAATGAA AAATTTATTG      2520
     TCGCAAGAGA TGTTGTTGTC GATGAAACCA ATATGGTTAA TTCTAGAGCT GTTAAATTTG      2580
     AAACAGTGTT CCTGAAAGAT AGTAAGGAAA GTGAAAATAA AAATTTTCCG AATGACAGTA      2640
     GGAAAATAAT ACAAACAGAA TTCCCGAATG AGAGTAAGGA ATGCGACAAC ATACAATTCC      2700
     TGAAAGATAG TAAGGAAAGT GAAAATAAAA ATTTTCCGAA TGACAGTAGG AAAATAATAC      2760
     AAACAGAATT CCCGAATGAG AGTAAGGAAT GCGACAACAT ACAATTCCTG AAAGATAGTA      2820
     AGGAAAGTAA TAAATATTTT CTGAATGAGA GTAAGAAAAG AAAGCGAGAT GATCACCTGA      2880
     ATGAAAGTAA GGGATCAGGC AACCCGAATG AGAGTAGGGA AAGTGAAACA GCAGAGCACT      2940
     TAAAAGAAAT TGGAATTGAT AATCCAACTA AAAATGATGG CATAGAAATT ATTAATAGAA      3000
     GAAGTGAGAG ATTAAAGACT AAGCCTCAGA TATCCTATAA TGAAGAGGAT AATAGTCTAA      3060
     ATAAAGTTGT TCTAAATGCT CACACTATAT TTAACGATGT CCCAAATTCA TTTGATGAAA      3120
     TTCAATATAG GGATGATAAA TCTTCTTGGG AAGAAGCCAT CAATACAGAG TTAAATGCTC      3180
     ATAAAATTAA TAATACTTGG ACAATTACAA AAAGGCCTGA AAACAAAAAT ATTGTAGATA      3240
     GCAGATGGGT ATTTTCTGTT AAATATAATG AACTTGGAAA TCCAATTAGA TACAAAGCTA      3300
     GATTGGTTGC ACGAGGATTC ACTCAAAAAT ACCAAATAGA CTATGAAGAG ACATTTGCTC      3360
     CTGTAGCTAG AATTTCAAGT TTCCGATTTA TATTGTCATT AGTAATACAG TATAACTTGA      3420
     AAGTCCATCA AATGGATGTA AAAACAGCTT TCTTAAATGG CACGTTAAAA GAGGAAATTT      3480
     ATATGAGACT TCCTCAAGGT ATATCGTGTA ATAGTGACAA TGTGTGTAAA TTGAATAAGG      3540
     CAATTTACGG ACTCAAGCAA GCGGCTAGAT GCTGGTTTGA AGTATTTGAG CAAGCATTGA      3600
     AAGAGTGTGA GTTTGTAAAC TCTTCAGTTG ATCGCTGTAT ATATATTTTA GACAAAGGTA      3660
     ACATCAATGA AAACATATAT GTATTATTAT ATGTAGATGA TGTGGTTATA GCTACAGGAG      3720
     ATATGACAAG AATGAATAAC TTCAAAAGGT ATTTAATGGA AAAGTTTAGG ATGACTGACC      3780
     TAAATGAAAT AAAACATTTT ATTGGAATTA GGATAGAGAT GCAGGAAGAT AAAATCTATT      3840
     TAAGCCAATC TGCATATGTT AAAAAAATTT TAAGTAAATT TAACATGGAA AATTGTAATG      3900
     CAGTTAGTAC TCCTTTACCT AGTAAAATAA ATTATGAATT ACTTAATTCA GATGAAGACT      3960
     GCAATACCCC ATGCCGTAGC CTCATAGGAT GTTTAATGTA CATAATGCTT TGTACACGCC      4020
     CAGATTTAAC TACTGCAGTA AATATCTTGA GCAGATATAG TAGCAAAAAT AACTCCGAAT      4080
     TATGGCAGAA CTTAAAAAGA GTTCTTAGAT ATTTGAAGGG CACTATCGAT ATGAAATTGA      4140
     TTTTTAAAAA GAACTTGGCA TTTGAAAATA AAATTATTGG TTATGTGGAT TCTGATTGGG      4200
     CTGGTAGTGA AATTGATAGA AAAAGTACAA CAGGGTATTT ATTCAAAATG TTTGATTTTA      4260
     ATCTCATTTG TTGGAATACA AAGAGACAGA ACTCAGTAGC AGCCTCATCA ACTGAAGCTG      4320
     AGTATATGGC CCTATTTGAA GCCGTGAGAG AAGCTCTATG GCTTAAATTT TTATTAACTA      4380
     GTATTAACAT TAAACTAGAA AACCCCATTA AAATTTACGA AGACAATCAA GGCTGTATTA      4440
     GCATAGCAAA CAACCCCTCA TGTCATAAAC GAGCTAAACA TATTGATATT AAATATCATT      4500
     TTGCCAGAGA GCAAGTTCAG AATAATGTGA TTTGTCTTGA GTATATTCCT ACAGAGAATC      4560
     AACTGGCTGA CATATTTACA AAACCGTTGC CTGCTGCGAG ATTTGTGGAG TTACGAGACA      4620
     AATTGGGTTT GCTGCAAGAC GACCAATCGA ATGCTGAATG AAATTTTTAT ATATATTTTT      4680
     CAAATTTAAA TTCCTGTAAA CATATTTTGT TACAATGATC TGATCGGGTT TTTCTGGGTT      4740
     TTCCCCGTAT CCTCGCAGCA AATGCTGGAT CAGTTAACAC TTCCCAGAAT GCACACCACC      4800
     CACATTTGAT AGTTACTAAT GAATATTATT GTTATGTTTT TAATTATAGA CGTTATTTTT      4860
     GAGGGGGCGT GTTGGAATAT ACTATTCAAC CTACAAAAAT AACGTTAAAC AACACTACTT      4920
     TATATTTGAT ATGAATGGCC ACACCTTTTA TGCCATAAAA CATATTGTAA GAGAATACCA      4980
     CTCTTTTTAT TCCTTCTTTC CTTCTTGTAC GTTTTTTGCT GTGAGTAGGT CGTGGTGCTG      5040
     GTGTTGCAGT TGAAATAACT TAAAATATAA ATCATAAAAC TCAAACATAA ACTTGACTAT      5100
     TTATTTATTA TTAAGAAAGG AAAATAAATT ATAAATTACA ACA                        5143
//
ID   DMW1DOC    standard; DNA; INV; 4725 BP.
XX
AC   X17551;
XX
DR   FLYBASE; FBte0000341; Dmel\Doc.
XX
FT   source          X17551:1..4725
FT   SO_feature      CDS ; SO:0000316:213..1910
FT                   /name="Dmel\Doc\gag"
FT                   /db_xref="FLYBASE:FBgn0024789"
FT                   /db_xref="SPTREMBL:Q04134"
FT                   /db_xref="NCBI_PROTEIN:CAA35586.1"
FT                   /translation="MNQNDIRSQRQCEQDERRLSLQRNNAYFSFVSPQIGDRAPSPSTN
FT                   SKLLPSANDRPRSCSPSLPASAHKSWSEETASPTPLLSQRQTTVPGNCNTAITSAVTSL
FT                   ATATTSTSSAAQLIIAVPAVNNSAALTVCNNNNARKEESKQKQKSISTVQTGMDRYIQI
FT                   KRKLSPQNNKAGNQPKINRTNNGNENSAVNNSNRYAILADSATEQPNEKTVGEPKKTRP
FT                   PPIFIREQSTNALVNKLVALIGDSKFHIIPLKKGNIHEIKLQIQTEADHRIVTKYLNDA
FT                   GKNYYTYQLKSCKGLQVVLKGIEATVTPAEIIEALKAKNFSAKTAINILNKDKVPQPLF
FT                   KIELEPELQALKKNEVHPIYNLQYLLHRRITVEEPHKRINPVQCTNCQEYGHTKAYCTL
FT                   KSVCVVCSEPHTTANCPKNKDDKSVKKCSNCGEKHTANYRGCVVYKELKSRLNKRIATA
FT                   HTYNKVNFYSPQPIFQPPLTVPSTTPTISFASALKSGLEVPAPPTRTAHSEHTPTNIQQ
FT                   TQQSGIEAMMLSLQQSMKDFMTFMQNTLQELMKNQNILIQLLVSSKSP"
FT   SO_feature      CDS ; SO:0000316:1910..4576
FT                   /name="Dmel\Doc\RTase"
FT                   /db_xref="FLYBASE:FBgn0024790"
FT                   /db_xref="SPTREMBL:Q04135"
FT                   /db_xref="NCBI_PROTEIN:CAA35587.1"
FT                   /translation="MASLRISLWNANGVSRHTQELTQFIYEKNIDVMLLSETHLTNKNN
FT                   FHIPGYLFYGTNHPDGKAHGGTGILIRNRIKHHHLNNFDKNYLQSTSIALQLNNGSTTL
FT                   AAVYCPPRFPISEDQFMEFFNTLGDRFIAAGDYNAKHTHWGSRLVSPKGKQLYNALTKP
FT                   ENKLDYVSPGKPTYWPADPRKIPDLIDFAITKHVPRNMVTAEALADLSSDHSPVFLNML
FT                   TRPHIVDPPYRLTNFRTNWPRYQKYVCSHIELTTALSTKEDIDKSTETLENILVSAAKA
FT                   STPPVTYAKPNYIKTNREIERLVLDKRRLRRDWQSNRSPITKHMLKIATRRLTNALKQE
FT                   EKNSQRSYIEQLSPTSTKYPLWRAHRNLKTPIAPIMPLRSPSGTWFRSDEERASAFADH
FT                   LQNVFRPNPSTNTFILPPLIAANLDPQEPFEFRPCELAKVIKEQLNPRKSPGYDLITPR
FT                   MLIELPKCAILHICLLFNAIAKLGYFPQKWKKSTIVMIPKPGKDKTQPSSYRPISLLTC
FT                   LSKLFEKMLLLRISPHLRINNTLPTHQFGFREKHGTIEQVNRITSEIRTAFEHREYCTA
FT                   IFLDVAQAFDRVWLDGLLFKIIKLLPQNTHKLLKSYLYNRVFAIRCDTSTSRDCAIEAG
FT                   VPQGSVLGPILYTLYTADFPIDYNLTTSTFADDTAILSRSKCPIKATALLSRHLTSVER
FT                   WLADWRISINVQKCKQVTFTLNKQTCPPLVLNNICIPQADEVTYLGVHLDRRLTWRKHI
FT                   EAKSKHLKLKARNLHWLINARSPLSLEFKALLYNSVLKPIWTYGSELWGNASRSNIDII
FT                   QRAQSRILRIITGAPWYLRNENIHRDLKIKLVIEVIAEKKTKYNEKLTTHTNPLARKLI
FT                   RVCSQSRLHRNDLPAQQ"
XX
CC   Derived from X17551 (g8821) (Rel. 29, Last updated, Version 2).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 4725 BP;  1647 A; 1192 C; 822 G; 1064 T; 0 other;
     GACATTCGGC ATTCCACAGT CTTCGGGTGG AGACGTGTTT CTTTCAAGCT ACGAATAGCA        60
     AGTTCTAAAA ACTACAACAG TATAGTGAAA GTTAAACACA AAGTGTAAAG TGCAGTTTGC       120
     ACAACTAACA ATTATTGACT ATAGTAATTA TTTACTAAAA TAAATAATTA TTCCATATTG       180
     TTCTGGTAAT TGTTATATGT GGACTTAGAA CAATGAATCA AAACGACATA CGTTCTCAGC       240
     GACAATGTGA ACAAGACGAG CGCCGGCTCT CTTTACAACG CAACAATGCA TACTTTTCTT       300
     TCGTCTCACC GCAAATCGGT GATCGAGCAC CCTCACCTTC AACTAACTCG AAACTTTTGC       360
     CCTCAGCGAA CGACAGACCG CGTTCTTGCT CTCCCTCTCT GCCTGCTTCG GCTCACAAGT       420
     CGTGGAGCGA AGAGACCGCC TCTCCTACCC CGCTCCTCTC GCAGCGCCAA ACGACCGTCC       480
     CGGGTAACTG TAACACTGCA ATAACGAGTG CAGTGACCTC ACTGGCAACT GCCACAACAT       540
     CAACTTCGTC AGCGGCCCAA CTAATTATCG CTGTGCCAGC TGTAAATAAT TCAGCAGCAC       600
     TGACCGTTTG CAACAACAAT AATGCACGTA AAGAAGAATC AAAACAAAAG CAGAAGTCGA       660
     TTTCGACTGT GCAGACTGGC ATGGATCGCT ACATCCAAAT CAAGAGAAAG CTCAGCCCTC       720
     AAAACAATAA GGCAGGTAAT CAACCCAAAA TCAATCGAAC CAACAACGGC AATGAAAACT       780
     CTGCAGTAAA TAATTCAAAC CGATATGCTA TCTTGGCTGA TTCTGCGACC GAACAACCCA       840
     ACGAAAAAAC GGTAGGGGAA CCAAAAAAGA CCAGGCCTCC ACCAATTTTC ATACGAGAAC       900
     AAAGTACAAA TGCACTTGTA AATAAACTCG TTGCTTTGAT TGGTGACAGC AAGTTCCACA       960
     TTATCCCACT TAAAAAAGGA AATATTCATG AAATAAAACT ACAGATCCAA ACAGAAGCAG      1020
     ACCACCGTAT AGTGACTAAA TACCTAAATG ATGCTGGTAA AAACTACTAC ACATACCAAT      1080
     TAAAAAGTTG CAAAGGGCTA CAGGTAGTAC TTAAGGGCAT TGAAGCAACA GTGACACCAG      1140
     CTGAGATAAT TGAGGCTCTG AAGGCCAAAA ACTTTTCTGC AAAGACAGCT ATTAATATTT      1200
     TAAACAAAGA CAAAGTTCCG CAGCCACTAT TCAAAATAGA ACTCGAACCA GAGCTCCAGG      1260
     CACTAAAGAA AAACGAAGTG CACCCAATAT ACAATTTACA GTACTTGCTA CATCGGAGGA      1320
     TCACCGTGGA GGAGCCGCAC AAACGTATCA ATCCAGTTCA ATGTACTAAT TGCCAAGAAT      1380
     ACGGCCACAC CAAGGCATAC TGCACCCTTA AGTCCGTATG TGTTGTCTGT AGCGAACCTC      1440
     ATACTACCGC AAACTGCCCC AAAAACAAGG ACGATAAGTC TGTGAAGAAA TGCAGTAACT      1500
     GCGGGGAAAA ACATACTGCA AACTACAGAG GCTGTGTGGT GTACAAAGAA TTGAAGAGCC      1560
     GCCTAAACAA ACGTATTGCC ACAGCACATA CATACAACAA AGTCAATTTC TACTCTCCGC      1620
     AACCGATTTT TCAACCACCC CTAACTGTCC CAAGCACTAC TCCAACAATT TCTTTCGCTA      1680
     GCGCCCTAAA ATCCGGACTA GAAGTGCCCG CCCCACCGAC AAGAACTGCT CATTCCGAAC      1740
     ATACACCGAC AAACATCCAA CAAACACAAC AAAGTGGCAT CGAAGCTATG ATGCTATCCC      1800
     TACAGCAAAG CATGAAAGAC TTCATGACGT TCATGCAAAA TACTTTGCAA GAGCTCATGA      1860
     AAAACCAAAA TATCCTGATT CAACTTCTTG TATCTTCAAA ATCCCCATAA TGGCTTCCCT      1920
     ACGGATATCT CTGTGGAACG CAAATGGCGT TTCACGGCAT ACACAAGAGC TCACACAGTT      1980
     CATTTACGAA AAAAACATCG ACGTAATGCT ACTATCAGAA ACGCACCTCA CAAATAAAAA      2040
     CAATTTTCAT ATACCAGGAT ACTTGTTCTA TGGTACAAAT CATCCAGATG GTAAAGCTCA      2100
     TGGAGGCACT GGAATACTCA TCAGAAATCG CATAAAACAC CACCACTTAA ACAATTTTGA      2160
     CAAAAACTAC TTACAATCTA CGTCCATAGC CTTACAACTC AACAATGGTT CAACGACTCT      2220
     AGCCGCAGTC TACTGCCCAC CGCGCTTTCC AATCTCTGAG GATCAATTCA TGGAATTCTT      2280
     TAACACACTA GGTGACAGGT TCATCGCAGC GGGTGACTAT AACGCCAAGC ACACCCATTG      2340
     GGGATCTCGA CTTGTGTCGC CAAAGGGTAA GCAATTGTAC AATGCGCTTA CGAAGCCAGA      2400
     AAACAAGCTA GACTATGTAT CCCCGGGTAA GCCTACATAC TGGCCAGCAG ACCCAAGAAA      2460
     AATCCCAGAC CTGATCGATT TTGCAATTAC TAAACATGTC CCCCGCAACA TGGTCACCGC      2520
     CGAAGCACTA GCAGATTTAT CATCAGATCA CTCACCTGTT TTTCTAAATA TGCTAACTCG      2580
     CCCCCACATC GTCGACCCAC CGTATAGACT CACAAATTTT AGAACAAACT GGCCAAGGTA      2640
     TCAAAAGTAT GTCTGTTCAC ACATAGAACT AACGACGGCA TTATCTACAA AGGAGGATAT      2700
     AGACAAGTCA ACGGAAACTC TTGAAAACAT TTTAGTTTCG GCTGCAAAGG CTTCAACCCC      2760
     GCCAGTGACG TATGCAAAAC CAAACTACAT CAAAACTAAT CGCGAAATCG AGCGGCTGGT      2820
     ATTAGATAAA CGACGCCTAC GAAGGGATTG GCAGTCTAAT AGATCACCAA TTACTAAGCA      2880
     CATGCTTAAG ATAGCCACAC GCAGGCTTAC CAATGCTCTC AAACAAGAGG AAAAAAACAG      2940
     CCAACGTTCA TATATCGAGC AACTCTCTCC CACCAGCACT AAGTACCCTC TTTGGAGAGC      3000
     TCACAGAAAC CTAAAGACTC CAATAGCGCC AATTATGCCA CTCCGAAGTC CCTCTGGCAC      3060
     CTGGTTTCGA AGTGATGAAG AAAGAGCCAG TGCTTTCGCT GACCATTTAC AAAATGTATT      3120
     CCGACCAAAT CCCTCTACCA ACACATTTAT TCTCCCTCCT TTAATAGCAG CCAATCTAGA      3180
     TCCTCAAGAA CCCTTTGAAT TCCGACCATG TGAACTAGCA AAGGTTATCA AAGAGCAACT      3240
     GAACCCAAGA AAATCGCCTG GCTACGACCT AATAACTCCA AGAATGCTCA TTGAACTCCC      3300
     AAAGTGTGCT ATTCTTCACA TCTGCCTGTT GTTCAACGCA ATCGCCAAGC TTGGATACTT      3360
     CCCTCAAAAA TGGAAAAAGT CGACCATAGT AATGATTCCA AAGCCAGGAA AAGATAAAAC      3420
     GCAGCCATCA TCATATAGAC CGATAAGCTT ACTAACATGT CTTTCAAAGC TGTTTGAAAA      3480
     AATGCTACTC CTTCGGATTA GCCCTCATCT TAGAATAAAC AACACACTTC CAACACATCA      3540
     ATTTGGCTTT AGAGAAAAAC ATGGAACCAT CGAACAGGTC AACCGAATCA CGTCAGAAAT      3600
     TCGTACTGCT TTTGAACATC GAGAATACTG CACAGCCATT TTTCTAGACG TCGCGCAGGC      3660
     ATTTGACAGA GTGTGGCTCG ATGGACTTTT GTTTAAAATA ATCAAGCTGT TGCCCCAAAA      3720
     CACACATAAG CTACTGAAGT CATACCTATA TAACAGAGTG TTTGCAATAA GATGCGATAC      3780
     AAGCACTTCA CGCGATTGCG CAATCGAAGC TGGAGTGCCG CAAGGCAGTG TACTGGGTCC      3840
     AATCTTATAC ACCCTGTATA CGGCGGATTT CCCCATAGAC TACAATCTAA CAACCTCCAC      3900
     GTTCGCTGAT GATACCGCGA TACTCAGTCG CTCGAAATGC CCAATAAAAG CCACGGCACT      3960
     CCTATCCCGA CACTTAACAT CTGTAGAACG ATGGCTTGCC GACTGGAGAA TTTCAATAAA      4020
     TGTTCAAAAA TGCAAGCAGG TTACCTTTAC CTTAAACAAA CAAACATGCC CACCACTGGT      4080
     CTTGAATAAC ATATGCATTC CACAAGCCGA CGAGGTAACA TATCTGGGAG TTCATCTGGA      4140
     CAGGCGGCTC ACTTGGCGCA AACATATAGA AGCCAAATCG AAACATCTTA AACTTAAAGC      4200
     AAGGAACCTC CACTGGCTCA TAAATGCTCG CTCTCCACTT AGTCTGGAGT TCAAAGCTCT      4260
     TCTATACAAC TCCGTCTTAA AACCTATCTG GACTTATGGC TCCGAGCTGT GGGGCAACGC      4320
     ATCCAGAAGT AACATAGACA TTATTCAGCG AGCACAGTCA AGAATTCTGA GAATTATCAC      4380
     TGGAGCGCCG TGGTACCTTC GAAACGAAAA CATACACAGA GACCTAAAAA TCAAATTAGT      4440
     AATCGAAGTA ATAGCTGAGA AAAAAACGAA GTATAACGAA AAGCTGACCA CCCATACAAA      4500
     TCCCCTCGCA AGAAAACTAA TCCGAGTATG CAGTCAAAGC CGGCTGCACC GCAACGACCT      4560
     CCCAGCCCAG CAATAAACTT ATTAGGGCAT TAATGAAAAA AAAAAACTAT CACTAAGTGA      4620
     AAGTTAATTA AGTTAGATTA AGATTTGAAC ACTTATTGTT AGTCTCTTAA CACAAAGGGA      4680
     AGATTCAATA AATAATAAAA ATTAAAAAAA AAAAAAAAAA AAAAA                      4725
//
ID   F     standard; DNA; INV; 4708 BP.
XX
AC   AC005198;
XX
DR   FLYBASE; FBte0000005; Dmel\F-element.
XX
SY   synonym: Jiminy
XX
FT   source          AC005198:38639..43358
FT   SO_feature      CDS ; SO:0000316:192..1880
FT                   /name="Dmel\F-element\gag-r"
FT                   /db_xref="FLYBASE:FBgn0041632"
FT                   /db_xref="TREMBL:P91787"
FT                   /translation="MSQNDTRAQRQREHDERRLSIQRNNAYFSYVSPTIPNADIERSI
FT                   THSPGNLLLPTNQERARSCSPALLAPTEAPLPPTTTAGEGPAARSASSSAAPAHGLTK
FT                   SAKAKPLAINGTAALPAKQNENVNKKAGSTWQTGMDRYITIKRKLSPENSDLGNKPKN
FT                   TRDNSTLIKNVAPANTNRFALLVDTAEDVPLGSVDIEPKKTKPPPIYIREKSTSRLVN
FT                   TLIGLIGKDSFHIIPLVRGTINEIKLQTKTEDDYRKVTNYFTAQKIGFYTYQLKSSKG
FT                   LQVVLKGIESDVTPEEITEALKEKGFYAKNVFNIKNRNRQPQPLFKIELEPENKPPRK
FT                   NEVHPIYKLQLLLHRRITVEEPHKRNAPVQCTNCQEYGHTRSYCTLRPVCVVCGDLHD
FT                   SKQCQINKENACEKKCNNCGGNHTANYRGCPIYKELKIRLHKRMNTARAHQGSATLIP
FT                   SETNPEVIFSKAASFAPWPTFNTNKTTFANVLKSGMTPPTQNSRTPHEVHTKLDTQQN
FT                   YHPAAQQETKTEAMMQALQQSMMEFMTFMKTTIQDMMRNQNLLIQMLVAQQSNK"
FT   SO_feature      CDS ; SO:0000316:1880..4561
FT                   /name="Dmel\F-element\RTase"
FT                   /db_xref="FLYBASE:FBgn0041633"
FT                   /db_xref="TREMBL:Q24335"
FT                   /translation="MATLRIATWNANGVSQRKLELAQFLHEKHIDVMLLSETHLTSKY
FT                   NFQIRDYHFYGTNHPDGKAHGGTAILIRNRMKHHFYKEFAENHLQATSINIQLDDNTL
FT                   LTLAAVYCPPRFTVLEAQFLDFFQALGPHFIAAGDYNAKHTHWGSRLVNPKGKQLYKT
FT                   IIKATNKLDHVSPGSPTYWPSDLNKLPDLIDFAVTKNISRSLVKAECLPDLSSDHSPV
FT                   LIHLRRYAENVKPPTRLTSSKTNWLRYKKYISSHIELSPKLNTESDIESCTCALQSIL
FT                   TAAALTATPKITNNTINSKKTNVQIEQLVHVKRRLRREWQSSRSPTAKQKLKVATRKL
FT                   ANALKQEEDDDQRRYIEQLTPTGTKQKSLWRAHSTLRPPTETVLPIKNSSGGWARSDE
FT                   DRANTFAAHLQNVFTPNQATSTFALPSYPVNRHQQHTPIVFRPKEITKIIKDNLSPKK
FT                   SPGYDLITPEMIIQLPHSAVRYITKLFNAITKLGYFPQRWKMMKIIMIPKPGKNHTVA
FT                   SSYRPISLLSCISKLFEKCLLIRLNQHQTYHNIIPAHQFGFRESHGTIEQVNRITTEI
FT                   RTAFEYREYCTAVFLDVSQAFDKVWLDGLMFKIKISLPESTHKLLKSYLYDRKFAVRC
FT                   NTATSTVHTIEAGVPQGSVLGPTLYLIYTADIPTNSRLTVSTFADDTAILSRSRSPIQ
FT                   ATAQLALYLIDIKKWLSDWRIKVNEQKCKHVTFTLNRQDCPPLLLNSIPLPKADEVTY
FT                   LGVHLDRRLTWRRHIEAKKTQLKLKANNLHWLINSGSPLSLDHKVLLYNSILKPIWTY
FT                   GSQLWGNASNSNIDIIQRAQSKILRTITGAPWYVRSENIQRDLNIPSVTNAITELKEK
FT                   YL"
XX
CC   K. O'Hare, Personal communication to FlyBase, 1 May 2000.
CC   CDS2 translation from M17214; AC005198 has a 1-bp deletion.
XX
SQ   Sequence 4708 BP;  1618 A; 1242 C; 857 G; 991 T; 0 other;
     AATCAATTAA TCAATTCGAT CGCCGACGTG TGAAGACGTT TTTATCGTGC TCCGCACAAA        60
     ATCGGTTGTT TTGAGTGAAG TGAACGCCAA ATAAAATAAA CTAAATAAAA AATCTGAAAG       120
     CGAAAGAGAC GCTCTATGCG ATGCAAGATC GCTTAAATAC ATAGTGAATT GTTATCTTAA       180
     ATAATAAAAC TATGAGTCAG AATGACACTC GCGCCCAGCG TCAGCGCGAG CATGACGAAC       240
     GCCGACTCTC AATTCAGCGC AACAACGCGT ACTTCTCCTA CGTCTCACCG ACAATCCCAA       300
     ACGCAGACAT CGAGCGGTCA ATAACCCATA GCCCAGGAAA CCTTCTTCTA CCAACAAATC       360
     AAGAAAGAGC GCGCTCCTGC TCTCCCGCTC TATTGGCTCC GACAGAAGCC CCGCTACCTC       420
     CAACAACAAC AGCTGGAGAG GGACCGGCAG CCCGCTCTGC CTCGTCATCG GCTGCACCCG       480
     CTCACGGTCT GACTAAGTCA GCGAAAGCAA AACCGCTAGC AATAAACGGT ACTGCTGCAC       540
     TGCCAGCAAA ACAAAACGAA AACGTAAACA AAAAAGCTGG GTCGACCTGG CAGACTGGAA       600
     TGGACCGCTA CATTACAATA AAGCGAAAGC TCAGCCCGGA AAATTCAGAT TTGGGAAACA       660
     AGCCGAAAAA TACACGCGAT AACTCTACCT TGATCAAAAA TGTAGCCCCT GCAAATACCA       720
     ACAGATTTGC CTTGCTGGTA GATACCGCTG AGGACGTGCC GCTGGGATCC GTTGATATCG       780
     AACCGAAGAA AACAAAGCCT CCGCCAATAT ACATCCGCGA GAAGAGCACA AGCCGTCTTG       840
     TAAATACTTT GATTGGCCTT ATTGGGAAAG ATAGCTTTCA TATAATTCCC CTCGTAAGAG       900
     GTACTATCAA CGAAATCAAA CTTCAGACGA AAACGGAGGA CGACTACAGA AAAGTCACAA       960
     ACTATTTTAC CGCACAAAAA ATAGGCTTCT ACACCTACCA GCTTAAAAGC AGCAAGGGCC      1020
     TGCAAGTAGT CCTGAAGGGC ATTGAGTCTG ATGTTACGCC CGAAGAGATA ACTGAGGCGC      1080
     TAAAGGAAAA GGGATTTTAC GCCAAAAACG TGTTCAATAT CAAAAACAGA AACAGGCAGC      1140
     CCCAACCACT CTTCAAGATT GAGCTTGAAC CAGAAAACAA GCCTCCTAGA AAAAACGAGG      1200
     TTCACCCAAT TTACAAACTC CAGCTCCTTT TGCACCGTAG GATCACGGTA GAAGAGCCGC      1260
     ACAAACGCAA CGCTCCTGTA CAATGTACAA ACTGCCAAGA GTATGGCCAC ACGAGGTCAT      1320
     ATTGTACACT TCGCCCGGTG TGCGTAGTCT GTGGAGATCT CCACGACTCC AAACAGTGTC      1380
     AAATTAACAA AGAAAATGCA TGCGAGAAAA AATGTAATAA CTGCGGGGGC AATCACACAG      1440
     CAAACTACAG AGGCTGTCCA ATCTACAAAG AGCTGAAAAT CCGTCTTCAC AAAAGAATGA      1500
     ACACGGCGCG GGCACACCAA GGATCAGCTA CCCTGATACC ATCAGAGACA AATCCTGAAG      1560
     TAATTTTCTC GAAAGCAGCT AGTTTCGCTC CCTGGCCTAC ATTCAACACT AACAAGACAA      1620
     CATTTGCTAA CGTTTTAAAA TCAGGTATGA CGCCTCCAAC CCAAAACTCC CGAACTCCAC      1680
     ATGAAGTGCA CACAAAATTA GACACACAAC AAAACTATCA CCCAGCTGCG CAGCAGGAAA      1740
     CAAAAACTGA AGCTATGATG CAAGCCTTAC AACAGAGCAT GATGGAATTT ATGACATTTA      1800
     TGAAGACCAC CATTCAAGAC ATGATGCGTA ATCAAAACCT TTTGATACAA ATGCTTGTAG      1860
     CCCAACAATC AAATAAATAA TGGCTACCTT ACGCATAGCT ACGTGGAACG CCAATGGCGT      1920
     CTCACAGCGC AAACTTGAGC TAGCTCAATT CCTACATGAG AAGCATATCG ACGTAATGCT      1980
     TCTTTCGGAA ACTCATCTCA CAAGCAAATA CAATTTTCAA ATAAGAGACT ACCATTTCTA      2040
     CGGTACAAAT CATCCCGACG GAAAAGCACA CGGTGGCACC GCCATACTCA TAAGGAACCG      2100
     TATGAAGCAC CACTTTTACA AAGAATTTGC GGAAAATCAT CTTCAGGCCA CATCTATCAA      2160
     CATTCAGCTG GATGACAACA CTCTCCTTAC ACTAGCGGCC GTATACTGCC CCCCCCGTTT      2220
     CACAGTATTA GAAGCTCAAT TCCTGGATTT CTTCCAAGCA CTAGGGCCAC ACTTCATTGC      2280
     AGCAGGCGAC TACAACGCTA AACATACTCA CTGGGGATCG CGACTTGTGA ACCCAAAAGG      2340
     AAAACAGCTT TATAAGACGA TAATAAAAGC CACTAATAAA CTTGACCATG TTTCCCCCGG      2400
     GAGTCCTACA TACTGGCCAT CAGACCTCAA TAAGCTGCCA GACCTGATCG ACTTCGCAGT      2460
     TACGAAAAAT ATTTCCCGCA GTTTGGTTAA AGCTGAATGT CTGCCGGATC TCTCATCTGA      2520
     TCACTCGCCT GTACTAATTC ACCTCCGCCG ATACGCAGAA AACGTGAAAC CACCAACCAG      2580
     ATTGACCTCT AGCAAAACAA ACTGGCTCAG GTATAAAAAA TATATAAGTT CACATATTGA      2640
     GCTAAGCCCA AAACTCAATA CTGAATCTGA TATAGAGAGC TGCACGTGTG CATTGCAATC      2700
     CATCCTTACT GCAGCAGCTC TTACTGCAAC ACCCAAAATA ACAAATAATA CAATTAATTC      2760
     AAAAAAGACC AACGTACAAA TCGAGCAACT CGTCCACGTA AAACGTCGCT TACGCAGAGA      2820
     ATGGCAATCT TCCAGATCCC CAACTGCAAA ACAAAAGCTA AAAGTAGCCA CACGGAAACT      2880
     GGCCAACGCT CTGAAACAAG AAGAGGACGA CGATCAGCGC CGATACATAG AGCAACTCAC      2940
     ACCAACAGGC ACAAAACAAA AGTCACTGTG GCGAGCCCAC TCAACTCTTC GCCCACCGAC      3000
     TGAAACCGTT TTGCCGATAA GGAATTCATC AGGTGGCTGG GCCCGTAGTG ATGAAGACAG      3060
     AGCCAACACA TTTGCCGCTC ACCTACAAAA TGTGTTCACG CCAAACCAGG CTACTAGCAC      3120
     ATTCGCGCTA CCGTCCTATC CCGTAAACCG CCATCAGCAA CACACCCCAA TTGTGTTTCG      3180
     TCCTAAAGAA ATAACTAAAA TAATCAAAGA CAATCTCAGC CCGAAAAAAT CCCCCGGCTA      3240
     CGACCTTATA ACACCGGAAA TGATCATCCA GCTGCCACAT TCTGCAGTTC GCTACATAAC      3300
     CAAGCTCTTT AATGCCATCA CCAAACTTGG TTACTTTCCA CAACGATGGA AGATGATGAA      3360
     GATCATAATG ATTCCAAAGC CTGGTAAGAA CCACACAGTC GCTTCATCTT ACAGACCAAT      3420
     AAGTCTACTC TCATGCATTT CGAAACTATT CGAAAAATGC CTGCTGATCC GACTTAATCA      3480
     ACATCTGATA TACCACAATA TAATCCCAGC CCACCAATTT GGATTTCGCG AAAGCCACGG      3540
     AACCATTGAA CAGGTGAATC GTATTACAAC GGAAATAAGA ACTGCATTTG AATATCGCGA      3600
     ATACTGTACA GCAGTATTTT TAGACGTATC CCAAGCATTC GACAAAGTCT GGCTCGACGG      3660
     CCTAATGTTT AAAATTAAAA CATCCCTACC CGAAAGCACA CACAAACTTC TAAAGTCTTA      3720
     CCTCTATGAC AGAAAGTTTG CAGTGCGGTG CAACACTGCC ACTTCCACTG TTCATACAAT      3780
     TGAGGCTGGA GTCCCCCAAG GCAGCGTTCT TGGGCCAACC TTATACCTCA TCTATACAGC      3840
     CGACATCCCT ACAAATAGTC GCTTAACGGT ATCCACATTT GCCGACGATA CAGCTATCCT      3900
     TAGCCGTTCA AGGTCCCCTA TCCAAGCTAC AGCACAGTTG GCACTGTACC TCATCGACAT      3960
     TGAGAAGTGG CTCTCTGACT GGCGAATAAA AGTAAACGAG CAAAAATGCA AGCACGTGAC      4020
     GTTTACGCTA AACAGACAAG ACTGTCCTCC GCTCTTGTTG AACAGCATAC CACTCCCGAA      4080
     AGCAGACGAG GTAACGTACC TAGGAGTACA CCTAGACAGA AGACTCACAT GGCGCAGGCA      4140
     CATTGAAGCC AAAAAAACCC AACTTAAACT CAAAGCCAAC AACTTACACT GGCTCATCAA      4200
     CTCTGGTTCT CCGCTCAGCC TAGATCACAA GGTCTTGCTC TACAATTCTA TATTGAAACC      4260
     AATCTGGACC TATGGCTCAC AGTTATGGGG CAATGCCAGC AACAGCAATA TTGACATCAT      4320
     TCAGCGAGCA CAATCAAAGA TTCTGAGAAC CATCACTGGG GCACCGTGGT ACGTTCGGAG      4380
     TGAAAACATC CAAAGAGACT TAAATATCCC ATCAGTTACC AACGCAATCA CGGAACTTAA      4440
     GGAAAAATAC CATAGCAAGC TTCACACGCA CCCCAACCAC CTAGCGCGAG GTCTAATCCA      4500
     GCTCAGCAGC CGTTCCCGTC TCCGGCGAAA GGACCTACCA ACCCAGCGAA TAAATTATTA      4560
     GGGCCGTTTA AACATAGAAC AGTTGGAAAA ATAATACAAC TGTTCAAAAA ATACTTGTTA      4620
     TAGTTAAGAT TTTTAAACTT ATTGTTAGTT CTTATACAAG AAGATTCAAT AAATAAAAGC      4680
     AAAGTAAAAT AAAAAAAAAA AAAAAAAA                                         4708
//
ID   FB   standard; DNA; INV; 4347 BP.
XX
AC   X51937;
AC   X15469;
XX
DR   FLYBASE; FBte0000466; Dmel\NOF.
XX
FT   source          join(X15469:94..1010,X51937:1..3430)
FT   SO_feature      CDS ; SO:0000316:797..3874
FT                   /name="Dmel\NOF\ORF"
FT                   /db_xref="FLYBASE:FBgn0044029"
FT                   /db_xref="SWISS-PROT:P16320"
FT                   /db_xref="NCBI_PROTEIN:CAA36201.1"
FT                   /translation="IQQLDTSANLTLNSTFPDDDPEFQITEASKNGPLPILYFNLELDL
FT                   ELWRSIAPKKDQKTEKLQPNWTDTMAKLIYKKVPLPCAFNFRKAKLSDKVDNIWLRIEG
FT                   YCNDCSSILKGHCLVKPDEQCGIMISVSVPDTRGIPHNKKRRCTGSRRLEIGNELILKK
FT                   AALWRKEATDNMNDDDPEPSYIPNLPTLRKLREEATNRHLGITKDRDPVSSLYLKKYEG
FT                   ELAGCILDIGLDEFFCIYCTGTQVKTYASRIKTIRKISIDATGSVVLPIQKPNGDSSYV
FT                   FLYQIVMEGDDSIFPVFQMLSAKHDTASIQFWLSRFISKSGHFPLEVVSDFSLALLNGI
FT                   SLSFNECRIATYIKKCFHSLLMEERTDLPPCYIRLDIAHLIKMICRKNVFKSKLPNLKD
FT                   FYTRCIGLATTCETKDSFAELIKSVLIVALSQSSGEDEKGDILSSYRNEKYLLARIATF
FT                   TAPDHKETIEDNCIPEDQEEIDEDVTDFISNIKIAAEEEALNCNSVNCRPNPYFLPELM
FT                   PPLIKLCKYFVLWTNVMKEKFCSKYDVGSSALVEAYFKDLKNTDMSIFHRPVRADKFVV
FT                   QHIRCIEAVCKLERAAMKRKTVKTPSFIKENAPKKMCSKETKGFLEEILEESEVEYLLQ
FT                   EENWKVKNKTIKPTEGNDAEDNDTDDENKEMDLSEQPKEKPRGKYLKKCPNVELLYNRP
FT                   HRRKQDEILHNGGSMGPVWIGKQLLQFKNTCPFDSLVEILSTAYIDNFYYKSLLDDFYT
FT                   DNLTIELVKKYAVEGVSSSLYCDRGLVLKSFFDEKHQIIKCDANIGSFIEKALNGVPSA
FT                   SSHRTHIKNNHDCRNQKYIHHRLEVIDVEKVGHLDVQEVVIPFIDEFFARTDGECKICG
FT                   GQQILERQPGPHVILDIEFAMDAFHQIHHNGLPGTTTLLQVPEEILIQEKKYILSGAIE
FT                   YVPAMGGEIGHYIAYCRRVIGSWEVHNDMCRQWKKFSALNTKMTLHILIYTRKN"
XX
CC   Derived from X15469 (g7962) (Rel. 36, Last updated, Version 3).
CC   Derived from X51937 (g8297) (Rel. 44, Last updated, Version 6).
CC   Takis Benos and Michael Ashburner, 25-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 4347 BP;  1461 A; 775 C; 885 G; 1226 T; 0 other;
     TATATTCTAT TGCCCACCAT ATAAACACGT GCCACTTTCC TAGTTTTAGG ATCTGCCTAC        60
     ATAACACGTG CAGACGCACA GGTGTTTCTG GGTTTATATA GACCAAAAAT TGGTTCCGAT       120
     TGCCAATCTT GTAATTTACA GTTTACCAGG TAATTACATA ATTTTCAAAC CTCACTTTAT       180
     GATAGGGTCC AATTTTTTAC CTGTGACAAA GTGTTAAATT TTTTAAGAAT GGGTTTTTCA       240
     TGGCAGGTCA GAATCCTCTA TAAAATCTAA AACACTTGTC GGTATTTGAA AATCGCTCTC       300
     CTCCTTGATT CTCATATTAG GTGTAAAAGA TAAATCCGGA ACTCATAATT AAAATATTTT       360
     TTATGTGAAA AAGTTGTGCG CGATTTTAAC TACGCTTACC CAGTGCTGGA AAAGTTAAAG       420
     TTGTTTTGTT TTTCAAAGAA AGTGAAAGTT GCTAAGCACG AACTTAAGAA ATCTGAGTGA       480
     TTGTGTTAAA TTTATTTGAA TCCTTGTGAA TTTTGTTGAC AGTCTTTTTA AAGACTTGCA       540
     AAATTTTCAT ATTATTCGGT TCTTGCTTTT ATTTTTATAC AACGCGTTTT TCCTTTAGGC       600
     ATACCTTTAT ACATTTACAG TGTAAACAAC AGTGTAAAAC GTGTAAATCA GTGCAAAATA       660
     GTTTTTTTTA TTTACTCCAT AAAAAATAAG TGTTACTGTC AGGATGCCGG CCAAACCGCA       720
     AGTCGATGGT CACACCTTAG TGGATGCATT TTGCTGCGCG AATATTTTTA CGGAGACTGG       780
     AGCTCTTAAG CCAAGAAGCG ATAAAGTTTG GATGGATATA AGCAACCAAT TGAAAGGAGC       840
     GATCAGCGCG AAGACGCTTA ATTTCTACGC CAGAATCAAT AGGAATAACA TGATAACTGT       900
     GGTTAAAGAA CGATGTGGAA TTCAACAGCT GGATACTAGT GCCAATTTAA CTTTAAATAG       960
     CACATTTCCT GATGATGACC CGGAGTTCCA GATCACCGAA GCTTCAAAAA ATGGACCATT      1020
     GCCTATTTTG TACTTTAACC TGGAGTTGGA CCTGGAATTG TGGAGATCAA TTGCCCCCAA      1080
     AAAGGATCAA AAAACTGAAA AACTGCAACC TAACTGGACG GATACTATGG CAAAGTTGAT      1140
     ATACAAAAAA GTTCCTCTTC CGTGTGCATT TAATTTTAGA AAAGCTAAAC TTTCCGACAA      1200
     AGTGGATAAT ATTTGGCTAC GAATTGAAGG CTATTGCAAT GACTGCAGCT CAATTTTAAA      1260
     GGGACATTGC CTTGTGAAAC CCGATGAACA ATGCGGCATA ATGATATCTG TTTCAGTACC      1320
     GGACACACGA GGTATACCTC ATAATAAAAA ACGACGGTGC ACTGGATCGA GACGACTTGA      1380
     AATTGGGAAC GAGTTGATTT TAAAAAAAGC TGCATTGTGG AGGAAGGAAG CCACCGACAA      1440
     CATGAATGAT GACGACCCAG AACCGAGTTA CATACCAAAT TTACCAACCC TTCGGAAACT      1500
     TCGTGAAGAG GCAACTAACA GACACCTAGG AATTACCAAG GATCGGGATC CAGTTTCATC      1560
     ATTATACCTT AAAAAGTATG AGGGTGAATT GGCTGGATGC ATTCTTGACA TTGGATTGGA      1620
     TGAATTTTTC TGCATATACT GCACAGGAAC CCAAGTAAAA ACATATGCAT CAAGGATAAA      1680
     AACTATTAGA AAGATTTCTA TTGACGCAAC TGGAAGCGTG GTGTTACCCA TCCAAAAACC      1740
     AAACGGTGAC TCTAGTTATG TTTTTCTGTA CCAAATTGTA ATGGAGGGTG ACGACAGTAT      1800
     ATTTCCAGTT TTTCAGATGC TGTCGGCTAA ACATGACACA GCCAGCATAC AGTTTTGGTT      1860
     AAGCAGATTT ATATCAAAGT CGGGGCATTT TCCACTGGAG GTTGTATCTG ATTTTTCCTT      1920
     GGCATTGCTA AATGGAATAA GCTTAAGCTT TAATGAGTGT AGGATTGCGA CGTATATAAA      1980
     AAAATGTTTC CACAGCCTTT TGATGGAGGA ACGGACGGAT CTGCCACCCT GCTATATTCG      2040
     ACTTGACATC GCCCACCTAA TTAAAATGAT ATGCCGGAAG AACGTCTTCA AAAGTAAATT      2100
     ACCGAACCTC AAGGATTTTT ATACTAGATG TATTGGTCTT GCAACAACGT GTGAGACAAA      2160
     GGACAGTTTT GCGGAATTAA TTAAATCAGT ACTGATTGTC GCACTGAGCC AATCCTCAGG      2220
     GGAAGATGAA AAAGGAGACA TTCTTTCAAG TTACAGGAAT GAAAAGTATC TGCTCGCCAG      2280
     AATAGCTACA TTTACTGCCC CGGATCACAA GGAGACCATT GAGGACAACT GCATACCAGA      2340
     GGACCAGGAG GAAATTGACG AGGATGTTAC GGACTTTATC TCTAATATTA AAATCGCTGC      2400
     CGAAGAAGAA GCGTTAAATT GCAATTCGGT CAACTGTCGG CCAAATCCGT ATTTCCTACC      2460
     TGAGCTAATG CCACCATTAA TTAAGTTGTG CAAATATTTT GTTTTATGGA CAAACGTGAT      2520
     GAAGGAAAAG TTCTGTTCCA AATATGATGT CGGCTCTTCG GCTCTTGTGG AAGCCTATTT      2580
     CAAGGATTTA AAAAACACGG ACATGAGCAT ATTCCACCGA CCAGTGAGAG CGGATAAATT      2640
     CGTGGTGCAA CATATCCGAT GCATCGAAGC TGTTTGCAAG CTGGAACGAG CCGCGATGAA      2700
     ACGCAAGACC GTTAAAACTC CCAGCTTTAT AAAAGAAAAC GCTCCTAAGA AAATGTGCAG      2760
     TAAGGAAACC AAGGGATTTC TGGAGGAAAT ACTTGAAGAA AGCGAAGTGG AATACCTTTT      2820
     ACAAGAAGAA AACTGGAAGG TGAAGAATAA AACAATAAAG CCCACGGAAG GAAATGATGC      2880
     TGAAGACAAC GACACTGATG ATGAAAACAA GGAAATGGAT TTAAGTGAAC AGCCCAAAGA      2940
     AAAACCAAGG GGAAAATATC TCAAAAAATG CCCCAATGTG GAGTTATTAT ACAATCGACC      3000
     ACATCGAAGG AAACAGGACG AAATTTTGCA TAATGGTGGA TCAATGGGAC CCGTCTGGAT      3060
     TGGCAAACAA TTATTGCAAT TCAAAAATAC TTGTCCGTTT GACTCTCTAG TGGAAATATT      3120
     GTCGACCGCA TACATAGACA ATTTTTATTA CAAAAGCCTA TTGGATGATT TCTACACTGA      3180
     CAACTTGACG ATAGAATTGG TGAAAAAGTA TGCCGTCGAG GGAGTTTCGT CCAGTCTCTA      3240
     CTGCGACAGA GGTCTGGTCC TAAAAAGTTT TTTTGATGAA AAACACCAGA TTATAAAATG      3300
     CGACGCAAAT ATTGGGTCTT TTATTGAAAA AGCGCTGAAT GGAGTACCCA GTGCGTCAAG      3360
     TCATCGGACC CATATAAAAA ACAACCATGA TTGCAGGAAC CAAAAATATA TCCACCATCG      3420
     GCTGGAGGTT ATAGATGTCG AAAAAGTTGG CCACCTCGAC GTCCAGGAGG TAGTGATCCC      3480
     CTTTATTGAT GAGTTTTTTG CAAGAACTGA TGGAGAATGT AAAATATGCG GTGGACAACA      3540
     GATCCTTGAA AGGCAGCCAG GACCGCATGT CATACTTGAT ATAGAATTTG CAATGGATGC      3600
     TTTTCATCAA ATTCATCATA ACGGTTTACC AGGAACGACC ACTTTACTTC AAGTGCCGGA      3660
     GGAAATTTTA ATACAGGAAA AGAAATATAT TTTAAGTGGT GCCATCGAAT ATGTTCCTGC      3720
     GATGGGAGGG GAAATTGGAC ATTACATTGC ATATTGCCGC AGAGTCATTG GATCTTGGGA      3780
     AGTGCACAAC GATATGTGCA GGCAATGGAA AAAGTTCTCA GCTCTAAATA CCAAAATGAC      3840
     ACTCCACATT TTGATATACA CCCGGAAAAA TTAATGTTTA TTTTTAAGCC TTGTTTAAAA      3900
     GTGTAAAAAA TATTTGTTGT TAAAAATTAC AATCTTAAGT CCTTTGCAAA CGTTGTTTAA      3960
     AAATAAAATT AAATTAATTA TTTTACAAAA CTTAACCCTT TTTCACTTTT ATACCTAATA      4020
     TAAAGAGGTC CGTAAAGTAT CAAGGAGGAG AGCGATTTTC AAATACCGAC AAGTGTTTTA      4080
     GATTTTATAG AGGATTCTGA CCTGCCATGA AAAACCCATT CTTAAAAAAT TTAACACTTT      4140
     GTCACAGGTA AAAAATTGGA CCCTATCATA AAGTGAGGTT TGAAAATTAT GTAATTACCT      4200
     GGTAAACTGT AAATTACAAG ATTGGCAATC GGAACCAATT TTTGGTCTAT ATAAACCCAG      4260
     AAACACCTGT GCGTCTGCAC GTGTTATGTA GGCAGATCCT AAAACTAGGA AAGTGGCACG      4320
     TGTTTATATG GTGGGCAATA GAATTTA                                          4347
//
ID   DMTNFB     standard; DNA; INV; 1106 BP.
XX
AC   V00246; J01084;
XX
DR   FLYBASE; FBte0000288; Dmel\FB.
XX
FT   source          V00246:1..1106
XX
CC   Derived from V00246 (g8708) (Rel. 36, Last updated, Version 3).
CC   Josh Kaminker 2 Aug 2002.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 1106 BP; 340 A; 228 C; 119 G; 419 T; 0 other;
     AGCTCAAAGA AGCTGGGGTC GGAAAAATCG AATTTTTGAA ATTTGAAAGC TGGAATCGTT        60
     TGCCCATTTT TTGCCCATGT TTGCCCACCA ATTAGTTTTT TTTGCCCACG TCCAGTTTTT       120
     GAGATATGGA TTTTCGAAAA AGTTCGAAAA TGTTCGAAAA TCAAAAATTT CGCTTTTTTC       180
     AAATTTTTTT TTTTTTAAAT CGCAATAACA TCGTTTGCCC ACGTTTGCCC ACCCTTTAGA       240
     ATTTTGAAAA AATTTATACT TTAGAAAATA TAAGGCTTTT AAGTTTACCT CGGTCTAATC       300
     AGAGAGTAAA TCGTTTGCCC ATCTCTTAAA ACCAAATATT ATCAACAAAA AACGTTTGCC       360
     CAACCATTAT TATTAGTTTT TATCGTTTGC CCACCCTTTA AAAAACCTTT AACAAAATTT       420
     TTTTTTCGAT TGCCCACACT TGAAATACAA CCAATTTCGT TAGCCCACCT CTTCAAAATA       480
     AATATTTCCA ATAAAAAACG TTTTCCCACC ATTTAAAAAT AAATAATTTC GATTGCCCAT       540
     CCTTCAAAAT TCATTTTAAC GTTTGCCCAC CCTTTAAAAT TTGTTTTTTT CGTTTGCCCA       600
     CTCTTAAAAC TAAATAATTT CGATTGCCCA CCTTTTAAAA CTAAATAATT TCGTTTGCCC       660
     ATCCTTTAAA ATTCATTTTT AACGTTTGCC CACCCTTTAA AAATAAATTA TTTCGTTTGC       720
     CCACCCTTTA AAATTTGTTT TTTTCGTTTG CCCACTCTTA AAACTAAATA ATTTCGATTG       780
     CCCACCTTTT AAAACTAAAT AATTTCGTTT GCCCATCCTT TAAAATTCAT TTTAACGTTT       840
     GCCCACCCTT TAAAAATAAA TTATTTCGTT TGCCCACCCT TTAAAAGTTT TTTTTTTTCG       900
     TTTGCCCACT CTTAAAACTA AATAATTTCG ATTGCCCACC TTTTAAAACT AAATAATTTC       960
     GTTTGCCCAT CCTTTAAAAT TCATTTTTAA CGTTTGCCCA CCCTTTAAAA TTTGTTTTGT      1020
     AAGATGTGGC GCCAATTCAG ATATTTTAGG ATCGGCGGAT AGAAGCACTT ACTTATATGA      1080
     TGATGATGAA CATACATAGA CATAAT                                           1106
//
ID   DMREPG     standard; DNA; INV; 4346 BP.
XX
AC   X06950;
XX
DR   FLYBASE; FBte0000657; Dmel\G-element.
XX
FT   source          X06950:1..4346
FT   SO_feature      CDS ; SO:0000316:220..951
FT                   /name="Dmel\G-element\ORF0"
FT                   /db_xref="FLYBASE:FBgnXXXXXXX"
FT   SO_feature      CDS ; SO:0000316:819..1539
FT                   /name="Dmel\G-element\ORF1"
FT                   /db_xref="FLYBASE:FBgnXXXXXXX"
FT   SO_feature      CDS ; SO:0000316:join(1530..1858,1866..1973,1982..2719,2727..3008,3012..3800,3806..3991,4006..4095)
FT                   /name="Dmel\G-element\ORF2"
FT                   /db_xref="FLYBASE:FBgnXXXXXXX"
XX
CC   Derived from X06950 (g8427) (Rel. 16, Last updated, Version 1).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 4346 BP;  1215 A; 1356 C; 959 G; 816 T; 0 other;
     ACAGTCGCGA TCGAACACTC AACGAGTGCA GACGTGCCTA CGGACCGACG GCAAGTTATT        60
     TTCGTGCTCA AAGTCCCGCT ACTCTAAAAC CGCTACGTAG TGTCGCGAGA TTTCTTCGCG       120
     CACCGTGATT GGTTCAGCCG GCGAACCTTA CGGTATCGCT ACCACTACCA ACGCACTCGT       180
     GCGTGCGTGT TATCGGTATC AACAGTTACA TTCGGCTAAA GTTACTGCGA ACAACTCAGC       240
     AGCAGCCACG TGCTGAGGCT GGTACACCAA CAAACGGTTC CTACCGTGCC CTCCTCCCCT       300
     CCTTCCCTAC TCCGGGACAA CATGGACTGG CAAGCCCCCC CGCGACCCAC CAAGCTGACC       360
     AAAGTGCCTA GAAAGAAGGC GCTCAAAGAG GCGCCAGGAG AAGGTGAAAG CAGCTGCTCA       420
     AGCGATAGCA GCTCCTCGGA GTCAGAGCCT GGGGAAGTCA AGCGCAAAGC AGCGAGCAGA       480
     GACGCTAAGG AAGCCGCCGA CAACGTGCCC AACACCAGCG CAGCTCTGCG CAAGAAGCTG       540
     GAAAATAACT CCTTCGCCCT TCTGTCCAGC ACTGAGGACG AAGACGATGA CGACGACAAC       600
     ACCGACAACG AGCAGCAAAC CCCTGTTGGG GAATCTGCTC CAAAAACCAT GAAAAAACCC       660
     AACCCGACCC CGAAGACCAT CAAGCCACCC CCGATCTACA TCCCAGACGT GACCAACATC       720
     TCAGCCCTTG TCAGGATGAT TACGACTCTC GTCGGTGCCC ACAAGGAATT CTCGTACAAA       780
     ACTGAGAGAA ACAACAATGT ACGAGTAATG ATGCCTGACA AGGAATCCTA CTCAGCCTTT       840
     CGTCAGCAGC TTGTGACCCA GAACAAAAGG CACCGCACAT TTCAACTGTC AGGGACCTGC       900
     ACAACCCAAT TGGCAAAAAA TCAAAGGAAC CCCTGGGGAT CTTCTTTGTA AACCTGGAAC       960
     CTGCGAGCAA CAATACAGAC ATCTACAAAC TCAAGAGAAT CTGCAGGTCG GTCGTCACCG      1020
     TTGAGCCGCC TCTGAAATTC AACGATGTTC CGCAGTGCTT CAGATGTCAA GGGTTCGGAC      1080
     ACACCCAGCG CTACTGCTTT TTAGAGTTTC GCTGCGTCAA GTGTGGTGGC CTCCACGACT      1140
     CCAGGGCGTG TGAAAAAAAG GAAGACGAGA AAGCATGCTG CCTACACTGT CAAGCCGACC      1200
     ATCCAGCGTC GTTCAAAGGG TGCCCCGCGT ATAAGAAGGC AAAGGCTCAA CAAGCTCCTA      1260
     AACCCAAAGC AAGGAGCATG GAAAGCAACA ACAAGCCCTC CTTTGAGCTC CCAAATATTA      1320
     CAAACGGTAT GAGCTATAGA GACGCGCTAA GTGGCACACG CAAGTCCCAA GCAAGCACTC      1380
     CCCCACCGAC ACCCCCAACC CCACCTGAAG CCCCACAACC TAACCACATG GAGGCTATGT      1440
     TCACTCGATT TGAGAGCCTG GTCGAAAGAA TGATGGAGAA GATGTTTGCT CAGGTGACGC      1500
     AGCTTGTTGC TTCCATCCTC AACAGCAAGT CATGCAAATA AGTCTCAACA TAGTCTTCTG      1560
     GAACGCGAAC GGCTTGCAGA GAAGCAAAGC CGAAGTTGAG CACACCATCA AAACCGACAA      1620
     CATCGATATT TTATTGGTCT CAGAATCCCA TTTTTGCCCC AGATCCCACT TCATCATCTC      1680
     CGGTTACGAC CTCATCACAG CCAACCACCC ATCAGGTAGA GCTCGAGGAG GAGCGGCCAT      1740
     GCTCATCAAA AGCGGCATAC AGTTCACTGA ACTGCCTGCG ATACAGGAGG ATTGGGCACA      1800
     GTGTGCAGTG GCCAGAGTCA ATAGCCTACA GGGAGATATT ACGGTTGGAG CGGTTTACTT      1860
     CCACCCCCAG GCACGCGATT ACAGAGACTC ACCTGCATGA GTTCTTCGAG TCCCTCGGAA      1920
     CTCGCTTCAT TGCAGCCGGA GACTTCAATG CAAAGCACTC CTGGTGGGGG TCCGCACAAA      1980
     CAACCCCAAA GGCAAAACGC TCCACAAGTA CCTGATGCGC AAAAACTTGG ACTGCCACTC      2040
     TACTGGAGAG CCCACACACT GGCCCTCGGA CCCTTCTAAG CAGCCGGATC TGCTGGACAT      2100
     CGCGATCTGC AAAGGCATAG GTCGTGCCAA ACTCGTCTGC ACTACATACG ACAGGCTCGT      2160
     ATCGGACCAC AGCGCCGTCA ACCTGCTCCT CAACATCCCT GTCCTCAGGA AGACGCCGCT      2220
     CCGTAGACTC ACGGGGAATC GCACCAATGC CCCCAAGTTC ACGTTCTGGA TGCTCTCCTC      2280
     CCTAAACCCA GACCCAGACC TCTCCACTCC AGGCAATATA GGCGCGGCCA TCGAAAAACT      2340
     GAACAAGGAG ATGCACAACG CCGCTGAGTT TGCGAACCCT CCTCCTCCTA CAACCCCGAG      2400
     AACTCCCGCA AGAGACCTGC ATTTGTGGTC CCCAGAAATC GCCGCCCTCG TGGCCGAGAA      2460
     GAGACGCCTC AGACGAGTAT GGTTCCTCTC GCGTAACCCC AGGGACAAGA CAGCGCTCAA      2520
     TCGCGCCTCC AAGGAACTCA AGGACAAACT AACCACCCTA CGCCAAGACT CGTTTCAACG      2580
     ATTCCTTGAA GATCTGGAAC CTGGAGACCC GCAGCACAAC CTGTGGATCG TCACGCGGCA      2640
     CATCAAAAGA CCCGCCAAGA AAATGGTACC AGTGCGTACA GCAGACTGCT CCTGGTGTCG      2700
     GTCTGAGGCA GAAAGAGCCG AAGCTTGCTG ACCACCTTCG CTCTGCCTTC ACTCCGTTTG      2760
     ACCGATGCAC AGCTGCAGAG CAAGCTGACA CCATCAGAGC TGTTGAAAGC CCATGTGCTC      2820
     CAGGACCTGC AATTCAGCCC GTCGCACCAG AGGAGATCGC GCAGGAAATT GCCTCGCTCA      2880
     GAAACGGCAA GTCTCCCGGC CCTGATCGCA TCGACGCTAC TGCGTTAAAA ATGTTGCCCA      2940
     CATTCTGCTC ACAGCTGCTT GCCAACATTT TTAACAGCTG CTTCCGGCTA GGGTATTTCC      3000
     CAAAACAATA GAAACGCGCC GAAGTGATTA CCATCCCCAA GCCCGGCAAA CCTGAAGCCA      3060
     ATCTTGCCTC CTATCGTCCG ATAAGTCTGC TGGCAATCCT CTCCAAAATA CTCGAAAGAG      3120
     TATTTCTGCG CAGAGTGCTG CCAGTACTGG ATGAGGCTGG TTTGATCCCC GATCACCAGT      3180
     TTGGCTTCAG GCGCTCCCAC GGAACACCAG AGCAATGCCA CCGGCTTGTA GAGCAAATTT      3240
     TGGAGGCCTT CGAAAGGAAG CAATACTGCT GCGCCGTCAT GCTGGATGTG AAGCAGGCCT      3300
     TCGACAAAGT CTGGCACCCT GGACTCCACT ATAAAATCAA GACTCACCTT CCCGGATCCC      3360
     ACTTCGCCTT CCTCAAATCA TTCACTGAGG GTAGAGAGTT CCAAGTTTGC TGCGGAACAG      3420
     CGACCAGCAC GCCTAGGCCG ATAAGAGCCG GAGTACCCCA AGGCAGCGTC CTTGGACCAA      3480
     TACTGTACAC ACTCTACACA GCAGACCTTC CTATCACACC CTCCCGGAGC CTAACAGTGG      3540
     CCACATATGC CGATGACACC GCCTTCCTAG CCTCCGCCTC AGACCCCCAA GAAGCATCAA      3600
     CCATCATTCT AAGCCAGCTG GATGCCCTCG ACCCATGGTT GAAACGATGG ACCATTGCCG      3660
     TGAACGCAGA CAAATCCTCC CAAACCACTT TCTCCCTGCG CAGAGGAGAC TGCCCCCCAG      3720
     TCACGCTCAA CGGGGAAACT ATTCCAACCT CAAGTTCCCC GAAATACCTT GGATTGACTC      3780
     TAGACCGGAG GCTCACTTGG CACACCAGGC TGACCTGCGC CTCAAGCAAC TCCACTGGCT      3840
     CATCGGGAAA AGGTCCAAAC TTAGGGAAAA CCTTAAACTC CTCCTGTACA AGGCCATCCT      3900
     GAAGCCAATT TGGACTTATG GGATTCAGCT GTGGGGCACT GCCAGCATCT CAAACCGCAA      3960
     CCGCATACAG CGCTTCCAGA ACAAGTGCCT GAGTCAATCG CTGACGCTCA CCCATACCAT      4020
     GAAAACTCCG TTATCCACAA GGAGCTTGGA ATGCCATGGG TAGCAGAGGA GATCTCCCGC      4080
     TTCAGCGAGA GATACGCTAA ACGACTGGAC AACCACCCTA ACCATCTGGC TATTAACCTC      4140
     CTGGACAACA GTGAAACCAT CAGACGCCTC CAGAGGAAAC ACCCGCTTGA TCTCCACCAC      4200
     CTATAACCCA CAACAATGAA CCCCCGACCA ATCTACAACT TTGTAATCCC TTAAGTTAAT      4260
     GCCCCCCCCA CCCAAACATT TAATTATTGT CCACATGGAC AGATTTTAAA TTAATACATA      4320
     GATCGCTAAA AAAAAAAAAA AAAAAA                                           4346
//
ID   DMGYPF1A   standard; DNA; INV; 7469 BP.
XX
AC   M12927;
XX
DR   FLYBASE; FBte0000021; Dmel\gypsy.
XX
SY   synonym: mdg4
XX
FT   source          M12927:1..7469
FT   SO_feature      five_prime_LTR ; SO:0000425:1..482
FT   SO_feature      three_prime_LTR ; SO:0000426:6841..7411
FT   SO_feature      polyA_site ; SO:0000553:7277..7280
FT   SO_feature      primer_binding_site ; SO:0005850:482..492
FT                   /bound_moiety="tRNA:lys2"
FT   SO_feature      CDS ; SO:0000316:1080..2435
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\gypsy\gag"
FT                   /db_xref="FLYBASE:FBgn0014965"
FT                   /db_xref="SWISS-PROT:P10405"
FT                   /db_xref="NCBI_PROTEIN:AAA70218.1"
FT                   /translation="MSWAHNYRKVKVEYESEDSWEEEQVGQALGRPLDSATVDITMDPN
FT                   QIQALIDNAVRQALSQQQSQFQTQLNSLAARVQSLQVEAPQIKIYEKVSVNPDVRCDIP
FT                   LDIIKSVPEFSGTQDEYVAWRQSAIYAYELFKPYNGSSAHYQAVAILRNKIRGAAGALL
FT                   VSHNTVLNFDAILARLDCTYSDKTSLRLLRQGLEMVRQGDLPLMQYYDEVEKKLTLVTN
FT                   KIVMTHEQEGADLLNAEVRADALHAFISGLKKALRAVVFPAQPKDLPSALALAREAEAS
FT                   IERSMFANSYAKAVEERAHSGANGKSRFQGKPNKEEQGQDRNPHFTKRPKNNGQTNKDT
FT                   QAQAPQPMEVDSSSRFRQRTEHYQNHPNESNAFKRRNSSERSTGPRRQRLNNVVQEAPK
FT                   QKDPKEEYEKTAKAAVEEIDSENEYAPSDDSLNFLGGAPGCRSLNDGWLGEP"
FT   SO_feature      CDS ; SO:0000316:2438..5470
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\gypsy\pol"
FT                   /db_xref="FLYBASE:FBgn0014966"
FT                   /db_xref="SWISS-PROT:P10401"
FT                   /db_xref="NCBI_PROTEIN:AAA70219.1"
FT                   /translation="MLIDTDAAKNYIRPVKELKNVMPVASPFSVSSIHGSTEIKHKCLM
FT                   KVFKHISPFFLLDSLNAFDAIIGLDLLTQAGVKLNLAEDSLEYQGIAEKLHYFSCPSVN
FT                   FTDVNDIVVPDSVKKEFKDTIIRRKKAFSTTNEALPFNTAVTATIRTVDNEPVYSRAYP
FT                   TLMGVSDFVNNEVKQLLKDGIIRPSRSPYNSPTWVVDKKGTDAFGNPNKRLVIDFRKLN
FT                   EKTIPDRYPMPSIPMILANLGKAKFFTTLDLKSGYHQIYLAEHDREKTSFSVNGGKYEF
FT                   CRLPFGLRNASSIFQRALDDVLREQIGKICYVYVDDVIIFSENESDHVRHIDTVLKCLI
FT                   DANMRVSQEKTRFFKESVEYLGFIVSKDGTKSDPEKVKAIQEYPEPDCVYKVRSFLGLA
FT                   SYYRVFIKDFAAIARPITDILKGENGSVSKHMSKKIPVEFNETQRNAFQRLRNILASED
FT                   VILKYPDFKKPFDLTTDASASGIGAVLSQEGRPITMISRTLKQPEQNYATNERELLAIV
FT                   WALGKLQNFLYGSREINIFTDHQPLTFAVADRNTNAKIKRWKSYIDQHNAKVFYKPGKE
FT                   NFVADALSRQNLNALQNEPQSDAATIHSELSLTYTVETTDKPLNCFRNQIILEAARFPL
FT                   KRNLVLFRSKSRHLISFTDKSWLLKTLKEVVNPDVVNAIHCDLPTLASFQHDLIAHFPA
FT                   TQFRHCKNVVLDITDKNEQIEIVTAEHNRAHRAAQENIKQVLRDYYFPKMGSLAKEVVA
FT                   NCRVCTQAKYDRHPKKQELGETPIPSYTGEMVHIDIFSTDRKLFLTCIDKFSKYAIVQP
FT                   VVSRTIVDITAPLLQIINLFPNIKTVYCDNEPAFNSETVTSMLKNSFGIDIVNAPPLHS
FT                   SSNGQVERFHSTLAEIARCLKLDKKTNDTVELILRATIEYNKTVHSVTRERPIEVVHPG
FT                   AHERCLEIKARLVKAQQDSIGRNNPSRQNRVFEVGERVFVKNNKRLGNKLTPLCTEQKV
FT                   QADLGTSVLIKGRVVHKDNLK"
FT   SO_feature      CDS ; SO:0000316:join(567..568,5551..7000)
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="gypsy\env"
FT                   /db_xref="FLYBASE:FBgn0014964"
FT                   /translation="
FT                   MFTLMMFIPLVVANARITDFSHANYIPVLDGDVLVFEQRDLLKHSSNLSE
FT                   YASMIDETQKLSESFPHSHMRKLLEVDTDHLRTLLSVLKVHHRIARSLDF
FT                   LGTALKVVAGTPDATDLFKIKITEAQLVESNSRQIAINSETQKQINKLTD
FT                   TINKVINARKGDLVDTPHLYEALLARNRMLSTEIQNLILTITLVKSNIIN
FT                   PTILDHADLKPLVEQDTPIVSLIEASKIRVLQSENSIHILIAYPRVKFSC
FT                   KKVAVYPVSHQHTILRLDEDTLAECEHDTFAVTGCTDTTHFTFCERSRRE
FT                   TCVRSLHAGNAAQCHTQPSHLREINPVDDGVVIINEAAAHVSTDGSPETL
FT                   IEGTYLVTFERTATINGSEFVNLRKTLSKQPGIVRSPLLNIVGHDPVLSI
FT                   PLLHRMSNENLHSIQNLMDDVESEGSPRLWFVAGVVLNFGLIGSLALYLA
FT                   LRRRRASREIQRTIDTFNMTEDGHKLEGGVVNN"
XX
CC   Derived from M12927 (g157583) (Rel. 44, Last updated, Version 6).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
CC   [See also:AF033821; alignments in /alignments/gypsy]
XX
SQ   Sequence 7469 BP;  2301 A; 1808 C; 1602 G; 1758 T; 0 other;
     AGTTAACAAC TAACAATGTA TTGCTTCGTA GCAACTAAGT AGCTTTGTAT GAACAATGCT        60
     GACGCGCCAG AATTGGGTTC AACGCTCCAC GCGAAGAATG CCTGGCAGCG GAAAGCTGAC       120
     ACTTCCTACC GGGAGTGTTG CTTCACGCTG CAAGAAATGC TGAGTCGGCT TGCCGACTTG       180
     TGGCGGCGCG ATGCATTGCT CGAGGGTAAA CTTAGTTTTC AATATTGTCT TCTACTCAGT       240
     TCAAATCTTG TGTCGAAATA AACCACAGCT TGCTCCGGCT CATTGCCGTT AAACATCATT       300
     GTTCTTATTT ACAATCAAAT CGCTATCGCC ACAAGGCTAG TGATAATAAC TAAGGGGGCG       360
     AAGTCAAGCC CTCCAACCTA ATCTCCATAA ACAGTGTCTA AGACGAACCT CAGCGAAAGA       420
     AGGAAGATCT CTAGACCTAC TGGAAATAAC ATAACTCTGG ACCTATTGGA ACTTATATAA       480
     TTGGCGCCCA ACCAACAATC TGAACCCACC AATCTAATTT AACACACTTT GTCAGGCGAC       540
     AAACAGGGTA GTTAAGTTAG AAAAGCATGT AAGTTTTACA AGACACTTCT TTGACGCAAT       600
     CAAGAAATTT ACGAGTGAAA AAAAAAAAAA AAAAAAGTTG TGTATCTGGC CACGTAATAA       660
     GTGTGCGTTG AATTTATTCG CAAAAACATT GCATATTTTC GGCAAAGTAA AATTTTGTTG       720
     CATACCTTAT CAAAAAATAA GTGCTGCATA CTTTTTAGAG AAACCAAATA ATTTTTTATT       780
     GCATACCCGT TTTTAATAAA ATACATTGCA TACCCTCTTT TAATAAAAAA TATTGCATAC       840
     TTTGACGAAA CAAATTTTCG TTGCATACCC AATAAAAGAT TATTATATTG CATACCCGTT       900
     TTTAATAAAA TACATTGCAT ACCCTCTTTT AATAAAAAAT ATTGCATACG TTGACGAAAC       960
     AAATTTTCGT TGCATACCCA ATAAAAGATT ATTATATTGC ATACCTTTTC TTGCCATACC      1020
     ATTTAGCCGA TCAATTGTGC TCGGCAACAG TATATTTGTG GTGTGCCAAC CAACAACCAA      1080
     TGAGTTGGGC ACATAACTAC AGAAAGGTTA AGGTCGAATA CGAAAGCGAG GATAGCTGGG      1140
     AGGAGGAGCA AGTAGGCCAA GCATTAGGTC GGCCGTTAGA TAGTGCCACG GTAGATATTA      1200
     CCATGGACCC CAATCAGATT CAAGCTCTTA TCGACAATGC TGTCAGACAG GCATTGTCGC      1260
     AACAGCAATC CCAATTTCAG ACACAACTCA ATTCCCTAGC TGCGCGGGTA CAGAGTTTGC      1320
     AGGTGGAAGC ACCGCAAATC AAGATTTACG AAAAAGTCTC TGTTAACCCC GATGTTAGGT      1380
     GCGACATTCC CCTTGACATA ATAAAGTCTG TACCAGAGTT CTCCGGTACC CAAGACGAGT      1440
     ATGTGGCCTG GAGACAATCG GCCATATACG CCTACGAGCT CTTCAAACCA TACAATGGCA      1500
     GCAGTGCCCA TTATCAGGCT GTTGCCATAT TAAGGAATAA AATCCGTGGC GCAGCCGGGG      1560
     CTTTACTGGT CTCCCACAAT ACGGTATTGA ACTTCGATGC TATTTTGGCC AGACTAGACT      1620
     GCACGTACTC GGACAAAACA TCCTTACGCC TGTTGAGGCA AGGATTGGAA ATGGTTAGGC      1680
     AAGGAGACCT ACCACTAATG CAATACTACG ATGAAGTTGA AAAGAAGCTA ACGCTTGTCA      1740
     CTAACAAAAT CGTAATGACG CATGAACAAG AGGGTGCTGA CCTGCTTAAC GCTGAGGTCA      1800
     GAGCCGACGC CCTGCATGCT TTTATTTCGG GGCTCAAAAA GGCCCTCAGA GCTGTGGTCT      1860
     TCCCGGCCCA ACCAAAAGAC CTGCCATCTG CACTGGCTTT AGCTAGAGAA GCAGAGGCAA      1920
     GCATAGAGAG AAGCATGTTC GCTAACTCCT ACGCCAAGGC CGTAGAGGAG CGAGCGCATT      1980
     CGGGGGCAAA CGGCAAGAGC CGTTTCCAGG GGAAGCCAAA TAAAGAAGAA CAGGGACAGG      2040
     ACAGGAATCC CCACTTCACC AAACGCCCCA AAAATAACGG ACAAACCAAC AAGGACACTC      2100
     AGGCGCAAGC ACCCCAGCCA ATGGAGGTCG ATTCATCCTC CAGGTTTAGG CAGCGTACTG      2160
     AACATTATCA GAATCATCCT AACGAGTCGA ACGCGTTTAA GAGGAGAAAT TCCTCAGAAC      2220
     GCTCAACAGG ACCGAGACGA CAACGTCTGA ATAACGTTGT CCAAGAGGCC CCTAAACAAA      2280
     AGGACCCCAA AGAAGAGTAT GAAAAAACAG CAAAGGCTGC AGTCGAGGAA ATCGACAGCG      2340
     AAAATGAGTA CGCTCCCAGT GACGACTCGT TGAATTTTTT AGGGGGCGCT CCCGGTTGCC      2400
     GTTCATTGAA CGACGGCTGG CTGGGAGAAC CTTAAAGATG CTAATCGATA CCGACGCGGC      2460
     AAAAAACTAC ATTAGGCCCG TAAAGGAGCT GAAAAATGTA ATGCCGGTCG CCAGCCCTTT      2520
     CTCGGTGAGC TCAATACACG GCTCCACCGA AATCAAACAC AAATGCTTGA TGAAAGTCTT      2580
     CAAGCACATC TCCCCATTTT TTCTTTTGGA TTCTCTCAAT GCGTTCGACG CTATCATAGG      2640
     CTTGGACCTG TTAACACAGG CCGGGGTAAA ACTCAACCTT GCAGAGGACT CCTTAGAATA      2700
     CCAGGGCATC GCTGAAAAGC TTCATTATTT CAGCTGCCCC AGTGTAAATT TCACTGATGT      2760
     AAACGATATT GTTGTACCTG ACTCCGTTAA AAAGGAGTTC AAGGACACAA TAATAAGGAG      2820
     GAAGAAAGCT TTCTCCACAA CAAATGAAGC TCTTCCTTTT AACACCGCTG TCACTGCCAC      2880
     AATTCGGACA GTTGACAATG AACCGGTGTA CTCAAGAGCG TACCCAACTC TTATGGGTGT      2940
     CTCCGACTTT GTGAACAACG AGGTCAAACA ACTGCTGAAA GACGGCATTA TCAGGCCCTC      3000
     AAGGTCTCCC TATAACAGCC CGACCTGGGT TGTTGACAAA AAGGGGACCG ACGCCTTCGG      3060
     GAACCCAAAC AAGAGGTTGG TCATTGACTT CAGGAAGCTA AATGAGAAAA CTATTCCTGA      3120
     CCGGTACCCG ATGCCTAGCA TTCCCATGAT TCTAGCGAAT CTGGGCAAGG CAAAGTTCTT      3180
     CACTACCCTT GATCTTAAGT CAGGGTATCA TCAAATTTAC CTCGCGGAAC ACGACCGCGA      3240
     GAAGACATCG TTCTCGGTGA ATGGTGGTAA ATACGAGTTT TGCCGTCTAC CGTTCGGCTT      3300
     GAGAAATGCA AGCAGCATTT TTCAAAGAGC CCTAGACGAT GTGCTTAGAG AGCAAATCGG      3360
     GAAGATATGT TACGTCTATG TAGATGACGT CATAATTTTC TCTGAAAACG AGTCCGACCA      3420
     TGTCCGCCAC ATCGATACAG TACTAAAATG CCTGATCGAT GCCAACATGA GAGTAAGCCA      3480
     GGAGAAAACT AGATTCTTTA AAGAGAGTGT AGAATACCTC GGCTTTATTG TCAGTAAGGA      3540
     CGGAACTAAA TCCGATCCAG AGAAGGTGAA GGCCATTCAG GAGTACCCTG AACCAGACTG      3600
     CGTTTACAAG GTTAGGTCCT TCCTTGGTTT AGCCAGCTAC TACAGAGTCT TCATCAAAGA      3660
     CTTTGCTGCC ATAGCCCGCC CGATCACCGA TATCCTAAAA GGGGAAAATG GTTCGGTGAG      3720
     CAAACACATG TCTAAAAAAA TTCCTGTTGA GTTTAATGAA ACTCAACGCA ACGCGTTCCA      3780
     AAGACTGCGA AACATACTAG CATCCGAGGA TGTCATACTC AAATACCCCG ACTTTAAAAA      3840
     GCCTTTTGAC CTTACTACAG ATGCTTCGGC AAGTGGTATC GGTGCAGTCC TATCCCAGGA      3900
     GGGCAGGCCA ATCACCATGA TATCGCGTAC CCTTAAACAG CCCGAGCAGA ACTACGCCAC      3960
     AAACGAAAGG GAATTGCTGG CGATTGTATG GGCCCTAGGT AAGTTGCAGA ACTTCCTGTA      4020
     TGGCTCTAGG GAGATTAATA TATTTACCGA CCATCAACCC CTCACTTTCG CTGTTGCCGA      4080
     CAGGAACACG AATGCCAAGA TAAAGAGGTG GAAATCTTAC ATAGACCAGC ATAATGCCAA      4140
     GGTTTTCTAC AAACCTGGCA AAGAAAATTT CGTGGCAGAC GCCCTCTCTA GGCAGAATCT      4200
     GAATGCCTTA CAAAACGAAC CCCAATCAGA CGCTGCGACC ATTCACAGTG AGCTCTCCCT      4260
     GACCTACACG GTCGAGACAA CAGACAAACC GTTAAATTGC TTCAGGAACC AGATCATTCT      4320
     GGAGGCAGCA CGTTTTCCGC TCAAACGAAA CCTGGTGCTC TTTCGAAGCA AATCTCGCCA      4380
     CTTAATCAGC TTTACTGATA AAAGTTGGCT ATTAAAAACA CTTAAGGAGG TGGTAAACCC      4440
     TGACGTCGTG AACGCTATTC ACTGCGACCT GCCCACTCTG GCAAGCTTCC AACACGACCT      4500
     CATTGCCCAC TTTCCAGCCA CCCAATTTCG TCACTGTAAG AATGTCGTGT TAGACATAAC      4560
     CGACAAAAAC GAACAGATCG AAATCGTCAC TGCCGAGCAC AACCGCGCTC ACAGAGCCGC      4620
     ACAAGAAAAC ATTAAACAAG TCCTTCGGGA TTATTACTTT CCCAAAATGG GCAGTTTAGC      4680
     TAAAGAAGTA GTAGCTAATT GTAGGGTCTG CACCCAAGCA AAGTATGACA GGCACCCGAA      4740
     AAAGCAAGAG CTCGGGGAAA CGCCCATACC CAGCTATACA GGTGAGATGG TGCATATTGA      4800
     CATATTCTCA ACCGACAGGA AGCTATTCCT GACGTGTATT GACAAATTTT CTAAATATGC      4860
     AATAGTGCAA CCAGTGGTGT CTAGAACAAT AGTGGACATC ACAGCACCCC TGTTGCAGAT      4920
     CATTAACCTG TTCCCCAATA TCAAAACGGT CTATTGTGAC AATGAGCCCG CATTTAACTC      4980
     AGAAACTGTC ACCTCAATGC TCAAGAACAG CTTCGGCATT GACATAGTAA ATGCGCCCCC      5040
     ACTCCACAGC TCATCCAATG GCCAAGTTGA ACGGTTCCAC AGCACATTGG CAGAAATCGC      5100
     CAGGTGCCTG AAGTTGGACA AAAAAACGAA TGACACAGTA GAACTAATCT TGAGGGCGAC      5160
     GATAGAATAT AACAAAACCG TGCACTCAGT TACTCGTGAG AGACCAATTG AGGTGGTTCA      5220
     CCCAGGGGCC CACGAGCGCT GCCTAGAAAT CAAGGCAAGA TTAGTAAAGG CTCAGCAAGA      5280
     CAGCATCGGA AGAAACAACC CTTCCCGACA AAACCGCGTG TTTGAGGTGG GAGAACGCGT      5340
     GTTTGTAAAA AACAACAAGA GGTTAGGAAA TAAGCTAACT CCACTATGCA CCGAGCAAAA      5400
     AGTGCAGGCA GACTTGGGAA CGTCTGTTCT TATTAAGGGG AGGGTGGTCC ACAAGGACAA      5460
     CCTCAAGTAG ACATTCCCTC TACAGTTAGG TAGTAAGTTA TGTCAAGGAA AATCCGAGCA      5520
     CTGTAGTATC ACCTTGTCTT TAATTTCCAG GTTCACCCTC ATGATGTTCA TACCCTTGGT      5580
     AGTAGCGAAT GCTCGGATCA CCGACTTTTC GCATGCCAAC TACATTCCTG TGTTAGATGG      5640
     GGATGTGCTG GTGTTTGAAC AGCGTGACCT CTTGAAACAT TCGAGTAACC TTTCCGAGTA      5700
     CGCTAGTATG ATAGATGAAA CACAGAAACT GTCCGAGTCC TTTCCCCACT CACATATGCG      5760
     TAAGTTGCTA GAGGTCGATA CTGACCATCT TAGAACCTTG TTGTCCGTTC TCAAAGTCCA      5820
     CCATAGGATA GCTAGGAGTC TAGATTTCTT AGGTACAGCC TTAAAGGTTG TGGCGGGTAC      5880
     TCCCGATGCC ACGGACCTCT TTAAAATTAA GATCACAGAG GCCCAACTAG TAGAATCTAA      5940
     TTCCAGGCAG ATAGCTATAA ACTCCGAAAC CCAGAAACAG ATAAATAAGT TAACTGACAC      6000
     CATCAATAAG GTGATCAATG CCCGTAAAGG CGACTTGGTT GACACTCCAC ACTTATATGA      6060
     AGCACTACTA GCAAGAAATA GGATGCTGTC TACAGAAATT CAAAATTTAA TTCTCACTAT      6120
     TACTTTGGTC AAATCAAACA TTATAAATCC CACAATTCTT GATCATGCCG ACTTGAAGCC      6180
     TCTTGTAGAA CAGGATACCC CAATTGTCAG CTTAATAGAA GCATCTAAGA TCAGGGTCCT      6240
     CCAGTCCGAG AATAGCATTC ATATTTTAAT TGCCTATCCT AGAGTCAAGT TCAGTTGCAA      6300
     GAAAGTCGCC GTCTACCCTG TATCTCACCA ACACACCATC TTGCGCCTCG ACGAAGACAC      6360
     TTTGGCCGAA TGCGAACATG ACACCTTTGC GGTCACCGGA TGCACAGACA CCACACACTT      6420
     CACGTTCTGC GAGCGGTCTC GGCGCGAAAC TTGCGTGCGC TCACTCCATG CTGGAAACGC      6480
     TGCTCAATGC CACACTCAAC CCAGCCACTT GCGAGAAATA AACCCCGTAG ATGATGGCGT      6540
     TGTGATTATC AACGAAGCCG CAGCTCACGT TAGCACTGAT GGCAGCCCCG AAACACTGAT      6600
     AGAGGGAACC TACCTGGTAA CCTTCGAGCG AACGGCAACC ATCAACGGCT CTGAATTCGT      6660
     AAATCTAAGG AAAACACTAA GCAAGCAGCC AGGCATCGTG CGTTCACCAC TACTTAACAT      6720
     CGTCGGCCAC GACCCTGTGC TCAGTATACC TCTGCTACAC CGGATGAGTA ACGAAAACCT      6780
     ACATTCCATC CAAAACCTTA TGGATGACGT GGAATCTGAA GGCTCGCCCA GACTCTGGTT      6840
     CGTGGCTGGT GTGGTCCTAA ACTTCGGCTT GATTGGCTCT CTCGCCCTTT ATCTGGCATT      6900
     AAGGAGAAGA CGAGCCTCTA GGGAGATACA GCGCACCATC GATACTTTCA ACATGACCGA      6960
     GGACGGTCAT AAACTTGAGG GGGGAGTAGT TAACAACTAA CAATGTATTG CTTCGTAGCA      7020
     ACTAAGTAGC TTTGTATGAA CAATGCTGAC GCGCCAGAAT TGGGTTCAAC GCTCCACGCG      7080
     AAGAATGCCT GGCAGCGGAA AGCTGACACT TCCTACCGGG AGTGTTGCTT CACGCTGCAA      7140
     GAAATGCTGA GTCGGCTTGC CGACTTGTGG CGGCGCGATG CATTGCTCGA GGGTAAACTT      7200
     AGTTTTCAAT ATTGTCTTCT ACTCAGTTCA AATCTTGTGT CGAAATAAAC CACAGCTTGC      7260
     TCCGGCTCAT TGCCGTTAAA CATCATTGTT CTTATTTACA ATCAAATCGC TATCGCCACA      7320
     AGGCTAGTGA TAATAACTAA GGGGGCGAAG TCAAGCCCTC CAACCTAATC TCCATAAACA      7380
     GTGTCTAAGA CGAACCTCAG CGAAAGAAGG AAGATCTCTA GACCTACTGG AAATAACATA      7440
     ACTCTGGACC TATTGGAACT TATATAATT                                        7469
//
ID   DMHFL1     standard; DNA; INV; 2959 BP.
XX
AC   M69216;
XX
DR   FLYBASE; FBte0000154; Dmel\hobo.
XX
SY   synonym: H-element
XX
XX
FT   source          M69216:1..2959
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1..12
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:2948..2959
FT   SO_feature      TATA_box ; SO:0000174:107..112
FT   SO_feature      polyA_signal_sequence ; SO:0000551:2382..2394
FT   SO_feature      CDS ; SO:0000316:316..2292
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\hobo\T"
FT                   /db_xref="FLYBASE:FBgn0014191"
FT                   /translation="
FT                   MAPYIMIVEFLCLWSSVSAVNCPFFVFYDAITSLLGFSIIWKPKEKVTIM
FT                   AEAADFVKNKINNGTYSVANKHKGKSVIWSILCDILKEDETVLDGWLFCR
FT                   QCQKVLKFLHKNTSNLSRHKCCLTLRRPTELKIVSENDKKVAIEKCTQWV
FT                   VQDCRPFSAVTGAGFKNLVKFFLQIGAIYGEQVDVDDLLPDPTTLSRKAK
FT                   SDAEEKRSLISSEIKKAVDSGRASATVDMWTDQYVQRNFLGITFHYEKEF
FT                   KLCDMILGLKSMNFQKSTAENILMKIKGLFSEFNVENIDNVKFVTDRGAN
FT                   IKKALEGNTRLNCSSHLLSNVLEKSFNEANELKKIVKSCKKIVKYCKKSN
FT                   LQHTLETTLKSACPTRWNSNYKMMKSILDNWRSVDKILGEADIHVDFNKS
FT                   SLKVVVDILGDFERIFKKLQTSSSPSICFVLPSISKILELCEPNILDLSA
FT                   AALLKERILENIRKIWMANLSIWHKAAFFLYPPAAHLQEEDILEIKVFCI
FT                   SQIQVPISYTLSLESTETPRTPETPETPESLESPNLFPKKNKTISSENEF
FT                   FFPKLVTESNSNFNESPLDEIERYIRQRVPLSQNFEVIEWWKNNANLYPQ
FT                   LSKLALKLLSIPASSAAAERVFSLAGNIITEKRNRLCPKSVDSLLFLHSY
FT                   YKNLNNSQ"
XX
CC   Derived from M69216 (g157606) (Rel. 41, Last updated, Version 3).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
CC   CDS annotation from Lynn Crosby's annotation 'H-element.v004'.
XX
SQ   Sequence 2959 BP;  994 A; 541 C; 571 G; 853 T; 0 other;
     CAGAGAACTG CAAGGGTGGC ACTTTTTTAC CACTCGACTC ACACCCTACA ATTTTGTGTG        60
     CGGGTGCTAC TCGCCACGCA CATCGCGGGT ACTTACAAAC ACACAGTATA AATCTGAACA       120
     TGCAGACAAG ACACCCCGTT GTGTGCGCAC CCGAATCAAT ACGGTGTTTT GCGTCGCGGG       180
     TGCCGCTCAC ACAGTGCCTA AAAAGGGATG AGTGAGAAAA ACACTTGTGG GTATACCGTT       240
     AAACACATGG GTGTTTCCAA AAATACTCGG GTGTTTCCAA AAATACTCGA GTGGTCTCGT       300
     AGGTAGTCGA GTCAAATGGC GCCATACATA ATGATTGTTG AGTTCTTGTG TCTTTGGTCC       360
     AGTGTCTCGG CTGTTAATTG CCCCTTTTTT GTTTTTTACG ATGCAATTAC TAGCTTGTTA       420
     GGATTCAGTA TTATTTGGAA GCCAAAGGAA AAGGTCACAA TAATGGCAGA AGCGGCTGAT       480
     TTCGTTAAAA ATAAAATTAA CAATGGAACA TACTCAGTTG CCAATAAACA TAAAGGAAAA       540
     AGTGTTATTT GGAGCATTTT ATGTGACATT TTAAAGGAAG ATGAAACTGT TCTGGACGGA       600
     TGGCTGTTCT GCAGGCAATG CCAGAAAGTG CTCAAATTTT TACACAAAAA CACCTCCAAT       660
     TTATCCCGCC ATAAATGTTG TCTAACATTA AGACGACCAA CGGAATTAAA AATTGTTTCG       720
     GAAAACGACA AGAAAGTAGC TATTGAAAAA TGCACCCAAT GGGTTGTCCA AGATTGTCGG       780
     CCGTTTTCTG CAGTAACCGG AGCCGGATTT AAAAATTTGG TGAAGTTTTT CCTACAAATC       840
     GGCGCTATCT ATGGGGAACA GGTAGACGTC GATGACTTAC TACCTGATCC AACAACATTA       900
     AGTCGGAAGG CCAAATCGGA TGCAGAAGAG AAGAGGAGTC TAATCTCGTC CGAGATAAAA       960
     AAAGCTGTGG ATAGCGGAAG AGCAAGTGCG ACCGTCGACA TGTGGACTGA CCAGTATGTC      1020
     CAAAGAAACT TTTTGGGCAT CACTTTCCAT TACGAAAAAG AATTTAAACT TTGTGACATG      1080
     ATTTTGGGAC TAAAATCGAT GAATTTTCAA AAATCGACTG CCGAAAACAT TTTAATGAAA      1140
     ATTAAAGGTT TATTTTCGGA ATTCAATGTT GAGAACATTG ATAATGTTAA GTTTGTGACT      1200
     GACAGGGGAG CAAATATAAA AAAGGCTTTA GAGGGCAATA CCCGTTTAAA TTGTAGCAGT      1260
     CACCTGTTGT CAAATGTTTT AGAAAAATCG TTTAACGAGG CCAATGAACT CAAAAAAATT      1320
     GTGAAATCAT GCAAAAAAAT CGTGAAGTAC TGCAAAAAAT CAAATTTGCA GCATACTCTA      1380
     GAAACCACTT TGAAAAGCGC CTGTCCGACT AGATGGAACT CCAACTACAA AATGATGAAG      1440
     TCCATTCTGG ATAACTGGCG TAGTGTGGAT AAAATATTAG GTGAAGCTGA TATCCATGTA      1500
     GATTTTAATA AATCATCTTT AAAAGTTGTG GTAGATATTC TAGGAGACTT TGAACGAATA      1560
     TTTAAGAAGT TGCAAACATC TAGCTCACCA TCTATATGCT TCGTATTGCC ATCCATCTCT      1620
     AAAATTTTAG AATTATGCGA GCCGAATATT TTAGACCTTT CTGCAGCAGC ATTGCTTAAG      1680
     GAAAGAATTT TGGAAAATAT TCGTAAGATT TGGATGGCAA ATCTAAGCAT ATGGCATAAG      1740
     GCGGCATTTT TTTTATATCC ACCCGCAGCA CATCTTCAGG AAGAAGATAT TCTTGAAATA      1800
     AAGGTGTTTT GCATTTCACA AATTCAAGTC CCAATTTCAT ACACATTAAG CTTAGAATCT      1860
     ACAGAAACTC CAAGAACTCC AGAAACTCCA GAAACTCCAG AAAGTCTAGA AAGTCCAAAC      1920
     TTATTTCCAA AAAAAAACAA AACAATATCT TCTGAAAACG AATTCTTCTT CCCAAAGTTA      1980
     GTAACTGAGT CTAATTCCAA CTTCAATGAA TCTCCATTAG ATGAAATTGA ACGATATATT      2040
     AGACAAAGAG TTCCATTGTC TCAAAATTTT GAAGTAATTG AGTGGTGGAA AAATAACGCA      2100
     AACTTATACC CTCAGTTGTC AAAGTTAGCA TTAAAACTTT TATCAATACC AGCCAGTAGC      2160
     GCAGCAGCTG AAAGAGTGTT TTCCCTAGCA GGTAATATAA TAACAGAAAA GCGAAATAGA      2220
     TTATGCCCAA AATCTGTAGA TAGCCTCCTT TTTTTGCATT CCTATTACAA AAACCTAAAC      2280
     AACTCGCAAT AGATATTCCT TCTTATAAGT ATATTTTATA TTATTAATTC TTATTATTTG      2340
     CTTAATTTTT GTATAAGTGT TAAGTATTAA GTATAAGTAT TAATTAATAA TATATAAGAT      2400
     TGTTATTTGT TAAGACATTA GATGCAAAAT CCTAAAAATG TGAAAGTAAT GAAGTTCCTT      2460
     ATATTTAATA GATACTTTTT AAGCCCACTA TGTTTTTATT ATTTAGATTG AGACATTAAA      2520
     AAACGTAAAA ATCAACAAAT GCCGTCTTTA ATTGCAATTA CTTTATGTGT TTGAAATGGG      2580
     AGGCACCCAT TGAGTCCATC AAAGAGCAAA GACATGAGCA CAAAAATTTT CTTGGGTATT      2640
     CCCTTTTACC CTTCATTTCT TATACCCGTC ACGCTTCCAC CCATACAAAT TTTAGGCGTA      2700
     CAAAAAATGA CCAGAGAACT GCAGCCCGCA TACAAAAAAT GACCTGCGGC CGATCGTTGA      2760
     CTGTGCGTCC ACTCACCCAT ACGGCTCTTG CGCAGCAGGC CTCGGGTGGT TTTTTTACTC      2820
     GTAACAAAAA CACAACGTCG GTAAAACACT CGAGTATTTT GTGTTGCCGC AAGTAGGGTG      2880
     TCAAAAAAAA CGGGGTGCCT AGAGTACCGA GTGTTTATCG GGTGGACGTA GAGTGCGAGT      2940
     GGCGGGCTGC AGTTCTCTG                                                   2959
//
ID   DMTHB1     standard; DNA; INV; 1653 BP.
XX
AC   X01748;
XX
DR   FLYBASE; FBte0000414; Dmel\HB.
XX
FT   source          X01748:189..1841
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1..31
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1622..1653
FT   SO_feature      CDS ; SO:0000316:387..534
FT                   /name="Dmel\HB\T"
FT                   /db_xref="FLYBASE:FBgn0044055"
FT                   /db_xref="SPTREMBL:Q27293"
FT                   /db_xref="NCBI_PROTEIN:CAA25884.1"
FT                   /translation="MLILKLRKEGKTYKDIQKTLKCSAKMVSNAIKYKWKPENRGTKHK
FT                   TTDIEDRRIVSYSKVYRFASFRDIKSELNLGISDVTIRRRLLNQNFSARSPRKVPLPSP
FT                   RHIKARLSLAKTYLNWPVSKWRNILWTDGSKIMLFGGTGSLQYI"
XX
CC   Derived from X01748 (g8693) (Rel. 49, Last updated, Version 3).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 1653 BP;  568 A; 288 C; 302 G; 495 T; 0 other;
     ATGTACAGCT GTGTTCAGAA AAATAGCAGT GCGAAGGAAA CTAAGTAATA CAAAGGTATT        60
     TTTCCATGTC CCTTTTCGGA ATCGACTTTT TATTCCTCTT ATTTTTGTTA AATGGAATGT       120
     GTAGATAGGG AAAAAAAGAA AATCCGGTCA GTTTTTCTTG TTATCCTTTT TTTATTTACA       180
     TTCTTGAGCA AAATCACAAT TTTTAGGCTG TTCATAAGAA TAGCAGTGTC TGGTTCTGAC       240
     CAACGTAAAG TCCCGAAATG ATCAATATTT TCTAAAAAGT GAGTTTGGTT AAGTTAATTC       300
     GTATATTTAA AAGGACAATA AATTAAAAAA ATTAAAAAAA TTTTATTTTA GTGGGTAGAG       360
     GACAGCACTA CTCCCAGGGG AAAAGAATGT TAATTCTTAA GCTTAGAAAG GAAGGAAAAA       420
     CATATAAGGA CATTCAAAAA ACCCTTAAAT GTTCTGCCAA AATGGTATCC AATGCCATTA       480
     AATATAAATG GAAGCCCGAA AACCGTGGTA CCAAACATAA AACCACAGAT ATAGAGGATC       540
     GACGCATTGT TTCTTACAGC AAAGTCTATC GTTTTGCATC CTTTAGGGAC ATAAAGTCTG       600
     AGCTGAACTT GGGAATCAGC GACGTTACTA TTCGTAGACG ACTACTGAAT CAAAATTTCA       660
     GTGCGAGGAG TCCACGAAAG GTTCCCCTAC CTAGCCCAAG GCATATTAAG GCAAGGTTAA       720
     GCTTAGCTAA AACCTACCTA AACTGGCCAG TCTCCAAATG GCGTAATATC CTTTGGACTG       780
     ATGGGTCAAA AATCATGCTA TTTGGTGGAA CTGGTTCACT ACAGTATATC TGACGACCTC       840
     CAAACACGGA GTATCACCCA AAACACCCAG TGAAGACTTT CAATCACGGT GGACCTAAAA       900
     TCATGGTATG GGCTTGTTTT TTTTATAATG GTATGAGTCA TGCTATGGAT TATGATTTAT       960
     GGTATTATAG ACCAAAACGC ATATGTAAAT ATACTTAGTG ATGTCTTATT GTCATATTCT      1020
     GAATAAAATA TACCCTTAAA ATGGACATTC CAACAGGATA ATGATCAGAA ACGCAGATGT      1080
     AAATCGGCTA AGAATAGGTT CACCCAAAAT AGAATAGATG CAATGCCGTG GCAAGCACCA      1140
     CCTTCCCATT TAAACCCGAT TGAAAACCTG TATGGGGACA TTAAACAGTT TGTGTCGAAG      1200
     AAGTCCCCGA CGTCTAAGAC TCAGATTTGG CAAGTTGTGC AGGATACATG GGCAAAAATT      1260
     CCTCCCAAAC CTTGCTAGGA CTTGGTGGAC TTCATGCCGC GTGGGTGTAA GGCTGTGCTG      1320
     GCTAACAAAG GCTATCCAGC CAAGTATTAG GCCCGAATTA ACATATTAAA AAGAAAAACT      1380
     AAGTTCGTTC TAGGTCAAGT TAAATTTTGT TACTATTTTT TCATAGCACT GCTATTTTAT      1440
     TGAACACCAG AATTTCTGCC TATTTATTGT TTTAATCTAT ATTTTCGAAA CTATTGAAGA      1500
     AATAAAAGTG AAACATTTGT TAAATTGTTT GAAATGAAAT ACCTAATGAT ATTATTAAAA      1560
     AAAAATTCCC ATTAAAACTG TAAATCATAG GAATTTTTTA TCTTAAACTC TGAAGTCCAA      1620
     AGCACTGCTA TTATTCTGAA CACAGCTGTA CAT                                   1653
//
ID   DM06920    standard; DNA; INV; 6083 BP.
XX
AC   U06920;
XX
DR   FLYBASE; FBte0000143; Dmel\HeT-A.
XX
FT   source          U06920:1015..7097
FT   SO_feature      five_prime_UTR ; SO:0000204:1..731
FT   SO_feature      three_prime_UTR ; SO:0000205:3497..6083
FT   SO_feature      polyA_sequence ; SO:0000610:6077..6083
FT   SO_feature      CDS ; SO:0000316:732..3497
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\HeT-A\gag"
FT                   /db_xref="FLYBASE:FBgn0016662"
FT                   /db_xref="REMTREMBL:AAC17188"
FT                   /db_xref="NCBI_PROTEIN:AAC17188.3"
FT                   /translation="MSMSDNLFSDDEVLSISSSPEQRSSPFYLNISPMSHGSDNSQINT
FT                   VIINSKKLPSNQADISLKNSSGAAIKIVNSLSHKKKENTNVNNAQKDPLSLTNTTASTC
FT                   GAKSSISEGKLSSPPSTSHTYEGKLLTKLTHTHTDFRGAKTSDAMGSFPSLSHSDNSIE
FT                   KNLSSSTKIGPNASSPPSHAHTHTSKSTDISLESRSKHPALANTDARSIKANANDNGEI
FT                   FSSLIQIDERKQEERPCTTINAFWSIFKPKPDVTKLSLKRKPTNPTKNTGKKCISPHKK
FT                   SAYLCPSAQDDLNLNLNPKSSAKPTVVNLPAARILSRPAAKRDLFKSSSSRSPDEQPMS
FT                   FSEVVAGTGSIFAAPCVPAPLTKTPGKRTNDDLDCSNFKTPNKKLCATSNFVTPSIFPP
FT                   LITPVFKSKAAQSVYEESKARNGPPPPALACSINASARSAAAPPGIAPLPPHNTDAELP
FT                   PWKIVPQSRRAPPILVNDVKEIVPLLEKLNYTAGVSSYTTRAIEGNGVRIQAKDMTAYN
FT                   KIKEVLVANGLPLFTNQPKSERGFRVIIRHLHHSTPCSWIVEELLKLGFQARFVRNMTN
FT                   PATGGPMRMFEVEIVMAKDGSHDKILSLKQIGGQRVDIERKNRTREPVQCYRCQGFRHA
FT                   KNSCMRPPRCMKCAGEHLSSCCTKPRTTPATCVNCSGQHISAYKGCPAYKAEKQKLAAN
FT                   NVDINKIRTIKDATNNFYKRQGPPLRNNTPRLPHSSAILSKSIAEARQEAARKSMLNPF
FT                   RQNINDRRPRFSSHDTAIQKRLNKWRRNTNKIPKKGRIALKDNAKPRPAHRTSNPAQRH
FT                   LEDYQDMLRRERSEENDQESEKGTPNTKQVGNDSPPTTSRAARASFKPRIIDDTTPSPK
FT                   ICNPNSQKGLLDDPTTSLANRVDNLEKKIDILMALIIQGRNNNLDMDTSN"
XX
CC   Derived from U06920.2 (Rel. 67, Last updated, Version 14).
CC   Michael Ashburner, 26-Jan-2002.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 6083 BP; 2199 A; 1545 C; 1033 G; 1306 T; 0 other;
     TAAATAAATA AAATAAATTA AACAATTAAC TAAATAATTA AATAACTAAA ATTAATAATA        60
     TAATCCGTTC GCTTGCCAAA GACTCTCACG CGCATAACTA ATTAAAATCG ATTTTCAAGT       120
     TGACAAATAA ATGGTTTAAA ATTGTCCTCA GGCTGCAAAG AAAAGCCGCG GCAACAATAA       180
     ACATTTAGTG ACACGCGAAA AGCGAACATT TGATTAGTGT AATACTTGTG CAAACCGACA       240
     AGCTGCCGCC ATAACAAAAC GGAGACGAAG AATCATAAAG AACAAAAGCT AAATCCACCA       300
     GCATAGCAAA AATAAATTAA CAAATAAAAT AAAAGCAAAT TTAAATAACA TAATAAATTA       360
     AACTTATTTA ATAAACCAAT TAATTTTAAT TAATTCAATT AAACGCTAAA TCTACATAAT       420
     ACTCCACGCG CAAATTAATT GAAATCGTCT TTCTAGTTAA TAAATTAAAA GTTTAAAAAT       480
     TGTCTCCGGC CGCAAAATTT GAACCGCGAC GATAAAAACA TTTAATTGAC AAACAAAAAG       540
     CGAACAATTA TTCAGTGAAC TATTTGTGCA AAATTGACAA GCAGACGCCA TAATTAAAAG       600
     GAGAAGAAGC CAAAAGACGA AGAGAAGAAA GCAACCAGAA GAACTCAAAG AAGAAAAGGA       660
     GGAAAGCCCA ATTAAAGAAA GCCAGGGTAT TTATACCTTA CACTTATCGT TTAATATAAC       720
     AAAAACCCAA CATGTCCATG TCCGACAACC TTTTTTCTGA CGATGAGGTA CTTTCAATTT       780
     CCTCAAGCCC AGAACAGCGA TCTTCTCCGT TCTACCTCAA TATATCGCCC ATGTCCCACG       840
     GATCAGACAA TTCTCAGATT AATACAGTCA TCATTAATTC GAAGAAATTG CCCTCAAATC       900
     AAGCAGACAT AAGTTTAAAA AACTCTTCTG GGGCTGCTAT AAAAATTGTT AATTCCCTTT       960
     CACACAAGAA GAAAGAGAAC ACAAACGTTA ATAATGCCCA AAAAGACCCC CTCTCACTCA      1020
     CCAATACTAC TGCAAGCACT TGTGGCGCCA AAAGCAGCAT CTCAGAGGGG AAATTGTCTT      1080
     CTCCTCCGTC CACCTCACAC ACATATGAGG GGAAATTACT CACAAAACTT ACTCACACAC      1140
     ACACAGACTT TAGAGGCGCC AAAACGAGCG ATGCAATGGG AAGTTTCCCC TCTCTCTCGC      1200
     ACAGCGACAA TAGCATAGAG AAAAATCTGA GTTCTTCCAC CAAAATTGGA CCAAACGCTT      1260
     CTTCCCCTCC TTCTCATGCA CACACTCACA CTAGCAAATC CACTGATATA AGCTTAGAAA      1320
     GCCGCTCAAA ACATCCCGCG CTTGCCAATA CGGACGCACG CTCTATAAAA GCCAATGCTA      1380
     ATGACAATGG GGAAATTTTC TCCTCACTTA TACAAATTGA CGAACGCAAG CAAGAGGAAA      1440
     GGCCTTGCAC AACTATCAAC GCTTTTTGGT CTATTTTTAA ACCCAAGCCG GACGTTACTA      1500
     AACTAAGTCT AAAGAGGAAA CCCACCAATC CCACTAAAAA CACTGGGAAA AAATGCATCT      1560
     CCCCTCATAA AAAGAGCGCT TATTTATGCC CTTCCGCTCA GGATGATTTA AATTTAAATT      1620
     TAAACCCCAA ATCTAGCGCC AAGCCCACTG TGGTGAATTT ACCAGCTGCC CGCATCCTAA      1680
     GCCGGCCTGC AGCCAAGCGG GATTTATTTA AATCATCATC CTCCCGAAGC CCAGACGAGC      1740
     AGCCTATGAG TTTTTCGGAA GTGGTCGCTG GCACGGGTTC AATTTTTGCG GCACCCTGTG      1800
     TCCCGGCACC TTTAACGAAA ACTCCAGGCA AGCGGACAAA CGACGATCTG GACTGCTCCA      1860
     ACTTTAAGAC GCCCAATAAA AAATTATGCG CGACTTCCAA CTTTGTAACT CCCAGCATTT      1920
     TTCCGCCGCT CATCACTCCC GTTTTCAAGA GCAAGGCAGC TCAATCTGTT TACGAGGAAT      1980
     CCAAAGCCAG AAATGGACCC CCCCCGCCGG CCCTCGCCTG CAGCATCAAT GCCTCTGCTC      2040
     GCAGCGCAGC GGCGCCACCC GGGATCGCCC CCCTACCCCC TCATAATACA GATGCAGAGC      2100
     TGCCTCCATG GAAAATCGTG CCCCAGAGCC GTAGAGCACC TCCTATACTC GTCAATGATG      2160
     TAAAGGAAAT TGTACCTCTA CTGGAAAAGC TGAACTACAC AGCAGGAGTC TCCAGCTATA      2220
     CTACTAGGGC TATAGAAGGA AACGGGGTCA GGATACAGGC AAAGGACATG ACCGCCTATA      2280
     ACAAAATTAA AGAAGTCCTG GTGGCCAACG GACTTCCTTT ATTCACCAAC CAGCCCAAGT      2340
     CCGAGAGAGG CTTCCGAGTC ATCATCAGAC ATCTCCACCA CTCCACACCA TGCTCGTGGA      2400
     TAGTCGAGGA ACTGCTGAAG CTCGGATTCC AAGCGCGATT CGTCAGAAAT ATGACGAATC      2460
     CGGCTACAGG TGGCCCCATG CGAATGTTTG AAGTGGAGAT CGTCATGGCC AAAGACGGCA      2520
     GTCATGACAA AATACTCTCA CTCAAACAAA TCGGTGGGCA AAGGGTGGAC ATTGAAAGGA      2580
     AAAACAGGAC ACGGGAGCCA GTCCAGTGCT ACAGATGCCA AGGCTTCAGG CATGCCAAAA      2640
     ACTCTTGCAT GAGGCCGCCA AGATGCATGA AATGCGCTGG CGAACACCTG TCTTCCTGTT      2700
     GCACCAAACC AAGAACCACC CCCGCCACCT GCGTAAATTG CTCTGGGCAG CATATTAGCG      2760
     CGTACAAAGG ATGCCCTGCA TATAAGGCGG AAAAACAAAA GCTGGCGGCA AACAACGTTG      2820
     ACATAAACAA AATAAGAACA ATCAAAGACG CAACAAATAA CTTTTATAAA CGTCAAGGCC      2880
     CCCCTCTACG CAACAACACC CCTCGGCTAC CGCACAGCTC AGCAATCCTG AGCAAATCAA      2940
     TTGCCGAAGC TCGCCAGGAG GCAGCCAGAA AGTCGATGTT AAATCCATTC CGACAAAATA      3000
     TAAACGACAG AAGACCACGA TTCTCCTCCC ACGACACGGC CATTCAGAAG CGTCTGAATA      3060
     AATGGCGCCG AAACACCAAC AAAATACCCA AAAAGGGTAG GATAGCCTTA AAGGATAATG      3120
     CAAAGCCACG ACCGGCACAT AGGACAAGTA ACCCAGCGCA AAGACATCTG GAGGACTACC      3180
     AGGACATGCT CCGAAGGGAA AGGAGTGAAG AAAACGACCA GGAATCTGAG AAGGGCACCC      3240
     CCAATACCAA GCAGGTCGGC AATGACAGCC CTCCGACCAC GAGCAGAGCA GCCAGAGCCA      3300
     GCTTTAAGCC AAGAATCATT GACGATACCA CGCCATCGCC AAAAATCTGC AATCCCAACT      3360
     CACAAAAAGG CCTCTTGGAC GACCCCACAA CAAGCTTAGC TAATAGAGTC GACAATTTAG      3420
     AAAAGAAAAT TGACATTTTA ATGGCCTTAA TCATACAAGG AAGAAATAAC AATCTTGACA      3480
     TGGATACATC CAATTAATCT TACAACTACT TATATATTCT TTAATAAATA TATCCAATAG      3540
     AAAAGCGCAC GTCGGTCTGC TTTTAAAATC CTTCACCGTC ATCACCTTCC TCGACGGAGC      3600
     CTAATTTATT GGAAAAATAA ATCAATTATA TGTTGGCACA AAAATGTAAA CACACACTCA      3660
     CCTAAACGCA CCCGGACGAA CAAGCCTATG ACAACGCACT CCAGCTGATC TGTAAGAAAC      3720
     AAAAAATATG AATAGATAGA TCGATATGAA AAGGATATGT GCGGCAGAAA CATGATGAGC      3780
     AAAAGGCGAC TCGCTGCAGC AACTTATGCA CAACGTCACT TACCTGAAAT TTCTTGCCGT      3840
     ACGATCTCCT GTAGTATCCC TTATCACAGC TGCAATCTAC TTGCAATGCT GCACTGCAAT      3900
     AAACGTACTA CAAAAGCTGC ATACGTTTTG ATCAGGACAC CTCGTGCGGA CGTGCTAAAA      3960
     AAAATTTCCT TTCTGCTGCT CTTATTGACG CTAAAACCTT AAAACCTACA AACAAAACAA      4020
     TTAAATAATA ACAAATCAAA TAAGACAACC AAATAATACA CTTACCTCAT TGACTGCAGC      4080
     TAAATCGCTG ACCCACATTC AGTGCAGCCG ACAGCAGGAG ACGGGCCCGC AAAAGCAAAA      4140
     CAAAATCGCC AATTTTGCGA TTATAAACAC GAAAAATTGA CAATTTTGCG ATGCCGTCTC      4200
     CGCCTCCTGA TGCCACTGCA TTGACAAGCA TCACTAGCGA GGAGCTGACA CCACACCAAA      4260
     AAGCTGTAAA ATCCGTCCAC AAATTGTATA TTTTGCCTCA GTGTCGTATC TGCAATGTTT      4320
     TTCCGATAAC CTGTAAGGAA AGAAAAATTA ATAAGAAAAT TATACAAAAT TAATTAAGGA      4380
     CGACAGAAAA TAGCAAACCA GACAGGCAAA TTAACAGATA CAAATATGAG ACTCCATCCT      4440
     GCTGCCGACA CACAAGTAAA TCCTTCAACT CGACAACAGG AGACGGGCCT TGCAAAAGCA      4500
     AAACAAAATC GCCAACTTTT GCGATTATAA ATACAAAAAA TTGACAATTT TGCAACGCCG      4560
     TCTCCACCTC CTGTTGCCAC TGCATTAATA AGGATCACCA GCGCGGCGTG ACGCCACACT      4620
     AAAAGGCTGC AAAATCCGTC CACAAAATGT ATACTTTTCC TCAGTACAAT ACTTTCTAAT      4680
     GAACTTCCGC CAACCTGCAA TGAAAAGAAA AGAAATAGGT ATATAAAACA AAACAAACAA      4740
     AAGGACAACC TAAAATTAGC AAACCAGACA GGCATACTAG TAGATGCTAA TATGCAGCTC      4800
     CATCCTACTG ACGACAACCA CGCAACTCCT TTCTCCAAGA CCGCAAATAC TGAAACAAGG      4860
     AAGCACAAGC TAATACTGGG AATTATTTAT TTAAACAAAA ATACTTATCT AATTGCCAAT      4920
     TCGACGACTC CAAATCCGCG GCTAACCGGC GGCGATGGCC CATAAATAAA GGGCCTCCTA      4980
     ATTAATTACA AAATGTACCT GAAAAACATA AAATTAACGC AACTATAATT AACGCAATTA      5040
     ATAAATCAAA TAAATACAAG TATAATACTT ACCTCCAAGC AAACGTACCT GAAAAACAAA      5100
     ACCAAAAAAA AAATTAATGC AATAAATAAA TCAAATAAAT ACAAACATAA TACTTACCTC      5160
     CAATTTACCT CCCAGCCAAT CTACCTGAAA AACATAATCT AATACAATCT CAAAAACAAA      5220
     TAACAAATGT AATACTTACC AAATTTTAAT TTTGTATTCA TTTCCATGAC CCCAACGCTG      5280
     CAACTGTCCT CGGCAACAAT TCCTGTTCCG GCGGCTCCAT GCTGCCAATC CTGACGCACT      5340
     GGCCACAAGA CGCGGCGCTG CTGGCAATCT CTCGATGAAC AACCGATCTA CAATTTCCAT      5400
     GACGACTCCT CTGTCACGAT GAGACAGAAG ACACCACCAA CGCCAGCAGC TCCAAAACAA      5460
     TACAACAACG GCCGCGCGGA ACCCATCTTC AGAATTCCCT CTTCCTGACG ACCGGCGAAC      5520
     GAGTTCTGGA ATAAACAATG TATTAATTGC AAACATCTAC CGATGAGGGT AGAAGAGATA      5580
     CTCACCAAAC GACTGCGGCG CGGGAACAAA CTAACTGCAA CGCCGGCCGG ACCTATTTGT      5640
     TGCAAGTGGC GCGCATCCAG CGCCTGCAAC ATGCCCCAGC CCAAGTACAC AACTACTTAC      5700
     CTGCAACGTC GCCAGAGGCT CCCAGCGAAT CGGTGCTTCC GTCCTTCTGG CGGGGGTACC      5760
     TGAAAAGAAA CAAATTAAAC AATATTAATC CTAAATTTCA ATGTTTTTTG TAAAATAATT      5820
     TAAATTGTTA AATGTAAACA AGCCTTGCAA TATGTTAATG TTACCAGTCC ATGCTACTGT      5880
     CTAAAAGCCA AGAATACAAA AAATACTAAT TATAAACTAA CTCACCACGC CCAACCCCCA      5940
     AACTCACCCC ATGCAATGTT AAACCTATAA ATTCAAATAA TTGTACCTAT ATATTGCACA      6000
     TACTGTAATC AAAGGCAAAA TAAATCGTGG ATGCGGAACA GAATTTACTC TGTCTCCGTA      6060
     CCTCCACCAG CAAAGTTAAA AAA                                              6083
//
ID   DMIFACA    standard; DNA; INV; 5371 BP.
XX
AC   M14954;
XX
DR   FLYBASE; FBte0000133; Dmel\I-element.
XX
FT   source          M14954:100..5470
FT   SO_feature      CDS ; SO:0000316:187..1467
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\I-element\gag"
FT                   /db_xref="FLYBASE:FBgn0020417"
FT                   /db_xref="SPTREMBL:Q24362"
FT                   /db_xref="NCBI_PROTEIN:AAA70221.1"
FT                   /translation="MTDPPNIYKITSKTYQSQLGEPKFIIIKRNDNNSFERTSPFIIKK
FT                   SVDFACGGEVEGCKRTRDGNLLIKTKNELQARKLLKLTKIADEDVTASEHKTLNFSKGV
FT                   IYCNDLRHIDEDTILQELKPQKVSEVKKIMKRQNPNSNSDTNNITLVETGLIIITFESH
FT                   KLPEIVRIGYETVRVRDYIPLPLRCKKCLRFGHPTPICKSVETCINCSETKHTNDGEKC
FT                   TNEKNCLNCRNNPELDHQHSPIDRKCPTFIKNQELTAIKTTQKVDHKTAQHIYFERHGF
FT                   QTKNTYAKTLTNGTTQRTTNTPSPNIHTNTTQSQQQNPHHTPKSAAQNTSAKTPTTEPA
FT                   KTTLLSNQPHQHHHHHSYDKLEDMDTDYTPTRKPSTTYSSQLTEDLKIKIFPKDKSNNL
FT                   SINLKASKLKAKAHKNKHTNNSDSESI"
FT   SO_feature      CDS ; SO:0000316:1938..5195
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\I-element\RTase"
FT                   /db_xref="FLYBASE:FBgn0020418"
FT                   /db_xref="SPTREMBL:Q24363"
FT                   /db_xref="NCBI_PROTEIN:AAA70222.1"
FT                   /translation="MAPSWGSPTTNKRGKITHRFIDNMHLILLNDKSPTHFSTHNTYTH
FT                   IDLTLCSPILAPHAKWKILNDLHGSDHFPIITTLFPTTNPQKFYRPFFKLKEANWEQFN
FT                   ALTHQTNKKYPTSHNVNKEAALINRIILYSANLSIPQTSPNTHPYRVPWWNKHLDQLRK
FT                   EKQLAWKKLNRTITVDNILDYRRKNAIFRYELKKRKKEASSSFTSTIHPTTPSSKIWAN
FT                   IRRFCGLNPAKQIHAITNPVNNETTLASNEIANIFAQHFSDLSGDWNFSEEFRNNKYRN
FT                   NIHLYTPSPIAQTIEENITYLELSSALQTLKGCAPGLNRISYQMIKNSSHTTKNRITKL
FT                   FNEIFNSHIPQAYKTSLIIPILKPNTDKTKTSSYRPISLNCCIAKILDKIIAKRLWWLV
FT                   TYNNLINDKQFGFKKGKSTSDCLLYVDYLITKSKMHTSLVTLDFSRAFDRVGVHSIIQQ
FT                   LQEWKTGPKIIKYIKNFMSNRKITVRVGPHTSSPLPLFNGIPQGSPISVILFLIAFNKL
FT                   SNIISLHKEIKFNAYADDFFLIINFNKNTNTNFNLDNLFDDIENWCSYSGASLSLSKCQ
FT                   HLHICRKRHCTCKISCNNFQIPSVTSLKILGITLNNKYKWNTHINLLLPKLHNKLNIIK
FT                   CLSSLKFNCNTHTLLNVAKATIIAKLEYGLFLYGHAPKSILNKIKTPFNSAIRLALGAY
FT                   RSTPINNLLYESNTPPLEMKRDLQIAKLSQNLILSKNTPIHKFLKPKKANKKKTSTIDR
FT                   TIKLSLELNLPYKPIKLHKNKPPWTLPNLIDTSLRIHKKEQTSPDQYRKLYEHTKNNLK
FT                   THNFIFTDGSKINYTISFAITTETDVLKYGILPPYSSVLTSETIAILEAIELTKNRRGK
FT                   FIICSDSLSAVDSIQNTNNNSFYPSRIRSLITQHAPKIKIMWIPGHSGIKGNELADQAA
FT                   KSASSMPLILTPNINTTDIKKHLKADLATKQKEHIINCSPWYQSINTNTSHPCDYLKQS
FT                   HPNWTRLDQIKIIRLRLGHTNITHQHYLNPNSIPTCPFCQGDISLNHIFNSCPSLLQTK
FT                   QDIFNNTNPLDLLSKPNPDNIQKLILFLKKTKLYHKI"
XX
CC   Derived from M14954 (g157749) (Rel. 44, Last updated, Version 2).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 5371 BP;  2176 A; 1446 C; 606 G; 1143 T; 0 other;
     CATTACCACT TCAACCTCCG AAGAGATAAG TCGTGCCTCT CAGTCTAAAG CCTCGCTTCG        60
     CGTAAGCCCA AAACTCTTAT CAGCAAAATC TTGATAAACA AATATCAACC ACAAAGAGAA       120
     AATAAAAAAC TTAACAACAA AAACAACAAT ACCGCTAATC CGGGCTCAAG CCCTTAACCA       180
     ACAATCATGA CAGACCCACC AAACATTTAC AAAATCACTT CAAAAACATA CCAATCCCAA       240
     TTAGGCGAAC CTAAATTTAT AATTATTAAA AGAAATGACA ACAACTCTTT CGAAAGAACT       300
     TCACCATTCA TCATAAAAAA ATCGGTGGAC TTTGCCTGTG GAGGAGAAGT TGAGGGATGC       360
     AAACGTACAA GAGACGGCAA CCTGCTAATA AAAACCAAAA ATGAATTACA AGCCAGAAAA       420
     CTCCTAAAAC TAACAAAAAT TGCAGATGAG GATGTAACAG CAAGTGAACA TAAAACATTA       480
     AACTTCTCTA AGGGAGTTAT TTACTGTAAC GACCTTAGAC ACATCGACGA AGACACAATT       540
     CTACAAGAAC TAAAACCACA AAAAGTATCT GAAGTTAAAA AAATAATGAA ACGGCAAAAC       600
     CCCAACTCTA ACTCCGACAC CAACAACATC ACATTAGTTG AAACTGGACT CATAATTATA       660
     ACCTTTGAAT CGCATAAGCT CCCCGAGATA GTACGAATCG GGTACGAAAC AGTCCGAGTA       720
     CGAGACTATA TCCCACTCCC ACTTCGATGC AAAAAATGCC TCCGCTTCGG TCATCCAACA       780
     CCCATATGCA AAAGTGTAGA AACTTGCATC AATTGCTCTG AAACAAAACA CACAAACGAC       840
     GGAGAAAAAT GCACAAACGA AAAAAACTGC TTAAATTGCC GAAATAACCC AGAACTTGAC       900
     CATCAACACA GCCCAATTGA CCGCAAATGC CCTACGTTCA TAAAAAACCA GGAATTAACA       960
     GCAATTAAAA CCACACAAAA AGTTGACCAT AAAACGGCCC AACACATATA TTTCGAACGT      1020
     CACGGCTTCC AAACGAAAAA CACCTACGCC AAAACACTTA CAAACGGCAC AACCCAGAGG      1080
     ACAACAAACA CTCCATCACC TAATATTCAC ACAAACACAA CCCAATCACA ACAACAAAAT      1140
     CCGCACCACA CACCCAAATC AGCAGCACAA AACACTTCAG CTAAGACACC AACAACTGAA      1200
     CCAGCCAAAA CAACCTTACT ATCCAACCAA CCACACCAAC ACCACCACCA CCACAGCTAC      1260
     GACAAACTAG AAGACATGGA TACCGACTAC ACACCTACCA GAAAACCATC TACGACATAC      1320
     TCATCACAAC TCACAGAAGA CCTAAAAATA AAAATCTTCC CTAAAGATAA GTCCAATAAC      1380
     CTATCCATAA ACCTTAAAGC ATCAAAACTA AAGGCCAAAG CCCACAAAAA CAAGCACACT      1440
     AACAACAGCG ACAGCGAATC CATATAGAAC TCTACACAAA ACCCTAACCG TTAACACTAC      1500
     CTTTAAGTAA GTTATAAGCT TTAATTTTCT CACAAATGTC CCTAACTATA ATCCAATGGA      1560
     ATCTAAAAGG ATATCTAAAC AACTACAGCC ATCTCCTTAT TCTAATCAAA AAATACTCCC      1620
     CCCACATAAT TTCCCTCCAA GAAACCCATA TACAATACAC TAATAACATT CCAACCCCAA      1680
     TAAACTACAA ACTATTAACA AATATTGCCA CCAACAGATT TGGGGGGCGT ACGACTACTA      1740
     GTGCATAAGT CAATACAACA CACTGTCCTC AACATAACAA TCGATATAGA AGCAATAGCC      1800
     ATAAATATAG AATCTAAACT TAAATTAAAC ATATTTTCCA CATACATTTC TCCGACCAAA      1860
     AACATAACTA ACCAGACACT CCATAACACA TTTAACATAC AACAAACACC CTCTCTAATT      1920
     ACGGGAGATT TTAATGGATG GCACCATCCT GGGGCTCCCC AACAACAAAT AAACGAGGAA      1980
     AAATAACTCA TAGATTCATT GACAACATGC ACCTTATCCT GTTAAACGAC AAATCTCCCA      2040
     CACACTTTTC AACACACAAT ACATACACAC ACATAGACCT CACACTCTGC TCTCCAATCC      2100
     TAGCCCCCCA CGCCAAGTGG AAAATACTAA ACGATCTTCA CGGTAGCGAC CATTTCCCTA      2160
     TTATCACAAC ACTATTCCCA ACAACCAATC CACAAAAATT CTACAGACCC TTTTTTAAAC      2220
     TCAAAGAAGC CAACTGGGAA CAGTTCAACG CTCTTACCCA CCAAACCAAC AAGAAATACC      2280
     CCACCTCCCA CAACGTAAAC AAAGAAGCCG CTCTAATCAA TAGAATCATC CTTTATAGCG      2340
     CAAACCTCTC CATCCCACAA ACCTCACCTA ACACACATCC ATACAGGGTT CCATGGTGGA      2400
     ATAAACACCT CGACCAATTA CGTAAAGAAA AACAACTTGC CTGGAAAAAA TTAAACCGCA      2460
     CAATTACTGT TGACAACATT CTAGACTATA GACGCAAAAA CGCAATATTT AGATACGAAC      2520
     TAAAAAAGAG GAAAAAAGAA GCTTCCAGCT CTTTCACCTC AACCATCCAT CCCACTACTC      2580
     CCTCATCCAA AATATGGGCC AATATAAGAC GCTTCTGCGG ACTTAACCCA GCAAAACAAA      2640
     TTCATGCCAT CACAAACCCA GTAAATAACG AGACTACATT GGCTAGCAAC GAAATTGCTA      2700
     ACATATTCGC ACAACATTTC TCTGACCTCT CCGGCGACTG GAACTTCTCA GAGGAGTTCC      2760
     GGAACAATAA ATATAGAAAT AACATACATC TCTACACCCC CTCTCCAATA GCCCAAACCA      2820
     TAGAAGAGAA CATAACGTAT CTAGAACTTA GCTCAGCACT ACAAACATTA AAAGGATGTG      2880
     CTCCAGGACT AAATAGAATC TCGTATCAAA TGATCAAAAA TAGCTCCCAC ACAACAAAAA      2940
     ACCGAATAAC GAAACTATTT AATGAAATAT TCAATAGCCA CATACCTCAA GCCTACAAAA      3000
     CAAGCCTAAT CATCCCAATC CTTAAGCCAA ACACCGACAA AACGAAAACT TCCTCATACC      3060
     GACCCATCTC CCTCAACTGC TGTATAGCAA AGATACTTGA TAAAATAATT GCGAAAAGAC      3120
     TCTGGTGGCT AGTGACATAT AACAACCTAA TTAACGACAA ACAATTCGGG TTCAAAAAAG      3180
     GCAAATCGAC TTCGGACTGT CTACTCTATG TAGACTATCT CATAACGAAG TCAAAAATGC      3240
     ACACCTCCCT CGTCACTCTT GATTTTTCAA GAGCCTTCGA TCGAGTAGGT GTGCACTCCA      3300
     TAATCCAGCA ATTGCAGGAA TGGAAAACGG GTCCCAAAAT AATAAAATAC ATTAAAAACT      3360
     TCATGAGCAA CAGAAAAATA ACTGTCCGCG TCGGTCCGCA TACATCAAGC CCGTTACCCC      3420
     TATTCAACGG AATCCCCCAA GGTTCACCCA TATCCGTAAT ACTTTTCCTC ATAGCATTCA      3480
     ACAAATTATC CAACATCATA TCCCTACATA AAGAAATTAA ATTCAACGCA TATGCCGACG      3540
     ACTTCTTCCT TATAATAAAT TTCAACAAAA ACACAAATAC AAATTTCAAC TTAGACAATC      3600
     TATTCGACGA TATAGAAAAT TGGTGCTCCT ACTCAGGGGC ATCGCTTTCC CTATCCAAAT      3660
     GTCAACACCT CCACATATGC AGAAAACGTC ACTGCACATG CAAGATAAGC TGCAACAACT      3720
     TCCAAATTCC TAGCGTTACG TCCTTAAAAA TTCTAGGAAT AACCTTAAAC AACAAATACA      3780
     AATGGAACAC ACACATAAAC CTACTTCTAC CCAAACTACA CAACAAGCTA AATATAATAA      3840
     AATGCCTATC TAGTCTTAAA TTTAACTGCA ACACGCATAC ACTACTTAAT GTCGCAAAAG      3900
     CAACAATTAT AGCCAAACTA GAGTATGGTT TGTTTCTGTA CGGCCATGCT CCCAAAAGCA      3960
     TTTTAAACAA AATAAAAACA CCGTTTAACT CCGCTATCCG TCTAGCTCTC GGCGCATATC      4020
     GCTCTACCCC AATAAATAAC TTACTTTACG AATCGAATAC TCCCCCCTTA GAAATGAAAC      4080
     GAGACCTTCA AATAGCCAAA CTATCCCAAA ACCTAATCCT CTCCAAAAAC ACACCAATAC      4140
     ATAAGTTCTT AAAGCCTAAA AAAGCTAATA AGAAAAAAAC ATCAACAATA GACCGAACAA      4200
     TCAAACTTAG CCTAGAACTT AATCTACCCT ACAAACCAAT AAAACTCCAT AAAAACAAAC      4260
     CACCATGGAC CCTCCCCAAT CTAATAGACA CGTCACTTAG AATCCATAAG AAAGAACAAA      4320
     CATCTCCAGA CCAATACAGA AAATTATACG AACACACAAA GAATAACCTC AAAACACACA      4380
     ATTTCATATT CACTGACGGT TCAAAAATTA ATTACACAAT ATCATTCGCC ATTACAACGG      4440
     AGACAGACGT CTTGAAATAC GGCATACTGC CCCCATATTC ATCCGTCCTC ACCTCCGAAA      4500
     CAATCGCCAT CCTAGAAGCA ATAGAACTTA CTAAAAACCG AAGAGGCAAA TTTATTATCT      4560
     GCTCCGACTC CCTATCAGCA GTAGATTCAA TTCAAAACAC AAATAATAAC AGCTTTTACC      4620
     CAAGCAGAAT ACGATCGCTA ATAACGCAAC ACGCACCTAA AATTAAAATA ATGTGGATTC      4680
     CTGGCCATTC AGGAATAAAA GGAAATGAAT TAGCCGATCA AGCTGCAAAA TCAGCAAGCA      4740
     GTATGCCACT TATCCTCACC CCAAACATAA ATACCACAGA TATAAAAAAA CACCTTAAAG      4800
     CCGACCTTGC GACAAAACAG AAAGAACACA TAATAAACTG CAGTCCATGG TACCAATCTA      4860
     TTAACACGAA CACCTCACAC CCATGCGATT ACCTTAAACA ATCCCACCCA AATTGGACCA      4920
     GACTCGACCA AATAAAAATA ATACGACTTC GACTAGGACA CACAAACATA ACCCACCAAC      4980
     ACTACCTAAA TCCCAATTCA ATACCAACTT GCCCGTTTTG CCAAGGTGAT ATTTCTTTAA      5040
     ACCACATATT TAACTCATGC CCATCCCTCC TACAAACCAA GCAAGATATA TTTAACAACA      5100
     CCAACCCTCT AGACCTTCTT AGCAAACCCA ATCCAGATAA CATACAAAAA CTCATACTTT      5160
     TCCTCAAAAA AACTAAATTA TACCACAAAA TCTAAAAACA AAACAGGCAT TTGTACATAA      5220
     CAAGCCAGCA ATTAGTTACC AAATTAGATA TTAACTAAAT TAAGATATAA TAACATTGTA      5280
     AATAAATATA GCTGTAAGCC CCGTAGCTAA TGCTATACTA TCTAAGTTAG TCTAGTTTTG      5340
     TAAACTATTC TATCTATCAT AATAATAATA A                                     5371
//
ID   DMLINEJA   standard; DNA; INV; 5020 BP.
XX
AC   M22874;
XX
DR   FLYBASE; FBte0000088; Dmel\jockey.
XX
SY   synonym: wallaby
SY   synonym: sancho
XX
FT   source          M22874:115..5134
FT   SO_feature      CDS ; SO:0000316:300..2051
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\jockey\gag"
FT                   /db_xref="FLYBASE:FBgn0020297"
FT                   /db_xref="SWISS-PROT:P21330"
FT                   /db_xref="NCBI_PROTEIN:AAA28674.1"
FT                   /translation="ISIALYGISIKTIDIMENSFAQSRPSNGCDKFEKMRKVAGVEPGE
FT                   LRSQLRASCAVVSPNLEGMPTQSAVSSLMVTISSNTNASVTCTISNVQANMICTPTYTD
FT                   CTTVTTSICPTTPYDNGLPTPLSSLPNKPSKANCPFQAHDRTVNRKRKGVSQPPLPILT
FT                   PSPSRKTKRQATMPLNEEASTSTAAALNNNRFALLSAEAENMEQDVSDADSDIEDSAAR
FT                   DGGGQSAKYSKPPAICVPSVSDPVTLERALNLSTGSSNYYIRISRFGVSRIYTANPDAF
FT                   RTAVKELNKLNCQFWHHQLKEEKPYRVVLKGIHANVPSSQIEQAFSDHGYEVLNIYCPR
FT                   KSDWKNIQVNEDDNEATKNFKTRQNLFYINLKQGPNVKESLKITRLGRYRVTVERATRR
FT                   KELLQCQRCQIFGHSKNYCAQDPICGKCSGPHMTGFALCISDVCLCINCGGDHVSTDKS
FT                   CPVRAEKAKKLKPRSRLPMTNNIATLKPPQRSSSGYIPAEALRTNISYADIARRNTTQS
FT                   RARATVQAEVIPTSDNSLNNKFMTLDNSIRAINTRMDELFKLIHETVEANKAFRELVQV
FT                   LITRIPK"
FT   SO_feature      CDS ; SO:0000316:2048..4798
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\jockey\pol"
FT                   /db_xref="FLYBASE:FBgn0015952"
FT                   /db_xref="SWISS-PROT:P21328"
FT                   /db_xref="NCBI_PROTEIN:AAA28675.1"
FT                   /translation="MTQPTLKIGLWNARGLTRGSEELRIFLSDHDIDVMLTTETHMRVG
FT                   QRIYLPGYLMYHAHHPSGNSRGGSAVIIKSRLCHSPLTPISTNDRQIARVHLQTSVGTV
FT                   TVAAVYLPPAERWIVDDFKSMFAALGNKFIAGGDYNAKHAWWGNPRSCPRGKMLQEVIA
FT                   HGQYQVLATGEPTFYSYNPLLTPSALDFFITCGYGMGRLDVQTLQELSSDHLPILAVLH
FT                   ATPLKKPQRVRLLAHNADINIFKTHLEQLSEVNMQILEAVDIDNATSLFMSKLSEAAQL
FT                   AAPRNRHEVEAFRPLQLPSSILALLRLKRRVRKEYARTGDPRMQQIHSRLANCLHKALA
FT                   RRKQAQIDTFLDNLGADASTNYSLWRITKRFKAQPTPKSAIKNPSGGWCRTSLEKTEVF
FT                   ANNLEQRFTPYNYAPESLCRQVEEYLESPFQMSLPLSAVTLEEVKNLIAKLPLKKAPGE
FT                   DLLDNRTIRLLPDQALQFLALIFNSVLDVGYFPKAWKSASIIMIHKTGKTPTDVDSYRP
FT                   TSLLPSLGKIMERLILNRLLTCKDVTKAIPKFQFGFRLQHGTPEQLHRVVNFALEAMEN
FT                   KEYAVGAFLDIQQAFDRVWHPGLLYKAKRLFPPQLYLVVKSFLEERTFHVSVDGYKSSI
FT                   KPIAAGVPQGSVLGPTLYSVFASDMPTHTPVTEVDEEDVLIATYADDTAVLTKSKSILA
FT                   ATSGLQEYLDAFQQWAENWNVRINAEKCANVTFANRTGSCPGVSLNGRLIRHHQAYKYL
FT                   GITLDRKLTFSRHITNIQQAFRTKVARMSWLIAPRNKLSLGCKVNIYKSILAPCLFYGL
FT                   QVYGIAAKSHLNKIRILQAKTLRRISGAPWYMRTRDIERDLKVPKLGDKLQNIAQKYME
FT                   RLNVHPNSLARKLGTAAVVNADPRTRVKRRLKRHHPHDLPNLVLT"
XX
CC   Derived from M22874 (g157823) (Rel. 47, Last updated, Version 5).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 5020 BP;  1527 A; 1198 C; 1055 G; 1240 T; 0 other;
     AAAAATCATT CACATGGGAG ATGAGCAATC GAGTGGACGT GTTCACAGAA GTCGCGAGAT        60
     AAAACAAAAA CGTAATTGTG ATCCATCACA AACATCTGCG CAGATCGTGT GCTTATCTCA       120
     CAAACAAAAT CTATTTTTAG TCACTGCATA ACGGTGACGG CTTCGGTTCG CGAAACTTAT       180
     CAGCAACTAG CAATTTCTAA GCTGTGTTGT TTTTGCCCCT CGCCCTGCGC GCTGCGCAAG       240
     CGGGAGGTTG TTACAATTTA CCTTACAAGT AAACCGGTAA ATCTTATCGT GTTTAGTAAA       300
     TATCAATTGC ATTATACGGC ATAAGTATAA AGACAATTGA TATAATGGAG AATTCATTTG       360
     CTCAATCGCG ACCTAGCAAT GGGTGCGATA AATTTGAGAA AATGAGGAAA GTAGCAGGTG       420
     TTGAGCCAGG AGAATTACGC TCCCAACTCC GCGCCAGCTG TGCAGTTGTT TCCCCTAACC       480
     TGGAAGGTAT GCCAACTCAA TCTGCGGTCT CCAGCTTAAT GGTGACAATC AGCAGCAACA       540
     CCAATGCAAG TGTTACCTGC ACTATTTCTA ACGTACAGGC CAACATGATC TGTACTCCTA       600
     CATACACTGA TTGCACAACC GTGACCACTA GCATTTGCCC AACTACGCCT TATGACAATG       660
     GACTGCCGAC ACCTCTGTCA TCACTGCCCA ATAAGCCATC TAAAGCGAAT TGCCCCTTTC       720
     AAGCACATGA TCGTACTGTC AACAGGAAAC GAAAAGGCGT GTCTCAGCCC CCATTACCTA       780
     TCCTCACCCC TTCTCCAAGC CGTAAAACTA AAAGGCAGGC CACTATGCCA CTCAATGAGG       840
     AGGCCTCTAC CTCCACTGCA GCAGCATTAA ATAACAATCG CTTCGCGCTT TTGTCCGCTG       900
     AAGCGGAGAA TATGGAGCAA GACGTGTCGG ATGCTGATTC TGACATTGAA GACTCTGCTG       960
     CCCGAGATGG TGGTGGACAA TCCGCTAAAT ATAGCAAACC CCCAGCCATA TGCGTACCAA      1020
     GTGTAAGCGA TCCGGTCACC TTGGAACGGG CTCTCAATCT GAGCACCGGC TCCTCAAACT      1080
     ACTACATCCG CATTTCTAGA TTTGGTGTAT CCAGAATCTA TACAGCCAAC CCTGATGCTT      1140
     TCCGCACCGC TGTAAAAGAA CTAAATAAGT TAAATTGTCA ATTCTGGCAT CACCAACTTA      1200
     AAGAAGAAAA ACCCTACAGA GTAGTGCTTA AAGGAATCCA TGCTAATGTT CCTAGTTCGC      1260
     AGATAGAACA AGCATTTAGT GATCACGGCT ATGAGGTCCT TAATATCTAT TGCCCCAGAA      1320
     AGTCTGACTG GAAGAACATT CAGGTAAACG AAGATGATAA TGAAGCTACA AAAAACTTCA      1380
     AAACTAGACA AAATTTGTTT TATATTAATC TTAAACAAGG CCCGAATGTT AAAGAGTCTC      1440
     TTAAGATAAC TCGACTTGGC AGATACAGAG TCACTGTTGA GCGCGCTACA CGTAGAAAAG      1500
     AACTGCTACA ATGTCAAAGA TGCCAAATTT TTGGACACTC TAAGAACTAT TGCGCCCAGG      1560
     ATCCTATTTG TGGTAAATGT AGTGGTCCCC ATATGACCGG GTTCGCTTTG TGCATAAGTG      1620
     ACGTATGTCT GTGTATAAAT TGTGGTGGTG ATCATGTCTC GACAGACAAA AGCTGCCCTG      1680
     TCAGAGCAGA GAAAGCCAAG AAGCTAAAAC CAAGGTCCAG GCTACCGATG ACTAATAATA      1740
     TTGCCACACT CAAACCTCCA CAACGTTCTT CAAGCGGTTA CATACCAGCT GAGGCATTAA      1800
     GAACCAACAT CTCTTATGCT GATATTGCTC GACGCAACAC GACTCAATCT AGGGCTCGTG      1860
     CTACTGTGCA GGCTGAAGTT ATACCAACGT CGGACAATAG CCTTAACAAT AAATTTATGA      1920
     CGTTAGACAA CTCCATTCGG GCCATCAATA CGAGAATGGA CGAACTATTT AAGCTTATAC      1980
     ACGAAACTGT AGAGGCTAAT AAAGCTTTCA GAGAACTGGT TCAGGTTCTA ATTACACGTA      2040
     TTCCTAAATG ACTCAACCAA CCTTAAAAAT CGGATTGTGG AACGCTCGCG GATTAACAAG      2100
     GGGCTCTGAG GAGCTTCGGA TATTCCTCAG CGATCACGAT ATAGACGTAA TGCTTACCAC      2160
     GGAAACACAC ATGCGAGTTG GTCAGCGCAT CTATCTCCCA GGGTATCTTA TGTATCACGC      2220
     CCACCACCCC AGTGGTAACA GTAGAGGTGG CTCTGCAGTC ATCATAAAAT CTAGACTTTG      2280
     TCACAGCCCT CTGACACCTA TCTCTACTAA TGACAGGCAG ATAGCGAGAG TGCACCTGCA      2340
     AACATCGGTT GGGACCGTCA CTGTAGCTGC TGTTTATCTA CCTCCAGCAG AAAGATGGAT      2400
     AGTAGATGAC TTCAAATCCA TGTTTGCTGC GTTAGGCAAC AAATTTATTG CTGGTGGTGA      2460
     TTACAATGCC AAACATGCAT GGTGGGGGAA CCCAAGATCC TGTCCTAGAG GTAAAATGTT      2520
     GCAAGAAGTC ATTGCACATG GGCAATACCA AGTTCTGGCT ACGGGCGAAC CCACTTTCTA      2580
     CTCTTACAAC CCTTTGTTAA CACCATCAGC CCTTGATTTT TTTATAACCT GTGGGTACGG      2640
     CATGGGCAGG CTAGATGTAC AAACTCTCCA GGAACTCTCG TCGGACCATC TTCCTATTCT      2700
     GGCTGTATTG CACGCTACGC CGTTAAAGAA ACCACAACGC GTACGACTAC TTGCCCATAA      2760
     TGCTGACATA AACATATTCA AAACCCATCT TGAACAGCTG AGTGAGGTAA ATATGCAAAT      2820
     TCTGGAGGCG GTGGACATTG ATAATGCCAC AAGCCTTTTC ATGAGCAAAC TAAGTGAGGC      2880
     TGCTCAGCTT GCTGCACCGA GAAATCGGCA TGAAGTAGAG GCCTTCAGAC CACTTCAACT      2940
     TCCTTCCAGT ATATTGGCAC TGCTCAGGCT AAAACGAAGA GTTCGAAAAG AATATGCTAG      3000
     AACAGGTGAT CCCCGCATGC AACAGATCCA CAGTAGACTG GCCAACTGCC TGCATAAGGC      3060
     CCTTGCTCGA AGAAAGCAGG CCCAAATAGA TACCTTCTTG GATAACTTGG GTGCTGACGC      3120
     GAGCACAAAT TACTCACTGT GGCGTATCAC GAAACGGTTC AAAGCTCAGC CCACCCCAAA      3180
     ATCAGCAATC AAAAATCCGT CTGGTGGCTG GTGTCGCACT AGCTTGGAAA AAACTGAAGT      3240
     GTTCGCTAAC AACCTTGAGC AACGTTTTAC ACCCTATAAC TATGCACCGG AAAGTCTCTG      3300
     TCGTCAGGTT GAAGAATACT TGGAATCGCC CTTTCAAATG AGCCTGCCTC TGAGTGCTGT      3360
     CACACTGGAA GAAGTGAAGA ATTTAATAGC CAAGCTGCCA CTTAAGAAAG CTCCTGGAGA      3420
     AGATCTTCTT GATAATAGAA CCATTAGACT TCTCCCAGAT CAAGCATTGC AGTTCCTTGC      3480
     CTTAATATTC AACAGCGTTC TTGATGTTGG CTACTTTCCG AAAGCTTGGA AATCGGCGAG      3540
     CATAATTATG ATCCATAAGA CTGGAAAAAC ACCGACAGAC GTTGACTCGT ACAGGCCCAC      3600
     CAGCTTACTC CCATCTCTGG GTAAAATTAT GGAGAGGCTG ATCCTAAACA GGCTGCTCAC      3660
     ATGCAAGGAT GTTACCAAAG CGATTCCCAA ATTTCAGTTT GGCTTCCGGT TGCAGCACGG      3720
     TACTCCTGAG CAACTACATA GAGTAGTGAA CTTTGCTCTG GAAGCTATGG AAAACAAGGA      3780
     GTATGCAGTA GGTGCCTTTC TTGATATTCA ACAGGCATTT GACAGAGTCT GGCACCCTGG      3840
     GCTCCTGTAC AAAGCGAAGA GGCTGTTCCC GCCGCAGCTA TATTTGGTTG TTAAAAGTTT      3900
     CCTGGAAGAA CGCACATTCC ACGTCTCTGT TGATGGGTAC AAATCATCAA TCAAGCCAAT      3960
     TGCAGCTGGA GTTCCTCAAG GAAGCGTTCT TGGCCCAACC CTATACTCAG TTTTTGCTTC      4020
     GGACATGCCT ACTCACACAC CAGTCACAGA GGTAGACGAA GAAGATGTGC TCATAGCCAC      4080
     CTACGCTGAC GATACTGCTG TGCTCACGAA AAGTAAAAGT ATCCTGGCTG CCACTTCTGG      4140
     TCTACAGGAA TACCTGGATG CATTCCAGCA ATGGGCTGAG AACTGGAATG TGCGCATCAA      4200
     CGCTGAGAAG TGTGCCAATG TGACGTTCGC CAACCGAACA GGTAGCTGTC CGGGTGTCAG      4260
     TCTGAATGGA AGACTGATCA GACACCATCA GGCTTATAAA TACCTTGGTA TTACCCTCGA      4320
     TAGGAAGCTC ACCTTCAGCA GGCACATCAC AAATATTCAG CAAGCGTTCA GGACCAAGGT      4380
     TGCTCGGATG TCTTGGCTCA TTGCACCACG CAACAAACTG TCGCTTGGCT GCAAGGTCAA      4440
     TATTTACAAG TCCATATTGG CCCCCTGCCT GTTCTACGGC CTGCAGGTAT ACGGCATTGC      4500
     TGCGAAGAGT CACCTTAATA AGATCCGGAT TTTACAGGCG AAGACCTTAA GAAGAATTTC      4560
     GGGGGCTCCT TGGTATATGA GAACAAGAGA CATCGAACGC GACCTCAAGG TGCCCAAATT      4620
     AGGAGACAAG CTCCAGAACA TCGCCCAAAA ATATATGGAA AGGCTTAATG TACACCCCAA      4680
     CAGCCTAGCA AGGAAGCTAG GAACTGCAGC TGTGGTCAAT GCTGACCCTC GGACTAGAGT      4740
     CAAAAGAAGA CTCAAGCGAC ACCACCCTCA TGACCTCCCT AACCTGGTTT TGACCTAGAA      4800
     AGTCTTAGTT TTAAAATTCA TTAGAATAAT CAAATAAATA ATAATTACTA TGTTATATCA      4860
     ACTATTATAA TTCTCCCTAT CATTTTTAGA TTAAAAATCT GTTAGTCTTA AGTAACCAAG      4920
     ACACATTGTA AAATAAAATA ATTTAAGCAG ATCAAATTAA GTTGCCGCAT GGGTAACAGT      4980
     GCGTTGATCA AATAATAAAA ACATCATAAA AAAAAAAAAA                            5020
//
ID   DMTRDNA    standard; DNA; INV; 1435 BP.
XX
AC   X80025;
XX
DR   FLYBASE; FBte0000670; Dmel\hopper.
XX
SY   synonym: M4
XX
FT   source          X80025:1..1435
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1..33
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1403..1435
XX
CC   Derived from X80025 (g510507) (Rel. 44, Last updated, Version 11).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 1435 BP;  456 A; 265 C; 212 G; 502 T; 0 other;
     CACTATGGGG CATTTGGCCT GTTTTTTTTA CAAAAATTAA TACCTCCTAA ACTATTGGAG        60
     ATATTTGGAT GAATTTTTTT TTATGCGTTA CACATGCCTC CAGGAATATT TTGGAAAAGT       120
     GGGCGTGCCC CAACTCCGCC CCATTTTTTT TTTTTTTTTT TTTTTTTTTT AATAATATAT       180
     TTTTAAAGTT TATTTTTAAT TTCAATAATG TATAATTCAT AACCGTCTTC CTCTTCACAA       240
     TCAGTAGAGT CTGAAGAATT TTTATCAGGT TCAAATTCGC AAGCTAACAT TTCAATGACT       300
     TCTGGTGGAA GAGATAGTCG CTTATGTTTT CGCCTCTTTA AATTTATTGA TGATATTATG       360
     GGATCCGAAG TATCCATTGC TCTGTAAAAG ACATCTGCGA AGCTACTAAT AGTTTTTGCC       420
     GTGGCTGGCT TCAACAAAAG AATTTTAAGT ATGGCTGCAA GATCCCGCAG GCAGCACTTC       480
     CGTGCAGCTT GAACCAAAAG ACGTTCGTTG TGTTTCTGCG CCCTTACGAG TTCATCTGCT       540
     TGCTGTCTTG GGCCACTCAA ATTTTTTAAA TAATATGACG TTTTCGGGAG TCCAACTAAT       600
     TTCCTTTCCT ATTTATTTTT CTCCTTTACC TTCAGGACTA GGTGTTCTTC TAACCAATTT       660
     GAAAAAAATT TTAAAAATTC ATATATTTTT CGATTGCATT TTCTCCAATT TCGTAAAAGA       720
     TTGACTGAAA TCATTCGTTA TTATTATTAT TAGTTAATCG TTTATTAAAG TCTAGCTTGC       780
     TATCAGAAAA ATGCCCACTG ATAAAAGTGC AAATAGAATT TTCCTTTTGA CGAACACCCT       840
     TTTGCGTGCG CCACACTTCC AGCAGGGCAG CATTGGAAAT CGAGATATTG CTCCCTAAAA       900
     AATGAAATTT CTCAAAAAAC CGCAAAAAAC GCACATAGAG ACTACCTGAT ATGAGTTAGG       960
     AATTGAACAC ACTACAACAT GGATATAAAC ACTTACTGAA CAAATTTGAA CAAATTGTTG      1020
     TAGCTCTATT CAAAGTTGAA AATTTTTTCA AACAACTACA TCTTGACACC ACTTGTTAAA      1080
     TGTACAAATT GTTAGAAATA GGCGCACACA ATAAACAATA TATTAATAAC AACACATAAT      1140
     AAGAACCTAA AGATTGATTA TCCATTTCAA ATTATACTCT CCTTCTTCTT CTTTTTAAAT      1200
     TTTAACACTT TGAAAGTTAA GCTAAATTTT GTGCGCAAAG CAGCCACGTG GTATATGCTC      1260
     GCAACAGCCG ACTTTAACAG CTGTTATTAT AACAGTGCAT TGTTAAATTA ACTTATGCGG      1320
     GCTATATCAT AACAGTTTAA CGTATTTCCA ATGTATTAAT ACTAAAATAC TTCAAATTTG      1380
     CATACTTGTG AAAAACACAT TATTGTAAAA AAAACAGGCC AAATGCCCCA TAGTG           1435
//
ID   DMRTMGD1   standard; DNA; INV; 7480 BP.
XX
AC   X59545;
XX
DR   FLYBASE; FBte0000015; Dmel\mdg1.
XX
FT   source          X59545:1..7480
FT   SO_feature      five_prime_LTR ; SO:0000425:1..441
FT   SO_feature      three_prime_LTR ; SO:0000426:7039..7480
FT   SO_feature      CDS ; SO:0000316:548..923
FT   SO_feature      CDS ; SO:0000316:1327..1557
FT   SO_feature      CDS ; SO:0000316:1749..3062
FT   SO_feature      CDS ; SO:0000316:2987..6673
XX
CC   Derived from X59545 (g8507) (Rel. 49, Last updated, Version 4).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 7480 BP;  3067 A; 1298 C; 1235 G; 1880 T; 0 other;
     TGTAGTATAT ACGAATATAA TAACAATAAT AATAACAATA ATAATAATAA TATTAATAAT        60
     AATTATAATA TGAATCATAA TAATAAGTCA ACTAATAAGT AAACTTAGGA CCACCCTAAT       120
     TCCTTAGGGT CACCCTAGTA GATCTTTAGA TACACCCTAA TACTAAATAT GCGAATTCAG       180
     GATGTACGCC TTTAGGGGTC GGACTCGACT CCCATTGGTT ATCGAGTATG AACTTCATAC       240
     ATACATATTG CAGAATTTGC TAGTGTCAGC ACTTGGCTGT CACAAGAGAT CTCCCTGTAG       300
     ACCACACTAA GATCAGTTAT AAATCAGGAA TAGATCTGGA ATGTACACTC GCTTAATAAA       360
     AACCAAATAA AGATAAAATG ACCAACTGCG TTTTGAGACT TTATTAACTA CATCAGAAGT       420
     ATTAGAATTC AAATTAACTA CATGGCGACC GTGACAAAGG ATCGTTATAA GTTGTAGCAG       480
     AAGCTAAAGG AAACCGCTTG TGATAATTTT CAACTTCGAT GCTCATCCAC CAAGACGGCG       540
     GCAATTATGA AGAAAAAAGC GATCTGAGTG AGTAGAGTGT CAGTGTGATG GGAAAAAACA       600
     GGGGCGGAGT TCGACATAAT ATAAAAAAGA GAATAGCGCA CATAAAGTGG CTATTATATA       660
     CGAACACTCC ACCACCCCAA TGGTCGAAAG CTCAAAAACT ACAAGCTGAG CTAGACCACT       720
     GTGTCGAATA TCTCAAGAAA AAAATCCCCA CCACACGCGC TCACTCAGAA AATCAAATAA       780
     AATCGTTAAC AATTAACAAA ACTCCAACTC CCAATCCGAA AAGCCTGCCT GTTTTCAAGA       840
     AAAGATGCCC GAACGACTGC GAGGGACCAC TGTTCACACC GCATTGTGAA CATACGTGCA       900
     GACATTGCAG CTCCACCACA TAACCCCTAA ATGAGGAAAT CATCATCAAC GTGGTGAGCA       960
     GCCCGCTCAT TACGTCATCG AGGGAGTGTC AGCGTGCCAA CCCGGCGACG ACCAGATGAC      1020
     GCAGGAGGGT CAGAGTGAAG CAAATAGGAG CTGAAAAATA AAATATTTTT TTTGTTGCCC      1080
     TGCGTGGCAC ACCCTCGATG CACTGCGCTG CATATTAATA TTACACAAAA TATTGTAACA      1140
     TTGAGCGGAA CTTTTTCTGC CCGATGAGAA GAATGGCCCG TAAAGCCATA CACCAACTAG      1200
     GTAGGAAAAT GTAACTATAT TGAACAAAAA AAAAAAAAAT CAAAACAACA TATTTTTAAA      1260
     GTAAAATAAA CCAAAACCCA AAAATAAAAA AAAAAAAAAA AAAAAAAAAA ATAAAAATAT      1320
     ACAAAAATGG GTTGGTTTGG ATCTGACGAT AGTCAGACAA AAGATAATAC GGCCAATGTG      1380
     GTCAATAACT TAAAAATAGT CGACCATACA GATGACATTC AGTCACTGTG GTTACTCCTT      1440
     TTGATCATGA CGATCGTAAC AGTCGCTCAG TTTATATTAA CGCTATATGT TAAGCATAAC      1500
     AAGATAATAA AGAGGCGTTA TATAGGCAAA GCAGAGAATA GTTTGGATAA AATTTGAAAA      1560
     AAAAAAAAAA AAAAAAAAAA AAAAAAACAT CCGAGATGTA TTTTGAATTA AGATGATCTA      1620
     AAATTTTTAT TTTTAATATC AGAAAACTAG AATGAAAAAA AAAAAAAAAG ATTATTGAAG      1680
     AAACCTATTT GAGAGAGGCC AAAATTTATA AAGTTCGATT GCATAGATAA ATCCATAGTA      1740
     TTCTTTAAAT GGACTGGCAA GAAATACAAA ACGAGCTTAA AGAAATTAAA ACAACTTTTG      1800
     ACAAGTCTTA TAAATGCATG ACACCAAATA GAGAAGTGCA ACAAGACACT CTCAACAAGC      1860
     ATGCGCAGAT ATTGGTAAGA TGCTTTAATG GAGCACGCCA ATTAATTTAC AGAGAAAGGA      1920
     AAAGATTAAC AAAAAATCAT TTATCACAAG CAGTAAAATT TCTAAACAGG TTCCGTGAGA      1980
     ACTTGTTAAA CGTCAAGTAC AGACACAACT TAAATATTAC AATCCCAACG ATTTTAAGCA      2040
     CACCTATAGT GGCTGAGATC GGTGAGGATA TCGAAAGTGT AGGAGAATCA GAAATAGAAA      2100
     TAAAAGAAGA GGATCTCCAC GATCTTGCAA TTCCAGCGGT AATAACATTA CCCGAATTAC      2160
     TTGAAGAAGA ACTTTCAGAT TCAAATACAG GAATAAGAAT ACAGGAAACG GACAAAATGA      2220
     CAGACTCTGC CGCAACAGCA AGGGAATATG TGCGACAAAT TTCGTCCACA ATACCTGAGT      2280
     TTGACGGCAA AAAGTTAAAC TTGAATAGAT TCCTCACGGC TCTCCGGCTG ATAGATCTGA      2340
     CAAAAGGAGA TCAGGAGATG CTAGCGGTTG AGGTAATCAA GACAAAGATA CTTGGTCCAT      2400
     TATCACACAA AGTTGAAAAT GAAAAGACCA TTATCGGTAT AATAAATCTA TTAAAAGCAT      2460
     CAGTTAAAGG CGAATCGCCC GATGTCATCA AAGCAAAAAT GCTTAGTACA CAACAGCGCG      2520
     GCAAAACTGC AGCGCAATAT ACCACGGAGA TAGAAAACCT ACGTGGGTTG CTCGAAGCAG      2580
     CCTATATAGA TGATGGTTTA GATTCCAACA ATGCAGACAA ATTCGCTACA AAGGAAGCCA      2640
     TATCTGCAAT GACCAAGAAC TGTGGGCACG ATAAGCTCAA AACCATATTG GAAGCTGGAA      2700
     ATTTCAACAC GATGAATAGC GTGATTGAAA AATACATACA CTGCAGTACA GAAATGACCG      2760
     GCAATTCAAA TAGTGTATTA TTCTATAATA ATAGAGGACA CTATCGAGGT AATAATTACC      2820
     GAGGAAATTA CCAAAACAGA GGTAATGGCC GAGGAAATTA TAACTCCTAC AATAACAACT      2880
     ATAGAGGCAG AGGTGGTTAC CATGGTGGAA ACAGAGGACG AGGTGGTAAC CAAAATTATA      2940
     ATAGAGGTGG AGGTTACTCA AGAGGTAACC AAAACCATAA CTATAAAACA AGTCATGCCC      3000
     ACAATGTCCG AAACATACAA TCGGAAAACG AACATACCCC CTTGAGCGAC AATCTACAAT      3060
     AAAATTATAC AAAATTAATC TCAATTTAAG CATTTTTATA CGATTGAAGA ATATGAGTAC      3120
     CAATTCATGG GTAACTCTTT TAATAGATAC AGGTGCAGAA ATTTCCCTGC TTAAATGCAG      3180
     AAACAATAAT CTTAACGATT TAAATCCAAA AAATACAACA AATATATCAG GAATAGGGCA      3240
     AGGGACAATT CAGTCTCTAG GTACACTACA TTTAGAAATG TGTATTGCTA ATGCAGCAAT      3300
     ACCATATGAA TTCCATATCG TACCTAACAA TTTTCCTATA CCAGGGGATG GTATAATTGG      3360
     CTTGGATTTC ATTAAGAAAT ACAATTGTAT TTTGGAATTC CACGACCAAG AAGATTGGTT      3420
     CACTTTGAGG CCCAAAAATT TCAGGAACAT AAACATTCCT ATTATACATA CACTAGATAA      3480
     TGAAATAATT TTGCCAGCTA GATCAGAAGT GATTCGAAAG ATTCAACTAA CATCTACTGA      3540
     CACACATGTT CTCATTCCCA ACCAAGAATT ACAACCTAGC ATAATAATCG CAAGTGCACT      3600
     CGTAAACACT CAGAACGTTT TGATTCGAAT TATTAATACA ACTGAAAAAG ACGCTATAGT      3660
     TAGTAGCGCA AATATAAAAA GCGAATCATT GGATGATTAT GATGTATACA ACGCAAATAT      3720
     AGAAAATAGT GCACAAAGAA CTTCAGAAGT ATTAAAACTT CTTAAATTTC CATCGTTATT      3780
     CAAAAGCGAT TTAACAAAAT TATGCACCGA ATATAGCGAT ATTTTTGGTC TTGAAACAGA      3840
     AACCATATCA GCTAATAATT TTTACAAGCA AAAATTGAGA TTAAATGACA AAACTCCAGT      3900
     CTATATCAAA AACTATAGAA TGCCAGAAAG TCAAAAACCA GAAATTCAAA GGCAAGTTGA      3960
     CAAATTAATA AAAGATGGCA TTGTCGAACA ATCTATTTCA GAATATAATA GCCCTCTTCT      4020
     CTTGGTACCC AAGAAATCAC TGCCTAACTC GGAGGAAAAG AGATGGCGAT TAGTAGTCGA      4080
     TTATCGCCAA ATAAACAAGA AACTGCTAGC AGATAAATTC CCACTTCCAA GAATAGAAGA      4140
     CATTCTTGAT CAATTAGGCC GAGCAAAATA TTTCTCGTGC CTAGACCTGA TGTCAGGATT      4200
     TCATCAAATA GAATTAGACG AAAGGTCAAG AAATATAACA TCTTTCTCAA CTTCAACGGG      4260
     AGCATACCGC TACACGCGAT TACCATTTGG TTTAAAAATA GCCCCAAATT CTTTTCAAAG      4320
     AATGATGACC CTTGCATTTT CAGGTTTAAC GCCTTCGCAA GCATTTCTGT ATATGGATGA      4380
     TTTAGTAGTC ATAGGCTGTT CTGAAAAGCA CATGCTTAAA AATCTAACCG ACGTTTTCAA      4440
     ATTATGTAGG CAACATAATT TAAAATTACA TCCAGAAAAA TGCACTTTCT TTATGAAAGA      4500
     GGTTACTTAT TTAGGTCACA AGTGTACTGA CAAAGGTATA TTGCCAGATG ACTCTAAATA      4560
     TGAGGTAATA AAGAACTACC CCAAACCAGT AAACGCAGAC GAAGCTAGAC GCTTCGTGGC      4620
     ATTTTGCAAT TATTACAGAA GATTTATTAA GAACTTTTCT GAGAAATCAC GCCACTTAAC      4680
     GAGGCTTTGT AAAAAGAATG TTCCATTTGA ATGGACAAGC GAATGCAATG ATGTATTCGA      4740
     ATATCTCAAA AGGAAATTAA TGAAACCAAC ACTCCTTCAG TACCCAGATT TCAGCAAACA      4800
     ATTTTGCATA ACCACAGATG CTAGTAAACA AGCATGTGGA GCGGTACTAT CTCAAGACCA      4860
     TAACGGTCAA CAGCTACCAG TGGCATACGC TTCAAGAAGC TTTACAAAAG GCGAAAGTAA      4920
     TAAGTCCACT ACAGAGCAGG AGCTAGCAGC TATTCACTGG GCAATAAATC ACTTCAGACC      4980
     ATACGTATAT GGTAGACATT TCTTAGTACA AAGTGACCAT AGGCCACTAT CATATCTTTT      5040
     TTCAATGAGA AACCCCAGTT CAAAATTAAC CAGAATGAGA CTAGACTTGG AGGAGTTCGA      5100
     ATTCACAGTA GAATATCTCA AGGGGAAAGA TAATCATGTC GCAGACGCAT TGTTCCGAAT      5160
     AACAATCGGA GAACTTAAAG CAATAAATAG ACAGATACTA AAGGTAACAA CAAGATCAAC      5220
     AACAAGACAG AAAAATACCT GCGCAGGTGA AAAATTGCAT GAACCAAATG AGAAAGAAAA      5280
     TATAAAAATG CCCAATATCT ATCAGGTAAT CAATAACATT GATGCCAAAA AATATGTTAT      5340
     ACTCAAAATA GACAAGCATA AGTGTTTGTT GAAAAGAGGA AAACAAATTA TAACACGTTT      5400
     TGATATGACT AATTTTTATT CTAATGAAAT AATCGATTTA GATCAATTCT TTCAAAGGCT      5460
     TAATGAAGAA GCAAGAATAA ATAGCATCAT TCAAACACAA TTGTCACCAA GTGAACAAAT      5520
     CTTCGAATTT GTCACTATAA AGAACTTTAA AGAAAAGGGC AATAAAATAC TAAAAAATTT      5580
     AAAAATAGCG CTATTAAACA AGGTGACTAA GATAGATAAA AATGATAAGG TTCAAATAAA      5640
     AGCAATACTG TCTAAATATC ATGATGATCC ATCAGAAGGA GGCCATTCAG GAATTTCTAG      5700
     AACCCTGAGG AAAATGAAAA ACTGTTGTTG TTGGCCACGA ATGACGAAGG CGATAAGTGA      5760
     ATATGTTGAA ACATGTTTGA AATGTCAACA AGCCAAGACT ACGAAACATA CTAAAACACC      5820
     GTTGACAATA ACAGAAACGC CAGCAACAGC ATTTGATAAA GTTTTGATAG ATACCATTGG      5880
     TCCACTGCCA AGATCAGAAA ACGGAAATGA GTATGCTGTT ACTATCATTT GCGATTTAAC      5940
     AAAATATTTG GTAACGGTAC CAATTCCAAA TAAAAGTGCA AAATCAGTTG CTAAGGCTAT      6000
     ATTCGAAAAT TTTATTCTAA AGTACGGTCC AATGAAAACA ATCACAACGG ACATGGGAAC      6060
     GGAATATAAA AACCAAATTA TAGACGACCT ATGCAAATAT ATGAAGATAA AAAACATTAC      6120
     TTCAACAGCA CACCATCACC AGACATTAGG AACAGTAGAA CGAAGTCACA GAACTTTCAA      6180
     CGAGTATGTT CGCTCATATA TATCTGTTGA CAAAACCGAT TGGGATATAT GGATACAATA      6240
     TTTTACTTAT TGTTTCAACA CAACACCATC GGTAGTTCAT GAATATTGTC CATATGAATT      6300
     AGTATTTGGA AGATTACCAA GACAGTTCAT AGATTTTAAC AGGATAGACA GAATAGATCC      6360
     TATTTACAAC ATGGATGATT ATTCAAAAGA AGTTAAGCTA CGATTAGAAA TAGCATATAG      6420
     AAGAGCTAAA AATATGTTAG ACAAGGCAAA AGCCGATAGA AAGATAAAAT ATGATAGAAA      6480
     TATTAGTAAC TTTGAATTAA AGATAGGAGA TAAGATATTA CTTAAAAACG AAACGGGTCA      6540
     TAAACTTGAC AATAATTATT TAGGACCATA TTTAGTTTCA GAAATAGGAG ATAATGACAA      6600
     CATTACAATT ATAGGAAATA AAAATAAAAA ACAGATAGTC CATAAAGATA GGTTAAAAAT      6660
     TTTTAATTCA TAATACATTT TGTTTGGTTG GCCAACCACA AATAAAAAAC CACAAATAAA      6720
     AAACCACAAA TAAAAAACCA CAAATAAAAA ACCACAAATA AAAAACCACA AATAAAAAAC      6780
     CACAAATAAA AAACCACAAA TAAAAAACCA CAAATAAAAA ACCACAAATA AAAAAACCAC      6840
     AAATAAAATA AAAACCAATA AAAACATTAT AATACAAAAC TTTTACTTTG CAAAATATAA      6900
     TGAAAATATA TATATTTTTT TTAATATCTC TTTAATCATT CATTTCAAAT ATTAATGTAC      6960
     ATTTAAAAAA AAAAAAAAAA ATATTATATA CTTGAAAATA ACTTCATGTT ATTACGTTAT      7020
     TTTTCAAAAG GAGGGAGATG TAGTATATAC GAATATAATA ACAATAATAA TAACAATAAT      7080
     AATAATAATA TTAATAATAA TTATAATATG AATCATAATA ATAAGTCAAC TAATAAGTAA      7140
     ACTTAGGACC ACCCTAATTC CTTAGGGTCA CCCTAGTAGA TCTTTAGATA CACCCTAATA      7200
     CTAAATATGC GAATTCAGGA TGTACGCCTT TAGGGGTCGG ACTCGACTCC CATTGGTTAT      7260
     CGAGTATGAA CTTCATACAT ACATATTGCA GAATTTGCTA GTGTCAGCAC TTGGCTGTCA      7320
     CAAGAGATCT CCCTGTAGAC CACACTAAGA TCAGTTATAA ATCAGGAATA GATCTGGAAT      7380
     GTACACTCGC TTAATAAAAA CCAAATAAAG ATAAAATGAC CAACTGCGTT TTGAGACTTT      7440
     ATTAACTACA TCAGAAGTAT TAGAATTCAA ATTAACTACA                            7480
//
ID   DMMDG3     standard; DNA; INV; 5519 BP.
XX
AC   X95908;
XX
DR   FLYBASE; FBte0000010; Dmel\mdg3.
XX
FT   source          X95908:1..5519
FT   SO_feature      five_prime_LTR ; SO:0000425:1..267
FT   SO_feature      three_prime_LTR ; SO:0000426:5253..5519
FT   SO_feature      transcription_start_site ; SO:0000315:178
FT   SO_feature      polyA_signal_sequence ; SO:0000551:5253..5519
FT   SO_feature      CDS ; SO:0000316:296..4780
FT                   /name="Dmel\mdg3\ORF"
FT                   /db_xref="FLYBASE:FBgn0043882"
FT                   /db_xref="SPTREMBL:Q94885"
FT                   /db_xref="NCBI_PROTEIN:CAA65152.1"
FT                   /translation="MDDKIILNDFSLTTLKDWLRILGQNTEGTKTELIARLQDIPTAVR
FT                   GDCPPEHPQKNAPPGNDIFSSLDFQNCEINTDHVSVNAMNRKESTETGSERETNMFELQ
FT                   QLRAELAEAKAMLNGTRSSLQFQEQQQPEQSKATVSSVIQTAQFTQAGATKENTTFHSP
FT                   QRSNERAESQRFPVDALALAKETITDYDGKTCARAWITVVKNIARTFNIDDNHLRILLI
FT                   TKLKGNAQVWLHAHPARLIEPIDNLLDQLSLTFGEQSSKAEIRRKFESRKWKTEENFCS
FT                   YYDEKMALSNGINIDDDELLDQMIEGIPLQNFRTQARIQCFSTPSEMLRAFSNIRLPAR
FT                   REPPVQPTDYKDAIRCANCNSRGHKADICKKPKREPGSCYACGQLGHLVAQCPTRKSVS
FT                   SNNYVRWFKINFFENAYKPIISECLIDSGSPISIIKKSLINETMKLALVNTCYFGLNNC
FT                   ILKTHGQTTCYVLKGSIKIYFRLIIVCDQSMRYNVILGRDFLTACNLNLDPYTLGMIAL
FT                   RKPMEINKISMFTENDSPEKSLENEIVSPKSLENEIVSSQSLENEIVSPKSLENEIVSP
FT                   KSFKNATISPKSLENKIVNQQHKETGPISLRDEIVNQQKNVSKSKLSEDEIVNTSKEIV
FT                   SFKLPKDKNVYEQLNHNFDKEVLRICHVTESELEYKIGENVSNRLQLEFDRLFRNFYIN
FT                   AKRPNEPTVRSEIQLCLKNPKPFSCSPRRLSYTEKDRLQKLLDEYLENGFIRPSDSEYA
FT                   SPIVLVKKKTGDLRMCVDFRKLNKMTMKDNYPLPLIDDLLDRMNEKTVFTKLDLKNGFF
FT                   HVHVKKESIKYTSFVTPLGQYEWLRMPFGLKNAPSVFQRFVNKIFADMIRENKVVVYMD
FT                   DILLATENINEHLETLKEIFKRLVENKLELRIDKCEFMQSSIKYLGFIINKDGIMPNDK
FT                   GIEAIKNFPIPNNVHTVQSFLGLCSYFRRFIKDFSRLAKPLHDILKKDKPFKFGSEEMI
FT                   CFNMLKDKLIQSPVLAIYNHKHETELHCDASSSGFGAVLMQKKEDQKWHPVSFFSKRTT
FT                   DIESKYHSFELETLAIVYSLRRFRVYLHWRTFKIVTDCNSLILTLSKKELNPRIARWAL
FT                   EFQGYDFEIVHRAGSRMQHVDALSRCTNIMVIQTNSFEDNLVICQGKDTKLKEIRQLLE
FT                   NTENKLYEMRNGIVYKKTNENRLLFYVPIEMEEQVLYKYHNELGHVGRDKMIEAIMKNY
FT                   WFPNLKQKCSTHISNCLKCISFSPKTGKTEGFLHNIPKGNKPFEIIHIDHYGPVDLARP
FT                   KKHILVIVDAFTKFVRLYATKTTNTKEVIQSLNDYFRAYSRPKCIISDRGACFTSGDFD
FT                   SFLKECNVKHIKIATGSPQANGQVERINRSLGPMISKLIEPDQGLHWDLVLEKVEYTLN
FT                   NTLHRSIKQYPSIMLFGLQQKGQIMDELKEKIEEIGETIEERDLESIRNKGEASQKIAQ
FT                   AYNKEYVDKKRKRSGVFTKGTTSWLKILTQQQA"
XX
CC   Derived from X95908 (e990667) (Rel. 49, Last updated, Version 3).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 5519 BP;  2078 A; 1005 C; 1029 G; 1407 T; 0 other;
     TGTAGTAGGC TGCACCTTCT ACCCTCTTCC TTTACTCTTA GTCATACATA CCTAATTATA        60
     CATAGCCAAT CTAGTCATAA GCTTATACAC TCATACACCC ATCCTTAACA TACAAATATT       120
     ATCGAGAAAC TTATCGACTA ATCGACTCGC CACTCTGCAG AGAGCGCGGC AGTCAGTCGC       180
     TGTTGAACCA AGCTAAAGGA CAGATCAAAA ATAAAAGAGA CACGTGAAAT TGTATTAGAA       240
     TATTAACTTC TGTAAACGGC GGCTAAAATC TCAGAAGTGG GATTAATAAT CCAAAATGGA       300
     CGATAAAATC ATCCTGAACG ACTTTTCGCT GACAACCCTA AAAGATTGGC TACGTATTCT       360
     GGGCCAAAAT ACGGAGGGCA CAAAAACCGA ATTAATCGCG AGGCTGCAAG ACATCCCAAC       420
     GGCAGTTCGG GGCGATTGTC CACCGGAGCA CCCCCAGAAA AACGCTCCAC CAGGAAACGA       480
     CATTTTTTCT TCACTGGATT TTCAGAATTG TGAAATTAAC ACCGATCACG TAAGTGTGAA       540
     TGCGATGAAC AGAAAAGAAT CAACCGAAAC TGGCAGTGAG AGGGAGACAA ACATGTTCGA       600
     GCTACAGCAA CTACGCGCAG AGCTAGCAGA AGCGAAGGCA ATGCTTAACG GAACACGATC       660
     GAGCTTGCAG TTCCAAGAAC AACAACAACC AGAGCAAAGC AAGGCTACAG TTAGTTCCGT       720
     TATCCAGACG GCGCAGTTTA CGCAGGCTGG CGCCACAAAA GAGAACACAA CATTTCACTC       780
     GCCGCAGCGA TCCAACGAGA GAGCGGAGAG CCAGCGTTTT CCAGTTGATG CTCTCGCTCT       840
     CGCCAAAGAG ACGATAACCG ATTACGATGG GAAAACTTGC GCGCGTGCCT GGATAACAGT       900
     GGTCAAAAAT ATCGCACGCA CTTTCAACAT CGATGACAAC CATTTACGCA TCTTACTCAT       960
     CACTAAACTT AAAGGAAACG CGCAAGTCTG GTTACATGCG CACCCTGCTC GATTGATCGA      1020
     ACCAATTGAC AATTTGCTTG ATCAATTGTC ATTGACTTTT GGCGAGCAAT CATCCAAGGC      1080
     TGAGATCCGG CGAAAATTCG AGAGTCGCAA GTGGAAAACC GAGGAGAATT TCTGCAGTTA      1140
     TTACGACGAG AAGATGGCTC TCTCAAACGG GATAAACATC GACGACGACG AACTACTGGA      1200
     CCAGATGATA GAGGGCATAC CGCTACAAAA TTTCCGTACC CAAGCACGGA TTCAATGCTT      1260
     CTCTACTCCA TCGGAGATGC TACGCGCATT TTCGAACATC CGTTTGCCAG CTCGGAGGGA      1320
     GCCACCTGTA CAGCCAACCG ACTACAAAGA TGCCATACGA TGCGCAAACT GTAATTCAAG      1380
     AGGACACAAA GCTGACATCT GCAAGAAGCC CAAACGTGAA CCAGGTTCGT GCTACGCCTG      1440
     TGGACAACTT GGACACCTGG TGGCACAATG TCCCACAAGG AAGAGCGTTT CATCTAATAA      1500
     TTATGTAAGA TGGTTTAAAA TTAATTTTTT TGAAAATGCT TATAAGCCCA TAATTTCAGA      1560
     ATGCCTCATA GACTCTGGCA GTCCTATATC TATCATTAAA AAGTCACTTA TTAACGAGAC      1620
     AATGAAGTTA GCCCTAGTTA ATACTTGCTA TTTTGGTTTA AACAACTGTA TTCTCAAAAC      1680
     ACATGGACAA ACCACATGTT ATGTTTTGAA AGGATCAATA AAAATATATT TTCGTTTAAT      1740
     CATTGTTTGC GACCAGTCTA TGAGGTATAA TGTTATTCTC GGCAGAGATT TTTTAACTGC      1800
     ATGCAATTTA AATTTAGACC CGTACACCTT GGGAATGATT GCGTTGAGAA AACCCATGGA      1860
     AATAAACAAA ATATCAATGT TTACTGAAAA TGATAGTCCT GAGAAATCTT TAGAAAATGA      1920
     AATTGTTAGT CCAAAATCGT TAGAGAATGA AATTGTTAGT TCACAATCGT TAGAAAATGA      1980
     AATTGTTAGC CCCAAATCGT TAGAGAATGA AATTGTTAGT CCAAAATCGT TTAAAAATGC      2040
     AACTATTAGT CCGAAATCGT TAGAAAATAA AATCGTTAAT CAACAGCATA AAGAAACTGG      2100
     TCCAATATCG TTAAGAGATG AAATAGTTAA TCAACAAAAG AATGTCAGTA AATCAAAATT      2160
     ATCAGAAGAT GAAATTGTTA ACACTTCAAA AGAAATCGTT AGTTTTAAAT TGCCAAAAGA      2220
     TAAAAACGTT TACGAACAAT TAAATCACAA CTTTGATAAG GAAGTACTAA GAATATGTCA      2280
     TGTAACTGAA AGTGAGTTAG AATACAAAAT AGGAGAAAAT GTTAGCAATA GGTTACAACT      2340
     AGAATTCGAT AGGTTGTTTA GAAATTTTTA TATAAATGCA AAAAGGCCAA ATGAACCGAC      2400
     AGTTAGAAGT GAAATACAAT TGTGTTTGAA AAACCCGAAA CCGTTTAGCT GTTCTCCTAG      2460
     GAGGCTTTCA TACACAGAAA AAGACAGGTT ACAAAAACTA TTAGACGAAT ATTTGGAAAA      2520
     CGGATTTATA CGACCAAGCG ACTCGGAATA TGCATCGCCT ATTGTTTTAG TGAAAAAGAA      2580
     AACTGGAGAC TTACGTATGT GCGTCGACTT TAGAAAACTT AATAAAATGA CAATGAAAGA      2640
     CAACTATCCT CTACCTCTTA TAGATGACTT GTTAGATAGA ATGAATGAGA AAACTGTTTT      2700
     CACCAAACTC GATCTTAAAA ACGGTTTTTT CCACGTGCAT GTTAAAAAAG AATCAATAAA      2760
     ATACACCTCT TTCGTTACAC CATTAGGCCA ATACGAGTGG CTGCGAATGC CATTTGGCCT      2820
     CAAAAACGCC CCGTCTGTGT TCCAAAGATT TGTTAACAAA ATTTTTGCGG ATATGATTAG      2880
     AGAAAACAAA GTAGTAGTAT ATATGGACGA CATTCTATTG GCAACCGAAA ATATAAACGA      2940
     ACACTTAGAA ACGTTGAAAG AAATTTTTAA AAGATTAGTT GAAAATAAAC TTGAATTAAG      3000
     AATAGACAAA TGTGAGTTTA TGCAATCAAG TATAAAATAT CTTGGGTTCA TAATAAATAA      3060
     AGACGGCATA ATGCCCAATG ACAAAGGAAT CGAGGCAATA AAAAATTTCC CAATACCTAA      3120
     TAATGTTCAT ACAGTACAAA GTTTTTTGGG ATTATGCTCA TATTTTCGAC GGTTTATAAA      3180
     AGATTTTTCT AGACTAGCTA AACCATTGCA TGACATTCTA AAAAAAGATA AACCGTTCAA      3240
     ATTTGGTAGT GAAGAAATGA TTTGTTTTAA TATGTTAAAA GATAAATTAA TACAGTCACC      3300
     GGTCTTAGCT ATATACAACC ATAAACACGA AACAGAATTG CATTGTGATG CAAGTTCTTC      3360
     TGGATTCGGT GCTGTACTTA TGCAAAAGAA GGAGGACCAG AAATGGCACC CAGTTTCATT      3420
     CTTTTCAAAA CGGACAACAG ATATTGAATC AAAATACCAC AGTTTCGAGT TAGAAACTTT      3480
     AGCCATTGTT TATTCGTTAC GTAGATTTAG AGTTTATCTT CATTGGAGGA CATTTAAAAT      3540
     AGTCACCGAC TGCAACTCAT TAATTTTGAC CCTAAGCAAA AAAGAGCTAA ACCCTAGGAT      3600
     AGCCAGGTGG GCTTTAGAAT TCCAAGGTTA TGATTTTGAA ATTGTGCATA GGGCAGGTAG      3660
     CCGCATGCAA CATGTTGACG CACTGAGTAG GTGTACAAAT ATTATGGTAA TACAAACAAA      3720
     CAGTTTCGAA GATAATCTAG TTATATGTCA AGGGAAAGAT ACAAAATTAA AAGAAATCAG      3780
     GCAATTGTTA GAAAACACAG AAAATAAATT GTATGAGATG AGAAATGGTA TAGTTTACAA      3840
     AAAGACAAAT GAAAATAGAT TGCTGTTCTA CGTTCCGATA GAAATGGAAG AACAAGTGTT      3900
     ATACAAATAT CACAACGAAC TTGGACACGT AGGAAGAGAC AAAATGATAG AAGCTATAAT      3960
     GAAAAACTAT TGGTTTCCAA ATTTAAAACA GAAGTGTAGC ACACATATCA GCAACTGTTT      4020
     AAAATGTATT TCATTCAGTC CCAAAACAGG AAAAACAGAA GGATTTCTAC ACAACATACC      4080
     TAAGGGAAAC AAACCTTTTG AAATAATCCA TATTGACCAT TATGGTCCAG TAGACTTGGC      4140
     TAGACCGAAG AAACATATTC TAGTGATAGT AGATGCATTC ACAAAGTTTG TCAGACTATA      4200
     CGCAACAAAA ACTACGAACA CAAAAGAAGT CATACAATCG TTAAATGACT ACTTCAGAGC      4260
     ATACAGTAGG CCTAAGTGTA TCATATCAGA TAGAGGAGCA TGTTTCACGT CTGGCGATTT      4320
     TGACTCATTT TTGAAAGAAT GCAATGTTAA ACACATAAAA ATTGCAACAG GATCGCCACA      4380
     AGCCAACGGT CAAGTTGAAC GTATAAACCG AAGTCTTGGT CCAATGATTA GCAAGTTAAT      4440
     TGAACCTGAT CAAGGTCTAC ACTGGGACTT AGTCTTAGAA AAGGTCGAAT ATACCCTGAA      4500
     CAATACACTA CACCGCAGCA TTAAACAGTA TCCTAGCATA ATGTTATTTG GGTTACAACA      4560
     AAAAGGACAA ATTATGGATG AGTTAAAAGA AAAAATTGAG GAAATTGGAG AAACGATTGA      4620
     AGAAAGAGAT TTAGAAAGTA TTAGAAATAA AGGCGAGGCA AGTCAGAAAA TAGCACAAGC      4680
     ATACAATAAA GAATATGTTG ACAAAAAACG AAAACGATCA GGAGTGTTCA CAAAAGGCAC      4740
     TACGTCATGG TTAAAAATTT TGACTCAACA ACAGGCATAG CTAAGAAGTT AATTCCAAAG      4800
     CATAAAGGAC CCTATGTCAT AAGCAAAGTT CTCAAAAATG ATCGCTTCCT TCTGGAAGAT      4860
     GTTGATGGAT TTCAAATTTC TCGCAATCCT TACCGGGGTG TATGGAGCAT ACAGAATATA      4920
     AAACACTGGC AAAGAAAAAT TAAGAGTCTA CAAAATAGAA AGTATAATTT GAGAAACTCT      4980
     GTACAAAATA GAAAGTATAA TTTGAGAAAC TCTGTACAAA ATAGAAAGTA TAATTTAAGA      5040
     AACTCTGTAC GAAATCGAAA GTATAATTTA AGAAGCAATT GTAAAACAAA GAAAACAAAC      5100
     AAGAAGAAAA GAAAACCAAA AAAATGTTTA AGACCGTTCA AAAGTATCTC CACTAAGAAG      5160
     AATAAAATAA GAAACAGGAC CCTTAGCTTT AAGAAACGTT AATTGTTATA AAATCCTACG      5220
     ATCGGGAGAT CTAGTTGTCA GGACGGCCGA GTTGTAGTAG GCTGCTCCTT CTACCCTCTT      5280
     CCTTTACTCT TAGTCATACA TACCTAATTA TACATAGCCA ATCTAGTCAT AAGCTTATAC      5340
     ACTCATACAC CCATCCTTAA CATACAAATA TTATCGAGAA ACTTATCGAC TAATCGACTC      5400
     GCCACTCTGC AGAGAGCGCG GCAGTCAGTC GCTGTTGAAC CAAGCTAAAG GACAGATCAA      5460
     AAATAAAAGA GACACGTGAA ATTGTATTAG AATATTAACT TCTGTAAACG GCGGCTAAA       5519
//
ID   DMDM11     standard; DNA; INV; 5461 BP.
XX
AC   X14037;
AC   X15066;
XX
DR   FLYBASE; FBte0000042; Dmel\micropia.
XX
FT   source          join(X14037:5..3664,X15066:3534..3593,X14037:3721..5461)
FT   SO_feature      five_prime_LTR ; SO:0000425:1..476
FT   SO_feature      three_prime_LTR ; SO:0000426:4957..5461
FT   SO_feature      primer_binding_site ; SO:0005850:477..489
FT                   /bound_moiety="tRNA-leu"
FT   SO_feature      primer_binding_site ; SO:0005850:4939..4956
FT   SO_feature      CDS ; SO:0000316:540..4415
FT                   /name="Dmel\micropia\polyprotein"
FT                   /db_xref="FLYBASE:FBgn0043876"
FT                   /translation="
FT                   MQNRNLAELVKIMQKTPAREQQPSYDVKLPKFNPDAACVEAAKWCSTTDI
FT                   ILTEHPLKGSKLITALSNCMEGTASQWLTQISYQGMTWQEFQELFLQRFE
FT                   TEETPAATFLNLLNSRPTAAECYAVYASRLVTQLTTKWRNMEIEEIAVTT
FT                   VLAHMANIDSRLQRVLFTSNVRTRSKLQAELKAFTFDKKRHARDDNLGPD
FT                   QKNRKASPVVCHFCSKPGRRIAECRSKMRQDRRAKPQREKSNVTCYRCGQ
FT                   PGHFSNQCPKNGTAAKQDVTQQKTVNQCCVTEPKGSLHQRGEIYPICFDS
FT                   GAECSLIKDDISSKLSGKRINNTVMIKGIGGGSVCSTLQILSEVTINENI
FT                   MEILFHVVPNEEMRNDILIGREILKQGFYVILTSDNFKVVKSKTVNNCSV
FT                   TERSFTLSDIDTELVDNEKAQLIELLEKHSTSFTNGIPHTRVNTGEMKIR
FT                   LIDPTKTVQRRPYRLSPEEREVVRMQVSELIRCNIVRPSCSPFASPMLLV
FT                   KKKNGTDRLCVDFRELNSNTISDKYPLPLISDQIARLRGANYFTCLDMAS
FT                   GFHQIPIHPESVEYTAFVPDGLKNAPSVFQRTVINALGDLANSFVIVYMD
FT                   DIMVVSPTKELALERLKTVLNVLTKAGFTFNLAKCSFLKTTVQYLGYEVR
FT                   AGEIRPNVRKIASLSSLPPPQTVSGVRQFIGLASYFRKFVSGFSQLMKPL
FT                   YSLSSGSGKITWSAELEEIRLKVVTILTNEPALVIFDPQYPIELHTDASA
FT                   CGYGAILLHRIESKPHVIEYFSKTTTSVESRYHSYELETLAVVKAVKHFR
FT                   HYLIGREFVVYTDCNSLKASRTKIDLTPRVHRWWAYLQSFNFEIQYREGK
FT                   RMAHVDFLSRNPLSPEHILSINKIPEKRVNLSEISSTWLLAEQRLDLEII
FT                   EIVNKLESDELAENLAKTYDLRKGVLYRKVQRRGRTSYLPVVPRAFKWSV
FT                   INQVHESIMHLGWQKTLDKVYQYYWFAKMNKYVRKFVSNCITCRSVKSSS
FT                   GKVQAELHSIPKTSIPWHTIHIDITGKLSGKSDLKEYVIVQIDAYTKFVY
FT                   LYHTLKIDAESCVNAMKSSISLFGVPDRIIADQGRCFTSSKFSEFCVSQK
FT                   VELHLIATGMSRANGQVERVMETLKNLLSVVESSQRSWQDALGEVQLALN
FT                   CTISRATDASPLEMLIGKQARPLGLVPPCETECEIDLATVRAHATENMNS
FT                   LASYDKSRFDSSRAAVDKHHVGDYVLLRNEERHQTKLDPKFRGPFLVTEV
FT                   LEGDRYTLKSLTSNRSFKYCHESIKMPDAEIPNELNENVEQ"
XX
CC   Sequence assembled by Lynn Crosby (FlyBase), 'micropia.v006'.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 5461 BP; 1679 A; 1051 C; 1264 G; 1467 T; 0 other;
     TGTCGTGGCG AAAATAATGA GTATGCGTGT AGTCGCTGTT TACTTCTTCT CCATGTTCCC        60
     TTTGCTATTA TGCGTGTTCC TATTTATGAA CACGTGGCGA AAATAATAAA TGCGTGTAGT       120
     CGCCGTTTAC TTCTTCTCCA TGTTCCCTTT GCTATTATGC GTGTTCCTAT TTATTGTCAA       180
     TGTGTGAGGA TGAATAGATG AATTATCTAT GAACGGGATT TTGCAAAAAC GACTTGCGCT       240
     GCTTGGTTAG AAAGGGAAAA CTATATAATG AAAAGGGAAT GCCAAAAATT GAGAAGAGAC       300
     AAAGCAGGCT GCACGAAGCT GGAGTGAGGG CATTAATCGT GGAGAAGCCA AAGCAGACGC       360
     AAGTGGACTC GTTGACTGCG CACAGCTGCA TAAAATTATA TAGTAAAAAG AGATTTGAGC       420
     GACGCTGATA TGGACGGACG GACGGACGCG AGGCCCCTGA TATTCTTAAC CCGACATCAG       480
     AAGTGGGATC TGTGCCACAC CCTGCATTTT CTGAGGATCA GTGGCGTGCA GTAGTGGAAA       540
     TGCAAAATCG GAATTTGGCT GAACTTGTAA AAATCATGCA AAAGACGCCG GCACGTGAGC       600
     AGCAACCTAG TTATGATGTT AAGCTACCCA AATTTAACCC TGATGCTGCA TGCGTAGAGG       660
     CAGCAAAGTG GTGTTCAACA ACCGATATAA TTCTAACTGA GCACCCCCTT AAAGGAAGTA       720
     AATTGATCAC GGCACTAAGT AACTGCATGG AGGGAACTGC ATCTCAGTGG CTAACACAAA       780
     TCTCGTACCA GGGTATGACT TGGCAAGAGT TCCAGGAATT ATTTCTGCAG CGCTTTGAAA       840
     CCGAAGAGAC GCCGGCCGCT ACGTTTTTAA ATTTACTCAA CAGCCGCCCG ACTGCCGCCG       900
     AATGTTACGC GGTGTATGCG AGTCGGCTGG TGACGCAGCT GACTACAAAG TGGCGGAATA       960
     TGGAAATAGA AGAAATTGCC GTTACAACTG TTCTTGCGCA TATGGCAAAC ATTGACAGTC      1020
     GTTTGCAGCG CGTCCTCTTC ACATCCAATG TGCGTACCAG AAGTAAGCTA CAGGCGGAGT      1080
     TAAAAGCGTT TACGTTCGAC AAGAAGCGAC ATGCTCGAGA TGACAACCTT GGACCTGACC      1140
     AGAAGAACCG TAAGGCATCG CCAGTTGTAT GCCACTTCTG TTCAAAGCCG GGACGTCGAA      1200
     TTGCTGAATG CCGAAGTAAA ATGCGACAAG ATAGACGGGC GAAACCGCAG CGTGAAAAAT      1260
     CAAATGTTAC GTGCTATCGG TGCGGCCAAC CGGGACATTT CTCCAACCAG TGCCCGAAAA      1320
     ACGGAACTGC AGCCAAACAA GATGTGACTC AACAGAAGAC TGTTAACCAA TGTTGTGTGA      1380
     CTGAGCCAAA GGGAAGCTTG CATCAACGAG GTGAGATCTA TCCAATTTGT TTCGATTCCG      1440
     GTGCAGAGTG CTCCCTTATT AAAGACGACA TTAGCAGTAA GTTATCTGGT AAACGTATAA      1500
     ACAATACTGT AATGATAAAA GGCATTGGTG GTGGCAGTGT GTGCAGTACA TTGCAAATCT      1560
     TGAGTGAAGT CACTATAAAC GAAAATATTA TGGAAATATT ATTTCATGTA GTCCCGAACG      1620
     AGGAAATGAG GAATGATATT CTGATAGGGC GAGAAATACT TAAACAAGGC TTTTATGTAA      1680
     TTTTGACATC CGATAATTTT AAAGTTGTAA AATCAAAAAC TGTTAATAAT TGTTCCGTTA      1740
     CTGAGCGATC GTTTACTTTG TCCGATATTG ACACCGAATT AGTCGACAAT GAGAAAGCTC      1800
     AATTAATTGA GTTACTTGAA AAGCACTCGA CTTCATTTAC CAACGGGATA CCTCATACTC      1860
     GAGTAAATAC AGGCGAAATG AAAATCCGTT TGATTGATCC AACTAAAACT GTTCAGCGCC      1920
     GACCTTACAG ACTTAGCCCC GAAGAGAGAG AAGTAGTGCG AATGCAGGTG AGCGAATTGA      1980
     TAAGATGTAA TATTGTTCGC CCAAGTTGCT CTCCCTTTGC TAGCCCCATG TTGCTCGTCA      2040
     AAAAGAAGAA CGGAACCGAC CGTCTATGTG TTGATTTTAG AGAGCTAAAC TCGAACACGA      2100
     TTTCGGATAA ATACCCCTTG CCGCTTATCA GCGATCAAAT TGCTAGACTT CGCGGAGCAA      2160
     ATTATTTCAC ATGCCTGGAT ATGGCAAGTG GTTTCCACCA AATCCCGATT CACCCTGAAT      2220
     CCGTGGAATA TACTGCATTT GTGCCCGACG GCCTCAAAAA TGCGCCATCT GTTTTCCAGC      2280
     GCACAGTCAT AAATGCACTT GGTGACCTTG CTAACTCTTT TGTAATCGTT TACATGGACG      2340
     ACATAATGGT AGTATCGCCA ACCAAGGAAT TGGCTTTGGA AAGGTTAAAA ACTGTTTTGA      2400
     ATGTTCTTAC AAAGGCTGGT TTTACCTTTA ACCTTGCTAA ATGCAGTTTT CTCAAAACAA      2460
     CGGTTCAGTA TTTAGGCTAT GAAGTGCGAG CGGGAGAAAT TCGTCCGAAT GTGCGAAAGA      2520
     TAGCTTCTTT AAGCTCCTTG CCTCCTCCTC AAACTGTCTC CGGCGTTAGA CAATTCATTG      2580
     GCTTGGCCTC TTACTTTCGC AAATTCGTGT CTGGATTCTC CCAACTTATG AAACCATTGT      2640
     ATTCACTTTC GTCTGGTAGC GGCAAGATTA CATGGAGCGC TGAGCTGGAA GAGATCAGAC      2700
     TTAAAGTTGT GACGATCCTC ACAAATGAGC CTGCTCTGGT AATCTTCGAC CCGCAATATC      2760
     CTATTGAGTT GCACACTGAT GCAAGTGCCT GTGGATATGG AGCGATACTT TTGCACCGTA      2820
     TAGAAAGTAA GCCCCATGTA ATCGAATACT TCAGCAAAAC AACTACCTCT GTTGAATCTA      2880
     GATATCACTC CTACGAGCTG GAAACCTTGG CAGTGGTAAA AGCCGTTAAA CATTTTCGCC      2940
     ATTACCTAAT TGGCCGTGAG TTCGTTGTCT ATACAGACTG CAATTCATTA AAAGCTTCTC      3000
     GCACAAAAAT AGATTTAACC CCCAGAGTTC ACCGCTGGTG GGCCTACTTA CAATCGTTTA      3060
     ATTTCGAAAT TCAGTATAGA GAGGGTAAGC GTATGGCTCA TGTGGATTTC CTATCAAGAA      3120
     ATCCTTTATC ACCCGAACAC ATTTTGTCAA TAAACAAGAT TCCCGAAAAA CGAGTAAATC      3180
     TGTCTGAAAT TTCAAGTACT TGGCTTCTTG CTGAGCAACG GTTAGACCTT GAGATAATAG      3240
     AAATTGTTAA CAAATTGGAG TCAGATGAAT TAGCCGAAAA CTTGGCCAAA ACGTATGATT      3300
     TGCGAAAAGG TGTATTATAT CGCAAGGTCC AAAGACGAGG TAGAACAAGT TATTTACCAG      3360
     TTGTACCCAG AGCTTTCAAA TGGTCAGTAA TTAACCAGGT ACACGAGTCG ATAATGCATT      3420
     TAGGGTGGCA AAAGACACTT GATAAAGTGT ACCAGTATTA TTGGTTCGCT AAAATGAACA      3480
     AGTATGTTCG AAAATTTGTT TCAAACTGCA TAACTTGTAG ATCAGTGAAA TCATCTTCCG      3540
     GGAAGGTTCA GGCGGAACTT CATTCCATTC CGAAGACAAG TATACCGTGG CACACCATCC      3600
     ACATAGATAT AACGGGGAAA TTAAGTGGCA AGAGCGATTT GAAGGAGTAT GTCATTGTTC      3660
     AGATCGATGC CTATACAAAG TTTGTTTATC TGTATCACAC CTTAAAGATA GATGCCGAAA      3720
     GCTGTGTTAA TGCTATGAAA TCTTCCATAT CCTTATTTGG AGTACCAGAT CGCATTATCG      3780
     CCGACCAGGG CAGATGTTTT ACTAGCTCTA AGTTTTCAGA GTTTTGCGTA TCGCAGAAAG      3840
     TTGAACTTCA CTTGATTGCT ACGGGAATGA GCCGTGCAAA TGGGCAAGTG GAACGGGTGA      3900
     TGGAAACACT GAAAAATTTG TTGTCAGTGG TAGAATCAAG TCAACGATCG TGGCAGGACG      3960
     CACTTGGCGA AGTCCAACTT GCACTGAATT GTACAATTTC TCGTGCCACT GATGCAAGTC      4020
     CGTTAGAAAT GTTAATTGGT AAACAGGCTC GACCCCTTGG ATTAGTTCCC CCATGTGAGA      4080
     CCGAATGTGA AATAGATTTG GCAACTGTTA GAGCTCATGC GACAGAAAAT ATGAATTCCT      4140
     TAGCGTCTTA CGACAAATCC CGATTTGATA GCAGTAGAGC AGCCGTTGAC AAACACCACG      4200
     TAGGTGACTA TGTGCTATTG AGGAATGAAG AAAGACACCA AACTAAGTTA GATCCGAAAT      4260
     TCAGAGGACC GTTTTTGGTA ACTGAAGTAT TAGAGGGTGA CAGGTATACA CTAAAGTCGT      4320
     TGACGAGTAA CCGATCGTTC AAGTATTGCC ATGAATCAAT CAAAATGCCG GATGCAGAAA      4380
     TCCCGAATGA GTTAAACGAG AATGTAGAGC AATAGCTGAA ATATAGAAAC AGTTGAATGA      4440
     AAAGAAAAGC CCGCCAATGA GTTCTTTTGT GAACGAGAGA TATCCGTCTA GGTGAGACGA      4500
     TGAATTGTGA GTTATCCGTC TAGGTGAGAC GATGAATTGT GAGTTATCCG TCTAGGTGAG      4560
     ACGATGAATT GTCAGTTATC CGTCAGGTGA GACGATGAAT TGTGAGTTAT CCGTCCAGGA      4620
     GAGACGATGA GTTTGGATTG AATTAATAAT CAAGTGTGTG TGAACTGGCG GAAGATCGAT      4680
     ATATAGAAAT CGATAAATGA TAATGTTAAG ATAAGTTGTG AGCTGATGTA TTACTGATCA      4740
     ATGGAACTGA ATATGAAAAT AGAATAAGTT ATCCCAGCAA CAGTGAAATA AGAGCTGTTT      4800
     TGTTTCTTCA CAGAATTAAG ATTTAAGAAA TACACCTGAT AAAGTCAAAC TAATGAAATT      4860
     AAATGTTATT GAATAGTGAT GAAAGTAGGT GATCTTGATA TCTTGGTATC TCGGTATCAA      4920
     AAGCTTACAC GAGGACGTGA AATGTCAGAA TGGCCGTGTC GTGGCGAAAA TAATGAGTAT      4980
     GCGTGTAGTC GCTGTTTACT TCTTCTCCAT GTTCCCTTTG CTATTATGCG TGTTCCTATT      5040
     TATGAACACG TGGCGAAAAT AATGAATGCG CGTAGTCCGG TTTACTTCTT CTCCATGTTC      5100
     CCTTTGCTAT TATGCGTGTT CCTATTTATT GTCAATGTGT GAGGATGAAT AGATGAATTA      5160
     TCTATGAACG GGATTTTGCA AAAACGAGAG CGATAGAGCT GTTGCTGAAC GTGGCCACTT      5220
     GCGCTGCTTG GTTAGAAAGG GAAAACTATA TAATGAAAAG GGAATGCCAA AAATTGAGAA      5280
     GAGACAAAGC AGGCTGCACG AAACTGGAGT GAGGGCATTA ATCGTGGAGA AGCCAAAGCA      5340
     GACGCAAGTG GACTCGTTGA CTGCGCACAG CTGCATAAAA TTATATAGTA AAAAGAGATT      5400
     TGAGCGACGC TGATATGGAC GGACGGACGG ACGCGAGGCC CCTGATATTC TTAACCCGAC      5460
     A                                                                      5461
//
ID   PPI251     standard; DNA; SYN; 2907 BP.
XX
AC   X06779; V01520; X69493;
XX
DR   FLYBASE; FBte0000037; Dmel\P-element.
XX
FT   source          X06779:996..3902
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1..31
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:2877..2907
FT   SO_feature      CDS ; SO:0000316:join(153..442,501..1168,1222..1947,2138..2709)
FT                   /name="Dmel\P\T"
FT                   /db_xref="FLYBASE:FBgn0013311"
FT                   /translation="
FT                   MKYCKFCCKAVTGVKLIHVPKCAIKRKLWEQSLGCSLGENSQICDTHFND
FT                   SQWKAAPAKGQTFKRRRLNADAVPSKVIEPEPEKIKEGYTSGSTQTESCS
FT                   LFNENKSLREKIRTLEYEMRRLEQQLRESQQLEESLRKIFTDTQIRILKN
FT                   GGQRATFNSDDISTAICLHTAGPRAYNHLYKKGFPLPSRTTLYRWLSDVD
FT                   IKRGCLDVVIDLMDSDGVDDADKLCVLAFDEMKVAAAFEYDSSADIVYEP
FT                   SDYVQLAIVRGLKKSWKQPVFFDFNTRMDPDTLNNILRKLHRKGYLVVAI
FT                   VSDLGTGNQKLWTELGISESKTWFSHPADDHLKIFVFSDTPHLIKLVRNH
FT                   YVDSGLTINGKKLTKKTIQEALHLCNKSDLSILFKINENHINVRSLAKQK
FT                   VKLATQLFSNTTASSIRRCYSLGYDIENATETADFFKLMNDWFDIFNSKL
FT                   STSNCIECSQPYGKQLDIQNDILNRMSEIMRTGILDKPKRLPFQKGIIVN
FT                   NASLDGLYKYLQENFSMQYILTSRLNQDIVEHFFGSMRSRGGQFDHPTPL
FT                   QFKYRLRKYIIARNTEMLRNSGNIEEDNSESWLNLDFSSKENENKSKDDE
FT                   PVDDEPVDEMLSNIDFTEMDELTEDAMEYIAGYVIKKLRISDKVKENLTF
FT                   TYVDEVSHGGLIKPSEKFQEKLKELECIFLHYTNNNNFEITNNVKEKLIL
FT                   AARNVDVDKQVKSFYFKIRIYFRIKYFNKKIEIKNQKQKLIGNSKLLKIK
FT                   L"
FT   SO_feature      CDS ; SO:0000316:join(153..442,501..1168,1222..1994)
FT                   /db_xref="FLYBASE:FBgnXXXXXXX"
FT                   /translation="
FT                   MKYCKFCCKAVTGVKLIHVPKCAIKRKLWEQSLGCSLGENSQICDTHFND
FT                   SQWKAAPAKGQTFKRRRLNADAVPSKVIEPEPEKIKEGYTSGSTQTESCS
FT                   LFNENKSLREKIRTLEYEMRRLEQQLRESQQLEESLRKIFTDTQIRILKN
FT                   GGQRATFNSDDISTAICLHTAGPRAYNHLYKKGFPLPSRTTLYRWLSDVD
FT                   IKRGCLDVVIDLMDSDGVDDADKLCVLAFDEMKVAAAFEYDSSADIVYEP
FT                   SDYVQLAIVRGLKKSWKQPVFFDFNTRMDPDTLNNILRKLHRKGYLVVAI
FT                   VSDLGTGNQKLWTELGISESKTWFSHPADDHLKIFVFSDTPHLIKLVRNH
FT                   YVDSGLTINGKKLTKKTIQEALHLCNKSDLSILFKINENHINVRSLAKQK
FT                   VKLATQLFSNTTASSIRRCYSLGYDIENATETADFFKLMNDWFDIFNSKL
FT                   STSNCIECSQPYGKQLDIQNDILNRMSEIMRTGILDKPKRLPFQKGIIVN
FT                   NASLDGLYKYLQENFSMQYILTSRLNQDIVEHFFGSMRSRGGQFDHPTPL
FT                   QFKYRLRKYIIGMTNLKECVNKNVIP"
FT   SO_feature      intron ; SO:0000188:443..500
FT   SO_feature      intron ; SO:0000188:1169..1221
FT   SO_feature      intron ; SO:0000188:1948..2137
XX
CC   Derived from X06779 (g58305) (Rel. 49, Last updated, Version 8).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
CC   CDS annotation from Lynn Crosby's annotation 'P-element.v010'.
XX
SQ   Sequence 2907 BP;  989 A; 491 C; 582 G; 845 T; 0 other;
     CATGATGAAA TAACATAAGG TGGTCCCGTC GAAAGCCGAA GCTTACCGAA GTATACACTT        60
     AAATTCAGTG CACGTTTGCT TGTTGAGAGG AAAGGTTGTG TGCGGACGAA TTTTTTTTTG       120
     AAAACATTAA CCCTTACGTG GAATAAAAAA AAATGAAATA TTGCAAATTT TGCTGCAAAG       180
     CTGTGACTGG AGTAAAATTA ATTCACGTGC CGAAGTGTGC TATTAAGAGA AAATTGTGGG       240
     AGCAGAGCCT TGGGTGCAGC CTTGGTGAAA ACTCCCAAAT TTGTGATACC CACTTTAATG       300
     ATTCGCAGTG GAAGGCTGCA CCTGCAAAAG GTCAGACATT TAAAAGGAGG CGACTCAACG       360
     CAGATGCCGT ACCTAGTAAA GTGATAGAGC CTGAACCAGA AAAGATAAAA GAAGGCTATA       420
     CCAGTGGGAG TACACAAACA GAGTAAGTTT GAATAGTAAA AAAAATCATT TATGTAAACA       480
     ATAACGTGAC TGTGCGTTAG GTCCTGTTCA TTGTTTAATG AAAATAAGAG CTTGAGGGAA       540
     AAAATTCGTA CTTTGGAGTA CGAAATGCGT CGTTTAGAGC AGCAGCTGAG GGAGTCTCAA       600
     CAGTTGGAGG AGTCTCTACG CAAAATCTTC ACGGACACGC AGATACGGAT ACTGAAGAAT       660
     GGTGGACAAA GAGCTACGTT CAATTCCGAC GACATTTCTA CAGCTATTTG TCTCCACACC       720
     GCAGGCCCTC GAGCGTATAA CCATCTGTAC AAAAAAGGAT TTCCTTTGCC CAGTCGTACG       780
     ACTTTGTACA GATGGTTATC AGATGTGGAC ATAAAAAGAG GATGTTTGGA TGTGGTCATA       840
     GACCTAATGG ACAGTGATGG AGTTGATGAC GCCGACAAGC TTTGCGTACT CGCTTTCGAC       900
     GAGATGAAGG TCGCTGCTGC CTTCGAGTAT GACAGCTCTG CTGATATTGT TTACGAGCCA       960
     AGCGACTATG TCCAACTGGC TATTGTTCGT GGTCTAAAAA AATCGTGGAA GCAGCCAGTT      1020
     TTTTTCGATT TTAATACCCG AATGGACCCG GATACTCTTA ACAATATATT AAGGAAACTG      1080
     CATAGGAAAG GATATTTAGT AGTTGCTATT GTATCCGATT TAGGTACCGG AAACCAAAAG      1140
     CTATGGACAG AGCTCGGTAT ATCAGAATGT AAGTTTCGTA TATTACAAAA ATCAGATAAT      1200
     CCTTGAAATT CCATTTTTTA GCAAAAACCT GGTTTAGCCA TCCTGCAGAT GACCATTTAA      1260
     AGATTTTCGT TTTTTCGGAT ACGCCACATT TAATTAAGTT AGTCCGTAAC CACTATGTGG      1320
     ATTCCGGATT AACAATAAAT GGGAAAAAAT TAACAAAAAA AACAATTCAG GAGGCACTTC      1380
     ATCTTTGCAA CAAGTCCGAT CTGTCTATCC TCTTTAAAAT TAATGAAAAT CACATTAATG      1440
     TTCGATCGCT CGCAAAACAG AAGGTTAAAT TGGCTACCCA GCTGTTTTCG AATACCACCG      1500
     CTAGCTCGAT CAGACGCTGC TATTCATTGG GGTATGACAT TGAAAATGCC ACCGAAACTG      1560
     CGGACTTCTT CAAATTGATG AATGATTGGT TCGACATTTT TAATTCTAAA TTGTCCACAT      1620
     CCAATTGCAT TGAGTGCTCG CAACCTTATG GCAAGCAGTT GGATATACAG AATGATATTT      1680
     TGAATCGAAT GTCGGAAATT ATGCGAACAG GAATTCTGGA TAAACCCAAA AGGCTCCCAT      1740
     TTCAAAAAGG TATCATTGTG AATAATGCTT CGCTTGATGG CTTGTATAAA TATTTGCAAG      1800
     AAAACTTCAG TATGCAATAC ATATTAACAA GCCGTCTCAA CCAAGACATT GTGGAGCATT      1860
     TTTTTGGCAG CATGCGATCG AGAGGTGGAC AATTCGACCA TCCCACTCCA CTGCAGTTTA      1920
     AGTATAGGTT AAGAAAATAT ATAATAGGTA TGACAAATTT AAAAGAATGC GTAAACAAAA      1980
     ATGTAATTCC ATGATTTATA ATTGTTTAAT GTTTAGCTAT ATGTTTCAGG AAAGTTTCAG      2040
     TTGAGAATGT AGGTAGTTAT GTGCTGTCTA TTGTGTTTTG TCTTTTATCT GTTTCTTTTC      2100
     ATTTTATTAT TTAATCATTA TCCTTTTGCT TATCCAGCCA GGAATACAGA AATGTTAAGA      2160
     AATTCGGGAA ATATCGAAGA GGACAACTCT GAAAGCTGGC TTAATTTAGA TTTCAGTTCT      2220
     AAAGAAAACG AAAATAAAAG TAAAGATGAT GAGCCTGTCG ATGATGAGCC TGTCGATGAG      2280
     ATGTTAAGCA ATATAGATTT CACCGAAATG GATGAGTTGA CGGAGGATGC GATGGAATAT      2340
     ATCGCGGGCT ATGTCATTAA AAAATTGAGA ATCAGTGACA AAGTAAAAGA AAATTTGACA      2400
     TTTACATACG TCGACGAGGT GTCTCACGGC GGACTTATTA AGCCGTCCGA AAAATTTCAA      2460
     GAGAAGTTAA AAGAGCTAGA ATGTATTTTT TTGCATTATA CAAATAATAA TAATTTTGAA      2520
     ATTACAAATA ATGTAAAGGA AAAATTAATA TTAGCAGCGC GAAACGTCGA TGTTGATAAA      2580
     CAAGTAAAAT CTTTTTATTT TAAAATTAGA ATATATTTTA GAATTAAGTA CTTCAACAAA      2640
     AAAATTGAAA TTAAAAATCA AAAACAAAAG TTAATTGGAA ACTCCAAATT ATTAAAAATA      2700
     AAACTTTAAA AATAATTTCG TCTAATTAAT ATTATGAGTT AATTCAAACC CCACGGACAT      2760
     GCTAAGGGTT AATCAACAAT CATATCGCTG TCTCACTCAG ACTCAATACG ACACTCAGAA      2820
     TACTATTCCT TTCACTCGCA CTTATTGCAA GCATACGTTA AGTGGATGTC TCTTGCCGAC      2880
     GGGACCACCT TATGTTATTT CATCATG                                          2907
//
ID   DMPOGOR11  standard; DNA; INV; 2121 BP.
XX
AC   X59837; S90749;
XX
DR   FLYBASE; FBte0000568; Dmel\pogo.
XX
FT   source          X59837:1..2121
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1..21
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:2101..2121
FT   SO_feature      intron ; SO:0000188:1438..1541
XX
CC   Derived from X59837 (g8354) (Rel. 45, Last updated, Version 10).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
CC   K. O'Hare, Personal communication to FlyBase, 1 May 2000.
CC   This is probably complete element.
XX
SQ   Sequence 2121 BP;  724 A; 353 C; 399 G; 645 T; 0 other;
     CAGTATAATT CGCTTAGCTG CATCGATAGT TAGCTGCATC GGCAAGATAT CTGCATTATT        60
     TTTCCATTTT TTTGTGTGAA TAGAAAATTT GTACGAAAAT TCATACGTTT GCTGCATCGC       120
     AGATAACAGC CTTTTTAACT TAAGTGCATC ATATCAGCTG TTTTTTTTGC CAATTTCAAT       180
     GAATATCATC AAAGTTAGCT GCGCCATCTA TGAATCATTT TTGCATATCT AAAAGATGCA       240
     AGAATGCCAA CTCGTTTCAG TATCTGCGCA TGTCCGTTTT TGTTTTTGCT TTGATCGTGA       300
     TTTTTGTGTT TTTGTTTCTT ATGGCACAAA GTTATTAAAA TGGGTAAAAC AAAGCGTGTC       360
     GTTGGACTAA CACTAAAGGA AAAGCTTCAA ATAATCGAGT TAGTGACCAA CAAAGTGGAC       420
     AAAAAGGAAA TTTGTGCCAA GTTCAAATGC GACAGATCCA CAGTCAACCG CATTTTACAA       480
     AAAACAAATG AAATTCATGA AGCTGTGGCC GCGTCAGGTT TAAAAAGAAA GCGTCAAAGA       540
     AAAGGAGCGC ACGACTTAGT AGAAGAAGCC TTATACATTT GGTTCGGACA GCAGGAATCA       600
     AAGAACGTAA TTCTTGACCG GCACGTCATA TTAGCAAAAG CGAAAGAATT TTGCCAAAAA       660
     TTTAACGACG CCTTTGAACC TGACGCCAGC TGGCTTTGGC GCTGGCGCAA GCGCCACAAT       720
     ATAAAGTATG GCAAAATACA CGGCGAAACT GCTACAAATG ATTCCGTATC AGCAAATGAG       780
     TACAAAAATG ATATTTTGCC AGGATTGCTT AAAGGTTATA ACCCAGAAGA CATTTTTAAC       840
     GCTGACGAAA CTGCACTCTT TTATAAAGCA ATGCCGAATG CGACATTTTT TACTTGTGGA       900
     AAGCAATTAA ATGGCCAGAA ATCTCAGAGA GTGAGACTTA CTTTGCTGTT TATATGCAAT       960
     GCAACTGGGA CATACAAAAA AACTTTTGTA ATCGGCAGAT CTAAATCGCC ACGATGCTTC      1020
     AAGAATGCTA ATGTGCCCAT TCCGTACTAT GCAAATAAGA AGGCCTGGAT GACTAAGGAT      1080
     CTCTGGCGAA AAATAATGAC AGGATTTGAC GAAGAAATGA AAAAGCAAAA TCGAAAGATT      1140
     TTACTCTTCA TCGACAATGC AACTAGTCAC ACGACTGTCA AGGACTTCGA AAACATAAAA      1200
     TTGTGCTTCA TGCCACCAAA CGCAACGGCT CTACTTCAAC CTCTGGACCA AGGTATTATC      1260
     CACTCATTCA AATTAGAGTA TAGGCGTATT TTGGTCAAAC AGCAGCTCAT TGCTGTTAAT      1320
     TGTGGTAAAT CTACTGTGGA ATTTTTAAAA TCATTATCGT TATTGGATGC TCTATATTTT      1380
     GTCAACCAAG GATGGAAGAA TGTTAAAATG TTAACTATTC AGAATTGTTT TAAAAAGGTA      1440
     AGATGGGATT ATTATTGATA TGTATCTCAA ATAACGAATT TATTATTTTC AGGCTGGATT      1500
     TAAGTTCAGT TTTGAAAATG AAGACACCAT TGCTGAAAAA GACAAACAAT GCGTAGAAGT      1560
     TGACATTGTA TCGAATATTA ATTGGAATGA ATATGCCAAT GTTGATGCAG ATGAGGCTTG      1620
     CCATGGTCAA TTAGATGATG ATGAAATCGT GCGCTCTTTA GTTCAAGATG CAAAAACCAG      1680
     CGATAACGAA GAAAGCCATA GTGATGAAGA TGTGGACGAT ACTGAGCGTC CTACTTTTAA      1740
     GGATGGGTTT GCAGCAATTA AGGCTTTAAA GTCCATTTTT ATGCGAAACA ATAATGATGA      1800
     GTTTTTGCAA AACTTGAATT CTATGGAAGA CAAGCTGTTT AATTTACATA TAAACTCAGC      1860
     TGTATTGCAA AAAAAAATTA CTGACTATTT TTAAGTTAGT TTTAAAAAGT GTTTTAATCA      1920
     ATTCACCATC ACTTAAATTT ATATGTCGAT CTTACTTATC ATTAAGAATG AAATTATCAG      1980
     TTCCTTTTAT GTTTAACATT GTTATAAAGA AATAAATTCT TTATTTTTCC TTAAAAAAAA      2040
     AAATTAAGTT AGCTGCATTT TTAAGTTACC TGCATCGAGG CATTGTGCAA AGTACTCGAG      2100
     GCAGCTAAGC GAATTATACT G                                                2121
//
ID   DMRER1DM   standard; DNA; INV; 5356 BP.
XX
AC   X51968;
XX
DR   FLYBASE; FBte0000118; Dmel\R1A1-element.
XX
FT   source          X51968:1..5356
FT   SO_feature      CDS ; SO:0000316:319..1731
FT                   /name="Dmel\R1A1-element\ORF1"
FT                   /db_xref="FLYBASE:FBgn0044825"
FT                   /db_xref="SWISS-PROT:P16424"
FT                   /db_xref="NCBI_PROTEIN:CAA36226.1"
FT                   /translation="PVSASIRLLDSSKGGATIGATPMESDSSVSALSGSSASKVSRRGR
FT                   RRSHLASKSSAPTQAKLVALASNGVPEPVGVLEEAFSSLEDARAATSNAANDAAPPAAA
FT                   PAVDHTVAPDVSTAAKIAATTATAATAAARAGQAAMMAELSATQRMVRNSFRSLGGVDT
FT                   EELSCAISRYDELVMALMLRCGELETRLAMPPPPPPPSKANTTAANAPQMPQVAPIAAP
FT                   RTTKVRETWSAVVKCDDPALSGKAIAEKVRTMVAPSLGVRVHEVRELPSRWWCDHSYSS
FT                   VGELQKVMASKRFAELGLNVARNAAEKPKVIVYDVDTAIGPEEFMQELHENNFDSEMTL
FT                   AQFKKSVHLVTKAWSATDGATVNVTLEVDDRAMAKLDVGRVYIKWFSFRCRSQVRTYAC
FT                   HRCVGFDHKVSECRQKESVCRQCGQQGHTAAKCQNPVDCRNCRHRGQPSGHYMLSNACP
FT                   IYGALLARVQARH"
FT   SO_feature      CDS ; SO:0000316:1728..4790
FT                   /name="Dmel\R1A1-element\ORF2"
FT                   /db_xref="FLYBASE:FBgn0044824"
FT                   /db_xref="SWISS-PROT:P16425"
FT                   /db_xref="NCBI_PROTEIN:CAA36227.1"
FT                   /translation="TLMFSFIQANCGRGRAATIELGVRLRRSESMFALVQEPYLGGDEM
FT                   DVLPEGMRVFTDRRGKAAILVDHQEAICMPVETLTTDYGVCLVVKGSFGSIFLCAAYCQ
FT                   FDAPLEPYLRYMDAVLLQASRTPAILGLDANAVSPMWLSKLSRHAEGQANYRRGELLSE
FT                   WMLEARVAALNQSTEVYTFDNHRATSDIDVTIVNEAASMWATYEWRVDEWELSDHNIIT
FT                   VVAEPTTARSVESIAPVPSWNFSNARWRLFKEEMVSRIAELPENFSESPLDQQVSTLRS
FT                   IVHSVCDTALGRKLTRSPSRRARWWTADLCAARREVRRLRRLLQDGRRRDDDAAVELVV
FT                   VELRRASAYYKKLIGRAKMDDWKRFVGDHADDPWGRVYKICRGRRKCTEIGCLRVNGEL
FT                   ITDWGDCARVLLRNFFPVAESEAPTAIAEEVPPALEVFEVDTCVARLKSRRSPGLDGIN
FT                   GTICKAVWRAIPEHLASLFSRCIRLGYFPAEWKCPRVVSLLKGPDKDKCEPSSYRGICL
FT                   LPVFGKVLEAIMVNRVREVLPEGCRWQFGFRQGRCVEDAWRHVKSSVGASAAQYVLGTF
FT                   VDFKGAFDNVEWSAALSRLADLGCREMGLWQSFFSGRRAVIRSSSGTVEVPVTRGCPQG
FT                   SISGPFIWDILMDVLLQRLQPYCQLSAYADDLLLLVEGNSRAVLEEKGAQLMSIVETWG
FT                   AEVGDCLSTSKTVIMLLKGALRRAPTVRFAGRNLPYVRSCRYLGITVSEGMKFLTHIAS
FT                   LRQRMTGVVGALARVLRADWGFSPRARRTIYDGLMAPCVLFGAPVWYDTAEQVAAQRRL
FT                   ASCQRLILLGCLSVCRTVSTVALQVLGGAPPLDLAAKLLAIKYKLKRGFPLEENDWLYG
FT                   EDIACLSWEQRKTRLEECLIQSWQNRWDDDSEPGRVTHRFIPYVTLAYRDPSFGFSMRT
FT                   SFLLTGHGSFNAFLHGRALSDTTACACGDPYEDWMHILCACPLYADLRDLDGLGVQRLG
FT                   ENWIFEGILDDQEKTQRLAMFAEEVFLRRRAL"
XX
CC   Derived from X51968 (g8429) (Rel. 23, Last updated, Version 1).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 5356 BP;  1213 A; 1340 C; 1634 G; 1169 T; 0 other;
     CGGACGTGTT TTCGTTGCGC TCGTGGACAT AGTGCGAAGA ACTTTGTTTT CCGTATTTGG        60
     AAGTATACGG AATAAATAAT TTAGTGTTCC GTGGAAGTGG TGCGCAAATT TTCGCGAATT       120
     AAAAACAAGC GGTTTGGAAG TAATTGACAA TAAATTATTG GAAATTTTCC ACTCCGCACG       180
     TGTTGAGCGG CGGAGCTTGC GGGTGAGCTT TTCGAACAGC TGAGAGAAGC TTATTGGTGG       240
     TAGTCACCGC TAAGGATTGT GTCTTGGGAC AGCTTAGTGC ACTCTACCAA TAGGTGGAGC       300
     TATCACCATA GCAACTAGCC CGTGTCAGCG AGCATACGAT TGCTGGACTC GTCAAAAGGA       360
     GGAGCCACCA TCGGAGCAAC GCCGATGGAG AGCGACAGCA GTGTGAGTGC CTTGAGCGGA       420
     AGCAGTGCCT CAAAGGTGTC AAGACGAGGC AGGCGTAGGA GCCATCTGGC CTCCAAGAGC       480
     TCGGCGCCAA CGCAGGCGAA ACTGGTTGCC CTGGCCTCGA ATGGAGTGCC GGAACCCGTT       540
     GGTGTGCTGG AGGAGGCGTT TTCGTCGCTG GAGGATGCCC GGGCGGCTAC GTCAAACGCT       600
     GCCAACGATG CTGCCCCCCC CGCTGCTGCC CCCGCTGTTG ATCACACTGT TGCCCCTGAT       660
     GTTTCCACTG CTGCTAAAAT CGCTGCCACC ACTGCCACCG CTGCCACCGC TGCCGCCCGT       720
     GCTGGGCAAG CAGCCATGAT GGCAGAGCTG TCGGCCACCC AGCGCATGGT GCGAAACAGT       780
     TTCCGCAGCC TAGGAGGCGT AGACACGGAA GAGCTCTCGT GTGCCATCAG CCGCTATGAT       840
     GAGCTGGTGA TGGCATTAAT GCTCCGGTGT GGAGAACTGG AGACGCGGCT CGCTATGCCA       900
     CCACCGCCGC CGCCGCCGTC CAAGGCGAAC ACTACTGCCG CCAATGCTCC CCAGATGCCT       960
     CAGGTTGCAC CCATCGCTGC CCCGCGGACA ACCAAGGTTC GTGAGACGTG GTCAGCGGTG      1020
     GTGAAGTGCG ACGACCCTGC GCTATCGGGG AAAGCCATAG CCGAAAAGGT GCGGACGATG      1080
     GTTGCACCCT CCCTCGGAGT CAGAGTACAC GAGGTACGTG AGCTGCCGTC GAGGTGGTGG      1140
     TGCGATCATT CGTACTCTTC GGTTGGAGAG CTGCAGAAGG TGATGGCATC GAAAAGATTC      1200
     GCAGAACTTG GACTGAATGT GGCACGGAAC GCGGCCGAGA AGCCGAAGGT CATAGTCTAT      1260
     GACGTCGACA CAGCCATCGG CCCAGAAGAG TTCATGCAGG AGCTTCACGA GAACAACTTC      1320
     GACAGTGAAA TGACTCTGGC CCAGTTCAAA AAGTCGGTGC ACCTGGTGAC CAAGGCGTGG      1380
     TCGGCTACTG ACGGTGCCAC CGTAAACGTG ACGCTAGAGG TAGACGACCG GGCGATGGCG      1440
     AAACTTGATG TAGGACGTGT CTACATTAAG TGGTTTTCGT TCCGATGCCG ATCGCAAGTC      1500
     CGCACCTATG CCTGCCACAG ATGTGTGGGT TTCGACCACA AGGTTAGTGA ATGCAGGCAG      1560
     AAGGAGAGTG TTTGCCGCCA GTGCGGGCAA CAAGGCCACA CCGCGGCAAA GTGCCAAAAC      1620
     CCGGTGGACT GCCGGAACTG CCGTCACAGA GGGCAACCTT CGGGGCATTA TATGCTCTCG      1680
     AATGCTTGCC CGATATACGG AGCGTTGTTA GCGAGGGTGC AAGCTAGACA CTAATGTTTA      1740
     GCTTCATCCA AGCGAACTGT GGCCGAGGCA GAGCTGCGAC CATCGAGCTC GGAGTCCGAC      1800
     TCAGGAGATC GGAGTCAATG TTTGCTCTGG TGCAGGAGCC GTATCTTGGC GGGGATGAAA      1860
     TGGATGTGCT GCCTGAAGGA ATGAGGGTTT TCACCGACCG GCGAGGGAAG GCAGCCATCC      1920
     TAGTGGATCA TCAGGAAGCC ATCTGCATGC CAGTGGAAAC TCTCACCACA GATTATGGCG      1980
     TATGTCTGGT CGTTAAAGGG AGTTTTGGCT CAATCTTCCT TTGCGCCGCA TACTGCCAGT      2040
     TCGATGCACC TCTGGAACCG TACCTCCGGT ACATGGATGC GGTCCTGCTG CAGGCCAGCA      2100
     GAACCCCCGC AATCCTGGGC CTCGACGCGA ATGCAGTGTC CCCCATGTGG CTTAGCAAAC      2160
     TCTCTCGTCA TGCCGAGGGG CAAGCTAACT ACAGACGGGG TGAGCTGCTG TCTGAGTGGA      2220
     TGCTGGAGGC AAGAGTCGCC GCCCTAAACC AGTCAACAGA GGTGTACACG TTCGATAATC      2280
     ACAGAGCGAC TAGTGATATC GACGTGACAA TCGTCAATGA AGCAGCATCT ATGTGGGCCA      2340
     CATATGAGTG GAGAGTGGAC GAGTGGGAAT TGAGTGACCA CAACATCATT ACTGTTGTGG      2400
     CCGAACCAAC TACCGCGCGC TCAGTTGAGA GCATAGCTCC TGTGCCGTCC TGGAACTTCT      2460
     CCAATGCACG TTGGCGATTG TTCAAGGAGG AAATGGTGAG TAGAATAGCC GAACTTCCGG      2520
     AAAACTTTTC AGAGTCGCCG TTGGACCAGC AAGTTTCGAC CCTGCGCAGT ATAGTACATA      2580
     GTGTATGTGA TACTGCGCTA GGAAGGAAGT TGACTCGATC GCCCAGCAGG AGAGCACGTT      2640
     GGTGGACTGC CGACCTCTGC GCTGCAAGGC GCGAAGTCCG AAGACTTCGT CGCCTGCTCC      2700
     AAGATGGAAG GCGTCGAGAT GACGATGCCG CTGTAGAGCT TGTAGTGGTC GAGCTGAGGC      2760
     GTGCCTCAGC CTACTACAAG AAGCTCATTG GAAGGGCGAA GATGGATGAC TGGAAACGCT      2820
     TCGTGGGAGA TCATGCCGAC GACCCATGGG GGCGCGTCTA CAAGATTTGC CGAGGTCGCA      2880
     GGAAGTGCAC GGAGATTGGG TGCCTCCGCG TGAATGGCGA GCTGATCACT GATTGGGGTG      2940
     ACTGCGCACG AGTGCTCCTC CGCAATTTTT TCCCAGTTGC GGAGTCCGAA GCACCGACTG      3000
     CCATCGCGGA GGAAGTCCCA CCGGCCCTCG AAGTATTCGA GGTTGATACA TGTGTTGCCC      3060
     GGCTGAAGAG CAGGCGCTCT CCCGGGTTGG ACGGCATCAA TGGCACTATC TGCAAGGCAG      3120
     TCTGGCGCGC CATACCCGAG CACCTAGCAT CATTGTTTTC CCGATGCATC CGATTGGGAT      3180
     ACTTTCCAGC CGAGTGGAAG TGCCCACGAG TTGTCTCGTT GCTCAAAGGG CCAGATAAGG      3240
     ACAAGTGTGA GCCCTCCTCA TACAGAGGAA TATGCTTGCT ACCAGTCTTT GGAAAGGTGC      3300
     TCGAGGCCAT CATGGTGAAT CGTGTGAGAG AAGTTCTTCC GGAAGGCTGC AGATGGCAAT      3360
     TCGGATTTCG CCAAGGACGA TGTGTGGAGG ATGCTTGGAG GCACGTGAAG AGCAGTGTTG      3420
     GCGCCAGCGC GGCGCAATAC GTGCTCGGCA CATTCGTGGA CTTCAAAGGA GCATTCGACA      3480
     ACGTCGAATG GAGTGCTGCA CTCAGCCGAC TAGCCGACTT GGGATGCCGG GAAATGGGCT      3540
     TGTGGCAGAG CTTTTTCTCC GGCCGAAGAG CAGTGATCCG AAGCAGTTCC GGTACTGTGG      3600
     AGGTACCGGT AACTAGAGGC TGCCCGCAGG GATCAATCAG CGGCCCATTT ATCTGGGACA      3660
     TACTGATGGA TGTACTGCTT CAGCGTCTCC AGCCGTATTG CCAGCTGAGT GCATACGCGG      3720
     ATGACTTGCT GCTTCTCGTC GAGGGAAATT CCCGAGCTGT GCTAGAGGAA AAAGGAGCGC      3780
     AACTAATGTC CATCGTAGAA ACGTGGGGAG CGGAAGTTGG CGATTGCCTC TCGACCAGCA      3840
     AGACGGTAAT CATGCTGCTG AAAGGTGCCT TGAGACGTGC GCCTACGGTG AGGTTTGCTG      3900
     GACGGAACCT TCCGTATGTG CGTAGCTGTC GGTACCTTGG CATCACGGTC AGTGAAGGAA      3960
     TGAAATTCCT CACGCACATA GCTTCGCTTC GCCAGCGGAT GACAGGAGTC GTTGGAGCAT      4020
     TGGCGCGTGT GCTTCGAGCC GACTGGGGCT TCAGTCCTCG AGCCAGGCGG ACCATATATG      4080
     ACGGACTCAT GGCACCTTGT GTGCTGTTTG GTGCCCCGGT ATGGTATGAC ACCGCGGAAC      4140
     AAGTAGCTGC CCAGAGGCGA CTAGCCTCCT GCCAGAGGCT AATCCTGCTT GGATGCCTTT      4200
     CGGTATGCCG AACAGTATCC ACAGTGGCAC TGCAGGTACT TGGTGGAGCT CCCCCGCTTG      4260
     ATCTGGCTGC TAAGTTATTA GCGATCAAAT ACAAGCTAAA ACGTGGATTC CCGCTGGAGG      4320
     AGAACGACTG GCTTTACGGC GAGGACATTG CGTGTCTTAG CTGGGAGCAG AGGAAGACTC      4380
     GCCTAGAGGA GTGTTTAATC CAGAGTTGGC AGAACAGATG GGACGATGAC AGCGAACCAG      4440
     GACGGGTGAC GCATAGGTTT ATCCCATACG TCACTCTTGC CTATCGGGAT CCAAGTTTTG      4500
     GATTCTCGAT GAGGACGTCT TTCCTGCTTA CAGGGCACGG GTCGTTCAAT GCATTTTTGC      4560
     ACGGGAGAGC CCTCAGCGAT ACCACTGCTT GCGCATGTGG AGATCCATAT GAGGACTGGA      4620
     TGCATATCTT GTGCGCTTGC CCCCTATATG CAGATCTGCG GGACCTAGAT GGACTTGGAG      4680
     TGCAGCGCCT TGGCGAAAAC TGGATCTTCG AGGGAATCCT GGATGATCAA GAGAAGACTC      4740
     AACGGCTGGC AATGTTTGCG GAAGAAGTGT TCCTGAGGAG GAGGGCCCTT TAGCTCAACA      4800
     TCTCTGCCGT GTGGTTAGCG GGCGAGAATA CTACCACAGT CCGCTGTTGC TTGTCGTAAG      4860
     AGACGACTAA TACAGCGATA GGATTCCTCT AACCCTGCTT GTCGGAGCAA AAGGGGGAGG      4920
     CCCACCGAGC CTCTTTTCGG TACCACGGGT TGAGCAGCTA TCCAAGACTG CTCATTGAGG      4980
     TAGGCCCCCT GGTGGGAGTA TCGTGGTGGC TGTGGTTGGT ACCCATATCG CGGGTAGAGC      5040
     CTTCATGCTC GACGTTTGAG TTACGGTGCT AGTTGCGCAA AACTCGGGTG CTGTGACCCA      5100
     GAGATCAGTA GAGATTTTAG GTAGATCTCG CTCCTCAGCA AGGGGGAGTG CTTGCCCGGC      5160
     AAGCAAGTAC TCGAATTGCT ACCGGGGTGG TCGCTATGTA CATAGCTATA GCTTCTAGTC      5220
     CGGGACGCTT GTCTGGCGTA TCCAGACACA TGCACCATAT GCTCACTTGT GGGCGTATAG      5280
     GGTGCCGTGG TTGTAATCCC TTCAGTGTGG AACACGCCAC GTAAAATAAG TTCGGAGGGA      5340
     TCCGAAAAGC ATACAT                                                      5356
//
ID   DMRER2DM   standard; DNA; INV; 3607 BP.
XX
AC   X51967;
XX
DR   FLYBASE; FBte0000030; Dmel\R2-element.
XX
FT   source          X51967:1..3607
FT   SO_feature      CDS ; SO:0000316:181..3351
FT                   /name="Dmel\R2-element\ORF"
FT                   /db_xref="FLYBASE:FBgn0016699"
FT                   /db_xref="SWISS-PROT:P16423"
FT                   /db_xref="NCBI_PROTEIN:CAA36225.1"
FT                   /translation="FERKNFSDGLVPQRKFIHIGTTSTNNEPRIPLHNLMTTRPSVDIF
FT                   PEDQYEPNAAATLSRVPCTVCGRSFNSKRGLGVHMRSRHPDELDEERRRVDIKARWSDE
FT                   EKWMMARKEVELTANGCKHINKQLAVYFANRSVEAIKKLRQRGDYKEKIEQIRGQSALA
FT                   PEVANLTIRRRPSRSEQDHQVTTSETTPITPFEQSNREILRTLRGYSPVECHSKWRAQE
FT                   LQTIIDRAHLEGKETTLQCLSLYLLGIFPAQGVRHTLTRPPRRPRNRRESRRQQYAVVQ
FT                   RNWDKHKGRCIKSLLNGTDESVMPSQEIMVPYWREVMTQPSPSSCSGEVIQMDHSLERV
FT                   WSAITEQDLRASRVSLSSSPGPDGITPKSAREVPSGIMLRIMNLILWCGNLPHSIRLAR
FT                   TVFIPKTVTAKRPQDFRPISVPSVLVRQLNAILATRLNSSINWDPRQRGFLPTDGCADN
FT                   ATIVDLVLRHSHKHFRSCYIANLDVSKAFDSLSHASIYDTLRAYGAPKGFVDYVQNTYE
FT                   GGGTSLNGDGWSSEEFVPARGVKQGDPLSPILFNLVMDRLLRTLPSEIGAKVGNAITNA
FT                   AAFADDLVLFAETRMGLQVLLDKTLDFLSIVGLKLNADKCFTVGIKGQPKQKCTVLEAQ
FT                   SFYVGSSEIPSLKRTDEWKYLGINFTATGRVRCNPAEDIGPKLQRLTKAPLKPQQRLFA
FT                   LRTVLIPQLYHKLALGSVAIGVLRKTDKLIRYYVRRWLNLPLDVPIAFVHAPPKSGGLG
FT                   IPSLRWVAPMLRLRRLSNIKWPHLTQNEVASSFLEAEKQRARDRLLAEQNELLSRPAIE
FT                   KYWANKLYLSVDGSGLREGGHYGPQHGWVSQPTRLLTGKEYMDGIRLRINALPTKSRTT
FT                   RGRHELERQCRAGCDAPETTNHIMQKCYRSHGRRVARHNCVVNRIKRGLEERGCVVIVE
FT                   PSLQCESGLNKPDLVALRQNHIDVIDTQIVTDGHSMDDAHQRKINRYDRPDIRTELRRR
FT                   FEAAGDIEFHSATLNWRGIWSGQSVKRLIAKGLLSKYDSHIISVQVMRGSLGCFKQFMY
FT                   LSGFSRDWT"
XX
CC   Derived from X51967 (g8432) (Rel. 24, Last updated, Version 1).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 3607 BP;  1064 A; 818 C; 900 G; 825 T; 0 other;
     TTGGGGATCA TGGGGTATTT GAGAGCAGAG GGGGAGTATT CTTCTGTAAT TCGTAAGTCA        60
     TATCATATGA TGTGCGGAAG GGGAATTTTA CTCTGTAACT CACAAGTCTC TCCTTTACTC       120
     AAGTCGACTC AAAACCTCCT CGTGGTGGTC CCGGTAATGC TAAACTCGTT TAGCAGCTAA       180
     TTTGAGCGGA AAAACTTTTC CGATGGGCTG GTTCCCCAGA GGAAATTTAT TCATATTGGA       240
     ACTACAAGCA CAAATAACGA GCCTCGGATA CCTTTACACA ATCTGATGAC GACCCGACCC       300
     TCCGTGGATA TCTTCCCGGA GGACCAATAT GAACCAAACG CAGCGGCTAC TCTATCTAGG       360
     GTTCCCTGCA CAGTATGTGG CCGGTCCTTT AACAGCAAGA GAGGACTCGG TGTTCACATG       420
     CGATCTCGGC ACCCAGACGA ACTTGATGAA GAACGTCGAC GTGTCGATAT AAAGGCAAGA       480
     TGGAGTGATG AAGAGAAGTG GATGATGGCG AGAAAGGAGG TTGAGCTCAC AGCAAATGGA       540
     TGTAAACACA TAAACAAGCA ACTAGCGGTG TATTTTGCAA ACCGCAGCGT CGAAGCCATC       600
     AAAAAGCTAA GACAGAGGGG CGATTATAAG GAGAAAATAG AGCAGATAAG AGGGCAATCA       660
     GCTCTCGCCC CGGAAGTTGC TAATCTAACC ATAAGGCGCC GCCCTAGTAG AAGTGAGCAA       720
     GACCACCAAG TAACAACATC GGAAACAACT CCAATCACTC CCTTCGAACA GTCGAACAGG       780
     GAAATTTTGC GGACACTACG CGGGTATAGC CCCGTAGAAT GCCATTCCAA ATGGAGAGCC       840
     CAAGAGTTGC AAACTATCAT TGATAGGGCA CATCTCGAGG GAAAGGAAAC CACTCTCCAA       900
     TGCTTATCGC TATATCTCCT GGGAATTTTT CCGGCACAGG GTGTACGACA CACACTGACG       960
     AGACCTCCTC GGAGACCTCG GAACAGGAGA GAAAGCAGAA GGCAGCAGTA CGCTGTCGTC      1020
     CAGCGTAACT GGGATAAGCA TAAAGGAAGA TGCATCAAGT CCTTGCTAAA TGGAACTGAT      1080
     GAGTCGGTAA TGCCAAGCCA AGAAATAATG GTTCCCTACT GGAGAGAAGT AATGACTCAG      1140
     CCTAGCCCAA GCTCTTGCAG TGGAGAAGTG ATACAAATGG ATCACTCGCT TGAGAGGGTA      1200
     TGGTCTGCTA TTACAGAGCA GGACCTTCGG GCGTCAAGAG TCTCATTATC CTCGTCTCCG      1260
     GGGCCTGACG GGATAACTCC AAAATCTGCC AGGGAGGTGC CGTCAGGTAT TATGCTGCGC      1320
     ATAATGAACC TAATTCTATG GTGCGGTAAT CTACCACACT CCATACGACT GGCCAGAACC      1380
     GTCTTCATCC CGAAGACGGT GACGGCGAAG CGACCGCAAG ACTTTCGTCC AATATCAGTG      1440
     CCTTCAGTCC TGGTAAGACA GCTAAATGCA ATATTGGCAA CCCGGTTGAA CTCATCAATC      1500
     AATTGGGACC CGCGCCAGCG GGGCTTCTTA CCAACCGACG GATGCGCCGA TAATGCGACG      1560
     ATAGTCGACT TAGTCTTGAG GCATAGCCAT AAGCACTTTA GATCTTGCTA CATCGCAAAT      1620
     TTAGATGTAA GCAAGGCATT TGATTCTCTA TCACATGCAT CTATATACGA CACCTTACGT      1680
     GCTTATGGTG CGCCAAAGGG CTTCGTTGAC TACGTACAGA ACACGTACGA GGGCGGTGGT      1740
     ACCAGTCTCA ATGGGGACGG TTGGAGTTCA GAGGAATTCG TCCCTGCTAG AGGAGTGAAG      1800
     CAGGGTGACC CTTTGTCTCC TATTCTATTT AACTTGGTAA TGGACAGGTT ACTTAGAACC      1860
     TTACCCAGCG AAATTGGTGC CAAAGTCGGA AATGCCATTA CTAACGCGGC CGCGTTTGCA      1920
     GATGATTTGG TACTATTTGC GGAAACTCGG ATGGGGCTTC AAGTATTGTT GGACAAGACG      1980
     TTGGATTTTC TATCTATCGT CGGCCTCAAA CTTAATGCCG ACAAATGTTT TACCGTTGGC      2040
     ATTAAGGGCC AGCCGAAACA GAAGTGTACC GTGTTAGAGG CACAGAGCTT CTACGTAGGC      2100
     TCGAGTGAGA TTCCATCACT GAAGCGCACG GACGAGTGGA AGTACTTAGG CATCAACTTC      2160
     ACTGCAACCG GGAGGGTTCG ATGCAATCCG GCCGAGGACA TTGGTCCAAA GCTACAAAGA      2220
     TTGACAAAGG CCCCCCTCAA ACCACAACAG AGGTTGTTCG CCCTTCGGAC TGTCCTTATC      2280
     CCACAGCTCT ACCACAAGTT AGCCCTTGGG AGTGTGGCGA TAGGCGTCCT AAGAAAAACT      2340
     GATAAACTTA TAAGATATTA TGTGCGAAGA TGGCTAAATC TTCCGCTGGA TGTGCCGATA      2400
     GCATTTGTTC ATGCACCCCC AAAAAGTGGA GGTCTCGGAA TTCCATCACT AAGATGGGTA      2460
     GCTCCAATGT TAAGGCTAAG ACGCTTGAGT AACATTAAAT GGCCTCACCT CACGCAAAAC      2520
     GAGGTAGCCA GCTCTTTCCT CGAAGCCGAA AAACAACGGG CCCGAGATAG ATTATTAGCT      2580
     GAACAAAATG AACTGTTATC GCGTCCGGCA ATAGAAAAAT ATTGGGCGAA CAAGTTGTAC      2640
     CTCTCAGTTG ATGGTAGCGG ACTCCGTGAA GGCGGCCATT ATGGCCCGCA ACACGGGTGG      2700
     GTTAGTCAAC CCACGCGTTT ATTAACAGGA AAGGAATATA TGGACGGTAT TCGTCTGCGG      2760
     ATAAATGCCC TACCCACAAA GTCTCGTACT ACAAGGGGAA GGCACGAATT GGAACGACAG      2820
     TGTCGTGCAG GATGTGATGC TCCCGAAACA ACAAACCACA TAATGCAAAA ATGCTACCGC      2880
     TCGCATGGGA GGCGGGTAGC TAGACACAAC TGCGTAGTAA ATCGAATCAA GCGGGGACTT      2940
     GAGGAGAGAG GCTGCGTGGT CATTGTTGAA CCAAGTCTGC AGTGCGAATC CGGCCTTAAT      3000
     AAACCAGACC TGGTGGCACT ACGACAAAAT CACATTGATG TGATCGACAC ACAAATTGTG      3060
     ACAGACGGAC ACTCTATGGA TGATGCGCAC CAGCGCAAAA TCAATAGATA CGACAGACCG      3120
     GACATACGAA CTGAATTGCG TCGCAGATTC GAAGCCGCAG GTGACATTGA ATTCCATTCT      3180
     GCCACCCTGA ACTGGAGGGG GATCTGGAGT GGTCAATCCG TTAAAAGATT GATAGCAAAG      3240
     GGTCTCCTCA GCAAATATGA TAGTCATATC ATTAGCGTCC AGGTTATGAG AGGCAGTCTC      3300
     GGTTGTTTTA AACAGTTCAT GTACCTGAGC GGGTTTTCCC GAGATTGGAC TTAGCTAAAT      3360
     CGTTTGGTTC AAAACATTTG CTTGCTGTCT TGGCATAACA TCAATAAAGG CATAAACATC      3420
     GCAAAATAAT GGTTATAATT AAATGGCTAT GAGGATGGTT TTAGTACGTA GGCGTTGCGG      3480
     AACTTCGGTT CATATAGAGC AATGAATCGT GCATGCTAGG AAAACTGACC ACACACAGTG      3540
     TTGGCAGACC TAGTATCTTT CGAAGATTTC CATACCTCCG CGATCAAAAA AAAAAAAAAA      3600
     AAAAAAA                                                                3607
//
ID   DM33463    standard; DNA; INV; 1736 BP.
XX
AC   U33463;
XX
DR   FLYBASE; FBte0001005; Dmel\S-element.
XX
FT   source          U33463:37..1772
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1..234
FT   SO_feature      terminal_inverted_repeat ; SO:0000481:1503..1736
FT   SO_feature      CDS ; SO:0000316:404..1441
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\S-element\T"
FT                   /db_xref="FLYBASE:FBgn0044019"
FT                   /db_xref="REMTREMBL:AAC47095"
FT                   /db_xref="NCBI_PROTEIN:AAC47095.1"
FT                   /translation="MPGKRLAFEVTQLIYYNHQLGKSIPELVEIFSVSRKTVYNILNRX
FT                   XKEGRLEPKSGGGCKTKINKRVDRLIMRKAIANPRISVRSLAQDIREECHLTVSHETVR
FT                   QVILRHRYSSRVARKKPLLSEINIEKRHSFAVSMMDHAEEYWDDVIFCDETKMMLFYND
FT                   GPSRVWRKPLSALETQNIIPTIKFGKLSVMIWGCISSHGVGKLAFIESTMNAVQYLDIL
FT                   KTNLKASAEKFGLFSNNKPNFKFYQDNDPKHKEYNVRNWLLYNCGKVIDTPPQSPDLNP
FT                   IENLWAYLKKKVAKRGPKTRQQLMAAIIEEWEKIPLEYDLKKLIHSMKKRLQLVAKANG
FT                   GHTKY"
XX
CC   Derived from U33463 (g1006788) (Rel. 47, Last updated, Version 5).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 1736 BP;  600 A; 287 C; 300 G; 545 T; 4 other;
     CAGTTTGTCA AGAAACTGTT TACACACCGC AAAATAAGTA GAATTTTTGA CTTTAAAGGC        60
     CAAAATTAAG GGTTTTTTGC TTAATTAAAC GCAATTTTTT TATGAAATAT AATTAAACAA       120
     TATTTATTTT ACTTATAAAT TAAAAAACAA ATTCAATATA TCAAATATAC AAGAAAATAA       180
     ACAACAAATT TCTTGTTTAC ACACTTTTGA GAGTGCCAAG AAACTCTTTA CACAGTTTTG       240
     GGTTCCTACT TTGTTTTGCT CTTTTTCTTA GAAACAATCT CATTTTTCCG TTATTTTTGT       300
     CTTATGCATT CCTTTTTACA ACGCTTCTAT TGCAATTTTT TCACTTTGCT TGTGAAATTT       360
     TGTTGATCTA ACGTGCTTAA AGCGAATTAT TAAATTTAAT GAAATGCCTG GAAAGAGATT       420
     GGCTTTTGAA GTGACCCAGC TAATATACTA TAACCACCAG TTGGGAAAAT CTATTCCTGA       480
     ATTAGTAGAA ATATTTTCCG TATCCCGTAA AACCGTCTAT AATATTTTAA ATCGTNNNNA       540
     AAAAGAGGGC AGGCTTGAAC CTAAGAGTGG TGGTGGGTGT AAAACGAAAA TTAACAAGCG       600
     AGTAGACCGC CTTATTATGC GAAAAGCGAT TGCGAACCCC CGAATCTCGG TCAGATCACT       660
     TGCTCAGGAT ATCAGGGAAG AATGTCACCT AACTGTATCA CACGAAACTG TGCGCCAAGT       720
     CATCCTACGC CATAGGTACT CTTCAAGAGT TGCAAGAAAA AAGCCTTTGC TATCAGAGAT       780
     CAATATTGAA AAGCGTCATT CATTCGCTGT GAGCATGATG GATCATGCGG AAGAGTACTG       840
     GGATGACGTC ATATTTTGTG ACGAAACAAA AATGATGCTC TTTTATAACG ATGGGCCAAG       900
     CAGAGTATGG CGCAAACCGT TGAGTGCGCT AGAAACACAA AATATAATTC CAACAATCAA       960
     ATTTGGAAAA TTGTCAGTGA TGATTTGGGG CTGTATTTCC AGCCATGGAG TGGGCAAACT      1020
     AGCCTTTATT GAAAGCACTA TGAATGCCGT GCAATATCTA GATATTTTAA AAACAAATTT      1080
     GAAGGCCAGT GCAGAAAAAT TTGGTTTGTT TAGCAACAAC AAGCCAAATT TTAAGTTTTA      1140
     TCAGGACAAT GATCCCAAAC ATAAAGAGTA CAATGTACGC AACTGGCTAC TCTATAACTG      1200
     TGGCAAGGTG ATCGATACGC CCCCTCAGAG TCCTGATCTA AACCCCATTG AAAATTTGTG      1260
     GGCCTACTTA AAGAAGAAGG TTGCAAAAAG GGGCCCCAAA ACTCGACAAC AACTCATGGC      1320
     TGCGATAATC GAAGAGTGGG AAAAGATCCC GCTTGAATAT GACCTAAAAA AACTCATACA      1380
     TTCCATGAAA AAAAGGCTTC AACTTGTAGC CAAAGCCAAT GGGGGTCATA CTAAATACTA      1440
     AAACTTTTCA AATATTATCA AAATAATTAA AAAATTTAGG ATTAAACTTA GGTTTAGTGT      1500
     TTTGTGTAAA GAGTTTCTTG ACACTCTCAA AAGTGTGTAA ACTTGAAATT TGTTGTTTAT      1560
     TTTCTTGTAT ATTTGATATA TTGAATTTGT TTTTTAATTT ATAAGTAAAA TAAATATTGT      1620
     TTAATTATAT TTCATAAAAA AATTGCGTTT AATTAAGCGA AAAACCCTTA ATTTTGACCT      1680
     TTAAAGTCAA AAATTCTACT TATTTTACGG TGTGTAAACA GTTTCTTGAC AAACTG          1736
//
ID   SPRINGER    standard; DNA; INV; 7546 BP.
XX
AC   AF364549;
XX
DR   FLYBASE; FBte0000333; Dmel\springer.
XX
FT   source          AF364549:1..7546
FT   SO_feature      five_prime_LTR ; SO:0000425:1..403
FT   SO_feature      three_prime_LTR ; SO:0000426:7143..7546
FT   SO_feature      CDS ; SO:0000316:1058..2422
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\springer\gag"
FT                   /db_xref="FLYBASE:FBgn0044343"
FT                   /db_xref="SPTREMBL:Q967T6"
FT                   /db_xref="NCBI_PROTEIN:AAK52057.1"
FT                   /translation="MSESFRQYRNSKKCASDSESESDDSTENSVRKNTPTNAFTAYKMS
FT                   LETEQIKALIRALQEQALESQRREADLRKTIQDLAGQVAAIQIAPARAEAPPIKVYRPV
FT                   EITGLVPCGETLDAVKCLPDFMGTQETYVSWRQAANAAYHMFRKYEDSSRHYQAVVIIR
FT                   SKVKGPADAVLSSFGTILNFDAIISRLDFTYSDKRPIHVIEQELGTLRQGSLTLLQYYD
FT                   EVEKKLTLLTNKATMSYEASAATVLCEKFRDDALRVFVSGLRRNLTDVLFAAKPKDMPS
FT                   ALALAQEVESNHERYTFATSFARSQEDRDHKQYPKVQERQRAPPQAGSQGSAGKNPHFT
FT                   KQHRAQVHSAPRSDRMARENMPEPMDVDPSLSRMQPSHAPAYPKSKPAASGRSVPPKRQ
FT                   RVNHVAQASDDLDKVYNTAASSAAVKVDDDSILEYDSDTINFLGESPCYPSSDEE"
FT   SO_feature      CDS ; SO:0000316:2434..5475
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\springer\pol"
FT                   /db_xref="FLYBASE:FBgn0044342"
FT                   /db_xref="SPTREMBL:Q967T5"
FT                   /db_xref="NCBI_PROTEIN:AAK52055.1"
FT                   /translation="MKLLIDTGAAKNFIRPFKGLKGVRPVQSPFTIHSIHGVTTITKKC
FT                   FVSIFNLKATFFLLPDLTSFDAIVGLDLLKQAGASLCLASGKLKWGSGAEQIDFHTCPD
FT                   VNFTKVDCSDAPPLIKDAFLKMLGNRKKAFADPNEALPYNTSVVATIRTVDEEPIYAKL
FT                   YPYPMGAADFVNGEIQELLKNGIIQKSKSPYNNPIWVVDKKGTDDAGNKKMRLVLDFRK
FT                   LNERTVPDRYPMPNISMILGNLGKAKYFTTLDLKSGYHQITLAERDREKTAFAVNGGKY
FT                   EFRRLPFGLRNAASIFQRTIDDILREQIGKFCYVYVDDVIIFSEDENDHVKHVDWVLKS
FT                   LYDANMRISAEKSRFFKKSVSFLGFIVTNNGAATDPEKVKAIKEFPEPKNVFEVRSFLG
FT                   LASYYRCFIKDFASIARPISDILKGENGSVSRHRSRSIQVEFSEAQQRAFEKLRNILAS
FT                   EDVILRYPDYKKAFDLTTDASAYGIGAVLSQEGRPITMISRTLSDREVNYATNERELLA
FT                   IVWALAKLRHYLYAVKEINIFTDHQPLTFAVSESNPNAKIKRWKARIDESGARIFYKPG
FT                   RNNLVADALSRQQLNVVEEQEPESCAATIHSELSLTHTIESTDKPVNCFQNQIILEEAR
FT                   SHWKRTFILFGNKRRHSINFSCKQALLEELANIIIPNGVNAFHCDLHTLALIQDDVVRQ
FT                   FPATKFWHCKNRVTDIFAMQERKEILTVEHNRAHRSAQENVKQVLSEYYFPKMTKLASE
FT                   IAANCKTCAKAKYDRHPKKQELGETPVPTHVGEILHIDIFSTDKKYFLTCVDKFSKFAM
FT                   VQPILSRTIEDLKAPLLQLMNVFPKAKTIYCDNEPSLKSQTIVAMLENHFGVSISNAPP
FT                   LHSVSNGQVERFHSTLIELARCLKIDKGISDTVELVLLATARYNMSIHSVINKKPAEVM
FT                   RADPDDPHTDVQEKIKNAQILTRKRENASRQNRVFQVGDKVLVKSNRRLGNKLTPLCEE
FT                   KTIEADLGTTVLIKGRVVHKDNLK"
FT   SO_feature      CDS ; SO:0000316:5870..7147
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\springer\env"
FT                   /db_xref="FLYBASE:FBgn0044344"
FT                   /db_xref="SPTREMBL:Q967T4"
FT                   /db_xref="NCBI_PROTEIN:AAK52056.1"
FT                   /translation="MLDMFPQSHMKKLLSVDIAHLRDMLDSLSIHHRVARSLDFLGTAL
FT                   KVVAGTPDAEDFEKVKFTEARLVDAHNSQIEINTKTQVRINELTDTINKLLKISKSAQI
FT                   DTGHLYETLSTRNRIIVMELQNLMLTITLAKINVVSPNFLDHADLESIWGEEPTNTPIR
FT                   EILSVASVKVLQSLNILHFIIKFPKIIMACNKVTILPVVHHDTVLRLKDNVVAECNREI
FT                   RTVKNCSITPGATFCQLSSVSSCAQELHAGVVAHCDAQQSDLHPITYVDEGIIVINDRP
FT                   ALVRVDNGTAIHIRGTHLITFIESAMVNETVFFNHDMVQNRAPGVANSPVLNISMKHEV
FT                   LSLPYLHRLSEKNLEQIRNFEKDVDGYRLSQIALVAGAIFCALICIGLTWQRTTRAKKS
FT                   TAQLKEVLAQIGSAEGGLNLEEGIVN"
XX
CC   Derived from BACR06P08 by Sue Celniker, 29 March 2001.
CC   Michael Ashburner, 9-Apr-2001.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 7546 BP; 2131 A; 1909 C; 1712 G; 1794 T; 0 other;
     AGTTAACTAA GTTAACCGGA CTGATCGTCC GCACACCAGC ACCGGTCAAA CTGCTGACCA        60
     AGCATTTGGC CGGAAGCTCA TGCATAGCCG GCAGAAGCTC TGCGCATTGG CAGAGGCCGC       120
     TATGATGTTT TTCCCTTTGT TAGCTTATAG TCAGTTTGAT TTTGTATTCA ATAAAGAGCG       180
     CATCGCGCCT TCAATCAACT CCAGCTACTG CTGTTATCAT TGAATTGGTT GGCTAGCCTT       240
     AAGGGCAGTC AACAACGGAG AGACGTTCTC CCACCATATC TCCCAATCTA GGAGAAGAGG       300
     TCTGCGGCAA CCGCCCTGCC TCCCAGTGAC AGAAGAACCC CCCGTTACCT GCAACCTACG       360
     CCGGAGACCG CGGCGAGGGA CCTGCACCTT ATATTTAATT AATTGGCACC CAACTCCAGG       420
     AACCCACACC ACTACCCTGA ATCATGTAAG TGGGATTCTC AACTTAAACA CTACTCCAAA       480
     CTGCGTCTAG AATTTTAAAA TATTTGGGAT GTTTGTGCGA GTTACATAAA TAAATTAAGA       540
     AAATCGGCAT TTCCACTACA ATAAACGTTT ATATGTGTTG CGAATTAAGA TTATGTTACT       600
     GTTATGAAGT TTAAATATCG AATTTTGATT TGTGGTTGAC TTTGCAATCC ATATTGTGTG       660
     CATTTCATTC CGCCTTCGCA CATCCGCGGG ACACTGTCGT TTCATTCGAA ATTTAATTCG       720
     CTACATTGGC TTCACAGCCC TTTCAAGCTT TGTTGTTTTT GACCCACTCC ACTTCGCTAC       780
     CCGATACTGG CGCATGCATT GCTGTGACAA TTTTGTGCCT TTTATTTATC TCTTTGTCTT       840
     TGCTGTGGCA ATTTTTGTCT TTGGATATTT GTTTGCCTTA TTGGAGACCC GCTCCCCGCA       900
     GGCCCTTCAC CTTATCGTTA CTTAGCTGGA CAGTGGCTCT GCTCGTTGAG TCTTCGTCCA       960
     ATGCCTTCAA AGCGGCGACT CAGCCCCCGC GACCCCCTTG CCGTACTGTT TGGCCCCACG      1020
     GGCACAACGG CCTGAGTATT CACATACATA GCTACCCATG AGCGAGTCAT TCCGACAATA      1080
     TAGGAATTCT AAAAAGTGCG CTAGCGACTC AGAGTCCGAA AGCGACGATT CGACAGAAAA      1140
     CTCTGTACGT AAAAACACCC CAACTAACGC ATTCACTGCA TATAAAATGT CCCTCGAAAC      1200
     GGAACAAATT AAAGCTCTCA TAAGGGCATT ACAAGAGCAA GCCTTAGAGA GTCAACGCAG      1260
     GGAGGCTGAC TTGCGTAAAA CAATTCAAGA TCTGGCCGGC CAGGTCGCGG CCATACAGAT      1320
     TGCCCCTGCC CGGGCAGAAG CTCCCCCAAT CAAAGTTTAC AGACCAGTAG AAATCACCGG      1380
     ACTGGTCCCT TGTGGGGAAA CATTGGATGC CGTTAAATGT CTTCCAGACT TTATGGGGAC      1440
     ACAGGAGACA TACGTCTCCT GGCGGCAAGC GGCAAATGCC GCTTACCATA TGTTCAGGAA      1500
     ATATGAGGAT AGTTCGCGGC ACTATCAAGC TGTGGTCATC ATCAGGAGCA AAGTTAAAGG      1560
     CCCTGCTGAT GCAGTTCTGT CGTCCTTTGG GACTATACTG AATTTCGATG CGATCATAAG      1620
     TCGCCTCGAT TTCACGTATA GTGACAAACG CCCGATACAC GTTATCGAGC AGGAGCTAGG      1680
     CACCCTCAGA CAGGGAAGCC TGACGCTCCT CCAGTATTAT GATGAGGTCG AGAAAAAACT      1740
     CACCTTACTC ACCAATAAGG CGACTATGTC TTATGAAGCG TCGGCAGCAA CGGTGCTGTG      1800
     TGAGAAGTTC CGAGATGATG CTTTGAGAGT TTTTGTCTCG GGGCTCAGGC GCAACCTCAC      1860
     AGACGTGCTA TTCGCGGCAA AGCCTAAGGA CATGCCGTCA GCGCTCGCCC TGGCGCAAGA      1920
     AGTAGAGTCC AATCATGAGC GGTACACTTT TGCAACTTCA TTTGCACGAA GCCAAGAGGA      1980
     TAGGGACCAC AAGCAATATC CCAAAGTGCA GGAGCGCCAA CGGGCCCCCC CACAAGCCGG      2040
     CTCGCAGGGA AGTGCTGGGA AGAACCCGCA CTTTACTAAG CAGCATAGAG CACAGGTGCA      2100
     CTCCGCTCCA CGTAGCGACC GAATGGCCCG AGAAAACATG CCAGAACCCA TGGACGTTGA      2160
     CCCGTCGTTG TCCAGGATGC AGCCATCTCA CGCCCCGGCT TACCCGAAAT CGAAGCCGGC      2220
     CGCGTCTGGC CGTTCGGTCC CACCAAAAAG GCAAAGGGTC AACCATGTTG CCCAGGCCTC      2280
     TGATGATTTG GACAAGGTTT ATAACACCGC AGCCTCCAGT GCAGCAGTTA AAGTCGACGA      2340
     CGATTCCATC CTAGAGTACG ACTCGGATAC CATTAATTTT TTAGGGGAAA GTCCCTGCTA      2400
     CCCGTCATCA GACGAAGAGT AGCGGGGATC GACATGAAAC TACTGATTGA TACGGGCGCG      2460
     GCAAAAAATT TTATCCGACC ATTTAAGGGG TTGAAAGGCG TCCGCCCGGT GCAGTCCCCA      2520
     TTTACAATCC ATTCGATTCA TGGTGTGACT ACAATAACTA AGAAATGTTT CGTGTCCATT      2580
     TTTAATCTTA AAGCTACCTT TTTTTTATTA CCAGACTTGA CCTCCTTTGA CGCGATCGTT      2640
     GGCCTAGACC TGTTAAAACA GGCCGGCGCG TCACTTTGCC TAGCTTCCGG CAAGCTCAAA      2700
     TGGGGCTCCG GAGCAGAGCA AATTGACTTT CATACTTGCC CCGATGTCAA TTTCACCAAA      2760
     GTAGATTGCT CGGACGCACC GCCCTTAATT AAGGATGCTT TTTTAAAAAT GCTCGGGAAT      2820
     AGGAAAAAAG CTTTTGCTGA TCCTAATGAG GCTCTTCCTT ACAATACGTC GGTGGTAGCC      2880
     ACCATCCGGA CGGTTGATGA GGAGCCCATT TATGCCAAGT TATACCCATA TCCCATGGGA      2940
     GCAGCTGACT TCGTCAACGG CGAAATTCAG GAACTGCTTA AAAATGGCAT AATCCAAAAG      3000
     TCAAAGTCCC CCTACAATAA CCCAATATGG GTCGTAGACA AAAAGGGCAC TGACGATGCG      3060
     GGCAATAAAA AAATGCGCTT GGTGCTGGAC TTTCGAAAAC TTAACGAAAG GACGGTACCA      3120
     GACAGATACC CCATGCCAAA TATCTCTATG ATATTGGGGA ATCTCGGCAA GGCCAAATAC      3180
     TTCACGACCC TCGATCTGAA GTCTGGCTAC CACCAAATCA CGCTCGCAGA ACGCGACCGT      3240
     GAAAAGACAG CGTTCGCAGT AAACGGAGGG AAGTATGAGT TCCGAAGGCT GCCATTCGGA      3300
     CTCAGGAATG CTGCAAGCAT CTTCCAAAGA ACAATTGACG ATATTCTGCG AGAGCAGATC      3360
     GGAAAGTTCT GCTACGTTTA CGTCGATGAC GTCATCATCT TTTCGGAAGA TGAAAACGAC      3420
     CATGTCAAGC ATGTAGATTG GGTTCTGAAG AGCCTGTACG ACGCTAACAT GAGAATATCG      3480
     GCAGAAAAGT CACGTTTTTT TAAGAAAAGC GTGAGCTTCC TGGGGTTCAT CGTCACCAAC      3540
     AATGGGGCGG CGACTGACCC AGAAAAGGTT AAGGCCATAA AGGAATTTCC GGAACCCAAA      3600
     AACGTATTTG AGGTAAGGTC ATTCTTGGGC TTAGCCAGCT ATTATCGTTG CTTTATCAAA      3660
     GACTTCGCAT CAATAGCTAG GCCCATTTCA GACATATTGA AGGGCGAGAA CGGTAGTGTT      3720
     AGCCGACACA GGTCCAGGAG TATCCAGGTA GAATTTTCCG AAGCGCAACA ACGTGCCTTC      3780
     GAAAAGCTAC GCAATATCCT GGCGTCTGAG GACGTCATCC TGAGATACCC TGATTACAAA      3840
     AAAGCGTTTG ATCTAACGAC AGACGCTTCG GCCTACGGCA TTGGCGCAGT GCTGTCCCAG      3900
     GAGGGACGTC CCATTACAAT GATCTCAAGG ACATTGTCTG ACAGAGAGGT TAACTATGCT      3960
     ACCAACGAAA GGGAGCTGTT AGCCATAGTC TGGGCACTGG CTAAGTTGCG GCACTACCTG      4020
     TATGCGGTTA AAGAGATAAA CATCTTTACC GATCACCAAC CTCTGACGTT CGCGGTATCG      4080
     GAGTCCAATC CGAACGCCAA AATTAAGAGA TGGAAAGCAC GCATCGACGA GTCCGGCGCA      4140
     CGAATTTTTT ACAAGCCTGG GAGAAACAAC CTCGTTGCAG ATGCCCTCTC GAGACAACAA      4200
     CTCAACGTTG TTGAAGAGCA AGAACCGGAG TCGTGCGCGG CCACGATTCA CAGCGAACTT      4260
     TCGCTTACGC ACACGATCGA GTCCACGGAC AAACCCGTGA ATTGCTTCCA GAACCAGATA      4320
     ATTTTGGAAG AGGCGCGCTC CCATTGGAAA CGCACTTTTA TATTATTTGG GAATAAGAGG      4380
     CGGCACTCGA TCAATTTCTC GTGCAAACAA GCTTTGCTGG AGGAACTCGC CAACATCATT      4440
     ATCCCTAATG GTGTAAACGC CTTCCACTGT GATCTTCACA CGCTGGCGCT AATCCAGGAC      4500
     GACGTAGTTC GACAGTTTCC AGCCACGAAA TTCTGGCATT GTAAGAATAG GGTCACCGAC      4560
     ATCTTCGCGA TGCAGGAGAG AAAAGAAATC CTCACCGTCG AGCACAACAG AGCTCACAGG      4620
     TCGGCCCAAG AAAACGTGAA ACAAGTACTC TCCGAGTACT ACTTCCCGAA AATGACCAAA      4680
     TTGGCGAGCG AAATAGCAGC CAATTGCAAA ACTTGCGCAA AGGCGAAGTA TGACAGACAT      4740
     CCGAAGAAGC AGGAGCTCGG TGAGACACCA GTCCCGACCC ACGTAGGAGA AATATTGCAC      4800
     ATCGATATTT TCTCAACGGA TAAAAAATAC TTTCTCACCT GTGTTGACAA GTTTTCTAAA      4860
     TTCGCCATGG TACAGCCGAT TCTGTCTAGA ACCATAGAAG ATTTGAAAGC ACCCCTTTTA      4920
     CAACTTATGA ATGTTTTCCC CAAAGCCAAA ACCATCTACT GCGACAATGA ACCATCATTG      4980
     AAATCGCAGA CAATAGTGGC TATGCTGGAA AACCATTTTG GCGTCAGCAT TTCGAATGCA      5040
     CCGCCCCTAC ATAGCGTCTC AAACGGACAG GTGGAACGAT TCCACAGCAC GTTAATTGAG      5100
     CTCGCCAGAT GCCTAAAAAT CGACAAAGGC ATAAGTGACA CAGTGGAATT GGTCTTGCTG      5160
     GCCACAGCCA GATATAACAT GTCCATCCAC TCCGTCATCA ATAAAAAACC GGCCGAAGTC      5220
     ATGCGGGCAG ATCCGGACGA TCCACATACC GATGTCCAAG AAAAAATCAA AAACGCCCAG      5280
     ATTTTGACAA GAAAACGAGA GAACGCTTCT CGGCAGAACA GAGTGTTCCA GGTCGGCGAC      5340
     AAAGTCCTAG TAAAGTCAAA CAGACGATTA GGCAACAAAC TTACTCCTTT ATGTGAGGAG      5400
     AAGACCATCG AGGCAGACTT GGGGACCACA GTCCTTATTA AAGGGAGGGT GGTCCATAAA      5460
     GACAACCTCA AGTGACCCAA GCAGAGCCTA GCCGCGGCTC CCTCGGAGGC ACACTTTTAT      5520
     TCCTCCAATT TGTAGCCACT CGGCATAAGT TTTTTCATTG TTTTTATAGC CGCTTGGCAT      5580
     AAGTTTTTTA TTTTTTAGCC ACTTGGCATA TTTTTTATAT ATTTTCGCTA TTATTGGTGG      5640
     TGGGCAACTC CATTCCGAAC AAGTAATAAT TTATCACACA CGTTACAGGT CGCTCCCAAC      5700
     CCTTCTTCTT TGTTTCCTGG CCACGACATC GGCCCACATT ACTGACTATT CCCGAGCGAA      5760
     TTACATTCCC GTCATTGACG GTAAAGTCTT AGTCTGGGAG GAATTCGCCT ATGTCAGACA      5820
     CTCGGCTAAC CTCTCCGAGT ATAGGCGGGT AATTGACGAA ACCGACAGCA TGCTCGATAT      5880
     GTTCCCCCAG TCCCATATGA AGAAGCTCCT GAGCGTTGAT ATCGCTCACC TCCGTGACAT      5940
     GCTTGATTCT TTGAGCATCC ATCACAGAGT GGCAAGGAGC CTAGACTTCT TGGGAACTGC      6000
     GTTAAAGGTT GTCGCAGGGA CACCTGACGC GGAAGACTTC GAGAAAGTCA AGTTCACTGA      6060
     AGCGCGGCTT GTTGATGCAC ACAATAGCCA AATCGAAATA AACACCAAAA CACAAGTTCG      6120
     AATTAACGAA CTCACTGATA CCATAAATAA ACTTTTAAAA ATTTCCAAAA GCGCTCAGAT      6180
     TGATACAGGT CACCTGTATG AAACGCTTTC TACTCGCAAC AGAATCATTG TAATGGAATT      6240
     GCAAAACTTA ATGCTCACTA TAACCCTCGC TAAAATTAAC GTAGTGAGTC CAAACTTCTT      6300
     GGACCACGCA GATCTGGAGA GTATTTGGGG CGAGGAGCCC ACCAACACCC CCATAAGGGA      6360
     GATTTTGTCC GTTGCGTCTG TAAAAGTCCT ACAATCCCTT AACATCTTAC ACTTTATTAT      6420
     TAAATTCCCC AAGATTATCA TGGCGTGCAA CAAAGTCACT ATCCTTCCAG TGGTACACCA      6480
     CGATACGGTG TTAAGGTTGA AAGATAATGT GGTAGCAGAG TGCAACAGAG AAATACGCAC      6540
     AGTAAAGAAT TGCTCCATAA CACCAGGGGC AACATTTTGC CAGTTATCTT CAGTGAGCTC      6600
     GTGTGCGCAG GAGCTCCACG CTGGGGTCGT AGCACATTGC GACGCACAGC AGAGTGATCT      6660
     ACATCCGATC ACCTACGTCG ACGAAGGAAT AATCGTCATC AATGACAGAC CAGCACTCGT      6720
     GCGTGTGGAC AATGGAACGG CCATCCACAT TAGAGGCACG CACCTCATAA CATTCATTGA      6780
     GAGTGCCATG GTCAACGAGA CCGTCTTCTT TAATCATGAC ATGGTCCAGA ATAGGGCGCC      6840
     GGGAGTGGCT AATTCCCCAG TCCTTAATAT CTCGATGAAA CACGAGGTCC TGAGCCTCCC      6900
     ATACCTTCAC CGTTTAAGTG AAAAGAACTT GGAGCAAATC AGGAACTTCG AGAAGGACGT      6960
     CGACGGATAC CGACTAAGTC AGATAGCGTT AGTTGCGGGA GCAATTTTCT GCGCTCTTAT      7020
     CTGCATCGGT TTAACCTGGC AGCGAACCAC TAGGGCCAAG AAATCTACAG CCCAACTGAA      7080
     GGAAGTTCTC GCCCAAATAG GGTCAGCCGA GGGCGGCCTT AATCTTGAGG AGGGAATAGT      7140
     TAACTAAGTT AACCGGACTG ATCGTCCGCA CACCAGCACC GGTCAAACTG CTGACCAAGC      7200
     ATTTGGCCGG AAGCTCATGC ATAGCCGGCA GAAGCTCTGC GCATTGGCAG AGGCCGCTAT      7260
     GATGTTTTTC CCTTTGTTAG CTTATAGTCA GTTTGATTTT GTATTCAATA AAGAGCGCAT      7320
     CGCGCCTTCA ATCAACTCCA GCTACTGCTG TTATCATTGA ATTGGTTGGC TAGCCTTAAG      7380
     GGCAGTCAAC AACGGAGAGA CGTTCTCCCA CCATATCTCC CAATCTAGGA GAAGAGGTCT      7440
     GCGGCAACCG CCCTGCCTCC CAGTGACAGA AGAACCCCCC GTTACCTGCA ACCTACGCCG      7500
     GAGACCGCGG CGAGGGACCT GCACCTTATA TTTAATTAAT TTAACT                     7546
//
ID   TARTC    standard; DNA; INV; 11124 BP.
XX
AC   AY600955;
XX
DR   FLYBASE; FBte0001208; Dmel\TART-C.
XX
FT   source          AY600955:1..11124
FT   SO_feature      non_LTR_retrotransposon ; SO:0000189
CC                   telomeric retrotransposon
FT   SO_feature      direct_repeat ; SO:0000314:1..331
FT   SO_feature      direct_repeat ; SO:0000314:10383..10713
FT   SO_feature      five_prime_UTR ; SO:0000204:1..205
FT   SO_feature      three_prime_UTR ; SO:0000205:6629..11102
FT   SO_feature      non_LTR_retrotransposon_polymeric_tract ; SO:0000433:11103..11124
CC                   derived from polyA tail of RNA transposition intermediate
FT   SO_feature      CDS ; SO:0000316:206..3349
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\TART-element\gag"
FT                   /db_xref="FLYBASE:FBgn0014071"
FT                   /db_xref="NCBI_PROTEIN:AAT12844.1"
FT                   /db_xref="SPTREMBL:Q6J4U8"
FT                   /translation="MDGHNGDINEGWATVLSISSDDSNQLSSPPSIIVSSLDTTPTSN
FT                   ETTIVRRSLHNPKADMKSYRFENIVLNENKNTILPDPLFVDKCGNTANTTEANEKKPA
FT                   NSPFPISIIKNLSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTQIKPAKPS
FT                   PPSKELSTNSAPKTLSYTDKITVTQKNLPDKTHVDRPTQDDDINATKASKTAKIISTQ
FT                   LHLRETKPTQPAKDPSPRTQKPIANKAAETLTHTDKLIASQNLVPAKTHINSPTQYND
FT                   TNATNALKTAKINFSSHSHQSEIKPTQSAKNISPLTQKQFTSESAGTHTHTDKHKNTA
FT                   SQNLFSAKTHINSPTQHNDTSAATASKTAKLILSPHSHLSETKPTQPALSPSPLSQKQ
FT                   ITSIAAKTLTHTNKHTASQNFIPAKTHINIPTQYNDTNATKALKTAKAASPSHTYSRQ
FT                   TKPIKPAINALHAAQDTNPSPAISAVTYTDKPTATQNIFPVKTFAELIRENAKRSPTP
FT                   IENPPQAKHDSAALGRPPTAARKNLNKTLISPKTPGKRRGDCLDEGLLQTSNKKVRIR
FT                   DDFSDDDLGVTNLLSETPLFKSKAAIKIRQDSRRESLQKSAEMDTAPAISPSNAAADP
FT                   DLPPWKTVPASRKPPSIFLSNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTM
FT                   DAYNAIQNVLLEANIPLHSHQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFI
FT                   RAMQFRDTRNPMRIHEVEVVPKADGSHLKVLLIKSLGGQTVKVERKRVSKDPTQCHRC
FT                   QCFGHTKNYCRNPFKCMKCGQLHASVSCTKPKNLPATCANCNGSHVSSYKGCPVFQEA
FT                   KQRLSINKIQSLHSQPTHLQTPRNKHPYPKPTHIQTPLNKQPYTHPLPRTLVNNTKLP
FT                   AKRIQGKKISQRNLSINKRLNRIRTLDRKPRNETSPPTTSKKVLASLEESRKNPNSAL
FT                   NPANTHLTHFRPPPLAQNIPNDESKELSGEQYLLNRIEGMEKKLNNLLEIVTRLLSQG
FT                   KDCPKSPKNPFRDPIFV"
FT   SO_feature      CDS ; SO:0000316:3350..6628
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\TART-element\pol"
FT                   /db_xref="FLYBASE:FBgn0014072"
FT                   /db_xref="NCBI_PROTEIN:AAT12845.1"
FT                   /db_xref="SPTREMBL:Q6J4U7"
FT                   /translation="MLFLVTSEVTFPMTRECNRDILKIAFWNAGGINNKIDELKLFIL
FT                   NIDAHIIIVTETRLDNNSTKLELPGYFTYLAQNPASSKRGGVATIVNSSLRHMALEPI
FT                   EKECIQSAPIVLLPENNRRSEMIVIASVYCPPSLSWSPHHFTDVLNFAEKTMGGQTKL
FT                   ILCGDWNAKHRQWGCIRACQRGAALYDAIQADSMAEIVATGSATHFPHDTRKSPSAID
FT                   FSICKRLGRYEKRISSSAHLSSDHLPILLEINLDIKTISLQKQNNNILKKTTNIELFK
FT                   NVLERKILLNTEIRVAEDINDAINIFIKNIKDSAAESTPSPRIPDNHRRRYGQANRNS
FT                   HTLTLDENTSRLLEEKRIQSRIFKATRTNEDKTKLKAAENRLKKVIKILREKRINEQI
FT                   EGIDTNNPDRMRKIWRLLSEGKKMNQPNFPLKLETKKGPKWTKTIKETTEAFVSHLEG
FT                   RFKPNKIVPDYHIDKVNTGLRIIKESMLTERHNLNKNPHNQPITLNELNEEIKNLKNS
FT                   KAPGKDLITNQLIKTLPTKATLYLILIYNSILRLGYYPEAWKHAQVKMILKPGKSSNE
FT                   PKSYRPISLLSGLSKMFERLLLKRLFRVDLFKKAIPLHQFGFRKEHGTEQQIARVTQF
FT                   ILEAFERKEYCSAVFLDISEAFDRVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVK
FT                   DQAGETSRTGQIGAGVPQGSNLGPLLYSIFSSDMPLPYIYRPSPTQRIMLSTYADDTI
FT                   VLSSDTLATAATRNNENYLKTFSDWADKWGISVNAAKTGHVIFTLKNDLPTNSMNVKI
FT                   KGQTIKKESKQSYLGVTLDSKLTLSSHVTKLLGKYSTAYRKLTWILNGRSKLPTKTKI
FT                   LILKSVLSPIWQYAIAAWGPLVTDAQIRRVQVEENRKIRDICRAGRYTRNQTIRDLFG
FT                   VKTVEEFYQQAMHRFSETIKSHPNIAVRRILSRHYIPNRLERSRQRYFKMTNDHITQK
FT                   QTGLALSPKLLKIPDIDDCRTVKKRSEREKIRQMHLTELPTLLRLEEEEEELKRIKKQ
FT                   EEREKRERENQKWPPDRWCELEINRYNKQYRKGDLTRQEVIEKFRGQPLNVQRIILPD
FT                   YEGD"
XX
CC   A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially
CC   overlapping the UTRs (annotated as "direct_repeat ; SO:0000314").
CC   Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates
CC   upstream of the 3’ end of the element and that the 5’ PNTR extends a short
CC   distance into ORF-1. The 5’ ends of TART-C elements are variable and the
CC   minimal size for functionality has not been determined.  Thus, this
CC   canonical sequence, AY600955, may be 5’ truncated within the 5’ PNTR (M-L
CC   Pardue, 2009).
XX
CC   Derived from AY600955, Michael Ashburner, 6-Apr-2004; updated Jan-2009 as
CC   per Mary-Lou Pardue and Greg DeBaryshe.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 11124 BP; 3774 A; 2893 C; 2173 G; 2284 T; 0 other;
     AAGCTTCGCG GGATATCGAT AACAATCAGG TGGTTAAAAA TACTATAACA TCGAGTACCA        60
     GCCGTGTTTT TCCTGTCGAT TTATCGAAGT CCAACAGCCC GCCTTCGCTC CGAACACAAA       120
     TCGGCAAGTC AGTAGCTTTT TTAACCCGGC AGTGGCGCCT GTGCAGCAGC TATTTAAAGT       180
     GAAAAACACG AAACGCAACA ACAAAATGGA CGGCCATAAT GGAGACATAA ATGAAGGATG       240
     GGCAACAGTA CTATCTATCT CGTCGGATGA TAGTAACCAA CTTTCGTCGC CGCCGTCAAT       300
     TATAGTCTCA TCGCTGGACA CCACGCCAAC GTCAAACGAA ACCACCATAG TAAGAAGAAG       360
     CCTACACAAC CCAAAAGCTG ACATGAAATC TTACAGATTT GAAAATATTG TATTAAATGA       420
     AAATAAAAAT ACCATATTGC CAGATCCTTT ATTTGTTGAT AAATGCGGAA ATACTGCTAA       480
     TACCACAGAA GCCAATGAAA AAAAGCCTGC CAATAGCCCC TTCCCCATTT CCATTATCAA       540
     GAATCTTAGC ACTTCCTCGC CACTAACACA TGTAGACACG CCTACACAAG AAGATGACGC       600
     CAGTGCATTC AATACATTGA AAGCAGCCAA AACAGCTAGA ATAATTTTTC CCACACACAC       660
     ACAGATAAAG CCCGCCAAAC CCTCGCCCCC TTCCAAAGAA TTAAGCACAA ACTCAGCACC       720
     CAAAACTCTT AGCTACACAG ACAAAATTAC AGTAACACAG AAAAATCTAC CCGACAAAAC       780
     ACATGTAGAC AGACCTACAC AAGATGACGA CATTAATGCA ACCAAAGCAT CAAAAACCGC       840
     CAAAATAATT TCTACACAGT TACACCTACG TGAAACCAAG CCAACACAGC CCGCCAAAGA       900
     CCCCTCACCC CGCACCCAAA AGCCTATTGC AAACAAAGCA GCCGAGACAC TCACCCACAC       960
     AGACAAACTC ATAGCATCAC AAAACCTAGT TCCCGCCAAA ACACATATAA ACTCCCCCAC      1020
     ACAATATAAC GACACTAATG CAACCAATGC ATTAAAAACC GCTAAAATAA ATTTCTCTTC      1080
     ACACTCACAC CAAAGTGAAA TCAAGCCAAC ACAGTCCGCC AAAAACATTT CACCCCTCAC      1140
     ACAAAAGCAA TTCACAAGCG AATCAGCCGG GACACACACC CATACAGACA AACACAAAAA      1200
     CACAGCATCA CAAAATCTCT TTTCCGCCAA AACACACATT AACTCACCCA CACAACATAA      1260
     CGACACTAGT GCAGCCACAG CATCAAAAAC CGCTAAATTA ATTCTCTCCC CACACTCACA      1320
     CCTAAGTGAA ACCAAGCCCA CACAGCCCGC TTTAAGCCCC TCGCCCCTCT CCCAGAAGCA      1380
     AATAACAAGC ATAGCAGCCA AGACACTCAC CCACACAAAC AAACACACAG CATCACAAAA      1440
     CTTTATTCCC GCCAAAACAC ATATAAACAT ACCCACACAA TATAACGACA CCAATGCAAC      1500
     CAAAGCATTA AAAACCGCAA AAGCAGCTTC TCCCTCCCAC ACATACTCAC GTCAGACAAA      1560
     ACCAATAAAG CCCGCCATAA ACGCATTGCA TGCCGCCCAA GACACAAACC CAAGCCCAGC      1620
     AATCAGTGCT GTCACTTACA CAGACAAACC CACAGCTACT CAGAATATTT TTCCTGTCAA      1680
     AACTTTTGCA GAGCTGATTA GAGAAAATGC AAAACGCTCA CCAACTCCAA TCGAAAATCC      1740
     CCCTCAAGCA AAACATGACT CTGCCGCCCT CGGACGCCCT CCGACTGCAG CTAGAAAAAA      1800
     TCTAAATAAA ACACTGATTT CTCCTAAAAC TCCTGGGAAG CGCCGTGGGG ACTGTCTTGA      1860
     TGAAGGCCTA CTTCAAACCT CTAACAAAAA GGTTAGAATA CGCGACGACT TCTCTGATGA      1920
     TGATCTGGGG GTCACAAACC TACTCTCTGA AACACCCTTA TTCAAAAGCA AAGCAGCTAT      1980
     TAAGATTCGG CAAGACTCGA GAAGAGAATC CCTGCAGAAG TCAGCTGAAA TGGACACAGC      2040
     TCCAGCAATA AGTCCCTCAA ACGCAGCAGC CGATCCCGAC CTACCGCCCT GGAAAACTGT      2100
     TCCAGCTAGC AGAAAACCAC CATCAATCTT CCTGTCCAAT ATACAGCAGA TTATCCCGCT      2160
     AATAGAAAAA CTAAACTATA AAGCCGGGGT AAATAGCTTT ACTACCAAGT CTGAACTTGG      2220
     CAACAATATT AGAATCCAGG CTAAAACGAT GGACGCCTAC AATGCAATTC AGAATGTCCT      2280
     CCTTGAAGCA AACATTCCCC TACACTCTCA CCAGCCAAAG AGTGCAAAGG GCTTCCAAAT      2340
     TGTAATTAGG CACCTCCACC AGTCAACCCC GACCAAATGG ATTGAAAGCC AACTTCAAGA      2400
     CATCGGTATA GCTACAAAAT TTATCAGGGC AATGCAGTTT AGGGACACGA GAAATCCTAT      2460
     GCGCATCCAT GAGGTTGAGG TTGTACCCAA GGCTGACGGC AGCCATCTTA AGGTCCTGCT      2520
     AATAAAATCC CTTGGAGGAC AAACGGTCAA GGTCGAAAGG AAACGGGTAT CGAAGGATCC      2580
     TACACAATGC CACCGCTGCC AATGCTTTGG ACACACAAAA AATTATTGCA GAAACCCGTT      2640
     TAAATGTATG AAATGTGGCC AGCTGCACGC CTCGGTCTCA TGCACCAAAC CCAAAAACCT      2700
     TCCGGCTACT TGTGCAAACT GCAATGGAAG CCACGTTAGC AGCTATAAAG GATGTCCTGT      2760
     TTTCCAAGAA GCAAAGCAAA GACTATCTAT CAACAAAATT CAATCCCTTC ACTCACAACC      2820
     CACCCACCTT CAGACCCCCC GCAATAAACA TCCCTACCCA AAACCCACCC ACATTCAGAC      2880
     GCCCCTCAAT AAGCAGCCCT ACACACACCC CCTCCCTCGC ACATTAGTAA ACAACACAAA      2940
     ACTACCTGCC AAAAGAATCC AAGGAAAGAA GATATCGCAA AGGAATCTAT CTATAAATAA      3000
     ACGCTTAAAC AGAATCAGGA CATTGGACAG AAAACCGAGG AATGAGACAA GCCCGCCGAC      3060
     AACTAGCAAA AAGGTCTTGG CCTCTCTAGA AGAAAGCAGA AAAAACCCAA ATAGCGCCCT      3120
     AAACCCGGCC AACACCCATC TCACTCATTT CCGCCCACCA CCATTAGCAC AAAATATTCC      3180
     TAATGACGAA TCTAAGGAGC TGAGTGGGGA GCAATACCTT TTAAATCGCA TTGAAGGGAT      3240
     GGAAAAGAAG CTCAACAACC TTCTTGAAAT CGTCACCCGC CTACTAAGCC AAGGAAAAGA      3300
     CTGTCCAAAG TCTCCAAAAA ATCCTTTCCG AGATCCAATC TTCGTTTAAA TGCTCTTTCT      3360
     AGTAACATCA GAAGTGACGT TTCCTATGAC TCGGGAGTGC AACAGGGACA TCCTTAAAAT      3420
     CGCTTTCTGG AATGCTGGTG GGATCAACAA TAAAATAGAT GAGCTTAAGC TGTTCATTCT      3480
     AAATATTGAT GCCCACATAA TCATAGTCAC CGAAACTAGA CTAGACAACA ATTCTACCAA      3540
     ACTAGAGCTG CCAGGATATT TCACATACTT AGCCCAAAAT CCTGCCTCTA GCAAGAGAGG      3600
     AGGAGTCGCC ACGATAGTAA ACAGTAGTCT CCGCCACATG GCCTTAGAAC CGATTGAAAA      3660
     GGAATGCATA CAGAGTGCCC CAATAGTATT ACTGCCTGAA AACAACAGAC GCAGCGAAAT      3720
     GATTGTAATA GCATCTGTCT ACTGTCCGCC TTCGCTAAGC TGGTCGCCCC ACCATTTTAC      3780
     TGACGTTCTC AATTTTGCTG AGAAAACTAT GGGAGGGCAG ACTAAGCTCA TTCTATGTGG      3840
     CGACTGGAAC GCAAAACATA GACAATGGGG TTGTATACGC GCCTGCCAAC GTGGCGCCGC      3900
     ACTCTACGAT GCAATTCAAG CAGACTCCAT GGCTGAAATC GTCGCGACTG GCAGCGCTAC      3960
     ACATTTCCCG CACGATACAA GGAAAAGCCC GTCAGCAATA GACTTCTCGA TATGTAAACG      4020
     GCTTGGCAGG TATGAAAAAA GAATCTCCTC AAGTGCACAC CTATCCTCAG ACCATCTTCC      4080
     CATATTACTT GAGATAAACC TAGATATAAA AACCATCTCC CTGCAAAAAC AAAACAACAA      4140
     TATCCTCAAG AAAACAACGA ACATTGAGCT CTTTAAGAAC GTTCTAGAAA GGAAGATACT      4200
     TCTAAACACT GAGATAAGGG TAGCAGAAGA CATAAATGAC GCCATAAACA TCTTTATTAA      4260
     AAACATCAAG GACTCGGCTG CTGAATCAAC TCCCTCCCCA AGAATTCCTG ATAACCACAG      4320
     AAGAAGATAT GGGCAAGCTA ACAGAAATAG TCATACGCTC ACACTAGACG AAAACACAAG      4380
     CAGATTGCTG GAAGAAAAAC GTATACAAAG TAGAATTTTT AAAGCTACTA GAACGAACGA      4440
     GGACAAAACT AAACTAAAAG CAGCTGAAAA TCGACTTAAA AAAGTAATCA AAATCTTAAG      4500
     AGAAAAGAGA ATCAATGAGC AAATTGAAGG AATTGACACA AATAACCCGG ACAGAATGAG      4560
     GAAAATTTGG AGGCTGCTGA GTGAAGGGAA AAAAATGAAT CAACCCAACT TTCCCCTCAA      4620
     ATTAGAAACC AAAAAAGGCC CTAAATGGAC TAAAACAATT AAGGAGACAA CAGAAGCGTT      4680
     TGTCTCCCAC CTGGAAGGAA GATTCAAGCC AAATAAAATT GTACCTGATT ACCACATAGA      4740
     TAAGGTTAAC ACCGGACTAA GAATAATTAA GGAAAGCATG CTAACAGAAC GACATAATCT      4800
     AAACAAAAAC CCCCATAACC AACCCATTAC GCTAAACGAA TTAAATGAAG AAATAAAAAA      4860
     CTTAAAGAAT AGCAAAGCAC CTGGTAAAGA CCTTATAACA AACCAGCTCA TAAAAACCCT      4920
     ACCGACTAAA GCTACCCTGT ACCTTATCCT AATCTATAAC TCCATACTTA GATTAGGATA      4980
     CTACCCTGAA GCCTGGAAAC ATGCACAGGT AAAAATGATC CTGAAGCCAG GGAAAAGCTC      5040
     AAACGAGCCG AAGTCATACA GGCCGATTAG TCTACTCTCG GGACTCTCTA AAATGTTTGA      5100
     AAGACTACTC CTAAAAAGAC TTTTTAGGGT AGATCTATTC AAAAAAGCCA TACCACTGCA      5160
     CCAATTTGGC TTCAGAAAAG AGCACGGAAC TGAGCAGCAA ATAGCCAGGG TCACCCAGTT      5220
     CATCCTCGAG GCCTTCGAGC GGAAGGAATA CTGCTCAGCG GTTTTCCTTG ACATCTCTGA      5280
     GGCCTTTGAT AGGGTATGGC ACGAAGGCCT TTTACTTAAA TTAGCTAAGA TCCTACCTTA      5340
     CAACCTATAC ATTATACTGG AGAGCTACCT TACAAATAGA ACGTTCGAAG TTAAAGACCA      5400
     AGCAGGAGAG ACTTCGAGAA CAGGACAAAT AGGCGCAGGA GTGCCTCAAG GAAGCAATCT      5460
     CGGACCACTA CTTTACTCTA TCTTCTCCTC TGACATGCCC CTCCCATATA TCTACCGCCC      5520
     TTCACCAACA CAAAGAATTA TGCTCTCAAC ATACGCAGAC GACACTATAG TCCTCAGCTC      5580
     AGACACACTA GCAACTGCCG CCACAAGAAA CAACGAAAAC TACCTCAAGA CATTTTCGGA      5640
     CTGGGCGGAC AAATGGGGTA TCTCAGTAAA CGCTGCTAAA ACCGGACATG TCATTTTTAC      5700
     ATTAAAAAAC GACTTACCTA CAAACTCAAT GAATGTGAAG ATCAAGGGTC AAACAATAAA      5760
     GAAGGAAAGC AAGCAATCAT ACCTTGGGGT AACCCTTGAT AGCAAGCTAA CCCTTAGCTC      5820
     TCACGTCACA AAGCTATTGG GTAAATACTC TACAGCCTAC AGAAAATTGA CATGGATCCT      5880
     AAACGGAAGA AGTAAACTCC CTACTAAAAC TAAGATACTG ATCCTTAAAT CAGTTTTATC      5940
     ACCAATATGG CAGTATGCCA TAGCAGCTTG GGGTCCCCTT GTGACAGATG CACAGATAAG      6000
     GAGGGTCCAG GTTGAGGAAA ACAGAAAAAT AAGAGACATA TGTAGAGCGG GAAGATATAC      6060
     GAGAAACCAA ACTATAAGGG ACCTTTTTGG CGTCAAAACA GTAGAAGAAT TCTATCAACA      6120
     GGCTATGCAC AGGTTCTCAG AAACTATAAA ATCGCACCCA AATATAGCTG TTCGCAGGAT      6180
     TCTCTCTAGG CACTATATCC CGAACAGACT AGAAAGAAGC AGGCAGAGGT ACTTTAAAAT      6240
     GACAAATGAT CATATCACGC AAAAGCAGAC TGGACTTGCC CTCTCACCTA AACTCTTAAA      6300
     AATCCCTGAT ATAGATGACT GCAGAACCGT AAAAAAGCGT AGCGAGAGAG AGAAAATAAG      6360
     ACAAATGCAT CTAACTGAAC TCCCCACCTT GCTGAGACTA GAGGAAGAGG AGGAAGAGCT      6420
     CAAAAGAATA AAAAAACAGG AAGAAAGGGA AAAAAGAGAA AGGGAAAACC AAAAGTGGCC      6480
     TCCAGATAGA TGGTGCGAAT TGGAAATAAA CCGATATAAT AAACAATATA GAAAGGGCGA      6540
     CCTAACCAGG CAGGAAGTTA TAGAAAAATT CAGAGGGCAA CCATTAAATG TACAACGAAT      6600
     AATCCTACCC GACTATGAAG GGGACTAAAA TTAAATCAAA ACAAACCAGG ACAGGAGCAG      6660
     AAGGCAGAAA TAATCAAAAC TGGCGGAAGG GGTGGCAAAA TATTGAAAAG AGAGGAAAGA      6720
     AATATAAAAA GGCTAAAGGC TAAGTTACAG GTTACATAAA AAGGGAAATC TGCTTATAGA      6780
     TATTATGGTA AAATTAACTT AACTAAACAC CTACTGGTTA ACAAAATAAT TATGCCTGCA      6840
     TGGCACAAGC TGCGTACTCA AATCATTTCT CCTGACGCTA TTGAAAATCC ATCTTTACTT      6900
     TCCAACCGAG GGACTTGCGA CTGCGGTCTT TCCGCCTTAT TGGCTCCTTA TGGATCCATC      6960
     TGCTGCCGTA TTGGGCGACA CACCAGCGCT CCAACCTAAA AGAGAGATAA CATGTTTTAA      7020
     TTCACTTTCC TTTTCTTATA ACTAAATCAC AACAACAGCA ACAGCGCATC GGGCGACTGA      7080
     CAAAAGCATT AGCTCACCAA GTCAGCAACA ACAGCAGCAG CAAGACCAGA ATCAGTTGAG      7140
     GAGGAGGCCT GGTGGTGTGC TGAACATTTC GCCGCCCACA CCCACCATTT CTGTAGGCCT      7200
     GTATGACCCT GAGCCCAACG CCGGCATGGC AAATCCGGTC TTCCTGAGGA GGCGGGGCTC      7260
     TAGTGTTAGG CGCGCTTTTG CCCCAAAAGC AACAACGACA GCGGCAGTAG GGTCGGCGCC      7320
     CCCTGCGTGA CCGAGTCCAT CTTAGCAATC GGTCCTTTTG GCGGTGTTAT GCCGACGCGG      7380
     CGGTCGCGCT TATGAGGACT GCCTGCAATG CTTGGCCATG AGACGGCGTC ATCGACAACA      7440
     TTTCAATCAC GCTCAGCTGG TTGACCGGGG GCAACATGCT TGCCATGCAG CAACAATGGT      7500
     GCATGCAGTC CAGCATGCAG CAACAACAAC AATATTGGCA GCAGCAGACT AATGTTTCGC      7560
     AGCAGATTCC ATCTGGCAAC TTCCGACGAC CAGACTCCTC GCTTGGCCCC TGGAGACTCG      7620
     CTCTGGAAAA AAAAAGAAAG AAGCATGGAT TAGTTTTTTT TTTTCCCTTT AGCTATTGGA      7680
     TTAAATTTCT TTCCTGGACA ACCGGCGCCT TCATGCAGAT GACGCTGGAC TGCGGCGATT      7740
     CTTTCCCTCC AGCCACAGAT GGGAAGCTCA CATCATGGCA TATATGCGGC ATCGTGCTAA      7800
     TCAGCTCCCC ATGCTGAGCG AGATCTTGAT GCGGCGATGC ACTCACTAGC GAGCAGCGGG      7860
     AACAGCATAC AGCGTCAGCA ACAGCAGGAA GAGACTTTGT AGCAGAAGCC TTTCGGCATT      7920
     CTCCGACGAC CCGACTCCTC GATCGGGGTC AGGCAAATTC TCCTGGACCG ACAAATTTTC      7980
     CCGGCGTTTC GTCCTGGAAT AAGGAAGGAA GCACGGATTA ATTTCTCCCC TTCAGCTTAC      8040
     GACCCTTCTC ACCAACAGCA GCAACTACAA CAACATCGGC AGCAGACGAC TTGCAGCTGC      8100
     TTGGCTCACC TAATGCGACA GCAATAATCC CGGCAAGGCC AGAAACGGCA CCGAGCAGAA      8160
     GCACGACAGG GTGAAGAACA ACATGCCGCC CACGTCCACC AATCCGGAAG CCCTGCATTA      8220
     GGGGTCTGAA GCGCCATTAA CTGGAGGATC CGGCAGCGTA TGCCTACGCA GAAGCGGGGC      8280
     GTCGTAAATC CGGTGGCCGG AATAGCGCCT TGAACAGCAT GCTGTGTATG TTTGCCCCAA      8340
     AAGCAGAAAC TGCCGCAGCA AAGGAACCGC AAGCAGGATC ATCACTCGTG GCAAACTGGC      8400
     GTATTCCTGT TGAAGACGCG GGACTGCGGC GCATTCTTCC TTTCCAACCG GGGGCTTTAG      8460
     CGCTGCGGTA TTTCTGCTTT CACGGCTCCA TTTGCTGCTG CATCTGACGC CTCATCAGCG      8520
     CTCCTCCCTG AAAGAAAGAG AATATGTATT AGTTTTCTTT CCATTCCTTA CAATCTCTCT      8580
     CACCAAACCT CCACGACACA ACAACAGCAG CAGAAACAGG TCTAGCCCAC AATGGCAGCA      8640
     GCTACAGCAA TCAGCAGAAG CAAGGCCGGC AAAAGCAACA ACAAAAGCCC TCTCTGAAAG      8700
     CCCGGATGTG GAGACTGAAG CGCCGGAAAC TTGAGGATCC GCCCCCGATG CACGCCCACC      8760
     AACAATAAGC TGGAGGAGAA GTTACTGAAG CATGGGAAGC AGCACCAGGG GTCGCATACG      8820
     CAGCGTCAGG GCTTTGCGAA CCAGATGAAT GAGGAGAGAC TGGAACAGCA TAACATCAGC      8880
     GGCAGCAACA ACAGCGCCAC GAGGGTCAGC GGCGTCTGCA TGGCTGTGTC CAAAACAACT      8940
     CCAATTCAAC TGCTGTATGA TGCAGCGCAC CAGCGGCTTT CACAGGGACC GTCTGAAACG      9000
     CTTGGCAGGA GCCGGCTGAA GGCCTGGGCG AAGACACTGG AGACACCAAT GCGGCTCCTT      9060
     TCGGCCGACG GCAACAGGCT TGCCATGCAA TAAGAACAGT AAATCCTGAA ATAACAGCAG      9120
     AAGATACAGA CGTCCAAATT GCGAACACTG ACGCCAGCCC TCACCTGAAC GACTCACTGT      9180
     GCAGCAGCAG CAACATCAGC ACCGATGCCC TCAGCATCGG CAGCAGAGGG TGTTTTTGGC      9240
     CTTTGACAAT TCCCTGCGAC TTGACTTCTT CTTGGCATCT GGTCAATCAT CACGTGCCAG      9300
     CAAACAGTGG CTTGTCACCC TGGAAGAAAG AAGACTGGAT TAGCTTCTCC CCTTCTAATA      9360
     CATTTTGTGT GTTGAAATGC ATCAGGCGGC GACACACTCA CCAGCAACAG CAGCAACAAC      9420
     ACCAGCGGCA CCGGTAGCAG GAAATGGATC CTCAGCAAAA ACCATCGGCA CTTTCAGACG      9480
     TCCCGTACTC CTCGCCTGGC CCTGGCCGGT AACAGGGGCT TGTTAGATGG AGAAGACGAC      9540
     GGTCATCCGA CGGACAGCAG CCTGAAGATG GAAGCAGGCC TACGCTGCCC ACCTCTCCGA      9600
     TGCCTGCAGC AGCAACGGCA GCGGCTCATA AATGCAAACT GGCGCCAGCC CTCGGCTCTT      9660
     CGGGCTCATG TAGGCGGTGA CACACTCACT AGCAGCTAAA ACAGCAACGG CGGAATTAGT      9720
     AGAAGCAATG TTTTGCCGCA GCTGCCAGAT GGCATACTCC TAGCTTGGCC CCTGCCCAAA      9780
     CCGTATTGGA CCGGCAAATG ATTCGACAAT CCGATCTGGA AAAAATAAGT ATTGATTAAT      9840
     TTTTCCCCCA CAGATTGGTA TAAAATTGCA TTTACGGCCA ACCGGCTTCT TCCTGTTGAT      9900
     GACGTCACGC TGCGCCGCAT GCTTTTCGCC AGCCACAGTT GGAATGCATG CATTGGGGTT      9960
     GACGGTCCGG ATGGGCCGTT GCCTGTTATA TGCTGGCATC TCCGCAGCGG CGTTGTGAGC     10020
     AACGACACTG AAAGCAACAA TAATATTGTT AATTACTGCT CAAAACTATA ACACATTTAA     10080
     TCACTTACAC AATTTACACA CGCTTCCTGC CTAGGAGTTG TGGGACCAGC TACCGATAAT     10140
     GCCAACAATA CCGGGAAACG CGTCGCGGGA CATCGATAAC AATTTGGCGG TTAAAATGCT     10200
     AGAACATCGA GTACCAGACA TGTTTTTCCT GCCGATATAT CGAAGCCCAA TAGCCGCCAA     10260
     CGCTCAAAAC ATAAATCGGA GTGTGAGACC AGATACTGAA GCCGTTAAAA GCTTTTACCG     10320
     GCATCGGTAG CTGGTCTCAC ACTCCGATTT AAATTTGGAG CGTTGGCGGG CTGTTTGACG     10380
     CGAAGCTTCG CGGGATATCG ATAACAATCA GGTGGTTAAA AATACTATAA CATCGAGTAC     10440
     CAGCCGTGTT TTTCCTGTCG ATTTATCGAA GTCCAACAGC CCGCCTTCGC TCCGAACACA     10500
     AATCGGCAAG TCAGTAGCTT TTTTAACCCG GCAGTGGCGC CTGTGCAGCA GCTATTTAAA     10560
     GTGAAAAACA CGAAACGCAA CAACAAAATG GACGGCCATA ATGGAGACAT AAATGAAGGA     10620
     TGGGCAACAG TACTATCTAT CTCGTCGGAT GATAGTAACC AACTTTCGTC GCCGCCGTCA     10680
     ATTATAGTCT CATCGCTGGA CACCACGCCA ACGCCTGTCT AATGCAAATC AACTTACATA     10740
     TTACTCTAAA ATCTACTTAT AACTGTCCCC TCTAATGATA AGCAATTTTT ATGTTTACTT     10800
     TAAACTTAAA CCGATACCTT AAACTATGGC GCGCAAAATG ACTACCAAGA AATCTAAAAC     10860
     TGTAAATTGT TGCAAACTAT TTCTCCTAGT AATGTTAAAT TTAAATGCGC GCATAACCGC     10920
     AGCCAAGTTA ACCAAAAATG TCACTCGTAA ATGTAATTCC TAAATTAACA CTTGTAACTA     10980
     AGCGCGTATA AATACCGCAA ATCCAAAAAT GTAAATATGC CATAAATTGT TACTATATAT     11040
     TTTTAAAAAA GAAAAATCAG AGTACAATAA AAATGCCAGC GTCTATTAGG CGTTGAAAAT     11100
     TTAAAAAAAA AAAAAAAAAA AAAA                                            11124
//
ID   AY561850    standard; DNA; INV; 13424 BP.
XX
AC   AY561850;
XX
DR   FLYBASE; FBte0001206; Dmel\TART-A.
XX
FT   source          AY561850:1..13424
FT   SO_feature      non_LTR_retrotransposon ; SO:0000189
CC                   telomeric retrotransposon
FT   SO_feature      direct_repeat ; SO:0000314:1..1850
FT   SO_feature      direct_repeat ; SO:0000314:11179..13028
FT   SO_feature      five_prime_UTR ; SO:0000204:1..1759
FT   SO_feature      three_prime_UTR ; SO:0000205:7953..13411
FT   SO_feature      non_LTR_retrotransposon_polymeric_tract ; SO:0000433:13412..13424
CC                   derived from polyA tail of RNA transposition intermediate
FT   SO_feature      CDS ; SO:0000316:1760..4672
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /db_xref="FLYBASE:FBgnXXXXXXX"
FT                   /db_xref="GI:45594384"
FT                   /db_xref="NCBI_PROTEIN:AAS68533.1"
FT                   /translation="MDGQNVNQSGGWASVLSISSDDGNCSSSPPSAIVSSLDTTPTSN
FT                   ETTIVRRSLYQTNADMKSYDFENIVLNENKNTILPDPLFVDKCGSTANTTEANEKQPA
FT                   DSPFPISISKNFSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTQIEPAKPS
FT                   PPSKELSSNSAPKTLSYTDKITATQKNFPTKTHVDTPTQDDDTNATKASKTAQIDSSH
FT                   SQLHETKPTQPAKNPSPLTQKLTTNKTAKTHTHTDKPTASQNLFPTKTHINSPTQYND
FT                   TNASTASKDGKINLSSHSHLRETKPTQPAKNPSPLSQKQITSIAANTLTHTNKHTASQ
FT                   NFIPAKTHINIPTQYNDTNATKALKTAKPASPSHTYSRQTKPIKPAINALHPAQDTNP
FT                   SPAISAVTYTDKPTATQNIFPAKTFAELVRENAKRSQTAMQNPPHAKHDSAALGRLPS
FT                   AARKNLTKTLSSPKTPGKRRGDCLDEGLLQTSNKKVRIRDDFSDDDLGVTNLLSETPI
FT                   FKSKVAIKIRQDSRRESLQKSVEMDTAPAISPSNTAAEPDLPPWKTVPASRKPPSIFL
FT                   SNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTMDAYKAIQNVLLGANIPLHS
FT                   HQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFIRAMQFRDTRNPMRIHEVEV
FT                   VPKADGSHLKVLLLKSLGGQTVKVERKRVSKDPTQCHRCQCFGHTKNYCRNPFKCMKC
FT                   GQLHATVSCTKPKNLPATCANCNGSHVSSYKGCPAFQEAKQRLSINKIQSLHSQPTHL
FT                   QTPRNKHPYPKPTHFQTPRNKQSYTHPPPRTTVNNTKLPAKRIQGKKLSQRNISINKR
FT                   LNRIRAFDKKPRKETSPPTTSKKVLASLEESSKNPNSVLNPANTHLTHFCPPPITQDI
FT                   PNDEPTEPSQEQYLLNRIEGMEKKLNNLLEIVTRLLNQGRECPKSPKNPFRDPILI"
FT   SO_feature      CDS ; SO:0000316:4710..7952
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /db_xref="FLYBASE:FBgnXXXXXXX"
FT                   /db_xref="GI:45594385"
FT                   /db_xref="NCBI_PROTEIN:AAS68534.1"
FT                   /translation="MTRACNRDILKIAFWNAGGINNKIDELKLFILNIDAHIVIVTET
FT                   RLDNKSTKLELPGYFTYLAQNPVSSKRGGVATIVNSSIRHMALEPIEKECIQSAPIVL
FT                   LPENNRRSEMIVIASVYCPPSLSWSPHHFTDVLNFAEKTLGGQTKFILCGDWNAKHRQ
FT                   WGCTRACQRGTALYEAVQADPMAEIIATGCATHFPHDTRKNPSAIDFSICKGLGRLEK
FT                   RISSSADLSSDHLPILLEINLDTSTLFLQKQNNNILKKTTNIELFKTVLERKILLNTE
FT                   IRVAEDINDAINIFIKNIKDSADESTPSPRIPDNLRRMHGQANRNSHTLTLDENTSRL
FT                   LEEKRILSRIFKATRTDEDKAKLKAAENRLKKAVKILREKRINKQIEGIDTKNPDRMR
FT                   KMWRLLDEGKKTNQPNFPLKLETKRGPKWTKTIKETTEAFVSHLEGRFKPNNNVPDYH
FT                   INTVNSGLRTIKESMLTERYDVNKNPCNQPITLKELNDEIKNLKNSKAPGKDLITNQL
FT                   IKTLPTKATLYLILIYNSILRIGYYPDAWKHAQVKMILKPGKSVNDPKSYRPISLLSG
FT                   LSKMFERLLLKRLFRVDLFKKAIPLHQFGFRKEHGTEQQIARVTQFILEAFERKEYCS
FT                   AVFLDISEAFDRVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVKDQAGETSRAGQI
FT                   GAGVPQGSNLGPILYSIFSSDMPLPHIYHPSPTERIMLSTYADDTIVLSSDILATAAT
FT                   RNNENYLKTFSDWADKWGISVNAAKTGHVIYTLKNDIPTNLKTMKIKGQAIKKESKQS
FT                   YLGVILDSKLTLSPHVTKVVGKYLTAYRKMSWILNERSKLPTNTKMLILKSVLSPIWQ
FT                   YAIAAWGPLVTDAQIRRIQVEENRKMRDICRAGRYTKNQTIRDRYCVKTVEEFYQQAV
FT                   HRFSETTKSHPNVAVRRIFSRHYIPNRLERSRQRYLKMTMDHITQKQTGLTLSPKLLK
FT                   IPDLDDCRTLKKRSEREKIRQTHLTELPTLLRLEEEEAELKRIKKQEERERRERENQK
FT                   WPPDRWCELEINRYNKKYRNGDLTRQEIIEKFRGQPLNVQRIILPDYEGD"
XX
CC   A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially
CC   overlapping the UTRs (annotated as "direct_repeat ; SO:0000314").
CC   Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates
CC   upstream of the 3’ end of the element and that the 5’ PNTR extends a short
CC   distance into ORF-1. The 5’ ends of TART-A elements are variable and the
CC   minimal size for functionality has not been determined.  Thus, this
CC   canonical sequence, AY561850, may be 5’ truncated within the 5’ PNTR (M-L
CC   Pardue, 2009).
XX
CC   Derived from AY561850, Michael Ashburner, 6-Apr-2004; updated Jan-2009 as
CC   per Mary-Lou Pardue and Greg DeBaryshe.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 13424 BP; 4373 A; 3415 C; 2870 G; 2766 T; 0 other;
     CACGCTTTTT GGCCCCTGGC CGATCTTCAT ATATCTCAAA TCGACGGCTG CTTTTACCCT        60
     GGAAAAAAAA AAAGGAGCTT GGGTTATATT GAACTACACT AGGCGGCGAC ACACTCACCA       120
     GCAGCAGCCA GAACAACAAC AGCGGCAGAA GTAGCAGGAA ATTATCTCAC TGCAAAATCC       180
     AATTGGCACT TTCCGAAGTC CGTATTTCTC GCCTGGCCCC TGGCCAGTAA CAGGGGCCTG       240
     TGCGACGGAG ATGACGACGA TGATCTGCCC TGTGGACGGC CTCAAGAAGG AATCGGCCCT       300
     GTACTGCCCA CCTGACCTGT GCCAGGATAG CAGCAATGTC AGCGGACCAT GGATGGAAGA       360
     GGCGGCACTG GCGACGGTCC TCAGTTTTGC GGTTTCCGCG GGGCGTAGGC GCAGTAATCG       420
     GCGGCAGCAA CAGTGGCGGC AGCAGAAGGG AATGTGTATC TGCAGTCGCC GAATGGCAAT       480
     TTCCTGCCCA GCTGTAATGG ACCGCCAAAT GTTTTTTGGC ATGTCGACCT GTAAGAAAGA       540
     AGCAAGGATA AGTTTTTTCT TTACAAGATT GTATATGAAT TTGTATTTAC GGACAACTGG       600
     CTTGTTTCCT GTCGACGATA AATGGCGCTT CATGTTTTCA CTCTGCCAAA ATCTGAGTGC       660
     AAGCATCGGG GCTGACGGGC CGAATTTGCT GATGCCTTGT ACATGCTAGC ATCTTTATGC       720
     CGCCGTGTAA TTTTGCGACA GCAAAACACA TGATGGAGAA GACGAAGGTG ATCGATGGCG       780
     CCCGGATGAC GGATGCAGGC CCGTGCTACC CACTGGTCCG TTGCCAGGAC AGCAGCGTTT       840
     CAATTATGCG AACAGAGGCA CTGGAGCCAC TTCTCAGGCG ATAGGGATCA TGAGGCGACG       900
     ACAACTCGCC AGCAGCAGTA ACAACAACAG CGGCAGCAGC GATCTCGGAC TTGCTGAACA       960
     TTGCGGCTTT TTCCCAGCCT GGACCGTCAT CACAAACGCT CTCAAAGATC GGTGCGCCTG      1020
     CAGCCTACGG AAGCGTACAA CTGCCCAAAG TCGTGCTATT GCATAATGTT AGGTGTCCTG      1080
     GCTGCTCCGG CGGATGAGCT CCACCCGATT GAGAGAGGTA AGAAGGCCCA GCAAGTCGCC      1140
     CTTAAATAAA AGAAACAAGC ATTAGACTCG GCTGAAATTG TAACATCAGT CAGACTGTAC      1200
     TCACGCATGC ACTTAGACAA ACCGAAGCCT ATTCTATTGA CGACGCGGAC TCCAACACAT      1260
     GTTTTCCTCC ACAAAAGGCT GTGAGTGCAC CAAAGTTGAC GGGCCACGCC GGCCGATGCT      1320
     TGCTGCATAC CGGCATCTCC GCAGCAGCGA CGTTACAAGC ACCACTAAAA TTAGAAAGAG      1380
     GCTTACTATA GGCAAAGCGC AGAAAAACAA ATATTACAAT AAGAAATAGC ACGCGATTTT      1440
     TCTGCTTCGT TTCCGCTTGG TACAAGTGAG ACCATTCTCC CTATATGCCA TTCTAGTATA      1500
     TTTGCCCGAT AAGCGATATG CTGGCGGCAA AAAAAAAAGA TAATAGCCGA TAAGCCCGCC      1560
     AAAAAAAAAG CGCGAAATAT CGATAACGAG CTGGCACGAA AATTGCTGGC ATATCGATCA      1620
     ACCGCTGTGT CTTTGAGCTA TCGAAAAAGC CCGCCTACGC GCCTAGCCCA AATTTGCAAG      1680
     TCAGTTGAGA TTATAAAACC GACAGAGGCG CGCGCGCAAC AGTAGCTAAA AGTGAAGCCA      1740
     GCAGCAACAA CAACAACTAA TGGACGGCCA GAACGTGAAC CAAAGCGGAG GATGGGCATC      1800
     GGTTTTATCC ATCTCATCGG ACGATGGTAA CTGCTCATCC TCGCCGCCAT CAGCTATAGT      1860
     CTCATCGCTG GATACCACGC CAACGTCAAA TGAAACCACC ATAGTAAGAA GAAGCCTATA      1920
     TCAAACAAAT GCCGACATGA AATCTTACGA TTTTGAAAAT ATTGTATTAA ATGAAAATAA      1980
     AAATACCATA TTGCCAGACC CTTTATTTGT TGATAAATGC GGGAGTACTG CTAATACCAC      2040
     AGAAGCCAAT GAAAAACAGC CTGCCGATAG CCCCTTCCCC ATTTCCATAA GCAAAAATTT      2100
     TAGCACTTCC TCGCCACTAA CACATGTAGA CACGCCTACA CAAGAAGATG ACGCCAGTGC      2160
     ATTTAATACA TTGAAAGCAG CCAAAACAGC TAGAATAATT TTTCCCACAC ACACACAGAT      2220
     AGAGCCCGCC AAACCCTCGC CCCCCTCCAA AGAATTAAGC TCAAACTCAG CACCCAAAAC      2280
     TCTTAGCTAC ACAGACAAAA TTACAGCAAC ACAGAAAAAT TTCCCCACTA AAACACATGT      2340
     AGACACACCT ACACAAGACG ATGACACTAA TGCAACCAAA GCATCAAAAA CCGCCCAAAT      2400
     AGATTCATCA CACTCACAAC TACATGAAAC CAAGCCAACA CAGCCCGCCA AAAACCCTTC      2460
     ACCCCTCACC CAAAAGCTAA CCACAAACAA AACAGCCAAG ACACACACAC ACACAGACAA      2520
     ACCGACAGCG TCACAAAATC TTTTTCCCAC CAAAACACAT ATAAACTCAC CCACACAATA      2580
     TAACGACACT AATGCAAGCA CAGCATCAAA AGACGGTAAA ATAAACCTCT CTTCACACTC      2640
     ACACTTACGT GAAACCAAGC CAACACAGCC CGCCAAAAAC CCCTCACCCC TCTCCCAGAA      2700
     GCAAATAACA AGCATAGCAG CCAATACACT CACCCACACA AACAAACACA CAGCATCACA      2760
     AAACTTTATT CCCGCCAAAA CACATATAAA CATACCCACA CAATATAACG ACACCAATGC      2820
     AACCAAAGCA TTAAAAACCG CAAAACCAGC TTCTCCCTCC CACACATACT CACGCCAGAC      2880
     AAAACCAATA AAGCCCGCCA TAAACGCATT GCATCCCGCC CAAGACACAA ACCCAAGTCC      2940
     AGCAATCAGT GCTGTCACTT ACACAGACAA ACCCACAGCT ACTCAGAATA TTTTTCCTGC      3000
     CAAAACTTTT GCAGAGCTGG TGAGAGAAAA TGCTAAACGC TCACAAACTG CAATGCAAAA      3060
     TCCCCCTCAT GCAAAACATG ACTCTGCCGC CCTCGGACGC TTACCGAGTG CAGCTAGAAA      3120
     AAACCTAACT AAAACACTGA GTTCTCCTAA AACTCCTGGG AAGCGCCGCG GGGACTGTTT      3180
     GGATGAGGGC TTACTTCAAA CCTCTAACAA AAAGGTTAGA ATACGCGACG ACTTCTCTGA      3240
     TGATGATCTG GGGGTCACAA ATCTACTCTC CGAAACACCC ATATTCAAAA GCAAAGTAGC      3300
     TATTAAAATT CGGCAAGACT CAAGAAGAGA ATCCCTGCAG AAGTCAGTTG AAATGGACAC      3360
     AGCACCAGCA ATTAGTCCCT CAAACACAGC AGCTGAGCCC GACCTACCGC CCTGGAAAAC      3420
     TGTTCCAGCT AGCAGAAAAC CACCATCAAT CTTCTTGTCC AATATTCAGC AGATTATCCC      3480
     GCTAATAGAA AAACTAAACT ATAAAGCCGG GGTAAATAGC TTTACTACCA AATCTGAACT      3540
     TGGCAACAAT ATTAGAATCC AGGCTAAAAC GATGGATGCC TATAAAGCAA TTCAGAATGT      3600
     CCTCCTTGGG GCAAACATTC CCCTACACTC TCACCAGCCA AAGAGCGCAA AGGGCTTCCA      3660
     AATTGTAATT AGGCACCTCC ACCAGTCAAC CCCGACCAAA TGGATTGAAA GCCAACTTCA      3720
     AGACATCGGT ATAGCTACAA AATTCATCAG GGCAATGCAG TTTAGGGACA CGAGAAATCC      3780
     TATGCGCATT CATGAGGTTG AGGTTGTACC CAAGGCTGAC GGCAGCCATC TCAAGGTCCT      3840
     GCTACTAAAA TCCCTTGGAG GTCAAACGGT CAAGGTTGAA AGGAAACGGG TATCGAAGGA      3900
     TCCCACACAA TGTCATCGCT GCCAATGTTT TGGGCATACA AAAAATTATT GTAGAAACCC      3960
     GTTTAAATGT ATGAAATGTG GCCAGCTGCA CGCCACGGTT TCTTGCACTA AACCCAAAAA      4020
     CCTTCCGGCT ACTTGTGCAA ACTGCAATGG AAGCCACGTA AGCAGCTATA AAGGATGTCC      4080
     TGCTTTCCAA GAAGCAAAGC AAAGACTATC TATCAACAAA ATTCAATCCC TACACTCACA      4140
     ACCCACGCAC CTTCAGACCC CCCGCAATAA ACATCCCTAC CCAAAACCCA CCCACTTTCA      4200
     GACGCCCCGC AATAAGCAGT CCTACACACA CCCCCCTCCT CGAACAACAG TAAACAACAC      4260
     AAAATTACCT GCCAAAAGAA TCCAAGGAAA AAAGTTATCG CAAAGGAACA TATCTATAAA      4320
     TAAACGCTTA AATAGAATTA GGGCTTTTGA CAAGAAACCG AGAAAGGAGA CAAGCCCGCC      4380
     GACAACTAGC AAAAAGGTAC TGGCCTCCCT AGAAGAAAGC AGCAAAAACC CAAACAGCGT      4440
     CCTAAACCCA GCCAACACCC ATCTCACTCA TTTCTGTCCA CCCCCAATAA CACAAGATAT      4500
     CCCTAATGAC GAACCCACGG AGCCGAGTCA GGAGCAATAC CTTCTAAATC GTATTGAAGG      4560
     GATGGAAAAG AAGCTCAACA ATCTCCTGGA AATCGTCACC CGCCTACTAA ACCAAGGAAG      4620
     AGAGTGTCCA AAATCTCCAA AAAATCCTTT CCGAGATCCA ATCCTCATTT AAACGCTCTT      4680
     GCTAGTAGCA TCAGAAAGTG ACGTATCTTA TGACTCGGGC GTGCAACAGG GATATCCTTA      4740
     AAATTGCTTT CTGGAACGCT GGTGGGATCA ATAATAAAAT AGACGAGCTC AAACTGTTCA      4800
     TTCTAAATAT TGATGCCCAC ATAGTCATAG TCACTGAAAC CAGACTTGAC AACAAATCGA      4860
     CCAAACTAGA ACTTCCAGGA TATTTCACAT ACTTAGCCCA AAATCCTGTT TCTAGCAAGA      4920
     GAGGAGGAGT CGCCACTATA GTAAACAGCA GTATCCGACA CATGGCCTTA GAACCGATTG      4980
     AAAAAGAATG CATACAGAGC GCCCCAATAG TCTTGCTGCC TGAAAACAAC AGACGCAGCG      5040
     AAATGATAGT AATAGCATCT GTCTACTGTC CGCCTTCGCT AAGCTGGTCG CCCCACCACT      5100
     TTACTGACGT TCTCAATTTT GCCGAGAAAA CTCTGGGAGG GCAGACAAAG TTCATTCTAT      5160
     GTGGCGACTG GAATGCAAAA CACAGGCAAT GGGGTTGTAC CCGCGCCTGT CAACGCGGCA      5220
     CCGCACTCTA CGAAGCAGTT CAAGCAGATC CCATGGCTGA GATTATTGCT ACCGGCTGTG      5280
     CGACACATTT CCCGCACGAC ACACGGAAAA ACCCGTCAGC AATAGATTTC TCCATATGCA      5340
     AAGGACTGGG CAGGCTCGAA AAGAGAATTT CCTCAAGTGC GGACTTATCT TCAGACCACC      5400
     TTCCCATCCT GCTTGAGATC AACTTAGATA CAAGCACCCT CTTTCTGCAA AAGCAAAACA      5460
     ATAACATCCT CAAGAAAACT ACGAACATTG AGCTCTTTAA GACTGTTCTT GAAAGAAAGA      5520
     TACTTCTTAA TACGGAGATA AGAGTAGCAG AAGACATAAA TGACGCCATA AATATCTTTA      5580
     TCAAAAACAT CAAGGACTCG GCTGATGAAT CAACTCCCTC CCCAAGAATC CCTGACAACC      5640
     TCAGAAGAAT GCATGGACAA GCTAACAGAA ATAGTCACAC CCTCACACTA GACGAAAACA      5700
     CAAGCAGATT GTTGGAAGAA AAACGGATAC TAAGTAGAAT TTTTAAAGCT ACTAGAACGG      5760
     ACGAGGACAA AGCTAAACTA AAAGCAGCTG AAAATCGACT AAAAAAAGCG GTAAAGATCT      5820
     TGAGAGAAAA GAGAATTAAT AAACAAATTG AAGGAATAGA CACGAAAAAC CCGGACAGAA      5880
     TGAGGAAAAT GTGGAGACTG CTAGATGAAG GAAAAAAGAC AAACCAACCG AACTTTCCCC      5940
     TCAAACTGGA AACCAAAAGA GGCCCCAAAT GGACAAAAAC GATAAAGGAG ACAACAGAAG      6000
     CATTTGTTTC CCACTTAGAA GGAAGATTTA AGCCAAATAA CAACGTACCT GATTACCACA      6060
     TAAATACAGT TAACTCTGGA CTAAGAACAA TTAAAGAAAG CATGTTAACA GAAAGATATG      6120
     ATGTAAACAA GAATCCCTGT AACCAACCTA TCACACTAAA GGAATTAAAT GACGAAATAA      6180
     AAAACTTAAA GAATAGTAAA GCACCGGGAA AAGACCTTAT AACAAACCAA CTTATAAAAA      6240
     CCCTACCGAC TAAAGCTACA CTGTACCTTA TCCTAATCTA TAACTCTATA CTTAGAATTG      6300
     GATACTACCC AGACGCCTGG AAACATGCCC AAGTGAAAAT GATCTTAAAA CCAGGGAAAA      6360
     GTGTGAACGA CCCGAAGTCA TATAGGCCGA TCAGTCTACT CTCGGGACTC TCTAAAATGT      6420
     TTGAAAGACT ACTTCTAAAA AGACTTTTTA GGGTAGATCT ATTCAAAAAA GCCATACCAC      6480
     TGCACCAATT TGGCTTCAGA AAAGAGCACG GAACTGAGCA GCAAATAGCC AGGGTCACCC      6540
     AGTTCATCCT CGAGGCCTTT GAGCGAAAGG AATACTGCTC AGCGGTTTTC CTTGACATCT      6600
     CTGAGGCTTT CGATAGGGTC TGGCACGAAG GCCTTTTACT TAAACTAGCT AAAATATTAC      6660
     CATACAACCT ATACATTATT CTCGAAAGCT ACCTTACAAA CAGAACATTT GAAGTTAAAG      6720
     ACCAAGCTGG AGAGACTTCG AGAGCAGGAC AAATAGGCGC AGGGGTGCCC CAAGGAAGCA      6780
     ACCTTGGACC CATACTGTAC TCTATCTTCT CCTCAGACAT GCCACTCCCA CACATATACC      6840
     ACCCCTCCCC AACAGAAAGA ATTATGCTCT CAACATACGC AGACGACACT ATAGTACTCA      6900
     GCTCAGACAT ACTAGCAACT GCTGCCACAA GAAACAACGA AAACTACCTC AAGACATTTT      6960
     CGGACTGGGC AGACAAATGG GGTATCTCAG TAAATGCTGC TAAAACAGGA CATGTCATTT      7020
     ATACATTAAA AAACGACATA CCTACAAATC TAAAGACCAT GAAGATTAAG GGTCAAGCAA      7080
     TAAAAAAGGA AAGCAAGCAA TCATACCTTG GCGTAATCCT TGATAGCAAG CTAACACTTA      7140
     GTCCTCACGT CACGAAGGTA GTAGGTAAAT ACTTGACAGC CTATAGAAAA ATGTCATGGA      7200
     TCTTAAATGA AAGAAGCAAA CTCCCTACTA ATACTAAGAT GCTGATCCTC AAATCAGTTC      7260
     TATCGCCAAT ATGGCAGTAT GCCATAGCAG CCTGGGGTCC CCTTGTGACA GATGCACAGA      7320
     TAAGACGGAT ACAAGTTGAG GAAAACAGAA AAATGAGAGA CATATGCAGA GCGGGAAGAT      7380
     ACACGAAAAA CCAAACTATA AGGGACCGCT ACTGTGTCAA AACAGTAGAA GAGTTCTATC      7440
     AACAGGCTGT CCACAGGTTC TCAGAAACTA CAAAATCGCA CCCTAATGTA GCTGTTCGCA      7500
     GGATATTCTC TAGGCACTAT ATCCCGAACA GACTAGAAAG AAGCAGGCAG AGGTACTTGA      7560
     AAATGACAAT GGACCATATC ACGCAAAAAC AGACTGGACT GACCCTCTCA CCTAAACTCT      7620
     TAAAAATCCC TGATCTAGAT GACTGCAGAA CCTTAAAAAA GCGAAGCGAG AGAGAGAAAA      7680
     TAAGACAAAC GCATCTAACT GAACTCCCCA CCCTGCTGAG ACTAGAGGAA GAGGAGGCAG      7740
     AGCTCAAAAG AATAAAAAAA CAGGAAGAGA GGGAAAGAAG GGAAAGGGAA AACCAAAAGT      7800
     GGCCTCCAGA TAGGTGGTGT GAACTGGAAA TAAACCGATA TAATAAAAAA TATAGAAATG      7860
     GCGATCTAAC CAGGCAGGAA ATTATAGAAA AATTCCGAGG GCAACCATTA AATGTACAAC      7920
     GAATAATCCT ACCCGACTAC GAAGGTGACT AAAAGTAAAT CAAAACAAAC TAGGGTCGGA      7980
     GCATAAAGCA GAAATAATTA ACCTGGCGGA AGGGGCGGCA AAAATATTTA AAAGAAAGGA      8040
     AATAAATACA AAAAGGCTAA AGGCTAAGTT ACAGGTTACA TAAAAAGGGA AATGTGCTTA      8100
     TAGATATAAT GGTAAAATTA ACTTAACTAA ACACCTACTG GAAAACAAAA CCATGATGGC      8160
     TGCGTACTTA AAACGTTTCT CCTGGCGCGA TTGAAAATCC ATCTTTCCTA TCCAACCGAG      8220
     GGATCTGCGA CTGCGGCCTT CTGCCGTTCG GCTCCTGATG GATCCATCTG CTGCTGGAAT      8280
     GGGTGCCACA CCGGCGCTCC AACCTAAAAG AAAGATAATA TGTCTTAGTT TTCTTTCCCT      8340
     TTTTCTCATA AAAAACAAAA GCTCATCTGG AGTCTGATAA TAGCTTTAGC TCACCAAGAC      8400
     AGCAAAAACA ACAGCATCAA GGCCAGCAAC AGTGGAGGCA GAGACCAAGC GGTTTGCTGA      8460
     ACATTTCGCT GCCCACACCC ACCATTCCTG GAGGCTCTGA ATGAGGGAGC TGAAGCCTCT      8520
     GAAAATTGAA GATCCTACTC CAATGTGACA CTTTCGGCTC CGAGCTCAAC GCCGGCGCTG      8580
     CAAATCCGGC GTTATAAGGA AAGGGTGCTC CAGCTTGTGG AGTGGTCTTT CCCCAGAGGC      8640
     AGCAGCAGCA GCAACGCCAG CGGCAATTGG CGACCTCTGC GTAGCCGAGT CAATCCCGTT      8700
     ATCGGTCCGT CTGGCGATGC GTTTCCGACG CGGCGGTATG CGTCCATAGG GACCGCCTAG      8760
     AATGCTTGGC CAGGAGACAG CAGTAGACCT GGGCGTGGGC GTCACCAGCA ACATGGTAGC      8820
     CATGCGCAGT CAATTGGCCG GTGGCAACAA TCTTGCCATG CAGCAATAGC GGCGCATGCT      8880
     ACCCTTGGAG CGACGTCAAC AGCTACATAT TTTTCAACAG TGTAGCGCGA CCTTTAGGCG      8940
     CCTACACCTA CACCAGCAGC AGCGATATTG GCAGTAGCAG CATTTAATGT CTTGCAGCAG      9000
     TTTCCATTTG ACAACTTCCG ACGACCAGAC TCCTCGCTTG GCCCCTGGCG ATTCGCCCTG      9060
     GAAGAAAGAA AGAAGCATGG ATTAGTCAAA TATCAAAGCA CAACAAGCAT GCACGAAATC      9120
     TTCGCAACAA GGACTATTCC AAGGCAAGCG ATGGTGTGTT CTTTGGCTCT ACATATATCG      9180
     TTGAAATCCG TCTCCAACTG CCGCGAGTCA CCCACGACTT CCACTCCCTG CAGACGGACG      9240
     TAATGCACTA CGATGTGTAA ATTTTCCGGA TCCAAGTGAA CGCCAGGCGG AAGAGGATTC      9300
     CCTGGATGTG AAGGATCACA AACTGCTGCT TTTTCAAGAG TCCCCATTTA ACAACTTCCG      9360
     ACGACCAGAC TCCTCGCTTG GCCCCTGGCG ATTCGCCCTG AAAGAAAGAA AGAAGCATGG      9420
     ATTAGTCAAA TACCAAAGCA CAACAAGCAT GCACGAAATC TGCGCAACAA GGACTATTCC      9480
     AAGGCAAGCG ATGACGGACG GAATGCACTA CTATGTGTAA ATTTTCCGGA TCCAAGTGAA      9540
     CGCCAGGCGG AAGAGGATTC CCTGGATGTG AAGGATCACA AACTGCTGCT TCTTCAAGAG      9600
     GTAACCGGCC TCATTTCCAC TTGGGTCACA TCGATTGTGG AGGAAGCCGA TTGGGACTTT      9660
     GAGCGAGCCC TAAAATTGTT CATTCAGAAG AACGCTGATC ACGAAATCCC AGATCTAGCA      9720
     TTCGCCTAGA ATATGTGATC TCGTTGGACT GCGTGCTGGA CTGCGGCGCA TGCTTTCCCT      9780
     CCCGCCAGAG ACGGGATGCG CGCATCAGGA TCGACGGGAC AGACCGGCCG ACGCCTGGCT      9840
     TCACGTCGGC ATCTATGCGA CGACGTGATA ATCAGCTTCA CAGTACCTGC GGATGAGGGC      9900
     ACAGGCGCCA GTCCTCTGCC TAGCGACACA TACACCAACA GCAACATCTA AAACAGTCGC      9960
     AGTAGATGCA GGGAATTTTC TTGCTGCATT CTCCAACTGG AAAAATCCGA CGGCCCAACT     10020
     CCTAGCTTAG CCCGGCCAAT CTTCTTGGAC TGGCAAACGA TGTGATGAAT CGTCCTGGAA     10080
     GAAAGAAGCA TGGATTATTT CTTCATACAC AGCTTGTCTA CTAAAATGCA TTTCCCGGCA     10140
     AACTGGCACT GGGGCGTTGA AAATACGACA CTACTCACCA AACAGCAGCA AAAACAACAG     10200
     CATCGGCAGC AGGCGACCAG CAGCTGCTTT GGCTCACCCA ATGCGACAGC AATATCTGCG     10260
     CATGGCCAGC AACATGCAGC AAGCAAAAGA CCGGCATGGT GGTGAACAAC ATATCGCTCA     10320
     CGCCCAACGA TCTGGAAGCC CTGAGCTAGG GAACTGAGTA TCCGCCAGCG GATACTTATG     10380
     CAGCGGCGAG GCGTCGGAAA TCCGATAGCC GGAAGAGAGG CCGGAGCAGC ATGTTGGGCA     10440
     TTTTCGCCCC AGTAGCAGCT GCTGGGGCAG CAAGGGCAGA GGTAGCAGTG TCAGCGCTCC     10500
     TGGTAAACCG GCCTTTTCTG TTGAAGACGC GGGACTGCGG CGCAATTGTT CCTGCCAACC     10560
     GGGAGTTCTC TGCGCCTGAG GTCCTGTTGT GCTTCAGCGG CTCCATCTGC TGTTGCATCT     10620
     GGCGCTTCTC CAACTTTCCT CCCTGAAAGA AGAGAATATT AGTAGGAGCA TGAGACCAAC     10680
     AACAGCCCTA GCTTACCACG TCAGCGGAAA CAGCAACTGC AGAAGCCCGG TAACTTTCTG     10740
     ATAATATGCA GCAATAAGAG CGGCTGGATC AGCATGTTGT GTAGCTTGGC CCCAGAAGCA     10800
     GCAGCTGCGG TACCAAAGGC AGCGGAAGCA GGGTCAACAT AGTCTGCTAT GCTGTGTCCA     10860
     TACTAGCATA GTCAAGTCAG CGGTGGTGAC GTTGCCGCAG CAGCTGATCC ACAGGGTACG     10920
     GCCTGGAATG TTTTGTCAGA GACGGCAGTG GCCTGGGCGT ATTAGTCAGA TACGCCAACA     10980
     ACATGATACC CATGCGCAAC CATTCTTCCG GTGGCGGCAT GCTCGTAAAG TAGCGGCGGC     11040
     GCATGCATCT CTCGAAGCAG CAGCAGCAAC AGAGGCGTCT CATAAGTGCA TGCGCAGCAG     11100
     CGGTAGCAGC GGTGGTGGCA GCAGCAGGGA GATTTCATTG CTGCAGTCGC CAAATTACAT     11160
     GCATCCTACG ACTCGACTCA CGCTTTTTGG CCCCTGGCCG ATCTTCATAT ATCTCAAATC     11220
     GACGGCTGCT TTTACCCTGG AAAAAAAAAA AGGAGCTTGG GTTATATTGA ACTACACTAG     11280
     GCGGCGACAC ACTCACCAGC AGCAGCCAGA ACAACAACAG CGGCAGAAGT AGCAGGAAAT     11340
     TATCTCACTG CAAAATCCAA TTGGCACTTT CCGAAGTCCG TATTTCTCGC CTGGCCCCTG     11400
     GCCAGTAACA GGGGCCTGTG CGACGGAGAT GACGACGATG ATCTGCCCTG TGGACGGCCT     11460
     CAAGAAGGAA TCGGCCCTGT ACTGCCCACC TGACCTGTGC CAGGATAGCA GCAATGTCAG     11520
     CGGACCATGG ATGGAAGAGG CGGCACTGGC GACGGTCCTC AGTTTTGCGG TTTCCGCGGG     11580
     GCGTAGGCGC AGTAATCGGC GGCAGCAACA GTGGCGGCAG CAGAAGGGAA TGTGTATCTG     11640
     CAGTCGCCGA ATGGCAATTT CCTGCCCAGC TGTAATGGAC CGACAAATGT TTTTTGGCAT     11700
     GTCGACCTGT AAGAAAGAAG CAAGGATAAG TTTTTTCTTT ACAAGATTGT ATATGAATTT     11760
     GTATTTACGG ACAACTGGCT TGTTTCCTGT CGACGATAAA TGGCGCTTCA TGTTTTCACT     11820
     CTGCCAAAAT CTGAGTGCAA GCATCGGGGC TGACGGGCCG AATTTGCTGA TGCCTTGTAC     11880
     ATGCTAGCAT CTTTATGCCG CCGTGTAATT TTGCGACAGC AAAACACATG ATGGAGAAGA     11940
     CGAAGGTGAT CGATGGCGCC CGGATGACGG ATGCAGGCCC GTGCTACCCA CTGGTCCGTT     12000
     GCCAGGACAG CAGCGTTTCA ATTATGCGAA CAGAGGCACT GGAGCCACTT CTCAGGCGAT     12060
     AGGGATCATG AGGCGACGAC AACTCGCCAG CAGCAGTAAC AACAACAGCG GCAGCAGCGA     12120
     TCTCGGACTT GCTGAACATT GCGGCTTTTT CCCAGCCTGG ACCGTCATCA CAAACGCTCT     12180
     CAAAGATCGG TGCGCCTGCA GCCTACGGAA GCGTACAACT GCCCAAAGTC GTGCTATTGC     12240
     ATAATGTTAG GTGTCCTGGC TGCTCCGGCG GATGAGCTCC ACCCGATTGA GAGAGGTAAG     12300
     AAGGCCCAGC AAGTCGCCCT TAAATAAAAG AAACAAGCAT TAGACTCGGC TGAAATTGTA     12360
     ACATCAGTCA GACTGTACTC ACGCATGCAC TTAGACAAAC CGAAGCCTAT TCTATTGACG     12420
     ACGCGGACTC CAACACATGT TTTCCTCCAC AAAAGGCTGT GAGTGCACCA AAGTTGACGG     12480
     GCCACGCCGG CCGATGCTTG CTGCATACCG GCATCTCCGC AGCAGCGACG TTACAAGCAC     12540
     CACTAAAATT AGAAAGAGGC TTACTATAGG CAAAGCGCAG AAAAACAAAT ATTACAATAA     12600
     GAAATAGCAC GCGATTTTTC TGCTTCGTTT CCGCTTGGTA CAAGTGAGAC CATTCTCCCT     12660
     ATATGCCATT CTAGTATATT TGCCCGATAA GCGATATGCT GGCGGCAAAA AAAAAAGATA     12720
     ATAGCCGATA AGCCCGCCAA AAAAAAAGCG CGAAATATCG ATAACGAGCT GGCACGAAAA     12780
     TTGCTGGCAT ATCGATCAAC CGCTGTGTCT TTGAGCTATC GAAAAAGCCC GCCTACGCGC     12840
     CTAGCCCAAA TTTGCAAGTC AGTTGAGATT ATAAAACCGA CAGAGGCGCG CGCCGAACAG     12900
     TAGCTAAAAG TGAAGCCAGC AGCAACAACA ACAACTAATG GACGGCCAGA ACGTGAACCA     12960
     AAGCGGAGGA TGGGCATTGG TCTTATCCAT CTCATCGGAC GATGGTAACT GCTCATCCTT     13020
     GCCGCCATAG TCTCATCGCT GGATATCAAG TCATCGCTCA ACTATACCTT AAAATTACTC     13080
     ACCAAAACTC TTTTCTCCTT TTCCATAAGA TAAAGTAAAG TAAAGTAATG TAAAGTAAAG     13140
     TAAAGTAAAT TAAAGTAAAG TAAAGTAACG TAAAGTAACA TAATATTTAA ATTTAAATTC     13200
     TACACTTGAA CAATGGCGCG CAAAACTGCC GCAATGTAAT TCAAAAATGT CTCCCGCAAA     13260
     TTTAAAACAT AGATTAATAC TTGTAAGTAT GGCGCGCATA TCTGCGGCCA AGAAATCCGA     13320
     AAATGTAATT TGCCACAAAT TGTCACTATA TATTTTTAAG CAAAAATCAG AGGACAATAA     13380
     ATGCCAACGT CATTAGACGT TGAAAATATT CAAAAAAAAA AAAA                      13424
//
ID   DM14101    standard; DNA; INV; 10654 BP.
XX
AC   U14101;
XX
DR   FLYBASE; FBte0001207; Dmel\TART-B.
XX
FT   source          U14101:1..10654
FT   SO_feature      non_LTR_retrotransposon ; SO:0000189
CC                   telomeric retrotransposon
FT   SO_feature      direct_repeat ; SO:0000314:1..1046
FT   SO_feature      direct_repeat ; SO:0000314:9031..10076
FT   SO_feature      five_prime_UTR ; SO:0000204:1..961
FT   SO_feature      three_prime_UTR ; SO:0000205:7386..10637
FT   SO_feature      polyA_signal_sequence ; SO:0000551:10479..10484
FT   SO_feature      polyA_signal_sequence ; SO:0000551:10600..10605
FT   SO_feature      non_LTR_retrotransposon_polymeric_tract ; SO:0000433:10638..10654
CC                   derived from polyA tail of RNA transposition intermediate
FT   SO_feature      CDS ; SO:0000316:962..4093
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\TART-element\gag"
FT                   /db_xref="FLYBASE:FBgn0014071"
FT                   /db_xref="SPTREMBL:Q23999"
FT                   /db_xref="GI:603663"
FT                   /db_xref="NCBI_PROTEIN:AAC46493.1"
FT                   /translation="MDGHNGDQSEGWATVLSISSDDSNSLSSPPSIIVSSLDTTPTSHE
FT                   TTIVRRSLYQTNADMKSYDFENIVLNENKNTILPDPLFVDKCGSTANTTEANEKKPANS
FT                   PFPISISKNFSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTHIKPTKPSPPS
FT                   KELSTNSALKTLSYTDKITGTQKNLPDKTHVDTPTQDDDINATKASKTAKIISTQTHLG
FT                   ETKPIQPAKDPSPRTQKPIAHKADETLTHTDKLTASQNLVPAKTHINTPTQYNDTNATN
FT                   ALKTAKINFSSHSHQSEIKPTQSAKNISPLTQKQFTSESAGTHTHTDKHKNTASQNLFS
FT                   AKTHINSPTQHNYTSAATASKTAKLILSPHSHLSETKPTQPALSPSPLSQKQITSIAAK
FT                   TLTHTNKHTASQNFIPAKTHINIPTQYNDTNATKALKTAKAASPSHTYSRQTKPIKSAI
FT                   NALHPAQDTNPSPAISAVTYTDKPTATQNIFPVKTFAELVRENAKRLPTPMQNSHQAKN
FT                   DSAALGRPPTAARKNLNKTLISPKTPGKRRGDCLDEGLLQTSNKKVRIRDDFSDDDLGV
FT                   TNLLSETPLFKSKAAIKIRQDSRRDSLQKSAEMDTAPAISPSNTAADSDLPPWKTVPAS
FT                   RKPPSIFLSNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTMDAHNAIQNVLLE
FT                   ANIPLHSHQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFIRAMQFRDTRNPMR
FT                   IHEVEVVPKADGSHLKVLLLKSLGGQTVKVERKRVSKDPTQCHRCQCFGHTKNYCRNPF
FT                   KCMKCGQLHATVSCTKPKNLPATCANCNGSHVSSYKGCPAFQEAKQRLSINKIQSLHSQ
FT                   PTHLQTPRNKHPYPKPTHLQTPRNKQPYTHPLPRTSVNNTKLPAKRIQGKKISQRNLSI
FT                   NKRLHRMKKPRKETSPPTTSKKVLASLEESRKNPNSVLNPANTHLTHFRPPPLAQNIPN
FT                   DEPKELSGEQYLLNRIEGMEKKINNLLEIVTRLLRQGKDCPKSPKNPFRDPIFV"
FT   SO_feature      CDS ; SO:0000316:4131..7385
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\TART-element\pol"
FT                   /db_xref="FLYBASE:FBgn0014072"
FT                   /db_xref="REMTREMBL:AAC46494"
FT                   /db_xref="GI:603664"
FT                   /db_xref="NCBI_PROTEIN:AAC46494.1"
FT                   /translation="MTRADNRDILKIAFWNAGGINNKIDELKLFILNIDAHIIIVTETR
FT                   LDNNSTKLELPGYFTYLAQNPVSSKRGGVATIVNSSIRHMALKPIEKECIQSAPIVLLP
FT                   ENNRRSEMIVIASVYCPPSLRWLPHHFTDVLNFAEKTLGGQTKFILCGDWNAKHRQWGC
FT                   TRACQRGTALYEAVQADSTAEIIATGCATHFPHDTRKNPSAIDFSICKGLGRFEKRISS
FT                   GADLSSDHLPILLEINLDTNTLFLQKQNNNILKKNTNIELFKKVLERKILLNTEIRVAE
FT                   DINDAISTFMKNIKDSAAESTPSPRIRDNPRRRHRQANRNSHTLALDENTSRLLEEKRI
FT                   LSRVFKATKNYEDKAKLKAAENRLKKAIKILRENRINEQVEGIDTSNPDRMRKMWKLLD
FT                   EGKRTNQPNFPLKLETQKGPKWTKTIKETTETFVSHLEGRFKPNNNVPDYHIDRVNTGL
FT                   RIIKESMLTERHNLNKNPHNQPITLKELNDEIKNLKNSKAPGKDLITNQLIKTLPTKAT
FT                   LYLILIYNSILRLGYYPEAWKHAQVKMILKPGKSANEPRSYRPISLLSGLSKIFERLLL
FT                   KRLFKVDLFKKAIPLHQFGFRKEHGSEQQIARVTQFILEAFERKEYCSAVFLDISEAFD
FT                   RVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVKDQAGETSRTGQIGAGVPQGSNLGP
FT                   LLYSIFSSDMPLPYIYRPSPTERIMLSTYADDTIVLSSDTLATAATRNNENYLKSFSDW
FT                   ADKWGISVNAAKTGHVIFTLKNDLPTSLRTMKIKGQVIKIESKQSYLGVILDSKLTLSS
FT                   HVTKLMGKYTTAYRKMTWILNRRSKLPTKTKMLILKSVLSPIWQYAIAAWGPLVTDAQI
FT                   RRIQVEENRKMRDICRAGRYTSNQTIRDRYGIKTVEEFYQQALHRFSETIKSHPNIAVR
FT                   RIFTRHYIPNRLERSRQRYLKMTNEHITQKQTGQTLSPKLLKIPDLNDCRTLKKRNERD
FT                   KIRQTHLIELPTLLRLEEEEEELRRIKKQEERERREKETQKWPPDRWCELEINLYNKQY
FT                   RRGDLTRQEIIQKFRGQPLNVQRIILPDYKGDQEHN"
XX
CC   A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially
CC   overlapping the UTRs (annotated as "direct_repeat ; SO:0000314").
CC   Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates
CC   upstream of the 3’ end of the element and that the 5’ PNTR extends a short
CC   distance into ORF-1. The 5’ ends of TART-B elements are variable and the
CC   minimal size for functionality has not been determined.  Thus, this
CC   canonical sequence, U14101, may be 5’ truncated within the 5’ PNTR (M-L
CC   Pardue, 2009).
XX
CC   Derived from U14101 (g603662) (Rel. 42, Last updated, Version 1).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997; updated Jan-2009 as per
CC   Mary-Lou Pardue and Greg DeBaryshe.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 10654 BP;  3669 A; 2717 C; 2036 G; 2232 T; 0 other;
     GATCCGGCCG GATGGCAGCT CGACGACGGT AGCAGGCCAC CATGCCCGCC AGCCCGCAGC        60
     TAGGATAGCA GCAACATCAG CGTCTTATTA ACGCGAACGG CGGCACTGGC CCTTAGCTGA       120
     CCAGCTGCAA CAACATCAGC GACGCAGTCT CCACCAGCAG CAACAACAGC AGCGGCGCTT       180
     GCGACAGCAG CAGCAGGGAA TGGTTCTGCC GCAGTCGCCT ATTGCTGCCT ATAAAGAGCA       240
     TTCCTTGCCA ATTGGCTTTC TGTACGACGA CGATGATCCT GCGGACAAAT CCACCTTTCC       300
     GGACGCCTGA GTATTATGGC GAGCCTGCTG ATCATTGTTT CTCCGACTCC TTACTTGACC       360
     ACTGGACAAT CATACAATCA CCGGCTTTTC ACATCTGGAA GAAAGAAACC TGGATTAGTA       420
     TTTGCCCTTC AGATTTGTAT GAAACTGCAT TTCTGGCCAA CCGGAGTGTT TCCTGCAGAC       480
     GACGCTGGAC TGCGACGCAC TTTTTTCTAC CAACACAGAT GGGACGCTTG CATCAGATCT       540
     GACGGGCCAG ACTGGCCGAT GCCTGGTACA CGATGGCATC TCCGCGGCGG CGAGATGTGC       600
     AGCGACGCTG AAAGCAATAA TAATTCTTTT ACTTTGCAGT ATCAAAAATG AGAAGCCACA       660
     TCACAATTTA CATCAGCAAA AATTACACGT GATATCTTTT TCTTTTGCCT AGGAGTAGTG       720
     AGACCTGCTA CCAAAATGAC CAGTAATACC GGCTAACGGA AGCGAGATAT CGATAATCAT       780
     TCTGGCGGTA AAATAGCCAG AACATCGATA ACCAGCTGTG CATTTTCCCT TCGATTTATC       840
     GAAGTCAAAT AGCCCGCCTA GGCTATCGGA CCGGATCGGC AAGTCAGTAG TGATTAAAAA       900
     TCCGGCAGAG GCGCCTGTGC AGCAGCTACC CAAAGTGAAC ACGACGAAAC GCAACAACAA       960
     AATGGACGGA CATAATGGAG ATCAAAGTGA AGGATGGGCA ACAGTGCTAT CTATCTCCTC      1020
     GGATGATAGT AACTCCTTGT CGTCGCCGCC GTCTATAATA GTTTCATCGC TGGACACCAC      1080
     GCCAACTTCG CACGAAACCA CCATAGTAAG AAGAAGCCTA TATCAAACAA ATGCTGACAT      1140
     GAAATCTTAC GATTTTGAAA ATATTGTATT AAATGAGAAT AAAAATACCA TATTGCCAGA      1200
     CCCTTTATTT GTTGATAAAT GCGGGAGTAC TGCTAATACC ACAGAAGCCA ATGAAAAAAA      1260
     GCCTGCCAAT AGCCCCTTCC CCATTTCCAT TAGCAAGAAT TTTAGCACTT CCTCGCCACT      1320
     AACACATGTA GACACGCCTA CACAAGAAGA TGACGCCAGT GCGTTCAATA CATTGAAAGC      1380
     AGCTAAAACA GCTAGAATAA TTTTTCCCAC ACACACACAT ATAAAGCCCA CCAAACCCTC      1440
     GCCCCCCTCC AAAGAATTAA GCACAAACTC AGCACTAAAA ACTCTCAGCT ACACAGACAA      1500
     AATAACAGGA ACACAGAAAA ATCTACCCGA CAAAACACAT GTAGACACAC CTACACAAGA      1560
     TGACGACATT AATGCAACCA AAGCATCAAA AACCGCTAAA ATAATTTCTA CACAGACACA      1620
     CCTAGGTGAA ACCAAGCCAA TACAGCCCGC CAAAGACCCC TCACCCCGCA CCCAAAAGCC      1680
     TATTGCACAC AAAGCTGACG AGACACTTAC CCACACAGAC AAACTCACAG CATCACAAAA      1740
     CCTCGTTCCC GCCAAAACAC ATATAAACAC ACCCACACAA TATAACGACA CTAATGCAAC      1800
     CAATGCATTA AAAACCGCTA AAATAAATTT CTCTTCACAC TCACACCAAA GTGAAATCAA      1860
     GCCAACACAG TCCGCCAAAA ACATTTCACC CCTCACACAA AAGCAATTCA CAAGCGAATC      1920
     AGCCGGGACA CACACCCATA CAGACAAACA CAAAAACACA GCATCACAAA ATCTCTTTTC      1980
     CGCCAAAACA CACATTAACT CACCCACACA ACATAACTAC ACTAGTGCAG CCACAGCATC      2040
     AAAAACCGCT AAATTAATTC TCTCCCCACA CTCACACCTA AGTGAAACCA AGCCAACACA      2100
     GCCCGCTTTA AGCCCCTCGC CCCTCTCCCA GAAGCAAATA ACAAGCATAG CAGCCAAGAC      2160
     ACTCACCCAC ACAAACAAAC ACACAGCATC ACAAAACTTT ATTCCCGCCA AAACACATAT      2220
     AAACATACCC ACACAATATA ACGACACCAA TGCAACCAAA GCATTAAAAA CCGCAAAAGC      2280
     AGCTTCTCCC TCCCACACAT ACTCACGTCA GACAAAACCA ATAAAGTCCG CCATAAACGC      2340
     ATTGCATCCC GCCCAAGACA CAAACCCAAG CCCAGCAATC AGTGCTGTCA CTTACACAGA      2400
     CAAACCCACA GCTACTCAGA ATATTTTTCC TGTCAAAACT TTTGCAGAGC TGGTTAGGGA      2460
     AAATGCAAAA CGCTTACCAA CTCCAATGCA GAATTCCCAT CAAGCTAAAA ATGACTCTGC      2520
     CGCTCTCGGA CGCCCCCCGA CTGCAGCTAG AAAAAATCTA AATAAAACAC TGATTTCTCC      2580
     TAAAACTCCT GGGAAGCGCC GTGGGGACTG TCTTGATGAA GGCCTACTAC AAACCTCTAA      2640
     CAAAAAGGTT AGAATACGCG ATGACTTCTC TGACGATGAT CTTGGGGTCA CAAATCTACT      2700
     CTCTGAAACA CCCTTATTCA AAAGCAAAGC AGCTATCAAG ATCCGGCAAG ACTCGAGAAG      2760
     AGATTCCCTG CAGAAGTCAG CCGAAATGGA CACAGCTCCA GCAATTAGTC CCTCAAACAC      2820
     AGCAGCCGAT TCCGACCTAC CGCCCTGGAA AACTGTTCCA GCTAGCAGAA AACCACCATC      2880
     AATCTTCTTG TCCAATATAC AGCAGATTAT CCCGCTAATA GAAAAACTAA ACTATAAAGC      2940
     CGGGGTAAAT AGCTTTACCA CCAAATCTGA ACTTGGCAAC AATATTAGAA TCCAGGCTAA      3000
     AACGATGGAC GCCCACAATG CAATTCAGAA TGTTCTCCTT GAGGCAAATA TTCCCCTACA      3060
     CTCCCACCAG CCAAAGAGTG CAAAGGGCTT CCAAATTGTA ATTAGGCACC TCCACCAGTC      3120
     AACCCCGACC AAATGGATTG AAAGCCAACT TCAAGACATC GGTATAGCTA CAAAATTTAT      3180
     CAGGGCAATG CAGTTTAGGG ACACGAGAAA TCCTATGCGC ATTCATGAGG TTGAAGTTGT      3240
     ACCCAAGGCT GACGGCAGCC ATCTCAAGGT CCTGCTACTA AAATCCCTTG GAGGTCAAAC      3300
     GGTCAAGGTT GAAAGGAAAC GGGTATCGAA GGATCCCACA CAATGTCATC GCTGCCAATG      3360
     TTTTGGGCAC ACAAAAAATT ATTGTAGAAA CCCGTTTAAA TGTATGAAAT GTGGCCAGCT      3420
     GCACGCCACG GTTTCATGCA CTAAACCCAA AAACCTTCCG GCTACTTGTG CAAACTGCAA      3480
     TGGAAGCCAC GTAAGCAGCT ATAAAGGATG TCCCGCTTTC CAAGAAGCAA AGCAAAGACT      3540
     ATCTATCAAC AAAATTCAAT CCCTACACTC ACAACCCACG CACCTTCAGA CCCCCCGCAA      3600
     TAAACATCCC TACCCAAAAC CCACCCACCT TCAGACGCCC CGCAATAAGC AGCCCTACAC      3660
     ACACCCCCTC CCTCGCACAT CAGTAAACAA CACAAAACTA CCTGCCAAAA GAATCCAAGG      3720
     AAAGAAGATA TCGCAAAGGA ATCTATCTAT AAACAAACGC TTACACAGAA TGAAAAAACC      3780
     GAGGAAGGAG ACAAGCCCGC CGACAACTAG CAAAAAGGTC TTGGCCTCTC TAGAAGAAAG      3840
     CAGAAAAAAC CCAAATAGCG TCCTAAACCC GGCCAACACC CATCTCACTC ATTTCCGCCC      3900
     ACCCCCTTTA GCACAAAATA TTCCTAATGA CGAACCTAAG GAGCTGAGTG GGGAGCAATA      3960
     CCTTCTAAAT CGCATTGAAG GGATGGAAAA GAAGATCAAC AACCTTCTTG AAATCGTCAC      4020
     CCGCCTACTA AGACAAGGAA AAGACTGTCC AAAGTCTCCA AAAAATCCTT TCCGAGATCC      4080
     AATCTTCGTG TAAATGCTCT TTCTAGTAAC ATCAGAAAGT GACGTTTCCT ATGACTCGGG      4140
     CTGACAACAG GGACATCCTT AAAATCGCTT TCTGGAATGC TGGTGGGATT AACAATAAAA      4200
     TAGATGAGCT TAAGCTGTTC ATTCTAAATA TTGATGCCCA CATAATCATA GTCACCGAAA      4260
     CTAGACTAGA CAACAATTCT ACCAAACTAG AGCTGCCAGG ATATTTCACA TACTTAGCCC      4320
     AAAATCCTGT CTCTAGCAAG AGAGGAGGGG TCGCTACTAT AGTAAACAGC AGTATCCGAC      4380
     ACATGGCCCT AAAACCGATC GAAAAAGAAT GCATACAAAG CGCCCCAATA GTCCTGCTGC      4440
     CTGAAAACAA CAGACGCAGC GAAATGATAG TAATAGCATC TGTCTACTGT CCGCCCTCGC      4500
     TAAGGTGGTT GCCCCACCAC TTTACTGACG TTCTCAATTT TGCAGAGAAA ACTTTAGGAG      4560
     GGCAGACCAA GTTTATCCTA TGTGGCGACT GGAATGCAAA ACATAGACAA TGGGGTTGTA      4620
     CACGCGCCTG CCAACGTGGC ACCGCACTCT ACGAAGCAGT CCAAGCCGAC TCCACTGCAG      4680
     AGATCATTGC CACTGGCTGT GCTACACATT TCCCACATGA CACAAGAAAA AACCCGTCAG      4740
     CAATAGATTT CTCCATTTGC AAAGGGCTTG GCAGGTTTGA AAAAAGAATT TCTTCAGGGG      4800
     CGGATCTATC CTCAGACCAT CTTCCCATCT TGTTAGAGAT AAACCTAGAC ACAAACACCC      4860
     TCTTCTTGCA AAAACAAAAC AACAATATAC TCAAGAAAAA TACAAACATC GAGCTGTTTA      4920
     AGAAAGTTCT AGAAAGAAAG ATACTATTAA ACACTGAGAT AAGGGTAGCA GAAGATATAA      4980
     ATGACGCCAT AAGCACCTTT ATGAAAAACA TCAAGGACTC GGCTGCGGAA TCAACTCCCT      5040
     CCCCAAGAAT ACGTGACAAC CCCAGAAGAA GACATAGGCA AGCCAACAGA AACAGTCATA      5100
     CCCTCGCACT AGACGAAAAC ACAAGCAGAC TGCTTGAGGA AAAACGCATA TTAAGTAGAG      5160
     TTTTCAAAGC TACCAAAAAT TACGAGGACA AAGCTAAACT AAAGGCAGCT GAAAACCGAC      5220
     TAAAAAAAGC GATAAAAATA TTGAGAGAAA ACAGAATCAA TGAGCAAGTT GAAGGAATAG      5280
     ATACAAGTAA CCCGGACAGA ATGAGAAAAA TGTGGAAACT GCTAGATGAA GGGAAAAGGA      5340
     CAAATCAGCC TAATTTTCCC CTCAAATTAG AAACCCAAAA AGGACCCAAA TGGACAAAAA      5400
     CGATTAAGGA GACAACAGAA ACATTTGTCT CCCACTTGGA AGGAAGATTT AAGCCAAACA      5460
     ATAATGTACC TGATTACCAC ATAGATAGAG TCAATACTGG ACTAAGAATA ATTAAGGAAA      5520
     GCATGCTAAC TGAACGACAT AATCTGAACA AAAACCCCCA TAACCAACCT ATTACTCTAA      5580
     AGGAATTAAA TGACGAAATA AAAAACTTAA AGAATAGTAA AGCACCGGGA AAAGACCTTA      5640
     TAACAAACCA GCTAATAAAA ACCCTACCGA CTAAAGCTAC CCTTTACCTT ATCCTAATCT      5700
     ATAACTCCAT ACTTAGACTA GGATACTACC CAGAAGCCTG GAAACATGCG CAGGTAAAAA      5760
     TGATTCTCAA GCCAGGGAAA AGTGCAAACG AGCCAAGGTC ATATAGGCCG ATTAGCCTAC      5820
     TCTCGGGACT CTCAAAAATC TTTGAAAGAC TACTCTTAAA AAGACTTTTT AAGGTAGATT      5880
     TATTCAAAAA AGCTATTCCT CTGCACCAAT TTGGCTTTAG AAAAGAACAC GGATCGGAGC      5940
     AGCAAATAGC CAGGGTCACC CAGTTCATTC TTGAGGCCTT CGAGAGAAAG GAATACTGCT      6000
     CCGCGGTCTT CCTTGACATC TCTGAGGCTT TCGACAGGGT ATGGCACGAA GGCCTTTTAC      6060
     TTAAATTAGC TAAGATCCTA CCTTACAACT TGTACATTAT ACTGGAGAGC TACCTAACAA      6120
     ATAGAACGTT CGAAGTTAAA GACCAAGCTG GAGAGACTTC GAGAACAGGA CAAATTGGTG      6180
     CTGGTGTGCC TCAAGGAAGC AATCTTGGAC CACTACTCTA CTCTATCTTC TCCTCAGACA      6240
     TGCCCCTTCC ATATATCTAC CGCCCCTCAC CAACAGAAAG AATCATGCTC TCAACATACG      6300
     CAGACGACAC TATAGTCCTC AGCTCAGACA CACTAGCAAC TGCCGCTACA AGAAACAACG      6360
     AAAACTACCT CAAGTCATTC TCGGACTGGG CGGACAAATG GGGTATATCA GTAAACGCTG      6420
     CTAAAACCGG ACATGTCATT TTTACATTAA AAAACGACTT ACCTACAAGT CTAAGGACTA      6480
     TGAAGATCAA GGGTCAAGTA ATAAAGATTG AAAGCAAACA ATCATACCTT GGCGTAATCC      6540
     TTGACAGCAA GCTAACCCTC AGCTCCCACG TCACAAAGCT GATGGGCAAA TACACTACAG      6600
     CCTACAGAAA AATGACATGG ATTCTAAACA GAAGAAGCAA ACTCCCTACC AAGACTAAAA      6660
     TGCTGATCCT TAAGTCAGTC CTTTCACCAA TATGGCAGTA TGCCATAGCA GCTTGGGGTC      6720
     CCCTTGTGAC GGATGCACAG ATAAGACGGA TCCAAGTCGA GGAAAATAGG AAAATGAGAG      6780
     ACATATGCAG AGCGGGTAGA TACACGAGCA ACCAAACTAT AAGGGACCGC TATGGAATCA      6840
     AAACAGTAGA AGAATTCTAT CAACAGGCAC TCCACAGGTT CTCAGAAACA ATAAAATCTC      6900
     ACCCAAATAT AGCTGTACGC AGGATATTCA CAAGGCACTA TATCCCGAAC AGACTAGAAA      6960
     GAAGCAGGCA GAGGTACTTG AAAATGACAA ATGAACACAT CACGCAAAAA CAGACTGGAC      7020
     AAACACTCTC ACCTAAACTC CTAAAAATCC CTGATCTAAA TGACTGCAGA ACCCTTAAAA      7080
     AGCGGAATGA AAGAGATAAA ATAAGGCAAA CCCATCTAAT TGAACTCCCC ACCCTGCTGA      7140
     GACTAGAGGA AGAAGAGGAA GAGCTTAGAA GAATAAAAAA ACAGGAAGAG AGGGAAAGAA      7200
     GGGAAAAGGA AACCCAAAAG TGGCCTCCAG ACAGATGGTG TGAATTAGAA ATTAACCTAT      7260
     ATAATAAGCA ATATAGAAGG GGCGATCTAA CCAGGCAGGA AATCATACAA AAATTTAGAG      7320
     GACAACCACT AAATGTACAG AGGATAATTT TACCCGACTA TAAAGGAGAC CAGGAACACA      7380
     ATTAAAAGTA AATCATGGGA AAGCAGGGGA AAAAAAACAG AAGTAACAAA ATGGCGGAAG      7440
     GGGTGGCAAA ATATATATAA AAATAAGAAA AGATAGAAAT AAAAAGGCTA AAGGCTCACT      7500
     TACAGGTTAA TTCAAAAGGG AAACGTGCTT ACATATCTAA TGGTAAAAAC TAACTTATAA      7560
     CACCTACTGG ATGACATAGT GAGGATGCCA CAGGTTGCGC ACTTGAATCA CGCTTTCCTG      7620
     GCGAGATTGT TAAGGCATCA CCGGGATCCC GTCTCTCTTT CCTAACTGGA GGACTCATGC      7680
     CTGAAATCTT TTCCGCTTCA CCGGCACCTG ATGGCCATAT CTGCTACTGC GCCTTGCGTC      7740
     CACGGACGCT CCTTCCTGAA AGAAAGAGAA TTTGTTTTAG TTTTCCTTTC TCTTCTTAAA      7800
     AATATAACAA AAACAGCAGC AGTAGCCGAC CAACAACATA CTTAGCTTAC CAAGGCAGCA      7860
     GCAATGATAC CAACAGAAGC CCTACAGTGT GCTGAACAAT ATGCCGCCCA CGCCCACCAC      7920
     TTCTGGAACT CAGGAATGGG GGGTACGGAA TGCCGGAAAC TGGAGGATTC GCCTCAAATG      7980
     TTACGCTTAC ATCTTTGAGC AAATCGCCTG CCTCCTCGTC TAACGGCCCG GCGTCTTGGT      8040
     ACGCCCAGAA GTAGCAGCGG TAGCAGGATT AGCAGCCTCC ACAGAGATAT GTTCATCCCA      8100
     GCATCAGTCC AGTTGGCATT GTGATGCCGC CGTAGCGTAC GCCCTCAGAG ACCCGACTGG      8160
     AATCCCAGGA CAAGAGACGG CAGCACGCCT GGGCTTAGGC GCGGGACAAC ATGCAGAGAT      8220
     TCGTCAATGA GAATGGCGGC ACTGGAATCA CCTTTCAGCT GAGCGGGATA ATGAGTCGGC      8280
     AACGCACCGC ACTATCAGCA GCAATAACAA CATCGGCAGA TGACCTGGAA GAAAGGAAAA      8340
     AACATGTATC AGTCTTTTCT TTTCTTTTTT TTTCCCATTA GCATGCGTTT TTAAATTCCA      8400
     TTCCTGAAAA CCGGCGTTTT CCTGTAAAAG ACACTGGACG GCGGCGTTTG TTTTAAATGC      8460
     AAAGATTGGA TGCTTGCATC AGGGCTGACG TCCTTGAATA GCCGATGCCT TGTAATTGCC      8520
     TGCATAGCCG CGGAGGTCCT GATGACGGAT GCTGGCCTGT ATTTGGCCAC CACTCCGATG      8580
     CCATGACAGC AGCAACAGCA GCGGTTTTTG CAAATGAGAG GGATCAGGAG GCGGCAACAC      8640
     ATTCACCCGT AGCAGCAACA ACAAGCAGTG GTAGCATCAG CAGGGAGTCT TCTCGCCACA      8700
     ATAGCCATTT GGAAATTTCT CGACGACCCG ACTTCCTGCT TGGCCCATGG TCAATCACAC      8760
     TGGACCAGTT AACAGCGGCG TTTTACCCTG GAAGAAAGAA AACTTGTATT ATTCATTCCC      8820
     TTTTCTCTCA CAGTTGGGTA TTTAAGTGCA TTCCTGGCCA ACCTAGCGTG TCTCCTGGCA      8880
     ATGACGTCGG ACTCAACGCA TGCTTCCCTT CCGACACAGT AAGGATGTTC GCATCTGGGC      8940
     TGACGGGCCA GGCCGGTCCG TTGCCATACA TGCTAGCGTT TCCGCGGCGG CGTAGTGAAC      9000
     ATCAAACCGT ATAATGGCGA AGACGACGAT GATCCGGCCG GATGGCAGCT CGACGACGGT      9060
     AGCAGGCCAC CATGCCCGCC AGCCCGCAGC TAGGATAGCA GCAACATCAG CGTCTTATTA      9120
     ACGCGAACGG CGGCACTGGC CCTTAGCTGA CCAGCTGCAA CAACATCAGC GACGCAGTCT      9180
     CCACCAGCAG CAACAACAGC AGCGGCGCTT GCGACAGCAG CAGCAGGGAA TGGTTCTGCC      9240
     GCAGTCGCCT ATTGCTGCCT ATAAAGAGCA TTCCTTGCCA ATTGGCTTTC TGTACGACGA      9300
     CGATGATCCT GCGGACAAAT CCACCTTTCC GGACGCCTGA GTATTATGGC GAGCCTGCTG      9360
     ATCATTGTTT CTCCGACTCC TTACTTGACC ACTGGACAAT CATACAATCA CCGGCTTTTC      9420
     ACATCTGGAA GAAAGAAACC TGGATTAGTA TTTGCCCTTC AGATTTGTAT GAAACTGCAT      9480
     TTCTGGCCAA CCGGAGTGTT TCCTGCAGAC GACGCTGGAC TGCGACGCAC TTTTTTCTAC      9540
     CAACACAGAT GGGACGCTTG CATCAGATCT GACGGGCCAG ACTGGCCGAT GCCTGGTACA      9600
     CGATGGCATC TCCGCGGCGG CGAGATGTGC AGCGACGCTG AAAGCAATAA TAATTCTTTT      9660
     ACTTTGCAGT ATCAAAAATG AGAAGCCACA TCACAATTTA CATCAGCAAA AATTACACGT      9720
     GATATCTTTT TCTTTTGCCT AGGAGTAGTG AGACCTGCTA CCAAAATGAC CAGTAATACC      9780
     GGCTAACGGA AGCGAGATAT CGATAATCAT TCTGGCGGTA AAATAGCCAG AACATCGATA      9840
     ACCAGCTGTG CATTTTCCCT TCGATTTATC GAAGTCAAAT AGCCCGCCTA GGCTATCGGA      9900
     CCGGATCGGC AAGTCAGTAG TGATTAAAAA TCCGGCAGAG GCGCCTGTGC AGCAGCTACC      9960
     CAAAGTGAAC ACGACGAAAC GCAACAACAA AATGGACGGA CATAATGGAG ATCAAAGTGA     10020
     AGGATGGGCA ACAGTGCTAT CTATCTCCTC GGATGATAGT AACTCCTTGT CGTCGCTGCA     10080
     TATATAAAAT AATAAATTTC TTAAAATAAT TTCATCGCTG GATTCCTGCG CCACCATAAA     10140
     TTACTTATAG AATACACTTA ACACTGTACC CACTAATGCT AAAAATTTTC TTATACAATT     10200
     TTACTTTAAA GCTAAAACTA CTTAAACTAT GGCGCGTAAA ACGGCCGTCA AAAATATCCA     10260
     AAAATTGTAC TTGCCATAAA CAAATTCTAA CATAATGTAA ATCCTAAATC GTAAAATCAT     10320
     GGCGAACATA ACCGCCGCCA AGCAAATCAA AAAATGTTCC TAGAAATTGT AAATCTTAAA     10380
     CCTACTTCTC TAACTAAAGC GCGCACAACT GCCGCTGATC CGAAATTGTA AAATGCCATA     10440
     AATTGTAACT ATATATTTTA TAAAAAAAAT CAGAGTACAA TAAAATGACA GCGCCGAAAG     10500
     GCACTGAAAA TATTTAAAAA AAAAAAAAAC TGCCGCTGAT CCGAAATTGT AAAATGCCAT     10560
     AAATTGTAAC TATATATTTT ATAAAAAAAA TCAGAGTACA ATAAAATGAC AGCGCCGAAA     10620
     GGCACTGAAA ATATTTAAAA AAAAAAAAAA AAAA                                 10654
//
ID   TIRANT   standard; DNA; INV; 8526 BP.
XX
AC   nnnnnnnn;
XX
DR   FLYBASE; FBte0000179; Dmel\Tirant.
XX
SY   synonym: prygun
XX
FT   source          X93507:1..2484
FT   SO_feature      five_prime_LTR ; SO:0000425:1..417
FT   SO_feature      three_prime_LTR ; SO:0000426:8109..8526
FT   SO_feature      CDS ; SO:0000316:1866..2999
FT   SO_feature      CDS ; SO:0000316:3239..6505
FT   SO_feature      CDS ; SO:0000316:6683..8146
XX
CC   Sequence identified by REPBASE:
CC   http://www.girinst.org/server/RepBase/RepBase6.6.embl/drorep.ref
CC   Assembled and annotated by Josh Kaminker & Michael Ashburner.
CC   REPBASE states this to be a consensus sequence.
CC   This replaces that from X93507 in versions previous to 4.8.
XX
SQ   Sequence 8526 BP; 2961 A; 2097 C; 1384 G; 2084 T; 0 other;
     GGAGTTACCA CCCCACCCCC TAAACCCCCA CGCCTCTAAA CAAATCATCG GACACTCAAC        60
     CGGGAAGACG GCAACTGGAA CACCGCATCC GGCCGAATGC TGACATTCCG GCCGAATGCT       120
     GACATTACAC AAAAGTCGCA CTGCAACATT GTCCCCAGCT AGCCAGCCAC ATGCCGAGTC       180
     GGCATGTTCA TTATGCTTAC AATTAAGAAC CTATGTACTT ATGTATAAGA CGAAAACGGA       240
     GGACTCGAGT AGCCACTCTC TGACAATAAA CTTGATACTG ATTTTGAACT TCAAGAAAGT       300
     CAGTCGTATT CTTTATTGGA AATCTTCACA CTACAACTAT CTGCTGAAAC TTAAAAACCT       360
     TCATACATTT ACACATCATA TCTTCACAAA AGGCTCCACC CTCGATCACG GACTTAACTG       420
     GCGCAGCCGG TAGGATGTCC TACCTATTAA TAATTACCTA CCTGTAAGTA AACATGTAAG       480
     AAACGAAACA AACTATATGC AAGATGTCGA CTGAAAGTGA CTAGGAACAA ATTTTTATAA       540
     AACAAAATTG AAGTTGTGAA GTACCAAATG AAACTCAAAC ATATATTCAA ACACAGGAAA       600
     AAAAAAGAGA GAGGAAAAAT GTAAAATAAA TAAATATACA AAAAAAAGTG CAAGTGTACC       660
     GTACTGCCGC GCTGACGTGG AATCTATCGC TGATCATCAC GCCATCGGTA TGTCCATACT       720
     CTGCCGAACG TCATAATTTT TTTAAAAAAG TGCAAGTGTA CCGTACTGCC GCACTGACGT       780
     GGAATCTATC GCTGATCATC ACGCCATCGG TATGTCCATA CTCTGCCGAA CGTCATAATT       840
     TTTATAAAAA AGTGCAAGTG TACCGTACTG CCGCGCTGAC GTGGAATCTA TCGCTGATCA       900
     TCACGCCATC GGTATGTCCA TACTCTGCCA AACGTCATAA TTTTTATAAA AAAGTGCAAG       960
     TGTACCGTAC TGCCGCGCTG ACGTGGAATC TATCGCTGAT CATCACGCCA TCGGTATGTC      1020
     CATACTCTGC CAAACGTCAT AATTTTTATA AAAAAAGTGC AAGTGTACCG TACTGCTGCG      1080
     CTGACGTGGA ATCTATCGCT GATCACCACG CCATCGGTAT GTCCATACTC TGCCAAACGT      1140
     CATAAGTTTT TATAAAAAAA AAGAGTGCAA GTGTACCGTA CTGCCGCGCT GACGTGGAAT      1200
     CTATCGCTGA TCATCACGTC ATCGGCACTT ACATACGCTG GCCAACGCAT CGCCAAAGCC      1260
     TCTATATACA CTTATATATG TGAGCATACA ATATCAACTA CAATCCAATA CATCCACGTA      1320
     CTGTACCGCC TCGTTGGCAT GGAATCAAAC GCTGATCACC ATGCCACCGT GGTAAACAAA      1380
     CAAAGCACCA AAGCCTCTCT AATACATTGT ACACTCAAAA CGCACACTGC CATACGTCGG      1440
     CGAAAAATCA AAACATAAGC AAAAATCATT TCAAACCAAG CGAGGCTCAT TCTGCGTACC      1500
     ACAACGACAA CGACACTGCA TGTGTAGTGG CGCACCCATG TCTGGGTAGC CGAGGTAAGG      1560
     GGAAAACGCT TGAGTATCGT CAAGTGTTCT TGCCTTTCAC TCTTCTACAA TGGGTTGCTA      1620
     CGCTCATGTA TTGCACATTC AAAATAACCA AAACAAATGT ACTAAAGAAG TCGACATATA      1680
     CAGATATATT TTGTTTCCTT TCATTGTGTA ATTTTGTATA TCAAACAAAT ACTAATACCA      1740
     ATCACATTGC AGAATATAAA AGGGAAAATA TAAAGCCAAA GACAGACACC CATACACTCT      1800
     AGTAAACAAG AAATTTGTTC ATTATTTTTC AATCATACAT AATATACTAA GTAACCTCAA      1860
     ATTTAATGTC AAAAAAGTTC GTTTACAACC TTAGGAAAAC TACACGTTCA GTTGTTGGAG      1920
     TTCCACCAAA CACTAATAGG CCCCCACATC CCGTTAGACG TCCTGACTCC CTTCTCCCGA      1980
     TTTCGGAAGA ACCCAAATCA ATATCTTCCC AAACCCCCAA TATGGACTCG GGAAACGATT      2040
     CTGCCCGCCC CACTCCATCC CCTCTGGCGC CCACTGTCAG TGGTATTAGC TCCTTAATTT      2100
     CAACTACGTT CAAGCCTAAA GATATCATGG CATTTGTTGA GCATTTGCCA ACCTTTGATG      2160
     GTACACCTCG TCTATTGGAC AGGTTTATCA CTAGCGTAGA AGAAATCCTG ATGCTCATCA      2220
     GGGGAGCTGA CCAAACACCG TATGGCCTGC TTACTCTGAG GACCATCAGG AACAAAATCA      2280
     TTGATAGGGC CGACGAAGCC TTGGAACTGG CAAATACCCC CTTGGTTTGG GATGAGATTA      2340
     AAAGCAATCT CATCCGCCTC TACTCGAGCA AGAAAAGCGA GGCCAACTTG TTAAGCGAGC      2400
     TTAACACATT TTCGGACAAC CTGACCTTGG GCCAACTGTT CTTTGGTATA TCAAAGGTGA      2460
     GAAGCCAACT CTTCTCCATA CTCAAAAACA GCGAACACAA CAACACTGTT GTAGATGCAA      2520
     AAAAGGTTGT CTACAACGAG GTTTGTCTCA ATGCTTTTAT GACTGGTTTG AAGGAACCTC      2580
     TCAAGACTTT CGTCAGGATA AAGTCCCCTT CTACACTTGA ACAGGCGTAC GAGCAATGCC      2640
     AAATAGAGCA GACCTTATAT AGGGCACAAA ACAAGCGAAC CAACAGACCA GAGCAGGGAC      2700
     CCAATGGATC AGACAATAAA ACCTACCGAA ATAGCTACGA CAGCAATTAC CGCAGCGGAC      2760
     GTAACGACCG AAATGACCGT AGGGGACCCT ACTCTAACTC TAACTCTAAC TCTAACTCTG      2820
     GCCAAAATAG ACCATTTAAT TCACACAATC GCACACCCCA ATCCGGCACC AAGGACAACC      2880
     GGGCCAATAC ATCAAACCCC TTTCGAGCAC CTTCACATAG TTTGAATAAT ATAGAGGAGA      2940
     ACCCTCAACC TGATTCGAAT TTTCAGCAAA CGGCCTCGGG AAACCAACAG GGTACATAAG      3000
     CCCAGCCACG CACAACCCCT CGCTTCCTTT TATAAAAATC AAACTATCCC AGACAAACCC      3060
     CCTGAAGTTT TTAATTGACA CAGGCTCTAC ACACTCCTTC ATCGACCCAA AATATGTCGA      3120
     CCCTAGGAAC TGTGTGACCT TAGATACGCC CATAACACTC AAAACAGCCC TGAACAGTTT      3180
     TAAAATATAT CAAAACGTCT CTATACCATT TCCACCGGAA TTCCAAATCA CGGGCAAAAT      3240
     GACCCTTCTA CCTTTCAAGT TCCACTCTTA TTTTGACGGA TTGATAGGAA TGGACTTATT      3300
     ATCTTACCTA AAAACAGAAA TAGATTTACT TAACCTAAAT CTAAAAACCC CAAGTACCAT      3360
     TATACCCTTA TGGACCCACA GTAACTCAAC TTCAAACGTA TTTAATATCT CTGGACATAC      3420
     GAAAACTATT TTGCCACTAC CAGTGGAAAC CAAACAGGGC GACTTCTACA TCGATTCAAT      3480
     TACAATCAAT GATGACTTAA TAATATCAGA CGGGATTTAT AATGCCCAAA ACAATATTGC      3540
     TAATTTCGTT ATCACAAACT ATAGCGAGAG GGATCAGTTA TTGTACCTCG AGAGCCCGAT      3600
     AAAAGGCATG CCATACTCCA CGGCCAACAA TGTTGAACTT TTCAGTATCA CTTCAGACAC      3660
     CCCACAGCCC CAAAACTCCG CAGCGTCGTT ACAAGCCCTT GGCGTCGATC ACCTCTCCTC      3720
     TGAAGAGAAA CAAAGCCTAC TTTCACTTTG CAAAAGTTAT CTAGATATCT TCTACAATGA      3780
     AGACAAATCA TTGACCTTCA CCAACAAGAT TACACACACG ATTAAAACCA CGGACGACAC      3840
     CCCCATTCAT ACAAAATCTT ATAGATATCC TTACATTCAT AAAGAGGAGG TCAAAAAACA      3900
     AATAGAGGCA ATGTTAAATC AGGACATTAT CAAATCCAGT TATTCCCCGT GGAGCGCCCC      3960
     CGTCTGGGTC GTCCCAAAGA AAATCACTCC TACGGGAGAG CAAAAATGGC GTCTAGTTAT      4020
     CGATTATAGA AAACTCAACG AGAAGACTAT ATCCGATAGA TATCCAATAC CTAACATCGC      4080
     GGATATCTTA GACAGATTGG GCAAAGCCAA ATATTTCTCC ACACTTGATC TGGCAAGTGG      4140
     ATTCCATCAG ATAGAAATGA ATCCCGACGA CACACCCAAA ACTGCATTTA CAGTAGAGGG      4200
     GGGCCACTAC GAGTTCATTA GAATGCCGTT TGGCCTCAAA AATGCCCCAG CCACATTCCA      4260
     AAGGGTGATG GACAATATTT TTGGAGACCT TATCGGAACT ATCTGCCTAG TTTACCTAGA      4320
     TGATATAATA ATTTTCTCAA CCTCCTTACA AGAACACTTC ATACACTTGA AAACTATTTT      4380
     TGGAAGACTC AGATCTGCCA ACTTTAAAGT CCAACTCACA AAATCCTACT TCCTCAGGCG      4440
     GGAGACAGAA TTCCTTGGCC ACATCGTTTC ACAAGAAGGT GTTAGGCCAA ATCCCAATAA      4500
     GATCGAAGCT ATAAAAAACT TTCCATGTCC CCACAGTAAA AAGTCAATTA AGTCTTTCCT      4560
     AGGCTTGTTG GGATATTACA GAAAATTTAT CAGAGATTTT GCGAGACTTA CCCAACCCAT      4620
     GACACAAAAA TTAAGGGGAA ACAATAAATC GATCATAATA GATGATGAAT TCAAAAAGGC      4680
     CTTTGAATAT TGCAAAACCT TACTGTCTAA CGACCCAATC CTCCAATACC CGGACTTTAC      4740
     AAAACCTTTC ACACTAACCA CGGACGCAAG TAATTTCGCA ATAGGAGCTG TCCTATCCCA      4800
     AGGTCCGGTG CATAGTGATA GGCCCGTATG TTTTGCTAGT AGAACCTTGT CGGCTGCGGA      4860
     AACAAATTAT TCCACAATTG AGAAGGAAAT GCTGGCCATT ATATGGGCGG TCCAATACTT      4920
     CAGACCCTAC CTCTTTGGCA GGAGATTCAC TATAATCACC GATCACAAAC CACTAACTTG      4980
     GTTAATGAAT TTCAAACAAC CAAATTCTAA AATAGTTAGG TGGAGACTCC AGCTTCAGGA      5040
     GTACGATTTC GAAGTCGTCT ACAAGAAAGG CTCTCAAAAT GTAATTGCTG ATGCTCTCAG      5100
     TAGACCAGAG GCCTCTGTCA ACCATAACGA AGCCCTATCA ATTCCTCAAA ATGTTTGCCC      5160
     CATCTCAGAG AAACCCCTTA ATGATTTTAA TATTCAGCTC CTGTTCAAAA TAACCCCAGA      5220
     TACAAATAAC GCCACACTGA CCCCGTTTAA ACACAAACTT AGGAGGGAAT TCTGTAAACC      5280
     CAATTTTCAG TATGACGACG TAGTTTGCAT TCTTAGGCAG TCGTTAAAAC CAAACAAGAC      5340
     ATGCGCGGTA TTTGCCCCCG ACCACATTTT TCAAATGGTG GAACAAGCCT ACCAAACCTA      5400
     CTTCTCAGCC CACAGTCAAT TTAAACTCAT TAGATGTTTG ATCTTCCTCC CCGAAATTAC      5460
     TGATAGTACG GAGATCGAAA AAATTATAAC CGACTATCAC TATAATAGTA ACCATCGAGG      5520
     GATCGATGAA ACATATTTAC ACATAAAACG ACAACAGTTC TTCCCACATA TGAAGGAGAG      5580
     AATAACTCAG TTAATTCGAA AATGTGAAAC ATGTTTAAAA TTAAAATACG ACAGACAACC      5640
     TCAAAAGATC ACTTACCAAA TATCCGAACT ACCTTCAAAA CCGTTGGACA TCTTACATAT      5700
     AGACATTTAT ACTATTAACA AAAATTATAA CCTTACTATT ATCGATAAAT TTTCTAAATT      5760
     TGCGGCTGCC TACCCTATAA CTAATAGGAA TTGCATTAAC GTAGTTAAAG CCTTAAAACA      5820
     TTTCATTTCC CAATTTGGTA TTCCCAAAAA GCTGATCTAT GATCAGGGAG CAGAATTCGC      5880
     TAGCGATATG TTCAATAAGT TCTGCACTCA ATTTAACATT GACCTACACG TTACGTCCTT      5940
     TCAACAATCC TCTAGTAACT CTCCCGTTGA ACGGCTTCAC TCGACACTAA CTGAGATTTA      6000
     CAGAATAATA CTTGACGTCA GGAAACAACA GAAACTCAGT AGCGAGCATG ACGAGATAAT      6060
     GTCCGAAACC CTAATCACAT ATAATAACGC TATTCATTCT GCAACTAAAC ATACCCCCTT      6120
     TGAACTATTT AACGGACGTA CTCATATATT CAACCAAACA ATCCAGTTCA ATAACGAACA      6180
     CGACTACTTA ACGAAATTAA ATGAATTTCG CGAGAAGTTG TACCCCCTCA TCACGGACAA      6240
     ACTTTCAAAT GACGTAGTTA GGAGAACCCT AAAATTAAAT GAAACCCGAA CAGACCCCGT      6300
     AGACCTACAA CCAGACACTT TAGTCCTTAG GAAGGAAAAC AGACGTAATA AGATTACACC      6360
     CAGGTTTTCG ATTCACAAAG TCAAACACGA CAAAGGTCAT ACATTGATAA CTGCTAGGAA      6420
     TCAAAAACTA CACAAATCAA AAATTCGAAA AACAGTTTTG AAAAAAGACA AAAGCAACAA      6480
     CGTACCCAAC ACTGATAATA ACTGACCCCA CTACCTCTTA ACTTACCATT TCAGGTTCAC      6540
     CCTTGTGCCA ACTCAGGCTA TCCATGTCCA TTATTTAAAT GATAACGCCC CTATAGCCAA      6600
     GATAGAACTA GGGAAAGCCT TACTAATTGA GAGGTACAAA ATAATTAGTC ATGTAATCAA      6660
     CCTACAAGAC TACAGCAGAT GTATGGAACA ATTCCATCTG ACCATTAATA AATTTAACCC      6720
     CGATTCCACG TTGACGGACT CCGTCACAAT TTTAAAAACC AAATTAACCC AAGCCCAAGT      6780
     AAAGCTCAAA GCCCTTACAC CTTCATATAG AAACAAACGG GGTTTGATTA ACGGATTGGG      6840
     GAGTCTAGTA AAGGTGGTTA CCGGCAACAT GGATGCCAAC GACAATAAAG AAATACATGA      6900
     AGAACTTGAC AATATAAAGA AAAATTCCGA AGTCAGTAAC GACAATCTCC AAAAACAAGT      6960
     AATGTTTAAC AACGAAATAC TTATCCGGTT CGAAAATATC ACGGACCATA TAAATAATGA      7020
     ACAAATTTTG ATAAGTAAAT TCTTTGATAC CTCACAAAAC AAAATATACA AACACTTAAA      7080
     CTTACAAGAT ACCCTTCTGG AAGAAATACA ATATTTAAAT AGGATTAATT ATAACATAGA      7140
     ATTATTCATT AACCACCTAA ACGACATAAC AGAAAGTATG CTATTGGCGA AAATAAATAT      7200
     AATTCCCAAG TTCATCCTAA ATGAACAAGA AATGGATAAA ATAAAAACAA TACTGGAAAA      7260
     ACAAAATATC ACAGTCAAAA ATGAACAAAG TATATACAAT TTCCTACAAA TGAATACACT      7320
     AAATTACGAA CAAAAGATTA TTTTTAATAT CAAAGTCCCA ATTTTTAAAC AACCTTTTCA      7380
     TACCCTCGCC AGACTAGTTC CATTACCAAT AAATAACACA TATTTTGTAA TAACCCCAAA      7440
     TTACCTAGCT TATAATATTA ATAATAAGAA ATTTCATATG ACCCGTAAAT GCCCCAAACT      7500
     GGATAATACA TTCTTGTGCG ACGAGAACTT CTACGTTGAT ACACCACAGA ACAACACATG      7560
     CCTGGAACAC CTTTTGAACG GAGAAAACAG TTCCTGCGAT GTACGGGAAA CCGGCCCCAT      7620
     CACCGACGTG TTCGAGGCAG AGAGAGGTTA CATCTTCGCA TTCAACGTGA ACAAACTGAA      7680
     GGTATCCCTA ACAAACGGCT CCGAGCTCTC AATAATGGGG TCAGCCATCA TCAGATACAT      7740
     TAACGAAACA ATACAGATTA ACGGTATCGA TTACGACGGC ACGGTTGACA CGTTCCCTGA      7800
     ACAGACGGAT TTTGATCTTC CCCCCATGCG AAAAGTAACT AGGAATACCA CTATTACGGT      7860
     ACTAAGCCTA GAAAAACTGC ACCTCGAAGC CACCCAAACA ATGGATAAAA TCCTGGCCGT      7920
     CCATCACAAT ACTATACAGC ACACCTGGAC ACTCTACACT CTGCTCGGAT TGGTAACGTT      7980
     CCTAGCAGTC ATCTTATGGC TGCACCGACG AACGAAACAC ATCGTCCACA TCCACGAGGA      8040
     TCATCACGTA CCAATCTACG CGTCATCCAT ACCTTCGCTA TGGCCGTCAC TTCGAACTGG      8100
     GGGGGGAGGA GTTACCACCC CACCCCCTAA ACCCCCACGC CTCTAAACAA ATCATCGGAC      8160
     ACTCAACCGG GAAGACGGCA ACTGGAACAC CGCATCCGGC CGAATGCTGA CATTCCGGCC      8220
     GAATGCTGAC ATTACACAAA AGTCGCACTG CAACATTGTC CCCAGCTAGC CAGCCACATG      8280
     CCGAGTCGGC ATGTTCATTA TGCTTACAAT TAAGAACCTA TGTACTTATG TATAAGACGA      8340
     AAACGGAGGA CTCGAGTAGC CACTCTCTGA CAATAAACTT GATACTGATT TTGAACTTCA      8400
     AGAAAGTCAG TCGTATTCTT TATTGGAAAT CTTCACACTA CAACTATCTG CTGAAACTTA      8460
     AAAACCTTCA TACATTTACA CATCATATCT TCACAAAAGG CTCCACCCTC GATCACGGAC      8520
     TTAACT                                                                 8526
//
ID   DMBLPP     standard; DNA; INV; 5034 BP.
XX
AC   Z27119;
XX
DR   FLYBASE; FBte0000660; Dmel\flea.
XX
SY   synonym: blastopia
SY   synonym: Kermit
XX
FT   source          Z27119:372..5405
FT   SO_feature      five_prime_LTR ; SO:0000425:1..275
FT   SO_feature      three_prime_LTR ; SO:0000426:4757..5034
FT   SO_feature      polyA_site ; SO:0000553:5006..5011
FT   SO_feature      polyA_site ; SO:0000553:5019..5024
FT   SO_feature      CDS ; SO:0000316:760..4761
FT                   /name="Dmel\flea\polyprotein"
FT                   /db_xref="FLYBASE:FBgn0043491"
FT                   /db_xref="SPTREMBL:Q24262"
FT                   /db_xref="NCBI_PROTEIN:CAA81643.1"
FT                   /translation="MFTRTPPTNKKLNTDQIQAILENESEDESRKEKMNEEDQKLAPVG
FT                   EAEAKKQNKDASAKVEEKFEQMMNTLTQSMLAKSKQEGQVIIAAEKFEKVVSDCDGKSI
FT                   PIKKWFEIFEKNAEAYELSEKQKYVQARSKMIGSAELFLESECVSGYTELKELLIEEFS
FT                   GSYNSAVIHKKLQDRKKKREETLHDYLLQMKKIAALGEVETVALITHIVNGLDIKKEYK
FT                   GAMLRCKTLKELKQEFEIYESLNIVDKPNIQPKPKQITQGVKADHCFNCGSREHKRKDC
FT                   TLPTKCFSCNQEGHISSKCPEKVNSMRIHVDSARTKPVIINGIIINCLVDTGSDVTIIK
FT                   EAIFKKMKDVDLNRTATVLRGLGNASTQPIGCFRALIKTDQVEASHNVLVVHDSKFSCD
FT                   GIVGHDFISKFRLICSAEGYTFLDLEADKKQAVEYSQMFNICEESSFTVAPQYREDVER
FT                   MIERTYETPPKQIKQCPVELKIIPDGVIKPFRHGHTRLSEEEAIAVKKQVEEWVEQSIV
FT                   RKSTSNVASRIVVVRKKDGTLRVCVDYRKLNTMVLMDCFPVPIMEEVLEKLQSAKWFTT
FT                   MDLQNGFFHVAVEEASKPYTAFVTREGLFEFNKAPFGFKNSPAAFIRFVQFIFQELINS
FT                   NIMQLYMDDIIVYAATPEECMEKTEMVLKRAAEFGLKIKWKKCNFMQRRIHFLGHIIEG
FT                   GQICPGKEKTSAVNSFGTPQNVKAVQGFLGLTGFFRKFIPGYAQIARPLTDLLKKDAIF
FT                   NIGPVEQQSVNKLKEILVNEPVLRIYSREAETELHTDASKDGLGAVLLQKFEGSFHPVC
FT                   FWSRKTTKAESNRHSYYLEVKAAYLALKKFRHYLLGVPFKLVTDCVAFKQTTKKADVPR
FT                   EVGPWILYMQDFNFQPEHRAGERMRHVDFLSRHPQACMMITSELTARIKKSQQNDDSIR
FT                   AILEILKDRLFQPYKLKGGLLYSMVNGNELLVVPALMEREVIQSAHEVGHLSLQKTMHS
FT                   IQQQFFYFLIWEYKVKKLISNCIKCIIHSKKLGKQEGYLNCIDKGDAPLHTLHIDHLGP
FT                   MDSSAKQYKYILATVDAFSKFVWLFPTKSTGQEEVVKRLTDWSNIFGFPKRIVSDKGTA
FT                   FTSGAFEQFMSSHNVEHVCTTTGVARGNGQIERVNRLILAIISKLSSDEPSKWYKYVPE
FT                   VQKAINCHVHSSLKLSPFEVMFGTKMYTRVEDRLLELLQEEVVCQFNEDRYEMRQLVKR
FT                   NIEQAQKDYKRNYDKKRRAEYKYKAGDLVAIKRTQFVAGRKMASGYLGPYEVTGVKDNG
FT                   RYDVKKAANVEGPNVTSTSCDNMKLWKYIAENADLLSSGSDDDDQEGRM"
XX
CC   Derived from Z27119 (g415797) (Rel. 50, Last updated, Version 6).
CC   Takis Benos and Michael Ashburner, 20-Aug-1997.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 5034 BP;  1719 A; 938 C; 1145 G; 1232 T; 0 other;
     TGTAACATGA GTAAGGCTGA AGGCTGGCAA CAACCCGGTT GGCAGCGCTG TTGAGCAGCA        60
     ACATGATTGT CGGAAATCCA AGTTATCGAC AATCAGTCAT CGAAGGACGA TCGCAGGCAG       120
     CAGTAGAGGC GAGTGGAAGT CAGCGTTGCA GTCAGTCGAG TTCTCAGCAG CAGTCGTTCG       180
     GTCCACAAAC TAAGAAATAC TTTATATAAT TACCGCATTT AGAATTAAAC TAATAATTAA       240
     ATTAATAATA AACAATAATA ATAAACAATC TTACATGGGG GCTCGTCCAG TCCTAAATCG       300
     GTTATATGAA GGTGCAGTTG TTTAAAGAAA AAAGACATTG TTGTGTGCGT GGGTATAGTC       360
     TTTAAAACGT TGTAAAGTTG TGGCTATATC TATTGCATTT AAAGTTGGAA AAATCAGTTG       420
     TACAGATTTT GTTTGAACAC AAGTCGGTAA AAGTCGGGAA AGCTGCTAGA GAGAACTGAT       480
     AAAGTTGAAA TTGTCGTGTG CGTGGATTTA GTCTTTAAAG TTGTAAAGTT ATGGCTACGT       540
     CTACTGCATT GAAAGTTGAA AAAATCGATT GAACTCATAC AGACTCAAGT CGTTTTGCTG       600
     TTGTGGAATT TAAAACAATT AAATTGCAAA GGTGGTGAAA TTCGTTTCTA ACGAAAATCA       660
     AAATTTGTCT TTTAACCGGT GGCGCCGTCT GCAAAATCGA CTACCGTCGC GCCGTTAGAA       720
     CATTGTCGTT GTTTGCTGGT GTTAGTGCCT TGTCGCGGAA TGTTCACACG TACACCACCT       780
     ACAAATAAAA AACTTAACAC CGACCAAATA CAAGCAATTC TAGAGAACGA AAGCGAGGAC       840
     GAAAGCAGAA AAGAAAAAAT GAACGAAGAA GATCAAAAGT TGGCGCCTGT AGGAGAAGCA       900
     GAGGCAAAGA AGCAGAATAA AGACGCTAGT GCTAAAGTCG AAGAGAAATT TGAACAAATG       960
     ATGAATACTC TAACCCAGAG CATGTTGGCA AAATCTAAAC AAGAGGGGCA AGTAATTATC      1020
     GCTGCAGAAA AATTTGAAAA AGTTGTAAGT GACTGTGATG GCAAATCAAT TCCTATTAAA      1080
     AAATGGTTTG AAATTTTTGA GAAAAATGCC GAGGCATATG AACTTTCGGA GAAACAAAAA      1140
     TATGTTCAAG CCAGAAGTAA GATGATTGGA TCAGCAGAAC TTTTCTTAGA ATCTGAATGT      1200
     GTCAGTGGAT ACACTGAACT CAAAGAGTTA CTAATTGAAG AATTTTCAGG CAGCTATAAT      1260
     AGCGCCGTTA TTCACAAAAA GTTGCAAGAC AGGAAGAAGA AGAGGGAGGA AACTCTACAC      1320
     GACTATTTGT TACAAATGAA GAAAATAGCA GCCTTAGGTG AAGTTGAAAC AGTTGCTTTG      1380
     ATAACTCATA TCGTAAACGG CCTCGACATT AAAAAGGAGT ATAAGGGTGC TATGCTCCGT      1440
     TGTAAAACTC TTAAGGAATT AAAGCAAGAA TTCGAAATCT ACGAGAGTCT GAATATTGTT      1500
     GACAAGCCGA ATATTCAACC AAAACCAAAG CAAATTACAC AAGGTGTAAA AGCAGATCAC      1560
     TGCTTCAACT GTGGTTCGAG GGAACACAAA CGAAAGGATT GTACACTTCC TACCAAATGT      1620
     TTCAGCTGTA ATCAAGAGGG CCATATCTCA AGCAAGTGTC CGGAAAAAGT AAACAGCATG      1680
     CGCATTCACG TTGATAGTGC ACGAACAAAG CCAGTAATCA TAAATGGGAT TATCATCAAC      1740
     TGTCTGGTGG ACACAGGATC AGATGTGACC ATAATTAAAG AAGCTATATT CAAGAAGATG      1800
     AAAGATGTTG ATTTAAACCG CACTGCAACA GTATTGCGAG GTTTGGGAAA TGCCTCAACA      1860
     CAGCCGATTG GATGCTTCAG AGCATTAATC AAGACCGACC AGGTGGAAGC AAGCCACAAC      1920
     GTTTTAGTCG TCCACGATTC TAAATTCAGT TGCGATGGAA TAGTGGGACA CGATTTTATC      1980
     AGCAAGTTTC GTCTTATCTG TAGTGCAGAA GGCTATACTT TTCTTGACCT GGAAGCAGAT      2040
     AAAAAACAAG CGGTTGAGTA TTCCCAAATG TTTAATATTT GTGAAGAATC TTCTTTTACA      2100
     GTTGCACCAC AATACCGAGA AGACGTTGAA CGCATGATAG AGAGAACATA CGAAACACCA      2160
     CCCAAGCAGA TAAAGCAATG TCCAGTCGAA CTCAAAATTA TTCCTGATGG CGTGATTAAA      2220
     CCCTTTCGCC ATGGACACAC CCGACTATCT GAAGAAGAAG CTATAGCTGT AAAGAAGCAG      2280
     GTAGAGGAAT GGGTCGAGCA GTCAATCGTC CGTAAATCTA CATCAAATGT TGCCAGTCGC      2340
     ATAGTCGTTG TCAGGAAAAA GGATGGTACC CTACGCGTTT GCGTGGACTA TAGAAAATTG      2400
     AACACCATGG TTCTGATGGA TTGTTTTCCG GTACCCATAA TGGAGGAGGT GCTTGAAAAA      2460
     CTGCAGAGTG CCAAATGGTT TACAACCATG GACTTACAGA ACGGATTTTT TCATGTGGCC      2520
     GTAGAAGAAG CCAGCAAGCC GTACACAGCA TTTGTTACCC GAGAAGGCTT ATTCGAGTTT      2580
     AACAAAGCGC CCTTTGGTTT TAAGAATTCC CCAGCAGCGT TTATACGGTT CGTTCAATTT      2640
     ATTTTTCAAG AACTAATCAA TTCCAATATA ATGCAGCTAT ATATGGATGA CATAATTGTA      2700
     TATGCCGCTA CCCCAGAAGA ATGCATGGAA AAGACGGAAA TGGTACTTAA GAGAGCTGCA      2760
     GAATTTGGTC TAAAAATAAA ATGGAAGAAG TGCAACTTTA TGCAGAGGCG AATTCATTTC      2820
     CTGGGACATA TTATCGAAGG TGGACAAATA TGCCCTGGAA AAGAGAAAAC ATCAGCAGTG      2880
     AATTCCTTTG GAACACCTCA GAATGTAAAA GCCGTTCAAG GATTTCTGGG TCTCACAGGA      2940
     TTCTTCAGAA AATTCATACC TGGATACGCC CAAATTGCGA GACCACTGAC GGACCTATTA      3000
     AAAAAAGATG CCATTTTCAA CATTGGACCA GTAGAGCAGC AGTCGGTGAA TAAGCTGAAA      3060
     GAGATTCTGG TAAACGAACC AGTATTGAGG ATCTACTCAC GAGAAGCAGA AACCGAACTT      3120
     CATACAGATG CCTCTAAGGA CGGGTTAGGA GCCGTTTTAT TGCAGAAGTT CGAAGGCAGT      3180
     TTTCACCCAG TCTGCTTTTG GAGCAGAAAA ACTACAAAAG CCGAATCAAA TCGTCATAGT      3240
     TATTACCTTG AAGTAAAAGC CGCATACTTA GCTCTGAAAA AGTTCAGACA CTATTTATTG      3300
     GGAGTCCCTT TCAAGCTCGT CACGGACTGT GTCGCATTTA AACAGACAAC AAAAAAAGCA      3360
     GATGTCCCAA GAGAAGTTGG CCCATGGATT CTCTATATGC AGGATTTTAA TTTTCAACCC      3420
     GAACATCGTG CAGGAGAAAG AATGAGACAC GTTGATTTTT TAAGCCGCCA TCCCCAAGCA      3480
     TGCATGATGA TAACATCCGA GTTGACAGCA CGTATTAAAA AGTCGCAGCA GAACGATGAT      3540
     TCAATTAGAG CAATCCTGGA AATTCTAAAA GATCGTCTAT TCCAACCCTA CAAGCTAAAA      3600
     GGTGGCCTGT TGTATAGTAT GGTCAATGGC AATGAACTAC TGGTTGTCCC TGCACTAATG      3660
     GAGAGGGAGG TGATTCAAAG CGCACATGAA GTTGGCCATT TGTCGTTGCA AAAGACGATG      3720
     CATAGCATAC AGCAGCAATT TTTTTATTTC CTCATTTGGG AATACAAGGT AAAAAAGCTA      3780
     ATTTCTAACT GTATAAAATG TATCATCCAC AGCAAAAAGT TGGGAAAGCA GGAGGGATAT      3840
     CTAAATTGCA TAGATAAAGG AGACGCACCG TTGCACACAC TACACATCGA TCATTTGGGG      3900
     CCAATGGATT CATCGGCCAA ACAGTATAAA TACATTCTGG CAACAGTCGA TGCGTTTTCA      3960
     AAGTTTGTCT GGTTATTCCC AACCAAATCA ACCGGACAGG AAGAAGTGGT CAAGAGGCTG      4020
     ACCGACTGGT CAAACATTTT TGGTTTCCCT AAGCGAATTG TTAGCGACAA AGGAACGGCC      4080
     TTTACGAGTG GTGCGTTCGA ACAATTTATG AGCAGCCATA ACGTGGAACA CGTCTGCACA      4140
     ACTACTGGAG TGGCCAGAGG CAACGGCCAG ATAGAACGAG TAAATCGTTT AATTTTGGCA      4200
     ATAATATCAA AGCTGTCTTC AGACGAACCG TCGAAGTGGT ACAAATATGT GCCTGAGGTA      4260
     CAAAAGGCGA TCAACTGTCA CGTGCATTCA TCACTGAAGC TGTCACCATT TGAGGTCATG      4320
     TTTGGCACCA AGATGTACAC CCGAGTTGAG GATCGGTTAC TGGAACTGCT CCAAGAAGAA      4380
     GTGGTCTGTC AATTCAACGA GGACCGCTAT GAGATGAGAC AGCTGGTAAA ACGCAACATC      4440
     GAGCAGGCGC AGAAGGACTA CAAGCGCAAT TACGACAAAA AGCGCCGAGC TGAATACAAA      4500
     TACAAAGCAG GTGATCTGGT TGCAATTAAA AGGACCCAAT TTGTAGCTGG CCGCAAGATG      4560
     GCAAGCGGGT ATTTAGGTCC ATACGAAGTC ACAGGGGTCA AAGACAATGG CAGATATGAC      4620
     GTTAAAAAAG CAGCAAACGT CGAAGGACCC AATGTCACAT CCACCAGCTG TGACAACATG      4680
     AAGTTGTGGA AGTACATAGC CGAAAATGCA GACCTATTGT CATCCGGGTC GGATGATGAT      4740
     GATCAGGAGG GCCGAATGTA ACATGGAGTA AGGCTGAAGG CTGGCAACAA CCCGGTTGGC      4800
     AGCGCTGTTG AGCAGCAACA TGATTGTCGG AAATCGAAGT TATCGACAAT CAGTCATCGA      4860
     AGGAACGATC GCAAGGCAGC AGTGGAGTAG GAGTGGAAGT CAGCGTTGCA GTCAGTCGTG      4920
     TTCTCAGCAG CAGTTCGTTC GGTCACAAAC TAAGAATACT TTATATAATT ACCGCATTTA      4980
     GAATTAAACT AATAATTAAA TTAATAATAA ACAATAATAA TAAACAATCT TACA            5034
//
ID   OPUS    standard; DNA; INV; 7521 BP.
XX
AC   AY180918;
XX
DR   FLYBASE; FBte0000918; Dmel\opus.
XX
SY   synonym: nomad
SY   synonym: yoyo
XX
FT   source          AY180918:1..7521
FT   SO_feature      five_prime_LTR ; SO:0000425:1..518
FT   SO_feature      three_prime_LTR ; SO:0000426:7004..7521
FT   SO_feature      CDS ; SO:0000316:1578..2831
FT                   /name="Dmel\opus\gag"
FT                   /db_xref="FLYBASE:FBgn0025876"
FT                   /db_xref="SPTREMBL:Q8I7Q0"
FT                   /db_xref="NCBI_PROTEIN:AAN87270.1"
FT                   /translation="MEETLRALSESLNALTNVVTGIKEDIKKNNDRLAILEQERGNAD
FT                   PTVDQPQPLVRARTEYELREISVLPDCVKELQAFEGRQEAYLSWINRAQSILTEYDLI
FT                   KTRPLYRAIVLHIRQKIRGHADMALAAYGVQDDDWDDIKRVLALHYADKRDLRTLEHE
FT                   LGAMCQGSRPLDRFYMDVNGHLSLILNNLKARNHPREVVNALIETYRDKALDVFIRGV
FT                   GRDCSKHLLVRSPKNLPEAYSFCMGLQNVMSRNFTAQNYQPSGAPRFAGPYQHQARPP
FT                   FRTPFSPGSGRFSQNSYRTQGPRQAIKMESNRSGQSYQSGYSGRQEEGSGIKRMSEGN
FT                   NPFQKAQRLYHMELAPPPLAPAASGDNQGRSHEGYYDDESQAVERSNNYPPQKNVEGV
FT                   TDAPHNLETEGGANFMTNASPVYRT"
FT   SO_feature      CDS ; SO:0000316:2972..5983
FT                   /name="Dmel\opus\pol"
FT                   /db_xref="FLYBASE:FBgn0025875"
FT                   /db_xref="SPTREMBL:Q8I7P9"
FT                   /db_xref="NCBI_PROTEIN:AAN87271.1"
FT                   /translation="MITHRLVGKFFKPLGNDSDITFFVLPNLHSFDGIIGDDTLKDLK
FT                   AIVDRKNNCLIITPGIKIPLLARASINVNPLLAAEHPDGTQEILNSLLGEFPRIFEPP
FT                   LSGMSVETAVKAEIRTNTQDPIYAKSYPYPVNMRGEVERQIDELLQDGIIRPSNSPYN
FT                   SPIWIVPKKPKPNGEKQYRMVVDFKRLNTVTIPDTYPIPDINATLASLGNAKYFTTLD
FT                   LTSGFHQIHMKESDIPKTAFSTLNGKYEFLRLPFGLKNAPAIFQRMIDDILREHIGKV
FT                   CYVYIDDIIVFSEDYDTHWKNLRLVLASLSKANLQVNLEKSHFLDTQVEFLGYIVTAD
FT                   GIKADPKKVRAISEMPPPTSVKELKRFLGMTSYYRKFIQDYAKVAKPLTNLTRGLYAN
FT                   IKSSQSSKVPITLDETALQSFNDLKSILCSSEILAFPCFTKPFHLTTDASNWAIGAVL
FT                   SQDDQGRDRPIAYISRSLNKTEENYATIEKEMLAIIWSLDNLRAYLYGAGTIKVYTDH
FT                   QPLTFALGNRNFNAKLKRWKARIEEYNCELIYKPGKSNVVADALSRIPPQLNQLSTDL
FT                   DANPEDDMQSLATAHSALHDSSRLIPHVESPINVFKNQLIFDTTRSKYLCEHPFPGYT
FT                   RHLIPLKDGSLADLTNSLQSCLRPVIINGVKIPEAHLQRFQSICLANFLLYKIRITQR
FT                   LVADVSGAEEICEIIEKEHRRAHRGPTEIRLQLLEKYYFPRMSSTIRLQTSSCQCCKL
FT                   YKYERHPNKPNLQPTPIPNYPCEILHIDIFALEKRLYLSCIDKFSKFAKLFHLQSKAS
FT                   VHLRETLVEALHYFTAPKVLVSDNERGLLCPTVLNYLRSLDIDLYYAPTQKSEVNGQV
FT                   ERFHSTFLEIYRCLKDELPTFKPVELVHIAVDRYNTSVHSVTNRKPADVFFDRSSRVN
FT                   YQGLTDFRRQTLEDIKGLIEYKQIRGNMARNKNRDEPKSYGPGDEVFVANKQIKTKEK
FT                   ARFRCEKVQEDNKITVKTRSGKIFHKSDLRN"
XX
CC   Sequence from P1 DS01219.2:861..8381 provided by Guochon Liao
CC   Berkeley Drosophila Genome Project.
XX
SQ   Sequence 7521 BP;  2322 A; 1740 C; 1677 G; 1782 T; 0 other;
     AGTTAAGAAC CCTCTTCTTG CGCTCTTCGT CAGGACTCAC CAGCGCTCGG CTCTCGTGTT        60
     TTCGGGCCCC GTCAGCAGGC GACTCGGGGC CTGTCTAGTA ACATGTTCGT GTAAGTTACG       120
     AACCCTCTTC TTGCGATCTT CGTCAGGACT CACCAGCGCT CGGCTCTCGT GTTTTCGGGC       180
     CCCGTCAGCA GGCGACTCGG GGCCTGTCTA GGAACATGTT TGTGTATGTG TGCATTCGGA       240
     ACAAGTGCCG TTGGTCGCAC TCAGGGTGAG GGGTCAACGG GGGAAGCGGA TATAAAAGCA       300
     GCGGGGCGGG AGAAGAGGTC CCAGTCTCGA ACGGACACAT AACGGAACCG CTAGCAGATC       360
     GCGAACTGAA TCTTAAAATA AAGCTAATCG TAAACTCGAA CCCTCTTAAC TATCTTGACT       420
     ATTATTTGGA GAACCACAGC ATGTTGGTTG TCATATCAAG GTGAGGTATG CGGCAGCGAG       480
     TGCCGAGAAC CCTGATGCAA GTGGAACTTG CGTTAACTGG CGCCCGAACA GGGACCGGCA       540
     ATGTCCGGCC GATAAAAGTG ATACGAAAAA ATTGTGGAAA TTTGTGCGTA AAAATAGTGG       600
     TGGTGTGCAT AAGTCAGATT AAGATCTGAA ATCCATAAAT GAAAAAGAAG TGCTGCGTGA       660
     GCTGTGTATA AAATGATAAA ATAGCAATTA CCCGCTGCCG GGGGGAACTA CGCCCATCCC       720
     GGGGCGCAAC AAATATTGCA TAATTCAATA AAAGGTGTAA AATTTCTAAA ATAAAAATGT       780
     AAACCTATGT TGCGCCAAGA CCTAATTTAA ATTAATAAAA CAACGACCCG CTACCGGAGG       840
     ACGCCACGTC GCCCATGCCG AGCGCAAAAG TTGTACGATA CCTATAACAT AATTAAAACA       900
     CGATCAACCC ACTGCGGCGG TACGGCTTGT GGGAAAATTT TTTTTTTTTT CTCTCCTTGC       960
     CAATTCGCGA GTGCAAAAGA TTGTGTATAA TAAACCAATA ATTAACCATT GCAGCAGTTT      1020
     ACCTGCGGCA GTACGAGTAA TATGAGCGCC CAGAGTGATA AGGTGGTGTG TGGCAGCTTG      1080
     TTGGATACGT TAAGTGGTGT GGAATGCACC CAAAAAAAAC CGCCCAACAA GTTGTGTGGC      1140
     GGCCGTACCT TAGTAGGCAA CCAGCCAAAA GGGATACTAC GGAACCACCG TGCCCAGTGC      1200
     CGAAATAAAT TAGAGGTCAT CAATAAAAAA CTGTAACAGC ACGCACGCAA GGAAAAAATA      1260
     TTGCAAAATG GAATAGCGCA CAAAAATTGT ATAAACACAT GCACAACACC ACAATTCAAA      1320
     GGAAAACAAA ATATTCATGC TGTAGGGGTA CAACCTAAAC GACGAAAACT AATAAAGAGC      1380
     ATACAAGGGT GAGTGAAATA TTTCATTAAA CTTTATTGCC ATATTTGCTA AATTTAGAGA      1440
     AATAAAGAAA AAGCAAAGAA GAACAGATAT TCTTTTTTAT CGGGTTAAAA CCGTTGTCTC      1500
     ACATTTCCGT AAAGTAATAA CGAATTCTGT TGCCTTGAAA GCTTCCTGCA TCTTTCCAAC      1560
     GCAAACTAAA AATCAAAATG GAAGAGACCC TGCGTGCTCT TAGCGAGTCC CTCAATGCCC      1620
     TGACCAACGT GGTGACAGGC ATTAAGGAAG ATATTAAGAA AAATAATGAT AGGTTGGCTA      1680
     TTTTAGAACA GGAGCGCGGG AACGCTGACC CTACGGTCGA CCAACCGCAA CCCCTGGTGC      1740
     GCGCACGCAC CGAGTATGAG CTGAGAGAGA TATCGGTCCT CCCTGACTGC GTCAAAGAAC      1800
     TGCAGGCGTT CGAAGGACGG CAGGAGGCTT ACCTGTCTTG GATAAACAGG GCACAGTCAA      1860
     TACTGACCGA ATATGACTTG ATTAAAACCA GACCCCTGTA TAGGGCAATT GTCTTGCATA      1920
     TTAGACAGAA AATAAGGGGA CACGCCGACA TGGCCTTGGC GGCCTATGGC GTCCAAGACG      1980
     ACGATTGGGA CGACATAAAA CGAGTCTTGG CGCTGCATTA CGCAGACAAA CGAGACTTAC      2040
     GTACGCTTGA GCATGAGCTT GGCGCTATGT GCCAAGGTTC TAGACCACTA GATAGGTTCT      2100
     ATATGGACGT TAATGGCCAT CTCTCGTTGA TCTTAAATAA CTTGAAGGCC AGAAACCACC      2160
     CTCGTGAAGT AGTCAACGCT TTGATAGAAA CCTATAGAGA CAAGGCTTTG GATGTTTTTA      2220
     TCCGAGGAGT GGGGAGAGAT TGTTCCAAAC ACTTACTTGT CCGCAGCCCG AAGAATCTAC      2280
     CAGAGGCTTA CTCTTTTTGT ATGGGATTGC AGAATGTAAT GTCAAGAAAT TTCACAGCTC      2340
     AGAACTATCA ACCGTCAGGT GCCCCAAGAT TCGCAGGCCC ATATCAACAT CAGGCCAGGC      2400
     CACCGTTCCG AACCCCTTTT TCTCCTGGTT CAGGCAGATT TTCGCAAAAC TCCTACAGAA      2460
     CTCAGGGTCC TAGACAGGCC ATAAAAATGG AATCCAATCG GTCGGGTCAA TCTTACCAAT      2520
     CAGGATACAG TGGTCGCCAG GAAGAAGGCT CCGGTATTAA GAGAATGTCC GAAGGAAACA      2580
     ACCCATTCCA AAAGGCACAA AGATTGTACC ACATGGAATT GGCACCACCC CCGCTAGCCC      2640
     CGGCGGCTAG TGGAGATAAC CAAGGACGTT CACACGAGGG TTACTATGAT GACGAGTCTC      2700
     AAGCTGTCGA GAGAAGCAAC AATTATCCTC CGCAGAAAAA CGTGGAAGGA GTTACAGATG      2760
     CTCCACATAA CCTTGAGACT GAGGGAGGGG CAAATTTTAT GACCAACGCC TCTCCAGTGT      2820
     ACCGTACTTA GAGTATGCTA CGGAGAGGGG AGAAAGGCTG AAGTTTTTGA TCGACACGGG      2880
     GGCGAACAAA AACTTTATTA GCCGAAGACT TGCAGCCGGG TGTACCACAG TCCGTAAACC      2940
     CTTCTCCGTA CTGTCCGCTG CGGGTAACAT CATGATAACG CACCGCCTAG TTGGTAAATT      3000
     CTTCAAACCA CTAGGGAACG ACTCGGATAT TACCTTTTTC GTACTACCGA ATTTACATTC      3060
     CTTTGATGGT ATCATTGGCG ACGATACTCT CAAAGACTTA AAAGCCATAG TGGATAGGAA      3120
     AAACAATTGT TTGATAATAA CCCCAGGAAT TAAAATCCCT CTTTTGGCGA GAGCTTCAAT      3180
     AAACGTTAAC CCGCTACTCG CCGCCGAACA CCCAGATGGT ACACAAGAAA TTTTGAATTC      3240
     CCTTCTCGGG GAATTTCCCC GCATCTTCGA GCCCCCCTTA TCTGGAATGT CCGTGGAGAC      3300
     GGCCGTCAAG GCTGAAATCC GGACAAACAC ACAAGACCCG ATCTATGCTA AAAGTTATCC      3360
     TTACCCAGTC AACATGCGCG GAGAAGTCGA ACGTCAAATC GATGAACTGC TGCAGGACGG      3420
     TATAATTCGA CCCTCTAATA GCCCTTACAA TTCCCCTATC TGGATAGTCC CGAAGAAACC      3480
     TAAACCAAAC GGAGAAAAAC AATATCGCAT GGTAGTCGAT TTCAAGCGGT TAAATACCGT      3540
     CACCATACCC GACACTTACC CCATCCCAGA TATAAACGCT ACGCTAGCCA GCCTTGGCAA      3600
     TGCCAAATAC TTTACCACCC TAGATTTGAC TTCTGGATTC CATCAAATCC ACATGAAGGA      3660
     AAGCGACATT CCAAAGACAG CTTTCTCTAC TCTAAATGGA AAGTACGAGT TCCTCCGTCT      3720
     ACCATTCGGT TTGAAGAATG CACCTGCAAT CTTCCAAAGA ATGATCGATG ATATTTTGCG      3780
     CGAGCATATT GGCAAGGTCT GCTACGTTTA TATTGACGAT ATCATCGTCT TCAGTGAAGA      3840
     TTATGACACA CACTGGAAAA ATCTCCGATT GGTATTAGCG AGTTTATCAA AAGCTAACCT      3900
     CCAAGTGAAC CTTGAGAAGT CGCATTTTTT AGACACGCAG GTAGAATTTT TAGGATATAT      3960
     CGTCACGGCC GATGGCATTA AGGCAGATCC GAAAAAGGTC AGAGCGATTA GCGAAATGCC      4020
     TCCTCCGACC TCTGTTAAGG AGTTAAAAAG ATTTCTAGGC ATGACCTCGT ACTACAGGAA      4080
     GTTCATTCAG GACTATGCGA AGGTAGCAAA GCCCCTTACA AACTTGACGC GTGGATTGTA      4140
     CGCTAATATA AAGTCTTCAC AATCAAGCAA AGTGCCAATT ACATTAGACG AGACGGCCCT      4200
     ACAGTCTTTT AATGATTTAA AATCAATTCT CTGTTCTTCT GAAATACTGG CGTTCCCATG      4260
     TTTCACTAAA CCTTTCCATC TAACCACGGA CGCTTCTAAC TGGGCCATCG GAGCTGTCCT      4320
     CTCACAGGAC GACCAGGGTA GAGATAGGCC GATAGCGTAC ATTTCCCGTT CATTAAATAA      4380
     GACGGAGGAA AACTACGCTA CTATCGAAAA GGAAATGCTC GCGATAATTT GGTCATTGGA      4440
     CAATCTTCGG GCTTACTTAT ATGGCGCTGG TACTATTAAA GTATATACTG ACCATCAACC      4500
     TCTAACGTTT GCCCTAGGCA ACAGAAATTT CAATGCGAAG CTAAAACGCT GGAAGGCTCG      4560
     TATAGAGGAA TACAACTGCG AACTCATCTA CAAGCCTGGG AAATCTAATG TGGTGGCTGA      4620
     CGCGCTTTCA CGCATTCCGC CTCAGCTTAA CCAGTTGAGC ACCGATTTAG ATGCTAATCC      4680
     CGAGGATGAC ATGCAGTCTT TGGCTACTGC CCATAGCGCT TTACATGACA GTTCACGATT      4740
     GATTCCCCAC GTTGAATCTC CAATCAACGT TTTCAAGAAT CAACTCATTT TTGACACAAC      4800
     CAGGTCAAAA TACTTATGCG AGCACCCGTT CCCAGGTTAT ACTCGCCATC TGATTCCTCT      4860
     CAAAGACGGA TCACTTGCCG ATTTAACCAA CTCGTTACAA TCGTGTCTAC GACCTGTAAT      4920
     AATTAACGGC GTCAAAATCC CGGAAGCACA TTTGCAACGC TTTCAGTCCA TCTGCTTAGC      4980
     GAATTTTCTT TTATACAAAA TTCGGATAAC GCAGCGCCTA GTGGCGGACG TGTCTGGCGC      5040
     AGAGGAAATT TGTGAAATAA TTGAAAAAGA ACACCGTAGA GCACATAGGG GCCCTACGGA      5100
     GATTCGTCTC CAACTTTTAG AAAAATATTA TTTCCCGCGA ATGTCCAGTA CGATCCGTCT      5160
     GCAAACTTCC TCATGTCAGT GTTGCAAACT CTACAAGTAC GAGAGACACC CTAACAAACC      5220
     AAACCTACAA CCTACGCCAA TTCCTAACTA CCCATGTGAA ATACTTCACA TCGACATTTT      5280
     TGCGCTCGAA AAAAGGTTAT ACCTAAGTTG TATTGACAAA TTTAGCAAGT TTGCCAAACT      5340
     TTTCCATCTG CAGTCAAAAG CATCTGTGCA TTTGCGAGAA ACTTTGGTGG AGGCCCTACA      5400
     TTACTTCACC GCCCCTAAGG TCTTGGTTTC GGATAACGAG CGAGGGTTGT TATGCCCCAC      5460
     AGTGCTCAAC TATCTTCGGT CTCTAGATAT CGATCTGTAT TATGCTCCAA CCCAGAAGAG      5520
     CGAAGTAAAT GGTCAAGTCG AGAGATTCCA CTCTACGTTC CTAGAAATTT ATCGTTGCCT      5580
     TAAAGATGAG CTCCCTACCT TCAAACCCGT TGAGCTGGTA CACATAGCAG TGGACCGCTA      5640
     CAACACTTCC GTTCACTCGG TAACGAATCG AAAACCAGCA GACGTTTTTT TCGACCGCTC      5700
     GTCAAGGGTA AACTATCAGG GTCTGACAGA TTTCCGGCGG CAGACTTTAG AGGACATCAA      5760
     GGGCTTAATT GAGTATAAGC AAATTAGAGG TAATATGGCT CGGAATAAAA ATAGGGACGA      5820
     GCCAAAGTCT TATGGGCCGG GAGATGAAGT TTTTGTTGCA AATAAGCAAA TAAAAACAAA      5880
     GGAAAAAGCG AGGTTCAGAT GCGAAAAGGT ACAGGAAGAC AACAAGATAA CAGTTAAAAC      5940
     CAGATCAGGA AAAATTTTCC ACAAATCTGA TCTAAGAAAT TGAGACGTGG CTTTCACATT      6000
     TAAAAAAGAA ACGCGAAAAA GAATAACGAA AGTAATAAAA GTACGTTGTG GCAGCTAATG      6060
     AAATATTCCA CCCATGCATA CCCTATATAA AAAAAACATT AATAAAAAAA AAAAAAAAAA      6120
     AAAAAAAAAA AAAAAAAAAT GAGTTAAGAA ATACAAAAAG AAATACAAAA AAAACTATAA      6180
     AAAAAATAAT ATAAAAAAAT ACAGATTATA AGAAATAAGA AATAAGAAAT ATAAAAAAAT      6240
     AAAAATATAA GTACACAAAA TGTACCGTAC CCCCACACAC TACGTAGTCT TAGAACAACT      6300
     TAGACGACCA GATATTTACG AATTGTCTTT TTGTAAGCGC GATTTCTGCA TGCGGCGCAA      6360
     ATCCCGCTCA CTGGACTGGC TGGGGTCGGC TTGGAAATGG GTAGCTGGAT CTCCAGATGC      6420
     TGCTGATTGG AACGCCGTCT TGGCCGCGCA AGCGACGGCT TCGAGGAACT GCAAAAACTG      6480
     GAGGAGGCTA GCTGTATCCC TCGGCTACTG AAGTAACCAA CGAGTGGTTA AGCAAGTCGA      6540
     CGATGGAATG CTCCTCCTGA CCAACTTCAA CGGAACTCTA AGAACGGCTG CAGAGAACTA      6600
     CGACCTGATC GGCTCCTTTA TCATCCAATT CGACAATGAG ACGATAATGG TCAACGGTCA      6660
     AAACTATTCC AGTTACTCGG TCAGTCATCT AATGGCGATG CCGGCCGTGT TGAGCCACAT      6720
     AACGGCCAGC AACTTTCAAC TTTCTCTGGA ATACGTCCAC GACGTGAGCA TGAAGAATTT      6780
     GGAAAAGATG TCCAACATGG CGAGTGAGCT ACTAGCCTCT CTTCTCACCG AGGCGGCACT      6840
     CGCAATCTGC ATATTCCTAG GCTTTTATTT CCTATGGAAG AAGCTGATGT CCACCAAAGG      6900
     CATGCCCGAT GTCCGCGAGA TTGCCGCAAA CTTAGAAGCA TTGGGCCAAA CCGAGCTGAA      6960
     CAAGGCTCAC TAATCTGCGG GACGCAGATC TTGAGGGGGG AGGAGTTAAG AACCCTCTTC      7020
     TTGCGCTCTT CGTCAGGACT CACCAGCGCT CGGCTCTCGT GTTTTCGGGC CCCGTCAGCA      7080
     GGCGACTCGG GGCCTGTCTA GTAACATGTT CGTGTAAGTT ACGAACCCTC TTCTTGCGAT      7140
     CTTCGTCAGG ACTCACCAGC GCTCGGCTCT CGTGTTTTCG GGCCCCGTCA GCAGGCGACT      7200
     CGGGGCCTGT CTAGGAACAT GTTTGTGTAT GTGTGCATTC GGAACAAGTG CCGTTGGTCG      7260
     CACTCAGGGT GAGGGGTCAA CGGGGGAAGC GGATATAAAA GCAGCGGGGC GGGAGAAGAG      7320
     GTCCCAGTCT CGAACGGACA CATAACGGAA CCGCTAGCAG ATCGCGAACT GAATCTTAAA      7380
     ATAAAGCTAA TCGTAAACTC GAACCCTCTT AACTATCTTG ACTATTATTT GGAGAACCAC      7440
     AGCATGTTGG TTGTCATATC AAGGTGAGGT ATGCGGCAGC GAGTGCCGAG AACCCTGATG      7500
     CAAGTGGAAC TTGCGTTAAC T                                                7521
//
ID   DM_ROO  standard; DNA; INV; 9092 BP.
XX
AC   AY180917;
XX
DR   FLYBASE; FBte0000100; Dmel\roo.
XX
SY   synonym: B104
XX
FT   source          AY180917:1..9092
FT   SO_feature      five_prime_LTR ; SO:0000425:1..429
FT   SO_feature      three_prime_LTR ; SO:0000426:8665..9092
FT   SO_feature      CDS ; SO:0000316:1275..8357
FT                   /name="Dmel\roo\ORF"
FT                   /db_xref="FLYBASE:FBgn0043856"
FT                   /db_xref="NCBI_PROTEIN:AAN87269.1"
FT                   /translation="MMSEKTIQFLKKQSEIILEIRKLEVKPTLTDVEILKLNELQKCF
FT                   IANHSNLLKIGVVDHEYFNAKQYDLIMMVLEKIKNKNEKIKGESVENTFPKSNTVPKS
FT                   NPPPTLNLEMRGHPEKEGIAQNNALKVEQAFRNNVGQFRVYLEDTSKLIDSSPDFLKI
FT                   RKNKIEFLWHKIDNLIEQVNSRFESSLFEEEISELEFDKQNILTAINSRLSGTINKAE
FT                   MSTVVKAEELPTLPKIQIPTFFGDSKEWDLFNELFTELIHVREDLSPSLKFNYLKSAL
FT                   KGEARNVVTHLLLGSGENYEATWEFLTKRYENKRNIFSDHMNRLMDMPNLNLESNKQI
FT                   KTFIDTINESIYIIKLKAQLPEDVDAIFAHIILRKFNKESLNLYESHVKKTKEIQALS
FT                   DVMDFLEQRLNSISSFSQEVKPVKKMINNNKNKNYSDNCAYCKLPGHYLIQCHKFKIM
FT                   NPAERSDWVRKNGICLRCLRHPFGKKCISEQLCSTCRKPHHTLLHFAGHNPEKVNTCR
FT                   TTGQALLATALIQVKSRYGGFEQLRALIDSGSQSTIISEESAQILKLKKFRSHTEISG
FT                   VSSTGTCISKHKAVISIRNSPKNLEIEAIILPKLMKALPVNTINVDQKKWKNFKLADP
FT                   DFNKPGRIDLIIGADVYTHILQNGVIKIDGLLGQKTDFGWIVSGCKKSKGKETIVATT
FT                   IEIKELDRYWEVEEEEKDDIESEICENKFIKTTKKDSDGRYIVSIPFKEDVTLGDSKK
FT                   QAIARYMNLEKKLKRNEKLKVDYTKFMNEYMDLGHMIEVSDEGKYFLPHQAVIRDSSL
FT                   TTKLRVVFDASAKTTNNKSLNDIMWVGPRVQKDIFDIIIKWRKWEFVVSADIEKMYRQ
FT                   IKIDNNDQKYQYILWRNSPKEKIKTYKLTTVTYGTASAPYLATRVLVDIADKCKNQVI
FT                   SAIIRNDFYMDDLMTGADSVEEANKLITLIPHELQKVGFNLRKWISNNSKILTTVEDT
FT                   GDNKVLNIIENECVKTLGLKWEPQKDLFKFSVNCNDESKNINKRVVLSTLAKIFDPLG
FT                   WLAPVTVSGKLFIQKLWINKSEWDQELSIEDKNYWEKYKENLLLLENIRIPRWINSNS
FT                   SSVIQIHGFADASEKAYAAVVYAKVGPHVNIIASKSRVNPIKNRKTIPKLELCAAHLL
FT                   SELIQRLKGSIDNIMEIYAWSDSTITLAWINSGQSKIKFIKRRTDDIRKLKNTEWNHV
FT                   KSEDNPADLASRGVDSNQLINCDFWWKGPKWLADPKELWPRQQSVEEPVLINTVLNDK
FT                   IDDPIYELIERYSSIEKLIRIIAYINRFVQMKTRNKAYSSIISVKEIRIAETVVIKKQ
FT                   QEYQFRQEIKCLKIKKEIKTNNKILSLNPFLDKGGVLRVGGRLQNSNAEFNVKHPIIL
FT                   EKCHLTSLLIKNAHKETLHGGINLMRNYIQRKYWIFGLKNSLKKYLRECVTCARYKQN
FT                   TAQQIMGNLPKYRVTMTFPFLNTGIDYAGPYYVKCSKNRGQKTFKGYVAVFVCMATKA
FT                   IHLEMVSDLTSDAFLAALRRFIARRGKCSNIYSDNGTNFVGAARKLDQELFNAIQENI
FT                   TIAAQLEKDRIDWHFIPPAGPHFGGIWEAGVKSMKYHLKRIIGDTIFTYEEMSTLLCQ
FT                   IEACLNSRPLYTIVSEKDQQEVLTPGHFLIGRPPLEIVEPMEDEKIGNLDRWRLIQKI
FT                   KKDFWVKWKSEYLHTLQQRNKWKKEIPNIEEGQIVLLKDENCHPARWPLGKVEKVHKG
FT                   NDDKVRVAKVKMQEGYITRPITKICPLEGIKSVDKNEADQEPKRRTRATSGMSKIGII
FT                   MAMLLFVLSCQVSSALPKDIAPRYSIDKINKTSAIYLDPLGDVEIVSTSWNLVIYYKM
FT                   DPYFKMLTKGNALIQSMRKVCERLHSFEEQCSLVLDNMQSQLSELEENNKLFMMQSRS
FT                   RSKRAPFEFMGSLYHILFGIMDEDDREQLEENMKNLLDNQNNLDKLIQKQTSVVDSTS
FT                   NLLKRTTEDVNSNFRSMQIRIENMTEVLKENYYVYKESIKFFMITKQLHSLIEEGEKI
FT                   QAGIISLLIDINHGRLNTNILRPNQLKKEIAKIQQSLSENLVIPGKRSGTELKEVYTL
FT                   LTARGLFIDDKLIISAKVPLFSRHPSKLFRLIPVPIRNEDRIIMVHTTSEYLIYNFEI
FT                   DSYHIMTEATLNQCQKWQLNKRICKGSWPWNSANDNACEIQPLKPDKAANCIYKTVVD
FT                   SKSYWVELEKKSSWLFKVPANSKVRLQCTGSQIELFDLPQQGVLSIAPYCTARTDDKI
FT                   LVAHHNIQSESEELLSTPYIGEVSGVPKIIWDPLKLSILNHTEEFERLNNEIKFMKEN
FT                   HQKLKDLHFHHISGHAGLIIALILMIVLIIYFIRKCAVQQRMQAITFAGPLPVLXX"
XX
CC   Sequence from P1 sequence DS00941:20448..29535 provided by
CC   Guochun Liao, Berkeley Drosophila Genome Project.
XX
SQ   Sequence 9092 BP;  3468 A; 1442 C; 1710 G; 2472 T; 0 other;
     TGTTCACACA TGAACACGAA TATATTTAAA GACTTACAAT TTTGGGCTCC GTTCATATCT        60
     TATGTAAATG AATCGAGAGC GATAAATTAT ATTTAGGATT TTGTTATCTA AGGCGACATG       120
     GGTGCATTGC TCAAAAACAT GTAATTTAAG TGCACACTAC ATGAGTCAGT CACTTGAGAT       180
     CGTTCCCCGC CTCCTAAAAT AGTCCCTTAG TGGGAGACCA CAGATAAGGT CCTCGCCGCT       240
     CAAGATAGGC AGATGTGCCC GAGCGTGGGA CCTCGATAAG GCGGGGACTA TTTACGTAGG       300
     CCTCTGCGTA GGCCATTTAC TTTAAGATGC GATTCTCATG TCACCTATTT AAACCGAAGA       360
     TATTTCCAAA TAAAATCAGT TTTTTTACAA AAACTCAACG AGTAAAGTCT TCTTATTTGG       420
     GATTTTACAT TTGGTCAATC GAGCCTTTAA TCGACTCTGC AGTTTCCCCC TACCAAAGGT       480
     AAGGAACTCA GAGAAAGGCC AGCTCCTTTA AGCATCTTAC AGCTAAAGGT AGCAAAAATA       540
     AGTGACTCTT GTTTCCCCCT ACCAAAGGTA AGGAACAGAG TATAAATATA AAAAGCAAAA       600
     GATACAAAAG AATCTTTTAT GTTTTAAAAC AAGCACCTTA TAGTCTATAG CTAAAGGTTG       660
     CTTTGTGTAC CATTATAAAT TGTGGTAAGG CGTGCTTGAG GCCATACATC AGCAATTGTG       720
     AAATTAAAAA GTGCATAACA AAAGTGCCTT ATAAATGCTC TAATAGCATT AAATCAGCTC       780
     ATAAATAGAG TGCAGTGTAT ATGCCATAAG AGCATAAATT AAATAAAAAG TGCCTGAAAA       840
     CAGTGCCTTA TAAATGCTCT AATAGCATTA AATCAGCTCA TAAATAGAGT GCAGTGTATA       900
     TGCCAAAAGA GCATAAATGC CGAAATAAAT GGCTAAAAAA CAAAAAATCT GACTGGACTA       960
     CAAAAATAAT AAAACGTGCC AAAAAAAAAA AAAAAATCAT CTTTAAACAT CGACGGAGCC      1020
     TTAAAGAAGA GAAGGAAGTC AAATTCAAAG GAGCCTCTAC CAGCAGCAGA AGCAGCAACA      1080
     ACAGCAGCAG CAGAAGCAGC AACAGCAGTA GCAACAGCAG CAACAACAGC AGCAACAGCA      1140
     GCAGCAACAA CAACGACATC AGCTAAGTCA AAACAAGAAT TTTCTGTTTA TCCAAACACA      1200
     CATATATATA TAAATACATA TAAAATACAT ATACACGTAC TATATATATT AAGAAATTAC      1260
     AAAAAATTTT CAAAATGATG TCAGAAAAGA CTATTCAATT CCTTAAGAAG CAGTCCGAAA      1320
     TTATTTTGGA AATTAGAAAG TTGGAAGTAA AACCAACATT AACAGATGTA GAAATTCTAA      1380
     AATTAAATGA GCTTCAAAAA TGTTTCATTG CTAATCATAG CAATTTGTTA AAGATCGGCG      1440
     TTGTCGATCA TGAATATTTT AACGCGAAGC AGTATGATTT AATAATGATG GTGTTAGAAA      1500
     AAATTAAAAA TAAAAATGAA AAAATTAAGG GCGAGTCGGT AGAAAACACT TTCCCTAAAT      1560
     CAAACACTGT CCCTAAATCA AACCCTCCCC CTACATTAAA CCTTGAAATG CGTGGTCACC      1620
     CTGAAAAAGA GGGTATAGCA CAAAACAACG CTTTAAAAGT AGAGCAGGCA TTTCGTAATA      1680
     ATGTTGGCCA ATTTCGAGTA TATCTAGAAG ATACGTCTAA ACTAATAGAC AGTAGTCCAG      1740
     ATTTCCTTAA AATAAGGAAA AATAAAATTG AATTTTTATG GCATAAAATA GATAACCTGA      1800
     TTGAACAGGT GAATAGTCGT TTTGAGAGTT CGCTATTCGA AGAAGAAATT AGCGAACTTG      1860
     AATTTGACAA ACAAAATATT CTTACAGCCA TTAATAGTCG ACTCAGTGGC ACAATAAATA      1920
     AAGCTGAAAT GTCGACGGTT GTTAAGGCGG AGGAGTTACC AACCCTGCCT AAAATACAGA      1980
     TTCCCACCTT CTTTGGTGAT TCCAAAGAAT GGGATCTTTT TAATGAACTC TTTACAGAGC      2040
     TCATACATGT GAGAGAGGAT CTCAGTCCTT CTCTCAAATT TAATTATCTA AAGTCAGCAT      2100
     TAAAAGGAGA AGCCAGAAAT GTGGTTACTC ATTTACTGCT CGGCTCTGGA GAAAATTATG      2160
     AAGCCACTTG GGAGTTTTTG ACCAAGCGAT ATGAGAATAA AAGAAACATA TTCTCAGATC      2220
     ATATGAATAG GCTTATGGAT ATGCCAAATT TAAATTTAGA ATCCAATAAG CAAATAAAGA      2280
     CATTTATTGA CACGATTAAC GAGTCAATTT ATATTATAAA ATTAAAGGCA CAATTACCAG      2340
     AAGATGTGGA TGCAATTTTC GCTCACATAA TTCTTCGGAA ATTCAATAAA GAATCACTCA      2400
     ATTTATATGA AAGCCATGTT AAAAAGACAA AAGAAATACA GGCACTTTCT GATGTCATGG      2460
     ACTTTTTAGA GCAAAGGCTC AATTCTATAT CATCATTCTC ACAGGAAGTA AAACCTGTAA      2520
     AGAAAATGAT TAATAATAAC AAGAATAAAA ATTATAGTGA CAATTGTGCA TATTGCAAAC      2580
     TACCAGGGCA TTATTTAATT CAATGCCATA AATTTAAAAT AATGAATCCA GCAGAACGGT      2640
     CTGACTGGGT AAGAAAAAAT GGGATTTGCC TAAGATGTCT GAGGCATCCG TTTGGTAAAA      2700
     AATGTATAAG CGAGCAGCTT TGTTCGACTT GTCGTAAACC TCACCACACG TTACTTCACT      2760
     TTGCAGGTCA TAATCCAGAA AAAGTGAATA CGTGTAGAAC AACAGGTCAA GCCTTGTTGG      2820
     CCACGGCCTT GATTCAAGTA AAGTCGAGGT ATGGAGGCTT TGAACAATTA AGAGCATTGA      2880
     TTGATAGTGG CTCTCAAAGC ACAATTATTT CAGAAGAGTC TGCACAGATT CTAAAATTGA      2940
     AAAAATTTCG GTCTCATACT GAAATAAGTG GAGTATCTTC CACAGGAACG TGCATCTCCA      3000
     AGCACAAAGC GGTTATTTCG ATAAGAAATT CTCCGAAAAA TTTAGAAATT GAAGCAATTA      3060
     TTCTCCCAAA ACTTATGAAG GCACTTCCAG TCAACACGAT TAATGTTGAT CAGAAAAAAT      3120
     GGAAGAACTT TAAATTAGCC GACCCCGATT TTAATAAACC GGGTCGCATT GATTTAATCA      3180
     TTGGAGCAGA CGTATATACT CACATTCTGC AAAATGGAGT TATAAAAATA GACGGTCTCC      3240
     TTGGGCAAAA AACTGATTTC GGGTGGATAG TTTCTGGATG TAAAAAATCC AAAGGAAAAG      3300
     AAACCATTGT AGCCACAACA ATAGAAATAA AAGAGTTAGA TCGCTACTGG GAAGTGGAAG      3360
     AAGAAGAAAA AGATGATATC GAGTCTGAAA TCTGTGAAAA TAAATTTATC AAAACGACAA      3420
     AAAAAGATTC AGATGGGCGA TACATTGTGT CAATTCCATT CAAGGAGGAT GTCACCTTAG      3480
     GAGATTCAAA GAAACAAGCG ATAGCTCGTT ACATGAATCT GGAGAAAAAA CTAAAAAGAA      3540
     ATGAAAAACT TAAGGTTGAC TACACTAAAT TCATGAATGA ATACATGGAT TTAGGACACA      3600
     TGATTGAAGT GAGTGATGAA GGCAAATATT TTTTACCGCA CCAGGCAGTG ATTAGAGATT      3660
     CAAGCCTTAC GACCAAATTG AGAGTAGTTT TTGATGCTTC AGCAAAAACT ACGAATAACA      3720
     AAAGTTTGAA CGACATAATG TGGGTTGGGC CACGAGTTCA AAAAGATATT TTTGACATTA      3780
     TTATTAAATG GAGAAAATGG GAATTTGTTG TTTCGGCAGA CATTGAAAAG ATGTACCGAC      3840
     AAATTAAAAT AGATAATAAT GATCAAAAAT ATCAATATAT TTTATGGAGA AATTCTCCAA      3900
     AAGAAAAAAT TAAAACATAT AAATTAACCA CAGTCACTTA CGGAACTGCA TCTGCACCAT      3960
     ATTTGGCTAC CAGGGTTCTG GTAGATATTG CAGATAAATG TAAAAACCAA GTTATTAGTG      4020
     CAATAATTAG GAATGATTTC TATATGGATG ACCTAATGAC TGGAGCTGAT TCGGTAGAAG      4080
     AAGCTAATAA ATTAATAACA TTAATTCCCC ATGAATTGCA GAAAGTTGGA TTCAACTTAA      4140
     GGAAATGGAT TTCCAACAAT TCCAAAATAT TAACCACTGT GGAGGACACA GGGGACAATA      4200
     AGGTTCTCAA TATTATCGAA AATGAATGTG TTAAAACTTT AGGACTAAAA TGGGAACCTC      4260
     AAAAGGATTT ATTTAAGTTC AGCGTAAATT GTAATGATGA ATCAAAAAAT ATAAATAAGC      4320
     GCGTTGTGTT ATCAACGCTA GCAAAAATAT TTGATCCGTT AGGATGGTTG GCACCAGTCA      4380
     CGGTTTCAGG AAAACTTTTT ATTCAAAAAC TTTGGATAAA TAAAAGTGAA TGGGATCAGG      4440
     AATTATCCAT AGAAGATAAA AATTATTGGG AAAAATATAA AGAAAATTTA TTATTGTTAG      4500
     AGAATATTCG AATCCCAAGG TGGATTAATT CAAACAGTTC TTCAGTCATT CAGATTCACG      4560
     GATTTGCGGA CGCCTCCGAA AAAGCATATG CTGCAGTAGT CTATGCTAAA GTAGGACCTC      4620
     ATGTTAATAT AATAGCTAGC AAAAGTAGAG TCAACCCTAT AAAAAATAGG AAGACAATTC      4680
     CCAAACTCGA GCTGTGTGCA GCTCACCTGC TTAGTGAATT AATCCAAAGA CTAAAAGGAT      4740
     CAATTGACAA TATAATGGAG ATCTATGCTT GGAGTGATTC CACGATTACC TTAGCATGGA      4800
     TTAACAGTGG TCAAAGTAAG ATCAAATTTA TAAAAAGAAG AACGGATGAC ATTCGGAAAT      4860
     TAAAAAATAC TGAATGGAAT CATGTTAAGT CAGAGGATAA TCCAGCAGAT TTAGCATCCA      4920
     GGGGAGTGGA TTCTAACCAG TTGATCAACT GTGATTTTTG GTGGAAAGGT CCGAAATGGC      4980
     TAGCAGACCC AAAAGAACTT TGGCCTCGGC AGCAGTCTGT AGAAGAACCT GTCTTAATAA      5040
     ATACGGTATT AAATGACAAA ATAGATGATC CTATTTACGA ATTAATAGAA AGGTATTCCA      5100
     GTATAGAAAA ACTTATACGT ATAATAGCAT ACATAAATAG ATTCGTGCAG ATGAAAACAA      5160
     GAAATAAAGC CTATTCATCA ATTATTTCAG TAAAGGAGAT AAGAATAGCG GAAACAGTTG      5220
     TTATTAAGAA ACAACAAGAA TACCAGTTTA GGCAAGAGAT AAAGTGCCTT AAAATCAAAA      5280
     AGGAAATCAA GACAAATAAT AAAATATTGT CATTGAATCC ATTTTTGGAC AAGGGTGGGG      5340
     TTCTAAGAGT TGGAGGAAGA TTGCAAAATT CCAATGCAGA ATTTAATGTT AAACATCCAA      5400
     TCATTTTAGA AAAATGCCAC CTAACAAGCT TATTAATAAA AAATGCTCAT AAGGAAACAT      5460
     TGCATGGAGG GATAAACCTA ATGCGAAACT ATATCCAAAG AAAGTATTGG ATTTTCGGGT      5520
     TGAAAAATTC GTTGAAAAAG TATTTAAGAG AATGTGTAAC GTGTGCAAGG TATAAACAAA      5580
     ATACAGCTCA GCAAATAATG GGTAACTTGC CAAAATATAG AGTGACGATG ACATTCCCGT      5640
     TTCTTAATAC TGGAATAGAT TACGCAGGTC CTTATTATGT TAAATGTTCA AAAAATCGTG      5700
     GCCAAAAAAC ATTTAAAGGA TACGTTGCTG TATTCGTTTG CATGGCCACC AAAGCCATAC      5760
     ACTTAGAAAT GGTAAGCGAT CTAACTTCAG ACGCATTTTT AGCAGCACTC AGAAGATTTA      5820
     TTGCTAGACG GGGAAAATGT TCCAATATCT ATTCAGACAA CGGAACAAAT TTTGTAGGAG      5880
     CTGCAAGAAA ATTAGATCAA GAGTTATTTA ATGCAATACA AGAAAATATA ACGATTGCAG      5940
     CGCAACTTGA AAAGGACAGG ATTGATTGGC ATTTTATTCC CCCGGCAGGA CCTCACTTCG      6000
     GAGGTATTTG GGAAGCTGGA GTTAAGTCAA TGAAATACCA TTTAAAGCGT ATAATCGGCG      6060
     ACACTATTTT TACTTATGAA GAAATGTCAA CTCTTTTATG TCAAATAGAA GCATGCTTAA      6120
     ATTCAAGGCC ATTATACACT ATAGTTAGTG AGAAGGACCA ACAAGAAGTT TTAACACCAG      6180
     GTCATTTTTT AATTGGAAGA CCACCTTTAG AAATAGTCGA ACCAATGGAA GATGAAAAAA      6240
     TCGGAAATTT GGATAGGTGG AGACTTATCC AAAAAATAAA GAAAGATTTC TGGGTTAAGT      6300
     GGAAAAGTGA ATATTTGCAT ACGCTCCAGC AAAGGAATAA ATGGAAAAAG GAAATTCCTA      6360
     ATATAGAAGA AGGGCAAATA GTTTTATTAA AGGATGAGAA TTGTCATCCT GCAAGATGGC      6420
     CTTTAGGAAA GGTGGAAAAG GTGCATAAGG GGAATGATGA TAAGGTCCGA GTGGCTAAAG      6480
     TAAAGATGCA GGAAGGATAT ATCACTAGAC CCATTACTAA AATTTGTCCC TTGGAAGGAA      6540
     TAAAGTCTGT TGACAAAAAT GAGGCTGACC AAGAGCCAAA AAGACGAACT AGAGCGACAT      6600
     CGGGAATGTC CAAGATCGGA ATCATTATGG CAATGTTGTT GTTTGTGTTA AGTTGTCAAG      6660
     TTTCTAGCGC ATTACCTAAA GATATAGCAC CAAGATATTC TATAGACAAA ATAAATAAAA      6720
     CCTCAGCAAT ATATCTAGAC CCGCTAGGAG ATGTTGAGAT TGTGAGTACT TCTTGGAATT      6780
     TGGTTATCTA TTATAAAATG GATCCATATT TTAAAATGTT AACAAAGGGT AATGCGCTTA      6840
     TACAAAGTAT GAGGAAAGTT TGCGAAAGAC TTCATAGCTT TGAAGAGCAA TGTAGTCTAG      6900
     TCTTAGATAA TATGCAAAGT CAGTTATCGG AACTTGAAGA AAACAATAAA TTGTTTATGA      6960
     TGCAGTCTAG ATCTAGAAGC AAGCGTGCTC CTTTCGAATT TATGGGTTCC TTGTATCATA      7020
     TTTTATTTGG TATAATGGAT GAAGATGATA GAGAGCAATT AGAAGAAAAT ATGAAGAATT      7080
     TGTTAGATAA CCAGAACAAC CTTGATAAAC TAATTCAAAA ACAAACATCT GTGGTTGATT      7140
     CAACTTCTAA TCTATTAAAG AGAACAACAG AAGATGTTAA CTCCAATTTT AGAAGTATGC      7200
     AAATAAGAAT TGAGAACATG ACAGAAGTTC TTAAAGAAAA TTATTATGTT TATAAGGAAT      7260
     CAATAAAATT CTTTATGATT ACGAAACAGC TACACTCATT GATTGAAGAA GGCGAAAAAA      7320
     TTCAAGCAGG CATTATAAGC CTGTTGATTG ATATTAATCA CGGTAGGCTA AATACAAATA      7380
     TTCTCAGGCC AAATCAGCTT AAAAAAGAAA TTGCCAAAAT TCAGCAGAGT CTTTCAGAGA      7440
     ACCTAGTAAT TCCAGGAAAA CGGTCAGGTA CGGAACTTAA GGAGGTGTAT ACACTGTTAA      7500
     CAGCCAGGGG TTTATTCATC GACGATAAAT TGATCATTAG TGCAAAAGTG CCTCTGTTTA      7560
     GCAGGCATCC ATCCAAATTG TTCAGGCTTA TTCCGGTGCC AATTCGAAAT GAAGATCGGA      7620
     TAATAATGGT GCATACAACG TCCGAATATT TAATTTATAA TTTTGAGATA GATTCCTATC      7680
     ACATAATGAC GGAAGCCACA TTAAATCAAT GTCAGAAATG GCAACTAAAT AAGAGAATAT      7740
     GCAAAGGAAG TTGGCCCTGG AATTCAGCGA ATGATAATGC ATGTGAGATT CAGCCTCTAA      7800
     AGCCAGATAA AGCGGCGAAC TGCATCTATA AAACAGTAGT CGACTCTAAA AGTTACTGGG      7860
     TAGAGTTAGA AAAGAAAAGT AGTTGGTTGT TTAAGGTTCC TGCGAATTCA AAAGTCCGTC      7920
     TGCAATGTAC TGGCTCTCAA ATTGAATTGT TTGATTTGCC TCAGCAAGGA GTTTTAAGCA      7980
     TTGCGCCATA TTGTACGGCA AGAACCGACG ATAAAATTCT AGTTGCCCAC CATAACATTC      8040
     AGTCCGAAAG TGAAGAATTA TTATCAACAC CTTATATAGG AGAAGTTAGT GGAGTGCCGA      8100
     AGATTATTTG GGATCCGCTG AAACTATCAA TATTAAATCA TACTGAGGAA TTTGAACGAT      8160
     TGAATAATGA AATTAAATTT ATGAAAGAGA ACCATCAAAA ATTGAAAGAT TTACATTTCC      8220
     ATCATATTTC CGGACATGCT GGATTAATTA TTGCTTTAAT ACTAATGATA GTATTAATAA      8280
     TATATTTCAT ACGGAAATGT GCTGTGCAAC AAAGAATGCA AGCAATAACC TTTGCAGGTC      8340
     CGTTGCCAGT ACTATAAATA TCAATAGTAA ATAAACAATA AAATAATATA ACAAATAAAA      8400
     ATATACAGTC CACTAATAGA AAATGTACTT CTACATAGAA AAAGCAAAAT GTTTAAAATA      8460
     AGTTAATTAA GTACAAATTG TTGAATTAAA AATAATATAA ACCATAATTG TAATCCAATA      8520
     AAATTAAAAG CCAGAAAAAC TAGGCCCATT GAAATCTTAG TTGCAAAATA AATGAACATA      8580
     TATCAAATAA ATACAGTCCA CTACTGTTAT AAATGCAACT AATATACTAA TGTACATCTC      8640
     AGCTTTGCTG GCCCTTTGGC AGAATGTTCA CACATGAACA CGAATATATT TAAAGACTTA      8700
     CAATTTTGGG CTCCGTTCAT ATCTTATGTA AATGAATCGA GAGCGATAAA TTATATTTAG      8760
     GATTTTGTTA TCTAAGGCGA CATGGGTGCA TTGCTCAAAA ACATGTAATT TAAGTGCACA      8820
     CTACATGAGT CAGTCACTTG AGATCGTTCC CCGCCTCCTA AAATAGTCCC TTAGTGGGAG      8880
     ACCACAGATA AGGTCCTCGC CGCTCAAGAT AGGCAGATGT GCCCGAGCGT GGGACCTCGA      8940
     TAAGGCGGGG ACTATTTACG TAGGCCTCTG CGTAGGCCAT TTACTTTAAG ATGCGATTCT      9000
     CATGTCACCT ATTTAAACCG AAGATATTTC CAAATAAAAT CAGTTTCTTA CAAAAACTCA      9060
     ACGAGTAAAG TCTTCTCATT TGGGATTTTA CA                                    9092
//
ID   BLOOD    standard; DNA; INV; 7410 BP.
XX
AC   AY180916;
XX
DR   FLYBASE; FBte0000279; Dmel\blood.
XX
FT   source          AY180916:1..7410
FT   SO_feature      five_prime_LTR ; SO:0000425:1..398
FT   SO_feature      three_prime_LTR ; SO:0000426:7011..7410
FT   SO_feature      CDS ; SO:0000316:966..1271
FT                   /name="Dmel\blood\sORF"
FT                   /db_xref="FLYBASE:FBgn0045863"
FT                   /db_xref="NCBI_PROTEIN:AAN87266.1"
FT                   /translation="MSTKQTFEHPAPVEQRDLPSIKEVIEVDPSAGPKPLTIQEYKAR
FT                   TAAREQPPKKKRGGRRIKLLSARRLNIELLKTATNEEDRQRYKERLAAINQQLRGAK"
FT   SO_feature      CDS ; SO:0000316:1863..3116
FT                   /name="Dmel\blood\ORF1"
FT                   /db_xref="FLYBASE:FBgn0045865"
FT                   /db_xref="NCBI_PROTEIN:AAN87267.1"
FT                   /translation="MEWLNLTISINNIRDAFDKSYKCINKTALIKTQTLIFHIKVLIT
FT                   QYNTLQNLIVTNKSKLTEEHKVQCFKVLSSFGKRLHNTSVRHSIIIEVPTELTKIAEF
FT                   DESQLRDLDESQPLEDLDIESDIESIEELKFNTVQPNTRNMANALEAQRAYVKQVSAT
FT                   VPDFDGKKLHLNRFVTALKLTDLTKGDQETLAVEVIKTKIIGPLNYKVEHATTIQAII
FT                   TILQANVKGESPDVIKAKLINAQQRGKTASQYVTEIDSMRKQLEAAYIDGGLDADNAD
FT                   KFATKESISAMTKNCANEALKMILTAGTFSTFNDAMEKYLHCSTEITGNSNTVLFYNG
FT                   NNRRGNYNAYYRGRGRNNYNHNYNQNYNQGYNNNNRGRGGYRGHGNNRDGGNRRGNQS
FT                   QNNNNNRNVRNVQSENSQTPLSDQQ"
FT   SO_feature      CDS ; SO:0000316:3749..6733
FT                   /name="Dmel\blood\ORF2"
FT                   /db_xref="FLYBASE:FBgn0045864"
FT                   /db_xref="NCBI_PROTEIN:AAN87268.1"
FT                   /translation="MKDYDIFTTPVEKENRTEEILKQLRFPKQFNNELTKLCTEFSDI
FT                   FGLETEPISANNFYKQKLRLGEKTPVYIKNYRMADSQKPEIARQVKKLIDDGIVEPSM
FT                   SEYNSPLLLVPKKPLPNSTEKRWRLAVDYRQINKKLLSDKFPLPRIEDILDQLGRAKY
FT                   FSCLDLMSGFHQIELEKRYRDITSFSTANGSYRFTRLPYGLKVAPNSFQRRMTLAFSG
FT                   LEPSQAFLYMDDLVVIGCSEKHMLKNLTNVFELCRRHNLKLHPGKCSFFMKEVTYLGH
FT                   KCTDKGILPDDTKYEVIEKYPIPTDADSARRFVAFCNYYRRFIKNFSDHSRHLTRLCK
FT                   KNVQFEWTAECNDAFEYLKTELMKPTLLQYPDFGKEFCITTDASKQACGAVLTQDHNG
FT                   QQLPVAYASRMFTQGESNKSTTEQELTAIHWAINHFRPYIYGKHFMVKSDHRPLSYLF
FT                   SMKNPSSKLTRMRLDLEEYDFTVEYLKGKDNHIADALSRITIKDLKTINREILKVTTR
FT                   SKAKQENSCKDEAIVKIQEEKEQTIEKPKVYEVVNNNDTKKYVLIKIDKHKCLLKRGK
FT                   TIVSRFDVDDLYSNETFDLNQFFQRLISKAGMHKITKMRISPSEQMFQFVSLNEFKIK
FT                   GNRVLEKVELAILQKVIIIDKNDEAQIKEILTKFHDDPIEGGHTGISRTQSKIKRFYY
FT                   WPQMTKTISKYVKTCLKCQQAKITTHTKTPLTLMPTPATAFDTVLIDTIGPLPKSEDG
FT                   NEYAVTIICDLTKFLVTIPTPNKSAKTVAKAIFELFVLKYGPMKTFITDQGTEYKNSL
FT                   MNELCKYMHIENLTSSAHHHQTLGTIERSHRTFNEYIRSYISVNKSDWDIWLPYFTYC
FT                   FNTTPSIVHDYCPYELVFGRLPRQFKDFSKINKIDPIYNLDDYSKELKCRLELSYNRA
FT                   RRMLEKAKADRKLRYDRNTNNFELKIGDKVLLRKETGHKLDKRYEGPYDVVDIGINDN
FT                   ITIKTGSKKQQIVHKDRLKKHK"
XX
CC   Sequence from P1 (complement)DS03023:69372..76782 provided by Guochon Liao,
CC   Berkeley Drosophila Genome Project.
XX
SQ   Sequence 7410 BP;  2840 A; 1403 C; 1328 G; 1839 T; 0 other;
     TGTAGTATGT GCATATATCG AGGGTACACT GTACCTATAA GTACACAGCA ACACTTAGTT        60
     GCATTGCATA AATAAATGTC TCAAGTGAGC GTGATATAAG ATCACCCATT TATGCTTTAA       120
     GCTAAGTCAG CATCCCCACG CTGGCCGCTG GCCATATATG CGCATAAGCT CTCTCTCTCT       180
     CTCTCTTATA CATATATATA TACGCTGCTC TTCTGCCGCT GTCGACGGCG GCGCAGTCGC       240
     AGTATTTAGG TAAGATTAGA CACTCTGTAG AGGTTAAGCG GGCAGAACCG TTTCTGCTAC       300
     TCGAAGAGAT AAGAAGAAAT AAAAAGGTGC CTGACGGCTG CACCCAACTG CAAGGAAAAC       360
     ACGTGTTCTC AATTGGTGGC ATATATTGGT TTATTACATG GCGACCGTGA GGCAGGAGCC       420
     TGCGATCTGA GGACTACTGA GGAAATGCTG CTAATATTGC CGATTTGATT TGGGAATTCT       480
     AAACAGCGAC AACAGGTGTG AGAAGCAGGC CGCCCCTTAC ACCAGTGCGG GAGACCTAGA       540
     GACGGGACAC TGATGAAAAA AAAAGAAACA AAAATACTGA GTGAGTAGAG TGTGGTAATG       600
     GGCAAACGCG GATGTCAGGA AATCAAAAAT AAAGGTATAG CACATATTAA GTGGCTATGA       660
     TATACAAATA AAACACCGCC CCCATGGGCA ACGGCACAGA AATTAACTGC CGAATTAGAC       720
     TTTCTGAAAG AAAACCTCCA GCAAAGAAAG CCGAATACCA CAACTCACTC AGCAAAAATA       780
     GAAATAATCA ATGAAGAAAT AACTGAAAAT TCAACATCAC CCAAGCCGAA AAGACCCGAC       840
     GTCTGCATGA AAGACTGCCC TCGACCATTG TAAGCCGCAA CAGCAATTAG CACGGCATCC       900
     TGCGAGGGTA GGATTAGGAT AAAGGATAAA GGATTCCACC GGCGCGCCGC ACATGACAAC       960
     AGCGAATGTC TACCAAGCAG ACGTTCGAAC ACCCTGCTCC TGTCGAGCAA AGGGATCTGC      1020
     CAAGTATCAA AGAGGTAATA GAGGTAGATC CGTCCGCGGG ACCAAAGCCC TTGACCATAC      1080
     AAGAGTACAA GGCACGGACT GCAGCGAGGG AGCAGCCACC TAAAAAGAAG AGGGGTGGCC      1140
     GCCGGATTAA GTTGCTCAGC GCCCGGAGGC TCAACATCGA ACTACTGAAG ACGGCAACTA      1200
     ATGAGGAAGA CCGGCAGCGC TACAAAGAGC GCCTTGCAGC CATCAATCAA CAACTTCGTG      1260
     GTGCGAAGTA AAGCGGCGGG CTGCGTTATA CGCCATAGCC TCAACCGCCC AAATATTATA      1320
     TTAATGTTGT CGATGCGGTT TCCGCTGCAA CAAAATTACT AACTTATCAG GGACCCATTT      1380
     CATAACTAAC ACATTATACT CAGTCCTAAA CTTAAAATAA GTAATAATAT TGTAAAATTG      1440
     CAAATTGCAA CCGATGTAAA CTGAGTATAA TGAATTCATC TATCAAGTAA AAATATGTTT      1500
     AACAACAGTT TAGACCTATT AAAATTTCGA GCTATATTTA TATCTGATCG AGATAACAAT      1560
     AATTGACCAA TTCTCAAAGT TAAAATTCTA TTTGTACTTT TGATATACAA ATAAAGACTA      1620
     ATTTTCCCCA TATCAAAATG GGACATAAGT CGTGGATACA ACCCCACAGT TAAATTCAAT      1680
     GTACTTACTA TTTTTGATTT TAGTTATCCT ATCAGCCTTT TTACCTTGGC CTTAAAACTT      1740
     TATCAGTTTC ACACAAGATC GTTGAAAAGA CTTACATGAG TCGAGCCAAT GATTTAGACA      1800
     AAATCTAATA GAAACTACAC CAAAAAGGTA CAAGGTCGAT TACATCGCTA AAAGGTACAT      1860
     ACATGGAATG GCTAAACTTA ACCATATCCA TAAACAATAT TAGAGATGCT TTTGATAAAT      1920
     CCTATAAATG TATTAATAAA ACCGCGCTGA TCAAAACTCA GACGCTTATT TTTCACATAA      1980
     AGGTATTGAT AACACAATAC AACACATTAC AAAACCTAAT AGTAACAAAC AAAAGCAAAC      2040
     TCACTGAAGA ACATAAAGTC CAATGCTTCA AAGTTCTCAG TTCATTTGGT AAAAGACTAC      2100
     ATAATACCAG CGTTAGACAC AGTATTATAA TAGAAGTCCC AACAGAACTA ACCAAAATAG      2160
     CAGAATTCGA CGAAAGCCAG TTAAGAGACT TGGACGAGTC GCAGCCGTTA GAAGATTTAG      2220
     ATATCGAAAG CGATATCGAA TCAATAGAAG AATTAAAATT TAATACCGTA CAACCAAATA      2280
     CAAGAAACAT GGCCAACGCA TTAGAAGCTC AGAGAGCATA CGTTAAACAG GTATCTGCCA      2340
     CAGTACCTGA TTTCGATGGT AAGAAACTCC ATTTAAACAG GTTTGTGACA GCACTTAAGT      2400
     TGACGGATCT AACTAAAGGA GATCAAGAAA CTTTAGCAGT AGAGGTCATA AAGACCAAAA      2460
     TTATTGGCCC ATTAAACTAT AAAGTAGAAC ATGCGACAAC GATACAGGCA ATAATTACCA      2520
     TATTGCAGGC AAACGTAAAA GGCGAATCGC CTGACGTTAT AAAGGCCAAA TTAATAAATG      2580
     CCCAACAAAG AGGCAAGACC GCGTCTCAGT ATGTTACAGA AATAGACAGT ATGCGTAAGC      2640
     AGCTCGAGGC AGCTTACATA GACGGCGGAT TAGACGCCGA TAATGCTGAC AAATTCGCGA      2700
     CTAAAGAGTC GATATCAGCA ATGACCAAAA ACTGTGCCAA CGAGGCACTT AAAATGATCT      2760
     TAACTGCAGG TACATTTAGT ACATTCAACG ACGCAATGGA AAAATACCTA CATTGCAGTA      2820
     CAGAAATAAC CGGCAATTCA AATACAGTCT TATTCTATAA TGGGAATAAT AGACGTGGTA      2880
     ATTATAATGC CTACTATCGT GGTAGAGGCA GAAATAATTA TAACCATAAT TATAACCAGA      2940
     ATTATAACCA AGGTTATAAT AATAACAACA GAGGTCGCGG AGGCTACCGC GGCCACGGTA      3000
     ATAACAGAGA CGGAGGTAAC CGAAGGGGTA ACCAAAGTCA GAATAATAAT AACAACCGAA      3060
     ATGTGCGTAA CGTACAATCG GAAAACAGCC AGACCCCCTT AAGCGATCAA CAGTAAAAGT      3120
     GTTTAAAGTA AACCTAAATC TGAGTATTTT CATTAAGACA AAAAACCATG AAACAAACAC      3180
     AGTTCTTACA TTACTAATAG ACACAGGTGC AGAAATTTCA TTGCTAAAAG CCAAAGCAAA      3240
     GGAATATAAT AATATAAATT TCAGTAATAT ATCAAATATT ACAGGTATTG GGCAAGGAAC      3300
     CATACAGTCT ATAGGTACAG TAGATCTTGA CATACGCATT CAGGATGTTC TAGTGCCACA      3360
     TGAATTTCAT GTAGTACCTG AGAATTTTCC GATACCATGC GATGGCATAA TCGGAATAGA      3420
     TTTTATCAAG AAATACAATT GCGTATTAGA GTTTCAAAAT AACAAAGACT GGTTCACAAT      3480
     AAGACCCAAT AACTTCAGTA GACAGATTAG TGTACCAATT ACACATAACT TAGACTCCAA      3540
     CACACTCTTA TTGCCAGCTA GATGCGAAGT AATCAGACAA GTCAAATTAC TCACTAACGA      3600
     AAAAACGGTG GTAGTACCAA ATCAGGAGCT GCAACCAGGT ATAATAGTAG CAAGCACCAT      3660
     TGCCGATAGC AAAAACGCAT TGATTCGCAT TATAAATACA AATAATAAAG ACGCCATAAT      3720
     AGATAGCGCG AAGATCAAAT GCGAATCAAT GAAAGACTAT GACATTTTTA CAACACCAGT      3780
     AGAAAAGGAA AATAGAACTG AAGAAATTTT AAAACAATTA AGATTCCCTA AACAATTCAA      3840
     TAATGAACTA ACTAAGTTAT GCACCGAGTT TAGCGATATT TTTGGTCTAG AAACAGAACC      3900
     AATATCGGCT AACAATTTCT ACAAACAAAA ACTCAGATTA GGGGAAAAAA CACCGGTCTA      3960
     TATAAAAAAC TATCGCATGG CAGATAGCCA AAAACCAGAA ATCGCCAGAC AGGTAAAAAA      4020
     ATTAATAGAT GATGGAATAG TTGAACCATC AATGTCTGAA TATAATAGTC CATTACTTTT      4080
     GGTTCCAAAG AAACCACTTC CGAATTCCAC GGAAAAAAGA TGGCGATTAG CAGTTGACTA      4140
     TCGTCAAATA AATAAGAAAC TATTATCAGA CAAATTTCCA CTTCCAAGAA TAGAAGATAT      4200
     TCTTGATCAA TTAGGAAGAG CAAAGTATTT TTCATGTCTC GACCTAATGT CTGGATTCCA      4260
     CCAGATAGAA CTAGAAAAAA GGTATAGAGA TATAACGTCA TTTTCAACAG CCAATGGCTC      4320
     ATATCGCTTC ACGCGATTAC CATACGGACT GAAAGTAGCA CCAAACTCCT TCCAACGTAG      4380
     GATGACACTT GCATTTTCTG GTCTTGAACC ATCGCAAGCA TTTCTATATA TGGATGACTT      4440
     AGTAGTAATA GGTTGTTCAG AAAAACATAT GCTCAAAAAT TTGACTAACG TATTCGAGCT      4500
     ATGTAGACGA CATAATTTGA AACTACATCC AGGGAAATGT TCTTTCTTTA TGAAAGAAGT      4560
     AACATATTTG GGTCACAAAT GTACCGATAA AGGTATACTC CCAGATGACA CCAAATATGA      4620
     AGTTATAGAA AAATATCCTA TACCAACAGA TGCCGACAGT GCTAGGCGTT TCGTAGCCTT      4680
     CTGTAATTAT TACAGACGTT TCATTAAAAA TTTTTCTGAT CATTCACGCC ACTTAACGAG      4740
     GCTTTGTAAA AAGAATGTTC AATTCGAATG GACAGCAGAA TGCAATGATG CATTCGAATA      4800
     CCTTAAAACA GAATTAATGA AACCAACATT ACTACAGTAC CCAGATTTCG GTAAAGAATT      4860
     TTGCATAACA ACCGATGCTA GTAAACAGGC ATGCGGAGCG GTACTTACAC AAGATCACAA      4920
     TGGTCAACAA CTTCCAGTGG CATACGCTTC AAGAATGTTC ACTCAAGGTG AAAGTAATAA      4980
     GTCCACTACA GAACAAGAAT TAACGGCCAT TCATTGGGCC ATAAATCATT TTCGACCATA      5040
     CATATATGGC AAGCATTTCA TGGTAAAAAG CGATCATAGA CCATTGTCAT ACCTATTCTC      5100
     TATGAAAAAT CCAAGTTCAA AACTCACTCG TATGAGGCTG GATTTAGAAG AGTATGACTT      5160
     TACTGTAGAA TATCTTAAGG GGAAAGATAA CCATATTGCG GACGCCTTGT CTCGCATAAC      5220
     AATAAAAGAT CTGAAAACAA TCAACAGAGA AATATTAAAA GTTACCACCA GATCAAAAGC      5280
     TAAACAGGAA AATTCCTGTA AGGACGAAGC AATAGTCAAA ATACAAGAGG AAAAAGAGCA      5340
     AACAATAGAA AAGCCCAAAG TCTATGAAGT TGTCAATAAT AATGACACAA AGAAATATGT      5400
     TTTAATCAAA ATAGATAAAC ACAAGTGTTT ATTAAAACGA GGAAAAACAA TTGTTTCACG      5460
     CTTTGATGTT GATGACTTGT ATTCTAATGA AACATTTGAT CTAAATCAAT TCTTTCAAAG      5520
     GCTTATTTCA AAAGCCGGAA TGCATAAAAT AACAAAAATG CGAATATCAC CAAGCGAACA      5580
     GATGTTCCAA TTTGTATCAC TAAATGAATT TAAAATAAAG GGCAACCGAG TACTCGAAAA      5640
     AGTAGAACTA GCTATTCTAC AAAAGGTGAT AATTATAGAC AAAAATGACG AAGCTCAGAT      5700
     TAAAGAAATT TTGACAAAAT TCCATGATGA TCCTATAGAA GGAGGCCACA CTGGTATTTC      5760
     GCGAACCCAG TCAAAAATCA AAAGATTTTA TTATTGGCCC CAGATGACCA AGACAATCTC      5820
     AAAGTATGTA AAGACTTGTT TGAAATGTCA ACAAGCCAAA ATTACAACAC ATACGAAAAC      5880
     TCCATTAACA TTGATGCCAA CGCCAGCAAC AGCATTTGAT ACTGTTTTAA TTGATACCAT      5940
     TGGTCCACTA CCGAAATCGG AAGACGGAAA TGAGTATGCA GTTACAATCA TATGCGATCT      6000
     AACCAAGTTT TTAGTAACTA TTCCAACACC AAATAAAAGT GCTAAAACAG TTGCAAAGGC      6060
     TATATTTGAA TTATTTGTAC TGAAGTACGG TCCAATGAAG ACGTTCATTA CAGATCAAGG      6120
     TACGGAATAC AAAAATTCAC TTATGAATGA ATTATGCAAA TATATGCATA TAGAAAATCT      6180
     AACATCTAGC GCTCACCATC ATCAAACTTT AGGAACAATA GAAAGAAGCC ACCGAACTTT      6240
     TAATGAATAT ATACGTTCAT ACATATCGGT TAACAAAAGT GATTGGGACA TTTGGTTACC      6300
     ATATTTCACT TATTGCTTCA ATACAACACC CTCAATAGTC CATGACTATT GCCCATACGA      6360
     ACTAGTATTT GGCAGACTAC CCAGACAATT CAAAGATTTC AGTAAGATAA ACAAAATAGA      6420
     CCCAATATAC AACTTAGACG ACTACTCTAA AGAGCTTAAA TGCAGACTAG AATTGTCGTA      6480
     CAACAGAGCA AGAAGAATGT TAGAAAAAGC AAAAGCGGAT AGAAAATTAA GATATGATAG      6540
     GAATACAAAT AATTTCGAAT TAAAAATAGG AGATAAAGTA TTACTTAGAA AAGAAACAGG      6600
     TCATAAGTTA GATAAAAGAT ATGAAGGTCC TTATGACGTA GTAGATATAG GAATAAATGA      6660
     CAATATAACC ATTAAAACAG GAAGTAAGAA ACAACAAATA GTACATAAAG ATAGGCTAAA      6720
     AAAGCACAAA TAGAATGAAA AAAAAAAAGG GCAATCAATG CCAAACCTTT CATAATAAAA      6780
     CTTAAATAAC GGCCTGATCA GCCAAAACAA TATAACAAAG ACATAGACAT AATCGAATTT      6840
     TTATTAATTC AAAATACATA CATATTTTTT CTTTATTCAT TTAAAAATTC TATATCATAA      6900
     ATAATGTTAA TTCATTAAAA ATAATATTTA AGTAATTTTT ATTTTATAAT GGTAATATAG      6960
     TTGATAGAAA ATAACTTCAT TTCTTTACGT TATTTTAAAA AAGAGGGGAG GTGTAGTATG      7020
     TGCATATATC GAGGGTACAC TGTACCTATA AGTACACAGC AACACTTAGT TGCATTGCAT      7080
     AAATAAATGT CTCAAGTGAG CGTGATATAA GATCACCCAT TTATGCTTTA AGCTAAGTCA      7140
     GCATCCCCAC GCTGGCCGCT GGCCATATAT GCGCATAAGC TCTCTCTCTC TCTCTCTTAT      7200
     ACATATATAT ATACGCTGCT CTTCTGCCGC TGTCGACGGC GGCGCAGTCG CAGTATTTAG      7260
     GTAAGATTAG ACACTCTGTA GAGGTTAAGC GGGCAGAACC GTTTCTGCTA CTCGAAGAGA      7320
     TAAGAAGAAA TAAAAAGGTG GCCTGACGGC TGCACCCAAC TGCAAGGAAA ACACGTGTTC      7380
     TCAATTGGTG GCATATATTG GTTTATTACA                                       7410
//
ID   DMZAM      standard; DNA; INV; 8435 BP.
XX
AC   AJ000387;
XX
DR   FLYBASE; FBte0000217; Dmel\ZAM.
XX
FT   source          AJ000387:1..8435
FT   SO_feature      five_prime_LTR ; SO:0000425:1..473
FT   SO_feature      three_prime_LTR ; SO:0000426:7963..8435
FT   SO_feature      CDS ; SO:0000316:join(494..531,6387..8004)
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\ZAM\env"
FT                   /db_xref="FLYBASE:FBgn0024272"
FT                   /db_xref="SPTREMBL:O46113"
FT                   /db_xref="NCBI_PROTEIN:CAA04048.1"
FT                   /translation="MENTLLNLLLVLLSCHGAYQSIFIHNFNSTNLLAKVPVGKTLVIG
FT                   NYKKISHIIDLSEYTNCIEKLYHTIDTLRQDETLTDSISILNAKLAQTQSKIDALTPFS
FT                   RHKRGLINGLGSLVKVVTGNMDANDAKNIETEINHLKSQSTTISDNFEIQNSFNDEVQL
FT                   RFKNLTRHINNEQNLIKNFFENTQNTIYTKIYNNEEEIKKLQYINRLNYNIDLLVSHLS
FT                   DIIESTLLAKINVIPKLILDKTEITKIKQIFKTQNYTIKSEQHIYNLLKMNALNYQNKI
FT                   IFSIKIPIFLSCNYEMARLIPLPINSTQFVIAPKYLIYNNKSNSMFSTMYKCPVIEEQF
FT                   VCEIDSINNLKNNTCLGHLIQNKTSYCDIKETGLTTDVFEPEKGFILVFNGNNLPIISS
FT                   NQTITSINGSAIIKYNNCTLKINEINYDNRAVSTEEHPDFFLPPMRKLIKNATINILTL
FT                   ERLHLDTLTTSNKLLVVAAGNSRHSTTLYILFTVSLVAVILTWTLRRDTHIFHTGPDHI
FT                   LPIVAPPIPPSMAFAPNWGGRSYRPIGTIHHPSL"
FT   SO_feature      CDS ; SO:0000316:1789..2820
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\ZAM\gag"
FT                   /db_xref="FLYBASE:FBgn0024271"
FT                   /db_xref="SPTREMBL:O46114"
FT                   /db_xref="NCBI_PROTEIN:CAA04049.1"
FT                   /translation="MSKKLTQTIKQTTRSVLESHTFPKRVTRSVSKTNTLPVIRESTPL
FT                   PPLQPINMDSGNASVGNSAPVTPTVSGFSSIATALSATDILAFVKELPTFDGTPGQLDK
FT                   YITSVEEIIMLIRGTDQTPYGLLTLRAIRNKIVGRADEALNLANTKLIWDDIKSNLLRL
FT                   YSSKKSEATLLGELQSLPDNLTLGQLFFGLSRIRSQLISITSNSGQSATIIEAKKTLYD
FT                   EVCLNAFISRIREPLKTVIRLKDPKTIETAYELCQGERARYQNRNPYPPTQNNTERRTN
FT                   NYNNNNNNNHRDNNNRNNVTRLTPKTTQTITQTPIPNIVNQTTATELVTRLKIIKQIMG
FT                   YTT"
FT   SO_feature      CDS ; SO:0000316:<2795..6448
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\ZAM\pol"
FT                   /db_xref="FLYBASE:FBgn0024270"
FT                   /db_xref="SPTREMBL:O46115"
FT                   /db_xref="NCBI_PROTEIN:CAA04050.1"
FT                   /translation="NKLWATQHRRRKTHPTLPYQLKFSGTRLRNPTGYINPTTHATSLP
FT                   YITLNLQQKFPLSFLIDTGSNNSFIDPESANQLECTILPTSTSITTALNSFKIEEKAIF
FT                   PMPPEFKTEGQITLLKFKFHSYFNGLIGMDLLSHLEAKVDLVNLQLVTSKSTLPIFLYT
FT                   NQASKIFNIPAYSKVILPLPVKTNHGEFYCCTTQLNNELSLSEGLYKSNNNIANVEISN
FT                   QSDSDKLLYLEYPLETIPYNKNDHIELFNISATPLNNDTPQAPLHILTEHLNPEEKTAL
FT                   TTLCKQFRDIFYNPETPLTFTNKITHSIPTIDNTPIHTKSYRYPFVHKTEVKKQIESML
FT                   DQQIIRSSHSPWSAPVWVVPKKLDGTGNRKWRLVIDYRKLNDKTISDRYPIPNINDILD
FT                   SIGKAKYFSTLDLTSGFHQIEMNPKDIAKTAFTVEGGHYEFTRMPFGLKNAPATFQRVM
FT                   DSVLGDLNGTICLFYLDDIIIFSPSLQKHLLDIKMVFEKLRAANFKLQPSKSEFLRKEI
FT                   EFLGHIVTQDGVKPNPNKISAIKKFPCPTNRRAIKSFLGLLGYYRKFIRDFARITKPMT
FT                   KQLKGKRQVTTDKDFVDAFEQCKTLLSNDPILIHPDFEKPFILTTDASNFALGAVLSQG
FT                   SLQNDRPVCFASRTLSDTEVNYSTIEKEMLAIIWAVKYFRPYIYGVKFTIVTDHKPLIW
FT                   LMNFKEPNSKIIRWRLQLMEYNFEIIHKKGSQNVIADALSRADPNLNYNETLTVKPCPT
FT                   SEKPINEFNTQLILEIDTNTSYQTTTPFKQKIRKKYSQPCFDFDNIVKILKGTLKPNRI
FT                   CAFLADDNNSALIEKAFSTYFAHKKHFKIIRCKSLLHEIVGNPEQNKFIQEYHTNSNHR
FT                   GIDETFLHLKRETYFPNMKNKISELIRNCETCLKLKYDRQPQNIVFETPETPSKPLDII
FT                   HIDIYTINNNFNLTIIDKFSKFAAVYPIPNRNGINCIKAIKNFFSQFGLPKKLIHDQGV
FT                   EFCNDIFRKFCSQYNILLHVTSFQQSSSNSPVERLHSSLTEIYRIILDTRKKHKLPTDH
FT                   EEIMSETVITYNNAIHSTTKHTPFELFNGRTHLFEKTIIPNNEHDYLNKLNTFQDKLYS
FT                   EIKEKLSTNTQQRIEKLNTSRVEPTTVQPNSTIFRKENRRNKLTPRFSLHRTAKDKGKT
FT                   LVTTRNQKIHKSKIRKISKPPNDLSLSTCIPDLAMGHTNLSSSTTSIAPTS"
XX
CC   Derived from AJ000387 (e1237231) ((Rel. 54, Last updated, Version 1).
CC   Takis Benos and Michael Ashburner, 19-Jan-1998.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 8435 BP; 3286 A; 2055 C; 1151 G; 1943 T; 0 other;
     AGTTACCGAC CCATCGGTAC CATACACCAC CCCTCCCTCT AAGCCACCAC GCCTACACAA        60
     GTAGAAGACA TCGAACCGGG AAGCTTTGCG ATACAAAGTT GCAGCATAAA CATCAACAAC       120
     GGGTCAGACG CCGACATCCG CCCAAAATGC TGACACCACA TCCTTTTCGC TCAGACAGAA       180
     CAACGCATAC AATTCCATAT ACATACGTAT AAACATACTC ATACTTTCTG CTGTGTCAGA       240
     TACTTTATTT CTAAGAACTT TAACATTGTA ATACATACAC ACATATTCAC TGTTAGCCCA       300
     TTTAAGACGA AGAATAAAGA CGACCACAGT CGAGTGCAAG CAGCAAACAC TTGTAGACGT       360
     ACATAATCTC CGATCAAAAT TCTCCCAAGA CGACCGTGGC TACGTTCTGG ACCCGCATAA       420
     CTCCTCTATC TTTCTGAGTG ATAATACCTC CGCAAGACTC CCCGGAGGTA ACTGGCGCAG       480
     CCGGAAAACT GGAATGGAAA ATACTTTATT AAACCTTCTA TTAGTTCTAT TGTAAGTAGT       540
     TGTGGAAAAA GAGTGAGAAT GAAGTGCAGA AATGTCTAAA AGTGATTACA ACAAAAATCC       600
     TAATACAATA CATAAACCGC CTTAACAAAC ATACAAAACA CGCATATAAA AAAAAAAAAA       660
     AAAAAAAAAA GAAAAAAAAA AACCCAAAAC TTAAAAATGC CGTAACCGCG AAACATGATA       720
     TGCGTTGTAC TTGTGTGAAA TCAATCGCTG ATAGTCACTG CCGAAGTTTA TTAAGGCCAA       780
     GTACCATATC ATTACTTTCA TGTTTACATA CATATATATG CCCCACAATT AAAACAACAT       840
     ACACACACAC AAATATTTCA AATGCAAAAA AAAAAAAAAG AATGTAGTGT ACCTGCGTGG       900
     CATCAATCGC TGATAAACCA CTGCCGAAAT ATTAAAGGCC CGGTACTACA TCACAAAACA       960
     CGTATATATG CAACAAAAAT ATACACAACA AAACCATATA TACAAACGTG TATGAGTGAC      1020
     GTGTAATGTA CTTGTGTGAA ATCAATCGCT GATAATCACT GCCGAAGCTT AGTAAGGCCA      1080
     AGTACCACAT CATTACTAAC ATGTGTACAT ATATATATAT GCAAAACAAT TAAAACAACA      1140
     TACACACACA CAAATATTTC AAATGCAAAA AAAAAAAAAA AAGAGGAAAT GTTGTGTACC      1200
     TGCGTGGCAT CAATCGCTGA TAAACCACTG CCGAAATATT AAAGGCCCGG TACTACATCA      1260
     CAAAACACGT ATATATGCAA CAAAAATATA CACAACAAAA CCATATATAC AAACGTGTAT      1320
     GAGTGACGTG TAATGTACTT GTGTGAAATC AATCGCTGAT AATCACTGCC GAAGCTTAGT      1380
     AAGGCCAAGT ACCACATCAT TACTAACATG TGTACATATA TATATGCAAA CCACCAAAAC      1440
     AAATACATAT ACACATACAA ACACTCCAAA AAAAAAAACA AATAATACTA TATGAACGGC      1500
     GAAGCGTATG TTTTCTAAGG CTGGATACAA AACCACAAAA CCAAATATAA ATTGCACACC      1560
     TTAATAAAGA AAAGAACAAA AATGATAATA AACAAAAGAA ATTTTTTTTG GAACATGCAC      1620
     CCATACTCTC ACTCTTTCAA CACAAATAAA GTATTCAAAT TATACATACA TACAATAATA      1680
     CCACTATATT ACAGAAATTA ACGCACAAGA AAACACACAC ACTATCCAAC AACAAACAAG      1740
     TAATTAAGAG TTATTAAGTA CATTGTAAAC TACATATTTT TATCTTAAAT GTCAAAGAAA      1800
     TTAACACAAA CTATTAAACA AACAACTCGC TCCGTGTTAG AATCACACAC ATTTCCCAAA      1860
     AGAGTTACAC GATCAGTTTC GAAAACAAAC ACCCTCCCCG TAATAAGAGA AAGCACCCCC      1920
     TTACCGCCCC TTCAACCTAT AAATATGGAT TCGGGCAACG CCTCCGTAGG TAATTCCGCC      1980
     CCCGTAACAC CTACTGTCAG TGGCTTTAGC AGTATTGCTA CGGCACTTAG TGCCACCGAT      2040
     ATTTTAGCCT TCGTTAAAGA ACTTCCGACC TTCGATGGTA CTCCAGGCCA ACTCGACAAA      2100
     TATATAACTA GCGTTGAGGA AATAATCATG CTCATTAGGG GTACCGACCA AACTCCGTAC      2160
     GGACTTCTGA CACTCAGGGC AATTAGGAAT AAAATAGTTG GAAGAGCAGA CGAAGCTCTA      2220
     AACCTAGCCA ACACCAAACT TATATGGGAC GATATCAAAA GTAACCTACT ACGTTTATAC      2280
     TCTAGCAAGA AAAGCGAAGC TACCCTCTTA GGCGAGCTCC AATCTCTCCC AGATAACCTA      2340
     ACCCTAGGGC AATTGTTCTT CGGCTTATCG AGGATTAGGA GCCAACTTAT ATCCATTACT      2400
     TCCAATAGTG GACAGTCGGC CACAATCATC GAAGCCAAGA AAACACTATA TGACGAAGTC      2460
     TGTTTAAACG CCTTCATCTC AAGAATTAGA GAACCACTTA AAACAGTCAT CAGATTGAAA      2520
     GACCCCAAGA CTATCGAAAC AGCTTACGAG CTATGTCAAG GAGAAAGGGC TCGTTACCAG      2580
     AACAGAAACC CATATCCCCC AACACAAAAC AACACCGAAC GACGAACTAA CAACTACAAT      2640
     AACAATAACA ACAACAATCA CAGAGACAAC AACAACCGCA ACAACGTAAC TCGTCTTACA      2700
     CCCAAAACCA CTCAAACCAT TACTCAAACC CCAATTCCCA ATATCGTCAA TCAAACAACG      2760
     GCAACAGAAC TAGTAACCCG TTTAAAGATA ATAAAACAAA TTATGGGCTA CACAACATAG      2820
     AAGAAGAAAA ACTCACCCAA CACTGCCTTA CCAACTTAAA TTTTCAGGCA CCCGCCTCAG      2880
     GAACCCAACA GGATACATAA ATCCTACCAC ACATGCAACA TCCCTTCCAT ACATAACTCT      2940
     AAACCTCCAA CAAAAATTCC CTTTATCATT TCTTATCGAT ACAGGATCCA ATAACTCCTT      3000
     CATTGACCCA GAATCTGCAA ACCAACTAGA GTGCACAATT CTACCAACAT CCACTTCAAT      3060
     TACAACAGCA TTAAATAGTT TCAAAATTGA AGAAAAGGCA ATATTCCCAA TGCCACCCGA      3120
     GTTCAAAACC GAAGGTCAAA TTACCCTACT TAAATTCAAA TTTCACTCTT ATTTCAATGG      3180
     CCTCATAGGA ATGGACCTAT TATCACACCT AGAAGCAAAA GTAGACCTAG TAAACTTACA      3240
     ACTAGTAACT TCAAAGTCTA CACTCCCAAT ATTCTTATAC ACTAACCAGG CTTCAAAAAT      3300
     TTTTAACATC CCCGCCTACA GTAAAGTTAT CTTACCACTA CCAGTAAAGA CTAATCATGG      3360
     GGAATTCTAT TGTTGTACTA CACAACTAAA TAATGAGTTA TCGTTGTCAG AAGGACTATA      3420
     TAAATCAAAC AATAATATTG CCAATGTCGA AATCTCTAAC CAATCCGACT CAGATAAACT      3480
     ATTATACCTA GAATACCCCC TAGAAACCAT TCCATACAAT AAAAACGACC ATATAGAGCT      3540
     CTTTAATATA TCAGCTACAC CTCTTAATAA CGATACCCCT CAAGCCCCAT TACATATCCT      3600
     CACAGAACAC CTCAATCCAG AGGAAAAAAC AGCCTTAACA ACCCTATGTA AACAATTTCG      3660
     CGACATATTC TACAACCCAG AAACACCATT AACTTTTACC AACAAAATCA CACACTCCAT      3720
     CCCAACCATA GATAACACTC CTATCCACAC AAAATCCTAC AGATACCCTT TTGTCCATAA      3780
     AACAGAAGTC AAAAAACAAA TCGAATCCAT GTTAGACCAA CAAATTATTA GATCTAGCCA      3840
     CTCCCCTTGG AGCGCCCCGG TGTGGGTGGT CCCAAAAAAA CTAGACGGGA CAGGGAACAG      3900
     GAAATGGCGA CTTGTAATAG ACTACCGGAA ACTCAACGAC AAAACCATTT CGGACAGATA      3960
     CCCCATCCCA AACATAAATG ACATATTAGA TAGCATAGGC AAAGCAAAAT ATTTCTCAAC      4020
     GCTCGACCTA ACTAGCGGTT TTCATCAAAT CGAGATGAAT CCAAAAGATA TCGCCAAAAC      4080
     AGCCTTTACA GTCGAAGGGG GTCACTACGA ATTCACACGG ATGCCCTTCG GCTTAAAAAA      4140
     CGCACCGGCT ACCTTTCAAC GGGTTATGGA CAGCGTTCTT GGCGATCTCA ACGGCACCAT      4200
     TTGCCTATTC TATCTTGACG ATATTATAAT TTTCTCGCCT TCCCTACAAA AACACCTGTT      4260
     GGACATAAAA ATGGTATTCG AAAAACTCAG AGCGGCAAAC TTTAAACTAC AACCTTCAAA      4320
     ATCAGAATTC CTAAGGAAAG AGATAGAATT TCTAGGCCAC ATAGTCACAC AAGACGGAGT      4380
     TAAACCAAAC CCGAACAAAA TAAGTGCGAT CAAAAAATTT CCTTGCCCCA CCAACAGAAG      4440
     AGCTATCAAA TCTTTTCTCG GGTTACTGGG TTATTATAGG AAGTTTATAA GAGACTTTGC      4500
     ACGAATAACG AAGCCCATGA CTAAACAATT GAAAGGGAAA AGACAAGTTA CTACAGACAA      4560
     AGACTTTGTA GACGCATTCG AACAGTGCAA AACTCTTCTG TCCAATGACC CAATACTCAT      4620
     ACACCCAGAC TTCGAAAAAC CATTCATTCT TACTACGGAT GCTAGTAACT TCGCGTTAGG      4680
     AGCCGTACTA TCTCAAGGCT CCTTACAAAA CGATAGACCT GTATGTTTTG CCAGCAGGAC      4740
     CCTCTCCGAC ACCGAAGTCA ACTATTCAAC CATAGAAAAA GAAATGTTGG CAATAATATG      4800
     GGCAGTAAAA TACTTCAGAC CATATATTTA TGGCGTAAAA TTTACTATTG TTACAGATCA      4860
     CAAGCCACTA ATATGGCTTA TGAATTTCAA AGAACCCAAC TCAAAAATAA TTCGTTGGAG      4920
     ACTCCAACTC ATGGAATACA ATTTTGAAAT AATTCACAAG AAAGGTTCAC AAAATGTAAT      4980
     TGCAGACGCC TTAAGTAGAG CGGACCCAAA TTTAAACTAC AACGAAACAC TGACTGTTAA      5040
     GCCTTGCCCC ACATCCGAAA AACCTATTAA CGAATTTAAC ACGCAACTCA TACTAGAAAT      5100
     AGATACAAAT ACGTCTTACC AAACTACAAC ACCATTTAAA CAAAAGATTA GGAAAAAATA      5160
     TTCACAGCCT TGCTTCGATT TCGATAATAT TGTTAAAATC TTGAAAGGAA CCCTAAAACC      5220
     TAACAGGATT TGCGCATTCT TGGCGGACGA TAATAATTCC GCATTAATCG AAAAAGCATT      5280
     CTCAACGTAT TTTGCACATA AAAAACACTT TAAAATTATC AGATGCAAAT CACTTCTCCA      5340
     CGAAATCGTA GGAAACCCCG AACAAAACAA ATTCATTCAG GAATATCACA CTAACAGCAA      5400
     CCACAGAGGC ATAGACGAAA CATTCCTTCA CCTCAAACGA GAAACCTACT TCCCCAATAT      5460
     GAAAAACAAA ATCTCTGAAT TAATTAGGAA TTGCGAAACC TGTCTAAAAC TCAAATACGA      5520
     CAGGCAACCA CAAAATATAG TATTTGAAAC CCCAGAAACC CCATCGAAAC CCCTCGACAT      5580
     AATACACATA GACATCTATA CTATTAACAA TAATTTTAAC CTGACAATCA TAGACAAATT      5640
     CTCAAAATTC GCAGCTGTCT ACCCCATCCC AAATAGAAAC GGCATCAATT GCATCAAAGC      5700
     AATCAAAAAT TTTTTCAGTC AATTCGGACT ACCCAAAAAA CTAATACACG ACCAAGGAGT      5760
     AGAATTTTGC AACGACATAT TTCGAAAGTT TTGCTCTCAA TATAATATAC TTCTCCATGT      5820
     CACATCCTTC CAGCAATCTT CAAGTAATTC TCCAGTAGAA CGTTTACACT CCTCTTTGAC      5880
     AGAGATTTAC AGAATAATAC TAGACACACG GAAAAAACAC AAATTACCTA CAGACCACGA      5940
     AGAAATAATG TCAGAAACTG TAATAACATA TAACAACGCA ATCCACTCCA CCACCAAACA      6000
     CACCCCTTTT GAACTTTTTA ATGGTAGGAC CCATTTATTC GAGAAAACAA TAATACCCAA      6060
     TAATGAGCAT GACTATTTAA ATAAACTAAA TACGTTCCAA GACAAACTAT ACTCCGAAAT      6120
     AAAAGAAAAA TTGTCCACAA ACACCCAACA AAGGATAGAA AAGCTAAACA CAAGCAGAGT      6180
     AGAACCAACA ACAGTACAAC CTAACAGCAC AATTTTCAGA AAAGAAAACA GGAGAAATAA      6240
     ATTAACACCA CGGTTTTCCT TACACAGAAC AGCAAAAGAC AAAGGAAAAA CTCTAGTAAC      6300
     CACAAGAAAT CAAAAAATCC ACAAATCAAA AATTAGGAAA ATATCCAAAC CTCCAAATGA      6360
     CTTAAGCCTT TCCACCTGCA TTCCAGATCT TGCCATGGGG CATACCAATC TATCTTCATC      6420
     CACAACTTCA ATAGCACCAA CCTCCTAGCA AAAGTGCCGG TAGGGAAAAC ACTCGTGATA      6480
     GGAAACTATA AAAAAATTAG CCACATAATC GATCTGTCCG AATACACCAA CTGTATTGAA      6540
     AAATTATACC ACACCATCGA TACCCTAAGA CAAGATGAAA CACTCACCGA TTCTATATCA      6600
     ATACTAAATG CTAAACTGGC CCAAACTCAA AGTAAAATAG ACGCACTAAC ACCCTTTTCA      6660
     CGCCACAAAA GAGGTCTTAT TAACGGGTTA GGTAGTTTAG TCAAAGTCGT CACCGGCAAC      6720
     ATGGACGCCA ATGATGCAAA GAATATAGAA ACAGAAATTA ACCACTTAAA AAGCCAGTCC      6780
     ACCACTATCT CAGATAACTT CGAAATACAG AACTCGTTCA ATGATGAAGT TCAACTACGG      6840
     TTCAAAAACT TAACAAGACA CATTAACAAT GAACAGAATT TGATTAAAAA CTTCTTCGAA      6900
     AACACTCAAA ATACAATTTA CACAAAAATA TACAACAACG AAGAAGAAAT AAAGAAACTA      6960
     CAATATATAA ATAGGCTTAA CTACAATATA GATTTATTAG TTAGCCACCT AAGCGACATT      7020
     ATAGAAAGTA CACTGCTTGC CAAAATTAAT GTTATCCCAA AACTCATCTT AGACAAGACA      7080
     GAAATAACCA AAATCAAACA AATTTTTAAA ACACAAAACT ACACAATAAA ATCCGAGCAA      7140
     CACATTTATA ACCTCTTAAA AATGAACGCA CTCAATTACC AAAACAAAAT AATTTTTAGT      7200
     ATCAAAATTC CTATTTTTTT AAGTTGTAAC TACGAAATGG CAAGATTAAT TCCACTTCCA      7260
     ATAAATTCCA CACAATTTGT AATAGCACCT AAGTACTTAA TATATAATAA CAAAAGTAAC      7320
     AGCATGTTTT CAACTATGTA TAAATGTCCT GTAATAGAAG AACAATTCGT CTGCGAAATC      7380
     GACTCCATCA ATAATCTTAA AAATAATACT TGCCTGGGAC ACCTTATCCA AAATAAGACC      7440
     AGCTACTGCG ACATAAAGGA AACGGGACTC ACGACTGATG TGTTCGAACC GGAAAAAGGC      7500
     TTCATACTTG TATTTAACGG GAACAACCTC CCAATCATCT CCTCCAACCA GACCATAACT      7560
     AGTATCAATG GATCAGCTAT AATAAAGTAT AACAATTGCA CATTAAAAAT CAATGAAATA      7620
     AACTACGACA ACAGGGCGGT ATCAACAGAA GAGCACCCCG ACTTCTTCCT ACCACCAATG      7680
     CGGAAACTAA TAAAAAATGC CACTATCAAC ATACTCACCT TGGAAAGACT TCACCTGGAT      7740
     ACACTCACAA CATCCAATAA GCTACTGGTC GTCGCCGCAG GAAACTCTCG ACACTCGACA      7800
     ACCTTGTATA TCCTCTTCAC CGTATCCCTA GTCGCCGTAA TACTCACCTG GACACTTCGA      7860
     AGGGACACCC ACATCTTCCA TACCGGGCCC GACCACATTC TTCCAATCGT CGCTCCACCA      7920
     ATTCCTCCGT CTATGGCCTT CGCTCCAAAC TGGGGGGGGA GGAGTTACCG ACCCATCGGT      7980
     ACCATACACC ACCCCTCCCT CTAAGCCACC ACGCCTACAC AAGTAGAAGA CATCGAACCG      8040
     GGAAGCTTTG CGATACAAAG TTGCAGCATA AACATCAACA ACGGGTCAGA CGCCGACATC      8100
     CGCCCAAAAT GCTGACACCA CATCCTTTTC GCTCAGACAG AACAACGCAT ACAATTCCAT      8160
     ATACATACGT ATAAACATAC TCATACTTTC TGCTGTGTCA GATACTTTAT TTCTAAGAAC      8220
     TTTAACATTG TAATACATAC ACACATATTC ACTGTTAGCC TATTTAAGAC GAAGAATAAA      8280
     GACGACCACA GTCGAGTGCA AGCAGCAAAC ACTTGTAGAC GTACATAATC TCCGATCAAA      8340
     ATTCTCCCAA GACGACCGTG GCTACGTTCT GGACCCGCAT AACTCCTCTA TCTTTCTGAG      8400
     TGATAATACC TCCGCAAGAC TCCCCGGAGG TAACT                                 8435
//
ID   DME010298  standard; DNA; INV; 8507 BP.
XX
AC   AJ010298;
XX
DR   FLYBASE; FBte0000359; Dmel\GATE.
XX
SY   synonym: Batumi
XX
FT   source          AJ010298:1..8507
FT   SO_feature      five_prime_LTR ; SO:0000425:1..272
FT   SO_feature      three_prime_LTR ; SO:0000426:8236..8507
FT   SO_feature      polyA_signal_sequence ; SO:0000551:158..163
FT   SO_feature      polyA_signal_sequence ; SO:0000551:8383..8398
FT   SO_feature      primer_binding_site ; SO:0005850:276..293
FT   SO_feature      RR_tract ; SO:0000435:8236..8507
FT   SO_feature      CDS ; SO:0000316:1741..6456
FT                   /name="Dmel\GATE\polyprotein"
FT                   /db_xref="FLYBASE:FBgn0044067"
FT                   /db_xref="SPTREMBL:O76925"
FT                   /db_xref="NCBI_PROTEIN:CAA09069.1"
FT                   /translation="MPIGDDKKKLSADKPRSIFSPQGPKSPRIPSISVKTPAQISDDCA
FT                   TPSKATVQRTAKNMAASDLALAKFISVSDAQANLRLRSTLRNPQLQPSRCLASVATKSE
FT                   AYGTRLKRIRPLLRVPCVSRRAAASGMPILRASYSYCYSVYERCVAQLVDKIEQGHFSV
FT                   HPKRTLRPRPTFPLAVGCLHAIQEFSQVTIFAGRFPDLLHAIYINNPRLTPFEKLFHLN
FT                   AKTSGDAHAIVSISPLTKRGFSSAWENLIERFENKRLLVNSQLKILFNVQSIPQESGAA
FT                   LKVMQSTVQGCLTALELSGINTENWDCLLEYLCSSKLPKITLSLWEQSLHKKADIPTWG
FT                   ELNTFLTERHRTLEAIDDVRPSVPSQSHSKAMNSSGPSRDGKLASDLCNKENHPVRVCR
FT                   VFSKWSVDDRSAYIKRKQLCLNYFAKGHQLRECKDRQSFTWWPASHVVAPKQPLFQQFK
FT                   PFKSCKPNFRYSGQFRSKRASRCSKLFCHGSRAILLGSAIINSSHLGTNFKARALIDSG
FT                   SEATFITEPLFNLIRLPFQVVQAQVSGLNQTVAAQFKNAAVSPSDLRLGRVAVGDDGLC
FT                   PPSTSRKSAFLPNSAKFLRDLPDFPLADPKFYESAPIDVLIRSPHPASVLLSGAKTNIC
FT                   GSLLGQETIFRWVLTGPVSASAQSRIPLFRHRSPTRTIIHWTNSSQNLGRWRIYQQSCK
FT                   RIRFHVRERVGKCLRRHQCGKYVVTLPFRDPEHIGCGLGHSRSWALAQFLKNEQRLKKD
FT                   EALKARYDSVIQEYLDLKHMRQVLPTHDCNAYYMPHHAVLKPESVTTKLRVVFNASSPS
FT                   SNGTSLNDILHAGPVLQSDLTVQILKWRDFRYVFSADIQKMYRQIWVDPKHTPFQRILF
FT                   RNNRGEIRDFELKTVTFGVNCAPLLAIRVLQQLAADEELSHPKASNVIRNFMYVDDVLA
FT                   GADSTEEAQLMVHELRDALNSSSSRQRWLSKRPLQRQVLSQIAKLFDPAGWLAPFIVRA
FT                   KIFMQEIWLQELGWDENVPNDLFQRWLNFLQSYSVFEQIRIPRWLSFHPDFKVEHHGFC
FT                   DASQKAYGAAIYVRGEVGSAIMVQLLTAKTRVAPVKTVSLPRLELCGALLLSEMAAAII
FT                   PQMPTINSKLYCWTDSTIVLAWLSKPACQWTTFVANRETKIAQATKTENWSHVQSEHNP
FT                   ADLASRGVSLQDLADSQLWWHGPTWLQNPRNQWPTQVNAPVTDLEKRALKVHLAKAPSE
FT                   ELLARFSKLEKALRVLAYVYRFIQRCRKQTSPSDVHLLATEIAAAERFLISNTQRREFP
FT                   VEYHCLSEKRPVPSSSAILSMNPFLDPQGLIRACGRVAASESPQYNERHPVILPYNCLL
FT                   SRLLAKFTHRTTLHGGNQLMVRLIRSKYWIPRIKNLMKAVVNSCKVCVIHKRRLQSQLM
FT                   GVLPKERASFSRPFTVSAWITPVRDIKNYTGRACVITKGYVLVFVCFSTKAIHLEPTSD
FT                   LTTEKFLAAFSRFVSRRGCPRQVQSDNGKTFVGAATLLSRDFLQAVKESVTNAYIHQEM
FT                   QWQLFSGGTQYGRPLGSRRKKLQDAILQMHGHTKIHVRRTLHALGKNRSVP"
XX
CC   Derived from AJ010298 (e1315889) (Rel. 56, Last updated, Version 1).
CC   Takis Benos and Michael Ashburner, 08-Sept-1998.
CC   Any changes to original sequence record are annotated in an FT line.
XX
SQ   Sequence 8507 BP; 2245 A; 2251 C; 1836 G; 2175 T; 0 other;
     TGTTCAAGTT ACGCTCACCC GCTGTCACCC GCTGTCACCC GCTCTCCGCT CCCTCTTACG        60
     CTCTCCCGCT CTTCACCTCA GAGTCTCCAA GGAGTCCTCG GGCTTGGGAT AGCCTAACTA       120
     ATTAGAATAA GCATCAGTGT AAAAACTAAC CACGCTGAAT AAACATACGC CCGGTCGCCG       180
     CGCAATTACG AAAAGTCTAG TGTTTGCTTT CCTTCGAGTG TTTCTTTTCA GCATATTTGA       240
     ATTCAGGACA GCCATCCCCC TACATCCCAA CATTTTGGTC CTTCGAGCCG GATCACCTGG       300
     ATTTTCAAGT TTGTCCACCA GCGAACAAAT TATAAGATAA GTACGAAATT TCCATTCCTT       360
     TTAATTGCCG GTCTGCAGCA AAAGGTTCGA AAATCCAATT TCGTTCAATT TGCTGTAAGA       420
     TTTATTGTCA AATCTAACGG ATTTCTCCGA CAAAAGGCAA TTAAAGAAAA GTACTTATCC       480
     AATCTCACGG GCGCCGCATA TTACTCGCCG TTCTCCGTTC TCCTTTCACC CTCATTCGTG       540
     AAAATTTCTA AAGTCCAAAT GGGCGAATAT ATTTAAATAT TAATCCAGTG CGATAATGCA       600
     AAATTCCAAA TGTGAAAAAG TGAATAATTT GTGCCAAGTT CAGTGAAACT TTCTAAGTCC       660
     AAAGCTCTGC CAAAATTGGC AAAAATTCTG TTCTCGTTTC ACTGTGTCAA AGCGAAGCCA       720
     AACTTCTTTT CGCAACACAT TTTTGCTTTA ACTCCGCAGT CCACTTAATA CCATTTGCTT       780
     TGCTATCGAA GAATACCACA ACGAAACAAA CAACACCATA CCCTCTGGCC ATTCAAATAA       840
     CATATTAATT AACATTTCCG CAGTTCCATA TCTCTTACAT CAACATATAC CTACTCCATA       900
     CTCTTGCATA TATTCACATC TTACACAATA TATCCTCACC ATATATTACA TATATTACAT       960
     CAACATATAA TATCCACATA TATTACCGAC ATACATTGCG CATATTATCA GCATTCCTTT      1020
     AACGTATACC AAAGTTTAAA TTCGATCCCG TCGGCAAATC CAACCACAAA TAAAATTTAT      1080
     TCCAAGTGCC GACGCGGAAA GGCGTTTTCT TTTCCATCAA TTTTTTCCGT AAATTTCCAA      1140
     ATTAATTTCC GAGCAATAAA TTAAAAGCGG TTTTTTCTTT TTTTTTAACA AATAACTTAT      1200
     TGTTGAAAAC ATTTATTAAA TTATTAAAAA TTATATAAAT AATACGACCG CCAAATACAA      1260
     GTCGTTCACC CGACAAATAT TTTTTCCTGT ATTGCTTGGA TATTAATTTG TGTTTGTTTT      1320
     AGAAGTACTT ACAACGCGGA GAAAAGACTC CAAATCCACC ATTCCATTTT CTCCGTTTCC      1380
     AGTTATAAAC AAAAAAATAA ATAAAATTTT CTTCCTTCTA ATAAACATTT TATTTTACCG      1440
     TGTTCACATT CCAAGTGTTC CAACCGTAAA TAAGGTGGAC CTAATTACCA TAAATCACAG      1500
     GTCATTTATA CAATTCGCTG TTCACTCCGA GTCACCTGTC CAATTAGTCT AAACTACGGC      1560
     GTTTCCACTT CGCAAATTCA ACACCACTTT CTCACCCATT ACATCCTATA CGGTCCTTTT      1620
     CCGCTGCTTT ATACCGTTCA CGGCAGGAAG CTTAAATTTA TTAAGTGGAA TCTGTCTACT      1680
     TTTTCAAAAG TGTGACCGGG CTCCAAAAAC GCTTCCCTTC CATTTCGTAT TTCTTCGATT      1740
     ATGCCCATCG GGGACGATAA GAAGAAATTG TCCGCTGACA AACCCAGGTC TATTTTTTCA      1800
     CCACAAGGGC CCAAGAGTCC AAGAATCCCA AGCATTTCGG TGAAAACGCC TGCGCAGATT      1860
     TCCGACGACT GTGCCACTCC ATCCAAAGCC ACAGTACAGC GCACAGCTAA AAATATGGCT      1920
     GCTTCCGATC TAGCGCTAGC CAAATTCATT TCGGTTTCTG ACGCTCAAGC GAATTTGAGG      1980
     CTCAGATCAA CACTCCGGAA TCCGCAGCTC CAACCGTCAC GATGCTTAGC GTCCGTCGCG      2040
     ACCAAGTCCG AAGCCTATGG GACAAGGTTG AAAAGAATTC GACCTCTGCT CAGAGTGCCT      2100
     TGTGTCAGCA GGCGAGCGGC AGCAAGCGGC ATGCCTATTC TCAGGGCTAG TTACAGTTAT      2160
     TGCTATTCAG TCTATGAAAG GTGTGTTGCC CAGCTCGTTG ATAAAATCGA GCAGGGGCAC      2220
     TTCTCAGTCC ATCCCAAGCG AACGCTGCGG CCCAGGCCTA CATTTCCTCT GGCTGTCGGT      2280
     TGCCTCCATG CGATACAGGA GTTTTCGCAG GTGACTATCT TCGCTGGCCG CTTTCCGGAT      2340
     CTTTTACACG CCATTTATAT TAATAATCCA CGGCTGACTC CGTTCGAAAA GTTATTCCAC      2400
     TTAAATGCCA AAACAAGTGG CGACGCGCAT GCCATAGTTT CGATTTCGCC TCTCACCAAA      2460
     CGAGGGTTTT CCTCTGCGTG GGAAAACCTA ATAGAGCGTT TCGAAAATAA ACGATTGTTG      2520
     GTAAACAGTC AATTGAAAAT ACTGTTTAAT GTGCAGTCGA TACCACAGGA ATCTGGGGCG      2580
     GCCTTGAAGG TAATGCAAAG TACTGTTCAA GGTTGCTTGA CTGCCTTAGA ACTGTCAGGC      2640
     ATCAACACTG AGAACTGGGA CTGCCTGCTG GAATATCTGT GTTCATCCAA GCTCCCGAAG      2700
     ATAACTCTCT CCTTATGGGA GCAGTCTCTA CATAAGAAAG CCGACATCCC GACATGGGGA      2760
     GAACTGAACA CCTTCCTCAC AGAACGTCAT CGAACCCTAG AGGCCATCGA TGATGTGAGA      2820
     CCGTCCGTAC CAAGTCAGTC GCACTCCAAA GCGATGAACT CAAGTGGGCC CTCTAGAGAT      2880
     GGCAAGCTGG CGTCCGACTT GTGCAACAAG GAAAACCATC CTGTCCGTGT ATGTCGCGTT      2940
     TTCTCCAAAT GGTCGGTTGA CGACCGGTCA GCCTACATTA AACGGAAGCA GTTATGCTTA      3000
     AACTACTTTG CAAAGGGACA TCAGCTTCGT GAGTGCAAAG ATCGACAAAG TTTTACTTGG      3060
     TGGCCGGCAT CACACGTTGT TGCACCGAAA CAACCTCTTT TCCAGCAATT CAAGCCCTTC      3120
     AAATCCTGCA AGCCCAATTT CCGCTACTCA GGCCAATTTC GTTCCAAACG AGCAAGCCGG      3180
     TGTTCAAAAT TATTTTGCCA CGGCTCAAGA GCTATCCTTC TTGGCAGTGC CATAATCAAT      3240
     AGTTCCCATC TTGGCACTAA CTTTAAGGCA CGCGCCCTGA TCGACTCCGG ATCAGAGGCG      3300
     ACATTCATAA CCGAGCCACT GTTCAATCTA ATTAGATTGC CATTCCAGGT GGTTCAAGCC      3360
     CAAGTCTCGG GCTTAAACCA AACAGTAGCT GCTCAGTTCA AGAACGCTGC AGTTTCACCA      3420
     TCCGATCTCC GACTAGGCCG CGTTGCAGTT GGAGACGACG GCCTATGTCC TCCCTCAACT      3480
     AGCCGGAAAT CTGCCTTCCT ACCCAATTCC GCAAAATTTC TTCGGGATCT TCCCGATTTT      3540
     CCACTGGCGG ATCCAAAATT CTATGAGAGC GCCCCAATAG ATGTACTTAT CCGGAGCCCA      3600
     CATCCTGCTT CGGTGCTTCT GAGTGGAGCA AAAACCAACA TCTGTGGCTC TCTCTTGGGG      3660
     CAAGAGACCA TTTTCCGCTG GGTACTAACT GGGCCAGTGT CAGCCTCAGC CCAAAGCAGG      3720
     ATTCCTCTTT TTCGACACAG ATCTCCCACG CGTACGATAA TTCACTGGAC AAACTCCTCA      3780
     CAAAATTTGG GGAGGTGGAG GATATACCAA CAAAGTTGCA AAAGAATCCG ATTCCATGTG      3840
     CGAGAACGGG TTGGTAAATG CTTACGACGA CACCAGTGCG GCAAATATGT CGTTACTCTG      3900
     CCTTTTCGCG ACCCAGAACA TATCGGTTGC GGGCTAGGGC ATTCTAGGTC TTGGGCGTTG      3960
     GCTCAGTTCT TGAAGAATGA GCAGCGTCTA AAAAAAGATG AGGCCTTGAA AGCGAGATAC      4020
     GATTCGGTGA TCCAGGAATA TCTCGACTTA AAGCACATGC GACAAGTTCT GCCTACCCAT      4080
     GATTGCAACG CCTATTATAT GCCACATCAC GCCGTCTTAA AACCGGAGAG TGTAACTACT      4140
     AAACTCCGTG TAGTATTCAA TGCCTCCAGC CCTTCATCGA ATGGTACCAG TTTAAATGAT      4200
     ATCCTTCATG CTGGCCCTGT CTTGCAGTCC GACTTGACAG TGCAAATTCT GAAGTGGCGC      4260
     GATTTCCGAT ACGTGTTCAG TGCCGATATT CAAAAAATGT ATCGGCAGAT CTGGGTAGAT      4320
     CCGAAACACA CTCCATTCCA GCGAATACTT TTCCGTAACA ATAGAGGGGA AATCAGAGAT      4380
     TTCGAATTGA AAACAGTAAC CTTTGGAGTC AATTGCGCGC CCTTGCTGGC GATCCGAGTA      4440
     CTGCAGCAGC TAGCAGCTGA CGAAGAACTC AGCCATCCAA AAGCTAGCAA TGTCATTCGA      4500
     AATTTCATGT ATGTGGATGA TGTTTTAGCC GGAGCGGACT CTACGGAAGA AGCTCAGCTC      4560
     ATGGTGCACG AGCTCCGAGA CGCTCTGAAT TCTTCTTCGT CCCGCCAGAG ATGGCTATCG      4620
     AAACGTCCTT TACAACGCCA AGTCCTGTCC CAAATTGCCA AATTGTTCGA CCCTGCAGGC      4680
     TGGTTAGCAC CGTTTATCGT TCGAGCTAAA ATTTTCATGC AGGAGATTTG GCTACAGGAG      4740
     CTTGGGTGGG ACGAAAACGT TCCAAATGAC CTTTTTCAGC GATGGCTTAA TTTTCTCCAA      4800
     AGTTATTCGG TTTTCGAGCA GATACGCATT CCACGCTGGC TATCGTTTCA TCCAGATTTC      4860
     AAGGTCGAGC ATCATGGCTT TTGCGATGCA TCGCAAAAGG CTTATGGCGC CGCAATATAT      4920
     GTCCGCGGAG AAGTGGGCAG CGCCATTATG GTGCAACTCC TAACCGCCAA AACCCGGGTA      4980
     GCACCAGTCA AAACGGTTTC GCTCCCAAGA CTCGAGCTCT GCGGAGCGTT ATTGCTTTCC      5040
     GAAATGGCTG CAGCCATCAT TCCGCAGATG CCTACGATTA ACTCCAAACT TTACTGTTGG      5100
     ACGGACTCCA CCATAGTGCT TGCATGGTTA AGCAAGCCAG CATGCCAGTG GACCACATTT      5160
     GTAGCCAATA GGGAGACGAA GATCGCCCAG GCCACAAAAA CAGAGAATTG GTCTCATGTT      5220
     CAATCTGAGC ATAATCCAGC AGACCTGGCA AGTAGAGGAG TTTCCCTCCA AGATCTAGCC      5280
     GATAGCCAGT TATGGTGGCA CGGACCGACT TGGTTGCAAA ATCCACGCAA CCAATGGCCT      5340
     ACTCAGGTCA ACGCTCCGGT GACCGACCTG GAGAAGCGTG CTCTAAAAGT CCATCTCGCG      5400
     AAAGCTCCTT CTGAAGAGTT GTTGGCACGT TTCTCCAAGC TAGAGAAAGC TCTACGAGTC      5460
     CTTGCCTATG TTTATCGCTT CATTCAGCGG TGCAGGAAGC AGACATCTCC ATCTGATGTT      5520
     CATCTACTGG CCACTGAAAT CGCCGCCGCC GAGCGGTTCC TAATTTCGAA CACTCAACGC      5580
     AGAGAATTCC CTGTGGAATA TCACTGCCTA AGTGAAAAGC GTCCAGTGCC AAGTTCAAGT      5640
     GCCATCCTAA GCATGAACCC GTTTCTAGAT CCGCAAGGAC TGATCAGGGC ATGCGGCCGT      5700
     GTGGCGGCTT CCGAAAGCCC TCAATACAAT GAACGCCATC CAGTGATTCT TCCGTATAAC      5760
     TGCCTGCTTT CTCGCCTCCT TGCGAAGTTC ACGCATCGCA CAACTCTCCA TGGTGGTAAC      5820
     CAGTTAATGG TGCGCCTCAT CCGGTCGAAA TACTGGATTC CGAGAATCAA GAACCTGATG      5880
     AAAGCAGTGG TAAATTCGTG CAAAGTATGT GTGATCCACA AAAGGCGGTT GCAAAGCCAA      5940
     CTGATGGGTG TCCTGCCCAA AGAAAGAGCA TCGTTCTCCC GACCATTCAC GGTATCGGCA      6000
     TGGATTACGC CGGTCCGCGA TATAAAGAAC TATACGGGAA GAGCATGTGT TATTACAAAG      6060
     GGGTATGTGT TAGTTTTTGT TTGTTTCTCC ACCAAGGCCA TCCACTTAGA GCCTACATCT      6120
     GACTTAACGA CCGAGAAGTT TCTTGCCGCT TTCTCTCGTT TTGTATCCAG GAGAGGGTGT      6180
     CCACGTCAAG TCCAGTCAGA CAATGGCAAA ACCTTTGTTG GCGCTGCCAC CCTGCTTTCC      6240
     CGCGATTTCC TTCAAGCCGT AAAAGAGTCG GTGACGAATG CCTATATTCA TCAAGAGATG      6300
     CAATGGCAAT TATTCTCCGG GGGCACCCAA TATGGGAGGC CTTTGGGAAG CAGGCGTAAA      6360
     AAGCTTCAAG ACGCTATTTT ACAAATGCAC GGCCACACGA AAATACACGT TCGAAGAACT      6420
     CTCCACGCTC TTGGCAAAAA TAGAAGCGTG CCTTAACTCC AGGCCGCTCT CTCCTATGTC      6480
     TGAAGATCCG ACAGACTTGC TGGCTCTGAC GCCAGGGCAT TTCCTTGTCG GGGGACCCCT      6540
     TATGTCCACG GTGGAACCCG AAGTAAAGGG GGAAACGAAA TCCCTTCTTA ATCGGTGGCA      6600
     GCATTTGAAG GCTCTCCATC AGCAGTTCCG TGTGCGATGG AAAGAAGAGT ACCTCAAAGA      6660
     ACTCCACAAG CGTTCTAAAT GGCAGGTCCC GTGAACTTCG AGCTAAAATA CTCGTGCATG      6720
     TGGAGCAGCG TGTGGTGGGA TCGGTCGCAC TTCTTGCAAC GATCACCGCT TCGGCAGTCT      6780
     CCCGTGGAAT GCTCGTGAGC GAGGCAATTG GCGCTAGTAT GTTGGTAATG AGGACTGCTC      6840
     GCAAACGCTT TTCAGCGCTG AGCTTTAGGA ACCTCGCGCA CGTCCGAAGA GGATGGATTA      6900
     CCGCGGCAGA CTCGGCATCG GTAGGATTTA ATACCTCGGG TACGTCTGCT CTCCACGGCA      6960
     CGACCTGCGT GCGTTTTGTT GACGAGGAGC CATGTGCGCG TAGTCGAATG TCGAAAGGAG      7020
     ATCGAAAACG AAATGAAAAA TAACGGATGA TTAGTGATAG TGAACTACAA CTAAGGACGA      7080
     GAGGAGAGAC CTATTATTGT GGAGATTCGG AACTCCGTCG GCAAAAGCAC CTTTTTTGCC      7140
     ACTGGACGTT TAATAACTCC ACGTGCAGTA CGGATGTTTA CTACACGACG TTGCCGTCAG      7200
     CTCCTGGGAA AACAGACTCA ATTCTGCCGA GCCGCCACTC ATTAGAGGGC AAGTTGTCGT      7260
     CCTTGATGAC GACTGTTGAG TTACGGGGTT TGGACTGTCA CCGTCTCCGC TCCCTCTTAC      7320
     GTTCTCCACT CCCTCTTACG CTCTCCCGCT CTTCACCACA GAGTCTCCGA GGAGTCTCTG      7380
     GCGCTTGGGA GAACCCAACG CATTAGAATA AGTTTTAGTG TAAAACTAAC CACGATCAAT      7440
     AAAACATACG CCCGGTGCCC GCGCTAATTC TACAAGTCTT CGAGTGTTTT TTCGAGTGGT      7500
     CTTTTTTTCA GCAAACTAGG AACTTTCCAG GACCAGCACC CCCCATCACC CCAACAACGA      7560
     CCATGTCATC GATGGCGTCG CCAACCGGCG CCAACCCTGC AAGCAGCTTC GGCCTCGTCC      7620
     CAACGTTCCC GCCGGCACAA TCCGCCAACT CAGCGTAGGA GTTCACCGCC ACGACGACCG      7680
     GAATCGACGA CGCCAGGCCC ATCACTCTCG TCGCCGCTGC AACGCCACAG CGTGAACATC      7740
     CTTCCCACAG CGCTGGTCAA GATGGAGACC GGGACGAAGA CCTTCAGACC GCAGCACTCA      7800
     TCGATCCGTG CAGCCCCATG AGCTGCATCG ACGCTTCGTT GGCGTCAGCC TTTAAGCTTT      7860
     CGATGACCAA TGTTGGCGAC GAGAAGGTCT GCACGACGAC GATTCGCTCC AGGATCGACG      7920
     CGAACACGAA GCTCGAGGTC GTGCTCAAGA TCGAGCCCAG GGTGCGGATC CGTACACCTG      7980
     TCCGGGCATT GAGCGACACC GTAGTGTCCA AGTACAGGGA CATCATGCTG GCGGATGACG      8040
     GGTTCCATCG GCCTGCTACC GTATCCATGG TCTTAGGAGC AGACATTTAT CCTAAGGTTA      8100
     TCCAATCCGG ATTCCTGACC TTCGACGAGG GAATGCCGGT CGCTCAAAAG ACCGTGTTTG      8160
     GGTGGATCGT GTCCGGTGCC TGCAGCTTGC CTAGATGGCT ATGTTGCAAC CCCAGTGATT      8220
     GCAAGGGGGG CGGAATGTTC AAGTTACGCT CACCCGCTGT CACCCGCTGT CACCCGCTCT      8280
     CCGCTCCCTC TTACGCTCTC CCGCTCTTCA CCTCAGAGTC TCCAAGGAGT CCTCGGGCTT      8340
     GGGATAGCCT AACTAATTAG AATAAGCATC AGTGTAAAAA CTAACCACGC TGAATAAACA      8400
     TACGCCCGGT CGCCGCGCAA TTACGAAAAG TCTAGTGTTT GCTTTCCTTC GAGTGTTTCT      8460
     TTTCAGCATA TTTGAATTCA GGACAGCCAT CCCCCTACAT CCCAACA                    8507
//
ID   ROXELEMENT     standard; DNA; INV; 4740 BP.
XX
AC   AF237761;
XX
XX
DR   FLYBASE; FBte0001160; Dmel\X-element.
XX
SY   synonym: BS2
XX
FT   source          AF237761:1..4740
FT   SO_feature      CDS ; SO:0000316:322..1827
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\X-element\ORF1"
FT                   /db_xref="FLYBASE:FBgn0041613"
FT                   /db_xref="SPTREMBL:Q9NBX5"
FT                   /db_xref="NCBI_PROTEIN:AAF81410.1"
FT                   /translation="MNTLNETAAADESLDTAFLSSPQCAAPQRFQKIKRKSRASPETER
FT                   KKPKSTIGKQGENPSATEPRYGGNSNRFGLLAHLTADKQVGNEIGDLYDQPSTSHQAAI
FT                   AAAKRDAASAGTTSSAKRAQSKPPPIVMEGVDDVYLMMQSIENIVDLEKIEARASMSGV
FT                   LRLYAADANTFRTIVNWLEIEEYEFHCYQLKEDRPYRVCVKGLHHSTLHHQIKDELEKI
FT                   GHKVLDIHTPLRRNEPGTSKASPVNMFFLNIAAAANNKEILAVKALCHMRVVIEPLRKR
FT                   NAIVQCHRCQQIGHTAKYCRKAHICVKCAGEHPAKDCTRPRIELCTCYNCGGQHPANYK
FT                   GCSKLQAFLQRSRPRSGVAGRTEVSDRPTPRGLAGGKEIPSSRGGISYADVARGSIHHK
FT                   QPMSLTHQQQKQKQQPYDGSPSRQRSRSRTRASRGTLQRSTDASSSIEAILQTLNENIN
FT                   SLRSIQEKQMELMMMMMKQQQQQSHQQGQIINLLTALQARQAP"
FT   SO_feature      CDS ; SO:0000316:1827..4553
FT   SO_feature      start_codon ; SO:0000318:1..3
FT                   /name="Dmel\X-element\ORF2"
FT                   /db_xref="FLYBASE:FBgn0041612"
FT                   /db_xref="SPTREMBL:Q9NBX4"
FT                   /db_xref="NCBI_PROTEIN:AAF81411.1"
FT                   /translation="MMPLRILVWNADGVSTKLPEVECFVRRHEIDVLLLSETHCKGAET
FT                   PKLFGFVAYTANDPSGGNAKGGAAILIKNSLAHFPLTPIATAKVQLAPAVIETALGPIS
FT                   FGAVYCPPRFAWTTDEFKDILEEFQTKFIVAGDWNASHWLWGAGRSNQRGIALANLVLN
FT                   SEVDSLATGGPTRYPYGCRGSPGYIDFALTKGVLGIHANISAVVELSSDHLPLVITLDA
FT                   GAISYPKMERLITRRTNLEVFQSQLESTLPLNTAINSGQDVDDAIELLTNNIKSAARLA
FT                   TRSISRQPAADRIPIPREILLLIAEKRRLRTRWMRSRHPSDKTEWNRALSRLRCALVLH
FT                   KAAWFDERLANTGVESEATHSLWKATRAIKRRCTRKAPLVDSNGTWCRTDLGQAEVFAA
FT                   HLAERFQPFKLASLQQVEETQDQLNQALQMDMPITPFEPCEVAEVIVRQSNNKAPGHDV
FT                   ICNATLKALPRQAILYITLVFNAIVRLQYFPYQWKLGIISMIHKPGKPEREPASYRPIS
FT                   LLPSISKVFERLIAVRIVSIMEAQGITPEHQFGFRAGHCTVEQLHRVVEQILTAYDSKE
FT                   YCNSLFLDIREAFDRVWHIGLQLKIKQTLPAPYFGLLKSYLEGRRFAVRFHSAISTEHN
FT                   VAAGVPQGSVLGPLLYCLYSHDMPQPDVSLYGKSMLATFADDVCVTYRSRCEHDAADGI
FT                   QDFAYRFSEWARRWNIGINSSKSNNVCFTLKRRTPPPVYIEEVPVPQPNAAKYLGVLLD
FT                   RRLTFSKHVTDIRTRLRAKVAKHYWLLSSRSKLSLSNKLTIYKQILAPNWKYGCQIWGL
FT                   ACDSHIKRIQAIQNKVARLITGCEWFVRNTTLHRDLKLATVFDEINKHSSRYHDRLERH
FT                   RNRLASALNRSRPPRRLNRRQPRDLITRSPLTRVRRS"
XX
SQ   Sequence 4740 BP;  1336 A; 1215 C; 1183 G; 1006 T; 0 other;
     AATGTTAAAT AAAGGTTCGT GTCTAACAAT ACGCACCTGA CAAAGTGGAT TAAGTGAAAT        60
     TAGTTTTCGC GGTAATAAAC TTATGGACAA GACCAGAATA CTGGCACACA TAGCAAATAG       120
     TGACCCCCCA AGTCACTAAC AGTGAAATAA TAGTGAAACG AAAACATTTT CATTCAAAAA       180
     TACAAAGTTA AGTTTCTCGA ACTGGGGCTC CGCTGCCCAG CTGCCACGCG ATCGCACAAA       240
     CAGCTGTTTG CGAGCTTAAA GCTTTCTATC CCAGGGTTCA AGTTTTGGCT AGAACCCTGG       300
     TGATTTGGTG CACACTTCAA TATGAACACT TTAAATGAAA CCGCTGCGGC TGATGAATCG       360
     TTGGATACTG CGTTTCTCTC GAGCCCCCAA TGTGCTGCCC CGCAGCGCTT TCAAAAAATA       420
     AAGCGAAAGT CTCGTGCTTC TCCGGAGACT GAAAGGAAAA AACCCAAATC AACCATCGGC       480
     AAACAAGGGG AAAACCCTTC GGCTACAGAA CCTAGATATG GCGGCAATTC AAACCGATTT       540
     GGTTTACTTG CGCATCTCAC AGCTGACAAA CAAGTAGGCA ATGAAATTGG CGATCTGTAT       600
     GACCAGCCCA GTACCAGTCA TCAAGCTGCA ATTGCTGCCG CTAAGCGGGA TGCAGCCTCC       660
     GCTGGTACCA CTAGCTCAGC CAAAAGAGCG CAGTCCAAAC CACCTCCTAT AGTAATGGAG       720
     GGAGTGGACG ACGTATACCT GATGATGCAG AGCATCGAAA ATATAGTGGA CCTAGAAAAG       780
     ATTGAGGCTA GGGCGTCAAT GAGCGGTGTC CTAAGGCTTT ACGCGGCTGA CGCTAATACA       840
     TTTCGCACCA TAGTGAACTG GCTCGAGATC GAAGAGTATG AGTTCCACTG CTACCAGCTT       900
     AAAGAGGACA GGCCTTACAG GGTATGCGTG AAAGGCCTGC ACCACAGTAC GCTACATCAC       960
     CAAATCAAGG ATGAGCTGGA AAAGATCGGG CACAAGGTTC TCGATATTCA CACACCGCTT      1020
     AGGCGAAACG AACCGGGTAC CTCAAAAGCG TCGCCAGTCA ATATGTTCTT CCTAAATATT      1080
     GCTGCTGCGG CAAACAATAA GGAGATCCTG GCGGTAAAGG CACTATGCCA TATGAGAGTA      1140
     GTTATTGAGC CTCTCCGCAA GCGTAACGCT ATTGTCCAGT GCCATCGTTG TCAGCAGATT      1200
     GGCCACACAG CCAAATACTG CCGTAAGGCC CACATTTGTG TGAAATGTGC CGGCGAACAC      1260
     CCAGCCAAGG ACTGTACCAG GCCACGCATC GAGCTGTGCA CTTGCTACAA CTGTGGCGGC      1320
     CAGCATCCTG CAAACTATAA AGGTTGCAGC AAGCTACAAG CGTTCCTGCA GCGATCCAGA      1380
     CCCAGAAGTG GAGTGGCTGG AAGAACAGAA GTAAGCGATC GACCAACTCC ACGGGGCTTA      1440
     GCTGGAGGTA AGGAGATCCC CTCTTCTCGA GGCGGAATAT CTTATGCAGA TGTGGCTAGA      1500
     GGGTCCATTC ACCACAAGCA ACCAATGAGC CTGACGCACC AGCAACAGAA GCAAAAGCAA      1560
     CAGCCCTATG ATGGAAGCCC CAGTCGTCAA AGGAGCCGCA GCCGGACAAG GGCGTCTAGG      1620
     GGTACACTCC AGCGCTCGAC GGATGCTAGC AGCAGCATTG AAGCCATCCT GCAGACGCTT      1680
     AATGAGAACA TTAATTCTTT GCGCTCGATT CAAGAGAAGC AAATGGAATT AATGATGATG      1740
     ATGATGAAGC AACAGCAACA ACAGTCACAT CAGCAGGGGC AGATTATCAA TCTGCTCACT      1800
     GCTCTCCAAG CGCGTCAAGC GCCATAATGA TGCCGCTGCG CATCCTAGTG TGGAACGCCG      1860
     ACGGCGTATC CACGAAGTTG CCTGAAGTAG AGTGCTTCGT GCGACGTCAC GAAATCGATG      1920
     TATTACTGCT CAGCGAGACA CACTGCAAGG GGGCAGAGAC GCCTAAGCTA TTCGGATTTG      1980
     TAGCCTACAC TGCCAATGAT CCGAGTGGTG GCAACGCCAA AGGCGGAGCA GCTATCTTAA      2040
     TCAAAAATAG CCTTGCCCAC TTTCCGCTAA CACCAATAGC CACTGCCAAG GTGCAACTTG      2100
     CGCCGGCGGT TATTGAAACG GCACTTGGTC CTATAAGCTT TGGAGCGGTC TACTGCCCAC      2160
     CGAGATTTGC ATGGACTACG GACGAGTTTA AGGACATTTT GGAAGAGTTC CAGACGAAGT      2220
     TCATTGTTGC AGGCGATTGG AACGCGTCCC ACTGGCTCTG GGGTGCGGGA AGGAGCAACC      2280
     AAAGAGGCAT TGCATTAGCG AATCTCGTCC TAAATTCGGA GGTGGACTCG CTAGCAACAG      2340
     GAGGACCAAC AAGATACCCG TACGGCTGTA GAGGCTCACC AGGGTACATC GATTTTGCAC      2400
     TGACAAAGGG TGTGCTGGGC ATCCACGCTA ACATAAGTGC GGTTGTTGAG CTTAGCTCCG      2460
     ACCACCTGCC TCTGGTAATT ACGCTGGATG CGGGGGCAAT ATCCTACCCT AAGATGGAGC      2520
     GGCTTATCAC TAGGCGTACT AACCTGGAGG TATTCCAATC GCAACTGGAG TCCACACTGC      2580
     CCCTCAACAC TGCCATAAAC TCTGGACAGG ACGTTGATGA TGCTATCGAA CTGCTCACCA      2640
     ACAATATCAA GTCAGCAGCT AGATTGGCAA CTCGCAGCAT ATCTCGGCAG CCCGCGGCAG      2700
     ATCGAATCCC AATACCCAGG GAGATCCTGC TGCTTATAGC TGAGAAGAGG CGCTTACGCA      2760
     CTAGGTGGAT GAGGTCTCGG CACCCGTCGG ACAAAACGGA ATGGAACCGA GCTCTGAGTA      2820
     GGCTCCGATG CGCGTTGGTG CTGCACAAAG CCGCATGGTT CGACGAAAGG CTTGCCAATA      2880
     CCGGAGTCGA AAGCGAAGCG ACGCATTCGC TGTGGAAGGC CACGCGCGCA ATCAAAAGGC      2940
     GTTGCACGAG GAAGGCGCCT CTAGTCGATA GCAACGGGAC ATGGTGTCGG ACCGACTTGG      3000
     GACAAGCGGA GGTATTCGCT GCGCACCTCG CCGAGCGATT TCAACCATTC AAGCTTGCCA      3060
     GCCTGCAACA GGTTGAAGAA ACTCAGGACC AGCTGAACCA AGCGCTTCAA ATGGATATGC      3120
     CAATCACGCC GTTTGAACCC TGCGAGGTAG CCGAAGTCAT TGTGCGCCAG AGTAACAACA      3180
     AAGCACCTGG ACATGACGTC ATCTGCAACG CCACATTGAA GGCCCTGCCC AGACAAGCGA      3240
     TCCTCTACAT AACGTTGGTT TTCAACGCTA TTGTGAGGTT GCAATACTTC CCTTATCAGT      3300
     GGAAGCTCGG GATAATCTCC ATGATCCACA AACCTGGCAA GCCGGAAAGG GAGCCCGCCT      3360
     CCTACCGGCC GATCAGTCTC CTCCCTTCAA TTTCGAAGGT GTTTGAGAGA CTGATTGCTG      3420
     TCCGGATTGT AAGCATTATG GAAGCCCAGG GGATTACCCC TGAGCACCAG TTCGGTTTCC      3480
     GTGCTGGCCA CTGTACTGTC GAGCAGCTCC ATCGAGTCGT CGAGCAAATT CTGACTGCCT      3540
     ACGACAGTAA GGAATATTGT AACAGCCTCT TCTTGGACAT TCGAGAAGCG TTTGATCGAG      3600
     TGTGGCACAT TGGACTCCAA CTGAAAATCA AGCAGACGCT GCCTGCCCCA TATTTTGGGT      3660
     TGCTGAAATC GTACCTGGAA GGAAGGAGGT TCGCTGTGCG CTTTCATTCA GCAATTTCCA      3720
     CCGAGCACAA CGTGGCAGCT GGTGTTCCAC AAGGTAGTGT CCTCGGCCCC CTGCTCTACT      3780
     GCCTGTATAG CCACGACATG CCGCAGCCAG ATGTAAGCCT TTACGGGAAA TCTATGTTGG      3840
     CCACATTTGC CGATGACGTG TGCGTCACCT ACAGGTCCCG ATGCGAGCAC GACGCAGCCG      3900
     ATGGTATCCA GGACTTTGCA TACCGGTTCT CGGAATGGGC AAGACGATGG AATATTGGCA      3960
     TCAATAGCAG TAAATCCAAC AACGTCTGCT TCACTTTAAA GCGGAGAACG CCACCGCCCG      4020
     TCTACATCGA GGAAGTCCCC GTACCACAGC CGAACGCAGC AAAGTACCTT GGAGTGCTTC      4080
     TGGATCGCAG ACTCACATTT TCCAAGCATG TGACCGACAT CAGAACGCGC CTACGTGCTA      4140
     AGGTGGCGAA GCACTACTGG CTACTTTCTT CGCGCAGTAA ATTGTCGCTA TCCAACAAGC      4200
     TGACAATTTA CAAACAGATC CTAGCACCAA ACTGGAAGTA TGGGTGCCAA ATCTGGGGCT      4260
     TAGCCTGCGA CAGCCACATC AAAAGGATCC AGGCTATTCA AAATAAGGTA GCAAGACTCA      4320
     TCACCGGCTG CGAGTGGTTT GTTCGAAACA CCACCCTGCA CAGAGACCTG AAACTCGCAA      4380
     CGGTATTTGA CGAAATAAAC AAGCACTCGA GCAGATACCA TGACAGGCTG GAGCGCCACA      4440
     GAAATCGGCT GGCCAGCGCT TTAAACAGAT CTCGCCCACC AAGGAGGCTC AATAGAAGGC      4500
     AACCGAGGGA TCTCATTACC CGATCTCCTT TGACAAGGGT CCGCAGAAGC TGACGCTTAT      4560
     CTTAAATCCT ATTTGTTATA TGTGATTGTT ATGTAATTGT AGTTAAATTA CTGTAAATTT      4620
     GAAAAAGCTA ACTATAGTTA GCCGGCGAGC CCAAATGGGC TGAATTAATA GATAAGAAGG      4680
     ACACAAAGGG GCTTCAAGAC TTCCCCGTAT GCCTTAATAA ATAAATTAAA TAAAAAAAAA      4740
//