Mercurial > repos > artbio > embl2fa
view test-data/transposon_sequence_set_v9.5.embl.txt @ 1:a0b6fec3b066 draft default tip
planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/main/tools/embl2fa commit 27cf3dbac49e5392d8b454668d9c09eabc8acb89
author | artbio |
---|---|
date | Sat, 14 Oct 2023 20:00:57 +0000 |
parents | 3c8c9911cf2a |
children |
line wrap: on
line source
ID DME9736 standard; DNA; INV; 7411 BP. XX AC AJ009736; XX DR FLYBASE; FBte0000104; Dmel\Idefix. XX FT source AJ009736:1..7411 FT SO_feature five_prime_LTR ; SO:0000425:1..600 FT SO_feature three_prime_LTR ; SO:0000426:6841..7411 FT SO_feature CDS ; SO:0000316:<988..2031 FT /name="Dmel\Idefix\gag" FT /db_xref="FLYBASE:FBgn0027381" FT /db_xref="SPTREMBL:O96739" FT /db_xref="NCBI_PROTEIN:CAA08806.1" FT /translation="ARKLKDIMAVPQLSETHLNQLLNQIKELNYYDGAPGKLSGFVNQV FT EQLLSLYPTQEARQAHVIYGAVKRLLVDSALEVVTQERANTWLDMKKALAMAFKDHRPY FT VTLIRQLEDISYPGSICKFIEKLETQYWIMFDKLELESDHVDKSNYTEMLNKTVKSVID FT RKLPDRIYMSLARKDIDTIYKLKQASMELGLYDAIPENHRSNRTEMNKRRNRGNYNQNN FT NQKYYNNRNHNYSNYYPSMNQNHNTQPPQNPTQPMTNQNQYSPRFIPNNQRGNYYAFRR FT DLTQAQQNNPLNNTLNFQPSTSNNINRQGPVKRQRESQSDQSRMDVNFHQAASDTQMIE FT KDIQVPM" FT SO_feature CDS ; SO:0000316:<1950..5402 FT /name="Dmel\Idefix\pol" FT /db_xref="FLYBASE:FBgn0027380" FT /db_xref="SPTREMBL:O96740" FT /db_xref="NCBI_PROTEIN:CAA08807.1" FT /translation="PKQDGCKFSSSCLGHSNDREGHTSPYVKIIHHNKNYKGMIDTGSS FT INIIRENFENLEEKEENLIVYTIKGPITLKRSIIIKPTSVCPSAQKFYIHKFSDNYDFL FT LGRKYLEDTKAKIDYANETVTLGSKVFKFLYEEKKGETASKCLDPQEKNDSALVDRTKP FT KMQKVKTAPKCLKPKHQQQKKETALPKCLISNVVKDTVDNDVTHLDPMSVDNDIVNFAI FT NNELRECNEYRLEHLNAEEVECLKKFLYEYRDIQYKEGENLTFTSTIKHVIQTQHEDPV FT YRKPYKYPQSVDQEVNKQIKEMIEQGIVRKSKSPYCSPIWVVPKKADASGKQKFRLVVD FT YRNLNEITVNDKFPIPRMDEILDKLGRCQYFTTIDLAKGFHQIQMDENSIAKTAFSTKH FT GHYEYTRMPFGLKNAPATFQRCMNNLLEDLIYKDCLVYLDDIIVYSTPLEEHILSLKKV FT FEKLRDANLKLQLDKCEFMKKETEFLGHIVTTNGIKPNPNKTKAITNFPLPKTPKQIKS FT FLGLCGFYRKFIPNFAKIVKPMTLKLKKGAIIDTKCKEYIESFEKLKVLITSDPILIYP FT DFSKPFSLTTDASNVAIGAVLSQNHKPVCYASRTLNEHEINYATIEKELLAIVWATKYF FT RSYLFGRPFEVLSDHKPLVWLNNIKEPNMKLQRWKIKLNEFDYKIKYLPGKENHVADAL FT SRTKIEVMVGEVANSADATIHSAIEDNLNYIPITERPINYFSRQIEIEKGDNDTTSVQH FT LFQKLKIKIVYKEMTPELAKNLIKEYVCTKKSAIYFPNDEDFLIFQRAFTEIISPNNFT FT KLLRCTTKLIDILTYAEFKDLILKKHKELLHPGIEKTINLFKEEYYYPDSQKLIQTIIN FT ECQICYLAKTEHQTQMTYETTPEIFNTREKYMIDFYLTGNQIFLSCIDIYSKFASLVEL FT KSRDWLEAKRAITKIFNDMGKPQEIKADKDSAFMCLALQNWLRSEGVQISISTSKNGIS FT DIERFHKTVNEKLRIIGSQQNVEDRCTKFERILYIYNHKTKHNSTKRFPADIFLYAGSP FT DFNVQQNKIDRIEYLNKNRHDFEVDIKYRQAPLVKSKITNPFKKTGRIGQVDDKHFEET FT NRGRKIVHYKSKFKKQKKFNKSKYDNSRPTKEAQSTQHTSNNA" FT SO_feature CDS ; SO:0000316:5248..6780 FT /name="Dmel\Idefix\env" FT /db_xref="FLYBASE:FBgn0027382" FT /db_xref="SPTREMBL:O96741" FT /db_xref="NCBI_PROTEIN:CAA08808.1" FT /translation="MINISKKQIVAGRSFTISQNLRNRKSLIRANMIIPDQPKKHKVHN FT ILLIMLSCILSLIITVKCNNIEVNPVNAKNGYLIFQTGTMEIPTSYEYHYLSINITKTM FT LMFEDIVSEANNYPNVPQIQYLVDKLKREINGLRIISRSKRGLLNVVGKAYKYLFGTLD FT EDDREELEEKINNMSEDSVKTHDLNTILDVINSGIDIINKLKVDKEQHQQIAVLIFNLE FT QFTEYIEDIELGLQLTRLGIFNPRLLKHDYLKHVNSEKMLKIKTSTWLKTDTNEILIIS FT HIPSEVTKVPIFQIVPYPDEHNYILTEQIFDKFYIFDNQVFHKDTNRDIFDKCIIGIIK FT QEQTQCKYIKTHKNYQINYIEPNILLTWNIPETAVNQDCTHNKILISGNNIIKIKNCTI FT QIDEFLISNNLADFTQTIYITNNVTRLEPINHLQTREMIETHVKHYNFFQIICITTFVI FT MIISLTLYVAYKFKNIPKKIIVNIVSKKNTRTLKIMSMKIFNKEIILPYTQI" XX CC Derived from AJ009736 (e1371475) (Rel. 58, Last updated, Version 1). CC Takis Benos and Michael Ashburner, 1-Feb-1999. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 7411 BP; 3047 A; 1363 C; 1109 G; 1892 T; 0 other; GTGACATATC CATAAGTCCC TAAGACTTAA GCATATGCCT ACATACTAAT ACACTTACAA 60 CACATACACC CCAATACAAC ATACACTACT CCGGATGTAC CCAACAGATA CCAGATAAGA 120 ATAAGATTGT TATATGATCC TCGAGAATGG AAAAAACCCC AATTCTAGAT AAGTCACCCA 180 CTGGTAGACT AAACATCCGT CCCCTAATTT AAACAATTCC TTGCTTAAGC CTCACCCCAT 240 CGTCACATTC CCACGTTCAA AGCTCGGAGC CGCAATCCCG AAAAACAAAA GTATCGATTT 300 CAATAAACAA ATTATAAGAA TCTAAGAGCA CTTGTATCCA AGAGCAAATG CACTTGAATC 360 CAAGAGAAAC GCAAAGCTTT TTCTCTTTAC GATCAGAATC CTAAAGTCTA AAGTCCATAT 420 TAGAAAAGCT CGATACCGAG GCTTGAACGT CAACCAAATC AGAATAATTA TCAGAGTTCA 480 GTTTGAGACC TAATTGTAAA AGGTTCGGTG TTCTTCTCAA ATAAAAAGAT TGTAATCATT 540 TAGTGAAATA AAAATTATAT TTTTTTCACT TATAAATATT GCAAGTATTT AATTGGCGCA 600 GTCGGTTAGG ATCCAATAAA ATAAAAGAGT CCTTTTAGTA CGGTACTGAT CAACTGAAGG 660 ATATGCTATA CGACTAGCTA TCCAAGATCA GCGAATTAAA ATAGTGATTC AAAAATATTT 720 TTTAATCCGC AAAAGAATCT ACGTGAAAGT AGTATTCAAA ATAAAATCCC GTGCGGTCGG 780 AAACAAAAAT TAATTTAAAT TTTTTAATTC CGAAACTTAA AACCAAGTTT AAAGAAAACT 840 TAAAATCAAG AAAACTTAAA ACCAAGTTTA AAGAAAACTT AAAATCAAGA AAACTTAAAA 900 CCAAGTTTAA AGAAAACTTA AAATCAAGAA AACTTAAAAC CAAGTTTAAA GAAAACTCAA 960 AATCAAGAAA ACTTAAAGCC AAAATAAGCT AGAAAACTAA AAGACATCAT GGCAGTCCCA 1020 CAACTCTCAG AAACACACCT AAACCAACTG CTAAACCAAA TCAAAGAATT AAACTACTAC 1080 GATGGCGCAC CTGGCAAATT ATCTGGATTC GTCAACCAAG TGGAACAACT GCTCAGTTTA 1140 TACCCAACAC AGGAAGCAAG ACAGGCACAC GTCATATATG GAGCAGTGAA GCGGTTATTA 1200 GTGGATTCAG CCTTAGAAGT CGTAACCCAG GAAAGAGCTA ACACATGGCT GGACATGAAG 1260 AAAGCACTGG CAATGGCATT CAAAGACCAT AGACCTTATG TAACTCTCAT CAGACAATTA 1320 GAAGACATAT CATACCCAGG AAGTATCTGT AAGTTTATAG AAAAATTAGA AACACAATAC 1380 TGGATTATGT TCGATAAGTT AGAATTAGAA AGTGACCATG TTGATAAATC GAATTATACC 1440 GAAATGTTAA ACAAAACTGT TAAATCAGTA ATAGATCGAA AACTGCCGGA TAGAATTTAT 1500 ATGTCTTTGG CACGTAAAGA TATTGATACA ATTTATAAAT TAAAACAAGC ATCAATGGAA 1560 TTAGGCCTTT ATGATGCTAT TCCAGAAAAT CACCGTTCTA ATAGAACAGA AATGAATAAA 1620 CGTAGGAACA GGGGAAACTA TAATCAAAAT AATAATCAAA AATATTACAA TAATAGAAAT 1680 CACAACTACA GTAATTATTA TCCTAGCATG AATCAGAATC ATAATACACA ACCACCTCAG 1740 AATCCGACTC AACCTATGAC AAATCAAAAC CAATATTCAC CGCGTTTCAT ACCGAATAAT 1800 CAAAGAGGGA ATTATTATGC ATTTAGACGA GACTTAACAC AAGCTCAGCA GAACAACCCA 1860 CTTAATAACA CCCTTAACTT CCAACCTTCG ACATCGAATA ATATTAACAG ACAAGGGCCA 1920 GTAAAAAGAC AACGCGAGAG TCAGAGTGAC CAAAGCAGGA TGGATGTAAA TTTTCATCAA 1980 GCTGCCTCGG ACACTCAAAT GATAGAGAAG GACATACAAG TCCCTATGTA AAAATAATTC 2040 ATCATAATAA AAATTATAAG GGAATGATCG ATACAGGATC ATCAATTAAC ATCATAAGAG 2100 AAAATTTTGA GAACTTAGAA GAAAAGGAAG AAAACCTAAT AGTATACACT ATTAAAGGAC 2160 CAATAACACT AAAGAGAAGT ATAATAATAA AACCTACTTC AGTATGTCCG TCTGCTCAAA 2220 AATTCTACAT TCACAAATTT TCTGATAACT ATGATTTCTT GTTAGGTCGA AAGTATTTAG 2280 AAGATACAAA AGCTAAAATA GATTATGCTA ACGAAACAGT AACACTAGGC TCAAAAGTAT 2340 TTAAGTTTCT CTATGAAGAA AAGAAGGGCG AGACCGCATC CAAATGCCTT GACCCACAAG 2400 AAAAGAATGA TTCCGCTCTA GTGGACAGAA CCAAACCAAA AATGCAAAAG GTTAAGACCG 2460 CACCTAAGTG CCTTAAACCA AAGCATCAAC AGCAGAAGAA AGAGACCGCA TTACCCAAAT 2520 GCCTCATTTC AAATGTTGTT AAAGACACAG TGGACAATGA TGTAACACAT CTCGATCCCA 2580 TGTCCGTTGA CAACGATATA GTCAACTTCG CGATTAACAA TGAGTTACGC GAATGTAACG 2640 AGTATAGACT CGAACACTTA AATGCAGAGG AAGTTGAATG TTTAAAGAAG TTCCTATACG 2700 AATATAGAGA CATTCAGTAC AAAGAGGGCG AAAATTTGAC CTTCACCAGT ACTATTAAAC 2760 ATGTCATCCA GACTCAACAC GAAGACCCAG TATACCGTAA ACCCTACAAG TACCCTCAAA 2820 GCGTTGACCA AGAAGTTAAC AAACAAATTA AAGAAATGAT AGAACAAGGG ATTGTTCGCA 2880 AATCGAAGTC CCCTTATTGT TCTCCTATTT GGGTGGTCCC CAAGAAGGCA GACGCCTCTG 2940 GGAAACAAAA ATTCAGGTTG GTAGTCGATT ACAGGAACCT AAATGAGATA ACTGTTAACG 3000 ACAAATTTCC CATTCCCCGA ATGGATGAGA TATTGGACAA ACTAGGTAGA TGCCAATACT 3060 TTACCACTAT AGATCTAGCC AAGGGTTTTC ACCAAATCCA AATGGATGAA AATTCTATTG 3120 CAAAAACAGC TTTTTCAACT AAGCATGGGC ATTATGAATA TACTCGTATG CCCTTTGGTT 3180 TAAAAAACGC TCCAGCTACT TTTCAGAGAT GCATGAATAA TCTTCTGGAA GATTTAATCT 3240 ACAAAGACTG TTTAGTCTAT TTAGACGATA TTATTGTTTA TTCCACTCCA TTGGAAGAAC 3300 ACATTTTATC CCTAAAGAAA GTCTTTGAAA AACTGAGAGA CGCTAATTTA AAGTTGCAAC 3360 TAGATAAATG TGAATTCATG AAGAAAGAAA CTGAATTCCT AGGACACATC GTCACAACAA 3420 ATGGCATCAA ACCAAATCCA AATAAAACTA AAGCAATTAC AAATTTTCCA TTACCCAAGA 3480 CACCTAAGCA AATAAAATCA TTTTTGGGAT TATGTGGATT CTATCGCAAG TTTATTCCTA 3540 ACTTTGCCAA AATAGTTAAA CCCATGACCC TCAAATTAAA GAAAGGTGCT ATAATAGACA 3600 CCAAATGTAA AGAATACATC GAATCATTTG AAAAATTAAA AGTTTTGATA ACTTCAGACC 3660 CGATATTAAT CTATCCTGAT TTTTCAAAAC CTTTTTCTTT GACAACTGAT GCTAGCAACG 3720 TAGCTATTGG TGCAGTGTTA TCACAAAATC ACAAGCCAGT TTGTTATGCC AGTAGAACGC 3780 TAAACGAACA TGAAATCAAC TATGCTACGA TTGAAAAAGA ATTGTTAGCT ATAGTTTGGG 3840 CTACAAAATA TTTCAGGTCA TACTTATTCG GCAGACCATT TGAAGTATTA AGTGATCACA 3900 AGCCACTGGT ATGGCTCAAC AACATTAAAG AACCAAACAT GAAATTGCAA AGATGGAAAA 3960 TAAAACTTAA TGAATTCGAT TATAAAATCA AATATCTTCC AGGCAAAGAA AACCATGTCG 4020 CGGATGCTCT TTCCCGCACG AAAATAGAAG TTATGGTTGG CGAGGTCGCA AATAGCGCAG 4080 ACGCAACTAT ACACAGTGCC ATTGAAGATA ATCTAAATTA CATACCCATA ACAGAAAGAC 4140 CAATAAATTA CTTCTCTAGA CAAATAGAGA TAGAAAAAGG CGATAACGAT ACAACAAGTG 4200 TACAACATTT GTTTCAAAAA TTAAAGATTA AGATAGTCTA TAAAGAAATG ACACCTGAAC 4260 TCGCCAAAAA CCTCATTAAG GAATATGTGT GCACCAAAAA GAGTGCAATT TATTTCCCTA 4320 ATGACGAAGA TTTTCTGATC TTCCAGAGAG CGTTTACCGA AATTATAAGC CCTAACAATT 4380 TCACAAAACT CTTGAGATGT ACCACAAAGT TAATTGATAT ACTAACGTAT GCAGAATTCA 4440 AAGATTTAAT CTTAAAGAAA CATAAGGAAC TTTTACATCC GGGTATAGAA AAAACAATCA 4500 ATTTATTTAA AGAAGAATAT TACTATCCTG ATAGTCAAAA GCTTATTCAA ACCATTATCA 4560 ATGAATGTCA AATTTGTTAT CTAGCAAAAA CGGAACATCA AACACAAATG ACATATGAGA 4620 CTACACCAGA AATATTTAAC ACAAGAGAAA AATACATGAT AGATTTTTAT CTCACAGGAA 4680 ACCAGATCTT CTTATCTTGC ATTGATATCT ATTCGAAATT TGCATCACTA GTTGAATTAA 4740 AAAGTAGAGA TTGGCTAGAA GCAAAAAGAG CCATTACTAA AATATTCAAT GACATGGGAA 4800 AACCGCAAGA AATTAAAGCA GACAAAGACT CAGCTTTTAT GTGTTTAGCC TTACAAAATT 4860 GGTTAAGATC TGAAGGTGTA CAAATTTCTA TAAGCACTAG CAAAAATGGT ATATCTGATA 4920 TAGAAAGATT CCACAAGACC GTAAACGAAA AGCTAAGAAT CATTGGTAGC CAACAAAATG 4980 TTGAAGATAG GTGCACAAAA TTCGAAAGAA TTCTATACAT ATACAATCAC AAAACTAAAC 5040 ATAATAGTAC TAAAAGATTT CCAGCAGACA TTTTCCTATA TGCAGGCAGT CCAGATTTTA 5100 ATGTACAACA AAACAAAATC GATAGGATAG AATACCTCAA TAAGAATAGA CACGATTTTG 5160 AAGTTGATAT AAAATATAGA CAAGCCCCAC TTGTAAAAAG TAAAATAACC AATCCATTTA 5220 AAAAGACAGG AAGAATTGGA CAAGTAGATG ATAAACATTT CGAAGAACAA AATCGTGGCA 5280 GGAAGATCGT TCACTATAAG TCAAAATTTA AGAAACAGAA AAAGTTTAAT AAGAGCAAAT 5340 ATGATAATTC CAGACCAACC AAAGAAGCAC AAAGTACACA ACATACTTCT AATAATGCTT 5400 AGTTGCATAC TATCACTTAT CATCACGGTC AAGTGCAACA ATATAGAAGT AAATCCAGTA 5460 AACGCGAAAA ATGGATACCT TATATTCCAA ACAGGAACAA TGGAAATTCC AACCAGCTAT 5520 GAATACCATT ATTTAAGCAT AAACATAACA AAGACAATGC TCATGTTCGA AGATATAGTA 5580 AGTGAAGCAA ACAACTATCC TAATGTACCA CAAATACAAT ATTTAGTCGA CAAATTAAAA 5640 CGAGAAATAA ATGGGTTAAG AATTATTAGT CGAAGTAAAA GAGGTCTTTT AAACGTAGTA 5700 GGAAAAGCAT ACAAATACTT ATTCGGCACA TTAGATGAGG ATGACAGAGA AGAGTTAGAA 5760 GAAAAAATAA ACAACATGTC AGAAGACTCT GTAAAAACCC ATGACCTAAA CACGATTCTA 5820 GATGTAATCA ATAGTGGTAT AGATATAATT AATAAGCTCA AAGTAGATAA AGAACAACAC 5880 CAACAAATTG CGGTACTAAT ATTTAACCTA GAGCAATTTA CAGAATATAT AGAAGACATA 5940 GAATTGGGTC TGCAATTAAC CAGACTAGGA ATTTTCAATC CAAGATTACT AAAGCATGAC 6000 TATTTAAAAC ATGTAAATTC AGAAAAAATG CTAAAGATAA AAACGTCAAC CTGGCTTAAA 6060 ACAGACACGA ACGAAATTTT GATTATTTCC CATATTCCTA GCGAAGTTAC TAAAGTTCCA 6120 ATATTCCAAA TTGTTCCGTA CCCAGATGAA CATAATTATA TTCTAACCGA GCAAATATTC 6180 GATAAATTCT ACATATTTGA TAACCAAGTA TTCCATAAAG ATACCAATAG GGATATATTC 6240 GACAAATGTA TTATTGGAAT CATCAAACAA GAGCAAACTC AATGCAAATA TATTAAAACA 6300 CATAAAAATT ACCAAATAAA TTATATAGAA CCAAATATAC TATTAACATG GAATATTCCT 6360 GAAACAGCTG TTAACCAAGA CTGTACACAC AATAAAATAT TAATTTCAGG AAACAACATC 6420 ATTAAAATTA AAAATTGTAC CATACAAATA GATGAATTCT TAATCTCTAA TAATCTAGCA 6480 GACTTTACAC AAACAATTTA TATCACCAAC AATGTAACAC GTCTAGAACC AATAAATCAC 6540 TTACAAACGA GAGAAATGAT AGAAACCCAT GTAAAACACT ATAACTTTTT TCAAATTATA 6600 TGCATTACAA CGTTCGTCAT AATGATAATT AGTTTGACTC TGTATGTAGC ATATAAGTTT 6660 AAAAATATAC CTAAGAAAAT TATTGTCAAT ATCGTAAGCA AAAAGAACAC ACGCACCTTG 6720 AAAATAATGT CAATGAAAAT ATTCAACAAG GAAATAATAT TACCTTATAC CCAAATTTAA 6780 CGACCTGAGG ACAGGCCAAA TTCAAAGGTT GGGGGAGTGA CATATCCATA AGTCCCTAAG 6840 ACTTAAGCAT ATGCCTACAT ACTAATACAC TTACAACACA TACACCCCAA TACAACATAC 6900 ACTACTCCGG ATGTACCCAA CAGATACCAG ATAAGAATAA GATTGTTATA TGATCCTCGA 6960 GAATGGAAAA AACCCCAATT CTAGATAAGT CACCCACTGG TAGACTAAAC ATCCGTTCCC 7020 CTAATTTAAA CAATTCCTTG CTTAAGCCTC ACCCCATCGT CACATTCCCA CGTTCAAAGC 7080 TCGGAGCCGC AATCCCGAAA AACAAAAGTA TCGATTTCAA TAAACAAATT ATAAGAATCT 7140 AAGAGCACTT GTATCCAAGA GCAAATGCAC TTGAATCCAA GAGAAACGCA AAGCTTTTTC 7200 TCTTTACGAT CAGAATCCTA AAGTCTAAAG TCCATATTAG AAAAGCTCGA TACCGAGGCT 7260 TGAACGTCAA CCAAATCAGA ATAATTATCA GAGTTCAGTT TGAGACCTAA TTGTAAAAGG 7320 TTCGGTGTTC TTCTCAAATA AAAAGATTGT AATCATTTAG TGAAATAAAA ATTATATTTT 7380 TTTCACTTAT AAATATTGCA AGTATTTAAT T 7411 // ID DMIS176 standard; DNA; INV; 7439 BP. XX AC X01472; J01060; J01061; XX DR FLYBASE; FBte0000109; Dmel\17.6. XX FT source X01472:1..7439 FT SO_feature five_prime_LTR ; SO:0000425:1..512 FT SO_feature three_prime_LTR ; SO:0000426:6928..7439 FT SO_feature TATA_box ; SO:0000174:372..377 FT SO_feature TATA_box ; SO:0000174:7271..7277 FT SO_feature primer_binding_site ; SO:0005850:511..529 FT SO_feature polyA_signal_sequence ; SO:0000551:372..377 FT SO_feature polyA_signal_sequence ; SO:0000551:7299.7304 FT SO_feature RR_tract ; SO:0000435:6917..6927 FT SO_feature CDS ; SO:0000316:1074..2393 FT /name="Dmel\17.6\gag" FT /db_xref="FLYBASE:FBgn0044339" FT /db_xref="SWISS-PROT:P04282" FT /db_xref="NCBI_PROTEIN:CAA25701.1" FT /translation="MAQEPAIVPPLSDSNMTQVAYQIGNVEKFNGDPGSLYTFVSRIDY FT ILALYATGDERQQQIIFGHIERSISGEVMRCIGAYDMYTWQQLRRQLVLNYKPQTPNHV FT LLEEFRKTPFRGNVRAFLEEAESRRQTLTSKLELEQDLEEKTFYLKLIKSSIESLIEKL FT PTHIYLRINNHNIPDLRSLINLLQEKGMYEQINHTSTHVQKQNFSDKPQKSFNQNTNQS FT NNIRKYPTPFLHYNSPIPYQAPQIYQTPPTNNPLYRHPIPYHPNPNNVFQPSQQNNVFQ FT PSQQNNAFQPNQRTNFTSRPIFNTNRNNAFDQNRFGQQPQYQNQQSTQNSSSYVPNRPI FT KRLRPANSGQTGMSVDETLYQEDAFYQQCVPYDYFYYPTYDHSDYYPENQYQIDENNQN FT LQRTQQLQQINTDETNNDNQEPNVEQAENFQPQALENPNI" FT SO_feature CDS ; SO:0000316:2345..5518 FT /name="Dmel\17.6\pol" FT /db_xref="FLYBASE:FBgn0014453" FT /db_xref="SWISS-PROT:P04323" FT /db_xref="NCBI_PROTEIN:CAA25702.1" FT /translation="TGRKFSATSLGKPQYITIKYKENNLKCLIDTGSTVNMTSKNIFDL FT PIQNTSTFIHTSNGPLIVNKSIIIPSKILFPTTNEFLLHPFSENYDLLLGRKLLAEAKA FT TISYRDQEVTLYNNKYKLIEGIATHEQSHFQNVNMIPDTMLRQPNKISPILESDLYRLE FT HLNNEEKQRLCALLQKYHDIQYHEGDKLTFTNQTKHTINTKHNLPLYSKYSYPQAYEQE FT VESQIQDMLNQGIIRTSNSPYNSPIWVVPKKQDASGKQKFRIVIDYRKLNEITVGDRHP FT IPNMDEILGKLGRCNYFTTIDLAKGFHQIEMDPESVSKTAFSTKHGHYEYLRMPFGLKN FT APATFQRCMNDILRPLLNKHCLVYLDDIIVFSTSLDEHLQSLGLVFEKLAKANLKLQLD FT KCEFLKQETTFLGHVLTPDGIKPNPEKIEAIQKYPIPTKPKEIKAFLGLTGYYRKFIPN FT FADIAKPMTKCLKKNMKIDTTNPEYDSAFKKLKYLISEDPILKVPDFTKKFTLTTDASD FT VALGAVLSQDGHPLSYISRTLNEHEINYSTIEKELLAIVWATKTFRHYLLGRHFEISSD FT HQPLSWLYRMKDPNSKLTRWRVKLSEFDFDIKYIKGKENCVADALSRIKLEETYLSEQT FT QHSAEEDNSDLIFITERPLNTFNRQVIFSKGPPDIKVTKYFKKHITQIFYDIMTREKAE FT QYLIDHFCGKKSALYIESDADFEVIQAAHKLAINTKYTKILRSTILLKNITTYAEFKEL FT ILTAHEKLLHPGIQKTTKLFGETYYFPNSQLLIQNIINECSICNLAKTEHRNTDMPTKT FT TPKPEHCREKFMIDIYSSEGKHYVSCIDIYSKFATLEEIKTKDWIECKNALMRIFNQLG FT KPKLLKADRDGAFSSLALKRWLESEEVELQLNTTKTGVADIERLHKTINEKIRIIKTSD FT DEETKLSKMETVLNIYNHKTKHDTTGQTPAHIFLYAGQPILDTQQNKENKINKINNDRV FT EYEVDTRYRKGPLQKGKLENPFKPTKNVEQTDSDHYKITNRNRITHYYKTQFKKRKKNN FT QLSISQAPGT" FT SO_feature CDS ; SO:0000316:5488..6903 FT /name="17.6\env" FT /db_xref="FLYBASE:FBgn0027624" FT /db_xref="SWISS-PROT:P04283" FT /db_xref="NCBI_PROTEIN:CAA25703.1" FT /translation="SALNFTGTWHLITLLLMLITTVHGQQIEINNIDTNHGYLLFSDKP FT VQIPSSFEHHCLRINLTEIDTIADYFEQRLRTDYHAPQVKFLYNKMRRELAGIALRHRN FT KRGLINIVGSVFKYLFGTLDENDRVDIQRKLETNAHNSVNLHELNDAIQLINDGMQKIQ FT NYENNSNIINSLLYELMQFTEYIEDVEMGMQLSRLGLFNPKLLNYDKLENVNSQNILNI FT KTSTWINYNDNQLLIISHIPINFSLINTVKIIPYPDSNGYQLEYTDTQSYFERENKVYN FT NENKEINNECVTNIIKHLKPICNFESIHTDEIIKYIEPNTIVTWNLTQTSLKQNCQNSF FT NNIKIKGNKMIKVTQCKIEINSIILSENLFKPEIDLTPLYTPLNITKIKTVKHNDINEM FT ISQNNITLYIFMTTVIIILILLYLYLRYVSFNPFMMLYAKLKLRKNQNQNTAQQIEMED FT VPLPLLYPSIPAQV" XX CC Derived from X01472 (g8142) (Rel. 36, Last updated, Version 2). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 7439 BP; 2985 A; 1512 C; 1048 G; 1894 T; 0 other; AGTGACATAT TCACATACAA AACCACATAA CATAGAGTAA ACATATTGAA AAGCCGCATA 60 CGTAAACAAT AAGTGACCAC CATGCTAATG TGGATCAAAT AACAAAAATA TCCACTCTGC 120 ATTTTGACAC CCCCATACTG TATGCCATCT GCGCAGTATG CATTCTAATA AACAAATTCT 180 TTGACAGCGG CACTTAGCCA TTCTTGTAAA CAAATCTTAA AGTCTGCCTG CTCTCTCTGA 240 GGCTTCTCCT CCACTTAAGA ATCCAAGAGC AATGCTCTCC CAAAAACACT AACATATTCT 300 TTAAGCAAGC ACAGAGGCTT CTCCTCATTT TCACTTTCAT TTGATTTTCA GTCTTAAGCT 360 GAACGTTAAT CAATAAACAA CACAATCGAT ACCGAAATTT TGATTCGTTT TATTTTGGCA 420 AAACTCAATT TTCAGCGTTG GTCTTAGTTC ATATTCGGAA CGGTCCATTT AATAGACTCA 480 AAACTATTTA TTGCAACCAT TTATTTGCAA TTGGCGCAGT CGATGTGATC AGTGTTAAAG 540 TTCCTTGATG CGGTAACCAG ATTTGCCAAT TCCTGTGTTC TTTTTGTTCT CTGACAAAAG 600 TACCACGATA ACGGGCACCC ACGTGACGGT TAATATCGCT TTAAGTTTTT AATTAAACCT 660 CGACAATAAA GTGAAACCGA AAAATCACAA TTTGCCTAAA CAAACCTGAA TTTATTATCA 720 GGAAGACGCT ATTGAATTTG TGAGAGGCTG TAAATCCAAT TGGTTACCTC AAAGACCCAC 780 GAAAAAGCTA TAGTGCAACC CTTGCGAAAA TCAAAACCTA TCTTAAAAAA AAAAAAAAAA 840 TATAAATAAT AAATTAATAA GCGAAAATTA AAACGTATTA AAAGTAAGAA TAATAAATAA 900 ATAAGTGAAA ATTCTATATG ATAAAAATTA AAAATAAGAA TAATAAATAA AAAGACAACA 960 TTTTAAATTA AACAATATTA AAAAAATATA AAAATATTAA AAACTATATT AAAAAAAAAA 1020 AAAAAACAAA AAAACAAAAA AAAAAAAATA AATAAATAAT CCAAAAATCA AAAATGGCTC 1080 AAGAACCAGC AATTGTGCCA CCACTATCAG ACAGCAACAT GACCCAGGTT GCCTACCAGA 1140 TTGGCAATGT GGAGAAATTC AACGGTGATC CAGGCTCACT ATACACCTTT GTGAGTCGAA 1200 TTGATTACAT ACTGGCTCTT TATGCTACCG GAGATGAACG CCAACAGCAG ATCATATTTG 1260 GGCATATTGA ACGCAGCATC AGCGGAGAAG TTATGCGCTG CATTGGAGCC TATGACATGT 1320 ACACCTGGCA GCAGCTTAGA AGACAATTGG TACTCAACTA TAAACCCCAG ACCCCTAACC 1380 ACGTTCTTTT AGAAGAGTTT CGAAAGACCC CATTTCGAGG CAATGTACGA GCATTCCTGG 1440 AAGAAGCAGA AAGCCGCAGA CAAACACTTA CTAGTAAGCT TGAATTAGAG CAAGATCTTG 1500 AAGAAAAGAC TTTTTATTTG AAATTAATAA AATCCAGTAT AGAATCACTA ATTGAAAAAT 1560 TACCTACACA CATTTATTTA AGAATAAATA ACCACAACAT ACCAGATTTG CGATCACTTA 1620 TAAACCTTTT ACAAGAGAAG GGCATGTACG AACAAATAAA TCATACAAGT ACACATGTCC 1680 AAAAACAAAA TTTCTCTGAT AAGCCACAAA AGTCCTTTAA TCAAAATACT AATCAGTCTA 1740 ACAATATCAG AAAATATCCA ACACCTTTCC TACATTATAA TTCACCAATA CCATATCAAG 1800 CTCCACAAAT TTATCAAACA CCACCAACTA ATAACCCACT TTATCGTCAT CCAATACCCT 1860 ACCACCCTAA TCCAAACAAT GTTTTTCAAC CAAGCCAACA AAACAATGTT TTCCAACCAA 1920 GCCAACAAAA CAATGCTTTT CAACCAAATC AACGAACAAA CTTTACATCT CGACCAATTT 1980 TTAACACCAA TCGAAACAAT GCATTCGATC AGAATAGGTT CGGACAACAA CCCCAATATC 2040 AAAATCAACA ATCAACACAA AATTCAAGTT CCTATGTACC CAATCGACCA ATAAAACGAT 2100 TAAGACCAGC TAATAGTGGA CAGACTGGGA TGAGTGTTGA CGAAACATTA TATCAAGAGG 2160 ACGCTTTTTA TCAGCAGTGT GTTCCATATG ACTATTTTTA TTATCCAACT TACGACCATT 2220 CAGACTATTA TCCAGAAAAT CAATATCAAA TTGACGAAAA CAACCAAAAT TTACAAAGAA 2280 CACAACAGTT ACAGCAGATT AATACAGACG AGACAAACAA TGACAACCAA GAACCCAATG 2340 TTGAACAGGC CGAAAATTTT CAGCCACAAG CCTTGGAAAA CCCCAATATA TAACAATTAA 2400 ATACAAAGAA AATAATTTGA AATGCCTTAT TGATACCGGA TCAACAGTTA ACATGACATC 2460 TAAAAATATA TTTGATTTAC CAATCCAGAA TACTAGTACT TTTATTCATA CCAGCAATGG 2520 ACCGCTCATT GTCAACAAAA GTATAATCAT ACCTTCAAAG ATTTTGTTCC CAACAACAAA 2580 TGAATTTTTA TTGCACCCTT TCTCTGAGAA TTACGATCTT TTATTAGGAA GAAAACTTTT 2640 AGCAGAAGCA AAAGCAACAA TAAGTTACCG CGATCAAGAG GTAACTCTTT ACAACAACAA 2700 ATACAAATTA ATAGAAGGAA TAGCAACACA TGAACAGAGT CATTTTCAAA ATGTAAATAT 2760 GATACCTGAC ACCATGCTCA GACAGCCAAA TAAAATTTCA CCCATTTTAG AATCAGACCT 2820 ATACAGATTG GAACATTTAA ATAACGAAGA AAAACAAAGA TTGTGCGCAC TCCTGCAGAA 2880 ATACCATGAC ATACAGTACC ATGAAGGTGA TAAGTTGACA TTTACTAATC AAACCAAACA 2940 TACTATCAAT ACAAAGCACA ATCTACCACT TTACTCTAAA TACAGTTACC CACAGGCTTA 3000 TGAACAGGAG GTCGAAAGCC AAATACAAGA TATGCTAAAT CAAGGTATTA TACGTACCAG 3060 TAATTCACCT TACAATAGCC CCATCTGGGT GGTTCCAAAG AAACAAGATG CATCAGGCAA 3120 ACAGAAATTT AGAATTGTAA TAGACTACCG AAAATTAAAT GAAATAACAG TAGGAGACAG 3180 ACACCCAATC CCAAACATGG ACGAAATCTT GGGAAAATTG GGCAGATGTA ATTACTTCAC 3240 AACTATAGAC TTGGCAAAGG GTTTCCACCA GATCGAAATG GATCCAGAAT CAGTTTCAAA 3300 GACAGCCTTT TCTACCAAGC ACGGTCATTA TGAATATTTG CGCATGCCAT TCGGATTAAA 3360 AAACGCGCCA GCCACCTTTC AACGGTGCAT GAATGATATT TTAAGACCAC TCTTAAACAA 3420 ACACTGTCTT GTGTATTTGG ACGACATAAT TGTATTCTCG ACATCCCTTG ATGAACACCT 3480 GCAATCGCTC GGACTAGTTT TCGAAAAATT AGCAAAAGCC AACCTTAAAT TACAACTTGA 3540 CAAATGTGAG TTTCTCAAGC AAGAAACCAC ATTTTTAGGA CATGTTCTAA CACCAGATGG 3600 AATAAAACCA AACCCTGAAA AAATTGAAGC CATTCAAAAA TATCCAATTC CCACTAAACC 3660 AAAAGAAATA AAAGCTTTTC TTGGACTGAC AGGATATTAT CGTAAATTTA TTCCAAACTT 3720 TGCAGACATA GCCAAACCCA TGACTAAGTG TTTAAAAAAG AACATGAAAA TTGACACTAC 3780 CAACCCAGAA TATGACTCTG CATTTAAAAA ATTAAAATAT CTAATATCAG AAGACCCAAT 3840 TCTTAAAGTA CCCGACTTTA CAAAGAAATT CACTTTAACC ACAGACGCAA GTGATGTCGC 3900 TTTGGGGGCA GTACTGTCAC AAGATGGACA CCCACTTAGC TACATTAGCC GAACACTTAA 3960 TGAACACGAA ATAAATTACA GCACAATTGA AAAAGAACTC TTAGCAATTG TATGGGCGAC 4020 AAAGACTTTT CGACACTACC TACTTGGAAG ACACTTTGAA ATATCCAGTG ACCATCAACC 4080 ATTGAGCTGG TTGTACCGTA TGAAAGACCC AAATTCAAAA CTGACCCGAT GGAGAGTAAA 4140 ATTATCCGAA TTCGATTTTG ATATAAAATA TATAAAAGGA AAAGAAAATT GCGTGGCGGA 4200 TGCTCTGTCC AGAATAAAAC TTGAGGAGAC ATATTTGAGC GAACAAACCC AACATAGTGC 4260 AGAAGAGGAC AATAGTGATT TAATTTTTAT TACAGAAAGA CCTCTAAATA CATTTAACAG 4320 ACAAGTTATA TTTTCAAAAG GACCACCAGA CATTAAAGTT ACGAAATATT TCAAAAAACA 4380 CATCACCCAA ATATTTTACG ACATTATGAC CAGGGAAAAA GCCGAACAAT ATTTGATAGA 4440 CCATTTTTGT GGTAAGAAAA GTGCGTTGTA TATTGAGAGT GACGCTGATT TCGAAGTCAT 4500 TCAAGCCGCA CATAAATTAG CCATAAACAC CAAATATACA AAAATCCTGC GTAGCACGAT 4560 TTTGTTAAAA AACATAACCA CTTATGCGGA ATTTAAGGAA TTGATCTTGA CTGCTCATGA 4620 AAAACTTCTA CACCCAGGCA TACAGAAAAC TACTAAACTT TTCGGAGAAA CTTACTATTT 4680 CCCTAATAGC CAGCTACTTA TTCAGAATAT AATAAATGAG TGCAGTATTT GCAATCTGGC 4740 AAAAACAGAG CACCGAAATA CAGACATGCC AACGAAAACC ACACCCAAAC CAGAACATTG 4800 CCGCGAAAAA TTCATGATAG ACATTTACTC ATCCGAAGGC AAACATTACG TTAGTTGCAT 4860 AGACATTTAT TCGAAATTTG CCACATTAGA AGAAATAAAA ACAAAAGACT GGATAGAATG 4920 CAAAAACGCG CTTATGCGCA TATTCAACCA GCTTGGCAAG CCAAAGTTAC TAAAGGCGGA 4980 CAGAGACGGC GCATTTTCCA GTTTAGCCCT CAAGAGATGG CTGGAGAGTG AGGAAGTCGA 5040 ATTGCAGCTT AACACAACAA AAACTGGTGT GGCGGACATA GAAAGACTAC ATAAAACAAT 5100 TAATGAAAAG ATTCGCATAA TCAAAACATC CGATGACGAA GAAACCAAAT TGAGCAAAAT 5160 GGAAACAGTA CTTAACATAT ACAATCATAA AACCAAACAC GACACCACTG GACAGACCCC 5220 TGCACACATA TTTCTCTACG CTGGACAACC AATATTAGAT ACCCAACAAA ACAAAGAAAA 5280 CAAAATAAAC AAAATAAATA ATGACAGAGT GGAGTACGAA GTCGACACAA GATACAGAAA 5340 AGGTCCACTA CAGAAAGGCA AATTAGAAAA TCCTTTTAAG CCAACAAAAA ATGTGGAGCA 5400 GACTGACTCT GATCATTATA AAATTACTAA TAGAAATAGA ATTACTCACT ACTACAAAAC 5460 ACAATTCAAA AAACGAAAGA AAAATAATCA GCTCTCAATT TCACAGGCAC CTGGCACTTG 5520 ATAACATTGC TGCTGATGCT GATCACAACA GTTCATGGAC AACAAATTGA AATTAATAAT 5580 ATTGACACAA ACCACGGATA TCTCCTTTTT TCTGATAAAC CAGTCCAGAT ACCATCATCC 5640 TTTGAACATC ATTGCTTGAG AATCAATTTA ACTGAAATAG ACACCATAGC TGATTATTTT 5700 GAGCAAAGAC TACGTACCGA CTACCATGCA CCCCAGGTCA AATTTTTATA CAACAAAATG 5760 AGAAGAGAAC TAGCTGGAAT AGCCTTGCGA CATAGAAATA AACGGGGACT TATTAACATT 5820 GTAGGTTCAG TTTTTAAATA CCTATTTGGC ACACTTGACG AAAATGATCG AGTGGATATA 5880 CAGAGGAAAC TTGAAACAAA CGCCCATAAC TCGGTAAATT TACATGAACT CAATGACGCT 5940 ATTCAATTAA TAAATGACGG AATGCAAAAG ATACAGAATT ATGAAAACAA CAGCAACATC 6000 ATTAACAGTC TTTTATATGA ACTCATGCAG TTTACAGAAT ACATAGAAGA TGTGGAAATG 6060 GGAATGCAGC TTTCCAGACT CGGTCTATTT AATCCCAAAC TACTAAACTA CGATAAACTT 6120 GAGAATGTAA ACAGCCAAAA TATTTTAAAC ATTAAAACAT CCACTTGGAT TAATTACAAT 6180 GATAACCAAT TATTAATCAT ATCTCACATA CCTATTAACT TTTCATTAAT AAATACAGTA 6240 AAAATAATCC CTTACCCAGA CTCGAACGGC TATCAGCTAG AATACACAGA CACACAATCA 6300 TATTTTGAAA GAGAAAATAA AGTTTACAAT AACGAAAATA AAGAAATAAA CAATGAGTGT 6360 GTCACCAACA TTATTAAACA TTTAAAACCA ATTTGTAATT TTGAGTCAAT CCACACAGAT 6420 GAAATAATAA AATACATAGA ACCAAACACA ATTGTAACCT GGAATTTAAC CCAAACAAGT 6480 CTCAAACAAA ATTGTCAAAA TTCATTTAAT AATATAAAAA TAAAAGGAAA CAAAATGATA 6540 AAAGTAACCC AATGTAAAAT AGAAATCAAT AGCATAATTC TAAGTGAAAA TCTCTTTAAA 6600 CCAGAAATAG ATTTGACACC ATTATACACA CCACTTAACA TAACAAAAAT AAAAACTGTT 6660 AAACACAACG ACATTAATGA AATGATTTCA CAAAACAATA TTACACTTTA CATATTTATG 6720 ACTACTGTCA TCATTATACT TATTTTATTG TACTTATATT TAAGATACGT ATCATTTAAC 6780 CCATTCATGA TGCTGTATGC AAAACTAAAA TTAAGAAAAA ATCAAAATCA AAACACAGCA 6840 CAACAAATAG AAATGGAAGA CGTTCCATTA CCCCTACTAT ATCCATCAAT CCCAGCCCAA 6900 GTATAGGCTT CTCTTTAAGG GAAGGGAAGT GACATATTCA CATACAAAAC CACATAACGT 6960 AGAGTAAACA TATTGAAAAG CCGCATACGT CAACAATAAG TGACCACCAT GCTAATGTGG 7020 ATCAAATAAC AAAAATATCC ACTCTGCATT TTGACACCCC CATACTGTAT GCCATCTGCG 7080 CAGTATGCAT TCTAATAAAC AAATTCTTTG ACAGCGGCAC TTAGCCATTC TTGTAAACAA 7140 ATCTTAAAGT CTGCCTGCTC TCTCTGAGGC TTCTCCTCCA CTTAAGAATC CAAGAGCAAT 7200 GCTCTCCCAA AAACACTAAC ATATTCTTTA AGCAAGCACA GAGGCTTCTC CTCATTTTCA 7260 CTTTCATTTG ATTTTCAGTC TTAAGCTGAA CGTTAATCAA TAAACAACAC AATCGATACC 7320 GAAATTTTGA TTCGTTTTAT TTTGGCAAAA CTCAATTTTC AGCGTTGGTC TTAGTTCATA 7380 TTCGGAACGG TCCATTTAAT AGACTCAAAA CTATTTATTG CAACCATTTA TTTGCAATT 7439 // ID DMTN1731 standard; DNA; INV; 4648 BP. XX AC X07656; XX DR FLYBASE; FBte0000003; Dmel\1731. XX FT source X07656:1..4648 FT SO_feature five_prime_LTR ; SO:0000425:1..336 FT SO_feature three_prime_LTR ; SO:0000426:4313..4648 FT SO_feature TATA_box ; SO:0000174:110..116 FT SO_feature primer_binding_site ; SO:0005850:342..352 FT SO_feature CDS ; SO:0000316:431..1252 FT /name="Dmel\1731\gag" FT /db_xref="FLYBASE:FBgn0020768" FT /db_xref="REMTREMBL:CAA30502" FT /db_xref="NCBI_PROTEIN:CAA30502.1" FT /translation="MSNLYQIDKLEDGSYETWSIQMRSVLVHACLWKVVSGESVKPEVD FT TGGAWQSQDEKALATIILSVKSSQLGYVKGCLTAAEAWKVLQDVHQPKGPLRTVMLYKK FT LLSKRLLEGQSISSHIKEFKEIFDALDAVEIGITEKLRSVVLLSSLPESFENFVVAIET FT RDDVPLFDALCIKLIEEDTRRGGAEQQREKQTESAKAFTAVHKPQAPAREARPSAKKRK FT DVVCYNCGERRHFKANCRREKVNKESATQEQCSLLNALDSGGFWQNTVVSR" FT SO_feature CDS ; SO:0000316:1203..4151 FT /name="Dmel\1731\RTase" FT /db_xref="FLYBASE:FBgn0012032" FT /db_xref="REMTREMBL:CAA30503" FT /db_xref="NCBI_PROTEIN:CAA30503.1" FT /translation="MRWIVVVFGKTQWCLDSGATSHMCCDRSVFTEFEEHTEKISLAGN FT GFLLAKGIGTVKLKTDLCTLVLNNVLFVPDLNGNFMSVSRAAQYKCFVNFGPHYADVIQ FT EGERILRVMRAGNLYMFQGKHNSCFAAVDADGSLWHKRNGHLNTSSLQEMVRKKMVYGV FT EKVVFKPDAVCKTCMLAKIHVQPFPKTTRSRAEELLDMIHSDLCGPFSTPSLAGSKYFL FT TFIDDKSRRIFVYFLRKKDEVFTKFVEFKKLVERQTGRKIKCIRSDNGGEFVNNVFDDY FT LKAHGIARQLTIPHTPQQNGVAERANRTLVEMARCMLLQSELGEALWAEAINTAVYLRN FT RSTSRALQSKTPMEEWTGKIPAVSHLRVFGAIAVALDKGVHKGKFESKGKEYRMIGYSI FT AAKGYRLFDKEKRCVIEKQDVLFDESGSLVNHGNTIEFQFPATDDPEPQSDSNAREGDD FT TEPVGSSDDYESAAEAEEAEVHVGPGRPKIVRTGRPGRPKKQYNVLGVLMASDVEIPKS FT YEEAINSQYSAKWEEAMGLEYKALLANETWKLADLPRNRRCVACKWVYSLKRDVSGRIE FT RFKARLVAKGCSQKFGVDYFETFSPVCRLESVRLILALAAEMQLYLHHMDVCTAYLNSE FT LKDTVYMKQPQGFTDAANPDQVLLLRKAIYGLKQSGREWNSKLDGVLKDLGFKACNHEP FT CLYQQSGQGNLMLILVYVDDLILACQSREDMEDLKAKISESFECTDKGPLHLFLGMEVQ FT RDGDLGEITLGHSQYIKELLRDYGSENCRPATTPLDAGHQVLCAGEQCQKVDAGQYQST FT IGELMWLGLTTRPDMLHSVAKLAQRNQDPHSEHMVAVKHILRYLASTVDVKLHYQKCGQ FT AFTGFVDADWGGDRLDRKSYTGYVFFLSGGPVSWRSEKQQSVALSSTEAEYMALTTACK FT EAIALRRLIVEIVCGDLKTPTVMHGDNLKCAAQLAKNPVHHSRTKHIDIRYH" XX CC Derived from X07656 (g8700) (Rel. 36, Last updated, Version 6). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 4648 BP; 1316 A; 880 C; 1268 G; 1184 T; 0 other; TGTTGAATAT AGGCAATGCC CACATGTGTG TTGAATATAG GCAATTTCCA CATGTGCATA 60 TGTAATTTTG TATGAGAACA TACATACATA CACATGAACT GTATGTATGT ATATATATTA 120 GCAAATAAGC AGCCGCATGA AGGTGGCATT TTTATGTGTA TCAGTTTCAG TTTCAAATAA 180 AACTTCTTCG TGTTCGGACA CGCGGCTCAA GACTTTTTAT TTCGCGTTTA CTCTTTCAGC 240 CTTTGCTCTC AATTCGCTGA GTTTGGGTGA AGATTAGGAT CTTCCCATTA TGATTGTCAG 300 TGTTCCACAC TTGGAGCACC TTTTCAATAA ACAACAGGTT AATGGGCCCA GCGCCCTAGG 360 AGCTGCCTAA AGGAGAAACG TGTAGTGAAA CTCAGGAGTT AGATTTTGGA GTCTACTCAA 420 GATTGCCGGA ATGAGTAACC TGTATCAGAT CGATAAGCTG GAGGATGGAT CCTATGAAAC 480 GTGGAGCATC CAGATGCGTT CAGTGTTGGT GCACGCATGT TTGTGGAAGG TGGTTTCAGG 540 AGAGTCCGTG AAACCTGAGG TTGATACTGG AGGTGCTTGG CAATCCCAAG ATGAAAAAGC 600 ATTGGCCACG ATCATCTTGA GTGTGAAGTC TTCGCAACTT GGTTATGTAA AAGGGTGTCT 660 CACTGCGGCT GAGGCATGGA AAGTTTTACA GGATGTCCAC CAGCCGAAAG GGCCGTTACG 720 AACGGTCATG CTGTATAAGA AGTTGCTGAG CAAACGTCTG TTGGAAGGGC AGAGTATATC 780 GTCACATATT AAAGAATTTA AGGAAATCTT TGATGCCCTT GATGCGGTGG AAATTGGTAT 840 CACCGAGAAA TTGCGCAGTG TTGTTTTGCT GTCGAGCCTT CCAGAGAGTT TCGAGAATTT 900 CGTTGTCGCC ATTGAGACGC GCGACGACGT GCCGCTTTTC GATGCTCTAT GTATAAAGCT 960 GATCGAGGAA GACACGAGAA GGGGAGGAGC GGAGCAGCAG AGAGAAAAAC AAACGGAGAG 1020 CGCAAAGGCA TTTACTGCAG TACATAAGCC ACAGGCGCCG GCGAGAGAAG CTCGGCCGAG 1080 CGCAAAGAAG AGGAAAGACG TAGTTTGTTA TAACTGTGGA GAGCGTAGGC ATTTTAAAGC 1140 GAACTGTCGT CGCGAGAAAG TAAACAAAGA GAGCGCGACA CAAGAACAAT GCAGTTTGTT 1200 AAATGCGCTG GATAGTGGTG GTTTTTGGCA AAACACAGTG GTGTCTCGAT AGCGGGGCTA 1260 CCAGTCACAT GTGCTGTGAC AGAAGTGTTT TTACTGAGTT TGAAGAGCAC ACTGAAAAAA 1320 TTAGTCTTGC TGGAAATGGA TTCCTACTAG CAAAGGGCAT AGGAACAGTG AAGCTGAAGA 1380 CTGATTTATG TACTCTGGTA TTGAATAACG TACTCTTCGT CCCAGATTTG AACGGCAACT 1440 TTATGTCAGT CAGCCGTGCA GCTCAGTATA AATGTTTTGT CAATTTTGGA CCACATTACG 1500 CTGACGTCAT TCAGGAAGGC GAGCGAATAC TGCGTGTAAT GAGAGCTGGT AATTTATATA 1560 TGTTTCAAGG GAAACATAAC AGTTGTTTTG CGGCCGTTGA TGCTGATGGT TCACTATGGC 1620 ATAAAAGGAA TGGCCATTTG AATACAAGCA GCCTACAGGA GATGGTGAGG AAGAAGATGG 1680 TGTACGGTGT TGAAAAGGTC GTTTTCAAAC CAGACGCAGT ATGCAAGACG TGCATGCTGG 1740 CAAAAATCCA TGTGCAACCA TTTCCGAAGA CAACGAGGAG CAGAGCTGAG GAGCTGTTGG 1800 ATATGATCCA TTCAGACCTG TGCGGGCCAT TTAGCACACC GTCACTTGCT GGATCAAAGT 1860 ACTTTCTCAC TTTCATAGAC GACAAGTCCA GGCGGATTTT TGTATATTTC TTGCGGAAGA 1920 AGGACGAAGT CTTCACTAAG TTTGTCGAGT TTAAGAAACT GGTCGAGCGA CAAACAGGTA 1980 GAAAGATAAA ATGTATCCGG AGCGATAATG GTGGTGAGTT CGTCAATAAT GTTTTTGATG 2040 ACTATTTAAA GGCACATGGG ATCGCTAGAC AGCTGACTAT TCCACACACT CCCCAACAAA 2100 ATGGAGTTGC AGAACGAGCC AACCGCACGC TAGTAGAAAT GGCTAGGTGC ATGTTGCTGC 2160 AATCGGAGTT GGGTGAGGCT CTATGGGCTG AGGCGATAAA CACTGCGGTG TATCTGAGGA 2220 ACCGATCAAC GAGCAGAGCA TTACAAAGCA AAACCCCTAT GGAAGAGTGG ACCGGAAAAA 2280 TACCAGCAGT GAGCCACTTG AGGGTTTTTG GTGCCATAGC AGTGGCATTG GACAAAGGAG 2340 TCCATAAAGG CAAATTCGAA TCCAAAGGAA AGGAATATCG TATGATTGGA TATTCAATAG 2400 CTGCTAAGGG GTACCGTCTG TTTGACAAAG AGAAGCGGTG TGTGATCGAG AAGCAAGATG 2460 TCCTTTTTGA TGAGTCTGGT AGTTTGGTAA ATCATGGAAA TACCATTGAG TTCCAGTTTC 2520 CCGCAACTGA TGACCCGGAG CCGCAGAGTG ATTCGAATGC ACGGGAAGGT GACGATACAG 2580 AACCCGTGGG CAGCAGCGAC GACTATGAGA GTGCAGCTGA GGCAGAAGAA GCTGAAGTAC 2640 ATGTGGGGCC TGGACGGCCA AAGATTGTTC GGACGGGCAG ACCAGGGCGC CCGAAGAAGC 2700 AATACAATGT ACTTGGCGTG TTGATGGCTA GCGACGTCGA AATTCCCAAG TCCTATGAGG 2760 AGGCCATCAA TTCGCAGTAT TCTGCAAAGT GGGAAGAGGC AATGGGCCTG GAGTACAAGG 2820 CGCTACTTGC AAATGAGACA TGGAAGCTGG CTGACTTACC AAGAAATCGC CGGTGTGTGG 2880 CTTGCAAGTG GGTGTATTCC CTGAAACGAG ACGTCTCTGG TAGAATTGAG CGCTTCAAGG 2940 CACGACTAGT AGCAAAGGGG TGTTCGCAGA AGTTCGGAGT GGACTACTTC GAGACTTTTT 3000 CACCCGTGTG CAGGCTCGAG AGTGTGAGGC TCATTTTGGC ATTGGCAGCA GAGATGCAAT 3060 TGTACTTGCA TCACATGGAC GTATGCACGG CGTACTTAAA TAGCGAGCTA AAGGATACTG 3120 TGTACATGAA GCAGCCCCAA GGGTTCACAG ATGCTGCTAA TCCCGACCAG GTGTTATTGC 3180 TGAGGAAGGC AATATACGGC TTGAAGCAGT CAGGCAGAGA GTGGAACTCC AAGCTCGACG 3240 GTGTTCTAAA AGACTTGGGA TTTAAGGCCT GTAATCATGA ACCATGTCTT TATCAGCAAA 3300 GTGGTCAAGG TAATCTGATG CTCATCTTAG TATATGTTGA TGATTTAATT CTAGCGTGCC 3360 AGTCAAGAGA AGATATGGAG GATCTGAAAG CCAAGATTTC AGAGTCTTTC GAGTGCACGG 3420 ACAAGGGTCC ACTGCATTTG TTCTTAGGCA TGGAGGTGCA ACGAGATGGC GACCTTGGAG 3480 AAATCACTTT GGGCCATTCG CAATATATCA AGGAACTATT GCGGGATTAT GGCAGCGAGA 3540 ACTGTAGACC AGCGACGACA CCTTTGGATG CAGGGCATCA AGTTTTGTGC GCGGGTGAGC 3600 AGTGCCAGAA GGTCGACGCA GGGCAGTATC AGTCTACAAT TGGTGAGCTA ATGTGGCTTG 3660 GGCTTACTAC CAGACCAGAC ATGCTACATT CGGTGGCGAA GTTGGCTCAG AGGAATCAGG 3720 ACCCGCATTC TGAGCACATG GTGGCTGTGA AGCACATCCT CCGGTACTTG GCGTCAACTG 3780 TGGACGTCAA GCTGCATTAT CAAAAGTGCG GTCAGGCATT TACCGGCTTT GTGGATGCAG 3840 ATTGGGGAGG CGACCGTTTG GACCGAAAGT CATACACAGG GTATGTGTTT TTCCTGTCTG 3900 GCGGACCAGT ATCATGGAGG TCCGAGAAGC AGCAGAGCGT GGCGTTGAGC AGTACTGAAG 3960 CCGAGTATAT GGCTCTGACC ACGGCTTGCA AGGAAGCTAT AGCTTTACGA AGGCTAATAG 4020 TGGAGATCGT ATGCGGTGAT CTGAAGACCC CGACGGTTAT GCATGGCGAC AACCTGAAGT 4080 GCGCAGCACA GTTAGCGAAG AACCCGGTTC ATCACTCTAG GACGAAGCAC ATCGACATTC 4140 GATATCATTA GAGAAGTCAT GAAAGAGGGT CACGTTGTGT TAGAGTACAC TTCTACGAAT 4200 GAGATGATAG CAGACATTAT GACAAAGAAT CTTTCAAAGG GAAAGCATAA TGGGTTTATG 4260 AAAATGTTAA ATTTGTTTTA ATTTTTGTAA ACATGTTGGC ATTGAGGAAG GCTGTTGAAT 4320 ATAGGCAATG CCCACATGTG TGTTGAATAT AGGCAATTTC CACATGTGCA TATGTAATTT 4380 TGTATGAGAA CATACATACA TACACATGAA CTATATGTAT GTATATATAT TAGTAAATAA 4440 GCAGCCGCAT GAAGCTGGCA TTTTTATGTG TATCAGTTTC AGTTTCAAAT AAAACTTCTT 4500 CGTGTTCGGA CGCTCGGCTC AAGACTTTTT ATTTCGCGTT TACTCATTCG GCCTTTGCTC 4560 TCAATGCGCT GAGTTTGGGT GAAGATTAGG ATCTTCCCAT TATGGTTGTC AGTGTTCCAC 4620 ACTGGGAGCA CCTTTTCAAC AAACCACA 4648 // ID DMIS297 standard; DNA; INV; 6995 BP. XX AC X03431; XX DR FLYBASE; FBte0000675; Dmel\297. XX FT source X03431:1..6995 FT SO_feature five_prime_LTR ; SO:0000425:1..414 FT SO_feature three_prime_LTR ; SO:0000426:6582..6995 FT SO_feature TATA_box ; SO:0000174:276..282 FT SO_feature TATA_box ; SO:0000174:6857..6863 FT SO_feature polyA_signal_sequence ; SO:0000551:304..309 FT SO_feature polyA_signal_sequence ; SO:0000551:6885..6890 FT SO_feature primer_binding_site ; SO:0005850:414..431 FT SO_feature RR_tract ; SO:0000435:6571..6581 FT SO_feature CDS ; SO:0000316:803..2047 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\297\gag" FT /db_xref="FLYBASE:FBgn0044338" FT /db_xref="SWISS-PROT:P20828" FT /db_xref="NCBI_PROTEIN:CAA27159.1" FT /translation="MSQPIIALSDINLAEARRQLKDIMPFKGDPETLHTFISRVDYVIS FT LYQTNDVRQQRILLGAIERNLDGQITRSLGLPNVEDWPTLKARLIAEFKIQTPNYKLLE FT NFRETPYRGSLRAFCEEAERRRQLLISKLHLEGNQSDFLIYIQGIKESIKILIRKLPIQ FT LFTILAHHDITDLRSLITIAQNEGIYEEHINFEFYEKPEYRNKNSNSNQNSKTQKFNTN FT VQTQNRPSYSQYSQPFQPNFNQYIQPFRPSYTQQITNNPPMWHAPNYFRPNQYINPQPI FT IQKNHFQQYPNKAQFPQTTHFRGNTYPRLQQPSTYKNTNFPITKRLRPSDSEQTKMSID FT EIRFQDAHEFEQVQPNYYEQQYFNQNQYNPYQNHSFINEGQQQVQFVQINNKQNQNNSE FT LNENFRLTVPENTNT" FT SO_feature CDS ; SO:0000316:<1999..5178 FT /name="Dmel\297\pol" FT /db_xref="FLYBASE:FBgn0027622" FT /db_xref="SWISS-PROT:P20825" FT /db_xref="NCBI_PROTEIN:CAB57796.1" FT /translation="TKRKFSVNSSGKYEYIKIVYKGRSYKCLLDTGSTINMINENIFCL FT PIQNSRCEVLTSNGPITLNDLIMLPRNSIFKKTEPFYVHRFSNNYDMLIGRKLLKNAQS FT VINYKNDTVTLFDQTYKLITSESERNQNLYIQRTPESIASSDQESIKKLDFSQFRLDHL FT NQEETFKLKGLLNKFRNLEYKEGEKLTFTNTIKHVLNTTHNSPIYSKQYPLAQTHEIEV FT ENQVQEMLNQGLIRESNSPYNSPTWVVPKKPDASGANKYRVVIDYRKLNEITIPDRYPI FT PNMDEILGKLGKCQYFTTIDLAKGFHQIEMDEESISKTAFSTKSGHYEYLRMPFGLRNA FT PATFQRCMNNILRPLLNKHCLVYLDDIIIFSTSLTEHLNSIQLVFTKLADANLKLQLDK FT CEFLKKEANFLGHIVTPDGIKPNPIKVKAIVSYPIPTKDKEIRAFLGLTGYYRKFIPNY FT ADIAKPMTSCLKKRTKIDTQKLEYIEAFEKLKALIIRDPILQLPDFEKKFVLTTDASNL FT ALGAVLSQNGHPISFISRTLNDHELNYSAIEKELLAIVWATKTFRHYLLGRQFLIASDH FT QPLRWLHNLKEPGAKLERWRVRLSEYQFKIDYIKGKENSVADALSRIKIEENHHSEATQ FT HSAEEDNSNLIHLTEKPINYFKKQIIFIKSDKNKVEHSKIFGNSITTIQYDVMTLEKAK FT QILLDHFIHRNITIYIESDVDFEIVQRAHIEIVNTTYTKVIRSLFLLKNVGSYAEFKEI FT ILQSHEKLLHPGIQKMTKLFKENHFFPNSQLLIQNIINECNICNLAKTEHRNTKMPLKI FT TPNPEHCREKFVVDIYSSEGKHYISCIDIYSKFATLEQIKTKDWIECRNALMRIFNQLG FT KPKLLKADRDGAFSSLALKRWLEEEEVELQLNTAKNGVADVERLHKTINEKIRIINSSD FT DEEVKLSKIETILYTYNQKIKHDTTGQRPAQIFLYAGHPILDTQKIKEKKIEKINEDRR FT EFNIDTNYRKGPLQKGKLENPFKPTKNVEQTDPDHYKITNRNRVTHYYKTQFKKQKKNN FT KLSISQAPGTR" FT SO_feature CDS ; SO:0000316:5145..6560 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="297\env" FT /db_xref="FLYBASE:FBgn0027623" FT /db_xref="SWISS-PROT:P20829" FT /db_xref="NCBI_PROTEIN:CAB57797.1" FT /translation="TLNFTGTWYPITLLFILITAVHGQQIQINNIDTNHGYLLFSDKPV FT QIPSSFEHHSLKINLTEIDIVVDYFEQRLRTDYHAPQINFLYNKIKRELARITLKHRNK FT RGFINIVGSGFKYLFGTLDENDRVEIQKKLEINVHNSVKLHELNDAIRLINDGMQKIQN FT YENNHTIIDSLLFELMQFTEYIEDLEMAMQLSRLGLFNPKLLNYDKLENVNSQNILNIK FT TSTWINYNDNQVLIISHIPIYLSLISTIKIIPYPDSNGYQLDYTDTQSYFEKENKVYNT FT ENKEVKNECVTNIIKHLNPICNFKPVHTNEIIKYIEPNTIVTWNLTQTILNQNCQNSIN FT KIKIEGNKMIRVTQCKIEINNINFSETLLEPEIDLTPLYTPLNITKIKIVKHNDIIEMI FT SENNITLYIQMIIVIIALILLYSYLRYVSFKPFMMLYAKLKIRKNQNQNTPQQTEIEEI FT PFPTLYPSIPAQV" XX CC Derived from X03431 (g8146) (Rel. 36, Last updated, Version 2). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 6995 BP; 2811 A; 1356 C; 972 G; 1856 T; 0 other; AGTGACGTAT TTGGGTGGTC CAAACCAGCC ACTTCCATTA TTTCAAAGAA ATCAGTAATG 60 CACTCTAGTA ATTTTCCATA ACTGTATCCC AGCTGCGCAG ACTCGTTTAT CTTTTGCAGC 120 GCAGCGTTCT TTGTAAACAT CCTAAAGACC TGCCTAAGCA GATTTGACTG CCCTCTTTCA 180 ACGCTACCTA ATCTTAAGAA CCCAAGAGCG AGGCTCTCCC GAAATACAAA TATTGTTCAA 240 ATACTGAGGC TTCTCCTCAA TCCAATTTGC ATTTGATTTT TAGTCTTAAG CTGAGATCCA 300 AAGAATAAAG TCGTGAAACT ATTTCTCCTA AAAACTATTT TTTATTTCTT GGCGTTGTCC 360 TTAGTCAACT GACGGGACAT TAGTTCGACT CATAAATAAA ACAACAATTT TACTGGCGCA 420 GTCGGTAGGA TACAAAAGTA TCCGAAAAAA AAGAACCTTC GAATGGAAAA TAAGTTAAAT 480 TTTATAGTCC TGTGCTCGAA ACATCTCCCA AAATAAATTC GTGAAAACTC TTCAACTTCA 540 ATTATAATTC CAATTCGGTT ATCCAATAAT AAGTGGAAGT GAAATACGAA ACAAAAATAT 600 TAAGTCCAAA GGCAACTAAG TTTTAAAACC AACATATAAA AATAAAAAAT TAAAACAATA 660 TAGAATTTTA ATAATACAAC ACAAAAATTT ACAAAACAAA AAAACAAACA AGTGAAACTA 720 GAAAGCTTAA AAATAATAAT AACATTGAAT CCGAAACAAA ACAAAAAAAT AAAACACAAA 780 AGTTAAAAAT TTTACAATAA AAATGTCACA ACCAATTATT GCGCTGAGCG ACATAAACCT 840 TGCCGAAGCC CGTCGGCAGC TTAAAGACAT TATGCCATTC AAGGGTGATC CAGAAACCCT 900 TCACACCTTT ATCAGCAGAG TGGATTACGT AATTTCGCTC TACCAAACAA ATGATGTCCG 960 ACAACAGAGG ATTCTACTGG GAGCCATCGA AAGGAACTTG GACGGACAAA TTACACGATC 1020 TTTGGGACTT CCGAACGTCG AAGATTGGCC TACCCTTAAA GCAAGACTCA TCGCGGAATT 1080 TAAAATTCAA ACACCAAACT ACAAACTTCT GGAGAACTTC AGGGAGACAC CATACAGAGG 1140 AAGCCTAAGA GCATTCTGCG AAGAAGCGGA GAGACGACGT CAATTACTAA TTTCGAAACT 1200 ACACCTGGAA GGTAACCAAT CGGATTTTCT TATTTATATT CAGGGTATTA AAGAATCTAT 1260 TAAGATACTG ATAAGGAAAC TACCAATACA ATTATTCACT ATTTTAGCCC ATCACGATAT 1320 TACAGACTTA AGATCCTTAA TTACCATTGC ACAAAATGAG GGAATTTATG AAGAACACAT 1380 TAATTTTGAA TTTTATGAAA AACCAGAATA TCGTAATAAA AATTCAAATT CTAACCAGAA 1440 TTCGAAAACA CAAAAATTCA ATACAAATGT TCAAACTCAA AATCGACCAA GTTACTCACA 1500 ATATTCCCAA CCCTTCCAAC CTAATTTTAA TCAATACATT CAACCATTTA GACCTAGCTA 1560 TACACAGCAG ATAACTAACA ACCCACCCAT GTGGCACGCA CCTAATTATT TCAGACCCAA 1620 CCAATACATA AACCCACAAC CCATTATTCA AAAAAATCAT TTCCAACAAT ATCCCAACAA 1680 AGCCCAATTT CCCCAAACAA CGCATTTTAG AGGAAATACA TACCCTCGAC TACAACAACC 1740 CTCTACATAT AAAAATACTA ACTTCCCGAT TACTAAACGA CTAAGACCAT CGGACAGTGA 1800 ACAAACTAAA ATGTCTATTG ACGAAATTAG ATTCCAAGAC GCGCATGAAT TCGAACAAGT 1860 CCAACCTAAT TATTACGAGC AACAGTATTT TAACCAAAAT CAATACAATC CGTATCAAAA 1920 TCATAGCTTC ATTAATGAAG GGCAACAACA AGTTCAATTT GTACAAATTA ATAACAAACA 1980 AAACCAAAAT AATTCTGAAC TAAACGAAAA TTTTCGGTTA ACAGTTCCGG AAAATACGAA 2040 TACATAAAAA TAGTATACAA AGGGCGTTCA TACAAATGCC TTCTAGACAC AGGATCAACA 2100 ATTAATATGA TCAATGAAAA TATATTTTGT CTTCCCATTC AAAATAGTAG ATGTGAAGTT 2160 TTAACATCAA ATGGCCCTAT TACCTTGAAC GACTTGATTA TGTTACCCAG AAATAGTATT 2220 TTCAAAAAAA CCGAACCATT TTATGTGCAC AGATTTTCTA ATAATTACGA TATGCTAATT 2280 GGCAGAAAAT TGTTGAAAAA TGCTCAATCA GTTATTAATT ACAAAAATGA TACAGTTACC 2340 CTTTTTGATC AAACATACAA ATTAATTACT TCAGAATCCG AAAGAAACCA AAATTTGTAT 2400 ATCCAAAGGA CACCAGAATC AATTGCAAGC TCAGATCAGG AATCAATAAA AAAATTAGAT 2460 TTTTCACAGT TTCGATTAGA TCACCTAAAT CAGGAGGAAA CTTTTAAGTT AAAAGGCTTG 2520 TTAAATAAAT TTAGAAATCT TGAATATAAG GAGGGAGAGA AATTAACATT TACAAATACA 2580 ATTAAACACG TACTAAATAC AACACATAAC TCCCCAATTT ATTCGAAACA ATACCCACTT 2640 GCGCAAACAC ACGAAATCGA AGTAGAAAAC CAAGTACAGG AAATGCTGAA TCAGGGATTA 2700 ATTAGGGAAA GTAATTCTCC ATACAATAGT CCTACTTGGG TCGTACCAAA GAAACCGGAT 2760 GCTTCTGGTG CAAATAAGTA CAGGGTAGTA ATTGATTATA GAAAGCTAAA TGAAATAACC 2820 ATACCTGACA GATATCCAAT TCCAAATATG GACGAAATTC TTGGCAAACT GGGTAAATGC 2880 CAATATTTTA CAACGATCGA TCTGGCAAAG GGATTTCATC AAATAGAAAT GGACGAAGAA 2940 TCAATTTCTA AAACTGCATT CTCCACAAAA AGCGGTCATT ACGAATACCT TCGAATGCCA 3000 TTTGGCCTTA GGAATGCACC CGCTACTTTT CAAAGGTGCA TGAATAATAT CCTTCGACCG 3060 TTGCTTAACA AACACTGTTT GGTGTATCTG GATGATATTA TAATTTTTTC AACATCCCTT 3120 ACAGAACATT TAAATTCAAT ACAATTAGTT TTTACAAAGC TTGCAGATGC AAATTTAAAA 3180 TTGCAACTAG ACAAATGTGA GTTCTTAAAA AAGGAAGCTA ACTTTCTTGG TCACATAGTT 3240 ACCCCTGATG GTATTAAACC AAATCCTATT AAAGTTAAAG CCATAGTTTC ATACCCAATT 3300 CCGACAAAAG ATAAAGAGAT AAGAGCTTTC CTTGGATTAA CAGGTTATTA TCGCAAATTT 3360 ATTCCAAATT ACGCAGACAT AGCAAAACCC ATGACCAGCT GCTTAAAAAA AAGGACAAAG 3420 ATAGATACAC AAAAACTTGA GTACATAGAG GCATTCGAAA AACTTAAGGC TTTGATAATT 3480 CGTGACCCAA TTTTACAATT ACCTGATTTT GAAAAGAAAT TTGTTTTAAC CACAGATGCA 3540 AGTAACTTGG CCCTCGGGGC TGTCCTTTCT CAAAACGGTC ATCCTATATC TTTTATTAGT 3600 AGAACACTTA ACGATCACGA ATTAAATTAC AGTGCTATCG AAAAAGAATT ACTTGCCATA 3660 GTTTGGGCCA CAAAAACTTT TCGACATTAT TTACTAGGAC GACAATTTCT CATTGCCAGT 3720 GACCATCAAC CTCTTAGATG GCTTCATAAC TTAAAGGAAC CAGGTGCTAA GTTAGAAAGA 3780 TGGAGAGTTA GATTAAGCGA ATACCAATTT AAAATAGATT ATATTAAAGG GAAAGAAAAT 3840 TCAGTTGCCG ATGCATTATC AAGAATTAAA ATTGAAGAAA ATCATCATAG TGAAGCTACT 3900 CAACATAGTG CAGAAGAGGA CAATAGCAAC CTTATTCATT TAACAGAAAA ACCAATAAAT 3960 TATTTCAAAA AACAAATAAT CTTTATTAAA TCCGATAAAA ATAAAGTAGA GCATTCAAAA 4020 ATATTCGGTA ACTCCATTAC CACAATTCAA TATGACGTAA TGACACTTGA AAAGGCCAAA 4080 CAAATTTTAC TCGATCACTT TATCCATAGA AACATTACCA TTTATATTGA GAGCGATGTA 4140 GATTTTGAAA TCGTTCAAAG AGCACACATA GAAATTGTTA ATACCACCTA CACAAAAGTA 4200 ATTCGCAGTC TTTTCCTATT AAAGAACGTT GGTTCATACG CCGAATTCAA AGAAATCATA 4260 CTTCAATCAC ATGAAAAACT TTTACACCCT GGTATACAGA AAATGACAAA ATTATTTAAA 4320 GAAAATCACT TCTTTCCAAA TAGCCAACTA TTAATTCAGA ATATAATAAA CGAATGCAAC 4380 ATATGCAATT TGGCCAAAAC AGAACATAGA AACACCAAAA TGCCTTTAAA AATCACACCC 4440 AACCCGGAAC ATTGCCGAGA AAAATTTGTA GTAGATATTT ATTCATCTGA GGGAAAACAT 4500 TACATCAGTT GCATTGATAT TTATTCTAAA TTCGCTACAC TTGAGCAAAT TAAAACTAAG 4560 GATTGGATAG AATGCAGAAA CGCATTAATG CGCATTTTTA ATCAACTAGG AAAACCCAAA 4620 TTATTAAAGG CAGACAGAGA CGGAGCTTTC TCCAGTTTAG CTTTAAAGCG ATGGCTTGAA 4680 GAAGAAGAAG TCGAATTACA GCTCAATACA GCAAAAAACG GAGTAGCAGA CGTCGAAAGA 4740 TTACACAAAA CAATAAATGA AAAAATTCGT ATAATCAATT CATCTGATGA TGAAGAAGTA 4800 AAATTAAGCA AGATAGAAAC AATCCTCTAC ACATACAACC AAAAAATTAA ACATGACACT 4860 ACTGGACAGA GACCTGCTCA AATTTTCTTA TACGCTGGGC ATCCCATATT AGACACTCAA 4920 AAAATTAAAG AGAAGAAAAT AGAGAAAATA AATGAAGACA GACGGGAATT TAATATTGAC 4980 ACTAATTACA GAAAAGGTCC ACTACAGAAA GGCAAATTAG AAAACCCATT TAAACCAACC 5040 AAAAATGTAG AACAGACAGA CCCTGACCAT TACAAAATCA CTAATAGAAA TAGAGTTACG 5100 CACTACTACA AAACACAATT CAAAAAACAA AAGAAAAATA ATAAACTCTC AATTTCACAG 5160 GCACCTGGTA CCCGATAACA CTATTGTTTA TACTGATCAC AGCTGTTCAT GGACAACAAA 5220 TTCAAATTAA TAATATTGAC ACCAACCACG GATATCTCCT TTTTTCTGAT AAGCCAGTAC 5280 AGATACCATC CTCCTTTGAA CATCACTCCT TAAAAATCAA TTTAACTGAA ATAGACATCG 5340 TGGTTGACTA TTTTGAGCAA AGACTACGAA CCGATTACCA TGCACCCCAG ATCAATTTTT 5400 TATACAATAA AATAAAAAGA GAACTAGCCA GAATAACCCT GAAACATAGA AACAAACGGG 5460 GTTTTATTAA CATTGTGGGT TCAGGTTTTA AATACCTATT TGGAACACTA GATGAAAATG 5520 ATCGAGTCGA AATACAGAAA AAACTTGAAA TCAACGTCCA TAACTCAGTA AAATTACATG 5580 AACTCAACGA CGCCATACGA TTGATAAATG ACGGAATGCA AAAAATACAG AATTATGAAA 5640 ATAACCACAC CATCATTGAC AGTCTTTTGT TCGAACTAAT GCAGTTTACG GAATACATAG 5700 AAGATTTGGA AATGGCTATG CAGCTTTCCA GACTTGGACT GTTTAACCCC AAATTACTAA 5760 ACTACGACAA ACTTGAAAAT GTGAACAGCC AAAACATTTT GAACATTAAA ACATCCACTT 5820 GGATTAACTA CAATGATAAC CAAGTATTAA TCATATCCCA CATACCCATT TACCTTTCAC 5880 TAATAAGCAC AATTAAAATA ATTCCTTACC CAGACTCCAA CGGCTATCAG CTAGATTACA 5940 CAGACACACA ATCATATTTT GAAAAAGAAA ATAAAGTTTA TAATACCGAA AATAAAGAAG 6000 TAAAAAATGA ATGTGTCACC AATATTATTA AACACTTAAA TCCAATTTGT AATTTTAAGC 6060 CAGTACACAC GAACGAAATA ATAAAATACA TAGAACCAAA CACAATTGTA ACTTGGAACT 6120 TAACCCAAAC AATTCTTAAC CAAAATTGCC AAAATTCAAT TAATAAAATA AAAATAGAAG 6180 GAAACAAAAT GATAAGAGTA ACGCAATGCA AAATAGAAAT CAATAATATA AATTTTAGTG 6240 AAACTCTGTT AGAACCAGAA ATAGATTTGA CACCACTATA CACACCACTT AATATAACAA 6300 AAATAAAAAT TGTAAAACAC AACGACATTA TTGAGATGAT TTCAGAGAAC AATATTACAC 6360 TTTACATACA AATGATCATT GTAATAATCG CACTAATTTT GTTGTACTCA TATTTAAGAT 6420 ATGTATCATT TAAACCATTT ATGATGTTGT ATGCAAAACT TAAAATAAGA AAAAATCAAA 6480 ATCAAAACAC ACCACAACAA ACAGAAATAG AAGAAATTCC ATTTCCCACA CTATATCCAT 6540 CAATCCCAGC CCAAGTATAG GCTTCTCTTT AAGGGAAGGG GAGTGACGTA TTTGGGTGGT 6600 CCAAACCAGC CACTTCCATT ATTTCAAAGA AATCAGTAAT GCACTCTAGT AATTTTCCAT 6660 AACTGTATCC CAGCTGCGCA GACTCGTTTA TCTTTTGCAG CGCAGCGTTC TTTGTAAACA 6720 TCCTAAAGAC CTGCCTAAGC AGATTTGACT GCCCTCTTTC AACGCTACCT AATCTTAAGA 6780 ACCCAAGAGC GAGGCTCTCC CGAAATACAA ATATTGTTCA AATACTGAGG CTTCTCCTCA 6840 ATCCAATTTG CATTTGATTT TTAGTCTTAA GCTGAGATCC AAAGAATAAA GTCGTGAAAC 6900 TATTTCTCCT AAAAACTATT TTTTATTTCT TGGCGTTGTC CTTAGTCAAC TGACGGGACA 6960 TTAGTTCGAC TCATAAATAA AACAACAATT TTACT 6995 // ID DM23420 standard; DNA; INV; 6126 BP. XX AC U23420; XX DR FLYBASE; FBte0000266; Dmel\3S18. XX SY synonym: BEL XX FT source U23420:1..6126 FT SO_feature five_prime_LTR ; SO:0000425:1..361 FT SO_feature three_prime_LTR ; SO:0000426:5766..6126 FT SO_feature CDS ; SO:0000316:919..5742 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\3S18\ORF" FT /db_xref="FLYBASE:FBgn0044337" FT /db_xref="REMTREMBL:AAB03640" FT /db_xref="NCBI_PROTEIN:AAB03640.1" FT /translation="MFIGSIASNSSLTDCQRFHYLKSYLAGDALALVKHIPVTNDNYRE FT AWERLEQRYNKQSLIIRSFLNSFMSLPSAINSNIGTVRKIADGADEVIRGLRALNCEER FT DPWLIFILLSKLDSDTRQAWAQCAESEEKGVTINRFLKFLTSRCDTLEAFELTRSTQAR FT RAATTHHADTHPRREEPKCTSCQQNHQLFKCPQFIALDIASRRDFLKSRKLCFNCLSPA FT HMVGNCTSRHTCRICRRKHHTLVHGSSQPIQNGNNIDTASVDSRDRPAVSHAGSTIGHN FT QPLAREGHRLGSETPAENNFTHHTLENIPAAGSQTLLPTILADVIDAWGNTTTCRLLLD FT TGSTITLASESFVQRIGVRRTHARISILGLAANSAGVTRGRAHIKLRSRHSGQTVELVS FT FILTSLTSSLPAQVIDTSSSTWRQICELPLADPTFCTPGAIDVIVGSDQLWSLYTGDRK FT HFGNDFPIALNTVFGWILAGSYSAFDDHPTSAVTHHADLDTMVRSFMEMDSIQPNQALL FT DASDPTERHFAATHKRSTDGVYVVEYPFKEKAPPIDSTLPQAINRFFSLERKFRRYPEL FT KQQYEAFLDDYLQRGHMEKLTSAQVEESPDTCFYLPHHAVIKLDSLTTKCRVVFDGSGK FT DSSGVSLNDRLHIGPPIQRDLFGVCLRFRQHQYVLCADVEKMFRGIKVFKPHTNFQRIV FT WRTTENEPLLHFRLLTVTYGLAPSPFLAVRVLKQLADDHGHEYPAAAHALLHDAYVDDI FT PTGANTFEELMILKDELIALLDKGKFKLRKWSSNSWRLLKSLPEEDRCFEPIQLLNKSA FT ADSPVKVLGIQWNPGKDVLYLNLKGCDATISPTKRELLSQLSRIYDPLGLVAPVTVLLK FT LIFQESWTSVLQWDDPIPESLRTRWRALVEDLPALTQCQVPRYIASPFRDVQLHGFADA FT SSHAYGAVVYARVAVGCSFQVTLVAAKTRVAPIKPVSIPRLELNAALLLSRLLSIVKTS FT LTIPLFSTSCWTDSEIVLHWLSAPPRRWNTYVCNRTSEILSDFPRSCWNHVRTEDNPAD FT CASRGLHPSKLLEHRLWWKGPSWLATPTSEWPPSTSKFSVSSSFDVNTEERAIKPTTLH FT NFPDESIHELLIHKFSTWTRLIRVSSYCHRFIHTLRSHHRNSAPFLTSEELLDAQRRLI FT RHVQQKSFAREYEQLENRRQLNAKSHLIRFSPFLDDYGVMRVGGRIEQSTLNYNAKHPI FT LIPKDTPLAGLLVRHFHVSYLHTGVDATFTNLRQQYWILGARNLVRKAVFQCKSCFLQR FT KGTSNQIMGELPIPRVQASRCFQHTGLDYAGPIAIKESKGRTPRIGKAWFSIFVCLTTK FT ALHIEVVSELTTQAFIAAFQRFIARRAKPTDLYSDNGTTFHGGKKTLDDMRRLAIQQAK FT DEELAGFFANEGISWHFIPPSAPHFGGMWEAGVRSIKLHMKRILGSKALTFEELSTVLT FT QIEAILNSRPLCPTGDNSLDPLTPAHFLTGSPYTALPEPCRLDMQVNRLERWNQLQAMV FT QGFWKRWHMEYLTSLHERTKWHLETENLKIDTLVVLKEPNLPPSKWILGRITAVHAGID FT NKVRVVTVKTAHGLYKRPIAKIAVLPLC" XX CC Derived from U23420 (g733531) (Rel. 48, Last updated, Version 3). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 6126 BP; 1623 A; 1556 C; 1346 G; 1601 T; 0 other; TGTTTGGGAA CGAGACACCC TGTATACGCG AACAAGTCAC CCTTTATCTT TATTTACATT 60 CTTATTTGTC TGCAGCTTCA TCGGAGCTTA TCAGCGGAAT CAATGTAAGC ATCGCACCGC 120 TGTAATTGTC CGCGAGCTTG CCCAGTACTT TTCCAAACTT CTAACTCCCT TCTAACTGTA 180 ACTTGTTTAC GTCTTATGCT AGACTAATCG TATGGCGTGA TTACAGCCAA AGCTGAAGTC 240 AGTCACAATT TTGATCTGCG AGAAAACGTA CGCATCGGTG TCGAAATAAT TAATATTAAG 300 TGTCTGAACT TAACCAATAA ATGAAAATTA ACAGTAACAC TGGCGGTTTT ATTTATAAAC 360 ATAAAAATTG GTCCTTCGAG CCGGATAACC GGAAGTGCGT TTCGTTCGGG CATTTGATTT 420 TGATTATTGG CCTTTTGGCA AACGATAATC TATAGATTCC TACATCGTGT AGAATCGTTC 480 CCTTCTTTCG ACCACCATGC GGAGTGTGAT TCAACAACGG GGCTTCTGCA AAAGCCAAAT 540 TACTCGTGCG CATAATAATG CCTTAAAATT TGTTGATGAC ATTCACTCAG TGCAAACAAT 600 AGTTGTCCGC CTGGCGCAAC TACAGGAAAA TTATTTGCGG TTCGTACGGC TCTCGGAAGA 660 GCTGTATGCA TTTCAATCGG AAGCCGATTG GGAGAACCCT GACGAGGATT TTGACGCATA 720 TGAGGACAAA CATTATGCTA CACACGCTAT TCTCAGCAAT ACTTTGGAGG AGTTGAGACG 780 GGATGTCACC TCAAACAGTA TTGATGCCAC AGTTCAAGCG CAGGCACACC CCAGAGAAGT 840 CATGTCGATT TTCAGTTCGA GAGAATTAAA CTTCCGACTT TTTCTGGAAA TTATGAGGAC 900 TGGAAACATT TTTCGGACAT GTTTATTGGA TCGATTGCTT CCAATTCGAG CCTGACGGAT 960 TGCCAACGAT TTCATTATTT AAAATCGTAC CTTGCCGGAG ACGCGCTTGC ATTAGTTAAA 1020 CATATTCCAG TTACTAATGA CAACTATCGG GAAGCATGGG AGCGGCTGGA ACAGCGATAT 1080 AACAAACAAT CGCTAATTAT TCGATCGTTC TTAAACAGTT TCATGAGCCT TCCGAGTGCT 1140 ATAAATTCAA ATATCGGCAC AGTGCGGAAA ATTGCCGATG GTGCAGACGA AGTTATTCGT 1200 GGTCTACGAG CTCTTAATTG CGAAGAGAGG GATCCCTGGC TAATTTTCAT TCTACTTTCA 1260 AAATTAGATA GCGATACCCG CCAAGCCTGG GCTCAGTGCG CAGAATCCGA GGAAAAAGGT 1320 GTGACCATCA ACCGATTCTT GAAATTTCTC ACATCACGCT GCGATACGTT GGAGGCTTTT 1380 GAATTAACTC GATCAACCCA AGCTCGACGC GCAGCTACCA CGCACCACGC AGACACGCAT 1440 CCAAGACGGG AAGAGCCGAA GTGCACATCG TGCCAGCAGA ATCACCAACT GTTTAAGTGT 1500 CCTCAATTCA TCGCACTCGA CATTGCATCT CGCCGAGACT TCCTCAAATC AAGAAAGCTC 1560 TGTTTCAATT GCCTCAGCCC GGCTCATATG GTGGGCAACT GTACATCGAG GCATACTTGT 1620 CGGATCTGCC GCCGCAAGCA TCATACTTTG GTTCATGGCT CGTCGCAGCC AATTCAAAAT 1680 GGCAACAACA TTGACACAGC AAGTGTTGAC AGCCGCGATC GACCAGCAGT CTCACATGCG 1740 GGATCTACAA TTGGCCACAA TCAACCGCTA GCTCGAGAAG GTCATCGCTT GGGAAGCGAG 1800 ACTCCCGCGG AAAACAACTT TACGCATCAT ACTCTGGAGA ATATTCCGGC GGCTGGTTCT 1860 CAGACTCTGT TGCCAACCAT CCTTGCTGAC GTCATCGACG CCTGGGGAAA CACTACAACC 1920 TGCAGGCTGC TCCTGGACAC TGGATCTACA ATAACCTTGG CATCGGAATC ATTTGTTCAG 1980 CGAATAGGCG TGCGTCGAAC GCACGCACGG ATTTCTATTC TCGGTCTCGC CGCCAACAGC 2040 GCGGGCGTTA CCCGAGGACG CGCACATATC AAGCTGCGCT CTCGTCATTC GGGCCAAACT 2100 GTCGAATTGG TCTCGTTCAT TCTCACCTCG CTGACGTCAT CACTTCCTGC CCAAGTTATT 2160 GACACCTCAT CCTCTACGTG GAGGCAAATC TGCGAGCTTC CTTTGGCAGA CCCAACGTTC 2220 TGCACACCTG GAGCAATCGA TGTCATTGTT GGATCGGATC AACTTTGGTC TCTATACACA 2280 GGAGATCGGA AACACTTTGG TAACGACTTT CCTATCGCTC TCAATACTGT ATTTGGTTGG 2340 ATTCTTGCAG GCTCTTACTC TGCATTCGAT GATCACCCTA CTTCTGCGGT TACTCATCAC 2400 GCGGACCTAG ACACGATGGT TCGTTCATTC ATGGAGATGG ACAGCATTCA GCCTAACCAG 2460 GCTCTCCTGG ACGCCAGCGA TCCCACAGAG CGTCATTTTG CTGCCACACA CAAGCGCTCG 2520 ACGGACGGGG TGTACGTCGT CGAGTATCCC TTCAAGGAAA AGGCACCGCC TATTGATTCG 2580 ACCTTGCCAC AGGCCATCAA TCGCTTCTTC TCGCTGGAAC GCAAATTTCG TCGGTATCCA 2640 GAATTGAAGC AGCAGTACGA AGCTTTCCTG GACGACTACT TGCAACGTGG ACATATGGAA 2700 AAACTGACCT CGGCTCAGGT TGAAGAGTCC CCAGACACCT GCTTCTATTT GCCGCACCAC 2760 GCTGTCATCA AACTGGACAG TCTGACTACC AAATGTCGTG TAGTTTTTGA TGGATCAGGA 2820 AAAGACAGCT CTGGAGTATC GCTCAATGAC AGACTACATA TTGGTCCACC GATTCAACGC 2880 GATCTTTTTG GCGTTTGTCT ACGCTTCCGG CAGCACCAAT ATGTTTTATG TGCAGATGTC 2940 GAAAAGATGT TTCGAGGCAT TAAAGTCTTT AAGCCACACA CCAATTTTCA GCGCATTGTT 3000 TGGCGCACGA CTGAGAATGA ACCTCTGCTT CATTTTCGCC TGCTGACGGT TACCTACGGA 3060 TTGGCACCGT CACCATTTCT GGCTGTTCGA GTTCTAAAGC AACTTGCCGA CGATCATGGC 3120 CATGAATACC CTGCAGCAGC TCACGCTCTT CTGCACGATG CCTATGTGGA CGATATCCCG 3180 ACAGGCGCCA ACACATTCGA GGAGCTTATG ATTCTCAAGG ACGAGCTTAT AGCCCTCTTG 3240 GATAAGGGAA AATTCAAGCT ACGCAAATGG AGTTCTAATA GTTGGCGTCT TCTGAAATCA 3300 TTACCAGAGG AAGATAGATG TTTTGAACCT ATCCAGCTCC TCAACAAATC AGCTGCGGAT 3360 TCACCTGTCA AAGTTCTTGG TATCCAATGG AACCCTGGGA AGGACGTCCT GTATCTCAAC 3420 CTAAAGGGAT GCGATGCGAC CATTTCTCCG ACGAAAAGAG AACTCTTGTC TCAGCTATCA 3480 AGAATTTATG ATCCGCTTGG ACTGGTAGCG CCGGTCACAG TTCTACTCAA GCTAATCTTC 3540 CAAGAAAGCT GGACAAGTGT CCTGCAGTGG GACGACCCCA TACCTGAAAG TCTACGTACG 3600 CGCTGGAGAG CCTTAGTAGA GGATTTGCCA GCACTTACGC AATGCCAAGT ACCACGGTAT 3660 ATTGCGTCAC CATTTCGAGA TGTTCAACTA CACGGATTCG CCGACGCATC CTCGCACGCC 3720 TACGGTGCGG TAGTTTACGC TCGAGTTGCA GTTGGATGCA GCTTTCAAGT AACTCTGGTT 3780 GCCGCCAAAA CACGGGTGGC CCCGATCAAG CCCGTATCAA TTCCACGTTT GGAGCTAAAC 3840 GCTGCGTTAC TTCTATCTCG ATTGCTTTCT ATTGTCAAAA CATCACTAAC AATTCCTCTT 3900 TTCAGCACGA GCTGCTGGAC AGATTCAGAA ATTGTGCTAC ACTGGCTTTC AGCTCCCCCT 3960 CGACGGTGGA ACACCTACGT CTGCAACCGA ACTTCTGAGA TATTGAGCGA CTTTCCCCGT 4020 AGCTGCTGGA ACCATGTTCG CACGGAAGAC AATCCTGCAG ATTGTGCTTC CCGAGGACTT 4080 CATCCGTCAA AGCTTCTGGA GCATCGACTG TGGTGGAAAG GTCCGTCTTG GCTGGCCACA 4140 CCCACCTCTG AGTGGCCACC TTCTACAAGC AAGTTCAGCG TATCTTCAAG TTTCGATGTC 4200 AACACCGAAG AACGAGCCAT AAAGCCCACG ACTCTACATA ACTTTCCTGA TGAAAGTATA 4260 CACGAGTTAC TCATCCACAA ATTCTCAACC TGGACGCGTC TTATAAGGGT ATCTAGCTAC 4320 TGTCATCGCT TTATTCACAC TCTTCGATCC CATCATAGGA ATTCGGCACC ATTCCTTACG 4380 TCTGAAGAGT TGCTGGACGC ACAGCGCCGA CTTATTCGAC ATGTGCAACA AAAATCCTTT 4440 GCCAGAGAAT ATGAGCAGCT AGAGAATCGA CGCCAGCTTA ACGCTAAATC GCATCTTATC 4500 CGGTTTTCTC CGTTTCTGGA TGATTATGGA GTAATGCGAG TCGGTGGGAG AATCGAGCAA 4560 TCTACACTCA ACTATAACGC CAAGCACCCG ATTCTGATAC CTAAAGATAC ACCACTAGCT 4620 GGACTCCTGG TTCGACATTT TCATGTCTCC TATCTGCACA CTGGAGTTGA TGCAACGTTC 4680 ACCAATCTTC GTCAGCAGTA CTGGATTCTG GGAGCCCGCA ATCTCGTCAG AAAGGCAGTC 4740 TTCCAATGCA AATCCTGTTT TCTTCAACGA AAGGGCACAA GCAACCAGAT CATGGGAGAG 4800 CTACCAATTC CTCGAGTTCA AGCTAGCCGC TGCTTTCAAC ACACAGGGCT GGACTACGCT 4860 GGACCGATCG CAATCAAGGA ATCAAAGGGA AGAACTCCAC GCATCGGAAA GGCATGGTTT 4920 TCTATTTTCG TGTGTCTCAC TACAAAGGCA CTTCACATCG AGGTTGTTAG TGAGCTAACT 4980 ACACAGGCTT TCATCGCAGC CTTTCAACGA TTCATTGCCC GCCGAGCGAA GCCTACTGAC 5040 CTGTATTCGG ATAATGGAAC AACATTTCAT GGAGGCAAGA AAACTTTGGA TGACATGAGA 5100 CGTCTGGCCA TTCAACAAGC CAAAGATGAG GAACTAGCAG GATTCTTTGC CAATGAAGGG 5160 ATTTCTTGGC ACTTTATACC CCCGTCTGCT CCACATTTTG GAGGGATGTG GGAAGCTGGA 5220 GTTCGCTCAA TTAAACTCCA TATGAAACGA ATACTTGGAT CAAAGGCTTT AACGTTTGAG 5280 GAGCTCTCTA CTGTCCTGAC CCAAATTGAA GCTATCCTGA ATTCACGCCC GCTGTGCCCA 5340 ACTGGGGATA ATTCTTTGGA TCCACTGACG CCTGCTCATT TTTTGACTGG ATCTCCGTAT 5400 ACTGCATTGC CTGAACCCTG TCGTCTGGAT ATGCAAGTCA ATCGATTGGA GAGGTGGAAT 5460 CAGCTGCAAG CCATGGTTCA AGGCTTTTGG AAAAGGTGGC ATATGGAATA CCTGACATCT 5520 CTTCATGAGC GGACAAAGTG GCATCTGGAA ACCGAGAATC TGAAGATCGA CACACTGGTA 5580 GTACTCAAGG AGCCCAATCT ACCGCCCTCT AAATGGATTC TTGGCCGCAT CACAGCAGTG 5640 CACGCAGGAA TCGACAACAA GGTCCGAGTC GTTACAGTGA AGACTGCTCA CGGATTATAC 5700 AAACGCCCAA TTGCCAAAAT CGCTGTACTG CCTCTCTGCT GAACAACCGT TCAGGGGGGC 5760 CGGTATGTTT GGGAACGAGA CACCCTGTAT ACGCGAACAA GTCACCCTTT ATCTTTATTT 5820 ACATTCTTAT TTGTCTGCAG CTTCATCGGA GCTTATCAGC GGAATCAATG TAAGCATCGC 5880 ACCGCTGTAA TTGTCCGCGA GCTTGCCCAG TACTTTTCCA AACTTCTAAC TCCCTTCTAA 5940 CTGTAACTTG TTTACGTCTT ATGCTAGACT AATCGTATGG CGTGATTACA GCCAAAGCTG 6000 AAGTCAGTCA CAATTTTGAT CTGCGAGAAA ACGTACGCAT CGGTGTCGAA ATAATTAATA 6060 TTAAGTGTCT GAACTTAACC AATAAATGAA AATTAACAGT AACACTGGCG GTTTTATTTA 6120 TAAACA 6126 // ID 412 standard; DNA; INV; 7567 BP. XX AC nnnnnnnn; XX DR FLYBASE; FBte0000007; Dmel\412. XX SY synonym: mdg2 XX FT source nnnnnnnn:1..7567 FT SO_feature five_prime_LTR ; SO:0000425:1..514 FT SO_feature three_prime_LTR ; SO:0000426:7054..7567 FT SO_feature CDS ; SO:0000316:679..1044 FT SO_feature CDS ; SO:0000316:1408..1722 FT SO_feature CDS ; SO:0000316:1888..3243 FT SO_feature CDS ; SO:0000316:3864..6866 XX CC Berkeley Drosophila Genome Project. XX SQ Sequence 7567 BP; 2982 A; 1367 C; 1323 G; 1895 T; 0 other; TGTAGTATGT GCCTATGCAA TATTAAGAAC AATTAAATAA AATAGCATAT TAACTTATGG 60 CAGCACTTTG TTGCTATGTT TATGTTTATG TTTATGCACG CAGTTAGGCC AGGGCGGATG 120 TAACATGATC ACCCACTCGA AGGCCACAAA GTATAAGTGC ATTGCCCAAT CGAAGGCAAA 180 AAGTATAAGT GCATGGTCAG CATTCACACG CCGACCAAAT ACATATTACA TACGTACATA 240 CATATCTCGC TCTCCCGATA AGCCTAGATA TATAAGATAT ACATAAGAAC GCCGCTCCGC 300 TGCTGGCGTA CCCGGCAGCG CAGCTACGCG GATTAGCCTA AGTCCAAATA TATAAAAAAC 360 TGTAAAATCG GAGAGACTCT GTAGACGTTG AGCTGACAGA ACCATTTCTG CCTACTCTAA 420 AATCAAAAGA AGAAATTGAA TAAATATATG TCAGCCCGAC GGCTGCCTTA AACTTAAAAC 480 GGACTTGTGT TCTTAATTGG AGTTCATCAT TACATGGCGA CCGTGACAGT CGTCCAACGC 540 TGGACGAATT GACCAAAGCT GGTGAAAACA AAGGAACAAA GGAACACTGG ACTGGAAGAA 600 GACTGGACTA ATTAAATGGA ACTGCAAAAA CCAAGGAAAA ATCTGAGTGA GTAGAGTTCT 660 ATTGAGTATG GGCAAACACC GTGGCGGTTT GAAAACTAAG CTGAATAAAC GTATAGCCCA 720 CGTAAGGTGG CTAATATACG GTCAGCAAAC GCCACCGGTT TGGTCGAAAG CTCTAAAGCT 780 ACATGCAGAG CTAGACCACT TGTTGCAATA TCAGCAAGAA TTAAAGACCC ATAAGCTCGA 840 GAAAACTCAC TCAGATAATA TTAAAAATAT ACCCACAATT AATGAAGTTC CAAAATACCA 900 GGCATGTCCA GCACCAGCAC CAGCATTAAC AAAACCAAAG AAGTCCTGCC CCCCTGGCTG 960 CGAAGGAATC TGGAGTCCCC ACTGCCTGGG GACTTGTGAG CGACCATCGA CGTCTTCAGC 1020 GGCGAAGAAA TAGACAGCAG CGAGGGAGTG TCAGCGTGCC ACCCCCGGCG ACGCCCAGCT 1080 GACACCCAAC AAATAGACAG CAGCGAGGGA GTGTCAGCGT GCCACCCCCG GCGACGCCCA 1140 GCTGACACCT GATGAGCATC ATCAACAGCA GAATATAATA ATAAATATAT ATAAATATAA 1200 AGTAAATATA AAATATATAT AGATAAGAAA AATTGTAAGA AATATTGTAA AACGGAGCAT 1260 ATACTATTAT GCCCTGTTAA CCCAATATGG CCCGTGAAGC CATAGCTAGA ATCAGGCAGG 1320 CAACAATGTA AAATACAATT TTTTTTTACT CTTGCGAACA TTGAAAGATT TTATAAATAG 1380 ATAATTCCAA ACATAAATGT CTATAGAGAC AAATGAAATA AGTAAAACTG AAAATAAAAG 1440 TATATACAAA GGAAATTTTC TATTCTATTC TCCAAAATAT AAAATTAGTA TACCCAAAAT 1500 GGGTCTAATA GACACTAAAA CTGTGGACTC TACAGCCAAT GTAATAAATA AAGTAGAAGT 1560 CCAAAATGCA GACTTGTTCT GGATAACCAT AATACTAATT GTAATTGCAT TAATTATGGT 1620 ATCCAATGCA TTAATAAAAA TATACAAACT GCATAACAAG TGTCTTAAGA AACGATACCG 1680 TAGCACTGCT AACGGTATAG ATAATATTTA AGGAAGATCT TTAATAAAGT CAATTATGAA 1740 TGAAAATATG AGAAAAATTA TATGAAAAAA AAAAATAATA AATAAAAAAA AAATATAAAA 1800 CGTAATATTG AATTTATCTA CATTAAAAAA AAATATATAC AAATGAATAA ATTTGAAGTT 1860 ATGAGTATAC CACAGCATGG ACTGGGAAAA GCTTGTTGAT CAGATAAAAG ATCAAAATGA 1920 AAATTTCAGA AAATCCTATA AGTGCTTAAC GCAAAACAGA TCAACACAAG CTGTAACAAT 1980 CAATAGGAAT GCCCAAGTCT TGGTAAATAG TTATAATGAA ATCAGAGAGT TGATCCAACA 2040 AAATAGAAAG AATTTGGAAC GCAAACAGTG TGCTAAGGCT TTGAACCTAC TGGTGACATT 2100 AAGAGAAAAA TTAATATTTA TAAAAAATAA ATTCAGTCTC CAGATAGAAA TTCCAACCAT 2160 AGTAAACACC CCACTAAGAA TAAATTTGAA TGAAGACAGC ACTAACTCTG ACGAGGAAGA 2220 TAGGACTATA GTCAAGGAAG ACATTAAAGA GGAAGATCTT CACGATCTAA CTATACCAGC 2280 AAAATTAATG CTGAAGAACG ACGATAAAAC AAATAACGCA GCCGACTCCG AAAATAACTT 2340 AACCATGGCA GAAGAAGCAG CTGCCATTAG GTCTTACATT AGGGAAGTCG CCTGCACAGT 2400 GCCAGAATTT GATGGGCAAA AGATCCATTT ACAAAGATTC ATTAAGGCAA TCAAATTGGT 2460 AGACCTAGCT AAGGGACCAT TTGAAGACAT TGCAGTTGAG GTCATTAAGT CAAAAATAGT 2520 TGGCACAATT TTGAACTCAG TTGACAATGA AACGACAATT CCAGCAATTA TAAACAAATT 2580 GCAGAAAGTA GTTGTCGGTG AGACATCCAG TAATGTCAAA GCAAAGCTAG CAACAGTTCA 2640 GCAGAGAGGT AAAACTGCAA CGCAATTTAC CGCTGAAGTT GATAGCCTGA GAAAACTTTT 2700 AGAAGCTTCC TATATCGATG AGGGTATACC TCTAGAACAT GCCACTGGTC TAAGCACCAA 2760 AGAGGCAATT GAAACCATGA TACATCGTGC TGAGCACGAA AGTATCAAAA CAGTACTGGA 2820 AGCAGGGACT TGCACCACTA TGGATGCAGC GATAAGCGCA TACATAAGAA CGAGTACAAG 2880 AGTTACCGGT GACATCAATA AAGTGATGTA CTTTAGAGGT AACAGACCCA ATAGAGGATA 2940 CGGAAATGCC AATAGAGGTA GTAACCGCGG TAGAGGCTTT AATAACAATA GTATTAGAGG 3000 CAACTACCAT AACGGTTACC AAAATAACGG TTACCAAAAT AACGGTTACC AGAATAACGG 3060 TTATCAAAAC CGCTATAATG GAAATAATAA CCGTTATAAT GGCTATAACA GAGGCCGTTA 3120 TAATGGAAAC AGAGGCCGTA ACAACAGTCA GAACAACTAC AACAGAAACA ATGCCAATGT 3180 ACGAGTAATC CAAGAACAGG GAAACTCGCA ACAGCCTTTA GGTACTCAGT AGAAGAAGAT 3240 CGTAGAGTAT ACACCATCAA TTATAATCTC AACATATTTT CTACATTCAT TCATGCCAAA 3300 ACAGGCGTAA AACTAGTTTT TCTACTTGAT ACAGGTGCAG ATATCTCTAT TCTCAAAGAG 3360 AACTCTGACA AATTTTCTAA TATTCAAATA ACCAATAAAA TAAACATTCA AGGCATAGGC 3420 CAACAGAAAA TTCAGTCTCG AGGACAGACT TTTATTGAGA TACAGACAGG TAAATACGTT 3480 ATCCCACACG ATTTTCATTT AGTAGATAAA AACTTTCCAA TACCGTGTGA TGGAATAATC 3540 GGAATAGATT TCATAAAAAA ATATAATTGC CAAATCGATT TAAACCAAGA AGAAGATTGG 3600 TTTATAATTA GACCAAACAA TTTGAAATTT CCAATATATA TTCCCATAGC ATACAGCTCT 3660 GGTATTAACA CAACGTTATT ACCAGCAAGA TCCCAAGTTG TCCGAAGATT AATAGTATCA 3720 TCAAAAGATG ATAACATTTT AATTCCAAAC CAGGAAATTC AAACTGGTAT TTATGTTGCA 3780 AATACAATCG CAACATCAAG TAATACATTT GTCCGAATTT TAAATACAAC CGATTCCGAC 3840 CAATTAGTCA ATATGGACAC TCTAAAATAT GAGCCACTTT CGAACTACAA TGTAGTTCAG 3900 GCAAATAGTG AACACAGAAA TAAAACTGTC TTATCTCAAT TAAAGAAAAA TTTCCCCGAA 3960 TTGTTTAAAT CACAATTAGA AAATATATGC AGCGAATATA TAGATATATT TGCATTAGAA 4020 TCAGAACCTA TAACAGTTAA TAATTTGTAT AAACAACAGT TGAGATTAAA AGATGATGAG 4080 CCAGTATACA CGAAAAATTA TAGAAGTCCT CATAGTCAAG TGGAAGAAAT ACAAGCCCAA 4140 GTTCAGAAAT TAATAAAAGA TAAAATAGTT GAACCATCAG TTTCACAGTA CAATAGCCCT 4200 TTGCTATTAG TACCCAAAAA GTCAAGCCCG AATTCTGATA AAAAGAAATG GAGATTAGTA 4260 ATAGACTATC GCCAAATTAA TAAGAAACTT TTAGCTGACA AATTTCCACT ACCGAGAATA 4320 GATGATATTT TGGACCAACT TGGTCGAGCA AAATATTTCT CCTGCCTTGA TTTAATGTCA 4380 GGTTTTCATC AAATCGAACT GGATGAAGGC TCGAGAGATA TAACATCTTT CTCAACCAGC 4440 AATGGCTCAT ATCGTTTCAC GCGATTGCCA TTTGGCTTAA AAATAGCGCC TAATTCATTC 4500 CAAAGAATGA TGACTATAGC ATTCTCCGGA ATAGAACCGT CTCAAGCATT CCTTTATATG 4560 GATGACTTAA TAGTCATAGG TTGTTCCGAA AAACATATGC TTAAAAACCT CACTGAAGTT 4620 TTTGGTAAAT GCAGGGAATA CAACCTAAAG TTACATCCTG AAAAATGTTC ATTTTTCATG 4680 CATGAAGTCA CATTTTTGGG ACACAAATGC ACAGACAAAG GAATTTTGCC GGATGACAAA 4740 AAATATGATG TCATTCAGAA CTACCCAGTT CCACATGATG CGGACAGCGC TAGACGTTTT 4800 GTAGCATTTT GCAATTACTA CAGACGTTTT ATCAAAAATT TCGCCGACTA TTCGCGGCAC 4860 ATAACAAGAT TATGTAAAAA GAATGTTCCA TTCGAGTGGA CAGATGAATG TCAAAAAGCA 4920 TTCATACATT TAAAATCTCA GCTAATTAAC CCAACACTCT TGCAGTACCC AGACTTCAGC 4980 AAAGAATTTT GCATAACAAC AGATGCAAGC AAGCAAGCGT GTGGCGCAGT TTTAACTCAA 5040 AACCATAATG GCCACCAACT CCCAGTTGCT TATGCATCCA GAGCTTTTAC GAAAGGTGAA 5100 AGCAATAAGA GTACAACAGA ACAAGAGTTA GCAGCAATTC ATTGGGCAAT AATACATTTC 5160 AGACCATACA TTTACGGAAA ACATTTCACT GTGAAAACAG ACCATAGACC ATTGACATAT 5220 TTATTCTCGA TGGTGAACCC CAGCTCTAAA TTAACTAGAA TAAGGCTTGA ACTAGAGGAA 5280 TATAATTTTA CAGTAGAGTA TCTAAAGGGC AAGGACAATC ATGTAGCAGA TGCGTTATCA 5340 AGAATAACCA TCAAAGAGCT AAAAGATATA ACTGGAAATA TATTAAAAGT CACTACAAGA 5400 TTTCAAAGTA GACAAAAATC CTGCGCAGGA AAAGAACAAT TGGATTTGCA AAAGCAAACC 5460 AAAGAAATAG CTTCAGAGCC CAACGTATAC GAAGTCATAA CAAATGACGA GGTACGAAAA 5520 GTAGTGACAT TGCAATTGAA TGACTCGATA TGTTTATTTA AACATGGAAA GAAAATTATT 5580 GCAAGATATG ATGTTGGTGA TCTTTATACT AATGGAATTC TTGATTTAGA TCAATTTCTC 5640 CAAAGGCTTG AATTGCAGGC CGGTATATAT GATATCAGCC AAATCAAAAT GGCACCGTGG 5700 AAAAAAATCT TTGAACACGT TTCAATAGAT AAATTTAAAA ATATGGGCAA TAAAATATTA 5760 AAGAATTTAA AAGTAGCGCT ACTTAACCCG GTGACCCAAA TAAATAATGA AAAAGAAAAA 5820 GAAGCTATAT TGTCTACATT ACATGATGAT CCAATACAAG GAGGGCATAC AGGCATTACA 5880 AAAACCTTGG CCAAGGTCAA AAGACATTAT TACTGGAAAA ATATGAGTAA ATACATAAAA 5940 GAGTACGTAA GAAAATGTCA AAAATGCCAA AAAGCAAAAA CAACAAAGCA CACAAAGACT 6000 CCAATGACGA TAACTGAAAC ACCAGAACAT GCTTTCGATA GAGTTGTTGT GGACACAATT 6060 GGTCCACTAC CCAAGTCAGA AAATGGTAAC GAGTACGCAG TCACTCTCAT ATGTGATTTA 6120 ACCAAGTACT TAGTTGCCAT ACCAATAGCA AATAAAAGCG CAAAAACAGT CGCAAAAGCT 6180 ATATTTGAAT CTTTTATTCT AAAGTACGGT CCAATGAAGA CGTTCATAAC GGACATGGGA 6240 ACAGAGTATA AGAATTCAAT AATTACTGAC CTGTGTAAAT ATTTGAAAAT AAAAAATATA 6300 ACATCAACAG CTCATCACCA CCAGACAGTT GGAGTAGTAG AAAGAAGTCA TAGAACCTTA 6360 AACGAGTATA TACGATCCTA CATATCGACG GACAAAACCG ATTGGGACGT ATGGCTTCAA 6420 TATTTCGTAT ACTGCTTCAA CACGACCCAA TCTATGGTAC ATAATTATTG TCCATATGAA 6480 TTAGTTTTCG GTAGAACAAG TAATTTACCA AAACATTTTA ATAAACTACA TAGCATAGAA 6540 CCAATATATA ACATAGATGA TTACGCTAAG GAGAGTAAAT ATAGGTTAGA GGTAGCATAT 6600 GCTCGAGCAA GAAAACTTCT CGAAGCACAC AAAGAAAAAA ATAAAGAAAA TTATGACTTA 6660 AAAATAAAAG ACATAGAATT AGAAGTAGGA GATAAAGTTT TACTAAGAAA TGAGGTAGGT 6720 CATAAATTAG ACTTTAAATA TACGGGGCCC TATAAGATAG AAAGCATAGG AGATAATAAC 6780 AATATTACGC TACTTACTAA TAAAAACAAA AAACAAATAG TTCATAAAGA TAGATTAAAG 6840 AAATTTCATT CATGATTGAA TTTAAACTTA TATTTTCCTT AATCATTTAC ACAAATTTTC 6900 CATACACTAC GTATATTTTT ATCTTTGCAT TATAAAATCA ACTATTGTTG TTCAAACAAA 6960 AACACAAACA AAATAAAAAT AAAAATAAAA TAATTTGCAT TTAATAATCA AAATAACTTC 7020 ACTAGGTTAC GTTATTTTTC AAAAGGAGGG AGATGTAGTA TGTGCCTATG CAATATTAAG 7080 AACAATTAAA TAAAATAGCA TATTAACTTA TGGCAGCACT TTGTTGCTAT GTTTATGTTT 7140 ATGTTTATGC ACGCAGTTAG GCCAGGGCGG ATGTAACATG ATCACCCACT CGAAGGCCAC 7200 AAAGTATAAG TGCATTGCCC AATCGAAGGC AAAAAGTATA AGTGCATGGT CAGCATTCAC 7260 ACGCCGACCA AATACATATT ACATACGTAC ATACATATCT CGCTCTCCCG ATAAGCCTAG 7320 ATATATAAGA TATACATAAG AACGCCGCTC CGCTGCTGGC GTACCCGGCA GCGCAGCTAC 7380 GCGGATTAGC CTAAGTCCAA ATATATAAAA AACTGTAAAA TCGGAGAGAC TCTGTAGACG 7440 TTGAGCTGAC AGAACCATTT CTGCCTACTC TAAAATCAAA AGAAGAAATT GAATAAATAT 7500 ATGTCAGCCC GACGGCTGCC TTAAACTTAA AACGGACTTG TGTTCTTAAT TGGAGTTCAT 7560 CATTACA 7567 // ID DMAURA standard; DNA; INV; 4581 BP. XX AC nnnnnnnn; XX DR FLYBASE; FBte0000112; Dmel\aurora-element. XX FT source nnnnnnnn:1..4581 FT SO_feature five_prime_LTR ; SO:0000425:1..324 FT SO_feature three_prime_LTR ; SO:0000426:4258..4581 FT SO_feature transcription_start_site ; SO:0000315:191..196 FT SO_feature polyA_signal_sequence ; SO:0000551:4482..4487 FT SO_feature primer_binding_site ; SO:0005850:331..346 FT SO_feature RR_tract ; SO:0000435:4247..4256 XX CC Composite sequence derived from AB022762, X70361 and X70362 CC Assembly based on strategy described in PMID: 10333568 CC Defective element with incomplete ORFs CC Casey Bergman, 21-June-2016. XX SQ Sequence 4581 BP; 1102 A; 1074 C; 1456 G; 949 T; 0 other; TGTCGCGGAT CGAATATTGT TATCGATAGG CTCTAGTTAG TATTTTTGAG AAGTCCGAAT 60 GTGGAAGGAT TTGTAAGCCC ATATGTGTCT GGGCACGTTG TTTTTGGCCA TTGTAAATTA 120 CCGGGAAAAT TTAGCTTTTC ATTGTCGTGT AAGAGTTGGA GGACACACTG CGGTGAGCTA 180 ATAAGTTAAG TTAGTTGCAA TTGTGAAACA TTGAATTCTT CAAGAATAAA ACGTGTTCTA 240 CTACCACGGA TTAGTCTGCC CTTTCTTTCG GGAACCAATG TGTGGGGTAG CCGTTTAAGG 300 CAACTCCCTG GACGCACGAC GACAACCTTT TATTCGCAGT CCTAGGGCGA CTGCAGGGGC 360 AACTTGCGCT GGAATGACGG TTTAGACGGC CAGCTAGAGA GTTGCCGGAG CTGGAGTGAC 420 GGTTTAGACG GCCAGCGAGG AGGATTTGTG TGAGCGCAGC CAGCGCTACG TACCGGCAGA 480 GGAGTCGCAG TCAGCGACAT AGAGGGACGC AGCCAGCGTC GAACGCCGGT ACGAAAGGGT 540 CGCAGCCAGC GACAAGGAGA CGCAAGAAGC GTCATTTGTG GAGACCGCAG CCAAGCATCC 600 GTGGCCGCAG CCAGCGGCAC GAGGCGTCAG AGACGCCATT TCGGACGCGC AGAGGCGCCG 660 CCATTTTTGG AGCTGGGAAA GATGCAGCAT TCCCCCAGGA AGAGTGCCCG GCTGAACGGA 720 GGGGAAGTCA CCCCTATAAC AACAGTGAGT CAGCAGCCAG CCAGTAGTGG AGCAGGAACT 780 CGGACGCGGG TGAACATCAC GGCGGCGTCG ATTCCTTGCC CGGCCACTAC GGTGACTACA 840 GTAGCTTCCC AACCTAGAAG TACTGCTGTC ACAGCTGCGA GTTCAGTACC GGAGGTGAAC 900 CAGCCCCTCG TGTTGGAACT CATGGAGAGG ATCGCAGCGT TGGAGAGGGA GCTGGAGAAG 960 ACTAGATCCC TAGAAAGTGT GAGCACCGCC AATTGCGCGC CAATCGCAGT TGGCCCAAGC 1020 GCAGTTGGCG CCAACAGTGG AGCGTCGGGG CGGCCGCCAT TTTGGAGCGG CCAGCTAATA 1080 CCCACATCTA ACGGAGAGGC CTTACATAAC GGGGACTGGG CCAGGCATGC TGCAACGATT 1140 GCGCCCTTTC CCACTGTAGT CCACTTCAGC GCGTGGCTAC AGGAGTACGC AAACGTGGTG 1200 TGCACGGTTT TGGACGTCGA GGGAAAGGAG CCGAGGCGTC GACTTCTACA TGCAAGCGTC 1260 GACCATAATG AATGCGATCA ACAGGATGAT CGGCATGGAG GTTGTCCCAT CTGTGGAGGA 1320 CAGCATGAAA TATTGAACTG CAGAAAATTT ATTGGAGCTT CGCCACAGGA AAGGTGGAGC 1380 AATGTGAAGA GGCATCGGCT CTGCTTCAAT TGCCTGCGAA GCGGGCACAC GGCTAGATCC 1440 TGCTATACGC AAGGTGAGTG CCAGGTTAAT GGATGCCGAA GGGAGCATCA CCGTCTGCTA 1500 CATGGTGCGG ACGGAGGAAC GAAGGCCGCT GCAGCGAGGT GGCTTCAGAC GCCACGAAGG 1560 GAACCAGCAG CCAGCAGTTT CCAGACGCAG CCTAAAGGGG AGGCCTTCGC TACGAGATGG 1620 TCACAGGGAC CAGGAGAGGA ACCGGCAGCC AGCCGTTCCA AGCAACAGTC TGGAGAGAGG 1680 AGCTCCACGT GAAGCGGGAG CGCCCATGCA GAGGAATTTG AGCTGCGTTG ACGCCGAAGG 1740 AGGCCGTCTA CTGTTCCGTA TACTGCCGGT TACGCTGTAC GGAGCGGGGC GAAAGGTGGA 1800 TACATATGCG CTCCTAGATG AGGGATCCTC CGTCACGATG ATCGATGACG AACTACGAAG 1860 GGATCTTGGA GTGCAAGGAG AGCGTCGGCA GCTAAATATC CAATGGTTTG GTGGTAAGGC 1920 AACCAGAGAG CCTACCAACG TGGTGAGTCC GAAGATAAGT GGAGTTGGAA AGCCCACTCG 1980 CCATGTATTG AGAAACGTTT ATGCCGTTTC GAGCTTGAGT TTGCCGATGC AGACATTGAG 2040 CCGACGAGAT GTCCAGGGCG TGCACAGGGA TGCGCGTCTG CCCGATGAAG CCTTACAGCA 2100 ACGTGGTGCC GAAGCTGCTC ATCGGTCTGG ATCACGGACA TCTGGGGTTG CCACTTAGGA 2160 CGAGGCGGTT CGCTCGAGAG GGACCGTATG CGGCCGCAAC CGAGCTGGGC TGGGTTGTGT 2220 TTGGGCCTGT AAGTGGGCAA CCGACCACGC CGTCACCGAG GTCCTGCCTA CTTGCCGTGT 2280 CAGTGGATGA CGCGATGGAG AAGATGGTGG AGGACTATTT CGACATGGAG AACTTTGGAG 2340 TGAAGACCGC GCCGCCGGTC GCAGCCAGCG ACGATGTCCG GGCCCAAAGG ATACTCGAAG 2400 ACACCACGGT GAAAGTGGGG CGTCGCTACC AGACGGGATT ACTCTGGAAG GACGACCACG 2460 TTGTGCTGCC ACCGAGATAT GAGGACGACG ACGTGCAAGT GAGCTTCGTG AGTGCGAGGA 2520 CGAAGTGTGC CCCAATGAGA ACGATGACGA TCCCACGGCT GGAGCTGCAA GCAGCAGTTC 2580 TTGGAACCAG GCTGATGAAC ACTGTCAAGG AGGAGCACAG TGTGGTCATC ACGGACCTGG 2640 TGTTATGGAC GGACTCTAAG ACGGTGCTGA GATGGATCGG CAGCACCCAC CGCCGCTGAC 2700 AATGCGGCTG ATGATGCGAC GCGGTCGCAG AAAAGGAGTC GACCTTAGCC AGGAATCAAG 2760 GTGGCTAAGA GGACCTGCAT TTTTGATGCA GCCAGCAGCC AGCTGGCCGG GGTCTGAGGA 2820 AGGAACTGAG CGTGTTCCAG ATGTCCCTGA TGAAGAAGAG ATGCCCAGTG AGTTTGCATT 2880 AGTTGCGGTA GACGATTTTG TCATTCCGTT TCAGAGATTC TCGAGCTTCA GTCGCCTGGT 2940 GAGGACCACA GCCTGGGTCC TACGGTTTGC GCGCTGGTGC CGCAAACAGC GAAACGATCT 3000 CGAGGAATAC GGCCTTACCG CAGCCAGAAT GTAAGGCCGC CGGAACCGCA CTGTGCATCC 3060 CGTACAGTGC GAGGAGGGCC GTATTACTGT CACACAGGCA CAGTCTGACG GAGCTGATTG 3120 TGAGAGACTT CCACGCCAGG ATGAAGCATC AAAATGTGGA TGCTACGATC GCGGAGATCC 3180 GGACAATGTT CTGGGTCACA AAGATGAGGC GTGTGATGCG GAGAGTCATC TCATCGTGCA 3240 ACGAGTGCAA GTTGCAGCGA GCGCGGCCGA TGCCGCCGAT AATGGGACCC CATCCGGAAG 3300 ACAAACTGGA TGCGGGTGGA TGGCCATTCA AATACACAGG ACTGGACTAC TTTGGGCCAC 3360 TGCTGGTGAC TGTGTCCCGT CACAAGGAGA AGCTTGGGTC GCCTTGTTTA CGTGTTTGAC 3420 GACAAGGGCG ATTCACCTGG AGCTGGCGCA TGACCTGTCG ACGGATTCCT GCATAATTGC 3480 GATCAGGAAC TTCGTCTGCC GTAGAGGGCC AGTATATAGA CTGCGCAGCG ATAACGGCAA 3540 GAACTTCGTG GGAGCTGACA GGGAAGCCAG GCGCTTTGGC GACGTATTCG AGATGGAGAA 3600 GCTTCAGAGT GAGTTGACAA GCAGAAGCAT TGAATGGGTG TTTAATTGTC CAGCGAACCC 3660 GTCTGAGGGC GGAGTTTGGG AGCGCATGGT GCAGTGCGTC AAGAGAGTAC TGCGTCATAC 3720 CCAGAAGGAA GTTGCGCCGA GGGACCATGT ATTGGAGAGT TTCCTGATTG AGGCGGAGAA 3780 TATTGTAAAC TCGCGTCCGC TCACCCACTT GCCTGTGGAT GTGGACCAGG AGGCGCCGTT 3840 GACGCCAAAC GATCTTCTCA AGGGAGTAGC CAATCTGCCG GATACGCCTG GATTGGATGC 3900 GGAGCTGCCC AAGGAAGGTA CTACGAGGAA GCAGTGGAGA ATTTCTCGCC TGCTACGAGA 3960 CCGTTTCTGG AGGAAGTGGG TCATGGAGTA CCTGCCTACG CTTGTGCGCC GCGAGAAGTG 4020 GTGCCGACGA ACGGAGCCCA TCCACCAGGG TGATGTGGTC TTCGTCTGCG ATCCTGCCTT 4080 GGCCCGACGA GAGTGCCGCA AGGGTATCGT GGAGGAGATC TACAGCGGAG CTGATGGAGT 4140 TGTCAGACGC GCTAAGGTGC GCGTGAACGA AAACGGCCTA TCTAGGACAA TGATGCGACC 4200 CGTCTCTAAA CTTGCAGTTA TGGATTTGAG TGAAGCGGTT CTTCACGGGG TCGGGGATGT 4260 CGCGGATCGA ATATTGTTAT CGATAGGCTC TAGTTAGTAT TTTTGAGAAG TCCGAATGTG 4320 GAAGGATTTG TAAGCCCATA TGTGTCTGGG CACGTTGTTT TTGGCCATTG TAAATTACCG 4380 GGAAAATTTA GCTTTTCATT GTCGTGTAAG AGTTGGAGGA CACACTGCGG TGAGCTAATA 4440 AGTTAAGTTA GTTGCAATTG TGAAACATTG AATTCTTCCA GAATAAAACG TGTTCTACTA 4500 CCACGGATTA GTCTGCCCTT TCTTTCGGGA ACCAATGTGT GGGGTAGCCG TTTAAGGCAA 4560 CTCCCTGGAC GCACGACGAC A 4581 // ID DMBARI1 standard; DNA; INV; 1728 BP. XX AC X67681; S55767; XX DR FLYBASE; FBte0000034; Dmel\Bari1. XX FT source X67681:1..1728 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..28 FT SO_feature terminal_inverted_repeat ; SO:0000481:1701..1728 FT SO_feature CDS ; SO:0000316:379..1398 FT /name="Dmel\Bari1\ORF" FT /db_xref="FLYBASE:FBgn0043784" FT /db_xref="SPTREMBL:Q24258" FT /db_xref="NCBI_PROTEIN:CAA47913.1" FT /translation="MPKTKELTVEARAGIVARFKAGTPAAKIAEIYQISRRTVYYLIKK FT FDTVGTLKNKKRSGRKPVLDQRQCRQILGVVAKNPSASPVKIALESKNTIGKQVSSSTI FT RRRLKEADFKTYVVRKTIEITPTNKTKRLRFALEYVKKPLDFWFNILWTDESAFQYQGS FT YSKHFMHLKNNQKHLAAQPTNRFGGGTVMFWGCLSYYGFGDLVPIEGTLNQNGYLLILN FT NHAFTSGNRLFPTTEWILQQDNAPCHKGRIPTKFLNDLNLAVLPWPPQSPDLNIIENVW FT AFIKNQRTIDKNRKREGAIIEIAEIWSKLTLEFAQTLVRSIPKRLQAVIDAKGGVTKY" XX CC Derived from X67681 (g7640) (Rel. 36, Last updated, Version 6). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 1728 BP; 596 A; 291 C; 332 G; 509 T; 0 other; ACAGTCATGG TCAAAATTAT TTTCACAAAG TGCATTTTTG TGCATGGGTC ACAAACAGTT 60 GCTTGTGCAG CAAGTGGGGG GAGGTGAAAT GCAAAAAAAC TTTTGCTTTT GCAAATTCAA 120 ACCTATGCAG AGTCAGATGA AAGAAGAATT GAAAAAATAA CTGTTCCTAT GCGCAAGGAA 180 GAGGCAAATG AAGAGATCTT TATCAGTTGT CAGAAGTATT TGCACACGGT TTCGTCGCAT 240 CACAATTATT TTCACAACGC AATTTCTTCT TCAGTGATTG GTTTAGAGTG ACAAGTGCCG 300 GTTTGTTTGC TTAAATACAT TTAAATTATT GAATAAAAAT TAGATTTAAT CATTTTCCTA 360 TTACAGTTAT TAAATAAAAT GCCCAAAACA AAAGAGTTAA CAGTTGAGGC CCGGGCTGGT 420 ATTGTTGCTA GGTTTAAAGC CGGTACACCT GCGGCCAAAA TAGCTGAAAT ATATCAAATT 480 TCGCGTAGAA CTGTCTACTA CTTAATAAAA AAGTTTGATA CAGTTGGCAC ATTAAAAAAT 540 AAAAAAAGAT CAGGCCGAAA ACCTGTGCTG GACCAAAGGC AATGCAGGCA AATACTTGGA 600 GTTGTGGCGA AGAATCCTAG TGCCAGTCCG GTAAAAATTG CCTTAGAATC AAAAAATACA 660 ATTGGCAAAC AAGTTAGTAG TTCTACAATT CGTCGCAGGC TAAAAGAAGC TGATTTTAAG 720 ACATACGTTG TTCGCAAAAC GATTGAGATC ACACCAACCA ACAAAACAAA ACGTCTTCGA 780 TTTGCGTTGG AATATGTTAA GAAGCCTCTT GACTTTTGGT TTAATATTTT ATGGACTGAT 840 GAGTCTGCAT TTCAGTACCA GGGGTCATAC AGCAAGCATT TTATGCATTT GAAAAATAAT 900 CAAAAGCATT TGGCAGCCCA GCCAACCAAT AGATTTGGTG GGGGCACAGT CATGTTTTGG 960 GGATGTCTTT CCTATTATGG ATTCGGAGAC TTGGTACCGA TAGAAGGAAC TTTAAATCAG 1020 AACGGATACC TTCTTATCTT AAACAACCAT GCTTTTACGT CTGGAAATAG ACTTTTTCCA 1080 ACTACTGAAT GGATTCTTCA GCAGGACAAT GCTCCATGCC ATAAGGGTAG GATACCAACA 1140 AAATTTTTAA ACGACCTTAA TCTGGCGGTT CTTCCGTGGC CCCCCCAAAG CCCAGACCTT 1200 AATATCATTG AAAACGTTTG GGCTTTTATT AAAAACCAAC GAACTATTGA TAAAAATAGA 1260 AAACGAGAGG GAGCCATCAT TGAAATAGCG GAGATTTGGT CCAAATTGAC ATTAGAATTT 1320 GCACAAACTT TGGTAAGGTC AATACCAAAA AGACTTCAAG CAGTTATTGA TGCCAAAGGT 1380 GGTGTTACAA AATATTAGTA TTGTATTTAT ATAAAATAAA GAAATTCTTA TGTTGAAATT 1440 AGATGTTAAG CTGAAATTTA CTAAATTAAG TTGAGTGAAA ATACTTTTGA AGCGCAATAA 1500 ACATGTGAAA ATACTATTGA CAACTTGCAT GCATATTTTC TTTTGCTTTA AGCTTTGTAC 1560 TATGAACCGT TATCTTTCGT ATTTCTTTTC GACTACCTTC TGCATAGATC AAGCTAAGCG 1620 ATAAGAACTA TTTCAGGCAA ATCGGACAAC AACAAGAAGA AATATAACAA AAAGAAGTTG 1680 AAGTTTGCAA ATATTGTGCG TTGTGAAAAT ACTTTTGACC ACCTCTGT 1728 // ID BS standard; DNA; INV; 5142 BP. XX AC nnnnnnnn; XX DR FLYBASE; FBte0000780; Dmel\BS. XX FT source nnnnnnnn:1..5142 FT SO_feature CDS ; SO:0000316:341..2248 FT SO_feature CDS ; SO:0000316:2245..2965 XX CC Sequence identified by REPBASE: CC http://www.girinst.org/server/RepBase/RepBase6.6.embl/drorep.ref CC Assembled and annotated by Josh Kaminker & Michael Ashburner. CC REPBASE states this to be a consensus sequence. CC This replaces that from complement(X77571:651..5776) in versions CC previous to 4.8. XX SQ Sequence 5142 BP; 1652 A; 1222 C; 1075 G; 1193 T; 0 other; AAATCTGCAT TCATAGAGAT CGGTTGTGTC GCGCGTATGC AAAAGTGATC TATTTTGCTT 60 TATTGTTGCA ATTTCTTGGG TGCTTAAAAT AGCACTCACC AGTACATTCG GGCGCTGCTT 120 CGTGCGGTGT CGGCATCTGG CCAACAACAA AAAGCGTTAA TCGAAGTGCG GTGTAGCTAC 180 GATACCTGCC CTTCGGGCAA CTTATTCCCC TCACCCCGCG CAAAGCCGCT GAAGGGGGCA 240 ATAAAATCTA TGCTTATCAG CAAAACTGAT CCGTATTTGA TCTGTTTTGT GGTCAGTTAA 300 GCAAGCTATT TTGTAAATAT TAAGAATTAT TATTAAGACA ATGGATGAGA ACAATTCTGA 360 TGACACCCAG CTTTTAAATA AGCAGAGTAA CCATAGAACA ATGTTCTCAA TAGCTGGCAA 420 ATTACCTCAC GAGATTAGAA ACGAGTGCCG ATCAGCAATT CAACGCTTTA CAAGCAGCGT 480 AACTCAAAGC AGTAGCGTCA CCACAACAAC GGTGACATTT ACTAGTGCCA ATAACAGCAC 540 CATATATACA ATGGCAAATG CCGCAATAAG CAGCCCGTGC CTTGGAACAA GATCCACTCA 600 CCAGGAAAGT TCCACATTGA TAAACTCCGG AATCGTAGAA GATAATCTCA GCGATGCTGC 660 CAGAAGGTTA TTAAATGACC AAAATCAGAG AGCGGGTAAA AGGAAAAATG GAAAGCCCTT 720 GTCCCCCATC TCCAACCCGA AAAGAGGGAG TAGCAGCCAA GTTTTACACT CGCCCCCTAC 780 GACTAGCCTG AAGATAAGCT CTAATAATAG GTTTGCCATT CTGGACACGG ATATTTCTAC 840 TAACGAAGAA AGCGTGGAAG GCATGATGAT AGAGGGTGCT GATATTGACA GTGCCCATAT 900 GGATGATTCT CAACTCGATG GTTCCAATAC TGGTCGAAAC TTGCAGGAAA CACACAATAC 960 AGCCAATCAA CTTAATGATC ACAAAAAACC ACCACAAATT GTTGTAAATA TCAGAAACTT 1020 GAATGATCTG TTTGAGCTTA TAAAAGAAAA GACAAGCTTA GATAACGTTG TCGTTAAAGC 1080 TAATCAAGGG GAAACGGTCA GAATATTTCC AAAAGACAGC GACACTTACA GGAAAATAGT 1140 GAGCCATATG GATGACATTG GTATTCAGTT TCACACTTAC CAAATGCTGA CAGATAAGCC 1200 ACACAGAATT GTAGTAAGGG ACTTACATCA CAGTACATCA AACAAAGACA TAACCGCCGA 1260 TCTGAAATGT TTAGGCTACG AAGTGCTCCA CATTCACAAC CCTAGTTCTA GGACTAATAA 1320 GGACGAAAAA CTAAACATCT TTTTCATTAA TATAAAGCCC TGTGCAAAAA TTAATGAAAT 1380 TTACCATGTC AAGACCCTTT GCCGACAGAA AATACGGATT GAAAGGATGA GAAAGTCTTC 1440 TGAAATTGCG CAATGTCGTC GTTGTCAGGA GTACGGCCAT ACAGCTAAAT ACTGCCGCAG 1500 ACACCCAAAT TGTGCCAGAT GTGGCGAAAA TCACCAAACC ATGCAATGCA CCCGACCGAT 1560 AGACGCACTG CCCACATGTT ACCATTGCTC TGAAAATCAT ACGGCTAGCT TCAAAGGTTG 1620 CCTAAAGTAT CAGGAGCTTC TTCGCAGATC TATGGGGCCT GCAAGAAATG GAAACAGGTT 1680 AAATAAGAAC ACCCATCATC ACTCTCCTAG AGACCGGCAA GAGCTTCCTG CCTTGCAGCC 1740 CAATTACCGC AAGAACAACA CCCAATCAAC AGTACAGCAG TTATCGACAC AACCACAGCT 1800 TAATTTTGCC CAAAGCCAAC CATCTATAGG CACTGGTGGA AACAGAGCAG TATCCTATGC 1860 TACAGTAGTA AAAGGATACC CAAAAATAGC GCCCTCCAAG GACGGACCAG CCCAGCGTCA 1920 ACGCTTAAAC AACCCACAAA CGAAACAAAT ACTGCAGCAA CACCGATCGA ATACACAGCA 1980 GAATAACTCA TCTGATGTGC AAGTATTCTT ACAACAGCAA CAACAACAGT TTCTGGAATG 2040 GCAACAGCAG ATCCAACAAC AACAACACCA ACAGTTTCTT ATGTGGTTGC AACAGCAGCA 2100 GCAAGAACAA CTACAGTATA AAAGCCAAAC CAATCAACGA CTGGAAAAGC TTGAAAAAAT 2160 GGTTCTTGAA CTAGCGAATA TGTTAAAAGA ATGGGCTGGG AGTGAACTTA AGCCCCAGCT 2220 CTTTAACAAC GTCTCAGCCT CCCTATGAAT CCACTAAAGA TTCTTATTTG GAATGCTAAC 2280 GGCATTTCAA GAAAAGCCAA AGATGTTGAG CTGTTCGCGC ACAACAAAAA GATAGACATC 2340 CTTCTTGTGA CTGAACTAAG ACTCAAAAGA GGGGAAACTG TAAAGATATA TGGATATGCG 2400 TACTATCCAG CATATAGGCC ATCCCTTAAT AATAATAGTG TTGGCGGAGT AGCGGTGTTC 2460 GTGAGGACAA CTCTTCGCCA CTTTCCACAA AGGGTCATTG AGACACGCCA CATACAATTG 2520 TCATCAGTAA AAGTAGCCAC AGGACTCGGG GACCTGCAGT TTAGCGCTAT TTACTGCTCC 2580 CCAAGTACTA GAATCGAGGA AAGACATTTT ACTGACATAA TACGCGCCTG CGGCCAAAGG 2640 TACTTGGTAG GTGGCGACTG GAATGCCCGC CACTGGCTTT GGGGCGACAC TTGCAATTCA 2700 CCTCGCGGGC GGGAACTAGC AGAAGCCTTG TCCGTGACTG GAGCTAAGAT CCTCGCAACT 2760 GGCTCTCCGA CAAGGTATCC GTATGTGCCC AGCCATACGC CCTCATGCAT AGATTTCGCA 2820 GTGTATCATG GTATACCAGA CCACCTAGCA ACTATAACAC AAAGCTGGGA CTTGGATTCT 2880 GATCACTTGC CTCTTATCAT TAGCATTGAG ACAGACAGTA TTCATGTCAA TCCAAGTCCC 2940 AGGCTAGTCA CCAAACACAC TGACCTCCTT GCCTTTAGCC GACAATTGGA GAGCCTTATT 3000 TCGCTGAACA CCACGCTTAA TTCTGGTGAG GAAATTGAAA TGGCTGTTGA CAACCTAACT 3060 GAAAGCATAC ATAGGGCCGC GGCTGTCTCT ACTTCTCCCG TCCCTCGGAT AGGCACCACA 3120 TATGGGATAG TCTTGACAAG AGAGGCTAGA GAGCTTCTGA CACAGAAAAG AAGACTCCGA 3180 AGGCGAGCAA TCCGATCTCA AGACCCCTGG GACCGACTTT TATGGAACCG TGCTGCAAAG 3240 CAACTACGAA ACGTCCTCAG AGAACTTCGA AGCAACTTTT TTGAGCAGAA ACTAGCTAGT 3300 ATGGACTACA CAGTGGATGC TGGATACTCG CTATGGAAAT GCACCAAGTC CCTTAAAAGA 3360 CAGCCGTTTA GACAGGTTCC TATAAGGTGT CCGGGAGGCG AACTTGCTAA AAATGAAGAG 3420 GAGCAGGCTA ATTGTTTTGC AAATCATCTG GAGACAAGGT TCACCCACTT CCAATTCGCT 3480 ACAACGGAGC AGTATCAAGA GACGCTTGAT AGCCTAGAGA CACCTCTGCA AATGTCACTA 3540 CCCATTAAGC CCATCAGGGT TGAGGAAATT GTCGAAGCTA TCAAATCTCT TCCGTTAAAG 3600 AAGTCTCCTG GCATCGACAA CGTTTGCAAT GCCACACTAA AAGCACTACC TGTTCGAGCA 3660 ATTCTCTACT TGGCGCTGAT ATATAATGCC ATACTCAGGG TGCAGTTTTT CCCAAAGCAG 3720 TGGAAAATGG CAGCAATCCT AATGATACAT AAGCCTGGTA AACCTGAAGA GAGCCCTGAA 3780 TCGTACCGAC CCATAAGTCT TTTATCTTCG CTATCCAAGC TATGGGAACG ACTGATTGCC 3840 AACAGATTAA ATGACATTAT GACCGAGCGT CGTATCCTGC CGGATCATCA GTTTGGCTTT 3900 CGTCAGGGAC ACAGTACTGT GGAGCAGGTA CACAGACTGA CAAAACATAT CCTTCAGGCC 3960 TTTGATGATA AGGAATACTG CAATGCTGTG TTCATTGACA TGCAACAGGC ATTCGATAGG 4020 GTCTGGCATG ACGGCCTTAT CAGCAAAGTT AAAAAGTTAT TCCCAGCACC ATACTATGGA 4080 GTCCTAAAAT CATACTTGGA AGATCGGAGA TTCATGGTCA GGGTCAGAAA CTCCTACTCG 4140 ATTCCCCGCG TTATGAGAGC TGGAGTTCCG CAGGGCAGCG TACTGGGACC GTTGCTCTAC 4200 TCAGTATTTA CTGCAGATCT GCCCTGCCCA AACGCCTATC ATATGGCAGA TCCCAGGAAG 4260 GCCCTTCTTG CTACGTACGC TGACGATATT GCCCTGCTGT ACAGCTCTAA TTGTTGCAAC 4320 GAGGCAGCAA GGGGTCTCCA AGAGTACCTC ACCACTCTGG CTGCATGGTG CAAAAGATGG 4380 AATTTAAAGG TCAATCCGCA AAAGACCATC AATCCCTGCT TCACCTTGAA GACCTTAAGT 4440 CCCGTCACCG CACCCATAGA GCTGGAAGGT GTAATCCTAG ATCAACCTTC ACAGGCTAAG 4500 TACCTCGGGA TTACCCTTGA TAAACGGTTG ACTTTCGGCC CGCACCTGAA AGCTACGACT 4560 CGGAGATGTT ATCAAAGGAT GCAACAACTT CGATGGCTGT TAAACAGAAA AAGCACCATG 4620 ACACTGAGAG CCAAAAGAGC AGTCTACGTC CACTGCGTAG CCCCGATCTG GCTGTACGGA 4680 ATACAGATCT GGGGTATCGC AGCAAAATCC AACTACAACC GCATTCAGGT ATTGCAAAAT 4740 CGTGCCATGC GTGCAATTAC AGACTGCCCA TACTATGTAC GTGGCACTAC CCTTCACCGT 4800 GATCTGAATC TTCATACAGT GGAAGAGCAG ATCTCCAGGC ACACCAGCAG ATATAGTGAT 4860 AGACTAAGAC GACACCACAG TATACTTGCT AGACGCTTAC TCCCTGCTAG GCCTCTAAGG 4920 AGATTAAAAA GGAAGGGTTT CGCCAAAACA CTTGGACAAC CCTAAAGACC CCCTCGAAAT 4980 ATGAGACAAA GTTGTAAGTC CTCACATGAT TAGTGAGAGG TTTGGTTCTA TCTTTTATAT 5040 GTTAATTGCG CTGTTATGTT ACTGTTATTG CATTGTATTG ATTCATCGCT TCTAAATAAA 5100 TAATAAAAAA AAAAAAAAAA AAAAAAAAAA AAAAAAAAAA AA 5142 // ID DMU89994 standard; DNA; INV; 6411 BP. XX AC U89994; XX DR FLYBASE; FBte0000739; Dmel\Burdock. XX FT source U89994:1..6411 FT SO_feature five_prime_LTR ; SO:0000425:1..275 FT SO_feature three_prime_LTR ; SO:0000426:6136..6411 FT SO_feature CDS ; SO:0000316:564..2057 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\Burdock\gag" FT /db_xref="FLYBASE:FBgn0043782" FT /db_xref="SPTREMBL:O01350" FT /db_xref="NCBI_PROTEIN:AAB50147.1" FT /translation="MSDSDNLLDNLVSSLNKWSAHQASRQNSAEKNNKSSDNWWSKTKT FT TSEMEFEAQLKAIVESAVAGALAVQKQSFEKQLQEMNERIGKLTVNTPEVETYVDAEIR FT PGVVCSEPLDILKSLPDFDGKSETYVSWRKAAHVAFKVFKDYEGSSTFYQALGIMRNKI FT KGPANTVLASFNTPLHFKAMISRLDFTYSDKRPIYLIEQELSTLRQGDMTLTEFYDEVE FT KKLTLLTNKTIMTFDSALAMSLNEKYRTDALRVFVTGAKKSLSDILFAKGPKDLPTALA FT LAQEVESNHERYQFALIYSKNIGDRGQKIEQRHSDKDRNSIMPMQTKNPYFSKRQVHTY FT DNQERQDPVQLTNPDVSMRSRRTGNFGQTPFPTQGNIWPSQQQNSWPSQQQYSWPSQQQ FT NSFRTQNQFASQPQQQNTSQAQGHFGYAQASKRPTSGSARFTGPKQQRINYLPHEKGQC FT EEDTDGYQKEAEAEVDDYEDELVNYDHVHFLATNPCYRT" FT SO_feature CDS ; SO:0000316:<1994..5119 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\Burdock\pol" FT /db_xref="FLYBASE:FBgn0043781" FT /db_xref="SPTREMBL:O01351" FT /db_xref="NCBI_PROTEIN:AAB50148.1" FT /translation="GRTSELRSCSFFSHKSLLPYIEREIAGRTIKLLIDTGASKNYIQP FT LPELKNIMPVQNKFTVKSLHGCNTVKQKCFIKLFNTSVQFFILPSLSSFDAIIGLDLLK FT QGNATLDFKNKTLNINNEVESIQFLRCDSVNFANIENIVVPNQISNKFHTMLRNRLAVF FT AEPEEALPYNTNIVATIRTEDDQPIYSKLYPYPMGVSDFVNKETHALLKDGIIRPSSSP FT YNNPVWVVDKKGTDEEGNTKKRLVIDFRKLNLKTIDDKYPIPNVVWILSNLGKARFFTT FT LDLKSAFHQILLAEKDRAKTAFSVGNGKYEFCRLPFGLKNAPSIFQRAIDDVVRDRIGK FT SCYVYVDDVIIFSNGIEDHVNDVAWVLDRLSGANMRVSKEKSFFFKESVEYLGFMVSSG FT GITTSPSKVEAIQKYNQPTNLFSVRSFLGLASYYRCFIKDFASIARPLTDILKGENGKV FT SASQSKKIPISFDERQCSAFEKLKNVLVSENVMLLYPDYRKAFDLTTDASAFGLGAVLS FT QDGKPVTMISRTLQDRELNFATNERELLAIVWALKSLRNYLYGVKNLNIFTDHQPLTYA FT VSDRNPNAKIKRWKAFIDEHNAKIFYKPGKETYVADALSRQAIHVLEDEPQSDIATIHS FT EISLTFTIETIDKPVNCFRNQIVIDEGTADSTRTFVIFGSKTRHLIQFLDKETLIGRIR FT DVVKPDVVNAIHCELPVLAFIQNSLVNDFPATTFRHTMKMVSDIFNQTEQREIVSLEHN FT RAHRAAQENVKQILQYYFFPKMSQIAATFVSNCLVCQKAKYDRHPQKQILGRTPIPSHV FT GETLHIDIFSTGRNYFLTCIDKFSKFAIVQPIGSRTITDLEPAIMQLMNFFPHSKTIFC FT DNEPSINSESIKSLLKNRFNVDIANAPPLHSTSNGQVERFHSTLLEIARCLKLDSGMND FT TVNLILQATIEYNKTVHSVTNRRPIDIIHSTPPELANEIVEMVNEAQEKQLRRENVTRR FT DRTFEVGETVMVKQNNRLGNKLTPRYREELIEADLGTTVLIKGRVVHKDNLR" XX CC Derived from U89994 (g1905850) (Rel. 51, Last updated, Version 1). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 6411 BP; 2219 A; 1259 C; 1204 G; 1729 T; 0 other; AGTTAACACA ATCACAAAAC ACCCGAAATA TAGTCGTAAG CCTCAAGTGC TTTTCCCATC 60 TATAGATCGA GCTTTACCTA TAAGAAACTG TAACTTGTTA AGCTTTAGAG ATAAGAACTC 120 TTGCTATACT TAAGTCAGTC GATTTTGGAA GATTAGAAGC GTCGGTCATC GCCACGTACT 180 TACTATTCGT CTCATTAAGT GCAGACCGCG CAAGCCTATT GTAATTAATA AACTTACGCT 240 AATAAATATA TGGAAAATCT ACTAAAATGA TAATTGGCGC CCAAACGGAT ATAAAAACCT 300 ACGATAACTG AATAATTATA AATAAATAAC AAAAGGAGGA TCCGGAGACA AAACCAGCGG 360 CTTTGGCTAA TTAACTCTAA CCTAAGAAAT AAAAATTTGC TGATTACATA AAATATAATA 420 TTAATTACTA AGACCATCTA CCTTAAAATT GTTTGTTAAT CACTATTATT ATATTGTAAG 480 TATAACGCTT ATTGAACGAA TTAAAAATAT TATTATTATT ATTATATTAT AACCTATGCA 540 AAGAGTATTG ATAATAAAAA TACATGAGTG ACAGTGATAA CCTTTTAGAC AACCTAGTGT 600 CAAGCTTAAA TAAATGGTCA GCGCACCAGG CAAGTAGGCA AAACAGTGCA GAAAAAAATA 660 ATAAGTCATC AGATAATTGG TGGTCAAAAA CAAAGACAAC TAGCGAAATG GAATTTGAAG 720 CTCAGTTAAA AGCGATCGTA GAGAGTGCTG TTGCCGGTGC GCTCGCAGTC CAAAAACAAT 780 CATTTGAAAA GCAATTGCAG GAGATGAATG AGCGAATCGG GAAATTAACA GTGAACACCC 840 CAGAGGTGGA AACTTATGTA GATGCTGAAA TTAGACCAGG TGTTGTCTGT AGCGAGCCTC 900 TAGATATACT TAAATCTCTG CCAGATTTTG ATGGCAAAAG TGAAACATAT GTGTCGTGGA 960 GAAAAGCGGC TCATGTCGCT TTTAAAGTTT TCAAAGATTA CGAGGGAAGT TCAACATTTT 1020 ACCAAGCTCT TGGTATTATG CGAAATAAAA TAAAAGGTCC AGCGAATACA GTATTGGCTT 1080 CTTTTAATAC TCCGTTACAT TTCAAAGCAA TGATCAGCCG TCTTGATTTC ACATATTCTG 1140 ACAAAAGGCC GATCTATCTA ATCGAACAAG AGCTATCAAC TTTGCGACAG GGAGACATGA 1200 CTCTTACTGA ATTCTACGAT GAAGTCGAGA AAAAACTGAC CCTACTTACC AACAAGACAA 1260 TAATGACATT TGATAGTGCC TTGGCGATGT CACTGAATGA AAAGTACAGG ACGGACGCGT 1320 TACGTGTATT TGTAACCGGA GCTAAGAAAT CGTTGAGCGA CATTCTTTTT GCAAAAGGTC 1380 CAAAAGATTT ACCAACTGCT CTCGCTTTAG CGCAAGAGGT CGAGTCGAAC CATGAGCGTT 1440 ACCAATTCGC CCTTATTTAT TCTAAAAATA TTGGAGACAG GGGTCAGAAA ATCGAACAAA 1500 GGCACAGCGA TAAGGATAGA AACTCAATCA TGCCCATGCA AACTAAAAAC CCATATTTTA 1560 GCAAGCGTCA GGTGCATACT TATGATAACC AGGAAAGACA AGATCCAGTC CAGTTAACAA 1620 ATCCTGATGT ATCCATGCGA TCTAGAAGAA CTGGAAATTT TGGACAAACT CCATTTCCGA 1680 CTCAGGGAAA TATTTGGCCA TCCCAACAGC AAAATTCTTG GCCATCTCAA CAACAATATT 1740 CTTGGCCATC CCAACAACAA AATTCATTTC GAACACAAAA TCAATTCGCA TCGCAACCCC 1800 AACAGCAAAA CACAAGTCAG GCTCAGGGAC ATTTTGGGTA TGCGCAAGCA TCAAAAAGAC 1860 CAACGAGTGG CAGTGCAAGG TTTACAGGGC CAAAACAGCA GAGGATCAAC TACTTACCTC 1920 ATGAGAAAGG TCAATGTGAG GAAGATACAG ACGGTTATCA AAAGGAGGCA GAAGCGGAGG 1980 TTGATGATTA TGAGGACGAA CTAGTGAATT ACGATCATGT TCATTTTTTA GCCACAAATC 2040 CCTGCTACCG TACATAGAAA GAGAGATAGC AGGGAGAACC ATAAAACTTT TGATTGACAC 2100 CGGGGCTTCG AAAAATTACA TACAGCCCCT CCCTGAATTA AAAAACATAA TGCCGGTACA 2160 AAATAAATTC ACGGTAAAAT CGCTTCATGG TTGCAACACC GTCAAACAGA AATGCTTTAT 2220 TAAGCTATTT AACACATCTG TTCAATTCTT TATTCTTCCA AGTCTCTCTA GTTTTGACGC 2280 AATAATAGGA CTTGACCTTT TGAAACAGGG AAATGCAACG TTAGATTTTA AGAACAAAAC 2340 GTTGAATATC AACAATGAAG TGGAATCTAT TCAGTTTTTG AGATGTGACA GCGTAAATTT 2400 CGCCAACATA GAGAATATTG TGGTTCCAAA TCAGATATCT AATAAATTCC ATACAATGCT 2460 TCGAAACCGA TTGGCCGTCT TTGCGGAACC GGAAGAAGCA CTGCCGTATA ATACCAACAT 2520 TGTTGCCACA ATACGTACTG AGGACGACCA ACCCATTTAC TCAAAACTCT ATCCGTACCC 2580 CATGGGCGTA TCGGATTTTG TGAATAAGGA GACACATGCT TTGTTAAAGG ACGGAATTAT 2640 CAGGCCCTCG TCGTCACCTT ACAACAATCC GGTTTGGGTA GTCGATAAAA AAGGTACAGA 2700 TGAAGAGGGA AATACTAAGA AAAGGTTGGT TATAGATTTT AGAAAACTAA ATTTAAAAAC 2760 AATCGACGAC AAGTACCCTA TACCAAACGT AGTATGGATC TTGTCAAATT TGGGAAAAGC 2820 CAGATTCTTT ACAACCCTTG ACCTTAAATC GGCGTTTCAC CAAATTCTGC TCGCAGAAAA 2880 GGATAGAGCG AAAACTGCCT TTTCAGTAGG AAATGGAAAA TACGAGTTTT GCCGTTTGCC 2940 GTTTGGCTTG AAAAATGCCC CAAGTATTTT TCAACGTGCT ATTGATGATG TTGTTAGGGA 3000 CCGTATAGGA AAGTCATGTT ACGTTTACGT TGACGACGTA ATAATATTTT CAAACGGAAT 3060 TGAGGACCAC GTAAACGACG TTGCTTGGGT ACTAGACAGA CTGTCTGGGG CAAACATGAG 3120 GGTTTCTAAA GAGAAATCGT TTTTCTTCAA GGAAAGCGTC GAGTATCTCG GATTCATGGT 3180 GTCAAGTGGA GGTATCACAA CCAGTCCTAG CAAAGTAGAG GCTATTCAGA AATATAATCA 3240 ACCTACTAAT CTGTTTAGTG TTCGATCGTT TTTAGGGCTA GCAAGTTATT ACCGCTGCTT 3300 TATTAAGGAC TTCGCCTCTA TTGCTAGACC ACTCACTGAC ATTCTGAAGG GTGAAAACGG 3360 AAAGGTTTCC GCAAGCCAGT CTAAAAAGAT ACCAATTTCT TTCGATGAAA GACAATGTTC 3420 TGCTTTTGAG AAGCTTAAAA ATGTTCTTGT CTCCGAAAAT GTAATGTTAT TGTATCCCGA 3480 TTATAGAAAA GCCTTTGACT TAACAACAGA CGCTTCGGCT TTTGGCCTGG GGGCAGTCTT 3540 ATCACAGGAT GGCAAGCCTG TTACAATGAT TTCGAGAACT TTACAGGATA GAGAACTTAA 3600 TTTCGCAACA AATGAACGAG AACTTTTGGC CATCGTTTGG GCTTTAAAGT CTCTTAGGAA 3660 CTATCTATAT GGTGTCAAAA ACTTAAACAT TTTTACAGAT CACCAGCCGT TAACATACGC 3720 CGTGTCAGAT AGGAATCCAA ATGCAAAAAT CAAGAGATGG AAGGCGTTTA TAGACGAACA 3780 TAATGCTAAA ATTTTCTATA AACCTGGCAA GGAGACCTAT GTTGCCGATG CACTATCCAG 3840 GCAGGCTATT CATGTCCTAG AGGACGAACC CCAGTCAGAC ATTGCAACAA TACATAGCGA 3900 AATTTCATTG ACTTTTACAA TCGAAACTAT CGACAAGCCG GTTAACTGTT TTAGAAACCA 3960 AATTGTGATA GATGAGGGCA CCGCAGACTC AACTCGAACT TTTGTTATTT TCGGAAGCAA 4020 GACAAGGCAT CTAATACAGT TTCTAGACAA AGAGACCTTA ATCGGAAGAA TTCGTGATGT 4080 GGTTAAGCCG GATGTAGTGA ATGCGATACA CTGCGAATTA CCTGTACTAG CTTTCATTCA 4140 AAACAGTCTT GTAAATGACT TTCCAGCAAC AACCTTCCGA CACACTATGA AAATGGTCAG 4200 CGACATTTTT AATCAAACTG AGCAACGGGA AATAGTGTCT TTGGAGCACA ACAGAGCGCA 4260 TAGGGCAGCA CAGGAGAATG TAAAACAAAT TCTTCAATAC TACTTTTTCC CTAAAATGTC 4320 ACAAATAGCC GCTACCTTTG TTTCTAACTG CTTGGTTTGT CAAAAAGCCA AATACGACCG 4380 CCATCCGCAA AAGCAAATCC TCGGGAGAAC ACCTATTCCG TCACATGTAG GCGAGACATT 4440 GCATATTGAT ATATTTTCTA CGGGCAGGAA TTACTTTTTG ACATGTATTG ACAAATTTTC 4500 CAAATTCGCT ATTGTGCAAC CAATCGGCTC TCGAACGATA ACTGATTTAG AACCTGCAAT 4560 TATGCAACTA ATGAACTTTT TTCCCCATTC AAAGACAATA TTTTGTGACA ATGAACCGTC 4620 CATAAATTCC GAGTCAATCA AGTCACTTTT GAAAAATCGT TTTAATGTTG ACATAGCGAA 4680 CGCACCTCCA CTTCATAGTA CCTCAAACGG ACAGGTTGAA AGGTTTCACA GCACGCTTTT 4740 AGAAATAGCT CGATGCCTGA AACTTGACAG TGGAATGAAT GATACAGTCA ACCTTATTCT 4800 TCAGGCAACA ATAGAATACA ATAAGACGGT GCACTCAGTC ACCAATAGAA GACCGATCGA 4860 CATTATTCAT TCAACTCCTC CCGAATTGGC TAACGAGATA GTAGAAATGG TTAACGAAGC 4920 TCAGGAAAAA CAGCTAAGAA GAGAAAATGT AACAAGACGA GACAGAACCT TTGAGGTGGG 4980 AGAAACCGTC ATGGTAAAAC AAAACAATCG CTTGGGAAAT AAACTAACCC CACGGTATAG 5040 GGAAGAACTA ATCGAAGCAG ACCTCGGGAC AACGGTCCTC ATAAAAGGGA GGGTCGTTCA 5100 TAAAGATAAT CTACGCTAGG TTTAGTATTT CTTTTCCTTT TGTGACCATC GCCAAGTTAG 5160 CAAAATACAA ACGTGAAATC TGAACACTAG TAAAAGAGTT TGCAAACATT TTTCAATTAA 5220 ATATTTGTCA AATCCTTCTT ATTTAATCTT TAAACATTTT GTATTATTTC CGCTTCATCC 5280 TCTTTAGAAA ATTTTAAAGG TATGTGATGA AATGCTAGAC CCGAATGATT TGAAAACTTA 5340 AAGTCCACGC AACCACAAAT ATTTCCTGAA ACTACCATAG AAAATAAATG CATTACCAAA 5400 ACGGCATAAT AACAGTATAG CGCACTCACT CTAATTAGAT TTCAAATTCC CGATTAAAAA 5460 AAAAATAAAA CACTAATGTT ATCAATACCC TTTCCTGATT CTGTTCAACT AAAATAGGAA 5520 AATCAATACT TGCAATCAAT AAGCGTTTTA CTACATACTT TAATATCAAA ATATCTGAAT 5580 GAACTTTATT ATAAAATTAT AATTGTTATA CTTAATTATT GTCAAAACTT TAGTATTAAA 5640 ACTGTAACTA CCTCTTAAGT AGATGAGAAG AGTAGAAGAG GGAATTAAGA TCTATCAACG 5700 TAGTATCTGC TAAAGACGTA AAGATGCGGC AACTATTTCT GCGCCTGGGT ACTGAAACGA 5760 CGAACTGAAT AATATCTGCC ATCAGACGCC AACCAGAGTG CGTTCAACAC ATACGTTTTG 5820 ATGGTCAACT AGTTCAACCA ACATCAGCAT CATCGTCGTC AACAAGTCGA CGGTTACAAT 5880 AAAGATTTTT TCCAAGTTCG CTACGATCAT CTCCAGAACC TTGTTGCGAA CCCATGACAT 5940 GGAGAATCAG CAGCATTTAC GAACTTCTCG GATCATCCAG ACACGCAGAG CTGCCTTCCC 6000 TTCGATGGTT TAACGCAGTA CCAGGTTGGC AGTATGGGAA CTTAGTGCAC AACCAATGTT 6060 ACCCGTAAGA TCCGCTTTCA AATAGATTTG CCAATTGTAA AAAGTCTGTG GACAGCCTTC 6120 GTCTTAGAAG GGGAGGAGTT AACACAATCA CAAAACACCC GAAATATAGT CGTAAGCCTC 6180 AAGTGCTTTT CCCATCTATA GATCGAGCTT TACCTATAAG AAACTGTAAC TTGTTAAGCT 6240 TTAGAGATAA GAACTCTTGC TATACTTAAG TCAGTCGATT TTGGAAGATT AGAAGCGTCG 6300 GTCATCGCCA CGTACTTACT ATTCGTCTCA TTAAGTGCAG ACCGCGCAAG CCTATTGTAA 6360 TTAATAAACT TACGCTAATA AATATATGGA AAATCTACTA AAATGATAAT T 6411 // ID DMCOPIA standard; DNA; INV; 5143 BP. XX AC X02599; XX DR FLYBASE; FBte0000023; Dmel\copia. XX FT source X02599:21..5163 FT SO_feature five_prime_LTR ; SO:0000425:1..276 FT SO_feature three_prime_LTR ; SO:0000426:4867..5143 FT SO_feature polyA_signal_sequence ; SO:0000551:1990..1999 FT SO_feature polyA_signal_sequence ; SO:0000551:5063..5073 FT SO_feature primer_binding_site ; SO:0005850:277..291 FT /bound_moiety="tRNA:M-i-RB" FT SO_feature CDS ; SO:0000316:432..4661 FT /name="Dmel\copia\GIP" FT /db_xref="FLYBASE:FBgn0013437" FT /db_xref="SWISS-PROT:P04146" FT /db_xref="NCBI_PROTEIN:CAA26444.1" FT /translation="MDKAKRNIKPFDGEKYAIWKFRIRALLAEQDVLKVVDGLMPNEVD FT DSWKKAERCAKSTIIEYLSDSFLNFATSDITARQILENLDAVYERKSLASQLALRKRLL FT SLKLSSEMSLLSHFHIFDELISELLAAGAKIEEMDKISHLLITLPSCYDGIITAIETLS FT EENLTLAFVKNRLLDQEIKIKNDHNDTSKKVMNAIVHNNNNTYKNNLFKNRVTKPKKIF FT KGNSKYKVKCHHCGREGHIKKDCFHYKRILNNKNKENEKQVQTATSHGIAFMVKEVNNT FT SVMDNCGFVLDSGASDHLINDESLYTDSVEVVPPLKIAVAKQGEFIYATKRGIVRLRND FT HEITLEDVLFCKEAAGNLMSVKRLQEAGMSIEFDKSGVTISKNGLMVVKNSGMLNNVPV FT INFQAYSINAKHKNNFRLWHERFGHISDGKLLEIKRKNMFSDQSLLNNLELSCEICEPC FT LNGKQARLPFKQLKDKTHIKRPLFVVHSDVCGPITPVTLDDKNYFVIFVDQFTHYCVTY FT LIKYKSDVFSMFQDFVAKSEAHFNLKVVYLYIDNGREYLSNEMRQFCVKKGISYHLTVP FT HTPQLNGVSERMIRTITEKARTMVSGAKLDKSFWGEAVLTATYLINRIPSRALVDSSKT FT PYEMWHNKKPYLKHLRVFGATVYVHIKNKQGKFDDKSFKSIFVGYEPNGFKLWDAVNEK FT FIVARDVVVDETNMVNSRAVKFETVFLKDSKESENKNFPNDSRKIIQTEFPNESKECDN FT IQFLKDSKESENKNFPNDSRKIIQTEFPNESKECDNIQFLKDSKESNKYFLNESKKRKR FT DDHLNESKGSGNPNESRESETAEHLKEIGIDNPTKNDGIEIINRRSERLKTKPQISYNE FT EDNSLNKVVLNAHTIFNDVPNSFDEIQYRDDKSSWEEAINTELNAHKINNTWTITKRPE FT NKNIVDSRWVFSVKYNELGNPIRYKARLVARGFTQKYQIDYEETFAPVARISSFRFILS FT LVIQYNLKVHQMDVKTAFLNGTLKEEIYMRLPQGISCNSDNVCKLNKAIYGLKQAARCW FT FEVFEQALKECEFVNSSVDRCIYILDKGNINENIYVLLYVDDVVIATGDMTRMNNFKRY FT LMEKFRMTDLNEIKHFIGIRIEMQEDKIYLSQSAYVKKILSKFNMENCNAVSTPLPSKI FT NYELLNSDEDCNTPCRSLIGCLMYIMLCTRPDLTTAVNILSRYSSKNNSELWQNLKRVL FT RYLKGTIDMKLIFKKNLAFENKIIGYVDSDWAGSEIDRKSTTGYLFKMFDFNLICWNTK FT RQNSVAASSTEAEYMALFEAVREALWLKFLLTSINIKLENPIKIYEDNQGCISIANNPS FT CHKRAKHIDIKYHFAREQVQNNVICLEYIPTENQLADIFTKPLPAARFVELRDKLGLLQ FT DDQSNAE" FT SO_feature CDS ; SO:0000316:join(432..1605,4555..4661) FT /name="Dmel\copia\GIP-RB" FT /db_xref="FLYBASE:FBgnXXXXXXX" FT /db_xref="SWISS-PROT:P04146" FT /db_xref="NCBI_PROTEIN:CAA26445.1" FT /translation="MDKAKRNIKPFDGEKYAIWKFRIRALLAEQDVLKVVDGLMPNEVD FT DSWKKAERCAKSTIIEYLSDSFLNFATSDITARQILENLDAVYERKSLASQLALRKRLL FT SLKLSSEMSLLSHFHIFDELISELLAAGAKIEEMDKISHLLITLPSCYDGIITAIETLS FT EENLTLAFVKNRLLDQEIKIKNDHNDTSKKVMNAIVHNNNNTYKNNLFKNRVTKPKKIF FT KGNSKYKVKCHHCGREGHIKKDCFHYKRILNNKNKENEKQVQTATSHGIAFMVKEVNNT FT SVMDNCGFVLDSGASDHLINDESLYTDSVEVVPPLKIAVAKQGEFIYATKRGIVRLRND FT HEITLEDVLFCKEAAGNLMSVKRLQEAGMSIEFDKSGVTISKNGLMVVKNSENQLADIF FT TKPLPAARFVELRDKLGLLQDDQSNAE" XX CC Derived from X02599 (g7740) (Rel. 49, Last updated, Version 4). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 5143 BP; 1874 A; 727 C; 971 G; 1571 T; 0 other; TGTTGGAATA TACTATTCAA CCTACAAAAA TAACGTTAAA CAACACTACT TTATATTTGA 60 TATGAATGGC CACACCTTTT ATGCCATAAA ACATATTGTA AGAGAATACC ACTCTTTTTA 120 TTCCTTCTTT CCTTCTTGTA CGTTTTTTGC TGTGAGTAGG TCGTGGTGCT GGTGTTGCAG 180 TTGAAATAAC TTAAAATATA AATCATAAAA CTCAAACATA AACTTGACTA TTTATTTATT 240 TATTAAGAAA GGAAATATAA ATTATAAATT ACAACAGGTT ATGGGCCCAG TCCATGCCTA 300 ATAAACAATT AAATTGTGAA TTAAAGATTG TGAAAATAAA TTGTGAAATA GCATTTTTTC 360 ACATTCTTGT GAAATAGCTT TTTTTTTCAC ATTCTTGTGA AATTATTTCC TTCTCAGAAT 420 TTGAGTGAAA AATGGACAAG GCTAAACGTA ATATTAAGCC GTTTGATGGC GAGAAGTACG 480 CGATTTGGAA ATTTAGAATT AGGGCTCTTT TAGCCGAGCA AGATGTGCTT AAAGTAGTTG 540 ATGGTTTAAT GCCTAACGAG GTAGATGACT CCTGGAAAAA GGCAGAGCGT TGTGCAAAAA 600 GTACAATAAT AGAGTACCTA AGCGACTCGT TTTTAAATTT CGCAACAAGC GACATTACGG 660 CGCGTCAGAT TCTTGAGAAT TTGGACGCCG TTTATGAACG AAAAAGTTTG GCGTCGCAAC 720 TGGCGCTGCG AAAACGTTTG CTTTCTCTGA AGCTATCGAG TGAGATGTCA CTATTAAGCC 780 ATTTTCATAT TTTTGACGAA CTTATAAGTG AATTGTTGGC AGCTGGTGCA AAAATAGAAG 840 AGATGGATAA AATTTCTCAT CTACTGATCA CATTGCCTTC GTGTTACGAT GGAATTATTA 900 CAGCGATAGA GACATTATCT GAAGAAAATT TGACATTGGC GTTTGTGAAA AATAGATTGC 960 TGGATCAAGA AATTAAAATT AAAAATGACC ACAACGATAC AAGCAAGAAA GTTATGAACG 1020 CGATCGTGCA CAACAATAAT AACACTTATA AAAATAATTT GTTTAAAAAT CGGGTAACTA 1080 AACCAAAGAA AATATTCAAG GGAAATTCAA AGTATAAAGT CAAGTGTCAC CACTGTGGCA 1140 GAGAAGGCCA CATTAAAAAA GATTGTTTCC ATTATAAAAG AATATTAAAT AATAAAAATA 1200 AAGAAAATGA AAAACAAGTT CAAACTGCAA CATCACACGG CATTGCGTTT ATGGTAAAAG 1260 AAGTGAATAA TACTTCAGTG ATGGACAACT GCGGGTTTGT CCTTGATTCT GGTGCTAGTG 1320 ACCATCTTAT AAATGATGAG TCGCTGTATA CCGACAGTGT GGAGGTTGTG CCTCCACTTA 1380 AGATTGCAGT GGCCAAGCAA GGCGAATTTA TTTATGCCAC TAAGCGTGGT ATTGTCCGAC 1440 TACGGAATGA CCATGAGATT ACACTGGAGG ATGTACTCTT TTGTAAGGAA GCTGCTGGTA 1500 ATTTGATGTC CGTAAAGCGT CTCCAAGAGG CAGGAATGTC GATCGAATTT GACAAAAGCG 1560 GTGTAACCAT TTCGAAAAAT GGGTTAATGG TTGTCAAAAA TTCAGGTATG TTAAACAATG 1620 TACCTGTGAT CAATTTTCAA GCATATTCTA TAAATGCTAA GCATAAAAAT AATTTTCGTT 1680 TATGGCATGA GAGGTTTGGC CATATAAGCG ATGGCAAATT ATTAGAAATA AAACGAAAGA 1740 ATATGTTTAG TGATCAAAGT CTTCTAAACA ACTTAGAGTT ATCATGTGAA ATTTGTGAAC 1800 CCTGTTTAAA TGGTAAACAG GCAAGACTTC CTTTTAAACA ATTGAAAGAT AAGACCCATA 1860 TTAAAAGACC ACTTTTTGTA GTACACTCAG ATGTCTGTGG GCCTATTACT CCAGTTACTT 1920 TAGATGATAA AAATTATTTT GTGATCTTTG TTGATCAGTT TACACATTAT TGTGTAACTT 1980 ATTTAATTAA ATATAAATCT GATGTGTTTA GCATGTTTCA AGATTTTGTA GCCAAGAGTG 2040 AAGCTCATTT TAATTTAAAG GTTGTGTACT TATACATTGA CAATGGTAGA GAATACTTGT 2100 CAAATGAGAT GAGACAATTT TGTGTTAAGA AAGGAATTTC TTATCACTTA ACAGTGCCAC 2160 ATACACCTCA GTTAAATGGT GTTTCTGAGA GAATGATAAG AACCATTACG GAAAAAGCTC 2220 GAACCATGGT TAGTGGTGCA AAGCTAGATA AAAGCTTTTG GGGCGAAGCA GTATTAACTG 2280 CTACTTATTT AATCAACAGA ATTCCTAGTA GAGCACTTGT TGATAGTTCA AAGACCCCAT 2340 ATGAGATGTG GCACAATAAG AAGCCATACT TAAAACATTT GAGAGTGTTT GGTGCAACTG 2400 TTTATGTGCA TATTAAAAAC AAACAAGGAA AGTTTGATGA TAAATCATTT AAAAGTATTT 2460 TTGTGGGCTA TGAACCCAAT GGTTTTAAGT TGTGGGATGC TGTAAATGAA AAATTTATTG 2520 TCGCAAGAGA TGTTGTTGTC GATGAAACCA ATATGGTTAA TTCTAGAGCT GTTAAATTTG 2580 AAACAGTGTT CCTGAAAGAT AGTAAGGAAA GTGAAAATAA AAATTTTCCG AATGACAGTA 2640 GGAAAATAAT ACAAACAGAA TTCCCGAATG AGAGTAAGGA ATGCGACAAC ATACAATTCC 2700 TGAAAGATAG TAAGGAAAGT GAAAATAAAA ATTTTCCGAA TGACAGTAGG AAAATAATAC 2760 AAACAGAATT CCCGAATGAG AGTAAGGAAT GCGACAACAT ACAATTCCTG AAAGATAGTA 2820 AGGAAAGTAA TAAATATTTT CTGAATGAGA GTAAGAAAAG AAAGCGAGAT GATCACCTGA 2880 ATGAAAGTAA GGGATCAGGC AACCCGAATG AGAGTAGGGA AAGTGAAACA GCAGAGCACT 2940 TAAAAGAAAT TGGAATTGAT AATCCAACTA AAAATGATGG CATAGAAATT ATTAATAGAA 3000 GAAGTGAGAG ATTAAAGACT AAGCCTCAGA TATCCTATAA TGAAGAGGAT AATAGTCTAA 3060 ATAAAGTTGT TCTAAATGCT CACACTATAT TTAACGATGT CCCAAATTCA TTTGATGAAA 3120 TTCAATATAG GGATGATAAA TCTTCTTGGG AAGAAGCCAT CAATACAGAG TTAAATGCTC 3180 ATAAAATTAA TAATACTTGG ACAATTACAA AAAGGCCTGA AAACAAAAAT ATTGTAGATA 3240 GCAGATGGGT ATTTTCTGTT AAATATAATG AACTTGGAAA TCCAATTAGA TACAAAGCTA 3300 GATTGGTTGC ACGAGGATTC ACTCAAAAAT ACCAAATAGA CTATGAAGAG ACATTTGCTC 3360 CTGTAGCTAG AATTTCAAGT TTCCGATTTA TATTGTCATT AGTAATACAG TATAACTTGA 3420 AAGTCCATCA AATGGATGTA AAAACAGCTT TCTTAAATGG CACGTTAAAA GAGGAAATTT 3480 ATATGAGACT TCCTCAAGGT ATATCGTGTA ATAGTGACAA TGTGTGTAAA TTGAATAAGG 3540 CAATTTACGG ACTCAAGCAA GCGGCTAGAT GCTGGTTTGA AGTATTTGAG CAAGCATTGA 3600 AAGAGTGTGA GTTTGTAAAC TCTTCAGTTG ATCGCTGTAT ATATATTTTA GACAAAGGTA 3660 ACATCAATGA AAACATATAT GTATTATTAT ATGTAGATGA TGTGGTTATA GCTACAGGAG 3720 ATATGACAAG AATGAATAAC TTCAAAAGGT ATTTAATGGA AAAGTTTAGG ATGACTGACC 3780 TAAATGAAAT AAAACATTTT ATTGGAATTA GGATAGAGAT GCAGGAAGAT AAAATCTATT 3840 TAAGCCAATC TGCATATGTT AAAAAAATTT TAAGTAAATT TAACATGGAA AATTGTAATG 3900 CAGTTAGTAC TCCTTTACCT AGTAAAATAA ATTATGAATT ACTTAATTCA GATGAAGACT 3960 GCAATACCCC ATGCCGTAGC CTCATAGGAT GTTTAATGTA CATAATGCTT TGTACACGCC 4020 CAGATTTAAC TACTGCAGTA AATATCTTGA GCAGATATAG TAGCAAAAAT AACTCCGAAT 4080 TATGGCAGAA CTTAAAAAGA GTTCTTAGAT ATTTGAAGGG CACTATCGAT ATGAAATTGA 4140 TTTTTAAAAA GAACTTGGCA TTTGAAAATA AAATTATTGG TTATGTGGAT TCTGATTGGG 4200 CTGGTAGTGA AATTGATAGA AAAAGTACAA CAGGGTATTT ATTCAAAATG TTTGATTTTA 4260 ATCTCATTTG TTGGAATACA AAGAGACAGA ACTCAGTAGC AGCCTCATCA ACTGAAGCTG 4320 AGTATATGGC CCTATTTGAA GCCGTGAGAG AAGCTCTATG GCTTAAATTT TTATTAACTA 4380 GTATTAACAT TAAACTAGAA AACCCCATTA AAATTTACGA AGACAATCAA GGCTGTATTA 4440 GCATAGCAAA CAACCCCTCA TGTCATAAAC GAGCTAAACA TATTGATATT AAATATCATT 4500 TTGCCAGAGA GCAAGTTCAG AATAATGTGA TTTGTCTTGA GTATATTCCT ACAGAGAATC 4560 AACTGGCTGA CATATTTACA AAACCGTTGC CTGCTGCGAG ATTTGTGGAG TTACGAGACA 4620 AATTGGGTTT GCTGCAAGAC GACCAATCGA ATGCTGAATG AAATTTTTAT ATATATTTTT 4680 CAAATTTAAA TTCCTGTAAA CATATTTTGT TACAATGATC TGATCGGGTT TTTCTGGGTT 4740 TTCCCCGTAT CCTCGCAGCA AATGCTGGAT CAGTTAACAC TTCCCAGAAT GCACACCACC 4800 CACATTTGAT AGTTACTAAT GAATATTATT GTTATGTTTT TAATTATAGA CGTTATTTTT 4860 GAGGGGGCGT GTTGGAATAT ACTATTCAAC CTACAAAAAT AACGTTAAAC AACACTACTT 4920 TATATTTGAT ATGAATGGCC ACACCTTTTA TGCCATAAAA CATATTGTAA GAGAATACCA 4980 CTCTTTTTAT TCCTTCTTTC CTTCTTGTAC GTTTTTTGCT GTGAGTAGGT CGTGGTGCTG 5040 GTGTTGCAGT TGAAATAACT TAAAATATAA ATCATAAAAC TCAAACATAA ACTTGACTAT 5100 TTATTTATTA TTAAGAAAGG AAAATAAATT ATAAATTACA ACA 5143 // ID DMW1DOC standard; DNA; INV; 4725 BP. XX AC X17551; XX DR FLYBASE; FBte0000341; Dmel\Doc. XX FT source X17551:1..4725 FT SO_feature CDS ; SO:0000316:213..1910 FT /name="Dmel\Doc\gag" FT /db_xref="FLYBASE:FBgn0024789" FT /db_xref="SPTREMBL:Q04134" FT /db_xref="NCBI_PROTEIN:CAA35586.1" FT /translation="MNQNDIRSQRQCEQDERRLSLQRNNAYFSFVSPQIGDRAPSPSTN FT SKLLPSANDRPRSCSPSLPASAHKSWSEETASPTPLLSQRQTTVPGNCNTAITSAVTSL FT ATATTSTSSAAQLIIAVPAVNNSAALTVCNNNNARKEESKQKQKSISTVQTGMDRYIQI FT KRKLSPQNNKAGNQPKINRTNNGNENSAVNNSNRYAILADSATEQPNEKTVGEPKKTRP FT PPIFIREQSTNALVNKLVALIGDSKFHIIPLKKGNIHEIKLQIQTEADHRIVTKYLNDA FT GKNYYTYQLKSCKGLQVVLKGIEATVTPAEIIEALKAKNFSAKTAINILNKDKVPQPLF FT KIELEPELQALKKNEVHPIYNLQYLLHRRITVEEPHKRINPVQCTNCQEYGHTKAYCTL FT KSVCVVCSEPHTTANCPKNKDDKSVKKCSNCGEKHTANYRGCVVYKELKSRLNKRIATA FT HTYNKVNFYSPQPIFQPPLTVPSTTPTISFASALKSGLEVPAPPTRTAHSEHTPTNIQQ FT TQQSGIEAMMLSLQQSMKDFMTFMQNTLQELMKNQNILIQLLVSSKSP" FT SO_feature CDS ; SO:0000316:1910..4576 FT /name="Dmel\Doc\RTase" FT /db_xref="FLYBASE:FBgn0024790" FT /db_xref="SPTREMBL:Q04135" FT /db_xref="NCBI_PROTEIN:CAA35587.1" FT /translation="MASLRISLWNANGVSRHTQELTQFIYEKNIDVMLLSETHLTNKNN FT FHIPGYLFYGTNHPDGKAHGGTGILIRNRIKHHHLNNFDKNYLQSTSIALQLNNGSTTL FT AAVYCPPRFPISEDQFMEFFNTLGDRFIAAGDYNAKHTHWGSRLVSPKGKQLYNALTKP FT ENKLDYVSPGKPTYWPADPRKIPDLIDFAITKHVPRNMVTAEALADLSSDHSPVFLNML FT TRPHIVDPPYRLTNFRTNWPRYQKYVCSHIELTTALSTKEDIDKSTETLENILVSAAKA FT STPPVTYAKPNYIKTNREIERLVLDKRRLRRDWQSNRSPITKHMLKIATRRLTNALKQE FT EKNSQRSYIEQLSPTSTKYPLWRAHRNLKTPIAPIMPLRSPSGTWFRSDEERASAFADH FT LQNVFRPNPSTNTFILPPLIAANLDPQEPFEFRPCELAKVIKEQLNPRKSPGYDLITPR FT MLIELPKCAILHICLLFNAIAKLGYFPQKWKKSTIVMIPKPGKDKTQPSSYRPISLLTC FT LSKLFEKMLLLRISPHLRINNTLPTHQFGFREKHGTIEQVNRITSEIRTAFEHREYCTA FT IFLDVAQAFDRVWLDGLLFKIIKLLPQNTHKLLKSYLYNRVFAIRCDTSTSRDCAIEAG FT VPQGSVLGPILYTLYTADFPIDYNLTTSTFADDTAILSRSKCPIKATALLSRHLTSVER FT WLADWRISINVQKCKQVTFTLNKQTCPPLVLNNICIPQADEVTYLGVHLDRRLTWRKHI FT EAKSKHLKLKARNLHWLINARSPLSLEFKALLYNSVLKPIWTYGSELWGNASRSNIDII FT QRAQSRILRIITGAPWYLRNENIHRDLKIKLVIEVIAEKKTKYNEKLTTHTNPLARKLI FT RVCSQSRLHRNDLPAQQ" XX CC Derived from X17551 (g8821) (Rel. 29, Last updated, Version 2). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 4725 BP; 1647 A; 1192 C; 822 G; 1064 T; 0 other; GACATTCGGC ATTCCACAGT CTTCGGGTGG AGACGTGTTT CTTTCAAGCT ACGAATAGCA 60 AGTTCTAAAA ACTACAACAG TATAGTGAAA GTTAAACACA AAGTGTAAAG TGCAGTTTGC 120 ACAACTAACA ATTATTGACT ATAGTAATTA TTTACTAAAA TAAATAATTA TTCCATATTG 180 TTCTGGTAAT TGTTATATGT GGACTTAGAA CAATGAATCA AAACGACATA CGTTCTCAGC 240 GACAATGTGA ACAAGACGAG CGCCGGCTCT CTTTACAACG CAACAATGCA TACTTTTCTT 300 TCGTCTCACC GCAAATCGGT GATCGAGCAC CCTCACCTTC AACTAACTCG AAACTTTTGC 360 CCTCAGCGAA CGACAGACCG CGTTCTTGCT CTCCCTCTCT GCCTGCTTCG GCTCACAAGT 420 CGTGGAGCGA AGAGACCGCC TCTCCTACCC CGCTCCTCTC GCAGCGCCAA ACGACCGTCC 480 CGGGTAACTG TAACACTGCA ATAACGAGTG CAGTGACCTC ACTGGCAACT GCCACAACAT 540 CAACTTCGTC AGCGGCCCAA CTAATTATCG CTGTGCCAGC TGTAAATAAT TCAGCAGCAC 600 TGACCGTTTG CAACAACAAT AATGCACGTA AAGAAGAATC AAAACAAAAG CAGAAGTCGA 660 TTTCGACTGT GCAGACTGGC ATGGATCGCT ACATCCAAAT CAAGAGAAAG CTCAGCCCTC 720 AAAACAATAA GGCAGGTAAT CAACCCAAAA TCAATCGAAC CAACAACGGC AATGAAAACT 780 CTGCAGTAAA TAATTCAAAC CGATATGCTA TCTTGGCTGA TTCTGCGACC GAACAACCCA 840 ACGAAAAAAC GGTAGGGGAA CCAAAAAAGA CCAGGCCTCC ACCAATTTTC ATACGAGAAC 900 AAAGTACAAA TGCACTTGTA AATAAACTCG TTGCTTTGAT TGGTGACAGC AAGTTCCACA 960 TTATCCCACT TAAAAAAGGA AATATTCATG AAATAAAACT ACAGATCCAA ACAGAAGCAG 1020 ACCACCGTAT AGTGACTAAA TACCTAAATG ATGCTGGTAA AAACTACTAC ACATACCAAT 1080 TAAAAAGTTG CAAAGGGCTA CAGGTAGTAC TTAAGGGCAT TGAAGCAACA GTGACACCAG 1140 CTGAGATAAT TGAGGCTCTG AAGGCCAAAA ACTTTTCTGC AAAGACAGCT ATTAATATTT 1200 TAAACAAAGA CAAAGTTCCG CAGCCACTAT TCAAAATAGA ACTCGAACCA GAGCTCCAGG 1260 CACTAAAGAA AAACGAAGTG CACCCAATAT ACAATTTACA GTACTTGCTA CATCGGAGGA 1320 TCACCGTGGA GGAGCCGCAC AAACGTATCA ATCCAGTTCA ATGTACTAAT TGCCAAGAAT 1380 ACGGCCACAC CAAGGCATAC TGCACCCTTA AGTCCGTATG TGTTGTCTGT AGCGAACCTC 1440 ATACTACCGC AAACTGCCCC AAAAACAAGG ACGATAAGTC TGTGAAGAAA TGCAGTAACT 1500 GCGGGGAAAA ACATACTGCA AACTACAGAG GCTGTGTGGT GTACAAAGAA TTGAAGAGCC 1560 GCCTAAACAA ACGTATTGCC ACAGCACATA CATACAACAA AGTCAATTTC TACTCTCCGC 1620 AACCGATTTT TCAACCACCC CTAACTGTCC CAAGCACTAC TCCAACAATT TCTTTCGCTA 1680 GCGCCCTAAA ATCCGGACTA GAAGTGCCCG CCCCACCGAC AAGAACTGCT CATTCCGAAC 1740 ATACACCGAC AAACATCCAA CAAACACAAC AAAGTGGCAT CGAAGCTATG ATGCTATCCC 1800 TACAGCAAAG CATGAAAGAC TTCATGACGT TCATGCAAAA TACTTTGCAA GAGCTCATGA 1860 AAAACCAAAA TATCCTGATT CAACTTCTTG TATCTTCAAA ATCCCCATAA TGGCTTCCCT 1920 ACGGATATCT CTGTGGAACG CAAATGGCGT TTCACGGCAT ACACAAGAGC TCACACAGTT 1980 CATTTACGAA AAAAACATCG ACGTAATGCT ACTATCAGAA ACGCACCTCA CAAATAAAAA 2040 CAATTTTCAT ATACCAGGAT ACTTGTTCTA TGGTACAAAT CATCCAGATG GTAAAGCTCA 2100 TGGAGGCACT GGAATACTCA TCAGAAATCG CATAAAACAC CACCACTTAA ACAATTTTGA 2160 CAAAAACTAC TTACAATCTA CGTCCATAGC CTTACAACTC AACAATGGTT CAACGACTCT 2220 AGCCGCAGTC TACTGCCCAC CGCGCTTTCC AATCTCTGAG GATCAATTCA TGGAATTCTT 2280 TAACACACTA GGTGACAGGT TCATCGCAGC GGGTGACTAT AACGCCAAGC ACACCCATTG 2340 GGGATCTCGA CTTGTGTCGC CAAAGGGTAA GCAATTGTAC AATGCGCTTA CGAAGCCAGA 2400 AAACAAGCTA GACTATGTAT CCCCGGGTAA GCCTACATAC TGGCCAGCAG ACCCAAGAAA 2460 AATCCCAGAC CTGATCGATT TTGCAATTAC TAAACATGTC CCCCGCAACA TGGTCACCGC 2520 CGAAGCACTA GCAGATTTAT CATCAGATCA CTCACCTGTT TTTCTAAATA TGCTAACTCG 2580 CCCCCACATC GTCGACCCAC CGTATAGACT CACAAATTTT AGAACAAACT GGCCAAGGTA 2640 TCAAAAGTAT GTCTGTTCAC ACATAGAACT AACGACGGCA TTATCTACAA AGGAGGATAT 2700 AGACAAGTCA ACGGAAACTC TTGAAAACAT TTTAGTTTCG GCTGCAAAGG CTTCAACCCC 2760 GCCAGTGACG TATGCAAAAC CAAACTACAT CAAAACTAAT CGCGAAATCG AGCGGCTGGT 2820 ATTAGATAAA CGACGCCTAC GAAGGGATTG GCAGTCTAAT AGATCACCAA TTACTAAGCA 2880 CATGCTTAAG ATAGCCACAC GCAGGCTTAC CAATGCTCTC AAACAAGAGG AAAAAAACAG 2940 CCAACGTTCA TATATCGAGC AACTCTCTCC CACCAGCACT AAGTACCCTC TTTGGAGAGC 3000 TCACAGAAAC CTAAAGACTC CAATAGCGCC AATTATGCCA CTCCGAAGTC CCTCTGGCAC 3060 CTGGTTTCGA AGTGATGAAG AAAGAGCCAG TGCTTTCGCT GACCATTTAC AAAATGTATT 3120 CCGACCAAAT CCCTCTACCA ACACATTTAT TCTCCCTCCT TTAATAGCAG CCAATCTAGA 3180 TCCTCAAGAA CCCTTTGAAT TCCGACCATG TGAACTAGCA AAGGTTATCA AAGAGCAACT 3240 GAACCCAAGA AAATCGCCTG GCTACGACCT AATAACTCCA AGAATGCTCA TTGAACTCCC 3300 AAAGTGTGCT ATTCTTCACA TCTGCCTGTT GTTCAACGCA ATCGCCAAGC TTGGATACTT 3360 CCCTCAAAAA TGGAAAAAGT CGACCATAGT AATGATTCCA AAGCCAGGAA AAGATAAAAC 3420 GCAGCCATCA TCATATAGAC CGATAAGCTT ACTAACATGT CTTTCAAAGC TGTTTGAAAA 3480 AATGCTACTC CTTCGGATTA GCCCTCATCT TAGAATAAAC AACACACTTC CAACACATCA 3540 ATTTGGCTTT AGAGAAAAAC ATGGAACCAT CGAACAGGTC AACCGAATCA CGTCAGAAAT 3600 TCGTACTGCT TTTGAACATC GAGAATACTG CACAGCCATT TTTCTAGACG TCGCGCAGGC 3660 ATTTGACAGA GTGTGGCTCG ATGGACTTTT GTTTAAAATA ATCAAGCTGT TGCCCCAAAA 3720 CACACATAAG CTACTGAAGT CATACCTATA TAACAGAGTG TTTGCAATAA GATGCGATAC 3780 AAGCACTTCA CGCGATTGCG CAATCGAAGC TGGAGTGCCG CAAGGCAGTG TACTGGGTCC 3840 AATCTTATAC ACCCTGTATA CGGCGGATTT CCCCATAGAC TACAATCTAA CAACCTCCAC 3900 GTTCGCTGAT GATACCGCGA TACTCAGTCG CTCGAAATGC CCAATAAAAG CCACGGCACT 3960 CCTATCCCGA CACTTAACAT CTGTAGAACG ATGGCTTGCC GACTGGAGAA TTTCAATAAA 4020 TGTTCAAAAA TGCAAGCAGG TTACCTTTAC CTTAAACAAA CAAACATGCC CACCACTGGT 4080 CTTGAATAAC ATATGCATTC CACAAGCCGA CGAGGTAACA TATCTGGGAG TTCATCTGGA 4140 CAGGCGGCTC ACTTGGCGCA AACATATAGA AGCCAAATCG AAACATCTTA AACTTAAAGC 4200 AAGGAACCTC CACTGGCTCA TAAATGCTCG CTCTCCACTT AGTCTGGAGT TCAAAGCTCT 4260 TCTATACAAC TCCGTCTTAA AACCTATCTG GACTTATGGC TCCGAGCTGT GGGGCAACGC 4320 ATCCAGAAGT AACATAGACA TTATTCAGCG AGCACAGTCA AGAATTCTGA GAATTATCAC 4380 TGGAGCGCCG TGGTACCTTC GAAACGAAAA CATACACAGA GACCTAAAAA TCAAATTAGT 4440 AATCGAAGTA ATAGCTGAGA AAAAAACGAA GTATAACGAA AAGCTGACCA CCCATACAAA 4500 TCCCCTCGCA AGAAAACTAA TCCGAGTATG CAGTCAAAGC CGGCTGCACC GCAACGACCT 4560 CCCAGCCCAG CAATAAACTT ATTAGGGCAT TAATGAAAAA AAAAAACTAT CACTAAGTGA 4620 AAGTTAATTA AGTTAGATTA AGATTTGAAC ACTTATTGTT AGTCTCTTAA CACAAAGGGA 4680 AGATTCAATA AATAATAAAA ATTAAAAAAA AAAAAAAAAA AAAAA 4725 // ID F standard; DNA; INV; 4708 BP. XX AC AC005198; XX DR FLYBASE; FBte0000005; Dmel\F-element. XX SY synonym: Jiminy XX FT source AC005198:38639..43358 FT SO_feature CDS ; SO:0000316:192..1880 FT /name="Dmel\F-element\gag-r" FT /db_xref="FLYBASE:FBgn0041632" FT /db_xref="TREMBL:P91787" FT /translation="MSQNDTRAQRQREHDERRLSIQRNNAYFSYVSPTIPNADIERSI FT THSPGNLLLPTNQERARSCSPALLAPTEAPLPPTTTAGEGPAARSASSSAAPAHGLTK FT SAKAKPLAINGTAALPAKQNENVNKKAGSTWQTGMDRYITIKRKLSPENSDLGNKPKN FT TRDNSTLIKNVAPANTNRFALLVDTAEDVPLGSVDIEPKKTKPPPIYIREKSTSRLVN FT TLIGLIGKDSFHIIPLVRGTINEIKLQTKTEDDYRKVTNYFTAQKIGFYTYQLKSSKG FT LQVVLKGIESDVTPEEITEALKEKGFYAKNVFNIKNRNRQPQPLFKIELEPENKPPRK FT NEVHPIYKLQLLLHRRITVEEPHKRNAPVQCTNCQEYGHTRSYCTLRPVCVVCGDLHD FT SKQCQINKENACEKKCNNCGGNHTANYRGCPIYKELKIRLHKRMNTARAHQGSATLIP FT SETNPEVIFSKAASFAPWPTFNTNKTTFANVLKSGMTPPTQNSRTPHEVHTKLDTQQN FT YHPAAQQETKTEAMMQALQQSMMEFMTFMKTTIQDMMRNQNLLIQMLVAQQSNK" FT SO_feature CDS ; SO:0000316:1880..4561 FT /name="Dmel\F-element\RTase" FT /db_xref="FLYBASE:FBgn0041633" FT /db_xref="TREMBL:Q24335" FT /translation="MATLRIATWNANGVSQRKLELAQFLHEKHIDVMLLSETHLTSKY FT NFQIRDYHFYGTNHPDGKAHGGTAILIRNRMKHHFYKEFAENHLQATSINIQLDDNTL FT LTLAAVYCPPRFTVLEAQFLDFFQALGPHFIAAGDYNAKHTHWGSRLVNPKGKQLYKT FT IIKATNKLDHVSPGSPTYWPSDLNKLPDLIDFAVTKNISRSLVKAECLPDLSSDHSPV FT LIHLRRYAENVKPPTRLTSSKTNWLRYKKYISSHIELSPKLNTESDIESCTCALQSIL FT TAAALTATPKITNNTINSKKTNVQIEQLVHVKRRLRREWQSSRSPTAKQKLKVATRKL FT ANALKQEEDDDQRRYIEQLTPTGTKQKSLWRAHSTLRPPTETVLPIKNSSGGWARSDE FT DRANTFAAHLQNVFTPNQATSTFALPSYPVNRHQQHTPIVFRPKEITKIIKDNLSPKK FT SPGYDLITPEMIIQLPHSAVRYITKLFNAITKLGYFPQRWKMMKIIMIPKPGKNHTVA FT SSYRPISLLSCISKLFEKCLLIRLNQHQTYHNIIPAHQFGFRESHGTIEQVNRITTEI FT RTAFEYREYCTAVFLDVSQAFDKVWLDGLMFKIKISLPESTHKLLKSYLYDRKFAVRC FT NTATSTVHTIEAGVPQGSVLGPTLYLIYTADIPTNSRLTVSTFADDTAILSRSRSPIQ FT ATAQLALYLIDIKKWLSDWRIKVNEQKCKHVTFTLNRQDCPPLLLNSIPLPKADEVTY FT LGVHLDRRLTWRRHIEAKKTQLKLKANNLHWLINSGSPLSLDHKVLLYNSILKPIWTY FT GSQLWGNASNSNIDIIQRAQSKILRTITGAPWYVRSENIQRDLNIPSVTNAITELKEK FT YL" XX CC K. O'Hare, Personal communication to FlyBase, 1 May 2000. CC CDS2 translation from M17214; AC005198 has a 1-bp deletion. XX SQ Sequence 4708 BP; 1618 A; 1242 C; 857 G; 991 T; 0 other; AATCAATTAA TCAATTCGAT CGCCGACGTG TGAAGACGTT TTTATCGTGC TCCGCACAAA 60 ATCGGTTGTT TTGAGTGAAG TGAACGCCAA ATAAAATAAA CTAAATAAAA AATCTGAAAG 120 CGAAAGAGAC GCTCTATGCG ATGCAAGATC GCTTAAATAC ATAGTGAATT GTTATCTTAA 180 ATAATAAAAC TATGAGTCAG AATGACACTC GCGCCCAGCG TCAGCGCGAG CATGACGAAC 240 GCCGACTCTC AATTCAGCGC AACAACGCGT ACTTCTCCTA CGTCTCACCG ACAATCCCAA 300 ACGCAGACAT CGAGCGGTCA ATAACCCATA GCCCAGGAAA CCTTCTTCTA CCAACAAATC 360 AAGAAAGAGC GCGCTCCTGC TCTCCCGCTC TATTGGCTCC GACAGAAGCC CCGCTACCTC 420 CAACAACAAC AGCTGGAGAG GGACCGGCAG CCCGCTCTGC CTCGTCATCG GCTGCACCCG 480 CTCACGGTCT GACTAAGTCA GCGAAAGCAA AACCGCTAGC AATAAACGGT ACTGCTGCAC 540 TGCCAGCAAA ACAAAACGAA AACGTAAACA AAAAAGCTGG GTCGACCTGG CAGACTGGAA 600 TGGACCGCTA CATTACAATA AAGCGAAAGC TCAGCCCGGA AAATTCAGAT TTGGGAAACA 660 AGCCGAAAAA TACACGCGAT AACTCTACCT TGATCAAAAA TGTAGCCCCT GCAAATACCA 720 ACAGATTTGC CTTGCTGGTA GATACCGCTG AGGACGTGCC GCTGGGATCC GTTGATATCG 780 AACCGAAGAA AACAAAGCCT CCGCCAATAT ACATCCGCGA GAAGAGCACA AGCCGTCTTG 840 TAAATACTTT GATTGGCCTT ATTGGGAAAG ATAGCTTTCA TATAATTCCC CTCGTAAGAG 900 GTACTATCAA CGAAATCAAA CTTCAGACGA AAACGGAGGA CGACTACAGA AAAGTCACAA 960 ACTATTTTAC CGCACAAAAA ATAGGCTTCT ACACCTACCA GCTTAAAAGC AGCAAGGGCC 1020 TGCAAGTAGT CCTGAAGGGC ATTGAGTCTG ATGTTACGCC CGAAGAGATA ACTGAGGCGC 1080 TAAAGGAAAA GGGATTTTAC GCCAAAAACG TGTTCAATAT CAAAAACAGA AACAGGCAGC 1140 CCCAACCACT CTTCAAGATT GAGCTTGAAC CAGAAAACAA GCCTCCTAGA AAAAACGAGG 1200 TTCACCCAAT TTACAAACTC CAGCTCCTTT TGCACCGTAG GATCACGGTA GAAGAGCCGC 1260 ACAAACGCAA CGCTCCTGTA CAATGTACAA ACTGCCAAGA GTATGGCCAC ACGAGGTCAT 1320 ATTGTACACT TCGCCCGGTG TGCGTAGTCT GTGGAGATCT CCACGACTCC AAACAGTGTC 1380 AAATTAACAA AGAAAATGCA TGCGAGAAAA AATGTAATAA CTGCGGGGGC AATCACACAG 1440 CAAACTACAG AGGCTGTCCA ATCTACAAAG AGCTGAAAAT CCGTCTTCAC AAAAGAATGA 1500 ACACGGCGCG GGCACACCAA GGATCAGCTA CCCTGATACC ATCAGAGACA AATCCTGAAG 1560 TAATTTTCTC GAAAGCAGCT AGTTTCGCTC CCTGGCCTAC ATTCAACACT AACAAGACAA 1620 CATTTGCTAA CGTTTTAAAA TCAGGTATGA CGCCTCCAAC CCAAAACTCC CGAACTCCAC 1680 ATGAAGTGCA CACAAAATTA GACACACAAC AAAACTATCA CCCAGCTGCG CAGCAGGAAA 1740 CAAAAACTGA AGCTATGATG CAAGCCTTAC AACAGAGCAT GATGGAATTT ATGACATTTA 1800 TGAAGACCAC CATTCAAGAC ATGATGCGTA ATCAAAACCT TTTGATACAA ATGCTTGTAG 1860 CCCAACAATC AAATAAATAA TGGCTACCTT ACGCATAGCT ACGTGGAACG CCAATGGCGT 1920 CTCACAGCGC AAACTTGAGC TAGCTCAATT CCTACATGAG AAGCATATCG ACGTAATGCT 1980 TCTTTCGGAA ACTCATCTCA CAAGCAAATA CAATTTTCAA ATAAGAGACT ACCATTTCTA 2040 CGGTACAAAT CATCCCGACG GAAAAGCACA CGGTGGCACC GCCATACTCA TAAGGAACCG 2100 TATGAAGCAC CACTTTTACA AAGAATTTGC GGAAAATCAT CTTCAGGCCA CATCTATCAA 2160 CATTCAGCTG GATGACAACA CTCTCCTTAC ACTAGCGGCC GTATACTGCC CCCCCCGTTT 2220 CACAGTATTA GAAGCTCAAT TCCTGGATTT CTTCCAAGCA CTAGGGCCAC ACTTCATTGC 2280 AGCAGGCGAC TACAACGCTA AACATACTCA CTGGGGATCG CGACTTGTGA ACCCAAAAGG 2340 AAAACAGCTT TATAAGACGA TAATAAAAGC CACTAATAAA CTTGACCATG TTTCCCCCGG 2400 GAGTCCTACA TACTGGCCAT CAGACCTCAA TAAGCTGCCA GACCTGATCG ACTTCGCAGT 2460 TACGAAAAAT ATTTCCCGCA GTTTGGTTAA AGCTGAATGT CTGCCGGATC TCTCATCTGA 2520 TCACTCGCCT GTACTAATTC ACCTCCGCCG ATACGCAGAA AACGTGAAAC CACCAACCAG 2580 ATTGACCTCT AGCAAAACAA ACTGGCTCAG GTATAAAAAA TATATAAGTT CACATATTGA 2640 GCTAAGCCCA AAACTCAATA CTGAATCTGA TATAGAGAGC TGCACGTGTG CATTGCAATC 2700 CATCCTTACT GCAGCAGCTC TTACTGCAAC ACCCAAAATA ACAAATAATA CAATTAATTC 2760 AAAAAAGACC AACGTACAAA TCGAGCAACT CGTCCACGTA AAACGTCGCT TACGCAGAGA 2820 ATGGCAATCT TCCAGATCCC CAACTGCAAA ACAAAAGCTA AAAGTAGCCA CACGGAAACT 2880 GGCCAACGCT CTGAAACAAG AAGAGGACGA CGATCAGCGC CGATACATAG AGCAACTCAC 2940 ACCAACAGGC ACAAAACAAA AGTCACTGTG GCGAGCCCAC TCAACTCTTC GCCCACCGAC 3000 TGAAACCGTT TTGCCGATAA GGAATTCATC AGGTGGCTGG GCCCGTAGTG ATGAAGACAG 3060 AGCCAACACA TTTGCCGCTC ACCTACAAAA TGTGTTCACG CCAAACCAGG CTACTAGCAC 3120 ATTCGCGCTA CCGTCCTATC CCGTAAACCG CCATCAGCAA CACACCCCAA TTGTGTTTCG 3180 TCCTAAAGAA ATAACTAAAA TAATCAAAGA CAATCTCAGC CCGAAAAAAT CCCCCGGCTA 3240 CGACCTTATA ACACCGGAAA TGATCATCCA GCTGCCACAT TCTGCAGTTC GCTACATAAC 3300 CAAGCTCTTT AATGCCATCA CCAAACTTGG TTACTTTCCA CAACGATGGA AGATGATGAA 3360 GATCATAATG ATTCCAAAGC CTGGTAAGAA CCACACAGTC GCTTCATCTT ACAGACCAAT 3420 AAGTCTACTC TCATGCATTT CGAAACTATT CGAAAAATGC CTGCTGATCC GACTTAATCA 3480 ACATCTGATA TACCACAATA TAATCCCAGC CCACCAATTT GGATTTCGCG AAAGCCACGG 3540 AACCATTGAA CAGGTGAATC GTATTACAAC GGAAATAAGA ACTGCATTTG AATATCGCGA 3600 ATACTGTACA GCAGTATTTT TAGACGTATC CCAAGCATTC GACAAAGTCT GGCTCGACGG 3660 CCTAATGTTT AAAATTAAAA CATCCCTACC CGAAAGCACA CACAAACTTC TAAAGTCTTA 3720 CCTCTATGAC AGAAAGTTTG CAGTGCGGTG CAACACTGCC ACTTCCACTG TTCATACAAT 3780 TGAGGCTGGA GTCCCCCAAG GCAGCGTTCT TGGGCCAACC TTATACCTCA TCTATACAGC 3840 CGACATCCCT ACAAATAGTC GCTTAACGGT ATCCACATTT GCCGACGATA CAGCTATCCT 3900 TAGCCGTTCA AGGTCCCCTA TCCAAGCTAC AGCACAGTTG GCACTGTACC TCATCGACAT 3960 TGAGAAGTGG CTCTCTGACT GGCGAATAAA AGTAAACGAG CAAAAATGCA AGCACGTGAC 4020 GTTTACGCTA AACAGACAAG ACTGTCCTCC GCTCTTGTTG AACAGCATAC CACTCCCGAA 4080 AGCAGACGAG GTAACGTACC TAGGAGTACA CCTAGACAGA AGACTCACAT GGCGCAGGCA 4140 CATTGAAGCC AAAAAAACCC AACTTAAACT CAAAGCCAAC AACTTACACT GGCTCATCAA 4200 CTCTGGTTCT CCGCTCAGCC TAGATCACAA GGTCTTGCTC TACAATTCTA TATTGAAACC 4260 AATCTGGACC TATGGCTCAC AGTTATGGGG CAATGCCAGC AACAGCAATA TTGACATCAT 4320 TCAGCGAGCA CAATCAAAGA TTCTGAGAAC CATCACTGGG GCACCGTGGT ACGTTCGGAG 4380 TGAAAACATC CAAAGAGACT TAAATATCCC ATCAGTTACC AACGCAATCA CGGAACTTAA 4440 GGAAAAATAC CATAGCAAGC TTCACACGCA CCCCAACCAC CTAGCGCGAG GTCTAATCCA 4500 GCTCAGCAGC CGTTCCCGTC TCCGGCGAAA GGACCTACCA ACCCAGCGAA TAAATTATTA 4560 GGGCCGTTTA AACATAGAAC AGTTGGAAAA ATAATACAAC TGTTCAAAAA ATACTTGTTA 4620 TAGTTAAGAT TTTTAAACTT ATTGTTAGTT CTTATACAAG AAGATTCAAT AAATAAAAGC 4680 AAAGTAAAAT AAAAAAAAAA AAAAAAAA 4708 // ID FB standard; DNA; INV; 4347 BP. XX AC X51937; AC X15469; XX DR FLYBASE; FBte0000466; Dmel\NOF. XX FT source join(X15469:94..1010,X51937:1..3430) FT SO_feature CDS ; SO:0000316:797..3874 FT /name="Dmel\NOF\ORF" FT /db_xref="FLYBASE:FBgn0044029" FT /db_xref="SWISS-PROT:P16320" FT /db_xref="NCBI_PROTEIN:CAA36201.1" FT /translation="IQQLDTSANLTLNSTFPDDDPEFQITEASKNGPLPILYFNLELDL FT ELWRSIAPKKDQKTEKLQPNWTDTMAKLIYKKVPLPCAFNFRKAKLSDKVDNIWLRIEG FT YCNDCSSILKGHCLVKPDEQCGIMISVSVPDTRGIPHNKKRRCTGSRRLEIGNELILKK FT AALWRKEATDNMNDDDPEPSYIPNLPTLRKLREEATNRHLGITKDRDPVSSLYLKKYEG FT ELAGCILDIGLDEFFCIYCTGTQVKTYASRIKTIRKISIDATGSVVLPIQKPNGDSSYV FT FLYQIVMEGDDSIFPVFQMLSAKHDTASIQFWLSRFISKSGHFPLEVVSDFSLALLNGI FT SLSFNECRIATYIKKCFHSLLMEERTDLPPCYIRLDIAHLIKMICRKNVFKSKLPNLKD FT FYTRCIGLATTCETKDSFAELIKSVLIVALSQSSGEDEKGDILSSYRNEKYLLARIATF FT TAPDHKETIEDNCIPEDQEEIDEDVTDFISNIKIAAEEEALNCNSVNCRPNPYFLPELM FT PPLIKLCKYFVLWTNVMKEKFCSKYDVGSSALVEAYFKDLKNTDMSIFHRPVRADKFVV FT QHIRCIEAVCKLERAAMKRKTVKTPSFIKENAPKKMCSKETKGFLEEILEESEVEYLLQ FT EENWKVKNKTIKPTEGNDAEDNDTDDENKEMDLSEQPKEKPRGKYLKKCPNVELLYNRP FT HRRKQDEILHNGGSMGPVWIGKQLLQFKNTCPFDSLVEILSTAYIDNFYYKSLLDDFYT FT DNLTIELVKKYAVEGVSSSLYCDRGLVLKSFFDEKHQIIKCDANIGSFIEKALNGVPSA FT SSHRTHIKNNHDCRNQKYIHHRLEVIDVEKVGHLDVQEVVIPFIDEFFARTDGECKICG FT GQQILERQPGPHVILDIEFAMDAFHQIHHNGLPGTTTLLQVPEEILIQEKKYILSGAIE FT YVPAMGGEIGHYIAYCRRVIGSWEVHNDMCRQWKKFSALNTKMTLHILIYTRKN" XX CC Derived from X15469 (g7962) (Rel. 36, Last updated, Version 3). CC Derived from X51937 (g8297) (Rel. 44, Last updated, Version 6). CC Takis Benos and Michael Ashburner, 25-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 4347 BP; 1461 A; 775 C; 885 G; 1226 T; 0 other; TATATTCTAT TGCCCACCAT ATAAACACGT GCCACTTTCC TAGTTTTAGG ATCTGCCTAC 60 ATAACACGTG CAGACGCACA GGTGTTTCTG GGTTTATATA GACCAAAAAT TGGTTCCGAT 120 TGCCAATCTT GTAATTTACA GTTTACCAGG TAATTACATA ATTTTCAAAC CTCACTTTAT 180 GATAGGGTCC AATTTTTTAC CTGTGACAAA GTGTTAAATT TTTTAAGAAT GGGTTTTTCA 240 TGGCAGGTCA GAATCCTCTA TAAAATCTAA AACACTTGTC GGTATTTGAA AATCGCTCTC 300 CTCCTTGATT CTCATATTAG GTGTAAAAGA TAAATCCGGA ACTCATAATT AAAATATTTT 360 TTATGTGAAA AAGTTGTGCG CGATTTTAAC TACGCTTACC CAGTGCTGGA AAAGTTAAAG 420 TTGTTTTGTT TTTCAAAGAA AGTGAAAGTT GCTAAGCACG AACTTAAGAA ATCTGAGTGA 480 TTGTGTTAAA TTTATTTGAA TCCTTGTGAA TTTTGTTGAC AGTCTTTTTA AAGACTTGCA 540 AAATTTTCAT ATTATTCGGT TCTTGCTTTT ATTTTTATAC AACGCGTTTT TCCTTTAGGC 600 ATACCTTTAT ACATTTACAG TGTAAACAAC AGTGTAAAAC GTGTAAATCA GTGCAAAATA 660 GTTTTTTTTA TTTACTCCAT AAAAAATAAG TGTTACTGTC AGGATGCCGG CCAAACCGCA 720 AGTCGATGGT CACACCTTAG TGGATGCATT TTGCTGCGCG AATATTTTTA CGGAGACTGG 780 AGCTCTTAAG CCAAGAAGCG ATAAAGTTTG GATGGATATA AGCAACCAAT TGAAAGGAGC 840 GATCAGCGCG AAGACGCTTA ATTTCTACGC CAGAATCAAT AGGAATAACA TGATAACTGT 900 GGTTAAAGAA CGATGTGGAA TTCAACAGCT GGATACTAGT GCCAATTTAA CTTTAAATAG 960 CACATTTCCT GATGATGACC CGGAGTTCCA GATCACCGAA GCTTCAAAAA ATGGACCATT 1020 GCCTATTTTG TACTTTAACC TGGAGTTGGA CCTGGAATTG TGGAGATCAA TTGCCCCCAA 1080 AAAGGATCAA AAAACTGAAA AACTGCAACC TAACTGGACG GATACTATGG CAAAGTTGAT 1140 ATACAAAAAA GTTCCTCTTC CGTGTGCATT TAATTTTAGA AAAGCTAAAC TTTCCGACAA 1200 AGTGGATAAT ATTTGGCTAC GAATTGAAGG CTATTGCAAT GACTGCAGCT CAATTTTAAA 1260 GGGACATTGC CTTGTGAAAC CCGATGAACA ATGCGGCATA ATGATATCTG TTTCAGTACC 1320 GGACACACGA GGTATACCTC ATAATAAAAA ACGACGGTGC ACTGGATCGA GACGACTTGA 1380 AATTGGGAAC GAGTTGATTT TAAAAAAAGC TGCATTGTGG AGGAAGGAAG CCACCGACAA 1440 CATGAATGAT GACGACCCAG AACCGAGTTA CATACCAAAT TTACCAACCC TTCGGAAACT 1500 TCGTGAAGAG GCAACTAACA GACACCTAGG AATTACCAAG GATCGGGATC CAGTTTCATC 1560 ATTATACCTT AAAAAGTATG AGGGTGAATT GGCTGGATGC ATTCTTGACA TTGGATTGGA 1620 TGAATTTTTC TGCATATACT GCACAGGAAC CCAAGTAAAA ACATATGCAT CAAGGATAAA 1680 AACTATTAGA AAGATTTCTA TTGACGCAAC TGGAAGCGTG GTGTTACCCA TCCAAAAACC 1740 AAACGGTGAC TCTAGTTATG TTTTTCTGTA CCAAATTGTA ATGGAGGGTG ACGACAGTAT 1800 ATTTCCAGTT TTTCAGATGC TGTCGGCTAA ACATGACACA GCCAGCATAC AGTTTTGGTT 1860 AAGCAGATTT ATATCAAAGT CGGGGCATTT TCCACTGGAG GTTGTATCTG ATTTTTCCTT 1920 GGCATTGCTA AATGGAATAA GCTTAAGCTT TAATGAGTGT AGGATTGCGA CGTATATAAA 1980 AAAATGTTTC CACAGCCTTT TGATGGAGGA ACGGACGGAT CTGCCACCCT GCTATATTCG 2040 ACTTGACATC GCCCACCTAA TTAAAATGAT ATGCCGGAAG AACGTCTTCA AAAGTAAATT 2100 ACCGAACCTC AAGGATTTTT ATACTAGATG TATTGGTCTT GCAACAACGT GTGAGACAAA 2160 GGACAGTTTT GCGGAATTAA TTAAATCAGT ACTGATTGTC GCACTGAGCC AATCCTCAGG 2220 GGAAGATGAA AAAGGAGACA TTCTTTCAAG TTACAGGAAT GAAAAGTATC TGCTCGCCAG 2280 AATAGCTACA TTTACTGCCC CGGATCACAA GGAGACCATT GAGGACAACT GCATACCAGA 2340 GGACCAGGAG GAAATTGACG AGGATGTTAC GGACTTTATC TCTAATATTA AAATCGCTGC 2400 CGAAGAAGAA GCGTTAAATT GCAATTCGGT CAACTGTCGG CCAAATCCGT ATTTCCTACC 2460 TGAGCTAATG CCACCATTAA TTAAGTTGTG CAAATATTTT GTTTTATGGA CAAACGTGAT 2520 GAAGGAAAAG TTCTGTTCCA AATATGATGT CGGCTCTTCG GCTCTTGTGG AAGCCTATTT 2580 CAAGGATTTA AAAAACACGG ACATGAGCAT ATTCCACCGA CCAGTGAGAG CGGATAAATT 2640 CGTGGTGCAA CATATCCGAT GCATCGAAGC TGTTTGCAAG CTGGAACGAG CCGCGATGAA 2700 ACGCAAGACC GTTAAAACTC CCAGCTTTAT AAAAGAAAAC GCTCCTAAGA AAATGTGCAG 2760 TAAGGAAACC AAGGGATTTC TGGAGGAAAT ACTTGAAGAA AGCGAAGTGG AATACCTTTT 2820 ACAAGAAGAA AACTGGAAGG TGAAGAATAA AACAATAAAG CCCACGGAAG GAAATGATGC 2880 TGAAGACAAC GACACTGATG ATGAAAACAA GGAAATGGAT TTAAGTGAAC AGCCCAAAGA 2940 AAAACCAAGG GGAAAATATC TCAAAAAATG CCCCAATGTG GAGTTATTAT ACAATCGACC 3000 ACATCGAAGG AAACAGGACG AAATTTTGCA TAATGGTGGA TCAATGGGAC CCGTCTGGAT 3060 TGGCAAACAA TTATTGCAAT TCAAAAATAC TTGTCCGTTT GACTCTCTAG TGGAAATATT 3120 GTCGACCGCA TACATAGACA ATTTTTATTA CAAAAGCCTA TTGGATGATT TCTACACTGA 3180 CAACTTGACG ATAGAATTGG TGAAAAAGTA TGCCGTCGAG GGAGTTTCGT CCAGTCTCTA 3240 CTGCGACAGA GGTCTGGTCC TAAAAAGTTT TTTTGATGAA AAACACCAGA TTATAAAATG 3300 CGACGCAAAT ATTGGGTCTT TTATTGAAAA AGCGCTGAAT GGAGTACCCA GTGCGTCAAG 3360 TCATCGGACC CATATAAAAA ACAACCATGA TTGCAGGAAC CAAAAATATA TCCACCATCG 3420 GCTGGAGGTT ATAGATGTCG AAAAAGTTGG CCACCTCGAC GTCCAGGAGG TAGTGATCCC 3480 CTTTATTGAT GAGTTTTTTG CAAGAACTGA TGGAGAATGT AAAATATGCG GTGGACAACA 3540 GATCCTTGAA AGGCAGCCAG GACCGCATGT CATACTTGAT ATAGAATTTG CAATGGATGC 3600 TTTTCATCAA ATTCATCATA ACGGTTTACC AGGAACGACC ACTTTACTTC AAGTGCCGGA 3660 GGAAATTTTA ATACAGGAAA AGAAATATAT TTTAAGTGGT GCCATCGAAT ATGTTCCTGC 3720 GATGGGAGGG GAAATTGGAC ATTACATTGC ATATTGCCGC AGAGTCATTG GATCTTGGGA 3780 AGTGCACAAC GATATGTGCA GGCAATGGAA AAAGTTCTCA GCTCTAAATA CCAAAATGAC 3840 ACTCCACATT TTGATATACA CCCGGAAAAA TTAATGTTTA TTTTTAAGCC TTGTTTAAAA 3900 GTGTAAAAAA TATTTGTTGT TAAAAATTAC AATCTTAAGT CCTTTGCAAA CGTTGTTTAA 3960 AAATAAAATT AAATTAATTA TTTTACAAAA CTTAACCCTT TTTCACTTTT ATACCTAATA 4020 TAAAGAGGTC CGTAAAGTAT CAAGGAGGAG AGCGATTTTC AAATACCGAC AAGTGTTTTA 4080 GATTTTATAG AGGATTCTGA CCTGCCATGA AAAACCCATT CTTAAAAAAT TTAACACTTT 4140 GTCACAGGTA AAAAATTGGA CCCTATCATA AAGTGAGGTT TGAAAATTAT GTAATTACCT 4200 GGTAAACTGT AAATTACAAG ATTGGCAATC GGAACCAATT TTTGGTCTAT ATAAACCCAG 4260 AAACACCTGT GCGTCTGCAC GTGTTATGTA GGCAGATCCT AAAACTAGGA AAGTGGCACG 4320 TGTTTATATG GTGGGCAATA GAATTTA 4347 // ID DMTNFB standard; DNA; INV; 1106 BP. XX AC V00246; J01084; XX DR FLYBASE; FBte0000288; Dmel\FB. XX FT source V00246:1..1106 XX CC Derived from V00246 (g8708) (Rel. 36, Last updated, Version 3). CC Josh Kaminker 2 Aug 2002. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 1106 BP; 340 A; 228 C; 119 G; 419 T; 0 other; AGCTCAAAGA AGCTGGGGTC GGAAAAATCG AATTTTTGAA ATTTGAAAGC TGGAATCGTT 60 TGCCCATTTT TTGCCCATGT TTGCCCACCA ATTAGTTTTT TTTGCCCACG TCCAGTTTTT 120 GAGATATGGA TTTTCGAAAA AGTTCGAAAA TGTTCGAAAA TCAAAAATTT CGCTTTTTTC 180 AAATTTTTTT TTTTTTAAAT CGCAATAACA TCGTTTGCCC ACGTTTGCCC ACCCTTTAGA 240 ATTTTGAAAA AATTTATACT TTAGAAAATA TAAGGCTTTT AAGTTTACCT CGGTCTAATC 300 AGAGAGTAAA TCGTTTGCCC ATCTCTTAAA ACCAAATATT ATCAACAAAA AACGTTTGCC 360 CAACCATTAT TATTAGTTTT TATCGTTTGC CCACCCTTTA AAAAACCTTT AACAAAATTT 420 TTTTTTCGAT TGCCCACACT TGAAATACAA CCAATTTCGT TAGCCCACCT CTTCAAAATA 480 AATATTTCCA ATAAAAAACG TTTTCCCACC ATTTAAAAAT AAATAATTTC GATTGCCCAT 540 CCTTCAAAAT TCATTTTAAC GTTTGCCCAC CCTTTAAAAT TTGTTTTTTT CGTTTGCCCA 600 CTCTTAAAAC TAAATAATTT CGATTGCCCA CCTTTTAAAA CTAAATAATT TCGTTTGCCC 660 ATCCTTTAAA ATTCATTTTT AACGTTTGCC CACCCTTTAA AAATAAATTA TTTCGTTTGC 720 CCACCCTTTA AAATTTGTTT TTTTCGTTTG CCCACTCTTA AAACTAAATA ATTTCGATTG 780 CCCACCTTTT AAAACTAAAT AATTTCGTTT GCCCATCCTT TAAAATTCAT TTTAACGTTT 840 GCCCACCCTT TAAAAATAAA TTATTTCGTT TGCCCACCCT TTAAAAGTTT TTTTTTTTCG 900 TTTGCCCACT CTTAAAACTA AATAATTTCG ATTGCCCACC TTTTAAAACT AAATAATTTC 960 GTTTGCCCAT CCTTTAAAAT TCATTTTTAA CGTTTGCCCA CCCTTTAAAA TTTGTTTTGT 1020 AAGATGTGGC GCCAATTCAG ATATTTTAGG ATCGGCGGAT AGAAGCACTT ACTTATATGA 1080 TGATGATGAA CATACATAGA CATAAT 1106 // ID DMREPG standard; DNA; INV; 4346 BP. XX AC X06950; XX DR FLYBASE; FBte0000657; Dmel\G-element. XX FT source X06950:1..4346 FT SO_feature CDS ; SO:0000316:220..951 FT /name="Dmel\G-element\ORF0" FT /db_xref="FLYBASE:FBgnXXXXXXX" FT SO_feature CDS ; SO:0000316:819..1539 FT /name="Dmel\G-element\ORF1" FT /db_xref="FLYBASE:FBgnXXXXXXX" FT SO_feature CDS ; SO:0000316:join(1530..1858,1866..1973,1982..2719,2727..3008,3012..3800,3806..3991,4006..4095) FT /name="Dmel\G-element\ORF2" FT /db_xref="FLYBASE:FBgnXXXXXXX" XX CC Derived from X06950 (g8427) (Rel. 16, Last updated, Version 1). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 4346 BP; 1215 A; 1356 C; 959 G; 816 T; 0 other; ACAGTCGCGA TCGAACACTC AACGAGTGCA GACGTGCCTA CGGACCGACG GCAAGTTATT 60 TTCGTGCTCA AAGTCCCGCT ACTCTAAAAC CGCTACGTAG TGTCGCGAGA TTTCTTCGCG 120 CACCGTGATT GGTTCAGCCG GCGAACCTTA CGGTATCGCT ACCACTACCA ACGCACTCGT 180 GCGTGCGTGT TATCGGTATC AACAGTTACA TTCGGCTAAA GTTACTGCGA ACAACTCAGC 240 AGCAGCCACG TGCTGAGGCT GGTACACCAA CAAACGGTTC CTACCGTGCC CTCCTCCCCT 300 CCTTCCCTAC TCCGGGACAA CATGGACTGG CAAGCCCCCC CGCGACCCAC CAAGCTGACC 360 AAAGTGCCTA GAAAGAAGGC GCTCAAAGAG GCGCCAGGAG AAGGTGAAAG CAGCTGCTCA 420 AGCGATAGCA GCTCCTCGGA GTCAGAGCCT GGGGAAGTCA AGCGCAAAGC AGCGAGCAGA 480 GACGCTAAGG AAGCCGCCGA CAACGTGCCC AACACCAGCG CAGCTCTGCG CAAGAAGCTG 540 GAAAATAACT CCTTCGCCCT TCTGTCCAGC ACTGAGGACG AAGACGATGA CGACGACAAC 600 ACCGACAACG AGCAGCAAAC CCCTGTTGGG GAATCTGCTC CAAAAACCAT GAAAAAACCC 660 AACCCGACCC CGAAGACCAT CAAGCCACCC CCGATCTACA TCCCAGACGT GACCAACATC 720 TCAGCCCTTG TCAGGATGAT TACGACTCTC GTCGGTGCCC ACAAGGAATT CTCGTACAAA 780 ACTGAGAGAA ACAACAATGT ACGAGTAATG ATGCCTGACA AGGAATCCTA CTCAGCCTTT 840 CGTCAGCAGC TTGTGACCCA GAACAAAAGG CACCGCACAT TTCAACTGTC AGGGACCTGC 900 ACAACCCAAT TGGCAAAAAA TCAAAGGAAC CCCTGGGGAT CTTCTTTGTA AACCTGGAAC 960 CTGCGAGCAA CAATACAGAC ATCTACAAAC TCAAGAGAAT CTGCAGGTCG GTCGTCACCG 1020 TTGAGCCGCC TCTGAAATTC AACGATGTTC CGCAGTGCTT CAGATGTCAA GGGTTCGGAC 1080 ACACCCAGCG CTACTGCTTT TTAGAGTTTC GCTGCGTCAA GTGTGGTGGC CTCCACGACT 1140 CCAGGGCGTG TGAAAAAAAG GAAGACGAGA AAGCATGCTG CCTACACTGT CAAGCCGACC 1200 ATCCAGCGTC GTTCAAAGGG TGCCCCGCGT ATAAGAAGGC AAAGGCTCAA CAAGCTCCTA 1260 AACCCAAAGC AAGGAGCATG GAAAGCAACA ACAAGCCCTC CTTTGAGCTC CCAAATATTA 1320 CAAACGGTAT GAGCTATAGA GACGCGCTAA GTGGCACACG CAAGTCCCAA GCAAGCACTC 1380 CCCCACCGAC ACCCCCAACC CCACCTGAAG CCCCACAACC TAACCACATG GAGGCTATGT 1440 TCACTCGATT TGAGAGCCTG GTCGAAAGAA TGATGGAGAA GATGTTTGCT CAGGTGACGC 1500 AGCTTGTTGC TTCCATCCTC AACAGCAAGT CATGCAAATA AGTCTCAACA TAGTCTTCTG 1560 GAACGCGAAC GGCTTGCAGA GAAGCAAAGC CGAAGTTGAG CACACCATCA AAACCGACAA 1620 CATCGATATT TTATTGGTCT CAGAATCCCA TTTTTGCCCC AGATCCCACT TCATCATCTC 1680 CGGTTACGAC CTCATCACAG CCAACCACCC ATCAGGTAGA GCTCGAGGAG GAGCGGCCAT 1740 GCTCATCAAA AGCGGCATAC AGTTCACTGA ACTGCCTGCG ATACAGGAGG ATTGGGCACA 1800 GTGTGCAGTG GCCAGAGTCA ATAGCCTACA GGGAGATATT ACGGTTGGAG CGGTTTACTT 1860 CCACCCCCAG GCACGCGATT ACAGAGACTC ACCTGCATGA GTTCTTCGAG TCCCTCGGAA 1920 CTCGCTTCAT TGCAGCCGGA GACTTCAATG CAAAGCACTC CTGGTGGGGG TCCGCACAAA 1980 CAACCCCAAA GGCAAAACGC TCCACAAGTA CCTGATGCGC AAAAACTTGG ACTGCCACTC 2040 TACTGGAGAG CCCACACACT GGCCCTCGGA CCCTTCTAAG CAGCCGGATC TGCTGGACAT 2100 CGCGATCTGC AAAGGCATAG GTCGTGCCAA ACTCGTCTGC ACTACATACG ACAGGCTCGT 2160 ATCGGACCAC AGCGCCGTCA ACCTGCTCCT CAACATCCCT GTCCTCAGGA AGACGCCGCT 2220 CCGTAGACTC ACGGGGAATC GCACCAATGC CCCCAAGTTC ACGTTCTGGA TGCTCTCCTC 2280 CCTAAACCCA GACCCAGACC TCTCCACTCC AGGCAATATA GGCGCGGCCA TCGAAAAACT 2340 GAACAAGGAG ATGCACAACG CCGCTGAGTT TGCGAACCCT CCTCCTCCTA CAACCCCGAG 2400 AACTCCCGCA AGAGACCTGC ATTTGTGGTC CCCAGAAATC GCCGCCCTCG TGGCCGAGAA 2460 GAGACGCCTC AGACGAGTAT GGTTCCTCTC GCGTAACCCC AGGGACAAGA CAGCGCTCAA 2520 TCGCGCCTCC AAGGAACTCA AGGACAAACT AACCACCCTA CGCCAAGACT CGTTTCAACG 2580 ATTCCTTGAA GATCTGGAAC CTGGAGACCC GCAGCACAAC CTGTGGATCG TCACGCGGCA 2640 CATCAAAAGA CCCGCCAAGA AAATGGTACC AGTGCGTACA GCAGACTGCT CCTGGTGTCG 2700 GTCTGAGGCA GAAAGAGCCG AAGCTTGCTG ACCACCTTCG CTCTGCCTTC ACTCCGTTTG 2760 ACCGATGCAC AGCTGCAGAG CAAGCTGACA CCATCAGAGC TGTTGAAAGC CCATGTGCTC 2820 CAGGACCTGC AATTCAGCCC GTCGCACCAG AGGAGATCGC GCAGGAAATT GCCTCGCTCA 2880 GAAACGGCAA GTCTCCCGGC CCTGATCGCA TCGACGCTAC TGCGTTAAAA ATGTTGCCCA 2940 CATTCTGCTC ACAGCTGCTT GCCAACATTT TTAACAGCTG CTTCCGGCTA GGGTATTTCC 3000 CAAAACAATA GAAACGCGCC GAAGTGATTA CCATCCCCAA GCCCGGCAAA CCTGAAGCCA 3060 ATCTTGCCTC CTATCGTCCG ATAAGTCTGC TGGCAATCCT CTCCAAAATA CTCGAAAGAG 3120 TATTTCTGCG CAGAGTGCTG CCAGTACTGG ATGAGGCTGG TTTGATCCCC GATCACCAGT 3180 TTGGCTTCAG GCGCTCCCAC GGAACACCAG AGCAATGCCA CCGGCTTGTA GAGCAAATTT 3240 TGGAGGCCTT CGAAAGGAAG CAATACTGCT GCGCCGTCAT GCTGGATGTG AAGCAGGCCT 3300 TCGACAAAGT CTGGCACCCT GGACTCCACT ATAAAATCAA GACTCACCTT CCCGGATCCC 3360 ACTTCGCCTT CCTCAAATCA TTCACTGAGG GTAGAGAGTT CCAAGTTTGC TGCGGAACAG 3420 CGACCAGCAC GCCTAGGCCG ATAAGAGCCG GAGTACCCCA AGGCAGCGTC CTTGGACCAA 3480 TACTGTACAC ACTCTACACA GCAGACCTTC CTATCACACC CTCCCGGAGC CTAACAGTGG 3540 CCACATATGC CGATGACACC GCCTTCCTAG CCTCCGCCTC AGACCCCCAA GAAGCATCAA 3600 CCATCATTCT AAGCCAGCTG GATGCCCTCG ACCCATGGTT GAAACGATGG ACCATTGCCG 3660 TGAACGCAGA CAAATCCTCC CAAACCACTT TCTCCCTGCG CAGAGGAGAC TGCCCCCCAG 3720 TCACGCTCAA CGGGGAAACT ATTCCAACCT CAAGTTCCCC GAAATACCTT GGATTGACTC 3780 TAGACCGGAG GCTCACTTGG CACACCAGGC TGACCTGCGC CTCAAGCAAC TCCACTGGCT 3840 CATCGGGAAA AGGTCCAAAC TTAGGGAAAA CCTTAAACTC CTCCTGTACA AGGCCATCCT 3900 GAAGCCAATT TGGACTTATG GGATTCAGCT GTGGGGCACT GCCAGCATCT CAAACCGCAA 3960 CCGCATACAG CGCTTCCAGA ACAAGTGCCT GAGTCAATCG CTGACGCTCA CCCATACCAT 4020 GAAAACTCCG TTATCCACAA GGAGCTTGGA ATGCCATGGG TAGCAGAGGA GATCTCCCGC 4080 TTCAGCGAGA GATACGCTAA ACGACTGGAC AACCACCCTA ACCATCTGGC TATTAACCTC 4140 CTGGACAACA GTGAAACCAT CAGACGCCTC CAGAGGAAAC ACCCGCTTGA TCTCCACCAC 4200 CTATAACCCA CAACAATGAA CCCCCGACCA ATCTACAACT TTGTAATCCC TTAAGTTAAT 4260 GCCCCCCCCA CCCAAACATT TAATTATTGT CCACATGGAC AGATTTTAAA TTAATACATA 4320 GATCGCTAAA AAAAAAAAAA AAAAAA 4346 // ID DMGYPF1A standard; DNA; INV; 7469 BP. XX AC M12927; XX DR FLYBASE; FBte0000021; Dmel\gypsy. XX SY synonym: mdg4 XX FT source M12927:1..7469 FT SO_feature five_prime_LTR ; SO:0000425:1..482 FT SO_feature three_prime_LTR ; SO:0000426:6841..7411 FT SO_feature polyA_site ; SO:0000553:7277..7280 FT SO_feature primer_binding_site ; SO:0005850:482..492 FT /bound_moiety="tRNA:lys2" FT SO_feature CDS ; SO:0000316:1080..2435 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\gypsy\gag" FT /db_xref="FLYBASE:FBgn0014965" FT /db_xref="SWISS-PROT:P10405" FT /db_xref="NCBI_PROTEIN:AAA70218.1" FT /translation="MSWAHNYRKVKVEYESEDSWEEEQVGQALGRPLDSATVDITMDPN FT QIQALIDNAVRQALSQQQSQFQTQLNSLAARVQSLQVEAPQIKIYEKVSVNPDVRCDIP FT LDIIKSVPEFSGTQDEYVAWRQSAIYAYELFKPYNGSSAHYQAVAILRNKIRGAAGALL FT VSHNTVLNFDAILARLDCTYSDKTSLRLLRQGLEMVRQGDLPLMQYYDEVEKKLTLVTN FT KIVMTHEQEGADLLNAEVRADALHAFISGLKKALRAVVFPAQPKDLPSALALAREAEAS FT IERSMFANSYAKAVEERAHSGANGKSRFQGKPNKEEQGQDRNPHFTKRPKNNGQTNKDT FT QAQAPQPMEVDSSSRFRQRTEHYQNHPNESNAFKRRNSSERSTGPRRQRLNNVVQEAPK FT QKDPKEEYEKTAKAAVEEIDSENEYAPSDDSLNFLGGAPGCRSLNDGWLGEP" FT SO_feature CDS ; SO:0000316:2438..5470 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\gypsy\pol" FT /db_xref="FLYBASE:FBgn0014966" FT /db_xref="SWISS-PROT:P10401" FT /db_xref="NCBI_PROTEIN:AAA70219.1" FT /translation="MLIDTDAAKNYIRPVKELKNVMPVASPFSVSSIHGSTEIKHKCLM FT KVFKHISPFFLLDSLNAFDAIIGLDLLTQAGVKLNLAEDSLEYQGIAEKLHYFSCPSVN FT FTDVNDIVVPDSVKKEFKDTIIRRKKAFSTTNEALPFNTAVTATIRTVDNEPVYSRAYP FT TLMGVSDFVNNEVKQLLKDGIIRPSRSPYNSPTWVVDKKGTDAFGNPNKRLVIDFRKLN FT EKTIPDRYPMPSIPMILANLGKAKFFTTLDLKSGYHQIYLAEHDREKTSFSVNGGKYEF FT CRLPFGLRNASSIFQRALDDVLREQIGKICYVYVDDVIIFSENESDHVRHIDTVLKCLI FT DANMRVSQEKTRFFKESVEYLGFIVSKDGTKSDPEKVKAIQEYPEPDCVYKVRSFLGLA FT SYYRVFIKDFAAIARPITDILKGENGSVSKHMSKKIPVEFNETQRNAFQRLRNILASED FT VILKYPDFKKPFDLTTDASASGIGAVLSQEGRPITMISRTLKQPEQNYATNERELLAIV FT WALGKLQNFLYGSREINIFTDHQPLTFAVADRNTNAKIKRWKSYIDQHNAKVFYKPGKE FT NFVADALSRQNLNALQNEPQSDAATIHSELSLTYTVETTDKPLNCFRNQIILEAARFPL FT KRNLVLFRSKSRHLISFTDKSWLLKTLKEVVNPDVVNAIHCDLPTLASFQHDLIAHFPA FT TQFRHCKNVVLDITDKNEQIEIVTAEHNRAHRAAQENIKQVLRDYYFPKMGSLAKEVVA FT NCRVCTQAKYDRHPKKQELGETPIPSYTGEMVHIDIFSTDRKLFLTCIDKFSKYAIVQP FT VVSRTIVDITAPLLQIINLFPNIKTVYCDNEPAFNSETVTSMLKNSFGIDIVNAPPLHS FT SSNGQVERFHSTLAEIARCLKLDKKTNDTVELILRATIEYNKTVHSVTRERPIEVVHPG FT AHERCLEIKARLVKAQQDSIGRNNPSRQNRVFEVGERVFVKNNKRLGNKLTPLCTEQKV FT QADLGTSVLIKGRVVHKDNLK" FT SO_feature CDS ; SO:0000316:join(567..568,5551..7000) FT SO_feature start_codon ; SO:0000318:1..3 FT /name="gypsy\env" FT /db_xref="FLYBASE:FBgn0014964" FT /translation=" FT MFTLMMFIPLVVANARITDFSHANYIPVLDGDVLVFEQRDLLKHSSNLSE FT YASMIDETQKLSESFPHSHMRKLLEVDTDHLRTLLSVLKVHHRIARSLDF FT LGTALKVVAGTPDATDLFKIKITEAQLVESNSRQIAINSETQKQINKLTD FT TINKVINARKGDLVDTPHLYEALLARNRMLSTEIQNLILTITLVKSNIIN FT PTILDHADLKPLVEQDTPIVSLIEASKIRVLQSENSIHILIAYPRVKFSC FT KKVAVYPVSHQHTILRLDEDTLAECEHDTFAVTGCTDTTHFTFCERSRRE FT TCVRSLHAGNAAQCHTQPSHLREINPVDDGVVIINEAAAHVSTDGSPETL FT IEGTYLVTFERTATINGSEFVNLRKTLSKQPGIVRSPLLNIVGHDPVLSI FT PLLHRMSNENLHSIQNLMDDVESEGSPRLWFVAGVVLNFGLIGSLALYLA FT LRRRRASREIQRTIDTFNMTEDGHKLEGGVVNN" XX CC Derived from M12927 (g157583) (Rel. 44, Last updated, Version 6). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. CC [See also:AF033821; alignments in /alignments/gypsy] XX SQ Sequence 7469 BP; 2301 A; 1808 C; 1602 G; 1758 T; 0 other; AGTTAACAAC TAACAATGTA TTGCTTCGTA GCAACTAAGT AGCTTTGTAT GAACAATGCT 60 GACGCGCCAG AATTGGGTTC AACGCTCCAC GCGAAGAATG CCTGGCAGCG GAAAGCTGAC 120 ACTTCCTACC GGGAGTGTTG CTTCACGCTG CAAGAAATGC TGAGTCGGCT TGCCGACTTG 180 TGGCGGCGCG ATGCATTGCT CGAGGGTAAA CTTAGTTTTC AATATTGTCT TCTACTCAGT 240 TCAAATCTTG TGTCGAAATA AACCACAGCT TGCTCCGGCT CATTGCCGTT AAACATCATT 300 GTTCTTATTT ACAATCAAAT CGCTATCGCC ACAAGGCTAG TGATAATAAC TAAGGGGGCG 360 AAGTCAAGCC CTCCAACCTA ATCTCCATAA ACAGTGTCTA AGACGAACCT CAGCGAAAGA 420 AGGAAGATCT CTAGACCTAC TGGAAATAAC ATAACTCTGG ACCTATTGGA ACTTATATAA 480 TTGGCGCCCA ACCAACAATC TGAACCCACC AATCTAATTT AACACACTTT GTCAGGCGAC 540 AAACAGGGTA GTTAAGTTAG AAAAGCATGT AAGTTTTACA AGACACTTCT TTGACGCAAT 600 CAAGAAATTT ACGAGTGAAA AAAAAAAAAA AAAAAAGTTG TGTATCTGGC CACGTAATAA 660 GTGTGCGTTG AATTTATTCG CAAAAACATT GCATATTTTC GGCAAAGTAA AATTTTGTTG 720 CATACCTTAT CAAAAAATAA GTGCTGCATA CTTTTTAGAG AAACCAAATA ATTTTTTATT 780 GCATACCCGT TTTTAATAAA ATACATTGCA TACCCTCTTT TAATAAAAAA TATTGCATAC 840 TTTGACGAAA CAAATTTTCG TTGCATACCC AATAAAAGAT TATTATATTG CATACCCGTT 900 TTTAATAAAA TACATTGCAT ACCCTCTTTT AATAAAAAAT ATTGCATACG TTGACGAAAC 960 AAATTTTCGT TGCATACCCA ATAAAAGATT ATTATATTGC ATACCTTTTC TTGCCATACC 1020 ATTTAGCCGA TCAATTGTGC TCGGCAACAG TATATTTGTG GTGTGCCAAC CAACAACCAA 1080 TGAGTTGGGC ACATAACTAC AGAAAGGTTA AGGTCGAATA CGAAAGCGAG GATAGCTGGG 1140 AGGAGGAGCA AGTAGGCCAA GCATTAGGTC GGCCGTTAGA TAGTGCCACG GTAGATATTA 1200 CCATGGACCC CAATCAGATT CAAGCTCTTA TCGACAATGC TGTCAGACAG GCATTGTCGC 1260 AACAGCAATC CCAATTTCAG ACACAACTCA ATTCCCTAGC TGCGCGGGTA CAGAGTTTGC 1320 AGGTGGAAGC ACCGCAAATC AAGATTTACG AAAAAGTCTC TGTTAACCCC GATGTTAGGT 1380 GCGACATTCC CCTTGACATA ATAAAGTCTG TACCAGAGTT CTCCGGTACC CAAGACGAGT 1440 ATGTGGCCTG GAGACAATCG GCCATATACG CCTACGAGCT CTTCAAACCA TACAATGGCA 1500 GCAGTGCCCA TTATCAGGCT GTTGCCATAT TAAGGAATAA AATCCGTGGC GCAGCCGGGG 1560 CTTTACTGGT CTCCCACAAT ACGGTATTGA ACTTCGATGC TATTTTGGCC AGACTAGACT 1620 GCACGTACTC GGACAAAACA TCCTTACGCC TGTTGAGGCA AGGATTGGAA ATGGTTAGGC 1680 AAGGAGACCT ACCACTAATG CAATACTACG ATGAAGTTGA AAAGAAGCTA ACGCTTGTCA 1740 CTAACAAAAT CGTAATGACG CATGAACAAG AGGGTGCTGA CCTGCTTAAC GCTGAGGTCA 1800 GAGCCGACGC CCTGCATGCT TTTATTTCGG GGCTCAAAAA GGCCCTCAGA GCTGTGGTCT 1860 TCCCGGCCCA ACCAAAAGAC CTGCCATCTG CACTGGCTTT AGCTAGAGAA GCAGAGGCAA 1920 GCATAGAGAG AAGCATGTTC GCTAACTCCT ACGCCAAGGC CGTAGAGGAG CGAGCGCATT 1980 CGGGGGCAAA CGGCAAGAGC CGTTTCCAGG GGAAGCCAAA TAAAGAAGAA CAGGGACAGG 2040 ACAGGAATCC CCACTTCACC AAACGCCCCA AAAATAACGG ACAAACCAAC AAGGACACTC 2100 AGGCGCAAGC ACCCCAGCCA ATGGAGGTCG ATTCATCCTC CAGGTTTAGG CAGCGTACTG 2160 AACATTATCA GAATCATCCT AACGAGTCGA ACGCGTTTAA GAGGAGAAAT TCCTCAGAAC 2220 GCTCAACAGG ACCGAGACGA CAACGTCTGA ATAACGTTGT CCAAGAGGCC CCTAAACAAA 2280 AGGACCCCAA AGAAGAGTAT GAAAAAACAG CAAAGGCTGC AGTCGAGGAA ATCGACAGCG 2340 AAAATGAGTA CGCTCCCAGT GACGACTCGT TGAATTTTTT AGGGGGCGCT CCCGGTTGCC 2400 GTTCATTGAA CGACGGCTGG CTGGGAGAAC CTTAAAGATG CTAATCGATA CCGACGCGGC 2460 AAAAAACTAC ATTAGGCCCG TAAAGGAGCT GAAAAATGTA ATGCCGGTCG CCAGCCCTTT 2520 CTCGGTGAGC TCAATACACG GCTCCACCGA AATCAAACAC AAATGCTTGA TGAAAGTCTT 2580 CAAGCACATC TCCCCATTTT TTCTTTTGGA TTCTCTCAAT GCGTTCGACG CTATCATAGG 2640 CTTGGACCTG TTAACACAGG CCGGGGTAAA ACTCAACCTT GCAGAGGACT CCTTAGAATA 2700 CCAGGGCATC GCTGAAAAGC TTCATTATTT CAGCTGCCCC AGTGTAAATT TCACTGATGT 2760 AAACGATATT GTTGTACCTG ACTCCGTTAA AAAGGAGTTC AAGGACACAA TAATAAGGAG 2820 GAAGAAAGCT TTCTCCACAA CAAATGAAGC TCTTCCTTTT AACACCGCTG TCACTGCCAC 2880 AATTCGGACA GTTGACAATG AACCGGTGTA CTCAAGAGCG TACCCAACTC TTATGGGTGT 2940 CTCCGACTTT GTGAACAACG AGGTCAAACA ACTGCTGAAA GACGGCATTA TCAGGCCCTC 3000 AAGGTCTCCC TATAACAGCC CGACCTGGGT TGTTGACAAA AAGGGGACCG ACGCCTTCGG 3060 GAACCCAAAC AAGAGGTTGG TCATTGACTT CAGGAAGCTA AATGAGAAAA CTATTCCTGA 3120 CCGGTACCCG ATGCCTAGCA TTCCCATGAT TCTAGCGAAT CTGGGCAAGG CAAAGTTCTT 3180 CACTACCCTT GATCTTAAGT CAGGGTATCA TCAAATTTAC CTCGCGGAAC ACGACCGCGA 3240 GAAGACATCG TTCTCGGTGA ATGGTGGTAA ATACGAGTTT TGCCGTCTAC CGTTCGGCTT 3300 GAGAAATGCA AGCAGCATTT TTCAAAGAGC CCTAGACGAT GTGCTTAGAG AGCAAATCGG 3360 GAAGATATGT TACGTCTATG TAGATGACGT CATAATTTTC TCTGAAAACG AGTCCGACCA 3420 TGTCCGCCAC ATCGATACAG TACTAAAATG CCTGATCGAT GCCAACATGA GAGTAAGCCA 3480 GGAGAAAACT AGATTCTTTA AAGAGAGTGT AGAATACCTC GGCTTTATTG TCAGTAAGGA 3540 CGGAACTAAA TCCGATCCAG AGAAGGTGAA GGCCATTCAG GAGTACCCTG AACCAGACTG 3600 CGTTTACAAG GTTAGGTCCT TCCTTGGTTT AGCCAGCTAC TACAGAGTCT TCATCAAAGA 3660 CTTTGCTGCC ATAGCCCGCC CGATCACCGA TATCCTAAAA GGGGAAAATG GTTCGGTGAG 3720 CAAACACATG TCTAAAAAAA TTCCTGTTGA GTTTAATGAA ACTCAACGCA ACGCGTTCCA 3780 AAGACTGCGA AACATACTAG CATCCGAGGA TGTCATACTC AAATACCCCG ACTTTAAAAA 3840 GCCTTTTGAC CTTACTACAG ATGCTTCGGC AAGTGGTATC GGTGCAGTCC TATCCCAGGA 3900 GGGCAGGCCA ATCACCATGA TATCGCGTAC CCTTAAACAG CCCGAGCAGA ACTACGCCAC 3960 AAACGAAAGG GAATTGCTGG CGATTGTATG GGCCCTAGGT AAGTTGCAGA ACTTCCTGTA 4020 TGGCTCTAGG GAGATTAATA TATTTACCGA CCATCAACCC CTCACTTTCG CTGTTGCCGA 4080 CAGGAACACG AATGCCAAGA TAAAGAGGTG GAAATCTTAC ATAGACCAGC ATAATGCCAA 4140 GGTTTTCTAC AAACCTGGCA AAGAAAATTT CGTGGCAGAC GCCCTCTCTA GGCAGAATCT 4200 GAATGCCTTA CAAAACGAAC CCCAATCAGA CGCTGCGACC ATTCACAGTG AGCTCTCCCT 4260 GACCTACACG GTCGAGACAA CAGACAAACC GTTAAATTGC TTCAGGAACC AGATCATTCT 4320 GGAGGCAGCA CGTTTTCCGC TCAAACGAAA CCTGGTGCTC TTTCGAAGCA AATCTCGCCA 4380 CTTAATCAGC TTTACTGATA AAAGTTGGCT ATTAAAAACA CTTAAGGAGG TGGTAAACCC 4440 TGACGTCGTG AACGCTATTC ACTGCGACCT GCCCACTCTG GCAAGCTTCC AACACGACCT 4500 CATTGCCCAC TTTCCAGCCA CCCAATTTCG TCACTGTAAG AATGTCGTGT TAGACATAAC 4560 CGACAAAAAC GAACAGATCG AAATCGTCAC TGCCGAGCAC AACCGCGCTC ACAGAGCCGC 4620 ACAAGAAAAC ATTAAACAAG TCCTTCGGGA TTATTACTTT CCCAAAATGG GCAGTTTAGC 4680 TAAAGAAGTA GTAGCTAATT GTAGGGTCTG CACCCAAGCA AAGTATGACA GGCACCCGAA 4740 AAAGCAAGAG CTCGGGGAAA CGCCCATACC CAGCTATACA GGTGAGATGG TGCATATTGA 4800 CATATTCTCA ACCGACAGGA AGCTATTCCT GACGTGTATT GACAAATTTT CTAAATATGC 4860 AATAGTGCAA CCAGTGGTGT CTAGAACAAT AGTGGACATC ACAGCACCCC TGTTGCAGAT 4920 CATTAACCTG TTCCCCAATA TCAAAACGGT CTATTGTGAC AATGAGCCCG CATTTAACTC 4980 AGAAACTGTC ACCTCAATGC TCAAGAACAG CTTCGGCATT GACATAGTAA ATGCGCCCCC 5040 ACTCCACAGC TCATCCAATG GCCAAGTTGA ACGGTTCCAC AGCACATTGG CAGAAATCGC 5100 CAGGTGCCTG AAGTTGGACA AAAAAACGAA TGACACAGTA GAACTAATCT TGAGGGCGAC 5160 GATAGAATAT AACAAAACCG TGCACTCAGT TACTCGTGAG AGACCAATTG AGGTGGTTCA 5220 CCCAGGGGCC CACGAGCGCT GCCTAGAAAT CAAGGCAAGA TTAGTAAAGG CTCAGCAAGA 5280 CAGCATCGGA AGAAACAACC CTTCCCGACA AAACCGCGTG TTTGAGGTGG GAGAACGCGT 5340 GTTTGTAAAA AACAACAAGA GGTTAGGAAA TAAGCTAACT CCACTATGCA CCGAGCAAAA 5400 AGTGCAGGCA GACTTGGGAA CGTCTGTTCT TATTAAGGGG AGGGTGGTCC ACAAGGACAA 5460 CCTCAAGTAG ACATTCCCTC TACAGTTAGG TAGTAAGTTA TGTCAAGGAA AATCCGAGCA 5520 CTGTAGTATC ACCTTGTCTT TAATTTCCAG GTTCACCCTC ATGATGTTCA TACCCTTGGT 5580 AGTAGCGAAT GCTCGGATCA CCGACTTTTC GCATGCCAAC TACATTCCTG TGTTAGATGG 5640 GGATGTGCTG GTGTTTGAAC AGCGTGACCT CTTGAAACAT TCGAGTAACC TTTCCGAGTA 5700 CGCTAGTATG ATAGATGAAA CACAGAAACT GTCCGAGTCC TTTCCCCACT CACATATGCG 5760 TAAGTTGCTA GAGGTCGATA CTGACCATCT TAGAACCTTG TTGTCCGTTC TCAAAGTCCA 5820 CCATAGGATA GCTAGGAGTC TAGATTTCTT AGGTACAGCC TTAAAGGTTG TGGCGGGTAC 5880 TCCCGATGCC ACGGACCTCT TTAAAATTAA GATCACAGAG GCCCAACTAG TAGAATCTAA 5940 TTCCAGGCAG ATAGCTATAA ACTCCGAAAC CCAGAAACAG ATAAATAAGT TAACTGACAC 6000 CATCAATAAG GTGATCAATG CCCGTAAAGG CGACTTGGTT GACACTCCAC ACTTATATGA 6060 AGCACTACTA GCAAGAAATA GGATGCTGTC TACAGAAATT CAAAATTTAA TTCTCACTAT 6120 TACTTTGGTC AAATCAAACA TTATAAATCC CACAATTCTT GATCATGCCG ACTTGAAGCC 6180 TCTTGTAGAA CAGGATACCC CAATTGTCAG CTTAATAGAA GCATCTAAGA TCAGGGTCCT 6240 CCAGTCCGAG AATAGCATTC ATATTTTAAT TGCCTATCCT AGAGTCAAGT TCAGTTGCAA 6300 GAAAGTCGCC GTCTACCCTG TATCTCACCA ACACACCATC TTGCGCCTCG ACGAAGACAC 6360 TTTGGCCGAA TGCGAACATG ACACCTTTGC GGTCACCGGA TGCACAGACA CCACACACTT 6420 CACGTTCTGC GAGCGGTCTC GGCGCGAAAC TTGCGTGCGC TCACTCCATG CTGGAAACGC 6480 TGCTCAATGC CACACTCAAC CCAGCCACTT GCGAGAAATA AACCCCGTAG ATGATGGCGT 6540 TGTGATTATC AACGAAGCCG CAGCTCACGT TAGCACTGAT GGCAGCCCCG AAACACTGAT 6600 AGAGGGAACC TACCTGGTAA CCTTCGAGCG AACGGCAACC ATCAACGGCT CTGAATTCGT 6660 AAATCTAAGG AAAACACTAA GCAAGCAGCC AGGCATCGTG CGTTCACCAC TACTTAACAT 6720 CGTCGGCCAC GACCCTGTGC TCAGTATACC TCTGCTACAC CGGATGAGTA ACGAAAACCT 6780 ACATTCCATC CAAAACCTTA TGGATGACGT GGAATCTGAA GGCTCGCCCA GACTCTGGTT 6840 CGTGGCTGGT GTGGTCCTAA ACTTCGGCTT GATTGGCTCT CTCGCCCTTT ATCTGGCATT 6900 AAGGAGAAGA CGAGCCTCTA GGGAGATACA GCGCACCATC GATACTTTCA ACATGACCGA 6960 GGACGGTCAT AAACTTGAGG GGGGAGTAGT TAACAACTAA CAATGTATTG CTTCGTAGCA 7020 ACTAAGTAGC TTTGTATGAA CAATGCTGAC GCGCCAGAAT TGGGTTCAAC GCTCCACGCG 7080 AAGAATGCCT GGCAGCGGAA AGCTGACACT TCCTACCGGG AGTGTTGCTT CACGCTGCAA 7140 GAAATGCTGA GTCGGCTTGC CGACTTGTGG CGGCGCGATG CATTGCTCGA GGGTAAACTT 7200 AGTTTTCAAT ATTGTCTTCT ACTCAGTTCA AATCTTGTGT CGAAATAAAC CACAGCTTGC 7260 TCCGGCTCAT TGCCGTTAAA CATCATTGTT CTTATTTACA ATCAAATCGC TATCGCCACA 7320 AGGCTAGTGA TAATAACTAA GGGGGCGAAG TCAAGCCCTC CAACCTAATC TCCATAAACA 7380 GTGTCTAAGA CGAACCTCAG CGAAAGAAGG AAGATCTCTA GACCTACTGG AAATAACATA 7440 ACTCTGGACC TATTGGAACT TATATAATT 7469 // ID DMHFL1 standard; DNA; INV; 2959 BP. XX AC M69216; XX DR FLYBASE; FBte0000154; Dmel\hobo. XX SY synonym: H-element XX XX FT source M69216:1..2959 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..12 FT SO_feature terminal_inverted_repeat ; SO:0000481:2948..2959 FT SO_feature TATA_box ; SO:0000174:107..112 FT SO_feature polyA_signal_sequence ; SO:0000551:2382..2394 FT SO_feature CDS ; SO:0000316:316..2292 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\hobo\T" FT /db_xref="FLYBASE:FBgn0014191" FT /translation=" FT MAPYIMIVEFLCLWSSVSAVNCPFFVFYDAITSLLGFSIIWKPKEKVTIM FT AEAADFVKNKINNGTYSVANKHKGKSVIWSILCDILKEDETVLDGWLFCR FT QCQKVLKFLHKNTSNLSRHKCCLTLRRPTELKIVSENDKKVAIEKCTQWV FT VQDCRPFSAVTGAGFKNLVKFFLQIGAIYGEQVDVDDLLPDPTTLSRKAK FT SDAEEKRSLISSEIKKAVDSGRASATVDMWTDQYVQRNFLGITFHYEKEF FT KLCDMILGLKSMNFQKSTAENILMKIKGLFSEFNVENIDNVKFVTDRGAN FT IKKALEGNTRLNCSSHLLSNVLEKSFNEANELKKIVKSCKKIVKYCKKSN FT LQHTLETTLKSACPTRWNSNYKMMKSILDNWRSVDKILGEADIHVDFNKS FT SLKVVVDILGDFERIFKKLQTSSSPSICFVLPSISKILELCEPNILDLSA FT AALLKERILENIRKIWMANLSIWHKAAFFLYPPAAHLQEEDILEIKVFCI FT SQIQVPISYTLSLESTETPRTPETPETPESLESPNLFPKKNKTISSENEF FT FFPKLVTESNSNFNESPLDEIERYIRQRVPLSQNFEVIEWWKNNANLYPQ FT LSKLALKLLSIPASSAAAERVFSLAGNIITEKRNRLCPKSVDSLLFLHSY FT YKNLNNSQ" XX CC Derived from M69216 (g157606) (Rel. 41, Last updated, Version 3). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. CC CDS annotation from Lynn Crosby's annotation 'H-element.v004'. XX SQ Sequence 2959 BP; 994 A; 541 C; 571 G; 853 T; 0 other; CAGAGAACTG CAAGGGTGGC ACTTTTTTAC CACTCGACTC ACACCCTACA ATTTTGTGTG 60 CGGGTGCTAC TCGCCACGCA CATCGCGGGT ACTTACAAAC ACACAGTATA AATCTGAACA 120 TGCAGACAAG ACACCCCGTT GTGTGCGCAC CCGAATCAAT ACGGTGTTTT GCGTCGCGGG 180 TGCCGCTCAC ACAGTGCCTA AAAAGGGATG AGTGAGAAAA ACACTTGTGG GTATACCGTT 240 AAACACATGG GTGTTTCCAA AAATACTCGG GTGTTTCCAA AAATACTCGA GTGGTCTCGT 300 AGGTAGTCGA GTCAAATGGC GCCATACATA ATGATTGTTG AGTTCTTGTG TCTTTGGTCC 360 AGTGTCTCGG CTGTTAATTG CCCCTTTTTT GTTTTTTACG ATGCAATTAC TAGCTTGTTA 420 GGATTCAGTA TTATTTGGAA GCCAAAGGAA AAGGTCACAA TAATGGCAGA AGCGGCTGAT 480 TTCGTTAAAA ATAAAATTAA CAATGGAACA TACTCAGTTG CCAATAAACA TAAAGGAAAA 540 AGTGTTATTT GGAGCATTTT ATGTGACATT TTAAAGGAAG ATGAAACTGT TCTGGACGGA 600 TGGCTGTTCT GCAGGCAATG CCAGAAAGTG CTCAAATTTT TACACAAAAA CACCTCCAAT 660 TTATCCCGCC ATAAATGTTG TCTAACATTA AGACGACCAA CGGAATTAAA AATTGTTTCG 720 GAAAACGACA AGAAAGTAGC TATTGAAAAA TGCACCCAAT GGGTTGTCCA AGATTGTCGG 780 CCGTTTTCTG CAGTAACCGG AGCCGGATTT AAAAATTTGG TGAAGTTTTT CCTACAAATC 840 GGCGCTATCT ATGGGGAACA GGTAGACGTC GATGACTTAC TACCTGATCC AACAACATTA 900 AGTCGGAAGG CCAAATCGGA TGCAGAAGAG AAGAGGAGTC TAATCTCGTC CGAGATAAAA 960 AAAGCTGTGG ATAGCGGAAG AGCAAGTGCG ACCGTCGACA TGTGGACTGA CCAGTATGTC 1020 CAAAGAAACT TTTTGGGCAT CACTTTCCAT TACGAAAAAG AATTTAAACT TTGTGACATG 1080 ATTTTGGGAC TAAAATCGAT GAATTTTCAA AAATCGACTG CCGAAAACAT TTTAATGAAA 1140 ATTAAAGGTT TATTTTCGGA ATTCAATGTT GAGAACATTG ATAATGTTAA GTTTGTGACT 1200 GACAGGGGAG CAAATATAAA AAAGGCTTTA GAGGGCAATA CCCGTTTAAA TTGTAGCAGT 1260 CACCTGTTGT CAAATGTTTT AGAAAAATCG TTTAACGAGG CCAATGAACT CAAAAAAATT 1320 GTGAAATCAT GCAAAAAAAT CGTGAAGTAC TGCAAAAAAT CAAATTTGCA GCATACTCTA 1380 GAAACCACTT TGAAAAGCGC CTGTCCGACT AGATGGAACT CCAACTACAA AATGATGAAG 1440 TCCATTCTGG ATAACTGGCG TAGTGTGGAT AAAATATTAG GTGAAGCTGA TATCCATGTA 1500 GATTTTAATA AATCATCTTT AAAAGTTGTG GTAGATATTC TAGGAGACTT TGAACGAATA 1560 TTTAAGAAGT TGCAAACATC TAGCTCACCA TCTATATGCT TCGTATTGCC ATCCATCTCT 1620 AAAATTTTAG AATTATGCGA GCCGAATATT TTAGACCTTT CTGCAGCAGC ATTGCTTAAG 1680 GAAAGAATTT TGGAAAATAT TCGTAAGATT TGGATGGCAA ATCTAAGCAT ATGGCATAAG 1740 GCGGCATTTT TTTTATATCC ACCCGCAGCA CATCTTCAGG AAGAAGATAT TCTTGAAATA 1800 AAGGTGTTTT GCATTTCACA AATTCAAGTC CCAATTTCAT ACACATTAAG CTTAGAATCT 1860 ACAGAAACTC CAAGAACTCC AGAAACTCCA GAAACTCCAG AAAGTCTAGA AAGTCCAAAC 1920 TTATTTCCAA AAAAAAACAA AACAATATCT TCTGAAAACG AATTCTTCTT CCCAAAGTTA 1980 GTAACTGAGT CTAATTCCAA CTTCAATGAA TCTCCATTAG ATGAAATTGA ACGATATATT 2040 AGACAAAGAG TTCCATTGTC TCAAAATTTT GAAGTAATTG AGTGGTGGAA AAATAACGCA 2100 AACTTATACC CTCAGTTGTC AAAGTTAGCA TTAAAACTTT TATCAATACC AGCCAGTAGC 2160 GCAGCAGCTG AAAGAGTGTT TTCCCTAGCA GGTAATATAA TAACAGAAAA GCGAAATAGA 2220 TTATGCCCAA AATCTGTAGA TAGCCTCCTT TTTTTGCATT CCTATTACAA AAACCTAAAC 2280 AACTCGCAAT AGATATTCCT TCTTATAAGT ATATTTTATA TTATTAATTC TTATTATTTG 2340 CTTAATTTTT GTATAAGTGT TAAGTATTAA GTATAAGTAT TAATTAATAA TATATAAGAT 2400 TGTTATTTGT TAAGACATTA GATGCAAAAT CCTAAAAATG TGAAAGTAAT GAAGTTCCTT 2460 ATATTTAATA GATACTTTTT AAGCCCACTA TGTTTTTATT ATTTAGATTG AGACATTAAA 2520 AAACGTAAAA ATCAACAAAT GCCGTCTTTA ATTGCAATTA CTTTATGTGT TTGAAATGGG 2580 AGGCACCCAT TGAGTCCATC AAAGAGCAAA GACATGAGCA CAAAAATTTT CTTGGGTATT 2640 CCCTTTTACC CTTCATTTCT TATACCCGTC ACGCTTCCAC CCATACAAAT TTTAGGCGTA 2700 CAAAAAATGA CCAGAGAACT GCAGCCCGCA TACAAAAAAT GACCTGCGGC CGATCGTTGA 2760 CTGTGCGTCC ACTCACCCAT ACGGCTCTTG CGCAGCAGGC CTCGGGTGGT TTTTTTACTC 2820 GTAACAAAAA CACAACGTCG GTAAAACACT CGAGTATTTT GTGTTGCCGC AAGTAGGGTG 2880 TCAAAAAAAA CGGGGTGCCT AGAGTACCGA GTGTTTATCG GGTGGACGTA GAGTGCGAGT 2940 GGCGGGCTGC AGTTCTCTG 2959 // ID DMTHB1 standard; DNA; INV; 1653 BP. XX AC X01748; XX DR FLYBASE; FBte0000414; Dmel\HB. XX FT source X01748:189..1841 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..31 FT SO_feature terminal_inverted_repeat ; SO:0000481:1622..1653 FT SO_feature CDS ; SO:0000316:387..534 FT /name="Dmel\HB\T" FT /db_xref="FLYBASE:FBgn0044055" FT /db_xref="SPTREMBL:Q27293" FT /db_xref="NCBI_PROTEIN:CAA25884.1" FT /translation="MLILKLRKEGKTYKDIQKTLKCSAKMVSNAIKYKWKPENRGTKHK FT TTDIEDRRIVSYSKVYRFASFRDIKSELNLGISDVTIRRRLLNQNFSARSPRKVPLPSP FT RHIKARLSLAKTYLNWPVSKWRNILWTDGSKIMLFGGTGSLQYI" XX CC Derived from X01748 (g8693) (Rel. 49, Last updated, Version 3). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 1653 BP; 568 A; 288 C; 302 G; 495 T; 0 other; ATGTACAGCT GTGTTCAGAA AAATAGCAGT GCGAAGGAAA CTAAGTAATA CAAAGGTATT 60 TTTCCATGTC CCTTTTCGGA ATCGACTTTT TATTCCTCTT ATTTTTGTTA AATGGAATGT 120 GTAGATAGGG AAAAAAAGAA AATCCGGTCA GTTTTTCTTG TTATCCTTTT TTTATTTACA 180 TTCTTGAGCA AAATCACAAT TTTTAGGCTG TTCATAAGAA TAGCAGTGTC TGGTTCTGAC 240 CAACGTAAAG TCCCGAAATG ATCAATATTT TCTAAAAAGT GAGTTTGGTT AAGTTAATTC 300 GTATATTTAA AAGGACAATA AATTAAAAAA ATTAAAAAAA TTTTATTTTA GTGGGTAGAG 360 GACAGCACTA CTCCCAGGGG AAAAGAATGT TAATTCTTAA GCTTAGAAAG GAAGGAAAAA 420 CATATAAGGA CATTCAAAAA ACCCTTAAAT GTTCTGCCAA AATGGTATCC AATGCCATTA 480 AATATAAATG GAAGCCCGAA AACCGTGGTA CCAAACATAA AACCACAGAT ATAGAGGATC 540 GACGCATTGT TTCTTACAGC AAAGTCTATC GTTTTGCATC CTTTAGGGAC ATAAAGTCTG 600 AGCTGAACTT GGGAATCAGC GACGTTACTA TTCGTAGACG ACTACTGAAT CAAAATTTCA 660 GTGCGAGGAG TCCACGAAAG GTTCCCCTAC CTAGCCCAAG GCATATTAAG GCAAGGTTAA 720 GCTTAGCTAA AACCTACCTA AACTGGCCAG TCTCCAAATG GCGTAATATC CTTTGGACTG 780 ATGGGTCAAA AATCATGCTA TTTGGTGGAA CTGGTTCACT ACAGTATATC TGACGACCTC 840 CAAACACGGA GTATCACCCA AAACACCCAG TGAAGACTTT CAATCACGGT GGACCTAAAA 900 TCATGGTATG GGCTTGTTTT TTTTATAATG GTATGAGTCA TGCTATGGAT TATGATTTAT 960 GGTATTATAG ACCAAAACGC ATATGTAAAT ATACTTAGTG ATGTCTTATT GTCATATTCT 1020 GAATAAAATA TACCCTTAAA ATGGACATTC CAACAGGATA ATGATCAGAA ACGCAGATGT 1080 AAATCGGCTA AGAATAGGTT CACCCAAAAT AGAATAGATG CAATGCCGTG GCAAGCACCA 1140 CCTTCCCATT TAAACCCGAT TGAAAACCTG TATGGGGACA TTAAACAGTT TGTGTCGAAG 1200 AAGTCCCCGA CGTCTAAGAC TCAGATTTGG CAAGTTGTGC AGGATACATG GGCAAAAATT 1260 CCTCCCAAAC CTTGCTAGGA CTTGGTGGAC TTCATGCCGC GTGGGTGTAA GGCTGTGCTG 1320 GCTAACAAAG GCTATCCAGC CAAGTATTAG GCCCGAATTA ACATATTAAA AAGAAAAACT 1380 AAGTTCGTTC TAGGTCAAGT TAAATTTTGT TACTATTTTT TCATAGCACT GCTATTTTAT 1440 TGAACACCAG AATTTCTGCC TATTTATTGT TTTAATCTAT ATTTTCGAAA CTATTGAAGA 1500 AATAAAAGTG AAACATTTGT TAAATTGTTT GAAATGAAAT ACCTAATGAT ATTATTAAAA 1560 AAAAATTCCC ATTAAAACTG TAAATCATAG GAATTTTTTA TCTTAAACTC TGAAGTCCAA 1620 AGCACTGCTA TTATTCTGAA CACAGCTGTA CAT 1653 // ID DM06920 standard; DNA; INV; 6083 BP. XX AC U06920; XX DR FLYBASE; FBte0000143; Dmel\HeT-A. XX FT source U06920:1015..7097 FT SO_feature five_prime_UTR ; SO:0000204:1..731 FT SO_feature three_prime_UTR ; SO:0000205:3497..6083 FT SO_feature polyA_sequence ; SO:0000610:6077..6083 FT SO_feature CDS ; SO:0000316:732..3497 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\HeT-A\gag" FT /db_xref="FLYBASE:FBgn0016662" FT /db_xref="REMTREMBL:AAC17188" FT /db_xref="NCBI_PROTEIN:AAC17188.3" FT /translation="MSMSDNLFSDDEVLSISSSPEQRSSPFYLNISPMSHGSDNSQINT FT VIINSKKLPSNQADISLKNSSGAAIKIVNSLSHKKKENTNVNNAQKDPLSLTNTTASTC FT GAKSSISEGKLSSPPSTSHTYEGKLLTKLTHTHTDFRGAKTSDAMGSFPSLSHSDNSIE FT KNLSSSTKIGPNASSPPSHAHTHTSKSTDISLESRSKHPALANTDARSIKANANDNGEI FT FSSLIQIDERKQEERPCTTINAFWSIFKPKPDVTKLSLKRKPTNPTKNTGKKCISPHKK FT SAYLCPSAQDDLNLNLNPKSSAKPTVVNLPAARILSRPAAKRDLFKSSSSRSPDEQPMS FT FSEVVAGTGSIFAAPCVPAPLTKTPGKRTNDDLDCSNFKTPNKKLCATSNFVTPSIFPP FT LITPVFKSKAAQSVYEESKARNGPPPPALACSINASARSAAAPPGIAPLPPHNTDAELP FT PWKIVPQSRRAPPILVNDVKEIVPLLEKLNYTAGVSSYTTRAIEGNGVRIQAKDMTAYN FT KIKEVLVANGLPLFTNQPKSERGFRVIIRHLHHSTPCSWIVEELLKLGFQARFVRNMTN FT PATGGPMRMFEVEIVMAKDGSHDKILSLKQIGGQRVDIERKNRTREPVQCYRCQGFRHA FT KNSCMRPPRCMKCAGEHLSSCCTKPRTTPATCVNCSGQHISAYKGCPAYKAEKQKLAAN FT NVDINKIRTIKDATNNFYKRQGPPLRNNTPRLPHSSAILSKSIAEARQEAARKSMLNPF FT RQNINDRRPRFSSHDTAIQKRLNKWRRNTNKIPKKGRIALKDNAKPRPAHRTSNPAQRH FT LEDYQDMLRRERSEENDQESEKGTPNTKQVGNDSPPTTSRAARASFKPRIIDDTTPSPK FT ICNPNSQKGLLDDPTTSLANRVDNLEKKIDILMALIIQGRNNNLDMDTSN" XX CC Derived from U06920.2 (Rel. 67, Last updated, Version 14). CC Michael Ashburner, 26-Jan-2002. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 6083 BP; 2199 A; 1545 C; 1033 G; 1306 T; 0 other; TAAATAAATA AAATAAATTA AACAATTAAC TAAATAATTA AATAACTAAA ATTAATAATA 60 TAATCCGTTC GCTTGCCAAA GACTCTCACG CGCATAACTA ATTAAAATCG ATTTTCAAGT 120 TGACAAATAA ATGGTTTAAA ATTGTCCTCA GGCTGCAAAG AAAAGCCGCG GCAACAATAA 180 ACATTTAGTG ACACGCGAAA AGCGAACATT TGATTAGTGT AATACTTGTG CAAACCGACA 240 AGCTGCCGCC ATAACAAAAC GGAGACGAAG AATCATAAAG AACAAAAGCT AAATCCACCA 300 GCATAGCAAA AATAAATTAA CAAATAAAAT AAAAGCAAAT TTAAATAACA TAATAAATTA 360 AACTTATTTA ATAAACCAAT TAATTTTAAT TAATTCAATT AAACGCTAAA TCTACATAAT 420 ACTCCACGCG CAAATTAATT GAAATCGTCT TTCTAGTTAA TAAATTAAAA GTTTAAAAAT 480 TGTCTCCGGC CGCAAAATTT GAACCGCGAC GATAAAAACA TTTAATTGAC AAACAAAAAG 540 CGAACAATTA TTCAGTGAAC TATTTGTGCA AAATTGACAA GCAGACGCCA TAATTAAAAG 600 GAGAAGAAGC CAAAAGACGA AGAGAAGAAA GCAACCAGAA GAACTCAAAG AAGAAAAGGA 660 GGAAAGCCCA ATTAAAGAAA GCCAGGGTAT TTATACCTTA CACTTATCGT TTAATATAAC 720 AAAAACCCAA CATGTCCATG TCCGACAACC TTTTTTCTGA CGATGAGGTA CTTTCAATTT 780 CCTCAAGCCC AGAACAGCGA TCTTCTCCGT TCTACCTCAA TATATCGCCC ATGTCCCACG 840 GATCAGACAA TTCTCAGATT AATACAGTCA TCATTAATTC GAAGAAATTG CCCTCAAATC 900 AAGCAGACAT AAGTTTAAAA AACTCTTCTG GGGCTGCTAT AAAAATTGTT AATTCCCTTT 960 CACACAAGAA GAAAGAGAAC ACAAACGTTA ATAATGCCCA AAAAGACCCC CTCTCACTCA 1020 CCAATACTAC TGCAAGCACT TGTGGCGCCA AAAGCAGCAT CTCAGAGGGG AAATTGTCTT 1080 CTCCTCCGTC CACCTCACAC ACATATGAGG GGAAATTACT CACAAAACTT ACTCACACAC 1140 ACACAGACTT TAGAGGCGCC AAAACGAGCG ATGCAATGGG AAGTTTCCCC TCTCTCTCGC 1200 ACAGCGACAA TAGCATAGAG AAAAATCTGA GTTCTTCCAC CAAAATTGGA CCAAACGCTT 1260 CTTCCCCTCC TTCTCATGCA CACACTCACA CTAGCAAATC CACTGATATA AGCTTAGAAA 1320 GCCGCTCAAA ACATCCCGCG CTTGCCAATA CGGACGCACG CTCTATAAAA GCCAATGCTA 1380 ATGACAATGG GGAAATTTTC TCCTCACTTA TACAAATTGA CGAACGCAAG CAAGAGGAAA 1440 GGCCTTGCAC AACTATCAAC GCTTTTTGGT CTATTTTTAA ACCCAAGCCG GACGTTACTA 1500 AACTAAGTCT AAAGAGGAAA CCCACCAATC CCACTAAAAA CACTGGGAAA AAATGCATCT 1560 CCCCTCATAA AAAGAGCGCT TATTTATGCC CTTCCGCTCA GGATGATTTA AATTTAAATT 1620 TAAACCCCAA ATCTAGCGCC AAGCCCACTG TGGTGAATTT ACCAGCTGCC CGCATCCTAA 1680 GCCGGCCTGC AGCCAAGCGG GATTTATTTA AATCATCATC CTCCCGAAGC CCAGACGAGC 1740 AGCCTATGAG TTTTTCGGAA GTGGTCGCTG GCACGGGTTC AATTTTTGCG GCACCCTGTG 1800 TCCCGGCACC TTTAACGAAA ACTCCAGGCA AGCGGACAAA CGACGATCTG GACTGCTCCA 1860 ACTTTAAGAC GCCCAATAAA AAATTATGCG CGACTTCCAA CTTTGTAACT CCCAGCATTT 1920 TTCCGCCGCT CATCACTCCC GTTTTCAAGA GCAAGGCAGC TCAATCTGTT TACGAGGAAT 1980 CCAAAGCCAG AAATGGACCC CCCCCGCCGG CCCTCGCCTG CAGCATCAAT GCCTCTGCTC 2040 GCAGCGCAGC GGCGCCACCC GGGATCGCCC CCCTACCCCC TCATAATACA GATGCAGAGC 2100 TGCCTCCATG GAAAATCGTG CCCCAGAGCC GTAGAGCACC TCCTATACTC GTCAATGATG 2160 TAAAGGAAAT TGTACCTCTA CTGGAAAAGC TGAACTACAC AGCAGGAGTC TCCAGCTATA 2220 CTACTAGGGC TATAGAAGGA AACGGGGTCA GGATACAGGC AAAGGACATG ACCGCCTATA 2280 ACAAAATTAA AGAAGTCCTG GTGGCCAACG GACTTCCTTT ATTCACCAAC CAGCCCAAGT 2340 CCGAGAGAGG CTTCCGAGTC ATCATCAGAC ATCTCCACCA CTCCACACCA TGCTCGTGGA 2400 TAGTCGAGGA ACTGCTGAAG CTCGGATTCC AAGCGCGATT CGTCAGAAAT ATGACGAATC 2460 CGGCTACAGG TGGCCCCATG CGAATGTTTG AAGTGGAGAT CGTCATGGCC AAAGACGGCA 2520 GTCATGACAA AATACTCTCA CTCAAACAAA TCGGTGGGCA AAGGGTGGAC ATTGAAAGGA 2580 AAAACAGGAC ACGGGAGCCA GTCCAGTGCT ACAGATGCCA AGGCTTCAGG CATGCCAAAA 2640 ACTCTTGCAT GAGGCCGCCA AGATGCATGA AATGCGCTGG CGAACACCTG TCTTCCTGTT 2700 GCACCAAACC AAGAACCACC CCCGCCACCT GCGTAAATTG CTCTGGGCAG CATATTAGCG 2760 CGTACAAAGG ATGCCCTGCA TATAAGGCGG AAAAACAAAA GCTGGCGGCA AACAACGTTG 2820 ACATAAACAA AATAAGAACA ATCAAAGACG CAACAAATAA CTTTTATAAA CGTCAAGGCC 2880 CCCCTCTACG CAACAACACC CCTCGGCTAC CGCACAGCTC AGCAATCCTG AGCAAATCAA 2940 TTGCCGAAGC TCGCCAGGAG GCAGCCAGAA AGTCGATGTT AAATCCATTC CGACAAAATA 3000 TAAACGACAG AAGACCACGA TTCTCCTCCC ACGACACGGC CATTCAGAAG CGTCTGAATA 3060 AATGGCGCCG AAACACCAAC AAAATACCCA AAAAGGGTAG GATAGCCTTA AAGGATAATG 3120 CAAAGCCACG ACCGGCACAT AGGACAAGTA ACCCAGCGCA AAGACATCTG GAGGACTACC 3180 AGGACATGCT CCGAAGGGAA AGGAGTGAAG AAAACGACCA GGAATCTGAG AAGGGCACCC 3240 CCAATACCAA GCAGGTCGGC AATGACAGCC CTCCGACCAC GAGCAGAGCA GCCAGAGCCA 3300 GCTTTAAGCC AAGAATCATT GACGATACCA CGCCATCGCC AAAAATCTGC AATCCCAACT 3360 CACAAAAAGG CCTCTTGGAC GACCCCACAA CAAGCTTAGC TAATAGAGTC GACAATTTAG 3420 AAAAGAAAAT TGACATTTTA ATGGCCTTAA TCATACAAGG AAGAAATAAC AATCTTGACA 3480 TGGATACATC CAATTAATCT TACAACTACT TATATATTCT TTAATAAATA TATCCAATAG 3540 AAAAGCGCAC GTCGGTCTGC TTTTAAAATC CTTCACCGTC ATCACCTTCC TCGACGGAGC 3600 CTAATTTATT GGAAAAATAA ATCAATTATA TGTTGGCACA AAAATGTAAA CACACACTCA 3660 CCTAAACGCA CCCGGACGAA CAAGCCTATG ACAACGCACT CCAGCTGATC TGTAAGAAAC 3720 AAAAAATATG AATAGATAGA TCGATATGAA AAGGATATGT GCGGCAGAAA CATGATGAGC 3780 AAAAGGCGAC TCGCTGCAGC AACTTATGCA CAACGTCACT TACCTGAAAT TTCTTGCCGT 3840 ACGATCTCCT GTAGTATCCC TTATCACAGC TGCAATCTAC TTGCAATGCT GCACTGCAAT 3900 AAACGTACTA CAAAAGCTGC ATACGTTTTG ATCAGGACAC CTCGTGCGGA CGTGCTAAAA 3960 AAAATTTCCT TTCTGCTGCT CTTATTGACG CTAAAACCTT AAAACCTACA AACAAAACAA 4020 TTAAATAATA ACAAATCAAA TAAGACAACC AAATAATACA CTTACCTCAT TGACTGCAGC 4080 TAAATCGCTG ACCCACATTC AGTGCAGCCG ACAGCAGGAG ACGGGCCCGC AAAAGCAAAA 4140 CAAAATCGCC AATTTTGCGA TTATAAACAC GAAAAATTGA CAATTTTGCG ATGCCGTCTC 4200 CGCCTCCTGA TGCCACTGCA TTGACAAGCA TCACTAGCGA GGAGCTGACA CCACACCAAA 4260 AAGCTGTAAA ATCCGTCCAC AAATTGTATA TTTTGCCTCA GTGTCGTATC TGCAATGTTT 4320 TTCCGATAAC CTGTAAGGAA AGAAAAATTA ATAAGAAAAT TATACAAAAT TAATTAAGGA 4380 CGACAGAAAA TAGCAAACCA GACAGGCAAA TTAACAGATA CAAATATGAG ACTCCATCCT 4440 GCTGCCGACA CACAAGTAAA TCCTTCAACT CGACAACAGG AGACGGGCCT TGCAAAAGCA 4500 AAACAAAATC GCCAACTTTT GCGATTATAA ATACAAAAAA TTGACAATTT TGCAACGCCG 4560 TCTCCACCTC CTGTTGCCAC TGCATTAATA AGGATCACCA GCGCGGCGTG ACGCCACACT 4620 AAAAGGCTGC AAAATCCGTC CACAAAATGT ATACTTTTCC TCAGTACAAT ACTTTCTAAT 4680 GAACTTCCGC CAACCTGCAA TGAAAAGAAA AGAAATAGGT ATATAAAACA AAACAAACAA 4740 AAGGACAACC TAAAATTAGC AAACCAGACA GGCATACTAG TAGATGCTAA TATGCAGCTC 4800 CATCCTACTG ACGACAACCA CGCAACTCCT TTCTCCAAGA CCGCAAATAC TGAAACAAGG 4860 AAGCACAAGC TAATACTGGG AATTATTTAT TTAAACAAAA ATACTTATCT AATTGCCAAT 4920 TCGACGACTC CAAATCCGCG GCTAACCGGC GGCGATGGCC CATAAATAAA GGGCCTCCTA 4980 ATTAATTACA AAATGTACCT GAAAAACATA AAATTAACGC AACTATAATT AACGCAATTA 5040 ATAAATCAAA TAAATACAAG TATAATACTT ACCTCCAAGC AAACGTACCT GAAAAACAAA 5100 ACCAAAAAAA AAATTAATGC AATAAATAAA TCAAATAAAT ACAAACATAA TACTTACCTC 5160 CAATTTACCT CCCAGCCAAT CTACCTGAAA AACATAATCT AATACAATCT CAAAAACAAA 5220 TAACAAATGT AATACTTACC AAATTTTAAT TTTGTATTCA TTTCCATGAC CCCAACGCTG 5280 CAACTGTCCT CGGCAACAAT TCCTGTTCCG GCGGCTCCAT GCTGCCAATC CTGACGCACT 5340 GGCCACAAGA CGCGGCGCTG CTGGCAATCT CTCGATGAAC AACCGATCTA CAATTTCCAT 5400 GACGACTCCT CTGTCACGAT GAGACAGAAG ACACCACCAA CGCCAGCAGC TCCAAAACAA 5460 TACAACAACG GCCGCGCGGA ACCCATCTTC AGAATTCCCT CTTCCTGACG ACCGGCGAAC 5520 GAGTTCTGGA ATAAACAATG TATTAATTGC AAACATCTAC CGATGAGGGT AGAAGAGATA 5580 CTCACCAAAC GACTGCGGCG CGGGAACAAA CTAACTGCAA CGCCGGCCGG ACCTATTTGT 5640 TGCAAGTGGC GCGCATCCAG CGCCTGCAAC ATGCCCCAGC CCAAGTACAC AACTACTTAC 5700 CTGCAACGTC GCCAGAGGCT CCCAGCGAAT CGGTGCTTCC GTCCTTCTGG CGGGGGTACC 5760 TGAAAAGAAA CAAATTAAAC AATATTAATC CTAAATTTCA ATGTTTTTTG TAAAATAATT 5820 TAAATTGTTA AATGTAAACA AGCCTTGCAA TATGTTAATG TTACCAGTCC ATGCTACTGT 5880 CTAAAAGCCA AGAATACAAA AAATACTAAT TATAAACTAA CTCACCACGC CCAACCCCCA 5940 AACTCACCCC ATGCAATGTT AAACCTATAA ATTCAAATAA TTGTACCTAT ATATTGCACA 6000 TACTGTAATC AAAGGCAAAA TAAATCGTGG ATGCGGAACA GAATTTACTC TGTCTCCGTA 6060 CCTCCACCAG CAAAGTTAAA AAA 6083 // ID DMIFACA standard; DNA; INV; 5371 BP. XX AC M14954; XX DR FLYBASE; FBte0000133; Dmel\I-element. XX FT source M14954:100..5470 FT SO_feature CDS ; SO:0000316:187..1467 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\I-element\gag" FT /db_xref="FLYBASE:FBgn0020417" FT /db_xref="SPTREMBL:Q24362" FT /db_xref="NCBI_PROTEIN:AAA70221.1" FT /translation="MTDPPNIYKITSKTYQSQLGEPKFIIIKRNDNNSFERTSPFIIKK FT SVDFACGGEVEGCKRTRDGNLLIKTKNELQARKLLKLTKIADEDVTASEHKTLNFSKGV FT IYCNDLRHIDEDTILQELKPQKVSEVKKIMKRQNPNSNSDTNNITLVETGLIIITFESH FT KLPEIVRIGYETVRVRDYIPLPLRCKKCLRFGHPTPICKSVETCINCSETKHTNDGEKC FT TNEKNCLNCRNNPELDHQHSPIDRKCPTFIKNQELTAIKTTQKVDHKTAQHIYFERHGF FT QTKNTYAKTLTNGTTQRTTNTPSPNIHTNTTQSQQQNPHHTPKSAAQNTSAKTPTTEPA FT KTTLLSNQPHQHHHHHSYDKLEDMDTDYTPTRKPSTTYSSQLTEDLKIKIFPKDKSNNL FT SINLKASKLKAKAHKNKHTNNSDSESI" FT SO_feature CDS ; SO:0000316:1938..5195 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\I-element\RTase" FT /db_xref="FLYBASE:FBgn0020418" FT /db_xref="SPTREMBL:Q24363" FT /db_xref="NCBI_PROTEIN:AAA70222.1" FT /translation="MAPSWGSPTTNKRGKITHRFIDNMHLILLNDKSPTHFSTHNTYTH FT IDLTLCSPILAPHAKWKILNDLHGSDHFPIITTLFPTTNPQKFYRPFFKLKEANWEQFN FT ALTHQTNKKYPTSHNVNKEAALINRIILYSANLSIPQTSPNTHPYRVPWWNKHLDQLRK FT EKQLAWKKLNRTITVDNILDYRRKNAIFRYELKKRKKEASSSFTSTIHPTTPSSKIWAN FT IRRFCGLNPAKQIHAITNPVNNETTLASNEIANIFAQHFSDLSGDWNFSEEFRNNKYRN FT NIHLYTPSPIAQTIEENITYLELSSALQTLKGCAPGLNRISYQMIKNSSHTTKNRITKL FT FNEIFNSHIPQAYKTSLIIPILKPNTDKTKTSSYRPISLNCCIAKILDKIIAKRLWWLV FT TYNNLINDKQFGFKKGKSTSDCLLYVDYLITKSKMHTSLVTLDFSRAFDRVGVHSIIQQ FT LQEWKTGPKIIKYIKNFMSNRKITVRVGPHTSSPLPLFNGIPQGSPISVILFLIAFNKL FT SNIISLHKEIKFNAYADDFFLIINFNKNTNTNFNLDNLFDDIENWCSYSGASLSLSKCQ FT HLHICRKRHCTCKISCNNFQIPSVTSLKILGITLNNKYKWNTHINLLLPKLHNKLNIIK FT CLSSLKFNCNTHTLLNVAKATIIAKLEYGLFLYGHAPKSILNKIKTPFNSAIRLALGAY FT RSTPINNLLYESNTPPLEMKRDLQIAKLSQNLILSKNTPIHKFLKPKKANKKKTSTIDR FT TIKLSLELNLPYKPIKLHKNKPPWTLPNLIDTSLRIHKKEQTSPDQYRKLYEHTKNNLK FT THNFIFTDGSKINYTISFAITTETDVLKYGILPPYSSVLTSETIAILEAIELTKNRRGK FT FIICSDSLSAVDSIQNTNNNSFYPSRIRSLITQHAPKIKIMWIPGHSGIKGNELADQAA FT KSASSMPLILTPNINTTDIKKHLKADLATKQKEHIINCSPWYQSINTNTSHPCDYLKQS FT HPNWTRLDQIKIIRLRLGHTNITHQHYLNPNSIPTCPFCQGDISLNHIFNSCPSLLQTK FT QDIFNNTNPLDLLSKPNPDNIQKLILFLKKTKLYHKI" XX CC Derived from M14954 (g157749) (Rel. 44, Last updated, Version 2). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 5371 BP; 2176 A; 1446 C; 606 G; 1143 T; 0 other; CATTACCACT TCAACCTCCG AAGAGATAAG TCGTGCCTCT CAGTCTAAAG CCTCGCTTCG 60 CGTAAGCCCA AAACTCTTAT CAGCAAAATC TTGATAAACA AATATCAACC ACAAAGAGAA 120 AATAAAAAAC TTAACAACAA AAACAACAAT ACCGCTAATC CGGGCTCAAG CCCTTAACCA 180 ACAATCATGA CAGACCCACC AAACATTTAC AAAATCACTT CAAAAACATA CCAATCCCAA 240 TTAGGCGAAC CTAAATTTAT AATTATTAAA AGAAATGACA ACAACTCTTT CGAAAGAACT 300 TCACCATTCA TCATAAAAAA ATCGGTGGAC TTTGCCTGTG GAGGAGAAGT TGAGGGATGC 360 AAACGTACAA GAGACGGCAA CCTGCTAATA AAAACCAAAA ATGAATTACA AGCCAGAAAA 420 CTCCTAAAAC TAACAAAAAT TGCAGATGAG GATGTAACAG CAAGTGAACA TAAAACATTA 480 AACTTCTCTA AGGGAGTTAT TTACTGTAAC GACCTTAGAC ACATCGACGA AGACACAATT 540 CTACAAGAAC TAAAACCACA AAAAGTATCT GAAGTTAAAA AAATAATGAA ACGGCAAAAC 600 CCCAACTCTA ACTCCGACAC CAACAACATC ACATTAGTTG AAACTGGACT CATAATTATA 660 ACCTTTGAAT CGCATAAGCT CCCCGAGATA GTACGAATCG GGTACGAAAC AGTCCGAGTA 720 CGAGACTATA TCCCACTCCC ACTTCGATGC AAAAAATGCC TCCGCTTCGG TCATCCAACA 780 CCCATATGCA AAAGTGTAGA AACTTGCATC AATTGCTCTG AAACAAAACA CACAAACGAC 840 GGAGAAAAAT GCACAAACGA AAAAAACTGC TTAAATTGCC GAAATAACCC AGAACTTGAC 900 CATCAACACA GCCCAATTGA CCGCAAATGC CCTACGTTCA TAAAAAACCA GGAATTAACA 960 GCAATTAAAA CCACACAAAA AGTTGACCAT AAAACGGCCC AACACATATA TTTCGAACGT 1020 CACGGCTTCC AAACGAAAAA CACCTACGCC AAAACACTTA CAAACGGCAC AACCCAGAGG 1080 ACAACAAACA CTCCATCACC TAATATTCAC ACAAACACAA CCCAATCACA ACAACAAAAT 1140 CCGCACCACA CACCCAAATC AGCAGCACAA AACACTTCAG CTAAGACACC AACAACTGAA 1200 CCAGCCAAAA CAACCTTACT ATCCAACCAA CCACACCAAC ACCACCACCA CCACAGCTAC 1260 GACAAACTAG AAGACATGGA TACCGACTAC ACACCTACCA GAAAACCATC TACGACATAC 1320 TCATCACAAC TCACAGAAGA CCTAAAAATA AAAATCTTCC CTAAAGATAA GTCCAATAAC 1380 CTATCCATAA ACCTTAAAGC ATCAAAACTA AAGGCCAAAG CCCACAAAAA CAAGCACACT 1440 AACAACAGCG ACAGCGAATC CATATAGAAC TCTACACAAA ACCCTAACCG TTAACACTAC 1500 CTTTAAGTAA GTTATAAGCT TTAATTTTCT CACAAATGTC CCTAACTATA ATCCAATGGA 1560 ATCTAAAAGG ATATCTAAAC AACTACAGCC ATCTCCTTAT TCTAATCAAA AAATACTCCC 1620 CCCACATAAT TTCCCTCCAA GAAACCCATA TACAATACAC TAATAACATT CCAACCCCAA 1680 TAAACTACAA ACTATTAACA AATATTGCCA CCAACAGATT TGGGGGGCGT ACGACTACTA 1740 GTGCATAAGT CAATACAACA CACTGTCCTC AACATAACAA TCGATATAGA AGCAATAGCC 1800 ATAAATATAG AATCTAAACT TAAATTAAAC ATATTTTCCA CATACATTTC TCCGACCAAA 1860 AACATAACTA ACCAGACACT CCATAACACA TTTAACATAC AACAAACACC CTCTCTAATT 1920 ACGGGAGATT TTAATGGATG GCACCATCCT GGGGCTCCCC AACAACAAAT AAACGAGGAA 1980 AAATAACTCA TAGATTCATT GACAACATGC ACCTTATCCT GTTAAACGAC AAATCTCCCA 2040 CACACTTTTC AACACACAAT ACATACACAC ACATAGACCT CACACTCTGC TCTCCAATCC 2100 TAGCCCCCCA CGCCAAGTGG AAAATACTAA ACGATCTTCA CGGTAGCGAC CATTTCCCTA 2160 TTATCACAAC ACTATTCCCA ACAACCAATC CACAAAAATT CTACAGACCC TTTTTTAAAC 2220 TCAAAGAAGC CAACTGGGAA CAGTTCAACG CTCTTACCCA CCAAACCAAC AAGAAATACC 2280 CCACCTCCCA CAACGTAAAC AAAGAAGCCG CTCTAATCAA TAGAATCATC CTTTATAGCG 2340 CAAACCTCTC CATCCCACAA ACCTCACCTA ACACACATCC ATACAGGGTT CCATGGTGGA 2400 ATAAACACCT CGACCAATTA CGTAAAGAAA AACAACTTGC CTGGAAAAAA TTAAACCGCA 2460 CAATTACTGT TGACAACATT CTAGACTATA GACGCAAAAA CGCAATATTT AGATACGAAC 2520 TAAAAAAGAG GAAAAAAGAA GCTTCCAGCT CTTTCACCTC AACCATCCAT CCCACTACTC 2580 CCTCATCCAA AATATGGGCC AATATAAGAC GCTTCTGCGG ACTTAACCCA GCAAAACAAA 2640 TTCATGCCAT CACAAACCCA GTAAATAACG AGACTACATT GGCTAGCAAC GAAATTGCTA 2700 ACATATTCGC ACAACATTTC TCTGACCTCT CCGGCGACTG GAACTTCTCA GAGGAGTTCC 2760 GGAACAATAA ATATAGAAAT AACATACATC TCTACACCCC CTCTCCAATA GCCCAAACCA 2820 TAGAAGAGAA CATAACGTAT CTAGAACTTA GCTCAGCACT ACAAACATTA AAAGGATGTG 2880 CTCCAGGACT AAATAGAATC TCGTATCAAA TGATCAAAAA TAGCTCCCAC ACAACAAAAA 2940 ACCGAATAAC GAAACTATTT AATGAAATAT TCAATAGCCA CATACCTCAA GCCTACAAAA 3000 CAAGCCTAAT CATCCCAATC CTTAAGCCAA ACACCGACAA AACGAAAACT TCCTCATACC 3060 GACCCATCTC CCTCAACTGC TGTATAGCAA AGATACTTGA TAAAATAATT GCGAAAAGAC 3120 TCTGGTGGCT AGTGACATAT AACAACCTAA TTAACGACAA ACAATTCGGG TTCAAAAAAG 3180 GCAAATCGAC TTCGGACTGT CTACTCTATG TAGACTATCT CATAACGAAG TCAAAAATGC 3240 ACACCTCCCT CGTCACTCTT GATTTTTCAA GAGCCTTCGA TCGAGTAGGT GTGCACTCCA 3300 TAATCCAGCA ATTGCAGGAA TGGAAAACGG GTCCCAAAAT AATAAAATAC ATTAAAAACT 3360 TCATGAGCAA CAGAAAAATA ACTGTCCGCG TCGGTCCGCA TACATCAAGC CCGTTACCCC 3420 TATTCAACGG AATCCCCCAA GGTTCACCCA TATCCGTAAT ACTTTTCCTC ATAGCATTCA 3480 ACAAATTATC CAACATCATA TCCCTACATA AAGAAATTAA ATTCAACGCA TATGCCGACG 3540 ACTTCTTCCT TATAATAAAT TTCAACAAAA ACACAAATAC AAATTTCAAC TTAGACAATC 3600 TATTCGACGA TATAGAAAAT TGGTGCTCCT ACTCAGGGGC ATCGCTTTCC CTATCCAAAT 3660 GTCAACACCT CCACATATGC AGAAAACGTC ACTGCACATG CAAGATAAGC TGCAACAACT 3720 TCCAAATTCC TAGCGTTACG TCCTTAAAAA TTCTAGGAAT AACCTTAAAC AACAAATACA 3780 AATGGAACAC ACACATAAAC CTACTTCTAC CCAAACTACA CAACAAGCTA AATATAATAA 3840 AATGCCTATC TAGTCTTAAA TTTAACTGCA ACACGCATAC ACTACTTAAT GTCGCAAAAG 3900 CAACAATTAT AGCCAAACTA GAGTATGGTT TGTTTCTGTA CGGCCATGCT CCCAAAAGCA 3960 TTTTAAACAA AATAAAAACA CCGTTTAACT CCGCTATCCG TCTAGCTCTC GGCGCATATC 4020 GCTCTACCCC AATAAATAAC TTACTTTACG AATCGAATAC TCCCCCCTTA GAAATGAAAC 4080 GAGACCTTCA AATAGCCAAA CTATCCCAAA ACCTAATCCT CTCCAAAAAC ACACCAATAC 4140 ATAAGTTCTT AAAGCCTAAA AAAGCTAATA AGAAAAAAAC ATCAACAATA GACCGAACAA 4200 TCAAACTTAG CCTAGAACTT AATCTACCCT ACAAACCAAT AAAACTCCAT AAAAACAAAC 4260 CACCATGGAC CCTCCCCAAT CTAATAGACA CGTCACTTAG AATCCATAAG AAAGAACAAA 4320 CATCTCCAGA CCAATACAGA AAATTATACG AACACACAAA GAATAACCTC AAAACACACA 4380 ATTTCATATT CACTGACGGT TCAAAAATTA ATTACACAAT ATCATTCGCC ATTACAACGG 4440 AGACAGACGT CTTGAAATAC GGCATACTGC CCCCATATTC ATCCGTCCTC ACCTCCGAAA 4500 CAATCGCCAT CCTAGAAGCA ATAGAACTTA CTAAAAACCG AAGAGGCAAA TTTATTATCT 4560 GCTCCGACTC CCTATCAGCA GTAGATTCAA TTCAAAACAC AAATAATAAC AGCTTTTACC 4620 CAAGCAGAAT ACGATCGCTA ATAACGCAAC ACGCACCTAA AATTAAAATA ATGTGGATTC 4680 CTGGCCATTC AGGAATAAAA GGAAATGAAT TAGCCGATCA AGCTGCAAAA TCAGCAAGCA 4740 GTATGCCACT TATCCTCACC CCAAACATAA ATACCACAGA TATAAAAAAA CACCTTAAAG 4800 CCGACCTTGC GACAAAACAG AAAGAACACA TAATAAACTG CAGTCCATGG TACCAATCTA 4860 TTAACACGAA CACCTCACAC CCATGCGATT ACCTTAAACA ATCCCACCCA AATTGGACCA 4920 GACTCGACCA AATAAAAATA ATACGACTTC GACTAGGACA CACAAACATA ACCCACCAAC 4980 ACTACCTAAA TCCCAATTCA ATACCAACTT GCCCGTTTTG CCAAGGTGAT ATTTCTTTAA 5040 ACCACATATT TAACTCATGC CCATCCCTCC TACAAACCAA GCAAGATATA TTTAACAACA 5100 CCAACCCTCT AGACCTTCTT AGCAAACCCA ATCCAGATAA CATACAAAAA CTCATACTTT 5160 TCCTCAAAAA AACTAAATTA TACCACAAAA TCTAAAAACA AAACAGGCAT TTGTACATAA 5220 CAAGCCAGCA ATTAGTTACC AAATTAGATA TTAACTAAAT TAAGATATAA TAACATTGTA 5280 AATAAATATA GCTGTAAGCC CCGTAGCTAA TGCTATACTA TCTAAGTTAG TCTAGTTTTG 5340 TAAACTATTC TATCTATCAT AATAATAATA A 5371 // ID DMLINEJA standard; DNA; INV; 5020 BP. XX AC M22874; XX DR FLYBASE; FBte0000088; Dmel\jockey. XX SY synonym: wallaby SY synonym: sancho XX FT source M22874:115..5134 FT SO_feature CDS ; SO:0000316:300..2051 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\jockey\gag" FT /db_xref="FLYBASE:FBgn0020297" FT /db_xref="SWISS-PROT:P21330" FT /db_xref="NCBI_PROTEIN:AAA28674.1" FT /translation="ISIALYGISIKTIDIMENSFAQSRPSNGCDKFEKMRKVAGVEPGE FT LRSQLRASCAVVSPNLEGMPTQSAVSSLMVTISSNTNASVTCTISNVQANMICTPTYTD FT CTTVTTSICPTTPYDNGLPTPLSSLPNKPSKANCPFQAHDRTVNRKRKGVSQPPLPILT FT PSPSRKTKRQATMPLNEEASTSTAAALNNNRFALLSAEAENMEQDVSDADSDIEDSAAR FT DGGGQSAKYSKPPAICVPSVSDPVTLERALNLSTGSSNYYIRISRFGVSRIYTANPDAF FT RTAVKELNKLNCQFWHHQLKEEKPYRVVLKGIHANVPSSQIEQAFSDHGYEVLNIYCPR FT KSDWKNIQVNEDDNEATKNFKTRQNLFYINLKQGPNVKESLKITRLGRYRVTVERATRR FT KELLQCQRCQIFGHSKNYCAQDPICGKCSGPHMTGFALCISDVCLCINCGGDHVSTDKS FT CPVRAEKAKKLKPRSRLPMTNNIATLKPPQRSSSGYIPAEALRTNISYADIARRNTTQS FT RARATVQAEVIPTSDNSLNNKFMTLDNSIRAINTRMDELFKLIHETVEANKAFRELVQV FT LITRIPK" FT SO_feature CDS ; SO:0000316:2048..4798 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\jockey\pol" FT /db_xref="FLYBASE:FBgn0015952" FT /db_xref="SWISS-PROT:P21328" FT /db_xref="NCBI_PROTEIN:AAA28675.1" FT /translation="MTQPTLKIGLWNARGLTRGSEELRIFLSDHDIDVMLTTETHMRVG FT QRIYLPGYLMYHAHHPSGNSRGGSAVIIKSRLCHSPLTPISTNDRQIARVHLQTSVGTV FT TVAAVYLPPAERWIVDDFKSMFAALGNKFIAGGDYNAKHAWWGNPRSCPRGKMLQEVIA FT HGQYQVLATGEPTFYSYNPLLTPSALDFFITCGYGMGRLDVQTLQELSSDHLPILAVLH FT ATPLKKPQRVRLLAHNADINIFKTHLEQLSEVNMQILEAVDIDNATSLFMSKLSEAAQL FT AAPRNRHEVEAFRPLQLPSSILALLRLKRRVRKEYARTGDPRMQQIHSRLANCLHKALA FT RRKQAQIDTFLDNLGADASTNYSLWRITKRFKAQPTPKSAIKNPSGGWCRTSLEKTEVF FT ANNLEQRFTPYNYAPESLCRQVEEYLESPFQMSLPLSAVTLEEVKNLIAKLPLKKAPGE FT DLLDNRTIRLLPDQALQFLALIFNSVLDVGYFPKAWKSASIIMIHKTGKTPTDVDSYRP FT TSLLPSLGKIMERLILNRLLTCKDVTKAIPKFQFGFRLQHGTPEQLHRVVNFALEAMEN FT KEYAVGAFLDIQQAFDRVWHPGLLYKAKRLFPPQLYLVVKSFLEERTFHVSVDGYKSSI FT KPIAAGVPQGSVLGPTLYSVFASDMPTHTPVTEVDEEDVLIATYADDTAVLTKSKSILA FT ATSGLQEYLDAFQQWAENWNVRINAEKCANVTFANRTGSCPGVSLNGRLIRHHQAYKYL FT GITLDRKLTFSRHITNIQQAFRTKVARMSWLIAPRNKLSLGCKVNIYKSILAPCLFYGL FT QVYGIAAKSHLNKIRILQAKTLRRISGAPWYMRTRDIERDLKVPKLGDKLQNIAQKYME FT RLNVHPNSLARKLGTAAVVNADPRTRVKRRLKRHHPHDLPNLVLT" XX CC Derived from M22874 (g157823) (Rel. 47, Last updated, Version 5). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 5020 BP; 1527 A; 1198 C; 1055 G; 1240 T; 0 other; AAAAATCATT CACATGGGAG ATGAGCAATC GAGTGGACGT GTTCACAGAA GTCGCGAGAT 60 AAAACAAAAA CGTAATTGTG ATCCATCACA AACATCTGCG CAGATCGTGT GCTTATCTCA 120 CAAACAAAAT CTATTTTTAG TCACTGCATA ACGGTGACGG CTTCGGTTCG CGAAACTTAT 180 CAGCAACTAG CAATTTCTAA GCTGTGTTGT TTTTGCCCCT CGCCCTGCGC GCTGCGCAAG 240 CGGGAGGTTG TTACAATTTA CCTTACAAGT AAACCGGTAA ATCTTATCGT GTTTAGTAAA 300 TATCAATTGC ATTATACGGC ATAAGTATAA AGACAATTGA TATAATGGAG AATTCATTTG 360 CTCAATCGCG ACCTAGCAAT GGGTGCGATA AATTTGAGAA AATGAGGAAA GTAGCAGGTG 420 TTGAGCCAGG AGAATTACGC TCCCAACTCC GCGCCAGCTG TGCAGTTGTT TCCCCTAACC 480 TGGAAGGTAT GCCAACTCAA TCTGCGGTCT CCAGCTTAAT GGTGACAATC AGCAGCAACA 540 CCAATGCAAG TGTTACCTGC ACTATTTCTA ACGTACAGGC CAACATGATC TGTACTCCTA 600 CATACACTGA TTGCACAACC GTGACCACTA GCATTTGCCC AACTACGCCT TATGACAATG 660 GACTGCCGAC ACCTCTGTCA TCACTGCCCA ATAAGCCATC TAAAGCGAAT TGCCCCTTTC 720 AAGCACATGA TCGTACTGTC AACAGGAAAC GAAAAGGCGT GTCTCAGCCC CCATTACCTA 780 TCCTCACCCC TTCTCCAAGC CGTAAAACTA AAAGGCAGGC CACTATGCCA CTCAATGAGG 840 AGGCCTCTAC CTCCACTGCA GCAGCATTAA ATAACAATCG CTTCGCGCTT TTGTCCGCTG 900 AAGCGGAGAA TATGGAGCAA GACGTGTCGG ATGCTGATTC TGACATTGAA GACTCTGCTG 960 CCCGAGATGG TGGTGGACAA TCCGCTAAAT ATAGCAAACC CCCAGCCATA TGCGTACCAA 1020 GTGTAAGCGA TCCGGTCACC TTGGAACGGG CTCTCAATCT GAGCACCGGC TCCTCAAACT 1080 ACTACATCCG CATTTCTAGA TTTGGTGTAT CCAGAATCTA TACAGCCAAC CCTGATGCTT 1140 TCCGCACCGC TGTAAAAGAA CTAAATAAGT TAAATTGTCA ATTCTGGCAT CACCAACTTA 1200 AAGAAGAAAA ACCCTACAGA GTAGTGCTTA AAGGAATCCA TGCTAATGTT CCTAGTTCGC 1260 AGATAGAACA AGCATTTAGT GATCACGGCT ATGAGGTCCT TAATATCTAT TGCCCCAGAA 1320 AGTCTGACTG GAAGAACATT CAGGTAAACG AAGATGATAA TGAAGCTACA AAAAACTTCA 1380 AAACTAGACA AAATTTGTTT TATATTAATC TTAAACAAGG CCCGAATGTT AAAGAGTCTC 1440 TTAAGATAAC TCGACTTGGC AGATACAGAG TCACTGTTGA GCGCGCTACA CGTAGAAAAG 1500 AACTGCTACA ATGTCAAAGA TGCCAAATTT TTGGACACTC TAAGAACTAT TGCGCCCAGG 1560 ATCCTATTTG TGGTAAATGT AGTGGTCCCC ATATGACCGG GTTCGCTTTG TGCATAAGTG 1620 ACGTATGTCT GTGTATAAAT TGTGGTGGTG ATCATGTCTC GACAGACAAA AGCTGCCCTG 1680 TCAGAGCAGA GAAAGCCAAG AAGCTAAAAC CAAGGTCCAG GCTACCGATG ACTAATAATA 1740 TTGCCACACT CAAACCTCCA CAACGTTCTT CAAGCGGTTA CATACCAGCT GAGGCATTAA 1800 GAACCAACAT CTCTTATGCT GATATTGCTC GACGCAACAC GACTCAATCT AGGGCTCGTG 1860 CTACTGTGCA GGCTGAAGTT ATACCAACGT CGGACAATAG CCTTAACAAT AAATTTATGA 1920 CGTTAGACAA CTCCATTCGG GCCATCAATA CGAGAATGGA CGAACTATTT AAGCTTATAC 1980 ACGAAACTGT AGAGGCTAAT AAAGCTTTCA GAGAACTGGT TCAGGTTCTA ATTACACGTA 2040 TTCCTAAATG ACTCAACCAA CCTTAAAAAT CGGATTGTGG AACGCTCGCG GATTAACAAG 2100 GGGCTCTGAG GAGCTTCGGA TATTCCTCAG CGATCACGAT ATAGACGTAA TGCTTACCAC 2160 GGAAACACAC ATGCGAGTTG GTCAGCGCAT CTATCTCCCA GGGTATCTTA TGTATCACGC 2220 CCACCACCCC AGTGGTAACA GTAGAGGTGG CTCTGCAGTC ATCATAAAAT CTAGACTTTG 2280 TCACAGCCCT CTGACACCTA TCTCTACTAA TGACAGGCAG ATAGCGAGAG TGCACCTGCA 2340 AACATCGGTT GGGACCGTCA CTGTAGCTGC TGTTTATCTA CCTCCAGCAG AAAGATGGAT 2400 AGTAGATGAC TTCAAATCCA TGTTTGCTGC GTTAGGCAAC AAATTTATTG CTGGTGGTGA 2460 TTACAATGCC AAACATGCAT GGTGGGGGAA CCCAAGATCC TGTCCTAGAG GTAAAATGTT 2520 GCAAGAAGTC ATTGCACATG GGCAATACCA AGTTCTGGCT ACGGGCGAAC CCACTTTCTA 2580 CTCTTACAAC CCTTTGTTAA CACCATCAGC CCTTGATTTT TTTATAACCT GTGGGTACGG 2640 CATGGGCAGG CTAGATGTAC AAACTCTCCA GGAACTCTCG TCGGACCATC TTCCTATTCT 2700 GGCTGTATTG CACGCTACGC CGTTAAAGAA ACCACAACGC GTACGACTAC TTGCCCATAA 2760 TGCTGACATA AACATATTCA AAACCCATCT TGAACAGCTG AGTGAGGTAA ATATGCAAAT 2820 TCTGGAGGCG GTGGACATTG ATAATGCCAC AAGCCTTTTC ATGAGCAAAC TAAGTGAGGC 2880 TGCTCAGCTT GCTGCACCGA GAAATCGGCA TGAAGTAGAG GCCTTCAGAC CACTTCAACT 2940 TCCTTCCAGT ATATTGGCAC TGCTCAGGCT AAAACGAAGA GTTCGAAAAG AATATGCTAG 3000 AACAGGTGAT CCCCGCATGC AACAGATCCA CAGTAGACTG GCCAACTGCC TGCATAAGGC 3060 CCTTGCTCGA AGAAAGCAGG CCCAAATAGA TACCTTCTTG GATAACTTGG GTGCTGACGC 3120 GAGCACAAAT TACTCACTGT GGCGTATCAC GAAACGGTTC AAAGCTCAGC CCACCCCAAA 3180 ATCAGCAATC AAAAATCCGT CTGGTGGCTG GTGTCGCACT AGCTTGGAAA AAACTGAAGT 3240 GTTCGCTAAC AACCTTGAGC AACGTTTTAC ACCCTATAAC TATGCACCGG AAAGTCTCTG 3300 TCGTCAGGTT GAAGAATACT TGGAATCGCC CTTTCAAATG AGCCTGCCTC TGAGTGCTGT 3360 CACACTGGAA GAAGTGAAGA ATTTAATAGC CAAGCTGCCA CTTAAGAAAG CTCCTGGAGA 3420 AGATCTTCTT GATAATAGAA CCATTAGACT TCTCCCAGAT CAAGCATTGC AGTTCCTTGC 3480 CTTAATATTC AACAGCGTTC TTGATGTTGG CTACTTTCCG AAAGCTTGGA AATCGGCGAG 3540 CATAATTATG ATCCATAAGA CTGGAAAAAC ACCGACAGAC GTTGACTCGT ACAGGCCCAC 3600 CAGCTTACTC CCATCTCTGG GTAAAATTAT GGAGAGGCTG ATCCTAAACA GGCTGCTCAC 3660 ATGCAAGGAT GTTACCAAAG CGATTCCCAA ATTTCAGTTT GGCTTCCGGT TGCAGCACGG 3720 TACTCCTGAG CAACTACATA GAGTAGTGAA CTTTGCTCTG GAAGCTATGG AAAACAAGGA 3780 GTATGCAGTA GGTGCCTTTC TTGATATTCA ACAGGCATTT GACAGAGTCT GGCACCCTGG 3840 GCTCCTGTAC AAAGCGAAGA GGCTGTTCCC GCCGCAGCTA TATTTGGTTG TTAAAAGTTT 3900 CCTGGAAGAA CGCACATTCC ACGTCTCTGT TGATGGGTAC AAATCATCAA TCAAGCCAAT 3960 TGCAGCTGGA GTTCCTCAAG GAAGCGTTCT TGGCCCAACC CTATACTCAG TTTTTGCTTC 4020 GGACATGCCT ACTCACACAC CAGTCACAGA GGTAGACGAA GAAGATGTGC TCATAGCCAC 4080 CTACGCTGAC GATACTGCTG TGCTCACGAA AAGTAAAAGT ATCCTGGCTG CCACTTCTGG 4140 TCTACAGGAA TACCTGGATG CATTCCAGCA ATGGGCTGAG AACTGGAATG TGCGCATCAA 4200 CGCTGAGAAG TGTGCCAATG TGACGTTCGC CAACCGAACA GGTAGCTGTC CGGGTGTCAG 4260 TCTGAATGGA AGACTGATCA GACACCATCA GGCTTATAAA TACCTTGGTA TTACCCTCGA 4320 TAGGAAGCTC ACCTTCAGCA GGCACATCAC AAATATTCAG CAAGCGTTCA GGACCAAGGT 4380 TGCTCGGATG TCTTGGCTCA TTGCACCACG CAACAAACTG TCGCTTGGCT GCAAGGTCAA 4440 TATTTACAAG TCCATATTGG CCCCCTGCCT GTTCTACGGC CTGCAGGTAT ACGGCATTGC 4500 TGCGAAGAGT CACCTTAATA AGATCCGGAT TTTACAGGCG AAGACCTTAA GAAGAATTTC 4560 GGGGGCTCCT TGGTATATGA GAACAAGAGA CATCGAACGC GACCTCAAGG TGCCCAAATT 4620 AGGAGACAAG CTCCAGAACA TCGCCCAAAA ATATATGGAA AGGCTTAATG TACACCCCAA 4680 CAGCCTAGCA AGGAAGCTAG GAACTGCAGC TGTGGTCAAT GCTGACCCTC GGACTAGAGT 4740 CAAAAGAAGA CTCAAGCGAC ACCACCCTCA TGACCTCCCT AACCTGGTTT TGACCTAGAA 4800 AGTCTTAGTT TTAAAATTCA TTAGAATAAT CAAATAAATA ATAATTACTA TGTTATATCA 4860 ACTATTATAA TTCTCCCTAT CATTTTTAGA TTAAAAATCT GTTAGTCTTA AGTAACCAAG 4920 ACACATTGTA AAATAAAATA ATTTAAGCAG ATCAAATTAA GTTGCCGCAT GGGTAACAGT 4980 GCGTTGATCA AATAATAAAA ACATCATAAA AAAAAAAAAA 5020 // ID DMTRDNA standard; DNA; INV; 1435 BP. XX AC X80025; XX DR FLYBASE; FBte0000670; Dmel\hopper. XX SY synonym: M4 XX FT source X80025:1..1435 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..33 FT SO_feature terminal_inverted_repeat ; SO:0000481:1403..1435 XX CC Derived from X80025 (g510507) (Rel. 44, Last updated, Version 11). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 1435 BP; 456 A; 265 C; 212 G; 502 T; 0 other; CACTATGGGG CATTTGGCCT GTTTTTTTTA CAAAAATTAA TACCTCCTAA ACTATTGGAG 60 ATATTTGGAT GAATTTTTTT TTATGCGTTA CACATGCCTC CAGGAATATT TTGGAAAAGT 120 GGGCGTGCCC CAACTCCGCC CCATTTTTTT TTTTTTTTTT TTTTTTTTTT AATAATATAT 180 TTTTAAAGTT TATTTTTAAT TTCAATAATG TATAATTCAT AACCGTCTTC CTCTTCACAA 240 TCAGTAGAGT CTGAAGAATT TTTATCAGGT TCAAATTCGC AAGCTAACAT TTCAATGACT 300 TCTGGTGGAA GAGATAGTCG CTTATGTTTT CGCCTCTTTA AATTTATTGA TGATATTATG 360 GGATCCGAAG TATCCATTGC TCTGTAAAAG ACATCTGCGA AGCTACTAAT AGTTTTTGCC 420 GTGGCTGGCT TCAACAAAAG AATTTTAAGT ATGGCTGCAA GATCCCGCAG GCAGCACTTC 480 CGTGCAGCTT GAACCAAAAG ACGTTCGTTG TGTTTCTGCG CCCTTACGAG TTCATCTGCT 540 TGCTGTCTTG GGCCACTCAA ATTTTTTAAA TAATATGACG TTTTCGGGAG TCCAACTAAT 600 TTCCTTTCCT ATTTATTTTT CTCCTTTACC TTCAGGACTA GGTGTTCTTC TAACCAATTT 660 GAAAAAAATT TTAAAAATTC ATATATTTTT CGATTGCATT TTCTCCAATT TCGTAAAAGA 720 TTGACTGAAA TCATTCGTTA TTATTATTAT TAGTTAATCG TTTATTAAAG TCTAGCTTGC 780 TATCAGAAAA ATGCCCACTG ATAAAAGTGC AAATAGAATT TTCCTTTTGA CGAACACCCT 840 TTTGCGTGCG CCACACTTCC AGCAGGGCAG CATTGGAAAT CGAGATATTG CTCCCTAAAA 900 AATGAAATTT CTCAAAAAAC CGCAAAAAAC GCACATAGAG ACTACCTGAT ATGAGTTAGG 960 AATTGAACAC ACTACAACAT GGATATAAAC ACTTACTGAA CAAATTTGAA CAAATTGTTG 1020 TAGCTCTATT CAAAGTTGAA AATTTTTTCA AACAACTACA TCTTGACACC ACTTGTTAAA 1080 TGTACAAATT GTTAGAAATA GGCGCACACA ATAAACAATA TATTAATAAC AACACATAAT 1140 AAGAACCTAA AGATTGATTA TCCATTTCAA ATTATACTCT CCTTCTTCTT CTTTTTAAAT 1200 TTTAACACTT TGAAAGTTAA GCTAAATTTT GTGCGCAAAG CAGCCACGTG GTATATGCTC 1260 GCAACAGCCG ACTTTAACAG CTGTTATTAT AACAGTGCAT TGTTAAATTA ACTTATGCGG 1320 GCTATATCAT AACAGTTTAA CGTATTTCCA ATGTATTAAT ACTAAAATAC TTCAAATTTG 1380 CATACTTGTG AAAAACACAT TATTGTAAAA AAAACAGGCC AAATGCCCCA TAGTG 1435 // ID DMRTMGD1 standard; DNA; INV; 7480 BP. XX AC X59545; XX DR FLYBASE; FBte0000015; Dmel\mdg1. XX FT source X59545:1..7480 FT SO_feature five_prime_LTR ; SO:0000425:1..441 FT SO_feature three_prime_LTR ; SO:0000426:7039..7480 FT SO_feature CDS ; SO:0000316:548..923 FT SO_feature CDS ; SO:0000316:1327..1557 FT SO_feature CDS ; SO:0000316:1749..3062 FT SO_feature CDS ; SO:0000316:2987..6673 XX CC Derived from X59545 (g8507) (Rel. 49, Last updated, Version 4). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 7480 BP; 3067 A; 1298 C; 1235 G; 1880 T; 0 other; TGTAGTATAT ACGAATATAA TAACAATAAT AATAACAATA ATAATAATAA TATTAATAAT 60 AATTATAATA TGAATCATAA TAATAAGTCA ACTAATAAGT AAACTTAGGA CCACCCTAAT 120 TCCTTAGGGT CACCCTAGTA GATCTTTAGA TACACCCTAA TACTAAATAT GCGAATTCAG 180 GATGTACGCC TTTAGGGGTC GGACTCGACT CCCATTGGTT ATCGAGTATG AACTTCATAC 240 ATACATATTG CAGAATTTGC TAGTGTCAGC ACTTGGCTGT CACAAGAGAT CTCCCTGTAG 300 ACCACACTAA GATCAGTTAT AAATCAGGAA TAGATCTGGA ATGTACACTC GCTTAATAAA 360 AACCAAATAA AGATAAAATG ACCAACTGCG TTTTGAGACT TTATTAACTA CATCAGAAGT 420 ATTAGAATTC AAATTAACTA CATGGCGACC GTGACAAAGG ATCGTTATAA GTTGTAGCAG 480 AAGCTAAAGG AAACCGCTTG TGATAATTTT CAACTTCGAT GCTCATCCAC CAAGACGGCG 540 GCAATTATGA AGAAAAAAGC GATCTGAGTG AGTAGAGTGT CAGTGTGATG GGAAAAAACA 600 GGGGCGGAGT TCGACATAAT ATAAAAAAGA GAATAGCGCA CATAAAGTGG CTATTATATA 660 CGAACACTCC ACCACCCCAA TGGTCGAAAG CTCAAAAACT ACAAGCTGAG CTAGACCACT 720 GTGTCGAATA TCTCAAGAAA AAAATCCCCA CCACACGCGC TCACTCAGAA AATCAAATAA 780 AATCGTTAAC AATTAACAAA ACTCCAACTC CCAATCCGAA AAGCCTGCCT GTTTTCAAGA 840 AAAGATGCCC GAACGACTGC GAGGGACCAC TGTTCACACC GCATTGTGAA CATACGTGCA 900 GACATTGCAG CTCCACCACA TAACCCCTAA ATGAGGAAAT CATCATCAAC GTGGTGAGCA 960 GCCCGCTCAT TACGTCATCG AGGGAGTGTC AGCGTGCCAA CCCGGCGACG ACCAGATGAC 1020 GCAGGAGGGT CAGAGTGAAG CAAATAGGAG CTGAAAAATA AAATATTTTT TTTGTTGCCC 1080 TGCGTGGCAC ACCCTCGATG CACTGCGCTG CATATTAATA TTACACAAAA TATTGTAACA 1140 TTGAGCGGAA CTTTTTCTGC CCGATGAGAA GAATGGCCCG TAAAGCCATA CACCAACTAG 1200 GTAGGAAAAT GTAACTATAT TGAACAAAAA AAAAAAAAAT CAAAACAACA TATTTTTAAA 1260 GTAAAATAAA CCAAAACCCA AAAATAAAAA AAAAAAAAAA AAAAAAAAAA ATAAAAATAT 1320 ACAAAAATGG GTTGGTTTGG ATCTGACGAT AGTCAGACAA AAGATAATAC GGCCAATGTG 1380 GTCAATAACT TAAAAATAGT CGACCATACA GATGACATTC AGTCACTGTG GTTACTCCTT 1440 TTGATCATGA CGATCGTAAC AGTCGCTCAG TTTATATTAA CGCTATATGT TAAGCATAAC 1500 AAGATAATAA AGAGGCGTTA TATAGGCAAA GCAGAGAATA GTTTGGATAA AATTTGAAAA 1560 AAAAAAAAAA AAAAAAAAAA AAAAAAACAT CCGAGATGTA TTTTGAATTA AGATGATCTA 1620 AAATTTTTAT TTTTAATATC AGAAAACTAG AATGAAAAAA AAAAAAAAAG ATTATTGAAG 1680 AAACCTATTT GAGAGAGGCC AAAATTTATA AAGTTCGATT GCATAGATAA ATCCATAGTA 1740 TTCTTTAAAT GGACTGGCAA GAAATACAAA ACGAGCTTAA AGAAATTAAA ACAACTTTTG 1800 ACAAGTCTTA TAAATGCATG ACACCAAATA GAGAAGTGCA ACAAGACACT CTCAACAAGC 1860 ATGCGCAGAT ATTGGTAAGA TGCTTTAATG GAGCACGCCA ATTAATTTAC AGAGAAAGGA 1920 AAAGATTAAC AAAAAATCAT TTATCACAAG CAGTAAAATT TCTAAACAGG TTCCGTGAGA 1980 ACTTGTTAAA CGTCAAGTAC AGACACAACT TAAATATTAC AATCCCAACG ATTTTAAGCA 2040 CACCTATAGT GGCTGAGATC GGTGAGGATA TCGAAAGTGT AGGAGAATCA GAAATAGAAA 2100 TAAAAGAAGA GGATCTCCAC GATCTTGCAA TTCCAGCGGT AATAACATTA CCCGAATTAC 2160 TTGAAGAAGA ACTTTCAGAT TCAAATACAG GAATAAGAAT ACAGGAAACG GACAAAATGA 2220 CAGACTCTGC CGCAACAGCA AGGGAATATG TGCGACAAAT TTCGTCCACA ATACCTGAGT 2280 TTGACGGCAA AAAGTTAAAC TTGAATAGAT TCCTCACGGC TCTCCGGCTG ATAGATCTGA 2340 CAAAAGGAGA TCAGGAGATG CTAGCGGTTG AGGTAATCAA GACAAAGATA CTTGGTCCAT 2400 TATCACACAA AGTTGAAAAT GAAAAGACCA TTATCGGTAT AATAAATCTA TTAAAAGCAT 2460 CAGTTAAAGG CGAATCGCCC GATGTCATCA AAGCAAAAAT GCTTAGTACA CAACAGCGCG 2520 GCAAAACTGC AGCGCAATAT ACCACGGAGA TAGAAAACCT ACGTGGGTTG CTCGAAGCAG 2580 CCTATATAGA TGATGGTTTA GATTCCAACA ATGCAGACAA ATTCGCTACA AAGGAAGCCA 2640 TATCTGCAAT GACCAAGAAC TGTGGGCACG ATAAGCTCAA AACCATATTG GAAGCTGGAA 2700 ATTTCAACAC GATGAATAGC GTGATTGAAA AATACATACA CTGCAGTACA GAAATGACCG 2760 GCAATTCAAA TAGTGTATTA TTCTATAATA ATAGAGGACA CTATCGAGGT AATAATTACC 2820 GAGGAAATTA CCAAAACAGA GGTAATGGCC GAGGAAATTA TAACTCCTAC AATAACAACT 2880 ATAGAGGCAG AGGTGGTTAC CATGGTGGAA ACAGAGGACG AGGTGGTAAC CAAAATTATA 2940 ATAGAGGTGG AGGTTACTCA AGAGGTAACC AAAACCATAA CTATAAAACA AGTCATGCCC 3000 ACAATGTCCG AAACATACAA TCGGAAAACG AACATACCCC CTTGAGCGAC AATCTACAAT 3060 AAAATTATAC AAAATTAATC TCAATTTAAG CATTTTTATA CGATTGAAGA ATATGAGTAC 3120 CAATTCATGG GTAACTCTTT TAATAGATAC AGGTGCAGAA ATTTCCCTGC TTAAATGCAG 3180 AAACAATAAT CTTAACGATT TAAATCCAAA AAATACAACA AATATATCAG GAATAGGGCA 3240 AGGGACAATT CAGTCTCTAG GTACACTACA TTTAGAAATG TGTATTGCTA ATGCAGCAAT 3300 ACCATATGAA TTCCATATCG TACCTAACAA TTTTCCTATA CCAGGGGATG GTATAATTGG 3360 CTTGGATTTC ATTAAGAAAT ACAATTGTAT TTTGGAATTC CACGACCAAG AAGATTGGTT 3420 CACTTTGAGG CCCAAAAATT TCAGGAACAT AAACATTCCT ATTATACATA CACTAGATAA 3480 TGAAATAATT TTGCCAGCTA GATCAGAAGT GATTCGAAAG ATTCAACTAA CATCTACTGA 3540 CACACATGTT CTCATTCCCA ACCAAGAATT ACAACCTAGC ATAATAATCG CAAGTGCACT 3600 CGTAAACACT CAGAACGTTT TGATTCGAAT TATTAATACA ACTGAAAAAG ACGCTATAGT 3660 TAGTAGCGCA AATATAAAAA GCGAATCATT GGATGATTAT GATGTATACA ACGCAAATAT 3720 AGAAAATAGT GCACAAAGAA CTTCAGAAGT ATTAAAACTT CTTAAATTTC CATCGTTATT 3780 CAAAAGCGAT TTAACAAAAT TATGCACCGA ATATAGCGAT ATTTTTGGTC TTGAAACAGA 3840 AACCATATCA GCTAATAATT TTTACAAGCA AAAATTGAGA TTAAATGACA AAACTCCAGT 3900 CTATATCAAA AACTATAGAA TGCCAGAAAG TCAAAAACCA GAAATTCAAA GGCAAGTTGA 3960 CAAATTAATA AAAGATGGCA TTGTCGAACA ATCTATTTCA GAATATAATA GCCCTCTTCT 4020 CTTGGTACCC AAGAAATCAC TGCCTAACTC GGAGGAAAAG AGATGGCGAT TAGTAGTCGA 4080 TTATCGCCAA ATAAACAAGA AACTGCTAGC AGATAAATTC CCACTTCCAA GAATAGAAGA 4140 CATTCTTGAT CAATTAGGCC GAGCAAAATA TTTCTCGTGC CTAGACCTGA TGTCAGGATT 4200 TCATCAAATA GAATTAGACG AAAGGTCAAG AAATATAACA TCTTTCTCAA CTTCAACGGG 4260 AGCATACCGC TACACGCGAT TACCATTTGG TTTAAAAATA GCCCCAAATT CTTTTCAAAG 4320 AATGATGACC CTTGCATTTT CAGGTTTAAC GCCTTCGCAA GCATTTCTGT ATATGGATGA 4380 TTTAGTAGTC ATAGGCTGTT CTGAAAAGCA CATGCTTAAA AATCTAACCG ACGTTTTCAA 4440 ATTATGTAGG CAACATAATT TAAAATTACA TCCAGAAAAA TGCACTTTCT TTATGAAAGA 4500 GGTTACTTAT TTAGGTCACA AGTGTACTGA CAAAGGTATA TTGCCAGATG ACTCTAAATA 4560 TGAGGTAATA AAGAACTACC CCAAACCAGT AAACGCAGAC GAAGCTAGAC GCTTCGTGGC 4620 ATTTTGCAAT TATTACAGAA GATTTATTAA GAACTTTTCT GAGAAATCAC GCCACTTAAC 4680 GAGGCTTTGT AAAAAGAATG TTCCATTTGA ATGGACAAGC GAATGCAATG ATGTATTCGA 4740 ATATCTCAAA AGGAAATTAA TGAAACCAAC ACTCCTTCAG TACCCAGATT TCAGCAAACA 4800 ATTTTGCATA ACCACAGATG CTAGTAAACA AGCATGTGGA GCGGTACTAT CTCAAGACCA 4860 TAACGGTCAA CAGCTACCAG TGGCATACGC TTCAAGAAGC TTTACAAAAG GCGAAAGTAA 4920 TAAGTCCACT ACAGAGCAGG AGCTAGCAGC TATTCACTGG GCAATAAATC ACTTCAGACC 4980 ATACGTATAT GGTAGACATT TCTTAGTACA AAGTGACCAT AGGCCACTAT CATATCTTTT 5040 TTCAATGAGA AACCCCAGTT CAAAATTAAC CAGAATGAGA CTAGACTTGG AGGAGTTCGA 5100 ATTCACAGTA GAATATCTCA AGGGGAAAGA TAATCATGTC GCAGACGCAT TGTTCCGAAT 5160 AACAATCGGA GAACTTAAAG CAATAAATAG ACAGATACTA AAGGTAACAA CAAGATCAAC 5220 AACAAGACAG AAAAATACCT GCGCAGGTGA AAAATTGCAT GAACCAAATG AGAAAGAAAA 5280 TATAAAAATG CCCAATATCT ATCAGGTAAT CAATAACATT GATGCCAAAA AATATGTTAT 5340 ACTCAAAATA GACAAGCATA AGTGTTTGTT GAAAAGAGGA AAACAAATTA TAACACGTTT 5400 TGATATGACT AATTTTTATT CTAATGAAAT AATCGATTTA GATCAATTCT TTCAAAGGCT 5460 TAATGAAGAA GCAAGAATAA ATAGCATCAT TCAAACACAA TTGTCACCAA GTGAACAAAT 5520 CTTCGAATTT GTCACTATAA AGAACTTTAA AGAAAAGGGC AATAAAATAC TAAAAAATTT 5580 AAAAATAGCG CTATTAAACA AGGTGACTAA GATAGATAAA AATGATAAGG TTCAAATAAA 5640 AGCAATACTG TCTAAATATC ATGATGATCC ATCAGAAGGA GGCCATTCAG GAATTTCTAG 5700 AACCCTGAGG AAAATGAAAA ACTGTTGTTG TTGGCCACGA ATGACGAAGG CGATAAGTGA 5760 ATATGTTGAA ACATGTTTGA AATGTCAACA AGCCAAGACT ACGAAACATA CTAAAACACC 5820 GTTGACAATA ACAGAAACGC CAGCAACAGC ATTTGATAAA GTTTTGATAG ATACCATTGG 5880 TCCACTGCCA AGATCAGAAA ACGGAAATGA GTATGCTGTT ACTATCATTT GCGATTTAAC 5940 AAAATATTTG GTAACGGTAC CAATTCCAAA TAAAAGTGCA AAATCAGTTG CTAAGGCTAT 6000 ATTCGAAAAT TTTATTCTAA AGTACGGTCC AATGAAAACA ATCACAACGG ACATGGGAAC 6060 GGAATATAAA AACCAAATTA TAGACGACCT ATGCAAATAT ATGAAGATAA AAAACATTAC 6120 TTCAACAGCA CACCATCACC AGACATTAGG AACAGTAGAA CGAAGTCACA GAACTTTCAA 6180 CGAGTATGTT CGCTCATATA TATCTGTTGA CAAAACCGAT TGGGATATAT GGATACAATA 6240 TTTTACTTAT TGTTTCAACA CAACACCATC GGTAGTTCAT GAATATTGTC CATATGAATT 6300 AGTATTTGGA AGATTACCAA GACAGTTCAT AGATTTTAAC AGGATAGACA GAATAGATCC 6360 TATTTACAAC ATGGATGATT ATTCAAAAGA AGTTAAGCTA CGATTAGAAA TAGCATATAG 6420 AAGAGCTAAA AATATGTTAG ACAAGGCAAA AGCCGATAGA AAGATAAAAT ATGATAGAAA 6480 TATTAGTAAC TTTGAATTAA AGATAGGAGA TAAGATATTA CTTAAAAACG AAACGGGTCA 6540 TAAACTTGAC AATAATTATT TAGGACCATA TTTAGTTTCA GAAATAGGAG ATAATGACAA 6600 CATTACAATT ATAGGAAATA AAAATAAAAA ACAGATAGTC CATAAAGATA GGTTAAAAAT 6660 TTTTAATTCA TAATACATTT TGTTTGGTTG GCCAACCACA AATAAAAAAC CACAAATAAA 6720 AAACCACAAA TAAAAAACCA CAAATAAAAA ACCACAAATA AAAAACCACA AATAAAAAAC 6780 CACAAATAAA AAACCACAAA TAAAAAACCA CAAATAAAAA ACCACAAATA AAAAAACCAC 6840 AAATAAAATA AAAACCAATA AAAACATTAT AATACAAAAC TTTTACTTTG CAAAATATAA 6900 TGAAAATATA TATATTTTTT TTAATATCTC TTTAATCATT CATTTCAAAT ATTAATGTAC 6960 ATTTAAAAAA AAAAAAAAAA ATATTATATA CTTGAAAATA ACTTCATGTT ATTACGTTAT 7020 TTTTCAAAAG GAGGGAGATG TAGTATATAC GAATATAATA ACAATAATAA TAACAATAAT 7080 AATAATAATA TTAATAATAA TTATAATATG AATCATAATA ATAAGTCAAC TAATAAGTAA 7140 ACTTAGGACC ACCCTAATTC CTTAGGGTCA CCCTAGTAGA TCTTTAGATA CACCCTAATA 7200 CTAAATATGC GAATTCAGGA TGTACGCCTT TAGGGGTCGG ACTCGACTCC CATTGGTTAT 7260 CGAGTATGAA CTTCATACAT ACATATTGCA GAATTTGCTA GTGTCAGCAC TTGGCTGTCA 7320 CAAGAGATCT CCCTGTAGAC CACACTAAGA TCAGTTATAA ATCAGGAATA GATCTGGAAT 7380 GTACACTCGC TTAATAAAAA CCAAATAAAG ATAAAATGAC CAACTGCGTT TTGAGACTTT 7440 ATTAACTACA TCAGAAGTAT TAGAATTCAA ATTAACTACA 7480 // ID DMMDG3 standard; DNA; INV; 5519 BP. XX AC X95908; XX DR FLYBASE; FBte0000010; Dmel\mdg3. XX FT source X95908:1..5519 FT SO_feature five_prime_LTR ; SO:0000425:1..267 FT SO_feature three_prime_LTR ; SO:0000426:5253..5519 FT SO_feature transcription_start_site ; SO:0000315:178 FT SO_feature polyA_signal_sequence ; SO:0000551:5253..5519 FT SO_feature CDS ; SO:0000316:296..4780 FT /name="Dmel\mdg3\ORF" FT /db_xref="FLYBASE:FBgn0043882" FT /db_xref="SPTREMBL:Q94885" FT /db_xref="NCBI_PROTEIN:CAA65152.1" FT /translation="MDDKIILNDFSLTTLKDWLRILGQNTEGTKTELIARLQDIPTAVR FT GDCPPEHPQKNAPPGNDIFSSLDFQNCEINTDHVSVNAMNRKESTETGSERETNMFELQ FT QLRAELAEAKAMLNGTRSSLQFQEQQQPEQSKATVSSVIQTAQFTQAGATKENTTFHSP FT QRSNERAESQRFPVDALALAKETITDYDGKTCARAWITVVKNIARTFNIDDNHLRILLI FT TKLKGNAQVWLHAHPARLIEPIDNLLDQLSLTFGEQSSKAEIRRKFESRKWKTEENFCS FT YYDEKMALSNGINIDDDELLDQMIEGIPLQNFRTQARIQCFSTPSEMLRAFSNIRLPAR FT REPPVQPTDYKDAIRCANCNSRGHKADICKKPKREPGSCYACGQLGHLVAQCPTRKSVS FT SNNYVRWFKINFFENAYKPIISECLIDSGSPISIIKKSLINETMKLALVNTCYFGLNNC FT ILKTHGQTTCYVLKGSIKIYFRLIIVCDQSMRYNVILGRDFLTACNLNLDPYTLGMIAL FT RKPMEINKISMFTENDSPEKSLENEIVSPKSLENEIVSSQSLENEIVSPKSLENEIVSP FT KSFKNATISPKSLENKIVNQQHKETGPISLRDEIVNQQKNVSKSKLSEDEIVNTSKEIV FT SFKLPKDKNVYEQLNHNFDKEVLRICHVTESELEYKIGENVSNRLQLEFDRLFRNFYIN FT AKRPNEPTVRSEIQLCLKNPKPFSCSPRRLSYTEKDRLQKLLDEYLENGFIRPSDSEYA FT SPIVLVKKKTGDLRMCVDFRKLNKMTMKDNYPLPLIDDLLDRMNEKTVFTKLDLKNGFF FT HVHVKKESIKYTSFVTPLGQYEWLRMPFGLKNAPSVFQRFVNKIFADMIRENKVVVYMD FT DILLATENINEHLETLKEIFKRLVENKLELRIDKCEFMQSSIKYLGFIINKDGIMPNDK FT GIEAIKNFPIPNNVHTVQSFLGLCSYFRRFIKDFSRLAKPLHDILKKDKPFKFGSEEMI FT CFNMLKDKLIQSPVLAIYNHKHETELHCDASSSGFGAVLMQKKEDQKWHPVSFFSKRTT FT DIESKYHSFELETLAIVYSLRRFRVYLHWRTFKIVTDCNSLILTLSKKELNPRIARWAL FT EFQGYDFEIVHRAGSRMQHVDALSRCTNIMVIQTNSFEDNLVICQGKDTKLKEIRQLLE FT NTENKLYEMRNGIVYKKTNENRLLFYVPIEMEEQVLYKYHNELGHVGRDKMIEAIMKNY FT WFPNLKQKCSTHISNCLKCISFSPKTGKTEGFLHNIPKGNKPFEIIHIDHYGPVDLARP FT KKHILVIVDAFTKFVRLYATKTTNTKEVIQSLNDYFRAYSRPKCIISDRGACFTSGDFD FT SFLKECNVKHIKIATGSPQANGQVERINRSLGPMISKLIEPDQGLHWDLVLEKVEYTLN FT NTLHRSIKQYPSIMLFGLQQKGQIMDELKEKIEEIGETIEERDLESIRNKGEASQKIAQ FT AYNKEYVDKKRKRSGVFTKGTTSWLKILTQQQA" XX CC Derived from X95908 (e990667) (Rel. 49, Last updated, Version 3). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 5519 BP; 2078 A; 1005 C; 1029 G; 1407 T; 0 other; TGTAGTAGGC TGCACCTTCT ACCCTCTTCC TTTACTCTTA GTCATACATA CCTAATTATA 60 CATAGCCAAT CTAGTCATAA GCTTATACAC TCATACACCC ATCCTTAACA TACAAATATT 120 ATCGAGAAAC TTATCGACTA ATCGACTCGC CACTCTGCAG AGAGCGCGGC AGTCAGTCGC 180 TGTTGAACCA AGCTAAAGGA CAGATCAAAA ATAAAAGAGA CACGTGAAAT TGTATTAGAA 240 TATTAACTTC TGTAAACGGC GGCTAAAATC TCAGAAGTGG GATTAATAAT CCAAAATGGA 300 CGATAAAATC ATCCTGAACG ACTTTTCGCT GACAACCCTA AAAGATTGGC TACGTATTCT 360 GGGCCAAAAT ACGGAGGGCA CAAAAACCGA ATTAATCGCG AGGCTGCAAG ACATCCCAAC 420 GGCAGTTCGG GGCGATTGTC CACCGGAGCA CCCCCAGAAA AACGCTCCAC CAGGAAACGA 480 CATTTTTTCT TCACTGGATT TTCAGAATTG TGAAATTAAC ACCGATCACG TAAGTGTGAA 540 TGCGATGAAC AGAAAAGAAT CAACCGAAAC TGGCAGTGAG AGGGAGACAA ACATGTTCGA 600 GCTACAGCAA CTACGCGCAG AGCTAGCAGA AGCGAAGGCA ATGCTTAACG GAACACGATC 660 GAGCTTGCAG TTCCAAGAAC AACAACAACC AGAGCAAAGC AAGGCTACAG TTAGTTCCGT 720 TATCCAGACG GCGCAGTTTA CGCAGGCTGG CGCCACAAAA GAGAACACAA CATTTCACTC 780 GCCGCAGCGA TCCAACGAGA GAGCGGAGAG CCAGCGTTTT CCAGTTGATG CTCTCGCTCT 840 CGCCAAAGAG ACGATAACCG ATTACGATGG GAAAACTTGC GCGCGTGCCT GGATAACAGT 900 GGTCAAAAAT ATCGCACGCA CTTTCAACAT CGATGACAAC CATTTACGCA TCTTACTCAT 960 CACTAAACTT AAAGGAAACG CGCAAGTCTG GTTACATGCG CACCCTGCTC GATTGATCGA 1020 ACCAATTGAC AATTTGCTTG ATCAATTGTC ATTGACTTTT GGCGAGCAAT CATCCAAGGC 1080 TGAGATCCGG CGAAAATTCG AGAGTCGCAA GTGGAAAACC GAGGAGAATT TCTGCAGTTA 1140 TTACGACGAG AAGATGGCTC TCTCAAACGG GATAAACATC GACGACGACG AACTACTGGA 1200 CCAGATGATA GAGGGCATAC CGCTACAAAA TTTCCGTACC CAAGCACGGA TTCAATGCTT 1260 CTCTACTCCA TCGGAGATGC TACGCGCATT TTCGAACATC CGTTTGCCAG CTCGGAGGGA 1320 GCCACCTGTA CAGCCAACCG ACTACAAAGA TGCCATACGA TGCGCAAACT GTAATTCAAG 1380 AGGACACAAA GCTGACATCT GCAAGAAGCC CAAACGTGAA CCAGGTTCGT GCTACGCCTG 1440 TGGACAACTT GGACACCTGG TGGCACAATG TCCCACAAGG AAGAGCGTTT CATCTAATAA 1500 TTATGTAAGA TGGTTTAAAA TTAATTTTTT TGAAAATGCT TATAAGCCCA TAATTTCAGA 1560 ATGCCTCATA GACTCTGGCA GTCCTATATC TATCATTAAA AAGTCACTTA TTAACGAGAC 1620 AATGAAGTTA GCCCTAGTTA ATACTTGCTA TTTTGGTTTA AACAACTGTA TTCTCAAAAC 1680 ACATGGACAA ACCACATGTT ATGTTTTGAA AGGATCAATA AAAATATATT TTCGTTTAAT 1740 CATTGTTTGC GACCAGTCTA TGAGGTATAA TGTTATTCTC GGCAGAGATT TTTTAACTGC 1800 ATGCAATTTA AATTTAGACC CGTACACCTT GGGAATGATT GCGTTGAGAA AACCCATGGA 1860 AATAAACAAA ATATCAATGT TTACTGAAAA TGATAGTCCT GAGAAATCTT TAGAAAATGA 1920 AATTGTTAGT CCAAAATCGT TAGAGAATGA AATTGTTAGT TCACAATCGT TAGAAAATGA 1980 AATTGTTAGC CCCAAATCGT TAGAGAATGA AATTGTTAGT CCAAAATCGT TTAAAAATGC 2040 AACTATTAGT CCGAAATCGT TAGAAAATAA AATCGTTAAT CAACAGCATA AAGAAACTGG 2100 TCCAATATCG TTAAGAGATG AAATAGTTAA TCAACAAAAG AATGTCAGTA AATCAAAATT 2160 ATCAGAAGAT GAAATTGTTA ACACTTCAAA AGAAATCGTT AGTTTTAAAT TGCCAAAAGA 2220 TAAAAACGTT TACGAACAAT TAAATCACAA CTTTGATAAG GAAGTACTAA GAATATGTCA 2280 TGTAACTGAA AGTGAGTTAG AATACAAAAT AGGAGAAAAT GTTAGCAATA GGTTACAACT 2340 AGAATTCGAT AGGTTGTTTA GAAATTTTTA TATAAATGCA AAAAGGCCAA ATGAACCGAC 2400 AGTTAGAAGT GAAATACAAT TGTGTTTGAA AAACCCGAAA CCGTTTAGCT GTTCTCCTAG 2460 GAGGCTTTCA TACACAGAAA AAGACAGGTT ACAAAAACTA TTAGACGAAT ATTTGGAAAA 2520 CGGATTTATA CGACCAAGCG ACTCGGAATA TGCATCGCCT ATTGTTTTAG TGAAAAAGAA 2580 AACTGGAGAC TTACGTATGT GCGTCGACTT TAGAAAACTT AATAAAATGA CAATGAAAGA 2640 CAACTATCCT CTACCTCTTA TAGATGACTT GTTAGATAGA ATGAATGAGA AAACTGTTTT 2700 CACCAAACTC GATCTTAAAA ACGGTTTTTT CCACGTGCAT GTTAAAAAAG AATCAATAAA 2760 ATACACCTCT TTCGTTACAC CATTAGGCCA ATACGAGTGG CTGCGAATGC CATTTGGCCT 2820 CAAAAACGCC CCGTCTGTGT TCCAAAGATT TGTTAACAAA ATTTTTGCGG ATATGATTAG 2880 AGAAAACAAA GTAGTAGTAT ATATGGACGA CATTCTATTG GCAACCGAAA ATATAAACGA 2940 ACACTTAGAA ACGTTGAAAG AAATTTTTAA AAGATTAGTT GAAAATAAAC TTGAATTAAG 3000 AATAGACAAA TGTGAGTTTA TGCAATCAAG TATAAAATAT CTTGGGTTCA TAATAAATAA 3060 AGACGGCATA ATGCCCAATG ACAAAGGAAT CGAGGCAATA AAAAATTTCC CAATACCTAA 3120 TAATGTTCAT ACAGTACAAA GTTTTTTGGG ATTATGCTCA TATTTTCGAC GGTTTATAAA 3180 AGATTTTTCT AGACTAGCTA AACCATTGCA TGACATTCTA AAAAAAGATA AACCGTTCAA 3240 ATTTGGTAGT GAAGAAATGA TTTGTTTTAA TATGTTAAAA GATAAATTAA TACAGTCACC 3300 GGTCTTAGCT ATATACAACC ATAAACACGA AACAGAATTG CATTGTGATG CAAGTTCTTC 3360 TGGATTCGGT GCTGTACTTA TGCAAAAGAA GGAGGACCAG AAATGGCACC CAGTTTCATT 3420 CTTTTCAAAA CGGACAACAG ATATTGAATC AAAATACCAC AGTTTCGAGT TAGAAACTTT 3480 AGCCATTGTT TATTCGTTAC GTAGATTTAG AGTTTATCTT CATTGGAGGA CATTTAAAAT 3540 AGTCACCGAC TGCAACTCAT TAATTTTGAC CCTAAGCAAA AAAGAGCTAA ACCCTAGGAT 3600 AGCCAGGTGG GCTTTAGAAT TCCAAGGTTA TGATTTTGAA ATTGTGCATA GGGCAGGTAG 3660 CCGCATGCAA CATGTTGACG CACTGAGTAG GTGTACAAAT ATTATGGTAA TACAAACAAA 3720 CAGTTTCGAA GATAATCTAG TTATATGTCA AGGGAAAGAT ACAAAATTAA AAGAAATCAG 3780 GCAATTGTTA GAAAACACAG AAAATAAATT GTATGAGATG AGAAATGGTA TAGTTTACAA 3840 AAAGACAAAT GAAAATAGAT TGCTGTTCTA CGTTCCGATA GAAATGGAAG AACAAGTGTT 3900 ATACAAATAT CACAACGAAC TTGGACACGT AGGAAGAGAC AAAATGATAG AAGCTATAAT 3960 GAAAAACTAT TGGTTTCCAA ATTTAAAACA GAAGTGTAGC ACACATATCA GCAACTGTTT 4020 AAAATGTATT TCATTCAGTC CCAAAACAGG AAAAACAGAA GGATTTCTAC ACAACATACC 4080 TAAGGGAAAC AAACCTTTTG AAATAATCCA TATTGACCAT TATGGTCCAG TAGACTTGGC 4140 TAGACCGAAG AAACATATTC TAGTGATAGT AGATGCATTC ACAAAGTTTG TCAGACTATA 4200 CGCAACAAAA ACTACGAACA CAAAAGAAGT CATACAATCG TTAAATGACT ACTTCAGAGC 4260 ATACAGTAGG CCTAAGTGTA TCATATCAGA TAGAGGAGCA TGTTTCACGT CTGGCGATTT 4320 TGACTCATTT TTGAAAGAAT GCAATGTTAA ACACATAAAA ATTGCAACAG GATCGCCACA 4380 AGCCAACGGT CAAGTTGAAC GTATAAACCG AAGTCTTGGT CCAATGATTA GCAAGTTAAT 4440 TGAACCTGAT CAAGGTCTAC ACTGGGACTT AGTCTTAGAA AAGGTCGAAT ATACCCTGAA 4500 CAATACACTA CACCGCAGCA TTAAACAGTA TCCTAGCATA ATGTTATTTG GGTTACAACA 4560 AAAAGGACAA ATTATGGATG AGTTAAAAGA AAAAATTGAG GAAATTGGAG AAACGATTGA 4620 AGAAAGAGAT TTAGAAAGTA TTAGAAATAA AGGCGAGGCA AGTCAGAAAA TAGCACAAGC 4680 ATACAATAAA GAATATGTTG ACAAAAAACG AAAACGATCA GGAGTGTTCA CAAAAGGCAC 4740 TACGTCATGG TTAAAAATTT TGACTCAACA ACAGGCATAG CTAAGAAGTT AATTCCAAAG 4800 CATAAAGGAC CCTATGTCAT AAGCAAAGTT CTCAAAAATG ATCGCTTCCT TCTGGAAGAT 4860 GTTGATGGAT TTCAAATTTC TCGCAATCCT TACCGGGGTG TATGGAGCAT ACAGAATATA 4920 AAACACTGGC AAAGAAAAAT TAAGAGTCTA CAAAATAGAA AGTATAATTT GAGAAACTCT 4980 GTACAAAATA GAAAGTATAA TTTGAGAAAC TCTGTACAAA ATAGAAAGTA TAATTTAAGA 5040 AACTCTGTAC GAAATCGAAA GTATAATTTA AGAAGCAATT GTAAAACAAA GAAAACAAAC 5100 AAGAAGAAAA GAAAACCAAA AAAATGTTTA AGACCGTTCA AAAGTATCTC CACTAAGAAG 5160 AATAAAATAA GAAACAGGAC CCTTAGCTTT AAGAAACGTT AATTGTTATA AAATCCTACG 5220 ATCGGGAGAT CTAGTTGTCA GGACGGCCGA GTTGTAGTAG GCTGCTCCTT CTACCCTCTT 5280 CCTTTACTCT TAGTCATACA TACCTAATTA TACATAGCCA ATCTAGTCAT AAGCTTATAC 5340 ACTCATACAC CCATCCTTAA CATACAAATA TTATCGAGAA ACTTATCGAC TAATCGACTC 5400 GCCACTCTGC AGAGAGCGCG GCAGTCAGTC GCTGTTGAAC CAAGCTAAAG GACAGATCAA 5460 AAATAAAAGA GACACGTGAA ATTGTATTAG AATATTAACT TCTGTAAACG GCGGCTAAA 5519 // ID DMDM11 standard; DNA; INV; 5461 BP. XX AC X14037; AC X15066; XX DR FLYBASE; FBte0000042; Dmel\micropia. XX FT source join(X14037:5..3664,X15066:3534..3593,X14037:3721..5461) FT SO_feature five_prime_LTR ; SO:0000425:1..476 FT SO_feature three_prime_LTR ; SO:0000426:4957..5461 FT SO_feature primer_binding_site ; SO:0005850:477..489 FT /bound_moiety="tRNA-leu" FT SO_feature primer_binding_site ; SO:0005850:4939..4956 FT SO_feature CDS ; SO:0000316:540..4415 FT /name="Dmel\micropia\polyprotein" FT /db_xref="FLYBASE:FBgn0043876" FT /translation=" FT MQNRNLAELVKIMQKTPAREQQPSYDVKLPKFNPDAACVEAAKWCSTTDI FT ILTEHPLKGSKLITALSNCMEGTASQWLTQISYQGMTWQEFQELFLQRFE FT TEETPAATFLNLLNSRPTAAECYAVYASRLVTQLTTKWRNMEIEEIAVTT FT VLAHMANIDSRLQRVLFTSNVRTRSKLQAELKAFTFDKKRHARDDNLGPD FT QKNRKASPVVCHFCSKPGRRIAECRSKMRQDRRAKPQREKSNVTCYRCGQ FT PGHFSNQCPKNGTAAKQDVTQQKTVNQCCVTEPKGSLHQRGEIYPICFDS FT GAECSLIKDDISSKLSGKRINNTVMIKGIGGGSVCSTLQILSEVTINENI FT MEILFHVVPNEEMRNDILIGREILKQGFYVILTSDNFKVVKSKTVNNCSV FT TERSFTLSDIDTELVDNEKAQLIELLEKHSTSFTNGIPHTRVNTGEMKIR FT LIDPTKTVQRRPYRLSPEEREVVRMQVSELIRCNIVRPSCSPFASPMLLV FT KKKNGTDRLCVDFRELNSNTISDKYPLPLISDQIARLRGANYFTCLDMAS FT GFHQIPIHPESVEYTAFVPDGLKNAPSVFQRTVINALGDLANSFVIVYMD FT DIMVVSPTKELALERLKTVLNVLTKAGFTFNLAKCSFLKTTVQYLGYEVR FT AGEIRPNVRKIASLSSLPPPQTVSGVRQFIGLASYFRKFVSGFSQLMKPL FT YSLSSGSGKITWSAELEEIRLKVVTILTNEPALVIFDPQYPIELHTDASA FT CGYGAILLHRIESKPHVIEYFSKTTTSVESRYHSYELETLAVVKAVKHFR FT HYLIGREFVVYTDCNSLKASRTKIDLTPRVHRWWAYLQSFNFEIQYREGK FT RMAHVDFLSRNPLSPEHILSINKIPEKRVNLSEISSTWLLAEQRLDLEII FT EIVNKLESDELAENLAKTYDLRKGVLYRKVQRRGRTSYLPVVPRAFKWSV FT INQVHESIMHLGWQKTLDKVYQYYWFAKMNKYVRKFVSNCITCRSVKSSS FT GKVQAELHSIPKTSIPWHTIHIDITGKLSGKSDLKEYVIVQIDAYTKFVY FT LYHTLKIDAESCVNAMKSSISLFGVPDRIIADQGRCFTSSKFSEFCVSQK FT VELHLIATGMSRANGQVERVMETLKNLLSVVESSQRSWQDALGEVQLALN FT CTISRATDASPLEMLIGKQARPLGLVPPCETECEIDLATVRAHATENMNS FT LASYDKSRFDSSRAAVDKHHVGDYVLLRNEERHQTKLDPKFRGPFLVTEV FT LEGDRYTLKSLTSNRSFKYCHESIKMPDAEIPNELNENVEQ" XX CC Sequence assembled by Lynn Crosby (FlyBase), 'micropia.v006'. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 5461 BP; 1679 A; 1051 C; 1264 G; 1467 T; 0 other; TGTCGTGGCG AAAATAATGA GTATGCGTGT AGTCGCTGTT TACTTCTTCT CCATGTTCCC 60 TTTGCTATTA TGCGTGTTCC TATTTATGAA CACGTGGCGA AAATAATAAA TGCGTGTAGT 120 CGCCGTTTAC TTCTTCTCCA TGTTCCCTTT GCTATTATGC GTGTTCCTAT TTATTGTCAA 180 TGTGTGAGGA TGAATAGATG AATTATCTAT GAACGGGATT TTGCAAAAAC GACTTGCGCT 240 GCTTGGTTAG AAAGGGAAAA CTATATAATG AAAAGGGAAT GCCAAAAATT GAGAAGAGAC 300 AAAGCAGGCT GCACGAAGCT GGAGTGAGGG CATTAATCGT GGAGAAGCCA AAGCAGACGC 360 AAGTGGACTC GTTGACTGCG CACAGCTGCA TAAAATTATA TAGTAAAAAG AGATTTGAGC 420 GACGCTGATA TGGACGGACG GACGGACGCG AGGCCCCTGA TATTCTTAAC CCGACATCAG 480 AAGTGGGATC TGTGCCACAC CCTGCATTTT CTGAGGATCA GTGGCGTGCA GTAGTGGAAA 540 TGCAAAATCG GAATTTGGCT GAACTTGTAA AAATCATGCA AAAGACGCCG GCACGTGAGC 600 AGCAACCTAG TTATGATGTT AAGCTACCCA AATTTAACCC TGATGCTGCA TGCGTAGAGG 660 CAGCAAAGTG GTGTTCAACA ACCGATATAA TTCTAACTGA GCACCCCCTT AAAGGAAGTA 720 AATTGATCAC GGCACTAAGT AACTGCATGG AGGGAACTGC ATCTCAGTGG CTAACACAAA 780 TCTCGTACCA GGGTATGACT TGGCAAGAGT TCCAGGAATT ATTTCTGCAG CGCTTTGAAA 840 CCGAAGAGAC GCCGGCCGCT ACGTTTTTAA ATTTACTCAA CAGCCGCCCG ACTGCCGCCG 900 AATGTTACGC GGTGTATGCG AGTCGGCTGG TGACGCAGCT GACTACAAAG TGGCGGAATA 960 TGGAAATAGA AGAAATTGCC GTTACAACTG TTCTTGCGCA TATGGCAAAC ATTGACAGTC 1020 GTTTGCAGCG CGTCCTCTTC ACATCCAATG TGCGTACCAG AAGTAAGCTA CAGGCGGAGT 1080 TAAAAGCGTT TACGTTCGAC AAGAAGCGAC ATGCTCGAGA TGACAACCTT GGACCTGACC 1140 AGAAGAACCG TAAGGCATCG CCAGTTGTAT GCCACTTCTG TTCAAAGCCG GGACGTCGAA 1200 TTGCTGAATG CCGAAGTAAA ATGCGACAAG ATAGACGGGC GAAACCGCAG CGTGAAAAAT 1260 CAAATGTTAC GTGCTATCGG TGCGGCCAAC CGGGACATTT CTCCAACCAG TGCCCGAAAA 1320 ACGGAACTGC AGCCAAACAA GATGTGACTC AACAGAAGAC TGTTAACCAA TGTTGTGTGA 1380 CTGAGCCAAA GGGAAGCTTG CATCAACGAG GTGAGATCTA TCCAATTTGT TTCGATTCCG 1440 GTGCAGAGTG CTCCCTTATT AAAGACGACA TTAGCAGTAA GTTATCTGGT AAACGTATAA 1500 ACAATACTGT AATGATAAAA GGCATTGGTG GTGGCAGTGT GTGCAGTACA TTGCAAATCT 1560 TGAGTGAAGT CACTATAAAC GAAAATATTA TGGAAATATT ATTTCATGTA GTCCCGAACG 1620 AGGAAATGAG GAATGATATT CTGATAGGGC GAGAAATACT TAAACAAGGC TTTTATGTAA 1680 TTTTGACATC CGATAATTTT AAAGTTGTAA AATCAAAAAC TGTTAATAAT TGTTCCGTTA 1740 CTGAGCGATC GTTTACTTTG TCCGATATTG ACACCGAATT AGTCGACAAT GAGAAAGCTC 1800 AATTAATTGA GTTACTTGAA AAGCACTCGA CTTCATTTAC CAACGGGATA CCTCATACTC 1860 GAGTAAATAC AGGCGAAATG AAAATCCGTT TGATTGATCC AACTAAAACT GTTCAGCGCC 1920 GACCTTACAG ACTTAGCCCC GAAGAGAGAG AAGTAGTGCG AATGCAGGTG AGCGAATTGA 1980 TAAGATGTAA TATTGTTCGC CCAAGTTGCT CTCCCTTTGC TAGCCCCATG TTGCTCGTCA 2040 AAAAGAAGAA CGGAACCGAC CGTCTATGTG TTGATTTTAG AGAGCTAAAC TCGAACACGA 2100 TTTCGGATAA ATACCCCTTG CCGCTTATCA GCGATCAAAT TGCTAGACTT CGCGGAGCAA 2160 ATTATTTCAC ATGCCTGGAT ATGGCAAGTG GTTTCCACCA AATCCCGATT CACCCTGAAT 2220 CCGTGGAATA TACTGCATTT GTGCCCGACG GCCTCAAAAA TGCGCCATCT GTTTTCCAGC 2280 GCACAGTCAT AAATGCACTT GGTGACCTTG CTAACTCTTT TGTAATCGTT TACATGGACG 2340 ACATAATGGT AGTATCGCCA ACCAAGGAAT TGGCTTTGGA AAGGTTAAAA ACTGTTTTGA 2400 ATGTTCTTAC AAAGGCTGGT TTTACCTTTA ACCTTGCTAA ATGCAGTTTT CTCAAAACAA 2460 CGGTTCAGTA TTTAGGCTAT GAAGTGCGAG CGGGAGAAAT TCGTCCGAAT GTGCGAAAGA 2520 TAGCTTCTTT AAGCTCCTTG CCTCCTCCTC AAACTGTCTC CGGCGTTAGA CAATTCATTG 2580 GCTTGGCCTC TTACTTTCGC AAATTCGTGT CTGGATTCTC CCAACTTATG AAACCATTGT 2640 ATTCACTTTC GTCTGGTAGC GGCAAGATTA CATGGAGCGC TGAGCTGGAA GAGATCAGAC 2700 TTAAAGTTGT GACGATCCTC ACAAATGAGC CTGCTCTGGT AATCTTCGAC CCGCAATATC 2760 CTATTGAGTT GCACACTGAT GCAAGTGCCT GTGGATATGG AGCGATACTT TTGCACCGTA 2820 TAGAAAGTAA GCCCCATGTA ATCGAATACT TCAGCAAAAC AACTACCTCT GTTGAATCTA 2880 GATATCACTC CTACGAGCTG GAAACCTTGG CAGTGGTAAA AGCCGTTAAA CATTTTCGCC 2940 ATTACCTAAT TGGCCGTGAG TTCGTTGTCT ATACAGACTG CAATTCATTA AAAGCTTCTC 3000 GCACAAAAAT AGATTTAACC CCCAGAGTTC ACCGCTGGTG GGCCTACTTA CAATCGTTTA 3060 ATTTCGAAAT TCAGTATAGA GAGGGTAAGC GTATGGCTCA TGTGGATTTC CTATCAAGAA 3120 ATCCTTTATC ACCCGAACAC ATTTTGTCAA TAAACAAGAT TCCCGAAAAA CGAGTAAATC 3180 TGTCTGAAAT TTCAAGTACT TGGCTTCTTG CTGAGCAACG GTTAGACCTT GAGATAATAG 3240 AAATTGTTAA CAAATTGGAG TCAGATGAAT TAGCCGAAAA CTTGGCCAAA ACGTATGATT 3300 TGCGAAAAGG TGTATTATAT CGCAAGGTCC AAAGACGAGG TAGAACAAGT TATTTACCAG 3360 TTGTACCCAG AGCTTTCAAA TGGTCAGTAA TTAACCAGGT ACACGAGTCG ATAATGCATT 3420 TAGGGTGGCA AAAGACACTT GATAAAGTGT ACCAGTATTA TTGGTTCGCT AAAATGAACA 3480 AGTATGTTCG AAAATTTGTT TCAAACTGCA TAACTTGTAG ATCAGTGAAA TCATCTTCCG 3540 GGAAGGTTCA GGCGGAACTT CATTCCATTC CGAAGACAAG TATACCGTGG CACACCATCC 3600 ACATAGATAT AACGGGGAAA TTAAGTGGCA AGAGCGATTT GAAGGAGTAT GTCATTGTTC 3660 AGATCGATGC CTATACAAAG TTTGTTTATC TGTATCACAC CTTAAAGATA GATGCCGAAA 3720 GCTGTGTTAA TGCTATGAAA TCTTCCATAT CCTTATTTGG AGTACCAGAT CGCATTATCG 3780 CCGACCAGGG CAGATGTTTT ACTAGCTCTA AGTTTTCAGA GTTTTGCGTA TCGCAGAAAG 3840 TTGAACTTCA CTTGATTGCT ACGGGAATGA GCCGTGCAAA TGGGCAAGTG GAACGGGTGA 3900 TGGAAACACT GAAAAATTTG TTGTCAGTGG TAGAATCAAG TCAACGATCG TGGCAGGACG 3960 CACTTGGCGA AGTCCAACTT GCACTGAATT GTACAATTTC TCGTGCCACT GATGCAAGTC 4020 CGTTAGAAAT GTTAATTGGT AAACAGGCTC GACCCCTTGG ATTAGTTCCC CCATGTGAGA 4080 CCGAATGTGA AATAGATTTG GCAACTGTTA GAGCTCATGC GACAGAAAAT ATGAATTCCT 4140 TAGCGTCTTA CGACAAATCC CGATTTGATA GCAGTAGAGC AGCCGTTGAC AAACACCACG 4200 TAGGTGACTA TGTGCTATTG AGGAATGAAG AAAGACACCA AACTAAGTTA GATCCGAAAT 4260 TCAGAGGACC GTTTTTGGTA ACTGAAGTAT TAGAGGGTGA CAGGTATACA CTAAAGTCGT 4320 TGACGAGTAA CCGATCGTTC AAGTATTGCC ATGAATCAAT CAAAATGCCG GATGCAGAAA 4380 TCCCGAATGA GTTAAACGAG AATGTAGAGC AATAGCTGAA ATATAGAAAC AGTTGAATGA 4440 AAAGAAAAGC CCGCCAATGA GTTCTTTTGT GAACGAGAGA TATCCGTCTA GGTGAGACGA 4500 TGAATTGTGA GTTATCCGTC TAGGTGAGAC GATGAATTGT GAGTTATCCG TCTAGGTGAG 4560 ACGATGAATT GTCAGTTATC CGTCAGGTGA GACGATGAAT TGTGAGTTAT CCGTCCAGGA 4620 GAGACGATGA GTTTGGATTG AATTAATAAT CAAGTGTGTG TGAACTGGCG GAAGATCGAT 4680 ATATAGAAAT CGATAAATGA TAATGTTAAG ATAAGTTGTG AGCTGATGTA TTACTGATCA 4740 ATGGAACTGA ATATGAAAAT AGAATAAGTT ATCCCAGCAA CAGTGAAATA AGAGCTGTTT 4800 TGTTTCTTCA CAGAATTAAG ATTTAAGAAA TACACCTGAT AAAGTCAAAC TAATGAAATT 4860 AAATGTTATT GAATAGTGAT GAAAGTAGGT GATCTTGATA TCTTGGTATC TCGGTATCAA 4920 AAGCTTACAC GAGGACGTGA AATGTCAGAA TGGCCGTGTC GTGGCGAAAA TAATGAGTAT 4980 GCGTGTAGTC GCTGTTTACT TCTTCTCCAT GTTCCCTTTG CTATTATGCG TGTTCCTATT 5040 TATGAACACG TGGCGAAAAT AATGAATGCG CGTAGTCCGG TTTACTTCTT CTCCATGTTC 5100 CCTTTGCTAT TATGCGTGTT CCTATTTATT GTCAATGTGT GAGGATGAAT AGATGAATTA 5160 TCTATGAACG GGATTTTGCA AAAACGAGAG CGATAGAGCT GTTGCTGAAC GTGGCCACTT 5220 GCGCTGCTTG GTTAGAAAGG GAAAACTATA TAATGAAAAG GGAATGCCAA AAATTGAGAA 5280 GAGACAAAGC AGGCTGCACG AAACTGGAGT GAGGGCATTA ATCGTGGAGA AGCCAAAGCA 5340 GACGCAAGTG GACTCGTTGA CTGCGCACAG CTGCATAAAA TTATATAGTA AAAAGAGATT 5400 TGAGCGACGC TGATATGGAC GGACGGACGG ACGCGAGGCC CCTGATATTC TTAACCCGAC 5460 A 5461 // ID PPI251 standard; DNA; SYN; 2907 BP. XX AC X06779; V01520; X69493; XX DR FLYBASE; FBte0000037; Dmel\P-element. XX FT source X06779:996..3902 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..31 FT SO_feature terminal_inverted_repeat ; SO:0000481:2877..2907 FT SO_feature CDS ; SO:0000316:join(153..442,501..1168,1222..1947,2138..2709) FT /name="Dmel\P\T" FT /db_xref="FLYBASE:FBgn0013311" FT /translation=" FT MKYCKFCCKAVTGVKLIHVPKCAIKRKLWEQSLGCSLGENSQICDTHFND FT SQWKAAPAKGQTFKRRRLNADAVPSKVIEPEPEKIKEGYTSGSTQTESCS FT LFNENKSLREKIRTLEYEMRRLEQQLRESQQLEESLRKIFTDTQIRILKN FT GGQRATFNSDDISTAICLHTAGPRAYNHLYKKGFPLPSRTTLYRWLSDVD FT IKRGCLDVVIDLMDSDGVDDADKLCVLAFDEMKVAAAFEYDSSADIVYEP FT SDYVQLAIVRGLKKSWKQPVFFDFNTRMDPDTLNNILRKLHRKGYLVVAI FT VSDLGTGNQKLWTELGISESKTWFSHPADDHLKIFVFSDTPHLIKLVRNH FT YVDSGLTINGKKLTKKTIQEALHLCNKSDLSILFKINENHINVRSLAKQK FT VKLATQLFSNTTASSIRRCYSLGYDIENATETADFFKLMNDWFDIFNSKL FT STSNCIECSQPYGKQLDIQNDILNRMSEIMRTGILDKPKRLPFQKGIIVN FT NASLDGLYKYLQENFSMQYILTSRLNQDIVEHFFGSMRSRGGQFDHPTPL FT QFKYRLRKYIIARNTEMLRNSGNIEEDNSESWLNLDFSSKENENKSKDDE FT PVDDEPVDEMLSNIDFTEMDELTEDAMEYIAGYVIKKLRISDKVKENLTF FT TYVDEVSHGGLIKPSEKFQEKLKELECIFLHYTNNNNFEITNNVKEKLIL FT AARNVDVDKQVKSFYFKIRIYFRIKYFNKKIEIKNQKQKLIGNSKLLKIK FT L" FT SO_feature CDS ; SO:0000316:join(153..442,501..1168,1222..1994) FT /db_xref="FLYBASE:FBgnXXXXXXX" FT /translation=" FT MKYCKFCCKAVTGVKLIHVPKCAIKRKLWEQSLGCSLGENSQICDTHFND FT SQWKAAPAKGQTFKRRRLNADAVPSKVIEPEPEKIKEGYTSGSTQTESCS FT LFNENKSLREKIRTLEYEMRRLEQQLRESQQLEESLRKIFTDTQIRILKN FT GGQRATFNSDDISTAICLHTAGPRAYNHLYKKGFPLPSRTTLYRWLSDVD FT IKRGCLDVVIDLMDSDGVDDADKLCVLAFDEMKVAAAFEYDSSADIVYEP FT SDYVQLAIVRGLKKSWKQPVFFDFNTRMDPDTLNNILRKLHRKGYLVVAI FT VSDLGTGNQKLWTELGISESKTWFSHPADDHLKIFVFSDTPHLIKLVRNH FT YVDSGLTINGKKLTKKTIQEALHLCNKSDLSILFKINENHINVRSLAKQK FT VKLATQLFSNTTASSIRRCYSLGYDIENATETADFFKLMNDWFDIFNSKL FT STSNCIECSQPYGKQLDIQNDILNRMSEIMRTGILDKPKRLPFQKGIIVN FT NASLDGLYKYLQENFSMQYILTSRLNQDIVEHFFGSMRSRGGQFDHPTPL FT QFKYRLRKYIIGMTNLKECVNKNVIP" FT SO_feature intron ; SO:0000188:443..500 FT SO_feature intron ; SO:0000188:1169..1221 FT SO_feature intron ; SO:0000188:1948..2137 XX CC Derived from X06779 (g58305) (Rel. 49, Last updated, Version 8). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. CC CDS annotation from Lynn Crosby's annotation 'P-element.v010'. XX SQ Sequence 2907 BP; 989 A; 491 C; 582 G; 845 T; 0 other; CATGATGAAA TAACATAAGG TGGTCCCGTC GAAAGCCGAA GCTTACCGAA GTATACACTT 60 AAATTCAGTG CACGTTTGCT TGTTGAGAGG AAAGGTTGTG TGCGGACGAA TTTTTTTTTG 120 AAAACATTAA CCCTTACGTG GAATAAAAAA AAATGAAATA TTGCAAATTT TGCTGCAAAG 180 CTGTGACTGG AGTAAAATTA ATTCACGTGC CGAAGTGTGC TATTAAGAGA AAATTGTGGG 240 AGCAGAGCCT TGGGTGCAGC CTTGGTGAAA ACTCCCAAAT TTGTGATACC CACTTTAATG 300 ATTCGCAGTG GAAGGCTGCA CCTGCAAAAG GTCAGACATT TAAAAGGAGG CGACTCAACG 360 CAGATGCCGT ACCTAGTAAA GTGATAGAGC CTGAACCAGA AAAGATAAAA GAAGGCTATA 420 CCAGTGGGAG TACACAAACA GAGTAAGTTT GAATAGTAAA AAAAATCATT TATGTAAACA 480 ATAACGTGAC TGTGCGTTAG GTCCTGTTCA TTGTTTAATG AAAATAAGAG CTTGAGGGAA 540 AAAATTCGTA CTTTGGAGTA CGAAATGCGT CGTTTAGAGC AGCAGCTGAG GGAGTCTCAA 600 CAGTTGGAGG AGTCTCTACG CAAAATCTTC ACGGACACGC AGATACGGAT ACTGAAGAAT 660 GGTGGACAAA GAGCTACGTT CAATTCCGAC GACATTTCTA CAGCTATTTG TCTCCACACC 720 GCAGGCCCTC GAGCGTATAA CCATCTGTAC AAAAAAGGAT TTCCTTTGCC CAGTCGTACG 780 ACTTTGTACA GATGGTTATC AGATGTGGAC ATAAAAAGAG GATGTTTGGA TGTGGTCATA 840 GACCTAATGG ACAGTGATGG AGTTGATGAC GCCGACAAGC TTTGCGTACT CGCTTTCGAC 900 GAGATGAAGG TCGCTGCTGC CTTCGAGTAT GACAGCTCTG CTGATATTGT TTACGAGCCA 960 AGCGACTATG TCCAACTGGC TATTGTTCGT GGTCTAAAAA AATCGTGGAA GCAGCCAGTT 1020 TTTTTCGATT TTAATACCCG AATGGACCCG GATACTCTTA ACAATATATT AAGGAAACTG 1080 CATAGGAAAG GATATTTAGT AGTTGCTATT GTATCCGATT TAGGTACCGG AAACCAAAAG 1140 CTATGGACAG AGCTCGGTAT ATCAGAATGT AAGTTTCGTA TATTACAAAA ATCAGATAAT 1200 CCTTGAAATT CCATTTTTTA GCAAAAACCT GGTTTAGCCA TCCTGCAGAT GACCATTTAA 1260 AGATTTTCGT TTTTTCGGAT ACGCCACATT TAATTAAGTT AGTCCGTAAC CACTATGTGG 1320 ATTCCGGATT AACAATAAAT GGGAAAAAAT TAACAAAAAA AACAATTCAG GAGGCACTTC 1380 ATCTTTGCAA CAAGTCCGAT CTGTCTATCC TCTTTAAAAT TAATGAAAAT CACATTAATG 1440 TTCGATCGCT CGCAAAACAG AAGGTTAAAT TGGCTACCCA GCTGTTTTCG AATACCACCG 1500 CTAGCTCGAT CAGACGCTGC TATTCATTGG GGTATGACAT TGAAAATGCC ACCGAAACTG 1560 CGGACTTCTT CAAATTGATG AATGATTGGT TCGACATTTT TAATTCTAAA TTGTCCACAT 1620 CCAATTGCAT TGAGTGCTCG CAACCTTATG GCAAGCAGTT GGATATACAG AATGATATTT 1680 TGAATCGAAT GTCGGAAATT ATGCGAACAG GAATTCTGGA TAAACCCAAA AGGCTCCCAT 1740 TTCAAAAAGG TATCATTGTG AATAATGCTT CGCTTGATGG CTTGTATAAA TATTTGCAAG 1800 AAAACTTCAG TATGCAATAC ATATTAACAA GCCGTCTCAA CCAAGACATT GTGGAGCATT 1860 TTTTTGGCAG CATGCGATCG AGAGGTGGAC AATTCGACCA TCCCACTCCA CTGCAGTTTA 1920 AGTATAGGTT AAGAAAATAT ATAATAGGTA TGACAAATTT AAAAGAATGC GTAAACAAAA 1980 ATGTAATTCC ATGATTTATA ATTGTTTAAT GTTTAGCTAT ATGTTTCAGG AAAGTTTCAG 2040 TTGAGAATGT AGGTAGTTAT GTGCTGTCTA TTGTGTTTTG TCTTTTATCT GTTTCTTTTC 2100 ATTTTATTAT TTAATCATTA TCCTTTTGCT TATCCAGCCA GGAATACAGA AATGTTAAGA 2160 AATTCGGGAA ATATCGAAGA GGACAACTCT GAAAGCTGGC TTAATTTAGA TTTCAGTTCT 2220 AAAGAAAACG AAAATAAAAG TAAAGATGAT GAGCCTGTCG ATGATGAGCC TGTCGATGAG 2280 ATGTTAAGCA ATATAGATTT CACCGAAATG GATGAGTTGA CGGAGGATGC GATGGAATAT 2340 ATCGCGGGCT ATGTCATTAA AAAATTGAGA ATCAGTGACA AAGTAAAAGA AAATTTGACA 2400 TTTACATACG TCGACGAGGT GTCTCACGGC GGACTTATTA AGCCGTCCGA AAAATTTCAA 2460 GAGAAGTTAA AAGAGCTAGA ATGTATTTTT TTGCATTATA CAAATAATAA TAATTTTGAA 2520 ATTACAAATA ATGTAAAGGA AAAATTAATA TTAGCAGCGC GAAACGTCGA TGTTGATAAA 2580 CAAGTAAAAT CTTTTTATTT TAAAATTAGA ATATATTTTA GAATTAAGTA CTTCAACAAA 2640 AAAATTGAAA TTAAAAATCA AAAACAAAAG TTAATTGGAA ACTCCAAATT ATTAAAAATA 2700 AAACTTTAAA AATAATTTCG TCTAATTAAT ATTATGAGTT AATTCAAACC CCACGGACAT 2760 GCTAAGGGTT AATCAACAAT CATATCGCTG TCTCACTCAG ACTCAATACG ACACTCAGAA 2820 TACTATTCCT TTCACTCGCA CTTATTGCAA GCATACGTTA AGTGGATGTC TCTTGCCGAC 2880 GGGACCACCT TATGTTATTT CATCATG 2907 // ID DMPOGOR11 standard; DNA; INV; 2121 BP. XX AC X59837; S90749; XX DR FLYBASE; FBte0000568; Dmel\pogo. XX FT source X59837:1..2121 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..21 FT SO_feature terminal_inverted_repeat ; SO:0000481:2101..2121 FT SO_feature intron ; SO:0000188:1438..1541 XX CC Derived from X59837 (g8354) (Rel. 45, Last updated, Version 10). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. CC K. O'Hare, Personal communication to FlyBase, 1 May 2000. CC This is probably complete element. XX SQ Sequence 2121 BP; 724 A; 353 C; 399 G; 645 T; 0 other; CAGTATAATT CGCTTAGCTG CATCGATAGT TAGCTGCATC GGCAAGATAT CTGCATTATT 60 TTTCCATTTT TTTGTGTGAA TAGAAAATTT GTACGAAAAT TCATACGTTT GCTGCATCGC 120 AGATAACAGC CTTTTTAACT TAAGTGCATC ATATCAGCTG TTTTTTTTGC CAATTTCAAT 180 GAATATCATC AAAGTTAGCT GCGCCATCTA TGAATCATTT TTGCATATCT AAAAGATGCA 240 AGAATGCCAA CTCGTTTCAG TATCTGCGCA TGTCCGTTTT TGTTTTTGCT TTGATCGTGA 300 TTTTTGTGTT TTTGTTTCTT ATGGCACAAA GTTATTAAAA TGGGTAAAAC AAAGCGTGTC 360 GTTGGACTAA CACTAAAGGA AAAGCTTCAA ATAATCGAGT TAGTGACCAA CAAAGTGGAC 420 AAAAAGGAAA TTTGTGCCAA GTTCAAATGC GACAGATCCA CAGTCAACCG CATTTTACAA 480 AAAACAAATG AAATTCATGA AGCTGTGGCC GCGTCAGGTT TAAAAAGAAA GCGTCAAAGA 540 AAAGGAGCGC ACGACTTAGT AGAAGAAGCC TTATACATTT GGTTCGGACA GCAGGAATCA 600 AAGAACGTAA TTCTTGACCG GCACGTCATA TTAGCAAAAG CGAAAGAATT TTGCCAAAAA 660 TTTAACGACG CCTTTGAACC TGACGCCAGC TGGCTTTGGC GCTGGCGCAA GCGCCACAAT 720 ATAAAGTATG GCAAAATACA CGGCGAAACT GCTACAAATG ATTCCGTATC AGCAAATGAG 780 TACAAAAATG ATATTTTGCC AGGATTGCTT AAAGGTTATA ACCCAGAAGA CATTTTTAAC 840 GCTGACGAAA CTGCACTCTT TTATAAAGCA ATGCCGAATG CGACATTTTT TACTTGTGGA 900 AAGCAATTAA ATGGCCAGAA ATCTCAGAGA GTGAGACTTA CTTTGCTGTT TATATGCAAT 960 GCAACTGGGA CATACAAAAA AACTTTTGTA ATCGGCAGAT CTAAATCGCC ACGATGCTTC 1020 AAGAATGCTA ATGTGCCCAT TCCGTACTAT GCAAATAAGA AGGCCTGGAT GACTAAGGAT 1080 CTCTGGCGAA AAATAATGAC AGGATTTGAC GAAGAAATGA AAAAGCAAAA TCGAAAGATT 1140 TTACTCTTCA TCGACAATGC AACTAGTCAC ACGACTGTCA AGGACTTCGA AAACATAAAA 1200 TTGTGCTTCA TGCCACCAAA CGCAACGGCT CTACTTCAAC CTCTGGACCA AGGTATTATC 1260 CACTCATTCA AATTAGAGTA TAGGCGTATT TTGGTCAAAC AGCAGCTCAT TGCTGTTAAT 1320 TGTGGTAAAT CTACTGTGGA ATTTTTAAAA TCATTATCGT TATTGGATGC TCTATATTTT 1380 GTCAACCAAG GATGGAAGAA TGTTAAAATG TTAACTATTC AGAATTGTTT TAAAAAGGTA 1440 AGATGGGATT ATTATTGATA TGTATCTCAA ATAACGAATT TATTATTTTC AGGCTGGATT 1500 TAAGTTCAGT TTTGAAAATG AAGACACCAT TGCTGAAAAA GACAAACAAT GCGTAGAAGT 1560 TGACATTGTA TCGAATATTA ATTGGAATGA ATATGCCAAT GTTGATGCAG ATGAGGCTTG 1620 CCATGGTCAA TTAGATGATG ATGAAATCGT GCGCTCTTTA GTTCAAGATG CAAAAACCAG 1680 CGATAACGAA GAAAGCCATA GTGATGAAGA TGTGGACGAT ACTGAGCGTC CTACTTTTAA 1740 GGATGGGTTT GCAGCAATTA AGGCTTTAAA GTCCATTTTT ATGCGAAACA ATAATGATGA 1800 GTTTTTGCAA AACTTGAATT CTATGGAAGA CAAGCTGTTT AATTTACATA TAAACTCAGC 1860 TGTATTGCAA AAAAAAATTA CTGACTATTT TTAAGTTAGT TTTAAAAAGT GTTTTAATCA 1920 ATTCACCATC ACTTAAATTT ATATGTCGAT CTTACTTATC ATTAAGAATG AAATTATCAG 1980 TTCCTTTTAT GTTTAACATT GTTATAAAGA AATAAATTCT TTATTTTTCC TTAAAAAAAA 2040 AAATTAAGTT AGCTGCATTT TTAAGTTACC TGCATCGAGG CATTGTGCAA AGTACTCGAG 2100 GCAGCTAAGC GAATTATACT G 2121 // ID DMRER1DM standard; DNA; INV; 5356 BP. XX AC X51968; XX DR FLYBASE; FBte0000118; Dmel\R1A1-element. XX FT source X51968:1..5356 FT SO_feature CDS ; SO:0000316:319..1731 FT /name="Dmel\R1A1-element\ORF1" FT /db_xref="FLYBASE:FBgn0044825" FT /db_xref="SWISS-PROT:P16424" FT /db_xref="NCBI_PROTEIN:CAA36226.1" FT /translation="PVSASIRLLDSSKGGATIGATPMESDSSVSALSGSSASKVSRRGR FT RRSHLASKSSAPTQAKLVALASNGVPEPVGVLEEAFSSLEDARAATSNAANDAAPPAAA FT PAVDHTVAPDVSTAAKIAATTATAATAAARAGQAAMMAELSATQRMVRNSFRSLGGVDT FT EELSCAISRYDELVMALMLRCGELETRLAMPPPPPPPSKANTTAANAPQMPQVAPIAAP FT RTTKVRETWSAVVKCDDPALSGKAIAEKVRTMVAPSLGVRVHEVRELPSRWWCDHSYSS FT VGELQKVMASKRFAELGLNVARNAAEKPKVIVYDVDTAIGPEEFMQELHENNFDSEMTL FT AQFKKSVHLVTKAWSATDGATVNVTLEVDDRAMAKLDVGRVYIKWFSFRCRSQVRTYAC FT HRCVGFDHKVSECRQKESVCRQCGQQGHTAAKCQNPVDCRNCRHRGQPSGHYMLSNACP FT IYGALLARVQARH" FT SO_feature CDS ; SO:0000316:1728..4790 FT /name="Dmel\R1A1-element\ORF2" FT /db_xref="FLYBASE:FBgn0044824" FT /db_xref="SWISS-PROT:P16425" FT /db_xref="NCBI_PROTEIN:CAA36227.1" FT /translation="TLMFSFIQANCGRGRAATIELGVRLRRSESMFALVQEPYLGGDEM FT DVLPEGMRVFTDRRGKAAILVDHQEAICMPVETLTTDYGVCLVVKGSFGSIFLCAAYCQ FT FDAPLEPYLRYMDAVLLQASRTPAILGLDANAVSPMWLSKLSRHAEGQANYRRGELLSE FT WMLEARVAALNQSTEVYTFDNHRATSDIDVTIVNEAASMWATYEWRVDEWELSDHNIIT FT VVAEPTTARSVESIAPVPSWNFSNARWRLFKEEMVSRIAELPENFSESPLDQQVSTLRS FT IVHSVCDTALGRKLTRSPSRRARWWTADLCAARREVRRLRRLLQDGRRRDDDAAVELVV FT VELRRASAYYKKLIGRAKMDDWKRFVGDHADDPWGRVYKICRGRRKCTEIGCLRVNGEL FT ITDWGDCARVLLRNFFPVAESEAPTAIAEEVPPALEVFEVDTCVARLKSRRSPGLDGIN FT GTICKAVWRAIPEHLASLFSRCIRLGYFPAEWKCPRVVSLLKGPDKDKCEPSSYRGICL FT LPVFGKVLEAIMVNRVREVLPEGCRWQFGFRQGRCVEDAWRHVKSSVGASAAQYVLGTF FT VDFKGAFDNVEWSAALSRLADLGCREMGLWQSFFSGRRAVIRSSSGTVEVPVTRGCPQG FT SISGPFIWDILMDVLLQRLQPYCQLSAYADDLLLLVEGNSRAVLEEKGAQLMSIVETWG FT AEVGDCLSTSKTVIMLLKGALRRAPTVRFAGRNLPYVRSCRYLGITVSEGMKFLTHIAS FT LRQRMTGVVGALARVLRADWGFSPRARRTIYDGLMAPCVLFGAPVWYDTAEQVAAQRRL FT ASCQRLILLGCLSVCRTVSTVALQVLGGAPPLDLAAKLLAIKYKLKRGFPLEENDWLYG FT EDIACLSWEQRKTRLEECLIQSWQNRWDDDSEPGRVTHRFIPYVTLAYRDPSFGFSMRT FT SFLLTGHGSFNAFLHGRALSDTTACACGDPYEDWMHILCACPLYADLRDLDGLGVQRLG FT ENWIFEGILDDQEKTQRLAMFAEEVFLRRRAL" XX CC Derived from X51968 (g8429) (Rel. 23, Last updated, Version 1). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 5356 BP; 1213 A; 1340 C; 1634 G; 1169 T; 0 other; CGGACGTGTT TTCGTTGCGC TCGTGGACAT AGTGCGAAGA ACTTTGTTTT CCGTATTTGG 60 AAGTATACGG AATAAATAAT TTAGTGTTCC GTGGAAGTGG TGCGCAAATT TTCGCGAATT 120 AAAAACAAGC GGTTTGGAAG TAATTGACAA TAAATTATTG GAAATTTTCC ACTCCGCACG 180 TGTTGAGCGG CGGAGCTTGC GGGTGAGCTT TTCGAACAGC TGAGAGAAGC TTATTGGTGG 240 TAGTCACCGC TAAGGATTGT GTCTTGGGAC AGCTTAGTGC ACTCTACCAA TAGGTGGAGC 300 TATCACCATA GCAACTAGCC CGTGTCAGCG AGCATACGAT TGCTGGACTC GTCAAAAGGA 360 GGAGCCACCA TCGGAGCAAC GCCGATGGAG AGCGACAGCA GTGTGAGTGC CTTGAGCGGA 420 AGCAGTGCCT CAAAGGTGTC AAGACGAGGC AGGCGTAGGA GCCATCTGGC CTCCAAGAGC 480 TCGGCGCCAA CGCAGGCGAA ACTGGTTGCC CTGGCCTCGA ATGGAGTGCC GGAACCCGTT 540 GGTGTGCTGG AGGAGGCGTT TTCGTCGCTG GAGGATGCCC GGGCGGCTAC GTCAAACGCT 600 GCCAACGATG CTGCCCCCCC CGCTGCTGCC CCCGCTGTTG ATCACACTGT TGCCCCTGAT 660 GTTTCCACTG CTGCTAAAAT CGCTGCCACC ACTGCCACCG CTGCCACCGC TGCCGCCCGT 720 GCTGGGCAAG CAGCCATGAT GGCAGAGCTG TCGGCCACCC AGCGCATGGT GCGAAACAGT 780 TTCCGCAGCC TAGGAGGCGT AGACACGGAA GAGCTCTCGT GTGCCATCAG CCGCTATGAT 840 GAGCTGGTGA TGGCATTAAT GCTCCGGTGT GGAGAACTGG AGACGCGGCT CGCTATGCCA 900 CCACCGCCGC CGCCGCCGTC CAAGGCGAAC ACTACTGCCG CCAATGCTCC CCAGATGCCT 960 CAGGTTGCAC CCATCGCTGC CCCGCGGACA ACCAAGGTTC GTGAGACGTG GTCAGCGGTG 1020 GTGAAGTGCG ACGACCCTGC GCTATCGGGG AAAGCCATAG CCGAAAAGGT GCGGACGATG 1080 GTTGCACCCT CCCTCGGAGT CAGAGTACAC GAGGTACGTG AGCTGCCGTC GAGGTGGTGG 1140 TGCGATCATT CGTACTCTTC GGTTGGAGAG CTGCAGAAGG TGATGGCATC GAAAAGATTC 1200 GCAGAACTTG GACTGAATGT GGCACGGAAC GCGGCCGAGA AGCCGAAGGT CATAGTCTAT 1260 GACGTCGACA CAGCCATCGG CCCAGAAGAG TTCATGCAGG AGCTTCACGA GAACAACTTC 1320 GACAGTGAAA TGACTCTGGC CCAGTTCAAA AAGTCGGTGC ACCTGGTGAC CAAGGCGTGG 1380 TCGGCTACTG ACGGTGCCAC CGTAAACGTG ACGCTAGAGG TAGACGACCG GGCGATGGCG 1440 AAACTTGATG TAGGACGTGT CTACATTAAG TGGTTTTCGT TCCGATGCCG ATCGCAAGTC 1500 CGCACCTATG CCTGCCACAG ATGTGTGGGT TTCGACCACA AGGTTAGTGA ATGCAGGCAG 1560 AAGGAGAGTG TTTGCCGCCA GTGCGGGCAA CAAGGCCACA CCGCGGCAAA GTGCCAAAAC 1620 CCGGTGGACT GCCGGAACTG CCGTCACAGA GGGCAACCTT CGGGGCATTA TATGCTCTCG 1680 AATGCTTGCC CGATATACGG AGCGTTGTTA GCGAGGGTGC AAGCTAGACA CTAATGTTTA 1740 GCTTCATCCA AGCGAACTGT GGCCGAGGCA GAGCTGCGAC CATCGAGCTC GGAGTCCGAC 1800 TCAGGAGATC GGAGTCAATG TTTGCTCTGG TGCAGGAGCC GTATCTTGGC GGGGATGAAA 1860 TGGATGTGCT GCCTGAAGGA ATGAGGGTTT TCACCGACCG GCGAGGGAAG GCAGCCATCC 1920 TAGTGGATCA TCAGGAAGCC ATCTGCATGC CAGTGGAAAC TCTCACCACA GATTATGGCG 1980 TATGTCTGGT CGTTAAAGGG AGTTTTGGCT CAATCTTCCT TTGCGCCGCA TACTGCCAGT 2040 TCGATGCACC TCTGGAACCG TACCTCCGGT ACATGGATGC GGTCCTGCTG CAGGCCAGCA 2100 GAACCCCCGC AATCCTGGGC CTCGACGCGA ATGCAGTGTC CCCCATGTGG CTTAGCAAAC 2160 TCTCTCGTCA TGCCGAGGGG CAAGCTAACT ACAGACGGGG TGAGCTGCTG TCTGAGTGGA 2220 TGCTGGAGGC AAGAGTCGCC GCCCTAAACC AGTCAACAGA GGTGTACACG TTCGATAATC 2280 ACAGAGCGAC TAGTGATATC GACGTGACAA TCGTCAATGA AGCAGCATCT ATGTGGGCCA 2340 CATATGAGTG GAGAGTGGAC GAGTGGGAAT TGAGTGACCA CAACATCATT ACTGTTGTGG 2400 CCGAACCAAC TACCGCGCGC TCAGTTGAGA GCATAGCTCC TGTGCCGTCC TGGAACTTCT 2460 CCAATGCACG TTGGCGATTG TTCAAGGAGG AAATGGTGAG TAGAATAGCC GAACTTCCGG 2520 AAAACTTTTC AGAGTCGCCG TTGGACCAGC AAGTTTCGAC CCTGCGCAGT ATAGTACATA 2580 GTGTATGTGA TACTGCGCTA GGAAGGAAGT TGACTCGATC GCCCAGCAGG AGAGCACGTT 2640 GGTGGACTGC CGACCTCTGC GCTGCAAGGC GCGAAGTCCG AAGACTTCGT CGCCTGCTCC 2700 AAGATGGAAG GCGTCGAGAT GACGATGCCG CTGTAGAGCT TGTAGTGGTC GAGCTGAGGC 2760 GTGCCTCAGC CTACTACAAG AAGCTCATTG GAAGGGCGAA GATGGATGAC TGGAAACGCT 2820 TCGTGGGAGA TCATGCCGAC GACCCATGGG GGCGCGTCTA CAAGATTTGC CGAGGTCGCA 2880 GGAAGTGCAC GGAGATTGGG TGCCTCCGCG TGAATGGCGA GCTGATCACT GATTGGGGTG 2940 ACTGCGCACG AGTGCTCCTC CGCAATTTTT TCCCAGTTGC GGAGTCCGAA GCACCGACTG 3000 CCATCGCGGA GGAAGTCCCA CCGGCCCTCG AAGTATTCGA GGTTGATACA TGTGTTGCCC 3060 GGCTGAAGAG CAGGCGCTCT CCCGGGTTGG ACGGCATCAA TGGCACTATC TGCAAGGCAG 3120 TCTGGCGCGC CATACCCGAG CACCTAGCAT CATTGTTTTC CCGATGCATC CGATTGGGAT 3180 ACTTTCCAGC CGAGTGGAAG TGCCCACGAG TTGTCTCGTT GCTCAAAGGG CCAGATAAGG 3240 ACAAGTGTGA GCCCTCCTCA TACAGAGGAA TATGCTTGCT ACCAGTCTTT GGAAAGGTGC 3300 TCGAGGCCAT CATGGTGAAT CGTGTGAGAG AAGTTCTTCC GGAAGGCTGC AGATGGCAAT 3360 TCGGATTTCG CCAAGGACGA TGTGTGGAGG ATGCTTGGAG GCACGTGAAG AGCAGTGTTG 3420 GCGCCAGCGC GGCGCAATAC GTGCTCGGCA CATTCGTGGA CTTCAAAGGA GCATTCGACA 3480 ACGTCGAATG GAGTGCTGCA CTCAGCCGAC TAGCCGACTT GGGATGCCGG GAAATGGGCT 3540 TGTGGCAGAG CTTTTTCTCC GGCCGAAGAG CAGTGATCCG AAGCAGTTCC GGTACTGTGG 3600 AGGTACCGGT AACTAGAGGC TGCCCGCAGG GATCAATCAG CGGCCCATTT ATCTGGGACA 3660 TACTGATGGA TGTACTGCTT CAGCGTCTCC AGCCGTATTG CCAGCTGAGT GCATACGCGG 3720 ATGACTTGCT GCTTCTCGTC GAGGGAAATT CCCGAGCTGT GCTAGAGGAA AAAGGAGCGC 3780 AACTAATGTC CATCGTAGAA ACGTGGGGAG CGGAAGTTGG CGATTGCCTC TCGACCAGCA 3840 AGACGGTAAT CATGCTGCTG AAAGGTGCCT TGAGACGTGC GCCTACGGTG AGGTTTGCTG 3900 GACGGAACCT TCCGTATGTG CGTAGCTGTC GGTACCTTGG CATCACGGTC AGTGAAGGAA 3960 TGAAATTCCT CACGCACATA GCTTCGCTTC GCCAGCGGAT GACAGGAGTC GTTGGAGCAT 4020 TGGCGCGTGT GCTTCGAGCC GACTGGGGCT TCAGTCCTCG AGCCAGGCGG ACCATATATG 4080 ACGGACTCAT GGCACCTTGT GTGCTGTTTG GTGCCCCGGT ATGGTATGAC ACCGCGGAAC 4140 AAGTAGCTGC CCAGAGGCGA CTAGCCTCCT GCCAGAGGCT AATCCTGCTT GGATGCCTTT 4200 CGGTATGCCG AACAGTATCC ACAGTGGCAC TGCAGGTACT TGGTGGAGCT CCCCCGCTTG 4260 ATCTGGCTGC TAAGTTATTA GCGATCAAAT ACAAGCTAAA ACGTGGATTC CCGCTGGAGG 4320 AGAACGACTG GCTTTACGGC GAGGACATTG CGTGTCTTAG CTGGGAGCAG AGGAAGACTC 4380 GCCTAGAGGA GTGTTTAATC CAGAGTTGGC AGAACAGATG GGACGATGAC AGCGAACCAG 4440 GACGGGTGAC GCATAGGTTT ATCCCATACG TCACTCTTGC CTATCGGGAT CCAAGTTTTG 4500 GATTCTCGAT GAGGACGTCT TTCCTGCTTA CAGGGCACGG GTCGTTCAAT GCATTTTTGC 4560 ACGGGAGAGC CCTCAGCGAT ACCACTGCTT GCGCATGTGG AGATCCATAT GAGGACTGGA 4620 TGCATATCTT GTGCGCTTGC CCCCTATATG CAGATCTGCG GGACCTAGAT GGACTTGGAG 4680 TGCAGCGCCT TGGCGAAAAC TGGATCTTCG AGGGAATCCT GGATGATCAA GAGAAGACTC 4740 AACGGCTGGC AATGTTTGCG GAAGAAGTGT TCCTGAGGAG GAGGGCCCTT TAGCTCAACA 4800 TCTCTGCCGT GTGGTTAGCG GGCGAGAATA CTACCACAGT CCGCTGTTGC TTGTCGTAAG 4860 AGACGACTAA TACAGCGATA GGATTCCTCT AACCCTGCTT GTCGGAGCAA AAGGGGGAGG 4920 CCCACCGAGC CTCTTTTCGG TACCACGGGT TGAGCAGCTA TCCAAGACTG CTCATTGAGG 4980 TAGGCCCCCT GGTGGGAGTA TCGTGGTGGC TGTGGTTGGT ACCCATATCG CGGGTAGAGC 5040 CTTCATGCTC GACGTTTGAG TTACGGTGCT AGTTGCGCAA AACTCGGGTG CTGTGACCCA 5100 GAGATCAGTA GAGATTTTAG GTAGATCTCG CTCCTCAGCA AGGGGGAGTG CTTGCCCGGC 5160 AAGCAAGTAC TCGAATTGCT ACCGGGGTGG TCGCTATGTA CATAGCTATA GCTTCTAGTC 5220 CGGGACGCTT GTCTGGCGTA TCCAGACACA TGCACCATAT GCTCACTTGT GGGCGTATAG 5280 GGTGCCGTGG TTGTAATCCC TTCAGTGTGG AACACGCCAC GTAAAATAAG TTCGGAGGGA 5340 TCCGAAAAGC ATACAT 5356 // ID DMRER2DM standard; DNA; INV; 3607 BP. XX AC X51967; XX DR FLYBASE; FBte0000030; Dmel\R2-element. XX FT source X51967:1..3607 FT SO_feature CDS ; SO:0000316:181..3351 FT /name="Dmel\R2-element\ORF" FT /db_xref="FLYBASE:FBgn0016699" FT /db_xref="SWISS-PROT:P16423" FT /db_xref="NCBI_PROTEIN:CAA36225.1" FT /translation="FERKNFSDGLVPQRKFIHIGTTSTNNEPRIPLHNLMTTRPSVDIF FT PEDQYEPNAAATLSRVPCTVCGRSFNSKRGLGVHMRSRHPDELDEERRRVDIKARWSDE FT EKWMMARKEVELTANGCKHINKQLAVYFANRSVEAIKKLRQRGDYKEKIEQIRGQSALA FT PEVANLTIRRRPSRSEQDHQVTTSETTPITPFEQSNREILRTLRGYSPVECHSKWRAQE FT LQTIIDRAHLEGKETTLQCLSLYLLGIFPAQGVRHTLTRPPRRPRNRRESRRQQYAVVQ FT RNWDKHKGRCIKSLLNGTDESVMPSQEIMVPYWREVMTQPSPSSCSGEVIQMDHSLERV FT WSAITEQDLRASRVSLSSSPGPDGITPKSAREVPSGIMLRIMNLILWCGNLPHSIRLAR FT TVFIPKTVTAKRPQDFRPISVPSVLVRQLNAILATRLNSSINWDPRQRGFLPTDGCADN FT ATIVDLVLRHSHKHFRSCYIANLDVSKAFDSLSHASIYDTLRAYGAPKGFVDYVQNTYE FT GGGTSLNGDGWSSEEFVPARGVKQGDPLSPILFNLVMDRLLRTLPSEIGAKVGNAITNA FT AAFADDLVLFAETRMGLQVLLDKTLDFLSIVGLKLNADKCFTVGIKGQPKQKCTVLEAQ FT SFYVGSSEIPSLKRTDEWKYLGINFTATGRVRCNPAEDIGPKLQRLTKAPLKPQQRLFA FT LRTVLIPQLYHKLALGSVAIGVLRKTDKLIRYYVRRWLNLPLDVPIAFVHAPPKSGGLG FT IPSLRWVAPMLRLRRLSNIKWPHLTQNEVASSFLEAEKQRARDRLLAEQNELLSRPAIE FT KYWANKLYLSVDGSGLREGGHYGPQHGWVSQPTRLLTGKEYMDGIRLRINALPTKSRTT FT RGRHELERQCRAGCDAPETTNHIMQKCYRSHGRRVARHNCVVNRIKRGLEERGCVVIVE FT PSLQCESGLNKPDLVALRQNHIDVIDTQIVTDGHSMDDAHQRKINRYDRPDIRTELRRR FT FEAAGDIEFHSATLNWRGIWSGQSVKRLIAKGLLSKYDSHIISVQVMRGSLGCFKQFMY FT LSGFSRDWT" XX CC Derived from X51967 (g8432) (Rel. 24, Last updated, Version 1). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 3607 BP; 1064 A; 818 C; 900 G; 825 T; 0 other; TTGGGGATCA TGGGGTATTT GAGAGCAGAG GGGGAGTATT CTTCTGTAAT TCGTAAGTCA 60 TATCATATGA TGTGCGGAAG GGGAATTTTA CTCTGTAACT CACAAGTCTC TCCTTTACTC 120 AAGTCGACTC AAAACCTCCT CGTGGTGGTC CCGGTAATGC TAAACTCGTT TAGCAGCTAA 180 TTTGAGCGGA AAAACTTTTC CGATGGGCTG GTTCCCCAGA GGAAATTTAT TCATATTGGA 240 ACTACAAGCA CAAATAACGA GCCTCGGATA CCTTTACACA ATCTGATGAC GACCCGACCC 300 TCCGTGGATA TCTTCCCGGA GGACCAATAT GAACCAAACG CAGCGGCTAC TCTATCTAGG 360 GTTCCCTGCA CAGTATGTGG CCGGTCCTTT AACAGCAAGA GAGGACTCGG TGTTCACATG 420 CGATCTCGGC ACCCAGACGA ACTTGATGAA GAACGTCGAC GTGTCGATAT AAAGGCAAGA 480 TGGAGTGATG AAGAGAAGTG GATGATGGCG AGAAAGGAGG TTGAGCTCAC AGCAAATGGA 540 TGTAAACACA TAAACAAGCA ACTAGCGGTG TATTTTGCAA ACCGCAGCGT CGAAGCCATC 600 AAAAAGCTAA GACAGAGGGG CGATTATAAG GAGAAAATAG AGCAGATAAG AGGGCAATCA 660 GCTCTCGCCC CGGAAGTTGC TAATCTAACC ATAAGGCGCC GCCCTAGTAG AAGTGAGCAA 720 GACCACCAAG TAACAACATC GGAAACAACT CCAATCACTC CCTTCGAACA GTCGAACAGG 780 GAAATTTTGC GGACACTACG CGGGTATAGC CCCGTAGAAT GCCATTCCAA ATGGAGAGCC 840 CAAGAGTTGC AAACTATCAT TGATAGGGCA CATCTCGAGG GAAAGGAAAC CACTCTCCAA 900 TGCTTATCGC TATATCTCCT GGGAATTTTT CCGGCACAGG GTGTACGACA CACACTGACG 960 AGACCTCCTC GGAGACCTCG GAACAGGAGA GAAAGCAGAA GGCAGCAGTA CGCTGTCGTC 1020 CAGCGTAACT GGGATAAGCA TAAAGGAAGA TGCATCAAGT CCTTGCTAAA TGGAACTGAT 1080 GAGTCGGTAA TGCCAAGCCA AGAAATAATG GTTCCCTACT GGAGAGAAGT AATGACTCAG 1140 CCTAGCCCAA GCTCTTGCAG TGGAGAAGTG ATACAAATGG ATCACTCGCT TGAGAGGGTA 1200 TGGTCTGCTA TTACAGAGCA GGACCTTCGG GCGTCAAGAG TCTCATTATC CTCGTCTCCG 1260 GGGCCTGACG GGATAACTCC AAAATCTGCC AGGGAGGTGC CGTCAGGTAT TATGCTGCGC 1320 ATAATGAACC TAATTCTATG GTGCGGTAAT CTACCACACT CCATACGACT GGCCAGAACC 1380 GTCTTCATCC CGAAGACGGT GACGGCGAAG CGACCGCAAG ACTTTCGTCC AATATCAGTG 1440 CCTTCAGTCC TGGTAAGACA GCTAAATGCA ATATTGGCAA CCCGGTTGAA CTCATCAATC 1500 AATTGGGACC CGCGCCAGCG GGGCTTCTTA CCAACCGACG GATGCGCCGA TAATGCGACG 1560 ATAGTCGACT TAGTCTTGAG GCATAGCCAT AAGCACTTTA GATCTTGCTA CATCGCAAAT 1620 TTAGATGTAA GCAAGGCATT TGATTCTCTA TCACATGCAT CTATATACGA CACCTTACGT 1680 GCTTATGGTG CGCCAAAGGG CTTCGTTGAC TACGTACAGA ACACGTACGA GGGCGGTGGT 1740 ACCAGTCTCA ATGGGGACGG TTGGAGTTCA GAGGAATTCG TCCCTGCTAG AGGAGTGAAG 1800 CAGGGTGACC CTTTGTCTCC TATTCTATTT AACTTGGTAA TGGACAGGTT ACTTAGAACC 1860 TTACCCAGCG AAATTGGTGC CAAAGTCGGA AATGCCATTA CTAACGCGGC CGCGTTTGCA 1920 GATGATTTGG TACTATTTGC GGAAACTCGG ATGGGGCTTC AAGTATTGTT GGACAAGACG 1980 TTGGATTTTC TATCTATCGT CGGCCTCAAA CTTAATGCCG ACAAATGTTT TACCGTTGGC 2040 ATTAAGGGCC AGCCGAAACA GAAGTGTACC GTGTTAGAGG CACAGAGCTT CTACGTAGGC 2100 TCGAGTGAGA TTCCATCACT GAAGCGCACG GACGAGTGGA AGTACTTAGG CATCAACTTC 2160 ACTGCAACCG GGAGGGTTCG ATGCAATCCG GCCGAGGACA TTGGTCCAAA GCTACAAAGA 2220 TTGACAAAGG CCCCCCTCAA ACCACAACAG AGGTTGTTCG CCCTTCGGAC TGTCCTTATC 2280 CCACAGCTCT ACCACAAGTT AGCCCTTGGG AGTGTGGCGA TAGGCGTCCT AAGAAAAACT 2340 GATAAACTTA TAAGATATTA TGTGCGAAGA TGGCTAAATC TTCCGCTGGA TGTGCCGATA 2400 GCATTTGTTC ATGCACCCCC AAAAAGTGGA GGTCTCGGAA TTCCATCACT AAGATGGGTA 2460 GCTCCAATGT TAAGGCTAAG ACGCTTGAGT AACATTAAAT GGCCTCACCT CACGCAAAAC 2520 GAGGTAGCCA GCTCTTTCCT CGAAGCCGAA AAACAACGGG CCCGAGATAG ATTATTAGCT 2580 GAACAAAATG AACTGTTATC GCGTCCGGCA ATAGAAAAAT ATTGGGCGAA CAAGTTGTAC 2640 CTCTCAGTTG ATGGTAGCGG ACTCCGTGAA GGCGGCCATT ATGGCCCGCA ACACGGGTGG 2700 GTTAGTCAAC CCACGCGTTT ATTAACAGGA AAGGAATATA TGGACGGTAT TCGTCTGCGG 2760 ATAAATGCCC TACCCACAAA GTCTCGTACT ACAAGGGGAA GGCACGAATT GGAACGACAG 2820 TGTCGTGCAG GATGTGATGC TCCCGAAACA ACAAACCACA TAATGCAAAA ATGCTACCGC 2880 TCGCATGGGA GGCGGGTAGC TAGACACAAC TGCGTAGTAA ATCGAATCAA GCGGGGACTT 2940 GAGGAGAGAG GCTGCGTGGT CATTGTTGAA CCAAGTCTGC AGTGCGAATC CGGCCTTAAT 3000 AAACCAGACC TGGTGGCACT ACGACAAAAT CACATTGATG TGATCGACAC ACAAATTGTG 3060 ACAGACGGAC ACTCTATGGA TGATGCGCAC CAGCGCAAAA TCAATAGATA CGACAGACCG 3120 GACATACGAA CTGAATTGCG TCGCAGATTC GAAGCCGCAG GTGACATTGA ATTCCATTCT 3180 GCCACCCTGA ACTGGAGGGG GATCTGGAGT GGTCAATCCG TTAAAAGATT GATAGCAAAG 3240 GGTCTCCTCA GCAAATATGA TAGTCATATC ATTAGCGTCC AGGTTATGAG AGGCAGTCTC 3300 GGTTGTTTTA AACAGTTCAT GTACCTGAGC GGGTTTTCCC GAGATTGGAC TTAGCTAAAT 3360 CGTTTGGTTC AAAACATTTG CTTGCTGTCT TGGCATAACA TCAATAAAGG CATAAACATC 3420 GCAAAATAAT GGTTATAATT AAATGGCTAT GAGGATGGTT TTAGTACGTA GGCGTTGCGG 3480 AACTTCGGTT CATATAGAGC AATGAATCGT GCATGCTAGG AAAACTGACC ACACACAGTG 3540 TTGGCAGACC TAGTATCTTT CGAAGATTTC CATACCTCCG CGATCAAAAA AAAAAAAAAA 3600 AAAAAAA 3607 // ID DM33463 standard; DNA; INV; 1736 BP. XX AC U33463; XX DR FLYBASE; FBte0001005; Dmel\S-element. XX FT source U33463:37..1772 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..234 FT SO_feature terminal_inverted_repeat ; SO:0000481:1503..1736 FT SO_feature CDS ; SO:0000316:404..1441 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\S-element\T" FT /db_xref="FLYBASE:FBgn0044019" FT /db_xref="REMTREMBL:AAC47095" FT /db_xref="NCBI_PROTEIN:AAC47095.1" FT /translation="MPGKRLAFEVTQLIYYNHQLGKSIPELVEIFSVSRKTVYNILNRX FT XKEGRLEPKSGGGCKTKINKRVDRLIMRKAIANPRISVRSLAQDIREECHLTVSHETVR FT QVILRHRYSSRVARKKPLLSEINIEKRHSFAVSMMDHAEEYWDDVIFCDETKMMLFYND FT GPSRVWRKPLSALETQNIIPTIKFGKLSVMIWGCISSHGVGKLAFIESTMNAVQYLDIL FT KTNLKASAEKFGLFSNNKPNFKFYQDNDPKHKEYNVRNWLLYNCGKVIDTPPQSPDLNP FT IENLWAYLKKKVAKRGPKTRQQLMAAIIEEWEKIPLEYDLKKLIHSMKKRLQLVAKANG FT GHTKY" XX CC Derived from U33463 (g1006788) (Rel. 47, Last updated, Version 5). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 1736 BP; 600 A; 287 C; 300 G; 545 T; 4 other; CAGTTTGTCA AGAAACTGTT TACACACCGC AAAATAAGTA GAATTTTTGA CTTTAAAGGC 60 CAAAATTAAG GGTTTTTTGC TTAATTAAAC GCAATTTTTT TATGAAATAT AATTAAACAA 120 TATTTATTTT ACTTATAAAT TAAAAAACAA ATTCAATATA TCAAATATAC AAGAAAATAA 180 ACAACAAATT TCTTGTTTAC ACACTTTTGA GAGTGCCAAG AAACTCTTTA CACAGTTTTG 240 GGTTCCTACT TTGTTTTGCT CTTTTTCTTA GAAACAATCT CATTTTTCCG TTATTTTTGT 300 CTTATGCATT CCTTTTTACA ACGCTTCTAT TGCAATTTTT TCACTTTGCT TGTGAAATTT 360 TGTTGATCTA ACGTGCTTAA AGCGAATTAT TAAATTTAAT GAAATGCCTG GAAAGAGATT 420 GGCTTTTGAA GTGACCCAGC TAATATACTA TAACCACCAG TTGGGAAAAT CTATTCCTGA 480 ATTAGTAGAA ATATTTTCCG TATCCCGTAA AACCGTCTAT AATATTTTAA ATCGTNNNNA 540 AAAAGAGGGC AGGCTTGAAC CTAAGAGTGG TGGTGGGTGT AAAACGAAAA TTAACAAGCG 600 AGTAGACCGC CTTATTATGC GAAAAGCGAT TGCGAACCCC CGAATCTCGG TCAGATCACT 660 TGCTCAGGAT ATCAGGGAAG AATGTCACCT AACTGTATCA CACGAAACTG TGCGCCAAGT 720 CATCCTACGC CATAGGTACT CTTCAAGAGT TGCAAGAAAA AAGCCTTTGC TATCAGAGAT 780 CAATATTGAA AAGCGTCATT CATTCGCTGT GAGCATGATG GATCATGCGG AAGAGTACTG 840 GGATGACGTC ATATTTTGTG ACGAAACAAA AATGATGCTC TTTTATAACG ATGGGCCAAG 900 CAGAGTATGG CGCAAACCGT TGAGTGCGCT AGAAACACAA AATATAATTC CAACAATCAA 960 ATTTGGAAAA TTGTCAGTGA TGATTTGGGG CTGTATTTCC AGCCATGGAG TGGGCAAACT 1020 AGCCTTTATT GAAAGCACTA TGAATGCCGT GCAATATCTA GATATTTTAA AAACAAATTT 1080 GAAGGCCAGT GCAGAAAAAT TTGGTTTGTT TAGCAACAAC AAGCCAAATT TTAAGTTTTA 1140 TCAGGACAAT GATCCCAAAC ATAAAGAGTA CAATGTACGC AACTGGCTAC TCTATAACTG 1200 TGGCAAGGTG ATCGATACGC CCCCTCAGAG TCCTGATCTA AACCCCATTG AAAATTTGTG 1260 GGCCTACTTA AAGAAGAAGG TTGCAAAAAG GGGCCCCAAA ACTCGACAAC AACTCATGGC 1320 TGCGATAATC GAAGAGTGGG AAAAGATCCC GCTTGAATAT GACCTAAAAA AACTCATACA 1380 TTCCATGAAA AAAAGGCTTC AACTTGTAGC CAAAGCCAAT GGGGGTCATA CTAAATACTA 1440 AAACTTTTCA AATATTATCA AAATAATTAA AAAATTTAGG ATTAAACTTA GGTTTAGTGT 1500 TTTGTGTAAA GAGTTTCTTG ACACTCTCAA AAGTGTGTAA ACTTGAAATT TGTTGTTTAT 1560 TTTCTTGTAT ATTTGATATA TTGAATTTGT TTTTTAATTT ATAAGTAAAA TAAATATTGT 1620 TTAATTATAT TTCATAAAAA AATTGCGTTT AATTAAGCGA AAAACCCTTA ATTTTGACCT 1680 TTAAAGTCAA AAATTCTACT TATTTTACGG TGTGTAAACA GTTTCTTGAC AAACTG 1736 // ID SPRINGER standard; DNA; INV; 7546 BP. XX AC AF364549; XX DR FLYBASE; FBte0000333; Dmel\springer. XX FT source AF364549:1..7546 FT SO_feature five_prime_LTR ; SO:0000425:1..403 FT SO_feature three_prime_LTR ; SO:0000426:7143..7546 FT SO_feature CDS ; SO:0000316:1058..2422 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\springer\gag" FT /db_xref="FLYBASE:FBgn0044343" FT /db_xref="SPTREMBL:Q967T6" FT /db_xref="NCBI_PROTEIN:AAK52057.1" FT /translation="MSESFRQYRNSKKCASDSESESDDSTENSVRKNTPTNAFTAYKMS FT LETEQIKALIRALQEQALESQRREADLRKTIQDLAGQVAAIQIAPARAEAPPIKVYRPV FT EITGLVPCGETLDAVKCLPDFMGTQETYVSWRQAANAAYHMFRKYEDSSRHYQAVVIIR FT SKVKGPADAVLSSFGTILNFDAIISRLDFTYSDKRPIHVIEQELGTLRQGSLTLLQYYD FT EVEKKLTLLTNKATMSYEASAATVLCEKFRDDALRVFVSGLRRNLTDVLFAAKPKDMPS FT ALALAQEVESNHERYTFATSFARSQEDRDHKQYPKVQERQRAPPQAGSQGSAGKNPHFT FT KQHRAQVHSAPRSDRMARENMPEPMDVDPSLSRMQPSHAPAYPKSKPAASGRSVPPKRQ FT RVNHVAQASDDLDKVYNTAASSAAVKVDDDSILEYDSDTINFLGESPCYPSSDEE" FT SO_feature CDS ; SO:0000316:2434..5475 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\springer\pol" FT /db_xref="FLYBASE:FBgn0044342" FT /db_xref="SPTREMBL:Q967T5" FT /db_xref="NCBI_PROTEIN:AAK52055.1" FT /translation="MKLLIDTGAAKNFIRPFKGLKGVRPVQSPFTIHSIHGVTTITKKC FT FVSIFNLKATFFLLPDLTSFDAIVGLDLLKQAGASLCLASGKLKWGSGAEQIDFHTCPD FT VNFTKVDCSDAPPLIKDAFLKMLGNRKKAFADPNEALPYNTSVVATIRTVDEEPIYAKL FT YPYPMGAADFVNGEIQELLKNGIIQKSKSPYNNPIWVVDKKGTDDAGNKKMRLVLDFRK FT LNERTVPDRYPMPNISMILGNLGKAKYFTTLDLKSGYHQITLAERDREKTAFAVNGGKY FT EFRRLPFGLRNAASIFQRTIDDILREQIGKFCYVYVDDVIIFSEDENDHVKHVDWVLKS FT LYDANMRISAEKSRFFKKSVSFLGFIVTNNGAATDPEKVKAIKEFPEPKNVFEVRSFLG FT LASYYRCFIKDFASIARPISDILKGENGSVSRHRSRSIQVEFSEAQQRAFEKLRNILAS FT EDVILRYPDYKKAFDLTTDASAYGIGAVLSQEGRPITMISRTLSDREVNYATNERELLA FT IVWALAKLRHYLYAVKEINIFTDHQPLTFAVSESNPNAKIKRWKARIDESGARIFYKPG FT RNNLVADALSRQQLNVVEEQEPESCAATIHSELSLTHTIESTDKPVNCFQNQIILEEAR FT SHWKRTFILFGNKRRHSINFSCKQALLEELANIIIPNGVNAFHCDLHTLALIQDDVVRQ FT FPATKFWHCKNRVTDIFAMQERKEILTVEHNRAHRSAQENVKQVLSEYYFPKMTKLASE FT IAANCKTCAKAKYDRHPKKQELGETPVPTHVGEILHIDIFSTDKKYFLTCVDKFSKFAM FT VQPILSRTIEDLKAPLLQLMNVFPKAKTIYCDNEPSLKSQTIVAMLENHFGVSISNAPP FT LHSVSNGQVERFHSTLIELARCLKIDKGISDTVELVLLATARYNMSIHSVINKKPAEVM FT RADPDDPHTDVQEKIKNAQILTRKRENASRQNRVFQVGDKVLVKSNRRLGNKLTPLCEE FT KTIEADLGTTVLIKGRVVHKDNLK" FT SO_feature CDS ; SO:0000316:5870..7147 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\springer\env" FT /db_xref="FLYBASE:FBgn0044344" FT /db_xref="SPTREMBL:Q967T4" FT /db_xref="NCBI_PROTEIN:AAK52056.1" FT /translation="MLDMFPQSHMKKLLSVDIAHLRDMLDSLSIHHRVARSLDFLGTAL FT KVVAGTPDAEDFEKVKFTEARLVDAHNSQIEINTKTQVRINELTDTINKLLKISKSAQI FT DTGHLYETLSTRNRIIVMELQNLMLTITLAKINVVSPNFLDHADLESIWGEEPTNTPIR FT EILSVASVKVLQSLNILHFIIKFPKIIMACNKVTILPVVHHDTVLRLKDNVVAECNREI FT RTVKNCSITPGATFCQLSSVSSCAQELHAGVVAHCDAQQSDLHPITYVDEGIIVINDRP FT ALVRVDNGTAIHIRGTHLITFIESAMVNETVFFNHDMVQNRAPGVANSPVLNISMKHEV FT LSLPYLHRLSEKNLEQIRNFEKDVDGYRLSQIALVAGAIFCALICIGLTWQRTTRAKKS FT TAQLKEVLAQIGSAEGGLNLEEGIVN" XX CC Derived from BACR06P08 by Sue Celniker, 29 March 2001. CC Michael Ashburner, 9-Apr-2001. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 7546 BP; 2131 A; 1909 C; 1712 G; 1794 T; 0 other; AGTTAACTAA GTTAACCGGA CTGATCGTCC GCACACCAGC ACCGGTCAAA CTGCTGACCA 60 AGCATTTGGC CGGAAGCTCA TGCATAGCCG GCAGAAGCTC TGCGCATTGG CAGAGGCCGC 120 TATGATGTTT TTCCCTTTGT TAGCTTATAG TCAGTTTGAT TTTGTATTCA ATAAAGAGCG 180 CATCGCGCCT TCAATCAACT CCAGCTACTG CTGTTATCAT TGAATTGGTT GGCTAGCCTT 240 AAGGGCAGTC AACAACGGAG AGACGTTCTC CCACCATATC TCCCAATCTA GGAGAAGAGG 300 TCTGCGGCAA CCGCCCTGCC TCCCAGTGAC AGAAGAACCC CCCGTTACCT GCAACCTACG 360 CCGGAGACCG CGGCGAGGGA CCTGCACCTT ATATTTAATT AATTGGCACC CAACTCCAGG 420 AACCCACACC ACTACCCTGA ATCATGTAAG TGGGATTCTC AACTTAAACA CTACTCCAAA 480 CTGCGTCTAG AATTTTAAAA TATTTGGGAT GTTTGTGCGA GTTACATAAA TAAATTAAGA 540 AAATCGGCAT TTCCACTACA ATAAACGTTT ATATGTGTTG CGAATTAAGA TTATGTTACT 600 GTTATGAAGT TTAAATATCG AATTTTGATT TGTGGTTGAC TTTGCAATCC ATATTGTGTG 660 CATTTCATTC CGCCTTCGCA CATCCGCGGG ACACTGTCGT TTCATTCGAA ATTTAATTCG 720 CTACATTGGC TTCACAGCCC TTTCAAGCTT TGTTGTTTTT GACCCACTCC ACTTCGCTAC 780 CCGATACTGG CGCATGCATT GCTGTGACAA TTTTGTGCCT TTTATTTATC TCTTTGTCTT 840 TGCTGTGGCA ATTTTTGTCT TTGGATATTT GTTTGCCTTA TTGGAGACCC GCTCCCCGCA 900 GGCCCTTCAC CTTATCGTTA CTTAGCTGGA CAGTGGCTCT GCTCGTTGAG TCTTCGTCCA 960 ATGCCTTCAA AGCGGCGACT CAGCCCCCGC GACCCCCTTG CCGTACTGTT TGGCCCCACG 1020 GGCACAACGG CCTGAGTATT CACATACATA GCTACCCATG AGCGAGTCAT TCCGACAATA 1080 TAGGAATTCT AAAAAGTGCG CTAGCGACTC AGAGTCCGAA AGCGACGATT CGACAGAAAA 1140 CTCTGTACGT AAAAACACCC CAACTAACGC ATTCACTGCA TATAAAATGT CCCTCGAAAC 1200 GGAACAAATT AAAGCTCTCA TAAGGGCATT ACAAGAGCAA GCCTTAGAGA GTCAACGCAG 1260 GGAGGCTGAC TTGCGTAAAA CAATTCAAGA TCTGGCCGGC CAGGTCGCGG CCATACAGAT 1320 TGCCCCTGCC CGGGCAGAAG CTCCCCCAAT CAAAGTTTAC AGACCAGTAG AAATCACCGG 1380 ACTGGTCCCT TGTGGGGAAA CATTGGATGC CGTTAAATGT CTTCCAGACT TTATGGGGAC 1440 ACAGGAGACA TACGTCTCCT GGCGGCAAGC GGCAAATGCC GCTTACCATA TGTTCAGGAA 1500 ATATGAGGAT AGTTCGCGGC ACTATCAAGC TGTGGTCATC ATCAGGAGCA AAGTTAAAGG 1560 CCCTGCTGAT GCAGTTCTGT CGTCCTTTGG GACTATACTG AATTTCGATG CGATCATAAG 1620 TCGCCTCGAT TTCACGTATA GTGACAAACG CCCGATACAC GTTATCGAGC AGGAGCTAGG 1680 CACCCTCAGA CAGGGAAGCC TGACGCTCCT CCAGTATTAT GATGAGGTCG AGAAAAAACT 1740 CACCTTACTC ACCAATAAGG CGACTATGTC TTATGAAGCG TCGGCAGCAA CGGTGCTGTG 1800 TGAGAAGTTC CGAGATGATG CTTTGAGAGT TTTTGTCTCG GGGCTCAGGC GCAACCTCAC 1860 AGACGTGCTA TTCGCGGCAA AGCCTAAGGA CATGCCGTCA GCGCTCGCCC TGGCGCAAGA 1920 AGTAGAGTCC AATCATGAGC GGTACACTTT TGCAACTTCA TTTGCACGAA GCCAAGAGGA 1980 TAGGGACCAC AAGCAATATC CCAAAGTGCA GGAGCGCCAA CGGGCCCCCC CACAAGCCGG 2040 CTCGCAGGGA AGTGCTGGGA AGAACCCGCA CTTTACTAAG CAGCATAGAG CACAGGTGCA 2100 CTCCGCTCCA CGTAGCGACC GAATGGCCCG AGAAAACATG CCAGAACCCA TGGACGTTGA 2160 CCCGTCGTTG TCCAGGATGC AGCCATCTCA CGCCCCGGCT TACCCGAAAT CGAAGCCGGC 2220 CGCGTCTGGC CGTTCGGTCC CACCAAAAAG GCAAAGGGTC AACCATGTTG CCCAGGCCTC 2280 TGATGATTTG GACAAGGTTT ATAACACCGC AGCCTCCAGT GCAGCAGTTA AAGTCGACGA 2340 CGATTCCATC CTAGAGTACG ACTCGGATAC CATTAATTTT TTAGGGGAAA GTCCCTGCTA 2400 CCCGTCATCA GACGAAGAGT AGCGGGGATC GACATGAAAC TACTGATTGA TACGGGCGCG 2460 GCAAAAAATT TTATCCGACC ATTTAAGGGG TTGAAAGGCG TCCGCCCGGT GCAGTCCCCA 2520 TTTACAATCC ATTCGATTCA TGGTGTGACT ACAATAACTA AGAAATGTTT CGTGTCCATT 2580 TTTAATCTTA AAGCTACCTT TTTTTTATTA CCAGACTTGA CCTCCTTTGA CGCGATCGTT 2640 GGCCTAGACC TGTTAAAACA GGCCGGCGCG TCACTTTGCC TAGCTTCCGG CAAGCTCAAA 2700 TGGGGCTCCG GAGCAGAGCA AATTGACTTT CATACTTGCC CCGATGTCAA TTTCACCAAA 2760 GTAGATTGCT CGGACGCACC GCCCTTAATT AAGGATGCTT TTTTAAAAAT GCTCGGGAAT 2820 AGGAAAAAAG CTTTTGCTGA TCCTAATGAG GCTCTTCCTT ACAATACGTC GGTGGTAGCC 2880 ACCATCCGGA CGGTTGATGA GGAGCCCATT TATGCCAAGT TATACCCATA TCCCATGGGA 2940 GCAGCTGACT TCGTCAACGG CGAAATTCAG GAACTGCTTA AAAATGGCAT AATCCAAAAG 3000 TCAAAGTCCC CCTACAATAA CCCAATATGG GTCGTAGACA AAAAGGGCAC TGACGATGCG 3060 GGCAATAAAA AAATGCGCTT GGTGCTGGAC TTTCGAAAAC TTAACGAAAG GACGGTACCA 3120 GACAGATACC CCATGCCAAA TATCTCTATG ATATTGGGGA ATCTCGGCAA GGCCAAATAC 3180 TTCACGACCC TCGATCTGAA GTCTGGCTAC CACCAAATCA CGCTCGCAGA ACGCGACCGT 3240 GAAAAGACAG CGTTCGCAGT AAACGGAGGG AAGTATGAGT TCCGAAGGCT GCCATTCGGA 3300 CTCAGGAATG CTGCAAGCAT CTTCCAAAGA ACAATTGACG ATATTCTGCG AGAGCAGATC 3360 GGAAAGTTCT GCTACGTTTA CGTCGATGAC GTCATCATCT TTTCGGAAGA TGAAAACGAC 3420 CATGTCAAGC ATGTAGATTG GGTTCTGAAG AGCCTGTACG ACGCTAACAT GAGAATATCG 3480 GCAGAAAAGT CACGTTTTTT TAAGAAAAGC GTGAGCTTCC TGGGGTTCAT CGTCACCAAC 3540 AATGGGGCGG CGACTGACCC AGAAAAGGTT AAGGCCATAA AGGAATTTCC GGAACCCAAA 3600 AACGTATTTG AGGTAAGGTC ATTCTTGGGC TTAGCCAGCT ATTATCGTTG CTTTATCAAA 3660 GACTTCGCAT CAATAGCTAG GCCCATTTCA GACATATTGA AGGGCGAGAA CGGTAGTGTT 3720 AGCCGACACA GGTCCAGGAG TATCCAGGTA GAATTTTCCG AAGCGCAACA ACGTGCCTTC 3780 GAAAAGCTAC GCAATATCCT GGCGTCTGAG GACGTCATCC TGAGATACCC TGATTACAAA 3840 AAAGCGTTTG ATCTAACGAC AGACGCTTCG GCCTACGGCA TTGGCGCAGT GCTGTCCCAG 3900 GAGGGACGTC CCATTACAAT GATCTCAAGG ACATTGTCTG ACAGAGAGGT TAACTATGCT 3960 ACCAACGAAA GGGAGCTGTT AGCCATAGTC TGGGCACTGG CTAAGTTGCG GCACTACCTG 4020 TATGCGGTTA AAGAGATAAA CATCTTTACC GATCACCAAC CTCTGACGTT CGCGGTATCG 4080 GAGTCCAATC CGAACGCCAA AATTAAGAGA TGGAAAGCAC GCATCGACGA GTCCGGCGCA 4140 CGAATTTTTT ACAAGCCTGG GAGAAACAAC CTCGTTGCAG ATGCCCTCTC GAGACAACAA 4200 CTCAACGTTG TTGAAGAGCA AGAACCGGAG TCGTGCGCGG CCACGATTCA CAGCGAACTT 4260 TCGCTTACGC ACACGATCGA GTCCACGGAC AAACCCGTGA ATTGCTTCCA GAACCAGATA 4320 ATTTTGGAAG AGGCGCGCTC CCATTGGAAA CGCACTTTTA TATTATTTGG GAATAAGAGG 4380 CGGCACTCGA TCAATTTCTC GTGCAAACAA GCTTTGCTGG AGGAACTCGC CAACATCATT 4440 ATCCCTAATG GTGTAAACGC CTTCCACTGT GATCTTCACA CGCTGGCGCT AATCCAGGAC 4500 GACGTAGTTC GACAGTTTCC AGCCACGAAA TTCTGGCATT GTAAGAATAG GGTCACCGAC 4560 ATCTTCGCGA TGCAGGAGAG AAAAGAAATC CTCACCGTCG AGCACAACAG AGCTCACAGG 4620 TCGGCCCAAG AAAACGTGAA ACAAGTACTC TCCGAGTACT ACTTCCCGAA AATGACCAAA 4680 TTGGCGAGCG AAATAGCAGC CAATTGCAAA ACTTGCGCAA AGGCGAAGTA TGACAGACAT 4740 CCGAAGAAGC AGGAGCTCGG TGAGACACCA GTCCCGACCC ACGTAGGAGA AATATTGCAC 4800 ATCGATATTT TCTCAACGGA TAAAAAATAC TTTCTCACCT GTGTTGACAA GTTTTCTAAA 4860 TTCGCCATGG TACAGCCGAT TCTGTCTAGA ACCATAGAAG ATTTGAAAGC ACCCCTTTTA 4920 CAACTTATGA ATGTTTTCCC CAAAGCCAAA ACCATCTACT GCGACAATGA ACCATCATTG 4980 AAATCGCAGA CAATAGTGGC TATGCTGGAA AACCATTTTG GCGTCAGCAT TTCGAATGCA 5040 CCGCCCCTAC ATAGCGTCTC AAACGGACAG GTGGAACGAT TCCACAGCAC GTTAATTGAG 5100 CTCGCCAGAT GCCTAAAAAT CGACAAAGGC ATAAGTGACA CAGTGGAATT GGTCTTGCTG 5160 GCCACAGCCA GATATAACAT GTCCATCCAC TCCGTCATCA ATAAAAAACC GGCCGAAGTC 5220 ATGCGGGCAG ATCCGGACGA TCCACATACC GATGTCCAAG AAAAAATCAA AAACGCCCAG 5280 ATTTTGACAA GAAAACGAGA GAACGCTTCT CGGCAGAACA GAGTGTTCCA GGTCGGCGAC 5340 AAAGTCCTAG TAAAGTCAAA CAGACGATTA GGCAACAAAC TTACTCCTTT ATGTGAGGAG 5400 AAGACCATCG AGGCAGACTT GGGGACCACA GTCCTTATTA AAGGGAGGGT GGTCCATAAA 5460 GACAACCTCA AGTGACCCAA GCAGAGCCTA GCCGCGGCTC CCTCGGAGGC ACACTTTTAT 5520 TCCTCCAATT TGTAGCCACT CGGCATAAGT TTTTTCATTG TTTTTATAGC CGCTTGGCAT 5580 AAGTTTTTTA TTTTTTAGCC ACTTGGCATA TTTTTTATAT ATTTTCGCTA TTATTGGTGG 5640 TGGGCAACTC CATTCCGAAC AAGTAATAAT TTATCACACA CGTTACAGGT CGCTCCCAAC 5700 CCTTCTTCTT TGTTTCCTGG CCACGACATC GGCCCACATT ACTGACTATT CCCGAGCGAA 5760 TTACATTCCC GTCATTGACG GTAAAGTCTT AGTCTGGGAG GAATTCGCCT ATGTCAGACA 5820 CTCGGCTAAC CTCTCCGAGT ATAGGCGGGT AATTGACGAA ACCGACAGCA TGCTCGATAT 5880 GTTCCCCCAG TCCCATATGA AGAAGCTCCT GAGCGTTGAT ATCGCTCACC TCCGTGACAT 5940 GCTTGATTCT TTGAGCATCC ATCACAGAGT GGCAAGGAGC CTAGACTTCT TGGGAACTGC 6000 GTTAAAGGTT GTCGCAGGGA CACCTGACGC GGAAGACTTC GAGAAAGTCA AGTTCACTGA 6060 AGCGCGGCTT GTTGATGCAC ACAATAGCCA AATCGAAATA AACACCAAAA CACAAGTTCG 6120 AATTAACGAA CTCACTGATA CCATAAATAA ACTTTTAAAA ATTTCCAAAA GCGCTCAGAT 6180 TGATACAGGT CACCTGTATG AAACGCTTTC TACTCGCAAC AGAATCATTG TAATGGAATT 6240 GCAAAACTTA ATGCTCACTA TAACCCTCGC TAAAATTAAC GTAGTGAGTC CAAACTTCTT 6300 GGACCACGCA GATCTGGAGA GTATTTGGGG CGAGGAGCCC ACCAACACCC CCATAAGGGA 6360 GATTTTGTCC GTTGCGTCTG TAAAAGTCCT ACAATCCCTT AACATCTTAC ACTTTATTAT 6420 TAAATTCCCC AAGATTATCA TGGCGTGCAA CAAAGTCACT ATCCTTCCAG TGGTACACCA 6480 CGATACGGTG TTAAGGTTGA AAGATAATGT GGTAGCAGAG TGCAACAGAG AAATACGCAC 6540 AGTAAAGAAT TGCTCCATAA CACCAGGGGC AACATTTTGC CAGTTATCTT CAGTGAGCTC 6600 GTGTGCGCAG GAGCTCCACG CTGGGGTCGT AGCACATTGC GACGCACAGC AGAGTGATCT 6660 ACATCCGATC ACCTACGTCG ACGAAGGAAT AATCGTCATC AATGACAGAC CAGCACTCGT 6720 GCGTGTGGAC AATGGAACGG CCATCCACAT TAGAGGCACG CACCTCATAA CATTCATTGA 6780 GAGTGCCATG GTCAACGAGA CCGTCTTCTT TAATCATGAC ATGGTCCAGA ATAGGGCGCC 6840 GGGAGTGGCT AATTCCCCAG TCCTTAATAT CTCGATGAAA CACGAGGTCC TGAGCCTCCC 6900 ATACCTTCAC CGTTTAAGTG AAAAGAACTT GGAGCAAATC AGGAACTTCG AGAAGGACGT 6960 CGACGGATAC CGACTAAGTC AGATAGCGTT AGTTGCGGGA GCAATTTTCT GCGCTCTTAT 7020 CTGCATCGGT TTAACCTGGC AGCGAACCAC TAGGGCCAAG AAATCTACAG CCCAACTGAA 7080 GGAAGTTCTC GCCCAAATAG GGTCAGCCGA GGGCGGCCTT AATCTTGAGG AGGGAATAGT 7140 TAACTAAGTT AACCGGACTG ATCGTCCGCA CACCAGCACC GGTCAAACTG CTGACCAAGC 7200 ATTTGGCCGG AAGCTCATGC ATAGCCGGCA GAAGCTCTGC GCATTGGCAG AGGCCGCTAT 7260 GATGTTTTTC CCTTTGTTAG CTTATAGTCA GTTTGATTTT GTATTCAATA AAGAGCGCAT 7320 CGCGCCTTCA ATCAACTCCA GCTACTGCTG TTATCATTGA ATTGGTTGGC TAGCCTTAAG 7380 GGCAGTCAAC AACGGAGAGA CGTTCTCCCA CCATATCTCC CAATCTAGGA GAAGAGGTCT 7440 GCGGCAACCG CCCTGCCTCC CAGTGACAGA AGAACCCCCC GTTACCTGCA ACCTACGCCG 7500 GAGACCGCGG CGAGGGACCT GCACCTTATA TTTAATTAAT TTAACT 7546 // ID TARTC standard; DNA; INV; 11124 BP. XX AC AY600955; XX DR FLYBASE; FBte0001208; Dmel\TART-C. XX FT source AY600955:1..11124 FT SO_feature non_LTR_retrotransposon ; SO:0000189 CC telomeric retrotransposon FT SO_feature direct_repeat ; SO:0000314:1..331 FT SO_feature direct_repeat ; SO:0000314:10383..10713 FT SO_feature five_prime_UTR ; SO:0000204:1..205 FT SO_feature three_prime_UTR ; SO:0000205:6629..11102 FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:11103..11124 CC derived from polyA tail of RNA transposition intermediate FT SO_feature CDS ; SO:0000316:206..3349 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\TART-element\gag" FT /db_xref="FLYBASE:FBgn0014071" FT /db_xref="NCBI_PROTEIN:AAT12844.1" FT /db_xref="SPTREMBL:Q6J4U8" FT /translation="MDGHNGDINEGWATVLSISSDDSNQLSSPPSIIVSSLDTTPTSN FT ETTIVRRSLHNPKADMKSYRFENIVLNENKNTILPDPLFVDKCGNTANTTEANEKKPA FT NSPFPISIIKNLSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTQIKPAKPS FT PPSKELSTNSAPKTLSYTDKITVTQKNLPDKTHVDRPTQDDDINATKASKTAKIISTQ FT LHLRETKPTQPAKDPSPRTQKPIANKAAETLTHTDKLIASQNLVPAKTHINSPTQYND FT TNATNALKTAKINFSSHSHQSEIKPTQSAKNISPLTQKQFTSESAGTHTHTDKHKNTA FT SQNLFSAKTHINSPTQHNDTSAATASKTAKLILSPHSHLSETKPTQPALSPSPLSQKQ FT ITSIAAKTLTHTNKHTASQNFIPAKTHINIPTQYNDTNATKALKTAKAASPSHTYSRQ FT TKPIKPAINALHAAQDTNPSPAISAVTYTDKPTATQNIFPVKTFAELIRENAKRSPTP FT IENPPQAKHDSAALGRPPTAARKNLNKTLISPKTPGKRRGDCLDEGLLQTSNKKVRIR FT DDFSDDDLGVTNLLSETPLFKSKAAIKIRQDSRRESLQKSAEMDTAPAISPSNAAADP FT DLPPWKTVPASRKPPSIFLSNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTM FT DAYNAIQNVLLEANIPLHSHQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFI FT RAMQFRDTRNPMRIHEVEVVPKADGSHLKVLLIKSLGGQTVKVERKRVSKDPTQCHRC FT QCFGHTKNYCRNPFKCMKCGQLHASVSCTKPKNLPATCANCNGSHVSSYKGCPVFQEA FT KQRLSINKIQSLHSQPTHLQTPRNKHPYPKPTHIQTPLNKQPYTHPLPRTLVNNTKLP FT AKRIQGKKISQRNLSINKRLNRIRTLDRKPRNETSPPTTSKKVLASLEESRKNPNSAL FT NPANTHLTHFRPPPLAQNIPNDESKELSGEQYLLNRIEGMEKKLNNLLEIVTRLLSQG FT KDCPKSPKNPFRDPIFV" FT SO_feature CDS ; SO:0000316:3350..6628 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\TART-element\pol" FT /db_xref="FLYBASE:FBgn0014072" FT /db_xref="NCBI_PROTEIN:AAT12845.1" FT /db_xref="SPTREMBL:Q6J4U7" FT /translation="MLFLVTSEVTFPMTRECNRDILKIAFWNAGGINNKIDELKLFIL FT NIDAHIIIVTETRLDNNSTKLELPGYFTYLAQNPASSKRGGVATIVNSSLRHMALEPI FT EKECIQSAPIVLLPENNRRSEMIVIASVYCPPSLSWSPHHFTDVLNFAEKTMGGQTKL FT ILCGDWNAKHRQWGCIRACQRGAALYDAIQADSMAEIVATGSATHFPHDTRKSPSAID FT FSICKRLGRYEKRISSSAHLSSDHLPILLEINLDIKTISLQKQNNNILKKTTNIELFK FT NVLERKILLNTEIRVAEDINDAINIFIKNIKDSAAESTPSPRIPDNHRRRYGQANRNS FT HTLTLDENTSRLLEEKRIQSRIFKATRTNEDKTKLKAAENRLKKVIKILREKRINEQI FT EGIDTNNPDRMRKIWRLLSEGKKMNQPNFPLKLETKKGPKWTKTIKETTEAFVSHLEG FT RFKPNKIVPDYHIDKVNTGLRIIKESMLTERHNLNKNPHNQPITLNELNEEIKNLKNS FT KAPGKDLITNQLIKTLPTKATLYLILIYNSILRLGYYPEAWKHAQVKMILKPGKSSNE FT PKSYRPISLLSGLSKMFERLLLKRLFRVDLFKKAIPLHQFGFRKEHGTEQQIARVTQF FT ILEAFERKEYCSAVFLDISEAFDRVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVK FT DQAGETSRTGQIGAGVPQGSNLGPLLYSIFSSDMPLPYIYRPSPTQRIMLSTYADDTI FT VLSSDTLATAATRNNENYLKTFSDWADKWGISVNAAKTGHVIFTLKNDLPTNSMNVKI FT KGQTIKKESKQSYLGVTLDSKLTLSSHVTKLLGKYSTAYRKLTWILNGRSKLPTKTKI FT LILKSVLSPIWQYAIAAWGPLVTDAQIRRVQVEENRKIRDICRAGRYTRNQTIRDLFG FT VKTVEEFYQQAMHRFSETIKSHPNIAVRRILSRHYIPNRLERSRQRYFKMTNDHITQK FT QTGLALSPKLLKIPDIDDCRTVKKRSEREKIRQMHLTELPTLLRLEEEEEELKRIKKQ FT EEREKRERENQKWPPDRWCELEINRYNKQYRKGDLTRQEVIEKFRGQPLNVQRIILPD FT YEGD" XX CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314"). CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short CC distance into ORF-1. The 5’ ends of TART-C elements are variable and the CC minimal size for functionality has not been determined. Thus, this CC canonical sequence, AY600955, may be 5’ truncated within the 5’ PNTR (M-L CC Pardue, 2009). XX CC Derived from AY600955, Michael Ashburner, 6-Apr-2004; updated Jan-2009 as CC per Mary-Lou Pardue and Greg DeBaryshe. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 11124 BP; 3774 A; 2893 C; 2173 G; 2284 T; 0 other; AAGCTTCGCG GGATATCGAT AACAATCAGG TGGTTAAAAA TACTATAACA TCGAGTACCA 60 GCCGTGTTTT TCCTGTCGAT TTATCGAAGT CCAACAGCCC GCCTTCGCTC CGAACACAAA 120 TCGGCAAGTC AGTAGCTTTT TTAACCCGGC AGTGGCGCCT GTGCAGCAGC TATTTAAAGT 180 GAAAAACACG AAACGCAACA ACAAAATGGA CGGCCATAAT GGAGACATAA ATGAAGGATG 240 GGCAACAGTA CTATCTATCT CGTCGGATGA TAGTAACCAA CTTTCGTCGC CGCCGTCAAT 300 TATAGTCTCA TCGCTGGACA CCACGCCAAC GTCAAACGAA ACCACCATAG TAAGAAGAAG 360 CCTACACAAC CCAAAAGCTG ACATGAAATC TTACAGATTT GAAAATATTG TATTAAATGA 420 AAATAAAAAT ACCATATTGC CAGATCCTTT ATTTGTTGAT AAATGCGGAA ATACTGCTAA 480 TACCACAGAA GCCAATGAAA AAAAGCCTGC CAATAGCCCC TTCCCCATTT CCATTATCAA 540 GAATCTTAGC ACTTCCTCGC CACTAACACA TGTAGACACG CCTACACAAG AAGATGACGC 600 CAGTGCATTC AATACATTGA AAGCAGCCAA AACAGCTAGA ATAATTTTTC CCACACACAC 660 ACAGATAAAG CCCGCCAAAC CCTCGCCCCC TTCCAAAGAA TTAAGCACAA ACTCAGCACC 720 CAAAACTCTT AGCTACACAG ACAAAATTAC AGTAACACAG AAAAATCTAC CCGACAAAAC 780 ACATGTAGAC AGACCTACAC AAGATGACGA CATTAATGCA ACCAAAGCAT CAAAAACCGC 840 CAAAATAATT TCTACACAGT TACACCTACG TGAAACCAAG CCAACACAGC CCGCCAAAGA 900 CCCCTCACCC CGCACCCAAA AGCCTATTGC AAACAAAGCA GCCGAGACAC TCACCCACAC 960 AGACAAACTC ATAGCATCAC AAAACCTAGT TCCCGCCAAA ACACATATAA ACTCCCCCAC 1020 ACAATATAAC GACACTAATG CAACCAATGC ATTAAAAACC GCTAAAATAA ATTTCTCTTC 1080 ACACTCACAC CAAAGTGAAA TCAAGCCAAC ACAGTCCGCC AAAAACATTT CACCCCTCAC 1140 ACAAAAGCAA TTCACAAGCG AATCAGCCGG GACACACACC CATACAGACA AACACAAAAA 1200 CACAGCATCA CAAAATCTCT TTTCCGCCAA AACACACATT AACTCACCCA CACAACATAA 1260 CGACACTAGT GCAGCCACAG CATCAAAAAC CGCTAAATTA ATTCTCTCCC CACACTCACA 1320 CCTAAGTGAA ACCAAGCCCA CACAGCCCGC TTTAAGCCCC TCGCCCCTCT CCCAGAAGCA 1380 AATAACAAGC ATAGCAGCCA AGACACTCAC CCACACAAAC AAACACACAG CATCACAAAA 1440 CTTTATTCCC GCCAAAACAC ATATAAACAT ACCCACACAA TATAACGACA CCAATGCAAC 1500 CAAAGCATTA AAAACCGCAA AAGCAGCTTC TCCCTCCCAC ACATACTCAC GTCAGACAAA 1560 ACCAATAAAG CCCGCCATAA ACGCATTGCA TGCCGCCCAA GACACAAACC CAAGCCCAGC 1620 AATCAGTGCT GTCACTTACA CAGACAAACC CACAGCTACT CAGAATATTT TTCCTGTCAA 1680 AACTTTTGCA GAGCTGATTA GAGAAAATGC AAAACGCTCA CCAACTCCAA TCGAAAATCC 1740 CCCTCAAGCA AAACATGACT CTGCCGCCCT CGGACGCCCT CCGACTGCAG CTAGAAAAAA 1800 TCTAAATAAA ACACTGATTT CTCCTAAAAC TCCTGGGAAG CGCCGTGGGG ACTGTCTTGA 1860 TGAAGGCCTA CTTCAAACCT CTAACAAAAA GGTTAGAATA CGCGACGACT TCTCTGATGA 1920 TGATCTGGGG GTCACAAACC TACTCTCTGA AACACCCTTA TTCAAAAGCA AAGCAGCTAT 1980 TAAGATTCGG CAAGACTCGA GAAGAGAATC CCTGCAGAAG TCAGCTGAAA TGGACACAGC 2040 TCCAGCAATA AGTCCCTCAA ACGCAGCAGC CGATCCCGAC CTACCGCCCT GGAAAACTGT 2100 TCCAGCTAGC AGAAAACCAC CATCAATCTT CCTGTCCAAT ATACAGCAGA TTATCCCGCT 2160 AATAGAAAAA CTAAACTATA AAGCCGGGGT AAATAGCTTT ACTACCAAGT CTGAACTTGG 2220 CAACAATATT AGAATCCAGG CTAAAACGAT GGACGCCTAC AATGCAATTC AGAATGTCCT 2280 CCTTGAAGCA AACATTCCCC TACACTCTCA CCAGCCAAAG AGTGCAAAGG GCTTCCAAAT 2340 TGTAATTAGG CACCTCCACC AGTCAACCCC GACCAAATGG ATTGAAAGCC AACTTCAAGA 2400 CATCGGTATA GCTACAAAAT TTATCAGGGC AATGCAGTTT AGGGACACGA GAAATCCTAT 2460 GCGCATCCAT GAGGTTGAGG TTGTACCCAA GGCTGACGGC AGCCATCTTA AGGTCCTGCT 2520 AATAAAATCC CTTGGAGGAC AAACGGTCAA GGTCGAAAGG AAACGGGTAT CGAAGGATCC 2580 TACACAATGC CACCGCTGCC AATGCTTTGG ACACACAAAA AATTATTGCA GAAACCCGTT 2640 TAAATGTATG AAATGTGGCC AGCTGCACGC CTCGGTCTCA TGCACCAAAC CCAAAAACCT 2700 TCCGGCTACT TGTGCAAACT GCAATGGAAG CCACGTTAGC AGCTATAAAG GATGTCCTGT 2760 TTTCCAAGAA GCAAAGCAAA GACTATCTAT CAACAAAATT CAATCCCTTC ACTCACAACC 2820 CACCCACCTT CAGACCCCCC GCAATAAACA TCCCTACCCA AAACCCACCC ACATTCAGAC 2880 GCCCCTCAAT AAGCAGCCCT ACACACACCC CCTCCCTCGC ACATTAGTAA ACAACACAAA 2940 ACTACCTGCC AAAAGAATCC AAGGAAAGAA GATATCGCAA AGGAATCTAT CTATAAATAA 3000 ACGCTTAAAC AGAATCAGGA CATTGGACAG AAAACCGAGG AATGAGACAA GCCCGCCGAC 3060 AACTAGCAAA AAGGTCTTGG CCTCTCTAGA AGAAAGCAGA AAAAACCCAA ATAGCGCCCT 3120 AAACCCGGCC AACACCCATC TCACTCATTT CCGCCCACCA CCATTAGCAC AAAATATTCC 3180 TAATGACGAA TCTAAGGAGC TGAGTGGGGA GCAATACCTT TTAAATCGCA TTGAAGGGAT 3240 GGAAAAGAAG CTCAACAACC TTCTTGAAAT CGTCACCCGC CTACTAAGCC AAGGAAAAGA 3300 CTGTCCAAAG TCTCCAAAAA ATCCTTTCCG AGATCCAATC TTCGTTTAAA TGCTCTTTCT 3360 AGTAACATCA GAAGTGACGT TTCCTATGAC TCGGGAGTGC AACAGGGACA TCCTTAAAAT 3420 CGCTTTCTGG AATGCTGGTG GGATCAACAA TAAAATAGAT GAGCTTAAGC TGTTCATTCT 3480 AAATATTGAT GCCCACATAA TCATAGTCAC CGAAACTAGA CTAGACAACA ATTCTACCAA 3540 ACTAGAGCTG CCAGGATATT TCACATACTT AGCCCAAAAT CCTGCCTCTA GCAAGAGAGG 3600 AGGAGTCGCC ACGATAGTAA ACAGTAGTCT CCGCCACATG GCCTTAGAAC CGATTGAAAA 3660 GGAATGCATA CAGAGTGCCC CAATAGTATT ACTGCCTGAA AACAACAGAC GCAGCGAAAT 3720 GATTGTAATA GCATCTGTCT ACTGTCCGCC TTCGCTAAGC TGGTCGCCCC ACCATTTTAC 3780 TGACGTTCTC AATTTTGCTG AGAAAACTAT GGGAGGGCAG ACTAAGCTCA TTCTATGTGG 3840 CGACTGGAAC GCAAAACATA GACAATGGGG TTGTATACGC GCCTGCCAAC GTGGCGCCGC 3900 ACTCTACGAT GCAATTCAAG CAGACTCCAT GGCTGAAATC GTCGCGACTG GCAGCGCTAC 3960 ACATTTCCCG CACGATACAA GGAAAAGCCC GTCAGCAATA GACTTCTCGA TATGTAAACG 4020 GCTTGGCAGG TATGAAAAAA GAATCTCCTC AAGTGCACAC CTATCCTCAG ACCATCTTCC 4080 CATATTACTT GAGATAAACC TAGATATAAA AACCATCTCC CTGCAAAAAC AAAACAACAA 4140 TATCCTCAAG AAAACAACGA ACATTGAGCT CTTTAAGAAC GTTCTAGAAA GGAAGATACT 4200 TCTAAACACT GAGATAAGGG TAGCAGAAGA CATAAATGAC GCCATAAACA TCTTTATTAA 4260 AAACATCAAG GACTCGGCTG CTGAATCAAC TCCCTCCCCA AGAATTCCTG ATAACCACAG 4320 AAGAAGATAT GGGCAAGCTA ACAGAAATAG TCATACGCTC ACACTAGACG AAAACACAAG 4380 CAGATTGCTG GAAGAAAAAC GTATACAAAG TAGAATTTTT AAAGCTACTA GAACGAACGA 4440 GGACAAAACT AAACTAAAAG CAGCTGAAAA TCGACTTAAA AAAGTAATCA AAATCTTAAG 4500 AGAAAAGAGA ATCAATGAGC AAATTGAAGG AATTGACACA AATAACCCGG ACAGAATGAG 4560 GAAAATTTGG AGGCTGCTGA GTGAAGGGAA AAAAATGAAT CAACCCAACT TTCCCCTCAA 4620 ATTAGAAACC AAAAAAGGCC CTAAATGGAC TAAAACAATT AAGGAGACAA CAGAAGCGTT 4680 TGTCTCCCAC CTGGAAGGAA GATTCAAGCC AAATAAAATT GTACCTGATT ACCACATAGA 4740 TAAGGTTAAC ACCGGACTAA GAATAATTAA GGAAAGCATG CTAACAGAAC GACATAATCT 4800 AAACAAAAAC CCCCATAACC AACCCATTAC GCTAAACGAA TTAAATGAAG AAATAAAAAA 4860 CTTAAAGAAT AGCAAAGCAC CTGGTAAAGA CCTTATAACA AACCAGCTCA TAAAAACCCT 4920 ACCGACTAAA GCTACCCTGT ACCTTATCCT AATCTATAAC TCCATACTTA GATTAGGATA 4980 CTACCCTGAA GCCTGGAAAC ATGCACAGGT AAAAATGATC CTGAAGCCAG GGAAAAGCTC 5040 AAACGAGCCG AAGTCATACA GGCCGATTAG TCTACTCTCG GGACTCTCTA AAATGTTTGA 5100 AAGACTACTC CTAAAAAGAC TTTTTAGGGT AGATCTATTC AAAAAAGCCA TACCACTGCA 5160 CCAATTTGGC TTCAGAAAAG AGCACGGAAC TGAGCAGCAA ATAGCCAGGG TCACCCAGTT 5220 CATCCTCGAG GCCTTCGAGC GGAAGGAATA CTGCTCAGCG GTTTTCCTTG ACATCTCTGA 5280 GGCCTTTGAT AGGGTATGGC ACGAAGGCCT TTTACTTAAA TTAGCTAAGA TCCTACCTTA 5340 CAACCTATAC ATTATACTGG AGAGCTACCT TACAAATAGA ACGTTCGAAG TTAAAGACCA 5400 AGCAGGAGAG ACTTCGAGAA CAGGACAAAT AGGCGCAGGA GTGCCTCAAG GAAGCAATCT 5460 CGGACCACTA CTTTACTCTA TCTTCTCCTC TGACATGCCC CTCCCATATA TCTACCGCCC 5520 TTCACCAACA CAAAGAATTA TGCTCTCAAC ATACGCAGAC GACACTATAG TCCTCAGCTC 5580 AGACACACTA GCAACTGCCG CCACAAGAAA CAACGAAAAC TACCTCAAGA CATTTTCGGA 5640 CTGGGCGGAC AAATGGGGTA TCTCAGTAAA CGCTGCTAAA ACCGGACATG TCATTTTTAC 5700 ATTAAAAAAC GACTTACCTA CAAACTCAAT GAATGTGAAG ATCAAGGGTC AAACAATAAA 5760 GAAGGAAAGC AAGCAATCAT ACCTTGGGGT AACCCTTGAT AGCAAGCTAA CCCTTAGCTC 5820 TCACGTCACA AAGCTATTGG GTAAATACTC TACAGCCTAC AGAAAATTGA CATGGATCCT 5880 AAACGGAAGA AGTAAACTCC CTACTAAAAC TAAGATACTG ATCCTTAAAT CAGTTTTATC 5940 ACCAATATGG CAGTATGCCA TAGCAGCTTG GGGTCCCCTT GTGACAGATG CACAGATAAG 6000 GAGGGTCCAG GTTGAGGAAA ACAGAAAAAT AAGAGACATA TGTAGAGCGG GAAGATATAC 6060 GAGAAACCAA ACTATAAGGG ACCTTTTTGG CGTCAAAACA GTAGAAGAAT TCTATCAACA 6120 GGCTATGCAC AGGTTCTCAG AAACTATAAA ATCGCACCCA AATATAGCTG TTCGCAGGAT 6180 TCTCTCTAGG CACTATATCC CGAACAGACT AGAAAGAAGC AGGCAGAGGT ACTTTAAAAT 6240 GACAAATGAT CATATCACGC AAAAGCAGAC TGGACTTGCC CTCTCACCTA AACTCTTAAA 6300 AATCCCTGAT ATAGATGACT GCAGAACCGT AAAAAAGCGT AGCGAGAGAG AGAAAATAAG 6360 ACAAATGCAT CTAACTGAAC TCCCCACCTT GCTGAGACTA GAGGAAGAGG AGGAAGAGCT 6420 CAAAAGAATA AAAAAACAGG AAGAAAGGGA AAAAAGAGAA AGGGAAAACC AAAAGTGGCC 6480 TCCAGATAGA TGGTGCGAAT TGGAAATAAA CCGATATAAT AAACAATATA GAAAGGGCGA 6540 CCTAACCAGG CAGGAAGTTA TAGAAAAATT CAGAGGGCAA CCATTAAATG TACAACGAAT 6600 AATCCTACCC GACTATGAAG GGGACTAAAA TTAAATCAAA ACAAACCAGG ACAGGAGCAG 6660 AAGGCAGAAA TAATCAAAAC TGGCGGAAGG GGTGGCAAAA TATTGAAAAG AGAGGAAAGA 6720 AATATAAAAA GGCTAAAGGC TAAGTTACAG GTTACATAAA AAGGGAAATC TGCTTATAGA 6780 TATTATGGTA AAATTAACTT AACTAAACAC CTACTGGTTA ACAAAATAAT TATGCCTGCA 6840 TGGCACAAGC TGCGTACTCA AATCATTTCT CCTGACGCTA TTGAAAATCC ATCTTTACTT 6900 TCCAACCGAG GGACTTGCGA CTGCGGTCTT TCCGCCTTAT TGGCTCCTTA TGGATCCATC 6960 TGCTGCCGTA TTGGGCGACA CACCAGCGCT CCAACCTAAA AGAGAGATAA CATGTTTTAA 7020 TTCACTTTCC TTTTCTTATA ACTAAATCAC AACAACAGCA ACAGCGCATC GGGCGACTGA 7080 CAAAAGCATT AGCTCACCAA GTCAGCAACA ACAGCAGCAG CAAGACCAGA ATCAGTTGAG 7140 GAGGAGGCCT GGTGGTGTGC TGAACATTTC GCCGCCCACA CCCACCATTT CTGTAGGCCT 7200 GTATGACCCT GAGCCCAACG CCGGCATGGC AAATCCGGTC TTCCTGAGGA GGCGGGGCTC 7260 TAGTGTTAGG CGCGCTTTTG CCCCAAAAGC AACAACGACA GCGGCAGTAG GGTCGGCGCC 7320 CCCTGCGTGA CCGAGTCCAT CTTAGCAATC GGTCCTTTTG GCGGTGTTAT GCCGACGCGG 7380 CGGTCGCGCT TATGAGGACT GCCTGCAATG CTTGGCCATG AGACGGCGTC ATCGACAACA 7440 TTTCAATCAC GCTCAGCTGG TTGACCGGGG GCAACATGCT TGCCATGCAG CAACAATGGT 7500 GCATGCAGTC CAGCATGCAG CAACAACAAC AATATTGGCA GCAGCAGACT AATGTTTCGC 7560 AGCAGATTCC ATCTGGCAAC TTCCGACGAC CAGACTCCTC GCTTGGCCCC TGGAGACTCG 7620 CTCTGGAAAA AAAAAGAAAG AAGCATGGAT TAGTTTTTTT TTTTCCCTTT AGCTATTGGA 7680 TTAAATTTCT TTCCTGGACA ACCGGCGCCT TCATGCAGAT GACGCTGGAC TGCGGCGATT 7740 CTTTCCCTCC AGCCACAGAT GGGAAGCTCA CATCATGGCA TATATGCGGC ATCGTGCTAA 7800 TCAGCTCCCC ATGCTGAGCG AGATCTTGAT GCGGCGATGC ACTCACTAGC GAGCAGCGGG 7860 AACAGCATAC AGCGTCAGCA ACAGCAGGAA GAGACTTTGT AGCAGAAGCC TTTCGGCATT 7920 CTCCGACGAC CCGACTCCTC GATCGGGGTC AGGCAAATTC TCCTGGACCG ACAAATTTTC 7980 CCGGCGTTTC GTCCTGGAAT AAGGAAGGAA GCACGGATTA ATTTCTCCCC TTCAGCTTAC 8040 GACCCTTCTC ACCAACAGCA GCAACTACAA CAACATCGGC AGCAGACGAC TTGCAGCTGC 8100 TTGGCTCACC TAATGCGACA GCAATAATCC CGGCAAGGCC AGAAACGGCA CCGAGCAGAA 8160 GCACGACAGG GTGAAGAACA ACATGCCGCC CACGTCCACC AATCCGGAAG CCCTGCATTA 8220 GGGGTCTGAA GCGCCATTAA CTGGAGGATC CGGCAGCGTA TGCCTACGCA GAAGCGGGGC 8280 GTCGTAAATC CGGTGGCCGG AATAGCGCCT TGAACAGCAT GCTGTGTATG TTTGCCCCAA 8340 AAGCAGAAAC TGCCGCAGCA AAGGAACCGC AAGCAGGATC ATCACTCGTG GCAAACTGGC 8400 GTATTCCTGT TGAAGACGCG GGACTGCGGC GCATTCTTCC TTTCCAACCG GGGGCTTTAG 8460 CGCTGCGGTA TTTCTGCTTT CACGGCTCCA TTTGCTGCTG CATCTGACGC CTCATCAGCG 8520 CTCCTCCCTG AAAGAAAGAG AATATGTATT AGTTTTCTTT CCATTCCTTA CAATCTCTCT 8580 CACCAAACCT CCACGACACA ACAACAGCAG CAGAAACAGG TCTAGCCCAC AATGGCAGCA 8640 GCTACAGCAA TCAGCAGAAG CAAGGCCGGC AAAAGCAACA ACAAAAGCCC TCTCTGAAAG 8700 CCCGGATGTG GAGACTGAAG CGCCGGAAAC TTGAGGATCC GCCCCCGATG CACGCCCACC 8760 AACAATAAGC TGGAGGAGAA GTTACTGAAG CATGGGAAGC AGCACCAGGG GTCGCATACG 8820 CAGCGTCAGG GCTTTGCGAA CCAGATGAAT GAGGAGAGAC TGGAACAGCA TAACATCAGC 8880 GGCAGCAACA ACAGCGCCAC GAGGGTCAGC GGCGTCTGCA TGGCTGTGTC CAAAACAACT 8940 CCAATTCAAC TGCTGTATGA TGCAGCGCAC CAGCGGCTTT CACAGGGACC GTCTGAAACG 9000 CTTGGCAGGA GCCGGCTGAA GGCCTGGGCG AAGACACTGG AGACACCAAT GCGGCTCCTT 9060 TCGGCCGACG GCAACAGGCT TGCCATGCAA TAAGAACAGT AAATCCTGAA ATAACAGCAG 9120 AAGATACAGA CGTCCAAATT GCGAACACTG ACGCCAGCCC TCACCTGAAC GACTCACTGT 9180 GCAGCAGCAG CAACATCAGC ACCGATGCCC TCAGCATCGG CAGCAGAGGG TGTTTTTGGC 9240 CTTTGACAAT TCCCTGCGAC TTGACTTCTT CTTGGCATCT GGTCAATCAT CACGTGCCAG 9300 CAAACAGTGG CTTGTCACCC TGGAAGAAAG AAGACTGGAT TAGCTTCTCC CCTTCTAATA 9360 CATTTTGTGT GTTGAAATGC ATCAGGCGGC GACACACTCA CCAGCAACAG CAGCAACAAC 9420 ACCAGCGGCA CCGGTAGCAG GAAATGGATC CTCAGCAAAA ACCATCGGCA CTTTCAGACG 9480 TCCCGTACTC CTCGCCTGGC CCTGGCCGGT AACAGGGGCT TGTTAGATGG AGAAGACGAC 9540 GGTCATCCGA CGGACAGCAG CCTGAAGATG GAAGCAGGCC TACGCTGCCC ACCTCTCCGA 9600 TGCCTGCAGC AGCAACGGCA GCGGCTCATA AATGCAAACT GGCGCCAGCC CTCGGCTCTT 9660 CGGGCTCATG TAGGCGGTGA CACACTCACT AGCAGCTAAA ACAGCAACGG CGGAATTAGT 9720 AGAAGCAATG TTTTGCCGCA GCTGCCAGAT GGCATACTCC TAGCTTGGCC CCTGCCCAAA 9780 CCGTATTGGA CCGGCAAATG ATTCGACAAT CCGATCTGGA AAAAATAAGT ATTGATTAAT 9840 TTTTCCCCCA CAGATTGGTA TAAAATTGCA TTTACGGCCA ACCGGCTTCT TCCTGTTGAT 9900 GACGTCACGC TGCGCCGCAT GCTTTTCGCC AGCCACAGTT GGAATGCATG CATTGGGGTT 9960 GACGGTCCGG ATGGGCCGTT GCCTGTTATA TGCTGGCATC TCCGCAGCGG CGTTGTGAGC 10020 AACGACACTG AAAGCAACAA TAATATTGTT AATTACTGCT CAAAACTATA ACACATTTAA 10080 TCACTTACAC AATTTACACA CGCTTCCTGC CTAGGAGTTG TGGGACCAGC TACCGATAAT 10140 GCCAACAATA CCGGGAAACG CGTCGCGGGA CATCGATAAC AATTTGGCGG TTAAAATGCT 10200 AGAACATCGA GTACCAGACA TGTTTTTCCT GCCGATATAT CGAAGCCCAA TAGCCGCCAA 10260 CGCTCAAAAC ATAAATCGGA GTGTGAGACC AGATACTGAA GCCGTTAAAA GCTTTTACCG 10320 GCATCGGTAG CTGGTCTCAC ACTCCGATTT AAATTTGGAG CGTTGGCGGG CTGTTTGACG 10380 CGAAGCTTCG CGGGATATCG ATAACAATCA GGTGGTTAAA AATACTATAA CATCGAGTAC 10440 CAGCCGTGTT TTTCCTGTCG ATTTATCGAA GTCCAACAGC CCGCCTTCGC TCCGAACACA 10500 AATCGGCAAG TCAGTAGCTT TTTTAACCCG GCAGTGGCGC CTGTGCAGCA GCTATTTAAA 10560 GTGAAAAACA CGAAACGCAA CAACAAAATG GACGGCCATA ATGGAGACAT AAATGAAGGA 10620 TGGGCAACAG TACTATCTAT CTCGTCGGAT GATAGTAACC AACTTTCGTC GCCGCCGTCA 10680 ATTATAGTCT CATCGCTGGA CACCACGCCA ACGCCTGTCT AATGCAAATC AACTTACATA 10740 TTACTCTAAA ATCTACTTAT AACTGTCCCC TCTAATGATA AGCAATTTTT ATGTTTACTT 10800 TAAACTTAAA CCGATACCTT AAACTATGGC GCGCAAAATG ACTACCAAGA AATCTAAAAC 10860 TGTAAATTGT TGCAAACTAT TTCTCCTAGT AATGTTAAAT TTAAATGCGC GCATAACCGC 10920 AGCCAAGTTA ACCAAAAATG TCACTCGTAA ATGTAATTCC TAAATTAACA CTTGTAACTA 10980 AGCGCGTATA AATACCGCAA ATCCAAAAAT GTAAATATGC CATAAATTGT TACTATATAT 11040 TTTTAAAAAA GAAAAATCAG AGTACAATAA AAATGCCAGC GTCTATTAGG CGTTGAAAAT 11100 TTAAAAAAAA AAAAAAAAAA AAAA 11124 // ID AY561850 standard; DNA; INV; 13424 BP. XX AC AY561850; XX DR FLYBASE; FBte0001206; Dmel\TART-A. XX FT source AY561850:1..13424 FT SO_feature non_LTR_retrotransposon ; SO:0000189 CC telomeric retrotransposon FT SO_feature direct_repeat ; SO:0000314:1..1850 FT SO_feature direct_repeat ; SO:0000314:11179..13028 FT SO_feature five_prime_UTR ; SO:0000204:1..1759 FT SO_feature three_prime_UTR ; SO:0000205:7953..13411 FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:13412..13424 CC derived from polyA tail of RNA transposition intermediate FT SO_feature CDS ; SO:0000316:1760..4672 FT SO_feature start_codon ; SO:0000318:1..3 FT /db_xref="FLYBASE:FBgnXXXXXXX" FT /db_xref="GI:45594384" FT /db_xref="NCBI_PROTEIN:AAS68533.1" FT /translation="MDGQNVNQSGGWASVLSISSDDGNCSSSPPSAIVSSLDTTPTSN FT ETTIVRRSLYQTNADMKSYDFENIVLNENKNTILPDPLFVDKCGSTANTTEANEKQPA FT DSPFPISISKNFSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTQIEPAKPS FT PPSKELSSNSAPKTLSYTDKITATQKNFPTKTHVDTPTQDDDTNATKASKTAQIDSSH FT SQLHETKPTQPAKNPSPLTQKLTTNKTAKTHTHTDKPTASQNLFPTKTHINSPTQYND FT TNASTASKDGKINLSSHSHLRETKPTQPAKNPSPLSQKQITSIAANTLTHTNKHTASQ FT NFIPAKTHINIPTQYNDTNATKALKTAKPASPSHTYSRQTKPIKPAINALHPAQDTNP FT SPAISAVTYTDKPTATQNIFPAKTFAELVRENAKRSQTAMQNPPHAKHDSAALGRLPS FT AARKNLTKTLSSPKTPGKRRGDCLDEGLLQTSNKKVRIRDDFSDDDLGVTNLLSETPI FT FKSKVAIKIRQDSRRESLQKSVEMDTAPAISPSNTAAEPDLPPWKTVPASRKPPSIFL FT SNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTMDAYKAIQNVLLGANIPLHS FT HQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFIRAMQFRDTRNPMRIHEVEV FT VPKADGSHLKVLLLKSLGGQTVKVERKRVSKDPTQCHRCQCFGHTKNYCRNPFKCMKC FT GQLHATVSCTKPKNLPATCANCNGSHVSSYKGCPAFQEAKQRLSINKIQSLHSQPTHL FT QTPRNKHPYPKPTHFQTPRNKQSYTHPPPRTTVNNTKLPAKRIQGKKLSQRNISINKR FT LNRIRAFDKKPRKETSPPTTSKKVLASLEESSKNPNSVLNPANTHLTHFCPPPITQDI FT PNDEPTEPSQEQYLLNRIEGMEKKLNNLLEIVTRLLNQGRECPKSPKNPFRDPILI" FT SO_feature CDS ; SO:0000316:4710..7952 FT SO_feature start_codon ; SO:0000318:1..3 FT /db_xref="FLYBASE:FBgnXXXXXXX" FT /db_xref="GI:45594385" FT /db_xref="NCBI_PROTEIN:AAS68534.1" FT /translation="MTRACNRDILKIAFWNAGGINNKIDELKLFILNIDAHIVIVTET FT RLDNKSTKLELPGYFTYLAQNPVSSKRGGVATIVNSSIRHMALEPIEKECIQSAPIVL FT LPENNRRSEMIVIASVYCPPSLSWSPHHFTDVLNFAEKTLGGQTKFILCGDWNAKHRQ FT WGCTRACQRGTALYEAVQADPMAEIIATGCATHFPHDTRKNPSAIDFSICKGLGRLEK FT RISSSADLSSDHLPILLEINLDTSTLFLQKQNNNILKKTTNIELFKTVLERKILLNTE FT IRVAEDINDAINIFIKNIKDSADESTPSPRIPDNLRRMHGQANRNSHTLTLDENTSRL FT LEEKRILSRIFKATRTDEDKAKLKAAENRLKKAVKILREKRINKQIEGIDTKNPDRMR FT KMWRLLDEGKKTNQPNFPLKLETKRGPKWTKTIKETTEAFVSHLEGRFKPNNNVPDYH FT INTVNSGLRTIKESMLTERYDVNKNPCNQPITLKELNDEIKNLKNSKAPGKDLITNQL FT IKTLPTKATLYLILIYNSILRIGYYPDAWKHAQVKMILKPGKSVNDPKSYRPISLLSG FT LSKMFERLLLKRLFRVDLFKKAIPLHQFGFRKEHGTEQQIARVTQFILEAFERKEYCS FT AVFLDISEAFDRVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVKDQAGETSRAGQI FT GAGVPQGSNLGPILYSIFSSDMPLPHIYHPSPTERIMLSTYADDTIVLSSDILATAAT FT RNNENYLKTFSDWADKWGISVNAAKTGHVIYTLKNDIPTNLKTMKIKGQAIKKESKQS FT YLGVILDSKLTLSPHVTKVVGKYLTAYRKMSWILNERSKLPTNTKMLILKSVLSPIWQ FT YAIAAWGPLVTDAQIRRIQVEENRKMRDICRAGRYTKNQTIRDRYCVKTVEEFYQQAV FT HRFSETTKSHPNVAVRRIFSRHYIPNRLERSRQRYLKMTMDHITQKQTGLTLSPKLLK FT IPDLDDCRTLKKRSEREKIRQTHLTELPTLLRLEEEEAELKRIKKQEERERRERENQK FT WPPDRWCELEINRYNKKYRNGDLTRQEIIEKFRGQPLNVQRIILPDYEGD" XX CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314"). CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short CC distance into ORF-1. The 5’ ends of TART-A elements are variable and the CC minimal size for functionality has not been determined. Thus, this CC canonical sequence, AY561850, may be 5’ truncated within the 5’ PNTR (M-L CC Pardue, 2009). XX CC Derived from AY561850, Michael Ashburner, 6-Apr-2004; updated Jan-2009 as CC per Mary-Lou Pardue and Greg DeBaryshe. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 13424 BP; 4373 A; 3415 C; 2870 G; 2766 T; 0 other; CACGCTTTTT GGCCCCTGGC CGATCTTCAT ATATCTCAAA TCGACGGCTG CTTTTACCCT 60 GGAAAAAAAA AAAGGAGCTT GGGTTATATT GAACTACACT AGGCGGCGAC ACACTCACCA 120 GCAGCAGCCA GAACAACAAC AGCGGCAGAA GTAGCAGGAA ATTATCTCAC TGCAAAATCC 180 AATTGGCACT TTCCGAAGTC CGTATTTCTC GCCTGGCCCC TGGCCAGTAA CAGGGGCCTG 240 TGCGACGGAG ATGACGACGA TGATCTGCCC TGTGGACGGC CTCAAGAAGG AATCGGCCCT 300 GTACTGCCCA CCTGACCTGT GCCAGGATAG CAGCAATGTC AGCGGACCAT GGATGGAAGA 360 GGCGGCACTG GCGACGGTCC TCAGTTTTGC GGTTTCCGCG GGGCGTAGGC GCAGTAATCG 420 GCGGCAGCAA CAGTGGCGGC AGCAGAAGGG AATGTGTATC TGCAGTCGCC GAATGGCAAT 480 TTCCTGCCCA GCTGTAATGG ACCGCCAAAT GTTTTTTGGC ATGTCGACCT GTAAGAAAGA 540 AGCAAGGATA AGTTTTTTCT TTACAAGATT GTATATGAAT TTGTATTTAC GGACAACTGG 600 CTTGTTTCCT GTCGACGATA AATGGCGCTT CATGTTTTCA CTCTGCCAAA ATCTGAGTGC 660 AAGCATCGGG GCTGACGGGC CGAATTTGCT GATGCCTTGT ACATGCTAGC ATCTTTATGC 720 CGCCGTGTAA TTTTGCGACA GCAAAACACA TGATGGAGAA GACGAAGGTG ATCGATGGCG 780 CCCGGATGAC GGATGCAGGC CCGTGCTACC CACTGGTCCG TTGCCAGGAC AGCAGCGTTT 840 CAATTATGCG AACAGAGGCA CTGGAGCCAC TTCTCAGGCG ATAGGGATCA TGAGGCGACG 900 ACAACTCGCC AGCAGCAGTA ACAACAACAG CGGCAGCAGC GATCTCGGAC TTGCTGAACA 960 TTGCGGCTTT TTCCCAGCCT GGACCGTCAT CACAAACGCT CTCAAAGATC GGTGCGCCTG 1020 CAGCCTACGG AAGCGTACAA CTGCCCAAAG TCGTGCTATT GCATAATGTT AGGTGTCCTG 1080 GCTGCTCCGG CGGATGAGCT CCACCCGATT GAGAGAGGTA AGAAGGCCCA GCAAGTCGCC 1140 CTTAAATAAA AGAAACAAGC ATTAGACTCG GCTGAAATTG TAACATCAGT CAGACTGTAC 1200 TCACGCATGC ACTTAGACAA ACCGAAGCCT ATTCTATTGA CGACGCGGAC TCCAACACAT 1260 GTTTTCCTCC ACAAAAGGCT GTGAGTGCAC CAAAGTTGAC GGGCCACGCC GGCCGATGCT 1320 TGCTGCATAC CGGCATCTCC GCAGCAGCGA CGTTACAAGC ACCACTAAAA TTAGAAAGAG 1380 GCTTACTATA GGCAAAGCGC AGAAAAACAA ATATTACAAT AAGAAATAGC ACGCGATTTT 1440 TCTGCTTCGT TTCCGCTTGG TACAAGTGAG ACCATTCTCC CTATATGCCA TTCTAGTATA 1500 TTTGCCCGAT AAGCGATATG CTGGCGGCAA AAAAAAAAGA TAATAGCCGA TAAGCCCGCC 1560 AAAAAAAAAG CGCGAAATAT CGATAACGAG CTGGCACGAA AATTGCTGGC ATATCGATCA 1620 ACCGCTGTGT CTTTGAGCTA TCGAAAAAGC CCGCCTACGC GCCTAGCCCA AATTTGCAAG 1680 TCAGTTGAGA TTATAAAACC GACAGAGGCG CGCGCGCAAC AGTAGCTAAA AGTGAAGCCA 1740 GCAGCAACAA CAACAACTAA TGGACGGCCA GAACGTGAAC CAAAGCGGAG GATGGGCATC 1800 GGTTTTATCC ATCTCATCGG ACGATGGTAA CTGCTCATCC TCGCCGCCAT CAGCTATAGT 1860 CTCATCGCTG GATACCACGC CAACGTCAAA TGAAACCACC ATAGTAAGAA GAAGCCTATA 1920 TCAAACAAAT GCCGACATGA AATCTTACGA TTTTGAAAAT ATTGTATTAA ATGAAAATAA 1980 AAATACCATA TTGCCAGACC CTTTATTTGT TGATAAATGC GGGAGTACTG CTAATACCAC 2040 AGAAGCCAAT GAAAAACAGC CTGCCGATAG CCCCTTCCCC ATTTCCATAA GCAAAAATTT 2100 TAGCACTTCC TCGCCACTAA CACATGTAGA CACGCCTACA CAAGAAGATG ACGCCAGTGC 2160 ATTTAATACA TTGAAAGCAG CCAAAACAGC TAGAATAATT TTTCCCACAC ACACACAGAT 2220 AGAGCCCGCC AAACCCTCGC CCCCCTCCAA AGAATTAAGC TCAAACTCAG CACCCAAAAC 2280 TCTTAGCTAC ACAGACAAAA TTACAGCAAC ACAGAAAAAT TTCCCCACTA AAACACATGT 2340 AGACACACCT ACACAAGACG ATGACACTAA TGCAACCAAA GCATCAAAAA CCGCCCAAAT 2400 AGATTCATCA CACTCACAAC TACATGAAAC CAAGCCAACA CAGCCCGCCA AAAACCCTTC 2460 ACCCCTCACC CAAAAGCTAA CCACAAACAA AACAGCCAAG ACACACACAC ACACAGACAA 2520 ACCGACAGCG TCACAAAATC TTTTTCCCAC CAAAACACAT ATAAACTCAC CCACACAATA 2580 TAACGACACT AATGCAAGCA CAGCATCAAA AGACGGTAAA ATAAACCTCT CTTCACACTC 2640 ACACTTACGT GAAACCAAGC CAACACAGCC CGCCAAAAAC CCCTCACCCC TCTCCCAGAA 2700 GCAAATAACA AGCATAGCAG CCAATACACT CACCCACACA AACAAACACA CAGCATCACA 2760 AAACTTTATT CCCGCCAAAA CACATATAAA CATACCCACA CAATATAACG ACACCAATGC 2820 AACCAAAGCA TTAAAAACCG CAAAACCAGC TTCTCCCTCC CACACATACT CACGCCAGAC 2880 AAAACCAATA AAGCCCGCCA TAAACGCATT GCATCCCGCC CAAGACACAA ACCCAAGTCC 2940 AGCAATCAGT GCTGTCACTT ACACAGACAA ACCCACAGCT ACTCAGAATA TTTTTCCTGC 3000 CAAAACTTTT GCAGAGCTGG TGAGAGAAAA TGCTAAACGC TCACAAACTG CAATGCAAAA 3060 TCCCCCTCAT GCAAAACATG ACTCTGCCGC CCTCGGACGC TTACCGAGTG CAGCTAGAAA 3120 AAACCTAACT AAAACACTGA GTTCTCCTAA AACTCCTGGG AAGCGCCGCG GGGACTGTTT 3180 GGATGAGGGC TTACTTCAAA CCTCTAACAA AAAGGTTAGA ATACGCGACG ACTTCTCTGA 3240 TGATGATCTG GGGGTCACAA ATCTACTCTC CGAAACACCC ATATTCAAAA GCAAAGTAGC 3300 TATTAAAATT CGGCAAGACT CAAGAAGAGA ATCCCTGCAG AAGTCAGTTG AAATGGACAC 3360 AGCACCAGCA ATTAGTCCCT CAAACACAGC AGCTGAGCCC GACCTACCGC CCTGGAAAAC 3420 TGTTCCAGCT AGCAGAAAAC CACCATCAAT CTTCTTGTCC AATATTCAGC AGATTATCCC 3480 GCTAATAGAA AAACTAAACT ATAAAGCCGG GGTAAATAGC TTTACTACCA AATCTGAACT 3540 TGGCAACAAT ATTAGAATCC AGGCTAAAAC GATGGATGCC TATAAAGCAA TTCAGAATGT 3600 CCTCCTTGGG GCAAACATTC CCCTACACTC TCACCAGCCA AAGAGCGCAA AGGGCTTCCA 3660 AATTGTAATT AGGCACCTCC ACCAGTCAAC CCCGACCAAA TGGATTGAAA GCCAACTTCA 3720 AGACATCGGT ATAGCTACAA AATTCATCAG GGCAATGCAG TTTAGGGACA CGAGAAATCC 3780 TATGCGCATT CATGAGGTTG AGGTTGTACC CAAGGCTGAC GGCAGCCATC TCAAGGTCCT 3840 GCTACTAAAA TCCCTTGGAG GTCAAACGGT CAAGGTTGAA AGGAAACGGG TATCGAAGGA 3900 TCCCACACAA TGTCATCGCT GCCAATGTTT TGGGCATACA AAAAATTATT GTAGAAACCC 3960 GTTTAAATGT ATGAAATGTG GCCAGCTGCA CGCCACGGTT TCTTGCACTA AACCCAAAAA 4020 CCTTCCGGCT ACTTGTGCAA ACTGCAATGG AAGCCACGTA AGCAGCTATA AAGGATGTCC 4080 TGCTTTCCAA GAAGCAAAGC AAAGACTATC TATCAACAAA ATTCAATCCC TACACTCACA 4140 ACCCACGCAC CTTCAGACCC CCCGCAATAA ACATCCCTAC CCAAAACCCA CCCACTTTCA 4200 GACGCCCCGC AATAAGCAGT CCTACACACA CCCCCCTCCT CGAACAACAG TAAACAACAC 4260 AAAATTACCT GCCAAAAGAA TCCAAGGAAA AAAGTTATCG CAAAGGAACA TATCTATAAA 4320 TAAACGCTTA AATAGAATTA GGGCTTTTGA CAAGAAACCG AGAAAGGAGA CAAGCCCGCC 4380 GACAACTAGC AAAAAGGTAC TGGCCTCCCT AGAAGAAAGC AGCAAAAACC CAAACAGCGT 4440 CCTAAACCCA GCCAACACCC ATCTCACTCA TTTCTGTCCA CCCCCAATAA CACAAGATAT 4500 CCCTAATGAC GAACCCACGG AGCCGAGTCA GGAGCAATAC CTTCTAAATC GTATTGAAGG 4560 GATGGAAAAG AAGCTCAACA ATCTCCTGGA AATCGTCACC CGCCTACTAA ACCAAGGAAG 4620 AGAGTGTCCA AAATCTCCAA AAAATCCTTT CCGAGATCCA ATCCTCATTT AAACGCTCTT 4680 GCTAGTAGCA TCAGAAAGTG ACGTATCTTA TGACTCGGGC GTGCAACAGG GATATCCTTA 4740 AAATTGCTTT CTGGAACGCT GGTGGGATCA ATAATAAAAT AGACGAGCTC AAACTGTTCA 4800 TTCTAAATAT TGATGCCCAC ATAGTCATAG TCACTGAAAC CAGACTTGAC AACAAATCGA 4860 CCAAACTAGA ACTTCCAGGA TATTTCACAT ACTTAGCCCA AAATCCTGTT TCTAGCAAGA 4920 GAGGAGGAGT CGCCACTATA GTAAACAGCA GTATCCGACA CATGGCCTTA GAACCGATTG 4980 AAAAAGAATG CATACAGAGC GCCCCAATAG TCTTGCTGCC TGAAAACAAC AGACGCAGCG 5040 AAATGATAGT AATAGCATCT GTCTACTGTC CGCCTTCGCT AAGCTGGTCG CCCCACCACT 5100 TTACTGACGT TCTCAATTTT GCCGAGAAAA CTCTGGGAGG GCAGACAAAG TTCATTCTAT 5160 GTGGCGACTG GAATGCAAAA CACAGGCAAT GGGGTTGTAC CCGCGCCTGT CAACGCGGCA 5220 CCGCACTCTA CGAAGCAGTT CAAGCAGATC CCATGGCTGA GATTATTGCT ACCGGCTGTG 5280 CGACACATTT CCCGCACGAC ACACGGAAAA ACCCGTCAGC AATAGATTTC TCCATATGCA 5340 AAGGACTGGG CAGGCTCGAA AAGAGAATTT CCTCAAGTGC GGACTTATCT TCAGACCACC 5400 TTCCCATCCT GCTTGAGATC AACTTAGATA CAAGCACCCT CTTTCTGCAA AAGCAAAACA 5460 ATAACATCCT CAAGAAAACT ACGAACATTG AGCTCTTTAA GACTGTTCTT GAAAGAAAGA 5520 TACTTCTTAA TACGGAGATA AGAGTAGCAG AAGACATAAA TGACGCCATA AATATCTTTA 5580 TCAAAAACAT CAAGGACTCG GCTGATGAAT CAACTCCCTC CCCAAGAATC CCTGACAACC 5640 TCAGAAGAAT GCATGGACAA GCTAACAGAA ATAGTCACAC CCTCACACTA GACGAAAACA 5700 CAAGCAGATT GTTGGAAGAA AAACGGATAC TAAGTAGAAT TTTTAAAGCT ACTAGAACGG 5760 ACGAGGACAA AGCTAAACTA AAAGCAGCTG AAAATCGACT AAAAAAAGCG GTAAAGATCT 5820 TGAGAGAAAA GAGAATTAAT AAACAAATTG AAGGAATAGA CACGAAAAAC CCGGACAGAA 5880 TGAGGAAAAT GTGGAGACTG CTAGATGAAG GAAAAAAGAC AAACCAACCG AACTTTCCCC 5940 TCAAACTGGA AACCAAAAGA GGCCCCAAAT GGACAAAAAC GATAAAGGAG ACAACAGAAG 6000 CATTTGTTTC CCACTTAGAA GGAAGATTTA AGCCAAATAA CAACGTACCT GATTACCACA 6060 TAAATACAGT TAACTCTGGA CTAAGAACAA TTAAAGAAAG CATGTTAACA GAAAGATATG 6120 ATGTAAACAA GAATCCCTGT AACCAACCTA TCACACTAAA GGAATTAAAT GACGAAATAA 6180 AAAACTTAAA GAATAGTAAA GCACCGGGAA AAGACCTTAT AACAAACCAA CTTATAAAAA 6240 CCCTACCGAC TAAAGCTACA CTGTACCTTA TCCTAATCTA TAACTCTATA CTTAGAATTG 6300 GATACTACCC AGACGCCTGG AAACATGCCC AAGTGAAAAT GATCTTAAAA CCAGGGAAAA 6360 GTGTGAACGA CCCGAAGTCA TATAGGCCGA TCAGTCTACT CTCGGGACTC TCTAAAATGT 6420 TTGAAAGACT ACTTCTAAAA AGACTTTTTA GGGTAGATCT ATTCAAAAAA GCCATACCAC 6480 TGCACCAATT TGGCTTCAGA AAAGAGCACG GAACTGAGCA GCAAATAGCC AGGGTCACCC 6540 AGTTCATCCT CGAGGCCTTT GAGCGAAAGG AATACTGCTC AGCGGTTTTC CTTGACATCT 6600 CTGAGGCTTT CGATAGGGTC TGGCACGAAG GCCTTTTACT TAAACTAGCT AAAATATTAC 6660 CATACAACCT ATACATTATT CTCGAAAGCT ACCTTACAAA CAGAACATTT GAAGTTAAAG 6720 ACCAAGCTGG AGAGACTTCG AGAGCAGGAC AAATAGGCGC AGGGGTGCCC CAAGGAAGCA 6780 ACCTTGGACC CATACTGTAC TCTATCTTCT CCTCAGACAT GCCACTCCCA CACATATACC 6840 ACCCCTCCCC AACAGAAAGA ATTATGCTCT CAACATACGC AGACGACACT ATAGTACTCA 6900 GCTCAGACAT ACTAGCAACT GCTGCCACAA GAAACAACGA AAACTACCTC AAGACATTTT 6960 CGGACTGGGC AGACAAATGG GGTATCTCAG TAAATGCTGC TAAAACAGGA CATGTCATTT 7020 ATACATTAAA AAACGACATA CCTACAAATC TAAAGACCAT GAAGATTAAG GGTCAAGCAA 7080 TAAAAAAGGA AAGCAAGCAA TCATACCTTG GCGTAATCCT TGATAGCAAG CTAACACTTA 7140 GTCCTCACGT CACGAAGGTA GTAGGTAAAT ACTTGACAGC CTATAGAAAA ATGTCATGGA 7200 TCTTAAATGA AAGAAGCAAA CTCCCTACTA ATACTAAGAT GCTGATCCTC AAATCAGTTC 7260 TATCGCCAAT ATGGCAGTAT GCCATAGCAG CCTGGGGTCC CCTTGTGACA GATGCACAGA 7320 TAAGACGGAT ACAAGTTGAG GAAAACAGAA AAATGAGAGA CATATGCAGA GCGGGAAGAT 7380 ACACGAAAAA CCAAACTATA AGGGACCGCT ACTGTGTCAA AACAGTAGAA GAGTTCTATC 7440 AACAGGCTGT CCACAGGTTC TCAGAAACTA CAAAATCGCA CCCTAATGTA GCTGTTCGCA 7500 GGATATTCTC TAGGCACTAT ATCCCGAACA GACTAGAAAG AAGCAGGCAG AGGTACTTGA 7560 AAATGACAAT GGACCATATC ACGCAAAAAC AGACTGGACT GACCCTCTCA CCTAAACTCT 7620 TAAAAATCCC TGATCTAGAT GACTGCAGAA CCTTAAAAAA GCGAAGCGAG AGAGAGAAAA 7680 TAAGACAAAC GCATCTAACT GAACTCCCCA CCCTGCTGAG ACTAGAGGAA GAGGAGGCAG 7740 AGCTCAAAAG AATAAAAAAA CAGGAAGAGA GGGAAAGAAG GGAAAGGGAA AACCAAAAGT 7800 GGCCTCCAGA TAGGTGGTGT GAACTGGAAA TAAACCGATA TAATAAAAAA TATAGAAATG 7860 GCGATCTAAC CAGGCAGGAA ATTATAGAAA AATTCCGAGG GCAACCATTA AATGTACAAC 7920 GAATAATCCT ACCCGACTAC GAAGGTGACT AAAAGTAAAT CAAAACAAAC TAGGGTCGGA 7980 GCATAAAGCA GAAATAATTA ACCTGGCGGA AGGGGCGGCA AAAATATTTA AAAGAAAGGA 8040 AATAAATACA AAAAGGCTAA AGGCTAAGTT ACAGGTTACA TAAAAAGGGA AATGTGCTTA 8100 TAGATATAAT GGTAAAATTA ACTTAACTAA ACACCTACTG GAAAACAAAA CCATGATGGC 8160 TGCGTACTTA AAACGTTTCT CCTGGCGCGA TTGAAAATCC ATCTTTCCTA TCCAACCGAG 8220 GGATCTGCGA CTGCGGCCTT CTGCCGTTCG GCTCCTGATG GATCCATCTG CTGCTGGAAT 8280 GGGTGCCACA CCGGCGCTCC AACCTAAAAG AAAGATAATA TGTCTTAGTT TTCTTTCCCT 8340 TTTTCTCATA AAAAACAAAA GCTCATCTGG AGTCTGATAA TAGCTTTAGC TCACCAAGAC 8400 AGCAAAAACA ACAGCATCAA GGCCAGCAAC AGTGGAGGCA GAGACCAAGC GGTTTGCTGA 8460 ACATTTCGCT GCCCACACCC ACCATTCCTG GAGGCTCTGA ATGAGGGAGC TGAAGCCTCT 8520 GAAAATTGAA GATCCTACTC CAATGTGACA CTTTCGGCTC CGAGCTCAAC GCCGGCGCTG 8580 CAAATCCGGC GTTATAAGGA AAGGGTGCTC CAGCTTGTGG AGTGGTCTTT CCCCAGAGGC 8640 AGCAGCAGCA GCAACGCCAG CGGCAATTGG CGACCTCTGC GTAGCCGAGT CAATCCCGTT 8700 ATCGGTCCGT CTGGCGATGC GTTTCCGACG CGGCGGTATG CGTCCATAGG GACCGCCTAG 8760 AATGCTTGGC CAGGAGACAG CAGTAGACCT GGGCGTGGGC GTCACCAGCA ACATGGTAGC 8820 CATGCGCAGT CAATTGGCCG GTGGCAACAA TCTTGCCATG CAGCAATAGC GGCGCATGCT 8880 ACCCTTGGAG CGACGTCAAC AGCTACATAT TTTTCAACAG TGTAGCGCGA CCTTTAGGCG 8940 CCTACACCTA CACCAGCAGC AGCGATATTG GCAGTAGCAG CATTTAATGT CTTGCAGCAG 9000 TTTCCATTTG ACAACTTCCG ACGACCAGAC TCCTCGCTTG GCCCCTGGCG ATTCGCCCTG 9060 GAAGAAAGAA AGAAGCATGG ATTAGTCAAA TATCAAAGCA CAACAAGCAT GCACGAAATC 9120 TTCGCAACAA GGACTATTCC AAGGCAAGCG ATGGTGTGTT CTTTGGCTCT ACATATATCG 9180 TTGAAATCCG TCTCCAACTG CCGCGAGTCA CCCACGACTT CCACTCCCTG CAGACGGACG 9240 TAATGCACTA CGATGTGTAA ATTTTCCGGA TCCAAGTGAA CGCCAGGCGG AAGAGGATTC 9300 CCTGGATGTG AAGGATCACA AACTGCTGCT TTTTCAAGAG TCCCCATTTA ACAACTTCCG 9360 ACGACCAGAC TCCTCGCTTG GCCCCTGGCG ATTCGCCCTG AAAGAAAGAA AGAAGCATGG 9420 ATTAGTCAAA TACCAAAGCA CAACAAGCAT GCACGAAATC TGCGCAACAA GGACTATTCC 9480 AAGGCAAGCG ATGACGGACG GAATGCACTA CTATGTGTAA ATTTTCCGGA TCCAAGTGAA 9540 CGCCAGGCGG AAGAGGATTC CCTGGATGTG AAGGATCACA AACTGCTGCT TCTTCAAGAG 9600 GTAACCGGCC TCATTTCCAC TTGGGTCACA TCGATTGTGG AGGAAGCCGA TTGGGACTTT 9660 GAGCGAGCCC TAAAATTGTT CATTCAGAAG AACGCTGATC ACGAAATCCC AGATCTAGCA 9720 TTCGCCTAGA ATATGTGATC TCGTTGGACT GCGTGCTGGA CTGCGGCGCA TGCTTTCCCT 9780 CCCGCCAGAG ACGGGATGCG CGCATCAGGA TCGACGGGAC AGACCGGCCG ACGCCTGGCT 9840 TCACGTCGGC ATCTATGCGA CGACGTGATA ATCAGCTTCA CAGTACCTGC GGATGAGGGC 9900 ACAGGCGCCA GTCCTCTGCC TAGCGACACA TACACCAACA GCAACATCTA AAACAGTCGC 9960 AGTAGATGCA GGGAATTTTC TTGCTGCATT CTCCAACTGG AAAAATCCGA CGGCCCAACT 10020 CCTAGCTTAG CCCGGCCAAT CTTCTTGGAC TGGCAAACGA TGTGATGAAT CGTCCTGGAA 10080 GAAAGAAGCA TGGATTATTT CTTCATACAC AGCTTGTCTA CTAAAATGCA TTTCCCGGCA 10140 AACTGGCACT GGGGCGTTGA AAATACGACA CTACTCACCA AACAGCAGCA AAAACAACAG 10200 CATCGGCAGC AGGCGACCAG CAGCTGCTTT GGCTCACCCA ATGCGACAGC AATATCTGCG 10260 CATGGCCAGC AACATGCAGC AAGCAAAAGA CCGGCATGGT GGTGAACAAC ATATCGCTCA 10320 CGCCCAACGA TCTGGAAGCC CTGAGCTAGG GAACTGAGTA TCCGCCAGCG GATACTTATG 10380 CAGCGGCGAG GCGTCGGAAA TCCGATAGCC GGAAGAGAGG CCGGAGCAGC ATGTTGGGCA 10440 TTTTCGCCCC AGTAGCAGCT GCTGGGGCAG CAAGGGCAGA GGTAGCAGTG TCAGCGCTCC 10500 TGGTAAACCG GCCTTTTCTG TTGAAGACGC GGGACTGCGG CGCAATTGTT CCTGCCAACC 10560 GGGAGTTCTC TGCGCCTGAG GTCCTGTTGT GCTTCAGCGG CTCCATCTGC TGTTGCATCT 10620 GGCGCTTCTC CAACTTTCCT CCCTGAAAGA AGAGAATATT AGTAGGAGCA TGAGACCAAC 10680 AACAGCCCTA GCTTACCACG TCAGCGGAAA CAGCAACTGC AGAAGCCCGG TAACTTTCTG 10740 ATAATATGCA GCAATAAGAG CGGCTGGATC AGCATGTTGT GTAGCTTGGC CCCAGAAGCA 10800 GCAGCTGCGG TACCAAAGGC AGCGGAAGCA GGGTCAACAT AGTCTGCTAT GCTGTGTCCA 10860 TACTAGCATA GTCAAGTCAG CGGTGGTGAC GTTGCCGCAG CAGCTGATCC ACAGGGTACG 10920 GCCTGGAATG TTTTGTCAGA GACGGCAGTG GCCTGGGCGT ATTAGTCAGA TACGCCAACA 10980 ACATGATACC CATGCGCAAC CATTCTTCCG GTGGCGGCAT GCTCGTAAAG TAGCGGCGGC 11040 GCATGCATCT CTCGAAGCAG CAGCAGCAAC AGAGGCGTCT CATAAGTGCA TGCGCAGCAG 11100 CGGTAGCAGC GGTGGTGGCA GCAGCAGGGA GATTTCATTG CTGCAGTCGC CAAATTACAT 11160 GCATCCTACG ACTCGACTCA CGCTTTTTGG CCCCTGGCCG ATCTTCATAT ATCTCAAATC 11220 GACGGCTGCT TTTACCCTGG AAAAAAAAAA AGGAGCTTGG GTTATATTGA ACTACACTAG 11280 GCGGCGACAC ACTCACCAGC AGCAGCCAGA ACAACAACAG CGGCAGAAGT AGCAGGAAAT 11340 TATCTCACTG CAAAATCCAA TTGGCACTTT CCGAAGTCCG TATTTCTCGC CTGGCCCCTG 11400 GCCAGTAACA GGGGCCTGTG CGACGGAGAT GACGACGATG ATCTGCCCTG TGGACGGCCT 11460 CAAGAAGGAA TCGGCCCTGT ACTGCCCACC TGACCTGTGC CAGGATAGCA GCAATGTCAG 11520 CGGACCATGG ATGGAAGAGG CGGCACTGGC GACGGTCCTC AGTTTTGCGG TTTCCGCGGG 11580 GCGTAGGCGC AGTAATCGGC GGCAGCAACA GTGGCGGCAG CAGAAGGGAA TGTGTATCTG 11640 CAGTCGCCGA ATGGCAATTT CCTGCCCAGC TGTAATGGAC CGACAAATGT TTTTTGGCAT 11700 GTCGACCTGT AAGAAAGAAG CAAGGATAAG TTTTTTCTTT ACAAGATTGT ATATGAATTT 11760 GTATTTACGG ACAACTGGCT TGTTTCCTGT CGACGATAAA TGGCGCTTCA TGTTTTCACT 11820 CTGCCAAAAT CTGAGTGCAA GCATCGGGGC TGACGGGCCG AATTTGCTGA TGCCTTGTAC 11880 ATGCTAGCAT CTTTATGCCG CCGTGTAATT TTGCGACAGC AAAACACATG ATGGAGAAGA 11940 CGAAGGTGAT CGATGGCGCC CGGATGACGG ATGCAGGCCC GTGCTACCCA CTGGTCCGTT 12000 GCCAGGACAG CAGCGTTTCA ATTATGCGAA CAGAGGCACT GGAGCCACTT CTCAGGCGAT 12060 AGGGATCATG AGGCGACGAC AACTCGCCAG CAGCAGTAAC AACAACAGCG GCAGCAGCGA 12120 TCTCGGACTT GCTGAACATT GCGGCTTTTT CCCAGCCTGG ACCGTCATCA CAAACGCTCT 12180 CAAAGATCGG TGCGCCTGCA GCCTACGGAA GCGTACAACT GCCCAAAGTC GTGCTATTGC 12240 ATAATGTTAG GTGTCCTGGC TGCTCCGGCG GATGAGCTCC ACCCGATTGA GAGAGGTAAG 12300 AAGGCCCAGC AAGTCGCCCT TAAATAAAAG AAACAAGCAT TAGACTCGGC TGAAATTGTA 12360 ACATCAGTCA GACTGTACTC ACGCATGCAC TTAGACAAAC CGAAGCCTAT TCTATTGACG 12420 ACGCGGACTC CAACACATGT TTTCCTCCAC AAAAGGCTGT GAGTGCACCA AAGTTGACGG 12480 GCCACGCCGG CCGATGCTTG CTGCATACCG GCATCTCCGC AGCAGCGACG TTACAAGCAC 12540 CACTAAAATT AGAAAGAGGC TTACTATAGG CAAAGCGCAG AAAAACAAAT ATTACAATAA 12600 GAAATAGCAC GCGATTTTTC TGCTTCGTTT CCGCTTGGTA CAAGTGAGAC CATTCTCCCT 12660 ATATGCCATT CTAGTATATT TGCCCGATAA GCGATATGCT GGCGGCAAAA AAAAAAGATA 12720 ATAGCCGATA AGCCCGCCAA AAAAAAAGCG CGAAATATCG ATAACGAGCT GGCACGAAAA 12780 TTGCTGGCAT ATCGATCAAC CGCTGTGTCT TTGAGCTATC GAAAAAGCCC GCCTACGCGC 12840 CTAGCCCAAA TTTGCAAGTC AGTTGAGATT ATAAAACCGA CAGAGGCGCG CGCCGAACAG 12900 TAGCTAAAAG TGAAGCCAGC AGCAACAACA ACAACTAATG GACGGCCAGA ACGTGAACCA 12960 AAGCGGAGGA TGGGCATTGG TCTTATCCAT CTCATCGGAC GATGGTAACT GCTCATCCTT 13020 GCCGCCATAG TCTCATCGCT GGATATCAAG TCATCGCTCA ACTATACCTT AAAATTACTC 13080 ACCAAAACTC TTTTCTCCTT TTCCATAAGA TAAAGTAAAG TAAAGTAATG TAAAGTAAAG 13140 TAAAGTAAAT TAAAGTAAAG TAAAGTAACG TAAAGTAACA TAATATTTAA ATTTAAATTC 13200 TACACTTGAA CAATGGCGCG CAAAACTGCC GCAATGTAAT TCAAAAATGT CTCCCGCAAA 13260 TTTAAAACAT AGATTAATAC TTGTAAGTAT GGCGCGCATA TCTGCGGCCA AGAAATCCGA 13320 AAATGTAATT TGCCACAAAT TGTCACTATA TATTTTTAAG CAAAAATCAG AGGACAATAA 13380 ATGCCAACGT CATTAGACGT TGAAAATATT CAAAAAAAAA AAAA 13424 // ID DM14101 standard; DNA; INV; 10654 BP. XX AC U14101; XX DR FLYBASE; FBte0001207; Dmel\TART-B. XX FT source U14101:1..10654 FT SO_feature non_LTR_retrotransposon ; SO:0000189 CC telomeric retrotransposon FT SO_feature direct_repeat ; SO:0000314:1..1046 FT SO_feature direct_repeat ; SO:0000314:9031..10076 FT SO_feature five_prime_UTR ; SO:0000204:1..961 FT SO_feature three_prime_UTR ; SO:0000205:7386..10637 FT SO_feature polyA_signal_sequence ; SO:0000551:10479..10484 FT SO_feature polyA_signal_sequence ; SO:0000551:10600..10605 FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:10638..10654 CC derived from polyA tail of RNA transposition intermediate FT SO_feature CDS ; SO:0000316:962..4093 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\TART-element\gag" FT /db_xref="FLYBASE:FBgn0014071" FT /db_xref="SPTREMBL:Q23999" FT /db_xref="GI:603663" FT /db_xref="NCBI_PROTEIN:AAC46493.1" FT /translation="MDGHNGDQSEGWATVLSISSDDSNSLSSPPSIIVSSLDTTPTSHE FT TTIVRRSLYQTNADMKSYDFENIVLNENKNTILPDPLFVDKCGSTANTTEANEKKPANS FT PFPISISKNFSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTHIKPTKPSPPS FT KELSTNSALKTLSYTDKITGTQKNLPDKTHVDTPTQDDDINATKASKTAKIISTQTHLG FT ETKPIQPAKDPSPRTQKPIAHKADETLTHTDKLTASQNLVPAKTHINTPTQYNDTNATN FT ALKTAKINFSSHSHQSEIKPTQSAKNISPLTQKQFTSESAGTHTHTDKHKNTASQNLFS FT AKTHINSPTQHNYTSAATASKTAKLILSPHSHLSETKPTQPALSPSPLSQKQITSIAAK FT TLTHTNKHTASQNFIPAKTHINIPTQYNDTNATKALKTAKAASPSHTYSRQTKPIKSAI FT NALHPAQDTNPSPAISAVTYTDKPTATQNIFPVKTFAELVRENAKRLPTPMQNSHQAKN FT DSAALGRPPTAARKNLNKTLISPKTPGKRRGDCLDEGLLQTSNKKVRIRDDFSDDDLGV FT TNLLSETPLFKSKAAIKIRQDSRRDSLQKSAEMDTAPAISPSNTAADSDLPPWKTVPAS FT RKPPSIFLSNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTMDAHNAIQNVLLE FT ANIPLHSHQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFIRAMQFRDTRNPMR FT IHEVEVVPKADGSHLKVLLLKSLGGQTVKVERKRVSKDPTQCHRCQCFGHTKNYCRNPF FT KCMKCGQLHATVSCTKPKNLPATCANCNGSHVSSYKGCPAFQEAKQRLSINKIQSLHSQ FT PTHLQTPRNKHPYPKPTHLQTPRNKQPYTHPLPRTSVNNTKLPAKRIQGKKISQRNLSI FT NKRLHRMKKPRKETSPPTTSKKVLASLEESRKNPNSVLNPANTHLTHFRPPPLAQNIPN FT DEPKELSGEQYLLNRIEGMEKKINNLLEIVTRLLRQGKDCPKSPKNPFRDPIFV" FT SO_feature CDS ; SO:0000316:4131..7385 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\TART-element\pol" FT /db_xref="FLYBASE:FBgn0014072" FT /db_xref="REMTREMBL:AAC46494" FT /db_xref="GI:603664" FT /db_xref="NCBI_PROTEIN:AAC46494.1" FT /translation="MTRADNRDILKIAFWNAGGINNKIDELKLFILNIDAHIIIVTETR FT LDNNSTKLELPGYFTYLAQNPVSSKRGGVATIVNSSIRHMALKPIEKECIQSAPIVLLP FT ENNRRSEMIVIASVYCPPSLRWLPHHFTDVLNFAEKTLGGQTKFILCGDWNAKHRQWGC FT TRACQRGTALYEAVQADSTAEIIATGCATHFPHDTRKNPSAIDFSICKGLGRFEKRISS FT GADLSSDHLPILLEINLDTNTLFLQKQNNNILKKNTNIELFKKVLERKILLNTEIRVAE FT DINDAISTFMKNIKDSAAESTPSPRIRDNPRRRHRQANRNSHTLALDENTSRLLEEKRI FT LSRVFKATKNYEDKAKLKAAENRLKKAIKILRENRINEQVEGIDTSNPDRMRKMWKLLD FT EGKRTNQPNFPLKLETQKGPKWTKTIKETTETFVSHLEGRFKPNNNVPDYHIDRVNTGL FT RIIKESMLTERHNLNKNPHNQPITLKELNDEIKNLKNSKAPGKDLITNQLIKTLPTKAT FT LYLILIYNSILRLGYYPEAWKHAQVKMILKPGKSANEPRSYRPISLLSGLSKIFERLLL FT KRLFKVDLFKKAIPLHQFGFRKEHGSEQQIARVTQFILEAFERKEYCSAVFLDISEAFD FT RVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVKDQAGETSRTGQIGAGVPQGSNLGP FT LLYSIFSSDMPLPYIYRPSPTERIMLSTYADDTIVLSSDTLATAATRNNENYLKSFSDW FT ADKWGISVNAAKTGHVIFTLKNDLPTSLRTMKIKGQVIKIESKQSYLGVILDSKLTLSS FT HVTKLMGKYTTAYRKMTWILNRRSKLPTKTKMLILKSVLSPIWQYAIAAWGPLVTDAQI FT RRIQVEENRKMRDICRAGRYTSNQTIRDRYGIKTVEEFYQQALHRFSETIKSHPNIAVR FT RIFTRHYIPNRLERSRQRYLKMTNEHITQKQTGQTLSPKLLKIPDLNDCRTLKKRNERD FT KIRQTHLIELPTLLRLEEEEEELRRIKKQEERERREKETQKWPPDRWCELEINLYNKQY FT RRGDLTRQEIIQKFRGQPLNVQRIILPDYKGDQEHN" XX CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314"). CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short CC distance into ORF-1. The 5’ ends of TART-B elements are variable and the CC minimal size for functionality has not been determined. Thus, this CC canonical sequence, U14101, may be 5’ truncated within the 5’ PNTR (M-L CC Pardue, 2009). XX CC Derived from U14101 (g603662) (Rel. 42, Last updated, Version 1). CC Takis Benos and Michael Ashburner, 20-Aug-1997; updated Jan-2009 as per CC Mary-Lou Pardue and Greg DeBaryshe. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 10654 BP; 3669 A; 2717 C; 2036 G; 2232 T; 0 other; GATCCGGCCG GATGGCAGCT CGACGACGGT AGCAGGCCAC CATGCCCGCC AGCCCGCAGC 60 TAGGATAGCA GCAACATCAG CGTCTTATTA ACGCGAACGG CGGCACTGGC CCTTAGCTGA 120 CCAGCTGCAA CAACATCAGC GACGCAGTCT CCACCAGCAG CAACAACAGC AGCGGCGCTT 180 GCGACAGCAG CAGCAGGGAA TGGTTCTGCC GCAGTCGCCT ATTGCTGCCT ATAAAGAGCA 240 TTCCTTGCCA ATTGGCTTTC TGTACGACGA CGATGATCCT GCGGACAAAT CCACCTTTCC 300 GGACGCCTGA GTATTATGGC GAGCCTGCTG ATCATTGTTT CTCCGACTCC TTACTTGACC 360 ACTGGACAAT CATACAATCA CCGGCTTTTC ACATCTGGAA GAAAGAAACC TGGATTAGTA 420 TTTGCCCTTC AGATTTGTAT GAAACTGCAT TTCTGGCCAA CCGGAGTGTT TCCTGCAGAC 480 GACGCTGGAC TGCGACGCAC TTTTTTCTAC CAACACAGAT GGGACGCTTG CATCAGATCT 540 GACGGGCCAG ACTGGCCGAT GCCTGGTACA CGATGGCATC TCCGCGGCGG CGAGATGTGC 600 AGCGACGCTG AAAGCAATAA TAATTCTTTT ACTTTGCAGT ATCAAAAATG AGAAGCCACA 660 TCACAATTTA CATCAGCAAA AATTACACGT GATATCTTTT TCTTTTGCCT AGGAGTAGTG 720 AGACCTGCTA CCAAAATGAC CAGTAATACC GGCTAACGGA AGCGAGATAT CGATAATCAT 780 TCTGGCGGTA AAATAGCCAG AACATCGATA ACCAGCTGTG CATTTTCCCT TCGATTTATC 840 GAAGTCAAAT AGCCCGCCTA GGCTATCGGA CCGGATCGGC AAGTCAGTAG TGATTAAAAA 900 TCCGGCAGAG GCGCCTGTGC AGCAGCTACC CAAAGTGAAC ACGACGAAAC GCAACAACAA 960 AATGGACGGA CATAATGGAG ATCAAAGTGA AGGATGGGCA ACAGTGCTAT CTATCTCCTC 1020 GGATGATAGT AACTCCTTGT CGTCGCCGCC GTCTATAATA GTTTCATCGC TGGACACCAC 1080 GCCAACTTCG CACGAAACCA CCATAGTAAG AAGAAGCCTA TATCAAACAA ATGCTGACAT 1140 GAAATCTTAC GATTTTGAAA ATATTGTATT AAATGAGAAT AAAAATACCA TATTGCCAGA 1200 CCCTTTATTT GTTGATAAAT GCGGGAGTAC TGCTAATACC ACAGAAGCCA ATGAAAAAAA 1260 GCCTGCCAAT AGCCCCTTCC CCATTTCCAT TAGCAAGAAT TTTAGCACTT CCTCGCCACT 1320 AACACATGTA GACACGCCTA CACAAGAAGA TGACGCCAGT GCGTTCAATA CATTGAAAGC 1380 AGCTAAAACA GCTAGAATAA TTTTTCCCAC ACACACACAT ATAAAGCCCA CCAAACCCTC 1440 GCCCCCCTCC AAAGAATTAA GCACAAACTC AGCACTAAAA ACTCTCAGCT ACACAGACAA 1500 AATAACAGGA ACACAGAAAA ATCTACCCGA CAAAACACAT GTAGACACAC CTACACAAGA 1560 TGACGACATT AATGCAACCA AAGCATCAAA AACCGCTAAA ATAATTTCTA CACAGACACA 1620 CCTAGGTGAA ACCAAGCCAA TACAGCCCGC CAAAGACCCC TCACCCCGCA CCCAAAAGCC 1680 TATTGCACAC AAAGCTGACG AGACACTTAC CCACACAGAC AAACTCACAG CATCACAAAA 1740 CCTCGTTCCC GCCAAAACAC ATATAAACAC ACCCACACAA TATAACGACA CTAATGCAAC 1800 CAATGCATTA AAAACCGCTA AAATAAATTT CTCTTCACAC TCACACCAAA GTGAAATCAA 1860 GCCAACACAG TCCGCCAAAA ACATTTCACC CCTCACACAA AAGCAATTCA CAAGCGAATC 1920 AGCCGGGACA CACACCCATA CAGACAAACA CAAAAACACA GCATCACAAA ATCTCTTTTC 1980 CGCCAAAACA CACATTAACT CACCCACACA ACATAACTAC ACTAGTGCAG CCACAGCATC 2040 AAAAACCGCT AAATTAATTC TCTCCCCACA CTCACACCTA AGTGAAACCA AGCCAACACA 2100 GCCCGCTTTA AGCCCCTCGC CCCTCTCCCA GAAGCAAATA ACAAGCATAG CAGCCAAGAC 2160 ACTCACCCAC ACAAACAAAC ACACAGCATC ACAAAACTTT ATTCCCGCCA AAACACATAT 2220 AAACATACCC ACACAATATA ACGACACCAA TGCAACCAAA GCATTAAAAA CCGCAAAAGC 2280 AGCTTCTCCC TCCCACACAT ACTCACGTCA GACAAAACCA ATAAAGTCCG CCATAAACGC 2340 ATTGCATCCC GCCCAAGACA CAAACCCAAG CCCAGCAATC AGTGCTGTCA CTTACACAGA 2400 CAAACCCACA GCTACTCAGA ATATTTTTCC TGTCAAAACT TTTGCAGAGC TGGTTAGGGA 2460 AAATGCAAAA CGCTTACCAA CTCCAATGCA GAATTCCCAT CAAGCTAAAA ATGACTCTGC 2520 CGCTCTCGGA CGCCCCCCGA CTGCAGCTAG AAAAAATCTA AATAAAACAC TGATTTCTCC 2580 TAAAACTCCT GGGAAGCGCC GTGGGGACTG TCTTGATGAA GGCCTACTAC AAACCTCTAA 2640 CAAAAAGGTT AGAATACGCG ATGACTTCTC TGACGATGAT CTTGGGGTCA CAAATCTACT 2700 CTCTGAAACA CCCTTATTCA AAAGCAAAGC AGCTATCAAG ATCCGGCAAG ACTCGAGAAG 2760 AGATTCCCTG CAGAAGTCAG CCGAAATGGA CACAGCTCCA GCAATTAGTC CCTCAAACAC 2820 AGCAGCCGAT TCCGACCTAC CGCCCTGGAA AACTGTTCCA GCTAGCAGAA AACCACCATC 2880 AATCTTCTTG TCCAATATAC AGCAGATTAT CCCGCTAATA GAAAAACTAA ACTATAAAGC 2940 CGGGGTAAAT AGCTTTACCA CCAAATCTGA ACTTGGCAAC AATATTAGAA TCCAGGCTAA 3000 AACGATGGAC GCCCACAATG CAATTCAGAA TGTTCTCCTT GAGGCAAATA TTCCCCTACA 3060 CTCCCACCAG CCAAAGAGTG CAAAGGGCTT CCAAATTGTA ATTAGGCACC TCCACCAGTC 3120 AACCCCGACC AAATGGATTG AAAGCCAACT TCAAGACATC GGTATAGCTA CAAAATTTAT 3180 CAGGGCAATG CAGTTTAGGG ACACGAGAAA TCCTATGCGC ATTCATGAGG TTGAAGTTGT 3240 ACCCAAGGCT GACGGCAGCC ATCTCAAGGT CCTGCTACTA AAATCCCTTG GAGGTCAAAC 3300 GGTCAAGGTT GAAAGGAAAC GGGTATCGAA GGATCCCACA CAATGTCATC GCTGCCAATG 3360 TTTTGGGCAC ACAAAAAATT ATTGTAGAAA CCCGTTTAAA TGTATGAAAT GTGGCCAGCT 3420 GCACGCCACG GTTTCATGCA CTAAACCCAA AAACCTTCCG GCTACTTGTG CAAACTGCAA 3480 TGGAAGCCAC GTAAGCAGCT ATAAAGGATG TCCCGCTTTC CAAGAAGCAA AGCAAAGACT 3540 ATCTATCAAC AAAATTCAAT CCCTACACTC ACAACCCACG CACCTTCAGA CCCCCCGCAA 3600 TAAACATCCC TACCCAAAAC CCACCCACCT TCAGACGCCC CGCAATAAGC AGCCCTACAC 3660 ACACCCCCTC CCTCGCACAT CAGTAAACAA CACAAAACTA CCTGCCAAAA GAATCCAAGG 3720 AAAGAAGATA TCGCAAAGGA ATCTATCTAT AAACAAACGC TTACACAGAA TGAAAAAACC 3780 GAGGAAGGAG ACAAGCCCGC CGACAACTAG CAAAAAGGTC TTGGCCTCTC TAGAAGAAAG 3840 CAGAAAAAAC CCAAATAGCG TCCTAAACCC GGCCAACACC CATCTCACTC ATTTCCGCCC 3900 ACCCCCTTTA GCACAAAATA TTCCTAATGA CGAACCTAAG GAGCTGAGTG GGGAGCAATA 3960 CCTTCTAAAT CGCATTGAAG GGATGGAAAA GAAGATCAAC AACCTTCTTG AAATCGTCAC 4020 CCGCCTACTA AGACAAGGAA AAGACTGTCC AAAGTCTCCA AAAAATCCTT TCCGAGATCC 4080 AATCTTCGTG TAAATGCTCT TTCTAGTAAC ATCAGAAAGT GACGTTTCCT ATGACTCGGG 4140 CTGACAACAG GGACATCCTT AAAATCGCTT TCTGGAATGC TGGTGGGATT AACAATAAAA 4200 TAGATGAGCT TAAGCTGTTC ATTCTAAATA TTGATGCCCA CATAATCATA GTCACCGAAA 4260 CTAGACTAGA CAACAATTCT ACCAAACTAG AGCTGCCAGG ATATTTCACA TACTTAGCCC 4320 AAAATCCTGT CTCTAGCAAG AGAGGAGGGG TCGCTACTAT AGTAAACAGC AGTATCCGAC 4380 ACATGGCCCT AAAACCGATC GAAAAAGAAT GCATACAAAG CGCCCCAATA GTCCTGCTGC 4440 CTGAAAACAA CAGACGCAGC GAAATGATAG TAATAGCATC TGTCTACTGT CCGCCCTCGC 4500 TAAGGTGGTT GCCCCACCAC TTTACTGACG TTCTCAATTT TGCAGAGAAA ACTTTAGGAG 4560 GGCAGACCAA GTTTATCCTA TGTGGCGACT GGAATGCAAA ACATAGACAA TGGGGTTGTA 4620 CACGCGCCTG CCAACGTGGC ACCGCACTCT ACGAAGCAGT CCAAGCCGAC TCCACTGCAG 4680 AGATCATTGC CACTGGCTGT GCTACACATT TCCCACATGA CACAAGAAAA AACCCGTCAG 4740 CAATAGATTT CTCCATTTGC AAAGGGCTTG GCAGGTTTGA AAAAAGAATT TCTTCAGGGG 4800 CGGATCTATC CTCAGACCAT CTTCCCATCT TGTTAGAGAT AAACCTAGAC ACAAACACCC 4860 TCTTCTTGCA AAAACAAAAC AACAATATAC TCAAGAAAAA TACAAACATC GAGCTGTTTA 4920 AGAAAGTTCT AGAAAGAAAG ATACTATTAA ACACTGAGAT AAGGGTAGCA GAAGATATAA 4980 ATGACGCCAT AAGCACCTTT ATGAAAAACA TCAAGGACTC GGCTGCGGAA TCAACTCCCT 5040 CCCCAAGAAT ACGTGACAAC CCCAGAAGAA GACATAGGCA AGCCAACAGA AACAGTCATA 5100 CCCTCGCACT AGACGAAAAC ACAAGCAGAC TGCTTGAGGA AAAACGCATA TTAAGTAGAG 5160 TTTTCAAAGC TACCAAAAAT TACGAGGACA AAGCTAAACT AAAGGCAGCT GAAAACCGAC 5220 TAAAAAAAGC GATAAAAATA TTGAGAGAAA ACAGAATCAA TGAGCAAGTT GAAGGAATAG 5280 ATACAAGTAA CCCGGACAGA ATGAGAAAAA TGTGGAAACT GCTAGATGAA GGGAAAAGGA 5340 CAAATCAGCC TAATTTTCCC CTCAAATTAG AAACCCAAAA AGGACCCAAA TGGACAAAAA 5400 CGATTAAGGA GACAACAGAA ACATTTGTCT CCCACTTGGA AGGAAGATTT AAGCCAAACA 5460 ATAATGTACC TGATTACCAC ATAGATAGAG TCAATACTGG ACTAAGAATA ATTAAGGAAA 5520 GCATGCTAAC TGAACGACAT AATCTGAACA AAAACCCCCA TAACCAACCT ATTACTCTAA 5580 AGGAATTAAA TGACGAAATA AAAAACTTAA AGAATAGTAA AGCACCGGGA AAAGACCTTA 5640 TAACAAACCA GCTAATAAAA ACCCTACCGA CTAAAGCTAC CCTTTACCTT ATCCTAATCT 5700 ATAACTCCAT ACTTAGACTA GGATACTACC CAGAAGCCTG GAAACATGCG CAGGTAAAAA 5760 TGATTCTCAA GCCAGGGAAA AGTGCAAACG AGCCAAGGTC ATATAGGCCG ATTAGCCTAC 5820 TCTCGGGACT CTCAAAAATC TTTGAAAGAC TACTCTTAAA AAGACTTTTT AAGGTAGATT 5880 TATTCAAAAA AGCTATTCCT CTGCACCAAT TTGGCTTTAG AAAAGAACAC GGATCGGAGC 5940 AGCAAATAGC CAGGGTCACC CAGTTCATTC TTGAGGCCTT CGAGAGAAAG GAATACTGCT 6000 CCGCGGTCTT CCTTGACATC TCTGAGGCTT TCGACAGGGT ATGGCACGAA GGCCTTTTAC 6060 TTAAATTAGC TAAGATCCTA CCTTACAACT TGTACATTAT ACTGGAGAGC TACCTAACAA 6120 ATAGAACGTT CGAAGTTAAA GACCAAGCTG GAGAGACTTC GAGAACAGGA CAAATTGGTG 6180 CTGGTGTGCC TCAAGGAAGC AATCTTGGAC CACTACTCTA CTCTATCTTC TCCTCAGACA 6240 TGCCCCTTCC ATATATCTAC CGCCCCTCAC CAACAGAAAG AATCATGCTC TCAACATACG 6300 CAGACGACAC TATAGTCCTC AGCTCAGACA CACTAGCAAC TGCCGCTACA AGAAACAACG 6360 AAAACTACCT CAAGTCATTC TCGGACTGGG CGGACAAATG GGGTATATCA GTAAACGCTG 6420 CTAAAACCGG ACATGTCATT TTTACATTAA AAAACGACTT ACCTACAAGT CTAAGGACTA 6480 TGAAGATCAA GGGTCAAGTA ATAAAGATTG AAAGCAAACA ATCATACCTT GGCGTAATCC 6540 TTGACAGCAA GCTAACCCTC AGCTCCCACG TCACAAAGCT GATGGGCAAA TACACTACAG 6600 CCTACAGAAA AATGACATGG ATTCTAAACA GAAGAAGCAA ACTCCCTACC AAGACTAAAA 6660 TGCTGATCCT TAAGTCAGTC CTTTCACCAA TATGGCAGTA TGCCATAGCA GCTTGGGGTC 6720 CCCTTGTGAC GGATGCACAG ATAAGACGGA TCCAAGTCGA GGAAAATAGG AAAATGAGAG 6780 ACATATGCAG AGCGGGTAGA TACACGAGCA ACCAAACTAT AAGGGACCGC TATGGAATCA 6840 AAACAGTAGA AGAATTCTAT CAACAGGCAC TCCACAGGTT CTCAGAAACA ATAAAATCTC 6900 ACCCAAATAT AGCTGTACGC AGGATATTCA CAAGGCACTA TATCCCGAAC AGACTAGAAA 6960 GAAGCAGGCA GAGGTACTTG AAAATGACAA ATGAACACAT CACGCAAAAA CAGACTGGAC 7020 AAACACTCTC ACCTAAACTC CTAAAAATCC CTGATCTAAA TGACTGCAGA ACCCTTAAAA 7080 AGCGGAATGA AAGAGATAAA ATAAGGCAAA CCCATCTAAT TGAACTCCCC ACCCTGCTGA 7140 GACTAGAGGA AGAAGAGGAA GAGCTTAGAA GAATAAAAAA ACAGGAAGAG AGGGAAAGAA 7200 GGGAAAAGGA AACCCAAAAG TGGCCTCCAG ACAGATGGTG TGAATTAGAA ATTAACCTAT 7260 ATAATAAGCA ATATAGAAGG GGCGATCTAA CCAGGCAGGA AATCATACAA AAATTTAGAG 7320 GACAACCACT AAATGTACAG AGGATAATTT TACCCGACTA TAAAGGAGAC CAGGAACACA 7380 ATTAAAAGTA AATCATGGGA AAGCAGGGGA AAAAAAACAG AAGTAACAAA ATGGCGGAAG 7440 GGGTGGCAAA ATATATATAA AAATAAGAAA AGATAGAAAT AAAAAGGCTA AAGGCTCACT 7500 TACAGGTTAA TTCAAAAGGG AAACGTGCTT ACATATCTAA TGGTAAAAAC TAACTTATAA 7560 CACCTACTGG ATGACATAGT GAGGATGCCA CAGGTTGCGC ACTTGAATCA CGCTTTCCTG 7620 GCGAGATTGT TAAGGCATCA CCGGGATCCC GTCTCTCTTT CCTAACTGGA GGACTCATGC 7680 CTGAAATCTT TTCCGCTTCA CCGGCACCTG ATGGCCATAT CTGCTACTGC GCCTTGCGTC 7740 CACGGACGCT CCTTCCTGAA AGAAAGAGAA TTTGTTTTAG TTTTCCTTTC TCTTCTTAAA 7800 AATATAACAA AAACAGCAGC AGTAGCCGAC CAACAACATA CTTAGCTTAC CAAGGCAGCA 7860 GCAATGATAC CAACAGAAGC CCTACAGTGT GCTGAACAAT ATGCCGCCCA CGCCCACCAC 7920 TTCTGGAACT CAGGAATGGG GGGTACGGAA TGCCGGAAAC TGGAGGATTC GCCTCAAATG 7980 TTACGCTTAC ATCTTTGAGC AAATCGCCTG CCTCCTCGTC TAACGGCCCG GCGTCTTGGT 8040 ACGCCCAGAA GTAGCAGCGG TAGCAGGATT AGCAGCCTCC ACAGAGATAT GTTCATCCCA 8100 GCATCAGTCC AGTTGGCATT GTGATGCCGC CGTAGCGTAC GCCCTCAGAG ACCCGACTGG 8160 AATCCCAGGA CAAGAGACGG CAGCACGCCT GGGCTTAGGC GCGGGACAAC ATGCAGAGAT 8220 TCGTCAATGA GAATGGCGGC ACTGGAATCA CCTTTCAGCT GAGCGGGATA ATGAGTCGGC 8280 AACGCACCGC ACTATCAGCA GCAATAACAA CATCGGCAGA TGACCTGGAA GAAAGGAAAA 8340 AACATGTATC AGTCTTTTCT TTTCTTTTTT TTTCCCATTA GCATGCGTTT TTAAATTCCA 8400 TTCCTGAAAA CCGGCGTTTT CCTGTAAAAG ACACTGGACG GCGGCGTTTG TTTTAAATGC 8460 AAAGATTGGA TGCTTGCATC AGGGCTGACG TCCTTGAATA GCCGATGCCT TGTAATTGCC 8520 TGCATAGCCG CGGAGGTCCT GATGACGGAT GCTGGCCTGT ATTTGGCCAC CACTCCGATG 8580 CCATGACAGC AGCAACAGCA GCGGTTTTTG CAAATGAGAG GGATCAGGAG GCGGCAACAC 8640 ATTCACCCGT AGCAGCAACA ACAAGCAGTG GTAGCATCAG CAGGGAGTCT TCTCGCCACA 8700 ATAGCCATTT GGAAATTTCT CGACGACCCG ACTTCCTGCT TGGCCCATGG TCAATCACAC 8760 TGGACCAGTT AACAGCGGCG TTTTACCCTG GAAGAAAGAA AACTTGTATT ATTCATTCCC 8820 TTTTCTCTCA CAGTTGGGTA TTTAAGTGCA TTCCTGGCCA ACCTAGCGTG TCTCCTGGCA 8880 ATGACGTCGG ACTCAACGCA TGCTTCCCTT CCGACACAGT AAGGATGTTC GCATCTGGGC 8940 TGACGGGCCA GGCCGGTCCG TTGCCATACA TGCTAGCGTT TCCGCGGCGG CGTAGTGAAC 9000 ATCAAACCGT ATAATGGCGA AGACGACGAT GATCCGGCCG GATGGCAGCT CGACGACGGT 9060 AGCAGGCCAC CATGCCCGCC AGCCCGCAGC TAGGATAGCA GCAACATCAG CGTCTTATTA 9120 ACGCGAACGG CGGCACTGGC CCTTAGCTGA CCAGCTGCAA CAACATCAGC GACGCAGTCT 9180 CCACCAGCAG CAACAACAGC AGCGGCGCTT GCGACAGCAG CAGCAGGGAA TGGTTCTGCC 9240 GCAGTCGCCT ATTGCTGCCT ATAAAGAGCA TTCCTTGCCA ATTGGCTTTC TGTACGACGA 9300 CGATGATCCT GCGGACAAAT CCACCTTTCC GGACGCCTGA GTATTATGGC GAGCCTGCTG 9360 ATCATTGTTT CTCCGACTCC TTACTTGACC ACTGGACAAT CATACAATCA CCGGCTTTTC 9420 ACATCTGGAA GAAAGAAACC TGGATTAGTA TTTGCCCTTC AGATTTGTAT GAAACTGCAT 9480 TTCTGGCCAA CCGGAGTGTT TCCTGCAGAC GACGCTGGAC TGCGACGCAC TTTTTTCTAC 9540 CAACACAGAT GGGACGCTTG CATCAGATCT GACGGGCCAG ACTGGCCGAT GCCTGGTACA 9600 CGATGGCATC TCCGCGGCGG CGAGATGTGC AGCGACGCTG AAAGCAATAA TAATTCTTTT 9660 ACTTTGCAGT ATCAAAAATG AGAAGCCACA TCACAATTTA CATCAGCAAA AATTACACGT 9720 GATATCTTTT TCTTTTGCCT AGGAGTAGTG AGACCTGCTA CCAAAATGAC CAGTAATACC 9780 GGCTAACGGA AGCGAGATAT CGATAATCAT TCTGGCGGTA AAATAGCCAG AACATCGATA 9840 ACCAGCTGTG CATTTTCCCT TCGATTTATC GAAGTCAAAT AGCCCGCCTA GGCTATCGGA 9900 CCGGATCGGC AAGTCAGTAG TGATTAAAAA TCCGGCAGAG GCGCCTGTGC AGCAGCTACC 9960 CAAAGTGAAC ACGACGAAAC GCAACAACAA AATGGACGGA CATAATGGAG ATCAAAGTGA 10020 AGGATGGGCA ACAGTGCTAT CTATCTCCTC GGATGATAGT AACTCCTTGT CGTCGCTGCA 10080 TATATAAAAT AATAAATTTC TTAAAATAAT TTCATCGCTG GATTCCTGCG CCACCATAAA 10140 TTACTTATAG AATACACTTA ACACTGTACC CACTAATGCT AAAAATTTTC TTATACAATT 10200 TTACTTTAAA GCTAAAACTA CTTAAACTAT GGCGCGTAAA ACGGCCGTCA AAAATATCCA 10260 AAAATTGTAC TTGCCATAAA CAAATTCTAA CATAATGTAA ATCCTAAATC GTAAAATCAT 10320 GGCGAACATA ACCGCCGCCA AGCAAATCAA AAAATGTTCC TAGAAATTGT AAATCTTAAA 10380 CCTACTTCTC TAACTAAAGC GCGCACAACT GCCGCTGATC CGAAATTGTA AAATGCCATA 10440 AATTGTAACT ATATATTTTA TAAAAAAAAT CAGAGTACAA TAAAATGACA GCGCCGAAAG 10500 GCACTGAAAA TATTTAAAAA AAAAAAAAAC TGCCGCTGAT CCGAAATTGT AAAATGCCAT 10560 AAATTGTAAC TATATATTTT ATAAAAAAAA TCAGAGTACA ATAAAATGAC AGCGCCGAAA 10620 GGCACTGAAA ATATTTAAAA AAAAAAAAAA AAAA 10654 // ID TIRANT standard; DNA; INV; 8526 BP. XX AC nnnnnnnn; XX DR FLYBASE; FBte0000179; Dmel\Tirant. XX SY synonym: prygun XX FT source X93507:1..2484 FT SO_feature five_prime_LTR ; SO:0000425:1..417 FT SO_feature three_prime_LTR ; SO:0000426:8109..8526 FT SO_feature CDS ; SO:0000316:1866..2999 FT SO_feature CDS ; SO:0000316:3239..6505 FT SO_feature CDS ; SO:0000316:6683..8146 XX CC Sequence identified by REPBASE: CC http://www.girinst.org/server/RepBase/RepBase6.6.embl/drorep.ref CC Assembled and annotated by Josh Kaminker & Michael Ashburner. CC REPBASE states this to be a consensus sequence. CC This replaces that from X93507 in versions previous to 4.8. XX SQ Sequence 8526 BP; 2961 A; 2097 C; 1384 G; 2084 T; 0 other; GGAGTTACCA CCCCACCCCC TAAACCCCCA CGCCTCTAAA CAAATCATCG GACACTCAAC 60 CGGGAAGACG GCAACTGGAA CACCGCATCC GGCCGAATGC TGACATTCCG GCCGAATGCT 120 GACATTACAC AAAAGTCGCA CTGCAACATT GTCCCCAGCT AGCCAGCCAC ATGCCGAGTC 180 GGCATGTTCA TTATGCTTAC AATTAAGAAC CTATGTACTT ATGTATAAGA CGAAAACGGA 240 GGACTCGAGT AGCCACTCTC TGACAATAAA CTTGATACTG ATTTTGAACT TCAAGAAAGT 300 CAGTCGTATT CTTTATTGGA AATCTTCACA CTACAACTAT CTGCTGAAAC TTAAAAACCT 360 TCATACATTT ACACATCATA TCTTCACAAA AGGCTCCACC CTCGATCACG GACTTAACTG 420 GCGCAGCCGG TAGGATGTCC TACCTATTAA TAATTACCTA CCTGTAAGTA AACATGTAAG 480 AAACGAAACA AACTATATGC AAGATGTCGA CTGAAAGTGA CTAGGAACAA ATTTTTATAA 540 AACAAAATTG AAGTTGTGAA GTACCAAATG AAACTCAAAC ATATATTCAA ACACAGGAAA 600 AAAAAAGAGA GAGGAAAAAT GTAAAATAAA TAAATATACA AAAAAAAGTG CAAGTGTACC 660 GTACTGCCGC GCTGACGTGG AATCTATCGC TGATCATCAC GCCATCGGTA TGTCCATACT 720 CTGCCGAACG TCATAATTTT TTTAAAAAAG TGCAAGTGTA CCGTACTGCC GCACTGACGT 780 GGAATCTATC GCTGATCATC ACGCCATCGG TATGTCCATA CTCTGCCGAA CGTCATAATT 840 TTTATAAAAA AGTGCAAGTG TACCGTACTG CCGCGCTGAC GTGGAATCTA TCGCTGATCA 900 TCACGCCATC GGTATGTCCA TACTCTGCCA AACGTCATAA TTTTTATAAA AAAGTGCAAG 960 TGTACCGTAC TGCCGCGCTG ACGTGGAATC TATCGCTGAT CATCACGCCA TCGGTATGTC 1020 CATACTCTGC CAAACGTCAT AATTTTTATA AAAAAAGTGC AAGTGTACCG TACTGCTGCG 1080 CTGACGTGGA ATCTATCGCT GATCACCACG CCATCGGTAT GTCCATACTC TGCCAAACGT 1140 CATAAGTTTT TATAAAAAAA AAGAGTGCAA GTGTACCGTA CTGCCGCGCT GACGTGGAAT 1200 CTATCGCTGA TCATCACGTC ATCGGCACTT ACATACGCTG GCCAACGCAT CGCCAAAGCC 1260 TCTATATACA CTTATATATG TGAGCATACA ATATCAACTA CAATCCAATA CATCCACGTA 1320 CTGTACCGCC TCGTTGGCAT GGAATCAAAC GCTGATCACC ATGCCACCGT GGTAAACAAA 1380 CAAAGCACCA AAGCCTCTCT AATACATTGT ACACTCAAAA CGCACACTGC CATACGTCGG 1440 CGAAAAATCA AAACATAAGC AAAAATCATT TCAAACCAAG CGAGGCTCAT TCTGCGTACC 1500 ACAACGACAA CGACACTGCA TGTGTAGTGG CGCACCCATG TCTGGGTAGC CGAGGTAAGG 1560 GGAAAACGCT TGAGTATCGT CAAGTGTTCT TGCCTTTCAC TCTTCTACAA TGGGTTGCTA 1620 CGCTCATGTA TTGCACATTC AAAATAACCA AAACAAATGT ACTAAAGAAG TCGACATATA 1680 CAGATATATT TTGTTTCCTT TCATTGTGTA ATTTTGTATA TCAAACAAAT ACTAATACCA 1740 ATCACATTGC AGAATATAAA AGGGAAAATA TAAAGCCAAA GACAGACACC CATACACTCT 1800 AGTAAACAAG AAATTTGTTC ATTATTTTTC AATCATACAT AATATACTAA GTAACCTCAA 1860 ATTTAATGTC AAAAAAGTTC GTTTACAACC TTAGGAAAAC TACACGTTCA GTTGTTGGAG 1920 TTCCACCAAA CACTAATAGG CCCCCACATC CCGTTAGACG TCCTGACTCC CTTCTCCCGA 1980 TTTCGGAAGA ACCCAAATCA ATATCTTCCC AAACCCCCAA TATGGACTCG GGAAACGATT 2040 CTGCCCGCCC CACTCCATCC CCTCTGGCGC CCACTGTCAG TGGTATTAGC TCCTTAATTT 2100 CAACTACGTT CAAGCCTAAA GATATCATGG CATTTGTTGA GCATTTGCCA ACCTTTGATG 2160 GTACACCTCG TCTATTGGAC AGGTTTATCA CTAGCGTAGA AGAAATCCTG ATGCTCATCA 2220 GGGGAGCTGA CCAAACACCG TATGGCCTGC TTACTCTGAG GACCATCAGG AACAAAATCA 2280 TTGATAGGGC CGACGAAGCC TTGGAACTGG CAAATACCCC CTTGGTTTGG GATGAGATTA 2340 AAAGCAATCT CATCCGCCTC TACTCGAGCA AGAAAAGCGA GGCCAACTTG TTAAGCGAGC 2400 TTAACACATT TTCGGACAAC CTGACCTTGG GCCAACTGTT CTTTGGTATA TCAAAGGTGA 2460 GAAGCCAACT CTTCTCCATA CTCAAAAACA GCGAACACAA CAACACTGTT GTAGATGCAA 2520 AAAAGGTTGT CTACAACGAG GTTTGTCTCA ATGCTTTTAT GACTGGTTTG AAGGAACCTC 2580 TCAAGACTTT CGTCAGGATA AAGTCCCCTT CTACACTTGA ACAGGCGTAC GAGCAATGCC 2640 AAATAGAGCA GACCTTATAT AGGGCACAAA ACAAGCGAAC CAACAGACCA GAGCAGGGAC 2700 CCAATGGATC AGACAATAAA ACCTACCGAA ATAGCTACGA CAGCAATTAC CGCAGCGGAC 2760 GTAACGACCG AAATGACCGT AGGGGACCCT ACTCTAACTC TAACTCTAAC TCTAACTCTG 2820 GCCAAAATAG ACCATTTAAT TCACACAATC GCACACCCCA ATCCGGCACC AAGGACAACC 2880 GGGCCAATAC ATCAAACCCC TTTCGAGCAC CTTCACATAG TTTGAATAAT ATAGAGGAGA 2940 ACCCTCAACC TGATTCGAAT TTTCAGCAAA CGGCCTCGGG AAACCAACAG GGTACATAAG 3000 CCCAGCCACG CACAACCCCT CGCTTCCTTT TATAAAAATC AAACTATCCC AGACAAACCC 3060 CCTGAAGTTT TTAATTGACA CAGGCTCTAC ACACTCCTTC ATCGACCCAA AATATGTCGA 3120 CCCTAGGAAC TGTGTGACCT TAGATACGCC CATAACACTC AAAACAGCCC TGAACAGTTT 3180 TAAAATATAT CAAAACGTCT CTATACCATT TCCACCGGAA TTCCAAATCA CGGGCAAAAT 3240 GACCCTTCTA CCTTTCAAGT TCCACTCTTA TTTTGACGGA TTGATAGGAA TGGACTTATT 3300 ATCTTACCTA AAAACAGAAA TAGATTTACT TAACCTAAAT CTAAAAACCC CAAGTACCAT 3360 TATACCCTTA TGGACCCACA GTAACTCAAC TTCAAACGTA TTTAATATCT CTGGACATAC 3420 GAAAACTATT TTGCCACTAC CAGTGGAAAC CAAACAGGGC GACTTCTACA TCGATTCAAT 3480 TACAATCAAT GATGACTTAA TAATATCAGA CGGGATTTAT AATGCCCAAA ACAATATTGC 3540 TAATTTCGTT ATCACAAACT ATAGCGAGAG GGATCAGTTA TTGTACCTCG AGAGCCCGAT 3600 AAAAGGCATG CCATACTCCA CGGCCAACAA TGTTGAACTT TTCAGTATCA CTTCAGACAC 3660 CCCACAGCCC CAAAACTCCG CAGCGTCGTT ACAAGCCCTT GGCGTCGATC ACCTCTCCTC 3720 TGAAGAGAAA CAAAGCCTAC TTTCACTTTG CAAAAGTTAT CTAGATATCT TCTACAATGA 3780 AGACAAATCA TTGACCTTCA CCAACAAGAT TACACACACG ATTAAAACCA CGGACGACAC 3840 CCCCATTCAT ACAAAATCTT ATAGATATCC TTACATTCAT AAAGAGGAGG TCAAAAAACA 3900 AATAGAGGCA ATGTTAAATC AGGACATTAT CAAATCCAGT TATTCCCCGT GGAGCGCCCC 3960 CGTCTGGGTC GTCCCAAAGA AAATCACTCC TACGGGAGAG CAAAAATGGC GTCTAGTTAT 4020 CGATTATAGA AAACTCAACG AGAAGACTAT ATCCGATAGA TATCCAATAC CTAACATCGC 4080 GGATATCTTA GACAGATTGG GCAAAGCCAA ATATTTCTCC ACACTTGATC TGGCAAGTGG 4140 ATTCCATCAG ATAGAAATGA ATCCCGACGA CACACCCAAA ACTGCATTTA CAGTAGAGGG 4200 GGGCCACTAC GAGTTCATTA GAATGCCGTT TGGCCTCAAA AATGCCCCAG CCACATTCCA 4260 AAGGGTGATG GACAATATTT TTGGAGACCT TATCGGAACT ATCTGCCTAG TTTACCTAGA 4320 TGATATAATA ATTTTCTCAA CCTCCTTACA AGAACACTTC ATACACTTGA AAACTATTTT 4380 TGGAAGACTC AGATCTGCCA ACTTTAAAGT CCAACTCACA AAATCCTACT TCCTCAGGCG 4440 GGAGACAGAA TTCCTTGGCC ACATCGTTTC ACAAGAAGGT GTTAGGCCAA ATCCCAATAA 4500 GATCGAAGCT ATAAAAAACT TTCCATGTCC CCACAGTAAA AAGTCAATTA AGTCTTTCCT 4560 AGGCTTGTTG GGATATTACA GAAAATTTAT CAGAGATTTT GCGAGACTTA CCCAACCCAT 4620 GACACAAAAA TTAAGGGGAA ACAATAAATC GATCATAATA GATGATGAAT TCAAAAAGGC 4680 CTTTGAATAT TGCAAAACCT TACTGTCTAA CGACCCAATC CTCCAATACC CGGACTTTAC 4740 AAAACCTTTC ACACTAACCA CGGACGCAAG TAATTTCGCA ATAGGAGCTG TCCTATCCCA 4800 AGGTCCGGTG CATAGTGATA GGCCCGTATG TTTTGCTAGT AGAACCTTGT CGGCTGCGGA 4860 AACAAATTAT TCCACAATTG AGAAGGAAAT GCTGGCCATT ATATGGGCGG TCCAATACTT 4920 CAGACCCTAC CTCTTTGGCA GGAGATTCAC TATAATCACC GATCACAAAC CACTAACTTG 4980 GTTAATGAAT TTCAAACAAC CAAATTCTAA AATAGTTAGG TGGAGACTCC AGCTTCAGGA 5040 GTACGATTTC GAAGTCGTCT ACAAGAAAGG CTCTCAAAAT GTAATTGCTG ATGCTCTCAG 5100 TAGACCAGAG GCCTCTGTCA ACCATAACGA AGCCCTATCA ATTCCTCAAA ATGTTTGCCC 5160 CATCTCAGAG AAACCCCTTA ATGATTTTAA TATTCAGCTC CTGTTCAAAA TAACCCCAGA 5220 TACAAATAAC GCCACACTGA CCCCGTTTAA ACACAAACTT AGGAGGGAAT TCTGTAAACC 5280 CAATTTTCAG TATGACGACG TAGTTTGCAT TCTTAGGCAG TCGTTAAAAC CAAACAAGAC 5340 ATGCGCGGTA TTTGCCCCCG ACCACATTTT TCAAATGGTG GAACAAGCCT ACCAAACCTA 5400 CTTCTCAGCC CACAGTCAAT TTAAACTCAT TAGATGTTTG ATCTTCCTCC CCGAAATTAC 5460 TGATAGTACG GAGATCGAAA AAATTATAAC CGACTATCAC TATAATAGTA ACCATCGAGG 5520 GATCGATGAA ACATATTTAC ACATAAAACG ACAACAGTTC TTCCCACATA TGAAGGAGAG 5580 AATAACTCAG TTAATTCGAA AATGTGAAAC ATGTTTAAAA TTAAAATACG ACAGACAACC 5640 TCAAAAGATC ACTTACCAAA TATCCGAACT ACCTTCAAAA CCGTTGGACA TCTTACATAT 5700 AGACATTTAT ACTATTAACA AAAATTATAA CCTTACTATT ATCGATAAAT TTTCTAAATT 5760 TGCGGCTGCC TACCCTATAA CTAATAGGAA TTGCATTAAC GTAGTTAAAG CCTTAAAACA 5820 TTTCATTTCC CAATTTGGTA TTCCCAAAAA GCTGATCTAT GATCAGGGAG CAGAATTCGC 5880 TAGCGATATG TTCAATAAGT TCTGCACTCA ATTTAACATT GACCTACACG TTACGTCCTT 5940 TCAACAATCC TCTAGTAACT CTCCCGTTGA ACGGCTTCAC TCGACACTAA CTGAGATTTA 6000 CAGAATAATA CTTGACGTCA GGAAACAACA GAAACTCAGT AGCGAGCATG ACGAGATAAT 6060 GTCCGAAACC CTAATCACAT ATAATAACGC TATTCATTCT GCAACTAAAC ATACCCCCTT 6120 TGAACTATTT AACGGACGTA CTCATATATT CAACCAAACA ATCCAGTTCA ATAACGAACA 6180 CGACTACTTA ACGAAATTAA ATGAATTTCG CGAGAAGTTG TACCCCCTCA TCACGGACAA 6240 ACTTTCAAAT GACGTAGTTA GGAGAACCCT AAAATTAAAT GAAACCCGAA CAGACCCCGT 6300 AGACCTACAA CCAGACACTT TAGTCCTTAG GAAGGAAAAC AGACGTAATA AGATTACACC 6360 CAGGTTTTCG ATTCACAAAG TCAAACACGA CAAAGGTCAT ACATTGATAA CTGCTAGGAA 6420 TCAAAAACTA CACAAATCAA AAATTCGAAA AACAGTTTTG AAAAAAGACA AAAGCAACAA 6480 CGTACCCAAC ACTGATAATA ACTGACCCCA CTACCTCTTA ACTTACCATT TCAGGTTCAC 6540 CCTTGTGCCA ACTCAGGCTA TCCATGTCCA TTATTTAAAT GATAACGCCC CTATAGCCAA 6600 GATAGAACTA GGGAAAGCCT TACTAATTGA GAGGTACAAA ATAATTAGTC ATGTAATCAA 6660 CCTACAAGAC TACAGCAGAT GTATGGAACA ATTCCATCTG ACCATTAATA AATTTAACCC 6720 CGATTCCACG TTGACGGACT CCGTCACAAT TTTAAAAACC AAATTAACCC AAGCCCAAGT 6780 AAAGCTCAAA GCCCTTACAC CTTCATATAG AAACAAACGG GGTTTGATTA ACGGATTGGG 6840 GAGTCTAGTA AAGGTGGTTA CCGGCAACAT GGATGCCAAC GACAATAAAG AAATACATGA 6900 AGAACTTGAC AATATAAAGA AAAATTCCGA AGTCAGTAAC GACAATCTCC AAAAACAAGT 6960 AATGTTTAAC AACGAAATAC TTATCCGGTT CGAAAATATC ACGGACCATA TAAATAATGA 7020 ACAAATTTTG ATAAGTAAAT TCTTTGATAC CTCACAAAAC AAAATATACA AACACTTAAA 7080 CTTACAAGAT ACCCTTCTGG AAGAAATACA ATATTTAAAT AGGATTAATT ATAACATAGA 7140 ATTATTCATT AACCACCTAA ACGACATAAC AGAAAGTATG CTATTGGCGA AAATAAATAT 7200 AATTCCCAAG TTCATCCTAA ATGAACAAGA AATGGATAAA ATAAAAACAA TACTGGAAAA 7260 ACAAAATATC ACAGTCAAAA ATGAACAAAG TATATACAAT TTCCTACAAA TGAATACACT 7320 AAATTACGAA CAAAAGATTA TTTTTAATAT CAAAGTCCCA ATTTTTAAAC AACCTTTTCA 7380 TACCCTCGCC AGACTAGTTC CATTACCAAT AAATAACACA TATTTTGTAA TAACCCCAAA 7440 TTACCTAGCT TATAATATTA ATAATAAGAA ATTTCATATG ACCCGTAAAT GCCCCAAACT 7500 GGATAATACA TTCTTGTGCG ACGAGAACTT CTACGTTGAT ACACCACAGA ACAACACATG 7560 CCTGGAACAC CTTTTGAACG GAGAAAACAG TTCCTGCGAT GTACGGGAAA CCGGCCCCAT 7620 CACCGACGTG TTCGAGGCAG AGAGAGGTTA CATCTTCGCA TTCAACGTGA ACAAACTGAA 7680 GGTATCCCTA ACAAACGGCT CCGAGCTCTC AATAATGGGG TCAGCCATCA TCAGATACAT 7740 TAACGAAACA ATACAGATTA ACGGTATCGA TTACGACGGC ACGGTTGACA CGTTCCCTGA 7800 ACAGACGGAT TTTGATCTTC CCCCCATGCG AAAAGTAACT AGGAATACCA CTATTACGGT 7860 ACTAAGCCTA GAAAAACTGC ACCTCGAAGC CACCCAAACA ATGGATAAAA TCCTGGCCGT 7920 CCATCACAAT ACTATACAGC ACACCTGGAC ACTCTACACT CTGCTCGGAT TGGTAACGTT 7980 CCTAGCAGTC ATCTTATGGC TGCACCGACG AACGAAACAC ATCGTCCACA TCCACGAGGA 8040 TCATCACGTA CCAATCTACG CGTCATCCAT ACCTTCGCTA TGGCCGTCAC TTCGAACTGG 8100 GGGGGGAGGA GTTACCACCC CACCCCCTAA ACCCCCACGC CTCTAAACAA ATCATCGGAC 8160 ACTCAACCGG GAAGACGGCA ACTGGAACAC CGCATCCGGC CGAATGCTGA CATTCCGGCC 8220 GAATGCTGAC ATTACACAAA AGTCGCACTG CAACATTGTC CCCAGCTAGC CAGCCACATG 8280 CCGAGTCGGC ATGTTCATTA TGCTTACAAT TAAGAACCTA TGTACTTATG TATAAGACGA 8340 AAACGGAGGA CTCGAGTAGC CACTCTCTGA CAATAAACTT GATACTGATT TTGAACTTCA 8400 AGAAAGTCAG TCGTATTCTT TATTGGAAAT CTTCACACTA CAACTATCTG CTGAAACTTA 8460 AAAACCTTCA TACATTTACA CATCATATCT TCACAAAAGG CTCCACCCTC GATCACGGAC 8520 TTAACT 8526 // ID DMBLPP standard; DNA; INV; 5034 BP. XX AC Z27119; XX DR FLYBASE; FBte0000660; Dmel\flea. XX SY synonym: blastopia SY synonym: Kermit XX FT source Z27119:372..5405 FT SO_feature five_prime_LTR ; SO:0000425:1..275 FT SO_feature three_prime_LTR ; SO:0000426:4757..5034 FT SO_feature polyA_site ; SO:0000553:5006..5011 FT SO_feature polyA_site ; SO:0000553:5019..5024 FT SO_feature CDS ; SO:0000316:760..4761 FT /name="Dmel\flea\polyprotein" FT /db_xref="FLYBASE:FBgn0043491" FT /db_xref="SPTREMBL:Q24262" FT /db_xref="NCBI_PROTEIN:CAA81643.1" FT /translation="MFTRTPPTNKKLNTDQIQAILENESEDESRKEKMNEEDQKLAPVG FT EAEAKKQNKDASAKVEEKFEQMMNTLTQSMLAKSKQEGQVIIAAEKFEKVVSDCDGKSI FT PIKKWFEIFEKNAEAYELSEKQKYVQARSKMIGSAELFLESECVSGYTELKELLIEEFS FT GSYNSAVIHKKLQDRKKKREETLHDYLLQMKKIAALGEVETVALITHIVNGLDIKKEYK FT GAMLRCKTLKELKQEFEIYESLNIVDKPNIQPKPKQITQGVKADHCFNCGSREHKRKDC FT TLPTKCFSCNQEGHISSKCPEKVNSMRIHVDSARTKPVIINGIIINCLVDTGSDVTIIK FT EAIFKKMKDVDLNRTATVLRGLGNASTQPIGCFRALIKTDQVEASHNVLVVHDSKFSCD FT GIVGHDFISKFRLICSAEGYTFLDLEADKKQAVEYSQMFNICEESSFTVAPQYREDVER FT MIERTYETPPKQIKQCPVELKIIPDGVIKPFRHGHTRLSEEEAIAVKKQVEEWVEQSIV FT RKSTSNVASRIVVVRKKDGTLRVCVDYRKLNTMVLMDCFPVPIMEEVLEKLQSAKWFTT FT MDLQNGFFHVAVEEASKPYTAFVTREGLFEFNKAPFGFKNSPAAFIRFVQFIFQELINS FT NIMQLYMDDIIVYAATPEECMEKTEMVLKRAAEFGLKIKWKKCNFMQRRIHFLGHIIEG FT GQICPGKEKTSAVNSFGTPQNVKAVQGFLGLTGFFRKFIPGYAQIARPLTDLLKKDAIF FT NIGPVEQQSVNKLKEILVNEPVLRIYSREAETELHTDASKDGLGAVLLQKFEGSFHPVC FT FWSRKTTKAESNRHSYYLEVKAAYLALKKFRHYLLGVPFKLVTDCVAFKQTTKKADVPR FT EVGPWILYMQDFNFQPEHRAGERMRHVDFLSRHPQACMMITSELTARIKKSQQNDDSIR FT AILEILKDRLFQPYKLKGGLLYSMVNGNELLVVPALMEREVIQSAHEVGHLSLQKTMHS FT IQQQFFYFLIWEYKVKKLISNCIKCIIHSKKLGKQEGYLNCIDKGDAPLHTLHIDHLGP FT MDSSAKQYKYILATVDAFSKFVWLFPTKSTGQEEVVKRLTDWSNIFGFPKRIVSDKGTA FT FTSGAFEQFMSSHNVEHVCTTTGVARGNGQIERVNRLILAIISKLSSDEPSKWYKYVPE FT VQKAINCHVHSSLKLSPFEVMFGTKMYTRVEDRLLELLQEEVVCQFNEDRYEMRQLVKR FT NIEQAQKDYKRNYDKKRRAEYKYKAGDLVAIKRTQFVAGRKMASGYLGPYEVTGVKDNG FT RYDVKKAANVEGPNVTSTSCDNMKLWKYIAENADLLSSGSDDDDQEGRM" XX CC Derived from Z27119 (g415797) (Rel. 50, Last updated, Version 6). CC Takis Benos and Michael Ashburner, 20-Aug-1997. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 5034 BP; 1719 A; 938 C; 1145 G; 1232 T; 0 other; TGTAACATGA GTAAGGCTGA AGGCTGGCAA CAACCCGGTT GGCAGCGCTG TTGAGCAGCA 60 ACATGATTGT CGGAAATCCA AGTTATCGAC AATCAGTCAT CGAAGGACGA TCGCAGGCAG 120 CAGTAGAGGC GAGTGGAAGT CAGCGTTGCA GTCAGTCGAG TTCTCAGCAG CAGTCGTTCG 180 GTCCACAAAC TAAGAAATAC TTTATATAAT TACCGCATTT AGAATTAAAC TAATAATTAA 240 ATTAATAATA AACAATAATA ATAAACAATC TTACATGGGG GCTCGTCCAG TCCTAAATCG 300 GTTATATGAA GGTGCAGTTG TTTAAAGAAA AAAGACATTG TTGTGTGCGT GGGTATAGTC 360 TTTAAAACGT TGTAAAGTTG TGGCTATATC TATTGCATTT AAAGTTGGAA AAATCAGTTG 420 TACAGATTTT GTTTGAACAC AAGTCGGTAA AAGTCGGGAA AGCTGCTAGA GAGAACTGAT 480 AAAGTTGAAA TTGTCGTGTG CGTGGATTTA GTCTTTAAAG TTGTAAAGTT ATGGCTACGT 540 CTACTGCATT GAAAGTTGAA AAAATCGATT GAACTCATAC AGACTCAAGT CGTTTTGCTG 600 TTGTGGAATT TAAAACAATT AAATTGCAAA GGTGGTGAAA TTCGTTTCTA ACGAAAATCA 660 AAATTTGTCT TTTAACCGGT GGCGCCGTCT GCAAAATCGA CTACCGTCGC GCCGTTAGAA 720 CATTGTCGTT GTTTGCTGGT GTTAGTGCCT TGTCGCGGAA TGTTCACACG TACACCACCT 780 ACAAATAAAA AACTTAACAC CGACCAAATA CAAGCAATTC TAGAGAACGA AAGCGAGGAC 840 GAAAGCAGAA AAGAAAAAAT GAACGAAGAA GATCAAAAGT TGGCGCCTGT AGGAGAAGCA 900 GAGGCAAAGA AGCAGAATAA AGACGCTAGT GCTAAAGTCG AAGAGAAATT TGAACAAATG 960 ATGAATACTC TAACCCAGAG CATGTTGGCA AAATCTAAAC AAGAGGGGCA AGTAATTATC 1020 GCTGCAGAAA AATTTGAAAA AGTTGTAAGT GACTGTGATG GCAAATCAAT TCCTATTAAA 1080 AAATGGTTTG AAATTTTTGA GAAAAATGCC GAGGCATATG AACTTTCGGA GAAACAAAAA 1140 TATGTTCAAG CCAGAAGTAA GATGATTGGA TCAGCAGAAC TTTTCTTAGA ATCTGAATGT 1200 GTCAGTGGAT ACACTGAACT CAAAGAGTTA CTAATTGAAG AATTTTCAGG CAGCTATAAT 1260 AGCGCCGTTA TTCACAAAAA GTTGCAAGAC AGGAAGAAGA AGAGGGAGGA AACTCTACAC 1320 GACTATTTGT TACAAATGAA GAAAATAGCA GCCTTAGGTG AAGTTGAAAC AGTTGCTTTG 1380 ATAACTCATA TCGTAAACGG CCTCGACATT AAAAAGGAGT ATAAGGGTGC TATGCTCCGT 1440 TGTAAAACTC TTAAGGAATT AAAGCAAGAA TTCGAAATCT ACGAGAGTCT GAATATTGTT 1500 GACAAGCCGA ATATTCAACC AAAACCAAAG CAAATTACAC AAGGTGTAAA AGCAGATCAC 1560 TGCTTCAACT GTGGTTCGAG GGAACACAAA CGAAAGGATT GTACACTTCC TACCAAATGT 1620 TTCAGCTGTA ATCAAGAGGG CCATATCTCA AGCAAGTGTC CGGAAAAAGT AAACAGCATG 1680 CGCATTCACG TTGATAGTGC ACGAACAAAG CCAGTAATCA TAAATGGGAT TATCATCAAC 1740 TGTCTGGTGG ACACAGGATC AGATGTGACC ATAATTAAAG AAGCTATATT CAAGAAGATG 1800 AAAGATGTTG ATTTAAACCG CACTGCAACA GTATTGCGAG GTTTGGGAAA TGCCTCAACA 1860 CAGCCGATTG GATGCTTCAG AGCATTAATC AAGACCGACC AGGTGGAAGC AAGCCACAAC 1920 GTTTTAGTCG TCCACGATTC TAAATTCAGT TGCGATGGAA TAGTGGGACA CGATTTTATC 1980 AGCAAGTTTC GTCTTATCTG TAGTGCAGAA GGCTATACTT TTCTTGACCT GGAAGCAGAT 2040 AAAAAACAAG CGGTTGAGTA TTCCCAAATG TTTAATATTT GTGAAGAATC TTCTTTTACA 2100 GTTGCACCAC AATACCGAGA AGACGTTGAA CGCATGATAG AGAGAACATA CGAAACACCA 2160 CCCAAGCAGA TAAAGCAATG TCCAGTCGAA CTCAAAATTA TTCCTGATGG CGTGATTAAA 2220 CCCTTTCGCC ATGGACACAC CCGACTATCT GAAGAAGAAG CTATAGCTGT AAAGAAGCAG 2280 GTAGAGGAAT GGGTCGAGCA GTCAATCGTC CGTAAATCTA CATCAAATGT TGCCAGTCGC 2340 ATAGTCGTTG TCAGGAAAAA GGATGGTACC CTACGCGTTT GCGTGGACTA TAGAAAATTG 2400 AACACCATGG TTCTGATGGA TTGTTTTCCG GTACCCATAA TGGAGGAGGT GCTTGAAAAA 2460 CTGCAGAGTG CCAAATGGTT TACAACCATG GACTTACAGA ACGGATTTTT TCATGTGGCC 2520 GTAGAAGAAG CCAGCAAGCC GTACACAGCA TTTGTTACCC GAGAAGGCTT ATTCGAGTTT 2580 AACAAAGCGC CCTTTGGTTT TAAGAATTCC CCAGCAGCGT TTATACGGTT CGTTCAATTT 2640 ATTTTTCAAG AACTAATCAA TTCCAATATA ATGCAGCTAT ATATGGATGA CATAATTGTA 2700 TATGCCGCTA CCCCAGAAGA ATGCATGGAA AAGACGGAAA TGGTACTTAA GAGAGCTGCA 2760 GAATTTGGTC TAAAAATAAA ATGGAAGAAG TGCAACTTTA TGCAGAGGCG AATTCATTTC 2820 CTGGGACATA TTATCGAAGG TGGACAAATA TGCCCTGGAA AAGAGAAAAC ATCAGCAGTG 2880 AATTCCTTTG GAACACCTCA GAATGTAAAA GCCGTTCAAG GATTTCTGGG TCTCACAGGA 2940 TTCTTCAGAA AATTCATACC TGGATACGCC CAAATTGCGA GACCACTGAC GGACCTATTA 3000 AAAAAAGATG CCATTTTCAA CATTGGACCA GTAGAGCAGC AGTCGGTGAA TAAGCTGAAA 3060 GAGATTCTGG TAAACGAACC AGTATTGAGG ATCTACTCAC GAGAAGCAGA AACCGAACTT 3120 CATACAGATG CCTCTAAGGA CGGGTTAGGA GCCGTTTTAT TGCAGAAGTT CGAAGGCAGT 3180 TTTCACCCAG TCTGCTTTTG GAGCAGAAAA ACTACAAAAG CCGAATCAAA TCGTCATAGT 3240 TATTACCTTG AAGTAAAAGC CGCATACTTA GCTCTGAAAA AGTTCAGACA CTATTTATTG 3300 GGAGTCCCTT TCAAGCTCGT CACGGACTGT GTCGCATTTA AACAGACAAC AAAAAAAGCA 3360 GATGTCCCAA GAGAAGTTGG CCCATGGATT CTCTATATGC AGGATTTTAA TTTTCAACCC 3420 GAACATCGTG CAGGAGAAAG AATGAGACAC GTTGATTTTT TAAGCCGCCA TCCCCAAGCA 3480 TGCATGATGA TAACATCCGA GTTGACAGCA CGTATTAAAA AGTCGCAGCA GAACGATGAT 3540 TCAATTAGAG CAATCCTGGA AATTCTAAAA GATCGTCTAT TCCAACCCTA CAAGCTAAAA 3600 GGTGGCCTGT TGTATAGTAT GGTCAATGGC AATGAACTAC TGGTTGTCCC TGCACTAATG 3660 GAGAGGGAGG TGATTCAAAG CGCACATGAA GTTGGCCATT TGTCGTTGCA AAAGACGATG 3720 CATAGCATAC AGCAGCAATT TTTTTATTTC CTCATTTGGG AATACAAGGT AAAAAAGCTA 3780 ATTTCTAACT GTATAAAATG TATCATCCAC AGCAAAAAGT TGGGAAAGCA GGAGGGATAT 3840 CTAAATTGCA TAGATAAAGG AGACGCACCG TTGCACACAC TACACATCGA TCATTTGGGG 3900 CCAATGGATT CATCGGCCAA ACAGTATAAA TACATTCTGG CAACAGTCGA TGCGTTTTCA 3960 AAGTTTGTCT GGTTATTCCC AACCAAATCA ACCGGACAGG AAGAAGTGGT CAAGAGGCTG 4020 ACCGACTGGT CAAACATTTT TGGTTTCCCT AAGCGAATTG TTAGCGACAA AGGAACGGCC 4080 TTTACGAGTG GTGCGTTCGA ACAATTTATG AGCAGCCATA ACGTGGAACA CGTCTGCACA 4140 ACTACTGGAG TGGCCAGAGG CAACGGCCAG ATAGAACGAG TAAATCGTTT AATTTTGGCA 4200 ATAATATCAA AGCTGTCTTC AGACGAACCG TCGAAGTGGT ACAAATATGT GCCTGAGGTA 4260 CAAAAGGCGA TCAACTGTCA CGTGCATTCA TCACTGAAGC TGTCACCATT TGAGGTCATG 4320 TTTGGCACCA AGATGTACAC CCGAGTTGAG GATCGGTTAC TGGAACTGCT CCAAGAAGAA 4380 GTGGTCTGTC AATTCAACGA GGACCGCTAT GAGATGAGAC AGCTGGTAAA ACGCAACATC 4440 GAGCAGGCGC AGAAGGACTA CAAGCGCAAT TACGACAAAA AGCGCCGAGC TGAATACAAA 4500 TACAAAGCAG GTGATCTGGT TGCAATTAAA AGGACCCAAT TTGTAGCTGG CCGCAAGATG 4560 GCAAGCGGGT ATTTAGGTCC ATACGAAGTC ACAGGGGTCA AAGACAATGG CAGATATGAC 4620 GTTAAAAAAG CAGCAAACGT CGAAGGACCC AATGTCACAT CCACCAGCTG TGACAACATG 4680 AAGTTGTGGA AGTACATAGC CGAAAATGCA GACCTATTGT CATCCGGGTC GGATGATGAT 4740 GATCAGGAGG GCCGAATGTA ACATGGAGTA AGGCTGAAGG CTGGCAACAA CCCGGTTGGC 4800 AGCGCTGTTG AGCAGCAACA TGATTGTCGG AAATCGAAGT TATCGACAAT CAGTCATCGA 4860 AGGAACGATC GCAAGGCAGC AGTGGAGTAG GAGTGGAAGT CAGCGTTGCA GTCAGTCGTG 4920 TTCTCAGCAG CAGTTCGTTC GGTCACAAAC TAAGAATACT TTATATAATT ACCGCATTTA 4980 GAATTAAACT AATAATTAAA TTAATAATAA ACAATAATAA TAAACAATCT TACA 5034 // ID OPUS standard; DNA; INV; 7521 BP. XX AC AY180918; XX DR FLYBASE; FBte0000918; Dmel\opus. XX SY synonym: nomad SY synonym: yoyo XX FT source AY180918:1..7521 FT SO_feature five_prime_LTR ; SO:0000425:1..518 FT SO_feature three_prime_LTR ; SO:0000426:7004..7521 FT SO_feature CDS ; SO:0000316:1578..2831 FT /name="Dmel\opus\gag" FT /db_xref="FLYBASE:FBgn0025876" FT /db_xref="SPTREMBL:Q8I7Q0" FT /db_xref="NCBI_PROTEIN:AAN87270.1" FT /translation="MEETLRALSESLNALTNVVTGIKEDIKKNNDRLAILEQERGNAD FT PTVDQPQPLVRARTEYELREISVLPDCVKELQAFEGRQEAYLSWINRAQSILTEYDLI FT KTRPLYRAIVLHIRQKIRGHADMALAAYGVQDDDWDDIKRVLALHYADKRDLRTLEHE FT LGAMCQGSRPLDRFYMDVNGHLSLILNNLKARNHPREVVNALIETYRDKALDVFIRGV FT GRDCSKHLLVRSPKNLPEAYSFCMGLQNVMSRNFTAQNYQPSGAPRFAGPYQHQARPP FT FRTPFSPGSGRFSQNSYRTQGPRQAIKMESNRSGQSYQSGYSGRQEEGSGIKRMSEGN FT NPFQKAQRLYHMELAPPPLAPAASGDNQGRSHEGYYDDESQAVERSNNYPPQKNVEGV FT TDAPHNLETEGGANFMTNASPVYRT" FT SO_feature CDS ; SO:0000316:2972..5983 FT /name="Dmel\opus\pol" FT /db_xref="FLYBASE:FBgn0025875" FT /db_xref="SPTREMBL:Q8I7P9" FT /db_xref="NCBI_PROTEIN:AAN87271.1" FT /translation="MITHRLVGKFFKPLGNDSDITFFVLPNLHSFDGIIGDDTLKDLK FT AIVDRKNNCLIITPGIKIPLLARASINVNPLLAAEHPDGTQEILNSLLGEFPRIFEPP FT LSGMSVETAVKAEIRTNTQDPIYAKSYPYPVNMRGEVERQIDELLQDGIIRPSNSPYN FT SPIWIVPKKPKPNGEKQYRMVVDFKRLNTVTIPDTYPIPDINATLASLGNAKYFTTLD FT LTSGFHQIHMKESDIPKTAFSTLNGKYEFLRLPFGLKNAPAIFQRMIDDILREHIGKV FT CYVYIDDIIVFSEDYDTHWKNLRLVLASLSKANLQVNLEKSHFLDTQVEFLGYIVTAD FT GIKADPKKVRAISEMPPPTSVKELKRFLGMTSYYRKFIQDYAKVAKPLTNLTRGLYAN FT IKSSQSSKVPITLDETALQSFNDLKSILCSSEILAFPCFTKPFHLTTDASNWAIGAVL FT SQDDQGRDRPIAYISRSLNKTEENYATIEKEMLAIIWSLDNLRAYLYGAGTIKVYTDH FT QPLTFALGNRNFNAKLKRWKARIEEYNCELIYKPGKSNVVADALSRIPPQLNQLSTDL FT DANPEDDMQSLATAHSALHDSSRLIPHVESPINVFKNQLIFDTTRSKYLCEHPFPGYT FT RHLIPLKDGSLADLTNSLQSCLRPVIINGVKIPEAHLQRFQSICLANFLLYKIRITQR FT LVADVSGAEEICEIIEKEHRRAHRGPTEIRLQLLEKYYFPRMSSTIRLQTSSCQCCKL FT YKYERHPNKPNLQPTPIPNYPCEILHIDIFALEKRLYLSCIDKFSKFAKLFHLQSKAS FT VHLRETLVEALHYFTAPKVLVSDNERGLLCPTVLNYLRSLDIDLYYAPTQKSEVNGQV FT ERFHSTFLEIYRCLKDELPTFKPVELVHIAVDRYNTSVHSVTNRKPADVFFDRSSRVN FT YQGLTDFRRQTLEDIKGLIEYKQIRGNMARNKNRDEPKSYGPGDEVFVANKQIKTKEK FT ARFRCEKVQEDNKITVKTRSGKIFHKSDLRN" XX CC Sequence from P1 DS01219.2:861..8381 provided by Guochon Liao CC Berkeley Drosophila Genome Project. XX SQ Sequence 7521 BP; 2322 A; 1740 C; 1677 G; 1782 T; 0 other; AGTTAAGAAC CCTCTTCTTG CGCTCTTCGT CAGGACTCAC CAGCGCTCGG CTCTCGTGTT 60 TTCGGGCCCC GTCAGCAGGC GACTCGGGGC CTGTCTAGTA ACATGTTCGT GTAAGTTACG 120 AACCCTCTTC TTGCGATCTT CGTCAGGACT CACCAGCGCT CGGCTCTCGT GTTTTCGGGC 180 CCCGTCAGCA GGCGACTCGG GGCCTGTCTA GGAACATGTT TGTGTATGTG TGCATTCGGA 240 ACAAGTGCCG TTGGTCGCAC TCAGGGTGAG GGGTCAACGG GGGAAGCGGA TATAAAAGCA 300 GCGGGGCGGG AGAAGAGGTC CCAGTCTCGA ACGGACACAT AACGGAACCG CTAGCAGATC 360 GCGAACTGAA TCTTAAAATA AAGCTAATCG TAAACTCGAA CCCTCTTAAC TATCTTGACT 420 ATTATTTGGA GAACCACAGC ATGTTGGTTG TCATATCAAG GTGAGGTATG CGGCAGCGAG 480 TGCCGAGAAC CCTGATGCAA GTGGAACTTG CGTTAACTGG CGCCCGAACA GGGACCGGCA 540 ATGTCCGGCC GATAAAAGTG ATACGAAAAA ATTGTGGAAA TTTGTGCGTA AAAATAGTGG 600 TGGTGTGCAT AAGTCAGATT AAGATCTGAA ATCCATAAAT GAAAAAGAAG TGCTGCGTGA 660 GCTGTGTATA AAATGATAAA ATAGCAATTA CCCGCTGCCG GGGGGAACTA CGCCCATCCC 720 GGGGCGCAAC AAATATTGCA TAATTCAATA AAAGGTGTAA AATTTCTAAA ATAAAAATGT 780 AAACCTATGT TGCGCCAAGA CCTAATTTAA ATTAATAAAA CAACGACCCG CTACCGGAGG 840 ACGCCACGTC GCCCATGCCG AGCGCAAAAG TTGTACGATA CCTATAACAT AATTAAAACA 900 CGATCAACCC ACTGCGGCGG TACGGCTTGT GGGAAAATTT TTTTTTTTTT CTCTCCTTGC 960 CAATTCGCGA GTGCAAAAGA TTGTGTATAA TAAACCAATA ATTAACCATT GCAGCAGTTT 1020 ACCTGCGGCA GTACGAGTAA TATGAGCGCC CAGAGTGATA AGGTGGTGTG TGGCAGCTTG 1080 TTGGATACGT TAAGTGGTGT GGAATGCACC CAAAAAAAAC CGCCCAACAA GTTGTGTGGC 1140 GGCCGTACCT TAGTAGGCAA CCAGCCAAAA GGGATACTAC GGAACCACCG TGCCCAGTGC 1200 CGAAATAAAT TAGAGGTCAT CAATAAAAAA CTGTAACAGC ACGCACGCAA GGAAAAAATA 1260 TTGCAAAATG GAATAGCGCA CAAAAATTGT ATAAACACAT GCACAACACC ACAATTCAAA 1320 GGAAAACAAA ATATTCATGC TGTAGGGGTA CAACCTAAAC GACGAAAACT AATAAAGAGC 1380 ATACAAGGGT GAGTGAAATA TTTCATTAAA CTTTATTGCC ATATTTGCTA AATTTAGAGA 1440 AATAAAGAAA AAGCAAAGAA GAACAGATAT TCTTTTTTAT CGGGTTAAAA CCGTTGTCTC 1500 ACATTTCCGT AAAGTAATAA CGAATTCTGT TGCCTTGAAA GCTTCCTGCA TCTTTCCAAC 1560 GCAAACTAAA AATCAAAATG GAAGAGACCC TGCGTGCTCT TAGCGAGTCC CTCAATGCCC 1620 TGACCAACGT GGTGACAGGC ATTAAGGAAG ATATTAAGAA AAATAATGAT AGGTTGGCTA 1680 TTTTAGAACA GGAGCGCGGG AACGCTGACC CTACGGTCGA CCAACCGCAA CCCCTGGTGC 1740 GCGCACGCAC CGAGTATGAG CTGAGAGAGA TATCGGTCCT CCCTGACTGC GTCAAAGAAC 1800 TGCAGGCGTT CGAAGGACGG CAGGAGGCTT ACCTGTCTTG GATAAACAGG GCACAGTCAA 1860 TACTGACCGA ATATGACTTG ATTAAAACCA GACCCCTGTA TAGGGCAATT GTCTTGCATA 1920 TTAGACAGAA AATAAGGGGA CACGCCGACA TGGCCTTGGC GGCCTATGGC GTCCAAGACG 1980 ACGATTGGGA CGACATAAAA CGAGTCTTGG CGCTGCATTA CGCAGACAAA CGAGACTTAC 2040 GTACGCTTGA GCATGAGCTT GGCGCTATGT GCCAAGGTTC TAGACCACTA GATAGGTTCT 2100 ATATGGACGT TAATGGCCAT CTCTCGTTGA TCTTAAATAA CTTGAAGGCC AGAAACCACC 2160 CTCGTGAAGT AGTCAACGCT TTGATAGAAA CCTATAGAGA CAAGGCTTTG GATGTTTTTA 2220 TCCGAGGAGT GGGGAGAGAT TGTTCCAAAC ACTTACTTGT CCGCAGCCCG AAGAATCTAC 2280 CAGAGGCTTA CTCTTTTTGT ATGGGATTGC AGAATGTAAT GTCAAGAAAT TTCACAGCTC 2340 AGAACTATCA ACCGTCAGGT GCCCCAAGAT TCGCAGGCCC ATATCAACAT CAGGCCAGGC 2400 CACCGTTCCG AACCCCTTTT TCTCCTGGTT CAGGCAGATT TTCGCAAAAC TCCTACAGAA 2460 CTCAGGGTCC TAGACAGGCC ATAAAAATGG AATCCAATCG GTCGGGTCAA TCTTACCAAT 2520 CAGGATACAG TGGTCGCCAG GAAGAAGGCT CCGGTATTAA GAGAATGTCC GAAGGAAACA 2580 ACCCATTCCA AAAGGCACAA AGATTGTACC ACATGGAATT GGCACCACCC CCGCTAGCCC 2640 CGGCGGCTAG TGGAGATAAC CAAGGACGTT CACACGAGGG TTACTATGAT GACGAGTCTC 2700 AAGCTGTCGA GAGAAGCAAC AATTATCCTC CGCAGAAAAA CGTGGAAGGA GTTACAGATG 2760 CTCCACATAA CCTTGAGACT GAGGGAGGGG CAAATTTTAT GACCAACGCC TCTCCAGTGT 2820 ACCGTACTTA GAGTATGCTA CGGAGAGGGG AGAAAGGCTG AAGTTTTTGA TCGACACGGG 2880 GGCGAACAAA AACTTTATTA GCCGAAGACT TGCAGCCGGG TGTACCACAG TCCGTAAACC 2940 CTTCTCCGTA CTGTCCGCTG CGGGTAACAT CATGATAACG CACCGCCTAG TTGGTAAATT 3000 CTTCAAACCA CTAGGGAACG ACTCGGATAT TACCTTTTTC GTACTACCGA ATTTACATTC 3060 CTTTGATGGT ATCATTGGCG ACGATACTCT CAAAGACTTA AAAGCCATAG TGGATAGGAA 3120 AAACAATTGT TTGATAATAA CCCCAGGAAT TAAAATCCCT CTTTTGGCGA GAGCTTCAAT 3180 AAACGTTAAC CCGCTACTCG CCGCCGAACA CCCAGATGGT ACACAAGAAA TTTTGAATTC 3240 CCTTCTCGGG GAATTTCCCC GCATCTTCGA GCCCCCCTTA TCTGGAATGT CCGTGGAGAC 3300 GGCCGTCAAG GCTGAAATCC GGACAAACAC ACAAGACCCG ATCTATGCTA AAAGTTATCC 3360 TTACCCAGTC AACATGCGCG GAGAAGTCGA ACGTCAAATC GATGAACTGC TGCAGGACGG 3420 TATAATTCGA CCCTCTAATA GCCCTTACAA TTCCCCTATC TGGATAGTCC CGAAGAAACC 3480 TAAACCAAAC GGAGAAAAAC AATATCGCAT GGTAGTCGAT TTCAAGCGGT TAAATACCGT 3540 CACCATACCC GACACTTACC CCATCCCAGA TATAAACGCT ACGCTAGCCA GCCTTGGCAA 3600 TGCCAAATAC TTTACCACCC TAGATTTGAC TTCTGGATTC CATCAAATCC ACATGAAGGA 3660 AAGCGACATT CCAAAGACAG CTTTCTCTAC TCTAAATGGA AAGTACGAGT TCCTCCGTCT 3720 ACCATTCGGT TTGAAGAATG CACCTGCAAT CTTCCAAAGA ATGATCGATG ATATTTTGCG 3780 CGAGCATATT GGCAAGGTCT GCTACGTTTA TATTGACGAT ATCATCGTCT TCAGTGAAGA 3840 TTATGACACA CACTGGAAAA ATCTCCGATT GGTATTAGCG AGTTTATCAA AAGCTAACCT 3900 CCAAGTGAAC CTTGAGAAGT CGCATTTTTT AGACACGCAG GTAGAATTTT TAGGATATAT 3960 CGTCACGGCC GATGGCATTA AGGCAGATCC GAAAAAGGTC AGAGCGATTA GCGAAATGCC 4020 TCCTCCGACC TCTGTTAAGG AGTTAAAAAG ATTTCTAGGC ATGACCTCGT ACTACAGGAA 4080 GTTCATTCAG GACTATGCGA AGGTAGCAAA GCCCCTTACA AACTTGACGC GTGGATTGTA 4140 CGCTAATATA AAGTCTTCAC AATCAAGCAA AGTGCCAATT ACATTAGACG AGACGGCCCT 4200 ACAGTCTTTT AATGATTTAA AATCAATTCT CTGTTCTTCT GAAATACTGG CGTTCCCATG 4260 TTTCACTAAA CCTTTCCATC TAACCACGGA CGCTTCTAAC TGGGCCATCG GAGCTGTCCT 4320 CTCACAGGAC GACCAGGGTA GAGATAGGCC GATAGCGTAC ATTTCCCGTT CATTAAATAA 4380 GACGGAGGAA AACTACGCTA CTATCGAAAA GGAAATGCTC GCGATAATTT GGTCATTGGA 4440 CAATCTTCGG GCTTACTTAT ATGGCGCTGG TACTATTAAA GTATATACTG ACCATCAACC 4500 TCTAACGTTT GCCCTAGGCA ACAGAAATTT CAATGCGAAG CTAAAACGCT GGAAGGCTCG 4560 TATAGAGGAA TACAACTGCG AACTCATCTA CAAGCCTGGG AAATCTAATG TGGTGGCTGA 4620 CGCGCTTTCA CGCATTCCGC CTCAGCTTAA CCAGTTGAGC ACCGATTTAG ATGCTAATCC 4680 CGAGGATGAC ATGCAGTCTT TGGCTACTGC CCATAGCGCT TTACATGACA GTTCACGATT 4740 GATTCCCCAC GTTGAATCTC CAATCAACGT TTTCAAGAAT CAACTCATTT TTGACACAAC 4800 CAGGTCAAAA TACTTATGCG AGCACCCGTT CCCAGGTTAT ACTCGCCATC TGATTCCTCT 4860 CAAAGACGGA TCACTTGCCG ATTTAACCAA CTCGTTACAA TCGTGTCTAC GACCTGTAAT 4920 AATTAACGGC GTCAAAATCC CGGAAGCACA TTTGCAACGC TTTCAGTCCA TCTGCTTAGC 4980 GAATTTTCTT TTATACAAAA TTCGGATAAC GCAGCGCCTA GTGGCGGACG TGTCTGGCGC 5040 AGAGGAAATT TGTGAAATAA TTGAAAAAGA ACACCGTAGA GCACATAGGG GCCCTACGGA 5100 GATTCGTCTC CAACTTTTAG AAAAATATTA TTTCCCGCGA ATGTCCAGTA CGATCCGTCT 5160 GCAAACTTCC TCATGTCAGT GTTGCAAACT CTACAAGTAC GAGAGACACC CTAACAAACC 5220 AAACCTACAA CCTACGCCAA TTCCTAACTA CCCATGTGAA ATACTTCACA TCGACATTTT 5280 TGCGCTCGAA AAAAGGTTAT ACCTAAGTTG TATTGACAAA TTTAGCAAGT TTGCCAAACT 5340 TTTCCATCTG CAGTCAAAAG CATCTGTGCA TTTGCGAGAA ACTTTGGTGG AGGCCCTACA 5400 TTACTTCACC GCCCCTAAGG TCTTGGTTTC GGATAACGAG CGAGGGTTGT TATGCCCCAC 5460 AGTGCTCAAC TATCTTCGGT CTCTAGATAT CGATCTGTAT TATGCTCCAA CCCAGAAGAG 5520 CGAAGTAAAT GGTCAAGTCG AGAGATTCCA CTCTACGTTC CTAGAAATTT ATCGTTGCCT 5580 TAAAGATGAG CTCCCTACCT TCAAACCCGT TGAGCTGGTA CACATAGCAG TGGACCGCTA 5640 CAACACTTCC GTTCACTCGG TAACGAATCG AAAACCAGCA GACGTTTTTT TCGACCGCTC 5700 GTCAAGGGTA AACTATCAGG GTCTGACAGA TTTCCGGCGG CAGACTTTAG AGGACATCAA 5760 GGGCTTAATT GAGTATAAGC AAATTAGAGG TAATATGGCT CGGAATAAAA ATAGGGACGA 5820 GCCAAAGTCT TATGGGCCGG GAGATGAAGT TTTTGTTGCA AATAAGCAAA TAAAAACAAA 5880 GGAAAAAGCG AGGTTCAGAT GCGAAAAGGT ACAGGAAGAC AACAAGATAA CAGTTAAAAC 5940 CAGATCAGGA AAAATTTTCC ACAAATCTGA TCTAAGAAAT TGAGACGTGG CTTTCACATT 6000 TAAAAAAGAA ACGCGAAAAA GAATAACGAA AGTAATAAAA GTACGTTGTG GCAGCTAATG 6060 AAATATTCCA CCCATGCATA CCCTATATAA AAAAAACATT AATAAAAAAA AAAAAAAAAA 6120 AAAAAAAAAA AAAAAAAAAT GAGTTAAGAA ATACAAAAAG AAATACAAAA AAAACTATAA 6180 AAAAAATAAT ATAAAAAAAT ACAGATTATA AGAAATAAGA AATAAGAAAT ATAAAAAAAT 6240 AAAAATATAA GTACACAAAA TGTACCGTAC CCCCACACAC TACGTAGTCT TAGAACAACT 6300 TAGACGACCA GATATTTACG AATTGTCTTT TTGTAAGCGC GATTTCTGCA TGCGGCGCAA 6360 ATCCCGCTCA CTGGACTGGC TGGGGTCGGC TTGGAAATGG GTAGCTGGAT CTCCAGATGC 6420 TGCTGATTGG AACGCCGTCT TGGCCGCGCA AGCGACGGCT TCGAGGAACT GCAAAAACTG 6480 GAGGAGGCTA GCTGTATCCC TCGGCTACTG AAGTAACCAA CGAGTGGTTA AGCAAGTCGA 6540 CGATGGAATG CTCCTCCTGA CCAACTTCAA CGGAACTCTA AGAACGGCTG CAGAGAACTA 6600 CGACCTGATC GGCTCCTTTA TCATCCAATT CGACAATGAG ACGATAATGG TCAACGGTCA 6660 AAACTATTCC AGTTACTCGG TCAGTCATCT AATGGCGATG CCGGCCGTGT TGAGCCACAT 6720 AACGGCCAGC AACTTTCAAC TTTCTCTGGA ATACGTCCAC GACGTGAGCA TGAAGAATTT 6780 GGAAAAGATG TCCAACATGG CGAGTGAGCT ACTAGCCTCT CTTCTCACCG AGGCGGCACT 6840 CGCAATCTGC ATATTCCTAG GCTTTTATTT CCTATGGAAG AAGCTGATGT CCACCAAAGG 6900 CATGCCCGAT GTCCGCGAGA TTGCCGCAAA CTTAGAAGCA TTGGGCCAAA CCGAGCTGAA 6960 CAAGGCTCAC TAATCTGCGG GACGCAGATC TTGAGGGGGG AGGAGTTAAG AACCCTCTTC 7020 TTGCGCTCTT CGTCAGGACT CACCAGCGCT CGGCTCTCGT GTTTTCGGGC CCCGTCAGCA 7080 GGCGACTCGG GGCCTGTCTA GTAACATGTT CGTGTAAGTT ACGAACCCTC TTCTTGCGAT 7140 CTTCGTCAGG ACTCACCAGC GCTCGGCTCT CGTGTTTTCG GGCCCCGTCA GCAGGCGACT 7200 CGGGGCCTGT CTAGGAACAT GTTTGTGTAT GTGTGCATTC GGAACAAGTG CCGTTGGTCG 7260 CACTCAGGGT GAGGGGTCAA CGGGGGAAGC GGATATAAAA GCAGCGGGGC GGGAGAAGAG 7320 GTCCCAGTCT CGAACGGACA CATAACGGAA CCGCTAGCAG ATCGCGAACT GAATCTTAAA 7380 ATAAAGCTAA TCGTAAACTC GAACCCTCTT AACTATCTTG ACTATTATTT GGAGAACCAC 7440 AGCATGTTGG TTGTCATATC AAGGTGAGGT ATGCGGCAGC GAGTGCCGAG AACCCTGATG 7500 CAAGTGGAAC TTGCGTTAAC T 7521 // ID DM_ROO standard; DNA; INV; 9092 BP. XX AC AY180917; XX DR FLYBASE; FBte0000100; Dmel\roo. XX SY synonym: B104 XX FT source AY180917:1..9092 FT SO_feature five_prime_LTR ; SO:0000425:1..429 FT SO_feature three_prime_LTR ; SO:0000426:8665..9092 FT SO_feature CDS ; SO:0000316:1275..8357 FT /name="Dmel\roo\ORF" FT /db_xref="FLYBASE:FBgn0043856" FT /db_xref="NCBI_PROTEIN:AAN87269.1" FT /translation="MMSEKTIQFLKKQSEIILEIRKLEVKPTLTDVEILKLNELQKCF FT IANHSNLLKIGVVDHEYFNAKQYDLIMMVLEKIKNKNEKIKGESVENTFPKSNTVPKS FT NPPPTLNLEMRGHPEKEGIAQNNALKVEQAFRNNVGQFRVYLEDTSKLIDSSPDFLKI FT RKNKIEFLWHKIDNLIEQVNSRFESSLFEEEISELEFDKQNILTAINSRLSGTINKAE FT MSTVVKAEELPTLPKIQIPTFFGDSKEWDLFNELFTELIHVREDLSPSLKFNYLKSAL FT KGEARNVVTHLLLGSGENYEATWEFLTKRYENKRNIFSDHMNRLMDMPNLNLESNKQI FT KTFIDTINESIYIIKLKAQLPEDVDAIFAHIILRKFNKESLNLYESHVKKTKEIQALS FT DVMDFLEQRLNSISSFSQEVKPVKKMINNNKNKNYSDNCAYCKLPGHYLIQCHKFKIM FT NPAERSDWVRKNGICLRCLRHPFGKKCISEQLCSTCRKPHHTLLHFAGHNPEKVNTCR FT TTGQALLATALIQVKSRYGGFEQLRALIDSGSQSTIISEESAQILKLKKFRSHTEISG FT VSSTGTCISKHKAVISIRNSPKNLEIEAIILPKLMKALPVNTINVDQKKWKNFKLADP FT DFNKPGRIDLIIGADVYTHILQNGVIKIDGLLGQKTDFGWIVSGCKKSKGKETIVATT FT IEIKELDRYWEVEEEEKDDIESEICENKFIKTTKKDSDGRYIVSIPFKEDVTLGDSKK FT QAIARYMNLEKKLKRNEKLKVDYTKFMNEYMDLGHMIEVSDEGKYFLPHQAVIRDSSL FT TTKLRVVFDASAKTTNNKSLNDIMWVGPRVQKDIFDIIIKWRKWEFVVSADIEKMYRQ FT IKIDNNDQKYQYILWRNSPKEKIKTYKLTTVTYGTASAPYLATRVLVDIADKCKNQVI FT SAIIRNDFYMDDLMTGADSVEEANKLITLIPHELQKVGFNLRKWISNNSKILTTVEDT FT GDNKVLNIIENECVKTLGLKWEPQKDLFKFSVNCNDESKNINKRVVLSTLAKIFDPLG FT WLAPVTVSGKLFIQKLWINKSEWDQELSIEDKNYWEKYKENLLLLENIRIPRWINSNS FT SSVIQIHGFADASEKAYAAVVYAKVGPHVNIIASKSRVNPIKNRKTIPKLELCAAHLL FT SELIQRLKGSIDNIMEIYAWSDSTITLAWINSGQSKIKFIKRRTDDIRKLKNTEWNHV FT KSEDNPADLASRGVDSNQLINCDFWWKGPKWLADPKELWPRQQSVEEPVLINTVLNDK FT IDDPIYELIERYSSIEKLIRIIAYINRFVQMKTRNKAYSSIISVKEIRIAETVVIKKQ FT QEYQFRQEIKCLKIKKEIKTNNKILSLNPFLDKGGVLRVGGRLQNSNAEFNVKHPIIL FT EKCHLTSLLIKNAHKETLHGGINLMRNYIQRKYWIFGLKNSLKKYLRECVTCARYKQN FT TAQQIMGNLPKYRVTMTFPFLNTGIDYAGPYYVKCSKNRGQKTFKGYVAVFVCMATKA FT IHLEMVSDLTSDAFLAALRRFIARRGKCSNIYSDNGTNFVGAARKLDQELFNAIQENI FT TIAAQLEKDRIDWHFIPPAGPHFGGIWEAGVKSMKYHLKRIIGDTIFTYEEMSTLLCQ FT IEACLNSRPLYTIVSEKDQQEVLTPGHFLIGRPPLEIVEPMEDEKIGNLDRWRLIQKI FT KKDFWVKWKSEYLHTLQQRNKWKKEIPNIEEGQIVLLKDENCHPARWPLGKVEKVHKG FT NDDKVRVAKVKMQEGYITRPITKICPLEGIKSVDKNEADQEPKRRTRATSGMSKIGII FT MAMLLFVLSCQVSSALPKDIAPRYSIDKINKTSAIYLDPLGDVEIVSTSWNLVIYYKM FT DPYFKMLTKGNALIQSMRKVCERLHSFEEQCSLVLDNMQSQLSELEENNKLFMMQSRS FT RSKRAPFEFMGSLYHILFGIMDEDDREQLEENMKNLLDNQNNLDKLIQKQTSVVDSTS FT NLLKRTTEDVNSNFRSMQIRIENMTEVLKENYYVYKESIKFFMITKQLHSLIEEGEKI FT QAGIISLLIDINHGRLNTNILRPNQLKKEIAKIQQSLSENLVIPGKRSGTELKEVYTL FT LTARGLFIDDKLIISAKVPLFSRHPSKLFRLIPVPIRNEDRIIMVHTTSEYLIYNFEI FT DSYHIMTEATLNQCQKWQLNKRICKGSWPWNSANDNACEIQPLKPDKAANCIYKTVVD FT SKSYWVELEKKSSWLFKVPANSKVRLQCTGSQIELFDLPQQGVLSIAPYCTARTDDKI FT LVAHHNIQSESEELLSTPYIGEVSGVPKIIWDPLKLSILNHTEEFERLNNEIKFMKEN FT HQKLKDLHFHHISGHAGLIIALILMIVLIIYFIRKCAVQQRMQAITFAGPLPVLXX" XX CC Sequence from P1 sequence DS00941:20448..29535 provided by CC Guochun Liao, Berkeley Drosophila Genome Project. XX SQ Sequence 9092 BP; 3468 A; 1442 C; 1710 G; 2472 T; 0 other; TGTTCACACA TGAACACGAA TATATTTAAA GACTTACAAT TTTGGGCTCC GTTCATATCT 60 TATGTAAATG AATCGAGAGC GATAAATTAT ATTTAGGATT TTGTTATCTA AGGCGACATG 120 GGTGCATTGC TCAAAAACAT GTAATTTAAG TGCACACTAC ATGAGTCAGT CACTTGAGAT 180 CGTTCCCCGC CTCCTAAAAT AGTCCCTTAG TGGGAGACCA CAGATAAGGT CCTCGCCGCT 240 CAAGATAGGC AGATGTGCCC GAGCGTGGGA CCTCGATAAG GCGGGGACTA TTTACGTAGG 300 CCTCTGCGTA GGCCATTTAC TTTAAGATGC GATTCTCATG TCACCTATTT AAACCGAAGA 360 TATTTCCAAA TAAAATCAGT TTTTTTACAA AAACTCAACG AGTAAAGTCT TCTTATTTGG 420 GATTTTACAT TTGGTCAATC GAGCCTTTAA TCGACTCTGC AGTTTCCCCC TACCAAAGGT 480 AAGGAACTCA GAGAAAGGCC AGCTCCTTTA AGCATCTTAC AGCTAAAGGT AGCAAAAATA 540 AGTGACTCTT GTTTCCCCCT ACCAAAGGTA AGGAACAGAG TATAAATATA AAAAGCAAAA 600 GATACAAAAG AATCTTTTAT GTTTTAAAAC AAGCACCTTA TAGTCTATAG CTAAAGGTTG 660 CTTTGTGTAC CATTATAAAT TGTGGTAAGG CGTGCTTGAG GCCATACATC AGCAATTGTG 720 AAATTAAAAA GTGCATAACA AAAGTGCCTT ATAAATGCTC TAATAGCATT AAATCAGCTC 780 ATAAATAGAG TGCAGTGTAT ATGCCATAAG AGCATAAATT AAATAAAAAG TGCCTGAAAA 840 CAGTGCCTTA TAAATGCTCT AATAGCATTA AATCAGCTCA TAAATAGAGT GCAGTGTATA 900 TGCCAAAAGA GCATAAATGC CGAAATAAAT GGCTAAAAAA CAAAAAATCT GACTGGACTA 960 CAAAAATAAT AAAACGTGCC AAAAAAAAAA AAAAAATCAT CTTTAAACAT CGACGGAGCC 1020 TTAAAGAAGA GAAGGAAGTC AAATTCAAAG GAGCCTCTAC CAGCAGCAGA AGCAGCAACA 1080 ACAGCAGCAG CAGAAGCAGC AACAGCAGTA GCAACAGCAG CAACAACAGC AGCAACAGCA 1140 GCAGCAACAA CAACGACATC AGCTAAGTCA AAACAAGAAT TTTCTGTTTA TCCAAACACA 1200 CATATATATA TAAATACATA TAAAATACAT ATACACGTAC TATATATATT AAGAAATTAC 1260 AAAAAATTTT CAAAATGATG TCAGAAAAGA CTATTCAATT CCTTAAGAAG CAGTCCGAAA 1320 TTATTTTGGA AATTAGAAAG TTGGAAGTAA AACCAACATT AACAGATGTA GAAATTCTAA 1380 AATTAAATGA GCTTCAAAAA TGTTTCATTG CTAATCATAG CAATTTGTTA AAGATCGGCG 1440 TTGTCGATCA TGAATATTTT AACGCGAAGC AGTATGATTT AATAATGATG GTGTTAGAAA 1500 AAATTAAAAA TAAAAATGAA AAAATTAAGG GCGAGTCGGT AGAAAACACT TTCCCTAAAT 1560 CAAACACTGT CCCTAAATCA AACCCTCCCC CTACATTAAA CCTTGAAATG CGTGGTCACC 1620 CTGAAAAAGA GGGTATAGCA CAAAACAACG CTTTAAAAGT AGAGCAGGCA TTTCGTAATA 1680 ATGTTGGCCA ATTTCGAGTA TATCTAGAAG ATACGTCTAA ACTAATAGAC AGTAGTCCAG 1740 ATTTCCTTAA AATAAGGAAA AATAAAATTG AATTTTTATG GCATAAAATA GATAACCTGA 1800 TTGAACAGGT GAATAGTCGT TTTGAGAGTT CGCTATTCGA AGAAGAAATT AGCGAACTTG 1860 AATTTGACAA ACAAAATATT CTTACAGCCA TTAATAGTCG ACTCAGTGGC ACAATAAATA 1920 AAGCTGAAAT GTCGACGGTT GTTAAGGCGG AGGAGTTACC AACCCTGCCT AAAATACAGA 1980 TTCCCACCTT CTTTGGTGAT TCCAAAGAAT GGGATCTTTT TAATGAACTC TTTACAGAGC 2040 TCATACATGT GAGAGAGGAT CTCAGTCCTT CTCTCAAATT TAATTATCTA AAGTCAGCAT 2100 TAAAAGGAGA AGCCAGAAAT GTGGTTACTC ATTTACTGCT CGGCTCTGGA GAAAATTATG 2160 AAGCCACTTG GGAGTTTTTG ACCAAGCGAT ATGAGAATAA AAGAAACATA TTCTCAGATC 2220 ATATGAATAG GCTTATGGAT ATGCCAAATT TAAATTTAGA ATCCAATAAG CAAATAAAGA 2280 CATTTATTGA CACGATTAAC GAGTCAATTT ATATTATAAA ATTAAAGGCA CAATTACCAG 2340 AAGATGTGGA TGCAATTTTC GCTCACATAA TTCTTCGGAA ATTCAATAAA GAATCACTCA 2400 ATTTATATGA AAGCCATGTT AAAAAGACAA AAGAAATACA GGCACTTTCT GATGTCATGG 2460 ACTTTTTAGA GCAAAGGCTC AATTCTATAT CATCATTCTC ACAGGAAGTA AAACCTGTAA 2520 AGAAAATGAT TAATAATAAC AAGAATAAAA ATTATAGTGA CAATTGTGCA TATTGCAAAC 2580 TACCAGGGCA TTATTTAATT CAATGCCATA AATTTAAAAT AATGAATCCA GCAGAACGGT 2640 CTGACTGGGT AAGAAAAAAT GGGATTTGCC TAAGATGTCT GAGGCATCCG TTTGGTAAAA 2700 AATGTATAAG CGAGCAGCTT TGTTCGACTT GTCGTAAACC TCACCACACG TTACTTCACT 2760 TTGCAGGTCA TAATCCAGAA AAAGTGAATA CGTGTAGAAC AACAGGTCAA GCCTTGTTGG 2820 CCACGGCCTT GATTCAAGTA AAGTCGAGGT ATGGAGGCTT TGAACAATTA AGAGCATTGA 2880 TTGATAGTGG CTCTCAAAGC ACAATTATTT CAGAAGAGTC TGCACAGATT CTAAAATTGA 2940 AAAAATTTCG GTCTCATACT GAAATAAGTG GAGTATCTTC CACAGGAACG TGCATCTCCA 3000 AGCACAAAGC GGTTATTTCG ATAAGAAATT CTCCGAAAAA TTTAGAAATT GAAGCAATTA 3060 TTCTCCCAAA ACTTATGAAG GCACTTCCAG TCAACACGAT TAATGTTGAT CAGAAAAAAT 3120 GGAAGAACTT TAAATTAGCC GACCCCGATT TTAATAAACC GGGTCGCATT GATTTAATCA 3180 TTGGAGCAGA CGTATATACT CACATTCTGC AAAATGGAGT TATAAAAATA GACGGTCTCC 3240 TTGGGCAAAA AACTGATTTC GGGTGGATAG TTTCTGGATG TAAAAAATCC AAAGGAAAAG 3300 AAACCATTGT AGCCACAACA ATAGAAATAA AAGAGTTAGA TCGCTACTGG GAAGTGGAAG 3360 AAGAAGAAAA AGATGATATC GAGTCTGAAA TCTGTGAAAA TAAATTTATC AAAACGACAA 3420 AAAAAGATTC AGATGGGCGA TACATTGTGT CAATTCCATT CAAGGAGGAT GTCACCTTAG 3480 GAGATTCAAA GAAACAAGCG ATAGCTCGTT ACATGAATCT GGAGAAAAAA CTAAAAAGAA 3540 ATGAAAAACT TAAGGTTGAC TACACTAAAT TCATGAATGA ATACATGGAT TTAGGACACA 3600 TGATTGAAGT GAGTGATGAA GGCAAATATT TTTTACCGCA CCAGGCAGTG ATTAGAGATT 3660 CAAGCCTTAC GACCAAATTG AGAGTAGTTT TTGATGCTTC AGCAAAAACT ACGAATAACA 3720 AAAGTTTGAA CGACATAATG TGGGTTGGGC CACGAGTTCA AAAAGATATT TTTGACATTA 3780 TTATTAAATG GAGAAAATGG GAATTTGTTG TTTCGGCAGA CATTGAAAAG ATGTACCGAC 3840 AAATTAAAAT AGATAATAAT GATCAAAAAT ATCAATATAT TTTATGGAGA AATTCTCCAA 3900 AAGAAAAAAT TAAAACATAT AAATTAACCA CAGTCACTTA CGGAACTGCA TCTGCACCAT 3960 ATTTGGCTAC CAGGGTTCTG GTAGATATTG CAGATAAATG TAAAAACCAA GTTATTAGTG 4020 CAATAATTAG GAATGATTTC TATATGGATG ACCTAATGAC TGGAGCTGAT TCGGTAGAAG 4080 AAGCTAATAA ATTAATAACA TTAATTCCCC ATGAATTGCA GAAAGTTGGA TTCAACTTAA 4140 GGAAATGGAT TTCCAACAAT TCCAAAATAT TAACCACTGT GGAGGACACA GGGGACAATA 4200 AGGTTCTCAA TATTATCGAA AATGAATGTG TTAAAACTTT AGGACTAAAA TGGGAACCTC 4260 AAAAGGATTT ATTTAAGTTC AGCGTAAATT GTAATGATGA ATCAAAAAAT ATAAATAAGC 4320 GCGTTGTGTT ATCAACGCTA GCAAAAATAT TTGATCCGTT AGGATGGTTG GCACCAGTCA 4380 CGGTTTCAGG AAAACTTTTT ATTCAAAAAC TTTGGATAAA TAAAAGTGAA TGGGATCAGG 4440 AATTATCCAT AGAAGATAAA AATTATTGGG AAAAATATAA AGAAAATTTA TTATTGTTAG 4500 AGAATATTCG AATCCCAAGG TGGATTAATT CAAACAGTTC TTCAGTCATT CAGATTCACG 4560 GATTTGCGGA CGCCTCCGAA AAAGCATATG CTGCAGTAGT CTATGCTAAA GTAGGACCTC 4620 ATGTTAATAT AATAGCTAGC AAAAGTAGAG TCAACCCTAT AAAAAATAGG AAGACAATTC 4680 CCAAACTCGA GCTGTGTGCA GCTCACCTGC TTAGTGAATT AATCCAAAGA CTAAAAGGAT 4740 CAATTGACAA TATAATGGAG ATCTATGCTT GGAGTGATTC CACGATTACC TTAGCATGGA 4800 TTAACAGTGG TCAAAGTAAG ATCAAATTTA TAAAAAGAAG AACGGATGAC ATTCGGAAAT 4860 TAAAAAATAC TGAATGGAAT CATGTTAAGT CAGAGGATAA TCCAGCAGAT TTAGCATCCA 4920 GGGGAGTGGA TTCTAACCAG TTGATCAACT GTGATTTTTG GTGGAAAGGT CCGAAATGGC 4980 TAGCAGACCC AAAAGAACTT TGGCCTCGGC AGCAGTCTGT AGAAGAACCT GTCTTAATAA 5040 ATACGGTATT AAATGACAAA ATAGATGATC CTATTTACGA ATTAATAGAA AGGTATTCCA 5100 GTATAGAAAA ACTTATACGT ATAATAGCAT ACATAAATAG ATTCGTGCAG ATGAAAACAA 5160 GAAATAAAGC CTATTCATCA ATTATTTCAG TAAAGGAGAT AAGAATAGCG GAAACAGTTG 5220 TTATTAAGAA ACAACAAGAA TACCAGTTTA GGCAAGAGAT AAAGTGCCTT AAAATCAAAA 5280 AGGAAATCAA GACAAATAAT AAAATATTGT CATTGAATCC ATTTTTGGAC AAGGGTGGGG 5340 TTCTAAGAGT TGGAGGAAGA TTGCAAAATT CCAATGCAGA ATTTAATGTT AAACATCCAA 5400 TCATTTTAGA AAAATGCCAC CTAACAAGCT TATTAATAAA AAATGCTCAT AAGGAAACAT 5460 TGCATGGAGG GATAAACCTA ATGCGAAACT ATATCCAAAG AAAGTATTGG ATTTTCGGGT 5520 TGAAAAATTC GTTGAAAAAG TATTTAAGAG AATGTGTAAC GTGTGCAAGG TATAAACAAA 5580 ATACAGCTCA GCAAATAATG GGTAACTTGC CAAAATATAG AGTGACGATG ACATTCCCGT 5640 TTCTTAATAC TGGAATAGAT TACGCAGGTC CTTATTATGT TAAATGTTCA AAAAATCGTG 5700 GCCAAAAAAC ATTTAAAGGA TACGTTGCTG TATTCGTTTG CATGGCCACC AAAGCCATAC 5760 ACTTAGAAAT GGTAAGCGAT CTAACTTCAG ACGCATTTTT AGCAGCACTC AGAAGATTTA 5820 TTGCTAGACG GGGAAAATGT TCCAATATCT ATTCAGACAA CGGAACAAAT TTTGTAGGAG 5880 CTGCAAGAAA ATTAGATCAA GAGTTATTTA ATGCAATACA AGAAAATATA ACGATTGCAG 5940 CGCAACTTGA AAAGGACAGG ATTGATTGGC ATTTTATTCC CCCGGCAGGA CCTCACTTCG 6000 GAGGTATTTG GGAAGCTGGA GTTAAGTCAA TGAAATACCA TTTAAAGCGT ATAATCGGCG 6060 ACACTATTTT TACTTATGAA GAAATGTCAA CTCTTTTATG TCAAATAGAA GCATGCTTAA 6120 ATTCAAGGCC ATTATACACT ATAGTTAGTG AGAAGGACCA ACAAGAAGTT TTAACACCAG 6180 GTCATTTTTT AATTGGAAGA CCACCTTTAG AAATAGTCGA ACCAATGGAA GATGAAAAAA 6240 TCGGAAATTT GGATAGGTGG AGACTTATCC AAAAAATAAA GAAAGATTTC TGGGTTAAGT 6300 GGAAAAGTGA ATATTTGCAT ACGCTCCAGC AAAGGAATAA ATGGAAAAAG GAAATTCCTA 6360 ATATAGAAGA AGGGCAAATA GTTTTATTAA AGGATGAGAA TTGTCATCCT GCAAGATGGC 6420 CTTTAGGAAA GGTGGAAAAG GTGCATAAGG GGAATGATGA TAAGGTCCGA GTGGCTAAAG 6480 TAAAGATGCA GGAAGGATAT ATCACTAGAC CCATTACTAA AATTTGTCCC TTGGAAGGAA 6540 TAAAGTCTGT TGACAAAAAT GAGGCTGACC AAGAGCCAAA AAGACGAACT AGAGCGACAT 6600 CGGGAATGTC CAAGATCGGA ATCATTATGG CAATGTTGTT GTTTGTGTTA AGTTGTCAAG 6660 TTTCTAGCGC ATTACCTAAA GATATAGCAC CAAGATATTC TATAGACAAA ATAAATAAAA 6720 CCTCAGCAAT ATATCTAGAC CCGCTAGGAG ATGTTGAGAT TGTGAGTACT TCTTGGAATT 6780 TGGTTATCTA TTATAAAATG GATCCATATT TTAAAATGTT AACAAAGGGT AATGCGCTTA 6840 TACAAAGTAT GAGGAAAGTT TGCGAAAGAC TTCATAGCTT TGAAGAGCAA TGTAGTCTAG 6900 TCTTAGATAA TATGCAAAGT CAGTTATCGG AACTTGAAGA AAACAATAAA TTGTTTATGA 6960 TGCAGTCTAG ATCTAGAAGC AAGCGTGCTC CTTTCGAATT TATGGGTTCC TTGTATCATA 7020 TTTTATTTGG TATAATGGAT GAAGATGATA GAGAGCAATT AGAAGAAAAT ATGAAGAATT 7080 TGTTAGATAA CCAGAACAAC CTTGATAAAC TAATTCAAAA ACAAACATCT GTGGTTGATT 7140 CAACTTCTAA TCTATTAAAG AGAACAACAG AAGATGTTAA CTCCAATTTT AGAAGTATGC 7200 AAATAAGAAT TGAGAACATG ACAGAAGTTC TTAAAGAAAA TTATTATGTT TATAAGGAAT 7260 CAATAAAATT CTTTATGATT ACGAAACAGC TACACTCATT GATTGAAGAA GGCGAAAAAA 7320 TTCAAGCAGG CATTATAAGC CTGTTGATTG ATATTAATCA CGGTAGGCTA AATACAAATA 7380 TTCTCAGGCC AAATCAGCTT AAAAAAGAAA TTGCCAAAAT TCAGCAGAGT CTTTCAGAGA 7440 ACCTAGTAAT TCCAGGAAAA CGGTCAGGTA CGGAACTTAA GGAGGTGTAT ACACTGTTAA 7500 CAGCCAGGGG TTTATTCATC GACGATAAAT TGATCATTAG TGCAAAAGTG CCTCTGTTTA 7560 GCAGGCATCC ATCCAAATTG TTCAGGCTTA TTCCGGTGCC AATTCGAAAT GAAGATCGGA 7620 TAATAATGGT GCATACAACG TCCGAATATT TAATTTATAA TTTTGAGATA GATTCCTATC 7680 ACATAATGAC GGAAGCCACA TTAAATCAAT GTCAGAAATG GCAACTAAAT AAGAGAATAT 7740 GCAAAGGAAG TTGGCCCTGG AATTCAGCGA ATGATAATGC ATGTGAGATT CAGCCTCTAA 7800 AGCCAGATAA AGCGGCGAAC TGCATCTATA AAACAGTAGT CGACTCTAAA AGTTACTGGG 7860 TAGAGTTAGA AAAGAAAAGT AGTTGGTTGT TTAAGGTTCC TGCGAATTCA AAAGTCCGTC 7920 TGCAATGTAC TGGCTCTCAA ATTGAATTGT TTGATTTGCC TCAGCAAGGA GTTTTAAGCA 7980 TTGCGCCATA TTGTACGGCA AGAACCGACG ATAAAATTCT AGTTGCCCAC CATAACATTC 8040 AGTCCGAAAG TGAAGAATTA TTATCAACAC CTTATATAGG AGAAGTTAGT GGAGTGCCGA 8100 AGATTATTTG GGATCCGCTG AAACTATCAA TATTAAATCA TACTGAGGAA TTTGAACGAT 8160 TGAATAATGA AATTAAATTT ATGAAAGAGA ACCATCAAAA ATTGAAAGAT TTACATTTCC 8220 ATCATATTTC CGGACATGCT GGATTAATTA TTGCTTTAAT ACTAATGATA GTATTAATAA 8280 TATATTTCAT ACGGAAATGT GCTGTGCAAC AAAGAATGCA AGCAATAACC TTTGCAGGTC 8340 CGTTGCCAGT ACTATAAATA TCAATAGTAA ATAAACAATA AAATAATATA ACAAATAAAA 8400 ATATACAGTC CACTAATAGA AAATGTACTT CTACATAGAA AAAGCAAAAT GTTTAAAATA 8460 AGTTAATTAA GTACAAATTG TTGAATTAAA AATAATATAA ACCATAATTG TAATCCAATA 8520 AAATTAAAAG CCAGAAAAAC TAGGCCCATT GAAATCTTAG TTGCAAAATA AATGAACATA 8580 TATCAAATAA ATACAGTCCA CTACTGTTAT AAATGCAACT AATATACTAA TGTACATCTC 8640 AGCTTTGCTG GCCCTTTGGC AGAATGTTCA CACATGAACA CGAATATATT TAAAGACTTA 8700 CAATTTTGGG CTCCGTTCAT ATCTTATGTA AATGAATCGA GAGCGATAAA TTATATTTAG 8760 GATTTTGTTA TCTAAGGCGA CATGGGTGCA TTGCTCAAAA ACATGTAATT TAAGTGCACA 8820 CTACATGAGT CAGTCACTTG AGATCGTTCC CCGCCTCCTA AAATAGTCCC TTAGTGGGAG 8880 ACCACAGATA AGGTCCTCGC CGCTCAAGAT AGGCAGATGT GCCCGAGCGT GGGACCTCGA 8940 TAAGGCGGGG ACTATTTACG TAGGCCTCTG CGTAGGCCAT TTACTTTAAG ATGCGATTCT 9000 CATGTCACCT ATTTAAACCG AAGATATTTC CAAATAAAAT CAGTTTCTTA CAAAAACTCA 9060 ACGAGTAAAG TCTTCTCATT TGGGATTTTA CA 9092 // ID BLOOD standard; DNA; INV; 7410 BP. XX AC AY180916; XX DR FLYBASE; FBte0000279; Dmel\blood. XX FT source AY180916:1..7410 FT SO_feature five_prime_LTR ; SO:0000425:1..398 FT SO_feature three_prime_LTR ; SO:0000426:7011..7410 FT SO_feature CDS ; SO:0000316:966..1271 FT /name="Dmel\blood\sORF" FT /db_xref="FLYBASE:FBgn0045863" FT /db_xref="NCBI_PROTEIN:AAN87266.1" FT /translation="MSTKQTFEHPAPVEQRDLPSIKEVIEVDPSAGPKPLTIQEYKAR FT TAAREQPPKKKRGGRRIKLLSARRLNIELLKTATNEEDRQRYKERLAAINQQLRGAK" FT SO_feature CDS ; SO:0000316:1863..3116 FT /name="Dmel\blood\ORF1" FT /db_xref="FLYBASE:FBgn0045865" FT /db_xref="NCBI_PROTEIN:AAN87267.1" FT /translation="MEWLNLTISINNIRDAFDKSYKCINKTALIKTQTLIFHIKVLIT FT QYNTLQNLIVTNKSKLTEEHKVQCFKVLSSFGKRLHNTSVRHSIIIEVPTELTKIAEF FT DESQLRDLDESQPLEDLDIESDIESIEELKFNTVQPNTRNMANALEAQRAYVKQVSAT FT VPDFDGKKLHLNRFVTALKLTDLTKGDQETLAVEVIKTKIIGPLNYKVEHATTIQAII FT TILQANVKGESPDVIKAKLINAQQRGKTASQYVTEIDSMRKQLEAAYIDGGLDADNAD FT KFATKESISAMTKNCANEALKMILTAGTFSTFNDAMEKYLHCSTEITGNSNTVLFYNG FT NNRRGNYNAYYRGRGRNNYNHNYNQNYNQGYNNNNRGRGGYRGHGNNRDGGNRRGNQS FT QNNNNNRNVRNVQSENSQTPLSDQQ" FT SO_feature CDS ; SO:0000316:3749..6733 FT /name="Dmel\blood\ORF2" FT /db_xref="FLYBASE:FBgn0045864" FT /db_xref="NCBI_PROTEIN:AAN87268.1" FT /translation="MKDYDIFTTPVEKENRTEEILKQLRFPKQFNNELTKLCTEFSDI FT FGLETEPISANNFYKQKLRLGEKTPVYIKNYRMADSQKPEIARQVKKLIDDGIVEPSM FT SEYNSPLLLVPKKPLPNSTEKRWRLAVDYRQINKKLLSDKFPLPRIEDILDQLGRAKY FT FSCLDLMSGFHQIELEKRYRDITSFSTANGSYRFTRLPYGLKVAPNSFQRRMTLAFSG FT LEPSQAFLYMDDLVVIGCSEKHMLKNLTNVFELCRRHNLKLHPGKCSFFMKEVTYLGH FT KCTDKGILPDDTKYEVIEKYPIPTDADSARRFVAFCNYYRRFIKNFSDHSRHLTRLCK FT KNVQFEWTAECNDAFEYLKTELMKPTLLQYPDFGKEFCITTDASKQACGAVLTQDHNG FT QQLPVAYASRMFTQGESNKSTTEQELTAIHWAINHFRPYIYGKHFMVKSDHRPLSYLF FT SMKNPSSKLTRMRLDLEEYDFTVEYLKGKDNHIADALSRITIKDLKTINREILKVTTR FT SKAKQENSCKDEAIVKIQEEKEQTIEKPKVYEVVNNNDTKKYVLIKIDKHKCLLKRGK FT TIVSRFDVDDLYSNETFDLNQFFQRLISKAGMHKITKMRISPSEQMFQFVSLNEFKIK FT GNRVLEKVELAILQKVIIIDKNDEAQIKEILTKFHDDPIEGGHTGISRTQSKIKRFYY FT WPQMTKTISKYVKTCLKCQQAKITTHTKTPLTLMPTPATAFDTVLIDTIGPLPKSEDG FT NEYAVTIICDLTKFLVTIPTPNKSAKTVAKAIFELFVLKYGPMKTFITDQGTEYKNSL FT MNELCKYMHIENLTSSAHHHQTLGTIERSHRTFNEYIRSYISVNKSDWDIWLPYFTYC FT FNTTPSIVHDYCPYELVFGRLPRQFKDFSKINKIDPIYNLDDYSKELKCRLELSYNRA FT RRMLEKAKADRKLRYDRNTNNFELKIGDKVLLRKETGHKLDKRYEGPYDVVDIGINDN FT ITIKTGSKKQQIVHKDRLKKHK" XX CC Sequence from P1 (complement)DS03023:69372..76782 provided by Guochon Liao, CC Berkeley Drosophila Genome Project. XX SQ Sequence 7410 BP; 2840 A; 1403 C; 1328 G; 1839 T; 0 other; TGTAGTATGT GCATATATCG AGGGTACACT GTACCTATAA GTACACAGCA ACACTTAGTT 60 GCATTGCATA AATAAATGTC TCAAGTGAGC GTGATATAAG ATCACCCATT TATGCTTTAA 120 GCTAAGTCAG CATCCCCACG CTGGCCGCTG GCCATATATG CGCATAAGCT CTCTCTCTCT 180 CTCTCTTATA CATATATATA TACGCTGCTC TTCTGCCGCT GTCGACGGCG GCGCAGTCGC 240 AGTATTTAGG TAAGATTAGA CACTCTGTAG AGGTTAAGCG GGCAGAACCG TTTCTGCTAC 300 TCGAAGAGAT AAGAAGAAAT AAAAAGGTGC CTGACGGCTG CACCCAACTG CAAGGAAAAC 360 ACGTGTTCTC AATTGGTGGC ATATATTGGT TTATTACATG GCGACCGTGA GGCAGGAGCC 420 TGCGATCTGA GGACTACTGA GGAAATGCTG CTAATATTGC CGATTTGATT TGGGAATTCT 480 AAACAGCGAC AACAGGTGTG AGAAGCAGGC CGCCCCTTAC ACCAGTGCGG GAGACCTAGA 540 GACGGGACAC TGATGAAAAA AAAAGAAACA AAAATACTGA GTGAGTAGAG TGTGGTAATG 600 GGCAAACGCG GATGTCAGGA AATCAAAAAT AAAGGTATAG CACATATTAA GTGGCTATGA 660 TATACAAATA AAACACCGCC CCCATGGGCA ACGGCACAGA AATTAACTGC CGAATTAGAC 720 TTTCTGAAAG AAAACCTCCA GCAAAGAAAG CCGAATACCA CAACTCACTC AGCAAAAATA 780 GAAATAATCA ATGAAGAAAT AACTGAAAAT TCAACATCAC CCAAGCCGAA AAGACCCGAC 840 GTCTGCATGA AAGACTGCCC TCGACCATTG TAAGCCGCAA CAGCAATTAG CACGGCATCC 900 TGCGAGGGTA GGATTAGGAT AAAGGATAAA GGATTCCACC GGCGCGCCGC ACATGACAAC 960 AGCGAATGTC TACCAAGCAG ACGTTCGAAC ACCCTGCTCC TGTCGAGCAA AGGGATCTGC 1020 CAAGTATCAA AGAGGTAATA GAGGTAGATC CGTCCGCGGG ACCAAAGCCC TTGACCATAC 1080 AAGAGTACAA GGCACGGACT GCAGCGAGGG AGCAGCCACC TAAAAAGAAG AGGGGTGGCC 1140 GCCGGATTAA GTTGCTCAGC GCCCGGAGGC TCAACATCGA ACTACTGAAG ACGGCAACTA 1200 ATGAGGAAGA CCGGCAGCGC TACAAAGAGC GCCTTGCAGC CATCAATCAA CAACTTCGTG 1260 GTGCGAAGTA AAGCGGCGGG CTGCGTTATA CGCCATAGCC TCAACCGCCC AAATATTATA 1320 TTAATGTTGT CGATGCGGTT TCCGCTGCAA CAAAATTACT AACTTATCAG GGACCCATTT 1380 CATAACTAAC ACATTATACT CAGTCCTAAA CTTAAAATAA GTAATAATAT TGTAAAATTG 1440 CAAATTGCAA CCGATGTAAA CTGAGTATAA TGAATTCATC TATCAAGTAA AAATATGTTT 1500 AACAACAGTT TAGACCTATT AAAATTTCGA GCTATATTTA TATCTGATCG AGATAACAAT 1560 AATTGACCAA TTCTCAAAGT TAAAATTCTA TTTGTACTTT TGATATACAA ATAAAGACTA 1620 ATTTTCCCCA TATCAAAATG GGACATAAGT CGTGGATACA ACCCCACAGT TAAATTCAAT 1680 GTACTTACTA TTTTTGATTT TAGTTATCCT ATCAGCCTTT TTACCTTGGC CTTAAAACTT 1740 TATCAGTTTC ACACAAGATC GTTGAAAAGA CTTACATGAG TCGAGCCAAT GATTTAGACA 1800 AAATCTAATA GAAACTACAC CAAAAAGGTA CAAGGTCGAT TACATCGCTA AAAGGTACAT 1860 ACATGGAATG GCTAAACTTA ACCATATCCA TAAACAATAT TAGAGATGCT TTTGATAAAT 1920 CCTATAAATG TATTAATAAA ACCGCGCTGA TCAAAACTCA GACGCTTATT TTTCACATAA 1980 AGGTATTGAT AACACAATAC AACACATTAC AAAACCTAAT AGTAACAAAC AAAAGCAAAC 2040 TCACTGAAGA ACATAAAGTC CAATGCTTCA AAGTTCTCAG TTCATTTGGT AAAAGACTAC 2100 ATAATACCAG CGTTAGACAC AGTATTATAA TAGAAGTCCC AACAGAACTA ACCAAAATAG 2160 CAGAATTCGA CGAAAGCCAG TTAAGAGACT TGGACGAGTC GCAGCCGTTA GAAGATTTAG 2220 ATATCGAAAG CGATATCGAA TCAATAGAAG AATTAAAATT TAATACCGTA CAACCAAATA 2280 CAAGAAACAT GGCCAACGCA TTAGAAGCTC AGAGAGCATA CGTTAAACAG GTATCTGCCA 2340 CAGTACCTGA TTTCGATGGT AAGAAACTCC ATTTAAACAG GTTTGTGACA GCACTTAAGT 2400 TGACGGATCT AACTAAAGGA GATCAAGAAA CTTTAGCAGT AGAGGTCATA AAGACCAAAA 2460 TTATTGGCCC ATTAAACTAT AAAGTAGAAC ATGCGACAAC GATACAGGCA ATAATTACCA 2520 TATTGCAGGC AAACGTAAAA GGCGAATCGC CTGACGTTAT AAAGGCCAAA TTAATAAATG 2580 CCCAACAAAG AGGCAAGACC GCGTCTCAGT ATGTTACAGA AATAGACAGT ATGCGTAAGC 2640 AGCTCGAGGC AGCTTACATA GACGGCGGAT TAGACGCCGA TAATGCTGAC AAATTCGCGA 2700 CTAAAGAGTC GATATCAGCA ATGACCAAAA ACTGTGCCAA CGAGGCACTT AAAATGATCT 2760 TAACTGCAGG TACATTTAGT ACATTCAACG ACGCAATGGA AAAATACCTA CATTGCAGTA 2820 CAGAAATAAC CGGCAATTCA AATACAGTCT TATTCTATAA TGGGAATAAT AGACGTGGTA 2880 ATTATAATGC CTACTATCGT GGTAGAGGCA GAAATAATTA TAACCATAAT TATAACCAGA 2940 ATTATAACCA AGGTTATAAT AATAACAACA GAGGTCGCGG AGGCTACCGC GGCCACGGTA 3000 ATAACAGAGA CGGAGGTAAC CGAAGGGGTA ACCAAAGTCA GAATAATAAT AACAACCGAA 3060 ATGTGCGTAA CGTACAATCG GAAAACAGCC AGACCCCCTT AAGCGATCAA CAGTAAAAGT 3120 GTTTAAAGTA AACCTAAATC TGAGTATTTT CATTAAGACA AAAAACCATG AAACAAACAC 3180 AGTTCTTACA TTACTAATAG ACACAGGTGC AGAAATTTCA TTGCTAAAAG CCAAAGCAAA 3240 GGAATATAAT AATATAAATT TCAGTAATAT ATCAAATATT ACAGGTATTG GGCAAGGAAC 3300 CATACAGTCT ATAGGTACAG TAGATCTTGA CATACGCATT CAGGATGTTC TAGTGCCACA 3360 TGAATTTCAT GTAGTACCTG AGAATTTTCC GATACCATGC GATGGCATAA TCGGAATAGA 3420 TTTTATCAAG AAATACAATT GCGTATTAGA GTTTCAAAAT AACAAAGACT GGTTCACAAT 3480 AAGACCCAAT AACTTCAGTA GACAGATTAG TGTACCAATT ACACATAACT TAGACTCCAA 3540 CACACTCTTA TTGCCAGCTA GATGCGAAGT AATCAGACAA GTCAAATTAC TCACTAACGA 3600 AAAAACGGTG GTAGTACCAA ATCAGGAGCT GCAACCAGGT ATAATAGTAG CAAGCACCAT 3660 TGCCGATAGC AAAAACGCAT TGATTCGCAT TATAAATACA AATAATAAAG ACGCCATAAT 3720 AGATAGCGCG AAGATCAAAT GCGAATCAAT GAAAGACTAT GACATTTTTA CAACACCAGT 3780 AGAAAAGGAA AATAGAACTG AAGAAATTTT AAAACAATTA AGATTCCCTA AACAATTCAA 3840 TAATGAACTA ACTAAGTTAT GCACCGAGTT TAGCGATATT TTTGGTCTAG AAACAGAACC 3900 AATATCGGCT AACAATTTCT ACAAACAAAA ACTCAGATTA GGGGAAAAAA CACCGGTCTA 3960 TATAAAAAAC TATCGCATGG CAGATAGCCA AAAACCAGAA ATCGCCAGAC AGGTAAAAAA 4020 ATTAATAGAT GATGGAATAG TTGAACCATC AATGTCTGAA TATAATAGTC CATTACTTTT 4080 GGTTCCAAAG AAACCACTTC CGAATTCCAC GGAAAAAAGA TGGCGATTAG CAGTTGACTA 4140 TCGTCAAATA AATAAGAAAC TATTATCAGA CAAATTTCCA CTTCCAAGAA TAGAAGATAT 4200 TCTTGATCAA TTAGGAAGAG CAAAGTATTT TTCATGTCTC GACCTAATGT CTGGATTCCA 4260 CCAGATAGAA CTAGAAAAAA GGTATAGAGA TATAACGTCA TTTTCAACAG CCAATGGCTC 4320 ATATCGCTTC ACGCGATTAC CATACGGACT GAAAGTAGCA CCAAACTCCT TCCAACGTAG 4380 GATGACACTT GCATTTTCTG GTCTTGAACC ATCGCAAGCA TTTCTATATA TGGATGACTT 4440 AGTAGTAATA GGTTGTTCAG AAAAACATAT GCTCAAAAAT TTGACTAACG TATTCGAGCT 4500 ATGTAGACGA CATAATTTGA AACTACATCC AGGGAAATGT TCTTTCTTTA TGAAAGAAGT 4560 AACATATTTG GGTCACAAAT GTACCGATAA AGGTATACTC CCAGATGACA CCAAATATGA 4620 AGTTATAGAA AAATATCCTA TACCAACAGA TGCCGACAGT GCTAGGCGTT TCGTAGCCTT 4680 CTGTAATTAT TACAGACGTT TCATTAAAAA TTTTTCTGAT CATTCACGCC ACTTAACGAG 4740 GCTTTGTAAA AAGAATGTTC AATTCGAATG GACAGCAGAA TGCAATGATG CATTCGAATA 4800 CCTTAAAACA GAATTAATGA AACCAACATT ACTACAGTAC CCAGATTTCG GTAAAGAATT 4860 TTGCATAACA ACCGATGCTA GTAAACAGGC ATGCGGAGCG GTACTTACAC AAGATCACAA 4920 TGGTCAACAA CTTCCAGTGG CATACGCTTC AAGAATGTTC ACTCAAGGTG AAAGTAATAA 4980 GTCCACTACA GAACAAGAAT TAACGGCCAT TCATTGGGCC ATAAATCATT TTCGACCATA 5040 CATATATGGC AAGCATTTCA TGGTAAAAAG CGATCATAGA CCATTGTCAT ACCTATTCTC 5100 TATGAAAAAT CCAAGTTCAA AACTCACTCG TATGAGGCTG GATTTAGAAG AGTATGACTT 5160 TACTGTAGAA TATCTTAAGG GGAAAGATAA CCATATTGCG GACGCCTTGT CTCGCATAAC 5220 AATAAAAGAT CTGAAAACAA TCAACAGAGA AATATTAAAA GTTACCACCA GATCAAAAGC 5280 TAAACAGGAA AATTCCTGTA AGGACGAAGC AATAGTCAAA ATACAAGAGG AAAAAGAGCA 5340 AACAATAGAA AAGCCCAAAG TCTATGAAGT TGTCAATAAT AATGACACAA AGAAATATGT 5400 TTTAATCAAA ATAGATAAAC ACAAGTGTTT ATTAAAACGA GGAAAAACAA TTGTTTCACG 5460 CTTTGATGTT GATGACTTGT ATTCTAATGA AACATTTGAT CTAAATCAAT TCTTTCAAAG 5520 GCTTATTTCA AAAGCCGGAA TGCATAAAAT AACAAAAATG CGAATATCAC CAAGCGAACA 5580 GATGTTCCAA TTTGTATCAC TAAATGAATT TAAAATAAAG GGCAACCGAG TACTCGAAAA 5640 AGTAGAACTA GCTATTCTAC AAAAGGTGAT AATTATAGAC AAAAATGACG AAGCTCAGAT 5700 TAAAGAAATT TTGACAAAAT TCCATGATGA TCCTATAGAA GGAGGCCACA CTGGTATTTC 5760 GCGAACCCAG TCAAAAATCA AAAGATTTTA TTATTGGCCC CAGATGACCA AGACAATCTC 5820 AAAGTATGTA AAGACTTGTT TGAAATGTCA ACAAGCCAAA ATTACAACAC ATACGAAAAC 5880 TCCATTAACA TTGATGCCAA CGCCAGCAAC AGCATTTGAT ACTGTTTTAA TTGATACCAT 5940 TGGTCCACTA CCGAAATCGG AAGACGGAAA TGAGTATGCA GTTACAATCA TATGCGATCT 6000 AACCAAGTTT TTAGTAACTA TTCCAACACC AAATAAAAGT GCTAAAACAG TTGCAAAGGC 6060 TATATTTGAA TTATTTGTAC TGAAGTACGG TCCAATGAAG ACGTTCATTA CAGATCAAGG 6120 TACGGAATAC AAAAATTCAC TTATGAATGA ATTATGCAAA TATATGCATA TAGAAAATCT 6180 AACATCTAGC GCTCACCATC ATCAAACTTT AGGAACAATA GAAAGAAGCC ACCGAACTTT 6240 TAATGAATAT ATACGTTCAT ACATATCGGT TAACAAAAGT GATTGGGACA TTTGGTTACC 6300 ATATTTCACT TATTGCTTCA ATACAACACC CTCAATAGTC CATGACTATT GCCCATACGA 6360 ACTAGTATTT GGCAGACTAC CCAGACAATT CAAAGATTTC AGTAAGATAA ACAAAATAGA 6420 CCCAATATAC AACTTAGACG ACTACTCTAA AGAGCTTAAA TGCAGACTAG AATTGTCGTA 6480 CAACAGAGCA AGAAGAATGT TAGAAAAAGC AAAAGCGGAT AGAAAATTAA GATATGATAG 6540 GAATACAAAT AATTTCGAAT TAAAAATAGG AGATAAAGTA TTACTTAGAA AAGAAACAGG 6600 TCATAAGTTA GATAAAAGAT ATGAAGGTCC TTATGACGTA GTAGATATAG GAATAAATGA 6660 CAATATAACC ATTAAAACAG GAAGTAAGAA ACAACAAATA GTACATAAAG ATAGGCTAAA 6720 AAAGCACAAA TAGAATGAAA AAAAAAAAGG GCAATCAATG CCAAACCTTT CATAATAAAA 6780 CTTAAATAAC GGCCTGATCA GCCAAAACAA TATAACAAAG ACATAGACAT AATCGAATTT 6840 TTATTAATTC AAAATACATA CATATTTTTT CTTTATTCAT TTAAAAATTC TATATCATAA 6900 ATAATGTTAA TTCATTAAAA ATAATATTTA AGTAATTTTT ATTTTATAAT GGTAATATAG 6960 TTGATAGAAA ATAACTTCAT TTCTTTACGT TATTTTAAAA AAGAGGGGAG GTGTAGTATG 7020 TGCATATATC GAGGGTACAC TGTACCTATA AGTACACAGC AACACTTAGT TGCATTGCAT 7080 AAATAAATGT CTCAAGTGAG CGTGATATAA GATCACCCAT TTATGCTTTA AGCTAAGTCA 7140 GCATCCCCAC GCTGGCCGCT GGCCATATAT GCGCATAAGC TCTCTCTCTC TCTCTCTTAT 7200 ACATATATAT ATACGCTGCT CTTCTGCCGC TGTCGACGGC GGCGCAGTCG CAGTATTTAG 7260 GTAAGATTAG ACACTCTGTA GAGGTTAAGC GGGCAGAACC GTTTCTGCTA CTCGAAGAGA 7320 TAAGAAGAAA TAAAAAGGTG GCCTGACGGC TGCACCCAAC TGCAAGGAAA ACACGTGTTC 7380 TCAATTGGTG GCATATATTG GTTTATTACA 7410 // ID DMZAM standard; DNA; INV; 8435 BP. XX AC AJ000387; XX DR FLYBASE; FBte0000217; Dmel\ZAM. XX FT source AJ000387:1..8435 FT SO_feature five_prime_LTR ; SO:0000425:1..473 FT SO_feature three_prime_LTR ; SO:0000426:7963..8435 FT SO_feature CDS ; SO:0000316:join(494..531,6387..8004) FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\ZAM\env" FT /db_xref="FLYBASE:FBgn0024272" FT /db_xref="SPTREMBL:O46113" FT /db_xref="NCBI_PROTEIN:CAA04048.1" FT /translation="MENTLLNLLLVLLSCHGAYQSIFIHNFNSTNLLAKVPVGKTLVIG FT NYKKISHIIDLSEYTNCIEKLYHTIDTLRQDETLTDSISILNAKLAQTQSKIDALTPFS FT RHKRGLINGLGSLVKVVTGNMDANDAKNIETEINHLKSQSTTISDNFEIQNSFNDEVQL FT RFKNLTRHINNEQNLIKNFFENTQNTIYTKIYNNEEEIKKLQYINRLNYNIDLLVSHLS FT DIIESTLLAKINVIPKLILDKTEITKIKQIFKTQNYTIKSEQHIYNLLKMNALNYQNKI FT IFSIKIPIFLSCNYEMARLIPLPINSTQFVIAPKYLIYNNKSNSMFSTMYKCPVIEEQF FT VCEIDSINNLKNNTCLGHLIQNKTSYCDIKETGLTTDVFEPEKGFILVFNGNNLPIISS FT NQTITSINGSAIIKYNNCTLKINEINYDNRAVSTEEHPDFFLPPMRKLIKNATINILTL FT ERLHLDTLTTSNKLLVVAAGNSRHSTTLYILFTVSLVAVILTWTLRRDTHIFHTGPDHI FT LPIVAPPIPPSMAFAPNWGGRSYRPIGTIHHPSL" FT SO_feature CDS ; SO:0000316:1789..2820 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\ZAM\gag" FT /db_xref="FLYBASE:FBgn0024271" FT /db_xref="SPTREMBL:O46114" FT /db_xref="NCBI_PROTEIN:CAA04049.1" FT /translation="MSKKLTQTIKQTTRSVLESHTFPKRVTRSVSKTNTLPVIRESTPL FT PPLQPINMDSGNASVGNSAPVTPTVSGFSSIATALSATDILAFVKELPTFDGTPGQLDK FT YITSVEEIIMLIRGTDQTPYGLLTLRAIRNKIVGRADEALNLANTKLIWDDIKSNLLRL FT YSSKKSEATLLGELQSLPDNLTLGQLFFGLSRIRSQLISITSNSGQSATIIEAKKTLYD FT EVCLNAFISRIREPLKTVIRLKDPKTIETAYELCQGERARYQNRNPYPPTQNNTERRTN FT NYNNNNNNNHRDNNNRNNVTRLTPKTTQTITQTPIPNIVNQTTATELVTRLKIIKQIMG FT YTT" FT SO_feature CDS ; SO:0000316:<2795..6448 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\ZAM\pol" FT /db_xref="FLYBASE:FBgn0024270" FT /db_xref="SPTREMBL:O46115" FT /db_xref="NCBI_PROTEIN:CAA04050.1" FT /translation="NKLWATQHRRRKTHPTLPYQLKFSGTRLRNPTGYINPTTHATSLP FT YITLNLQQKFPLSFLIDTGSNNSFIDPESANQLECTILPTSTSITTALNSFKIEEKAIF FT PMPPEFKTEGQITLLKFKFHSYFNGLIGMDLLSHLEAKVDLVNLQLVTSKSTLPIFLYT FT NQASKIFNIPAYSKVILPLPVKTNHGEFYCCTTQLNNELSLSEGLYKSNNNIANVEISN FT QSDSDKLLYLEYPLETIPYNKNDHIELFNISATPLNNDTPQAPLHILTEHLNPEEKTAL FT TTLCKQFRDIFYNPETPLTFTNKITHSIPTIDNTPIHTKSYRYPFVHKTEVKKQIESML FT DQQIIRSSHSPWSAPVWVVPKKLDGTGNRKWRLVIDYRKLNDKTISDRYPIPNINDILD FT SIGKAKYFSTLDLTSGFHQIEMNPKDIAKTAFTVEGGHYEFTRMPFGLKNAPATFQRVM FT DSVLGDLNGTICLFYLDDIIIFSPSLQKHLLDIKMVFEKLRAANFKLQPSKSEFLRKEI FT EFLGHIVTQDGVKPNPNKISAIKKFPCPTNRRAIKSFLGLLGYYRKFIRDFARITKPMT FT KQLKGKRQVTTDKDFVDAFEQCKTLLSNDPILIHPDFEKPFILTTDASNFALGAVLSQG FT SLQNDRPVCFASRTLSDTEVNYSTIEKEMLAIIWAVKYFRPYIYGVKFTIVTDHKPLIW FT LMNFKEPNSKIIRWRLQLMEYNFEIIHKKGSQNVIADALSRADPNLNYNETLTVKPCPT FT SEKPINEFNTQLILEIDTNTSYQTTTPFKQKIRKKYSQPCFDFDNIVKILKGTLKPNRI FT CAFLADDNNSALIEKAFSTYFAHKKHFKIIRCKSLLHEIVGNPEQNKFIQEYHTNSNHR FT GIDETFLHLKRETYFPNMKNKISELIRNCETCLKLKYDRQPQNIVFETPETPSKPLDII FT HIDIYTINNNFNLTIIDKFSKFAAVYPIPNRNGINCIKAIKNFFSQFGLPKKLIHDQGV FT EFCNDIFRKFCSQYNILLHVTSFQQSSSNSPVERLHSSLTEIYRIILDTRKKHKLPTDH FT EEIMSETVITYNNAIHSTTKHTPFELFNGRTHLFEKTIIPNNEHDYLNKLNTFQDKLYS FT EIKEKLSTNTQQRIEKLNTSRVEPTTVQPNSTIFRKENRRNKLTPRFSLHRTAKDKGKT FT LVTTRNQKIHKSKIRKISKPPNDLSLSTCIPDLAMGHTNLSSSTTSIAPTS" XX CC Derived from AJ000387 (e1237231) ((Rel. 54, Last updated, Version 1). CC Takis Benos and Michael Ashburner, 19-Jan-1998. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 8435 BP; 3286 A; 2055 C; 1151 G; 1943 T; 0 other; AGTTACCGAC CCATCGGTAC CATACACCAC CCCTCCCTCT AAGCCACCAC GCCTACACAA 60 GTAGAAGACA TCGAACCGGG AAGCTTTGCG ATACAAAGTT GCAGCATAAA CATCAACAAC 120 GGGTCAGACG CCGACATCCG CCCAAAATGC TGACACCACA TCCTTTTCGC TCAGACAGAA 180 CAACGCATAC AATTCCATAT ACATACGTAT AAACATACTC ATACTTTCTG CTGTGTCAGA 240 TACTTTATTT CTAAGAACTT TAACATTGTA ATACATACAC ACATATTCAC TGTTAGCCCA 300 TTTAAGACGA AGAATAAAGA CGACCACAGT CGAGTGCAAG CAGCAAACAC TTGTAGACGT 360 ACATAATCTC CGATCAAAAT TCTCCCAAGA CGACCGTGGC TACGTTCTGG ACCCGCATAA 420 CTCCTCTATC TTTCTGAGTG ATAATACCTC CGCAAGACTC CCCGGAGGTA ACTGGCGCAG 480 CCGGAAAACT GGAATGGAAA ATACTTTATT AAACCTTCTA TTAGTTCTAT TGTAAGTAGT 540 TGTGGAAAAA GAGTGAGAAT GAAGTGCAGA AATGTCTAAA AGTGATTACA ACAAAAATCC 600 TAATACAATA CATAAACCGC CTTAACAAAC ATACAAAACA CGCATATAAA AAAAAAAAAA 660 AAAAAAAAAA GAAAAAAAAA AACCCAAAAC TTAAAAATGC CGTAACCGCG AAACATGATA 720 TGCGTTGTAC TTGTGTGAAA TCAATCGCTG ATAGTCACTG CCGAAGTTTA TTAAGGCCAA 780 GTACCATATC ATTACTTTCA TGTTTACATA CATATATATG CCCCACAATT AAAACAACAT 840 ACACACACAC AAATATTTCA AATGCAAAAA AAAAAAAAAG AATGTAGTGT ACCTGCGTGG 900 CATCAATCGC TGATAAACCA CTGCCGAAAT ATTAAAGGCC CGGTACTACA TCACAAAACA 960 CGTATATATG CAACAAAAAT ATACACAACA AAACCATATA TACAAACGTG TATGAGTGAC 1020 GTGTAATGTA CTTGTGTGAA ATCAATCGCT GATAATCACT GCCGAAGCTT AGTAAGGCCA 1080 AGTACCACAT CATTACTAAC ATGTGTACAT ATATATATAT GCAAAACAAT TAAAACAACA 1140 TACACACACA CAAATATTTC AAATGCAAAA AAAAAAAAAA AAGAGGAAAT GTTGTGTACC 1200 TGCGTGGCAT CAATCGCTGA TAAACCACTG CCGAAATATT AAAGGCCCGG TACTACATCA 1260 CAAAACACGT ATATATGCAA CAAAAATATA CACAACAAAA CCATATATAC AAACGTGTAT 1320 GAGTGACGTG TAATGTACTT GTGTGAAATC AATCGCTGAT AATCACTGCC GAAGCTTAGT 1380 AAGGCCAAGT ACCACATCAT TACTAACATG TGTACATATA TATATGCAAA CCACCAAAAC 1440 AAATACATAT ACACATACAA ACACTCCAAA AAAAAAAACA AATAATACTA TATGAACGGC 1500 GAAGCGTATG TTTTCTAAGG CTGGATACAA AACCACAAAA CCAAATATAA ATTGCACACC 1560 TTAATAAAGA AAAGAACAAA AATGATAATA AACAAAAGAA ATTTTTTTTG GAACATGCAC 1620 CCATACTCTC ACTCTTTCAA CACAAATAAA GTATTCAAAT TATACATACA TACAATAATA 1680 CCACTATATT ACAGAAATTA ACGCACAAGA AAACACACAC ACTATCCAAC AACAAACAAG 1740 TAATTAAGAG TTATTAAGTA CATTGTAAAC TACATATTTT TATCTTAAAT GTCAAAGAAA 1800 TTAACACAAA CTATTAAACA AACAACTCGC TCCGTGTTAG AATCACACAC ATTTCCCAAA 1860 AGAGTTACAC GATCAGTTTC GAAAACAAAC ACCCTCCCCG TAATAAGAGA AAGCACCCCC 1920 TTACCGCCCC TTCAACCTAT AAATATGGAT TCGGGCAACG CCTCCGTAGG TAATTCCGCC 1980 CCCGTAACAC CTACTGTCAG TGGCTTTAGC AGTATTGCTA CGGCACTTAG TGCCACCGAT 2040 ATTTTAGCCT TCGTTAAAGA ACTTCCGACC TTCGATGGTA CTCCAGGCCA ACTCGACAAA 2100 TATATAACTA GCGTTGAGGA AATAATCATG CTCATTAGGG GTACCGACCA AACTCCGTAC 2160 GGACTTCTGA CACTCAGGGC AATTAGGAAT AAAATAGTTG GAAGAGCAGA CGAAGCTCTA 2220 AACCTAGCCA ACACCAAACT TATATGGGAC GATATCAAAA GTAACCTACT ACGTTTATAC 2280 TCTAGCAAGA AAAGCGAAGC TACCCTCTTA GGCGAGCTCC AATCTCTCCC AGATAACCTA 2340 ACCCTAGGGC AATTGTTCTT CGGCTTATCG AGGATTAGGA GCCAACTTAT ATCCATTACT 2400 TCCAATAGTG GACAGTCGGC CACAATCATC GAAGCCAAGA AAACACTATA TGACGAAGTC 2460 TGTTTAAACG CCTTCATCTC AAGAATTAGA GAACCACTTA AAACAGTCAT CAGATTGAAA 2520 GACCCCAAGA CTATCGAAAC AGCTTACGAG CTATGTCAAG GAGAAAGGGC TCGTTACCAG 2580 AACAGAAACC CATATCCCCC AACACAAAAC AACACCGAAC GACGAACTAA CAACTACAAT 2640 AACAATAACA ACAACAATCA CAGAGACAAC AACAACCGCA ACAACGTAAC TCGTCTTACA 2700 CCCAAAACCA CTCAAACCAT TACTCAAACC CCAATTCCCA ATATCGTCAA TCAAACAACG 2760 GCAACAGAAC TAGTAACCCG TTTAAAGATA ATAAAACAAA TTATGGGCTA CACAACATAG 2820 AAGAAGAAAA ACTCACCCAA CACTGCCTTA CCAACTTAAA TTTTCAGGCA CCCGCCTCAG 2880 GAACCCAACA GGATACATAA ATCCTACCAC ACATGCAACA TCCCTTCCAT ACATAACTCT 2940 AAACCTCCAA CAAAAATTCC CTTTATCATT TCTTATCGAT ACAGGATCCA ATAACTCCTT 3000 CATTGACCCA GAATCTGCAA ACCAACTAGA GTGCACAATT CTACCAACAT CCACTTCAAT 3060 TACAACAGCA TTAAATAGTT TCAAAATTGA AGAAAAGGCA ATATTCCCAA TGCCACCCGA 3120 GTTCAAAACC GAAGGTCAAA TTACCCTACT TAAATTCAAA TTTCACTCTT ATTTCAATGG 3180 CCTCATAGGA ATGGACCTAT TATCACACCT AGAAGCAAAA GTAGACCTAG TAAACTTACA 3240 ACTAGTAACT TCAAAGTCTA CACTCCCAAT ATTCTTATAC ACTAACCAGG CTTCAAAAAT 3300 TTTTAACATC CCCGCCTACA GTAAAGTTAT CTTACCACTA CCAGTAAAGA CTAATCATGG 3360 GGAATTCTAT TGTTGTACTA CACAACTAAA TAATGAGTTA TCGTTGTCAG AAGGACTATA 3420 TAAATCAAAC AATAATATTG CCAATGTCGA AATCTCTAAC CAATCCGACT CAGATAAACT 3480 ATTATACCTA GAATACCCCC TAGAAACCAT TCCATACAAT AAAAACGACC ATATAGAGCT 3540 CTTTAATATA TCAGCTACAC CTCTTAATAA CGATACCCCT CAAGCCCCAT TACATATCCT 3600 CACAGAACAC CTCAATCCAG AGGAAAAAAC AGCCTTAACA ACCCTATGTA AACAATTTCG 3660 CGACATATTC TACAACCCAG AAACACCATT AACTTTTACC AACAAAATCA CACACTCCAT 3720 CCCAACCATA GATAACACTC CTATCCACAC AAAATCCTAC AGATACCCTT TTGTCCATAA 3780 AACAGAAGTC AAAAAACAAA TCGAATCCAT GTTAGACCAA CAAATTATTA GATCTAGCCA 3840 CTCCCCTTGG AGCGCCCCGG TGTGGGTGGT CCCAAAAAAA CTAGACGGGA CAGGGAACAG 3900 GAAATGGCGA CTTGTAATAG ACTACCGGAA ACTCAACGAC AAAACCATTT CGGACAGATA 3960 CCCCATCCCA AACATAAATG ACATATTAGA TAGCATAGGC AAAGCAAAAT ATTTCTCAAC 4020 GCTCGACCTA ACTAGCGGTT TTCATCAAAT CGAGATGAAT CCAAAAGATA TCGCCAAAAC 4080 AGCCTTTACA GTCGAAGGGG GTCACTACGA ATTCACACGG ATGCCCTTCG GCTTAAAAAA 4140 CGCACCGGCT ACCTTTCAAC GGGTTATGGA CAGCGTTCTT GGCGATCTCA ACGGCACCAT 4200 TTGCCTATTC TATCTTGACG ATATTATAAT TTTCTCGCCT TCCCTACAAA AACACCTGTT 4260 GGACATAAAA ATGGTATTCG AAAAACTCAG AGCGGCAAAC TTTAAACTAC AACCTTCAAA 4320 ATCAGAATTC CTAAGGAAAG AGATAGAATT TCTAGGCCAC ATAGTCACAC AAGACGGAGT 4380 TAAACCAAAC CCGAACAAAA TAAGTGCGAT CAAAAAATTT CCTTGCCCCA CCAACAGAAG 4440 AGCTATCAAA TCTTTTCTCG GGTTACTGGG TTATTATAGG AAGTTTATAA GAGACTTTGC 4500 ACGAATAACG AAGCCCATGA CTAAACAATT GAAAGGGAAA AGACAAGTTA CTACAGACAA 4560 AGACTTTGTA GACGCATTCG AACAGTGCAA AACTCTTCTG TCCAATGACC CAATACTCAT 4620 ACACCCAGAC TTCGAAAAAC CATTCATTCT TACTACGGAT GCTAGTAACT TCGCGTTAGG 4680 AGCCGTACTA TCTCAAGGCT CCTTACAAAA CGATAGACCT GTATGTTTTG CCAGCAGGAC 4740 CCTCTCCGAC ACCGAAGTCA ACTATTCAAC CATAGAAAAA GAAATGTTGG CAATAATATG 4800 GGCAGTAAAA TACTTCAGAC CATATATTTA TGGCGTAAAA TTTACTATTG TTACAGATCA 4860 CAAGCCACTA ATATGGCTTA TGAATTTCAA AGAACCCAAC TCAAAAATAA TTCGTTGGAG 4920 ACTCCAACTC ATGGAATACA ATTTTGAAAT AATTCACAAG AAAGGTTCAC AAAATGTAAT 4980 TGCAGACGCC TTAAGTAGAG CGGACCCAAA TTTAAACTAC AACGAAACAC TGACTGTTAA 5040 GCCTTGCCCC ACATCCGAAA AACCTATTAA CGAATTTAAC ACGCAACTCA TACTAGAAAT 5100 AGATACAAAT ACGTCTTACC AAACTACAAC ACCATTTAAA CAAAAGATTA GGAAAAAATA 5160 TTCACAGCCT TGCTTCGATT TCGATAATAT TGTTAAAATC TTGAAAGGAA CCCTAAAACC 5220 TAACAGGATT TGCGCATTCT TGGCGGACGA TAATAATTCC GCATTAATCG AAAAAGCATT 5280 CTCAACGTAT TTTGCACATA AAAAACACTT TAAAATTATC AGATGCAAAT CACTTCTCCA 5340 CGAAATCGTA GGAAACCCCG AACAAAACAA ATTCATTCAG GAATATCACA CTAACAGCAA 5400 CCACAGAGGC ATAGACGAAA CATTCCTTCA CCTCAAACGA GAAACCTACT TCCCCAATAT 5460 GAAAAACAAA ATCTCTGAAT TAATTAGGAA TTGCGAAACC TGTCTAAAAC TCAAATACGA 5520 CAGGCAACCA CAAAATATAG TATTTGAAAC CCCAGAAACC CCATCGAAAC CCCTCGACAT 5580 AATACACATA GACATCTATA CTATTAACAA TAATTTTAAC CTGACAATCA TAGACAAATT 5640 CTCAAAATTC GCAGCTGTCT ACCCCATCCC AAATAGAAAC GGCATCAATT GCATCAAAGC 5700 AATCAAAAAT TTTTTCAGTC AATTCGGACT ACCCAAAAAA CTAATACACG ACCAAGGAGT 5760 AGAATTTTGC AACGACATAT TTCGAAAGTT TTGCTCTCAA TATAATATAC TTCTCCATGT 5820 CACATCCTTC CAGCAATCTT CAAGTAATTC TCCAGTAGAA CGTTTACACT CCTCTTTGAC 5880 AGAGATTTAC AGAATAATAC TAGACACACG GAAAAAACAC AAATTACCTA CAGACCACGA 5940 AGAAATAATG TCAGAAACTG TAATAACATA TAACAACGCA ATCCACTCCA CCACCAAACA 6000 CACCCCTTTT GAACTTTTTA ATGGTAGGAC CCATTTATTC GAGAAAACAA TAATACCCAA 6060 TAATGAGCAT GACTATTTAA ATAAACTAAA TACGTTCCAA GACAAACTAT ACTCCGAAAT 6120 AAAAGAAAAA TTGTCCACAA ACACCCAACA AAGGATAGAA AAGCTAAACA CAAGCAGAGT 6180 AGAACCAACA ACAGTACAAC CTAACAGCAC AATTTTCAGA AAAGAAAACA GGAGAAATAA 6240 ATTAACACCA CGGTTTTCCT TACACAGAAC AGCAAAAGAC AAAGGAAAAA CTCTAGTAAC 6300 CACAAGAAAT CAAAAAATCC ACAAATCAAA AATTAGGAAA ATATCCAAAC CTCCAAATGA 6360 CTTAAGCCTT TCCACCTGCA TTCCAGATCT TGCCATGGGG CATACCAATC TATCTTCATC 6420 CACAACTTCA ATAGCACCAA CCTCCTAGCA AAAGTGCCGG TAGGGAAAAC ACTCGTGATA 6480 GGAAACTATA AAAAAATTAG CCACATAATC GATCTGTCCG AATACACCAA CTGTATTGAA 6540 AAATTATACC ACACCATCGA TACCCTAAGA CAAGATGAAA CACTCACCGA TTCTATATCA 6600 ATACTAAATG CTAAACTGGC CCAAACTCAA AGTAAAATAG ACGCACTAAC ACCCTTTTCA 6660 CGCCACAAAA GAGGTCTTAT TAACGGGTTA GGTAGTTTAG TCAAAGTCGT CACCGGCAAC 6720 ATGGACGCCA ATGATGCAAA GAATATAGAA ACAGAAATTA ACCACTTAAA AAGCCAGTCC 6780 ACCACTATCT CAGATAACTT CGAAATACAG AACTCGTTCA ATGATGAAGT TCAACTACGG 6840 TTCAAAAACT TAACAAGACA CATTAACAAT GAACAGAATT TGATTAAAAA CTTCTTCGAA 6900 AACACTCAAA ATACAATTTA CACAAAAATA TACAACAACG AAGAAGAAAT AAAGAAACTA 6960 CAATATATAA ATAGGCTTAA CTACAATATA GATTTATTAG TTAGCCACCT AAGCGACATT 7020 ATAGAAAGTA CACTGCTTGC CAAAATTAAT GTTATCCCAA AACTCATCTT AGACAAGACA 7080 GAAATAACCA AAATCAAACA AATTTTTAAA ACACAAAACT ACACAATAAA ATCCGAGCAA 7140 CACATTTATA ACCTCTTAAA AATGAACGCA CTCAATTACC AAAACAAAAT AATTTTTAGT 7200 ATCAAAATTC CTATTTTTTT AAGTTGTAAC TACGAAATGG CAAGATTAAT TCCACTTCCA 7260 ATAAATTCCA CACAATTTGT AATAGCACCT AAGTACTTAA TATATAATAA CAAAAGTAAC 7320 AGCATGTTTT CAACTATGTA TAAATGTCCT GTAATAGAAG AACAATTCGT CTGCGAAATC 7380 GACTCCATCA ATAATCTTAA AAATAATACT TGCCTGGGAC ACCTTATCCA AAATAAGACC 7440 AGCTACTGCG ACATAAAGGA AACGGGACTC ACGACTGATG TGTTCGAACC GGAAAAAGGC 7500 TTCATACTTG TATTTAACGG GAACAACCTC CCAATCATCT CCTCCAACCA GACCATAACT 7560 AGTATCAATG GATCAGCTAT AATAAAGTAT AACAATTGCA CATTAAAAAT CAATGAAATA 7620 AACTACGACA ACAGGGCGGT ATCAACAGAA GAGCACCCCG ACTTCTTCCT ACCACCAATG 7680 CGGAAACTAA TAAAAAATGC CACTATCAAC ATACTCACCT TGGAAAGACT TCACCTGGAT 7740 ACACTCACAA CATCCAATAA GCTACTGGTC GTCGCCGCAG GAAACTCTCG ACACTCGACA 7800 ACCTTGTATA TCCTCTTCAC CGTATCCCTA GTCGCCGTAA TACTCACCTG GACACTTCGA 7860 AGGGACACCC ACATCTTCCA TACCGGGCCC GACCACATTC TTCCAATCGT CGCTCCACCA 7920 ATTCCTCCGT CTATGGCCTT CGCTCCAAAC TGGGGGGGGA GGAGTTACCG ACCCATCGGT 7980 ACCATACACC ACCCCTCCCT CTAAGCCACC ACGCCTACAC AAGTAGAAGA CATCGAACCG 8040 GGAAGCTTTG CGATACAAAG TTGCAGCATA AACATCAACA ACGGGTCAGA CGCCGACATC 8100 CGCCCAAAAT GCTGACACCA CATCCTTTTC GCTCAGACAG AACAACGCAT ACAATTCCAT 8160 ATACATACGT ATAAACATAC TCATACTTTC TGCTGTGTCA GATACTTTAT TTCTAAGAAC 8220 TTTAACATTG TAATACATAC ACACATATTC ACTGTTAGCC TATTTAAGAC GAAGAATAAA 8280 GACGACCACA GTCGAGTGCA AGCAGCAAAC ACTTGTAGAC GTACATAATC TCCGATCAAA 8340 ATTCTCCCAA GACGACCGTG GCTACGTTCT GGACCCGCAT AACTCCTCTA TCTTTCTGAG 8400 TGATAATACC TCCGCAAGAC TCCCCGGAGG TAACT 8435 // ID DME010298 standard; DNA; INV; 8507 BP. XX AC AJ010298; XX DR FLYBASE; FBte0000359; Dmel\GATE. XX SY synonym: Batumi XX FT source AJ010298:1..8507 FT SO_feature five_prime_LTR ; SO:0000425:1..272 FT SO_feature three_prime_LTR ; SO:0000426:8236..8507 FT SO_feature polyA_signal_sequence ; SO:0000551:158..163 FT SO_feature polyA_signal_sequence ; SO:0000551:8383..8398 FT SO_feature primer_binding_site ; SO:0005850:276..293 FT SO_feature RR_tract ; SO:0000435:8236..8507 FT SO_feature CDS ; SO:0000316:1741..6456 FT /name="Dmel\GATE\polyprotein" FT /db_xref="FLYBASE:FBgn0044067" FT /db_xref="SPTREMBL:O76925" FT /db_xref="NCBI_PROTEIN:CAA09069.1" FT /translation="MPIGDDKKKLSADKPRSIFSPQGPKSPRIPSISVKTPAQISDDCA FT TPSKATVQRTAKNMAASDLALAKFISVSDAQANLRLRSTLRNPQLQPSRCLASVATKSE FT AYGTRLKRIRPLLRVPCVSRRAAASGMPILRASYSYCYSVYERCVAQLVDKIEQGHFSV FT HPKRTLRPRPTFPLAVGCLHAIQEFSQVTIFAGRFPDLLHAIYINNPRLTPFEKLFHLN FT AKTSGDAHAIVSISPLTKRGFSSAWENLIERFENKRLLVNSQLKILFNVQSIPQESGAA FT LKVMQSTVQGCLTALELSGINTENWDCLLEYLCSSKLPKITLSLWEQSLHKKADIPTWG FT ELNTFLTERHRTLEAIDDVRPSVPSQSHSKAMNSSGPSRDGKLASDLCNKENHPVRVCR FT VFSKWSVDDRSAYIKRKQLCLNYFAKGHQLRECKDRQSFTWWPASHVVAPKQPLFQQFK FT PFKSCKPNFRYSGQFRSKRASRCSKLFCHGSRAILLGSAIINSSHLGTNFKARALIDSG FT SEATFITEPLFNLIRLPFQVVQAQVSGLNQTVAAQFKNAAVSPSDLRLGRVAVGDDGLC FT PPSTSRKSAFLPNSAKFLRDLPDFPLADPKFYESAPIDVLIRSPHPASVLLSGAKTNIC FT GSLLGQETIFRWVLTGPVSASAQSRIPLFRHRSPTRTIIHWTNSSQNLGRWRIYQQSCK FT RIRFHVRERVGKCLRRHQCGKYVVTLPFRDPEHIGCGLGHSRSWALAQFLKNEQRLKKD FT EALKARYDSVIQEYLDLKHMRQVLPTHDCNAYYMPHHAVLKPESVTTKLRVVFNASSPS FT SNGTSLNDILHAGPVLQSDLTVQILKWRDFRYVFSADIQKMYRQIWVDPKHTPFQRILF FT RNNRGEIRDFELKTVTFGVNCAPLLAIRVLQQLAADEELSHPKASNVIRNFMYVDDVLA FT GADSTEEAQLMVHELRDALNSSSSRQRWLSKRPLQRQVLSQIAKLFDPAGWLAPFIVRA FT KIFMQEIWLQELGWDENVPNDLFQRWLNFLQSYSVFEQIRIPRWLSFHPDFKVEHHGFC FT DASQKAYGAAIYVRGEVGSAIMVQLLTAKTRVAPVKTVSLPRLELCGALLLSEMAAAII FT PQMPTINSKLYCWTDSTIVLAWLSKPACQWTTFVANRETKIAQATKTENWSHVQSEHNP FT ADLASRGVSLQDLADSQLWWHGPTWLQNPRNQWPTQVNAPVTDLEKRALKVHLAKAPSE FT ELLARFSKLEKALRVLAYVYRFIQRCRKQTSPSDVHLLATEIAAAERFLISNTQRREFP FT VEYHCLSEKRPVPSSSAILSMNPFLDPQGLIRACGRVAASESPQYNERHPVILPYNCLL FT SRLLAKFTHRTTLHGGNQLMVRLIRSKYWIPRIKNLMKAVVNSCKVCVIHKRRLQSQLM FT GVLPKERASFSRPFTVSAWITPVRDIKNYTGRACVITKGYVLVFVCFSTKAIHLEPTSD FT LTTEKFLAAFSRFVSRRGCPRQVQSDNGKTFVGAATLLSRDFLQAVKESVTNAYIHQEM FT QWQLFSGGTQYGRPLGSRRKKLQDAILQMHGHTKIHVRRTLHALGKNRSVP" XX CC Derived from AJ010298 (e1315889) (Rel. 56, Last updated, Version 1). CC Takis Benos and Michael Ashburner, 08-Sept-1998. CC Any changes to original sequence record are annotated in an FT line. XX SQ Sequence 8507 BP; 2245 A; 2251 C; 1836 G; 2175 T; 0 other; TGTTCAAGTT ACGCTCACCC GCTGTCACCC GCTGTCACCC GCTCTCCGCT CCCTCTTACG 60 CTCTCCCGCT CTTCACCTCA GAGTCTCCAA GGAGTCCTCG GGCTTGGGAT AGCCTAACTA 120 ATTAGAATAA GCATCAGTGT AAAAACTAAC CACGCTGAAT AAACATACGC CCGGTCGCCG 180 CGCAATTACG AAAAGTCTAG TGTTTGCTTT CCTTCGAGTG TTTCTTTTCA GCATATTTGA 240 ATTCAGGACA GCCATCCCCC TACATCCCAA CATTTTGGTC CTTCGAGCCG GATCACCTGG 300 ATTTTCAAGT TTGTCCACCA GCGAACAAAT TATAAGATAA GTACGAAATT TCCATTCCTT 360 TTAATTGCCG GTCTGCAGCA AAAGGTTCGA AAATCCAATT TCGTTCAATT TGCTGTAAGA 420 TTTATTGTCA AATCTAACGG ATTTCTCCGA CAAAAGGCAA TTAAAGAAAA GTACTTATCC 480 AATCTCACGG GCGCCGCATA TTACTCGCCG TTCTCCGTTC TCCTTTCACC CTCATTCGTG 540 AAAATTTCTA AAGTCCAAAT GGGCGAATAT ATTTAAATAT TAATCCAGTG CGATAATGCA 600 AAATTCCAAA TGTGAAAAAG TGAATAATTT GTGCCAAGTT CAGTGAAACT TTCTAAGTCC 660 AAAGCTCTGC CAAAATTGGC AAAAATTCTG TTCTCGTTTC ACTGTGTCAA AGCGAAGCCA 720 AACTTCTTTT CGCAACACAT TTTTGCTTTA ACTCCGCAGT CCACTTAATA CCATTTGCTT 780 TGCTATCGAA GAATACCACA ACGAAACAAA CAACACCATA CCCTCTGGCC ATTCAAATAA 840 CATATTAATT AACATTTCCG CAGTTCCATA TCTCTTACAT CAACATATAC CTACTCCATA 900 CTCTTGCATA TATTCACATC TTACACAATA TATCCTCACC ATATATTACA TATATTACAT 960 CAACATATAA TATCCACATA TATTACCGAC ATACATTGCG CATATTATCA GCATTCCTTT 1020 AACGTATACC AAAGTTTAAA TTCGATCCCG TCGGCAAATC CAACCACAAA TAAAATTTAT 1080 TCCAAGTGCC GACGCGGAAA GGCGTTTTCT TTTCCATCAA TTTTTTCCGT AAATTTCCAA 1140 ATTAATTTCC GAGCAATAAA TTAAAAGCGG TTTTTTCTTT TTTTTTAACA AATAACTTAT 1200 TGTTGAAAAC ATTTATTAAA TTATTAAAAA TTATATAAAT AATACGACCG CCAAATACAA 1260 GTCGTTCACC CGACAAATAT TTTTTCCTGT ATTGCTTGGA TATTAATTTG TGTTTGTTTT 1320 AGAAGTACTT ACAACGCGGA GAAAAGACTC CAAATCCACC ATTCCATTTT CTCCGTTTCC 1380 AGTTATAAAC AAAAAAATAA ATAAAATTTT CTTCCTTCTA ATAAACATTT TATTTTACCG 1440 TGTTCACATT CCAAGTGTTC CAACCGTAAA TAAGGTGGAC CTAATTACCA TAAATCACAG 1500 GTCATTTATA CAATTCGCTG TTCACTCCGA GTCACCTGTC CAATTAGTCT AAACTACGGC 1560 GTTTCCACTT CGCAAATTCA ACACCACTTT CTCACCCATT ACATCCTATA CGGTCCTTTT 1620 CCGCTGCTTT ATACCGTTCA CGGCAGGAAG CTTAAATTTA TTAAGTGGAA TCTGTCTACT 1680 TTTTCAAAAG TGTGACCGGG CTCCAAAAAC GCTTCCCTTC CATTTCGTAT TTCTTCGATT 1740 ATGCCCATCG GGGACGATAA GAAGAAATTG TCCGCTGACA AACCCAGGTC TATTTTTTCA 1800 CCACAAGGGC CCAAGAGTCC AAGAATCCCA AGCATTTCGG TGAAAACGCC TGCGCAGATT 1860 TCCGACGACT GTGCCACTCC ATCCAAAGCC ACAGTACAGC GCACAGCTAA AAATATGGCT 1920 GCTTCCGATC TAGCGCTAGC CAAATTCATT TCGGTTTCTG ACGCTCAAGC GAATTTGAGG 1980 CTCAGATCAA CACTCCGGAA TCCGCAGCTC CAACCGTCAC GATGCTTAGC GTCCGTCGCG 2040 ACCAAGTCCG AAGCCTATGG GACAAGGTTG AAAAGAATTC GACCTCTGCT CAGAGTGCCT 2100 TGTGTCAGCA GGCGAGCGGC AGCAAGCGGC ATGCCTATTC TCAGGGCTAG TTACAGTTAT 2160 TGCTATTCAG TCTATGAAAG GTGTGTTGCC CAGCTCGTTG ATAAAATCGA GCAGGGGCAC 2220 TTCTCAGTCC ATCCCAAGCG AACGCTGCGG CCCAGGCCTA CATTTCCTCT GGCTGTCGGT 2280 TGCCTCCATG CGATACAGGA GTTTTCGCAG GTGACTATCT TCGCTGGCCG CTTTCCGGAT 2340 CTTTTACACG CCATTTATAT TAATAATCCA CGGCTGACTC CGTTCGAAAA GTTATTCCAC 2400 TTAAATGCCA AAACAAGTGG CGACGCGCAT GCCATAGTTT CGATTTCGCC TCTCACCAAA 2460 CGAGGGTTTT CCTCTGCGTG GGAAAACCTA ATAGAGCGTT TCGAAAATAA ACGATTGTTG 2520 GTAAACAGTC AATTGAAAAT ACTGTTTAAT GTGCAGTCGA TACCACAGGA ATCTGGGGCG 2580 GCCTTGAAGG TAATGCAAAG TACTGTTCAA GGTTGCTTGA CTGCCTTAGA ACTGTCAGGC 2640 ATCAACACTG AGAACTGGGA CTGCCTGCTG GAATATCTGT GTTCATCCAA GCTCCCGAAG 2700 ATAACTCTCT CCTTATGGGA GCAGTCTCTA CATAAGAAAG CCGACATCCC GACATGGGGA 2760 GAACTGAACA CCTTCCTCAC AGAACGTCAT CGAACCCTAG AGGCCATCGA TGATGTGAGA 2820 CCGTCCGTAC CAAGTCAGTC GCACTCCAAA GCGATGAACT CAAGTGGGCC CTCTAGAGAT 2880 GGCAAGCTGG CGTCCGACTT GTGCAACAAG GAAAACCATC CTGTCCGTGT ATGTCGCGTT 2940 TTCTCCAAAT GGTCGGTTGA CGACCGGTCA GCCTACATTA AACGGAAGCA GTTATGCTTA 3000 AACTACTTTG CAAAGGGACA TCAGCTTCGT GAGTGCAAAG ATCGACAAAG TTTTACTTGG 3060 TGGCCGGCAT CACACGTTGT TGCACCGAAA CAACCTCTTT TCCAGCAATT CAAGCCCTTC 3120 AAATCCTGCA AGCCCAATTT CCGCTACTCA GGCCAATTTC GTTCCAAACG AGCAAGCCGG 3180 TGTTCAAAAT TATTTTGCCA CGGCTCAAGA GCTATCCTTC TTGGCAGTGC CATAATCAAT 3240 AGTTCCCATC TTGGCACTAA CTTTAAGGCA CGCGCCCTGA TCGACTCCGG ATCAGAGGCG 3300 ACATTCATAA CCGAGCCACT GTTCAATCTA ATTAGATTGC CATTCCAGGT GGTTCAAGCC 3360 CAAGTCTCGG GCTTAAACCA AACAGTAGCT GCTCAGTTCA AGAACGCTGC AGTTTCACCA 3420 TCCGATCTCC GACTAGGCCG CGTTGCAGTT GGAGACGACG GCCTATGTCC TCCCTCAACT 3480 AGCCGGAAAT CTGCCTTCCT ACCCAATTCC GCAAAATTTC TTCGGGATCT TCCCGATTTT 3540 CCACTGGCGG ATCCAAAATT CTATGAGAGC GCCCCAATAG ATGTACTTAT CCGGAGCCCA 3600 CATCCTGCTT CGGTGCTTCT GAGTGGAGCA AAAACCAACA TCTGTGGCTC TCTCTTGGGG 3660 CAAGAGACCA TTTTCCGCTG GGTACTAACT GGGCCAGTGT CAGCCTCAGC CCAAAGCAGG 3720 ATTCCTCTTT TTCGACACAG ATCTCCCACG CGTACGATAA TTCACTGGAC AAACTCCTCA 3780 CAAAATTTGG GGAGGTGGAG GATATACCAA CAAAGTTGCA AAAGAATCCG ATTCCATGTG 3840 CGAGAACGGG TTGGTAAATG CTTACGACGA CACCAGTGCG GCAAATATGT CGTTACTCTG 3900 CCTTTTCGCG ACCCAGAACA TATCGGTTGC GGGCTAGGGC ATTCTAGGTC TTGGGCGTTG 3960 GCTCAGTTCT TGAAGAATGA GCAGCGTCTA AAAAAAGATG AGGCCTTGAA AGCGAGATAC 4020 GATTCGGTGA TCCAGGAATA TCTCGACTTA AAGCACATGC GACAAGTTCT GCCTACCCAT 4080 GATTGCAACG CCTATTATAT GCCACATCAC GCCGTCTTAA AACCGGAGAG TGTAACTACT 4140 AAACTCCGTG TAGTATTCAA TGCCTCCAGC CCTTCATCGA ATGGTACCAG TTTAAATGAT 4200 ATCCTTCATG CTGGCCCTGT CTTGCAGTCC GACTTGACAG TGCAAATTCT GAAGTGGCGC 4260 GATTTCCGAT ACGTGTTCAG TGCCGATATT CAAAAAATGT ATCGGCAGAT CTGGGTAGAT 4320 CCGAAACACA CTCCATTCCA GCGAATACTT TTCCGTAACA ATAGAGGGGA AATCAGAGAT 4380 TTCGAATTGA AAACAGTAAC CTTTGGAGTC AATTGCGCGC CCTTGCTGGC GATCCGAGTA 4440 CTGCAGCAGC TAGCAGCTGA CGAAGAACTC AGCCATCCAA AAGCTAGCAA TGTCATTCGA 4500 AATTTCATGT ATGTGGATGA TGTTTTAGCC GGAGCGGACT CTACGGAAGA AGCTCAGCTC 4560 ATGGTGCACG AGCTCCGAGA CGCTCTGAAT TCTTCTTCGT CCCGCCAGAG ATGGCTATCG 4620 AAACGTCCTT TACAACGCCA AGTCCTGTCC CAAATTGCCA AATTGTTCGA CCCTGCAGGC 4680 TGGTTAGCAC CGTTTATCGT TCGAGCTAAA ATTTTCATGC AGGAGATTTG GCTACAGGAG 4740 CTTGGGTGGG ACGAAAACGT TCCAAATGAC CTTTTTCAGC GATGGCTTAA TTTTCTCCAA 4800 AGTTATTCGG TTTTCGAGCA GATACGCATT CCACGCTGGC TATCGTTTCA TCCAGATTTC 4860 AAGGTCGAGC ATCATGGCTT TTGCGATGCA TCGCAAAAGG CTTATGGCGC CGCAATATAT 4920 GTCCGCGGAG AAGTGGGCAG CGCCATTATG GTGCAACTCC TAACCGCCAA AACCCGGGTA 4980 GCACCAGTCA AAACGGTTTC GCTCCCAAGA CTCGAGCTCT GCGGAGCGTT ATTGCTTTCC 5040 GAAATGGCTG CAGCCATCAT TCCGCAGATG CCTACGATTA ACTCCAAACT TTACTGTTGG 5100 ACGGACTCCA CCATAGTGCT TGCATGGTTA AGCAAGCCAG CATGCCAGTG GACCACATTT 5160 GTAGCCAATA GGGAGACGAA GATCGCCCAG GCCACAAAAA CAGAGAATTG GTCTCATGTT 5220 CAATCTGAGC ATAATCCAGC AGACCTGGCA AGTAGAGGAG TTTCCCTCCA AGATCTAGCC 5280 GATAGCCAGT TATGGTGGCA CGGACCGACT TGGTTGCAAA ATCCACGCAA CCAATGGCCT 5340 ACTCAGGTCA ACGCTCCGGT GACCGACCTG GAGAAGCGTG CTCTAAAAGT CCATCTCGCG 5400 AAAGCTCCTT CTGAAGAGTT GTTGGCACGT TTCTCCAAGC TAGAGAAAGC TCTACGAGTC 5460 CTTGCCTATG TTTATCGCTT CATTCAGCGG TGCAGGAAGC AGACATCTCC ATCTGATGTT 5520 CATCTACTGG CCACTGAAAT CGCCGCCGCC GAGCGGTTCC TAATTTCGAA CACTCAACGC 5580 AGAGAATTCC CTGTGGAATA TCACTGCCTA AGTGAAAAGC GTCCAGTGCC AAGTTCAAGT 5640 GCCATCCTAA GCATGAACCC GTTTCTAGAT CCGCAAGGAC TGATCAGGGC ATGCGGCCGT 5700 GTGGCGGCTT CCGAAAGCCC TCAATACAAT GAACGCCATC CAGTGATTCT TCCGTATAAC 5760 TGCCTGCTTT CTCGCCTCCT TGCGAAGTTC ACGCATCGCA CAACTCTCCA TGGTGGTAAC 5820 CAGTTAATGG TGCGCCTCAT CCGGTCGAAA TACTGGATTC CGAGAATCAA GAACCTGATG 5880 AAAGCAGTGG TAAATTCGTG CAAAGTATGT GTGATCCACA AAAGGCGGTT GCAAAGCCAA 5940 CTGATGGGTG TCCTGCCCAA AGAAAGAGCA TCGTTCTCCC GACCATTCAC GGTATCGGCA 6000 TGGATTACGC CGGTCCGCGA TATAAAGAAC TATACGGGAA GAGCATGTGT TATTACAAAG 6060 GGGTATGTGT TAGTTTTTGT TTGTTTCTCC ACCAAGGCCA TCCACTTAGA GCCTACATCT 6120 GACTTAACGA CCGAGAAGTT TCTTGCCGCT TTCTCTCGTT TTGTATCCAG GAGAGGGTGT 6180 CCACGTCAAG TCCAGTCAGA CAATGGCAAA ACCTTTGTTG GCGCTGCCAC CCTGCTTTCC 6240 CGCGATTTCC TTCAAGCCGT AAAAGAGTCG GTGACGAATG CCTATATTCA TCAAGAGATG 6300 CAATGGCAAT TATTCTCCGG GGGCACCCAA TATGGGAGGC CTTTGGGAAG CAGGCGTAAA 6360 AAGCTTCAAG ACGCTATTTT ACAAATGCAC GGCCACACGA AAATACACGT TCGAAGAACT 6420 CTCCACGCTC TTGGCAAAAA TAGAAGCGTG CCTTAACTCC AGGCCGCTCT CTCCTATGTC 6480 TGAAGATCCG ACAGACTTGC TGGCTCTGAC GCCAGGGCAT TTCCTTGTCG GGGGACCCCT 6540 TATGTCCACG GTGGAACCCG AAGTAAAGGG GGAAACGAAA TCCCTTCTTA ATCGGTGGCA 6600 GCATTTGAAG GCTCTCCATC AGCAGTTCCG TGTGCGATGG AAAGAAGAGT ACCTCAAAGA 6660 ACTCCACAAG CGTTCTAAAT GGCAGGTCCC GTGAACTTCG AGCTAAAATA CTCGTGCATG 6720 TGGAGCAGCG TGTGGTGGGA TCGGTCGCAC TTCTTGCAAC GATCACCGCT TCGGCAGTCT 6780 CCCGTGGAAT GCTCGTGAGC GAGGCAATTG GCGCTAGTAT GTTGGTAATG AGGACTGCTC 6840 GCAAACGCTT TTCAGCGCTG AGCTTTAGGA ACCTCGCGCA CGTCCGAAGA GGATGGATTA 6900 CCGCGGCAGA CTCGGCATCG GTAGGATTTA ATACCTCGGG TACGTCTGCT CTCCACGGCA 6960 CGACCTGCGT GCGTTTTGTT GACGAGGAGC CATGTGCGCG TAGTCGAATG TCGAAAGGAG 7020 ATCGAAAACG AAATGAAAAA TAACGGATGA TTAGTGATAG TGAACTACAA CTAAGGACGA 7080 GAGGAGAGAC CTATTATTGT GGAGATTCGG AACTCCGTCG GCAAAAGCAC CTTTTTTGCC 7140 ACTGGACGTT TAATAACTCC ACGTGCAGTA CGGATGTTTA CTACACGACG TTGCCGTCAG 7200 CTCCTGGGAA AACAGACTCA ATTCTGCCGA GCCGCCACTC ATTAGAGGGC AAGTTGTCGT 7260 CCTTGATGAC GACTGTTGAG TTACGGGGTT TGGACTGTCA CCGTCTCCGC TCCCTCTTAC 7320 GTTCTCCACT CCCTCTTACG CTCTCCCGCT CTTCACCACA GAGTCTCCGA GGAGTCTCTG 7380 GCGCTTGGGA GAACCCAACG CATTAGAATA AGTTTTAGTG TAAAACTAAC CACGATCAAT 7440 AAAACATACG CCCGGTGCCC GCGCTAATTC TACAAGTCTT CGAGTGTTTT TTCGAGTGGT 7500 CTTTTTTTCA GCAAACTAGG AACTTTCCAG GACCAGCACC CCCCATCACC CCAACAACGA 7560 CCATGTCATC GATGGCGTCG CCAACCGGCG CCAACCCTGC AAGCAGCTTC GGCCTCGTCC 7620 CAACGTTCCC GCCGGCACAA TCCGCCAACT CAGCGTAGGA GTTCACCGCC ACGACGACCG 7680 GAATCGACGA CGCCAGGCCC ATCACTCTCG TCGCCGCTGC AACGCCACAG CGTGAACATC 7740 CTTCCCACAG CGCTGGTCAA GATGGAGACC GGGACGAAGA CCTTCAGACC GCAGCACTCA 7800 TCGATCCGTG CAGCCCCATG AGCTGCATCG ACGCTTCGTT GGCGTCAGCC TTTAAGCTTT 7860 CGATGACCAA TGTTGGCGAC GAGAAGGTCT GCACGACGAC GATTCGCTCC AGGATCGACG 7920 CGAACACGAA GCTCGAGGTC GTGCTCAAGA TCGAGCCCAG GGTGCGGATC CGTACACCTG 7980 TCCGGGCATT GAGCGACACC GTAGTGTCCA AGTACAGGGA CATCATGCTG GCGGATGACG 8040 GGTTCCATCG GCCTGCTACC GTATCCATGG TCTTAGGAGC AGACATTTAT CCTAAGGTTA 8100 TCCAATCCGG ATTCCTGACC TTCGACGAGG GAATGCCGGT CGCTCAAAAG ACCGTGTTTG 8160 GGTGGATCGT GTCCGGTGCC TGCAGCTTGC CTAGATGGCT ATGTTGCAAC CCCAGTGATT 8220 GCAAGGGGGG CGGAATGTTC AAGTTACGCT CACCCGCTGT CACCCGCTGT CACCCGCTCT 8280 CCGCTCCCTC TTACGCTCTC CCGCTCTTCA CCTCAGAGTC TCCAAGGAGT CCTCGGGCTT 8340 GGGATAGCCT AACTAATTAG AATAAGCATC AGTGTAAAAA CTAACCACGC TGAATAAACA 8400 TACGCCCGGT CGCCGCGCAA TTACGAAAAG TCTAGTGTTT GCTTTCCTTC GAGTGTTTCT 8460 TTTCAGCATA TTTGAATTCA GGACAGCCAT CCCCCTACAT CCCAACA 8507 // ID ROXELEMENT standard; DNA; INV; 4740 BP. XX AC AF237761; XX XX DR FLYBASE; FBte0001160; Dmel\X-element. XX SY synonym: BS2 XX FT source AF237761:1..4740 FT SO_feature CDS ; SO:0000316:322..1827 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\X-element\ORF1" FT /db_xref="FLYBASE:FBgn0041613" FT /db_xref="SPTREMBL:Q9NBX5" FT /db_xref="NCBI_PROTEIN:AAF81410.1" FT /translation="MNTLNETAAADESLDTAFLSSPQCAAPQRFQKIKRKSRASPETER FT KKPKSTIGKQGENPSATEPRYGGNSNRFGLLAHLTADKQVGNEIGDLYDQPSTSHQAAI FT AAAKRDAASAGTTSSAKRAQSKPPPIVMEGVDDVYLMMQSIENIVDLEKIEARASMSGV FT LRLYAADANTFRTIVNWLEIEEYEFHCYQLKEDRPYRVCVKGLHHSTLHHQIKDELEKI FT GHKVLDIHTPLRRNEPGTSKASPVNMFFLNIAAAANNKEILAVKALCHMRVVIEPLRKR FT NAIVQCHRCQQIGHTAKYCRKAHICVKCAGEHPAKDCTRPRIELCTCYNCGGQHPANYK FT GCSKLQAFLQRSRPRSGVAGRTEVSDRPTPRGLAGGKEIPSSRGGISYADVARGSIHHK FT QPMSLTHQQQKQKQQPYDGSPSRQRSRSRTRASRGTLQRSTDASSSIEAILQTLNENIN FT SLRSIQEKQMELMMMMMKQQQQQSHQQGQIINLLTALQARQAP" FT SO_feature CDS ; SO:0000316:1827..4553 FT SO_feature start_codon ; SO:0000318:1..3 FT /name="Dmel\X-element\ORF2" FT /db_xref="FLYBASE:FBgn0041612" FT /db_xref="SPTREMBL:Q9NBX4" FT /db_xref="NCBI_PROTEIN:AAF81411.1" FT /translation="MMPLRILVWNADGVSTKLPEVECFVRRHEIDVLLLSETHCKGAET FT PKLFGFVAYTANDPSGGNAKGGAAILIKNSLAHFPLTPIATAKVQLAPAVIETALGPIS FT FGAVYCPPRFAWTTDEFKDILEEFQTKFIVAGDWNASHWLWGAGRSNQRGIALANLVLN FT SEVDSLATGGPTRYPYGCRGSPGYIDFALTKGVLGIHANISAVVELSSDHLPLVITLDA FT GAISYPKMERLITRRTNLEVFQSQLESTLPLNTAINSGQDVDDAIELLTNNIKSAARLA FT TRSISRQPAADRIPIPREILLLIAEKRRLRTRWMRSRHPSDKTEWNRALSRLRCALVLH FT KAAWFDERLANTGVESEATHSLWKATRAIKRRCTRKAPLVDSNGTWCRTDLGQAEVFAA FT HLAERFQPFKLASLQQVEETQDQLNQALQMDMPITPFEPCEVAEVIVRQSNNKAPGHDV FT ICNATLKALPRQAILYITLVFNAIVRLQYFPYQWKLGIISMIHKPGKPEREPASYRPIS FT LLPSISKVFERLIAVRIVSIMEAQGITPEHQFGFRAGHCTVEQLHRVVEQILTAYDSKE FT YCNSLFLDIREAFDRVWHIGLQLKIKQTLPAPYFGLLKSYLEGRRFAVRFHSAISTEHN FT VAAGVPQGSVLGPLLYCLYSHDMPQPDVSLYGKSMLATFADDVCVTYRSRCEHDAADGI FT QDFAYRFSEWARRWNIGINSSKSNNVCFTLKRRTPPPVYIEEVPVPQPNAAKYLGVLLD FT RRLTFSKHVTDIRTRLRAKVAKHYWLLSSRSKLSLSNKLTIYKQILAPNWKYGCQIWGL FT ACDSHIKRIQAIQNKVARLITGCEWFVRNTTLHRDLKLATVFDEINKHSSRYHDRLERH FT RNRLASALNRSRPPRRLNRRQPRDLITRSPLTRVRRS" XX SQ Sequence 4740 BP; 1336 A; 1215 C; 1183 G; 1006 T; 0 other; AATGTTAAAT AAAGGTTCGT GTCTAACAAT ACGCACCTGA CAAAGTGGAT TAAGTGAAAT 60 TAGTTTTCGC GGTAATAAAC TTATGGACAA GACCAGAATA CTGGCACACA TAGCAAATAG 120 TGACCCCCCA AGTCACTAAC AGTGAAATAA TAGTGAAACG AAAACATTTT CATTCAAAAA 180 TACAAAGTTA AGTTTCTCGA ACTGGGGCTC CGCTGCCCAG CTGCCACGCG ATCGCACAAA 240 CAGCTGTTTG CGAGCTTAAA GCTTTCTATC CCAGGGTTCA AGTTTTGGCT AGAACCCTGG 300 TGATTTGGTG CACACTTCAA TATGAACACT TTAAATGAAA CCGCTGCGGC TGATGAATCG 360 TTGGATACTG CGTTTCTCTC GAGCCCCCAA TGTGCTGCCC CGCAGCGCTT TCAAAAAATA 420 AAGCGAAAGT CTCGTGCTTC TCCGGAGACT GAAAGGAAAA AACCCAAATC AACCATCGGC 480 AAACAAGGGG AAAACCCTTC GGCTACAGAA CCTAGATATG GCGGCAATTC AAACCGATTT 540 GGTTTACTTG CGCATCTCAC AGCTGACAAA CAAGTAGGCA ATGAAATTGG CGATCTGTAT 600 GACCAGCCCA GTACCAGTCA TCAAGCTGCA ATTGCTGCCG CTAAGCGGGA TGCAGCCTCC 660 GCTGGTACCA CTAGCTCAGC CAAAAGAGCG CAGTCCAAAC CACCTCCTAT AGTAATGGAG 720 GGAGTGGACG ACGTATACCT GATGATGCAG AGCATCGAAA ATATAGTGGA CCTAGAAAAG 780 ATTGAGGCTA GGGCGTCAAT GAGCGGTGTC CTAAGGCTTT ACGCGGCTGA CGCTAATACA 840 TTTCGCACCA TAGTGAACTG GCTCGAGATC GAAGAGTATG AGTTCCACTG CTACCAGCTT 900 AAAGAGGACA GGCCTTACAG GGTATGCGTG AAAGGCCTGC ACCACAGTAC GCTACATCAC 960 CAAATCAAGG ATGAGCTGGA AAAGATCGGG CACAAGGTTC TCGATATTCA CACACCGCTT 1020 AGGCGAAACG AACCGGGTAC CTCAAAAGCG TCGCCAGTCA ATATGTTCTT CCTAAATATT 1080 GCTGCTGCGG CAAACAATAA GGAGATCCTG GCGGTAAAGG CACTATGCCA TATGAGAGTA 1140 GTTATTGAGC CTCTCCGCAA GCGTAACGCT ATTGTCCAGT GCCATCGTTG TCAGCAGATT 1200 GGCCACACAG CCAAATACTG CCGTAAGGCC CACATTTGTG TGAAATGTGC CGGCGAACAC 1260 CCAGCCAAGG ACTGTACCAG GCCACGCATC GAGCTGTGCA CTTGCTACAA CTGTGGCGGC 1320 CAGCATCCTG CAAACTATAA AGGTTGCAGC AAGCTACAAG CGTTCCTGCA GCGATCCAGA 1380 CCCAGAAGTG GAGTGGCTGG AAGAACAGAA GTAAGCGATC GACCAACTCC ACGGGGCTTA 1440 GCTGGAGGTA AGGAGATCCC CTCTTCTCGA GGCGGAATAT CTTATGCAGA TGTGGCTAGA 1500 GGGTCCATTC ACCACAAGCA ACCAATGAGC CTGACGCACC AGCAACAGAA GCAAAAGCAA 1560 CAGCCCTATG ATGGAAGCCC CAGTCGTCAA AGGAGCCGCA GCCGGACAAG GGCGTCTAGG 1620 GGTACACTCC AGCGCTCGAC GGATGCTAGC AGCAGCATTG AAGCCATCCT GCAGACGCTT 1680 AATGAGAACA TTAATTCTTT GCGCTCGATT CAAGAGAAGC AAATGGAATT AATGATGATG 1740 ATGATGAAGC AACAGCAACA ACAGTCACAT CAGCAGGGGC AGATTATCAA TCTGCTCACT 1800 GCTCTCCAAG CGCGTCAAGC GCCATAATGA TGCCGCTGCG CATCCTAGTG TGGAACGCCG 1860 ACGGCGTATC CACGAAGTTG CCTGAAGTAG AGTGCTTCGT GCGACGTCAC GAAATCGATG 1920 TATTACTGCT CAGCGAGACA CACTGCAAGG GGGCAGAGAC GCCTAAGCTA TTCGGATTTG 1980 TAGCCTACAC TGCCAATGAT CCGAGTGGTG GCAACGCCAA AGGCGGAGCA GCTATCTTAA 2040 TCAAAAATAG CCTTGCCCAC TTTCCGCTAA CACCAATAGC CACTGCCAAG GTGCAACTTG 2100 CGCCGGCGGT TATTGAAACG GCACTTGGTC CTATAAGCTT TGGAGCGGTC TACTGCCCAC 2160 CGAGATTTGC ATGGACTACG GACGAGTTTA AGGACATTTT GGAAGAGTTC CAGACGAAGT 2220 TCATTGTTGC AGGCGATTGG AACGCGTCCC ACTGGCTCTG GGGTGCGGGA AGGAGCAACC 2280 AAAGAGGCAT TGCATTAGCG AATCTCGTCC TAAATTCGGA GGTGGACTCG CTAGCAACAG 2340 GAGGACCAAC AAGATACCCG TACGGCTGTA GAGGCTCACC AGGGTACATC GATTTTGCAC 2400 TGACAAAGGG TGTGCTGGGC ATCCACGCTA ACATAAGTGC GGTTGTTGAG CTTAGCTCCG 2460 ACCACCTGCC TCTGGTAATT ACGCTGGATG CGGGGGCAAT ATCCTACCCT AAGATGGAGC 2520 GGCTTATCAC TAGGCGTACT AACCTGGAGG TATTCCAATC GCAACTGGAG TCCACACTGC 2580 CCCTCAACAC TGCCATAAAC TCTGGACAGG ACGTTGATGA TGCTATCGAA CTGCTCACCA 2640 ACAATATCAA GTCAGCAGCT AGATTGGCAA CTCGCAGCAT ATCTCGGCAG CCCGCGGCAG 2700 ATCGAATCCC AATACCCAGG GAGATCCTGC TGCTTATAGC TGAGAAGAGG CGCTTACGCA 2760 CTAGGTGGAT GAGGTCTCGG CACCCGTCGG ACAAAACGGA ATGGAACCGA GCTCTGAGTA 2820 GGCTCCGATG CGCGTTGGTG CTGCACAAAG CCGCATGGTT CGACGAAAGG CTTGCCAATA 2880 CCGGAGTCGA AAGCGAAGCG ACGCATTCGC TGTGGAAGGC CACGCGCGCA ATCAAAAGGC 2940 GTTGCACGAG GAAGGCGCCT CTAGTCGATA GCAACGGGAC ATGGTGTCGG ACCGACTTGG 3000 GACAAGCGGA GGTATTCGCT GCGCACCTCG CCGAGCGATT TCAACCATTC AAGCTTGCCA 3060 GCCTGCAACA GGTTGAAGAA ACTCAGGACC AGCTGAACCA AGCGCTTCAA ATGGATATGC 3120 CAATCACGCC GTTTGAACCC TGCGAGGTAG CCGAAGTCAT TGTGCGCCAG AGTAACAACA 3180 AAGCACCTGG ACATGACGTC ATCTGCAACG CCACATTGAA GGCCCTGCCC AGACAAGCGA 3240 TCCTCTACAT AACGTTGGTT TTCAACGCTA TTGTGAGGTT GCAATACTTC CCTTATCAGT 3300 GGAAGCTCGG GATAATCTCC ATGATCCACA AACCTGGCAA GCCGGAAAGG GAGCCCGCCT 3360 CCTACCGGCC GATCAGTCTC CTCCCTTCAA TTTCGAAGGT GTTTGAGAGA CTGATTGCTG 3420 TCCGGATTGT AAGCATTATG GAAGCCCAGG GGATTACCCC TGAGCACCAG TTCGGTTTCC 3480 GTGCTGGCCA CTGTACTGTC GAGCAGCTCC ATCGAGTCGT CGAGCAAATT CTGACTGCCT 3540 ACGACAGTAA GGAATATTGT AACAGCCTCT TCTTGGACAT TCGAGAAGCG TTTGATCGAG 3600 TGTGGCACAT TGGACTCCAA CTGAAAATCA AGCAGACGCT GCCTGCCCCA TATTTTGGGT 3660 TGCTGAAATC GTACCTGGAA GGAAGGAGGT TCGCTGTGCG CTTTCATTCA GCAATTTCCA 3720 CCGAGCACAA CGTGGCAGCT GGTGTTCCAC AAGGTAGTGT CCTCGGCCCC CTGCTCTACT 3780 GCCTGTATAG CCACGACATG CCGCAGCCAG ATGTAAGCCT TTACGGGAAA TCTATGTTGG 3840 CCACATTTGC CGATGACGTG TGCGTCACCT ACAGGTCCCG ATGCGAGCAC GACGCAGCCG 3900 ATGGTATCCA GGACTTTGCA TACCGGTTCT CGGAATGGGC AAGACGATGG AATATTGGCA 3960 TCAATAGCAG TAAATCCAAC AACGTCTGCT TCACTTTAAA GCGGAGAACG CCACCGCCCG 4020 TCTACATCGA GGAAGTCCCC GTACCACAGC CGAACGCAGC AAAGTACCTT GGAGTGCTTC 4080 TGGATCGCAG ACTCACATTT TCCAAGCATG TGACCGACAT CAGAACGCGC CTACGTGCTA 4140 AGGTGGCGAA GCACTACTGG CTACTTTCTT CGCGCAGTAA ATTGTCGCTA TCCAACAAGC 4200 TGACAATTTA CAAACAGATC CTAGCACCAA ACTGGAAGTA TGGGTGCCAA ATCTGGGGCT 4260 TAGCCTGCGA CAGCCACATC AAAAGGATCC AGGCTATTCA AAATAAGGTA GCAAGACTCA 4320 TCACCGGCTG CGAGTGGTTT GTTCGAAACA CCACCCTGCA CAGAGACCTG AAACTCGCAA 4380 CGGTATTTGA CGAAATAAAC AAGCACTCGA GCAGATACCA TGACAGGCTG GAGCGCCACA 4440 GAAATCGGCT GGCCAGCGCT TTAAACAGAT CTCGCCCACC AAGGAGGCTC AATAGAAGGC 4500 AACCGAGGGA TCTCATTACC CGATCTCCTT TGACAAGGGT CCGCAGAAGC TGACGCTTAT 4560 CTTAAATCCT ATTTGTTATA TGTGATTGTT ATGTAATTGT AGTTAAATTA CTGTAAATTT 4620 GAAAAAGCTA ACTATAGTTA GCCGGCGAGC CCAAATGGGC TGAATTAATA GATAAGAAGG 4680 ACACAAAGGG GCTTCAAGAC TTCCCCGTAT GCCTTAATAA ATAAATTAAA TAAAAAAAAA 4740 //