comparison test-data/transposon_sequence_set_v9.5.embl.txt @ 0:3c8c9911cf2a draft

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/embl2fa commit 6e5860cedc0ed0bc807ff64f752e62355c1b19d4
author artbio
date Sun, 13 Nov 2022 00:23:23 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:3c8c9911cf2a
1
2 ID DME9736 standard; DNA; INV; 7411 BP.
3 XX
4 AC AJ009736;
5 XX
6 DR FLYBASE; FBte0000104; Dmel\Idefix.
7 XX
8 FT source AJ009736:1..7411
9 FT SO_feature five_prime_LTR ; SO:0000425:1..600
10 FT SO_feature three_prime_LTR ; SO:0000426:6841..7411
11 FT SO_feature CDS ; SO:0000316:<988..2031
12 FT /name="Dmel\Idefix\gag"
13 FT /db_xref="FLYBASE:FBgn0027381"
14 FT /db_xref="SPTREMBL:O96739"
15 FT /db_xref="NCBI_PROTEIN:CAA08806.1"
16 FT /translation="ARKLKDIMAVPQLSETHLNQLLNQIKELNYYDGAPGKLSGFVNQV
17 FT EQLLSLYPTQEARQAHVIYGAVKRLLVDSALEVVTQERANTWLDMKKALAMAFKDHRPY
18 FT VTLIRQLEDISYPGSICKFIEKLETQYWIMFDKLELESDHVDKSNYTEMLNKTVKSVID
19 FT RKLPDRIYMSLARKDIDTIYKLKQASMELGLYDAIPENHRSNRTEMNKRRNRGNYNQNN
20 FT NQKYYNNRNHNYSNYYPSMNQNHNTQPPQNPTQPMTNQNQYSPRFIPNNQRGNYYAFRR
21 FT DLTQAQQNNPLNNTLNFQPSTSNNINRQGPVKRQRESQSDQSRMDVNFHQAASDTQMIE
22 FT KDIQVPM"
23 FT SO_feature CDS ; SO:0000316:<1950..5402
24 FT /name="Dmel\Idefix\pol"
25 FT /db_xref="FLYBASE:FBgn0027380"
26 FT /db_xref="SPTREMBL:O96740"
27 FT /db_xref="NCBI_PROTEIN:CAA08807.1"
28 FT /translation="PKQDGCKFSSSCLGHSNDREGHTSPYVKIIHHNKNYKGMIDTGSS
29 FT INIIRENFENLEEKEENLIVYTIKGPITLKRSIIIKPTSVCPSAQKFYIHKFSDNYDFL
30 FT LGRKYLEDTKAKIDYANETVTLGSKVFKFLYEEKKGETASKCLDPQEKNDSALVDRTKP
31 FT KMQKVKTAPKCLKPKHQQQKKETALPKCLISNVVKDTVDNDVTHLDPMSVDNDIVNFAI
32 FT NNELRECNEYRLEHLNAEEVECLKKFLYEYRDIQYKEGENLTFTSTIKHVIQTQHEDPV
33 FT YRKPYKYPQSVDQEVNKQIKEMIEQGIVRKSKSPYCSPIWVVPKKADASGKQKFRLVVD
34 FT YRNLNEITVNDKFPIPRMDEILDKLGRCQYFTTIDLAKGFHQIQMDENSIAKTAFSTKH
35 FT GHYEYTRMPFGLKNAPATFQRCMNNLLEDLIYKDCLVYLDDIIVYSTPLEEHILSLKKV
36 FT FEKLRDANLKLQLDKCEFMKKETEFLGHIVTTNGIKPNPNKTKAITNFPLPKTPKQIKS
37 FT FLGLCGFYRKFIPNFAKIVKPMTLKLKKGAIIDTKCKEYIESFEKLKVLITSDPILIYP
38 FT DFSKPFSLTTDASNVAIGAVLSQNHKPVCYASRTLNEHEINYATIEKELLAIVWATKYF
39 FT RSYLFGRPFEVLSDHKPLVWLNNIKEPNMKLQRWKIKLNEFDYKIKYLPGKENHVADAL
40 FT SRTKIEVMVGEVANSADATIHSAIEDNLNYIPITERPINYFSRQIEIEKGDNDTTSVQH
41 FT LFQKLKIKIVYKEMTPELAKNLIKEYVCTKKSAIYFPNDEDFLIFQRAFTEIISPNNFT
42 FT KLLRCTTKLIDILTYAEFKDLILKKHKELLHPGIEKTINLFKEEYYYPDSQKLIQTIIN
43 FT ECQICYLAKTEHQTQMTYETTPEIFNTREKYMIDFYLTGNQIFLSCIDIYSKFASLVEL
44 FT KSRDWLEAKRAITKIFNDMGKPQEIKADKDSAFMCLALQNWLRSEGVQISISTSKNGIS
45 FT DIERFHKTVNEKLRIIGSQQNVEDRCTKFERILYIYNHKTKHNSTKRFPADIFLYAGSP
46 FT DFNVQQNKIDRIEYLNKNRHDFEVDIKYRQAPLVKSKITNPFKKTGRIGQVDDKHFEET
47 FT NRGRKIVHYKSKFKKQKKFNKSKYDNSRPTKEAQSTQHTSNNA"
48 FT SO_feature CDS ; SO:0000316:5248..6780
49 FT /name="Dmel\Idefix\env"
50 FT /db_xref="FLYBASE:FBgn0027382"
51 FT /db_xref="SPTREMBL:O96741"
52 FT /db_xref="NCBI_PROTEIN:CAA08808.1"
53 FT /translation="MINISKKQIVAGRSFTISQNLRNRKSLIRANMIIPDQPKKHKVHN
54 FT ILLIMLSCILSLIITVKCNNIEVNPVNAKNGYLIFQTGTMEIPTSYEYHYLSINITKTM
55 FT LMFEDIVSEANNYPNVPQIQYLVDKLKREINGLRIISRSKRGLLNVVGKAYKYLFGTLD
56 FT EDDREELEEKINNMSEDSVKTHDLNTILDVINSGIDIINKLKVDKEQHQQIAVLIFNLE
57 FT QFTEYIEDIELGLQLTRLGIFNPRLLKHDYLKHVNSEKMLKIKTSTWLKTDTNEILIIS
58 FT HIPSEVTKVPIFQIVPYPDEHNYILTEQIFDKFYIFDNQVFHKDTNRDIFDKCIIGIIK
59 FT QEQTQCKYIKTHKNYQINYIEPNILLTWNIPETAVNQDCTHNKILISGNNIIKIKNCTI
60 FT QIDEFLISNNLADFTQTIYITNNVTRLEPINHLQTREMIETHVKHYNFFQIICITTFVI
61 FT MIISLTLYVAYKFKNIPKKIIVNIVSKKNTRTLKIMSMKIFNKEIILPYTQI"
62 XX
63 CC Derived from AJ009736 (e1371475) (Rel. 58, Last updated, Version 1).
64 CC Takis Benos and Michael Ashburner, 1-Feb-1999.
65 CC Any changes to original sequence record are annotated in an FT line.
66 XX
67 SQ Sequence 7411 BP; 3047 A; 1363 C; 1109 G; 1892 T; 0 other;
68 GTGACATATC CATAAGTCCC TAAGACTTAA GCATATGCCT ACATACTAAT ACACTTACAA 60
69 CACATACACC CCAATACAAC ATACACTACT CCGGATGTAC CCAACAGATA CCAGATAAGA 120
70 ATAAGATTGT TATATGATCC TCGAGAATGG AAAAAACCCC AATTCTAGAT AAGTCACCCA 180
71 CTGGTAGACT AAACATCCGT CCCCTAATTT AAACAATTCC TTGCTTAAGC CTCACCCCAT 240
72 CGTCACATTC CCACGTTCAA AGCTCGGAGC CGCAATCCCG AAAAACAAAA GTATCGATTT 300
73 CAATAAACAA ATTATAAGAA TCTAAGAGCA CTTGTATCCA AGAGCAAATG CACTTGAATC 360
74 CAAGAGAAAC GCAAAGCTTT TTCTCTTTAC GATCAGAATC CTAAAGTCTA AAGTCCATAT 420
75 TAGAAAAGCT CGATACCGAG GCTTGAACGT CAACCAAATC AGAATAATTA TCAGAGTTCA 480
76 GTTTGAGACC TAATTGTAAA AGGTTCGGTG TTCTTCTCAA ATAAAAAGAT TGTAATCATT 540
77 TAGTGAAATA AAAATTATAT TTTTTTCACT TATAAATATT GCAAGTATTT AATTGGCGCA 600
78 GTCGGTTAGG ATCCAATAAA ATAAAAGAGT CCTTTTAGTA CGGTACTGAT CAACTGAAGG 660
79 ATATGCTATA CGACTAGCTA TCCAAGATCA GCGAATTAAA ATAGTGATTC AAAAATATTT 720
80 TTTAATCCGC AAAAGAATCT ACGTGAAAGT AGTATTCAAA ATAAAATCCC GTGCGGTCGG 780
81 AAACAAAAAT TAATTTAAAT TTTTTAATTC CGAAACTTAA AACCAAGTTT AAAGAAAACT 840
82 TAAAATCAAG AAAACTTAAA ACCAAGTTTA AAGAAAACTT AAAATCAAGA AAACTTAAAA 900
83 CCAAGTTTAA AGAAAACTTA AAATCAAGAA AACTTAAAAC CAAGTTTAAA GAAAACTCAA 960
84 AATCAAGAAA ACTTAAAGCC AAAATAAGCT AGAAAACTAA AAGACATCAT GGCAGTCCCA 1020
85 CAACTCTCAG AAACACACCT AAACCAACTG CTAAACCAAA TCAAAGAATT AAACTACTAC 1080
86 GATGGCGCAC CTGGCAAATT ATCTGGATTC GTCAACCAAG TGGAACAACT GCTCAGTTTA 1140
87 TACCCAACAC AGGAAGCAAG ACAGGCACAC GTCATATATG GAGCAGTGAA GCGGTTATTA 1200
88 GTGGATTCAG CCTTAGAAGT CGTAACCCAG GAAAGAGCTA ACACATGGCT GGACATGAAG 1260
89 AAAGCACTGG CAATGGCATT CAAAGACCAT AGACCTTATG TAACTCTCAT CAGACAATTA 1320
90 GAAGACATAT CATACCCAGG AAGTATCTGT AAGTTTATAG AAAAATTAGA AACACAATAC 1380
91 TGGATTATGT TCGATAAGTT AGAATTAGAA AGTGACCATG TTGATAAATC GAATTATACC 1440
92 GAAATGTTAA ACAAAACTGT TAAATCAGTA ATAGATCGAA AACTGCCGGA TAGAATTTAT 1500
93 ATGTCTTTGG CACGTAAAGA TATTGATACA ATTTATAAAT TAAAACAAGC ATCAATGGAA 1560
94 TTAGGCCTTT ATGATGCTAT TCCAGAAAAT CACCGTTCTA ATAGAACAGA AATGAATAAA 1620
95 CGTAGGAACA GGGGAAACTA TAATCAAAAT AATAATCAAA AATATTACAA TAATAGAAAT 1680
96 CACAACTACA GTAATTATTA TCCTAGCATG AATCAGAATC ATAATACACA ACCACCTCAG 1740
97 AATCCGACTC AACCTATGAC AAATCAAAAC CAATATTCAC CGCGTTTCAT ACCGAATAAT 1800
98 CAAAGAGGGA ATTATTATGC ATTTAGACGA GACTTAACAC AAGCTCAGCA GAACAACCCA 1860
99 CTTAATAACA CCCTTAACTT CCAACCTTCG ACATCGAATA ATATTAACAG ACAAGGGCCA 1920
100 GTAAAAAGAC AACGCGAGAG TCAGAGTGAC CAAAGCAGGA TGGATGTAAA TTTTCATCAA 1980
101 GCTGCCTCGG ACACTCAAAT GATAGAGAAG GACATACAAG TCCCTATGTA AAAATAATTC 2040
102 ATCATAATAA AAATTATAAG GGAATGATCG ATACAGGATC ATCAATTAAC ATCATAAGAG 2100
103 AAAATTTTGA GAACTTAGAA GAAAAGGAAG AAAACCTAAT AGTATACACT ATTAAAGGAC 2160
104 CAATAACACT AAAGAGAAGT ATAATAATAA AACCTACTTC AGTATGTCCG TCTGCTCAAA 2220
105 AATTCTACAT TCACAAATTT TCTGATAACT ATGATTTCTT GTTAGGTCGA AAGTATTTAG 2280
106 AAGATACAAA AGCTAAAATA GATTATGCTA ACGAAACAGT AACACTAGGC TCAAAAGTAT 2340
107 TTAAGTTTCT CTATGAAGAA AAGAAGGGCG AGACCGCATC CAAATGCCTT GACCCACAAG 2400
108 AAAAGAATGA TTCCGCTCTA GTGGACAGAA CCAAACCAAA AATGCAAAAG GTTAAGACCG 2460
109 CACCTAAGTG CCTTAAACCA AAGCATCAAC AGCAGAAGAA AGAGACCGCA TTACCCAAAT 2520
110 GCCTCATTTC AAATGTTGTT AAAGACACAG TGGACAATGA TGTAACACAT CTCGATCCCA 2580
111 TGTCCGTTGA CAACGATATA GTCAACTTCG CGATTAACAA TGAGTTACGC GAATGTAACG 2640
112 AGTATAGACT CGAACACTTA AATGCAGAGG AAGTTGAATG TTTAAAGAAG TTCCTATACG 2700
113 AATATAGAGA CATTCAGTAC AAAGAGGGCG AAAATTTGAC CTTCACCAGT ACTATTAAAC 2760
114 ATGTCATCCA GACTCAACAC GAAGACCCAG TATACCGTAA ACCCTACAAG TACCCTCAAA 2820
115 GCGTTGACCA AGAAGTTAAC AAACAAATTA AAGAAATGAT AGAACAAGGG ATTGTTCGCA 2880
116 AATCGAAGTC CCCTTATTGT TCTCCTATTT GGGTGGTCCC CAAGAAGGCA GACGCCTCTG 2940
117 GGAAACAAAA ATTCAGGTTG GTAGTCGATT ACAGGAACCT AAATGAGATA ACTGTTAACG 3000
118 ACAAATTTCC CATTCCCCGA ATGGATGAGA TATTGGACAA ACTAGGTAGA TGCCAATACT 3060
119 TTACCACTAT AGATCTAGCC AAGGGTTTTC ACCAAATCCA AATGGATGAA AATTCTATTG 3120
120 CAAAAACAGC TTTTTCAACT AAGCATGGGC ATTATGAATA TACTCGTATG CCCTTTGGTT 3180
121 TAAAAAACGC TCCAGCTACT TTTCAGAGAT GCATGAATAA TCTTCTGGAA GATTTAATCT 3240
122 ACAAAGACTG TTTAGTCTAT TTAGACGATA TTATTGTTTA TTCCACTCCA TTGGAAGAAC 3300
123 ACATTTTATC CCTAAAGAAA GTCTTTGAAA AACTGAGAGA CGCTAATTTA AAGTTGCAAC 3360
124 TAGATAAATG TGAATTCATG AAGAAAGAAA CTGAATTCCT AGGACACATC GTCACAACAA 3420
125 ATGGCATCAA ACCAAATCCA AATAAAACTA AAGCAATTAC AAATTTTCCA TTACCCAAGA 3480
126 CACCTAAGCA AATAAAATCA TTTTTGGGAT TATGTGGATT CTATCGCAAG TTTATTCCTA 3540
127 ACTTTGCCAA AATAGTTAAA CCCATGACCC TCAAATTAAA GAAAGGTGCT ATAATAGACA 3600
128 CCAAATGTAA AGAATACATC GAATCATTTG AAAAATTAAA AGTTTTGATA ACTTCAGACC 3660
129 CGATATTAAT CTATCCTGAT TTTTCAAAAC CTTTTTCTTT GACAACTGAT GCTAGCAACG 3720
130 TAGCTATTGG TGCAGTGTTA TCACAAAATC ACAAGCCAGT TTGTTATGCC AGTAGAACGC 3780
131 TAAACGAACA TGAAATCAAC TATGCTACGA TTGAAAAAGA ATTGTTAGCT ATAGTTTGGG 3840
132 CTACAAAATA TTTCAGGTCA TACTTATTCG GCAGACCATT TGAAGTATTA AGTGATCACA 3900
133 AGCCACTGGT ATGGCTCAAC AACATTAAAG AACCAAACAT GAAATTGCAA AGATGGAAAA 3960
134 TAAAACTTAA TGAATTCGAT TATAAAATCA AATATCTTCC AGGCAAAGAA AACCATGTCG 4020
135 CGGATGCTCT TTCCCGCACG AAAATAGAAG TTATGGTTGG CGAGGTCGCA AATAGCGCAG 4080
136 ACGCAACTAT ACACAGTGCC ATTGAAGATA ATCTAAATTA CATACCCATA ACAGAAAGAC 4140
137 CAATAAATTA CTTCTCTAGA CAAATAGAGA TAGAAAAAGG CGATAACGAT ACAACAAGTG 4200
138 TACAACATTT GTTTCAAAAA TTAAAGATTA AGATAGTCTA TAAAGAAATG ACACCTGAAC 4260
139 TCGCCAAAAA CCTCATTAAG GAATATGTGT GCACCAAAAA GAGTGCAATT TATTTCCCTA 4320
140 ATGACGAAGA TTTTCTGATC TTCCAGAGAG CGTTTACCGA AATTATAAGC CCTAACAATT 4380
141 TCACAAAACT CTTGAGATGT ACCACAAAGT TAATTGATAT ACTAACGTAT GCAGAATTCA 4440
142 AAGATTTAAT CTTAAAGAAA CATAAGGAAC TTTTACATCC GGGTATAGAA AAAACAATCA 4500
143 ATTTATTTAA AGAAGAATAT TACTATCCTG ATAGTCAAAA GCTTATTCAA ACCATTATCA 4560
144 ATGAATGTCA AATTTGTTAT CTAGCAAAAA CGGAACATCA AACACAAATG ACATATGAGA 4620
145 CTACACCAGA AATATTTAAC ACAAGAGAAA AATACATGAT AGATTTTTAT CTCACAGGAA 4680
146 ACCAGATCTT CTTATCTTGC ATTGATATCT ATTCGAAATT TGCATCACTA GTTGAATTAA 4740
147 AAAGTAGAGA TTGGCTAGAA GCAAAAAGAG CCATTACTAA AATATTCAAT GACATGGGAA 4800
148 AACCGCAAGA AATTAAAGCA GACAAAGACT CAGCTTTTAT GTGTTTAGCC TTACAAAATT 4860
149 GGTTAAGATC TGAAGGTGTA CAAATTTCTA TAAGCACTAG CAAAAATGGT ATATCTGATA 4920
150 TAGAAAGATT CCACAAGACC GTAAACGAAA AGCTAAGAAT CATTGGTAGC CAACAAAATG 4980
151 TTGAAGATAG GTGCACAAAA TTCGAAAGAA TTCTATACAT ATACAATCAC AAAACTAAAC 5040
152 ATAATAGTAC TAAAAGATTT CCAGCAGACA TTTTCCTATA TGCAGGCAGT CCAGATTTTA 5100
153 ATGTACAACA AAACAAAATC GATAGGATAG AATACCTCAA TAAGAATAGA CACGATTTTG 5160
154 AAGTTGATAT AAAATATAGA CAAGCCCCAC TTGTAAAAAG TAAAATAACC AATCCATTTA 5220
155 AAAAGACAGG AAGAATTGGA CAAGTAGATG ATAAACATTT CGAAGAACAA AATCGTGGCA 5280
156 GGAAGATCGT TCACTATAAG TCAAAATTTA AGAAACAGAA AAAGTTTAAT AAGAGCAAAT 5340
157 ATGATAATTC CAGACCAACC AAAGAAGCAC AAAGTACACA ACATACTTCT AATAATGCTT 5400
158 AGTTGCATAC TATCACTTAT CATCACGGTC AAGTGCAACA ATATAGAAGT AAATCCAGTA 5460
159 AACGCGAAAA ATGGATACCT TATATTCCAA ACAGGAACAA TGGAAATTCC AACCAGCTAT 5520
160 GAATACCATT ATTTAAGCAT AAACATAACA AAGACAATGC TCATGTTCGA AGATATAGTA 5580
161 AGTGAAGCAA ACAACTATCC TAATGTACCA CAAATACAAT ATTTAGTCGA CAAATTAAAA 5640
162 CGAGAAATAA ATGGGTTAAG AATTATTAGT CGAAGTAAAA GAGGTCTTTT AAACGTAGTA 5700
163 GGAAAAGCAT ACAAATACTT ATTCGGCACA TTAGATGAGG ATGACAGAGA AGAGTTAGAA 5760
164 GAAAAAATAA ACAACATGTC AGAAGACTCT GTAAAAACCC ATGACCTAAA CACGATTCTA 5820
165 GATGTAATCA ATAGTGGTAT AGATATAATT AATAAGCTCA AAGTAGATAA AGAACAACAC 5880
166 CAACAAATTG CGGTACTAAT ATTTAACCTA GAGCAATTTA CAGAATATAT AGAAGACATA 5940
167 GAATTGGGTC TGCAATTAAC CAGACTAGGA ATTTTCAATC CAAGATTACT AAAGCATGAC 6000
168 TATTTAAAAC ATGTAAATTC AGAAAAAATG CTAAAGATAA AAACGTCAAC CTGGCTTAAA 6060
169 ACAGACACGA ACGAAATTTT GATTATTTCC CATATTCCTA GCGAAGTTAC TAAAGTTCCA 6120
170 ATATTCCAAA TTGTTCCGTA CCCAGATGAA CATAATTATA TTCTAACCGA GCAAATATTC 6180
171 GATAAATTCT ACATATTTGA TAACCAAGTA TTCCATAAAG ATACCAATAG GGATATATTC 6240
172 GACAAATGTA TTATTGGAAT CATCAAACAA GAGCAAACTC AATGCAAATA TATTAAAACA 6300
173 CATAAAAATT ACCAAATAAA TTATATAGAA CCAAATATAC TATTAACATG GAATATTCCT 6360
174 GAAACAGCTG TTAACCAAGA CTGTACACAC AATAAAATAT TAATTTCAGG AAACAACATC 6420
175 ATTAAAATTA AAAATTGTAC CATACAAATA GATGAATTCT TAATCTCTAA TAATCTAGCA 6480
176 GACTTTACAC AAACAATTTA TATCACCAAC AATGTAACAC GTCTAGAACC AATAAATCAC 6540
177 TTACAAACGA GAGAAATGAT AGAAACCCAT GTAAAACACT ATAACTTTTT TCAAATTATA 6600
178 TGCATTACAA CGTTCGTCAT AATGATAATT AGTTTGACTC TGTATGTAGC ATATAAGTTT 6660
179 AAAAATATAC CTAAGAAAAT TATTGTCAAT ATCGTAAGCA AAAAGAACAC ACGCACCTTG 6720
180 AAAATAATGT CAATGAAAAT ATTCAACAAG GAAATAATAT TACCTTATAC CCAAATTTAA 6780
181 CGACCTGAGG ACAGGCCAAA TTCAAAGGTT GGGGGAGTGA CATATCCATA AGTCCCTAAG 6840
182 ACTTAAGCAT ATGCCTACAT ACTAATACAC TTACAACACA TACACCCCAA TACAACATAC 6900
183 ACTACTCCGG ATGTACCCAA CAGATACCAG ATAAGAATAA GATTGTTATA TGATCCTCGA 6960
184 GAATGGAAAA AACCCCAATT CTAGATAAGT CACCCACTGG TAGACTAAAC ATCCGTTCCC 7020
185 CTAATTTAAA CAATTCCTTG CTTAAGCCTC ACCCCATCGT CACATTCCCA CGTTCAAAGC 7080
186 TCGGAGCCGC AATCCCGAAA AACAAAAGTA TCGATTTCAA TAAACAAATT ATAAGAATCT 7140
187 AAGAGCACTT GTATCCAAGA GCAAATGCAC TTGAATCCAA GAGAAACGCA AAGCTTTTTC 7200
188 TCTTTACGAT CAGAATCCTA AAGTCTAAAG TCCATATTAG AAAAGCTCGA TACCGAGGCT 7260
189 TGAACGTCAA CCAAATCAGA ATAATTATCA GAGTTCAGTT TGAGACCTAA TTGTAAAAGG 7320
190 TTCGGTGTTC TTCTCAAATA AAAAGATTGT AATCATTTAG TGAAATAAAA ATTATATTTT 7380
191 TTTCACTTAT AAATATTGCA AGTATTTAAT T 7411
192 //
193 ID DMIS176 standard; DNA; INV; 7439 BP.
194 XX
195 AC X01472; J01060; J01061;
196 XX
197 DR FLYBASE; FBte0000109; Dmel\17.6.
198 XX
199 FT source X01472:1..7439
200 FT SO_feature five_prime_LTR ; SO:0000425:1..512
201 FT SO_feature three_prime_LTR ; SO:0000426:6928..7439
202 FT SO_feature TATA_box ; SO:0000174:372..377
203 FT SO_feature TATA_box ; SO:0000174:7271..7277
204 FT SO_feature primer_binding_site ; SO:0005850:511..529
205 FT SO_feature polyA_signal_sequence ; SO:0000551:372..377
206 FT SO_feature polyA_signal_sequence ; SO:0000551:7299.7304
207 FT SO_feature RR_tract ; SO:0000435:6917..6927
208 FT SO_feature CDS ; SO:0000316:1074..2393
209 FT /name="Dmel\17.6\gag"
210 FT /db_xref="FLYBASE:FBgn0044339"
211 FT /db_xref="SWISS-PROT:P04282"
212 FT /db_xref="NCBI_PROTEIN:CAA25701.1"
213 FT /translation="MAQEPAIVPPLSDSNMTQVAYQIGNVEKFNGDPGSLYTFVSRIDY
214 FT ILALYATGDERQQQIIFGHIERSISGEVMRCIGAYDMYTWQQLRRQLVLNYKPQTPNHV
215 FT LLEEFRKTPFRGNVRAFLEEAESRRQTLTSKLELEQDLEEKTFYLKLIKSSIESLIEKL
216 FT PTHIYLRINNHNIPDLRSLINLLQEKGMYEQINHTSTHVQKQNFSDKPQKSFNQNTNQS
217 FT NNIRKYPTPFLHYNSPIPYQAPQIYQTPPTNNPLYRHPIPYHPNPNNVFQPSQQNNVFQ
218 FT PSQQNNAFQPNQRTNFTSRPIFNTNRNNAFDQNRFGQQPQYQNQQSTQNSSSYVPNRPI
219 FT KRLRPANSGQTGMSVDETLYQEDAFYQQCVPYDYFYYPTYDHSDYYPENQYQIDENNQN
220 FT LQRTQQLQQINTDETNNDNQEPNVEQAENFQPQALENPNI"
221 FT SO_feature CDS ; SO:0000316:2345..5518
222 FT /name="Dmel\17.6\pol"
223 FT /db_xref="FLYBASE:FBgn0014453"
224 FT /db_xref="SWISS-PROT:P04323"
225 FT /db_xref="NCBI_PROTEIN:CAA25702.1"
226 FT /translation="TGRKFSATSLGKPQYITIKYKENNLKCLIDTGSTVNMTSKNIFDL
227 FT PIQNTSTFIHTSNGPLIVNKSIIIPSKILFPTTNEFLLHPFSENYDLLLGRKLLAEAKA
228 FT TISYRDQEVTLYNNKYKLIEGIATHEQSHFQNVNMIPDTMLRQPNKISPILESDLYRLE
229 FT HLNNEEKQRLCALLQKYHDIQYHEGDKLTFTNQTKHTINTKHNLPLYSKYSYPQAYEQE
230 FT VESQIQDMLNQGIIRTSNSPYNSPIWVVPKKQDASGKQKFRIVIDYRKLNEITVGDRHP
231 FT IPNMDEILGKLGRCNYFTTIDLAKGFHQIEMDPESVSKTAFSTKHGHYEYLRMPFGLKN
232 FT APATFQRCMNDILRPLLNKHCLVYLDDIIVFSTSLDEHLQSLGLVFEKLAKANLKLQLD
233 FT KCEFLKQETTFLGHVLTPDGIKPNPEKIEAIQKYPIPTKPKEIKAFLGLTGYYRKFIPN
234 FT FADIAKPMTKCLKKNMKIDTTNPEYDSAFKKLKYLISEDPILKVPDFTKKFTLTTDASD
235 FT VALGAVLSQDGHPLSYISRTLNEHEINYSTIEKELLAIVWATKTFRHYLLGRHFEISSD
236 FT HQPLSWLYRMKDPNSKLTRWRVKLSEFDFDIKYIKGKENCVADALSRIKLEETYLSEQT
237 FT QHSAEEDNSDLIFITERPLNTFNRQVIFSKGPPDIKVTKYFKKHITQIFYDIMTREKAE
238 FT QYLIDHFCGKKSALYIESDADFEVIQAAHKLAINTKYTKILRSTILLKNITTYAEFKEL
239 FT ILTAHEKLLHPGIQKTTKLFGETYYFPNSQLLIQNIINECSICNLAKTEHRNTDMPTKT
240 FT TPKPEHCREKFMIDIYSSEGKHYVSCIDIYSKFATLEEIKTKDWIECKNALMRIFNQLG
241 FT KPKLLKADRDGAFSSLALKRWLESEEVELQLNTTKTGVADIERLHKTINEKIRIIKTSD
242 FT DEETKLSKMETVLNIYNHKTKHDTTGQTPAHIFLYAGQPILDTQQNKENKINKINNDRV
243 FT EYEVDTRYRKGPLQKGKLENPFKPTKNVEQTDSDHYKITNRNRITHYYKTQFKKRKKNN
244 FT QLSISQAPGT"
245 FT SO_feature CDS ; SO:0000316:5488..6903
246 FT /name="17.6\env"
247 FT /db_xref="FLYBASE:FBgn0027624"
248 FT /db_xref="SWISS-PROT:P04283"
249 FT /db_xref="NCBI_PROTEIN:CAA25703.1"
250 FT /translation="SALNFTGTWHLITLLLMLITTVHGQQIEINNIDTNHGYLLFSDKP
251 FT VQIPSSFEHHCLRINLTEIDTIADYFEQRLRTDYHAPQVKFLYNKMRRELAGIALRHRN
252 FT KRGLINIVGSVFKYLFGTLDENDRVDIQRKLETNAHNSVNLHELNDAIQLINDGMQKIQ
253 FT NYENNSNIINSLLYELMQFTEYIEDVEMGMQLSRLGLFNPKLLNYDKLENVNSQNILNI
254 FT KTSTWINYNDNQLLIISHIPINFSLINTVKIIPYPDSNGYQLEYTDTQSYFERENKVYN
255 FT NENKEINNECVTNIIKHLKPICNFESIHTDEIIKYIEPNTIVTWNLTQTSLKQNCQNSF
256 FT NNIKIKGNKMIKVTQCKIEINSIILSENLFKPEIDLTPLYTPLNITKIKTVKHNDINEM
257 FT ISQNNITLYIFMTTVIIILILLYLYLRYVSFNPFMMLYAKLKLRKNQNQNTAQQIEMED
258 FT VPLPLLYPSIPAQV"
259 XX
260 CC Derived from X01472 (g8142) (Rel. 36, Last updated, Version 2).
261 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
262 CC Any changes to original sequence record are annotated in an FT line.
263 XX
264 SQ Sequence 7439 BP; 2985 A; 1512 C; 1048 G; 1894 T; 0 other;
265 AGTGACATAT TCACATACAA AACCACATAA CATAGAGTAA ACATATTGAA AAGCCGCATA 60
266 CGTAAACAAT AAGTGACCAC CATGCTAATG TGGATCAAAT AACAAAAATA TCCACTCTGC 120
267 ATTTTGACAC CCCCATACTG TATGCCATCT GCGCAGTATG CATTCTAATA AACAAATTCT 180
268 TTGACAGCGG CACTTAGCCA TTCTTGTAAA CAAATCTTAA AGTCTGCCTG CTCTCTCTGA 240
269 GGCTTCTCCT CCACTTAAGA ATCCAAGAGC AATGCTCTCC CAAAAACACT AACATATTCT 300
270 TTAAGCAAGC ACAGAGGCTT CTCCTCATTT TCACTTTCAT TTGATTTTCA GTCTTAAGCT 360
271 GAACGTTAAT CAATAAACAA CACAATCGAT ACCGAAATTT TGATTCGTTT TATTTTGGCA 420
272 AAACTCAATT TTCAGCGTTG GTCTTAGTTC ATATTCGGAA CGGTCCATTT AATAGACTCA 480
273 AAACTATTTA TTGCAACCAT TTATTTGCAA TTGGCGCAGT CGATGTGATC AGTGTTAAAG 540
274 TTCCTTGATG CGGTAACCAG ATTTGCCAAT TCCTGTGTTC TTTTTGTTCT CTGACAAAAG 600
275 TACCACGATA ACGGGCACCC ACGTGACGGT TAATATCGCT TTAAGTTTTT AATTAAACCT 660
276 CGACAATAAA GTGAAACCGA AAAATCACAA TTTGCCTAAA CAAACCTGAA TTTATTATCA 720
277 GGAAGACGCT ATTGAATTTG TGAGAGGCTG TAAATCCAAT TGGTTACCTC AAAGACCCAC 780
278 GAAAAAGCTA TAGTGCAACC CTTGCGAAAA TCAAAACCTA TCTTAAAAAA AAAAAAAAAA 840
279 TATAAATAAT AAATTAATAA GCGAAAATTA AAACGTATTA AAAGTAAGAA TAATAAATAA 900
280 ATAAGTGAAA ATTCTATATG ATAAAAATTA AAAATAAGAA TAATAAATAA AAAGACAACA 960
281 TTTTAAATTA AACAATATTA AAAAAATATA AAAATATTAA AAACTATATT AAAAAAAAAA 1020
282 AAAAAACAAA AAAACAAAAA AAAAAAAATA AATAAATAAT CCAAAAATCA AAAATGGCTC 1080
283 AAGAACCAGC AATTGTGCCA CCACTATCAG ACAGCAACAT GACCCAGGTT GCCTACCAGA 1140
284 TTGGCAATGT GGAGAAATTC AACGGTGATC CAGGCTCACT ATACACCTTT GTGAGTCGAA 1200
285 TTGATTACAT ACTGGCTCTT TATGCTACCG GAGATGAACG CCAACAGCAG ATCATATTTG 1260
286 GGCATATTGA ACGCAGCATC AGCGGAGAAG TTATGCGCTG CATTGGAGCC TATGACATGT 1320
287 ACACCTGGCA GCAGCTTAGA AGACAATTGG TACTCAACTA TAAACCCCAG ACCCCTAACC 1380
288 ACGTTCTTTT AGAAGAGTTT CGAAAGACCC CATTTCGAGG CAATGTACGA GCATTCCTGG 1440
289 AAGAAGCAGA AAGCCGCAGA CAAACACTTA CTAGTAAGCT TGAATTAGAG CAAGATCTTG 1500
290 AAGAAAAGAC TTTTTATTTG AAATTAATAA AATCCAGTAT AGAATCACTA ATTGAAAAAT 1560
291 TACCTACACA CATTTATTTA AGAATAAATA ACCACAACAT ACCAGATTTG CGATCACTTA 1620
292 TAAACCTTTT ACAAGAGAAG GGCATGTACG AACAAATAAA TCATACAAGT ACACATGTCC 1680
293 AAAAACAAAA TTTCTCTGAT AAGCCACAAA AGTCCTTTAA TCAAAATACT AATCAGTCTA 1740
294 ACAATATCAG AAAATATCCA ACACCTTTCC TACATTATAA TTCACCAATA CCATATCAAG 1800
295 CTCCACAAAT TTATCAAACA CCACCAACTA ATAACCCACT TTATCGTCAT CCAATACCCT 1860
296 ACCACCCTAA TCCAAACAAT GTTTTTCAAC CAAGCCAACA AAACAATGTT TTCCAACCAA 1920
297 GCCAACAAAA CAATGCTTTT CAACCAAATC AACGAACAAA CTTTACATCT CGACCAATTT 1980
298 TTAACACCAA TCGAAACAAT GCATTCGATC AGAATAGGTT CGGACAACAA CCCCAATATC 2040
299 AAAATCAACA ATCAACACAA AATTCAAGTT CCTATGTACC CAATCGACCA ATAAAACGAT 2100
300 TAAGACCAGC TAATAGTGGA CAGACTGGGA TGAGTGTTGA CGAAACATTA TATCAAGAGG 2160
301 ACGCTTTTTA TCAGCAGTGT GTTCCATATG ACTATTTTTA TTATCCAACT TACGACCATT 2220
302 CAGACTATTA TCCAGAAAAT CAATATCAAA TTGACGAAAA CAACCAAAAT TTACAAAGAA 2280
303 CACAACAGTT ACAGCAGATT AATACAGACG AGACAAACAA TGACAACCAA GAACCCAATG 2340
304 TTGAACAGGC CGAAAATTTT CAGCCACAAG CCTTGGAAAA CCCCAATATA TAACAATTAA 2400
305 ATACAAAGAA AATAATTTGA AATGCCTTAT TGATACCGGA TCAACAGTTA ACATGACATC 2460
306 TAAAAATATA TTTGATTTAC CAATCCAGAA TACTAGTACT TTTATTCATA CCAGCAATGG 2520
307 ACCGCTCATT GTCAACAAAA GTATAATCAT ACCTTCAAAG ATTTTGTTCC CAACAACAAA 2580
308 TGAATTTTTA TTGCACCCTT TCTCTGAGAA TTACGATCTT TTATTAGGAA GAAAACTTTT 2640
309 AGCAGAAGCA AAAGCAACAA TAAGTTACCG CGATCAAGAG GTAACTCTTT ACAACAACAA 2700
310 ATACAAATTA ATAGAAGGAA TAGCAACACA TGAACAGAGT CATTTTCAAA ATGTAAATAT 2760
311 GATACCTGAC ACCATGCTCA GACAGCCAAA TAAAATTTCA CCCATTTTAG AATCAGACCT 2820
312 ATACAGATTG GAACATTTAA ATAACGAAGA AAAACAAAGA TTGTGCGCAC TCCTGCAGAA 2880
313 ATACCATGAC ATACAGTACC ATGAAGGTGA TAAGTTGACA TTTACTAATC AAACCAAACA 2940
314 TACTATCAAT ACAAAGCACA ATCTACCACT TTACTCTAAA TACAGTTACC CACAGGCTTA 3000
315 TGAACAGGAG GTCGAAAGCC AAATACAAGA TATGCTAAAT CAAGGTATTA TACGTACCAG 3060
316 TAATTCACCT TACAATAGCC CCATCTGGGT GGTTCCAAAG AAACAAGATG CATCAGGCAA 3120
317 ACAGAAATTT AGAATTGTAA TAGACTACCG AAAATTAAAT GAAATAACAG TAGGAGACAG 3180
318 ACACCCAATC CCAAACATGG ACGAAATCTT GGGAAAATTG GGCAGATGTA ATTACTTCAC 3240
319 AACTATAGAC TTGGCAAAGG GTTTCCACCA GATCGAAATG GATCCAGAAT CAGTTTCAAA 3300
320 GACAGCCTTT TCTACCAAGC ACGGTCATTA TGAATATTTG CGCATGCCAT TCGGATTAAA 3360
321 AAACGCGCCA GCCACCTTTC AACGGTGCAT GAATGATATT TTAAGACCAC TCTTAAACAA 3420
322 ACACTGTCTT GTGTATTTGG ACGACATAAT TGTATTCTCG ACATCCCTTG ATGAACACCT 3480
323 GCAATCGCTC GGACTAGTTT TCGAAAAATT AGCAAAAGCC AACCTTAAAT TACAACTTGA 3540
324 CAAATGTGAG TTTCTCAAGC AAGAAACCAC ATTTTTAGGA CATGTTCTAA CACCAGATGG 3600
325 AATAAAACCA AACCCTGAAA AAATTGAAGC CATTCAAAAA TATCCAATTC CCACTAAACC 3660
326 AAAAGAAATA AAAGCTTTTC TTGGACTGAC AGGATATTAT CGTAAATTTA TTCCAAACTT 3720
327 TGCAGACATA GCCAAACCCA TGACTAAGTG TTTAAAAAAG AACATGAAAA TTGACACTAC 3780
328 CAACCCAGAA TATGACTCTG CATTTAAAAA ATTAAAATAT CTAATATCAG AAGACCCAAT 3840
329 TCTTAAAGTA CCCGACTTTA CAAAGAAATT CACTTTAACC ACAGACGCAA GTGATGTCGC 3900
330 TTTGGGGGCA GTACTGTCAC AAGATGGACA CCCACTTAGC TACATTAGCC GAACACTTAA 3960
331 TGAACACGAA ATAAATTACA GCACAATTGA AAAAGAACTC TTAGCAATTG TATGGGCGAC 4020
332 AAAGACTTTT CGACACTACC TACTTGGAAG ACACTTTGAA ATATCCAGTG ACCATCAACC 4080
333 ATTGAGCTGG TTGTACCGTA TGAAAGACCC AAATTCAAAA CTGACCCGAT GGAGAGTAAA 4140
334 ATTATCCGAA TTCGATTTTG ATATAAAATA TATAAAAGGA AAAGAAAATT GCGTGGCGGA 4200
335 TGCTCTGTCC AGAATAAAAC TTGAGGAGAC ATATTTGAGC GAACAAACCC AACATAGTGC 4260
336 AGAAGAGGAC AATAGTGATT TAATTTTTAT TACAGAAAGA CCTCTAAATA CATTTAACAG 4320
337 ACAAGTTATA TTTTCAAAAG GACCACCAGA CATTAAAGTT ACGAAATATT TCAAAAAACA 4380
338 CATCACCCAA ATATTTTACG ACATTATGAC CAGGGAAAAA GCCGAACAAT ATTTGATAGA 4440
339 CCATTTTTGT GGTAAGAAAA GTGCGTTGTA TATTGAGAGT GACGCTGATT TCGAAGTCAT 4500
340 TCAAGCCGCA CATAAATTAG CCATAAACAC CAAATATACA AAAATCCTGC GTAGCACGAT 4560
341 TTTGTTAAAA AACATAACCA CTTATGCGGA ATTTAAGGAA TTGATCTTGA CTGCTCATGA 4620
342 AAAACTTCTA CACCCAGGCA TACAGAAAAC TACTAAACTT TTCGGAGAAA CTTACTATTT 4680
343 CCCTAATAGC CAGCTACTTA TTCAGAATAT AATAAATGAG TGCAGTATTT GCAATCTGGC 4740
344 AAAAACAGAG CACCGAAATA CAGACATGCC AACGAAAACC ACACCCAAAC CAGAACATTG 4800
345 CCGCGAAAAA TTCATGATAG ACATTTACTC ATCCGAAGGC AAACATTACG TTAGTTGCAT 4860
346 AGACATTTAT TCGAAATTTG CCACATTAGA AGAAATAAAA ACAAAAGACT GGATAGAATG 4920
347 CAAAAACGCG CTTATGCGCA TATTCAACCA GCTTGGCAAG CCAAAGTTAC TAAAGGCGGA 4980
348 CAGAGACGGC GCATTTTCCA GTTTAGCCCT CAAGAGATGG CTGGAGAGTG AGGAAGTCGA 5040
349 ATTGCAGCTT AACACAACAA AAACTGGTGT GGCGGACATA GAAAGACTAC ATAAAACAAT 5100
350 TAATGAAAAG ATTCGCATAA TCAAAACATC CGATGACGAA GAAACCAAAT TGAGCAAAAT 5160
351 GGAAACAGTA CTTAACATAT ACAATCATAA AACCAAACAC GACACCACTG GACAGACCCC 5220
352 TGCACACATA TTTCTCTACG CTGGACAACC AATATTAGAT ACCCAACAAA ACAAAGAAAA 5280
353 CAAAATAAAC AAAATAAATA ATGACAGAGT GGAGTACGAA GTCGACACAA GATACAGAAA 5340
354 AGGTCCACTA CAGAAAGGCA AATTAGAAAA TCCTTTTAAG CCAACAAAAA ATGTGGAGCA 5400
355 GACTGACTCT GATCATTATA AAATTACTAA TAGAAATAGA ATTACTCACT ACTACAAAAC 5460
356 ACAATTCAAA AAACGAAAGA AAAATAATCA GCTCTCAATT TCACAGGCAC CTGGCACTTG 5520
357 ATAACATTGC TGCTGATGCT GATCACAACA GTTCATGGAC AACAAATTGA AATTAATAAT 5580
358 ATTGACACAA ACCACGGATA TCTCCTTTTT TCTGATAAAC CAGTCCAGAT ACCATCATCC 5640
359 TTTGAACATC ATTGCTTGAG AATCAATTTA ACTGAAATAG ACACCATAGC TGATTATTTT 5700
360 GAGCAAAGAC TACGTACCGA CTACCATGCA CCCCAGGTCA AATTTTTATA CAACAAAATG 5760
361 AGAAGAGAAC TAGCTGGAAT AGCCTTGCGA CATAGAAATA AACGGGGACT TATTAACATT 5820
362 GTAGGTTCAG TTTTTAAATA CCTATTTGGC ACACTTGACG AAAATGATCG AGTGGATATA 5880
363 CAGAGGAAAC TTGAAACAAA CGCCCATAAC TCGGTAAATT TACATGAACT CAATGACGCT 5940
364 ATTCAATTAA TAAATGACGG AATGCAAAAG ATACAGAATT ATGAAAACAA CAGCAACATC 6000
365 ATTAACAGTC TTTTATATGA ACTCATGCAG TTTACAGAAT ACATAGAAGA TGTGGAAATG 6060
366 GGAATGCAGC TTTCCAGACT CGGTCTATTT AATCCCAAAC TACTAAACTA CGATAAACTT 6120
367 GAGAATGTAA ACAGCCAAAA TATTTTAAAC ATTAAAACAT CCACTTGGAT TAATTACAAT 6180
368 GATAACCAAT TATTAATCAT ATCTCACATA CCTATTAACT TTTCATTAAT AAATACAGTA 6240
369 AAAATAATCC CTTACCCAGA CTCGAACGGC TATCAGCTAG AATACACAGA CACACAATCA 6300
370 TATTTTGAAA GAGAAAATAA AGTTTACAAT AACGAAAATA AAGAAATAAA CAATGAGTGT 6360
371 GTCACCAACA TTATTAAACA TTTAAAACCA ATTTGTAATT TTGAGTCAAT CCACACAGAT 6420
372 GAAATAATAA AATACATAGA ACCAAACACA ATTGTAACCT GGAATTTAAC CCAAACAAGT 6480
373 CTCAAACAAA ATTGTCAAAA TTCATTTAAT AATATAAAAA TAAAAGGAAA CAAAATGATA 6540
374 AAAGTAACCC AATGTAAAAT AGAAATCAAT AGCATAATTC TAAGTGAAAA TCTCTTTAAA 6600
375 CCAGAAATAG ATTTGACACC ATTATACACA CCACTTAACA TAACAAAAAT AAAAACTGTT 6660
376 AAACACAACG ACATTAATGA AATGATTTCA CAAAACAATA TTACACTTTA CATATTTATG 6720
377 ACTACTGTCA TCATTATACT TATTTTATTG TACTTATATT TAAGATACGT ATCATTTAAC 6780
378 CCATTCATGA TGCTGTATGC AAAACTAAAA TTAAGAAAAA ATCAAAATCA AAACACAGCA 6840
379 CAACAAATAG AAATGGAAGA CGTTCCATTA CCCCTACTAT ATCCATCAAT CCCAGCCCAA 6900
380 GTATAGGCTT CTCTTTAAGG GAAGGGAAGT GACATATTCA CATACAAAAC CACATAACGT 6960
381 AGAGTAAACA TATTGAAAAG CCGCATACGT CAACAATAAG TGACCACCAT GCTAATGTGG 7020
382 ATCAAATAAC AAAAATATCC ACTCTGCATT TTGACACCCC CATACTGTAT GCCATCTGCG 7080
383 CAGTATGCAT TCTAATAAAC AAATTCTTTG ACAGCGGCAC TTAGCCATTC TTGTAAACAA 7140
384 ATCTTAAAGT CTGCCTGCTC TCTCTGAGGC TTCTCCTCCA CTTAAGAATC CAAGAGCAAT 7200
385 GCTCTCCCAA AAACACTAAC ATATTCTTTA AGCAAGCACA GAGGCTTCTC CTCATTTTCA 7260
386 CTTTCATTTG ATTTTCAGTC TTAAGCTGAA CGTTAATCAA TAAACAACAC AATCGATACC 7320
387 GAAATTTTGA TTCGTTTTAT TTTGGCAAAA CTCAATTTTC AGCGTTGGTC TTAGTTCATA 7380
388 TTCGGAACGG TCCATTTAAT AGACTCAAAA CTATTTATTG CAACCATTTA TTTGCAATT 7439
389 //
390 ID DMTN1731 standard; DNA; INV; 4648 BP.
391 XX
392 AC X07656;
393 XX
394 DR FLYBASE; FBte0000003; Dmel\1731.
395 XX
396 FT source X07656:1..4648
397 FT SO_feature five_prime_LTR ; SO:0000425:1..336
398 FT SO_feature three_prime_LTR ; SO:0000426:4313..4648
399 FT SO_feature TATA_box ; SO:0000174:110..116
400 FT SO_feature primer_binding_site ; SO:0005850:342..352
401 FT SO_feature CDS ; SO:0000316:431..1252
402 FT /name="Dmel\1731\gag"
403 FT /db_xref="FLYBASE:FBgn0020768"
404 FT /db_xref="REMTREMBL:CAA30502"
405 FT /db_xref="NCBI_PROTEIN:CAA30502.1"
406 FT /translation="MSNLYQIDKLEDGSYETWSIQMRSVLVHACLWKVVSGESVKPEVD
407 FT TGGAWQSQDEKALATIILSVKSSQLGYVKGCLTAAEAWKVLQDVHQPKGPLRTVMLYKK
408 FT LLSKRLLEGQSISSHIKEFKEIFDALDAVEIGITEKLRSVVLLSSLPESFENFVVAIET
409 FT RDDVPLFDALCIKLIEEDTRRGGAEQQREKQTESAKAFTAVHKPQAPAREARPSAKKRK
410 FT DVVCYNCGERRHFKANCRREKVNKESATQEQCSLLNALDSGGFWQNTVVSR"
411 FT SO_feature CDS ; SO:0000316:1203..4151
412 FT /name="Dmel\1731\RTase"
413 FT /db_xref="FLYBASE:FBgn0012032"
414 FT /db_xref="REMTREMBL:CAA30503"
415 FT /db_xref="NCBI_PROTEIN:CAA30503.1"
416 FT /translation="MRWIVVVFGKTQWCLDSGATSHMCCDRSVFTEFEEHTEKISLAGN
417 FT GFLLAKGIGTVKLKTDLCTLVLNNVLFVPDLNGNFMSVSRAAQYKCFVNFGPHYADVIQ
418 FT EGERILRVMRAGNLYMFQGKHNSCFAAVDADGSLWHKRNGHLNTSSLQEMVRKKMVYGV
419 FT EKVVFKPDAVCKTCMLAKIHVQPFPKTTRSRAEELLDMIHSDLCGPFSTPSLAGSKYFL
420 FT TFIDDKSRRIFVYFLRKKDEVFTKFVEFKKLVERQTGRKIKCIRSDNGGEFVNNVFDDY
421 FT LKAHGIARQLTIPHTPQQNGVAERANRTLVEMARCMLLQSELGEALWAEAINTAVYLRN
422 FT RSTSRALQSKTPMEEWTGKIPAVSHLRVFGAIAVALDKGVHKGKFESKGKEYRMIGYSI
423 FT AAKGYRLFDKEKRCVIEKQDVLFDESGSLVNHGNTIEFQFPATDDPEPQSDSNAREGDD
424 FT TEPVGSSDDYESAAEAEEAEVHVGPGRPKIVRTGRPGRPKKQYNVLGVLMASDVEIPKS
425 FT YEEAINSQYSAKWEEAMGLEYKALLANETWKLADLPRNRRCVACKWVYSLKRDVSGRIE
426 FT RFKARLVAKGCSQKFGVDYFETFSPVCRLESVRLILALAAEMQLYLHHMDVCTAYLNSE
427 FT LKDTVYMKQPQGFTDAANPDQVLLLRKAIYGLKQSGREWNSKLDGVLKDLGFKACNHEP
428 FT CLYQQSGQGNLMLILVYVDDLILACQSREDMEDLKAKISESFECTDKGPLHLFLGMEVQ
429 FT RDGDLGEITLGHSQYIKELLRDYGSENCRPATTPLDAGHQVLCAGEQCQKVDAGQYQST
430 FT IGELMWLGLTTRPDMLHSVAKLAQRNQDPHSEHMVAVKHILRYLASTVDVKLHYQKCGQ
431 FT AFTGFVDADWGGDRLDRKSYTGYVFFLSGGPVSWRSEKQQSVALSSTEAEYMALTTACK
432 FT EAIALRRLIVEIVCGDLKTPTVMHGDNLKCAAQLAKNPVHHSRTKHIDIRYH"
433 XX
434 CC Derived from X07656 (g8700) (Rel. 36, Last updated, Version 6).
435 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
436 CC Any changes to original sequence record are annotated in an FT line.
437 XX
438 SQ Sequence 4648 BP; 1316 A; 880 C; 1268 G; 1184 T; 0 other;
439 TGTTGAATAT AGGCAATGCC CACATGTGTG TTGAATATAG GCAATTTCCA CATGTGCATA 60
440 TGTAATTTTG TATGAGAACA TACATACATA CACATGAACT GTATGTATGT ATATATATTA 120
441 GCAAATAAGC AGCCGCATGA AGGTGGCATT TTTATGTGTA TCAGTTTCAG TTTCAAATAA 180
442 AACTTCTTCG TGTTCGGACA CGCGGCTCAA GACTTTTTAT TTCGCGTTTA CTCTTTCAGC 240
443 CTTTGCTCTC AATTCGCTGA GTTTGGGTGA AGATTAGGAT CTTCCCATTA TGATTGTCAG 300
444 TGTTCCACAC TTGGAGCACC TTTTCAATAA ACAACAGGTT AATGGGCCCA GCGCCCTAGG 360
445 AGCTGCCTAA AGGAGAAACG TGTAGTGAAA CTCAGGAGTT AGATTTTGGA GTCTACTCAA 420
446 GATTGCCGGA ATGAGTAACC TGTATCAGAT CGATAAGCTG GAGGATGGAT CCTATGAAAC 480
447 GTGGAGCATC CAGATGCGTT CAGTGTTGGT GCACGCATGT TTGTGGAAGG TGGTTTCAGG 540
448 AGAGTCCGTG AAACCTGAGG TTGATACTGG AGGTGCTTGG CAATCCCAAG ATGAAAAAGC 600
449 ATTGGCCACG ATCATCTTGA GTGTGAAGTC TTCGCAACTT GGTTATGTAA AAGGGTGTCT 660
450 CACTGCGGCT GAGGCATGGA AAGTTTTACA GGATGTCCAC CAGCCGAAAG GGCCGTTACG 720
451 AACGGTCATG CTGTATAAGA AGTTGCTGAG CAAACGTCTG TTGGAAGGGC AGAGTATATC 780
452 GTCACATATT AAAGAATTTA AGGAAATCTT TGATGCCCTT GATGCGGTGG AAATTGGTAT 840
453 CACCGAGAAA TTGCGCAGTG TTGTTTTGCT GTCGAGCCTT CCAGAGAGTT TCGAGAATTT 900
454 CGTTGTCGCC ATTGAGACGC GCGACGACGT GCCGCTTTTC GATGCTCTAT GTATAAAGCT 960
455 GATCGAGGAA GACACGAGAA GGGGAGGAGC GGAGCAGCAG AGAGAAAAAC AAACGGAGAG 1020
456 CGCAAAGGCA TTTACTGCAG TACATAAGCC ACAGGCGCCG GCGAGAGAAG CTCGGCCGAG 1080
457 CGCAAAGAAG AGGAAAGACG TAGTTTGTTA TAACTGTGGA GAGCGTAGGC ATTTTAAAGC 1140
458 GAACTGTCGT CGCGAGAAAG TAAACAAAGA GAGCGCGACA CAAGAACAAT GCAGTTTGTT 1200
459 AAATGCGCTG GATAGTGGTG GTTTTTGGCA AAACACAGTG GTGTCTCGAT AGCGGGGCTA 1260
460 CCAGTCACAT GTGCTGTGAC AGAAGTGTTT TTACTGAGTT TGAAGAGCAC ACTGAAAAAA 1320
461 TTAGTCTTGC TGGAAATGGA TTCCTACTAG CAAAGGGCAT AGGAACAGTG AAGCTGAAGA 1380
462 CTGATTTATG TACTCTGGTA TTGAATAACG TACTCTTCGT CCCAGATTTG AACGGCAACT 1440
463 TTATGTCAGT CAGCCGTGCA GCTCAGTATA AATGTTTTGT CAATTTTGGA CCACATTACG 1500
464 CTGACGTCAT TCAGGAAGGC GAGCGAATAC TGCGTGTAAT GAGAGCTGGT AATTTATATA 1560
465 TGTTTCAAGG GAAACATAAC AGTTGTTTTG CGGCCGTTGA TGCTGATGGT TCACTATGGC 1620
466 ATAAAAGGAA TGGCCATTTG AATACAAGCA GCCTACAGGA GATGGTGAGG AAGAAGATGG 1680
467 TGTACGGTGT TGAAAAGGTC GTTTTCAAAC CAGACGCAGT ATGCAAGACG TGCATGCTGG 1740
468 CAAAAATCCA TGTGCAACCA TTTCCGAAGA CAACGAGGAG CAGAGCTGAG GAGCTGTTGG 1800
469 ATATGATCCA TTCAGACCTG TGCGGGCCAT TTAGCACACC GTCACTTGCT GGATCAAAGT 1860
470 ACTTTCTCAC TTTCATAGAC GACAAGTCCA GGCGGATTTT TGTATATTTC TTGCGGAAGA 1920
471 AGGACGAAGT CTTCACTAAG TTTGTCGAGT TTAAGAAACT GGTCGAGCGA CAAACAGGTA 1980
472 GAAAGATAAA ATGTATCCGG AGCGATAATG GTGGTGAGTT CGTCAATAAT GTTTTTGATG 2040
473 ACTATTTAAA GGCACATGGG ATCGCTAGAC AGCTGACTAT TCCACACACT CCCCAACAAA 2100
474 ATGGAGTTGC AGAACGAGCC AACCGCACGC TAGTAGAAAT GGCTAGGTGC ATGTTGCTGC 2160
475 AATCGGAGTT GGGTGAGGCT CTATGGGCTG AGGCGATAAA CACTGCGGTG TATCTGAGGA 2220
476 ACCGATCAAC GAGCAGAGCA TTACAAAGCA AAACCCCTAT GGAAGAGTGG ACCGGAAAAA 2280
477 TACCAGCAGT GAGCCACTTG AGGGTTTTTG GTGCCATAGC AGTGGCATTG GACAAAGGAG 2340
478 TCCATAAAGG CAAATTCGAA TCCAAAGGAA AGGAATATCG TATGATTGGA TATTCAATAG 2400
479 CTGCTAAGGG GTACCGTCTG TTTGACAAAG AGAAGCGGTG TGTGATCGAG AAGCAAGATG 2460
480 TCCTTTTTGA TGAGTCTGGT AGTTTGGTAA ATCATGGAAA TACCATTGAG TTCCAGTTTC 2520
481 CCGCAACTGA TGACCCGGAG CCGCAGAGTG ATTCGAATGC ACGGGAAGGT GACGATACAG 2580
482 AACCCGTGGG CAGCAGCGAC GACTATGAGA GTGCAGCTGA GGCAGAAGAA GCTGAAGTAC 2640
483 ATGTGGGGCC TGGACGGCCA AAGATTGTTC GGACGGGCAG ACCAGGGCGC CCGAAGAAGC 2700
484 AATACAATGT ACTTGGCGTG TTGATGGCTA GCGACGTCGA AATTCCCAAG TCCTATGAGG 2760
485 AGGCCATCAA TTCGCAGTAT TCTGCAAAGT GGGAAGAGGC AATGGGCCTG GAGTACAAGG 2820
486 CGCTACTTGC AAATGAGACA TGGAAGCTGG CTGACTTACC AAGAAATCGC CGGTGTGTGG 2880
487 CTTGCAAGTG GGTGTATTCC CTGAAACGAG ACGTCTCTGG TAGAATTGAG CGCTTCAAGG 2940
488 CACGACTAGT AGCAAAGGGG TGTTCGCAGA AGTTCGGAGT GGACTACTTC GAGACTTTTT 3000
489 CACCCGTGTG CAGGCTCGAG AGTGTGAGGC TCATTTTGGC ATTGGCAGCA GAGATGCAAT 3060
490 TGTACTTGCA TCACATGGAC GTATGCACGG CGTACTTAAA TAGCGAGCTA AAGGATACTG 3120
491 TGTACATGAA GCAGCCCCAA GGGTTCACAG ATGCTGCTAA TCCCGACCAG GTGTTATTGC 3180
492 TGAGGAAGGC AATATACGGC TTGAAGCAGT CAGGCAGAGA GTGGAACTCC AAGCTCGACG 3240
493 GTGTTCTAAA AGACTTGGGA TTTAAGGCCT GTAATCATGA ACCATGTCTT TATCAGCAAA 3300
494 GTGGTCAAGG TAATCTGATG CTCATCTTAG TATATGTTGA TGATTTAATT CTAGCGTGCC 3360
495 AGTCAAGAGA AGATATGGAG GATCTGAAAG CCAAGATTTC AGAGTCTTTC GAGTGCACGG 3420
496 ACAAGGGTCC ACTGCATTTG TTCTTAGGCA TGGAGGTGCA ACGAGATGGC GACCTTGGAG 3480
497 AAATCACTTT GGGCCATTCG CAATATATCA AGGAACTATT GCGGGATTAT GGCAGCGAGA 3540
498 ACTGTAGACC AGCGACGACA CCTTTGGATG CAGGGCATCA AGTTTTGTGC GCGGGTGAGC 3600
499 AGTGCCAGAA GGTCGACGCA GGGCAGTATC AGTCTACAAT TGGTGAGCTA ATGTGGCTTG 3660
500 GGCTTACTAC CAGACCAGAC ATGCTACATT CGGTGGCGAA GTTGGCTCAG AGGAATCAGG 3720
501 ACCCGCATTC TGAGCACATG GTGGCTGTGA AGCACATCCT CCGGTACTTG GCGTCAACTG 3780
502 TGGACGTCAA GCTGCATTAT CAAAAGTGCG GTCAGGCATT TACCGGCTTT GTGGATGCAG 3840
503 ATTGGGGAGG CGACCGTTTG GACCGAAAGT CATACACAGG GTATGTGTTT TTCCTGTCTG 3900
504 GCGGACCAGT ATCATGGAGG TCCGAGAAGC AGCAGAGCGT GGCGTTGAGC AGTACTGAAG 3960
505 CCGAGTATAT GGCTCTGACC ACGGCTTGCA AGGAAGCTAT AGCTTTACGA AGGCTAATAG 4020
506 TGGAGATCGT ATGCGGTGAT CTGAAGACCC CGACGGTTAT GCATGGCGAC AACCTGAAGT 4080
507 GCGCAGCACA GTTAGCGAAG AACCCGGTTC ATCACTCTAG GACGAAGCAC ATCGACATTC 4140
508 GATATCATTA GAGAAGTCAT GAAAGAGGGT CACGTTGTGT TAGAGTACAC TTCTACGAAT 4200
509 GAGATGATAG CAGACATTAT GACAAAGAAT CTTTCAAAGG GAAAGCATAA TGGGTTTATG 4260
510 AAAATGTTAA ATTTGTTTTA ATTTTTGTAA ACATGTTGGC ATTGAGGAAG GCTGTTGAAT 4320
511 ATAGGCAATG CCCACATGTG TGTTGAATAT AGGCAATTTC CACATGTGCA TATGTAATTT 4380
512 TGTATGAGAA CATACATACA TACACATGAA CTATATGTAT GTATATATAT TAGTAAATAA 4440
513 GCAGCCGCAT GAAGCTGGCA TTTTTATGTG TATCAGTTTC AGTTTCAAAT AAAACTTCTT 4500
514 CGTGTTCGGA CGCTCGGCTC AAGACTTTTT ATTTCGCGTT TACTCATTCG GCCTTTGCTC 4560
515 TCAATGCGCT GAGTTTGGGT GAAGATTAGG ATCTTCCCAT TATGGTTGTC AGTGTTCCAC 4620
516 ACTGGGAGCA CCTTTTCAAC AAACCACA 4648
517 //
518 ID DMIS297 standard; DNA; INV; 6995 BP.
519 XX
520 AC X03431;
521 XX
522 DR FLYBASE; FBte0000675; Dmel\297.
523 XX
524 FT source X03431:1..6995
525 FT SO_feature five_prime_LTR ; SO:0000425:1..414
526 FT SO_feature three_prime_LTR ; SO:0000426:6582..6995
527 FT SO_feature TATA_box ; SO:0000174:276..282
528 FT SO_feature TATA_box ; SO:0000174:6857..6863
529 FT SO_feature polyA_signal_sequence ; SO:0000551:304..309
530 FT SO_feature polyA_signal_sequence ; SO:0000551:6885..6890
531 FT SO_feature primer_binding_site ; SO:0005850:414..431
532 FT SO_feature RR_tract ; SO:0000435:6571..6581
533 FT SO_feature CDS ; SO:0000316:803..2047
534 FT SO_feature start_codon ; SO:0000318:1..3
535 FT /name="Dmel\297\gag"
536 FT /db_xref="FLYBASE:FBgn0044338"
537 FT /db_xref="SWISS-PROT:P20828"
538 FT /db_xref="NCBI_PROTEIN:CAA27159.1"
539 FT /translation="MSQPIIALSDINLAEARRQLKDIMPFKGDPETLHTFISRVDYVIS
540 FT LYQTNDVRQQRILLGAIERNLDGQITRSLGLPNVEDWPTLKARLIAEFKIQTPNYKLLE
541 FT NFRETPYRGSLRAFCEEAERRRQLLISKLHLEGNQSDFLIYIQGIKESIKILIRKLPIQ
542 FT LFTILAHHDITDLRSLITIAQNEGIYEEHINFEFYEKPEYRNKNSNSNQNSKTQKFNTN
543 FT VQTQNRPSYSQYSQPFQPNFNQYIQPFRPSYTQQITNNPPMWHAPNYFRPNQYINPQPI
544 FT IQKNHFQQYPNKAQFPQTTHFRGNTYPRLQQPSTYKNTNFPITKRLRPSDSEQTKMSID
545 FT EIRFQDAHEFEQVQPNYYEQQYFNQNQYNPYQNHSFINEGQQQVQFVQINNKQNQNNSE
546 FT LNENFRLTVPENTNT"
547 FT SO_feature CDS ; SO:0000316:<1999..5178
548 FT /name="Dmel\297\pol"
549 FT /db_xref="FLYBASE:FBgn0027622"
550 FT /db_xref="SWISS-PROT:P20825"
551 FT /db_xref="NCBI_PROTEIN:CAB57796.1"
552 FT /translation="TKRKFSVNSSGKYEYIKIVYKGRSYKCLLDTGSTINMINENIFCL
553 FT PIQNSRCEVLTSNGPITLNDLIMLPRNSIFKKTEPFYVHRFSNNYDMLIGRKLLKNAQS
554 FT VINYKNDTVTLFDQTYKLITSESERNQNLYIQRTPESIASSDQESIKKLDFSQFRLDHL
555 FT NQEETFKLKGLLNKFRNLEYKEGEKLTFTNTIKHVLNTTHNSPIYSKQYPLAQTHEIEV
556 FT ENQVQEMLNQGLIRESNSPYNSPTWVVPKKPDASGANKYRVVIDYRKLNEITIPDRYPI
557 FT PNMDEILGKLGKCQYFTTIDLAKGFHQIEMDEESISKTAFSTKSGHYEYLRMPFGLRNA
558 FT PATFQRCMNNILRPLLNKHCLVYLDDIIIFSTSLTEHLNSIQLVFTKLADANLKLQLDK
559 FT CEFLKKEANFLGHIVTPDGIKPNPIKVKAIVSYPIPTKDKEIRAFLGLTGYYRKFIPNY
560 FT ADIAKPMTSCLKKRTKIDTQKLEYIEAFEKLKALIIRDPILQLPDFEKKFVLTTDASNL
561 FT ALGAVLSQNGHPISFISRTLNDHELNYSAIEKELLAIVWATKTFRHYLLGRQFLIASDH
562 FT QPLRWLHNLKEPGAKLERWRVRLSEYQFKIDYIKGKENSVADALSRIKIEENHHSEATQ
563 FT HSAEEDNSNLIHLTEKPINYFKKQIIFIKSDKNKVEHSKIFGNSITTIQYDVMTLEKAK
564 FT QILLDHFIHRNITIYIESDVDFEIVQRAHIEIVNTTYTKVIRSLFLLKNVGSYAEFKEI
565 FT ILQSHEKLLHPGIQKMTKLFKENHFFPNSQLLIQNIINECNICNLAKTEHRNTKMPLKI
566 FT TPNPEHCREKFVVDIYSSEGKHYISCIDIYSKFATLEQIKTKDWIECRNALMRIFNQLG
567 FT KPKLLKADRDGAFSSLALKRWLEEEEVELQLNTAKNGVADVERLHKTINEKIRIINSSD
568 FT DEEVKLSKIETILYTYNQKIKHDTTGQRPAQIFLYAGHPILDTQKIKEKKIEKINEDRR
569 FT EFNIDTNYRKGPLQKGKLENPFKPTKNVEQTDPDHYKITNRNRVTHYYKTQFKKQKKNN
570 FT KLSISQAPGTR"
571 FT SO_feature CDS ; SO:0000316:5145..6560
572 FT SO_feature start_codon ; SO:0000318:1..3
573 FT /name="297\env"
574 FT /db_xref="FLYBASE:FBgn0027623"
575 FT /db_xref="SWISS-PROT:P20829"
576 FT /db_xref="NCBI_PROTEIN:CAB57797.1"
577 FT /translation="TLNFTGTWYPITLLFILITAVHGQQIQINNIDTNHGYLLFSDKPV
578 FT QIPSSFEHHSLKINLTEIDIVVDYFEQRLRTDYHAPQINFLYNKIKRELARITLKHRNK
579 FT RGFINIVGSGFKYLFGTLDENDRVEIQKKLEINVHNSVKLHELNDAIRLINDGMQKIQN
580 FT YENNHTIIDSLLFELMQFTEYIEDLEMAMQLSRLGLFNPKLLNYDKLENVNSQNILNIK
581 FT TSTWINYNDNQVLIISHIPIYLSLISTIKIIPYPDSNGYQLDYTDTQSYFEKENKVYNT
582 FT ENKEVKNECVTNIIKHLNPICNFKPVHTNEIIKYIEPNTIVTWNLTQTILNQNCQNSIN
583 FT KIKIEGNKMIRVTQCKIEINNINFSETLLEPEIDLTPLYTPLNITKIKIVKHNDIIEMI
584 FT SENNITLYIQMIIVIIALILLYSYLRYVSFKPFMMLYAKLKIRKNQNQNTPQQTEIEEI
585 FT PFPTLYPSIPAQV"
586 XX
587 CC Derived from X03431 (g8146) (Rel. 36, Last updated, Version 2).
588 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
589 CC Any changes to original sequence record are annotated in an FT line.
590 XX
591 SQ Sequence 6995 BP; 2811 A; 1356 C; 972 G; 1856 T; 0 other;
592 AGTGACGTAT TTGGGTGGTC CAAACCAGCC ACTTCCATTA TTTCAAAGAA ATCAGTAATG 60
593 CACTCTAGTA ATTTTCCATA ACTGTATCCC AGCTGCGCAG ACTCGTTTAT CTTTTGCAGC 120
594 GCAGCGTTCT TTGTAAACAT CCTAAAGACC TGCCTAAGCA GATTTGACTG CCCTCTTTCA 180
595 ACGCTACCTA ATCTTAAGAA CCCAAGAGCG AGGCTCTCCC GAAATACAAA TATTGTTCAA 240
596 ATACTGAGGC TTCTCCTCAA TCCAATTTGC ATTTGATTTT TAGTCTTAAG CTGAGATCCA 300
597 AAGAATAAAG TCGTGAAACT ATTTCTCCTA AAAACTATTT TTTATTTCTT GGCGTTGTCC 360
598 TTAGTCAACT GACGGGACAT TAGTTCGACT CATAAATAAA ACAACAATTT TACTGGCGCA 420
599 GTCGGTAGGA TACAAAAGTA TCCGAAAAAA AAGAACCTTC GAATGGAAAA TAAGTTAAAT 480
600 TTTATAGTCC TGTGCTCGAA ACATCTCCCA AAATAAATTC GTGAAAACTC TTCAACTTCA 540
601 ATTATAATTC CAATTCGGTT ATCCAATAAT AAGTGGAAGT GAAATACGAA ACAAAAATAT 600
602 TAAGTCCAAA GGCAACTAAG TTTTAAAACC AACATATAAA AATAAAAAAT TAAAACAATA 660
603 TAGAATTTTA ATAATACAAC ACAAAAATTT ACAAAACAAA AAAACAAACA AGTGAAACTA 720
604 GAAAGCTTAA AAATAATAAT AACATTGAAT CCGAAACAAA ACAAAAAAAT AAAACACAAA 780
605 AGTTAAAAAT TTTACAATAA AAATGTCACA ACCAATTATT GCGCTGAGCG ACATAAACCT 840
606 TGCCGAAGCC CGTCGGCAGC TTAAAGACAT TATGCCATTC AAGGGTGATC CAGAAACCCT 900
607 TCACACCTTT ATCAGCAGAG TGGATTACGT AATTTCGCTC TACCAAACAA ATGATGTCCG 960
608 ACAACAGAGG ATTCTACTGG GAGCCATCGA AAGGAACTTG GACGGACAAA TTACACGATC 1020
609 TTTGGGACTT CCGAACGTCG AAGATTGGCC TACCCTTAAA GCAAGACTCA TCGCGGAATT 1080
610 TAAAATTCAA ACACCAAACT ACAAACTTCT GGAGAACTTC AGGGAGACAC CATACAGAGG 1140
611 AAGCCTAAGA GCATTCTGCG AAGAAGCGGA GAGACGACGT CAATTACTAA TTTCGAAACT 1200
612 ACACCTGGAA GGTAACCAAT CGGATTTTCT TATTTATATT CAGGGTATTA AAGAATCTAT 1260
613 TAAGATACTG ATAAGGAAAC TACCAATACA ATTATTCACT ATTTTAGCCC ATCACGATAT 1320
614 TACAGACTTA AGATCCTTAA TTACCATTGC ACAAAATGAG GGAATTTATG AAGAACACAT 1380
615 TAATTTTGAA TTTTATGAAA AACCAGAATA TCGTAATAAA AATTCAAATT CTAACCAGAA 1440
616 TTCGAAAACA CAAAAATTCA ATACAAATGT TCAAACTCAA AATCGACCAA GTTACTCACA 1500
617 ATATTCCCAA CCCTTCCAAC CTAATTTTAA TCAATACATT CAACCATTTA GACCTAGCTA 1560
618 TACACAGCAG ATAACTAACA ACCCACCCAT GTGGCACGCA CCTAATTATT TCAGACCCAA 1620
619 CCAATACATA AACCCACAAC CCATTATTCA AAAAAATCAT TTCCAACAAT ATCCCAACAA 1680
620 AGCCCAATTT CCCCAAACAA CGCATTTTAG AGGAAATACA TACCCTCGAC TACAACAACC 1740
621 CTCTACATAT AAAAATACTA ACTTCCCGAT TACTAAACGA CTAAGACCAT CGGACAGTGA 1800
622 ACAAACTAAA ATGTCTATTG ACGAAATTAG ATTCCAAGAC GCGCATGAAT TCGAACAAGT 1860
623 CCAACCTAAT TATTACGAGC AACAGTATTT TAACCAAAAT CAATACAATC CGTATCAAAA 1920
624 TCATAGCTTC ATTAATGAAG GGCAACAACA AGTTCAATTT GTACAAATTA ATAACAAACA 1980
625 AAACCAAAAT AATTCTGAAC TAAACGAAAA TTTTCGGTTA ACAGTTCCGG AAAATACGAA 2040
626 TACATAAAAA TAGTATACAA AGGGCGTTCA TACAAATGCC TTCTAGACAC AGGATCAACA 2100
627 ATTAATATGA TCAATGAAAA TATATTTTGT CTTCCCATTC AAAATAGTAG ATGTGAAGTT 2160
628 TTAACATCAA ATGGCCCTAT TACCTTGAAC GACTTGATTA TGTTACCCAG AAATAGTATT 2220
629 TTCAAAAAAA CCGAACCATT TTATGTGCAC AGATTTTCTA ATAATTACGA TATGCTAATT 2280
630 GGCAGAAAAT TGTTGAAAAA TGCTCAATCA GTTATTAATT ACAAAAATGA TACAGTTACC 2340
631 CTTTTTGATC AAACATACAA ATTAATTACT TCAGAATCCG AAAGAAACCA AAATTTGTAT 2400
632 ATCCAAAGGA CACCAGAATC AATTGCAAGC TCAGATCAGG AATCAATAAA AAAATTAGAT 2460
633 TTTTCACAGT TTCGATTAGA TCACCTAAAT CAGGAGGAAA CTTTTAAGTT AAAAGGCTTG 2520
634 TTAAATAAAT TTAGAAATCT TGAATATAAG GAGGGAGAGA AATTAACATT TACAAATACA 2580
635 ATTAAACACG TACTAAATAC AACACATAAC TCCCCAATTT ATTCGAAACA ATACCCACTT 2640
636 GCGCAAACAC ACGAAATCGA AGTAGAAAAC CAAGTACAGG AAATGCTGAA TCAGGGATTA 2700
637 ATTAGGGAAA GTAATTCTCC ATACAATAGT CCTACTTGGG TCGTACCAAA GAAACCGGAT 2760
638 GCTTCTGGTG CAAATAAGTA CAGGGTAGTA ATTGATTATA GAAAGCTAAA TGAAATAACC 2820
639 ATACCTGACA GATATCCAAT TCCAAATATG GACGAAATTC TTGGCAAACT GGGTAAATGC 2880
640 CAATATTTTA CAACGATCGA TCTGGCAAAG GGATTTCATC AAATAGAAAT GGACGAAGAA 2940
641 TCAATTTCTA AAACTGCATT CTCCACAAAA AGCGGTCATT ACGAATACCT TCGAATGCCA 3000
642 TTTGGCCTTA GGAATGCACC CGCTACTTTT CAAAGGTGCA TGAATAATAT CCTTCGACCG 3060
643 TTGCTTAACA AACACTGTTT GGTGTATCTG GATGATATTA TAATTTTTTC AACATCCCTT 3120
644 ACAGAACATT TAAATTCAAT ACAATTAGTT TTTACAAAGC TTGCAGATGC AAATTTAAAA 3180
645 TTGCAACTAG ACAAATGTGA GTTCTTAAAA AAGGAAGCTA ACTTTCTTGG TCACATAGTT 3240
646 ACCCCTGATG GTATTAAACC AAATCCTATT AAAGTTAAAG CCATAGTTTC ATACCCAATT 3300
647 CCGACAAAAG ATAAAGAGAT AAGAGCTTTC CTTGGATTAA CAGGTTATTA TCGCAAATTT 3360
648 ATTCCAAATT ACGCAGACAT AGCAAAACCC ATGACCAGCT GCTTAAAAAA AAGGACAAAG 3420
649 ATAGATACAC AAAAACTTGA GTACATAGAG GCATTCGAAA AACTTAAGGC TTTGATAATT 3480
650 CGTGACCCAA TTTTACAATT ACCTGATTTT GAAAAGAAAT TTGTTTTAAC CACAGATGCA 3540
651 AGTAACTTGG CCCTCGGGGC TGTCCTTTCT CAAAACGGTC ATCCTATATC TTTTATTAGT 3600
652 AGAACACTTA ACGATCACGA ATTAAATTAC AGTGCTATCG AAAAAGAATT ACTTGCCATA 3660
653 GTTTGGGCCA CAAAAACTTT TCGACATTAT TTACTAGGAC GACAATTTCT CATTGCCAGT 3720
654 GACCATCAAC CTCTTAGATG GCTTCATAAC TTAAAGGAAC CAGGTGCTAA GTTAGAAAGA 3780
655 TGGAGAGTTA GATTAAGCGA ATACCAATTT AAAATAGATT ATATTAAAGG GAAAGAAAAT 3840
656 TCAGTTGCCG ATGCATTATC AAGAATTAAA ATTGAAGAAA ATCATCATAG TGAAGCTACT 3900
657 CAACATAGTG CAGAAGAGGA CAATAGCAAC CTTATTCATT TAACAGAAAA ACCAATAAAT 3960
658 TATTTCAAAA AACAAATAAT CTTTATTAAA TCCGATAAAA ATAAAGTAGA GCATTCAAAA 4020
659 ATATTCGGTA ACTCCATTAC CACAATTCAA TATGACGTAA TGACACTTGA AAAGGCCAAA 4080
660 CAAATTTTAC TCGATCACTT TATCCATAGA AACATTACCA TTTATATTGA GAGCGATGTA 4140
661 GATTTTGAAA TCGTTCAAAG AGCACACATA GAAATTGTTA ATACCACCTA CACAAAAGTA 4200
662 ATTCGCAGTC TTTTCCTATT AAAGAACGTT GGTTCATACG CCGAATTCAA AGAAATCATA 4260
663 CTTCAATCAC ATGAAAAACT TTTACACCCT GGTATACAGA AAATGACAAA ATTATTTAAA 4320
664 GAAAATCACT TCTTTCCAAA TAGCCAACTA TTAATTCAGA ATATAATAAA CGAATGCAAC 4380
665 ATATGCAATT TGGCCAAAAC AGAACATAGA AACACCAAAA TGCCTTTAAA AATCACACCC 4440
666 AACCCGGAAC ATTGCCGAGA AAAATTTGTA GTAGATATTT ATTCATCTGA GGGAAAACAT 4500
667 TACATCAGTT GCATTGATAT TTATTCTAAA TTCGCTACAC TTGAGCAAAT TAAAACTAAG 4560
668 GATTGGATAG AATGCAGAAA CGCATTAATG CGCATTTTTA ATCAACTAGG AAAACCCAAA 4620
669 TTATTAAAGG CAGACAGAGA CGGAGCTTTC TCCAGTTTAG CTTTAAAGCG ATGGCTTGAA 4680
670 GAAGAAGAAG TCGAATTACA GCTCAATACA GCAAAAAACG GAGTAGCAGA CGTCGAAAGA 4740
671 TTACACAAAA CAATAAATGA AAAAATTCGT ATAATCAATT CATCTGATGA TGAAGAAGTA 4800
672 AAATTAAGCA AGATAGAAAC AATCCTCTAC ACATACAACC AAAAAATTAA ACATGACACT 4860
673 ACTGGACAGA GACCTGCTCA AATTTTCTTA TACGCTGGGC ATCCCATATT AGACACTCAA 4920
674 AAAATTAAAG AGAAGAAAAT AGAGAAAATA AATGAAGACA GACGGGAATT TAATATTGAC 4980
675 ACTAATTACA GAAAAGGTCC ACTACAGAAA GGCAAATTAG AAAACCCATT TAAACCAACC 5040
676 AAAAATGTAG AACAGACAGA CCCTGACCAT TACAAAATCA CTAATAGAAA TAGAGTTACG 5100
677 CACTACTACA AAACACAATT CAAAAAACAA AAGAAAAATA ATAAACTCTC AATTTCACAG 5160
678 GCACCTGGTA CCCGATAACA CTATTGTTTA TACTGATCAC AGCTGTTCAT GGACAACAAA 5220
679 TTCAAATTAA TAATATTGAC ACCAACCACG GATATCTCCT TTTTTCTGAT AAGCCAGTAC 5280
680 AGATACCATC CTCCTTTGAA CATCACTCCT TAAAAATCAA TTTAACTGAA ATAGACATCG 5340
681 TGGTTGACTA TTTTGAGCAA AGACTACGAA CCGATTACCA TGCACCCCAG ATCAATTTTT 5400
682 TATACAATAA AATAAAAAGA GAACTAGCCA GAATAACCCT GAAACATAGA AACAAACGGG 5460
683 GTTTTATTAA CATTGTGGGT TCAGGTTTTA AATACCTATT TGGAACACTA GATGAAAATG 5520
684 ATCGAGTCGA AATACAGAAA AAACTTGAAA TCAACGTCCA TAACTCAGTA AAATTACATG 5580
685 AACTCAACGA CGCCATACGA TTGATAAATG ACGGAATGCA AAAAATACAG AATTATGAAA 5640
686 ATAACCACAC CATCATTGAC AGTCTTTTGT TCGAACTAAT GCAGTTTACG GAATACATAG 5700
687 AAGATTTGGA AATGGCTATG CAGCTTTCCA GACTTGGACT GTTTAACCCC AAATTACTAA 5760
688 ACTACGACAA ACTTGAAAAT GTGAACAGCC AAAACATTTT GAACATTAAA ACATCCACTT 5820
689 GGATTAACTA CAATGATAAC CAAGTATTAA TCATATCCCA CATACCCATT TACCTTTCAC 5880
690 TAATAAGCAC AATTAAAATA ATTCCTTACC CAGACTCCAA CGGCTATCAG CTAGATTACA 5940
691 CAGACACACA ATCATATTTT GAAAAAGAAA ATAAAGTTTA TAATACCGAA AATAAAGAAG 6000
692 TAAAAAATGA ATGTGTCACC AATATTATTA AACACTTAAA TCCAATTTGT AATTTTAAGC 6060
693 CAGTACACAC GAACGAAATA ATAAAATACA TAGAACCAAA CACAATTGTA ACTTGGAACT 6120
694 TAACCCAAAC AATTCTTAAC CAAAATTGCC AAAATTCAAT TAATAAAATA AAAATAGAAG 6180
695 GAAACAAAAT GATAAGAGTA ACGCAATGCA AAATAGAAAT CAATAATATA AATTTTAGTG 6240
696 AAACTCTGTT AGAACCAGAA ATAGATTTGA CACCACTATA CACACCACTT AATATAACAA 6300
697 AAATAAAAAT TGTAAAACAC AACGACATTA TTGAGATGAT TTCAGAGAAC AATATTACAC 6360
698 TTTACATACA AATGATCATT GTAATAATCG CACTAATTTT GTTGTACTCA TATTTAAGAT 6420
699 ATGTATCATT TAAACCATTT ATGATGTTGT ATGCAAAACT TAAAATAAGA AAAAATCAAA 6480
700 ATCAAAACAC ACCACAACAA ACAGAAATAG AAGAAATTCC ATTTCCCACA CTATATCCAT 6540
701 CAATCCCAGC CCAAGTATAG GCTTCTCTTT AAGGGAAGGG GAGTGACGTA TTTGGGTGGT 6600
702 CCAAACCAGC CACTTCCATT ATTTCAAAGA AATCAGTAAT GCACTCTAGT AATTTTCCAT 6660
703 AACTGTATCC CAGCTGCGCA GACTCGTTTA TCTTTTGCAG CGCAGCGTTC TTTGTAAACA 6720
704 TCCTAAAGAC CTGCCTAAGC AGATTTGACT GCCCTCTTTC AACGCTACCT AATCTTAAGA 6780
705 ACCCAAGAGC GAGGCTCTCC CGAAATACAA ATATTGTTCA AATACTGAGG CTTCTCCTCA 6840
706 ATCCAATTTG CATTTGATTT TTAGTCTTAA GCTGAGATCC AAAGAATAAA GTCGTGAAAC 6900
707 TATTTCTCCT AAAAACTATT TTTTATTTCT TGGCGTTGTC CTTAGTCAAC TGACGGGACA 6960
708 TTAGTTCGAC TCATAAATAA AACAACAATT TTACT 6995
709 //
710 ID DM23420 standard; DNA; INV; 6126 BP.
711 XX
712 AC U23420;
713 XX
714 DR FLYBASE; FBte0000266; Dmel\3S18.
715 XX
716 SY synonym: BEL
717 XX
718 FT source U23420:1..6126
719 FT SO_feature five_prime_LTR ; SO:0000425:1..361
720 FT SO_feature three_prime_LTR ; SO:0000426:5766..6126
721 FT SO_feature CDS ; SO:0000316:919..5742
722 FT SO_feature start_codon ; SO:0000318:1..3
723 FT /name="Dmel\3S18\ORF"
724 FT /db_xref="FLYBASE:FBgn0044337"
725 FT /db_xref="REMTREMBL:AAB03640"
726 FT /db_xref="NCBI_PROTEIN:AAB03640.1"
727 FT /translation="MFIGSIASNSSLTDCQRFHYLKSYLAGDALALVKHIPVTNDNYRE
728 FT AWERLEQRYNKQSLIIRSFLNSFMSLPSAINSNIGTVRKIADGADEVIRGLRALNCEER
729 FT DPWLIFILLSKLDSDTRQAWAQCAESEEKGVTINRFLKFLTSRCDTLEAFELTRSTQAR
730 FT RAATTHHADTHPRREEPKCTSCQQNHQLFKCPQFIALDIASRRDFLKSRKLCFNCLSPA
731 FT HMVGNCTSRHTCRICRRKHHTLVHGSSQPIQNGNNIDTASVDSRDRPAVSHAGSTIGHN
732 FT QPLAREGHRLGSETPAENNFTHHTLENIPAAGSQTLLPTILADVIDAWGNTTTCRLLLD
733 FT TGSTITLASESFVQRIGVRRTHARISILGLAANSAGVTRGRAHIKLRSRHSGQTVELVS
734 FT FILTSLTSSLPAQVIDTSSSTWRQICELPLADPTFCTPGAIDVIVGSDQLWSLYTGDRK
735 FT HFGNDFPIALNTVFGWILAGSYSAFDDHPTSAVTHHADLDTMVRSFMEMDSIQPNQALL
736 FT DASDPTERHFAATHKRSTDGVYVVEYPFKEKAPPIDSTLPQAINRFFSLERKFRRYPEL
737 FT KQQYEAFLDDYLQRGHMEKLTSAQVEESPDTCFYLPHHAVIKLDSLTTKCRVVFDGSGK
738 FT DSSGVSLNDRLHIGPPIQRDLFGVCLRFRQHQYVLCADVEKMFRGIKVFKPHTNFQRIV
739 FT WRTTENEPLLHFRLLTVTYGLAPSPFLAVRVLKQLADDHGHEYPAAAHALLHDAYVDDI
740 FT PTGANTFEELMILKDELIALLDKGKFKLRKWSSNSWRLLKSLPEEDRCFEPIQLLNKSA
741 FT ADSPVKVLGIQWNPGKDVLYLNLKGCDATISPTKRELLSQLSRIYDPLGLVAPVTVLLK
742 FT LIFQESWTSVLQWDDPIPESLRTRWRALVEDLPALTQCQVPRYIASPFRDVQLHGFADA
743 FT SSHAYGAVVYARVAVGCSFQVTLVAAKTRVAPIKPVSIPRLELNAALLLSRLLSIVKTS
744 FT LTIPLFSTSCWTDSEIVLHWLSAPPRRWNTYVCNRTSEILSDFPRSCWNHVRTEDNPAD
745 FT CASRGLHPSKLLEHRLWWKGPSWLATPTSEWPPSTSKFSVSSSFDVNTEERAIKPTTLH
746 FT NFPDESIHELLIHKFSTWTRLIRVSSYCHRFIHTLRSHHRNSAPFLTSEELLDAQRRLI
747 FT RHVQQKSFAREYEQLENRRQLNAKSHLIRFSPFLDDYGVMRVGGRIEQSTLNYNAKHPI
748 FT LIPKDTPLAGLLVRHFHVSYLHTGVDATFTNLRQQYWILGARNLVRKAVFQCKSCFLQR
749 FT KGTSNQIMGELPIPRVQASRCFQHTGLDYAGPIAIKESKGRTPRIGKAWFSIFVCLTTK
750 FT ALHIEVVSELTTQAFIAAFQRFIARRAKPTDLYSDNGTTFHGGKKTLDDMRRLAIQQAK
751 FT DEELAGFFANEGISWHFIPPSAPHFGGMWEAGVRSIKLHMKRILGSKALTFEELSTVLT
752 FT QIEAILNSRPLCPTGDNSLDPLTPAHFLTGSPYTALPEPCRLDMQVNRLERWNQLQAMV
753 FT QGFWKRWHMEYLTSLHERTKWHLETENLKIDTLVVLKEPNLPPSKWILGRITAVHAGID
754 FT NKVRVVTVKTAHGLYKRPIAKIAVLPLC"
755 XX
756 CC Derived from U23420 (g733531) (Rel. 48, Last updated, Version 3).
757 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
758 CC Any changes to original sequence record are annotated in an FT line.
759 XX
760 SQ Sequence 6126 BP; 1623 A; 1556 C; 1346 G; 1601 T; 0 other;
761 TGTTTGGGAA CGAGACACCC TGTATACGCG AACAAGTCAC CCTTTATCTT TATTTACATT 60
762 CTTATTTGTC TGCAGCTTCA TCGGAGCTTA TCAGCGGAAT CAATGTAAGC ATCGCACCGC 120
763 TGTAATTGTC CGCGAGCTTG CCCAGTACTT TTCCAAACTT CTAACTCCCT TCTAACTGTA 180
764 ACTTGTTTAC GTCTTATGCT AGACTAATCG TATGGCGTGA TTACAGCCAA AGCTGAAGTC 240
765 AGTCACAATT TTGATCTGCG AGAAAACGTA CGCATCGGTG TCGAAATAAT TAATATTAAG 300
766 TGTCTGAACT TAACCAATAA ATGAAAATTA ACAGTAACAC TGGCGGTTTT ATTTATAAAC 360
767 ATAAAAATTG GTCCTTCGAG CCGGATAACC GGAAGTGCGT TTCGTTCGGG CATTTGATTT 420
768 TGATTATTGG CCTTTTGGCA AACGATAATC TATAGATTCC TACATCGTGT AGAATCGTTC 480
769 CCTTCTTTCG ACCACCATGC GGAGTGTGAT TCAACAACGG GGCTTCTGCA AAAGCCAAAT 540
770 TACTCGTGCG CATAATAATG CCTTAAAATT TGTTGATGAC ATTCACTCAG TGCAAACAAT 600
771 AGTTGTCCGC CTGGCGCAAC TACAGGAAAA TTATTTGCGG TTCGTACGGC TCTCGGAAGA 660
772 GCTGTATGCA TTTCAATCGG AAGCCGATTG GGAGAACCCT GACGAGGATT TTGACGCATA 720
773 TGAGGACAAA CATTATGCTA CACACGCTAT TCTCAGCAAT ACTTTGGAGG AGTTGAGACG 780
774 GGATGTCACC TCAAACAGTA TTGATGCCAC AGTTCAAGCG CAGGCACACC CCAGAGAAGT 840
775 CATGTCGATT TTCAGTTCGA GAGAATTAAA CTTCCGACTT TTTCTGGAAA TTATGAGGAC 900
776 TGGAAACATT TTTCGGACAT GTTTATTGGA TCGATTGCTT CCAATTCGAG CCTGACGGAT 960
777 TGCCAACGAT TTCATTATTT AAAATCGTAC CTTGCCGGAG ACGCGCTTGC ATTAGTTAAA 1020
778 CATATTCCAG TTACTAATGA CAACTATCGG GAAGCATGGG AGCGGCTGGA ACAGCGATAT 1080
779 AACAAACAAT CGCTAATTAT TCGATCGTTC TTAAACAGTT TCATGAGCCT TCCGAGTGCT 1140
780 ATAAATTCAA ATATCGGCAC AGTGCGGAAA ATTGCCGATG GTGCAGACGA AGTTATTCGT 1200
781 GGTCTACGAG CTCTTAATTG CGAAGAGAGG GATCCCTGGC TAATTTTCAT TCTACTTTCA 1260
782 AAATTAGATA GCGATACCCG CCAAGCCTGG GCTCAGTGCG CAGAATCCGA GGAAAAAGGT 1320
783 GTGACCATCA ACCGATTCTT GAAATTTCTC ACATCACGCT GCGATACGTT GGAGGCTTTT 1380
784 GAATTAACTC GATCAACCCA AGCTCGACGC GCAGCTACCA CGCACCACGC AGACACGCAT 1440
785 CCAAGACGGG AAGAGCCGAA GTGCACATCG TGCCAGCAGA ATCACCAACT GTTTAAGTGT 1500
786 CCTCAATTCA TCGCACTCGA CATTGCATCT CGCCGAGACT TCCTCAAATC AAGAAAGCTC 1560
787 TGTTTCAATT GCCTCAGCCC GGCTCATATG GTGGGCAACT GTACATCGAG GCATACTTGT 1620
788 CGGATCTGCC GCCGCAAGCA TCATACTTTG GTTCATGGCT CGTCGCAGCC AATTCAAAAT 1680
789 GGCAACAACA TTGACACAGC AAGTGTTGAC AGCCGCGATC GACCAGCAGT CTCACATGCG 1740
790 GGATCTACAA TTGGCCACAA TCAACCGCTA GCTCGAGAAG GTCATCGCTT GGGAAGCGAG 1800
791 ACTCCCGCGG AAAACAACTT TACGCATCAT ACTCTGGAGA ATATTCCGGC GGCTGGTTCT 1860
792 CAGACTCTGT TGCCAACCAT CCTTGCTGAC GTCATCGACG CCTGGGGAAA CACTACAACC 1920
793 TGCAGGCTGC TCCTGGACAC TGGATCTACA ATAACCTTGG CATCGGAATC ATTTGTTCAG 1980
794 CGAATAGGCG TGCGTCGAAC GCACGCACGG ATTTCTATTC TCGGTCTCGC CGCCAACAGC 2040
795 GCGGGCGTTA CCCGAGGACG CGCACATATC AAGCTGCGCT CTCGTCATTC GGGCCAAACT 2100
796 GTCGAATTGG TCTCGTTCAT TCTCACCTCG CTGACGTCAT CACTTCCTGC CCAAGTTATT 2160
797 GACACCTCAT CCTCTACGTG GAGGCAAATC TGCGAGCTTC CTTTGGCAGA CCCAACGTTC 2220
798 TGCACACCTG GAGCAATCGA TGTCATTGTT GGATCGGATC AACTTTGGTC TCTATACACA 2280
799 GGAGATCGGA AACACTTTGG TAACGACTTT CCTATCGCTC TCAATACTGT ATTTGGTTGG 2340
800 ATTCTTGCAG GCTCTTACTC TGCATTCGAT GATCACCCTA CTTCTGCGGT TACTCATCAC 2400
801 GCGGACCTAG ACACGATGGT TCGTTCATTC ATGGAGATGG ACAGCATTCA GCCTAACCAG 2460
802 GCTCTCCTGG ACGCCAGCGA TCCCACAGAG CGTCATTTTG CTGCCACACA CAAGCGCTCG 2520
803 ACGGACGGGG TGTACGTCGT CGAGTATCCC TTCAAGGAAA AGGCACCGCC TATTGATTCG 2580
804 ACCTTGCCAC AGGCCATCAA TCGCTTCTTC TCGCTGGAAC GCAAATTTCG TCGGTATCCA 2640
805 GAATTGAAGC AGCAGTACGA AGCTTTCCTG GACGACTACT TGCAACGTGG ACATATGGAA 2700
806 AAACTGACCT CGGCTCAGGT TGAAGAGTCC CCAGACACCT GCTTCTATTT GCCGCACCAC 2760
807 GCTGTCATCA AACTGGACAG TCTGACTACC AAATGTCGTG TAGTTTTTGA TGGATCAGGA 2820
808 AAAGACAGCT CTGGAGTATC GCTCAATGAC AGACTACATA TTGGTCCACC GATTCAACGC 2880
809 GATCTTTTTG GCGTTTGTCT ACGCTTCCGG CAGCACCAAT ATGTTTTATG TGCAGATGTC 2940
810 GAAAAGATGT TTCGAGGCAT TAAAGTCTTT AAGCCACACA CCAATTTTCA GCGCATTGTT 3000
811 TGGCGCACGA CTGAGAATGA ACCTCTGCTT CATTTTCGCC TGCTGACGGT TACCTACGGA 3060
812 TTGGCACCGT CACCATTTCT GGCTGTTCGA GTTCTAAAGC AACTTGCCGA CGATCATGGC 3120
813 CATGAATACC CTGCAGCAGC TCACGCTCTT CTGCACGATG CCTATGTGGA CGATATCCCG 3180
814 ACAGGCGCCA ACACATTCGA GGAGCTTATG ATTCTCAAGG ACGAGCTTAT AGCCCTCTTG 3240
815 GATAAGGGAA AATTCAAGCT ACGCAAATGG AGTTCTAATA GTTGGCGTCT TCTGAAATCA 3300
816 TTACCAGAGG AAGATAGATG TTTTGAACCT ATCCAGCTCC TCAACAAATC AGCTGCGGAT 3360
817 TCACCTGTCA AAGTTCTTGG TATCCAATGG AACCCTGGGA AGGACGTCCT GTATCTCAAC 3420
818 CTAAAGGGAT GCGATGCGAC CATTTCTCCG ACGAAAAGAG AACTCTTGTC TCAGCTATCA 3480
819 AGAATTTATG ATCCGCTTGG ACTGGTAGCG CCGGTCACAG TTCTACTCAA GCTAATCTTC 3540
820 CAAGAAAGCT GGACAAGTGT CCTGCAGTGG GACGACCCCA TACCTGAAAG TCTACGTACG 3600
821 CGCTGGAGAG CCTTAGTAGA GGATTTGCCA GCACTTACGC AATGCCAAGT ACCACGGTAT 3660
822 ATTGCGTCAC CATTTCGAGA TGTTCAACTA CACGGATTCG CCGACGCATC CTCGCACGCC 3720
823 TACGGTGCGG TAGTTTACGC TCGAGTTGCA GTTGGATGCA GCTTTCAAGT AACTCTGGTT 3780
824 GCCGCCAAAA CACGGGTGGC CCCGATCAAG CCCGTATCAA TTCCACGTTT GGAGCTAAAC 3840
825 GCTGCGTTAC TTCTATCTCG ATTGCTTTCT ATTGTCAAAA CATCACTAAC AATTCCTCTT 3900
826 TTCAGCACGA GCTGCTGGAC AGATTCAGAA ATTGTGCTAC ACTGGCTTTC AGCTCCCCCT 3960
827 CGACGGTGGA ACACCTACGT CTGCAACCGA ACTTCTGAGA TATTGAGCGA CTTTCCCCGT 4020
828 AGCTGCTGGA ACCATGTTCG CACGGAAGAC AATCCTGCAG ATTGTGCTTC CCGAGGACTT 4080
829 CATCCGTCAA AGCTTCTGGA GCATCGACTG TGGTGGAAAG GTCCGTCTTG GCTGGCCACA 4140
830 CCCACCTCTG AGTGGCCACC TTCTACAAGC AAGTTCAGCG TATCTTCAAG TTTCGATGTC 4200
831 AACACCGAAG AACGAGCCAT AAAGCCCACG ACTCTACATA ACTTTCCTGA TGAAAGTATA 4260
832 CACGAGTTAC TCATCCACAA ATTCTCAACC TGGACGCGTC TTATAAGGGT ATCTAGCTAC 4320
833 TGTCATCGCT TTATTCACAC TCTTCGATCC CATCATAGGA ATTCGGCACC ATTCCTTACG 4380
834 TCTGAAGAGT TGCTGGACGC ACAGCGCCGA CTTATTCGAC ATGTGCAACA AAAATCCTTT 4440
835 GCCAGAGAAT ATGAGCAGCT AGAGAATCGA CGCCAGCTTA ACGCTAAATC GCATCTTATC 4500
836 CGGTTTTCTC CGTTTCTGGA TGATTATGGA GTAATGCGAG TCGGTGGGAG AATCGAGCAA 4560
837 TCTACACTCA ACTATAACGC CAAGCACCCG ATTCTGATAC CTAAAGATAC ACCACTAGCT 4620
838 GGACTCCTGG TTCGACATTT TCATGTCTCC TATCTGCACA CTGGAGTTGA TGCAACGTTC 4680
839 ACCAATCTTC GTCAGCAGTA CTGGATTCTG GGAGCCCGCA ATCTCGTCAG AAAGGCAGTC 4740
840 TTCCAATGCA AATCCTGTTT TCTTCAACGA AAGGGCACAA GCAACCAGAT CATGGGAGAG 4800
841 CTACCAATTC CTCGAGTTCA AGCTAGCCGC TGCTTTCAAC ACACAGGGCT GGACTACGCT 4860
842 GGACCGATCG CAATCAAGGA ATCAAAGGGA AGAACTCCAC GCATCGGAAA GGCATGGTTT 4920
843 TCTATTTTCG TGTGTCTCAC TACAAAGGCA CTTCACATCG AGGTTGTTAG TGAGCTAACT 4980
844 ACACAGGCTT TCATCGCAGC CTTTCAACGA TTCATTGCCC GCCGAGCGAA GCCTACTGAC 5040
845 CTGTATTCGG ATAATGGAAC AACATTTCAT GGAGGCAAGA AAACTTTGGA TGACATGAGA 5100
846 CGTCTGGCCA TTCAACAAGC CAAAGATGAG GAACTAGCAG GATTCTTTGC CAATGAAGGG 5160
847 ATTTCTTGGC ACTTTATACC CCCGTCTGCT CCACATTTTG GAGGGATGTG GGAAGCTGGA 5220
848 GTTCGCTCAA TTAAACTCCA TATGAAACGA ATACTTGGAT CAAAGGCTTT AACGTTTGAG 5280
849 GAGCTCTCTA CTGTCCTGAC CCAAATTGAA GCTATCCTGA ATTCACGCCC GCTGTGCCCA 5340
850 ACTGGGGATA ATTCTTTGGA TCCACTGACG CCTGCTCATT TTTTGACTGG ATCTCCGTAT 5400
851 ACTGCATTGC CTGAACCCTG TCGTCTGGAT ATGCAAGTCA ATCGATTGGA GAGGTGGAAT 5460
852 CAGCTGCAAG CCATGGTTCA AGGCTTTTGG AAAAGGTGGC ATATGGAATA CCTGACATCT 5520
853 CTTCATGAGC GGACAAAGTG GCATCTGGAA ACCGAGAATC TGAAGATCGA CACACTGGTA 5580
854 GTACTCAAGG AGCCCAATCT ACCGCCCTCT AAATGGATTC TTGGCCGCAT CACAGCAGTG 5640
855 CACGCAGGAA TCGACAACAA GGTCCGAGTC GTTACAGTGA AGACTGCTCA CGGATTATAC 5700
856 AAACGCCCAA TTGCCAAAAT CGCTGTACTG CCTCTCTGCT GAACAACCGT TCAGGGGGGC 5760
857 CGGTATGTTT GGGAACGAGA CACCCTGTAT ACGCGAACAA GTCACCCTTT ATCTTTATTT 5820
858 ACATTCTTAT TTGTCTGCAG CTTCATCGGA GCTTATCAGC GGAATCAATG TAAGCATCGC 5880
859 ACCGCTGTAA TTGTCCGCGA GCTTGCCCAG TACTTTTCCA AACTTCTAAC TCCCTTCTAA 5940
860 CTGTAACTTG TTTACGTCTT ATGCTAGACT AATCGTATGG CGTGATTACA GCCAAAGCTG 6000
861 AAGTCAGTCA CAATTTTGAT CTGCGAGAAA ACGTACGCAT CGGTGTCGAA ATAATTAATA 6060
862 TTAAGTGTCT GAACTTAACC AATAAATGAA AATTAACAGT AACACTGGCG GTTTTATTTA 6120
863 TAAACA 6126
864 //
865 ID 412 standard; DNA; INV; 7567 BP.
866 XX
867 AC nnnnnnnn;
868 XX
869 DR FLYBASE; FBte0000007; Dmel\412.
870 XX
871 SY synonym: mdg2
872 XX
873 FT source nnnnnnnn:1..7567
874 FT SO_feature five_prime_LTR ; SO:0000425:1..514
875 FT SO_feature three_prime_LTR ; SO:0000426:7054..7567
876 FT SO_feature CDS ; SO:0000316:679..1044
877 FT SO_feature CDS ; SO:0000316:1408..1722
878 FT SO_feature CDS ; SO:0000316:1888..3243
879 FT SO_feature CDS ; SO:0000316:3864..6866
880 XX
881 CC Berkeley Drosophila Genome Project.
882 XX
883 SQ Sequence 7567 BP; 2982 A; 1367 C; 1323 G; 1895 T; 0 other;
884 TGTAGTATGT GCCTATGCAA TATTAAGAAC AATTAAATAA AATAGCATAT TAACTTATGG 60
885 CAGCACTTTG TTGCTATGTT TATGTTTATG TTTATGCACG CAGTTAGGCC AGGGCGGATG 120
886 TAACATGATC ACCCACTCGA AGGCCACAAA GTATAAGTGC ATTGCCCAAT CGAAGGCAAA 180
887 AAGTATAAGT GCATGGTCAG CATTCACACG CCGACCAAAT ACATATTACA TACGTACATA 240
888 CATATCTCGC TCTCCCGATA AGCCTAGATA TATAAGATAT ACATAAGAAC GCCGCTCCGC 300
889 TGCTGGCGTA CCCGGCAGCG CAGCTACGCG GATTAGCCTA AGTCCAAATA TATAAAAAAC 360
890 TGTAAAATCG GAGAGACTCT GTAGACGTTG AGCTGACAGA ACCATTTCTG CCTACTCTAA 420
891 AATCAAAAGA AGAAATTGAA TAAATATATG TCAGCCCGAC GGCTGCCTTA AACTTAAAAC 480
892 GGACTTGTGT TCTTAATTGG AGTTCATCAT TACATGGCGA CCGTGACAGT CGTCCAACGC 540
893 TGGACGAATT GACCAAAGCT GGTGAAAACA AAGGAACAAA GGAACACTGG ACTGGAAGAA 600
894 GACTGGACTA ATTAAATGGA ACTGCAAAAA CCAAGGAAAA ATCTGAGTGA GTAGAGTTCT 660
895 ATTGAGTATG GGCAAACACC GTGGCGGTTT GAAAACTAAG CTGAATAAAC GTATAGCCCA 720
896 CGTAAGGTGG CTAATATACG GTCAGCAAAC GCCACCGGTT TGGTCGAAAG CTCTAAAGCT 780
897 ACATGCAGAG CTAGACCACT TGTTGCAATA TCAGCAAGAA TTAAAGACCC ATAAGCTCGA 840
898 GAAAACTCAC TCAGATAATA TTAAAAATAT ACCCACAATT AATGAAGTTC CAAAATACCA 900
899 GGCATGTCCA GCACCAGCAC CAGCATTAAC AAAACCAAAG AAGTCCTGCC CCCCTGGCTG 960
900 CGAAGGAATC TGGAGTCCCC ACTGCCTGGG GACTTGTGAG CGACCATCGA CGTCTTCAGC 1020
901 GGCGAAGAAA TAGACAGCAG CGAGGGAGTG TCAGCGTGCC ACCCCCGGCG ACGCCCAGCT 1080
902 GACACCCAAC AAATAGACAG CAGCGAGGGA GTGTCAGCGT GCCACCCCCG GCGACGCCCA 1140
903 GCTGACACCT GATGAGCATC ATCAACAGCA GAATATAATA ATAAATATAT ATAAATATAA 1200
904 AGTAAATATA AAATATATAT AGATAAGAAA AATTGTAAGA AATATTGTAA AACGGAGCAT 1260
905 ATACTATTAT GCCCTGTTAA CCCAATATGG CCCGTGAAGC CATAGCTAGA ATCAGGCAGG 1320
906 CAACAATGTA AAATACAATT TTTTTTTACT CTTGCGAACA TTGAAAGATT TTATAAATAG 1380
907 ATAATTCCAA ACATAAATGT CTATAGAGAC AAATGAAATA AGTAAAACTG AAAATAAAAG 1440
908 TATATACAAA GGAAATTTTC TATTCTATTC TCCAAAATAT AAAATTAGTA TACCCAAAAT 1500
909 GGGTCTAATA GACACTAAAA CTGTGGACTC TACAGCCAAT GTAATAAATA AAGTAGAAGT 1560
910 CCAAAATGCA GACTTGTTCT GGATAACCAT AATACTAATT GTAATTGCAT TAATTATGGT 1620
911 ATCCAATGCA TTAATAAAAA TATACAAACT GCATAACAAG TGTCTTAAGA AACGATACCG 1680
912 TAGCACTGCT AACGGTATAG ATAATATTTA AGGAAGATCT TTAATAAAGT CAATTATGAA 1740
913 TGAAAATATG AGAAAAATTA TATGAAAAAA AAAAATAATA AATAAAAAAA AAATATAAAA 1800
914 CGTAATATTG AATTTATCTA CATTAAAAAA AAATATATAC AAATGAATAA ATTTGAAGTT 1860
915 ATGAGTATAC CACAGCATGG ACTGGGAAAA GCTTGTTGAT CAGATAAAAG ATCAAAATGA 1920
916 AAATTTCAGA AAATCCTATA AGTGCTTAAC GCAAAACAGA TCAACACAAG CTGTAACAAT 1980
917 CAATAGGAAT GCCCAAGTCT TGGTAAATAG TTATAATGAA ATCAGAGAGT TGATCCAACA 2040
918 AAATAGAAAG AATTTGGAAC GCAAACAGTG TGCTAAGGCT TTGAACCTAC TGGTGACATT 2100
919 AAGAGAAAAA TTAATATTTA TAAAAAATAA ATTCAGTCTC CAGATAGAAA TTCCAACCAT 2160
920 AGTAAACACC CCACTAAGAA TAAATTTGAA TGAAGACAGC ACTAACTCTG ACGAGGAAGA 2220
921 TAGGACTATA GTCAAGGAAG ACATTAAAGA GGAAGATCTT CACGATCTAA CTATACCAGC 2280
922 AAAATTAATG CTGAAGAACG ACGATAAAAC AAATAACGCA GCCGACTCCG AAAATAACTT 2340
923 AACCATGGCA GAAGAAGCAG CTGCCATTAG GTCTTACATT AGGGAAGTCG CCTGCACAGT 2400
924 GCCAGAATTT GATGGGCAAA AGATCCATTT ACAAAGATTC ATTAAGGCAA TCAAATTGGT 2460
925 AGACCTAGCT AAGGGACCAT TTGAAGACAT TGCAGTTGAG GTCATTAAGT CAAAAATAGT 2520
926 TGGCACAATT TTGAACTCAG TTGACAATGA AACGACAATT CCAGCAATTA TAAACAAATT 2580
927 GCAGAAAGTA GTTGTCGGTG AGACATCCAG TAATGTCAAA GCAAAGCTAG CAACAGTTCA 2640
928 GCAGAGAGGT AAAACTGCAA CGCAATTTAC CGCTGAAGTT GATAGCCTGA GAAAACTTTT 2700
929 AGAAGCTTCC TATATCGATG AGGGTATACC TCTAGAACAT GCCACTGGTC TAAGCACCAA 2760
930 AGAGGCAATT GAAACCATGA TACATCGTGC TGAGCACGAA AGTATCAAAA CAGTACTGGA 2820
931 AGCAGGGACT TGCACCACTA TGGATGCAGC GATAAGCGCA TACATAAGAA CGAGTACAAG 2880
932 AGTTACCGGT GACATCAATA AAGTGATGTA CTTTAGAGGT AACAGACCCA ATAGAGGATA 2940
933 CGGAAATGCC AATAGAGGTA GTAACCGCGG TAGAGGCTTT AATAACAATA GTATTAGAGG 3000
934 CAACTACCAT AACGGTTACC AAAATAACGG TTACCAAAAT AACGGTTACC AGAATAACGG 3060
935 TTATCAAAAC CGCTATAATG GAAATAATAA CCGTTATAAT GGCTATAACA GAGGCCGTTA 3120
936 TAATGGAAAC AGAGGCCGTA ACAACAGTCA GAACAACTAC AACAGAAACA ATGCCAATGT 3180
937 ACGAGTAATC CAAGAACAGG GAAACTCGCA ACAGCCTTTA GGTACTCAGT AGAAGAAGAT 3240
938 CGTAGAGTAT ACACCATCAA TTATAATCTC AACATATTTT CTACATTCAT TCATGCCAAA 3300
939 ACAGGCGTAA AACTAGTTTT TCTACTTGAT ACAGGTGCAG ATATCTCTAT TCTCAAAGAG 3360
940 AACTCTGACA AATTTTCTAA TATTCAAATA ACCAATAAAA TAAACATTCA AGGCATAGGC 3420
941 CAACAGAAAA TTCAGTCTCG AGGACAGACT TTTATTGAGA TACAGACAGG TAAATACGTT 3480
942 ATCCCACACG ATTTTCATTT AGTAGATAAA AACTTTCCAA TACCGTGTGA TGGAATAATC 3540
943 GGAATAGATT TCATAAAAAA ATATAATTGC CAAATCGATT TAAACCAAGA AGAAGATTGG 3600
944 TTTATAATTA GACCAAACAA TTTGAAATTT CCAATATATA TTCCCATAGC ATACAGCTCT 3660
945 GGTATTAACA CAACGTTATT ACCAGCAAGA TCCCAAGTTG TCCGAAGATT AATAGTATCA 3720
946 TCAAAAGATG ATAACATTTT AATTCCAAAC CAGGAAATTC AAACTGGTAT TTATGTTGCA 3780
947 AATACAATCG CAACATCAAG TAATACATTT GTCCGAATTT TAAATACAAC CGATTCCGAC 3840
948 CAATTAGTCA ATATGGACAC TCTAAAATAT GAGCCACTTT CGAACTACAA TGTAGTTCAG 3900
949 GCAAATAGTG AACACAGAAA TAAAACTGTC TTATCTCAAT TAAAGAAAAA TTTCCCCGAA 3960
950 TTGTTTAAAT CACAATTAGA AAATATATGC AGCGAATATA TAGATATATT TGCATTAGAA 4020
951 TCAGAACCTA TAACAGTTAA TAATTTGTAT AAACAACAGT TGAGATTAAA AGATGATGAG 4080
952 CCAGTATACA CGAAAAATTA TAGAAGTCCT CATAGTCAAG TGGAAGAAAT ACAAGCCCAA 4140
953 GTTCAGAAAT TAATAAAAGA TAAAATAGTT GAACCATCAG TTTCACAGTA CAATAGCCCT 4200
954 TTGCTATTAG TACCCAAAAA GTCAAGCCCG AATTCTGATA AAAAGAAATG GAGATTAGTA 4260
955 ATAGACTATC GCCAAATTAA TAAGAAACTT TTAGCTGACA AATTTCCACT ACCGAGAATA 4320
956 GATGATATTT TGGACCAACT TGGTCGAGCA AAATATTTCT CCTGCCTTGA TTTAATGTCA 4380
957 GGTTTTCATC AAATCGAACT GGATGAAGGC TCGAGAGATA TAACATCTTT CTCAACCAGC 4440
958 AATGGCTCAT ATCGTTTCAC GCGATTGCCA TTTGGCTTAA AAATAGCGCC TAATTCATTC 4500
959 CAAAGAATGA TGACTATAGC ATTCTCCGGA ATAGAACCGT CTCAAGCATT CCTTTATATG 4560
960 GATGACTTAA TAGTCATAGG TTGTTCCGAA AAACATATGC TTAAAAACCT CACTGAAGTT 4620
961 TTTGGTAAAT GCAGGGAATA CAACCTAAAG TTACATCCTG AAAAATGTTC ATTTTTCATG 4680
962 CATGAAGTCA CATTTTTGGG ACACAAATGC ACAGACAAAG GAATTTTGCC GGATGACAAA 4740
963 AAATATGATG TCATTCAGAA CTACCCAGTT CCACATGATG CGGACAGCGC TAGACGTTTT 4800
964 GTAGCATTTT GCAATTACTA CAGACGTTTT ATCAAAAATT TCGCCGACTA TTCGCGGCAC 4860
965 ATAACAAGAT TATGTAAAAA GAATGTTCCA TTCGAGTGGA CAGATGAATG TCAAAAAGCA 4920
966 TTCATACATT TAAAATCTCA GCTAATTAAC CCAACACTCT TGCAGTACCC AGACTTCAGC 4980
967 AAAGAATTTT GCATAACAAC AGATGCAAGC AAGCAAGCGT GTGGCGCAGT TTTAACTCAA 5040
968 AACCATAATG GCCACCAACT CCCAGTTGCT TATGCATCCA GAGCTTTTAC GAAAGGTGAA 5100
969 AGCAATAAGA GTACAACAGA ACAAGAGTTA GCAGCAATTC ATTGGGCAAT AATACATTTC 5160
970 AGACCATACA TTTACGGAAA ACATTTCACT GTGAAAACAG ACCATAGACC ATTGACATAT 5220
971 TTATTCTCGA TGGTGAACCC CAGCTCTAAA TTAACTAGAA TAAGGCTTGA ACTAGAGGAA 5280
972 TATAATTTTA CAGTAGAGTA TCTAAAGGGC AAGGACAATC ATGTAGCAGA TGCGTTATCA 5340
973 AGAATAACCA TCAAAGAGCT AAAAGATATA ACTGGAAATA TATTAAAAGT CACTACAAGA 5400
974 TTTCAAAGTA GACAAAAATC CTGCGCAGGA AAAGAACAAT TGGATTTGCA AAAGCAAACC 5460
975 AAAGAAATAG CTTCAGAGCC CAACGTATAC GAAGTCATAA CAAATGACGA GGTACGAAAA 5520
976 GTAGTGACAT TGCAATTGAA TGACTCGATA TGTTTATTTA AACATGGAAA GAAAATTATT 5580
977 GCAAGATATG ATGTTGGTGA TCTTTATACT AATGGAATTC TTGATTTAGA TCAATTTCTC 5640
978 CAAAGGCTTG AATTGCAGGC CGGTATATAT GATATCAGCC AAATCAAAAT GGCACCGTGG 5700
979 AAAAAAATCT TTGAACACGT TTCAATAGAT AAATTTAAAA ATATGGGCAA TAAAATATTA 5760
980 AAGAATTTAA AAGTAGCGCT ACTTAACCCG GTGACCCAAA TAAATAATGA AAAAGAAAAA 5820
981 GAAGCTATAT TGTCTACATT ACATGATGAT CCAATACAAG GAGGGCATAC AGGCATTACA 5880
982 AAAACCTTGG CCAAGGTCAA AAGACATTAT TACTGGAAAA ATATGAGTAA ATACATAAAA 5940
983 GAGTACGTAA GAAAATGTCA AAAATGCCAA AAAGCAAAAA CAACAAAGCA CACAAAGACT 6000
984 CCAATGACGA TAACTGAAAC ACCAGAACAT GCTTTCGATA GAGTTGTTGT GGACACAATT 6060
985 GGTCCACTAC CCAAGTCAGA AAATGGTAAC GAGTACGCAG TCACTCTCAT ATGTGATTTA 6120
986 ACCAAGTACT TAGTTGCCAT ACCAATAGCA AATAAAAGCG CAAAAACAGT CGCAAAAGCT 6180
987 ATATTTGAAT CTTTTATTCT AAAGTACGGT CCAATGAAGA CGTTCATAAC GGACATGGGA 6240
988 ACAGAGTATA AGAATTCAAT AATTACTGAC CTGTGTAAAT ATTTGAAAAT AAAAAATATA 6300
989 ACATCAACAG CTCATCACCA CCAGACAGTT GGAGTAGTAG AAAGAAGTCA TAGAACCTTA 6360
990 AACGAGTATA TACGATCCTA CATATCGACG GACAAAACCG ATTGGGACGT ATGGCTTCAA 6420
991 TATTTCGTAT ACTGCTTCAA CACGACCCAA TCTATGGTAC ATAATTATTG TCCATATGAA 6480
992 TTAGTTTTCG GTAGAACAAG TAATTTACCA AAACATTTTA ATAAACTACA TAGCATAGAA 6540
993 CCAATATATA ACATAGATGA TTACGCTAAG GAGAGTAAAT ATAGGTTAGA GGTAGCATAT 6600
994 GCTCGAGCAA GAAAACTTCT CGAAGCACAC AAAGAAAAAA ATAAAGAAAA TTATGACTTA 6660
995 AAAATAAAAG ACATAGAATT AGAAGTAGGA GATAAAGTTT TACTAAGAAA TGAGGTAGGT 6720
996 CATAAATTAG ACTTTAAATA TACGGGGCCC TATAAGATAG AAAGCATAGG AGATAATAAC 6780
997 AATATTACGC TACTTACTAA TAAAAACAAA AAACAAATAG TTCATAAAGA TAGATTAAAG 6840
998 AAATTTCATT CATGATTGAA TTTAAACTTA TATTTTCCTT AATCATTTAC ACAAATTTTC 6900
999 CATACACTAC GTATATTTTT ATCTTTGCAT TATAAAATCA ACTATTGTTG TTCAAACAAA 6960
1000 AACACAAACA AAATAAAAAT AAAAATAAAA TAATTTGCAT TTAATAATCA AAATAACTTC 7020
1001 ACTAGGTTAC GTTATTTTTC AAAAGGAGGG AGATGTAGTA TGTGCCTATG CAATATTAAG 7080
1002 AACAATTAAA TAAAATAGCA TATTAACTTA TGGCAGCACT TTGTTGCTAT GTTTATGTTT 7140
1003 ATGTTTATGC ACGCAGTTAG GCCAGGGCGG ATGTAACATG ATCACCCACT CGAAGGCCAC 7200
1004 AAAGTATAAG TGCATTGCCC AATCGAAGGC AAAAAGTATA AGTGCATGGT CAGCATTCAC 7260
1005 ACGCCGACCA AATACATATT ACATACGTAC ATACATATCT CGCTCTCCCG ATAAGCCTAG 7320
1006 ATATATAAGA TATACATAAG AACGCCGCTC CGCTGCTGGC GTACCCGGCA GCGCAGCTAC 7380
1007 GCGGATTAGC CTAAGTCCAA ATATATAAAA AACTGTAAAA TCGGAGAGAC TCTGTAGACG 7440
1008 TTGAGCTGAC AGAACCATTT CTGCCTACTC TAAAATCAAA AGAAGAAATT GAATAAATAT 7500
1009 ATGTCAGCCC GACGGCTGCC TTAAACTTAA AACGGACTTG TGTTCTTAAT TGGAGTTCAT 7560
1010 CATTACA 7567
1011 //
1012 ID DMAURA standard; DNA; INV; 4581 BP.
1013 XX
1014 AC nnnnnnnn;
1015 XX
1016 DR FLYBASE; FBte0000112; Dmel\aurora-element.
1017 XX
1018 FT source nnnnnnnn:1..4581
1019 FT SO_feature five_prime_LTR ; SO:0000425:1..324
1020 FT SO_feature three_prime_LTR ; SO:0000426:4258..4581
1021 FT SO_feature transcription_start_site ; SO:0000315:191..196
1022 FT SO_feature polyA_signal_sequence ; SO:0000551:4482..4487
1023 FT SO_feature primer_binding_site ; SO:0005850:331..346
1024 FT SO_feature RR_tract ; SO:0000435:4247..4256
1025 XX
1026 CC Composite sequence derived from AB022762, X70361 and X70362
1027 CC Assembly based on strategy described in PMID: 10333568
1028 CC Defective element with incomplete ORFs
1029 CC Casey Bergman, 21-June-2016.
1030 XX
1031 SQ Sequence 4581 BP; 1102 A; 1074 C; 1456 G; 949 T; 0 other;
1032 TGTCGCGGAT CGAATATTGT TATCGATAGG CTCTAGTTAG TATTTTTGAG AAGTCCGAAT 60
1033 GTGGAAGGAT TTGTAAGCCC ATATGTGTCT GGGCACGTTG TTTTTGGCCA TTGTAAATTA 120
1034 CCGGGAAAAT TTAGCTTTTC ATTGTCGTGT AAGAGTTGGA GGACACACTG CGGTGAGCTA 180
1035 ATAAGTTAAG TTAGTTGCAA TTGTGAAACA TTGAATTCTT CAAGAATAAA ACGTGTTCTA 240
1036 CTACCACGGA TTAGTCTGCC CTTTCTTTCG GGAACCAATG TGTGGGGTAG CCGTTTAAGG 300
1037 CAACTCCCTG GACGCACGAC GACAACCTTT TATTCGCAGT CCTAGGGCGA CTGCAGGGGC 360
1038 AACTTGCGCT GGAATGACGG TTTAGACGGC CAGCTAGAGA GTTGCCGGAG CTGGAGTGAC 420
1039 GGTTTAGACG GCCAGCGAGG AGGATTTGTG TGAGCGCAGC CAGCGCTACG TACCGGCAGA 480
1040 GGAGTCGCAG TCAGCGACAT AGAGGGACGC AGCCAGCGTC GAACGCCGGT ACGAAAGGGT 540
1041 CGCAGCCAGC GACAAGGAGA CGCAAGAAGC GTCATTTGTG GAGACCGCAG CCAAGCATCC 600
1042 GTGGCCGCAG CCAGCGGCAC GAGGCGTCAG AGACGCCATT TCGGACGCGC AGAGGCGCCG 660
1043 CCATTTTTGG AGCTGGGAAA GATGCAGCAT TCCCCCAGGA AGAGTGCCCG GCTGAACGGA 720
1044 GGGGAAGTCA CCCCTATAAC AACAGTGAGT CAGCAGCCAG CCAGTAGTGG AGCAGGAACT 780
1045 CGGACGCGGG TGAACATCAC GGCGGCGTCG ATTCCTTGCC CGGCCACTAC GGTGACTACA 840
1046 GTAGCTTCCC AACCTAGAAG TACTGCTGTC ACAGCTGCGA GTTCAGTACC GGAGGTGAAC 900
1047 CAGCCCCTCG TGTTGGAACT CATGGAGAGG ATCGCAGCGT TGGAGAGGGA GCTGGAGAAG 960
1048 ACTAGATCCC TAGAAAGTGT GAGCACCGCC AATTGCGCGC CAATCGCAGT TGGCCCAAGC 1020
1049 GCAGTTGGCG CCAACAGTGG AGCGTCGGGG CGGCCGCCAT TTTGGAGCGG CCAGCTAATA 1080
1050 CCCACATCTA ACGGAGAGGC CTTACATAAC GGGGACTGGG CCAGGCATGC TGCAACGATT 1140
1051 GCGCCCTTTC CCACTGTAGT CCACTTCAGC GCGTGGCTAC AGGAGTACGC AAACGTGGTG 1200
1052 TGCACGGTTT TGGACGTCGA GGGAAAGGAG CCGAGGCGTC GACTTCTACA TGCAAGCGTC 1260
1053 GACCATAATG AATGCGATCA ACAGGATGAT CGGCATGGAG GTTGTCCCAT CTGTGGAGGA 1320
1054 CAGCATGAAA TATTGAACTG CAGAAAATTT ATTGGAGCTT CGCCACAGGA AAGGTGGAGC 1380
1055 AATGTGAAGA GGCATCGGCT CTGCTTCAAT TGCCTGCGAA GCGGGCACAC GGCTAGATCC 1440
1056 TGCTATACGC AAGGTGAGTG CCAGGTTAAT GGATGCCGAA GGGAGCATCA CCGTCTGCTA 1500
1057 CATGGTGCGG ACGGAGGAAC GAAGGCCGCT GCAGCGAGGT GGCTTCAGAC GCCACGAAGG 1560
1058 GAACCAGCAG CCAGCAGTTT CCAGACGCAG CCTAAAGGGG AGGCCTTCGC TACGAGATGG 1620
1059 TCACAGGGAC CAGGAGAGGA ACCGGCAGCC AGCCGTTCCA AGCAACAGTC TGGAGAGAGG 1680
1060 AGCTCCACGT GAAGCGGGAG CGCCCATGCA GAGGAATTTG AGCTGCGTTG ACGCCGAAGG 1740
1061 AGGCCGTCTA CTGTTCCGTA TACTGCCGGT TACGCTGTAC GGAGCGGGGC GAAAGGTGGA 1800
1062 TACATATGCG CTCCTAGATG AGGGATCCTC CGTCACGATG ATCGATGACG AACTACGAAG 1860
1063 GGATCTTGGA GTGCAAGGAG AGCGTCGGCA GCTAAATATC CAATGGTTTG GTGGTAAGGC 1920
1064 AACCAGAGAG CCTACCAACG TGGTGAGTCC GAAGATAAGT GGAGTTGGAA AGCCCACTCG 1980
1065 CCATGTATTG AGAAACGTTT ATGCCGTTTC GAGCTTGAGT TTGCCGATGC AGACATTGAG 2040
1066 CCGACGAGAT GTCCAGGGCG TGCACAGGGA TGCGCGTCTG CCCGATGAAG CCTTACAGCA 2100
1067 ACGTGGTGCC GAAGCTGCTC ATCGGTCTGG ATCACGGACA TCTGGGGTTG CCACTTAGGA 2160
1068 CGAGGCGGTT CGCTCGAGAG GGACCGTATG CGGCCGCAAC CGAGCTGGGC TGGGTTGTGT 2220
1069 TTGGGCCTGT AAGTGGGCAA CCGACCACGC CGTCACCGAG GTCCTGCCTA CTTGCCGTGT 2280
1070 CAGTGGATGA CGCGATGGAG AAGATGGTGG AGGACTATTT CGACATGGAG AACTTTGGAG 2340
1071 TGAAGACCGC GCCGCCGGTC GCAGCCAGCG ACGATGTCCG GGCCCAAAGG ATACTCGAAG 2400
1072 ACACCACGGT GAAAGTGGGG CGTCGCTACC AGACGGGATT ACTCTGGAAG GACGACCACG 2460
1073 TTGTGCTGCC ACCGAGATAT GAGGACGACG ACGTGCAAGT GAGCTTCGTG AGTGCGAGGA 2520
1074 CGAAGTGTGC CCCAATGAGA ACGATGACGA TCCCACGGCT GGAGCTGCAA GCAGCAGTTC 2580
1075 TTGGAACCAG GCTGATGAAC ACTGTCAAGG AGGAGCACAG TGTGGTCATC ACGGACCTGG 2640
1076 TGTTATGGAC GGACTCTAAG ACGGTGCTGA GATGGATCGG CAGCACCCAC CGCCGCTGAC 2700
1077 AATGCGGCTG ATGATGCGAC GCGGTCGCAG AAAAGGAGTC GACCTTAGCC AGGAATCAAG 2760
1078 GTGGCTAAGA GGACCTGCAT TTTTGATGCA GCCAGCAGCC AGCTGGCCGG GGTCTGAGGA 2820
1079 AGGAACTGAG CGTGTTCCAG ATGTCCCTGA TGAAGAAGAG ATGCCCAGTG AGTTTGCATT 2880
1080 AGTTGCGGTA GACGATTTTG TCATTCCGTT TCAGAGATTC TCGAGCTTCA GTCGCCTGGT 2940
1081 GAGGACCACA GCCTGGGTCC TACGGTTTGC GCGCTGGTGC CGCAAACAGC GAAACGATCT 3000
1082 CGAGGAATAC GGCCTTACCG CAGCCAGAAT GTAAGGCCGC CGGAACCGCA CTGTGCATCC 3060
1083 CGTACAGTGC GAGGAGGGCC GTATTACTGT CACACAGGCA CAGTCTGACG GAGCTGATTG 3120
1084 TGAGAGACTT CCACGCCAGG ATGAAGCATC AAAATGTGGA TGCTACGATC GCGGAGATCC 3180
1085 GGACAATGTT CTGGGTCACA AAGATGAGGC GTGTGATGCG GAGAGTCATC TCATCGTGCA 3240
1086 ACGAGTGCAA GTTGCAGCGA GCGCGGCCGA TGCCGCCGAT AATGGGACCC CATCCGGAAG 3300
1087 ACAAACTGGA TGCGGGTGGA TGGCCATTCA AATACACAGG ACTGGACTAC TTTGGGCCAC 3360
1088 TGCTGGTGAC TGTGTCCCGT CACAAGGAGA AGCTTGGGTC GCCTTGTTTA CGTGTTTGAC 3420
1089 GACAAGGGCG ATTCACCTGG AGCTGGCGCA TGACCTGTCG ACGGATTCCT GCATAATTGC 3480
1090 GATCAGGAAC TTCGTCTGCC GTAGAGGGCC AGTATATAGA CTGCGCAGCG ATAACGGCAA 3540
1091 GAACTTCGTG GGAGCTGACA GGGAAGCCAG GCGCTTTGGC GACGTATTCG AGATGGAGAA 3600
1092 GCTTCAGAGT GAGTTGACAA GCAGAAGCAT TGAATGGGTG TTTAATTGTC CAGCGAACCC 3660
1093 GTCTGAGGGC GGAGTTTGGG AGCGCATGGT GCAGTGCGTC AAGAGAGTAC TGCGTCATAC 3720
1094 CCAGAAGGAA GTTGCGCCGA GGGACCATGT ATTGGAGAGT TTCCTGATTG AGGCGGAGAA 3780
1095 TATTGTAAAC TCGCGTCCGC TCACCCACTT GCCTGTGGAT GTGGACCAGG AGGCGCCGTT 3840
1096 GACGCCAAAC GATCTTCTCA AGGGAGTAGC CAATCTGCCG GATACGCCTG GATTGGATGC 3900
1097 GGAGCTGCCC AAGGAAGGTA CTACGAGGAA GCAGTGGAGA ATTTCTCGCC TGCTACGAGA 3960
1098 CCGTTTCTGG AGGAAGTGGG TCATGGAGTA CCTGCCTACG CTTGTGCGCC GCGAGAAGTG 4020
1099 GTGCCGACGA ACGGAGCCCA TCCACCAGGG TGATGTGGTC TTCGTCTGCG ATCCTGCCTT 4080
1100 GGCCCGACGA GAGTGCCGCA AGGGTATCGT GGAGGAGATC TACAGCGGAG CTGATGGAGT 4140
1101 TGTCAGACGC GCTAAGGTGC GCGTGAACGA AAACGGCCTA TCTAGGACAA TGATGCGACC 4200
1102 CGTCTCTAAA CTTGCAGTTA TGGATTTGAG TGAAGCGGTT CTTCACGGGG TCGGGGATGT 4260
1103 CGCGGATCGA ATATTGTTAT CGATAGGCTC TAGTTAGTAT TTTTGAGAAG TCCGAATGTG 4320
1104 GAAGGATTTG TAAGCCCATA TGTGTCTGGG CACGTTGTTT TTGGCCATTG TAAATTACCG 4380
1105 GGAAAATTTA GCTTTTCATT GTCGTGTAAG AGTTGGAGGA CACACTGCGG TGAGCTAATA 4440
1106 AGTTAAGTTA GTTGCAATTG TGAAACATTG AATTCTTCCA GAATAAAACG TGTTCTACTA 4500
1107 CCACGGATTA GTCTGCCCTT TCTTTCGGGA ACCAATGTGT GGGGTAGCCG TTTAAGGCAA 4560
1108 CTCCCTGGAC GCACGACGAC A 4581
1109 //
1110 ID DMBARI1 standard; DNA; INV; 1728 BP.
1111 XX
1112 AC X67681; S55767;
1113 XX
1114 DR FLYBASE; FBte0000034; Dmel\Bari1.
1115 XX
1116 FT source X67681:1..1728
1117 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..28
1118 FT SO_feature terminal_inverted_repeat ; SO:0000481:1701..1728
1119 FT SO_feature CDS ; SO:0000316:379..1398
1120 FT /name="Dmel\Bari1\ORF"
1121 FT /db_xref="FLYBASE:FBgn0043784"
1122 FT /db_xref="SPTREMBL:Q24258"
1123 FT /db_xref="NCBI_PROTEIN:CAA47913.1"
1124 FT /translation="MPKTKELTVEARAGIVARFKAGTPAAKIAEIYQISRRTVYYLIKK
1125 FT FDTVGTLKNKKRSGRKPVLDQRQCRQILGVVAKNPSASPVKIALESKNTIGKQVSSSTI
1126 FT RRRLKEADFKTYVVRKTIEITPTNKTKRLRFALEYVKKPLDFWFNILWTDESAFQYQGS
1127 FT YSKHFMHLKNNQKHLAAQPTNRFGGGTVMFWGCLSYYGFGDLVPIEGTLNQNGYLLILN
1128 FT NHAFTSGNRLFPTTEWILQQDNAPCHKGRIPTKFLNDLNLAVLPWPPQSPDLNIIENVW
1129 FT AFIKNQRTIDKNRKREGAIIEIAEIWSKLTLEFAQTLVRSIPKRLQAVIDAKGGVTKY"
1130 XX
1131 CC Derived from X67681 (g7640) (Rel. 36, Last updated, Version 6).
1132 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
1133 CC Any changes to original sequence record are annotated in an FT line.
1134 XX
1135 SQ Sequence 1728 BP; 596 A; 291 C; 332 G; 509 T; 0 other;
1136 ACAGTCATGG TCAAAATTAT TTTCACAAAG TGCATTTTTG TGCATGGGTC ACAAACAGTT 60
1137 GCTTGTGCAG CAAGTGGGGG GAGGTGAAAT GCAAAAAAAC TTTTGCTTTT GCAAATTCAA 120
1138 ACCTATGCAG AGTCAGATGA AAGAAGAATT GAAAAAATAA CTGTTCCTAT GCGCAAGGAA 180
1139 GAGGCAAATG AAGAGATCTT TATCAGTTGT CAGAAGTATT TGCACACGGT TTCGTCGCAT 240
1140 CACAATTATT TTCACAACGC AATTTCTTCT TCAGTGATTG GTTTAGAGTG ACAAGTGCCG 300
1141 GTTTGTTTGC TTAAATACAT TTAAATTATT GAATAAAAAT TAGATTTAAT CATTTTCCTA 360
1142 TTACAGTTAT TAAATAAAAT GCCCAAAACA AAAGAGTTAA CAGTTGAGGC CCGGGCTGGT 420
1143 ATTGTTGCTA GGTTTAAAGC CGGTACACCT GCGGCCAAAA TAGCTGAAAT ATATCAAATT 480
1144 TCGCGTAGAA CTGTCTACTA CTTAATAAAA AAGTTTGATA CAGTTGGCAC ATTAAAAAAT 540
1145 AAAAAAAGAT CAGGCCGAAA ACCTGTGCTG GACCAAAGGC AATGCAGGCA AATACTTGGA 600
1146 GTTGTGGCGA AGAATCCTAG TGCCAGTCCG GTAAAAATTG CCTTAGAATC AAAAAATACA 660
1147 ATTGGCAAAC AAGTTAGTAG TTCTACAATT CGTCGCAGGC TAAAAGAAGC TGATTTTAAG 720
1148 ACATACGTTG TTCGCAAAAC GATTGAGATC ACACCAACCA ACAAAACAAA ACGTCTTCGA 780
1149 TTTGCGTTGG AATATGTTAA GAAGCCTCTT GACTTTTGGT TTAATATTTT ATGGACTGAT 840
1150 GAGTCTGCAT TTCAGTACCA GGGGTCATAC AGCAAGCATT TTATGCATTT GAAAAATAAT 900
1151 CAAAAGCATT TGGCAGCCCA GCCAACCAAT AGATTTGGTG GGGGCACAGT CATGTTTTGG 960
1152 GGATGTCTTT CCTATTATGG ATTCGGAGAC TTGGTACCGA TAGAAGGAAC TTTAAATCAG 1020
1153 AACGGATACC TTCTTATCTT AAACAACCAT GCTTTTACGT CTGGAAATAG ACTTTTTCCA 1080
1154 ACTACTGAAT GGATTCTTCA GCAGGACAAT GCTCCATGCC ATAAGGGTAG GATACCAACA 1140
1155 AAATTTTTAA ACGACCTTAA TCTGGCGGTT CTTCCGTGGC CCCCCCAAAG CCCAGACCTT 1200
1156 AATATCATTG AAAACGTTTG GGCTTTTATT AAAAACCAAC GAACTATTGA TAAAAATAGA 1260
1157 AAACGAGAGG GAGCCATCAT TGAAATAGCG GAGATTTGGT CCAAATTGAC ATTAGAATTT 1320
1158 GCACAAACTT TGGTAAGGTC AATACCAAAA AGACTTCAAG CAGTTATTGA TGCCAAAGGT 1380
1159 GGTGTTACAA AATATTAGTA TTGTATTTAT ATAAAATAAA GAAATTCTTA TGTTGAAATT 1440
1160 AGATGTTAAG CTGAAATTTA CTAAATTAAG TTGAGTGAAA ATACTTTTGA AGCGCAATAA 1500
1161 ACATGTGAAA ATACTATTGA CAACTTGCAT GCATATTTTC TTTTGCTTTA AGCTTTGTAC 1560
1162 TATGAACCGT TATCTTTCGT ATTTCTTTTC GACTACCTTC TGCATAGATC AAGCTAAGCG 1620
1163 ATAAGAACTA TTTCAGGCAA ATCGGACAAC AACAAGAAGA AATATAACAA AAAGAAGTTG 1680
1164 AAGTTTGCAA ATATTGTGCG TTGTGAAAAT ACTTTTGACC ACCTCTGT 1728
1165 //
1166 ID BS standard; DNA; INV; 5142 BP.
1167 XX
1168 AC nnnnnnnn;
1169 XX
1170 DR FLYBASE; FBte0000780; Dmel\BS.
1171 XX
1172 FT source nnnnnnnn:1..5142
1173 FT SO_feature CDS ; SO:0000316:341..2248
1174 FT SO_feature CDS ; SO:0000316:2245..2965
1175 XX
1176 CC Sequence identified by REPBASE:
1177 CC http://www.girinst.org/server/RepBase/RepBase6.6.embl/drorep.ref
1178 CC Assembled and annotated by Josh Kaminker & Michael Ashburner.
1179 CC REPBASE states this to be a consensus sequence.
1180 CC This replaces that from complement(X77571:651..5776) in versions
1181 CC previous to 4.8.
1182 XX
1183 SQ Sequence 5142 BP; 1652 A; 1222 C; 1075 G; 1193 T; 0 other;
1184 AAATCTGCAT TCATAGAGAT CGGTTGTGTC GCGCGTATGC AAAAGTGATC TATTTTGCTT 60
1185 TATTGTTGCA ATTTCTTGGG TGCTTAAAAT AGCACTCACC AGTACATTCG GGCGCTGCTT 120
1186 CGTGCGGTGT CGGCATCTGG CCAACAACAA AAAGCGTTAA TCGAAGTGCG GTGTAGCTAC 180
1187 GATACCTGCC CTTCGGGCAA CTTATTCCCC TCACCCCGCG CAAAGCCGCT GAAGGGGGCA 240
1188 ATAAAATCTA TGCTTATCAG CAAAACTGAT CCGTATTTGA TCTGTTTTGT GGTCAGTTAA 300
1189 GCAAGCTATT TTGTAAATAT TAAGAATTAT TATTAAGACA ATGGATGAGA ACAATTCTGA 360
1190 TGACACCCAG CTTTTAAATA AGCAGAGTAA CCATAGAACA ATGTTCTCAA TAGCTGGCAA 420
1191 ATTACCTCAC GAGATTAGAA ACGAGTGCCG ATCAGCAATT CAACGCTTTA CAAGCAGCGT 480
1192 AACTCAAAGC AGTAGCGTCA CCACAACAAC GGTGACATTT ACTAGTGCCA ATAACAGCAC 540
1193 CATATATACA ATGGCAAATG CCGCAATAAG CAGCCCGTGC CTTGGAACAA GATCCACTCA 600
1194 CCAGGAAAGT TCCACATTGA TAAACTCCGG AATCGTAGAA GATAATCTCA GCGATGCTGC 660
1195 CAGAAGGTTA TTAAATGACC AAAATCAGAG AGCGGGTAAA AGGAAAAATG GAAAGCCCTT 720
1196 GTCCCCCATC TCCAACCCGA AAAGAGGGAG TAGCAGCCAA GTTTTACACT CGCCCCCTAC 780
1197 GACTAGCCTG AAGATAAGCT CTAATAATAG GTTTGCCATT CTGGACACGG ATATTTCTAC 840
1198 TAACGAAGAA AGCGTGGAAG GCATGATGAT AGAGGGTGCT GATATTGACA GTGCCCATAT 900
1199 GGATGATTCT CAACTCGATG GTTCCAATAC TGGTCGAAAC TTGCAGGAAA CACACAATAC 960
1200 AGCCAATCAA CTTAATGATC ACAAAAAACC ACCACAAATT GTTGTAAATA TCAGAAACTT 1020
1201 GAATGATCTG TTTGAGCTTA TAAAAGAAAA GACAAGCTTA GATAACGTTG TCGTTAAAGC 1080
1202 TAATCAAGGG GAAACGGTCA GAATATTTCC AAAAGACAGC GACACTTACA GGAAAATAGT 1140
1203 GAGCCATATG GATGACATTG GTATTCAGTT TCACACTTAC CAAATGCTGA CAGATAAGCC 1200
1204 ACACAGAATT GTAGTAAGGG ACTTACATCA CAGTACATCA AACAAAGACA TAACCGCCGA 1260
1205 TCTGAAATGT TTAGGCTACG AAGTGCTCCA CATTCACAAC CCTAGTTCTA GGACTAATAA 1320
1206 GGACGAAAAA CTAAACATCT TTTTCATTAA TATAAAGCCC TGTGCAAAAA TTAATGAAAT 1380
1207 TTACCATGTC AAGACCCTTT GCCGACAGAA AATACGGATT GAAAGGATGA GAAAGTCTTC 1440
1208 TGAAATTGCG CAATGTCGTC GTTGTCAGGA GTACGGCCAT ACAGCTAAAT ACTGCCGCAG 1500
1209 ACACCCAAAT TGTGCCAGAT GTGGCGAAAA TCACCAAACC ATGCAATGCA CCCGACCGAT 1560
1210 AGACGCACTG CCCACATGTT ACCATTGCTC TGAAAATCAT ACGGCTAGCT TCAAAGGTTG 1620
1211 CCTAAAGTAT CAGGAGCTTC TTCGCAGATC TATGGGGCCT GCAAGAAATG GAAACAGGTT 1680
1212 AAATAAGAAC ACCCATCATC ACTCTCCTAG AGACCGGCAA GAGCTTCCTG CCTTGCAGCC 1740
1213 CAATTACCGC AAGAACAACA CCCAATCAAC AGTACAGCAG TTATCGACAC AACCACAGCT 1800
1214 TAATTTTGCC CAAAGCCAAC CATCTATAGG CACTGGTGGA AACAGAGCAG TATCCTATGC 1860
1215 TACAGTAGTA AAAGGATACC CAAAAATAGC GCCCTCCAAG GACGGACCAG CCCAGCGTCA 1920
1216 ACGCTTAAAC AACCCACAAA CGAAACAAAT ACTGCAGCAA CACCGATCGA ATACACAGCA 1980
1217 GAATAACTCA TCTGATGTGC AAGTATTCTT ACAACAGCAA CAACAACAGT TTCTGGAATG 2040
1218 GCAACAGCAG ATCCAACAAC AACAACACCA ACAGTTTCTT ATGTGGTTGC AACAGCAGCA 2100
1219 GCAAGAACAA CTACAGTATA AAAGCCAAAC CAATCAACGA CTGGAAAAGC TTGAAAAAAT 2160
1220 GGTTCTTGAA CTAGCGAATA TGTTAAAAGA ATGGGCTGGG AGTGAACTTA AGCCCCAGCT 2220
1221 CTTTAACAAC GTCTCAGCCT CCCTATGAAT CCACTAAAGA TTCTTATTTG GAATGCTAAC 2280
1222 GGCATTTCAA GAAAAGCCAA AGATGTTGAG CTGTTCGCGC ACAACAAAAA GATAGACATC 2340
1223 CTTCTTGTGA CTGAACTAAG ACTCAAAAGA GGGGAAACTG TAAAGATATA TGGATATGCG 2400
1224 TACTATCCAG CATATAGGCC ATCCCTTAAT AATAATAGTG TTGGCGGAGT AGCGGTGTTC 2460
1225 GTGAGGACAA CTCTTCGCCA CTTTCCACAA AGGGTCATTG AGACACGCCA CATACAATTG 2520
1226 TCATCAGTAA AAGTAGCCAC AGGACTCGGG GACCTGCAGT TTAGCGCTAT TTACTGCTCC 2580
1227 CCAAGTACTA GAATCGAGGA AAGACATTTT ACTGACATAA TACGCGCCTG CGGCCAAAGG 2640
1228 TACTTGGTAG GTGGCGACTG GAATGCCCGC CACTGGCTTT GGGGCGACAC TTGCAATTCA 2700
1229 CCTCGCGGGC GGGAACTAGC AGAAGCCTTG TCCGTGACTG GAGCTAAGAT CCTCGCAACT 2760
1230 GGCTCTCCGA CAAGGTATCC GTATGTGCCC AGCCATACGC CCTCATGCAT AGATTTCGCA 2820
1231 GTGTATCATG GTATACCAGA CCACCTAGCA ACTATAACAC AAAGCTGGGA CTTGGATTCT 2880
1232 GATCACTTGC CTCTTATCAT TAGCATTGAG ACAGACAGTA TTCATGTCAA TCCAAGTCCC 2940
1233 AGGCTAGTCA CCAAACACAC TGACCTCCTT GCCTTTAGCC GACAATTGGA GAGCCTTATT 3000
1234 TCGCTGAACA CCACGCTTAA TTCTGGTGAG GAAATTGAAA TGGCTGTTGA CAACCTAACT 3060
1235 GAAAGCATAC ATAGGGCCGC GGCTGTCTCT ACTTCTCCCG TCCCTCGGAT AGGCACCACA 3120
1236 TATGGGATAG TCTTGACAAG AGAGGCTAGA GAGCTTCTGA CACAGAAAAG AAGACTCCGA 3180
1237 AGGCGAGCAA TCCGATCTCA AGACCCCTGG GACCGACTTT TATGGAACCG TGCTGCAAAG 3240
1238 CAACTACGAA ACGTCCTCAG AGAACTTCGA AGCAACTTTT TTGAGCAGAA ACTAGCTAGT 3300
1239 ATGGACTACA CAGTGGATGC TGGATACTCG CTATGGAAAT GCACCAAGTC CCTTAAAAGA 3360
1240 CAGCCGTTTA GACAGGTTCC TATAAGGTGT CCGGGAGGCG AACTTGCTAA AAATGAAGAG 3420
1241 GAGCAGGCTA ATTGTTTTGC AAATCATCTG GAGACAAGGT TCACCCACTT CCAATTCGCT 3480
1242 ACAACGGAGC AGTATCAAGA GACGCTTGAT AGCCTAGAGA CACCTCTGCA AATGTCACTA 3540
1243 CCCATTAAGC CCATCAGGGT TGAGGAAATT GTCGAAGCTA TCAAATCTCT TCCGTTAAAG 3600
1244 AAGTCTCCTG GCATCGACAA CGTTTGCAAT GCCACACTAA AAGCACTACC TGTTCGAGCA 3660
1245 ATTCTCTACT TGGCGCTGAT ATATAATGCC ATACTCAGGG TGCAGTTTTT CCCAAAGCAG 3720
1246 TGGAAAATGG CAGCAATCCT AATGATACAT AAGCCTGGTA AACCTGAAGA GAGCCCTGAA 3780
1247 TCGTACCGAC CCATAAGTCT TTTATCTTCG CTATCCAAGC TATGGGAACG ACTGATTGCC 3840
1248 AACAGATTAA ATGACATTAT GACCGAGCGT CGTATCCTGC CGGATCATCA GTTTGGCTTT 3900
1249 CGTCAGGGAC ACAGTACTGT GGAGCAGGTA CACAGACTGA CAAAACATAT CCTTCAGGCC 3960
1250 TTTGATGATA AGGAATACTG CAATGCTGTG TTCATTGACA TGCAACAGGC ATTCGATAGG 4020
1251 GTCTGGCATG ACGGCCTTAT CAGCAAAGTT AAAAAGTTAT TCCCAGCACC ATACTATGGA 4080
1252 GTCCTAAAAT CATACTTGGA AGATCGGAGA TTCATGGTCA GGGTCAGAAA CTCCTACTCG 4140
1253 ATTCCCCGCG TTATGAGAGC TGGAGTTCCG CAGGGCAGCG TACTGGGACC GTTGCTCTAC 4200
1254 TCAGTATTTA CTGCAGATCT GCCCTGCCCA AACGCCTATC ATATGGCAGA TCCCAGGAAG 4260
1255 GCCCTTCTTG CTACGTACGC TGACGATATT GCCCTGCTGT ACAGCTCTAA TTGTTGCAAC 4320
1256 GAGGCAGCAA GGGGTCTCCA AGAGTACCTC ACCACTCTGG CTGCATGGTG CAAAAGATGG 4380
1257 AATTTAAAGG TCAATCCGCA AAAGACCATC AATCCCTGCT TCACCTTGAA GACCTTAAGT 4440
1258 CCCGTCACCG CACCCATAGA GCTGGAAGGT GTAATCCTAG ATCAACCTTC ACAGGCTAAG 4500
1259 TACCTCGGGA TTACCCTTGA TAAACGGTTG ACTTTCGGCC CGCACCTGAA AGCTACGACT 4560
1260 CGGAGATGTT ATCAAAGGAT GCAACAACTT CGATGGCTGT TAAACAGAAA AAGCACCATG 4620
1261 ACACTGAGAG CCAAAAGAGC AGTCTACGTC CACTGCGTAG CCCCGATCTG GCTGTACGGA 4680
1262 ATACAGATCT GGGGTATCGC AGCAAAATCC AACTACAACC GCATTCAGGT ATTGCAAAAT 4740
1263 CGTGCCATGC GTGCAATTAC AGACTGCCCA TACTATGTAC GTGGCACTAC CCTTCACCGT 4800
1264 GATCTGAATC TTCATACAGT GGAAGAGCAG ATCTCCAGGC ACACCAGCAG ATATAGTGAT 4860
1265 AGACTAAGAC GACACCACAG TATACTTGCT AGACGCTTAC TCCCTGCTAG GCCTCTAAGG 4920
1266 AGATTAAAAA GGAAGGGTTT CGCCAAAACA CTTGGACAAC CCTAAAGACC CCCTCGAAAT 4980
1267 ATGAGACAAA GTTGTAAGTC CTCACATGAT TAGTGAGAGG TTTGGTTCTA TCTTTTATAT 5040
1268 GTTAATTGCG CTGTTATGTT ACTGTTATTG CATTGTATTG ATTCATCGCT TCTAAATAAA 5100
1269 TAATAAAAAA AAAAAAAAAA AAAAAAAAAA AAAAAAAAAA AA 5142
1270 //
1271 ID DMU89994 standard; DNA; INV; 6411 BP.
1272 XX
1273 AC U89994;
1274 XX
1275 DR FLYBASE; FBte0000739; Dmel\Burdock.
1276 XX
1277 FT source U89994:1..6411
1278 FT SO_feature five_prime_LTR ; SO:0000425:1..275
1279 FT SO_feature three_prime_LTR ; SO:0000426:6136..6411
1280 FT SO_feature CDS ; SO:0000316:564..2057
1281 FT SO_feature start_codon ; SO:0000318:1..3
1282 FT /name="Dmel\Burdock\gag"
1283 FT /db_xref="FLYBASE:FBgn0043782"
1284 FT /db_xref="SPTREMBL:O01350"
1285 FT /db_xref="NCBI_PROTEIN:AAB50147.1"
1286 FT /translation="MSDSDNLLDNLVSSLNKWSAHQASRQNSAEKNNKSSDNWWSKTKT
1287 FT TSEMEFEAQLKAIVESAVAGALAVQKQSFEKQLQEMNERIGKLTVNTPEVETYVDAEIR
1288 FT PGVVCSEPLDILKSLPDFDGKSETYVSWRKAAHVAFKVFKDYEGSSTFYQALGIMRNKI
1289 FT KGPANTVLASFNTPLHFKAMISRLDFTYSDKRPIYLIEQELSTLRQGDMTLTEFYDEVE
1290 FT KKLTLLTNKTIMTFDSALAMSLNEKYRTDALRVFVTGAKKSLSDILFAKGPKDLPTALA
1291 FT LAQEVESNHERYQFALIYSKNIGDRGQKIEQRHSDKDRNSIMPMQTKNPYFSKRQVHTY
1292 FT DNQERQDPVQLTNPDVSMRSRRTGNFGQTPFPTQGNIWPSQQQNSWPSQQQYSWPSQQQ
1293 FT NSFRTQNQFASQPQQQNTSQAQGHFGYAQASKRPTSGSARFTGPKQQRINYLPHEKGQC
1294 FT EEDTDGYQKEAEAEVDDYEDELVNYDHVHFLATNPCYRT"
1295 FT SO_feature CDS ; SO:0000316:<1994..5119
1296 FT SO_feature start_codon ; SO:0000318:1..3
1297 FT /name="Dmel\Burdock\pol"
1298 FT /db_xref="FLYBASE:FBgn0043781"
1299 FT /db_xref="SPTREMBL:O01351"
1300 FT /db_xref="NCBI_PROTEIN:AAB50148.1"
1301 FT /translation="GRTSELRSCSFFSHKSLLPYIEREIAGRTIKLLIDTGASKNYIQP
1302 FT LPELKNIMPVQNKFTVKSLHGCNTVKQKCFIKLFNTSVQFFILPSLSSFDAIIGLDLLK
1303 FT QGNATLDFKNKTLNINNEVESIQFLRCDSVNFANIENIVVPNQISNKFHTMLRNRLAVF
1304 FT AEPEEALPYNTNIVATIRTEDDQPIYSKLYPYPMGVSDFVNKETHALLKDGIIRPSSSP
1305 FT YNNPVWVVDKKGTDEEGNTKKRLVIDFRKLNLKTIDDKYPIPNVVWILSNLGKARFFTT
1306 FT LDLKSAFHQILLAEKDRAKTAFSVGNGKYEFCRLPFGLKNAPSIFQRAIDDVVRDRIGK
1307 FT SCYVYVDDVIIFSNGIEDHVNDVAWVLDRLSGANMRVSKEKSFFFKESVEYLGFMVSSG
1308 FT GITTSPSKVEAIQKYNQPTNLFSVRSFLGLASYYRCFIKDFASIARPLTDILKGENGKV
1309 FT SASQSKKIPISFDERQCSAFEKLKNVLVSENVMLLYPDYRKAFDLTTDASAFGLGAVLS
1310 FT QDGKPVTMISRTLQDRELNFATNERELLAIVWALKSLRNYLYGVKNLNIFTDHQPLTYA
1311 FT VSDRNPNAKIKRWKAFIDEHNAKIFYKPGKETYVADALSRQAIHVLEDEPQSDIATIHS
1312 FT EISLTFTIETIDKPVNCFRNQIVIDEGTADSTRTFVIFGSKTRHLIQFLDKETLIGRIR
1313 FT DVVKPDVVNAIHCELPVLAFIQNSLVNDFPATTFRHTMKMVSDIFNQTEQREIVSLEHN
1314 FT RAHRAAQENVKQILQYYFFPKMSQIAATFVSNCLVCQKAKYDRHPQKQILGRTPIPSHV
1315 FT GETLHIDIFSTGRNYFLTCIDKFSKFAIVQPIGSRTITDLEPAIMQLMNFFPHSKTIFC
1316 FT DNEPSINSESIKSLLKNRFNVDIANAPPLHSTSNGQVERFHSTLLEIARCLKLDSGMND
1317 FT TVNLILQATIEYNKTVHSVTNRRPIDIIHSTPPELANEIVEMVNEAQEKQLRRENVTRR
1318 FT DRTFEVGETVMVKQNNRLGNKLTPRYREELIEADLGTTVLIKGRVVHKDNLR"
1319 XX
1320 CC Derived from U89994 (g1905850) (Rel. 51, Last updated, Version 1).
1321 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
1322 CC Any changes to original sequence record are annotated in an FT line.
1323 XX
1324 SQ Sequence 6411 BP; 2219 A; 1259 C; 1204 G; 1729 T; 0 other;
1325 AGTTAACACA ATCACAAAAC ACCCGAAATA TAGTCGTAAG CCTCAAGTGC TTTTCCCATC 60
1326 TATAGATCGA GCTTTACCTA TAAGAAACTG TAACTTGTTA AGCTTTAGAG ATAAGAACTC 120
1327 TTGCTATACT TAAGTCAGTC GATTTTGGAA GATTAGAAGC GTCGGTCATC GCCACGTACT 180
1328 TACTATTCGT CTCATTAAGT GCAGACCGCG CAAGCCTATT GTAATTAATA AACTTACGCT 240
1329 AATAAATATA TGGAAAATCT ACTAAAATGA TAATTGGCGC CCAAACGGAT ATAAAAACCT 300
1330 ACGATAACTG AATAATTATA AATAAATAAC AAAAGGAGGA TCCGGAGACA AAACCAGCGG 360
1331 CTTTGGCTAA TTAACTCTAA CCTAAGAAAT AAAAATTTGC TGATTACATA AAATATAATA 420
1332 TTAATTACTA AGACCATCTA CCTTAAAATT GTTTGTTAAT CACTATTATT ATATTGTAAG 480
1333 TATAACGCTT ATTGAACGAA TTAAAAATAT TATTATTATT ATTATATTAT AACCTATGCA 540
1334 AAGAGTATTG ATAATAAAAA TACATGAGTG ACAGTGATAA CCTTTTAGAC AACCTAGTGT 600
1335 CAAGCTTAAA TAAATGGTCA GCGCACCAGG CAAGTAGGCA AAACAGTGCA GAAAAAAATA 660
1336 ATAAGTCATC AGATAATTGG TGGTCAAAAA CAAAGACAAC TAGCGAAATG GAATTTGAAG 720
1337 CTCAGTTAAA AGCGATCGTA GAGAGTGCTG TTGCCGGTGC GCTCGCAGTC CAAAAACAAT 780
1338 CATTTGAAAA GCAATTGCAG GAGATGAATG AGCGAATCGG GAAATTAACA GTGAACACCC 840
1339 CAGAGGTGGA AACTTATGTA GATGCTGAAA TTAGACCAGG TGTTGTCTGT AGCGAGCCTC 900
1340 TAGATATACT TAAATCTCTG CCAGATTTTG ATGGCAAAAG TGAAACATAT GTGTCGTGGA 960
1341 GAAAAGCGGC TCATGTCGCT TTTAAAGTTT TCAAAGATTA CGAGGGAAGT TCAACATTTT 1020
1342 ACCAAGCTCT TGGTATTATG CGAAATAAAA TAAAAGGTCC AGCGAATACA GTATTGGCTT 1080
1343 CTTTTAATAC TCCGTTACAT TTCAAAGCAA TGATCAGCCG TCTTGATTTC ACATATTCTG 1140
1344 ACAAAAGGCC GATCTATCTA ATCGAACAAG AGCTATCAAC TTTGCGACAG GGAGACATGA 1200
1345 CTCTTACTGA ATTCTACGAT GAAGTCGAGA AAAAACTGAC CCTACTTACC AACAAGACAA 1260
1346 TAATGACATT TGATAGTGCC TTGGCGATGT CACTGAATGA AAAGTACAGG ACGGACGCGT 1320
1347 TACGTGTATT TGTAACCGGA GCTAAGAAAT CGTTGAGCGA CATTCTTTTT GCAAAAGGTC 1380
1348 CAAAAGATTT ACCAACTGCT CTCGCTTTAG CGCAAGAGGT CGAGTCGAAC CATGAGCGTT 1440
1349 ACCAATTCGC CCTTATTTAT TCTAAAAATA TTGGAGACAG GGGTCAGAAA ATCGAACAAA 1500
1350 GGCACAGCGA TAAGGATAGA AACTCAATCA TGCCCATGCA AACTAAAAAC CCATATTTTA 1560
1351 GCAAGCGTCA GGTGCATACT TATGATAACC AGGAAAGACA AGATCCAGTC CAGTTAACAA 1620
1352 ATCCTGATGT ATCCATGCGA TCTAGAAGAA CTGGAAATTT TGGACAAACT CCATTTCCGA 1680
1353 CTCAGGGAAA TATTTGGCCA TCCCAACAGC AAAATTCTTG GCCATCTCAA CAACAATATT 1740
1354 CTTGGCCATC CCAACAACAA AATTCATTTC GAACACAAAA TCAATTCGCA TCGCAACCCC 1800
1355 AACAGCAAAA CACAAGTCAG GCTCAGGGAC ATTTTGGGTA TGCGCAAGCA TCAAAAAGAC 1860
1356 CAACGAGTGG CAGTGCAAGG TTTACAGGGC CAAAACAGCA GAGGATCAAC TACTTACCTC 1920
1357 ATGAGAAAGG TCAATGTGAG GAAGATACAG ACGGTTATCA AAAGGAGGCA GAAGCGGAGG 1980
1358 TTGATGATTA TGAGGACGAA CTAGTGAATT ACGATCATGT TCATTTTTTA GCCACAAATC 2040
1359 CCTGCTACCG TACATAGAAA GAGAGATAGC AGGGAGAACC ATAAAACTTT TGATTGACAC 2100
1360 CGGGGCTTCG AAAAATTACA TACAGCCCCT CCCTGAATTA AAAAACATAA TGCCGGTACA 2160
1361 AAATAAATTC ACGGTAAAAT CGCTTCATGG TTGCAACACC GTCAAACAGA AATGCTTTAT 2220
1362 TAAGCTATTT AACACATCTG TTCAATTCTT TATTCTTCCA AGTCTCTCTA GTTTTGACGC 2280
1363 AATAATAGGA CTTGACCTTT TGAAACAGGG AAATGCAACG TTAGATTTTA AGAACAAAAC 2340
1364 GTTGAATATC AACAATGAAG TGGAATCTAT TCAGTTTTTG AGATGTGACA GCGTAAATTT 2400
1365 CGCCAACATA GAGAATATTG TGGTTCCAAA TCAGATATCT AATAAATTCC ATACAATGCT 2460
1366 TCGAAACCGA TTGGCCGTCT TTGCGGAACC GGAAGAAGCA CTGCCGTATA ATACCAACAT 2520
1367 TGTTGCCACA ATACGTACTG AGGACGACCA ACCCATTTAC TCAAAACTCT ATCCGTACCC 2580
1368 CATGGGCGTA TCGGATTTTG TGAATAAGGA GACACATGCT TTGTTAAAGG ACGGAATTAT 2640
1369 CAGGCCCTCG TCGTCACCTT ACAACAATCC GGTTTGGGTA GTCGATAAAA AAGGTACAGA 2700
1370 TGAAGAGGGA AATACTAAGA AAAGGTTGGT TATAGATTTT AGAAAACTAA ATTTAAAAAC 2760
1371 AATCGACGAC AAGTACCCTA TACCAAACGT AGTATGGATC TTGTCAAATT TGGGAAAAGC 2820
1372 CAGATTCTTT ACAACCCTTG ACCTTAAATC GGCGTTTCAC CAAATTCTGC TCGCAGAAAA 2880
1373 GGATAGAGCG AAAACTGCCT TTTCAGTAGG AAATGGAAAA TACGAGTTTT GCCGTTTGCC 2940
1374 GTTTGGCTTG AAAAATGCCC CAAGTATTTT TCAACGTGCT ATTGATGATG TTGTTAGGGA 3000
1375 CCGTATAGGA AAGTCATGTT ACGTTTACGT TGACGACGTA ATAATATTTT CAAACGGAAT 3060
1376 TGAGGACCAC GTAAACGACG TTGCTTGGGT ACTAGACAGA CTGTCTGGGG CAAACATGAG 3120
1377 GGTTTCTAAA GAGAAATCGT TTTTCTTCAA GGAAAGCGTC GAGTATCTCG GATTCATGGT 3180
1378 GTCAAGTGGA GGTATCACAA CCAGTCCTAG CAAAGTAGAG GCTATTCAGA AATATAATCA 3240
1379 ACCTACTAAT CTGTTTAGTG TTCGATCGTT TTTAGGGCTA GCAAGTTATT ACCGCTGCTT 3300
1380 TATTAAGGAC TTCGCCTCTA TTGCTAGACC ACTCACTGAC ATTCTGAAGG GTGAAAACGG 3360
1381 AAAGGTTTCC GCAAGCCAGT CTAAAAAGAT ACCAATTTCT TTCGATGAAA GACAATGTTC 3420
1382 TGCTTTTGAG AAGCTTAAAA ATGTTCTTGT CTCCGAAAAT GTAATGTTAT TGTATCCCGA 3480
1383 TTATAGAAAA GCCTTTGACT TAACAACAGA CGCTTCGGCT TTTGGCCTGG GGGCAGTCTT 3540
1384 ATCACAGGAT GGCAAGCCTG TTACAATGAT TTCGAGAACT TTACAGGATA GAGAACTTAA 3600
1385 TTTCGCAACA AATGAACGAG AACTTTTGGC CATCGTTTGG GCTTTAAAGT CTCTTAGGAA 3660
1386 CTATCTATAT GGTGTCAAAA ACTTAAACAT TTTTACAGAT CACCAGCCGT TAACATACGC 3720
1387 CGTGTCAGAT AGGAATCCAA ATGCAAAAAT CAAGAGATGG AAGGCGTTTA TAGACGAACA 3780
1388 TAATGCTAAA ATTTTCTATA AACCTGGCAA GGAGACCTAT GTTGCCGATG CACTATCCAG 3840
1389 GCAGGCTATT CATGTCCTAG AGGACGAACC CCAGTCAGAC ATTGCAACAA TACATAGCGA 3900
1390 AATTTCATTG ACTTTTACAA TCGAAACTAT CGACAAGCCG GTTAACTGTT TTAGAAACCA 3960
1391 AATTGTGATA GATGAGGGCA CCGCAGACTC AACTCGAACT TTTGTTATTT TCGGAAGCAA 4020
1392 GACAAGGCAT CTAATACAGT TTCTAGACAA AGAGACCTTA ATCGGAAGAA TTCGTGATGT 4080
1393 GGTTAAGCCG GATGTAGTGA ATGCGATACA CTGCGAATTA CCTGTACTAG CTTTCATTCA 4140
1394 AAACAGTCTT GTAAATGACT TTCCAGCAAC AACCTTCCGA CACACTATGA AAATGGTCAG 4200
1395 CGACATTTTT AATCAAACTG AGCAACGGGA AATAGTGTCT TTGGAGCACA ACAGAGCGCA 4260
1396 TAGGGCAGCA CAGGAGAATG TAAAACAAAT TCTTCAATAC TACTTTTTCC CTAAAATGTC 4320
1397 ACAAATAGCC GCTACCTTTG TTTCTAACTG CTTGGTTTGT CAAAAAGCCA AATACGACCG 4380
1398 CCATCCGCAA AAGCAAATCC TCGGGAGAAC ACCTATTCCG TCACATGTAG GCGAGACATT 4440
1399 GCATATTGAT ATATTTTCTA CGGGCAGGAA TTACTTTTTG ACATGTATTG ACAAATTTTC 4500
1400 CAAATTCGCT ATTGTGCAAC CAATCGGCTC TCGAACGATA ACTGATTTAG AACCTGCAAT 4560
1401 TATGCAACTA ATGAACTTTT TTCCCCATTC AAAGACAATA TTTTGTGACA ATGAACCGTC 4620
1402 CATAAATTCC GAGTCAATCA AGTCACTTTT GAAAAATCGT TTTAATGTTG ACATAGCGAA 4680
1403 CGCACCTCCA CTTCATAGTA CCTCAAACGG ACAGGTTGAA AGGTTTCACA GCACGCTTTT 4740
1404 AGAAATAGCT CGATGCCTGA AACTTGACAG TGGAATGAAT GATACAGTCA ACCTTATTCT 4800
1405 TCAGGCAACA ATAGAATACA ATAAGACGGT GCACTCAGTC ACCAATAGAA GACCGATCGA 4860
1406 CATTATTCAT TCAACTCCTC CCGAATTGGC TAACGAGATA GTAGAAATGG TTAACGAAGC 4920
1407 TCAGGAAAAA CAGCTAAGAA GAGAAAATGT AACAAGACGA GACAGAACCT TTGAGGTGGG 4980
1408 AGAAACCGTC ATGGTAAAAC AAAACAATCG CTTGGGAAAT AAACTAACCC CACGGTATAG 5040
1409 GGAAGAACTA ATCGAAGCAG ACCTCGGGAC AACGGTCCTC ATAAAAGGGA GGGTCGTTCA 5100
1410 TAAAGATAAT CTACGCTAGG TTTAGTATTT CTTTTCCTTT TGTGACCATC GCCAAGTTAG 5160
1411 CAAAATACAA ACGTGAAATC TGAACACTAG TAAAAGAGTT TGCAAACATT TTTCAATTAA 5220
1412 ATATTTGTCA AATCCTTCTT ATTTAATCTT TAAACATTTT GTATTATTTC CGCTTCATCC 5280
1413 TCTTTAGAAA ATTTTAAAGG TATGTGATGA AATGCTAGAC CCGAATGATT TGAAAACTTA 5340
1414 AAGTCCACGC AACCACAAAT ATTTCCTGAA ACTACCATAG AAAATAAATG CATTACCAAA 5400
1415 ACGGCATAAT AACAGTATAG CGCACTCACT CTAATTAGAT TTCAAATTCC CGATTAAAAA 5460
1416 AAAAATAAAA CACTAATGTT ATCAATACCC TTTCCTGATT CTGTTCAACT AAAATAGGAA 5520
1417 AATCAATACT TGCAATCAAT AAGCGTTTTA CTACATACTT TAATATCAAA ATATCTGAAT 5580
1418 GAACTTTATT ATAAAATTAT AATTGTTATA CTTAATTATT GTCAAAACTT TAGTATTAAA 5640
1419 ACTGTAACTA CCTCTTAAGT AGATGAGAAG AGTAGAAGAG GGAATTAAGA TCTATCAACG 5700
1420 TAGTATCTGC TAAAGACGTA AAGATGCGGC AACTATTTCT GCGCCTGGGT ACTGAAACGA 5760
1421 CGAACTGAAT AATATCTGCC ATCAGACGCC AACCAGAGTG CGTTCAACAC ATACGTTTTG 5820
1422 ATGGTCAACT AGTTCAACCA ACATCAGCAT CATCGTCGTC AACAAGTCGA CGGTTACAAT 5880
1423 AAAGATTTTT TCCAAGTTCG CTACGATCAT CTCCAGAACC TTGTTGCGAA CCCATGACAT 5940
1424 GGAGAATCAG CAGCATTTAC GAACTTCTCG GATCATCCAG ACACGCAGAG CTGCCTTCCC 6000
1425 TTCGATGGTT TAACGCAGTA CCAGGTTGGC AGTATGGGAA CTTAGTGCAC AACCAATGTT 6060
1426 ACCCGTAAGA TCCGCTTTCA AATAGATTTG CCAATTGTAA AAAGTCTGTG GACAGCCTTC 6120
1427 GTCTTAGAAG GGGAGGAGTT AACACAATCA CAAAACACCC GAAATATAGT CGTAAGCCTC 6180
1428 AAGTGCTTTT CCCATCTATA GATCGAGCTT TACCTATAAG AAACTGTAAC TTGTTAAGCT 6240
1429 TTAGAGATAA GAACTCTTGC TATACTTAAG TCAGTCGATT TTGGAAGATT AGAAGCGTCG 6300
1430 GTCATCGCCA CGTACTTACT ATTCGTCTCA TTAAGTGCAG ACCGCGCAAG CCTATTGTAA 6360
1431 TTAATAAACT TACGCTAATA AATATATGGA AAATCTACTA AAATGATAAT T 6411
1432 //
1433 ID DMCOPIA standard; DNA; INV; 5143 BP.
1434 XX
1435 AC X02599;
1436 XX
1437 DR FLYBASE; FBte0000023; Dmel\copia.
1438 XX
1439 FT source X02599:21..5163
1440 FT SO_feature five_prime_LTR ; SO:0000425:1..276
1441 FT SO_feature three_prime_LTR ; SO:0000426:4867..5143
1442 FT SO_feature polyA_signal_sequence ; SO:0000551:1990..1999
1443 FT SO_feature polyA_signal_sequence ; SO:0000551:5063..5073
1444 FT SO_feature primer_binding_site ; SO:0005850:277..291
1445 FT /bound_moiety="tRNA:M-i-RB"
1446 FT SO_feature CDS ; SO:0000316:432..4661
1447 FT /name="Dmel\copia\GIP"
1448 FT /db_xref="FLYBASE:FBgn0013437"
1449 FT /db_xref="SWISS-PROT:P04146"
1450 FT /db_xref="NCBI_PROTEIN:CAA26444.1"
1451 FT /translation="MDKAKRNIKPFDGEKYAIWKFRIRALLAEQDVLKVVDGLMPNEVD
1452 FT DSWKKAERCAKSTIIEYLSDSFLNFATSDITARQILENLDAVYERKSLASQLALRKRLL
1453 FT SLKLSSEMSLLSHFHIFDELISELLAAGAKIEEMDKISHLLITLPSCYDGIITAIETLS
1454 FT EENLTLAFVKNRLLDQEIKIKNDHNDTSKKVMNAIVHNNNNTYKNNLFKNRVTKPKKIF
1455 FT KGNSKYKVKCHHCGREGHIKKDCFHYKRILNNKNKENEKQVQTATSHGIAFMVKEVNNT
1456 FT SVMDNCGFVLDSGASDHLINDESLYTDSVEVVPPLKIAVAKQGEFIYATKRGIVRLRND
1457 FT HEITLEDVLFCKEAAGNLMSVKRLQEAGMSIEFDKSGVTISKNGLMVVKNSGMLNNVPV
1458 FT INFQAYSINAKHKNNFRLWHERFGHISDGKLLEIKRKNMFSDQSLLNNLELSCEICEPC
1459 FT LNGKQARLPFKQLKDKTHIKRPLFVVHSDVCGPITPVTLDDKNYFVIFVDQFTHYCVTY
1460 FT LIKYKSDVFSMFQDFVAKSEAHFNLKVVYLYIDNGREYLSNEMRQFCVKKGISYHLTVP
1461 FT HTPQLNGVSERMIRTITEKARTMVSGAKLDKSFWGEAVLTATYLINRIPSRALVDSSKT
1462 FT PYEMWHNKKPYLKHLRVFGATVYVHIKNKQGKFDDKSFKSIFVGYEPNGFKLWDAVNEK
1463 FT FIVARDVVVDETNMVNSRAVKFETVFLKDSKESENKNFPNDSRKIIQTEFPNESKECDN
1464 FT IQFLKDSKESENKNFPNDSRKIIQTEFPNESKECDNIQFLKDSKESNKYFLNESKKRKR
1465 FT DDHLNESKGSGNPNESRESETAEHLKEIGIDNPTKNDGIEIINRRSERLKTKPQISYNE
1466 FT EDNSLNKVVLNAHTIFNDVPNSFDEIQYRDDKSSWEEAINTELNAHKINNTWTITKRPE
1467 FT NKNIVDSRWVFSVKYNELGNPIRYKARLVARGFTQKYQIDYEETFAPVARISSFRFILS
1468 FT LVIQYNLKVHQMDVKTAFLNGTLKEEIYMRLPQGISCNSDNVCKLNKAIYGLKQAARCW
1469 FT FEVFEQALKECEFVNSSVDRCIYILDKGNINENIYVLLYVDDVVIATGDMTRMNNFKRY
1470 FT LMEKFRMTDLNEIKHFIGIRIEMQEDKIYLSQSAYVKKILSKFNMENCNAVSTPLPSKI
1471 FT NYELLNSDEDCNTPCRSLIGCLMYIMLCTRPDLTTAVNILSRYSSKNNSELWQNLKRVL
1472 FT RYLKGTIDMKLIFKKNLAFENKIIGYVDSDWAGSEIDRKSTTGYLFKMFDFNLICWNTK
1473 FT RQNSVAASSTEAEYMALFEAVREALWLKFLLTSINIKLENPIKIYEDNQGCISIANNPS
1474 FT CHKRAKHIDIKYHFAREQVQNNVICLEYIPTENQLADIFTKPLPAARFVELRDKLGLLQ
1475 FT DDQSNAE"
1476 FT SO_feature CDS ; SO:0000316:join(432..1605,4555..4661)
1477 FT /name="Dmel\copia\GIP-RB"
1478 FT /db_xref="FLYBASE:FBgnXXXXXXX"
1479 FT /db_xref="SWISS-PROT:P04146"
1480 FT /db_xref="NCBI_PROTEIN:CAA26445.1"
1481 FT /translation="MDKAKRNIKPFDGEKYAIWKFRIRALLAEQDVLKVVDGLMPNEVD
1482 FT DSWKKAERCAKSTIIEYLSDSFLNFATSDITARQILENLDAVYERKSLASQLALRKRLL
1483 FT SLKLSSEMSLLSHFHIFDELISELLAAGAKIEEMDKISHLLITLPSCYDGIITAIETLS
1484 FT EENLTLAFVKNRLLDQEIKIKNDHNDTSKKVMNAIVHNNNNTYKNNLFKNRVTKPKKIF
1485 FT KGNSKYKVKCHHCGREGHIKKDCFHYKRILNNKNKENEKQVQTATSHGIAFMVKEVNNT
1486 FT SVMDNCGFVLDSGASDHLINDESLYTDSVEVVPPLKIAVAKQGEFIYATKRGIVRLRND
1487 FT HEITLEDVLFCKEAAGNLMSVKRLQEAGMSIEFDKSGVTISKNGLMVVKNSENQLADIF
1488 FT TKPLPAARFVELRDKLGLLQDDQSNAE"
1489 XX
1490 CC Derived from X02599 (g7740) (Rel. 49, Last updated, Version 4).
1491 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
1492 CC Any changes to original sequence record are annotated in an FT line.
1493 XX
1494 SQ Sequence 5143 BP; 1874 A; 727 C; 971 G; 1571 T; 0 other;
1495 TGTTGGAATA TACTATTCAA CCTACAAAAA TAACGTTAAA CAACACTACT TTATATTTGA 60
1496 TATGAATGGC CACACCTTTT ATGCCATAAA ACATATTGTA AGAGAATACC ACTCTTTTTA 120
1497 TTCCTTCTTT CCTTCTTGTA CGTTTTTTGC TGTGAGTAGG TCGTGGTGCT GGTGTTGCAG 180
1498 TTGAAATAAC TTAAAATATA AATCATAAAA CTCAAACATA AACTTGACTA TTTATTTATT 240
1499 TATTAAGAAA GGAAATATAA ATTATAAATT ACAACAGGTT ATGGGCCCAG TCCATGCCTA 300
1500 ATAAACAATT AAATTGTGAA TTAAAGATTG TGAAAATAAA TTGTGAAATA GCATTTTTTC 360
1501 ACATTCTTGT GAAATAGCTT TTTTTTTCAC ATTCTTGTGA AATTATTTCC TTCTCAGAAT 420
1502 TTGAGTGAAA AATGGACAAG GCTAAACGTA ATATTAAGCC GTTTGATGGC GAGAAGTACG 480
1503 CGATTTGGAA ATTTAGAATT AGGGCTCTTT TAGCCGAGCA AGATGTGCTT AAAGTAGTTG 540
1504 ATGGTTTAAT GCCTAACGAG GTAGATGACT CCTGGAAAAA GGCAGAGCGT TGTGCAAAAA 600
1505 GTACAATAAT AGAGTACCTA AGCGACTCGT TTTTAAATTT CGCAACAAGC GACATTACGG 660
1506 CGCGTCAGAT TCTTGAGAAT TTGGACGCCG TTTATGAACG AAAAAGTTTG GCGTCGCAAC 720
1507 TGGCGCTGCG AAAACGTTTG CTTTCTCTGA AGCTATCGAG TGAGATGTCA CTATTAAGCC 780
1508 ATTTTCATAT TTTTGACGAA CTTATAAGTG AATTGTTGGC AGCTGGTGCA AAAATAGAAG 840
1509 AGATGGATAA AATTTCTCAT CTACTGATCA CATTGCCTTC GTGTTACGAT GGAATTATTA 900
1510 CAGCGATAGA GACATTATCT GAAGAAAATT TGACATTGGC GTTTGTGAAA AATAGATTGC 960
1511 TGGATCAAGA AATTAAAATT AAAAATGACC ACAACGATAC AAGCAAGAAA GTTATGAACG 1020
1512 CGATCGTGCA CAACAATAAT AACACTTATA AAAATAATTT GTTTAAAAAT CGGGTAACTA 1080
1513 AACCAAAGAA AATATTCAAG GGAAATTCAA AGTATAAAGT CAAGTGTCAC CACTGTGGCA 1140
1514 GAGAAGGCCA CATTAAAAAA GATTGTTTCC ATTATAAAAG AATATTAAAT AATAAAAATA 1200
1515 AAGAAAATGA AAAACAAGTT CAAACTGCAA CATCACACGG CATTGCGTTT ATGGTAAAAG 1260
1516 AAGTGAATAA TACTTCAGTG ATGGACAACT GCGGGTTTGT CCTTGATTCT GGTGCTAGTG 1320
1517 ACCATCTTAT AAATGATGAG TCGCTGTATA CCGACAGTGT GGAGGTTGTG CCTCCACTTA 1380
1518 AGATTGCAGT GGCCAAGCAA GGCGAATTTA TTTATGCCAC TAAGCGTGGT ATTGTCCGAC 1440
1519 TACGGAATGA CCATGAGATT ACACTGGAGG ATGTACTCTT TTGTAAGGAA GCTGCTGGTA 1500
1520 ATTTGATGTC CGTAAAGCGT CTCCAAGAGG CAGGAATGTC GATCGAATTT GACAAAAGCG 1560
1521 GTGTAACCAT TTCGAAAAAT GGGTTAATGG TTGTCAAAAA TTCAGGTATG TTAAACAATG 1620
1522 TACCTGTGAT CAATTTTCAA GCATATTCTA TAAATGCTAA GCATAAAAAT AATTTTCGTT 1680
1523 TATGGCATGA GAGGTTTGGC CATATAAGCG ATGGCAAATT ATTAGAAATA AAACGAAAGA 1740
1524 ATATGTTTAG TGATCAAAGT CTTCTAAACA ACTTAGAGTT ATCATGTGAA ATTTGTGAAC 1800
1525 CCTGTTTAAA TGGTAAACAG GCAAGACTTC CTTTTAAACA ATTGAAAGAT AAGACCCATA 1860
1526 TTAAAAGACC ACTTTTTGTA GTACACTCAG ATGTCTGTGG GCCTATTACT CCAGTTACTT 1920
1527 TAGATGATAA AAATTATTTT GTGATCTTTG TTGATCAGTT TACACATTAT TGTGTAACTT 1980
1528 ATTTAATTAA ATATAAATCT GATGTGTTTA GCATGTTTCA AGATTTTGTA GCCAAGAGTG 2040
1529 AAGCTCATTT TAATTTAAAG GTTGTGTACT TATACATTGA CAATGGTAGA GAATACTTGT 2100
1530 CAAATGAGAT GAGACAATTT TGTGTTAAGA AAGGAATTTC TTATCACTTA ACAGTGCCAC 2160
1531 ATACACCTCA GTTAAATGGT GTTTCTGAGA GAATGATAAG AACCATTACG GAAAAAGCTC 2220
1532 GAACCATGGT TAGTGGTGCA AAGCTAGATA AAAGCTTTTG GGGCGAAGCA GTATTAACTG 2280
1533 CTACTTATTT AATCAACAGA ATTCCTAGTA GAGCACTTGT TGATAGTTCA AAGACCCCAT 2340
1534 ATGAGATGTG GCACAATAAG AAGCCATACT TAAAACATTT GAGAGTGTTT GGTGCAACTG 2400
1535 TTTATGTGCA TATTAAAAAC AAACAAGGAA AGTTTGATGA TAAATCATTT AAAAGTATTT 2460
1536 TTGTGGGCTA TGAACCCAAT GGTTTTAAGT TGTGGGATGC TGTAAATGAA AAATTTATTG 2520
1537 TCGCAAGAGA TGTTGTTGTC GATGAAACCA ATATGGTTAA TTCTAGAGCT GTTAAATTTG 2580
1538 AAACAGTGTT CCTGAAAGAT AGTAAGGAAA GTGAAAATAA AAATTTTCCG AATGACAGTA 2640
1539 GGAAAATAAT ACAAACAGAA TTCCCGAATG AGAGTAAGGA ATGCGACAAC ATACAATTCC 2700
1540 TGAAAGATAG TAAGGAAAGT GAAAATAAAA ATTTTCCGAA TGACAGTAGG AAAATAATAC 2760
1541 AAACAGAATT CCCGAATGAG AGTAAGGAAT GCGACAACAT ACAATTCCTG AAAGATAGTA 2820
1542 AGGAAAGTAA TAAATATTTT CTGAATGAGA GTAAGAAAAG AAAGCGAGAT GATCACCTGA 2880
1543 ATGAAAGTAA GGGATCAGGC AACCCGAATG AGAGTAGGGA AAGTGAAACA GCAGAGCACT 2940
1544 TAAAAGAAAT TGGAATTGAT AATCCAACTA AAAATGATGG CATAGAAATT ATTAATAGAA 3000
1545 GAAGTGAGAG ATTAAAGACT AAGCCTCAGA TATCCTATAA TGAAGAGGAT AATAGTCTAA 3060
1546 ATAAAGTTGT TCTAAATGCT CACACTATAT TTAACGATGT CCCAAATTCA TTTGATGAAA 3120
1547 TTCAATATAG GGATGATAAA TCTTCTTGGG AAGAAGCCAT CAATACAGAG TTAAATGCTC 3180
1548 ATAAAATTAA TAATACTTGG ACAATTACAA AAAGGCCTGA AAACAAAAAT ATTGTAGATA 3240
1549 GCAGATGGGT ATTTTCTGTT AAATATAATG AACTTGGAAA TCCAATTAGA TACAAAGCTA 3300
1550 GATTGGTTGC ACGAGGATTC ACTCAAAAAT ACCAAATAGA CTATGAAGAG ACATTTGCTC 3360
1551 CTGTAGCTAG AATTTCAAGT TTCCGATTTA TATTGTCATT AGTAATACAG TATAACTTGA 3420
1552 AAGTCCATCA AATGGATGTA AAAACAGCTT TCTTAAATGG CACGTTAAAA GAGGAAATTT 3480
1553 ATATGAGACT TCCTCAAGGT ATATCGTGTA ATAGTGACAA TGTGTGTAAA TTGAATAAGG 3540
1554 CAATTTACGG ACTCAAGCAA GCGGCTAGAT GCTGGTTTGA AGTATTTGAG CAAGCATTGA 3600
1555 AAGAGTGTGA GTTTGTAAAC TCTTCAGTTG ATCGCTGTAT ATATATTTTA GACAAAGGTA 3660
1556 ACATCAATGA AAACATATAT GTATTATTAT ATGTAGATGA TGTGGTTATA GCTACAGGAG 3720
1557 ATATGACAAG AATGAATAAC TTCAAAAGGT ATTTAATGGA AAAGTTTAGG ATGACTGACC 3780
1558 TAAATGAAAT AAAACATTTT ATTGGAATTA GGATAGAGAT GCAGGAAGAT AAAATCTATT 3840
1559 TAAGCCAATC TGCATATGTT AAAAAAATTT TAAGTAAATT TAACATGGAA AATTGTAATG 3900
1560 CAGTTAGTAC TCCTTTACCT AGTAAAATAA ATTATGAATT ACTTAATTCA GATGAAGACT 3960
1561 GCAATACCCC ATGCCGTAGC CTCATAGGAT GTTTAATGTA CATAATGCTT TGTACACGCC 4020
1562 CAGATTTAAC TACTGCAGTA AATATCTTGA GCAGATATAG TAGCAAAAAT AACTCCGAAT 4080
1563 TATGGCAGAA CTTAAAAAGA GTTCTTAGAT ATTTGAAGGG CACTATCGAT ATGAAATTGA 4140
1564 TTTTTAAAAA GAACTTGGCA TTTGAAAATA AAATTATTGG TTATGTGGAT TCTGATTGGG 4200
1565 CTGGTAGTGA AATTGATAGA AAAAGTACAA CAGGGTATTT ATTCAAAATG TTTGATTTTA 4260
1566 ATCTCATTTG TTGGAATACA AAGAGACAGA ACTCAGTAGC AGCCTCATCA ACTGAAGCTG 4320
1567 AGTATATGGC CCTATTTGAA GCCGTGAGAG AAGCTCTATG GCTTAAATTT TTATTAACTA 4380
1568 GTATTAACAT TAAACTAGAA AACCCCATTA AAATTTACGA AGACAATCAA GGCTGTATTA 4440
1569 GCATAGCAAA CAACCCCTCA TGTCATAAAC GAGCTAAACA TATTGATATT AAATATCATT 4500
1570 TTGCCAGAGA GCAAGTTCAG AATAATGTGA TTTGTCTTGA GTATATTCCT ACAGAGAATC 4560
1571 AACTGGCTGA CATATTTACA AAACCGTTGC CTGCTGCGAG ATTTGTGGAG TTACGAGACA 4620
1572 AATTGGGTTT GCTGCAAGAC GACCAATCGA ATGCTGAATG AAATTTTTAT ATATATTTTT 4680
1573 CAAATTTAAA TTCCTGTAAA CATATTTTGT TACAATGATC TGATCGGGTT TTTCTGGGTT 4740
1574 TTCCCCGTAT CCTCGCAGCA AATGCTGGAT CAGTTAACAC TTCCCAGAAT GCACACCACC 4800
1575 CACATTTGAT AGTTACTAAT GAATATTATT GTTATGTTTT TAATTATAGA CGTTATTTTT 4860
1576 GAGGGGGCGT GTTGGAATAT ACTATTCAAC CTACAAAAAT AACGTTAAAC AACACTACTT 4920
1577 TATATTTGAT ATGAATGGCC ACACCTTTTA TGCCATAAAA CATATTGTAA GAGAATACCA 4980
1578 CTCTTTTTAT TCCTTCTTTC CTTCTTGTAC GTTTTTTGCT GTGAGTAGGT CGTGGTGCTG 5040
1579 GTGTTGCAGT TGAAATAACT TAAAATATAA ATCATAAAAC TCAAACATAA ACTTGACTAT 5100
1580 TTATTTATTA TTAAGAAAGG AAAATAAATT ATAAATTACA ACA 5143
1581 //
1582 ID DMW1DOC standard; DNA; INV; 4725 BP.
1583 XX
1584 AC X17551;
1585 XX
1586 DR FLYBASE; FBte0000341; Dmel\Doc.
1587 XX
1588 FT source X17551:1..4725
1589 FT SO_feature CDS ; SO:0000316:213..1910
1590 FT /name="Dmel\Doc\gag"
1591 FT /db_xref="FLYBASE:FBgn0024789"
1592 FT /db_xref="SPTREMBL:Q04134"
1593 FT /db_xref="NCBI_PROTEIN:CAA35586.1"
1594 FT /translation="MNQNDIRSQRQCEQDERRLSLQRNNAYFSFVSPQIGDRAPSPSTN
1595 FT SKLLPSANDRPRSCSPSLPASAHKSWSEETASPTPLLSQRQTTVPGNCNTAITSAVTSL
1596 FT ATATTSTSSAAQLIIAVPAVNNSAALTVCNNNNARKEESKQKQKSISTVQTGMDRYIQI
1597 FT KRKLSPQNNKAGNQPKINRTNNGNENSAVNNSNRYAILADSATEQPNEKTVGEPKKTRP
1598 FT PPIFIREQSTNALVNKLVALIGDSKFHIIPLKKGNIHEIKLQIQTEADHRIVTKYLNDA
1599 FT GKNYYTYQLKSCKGLQVVLKGIEATVTPAEIIEALKAKNFSAKTAINILNKDKVPQPLF
1600 FT KIELEPELQALKKNEVHPIYNLQYLLHRRITVEEPHKRINPVQCTNCQEYGHTKAYCTL
1601 FT KSVCVVCSEPHTTANCPKNKDDKSVKKCSNCGEKHTANYRGCVVYKELKSRLNKRIATA
1602 FT HTYNKVNFYSPQPIFQPPLTVPSTTPTISFASALKSGLEVPAPPTRTAHSEHTPTNIQQ
1603 FT TQQSGIEAMMLSLQQSMKDFMTFMQNTLQELMKNQNILIQLLVSSKSP"
1604 FT SO_feature CDS ; SO:0000316:1910..4576
1605 FT /name="Dmel\Doc\RTase"
1606 FT /db_xref="FLYBASE:FBgn0024790"
1607 FT /db_xref="SPTREMBL:Q04135"
1608 FT /db_xref="NCBI_PROTEIN:CAA35587.1"
1609 FT /translation="MASLRISLWNANGVSRHTQELTQFIYEKNIDVMLLSETHLTNKNN
1610 FT FHIPGYLFYGTNHPDGKAHGGTGILIRNRIKHHHLNNFDKNYLQSTSIALQLNNGSTTL
1611 FT AAVYCPPRFPISEDQFMEFFNTLGDRFIAAGDYNAKHTHWGSRLVSPKGKQLYNALTKP
1612 FT ENKLDYVSPGKPTYWPADPRKIPDLIDFAITKHVPRNMVTAEALADLSSDHSPVFLNML
1613 FT TRPHIVDPPYRLTNFRTNWPRYQKYVCSHIELTTALSTKEDIDKSTETLENILVSAAKA
1614 FT STPPVTYAKPNYIKTNREIERLVLDKRRLRRDWQSNRSPITKHMLKIATRRLTNALKQE
1615 FT EKNSQRSYIEQLSPTSTKYPLWRAHRNLKTPIAPIMPLRSPSGTWFRSDEERASAFADH
1616 FT LQNVFRPNPSTNTFILPPLIAANLDPQEPFEFRPCELAKVIKEQLNPRKSPGYDLITPR
1617 FT MLIELPKCAILHICLLFNAIAKLGYFPQKWKKSTIVMIPKPGKDKTQPSSYRPISLLTC
1618 FT LSKLFEKMLLLRISPHLRINNTLPTHQFGFREKHGTIEQVNRITSEIRTAFEHREYCTA
1619 FT IFLDVAQAFDRVWLDGLLFKIIKLLPQNTHKLLKSYLYNRVFAIRCDTSTSRDCAIEAG
1620 FT VPQGSVLGPILYTLYTADFPIDYNLTTSTFADDTAILSRSKCPIKATALLSRHLTSVER
1621 FT WLADWRISINVQKCKQVTFTLNKQTCPPLVLNNICIPQADEVTYLGVHLDRRLTWRKHI
1622 FT EAKSKHLKLKARNLHWLINARSPLSLEFKALLYNSVLKPIWTYGSELWGNASRSNIDII
1623 FT QRAQSRILRIITGAPWYLRNENIHRDLKIKLVIEVIAEKKTKYNEKLTTHTNPLARKLI
1624 FT RVCSQSRLHRNDLPAQQ"
1625 XX
1626 CC Derived from X17551 (g8821) (Rel. 29, Last updated, Version 2).
1627 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
1628 CC Any changes to original sequence record are annotated in an FT line.
1629 XX
1630 SQ Sequence 4725 BP; 1647 A; 1192 C; 822 G; 1064 T; 0 other;
1631 GACATTCGGC ATTCCACAGT CTTCGGGTGG AGACGTGTTT CTTTCAAGCT ACGAATAGCA 60
1632 AGTTCTAAAA ACTACAACAG TATAGTGAAA GTTAAACACA AAGTGTAAAG TGCAGTTTGC 120
1633 ACAACTAACA ATTATTGACT ATAGTAATTA TTTACTAAAA TAAATAATTA TTCCATATTG 180
1634 TTCTGGTAAT TGTTATATGT GGACTTAGAA CAATGAATCA AAACGACATA CGTTCTCAGC 240
1635 GACAATGTGA ACAAGACGAG CGCCGGCTCT CTTTACAACG CAACAATGCA TACTTTTCTT 300
1636 TCGTCTCACC GCAAATCGGT GATCGAGCAC CCTCACCTTC AACTAACTCG AAACTTTTGC 360
1637 CCTCAGCGAA CGACAGACCG CGTTCTTGCT CTCCCTCTCT GCCTGCTTCG GCTCACAAGT 420
1638 CGTGGAGCGA AGAGACCGCC TCTCCTACCC CGCTCCTCTC GCAGCGCCAA ACGACCGTCC 480
1639 CGGGTAACTG TAACACTGCA ATAACGAGTG CAGTGACCTC ACTGGCAACT GCCACAACAT 540
1640 CAACTTCGTC AGCGGCCCAA CTAATTATCG CTGTGCCAGC TGTAAATAAT TCAGCAGCAC 600
1641 TGACCGTTTG CAACAACAAT AATGCACGTA AAGAAGAATC AAAACAAAAG CAGAAGTCGA 660
1642 TTTCGACTGT GCAGACTGGC ATGGATCGCT ACATCCAAAT CAAGAGAAAG CTCAGCCCTC 720
1643 AAAACAATAA GGCAGGTAAT CAACCCAAAA TCAATCGAAC CAACAACGGC AATGAAAACT 780
1644 CTGCAGTAAA TAATTCAAAC CGATATGCTA TCTTGGCTGA TTCTGCGACC GAACAACCCA 840
1645 ACGAAAAAAC GGTAGGGGAA CCAAAAAAGA CCAGGCCTCC ACCAATTTTC ATACGAGAAC 900
1646 AAAGTACAAA TGCACTTGTA AATAAACTCG TTGCTTTGAT TGGTGACAGC AAGTTCCACA 960
1647 TTATCCCACT TAAAAAAGGA AATATTCATG AAATAAAACT ACAGATCCAA ACAGAAGCAG 1020
1648 ACCACCGTAT AGTGACTAAA TACCTAAATG ATGCTGGTAA AAACTACTAC ACATACCAAT 1080
1649 TAAAAAGTTG CAAAGGGCTA CAGGTAGTAC TTAAGGGCAT TGAAGCAACA GTGACACCAG 1140
1650 CTGAGATAAT TGAGGCTCTG AAGGCCAAAA ACTTTTCTGC AAAGACAGCT ATTAATATTT 1200
1651 TAAACAAAGA CAAAGTTCCG CAGCCACTAT TCAAAATAGA ACTCGAACCA GAGCTCCAGG 1260
1652 CACTAAAGAA AAACGAAGTG CACCCAATAT ACAATTTACA GTACTTGCTA CATCGGAGGA 1320
1653 TCACCGTGGA GGAGCCGCAC AAACGTATCA ATCCAGTTCA ATGTACTAAT TGCCAAGAAT 1380
1654 ACGGCCACAC CAAGGCATAC TGCACCCTTA AGTCCGTATG TGTTGTCTGT AGCGAACCTC 1440
1655 ATACTACCGC AAACTGCCCC AAAAACAAGG ACGATAAGTC TGTGAAGAAA TGCAGTAACT 1500
1656 GCGGGGAAAA ACATACTGCA AACTACAGAG GCTGTGTGGT GTACAAAGAA TTGAAGAGCC 1560
1657 GCCTAAACAA ACGTATTGCC ACAGCACATA CATACAACAA AGTCAATTTC TACTCTCCGC 1620
1658 AACCGATTTT TCAACCACCC CTAACTGTCC CAAGCACTAC TCCAACAATT TCTTTCGCTA 1680
1659 GCGCCCTAAA ATCCGGACTA GAAGTGCCCG CCCCACCGAC AAGAACTGCT CATTCCGAAC 1740
1660 ATACACCGAC AAACATCCAA CAAACACAAC AAAGTGGCAT CGAAGCTATG ATGCTATCCC 1800
1661 TACAGCAAAG CATGAAAGAC TTCATGACGT TCATGCAAAA TACTTTGCAA GAGCTCATGA 1860
1662 AAAACCAAAA TATCCTGATT CAACTTCTTG TATCTTCAAA ATCCCCATAA TGGCTTCCCT 1920
1663 ACGGATATCT CTGTGGAACG CAAATGGCGT TTCACGGCAT ACACAAGAGC TCACACAGTT 1980
1664 CATTTACGAA AAAAACATCG ACGTAATGCT ACTATCAGAA ACGCACCTCA CAAATAAAAA 2040
1665 CAATTTTCAT ATACCAGGAT ACTTGTTCTA TGGTACAAAT CATCCAGATG GTAAAGCTCA 2100
1666 TGGAGGCACT GGAATACTCA TCAGAAATCG CATAAAACAC CACCACTTAA ACAATTTTGA 2160
1667 CAAAAACTAC TTACAATCTA CGTCCATAGC CTTACAACTC AACAATGGTT CAACGACTCT 2220
1668 AGCCGCAGTC TACTGCCCAC CGCGCTTTCC AATCTCTGAG GATCAATTCA TGGAATTCTT 2280
1669 TAACACACTA GGTGACAGGT TCATCGCAGC GGGTGACTAT AACGCCAAGC ACACCCATTG 2340
1670 GGGATCTCGA CTTGTGTCGC CAAAGGGTAA GCAATTGTAC AATGCGCTTA CGAAGCCAGA 2400
1671 AAACAAGCTA GACTATGTAT CCCCGGGTAA GCCTACATAC TGGCCAGCAG ACCCAAGAAA 2460
1672 AATCCCAGAC CTGATCGATT TTGCAATTAC TAAACATGTC CCCCGCAACA TGGTCACCGC 2520
1673 CGAAGCACTA GCAGATTTAT CATCAGATCA CTCACCTGTT TTTCTAAATA TGCTAACTCG 2580
1674 CCCCCACATC GTCGACCCAC CGTATAGACT CACAAATTTT AGAACAAACT GGCCAAGGTA 2640
1675 TCAAAAGTAT GTCTGTTCAC ACATAGAACT AACGACGGCA TTATCTACAA AGGAGGATAT 2700
1676 AGACAAGTCA ACGGAAACTC TTGAAAACAT TTTAGTTTCG GCTGCAAAGG CTTCAACCCC 2760
1677 GCCAGTGACG TATGCAAAAC CAAACTACAT CAAAACTAAT CGCGAAATCG AGCGGCTGGT 2820
1678 ATTAGATAAA CGACGCCTAC GAAGGGATTG GCAGTCTAAT AGATCACCAA TTACTAAGCA 2880
1679 CATGCTTAAG ATAGCCACAC GCAGGCTTAC CAATGCTCTC AAACAAGAGG AAAAAAACAG 2940
1680 CCAACGTTCA TATATCGAGC AACTCTCTCC CACCAGCACT AAGTACCCTC TTTGGAGAGC 3000
1681 TCACAGAAAC CTAAAGACTC CAATAGCGCC AATTATGCCA CTCCGAAGTC CCTCTGGCAC 3060
1682 CTGGTTTCGA AGTGATGAAG AAAGAGCCAG TGCTTTCGCT GACCATTTAC AAAATGTATT 3120
1683 CCGACCAAAT CCCTCTACCA ACACATTTAT TCTCCCTCCT TTAATAGCAG CCAATCTAGA 3180
1684 TCCTCAAGAA CCCTTTGAAT TCCGACCATG TGAACTAGCA AAGGTTATCA AAGAGCAACT 3240
1685 GAACCCAAGA AAATCGCCTG GCTACGACCT AATAACTCCA AGAATGCTCA TTGAACTCCC 3300
1686 AAAGTGTGCT ATTCTTCACA TCTGCCTGTT GTTCAACGCA ATCGCCAAGC TTGGATACTT 3360
1687 CCCTCAAAAA TGGAAAAAGT CGACCATAGT AATGATTCCA AAGCCAGGAA AAGATAAAAC 3420
1688 GCAGCCATCA TCATATAGAC CGATAAGCTT ACTAACATGT CTTTCAAAGC TGTTTGAAAA 3480
1689 AATGCTACTC CTTCGGATTA GCCCTCATCT TAGAATAAAC AACACACTTC CAACACATCA 3540
1690 ATTTGGCTTT AGAGAAAAAC ATGGAACCAT CGAACAGGTC AACCGAATCA CGTCAGAAAT 3600
1691 TCGTACTGCT TTTGAACATC GAGAATACTG CACAGCCATT TTTCTAGACG TCGCGCAGGC 3660
1692 ATTTGACAGA GTGTGGCTCG ATGGACTTTT GTTTAAAATA ATCAAGCTGT TGCCCCAAAA 3720
1693 CACACATAAG CTACTGAAGT CATACCTATA TAACAGAGTG TTTGCAATAA GATGCGATAC 3780
1694 AAGCACTTCA CGCGATTGCG CAATCGAAGC TGGAGTGCCG CAAGGCAGTG TACTGGGTCC 3840
1695 AATCTTATAC ACCCTGTATA CGGCGGATTT CCCCATAGAC TACAATCTAA CAACCTCCAC 3900
1696 GTTCGCTGAT GATACCGCGA TACTCAGTCG CTCGAAATGC CCAATAAAAG CCACGGCACT 3960
1697 CCTATCCCGA CACTTAACAT CTGTAGAACG ATGGCTTGCC GACTGGAGAA TTTCAATAAA 4020
1698 TGTTCAAAAA TGCAAGCAGG TTACCTTTAC CTTAAACAAA CAAACATGCC CACCACTGGT 4080
1699 CTTGAATAAC ATATGCATTC CACAAGCCGA CGAGGTAACA TATCTGGGAG TTCATCTGGA 4140
1700 CAGGCGGCTC ACTTGGCGCA AACATATAGA AGCCAAATCG AAACATCTTA AACTTAAAGC 4200
1701 AAGGAACCTC CACTGGCTCA TAAATGCTCG CTCTCCACTT AGTCTGGAGT TCAAAGCTCT 4260
1702 TCTATACAAC TCCGTCTTAA AACCTATCTG GACTTATGGC TCCGAGCTGT GGGGCAACGC 4320
1703 ATCCAGAAGT AACATAGACA TTATTCAGCG AGCACAGTCA AGAATTCTGA GAATTATCAC 4380
1704 TGGAGCGCCG TGGTACCTTC GAAACGAAAA CATACACAGA GACCTAAAAA TCAAATTAGT 4440
1705 AATCGAAGTA ATAGCTGAGA AAAAAACGAA GTATAACGAA AAGCTGACCA CCCATACAAA 4500
1706 TCCCCTCGCA AGAAAACTAA TCCGAGTATG CAGTCAAAGC CGGCTGCACC GCAACGACCT 4560
1707 CCCAGCCCAG CAATAAACTT ATTAGGGCAT TAATGAAAAA AAAAAACTAT CACTAAGTGA 4620
1708 AAGTTAATTA AGTTAGATTA AGATTTGAAC ACTTATTGTT AGTCTCTTAA CACAAAGGGA 4680
1709 AGATTCAATA AATAATAAAA ATTAAAAAAA AAAAAAAAAA AAAAA 4725
1710 //
1711 ID F standard; DNA; INV; 4708 BP.
1712 XX
1713 AC AC005198;
1714 XX
1715 DR FLYBASE; FBte0000005; Dmel\F-element.
1716 XX
1717 SY synonym: Jiminy
1718 XX
1719 FT source AC005198:38639..43358
1720 FT SO_feature CDS ; SO:0000316:192..1880
1721 FT /name="Dmel\F-element\gag-r"
1722 FT /db_xref="FLYBASE:FBgn0041632"
1723 FT /db_xref="TREMBL:P91787"
1724 FT /translation="MSQNDTRAQRQREHDERRLSIQRNNAYFSYVSPTIPNADIERSI
1725 FT THSPGNLLLPTNQERARSCSPALLAPTEAPLPPTTTAGEGPAARSASSSAAPAHGLTK
1726 FT SAKAKPLAINGTAALPAKQNENVNKKAGSTWQTGMDRYITIKRKLSPENSDLGNKPKN
1727 FT TRDNSTLIKNVAPANTNRFALLVDTAEDVPLGSVDIEPKKTKPPPIYIREKSTSRLVN
1728 FT TLIGLIGKDSFHIIPLVRGTINEIKLQTKTEDDYRKVTNYFTAQKIGFYTYQLKSSKG
1729 FT LQVVLKGIESDVTPEEITEALKEKGFYAKNVFNIKNRNRQPQPLFKIELEPENKPPRK
1730 FT NEVHPIYKLQLLLHRRITVEEPHKRNAPVQCTNCQEYGHTRSYCTLRPVCVVCGDLHD
1731 FT SKQCQINKENACEKKCNNCGGNHTANYRGCPIYKELKIRLHKRMNTARAHQGSATLIP
1732 FT SETNPEVIFSKAASFAPWPTFNTNKTTFANVLKSGMTPPTQNSRTPHEVHTKLDTQQN
1733 FT YHPAAQQETKTEAMMQALQQSMMEFMTFMKTTIQDMMRNQNLLIQMLVAQQSNK"
1734 FT SO_feature CDS ; SO:0000316:1880..4561
1735 FT /name="Dmel\F-element\RTase"
1736 FT /db_xref="FLYBASE:FBgn0041633"
1737 FT /db_xref="TREMBL:Q24335"
1738 FT /translation="MATLRIATWNANGVSQRKLELAQFLHEKHIDVMLLSETHLTSKY
1739 FT NFQIRDYHFYGTNHPDGKAHGGTAILIRNRMKHHFYKEFAENHLQATSINIQLDDNTL
1740 FT LTLAAVYCPPRFTVLEAQFLDFFQALGPHFIAAGDYNAKHTHWGSRLVNPKGKQLYKT
1741 FT IIKATNKLDHVSPGSPTYWPSDLNKLPDLIDFAVTKNISRSLVKAECLPDLSSDHSPV
1742 FT LIHLRRYAENVKPPTRLTSSKTNWLRYKKYISSHIELSPKLNTESDIESCTCALQSIL
1743 FT TAAALTATPKITNNTINSKKTNVQIEQLVHVKRRLRREWQSSRSPTAKQKLKVATRKL
1744 FT ANALKQEEDDDQRRYIEQLTPTGTKQKSLWRAHSTLRPPTETVLPIKNSSGGWARSDE
1745 FT DRANTFAAHLQNVFTPNQATSTFALPSYPVNRHQQHTPIVFRPKEITKIIKDNLSPKK
1746 FT SPGYDLITPEMIIQLPHSAVRYITKLFNAITKLGYFPQRWKMMKIIMIPKPGKNHTVA
1747 FT SSYRPISLLSCISKLFEKCLLIRLNQHQTYHNIIPAHQFGFRESHGTIEQVNRITTEI
1748 FT RTAFEYREYCTAVFLDVSQAFDKVWLDGLMFKIKISLPESTHKLLKSYLYDRKFAVRC
1749 FT NTATSTVHTIEAGVPQGSVLGPTLYLIYTADIPTNSRLTVSTFADDTAILSRSRSPIQ
1750 FT ATAQLALYLIDIKKWLSDWRIKVNEQKCKHVTFTLNRQDCPPLLLNSIPLPKADEVTY
1751 FT LGVHLDRRLTWRRHIEAKKTQLKLKANNLHWLINSGSPLSLDHKVLLYNSILKPIWTY
1752 FT GSQLWGNASNSNIDIIQRAQSKILRTITGAPWYVRSENIQRDLNIPSVTNAITELKEK
1753 FT YL"
1754 XX
1755 CC K. O'Hare, Personal communication to FlyBase, 1 May 2000.
1756 CC CDS2 translation from M17214; AC005198 has a 1-bp deletion.
1757 XX
1758 SQ Sequence 4708 BP; 1618 A; 1242 C; 857 G; 991 T; 0 other;
1759 AATCAATTAA TCAATTCGAT CGCCGACGTG TGAAGACGTT TTTATCGTGC TCCGCACAAA 60
1760 ATCGGTTGTT TTGAGTGAAG TGAACGCCAA ATAAAATAAA CTAAATAAAA AATCTGAAAG 120
1761 CGAAAGAGAC GCTCTATGCG ATGCAAGATC GCTTAAATAC ATAGTGAATT GTTATCTTAA 180
1762 ATAATAAAAC TATGAGTCAG AATGACACTC GCGCCCAGCG TCAGCGCGAG CATGACGAAC 240
1763 GCCGACTCTC AATTCAGCGC AACAACGCGT ACTTCTCCTA CGTCTCACCG ACAATCCCAA 300
1764 ACGCAGACAT CGAGCGGTCA ATAACCCATA GCCCAGGAAA CCTTCTTCTA CCAACAAATC 360
1765 AAGAAAGAGC GCGCTCCTGC TCTCCCGCTC TATTGGCTCC GACAGAAGCC CCGCTACCTC 420
1766 CAACAACAAC AGCTGGAGAG GGACCGGCAG CCCGCTCTGC CTCGTCATCG GCTGCACCCG 480
1767 CTCACGGTCT GACTAAGTCA GCGAAAGCAA AACCGCTAGC AATAAACGGT ACTGCTGCAC 540
1768 TGCCAGCAAA ACAAAACGAA AACGTAAACA AAAAAGCTGG GTCGACCTGG CAGACTGGAA 600
1769 TGGACCGCTA CATTACAATA AAGCGAAAGC TCAGCCCGGA AAATTCAGAT TTGGGAAACA 660
1770 AGCCGAAAAA TACACGCGAT AACTCTACCT TGATCAAAAA TGTAGCCCCT GCAAATACCA 720
1771 ACAGATTTGC CTTGCTGGTA GATACCGCTG AGGACGTGCC GCTGGGATCC GTTGATATCG 780
1772 AACCGAAGAA AACAAAGCCT CCGCCAATAT ACATCCGCGA GAAGAGCACA AGCCGTCTTG 840
1773 TAAATACTTT GATTGGCCTT ATTGGGAAAG ATAGCTTTCA TATAATTCCC CTCGTAAGAG 900
1774 GTACTATCAA CGAAATCAAA CTTCAGACGA AAACGGAGGA CGACTACAGA AAAGTCACAA 960
1775 ACTATTTTAC CGCACAAAAA ATAGGCTTCT ACACCTACCA GCTTAAAAGC AGCAAGGGCC 1020
1776 TGCAAGTAGT CCTGAAGGGC ATTGAGTCTG ATGTTACGCC CGAAGAGATA ACTGAGGCGC 1080
1777 TAAAGGAAAA GGGATTTTAC GCCAAAAACG TGTTCAATAT CAAAAACAGA AACAGGCAGC 1140
1778 CCCAACCACT CTTCAAGATT GAGCTTGAAC CAGAAAACAA GCCTCCTAGA AAAAACGAGG 1200
1779 TTCACCCAAT TTACAAACTC CAGCTCCTTT TGCACCGTAG GATCACGGTA GAAGAGCCGC 1260
1780 ACAAACGCAA CGCTCCTGTA CAATGTACAA ACTGCCAAGA GTATGGCCAC ACGAGGTCAT 1320
1781 ATTGTACACT TCGCCCGGTG TGCGTAGTCT GTGGAGATCT CCACGACTCC AAACAGTGTC 1380
1782 AAATTAACAA AGAAAATGCA TGCGAGAAAA AATGTAATAA CTGCGGGGGC AATCACACAG 1440
1783 CAAACTACAG AGGCTGTCCA ATCTACAAAG AGCTGAAAAT CCGTCTTCAC AAAAGAATGA 1500
1784 ACACGGCGCG GGCACACCAA GGATCAGCTA CCCTGATACC ATCAGAGACA AATCCTGAAG 1560
1785 TAATTTTCTC GAAAGCAGCT AGTTTCGCTC CCTGGCCTAC ATTCAACACT AACAAGACAA 1620
1786 CATTTGCTAA CGTTTTAAAA TCAGGTATGA CGCCTCCAAC CCAAAACTCC CGAACTCCAC 1680
1787 ATGAAGTGCA CACAAAATTA GACACACAAC AAAACTATCA CCCAGCTGCG CAGCAGGAAA 1740
1788 CAAAAACTGA AGCTATGATG CAAGCCTTAC AACAGAGCAT GATGGAATTT ATGACATTTA 1800
1789 TGAAGACCAC CATTCAAGAC ATGATGCGTA ATCAAAACCT TTTGATACAA ATGCTTGTAG 1860
1790 CCCAACAATC AAATAAATAA TGGCTACCTT ACGCATAGCT ACGTGGAACG CCAATGGCGT 1920
1791 CTCACAGCGC AAACTTGAGC TAGCTCAATT CCTACATGAG AAGCATATCG ACGTAATGCT 1980
1792 TCTTTCGGAA ACTCATCTCA CAAGCAAATA CAATTTTCAA ATAAGAGACT ACCATTTCTA 2040
1793 CGGTACAAAT CATCCCGACG GAAAAGCACA CGGTGGCACC GCCATACTCA TAAGGAACCG 2100
1794 TATGAAGCAC CACTTTTACA AAGAATTTGC GGAAAATCAT CTTCAGGCCA CATCTATCAA 2160
1795 CATTCAGCTG GATGACAACA CTCTCCTTAC ACTAGCGGCC GTATACTGCC CCCCCCGTTT 2220
1796 CACAGTATTA GAAGCTCAAT TCCTGGATTT CTTCCAAGCA CTAGGGCCAC ACTTCATTGC 2280
1797 AGCAGGCGAC TACAACGCTA AACATACTCA CTGGGGATCG CGACTTGTGA ACCCAAAAGG 2340
1798 AAAACAGCTT TATAAGACGA TAATAAAAGC CACTAATAAA CTTGACCATG TTTCCCCCGG 2400
1799 GAGTCCTACA TACTGGCCAT CAGACCTCAA TAAGCTGCCA GACCTGATCG ACTTCGCAGT 2460
1800 TACGAAAAAT ATTTCCCGCA GTTTGGTTAA AGCTGAATGT CTGCCGGATC TCTCATCTGA 2520
1801 TCACTCGCCT GTACTAATTC ACCTCCGCCG ATACGCAGAA AACGTGAAAC CACCAACCAG 2580
1802 ATTGACCTCT AGCAAAACAA ACTGGCTCAG GTATAAAAAA TATATAAGTT CACATATTGA 2640
1803 GCTAAGCCCA AAACTCAATA CTGAATCTGA TATAGAGAGC TGCACGTGTG CATTGCAATC 2700
1804 CATCCTTACT GCAGCAGCTC TTACTGCAAC ACCCAAAATA ACAAATAATA CAATTAATTC 2760
1805 AAAAAAGACC AACGTACAAA TCGAGCAACT CGTCCACGTA AAACGTCGCT TACGCAGAGA 2820
1806 ATGGCAATCT TCCAGATCCC CAACTGCAAA ACAAAAGCTA AAAGTAGCCA CACGGAAACT 2880
1807 GGCCAACGCT CTGAAACAAG AAGAGGACGA CGATCAGCGC CGATACATAG AGCAACTCAC 2940
1808 ACCAACAGGC ACAAAACAAA AGTCACTGTG GCGAGCCCAC TCAACTCTTC GCCCACCGAC 3000
1809 TGAAACCGTT TTGCCGATAA GGAATTCATC AGGTGGCTGG GCCCGTAGTG ATGAAGACAG 3060
1810 AGCCAACACA TTTGCCGCTC ACCTACAAAA TGTGTTCACG CCAAACCAGG CTACTAGCAC 3120
1811 ATTCGCGCTA CCGTCCTATC CCGTAAACCG CCATCAGCAA CACACCCCAA TTGTGTTTCG 3180
1812 TCCTAAAGAA ATAACTAAAA TAATCAAAGA CAATCTCAGC CCGAAAAAAT CCCCCGGCTA 3240
1813 CGACCTTATA ACACCGGAAA TGATCATCCA GCTGCCACAT TCTGCAGTTC GCTACATAAC 3300
1814 CAAGCTCTTT AATGCCATCA CCAAACTTGG TTACTTTCCA CAACGATGGA AGATGATGAA 3360
1815 GATCATAATG ATTCCAAAGC CTGGTAAGAA CCACACAGTC GCTTCATCTT ACAGACCAAT 3420
1816 AAGTCTACTC TCATGCATTT CGAAACTATT CGAAAAATGC CTGCTGATCC GACTTAATCA 3480
1817 ACATCTGATA TACCACAATA TAATCCCAGC CCACCAATTT GGATTTCGCG AAAGCCACGG 3540
1818 AACCATTGAA CAGGTGAATC GTATTACAAC GGAAATAAGA ACTGCATTTG AATATCGCGA 3600
1819 ATACTGTACA GCAGTATTTT TAGACGTATC CCAAGCATTC GACAAAGTCT GGCTCGACGG 3660
1820 CCTAATGTTT AAAATTAAAA CATCCCTACC CGAAAGCACA CACAAACTTC TAAAGTCTTA 3720
1821 CCTCTATGAC AGAAAGTTTG CAGTGCGGTG CAACACTGCC ACTTCCACTG TTCATACAAT 3780
1822 TGAGGCTGGA GTCCCCCAAG GCAGCGTTCT TGGGCCAACC TTATACCTCA TCTATACAGC 3840
1823 CGACATCCCT ACAAATAGTC GCTTAACGGT ATCCACATTT GCCGACGATA CAGCTATCCT 3900
1824 TAGCCGTTCA AGGTCCCCTA TCCAAGCTAC AGCACAGTTG GCACTGTACC TCATCGACAT 3960
1825 TGAGAAGTGG CTCTCTGACT GGCGAATAAA AGTAAACGAG CAAAAATGCA AGCACGTGAC 4020
1826 GTTTACGCTA AACAGACAAG ACTGTCCTCC GCTCTTGTTG AACAGCATAC CACTCCCGAA 4080
1827 AGCAGACGAG GTAACGTACC TAGGAGTACA CCTAGACAGA AGACTCACAT GGCGCAGGCA 4140
1828 CATTGAAGCC AAAAAAACCC AACTTAAACT CAAAGCCAAC AACTTACACT GGCTCATCAA 4200
1829 CTCTGGTTCT CCGCTCAGCC TAGATCACAA GGTCTTGCTC TACAATTCTA TATTGAAACC 4260
1830 AATCTGGACC TATGGCTCAC AGTTATGGGG CAATGCCAGC AACAGCAATA TTGACATCAT 4320
1831 TCAGCGAGCA CAATCAAAGA TTCTGAGAAC CATCACTGGG GCACCGTGGT ACGTTCGGAG 4380
1832 TGAAAACATC CAAAGAGACT TAAATATCCC ATCAGTTACC AACGCAATCA CGGAACTTAA 4440
1833 GGAAAAATAC CATAGCAAGC TTCACACGCA CCCCAACCAC CTAGCGCGAG GTCTAATCCA 4500
1834 GCTCAGCAGC CGTTCCCGTC TCCGGCGAAA GGACCTACCA ACCCAGCGAA TAAATTATTA 4560
1835 GGGCCGTTTA AACATAGAAC AGTTGGAAAA ATAATACAAC TGTTCAAAAA ATACTTGTTA 4620
1836 TAGTTAAGAT TTTTAAACTT ATTGTTAGTT CTTATACAAG AAGATTCAAT AAATAAAAGC 4680
1837 AAAGTAAAAT AAAAAAAAAA AAAAAAAA 4708
1838 //
1839 ID FB standard; DNA; INV; 4347 BP.
1840 XX
1841 AC X51937;
1842 AC X15469;
1843 XX
1844 DR FLYBASE; FBte0000466; Dmel\NOF.
1845 XX
1846 FT source join(X15469:94..1010,X51937:1..3430)
1847 FT SO_feature CDS ; SO:0000316:797..3874
1848 FT /name="Dmel\NOF\ORF"
1849 FT /db_xref="FLYBASE:FBgn0044029"
1850 FT /db_xref="SWISS-PROT:P16320"
1851 FT /db_xref="NCBI_PROTEIN:CAA36201.1"
1852 FT /translation="IQQLDTSANLTLNSTFPDDDPEFQITEASKNGPLPILYFNLELDL
1853 FT ELWRSIAPKKDQKTEKLQPNWTDTMAKLIYKKVPLPCAFNFRKAKLSDKVDNIWLRIEG
1854 FT YCNDCSSILKGHCLVKPDEQCGIMISVSVPDTRGIPHNKKRRCTGSRRLEIGNELILKK
1855 FT AALWRKEATDNMNDDDPEPSYIPNLPTLRKLREEATNRHLGITKDRDPVSSLYLKKYEG
1856 FT ELAGCILDIGLDEFFCIYCTGTQVKTYASRIKTIRKISIDATGSVVLPIQKPNGDSSYV
1857 FT FLYQIVMEGDDSIFPVFQMLSAKHDTASIQFWLSRFISKSGHFPLEVVSDFSLALLNGI
1858 FT SLSFNECRIATYIKKCFHSLLMEERTDLPPCYIRLDIAHLIKMICRKNVFKSKLPNLKD
1859 FT FYTRCIGLATTCETKDSFAELIKSVLIVALSQSSGEDEKGDILSSYRNEKYLLARIATF
1860 FT TAPDHKETIEDNCIPEDQEEIDEDVTDFISNIKIAAEEEALNCNSVNCRPNPYFLPELM
1861 FT PPLIKLCKYFVLWTNVMKEKFCSKYDVGSSALVEAYFKDLKNTDMSIFHRPVRADKFVV
1862 FT QHIRCIEAVCKLERAAMKRKTVKTPSFIKENAPKKMCSKETKGFLEEILEESEVEYLLQ
1863 FT EENWKVKNKTIKPTEGNDAEDNDTDDENKEMDLSEQPKEKPRGKYLKKCPNVELLYNRP
1864 FT HRRKQDEILHNGGSMGPVWIGKQLLQFKNTCPFDSLVEILSTAYIDNFYYKSLLDDFYT
1865 FT DNLTIELVKKYAVEGVSSSLYCDRGLVLKSFFDEKHQIIKCDANIGSFIEKALNGVPSA
1866 FT SSHRTHIKNNHDCRNQKYIHHRLEVIDVEKVGHLDVQEVVIPFIDEFFARTDGECKICG
1867 FT GQQILERQPGPHVILDIEFAMDAFHQIHHNGLPGTTTLLQVPEEILIQEKKYILSGAIE
1868 FT YVPAMGGEIGHYIAYCRRVIGSWEVHNDMCRQWKKFSALNTKMTLHILIYTRKN"
1869 XX
1870 CC Derived from X15469 (g7962) (Rel. 36, Last updated, Version 3).
1871 CC Derived from X51937 (g8297) (Rel. 44, Last updated, Version 6).
1872 CC Takis Benos and Michael Ashburner, 25-Aug-1997.
1873 CC Any changes to original sequence record are annotated in an FT line.
1874 XX
1875 SQ Sequence 4347 BP; 1461 A; 775 C; 885 G; 1226 T; 0 other;
1876 TATATTCTAT TGCCCACCAT ATAAACACGT GCCACTTTCC TAGTTTTAGG ATCTGCCTAC 60
1877 ATAACACGTG CAGACGCACA GGTGTTTCTG GGTTTATATA GACCAAAAAT TGGTTCCGAT 120
1878 TGCCAATCTT GTAATTTACA GTTTACCAGG TAATTACATA ATTTTCAAAC CTCACTTTAT 180
1879 GATAGGGTCC AATTTTTTAC CTGTGACAAA GTGTTAAATT TTTTAAGAAT GGGTTTTTCA 240
1880 TGGCAGGTCA GAATCCTCTA TAAAATCTAA AACACTTGTC GGTATTTGAA AATCGCTCTC 300
1881 CTCCTTGATT CTCATATTAG GTGTAAAAGA TAAATCCGGA ACTCATAATT AAAATATTTT 360
1882 TTATGTGAAA AAGTTGTGCG CGATTTTAAC TACGCTTACC CAGTGCTGGA AAAGTTAAAG 420
1883 TTGTTTTGTT TTTCAAAGAA AGTGAAAGTT GCTAAGCACG AACTTAAGAA ATCTGAGTGA 480
1884 TTGTGTTAAA TTTATTTGAA TCCTTGTGAA TTTTGTTGAC AGTCTTTTTA AAGACTTGCA 540
1885 AAATTTTCAT ATTATTCGGT TCTTGCTTTT ATTTTTATAC AACGCGTTTT TCCTTTAGGC 600
1886 ATACCTTTAT ACATTTACAG TGTAAACAAC AGTGTAAAAC GTGTAAATCA GTGCAAAATA 660
1887 GTTTTTTTTA TTTACTCCAT AAAAAATAAG TGTTACTGTC AGGATGCCGG CCAAACCGCA 720
1888 AGTCGATGGT CACACCTTAG TGGATGCATT TTGCTGCGCG AATATTTTTA CGGAGACTGG 780
1889 AGCTCTTAAG CCAAGAAGCG ATAAAGTTTG GATGGATATA AGCAACCAAT TGAAAGGAGC 840
1890 GATCAGCGCG AAGACGCTTA ATTTCTACGC CAGAATCAAT AGGAATAACA TGATAACTGT 900
1891 GGTTAAAGAA CGATGTGGAA TTCAACAGCT GGATACTAGT GCCAATTTAA CTTTAAATAG 960
1892 CACATTTCCT GATGATGACC CGGAGTTCCA GATCACCGAA GCTTCAAAAA ATGGACCATT 1020
1893 GCCTATTTTG TACTTTAACC TGGAGTTGGA CCTGGAATTG TGGAGATCAA TTGCCCCCAA 1080
1894 AAAGGATCAA AAAACTGAAA AACTGCAACC TAACTGGACG GATACTATGG CAAAGTTGAT 1140
1895 ATACAAAAAA GTTCCTCTTC CGTGTGCATT TAATTTTAGA AAAGCTAAAC TTTCCGACAA 1200
1896 AGTGGATAAT ATTTGGCTAC GAATTGAAGG CTATTGCAAT GACTGCAGCT CAATTTTAAA 1260
1897 GGGACATTGC CTTGTGAAAC CCGATGAACA ATGCGGCATA ATGATATCTG TTTCAGTACC 1320
1898 GGACACACGA GGTATACCTC ATAATAAAAA ACGACGGTGC ACTGGATCGA GACGACTTGA 1380
1899 AATTGGGAAC GAGTTGATTT TAAAAAAAGC TGCATTGTGG AGGAAGGAAG CCACCGACAA 1440
1900 CATGAATGAT GACGACCCAG AACCGAGTTA CATACCAAAT TTACCAACCC TTCGGAAACT 1500
1901 TCGTGAAGAG GCAACTAACA GACACCTAGG AATTACCAAG GATCGGGATC CAGTTTCATC 1560
1902 ATTATACCTT AAAAAGTATG AGGGTGAATT GGCTGGATGC ATTCTTGACA TTGGATTGGA 1620
1903 TGAATTTTTC TGCATATACT GCACAGGAAC CCAAGTAAAA ACATATGCAT CAAGGATAAA 1680
1904 AACTATTAGA AAGATTTCTA TTGACGCAAC TGGAAGCGTG GTGTTACCCA TCCAAAAACC 1740
1905 AAACGGTGAC TCTAGTTATG TTTTTCTGTA CCAAATTGTA ATGGAGGGTG ACGACAGTAT 1800
1906 ATTTCCAGTT TTTCAGATGC TGTCGGCTAA ACATGACACA GCCAGCATAC AGTTTTGGTT 1860
1907 AAGCAGATTT ATATCAAAGT CGGGGCATTT TCCACTGGAG GTTGTATCTG ATTTTTCCTT 1920
1908 GGCATTGCTA AATGGAATAA GCTTAAGCTT TAATGAGTGT AGGATTGCGA CGTATATAAA 1980
1909 AAAATGTTTC CACAGCCTTT TGATGGAGGA ACGGACGGAT CTGCCACCCT GCTATATTCG 2040
1910 ACTTGACATC GCCCACCTAA TTAAAATGAT ATGCCGGAAG AACGTCTTCA AAAGTAAATT 2100
1911 ACCGAACCTC AAGGATTTTT ATACTAGATG TATTGGTCTT GCAACAACGT GTGAGACAAA 2160
1912 GGACAGTTTT GCGGAATTAA TTAAATCAGT ACTGATTGTC GCACTGAGCC AATCCTCAGG 2220
1913 GGAAGATGAA AAAGGAGACA TTCTTTCAAG TTACAGGAAT GAAAAGTATC TGCTCGCCAG 2280
1914 AATAGCTACA TTTACTGCCC CGGATCACAA GGAGACCATT GAGGACAACT GCATACCAGA 2340
1915 GGACCAGGAG GAAATTGACG AGGATGTTAC GGACTTTATC TCTAATATTA AAATCGCTGC 2400
1916 CGAAGAAGAA GCGTTAAATT GCAATTCGGT CAACTGTCGG CCAAATCCGT ATTTCCTACC 2460
1917 TGAGCTAATG CCACCATTAA TTAAGTTGTG CAAATATTTT GTTTTATGGA CAAACGTGAT 2520
1918 GAAGGAAAAG TTCTGTTCCA AATATGATGT CGGCTCTTCG GCTCTTGTGG AAGCCTATTT 2580
1919 CAAGGATTTA AAAAACACGG ACATGAGCAT ATTCCACCGA CCAGTGAGAG CGGATAAATT 2640
1920 CGTGGTGCAA CATATCCGAT GCATCGAAGC TGTTTGCAAG CTGGAACGAG CCGCGATGAA 2700
1921 ACGCAAGACC GTTAAAACTC CCAGCTTTAT AAAAGAAAAC GCTCCTAAGA AAATGTGCAG 2760
1922 TAAGGAAACC AAGGGATTTC TGGAGGAAAT ACTTGAAGAA AGCGAAGTGG AATACCTTTT 2820
1923 ACAAGAAGAA AACTGGAAGG TGAAGAATAA AACAATAAAG CCCACGGAAG GAAATGATGC 2880
1924 TGAAGACAAC GACACTGATG ATGAAAACAA GGAAATGGAT TTAAGTGAAC AGCCCAAAGA 2940
1925 AAAACCAAGG GGAAAATATC TCAAAAAATG CCCCAATGTG GAGTTATTAT ACAATCGACC 3000
1926 ACATCGAAGG AAACAGGACG AAATTTTGCA TAATGGTGGA TCAATGGGAC CCGTCTGGAT 3060
1927 TGGCAAACAA TTATTGCAAT TCAAAAATAC TTGTCCGTTT GACTCTCTAG TGGAAATATT 3120
1928 GTCGACCGCA TACATAGACA ATTTTTATTA CAAAAGCCTA TTGGATGATT TCTACACTGA 3180
1929 CAACTTGACG ATAGAATTGG TGAAAAAGTA TGCCGTCGAG GGAGTTTCGT CCAGTCTCTA 3240
1930 CTGCGACAGA GGTCTGGTCC TAAAAAGTTT TTTTGATGAA AAACACCAGA TTATAAAATG 3300
1931 CGACGCAAAT ATTGGGTCTT TTATTGAAAA AGCGCTGAAT GGAGTACCCA GTGCGTCAAG 3360
1932 TCATCGGACC CATATAAAAA ACAACCATGA TTGCAGGAAC CAAAAATATA TCCACCATCG 3420
1933 GCTGGAGGTT ATAGATGTCG AAAAAGTTGG CCACCTCGAC GTCCAGGAGG TAGTGATCCC 3480
1934 CTTTATTGAT GAGTTTTTTG CAAGAACTGA TGGAGAATGT AAAATATGCG GTGGACAACA 3540
1935 GATCCTTGAA AGGCAGCCAG GACCGCATGT CATACTTGAT ATAGAATTTG CAATGGATGC 3600
1936 TTTTCATCAA ATTCATCATA ACGGTTTACC AGGAACGACC ACTTTACTTC AAGTGCCGGA 3660
1937 GGAAATTTTA ATACAGGAAA AGAAATATAT TTTAAGTGGT GCCATCGAAT ATGTTCCTGC 3720
1938 GATGGGAGGG GAAATTGGAC ATTACATTGC ATATTGCCGC AGAGTCATTG GATCTTGGGA 3780
1939 AGTGCACAAC GATATGTGCA GGCAATGGAA AAAGTTCTCA GCTCTAAATA CCAAAATGAC 3840
1940 ACTCCACATT TTGATATACA CCCGGAAAAA TTAATGTTTA TTTTTAAGCC TTGTTTAAAA 3900
1941 GTGTAAAAAA TATTTGTTGT TAAAAATTAC AATCTTAAGT CCTTTGCAAA CGTTGTTTAA 3960
1942 AAATAAAATT AAATTAATTA TTTTACAAAA CTTAACCCTT TTTCACTTTT ATACCTAATA 4020
1943 TAAAGAGGTC CGTAAAGTAT CAAGGAGGAG AGCGATTTTC AAATACCGAC AAGTGTTTTA 4080
1944 GATTTTATAG AGGATTCTGA CCTGCCATGA AAAACCCATT CTTAAAAAAT TTAACACTTT 4140
1945 GTCACAGGTA AAAAATTGGA CCCTATCATA AAGTGAGGTT TGAAAATTAT GTAATTACCT 4200
1946 GGTAAACTGT AAATTACAAG ATTGGCAATC GGAACCAATT TTTGGTCTAT ATAAACCCAG 4260
1947 AAACACCTGT GCGTCTGCAC GTGTTATGTA GGCAGATCCT AAAACTAGGA AAGTGGCACG 4320
1948 TGTTTATATG GTGGGCAATA GAATTTA 4347
1949 //
1950 ID DMTNFB standard; DNA; INV; 1106 BP.
1951 XX
1952 AC V00246; J01084;
1953 XX
1954 DR FLYBASE; FBte0000288; Dmel\FB.
1955 XX
1956 FT source V00246:1..1106
1957 XX
1958 CC Derived from V00246 (g8708) (Rel. 36, Last updated, Version 3).
1959 CC Josh Kaminker 2 Aug 2002.
1960 CC Any changes to original sequence record are annotated in an FT line.
1961 XX
1962 SQ Sequence 1106 BP; 340 A; 228 C; 119 G; 419 T; 0 other;
1963 AGCTCAAAGA AGCTGGGGTC GGAAAAATCG AATTTTTGAA ATTTGAAAGC TGGAATCGTT 60
1964 TGCCCATTTT TTGCCCATGT TTGCCCACCA ATTAGTTTTT TTTGCCCACG TCCAGTTTTT 120
1965 GAGATATGGA TTTTCGAAAA AGTTCGAAAA TGTTCGAAAA TCAAAAATTT CGCTTTTTTC 180
1966 AAATTTTTTT TTTTTTAAAT CGCAATAACA TCGTTTGCCC ACGTTTGCCC ACCCTTTAGA 240
1967 ATTTTGAAAA AATTTATACT TTAGAAAATA TAAGGCTTTT AAGTTTACCT CGGTCTAATC 300
1968 AGAGAGTAAA TCGTTTGCCC ATCTCTTAAA ACCAAATATT ATCAACAAAA AACGTTTGCC 360
1969 CAACCATTAT TATTAGTTTT TATCGTTTGC CCACCCTTTA AAAAACCTTT AACAAAATTT 420
1970 TTTTTTCGAT TGCCCACACT TGAAATACAA CCAATTTCGT TAGCCCACCT CTTCAAAATA 480
1971 AATATTTCCA ATAAAAAACG TTTTCCCACC ATTTAAAAAT AAATAATTTC GATTGCCCAT 540
1972 CCTTCAAAAT TCATTTTAAC GTTTGCCCAC CCTTTAAAAT TTGTTTTTTT CGTTTGCCCA 600
1973 CTCTTAAAAC TAAATAATTT CGATTGCCCA CCTTTTAAAA CTAAATAATT TCGTTTGCCC 660
1974 ATCCTTTAAA ATTCATTTTT AACGTTTGCC CACCCTTTAA AAATAAATTA TTTCGTTTGC 720
1975 CCACCCTTTA AAATTTGTTT TTTTCGTTTG CCCACTCTTA AAACTAAATA ATTTCGATTG 780
1976 CCCACCTTTT AAAACTAAAT AATTTCGTTT GCCCATCCTT TAAAATTCAT TTTAACGTTT 840
1977 GCCCACCCTT TAAAAATAAA TTATTTCGTT TGCCCACCCT TTAAAAGTTT TTTTTTTTCG 900
1978 TTTGCCCACT CTTAAAACTA AATAATTTCG ATTGCCCACC TTTTAAAACT AAATAATTTC 960
1979 GTTTGCCCAT CCTTTAAAAT TCATTTTTAA CGTTTGCCCA CCCTTTAAAA TTTGTTTTGT 1020
1980 AAGATGTGGC GCCAATTCAG ATATTTTAGG ATCGGCGGAT AGAAGCACTT ACTTATATGA 1080
1981 TGATGATGAA CATACATAGA CATAAT 1106
1982 //
1983 ID DMREPG standard; DNA; INV; 4346 BP.
1984 XX
1985 AC X06950;
1986 XX
1987 DR FLYBASE; FBte0000657; Dmel\G-element.
1988 XX
1989 FT source X06950:1..4346
1990 FT SO_feature CDS ; SO:0000316:220..951
1991 FT /name="Dmel\G-element\ORF0"
1992 FT /db_xref="FLYBASE:FBgnXXXXXXX"
1993 FT SO_feature CDS ; SO:0000316:819..1539
1994 FT /name="Dmel\G-element\ORF1"
1995 FT /db_xref="FLYBASE:FBgnXXXXXXX"
1996 FT SO_feature CDS ; SO:0000316:join(1530..1858,1866..1973,1982..2719,2727..3008,3012..3800,3806..3991,4006..4095)
1997 FT /name="Dmel\G-element\ORF2"
1998 FT /db_xref="FLYBASE:FBgnXXXXXXX"
1999 XX
2000 CC Derived from X06950 (g8427) (Rel. 16, Last updated, Version 1).
2001 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
2002 CC Any changes to original sequence record are annotated in an FT line.
2003 XX
2004 SQ Sequence 4346 BP; 1215 A; 1356 C; 959 G; 816 T; 0 other;
2005 ACAGTCGCGA TCGAACACTC AACGAGTGCA GACGTGCCTA CGGACCGACG GCAAGTTATT 60
2006 TTCGTGCTCA AAGTCCCGCT ACTCTAAAAC CGCTACGTAG TGTCGCGAGA TTTCTTCGCG 120
2007 CACCGTGATT GGTTCAGCCG GCGAACCTTA CGGTATCGCT ACCACTACCA ACGCACTCGT 180
2008 GCGTGCGTGT TATCGGTATC AACAGTTACA TTCGGCTAAA GTTACTGCGA ACAACTCAGC 240
2009 AGCAGCCACG TGCTGAGGCT GGTACACCAA CAAACGGTTC CTACCGTGCC CTCCTCCCCT 300
2010 CCTTCCCTAC TCCGGGACAA CATGGACTGG CAAGCCCCCC CGCGACCCAC CAAGCTGACC 360
2011 AAAGTGCCTA GAAAGAAGGC GCTCAAAGAG GCGCCAGGAG AAGGTGAAAG CAGCTGCTCA 420
2012 AGCGATAGCA GCTCCTCGGA GTCAGAGCCT GGGGAAGTCA AGCGCAAAGC AGCGAGCAGA 480
2013 GACGCTAAGG AAGCCGCCGA CAACGTGCCC AACACCAGCG CAGCTCTGCG CAAGAAGCTG 540
2014 GAAAATAACT CCTTCGCCCT TCTGTCCAGC ACTGAGGACG AAGACGATGA CGACGACAAC 600
2015 ACCGACAACG AGCAGCAAAC CCCTGTTGGG GAATCTGCTC CAAAAACCAT GAAAAAACCC 660
2016 AACCCGACCC CGAAGACCAT CAAGCCACCC CCGATCTACA TCCCAGACGT GACCAACATC 720
2017 TCAGCCCTTG TCAGGATGAT TACGACTCTC GTCGGTGCCC ACAAGGAATT CTCGTACAAA 780
2018 ACTGAGAGAA ACAACAATGT ACGAGTAATG ATGCCTGACA AGGAATCCTA CTCAGCCTTT 840
2019 CGTCAGCAGC TTGTGACCCA GAACAAAAGG CACCGCACAT TTCAACTGTC AGGGACCTGC 900
2020 ACAACCCAAT TGGCAAAAAA TCAAAGGAAC CCCTGGGGAT CTTCTTTGTA AACCTGGAAC 960
2021 CTGCGAGCAA CAATACAGAC ATCTACAAAC TCAAGAGAAT CTGCAGGTCG GTCGTCACCG 1020
2022 TTGAGCCGCC TCTGAAATTC AACGATGTTC CGCAGTGCTT CAGATGTCAA GGGTTCGGAC 1080
2023 ACACCCAGCG CTACTGCTTT TTAGAGTTTC GCTGCGTCAA GTGTGGTGGC CTCCACGACT 1140
2024 CCAGGGCGTG TGAAAAAAAG GAAGACGAGA AAGCATGCTG CCTACACTGT CAAGCCGACC 1200
2025 ATCCAGCGTC GTTCAAAGGG TGCCCCGCGT ATAAGAAGGC AAAGGCTCAA CAAGCTCCTA 1260
2026 AACCCAAAGC AAGGAGCATG GAAAGCAACA ACAAGCCCTC CTTTGAGCTC CCAAATATTA 1320
2027 CAAACGGTAT GAGCTATAGA GACGCGCTAA GTGGCACACG CAAGTCCCAA GCAAGCACTC 1380
2028 CCCCACCGAC ACCCCCAACC CCACCTGAAG CCCCACAACC TAACCACATG GAGGCTATGT 1440
2029 TCACTCGATT TGAGAGCCTG GTCGAAAGAA TGATGGAGAA GATGTTTGCT CAGGTGACGC 1500
2030 AGCTTGTTGC TTCCATCCTC AACAGCAAGT CATGCAAATA AGTCTCAACA TAGTCTTCTG 1560
2031 GAACGCGAAC GGCTTGCAGA GAAGCAAAGC CGAAGTTGAG CACACCATCA AAACCGACAA 1620
2032 CATCGATATT TTATTGGTCT CAGAATCCCA TTTTTGCCCC AGATCCCACT TCATCATCTC 1680
2033 CGGTTACGAC CTCATCACAG CCAACCACCC ATCAGGTAGA GCTCGAGGAG GAGCGGCCAT 1740
2034 GCTCATCAAA AGCGGCATAC AGTTCACTGA ACTGCCTGCG ATACAGGAGG ATTGGGCACA 1800
2035 GTGTGCAGTG GCCAGAGTCA ATAGCCTACA GGGAGATATT ACGGTTGGAG CGGTTTACTT 1860
2036 CCACCCCCAG GCACGCGATT ACAGAGACTC ACCTGCATGA GTTCTTCGAG TCCCTCGGAA 1920
2037 CTCGCTTCAT TGCAGCCGGA GACTTCAATG CAAAGCACTC CTGGTGGGGG TCCGCACAAA 1980
2038 CAACCCCAAA GGCAAAACGC TCCACAAGTA CCTGATGCGC AAAAACTTGG ACTGCCACTC 2040
2039 TACTGGAGAG CCCACACACT GGCCCTCGGA CCCTTCTAAG CAGCCGGATC TGCTGGACAT 2100
2040 CGCGATCTGC AAAGGCATAG GTCGTGCCAA ACTCGTCTGC ACTACATACG ACAGGCTCGT 2160
2041 ATCGGACCAC AGCGCCGTCA ACCTGCTCCT CAACATCCCT GTCCTCAGGA AGACGCCGCT 2220
2042 CCGTAGACTC ACGGGGAATC GCACCAATGC CCCCAAGTTC ACGTTCTGGA TGCTCTCCTC 2280
2043 CCTAAACCCA GACCCAGACC TCTCCACTCC AGGCAATATA GGCGCGGCCA TCGAAAAACT 2340
2044 GAACAAGGAG ATGCACAACG CCGCTGAGTT TGCGAACCCT CCTCCTCCTA CAACCCCGAG 2400
2045 AACTCCCGCA AGAGACCTGC ATTTGTGGTC CCCAGAAATC GCCGCCCTCG TGGCCGAGAA 2460
2046 GAGACGCCTC AGACGAGTAT GGTTCCTCTC GCGTAACCCC AGGGACAAGA CAGCGCTCAA 2520
2047 TCGCGCCTCC AAGGAACTCA AGGACAAACT AACCACCCTA CGCCAAGACT CGTTTCAACG 2580
2048 ATTCCTTGAA GATCTGGAAC CTGGAGACCC GCAGCACAAC CTGTGGATCG TCACGCGGCA 2640
2049 CATCAAAAGA CCCGCCAAGA AAATGGTACC AGTGCGTACA GCAGACTGCT CCTGGTGTCG 2700
2050 GTCTGAGGCA GAAAGAGCCG AAGCTTGCTG ACCACCTTCG CTCTGCCTTC ACTCCGTTTG 2760
2051 ACCGATGCAC AGCTGCAGAG CAAGCTGACA CCATCAGAGC TGTTGAAAGC CCATGTGCTC 2820
2052 CAGGACCTGC AATTCAGCCC GTCGCACCAG AGGAGATCGC GCAGGAAATT GCCTCGCTCA 2880
2053 GAAACGGCAA GTCTCCCGGC CCTGATCGCA TCGACGCTAC TGCGTTAAAA ATGTTGCCCA 2940
2054 CATTCTGCTC ACAGCTGCTT GCCAACATTT TTAACAGCTG CTTCCGGCTA GGGTATTTCC 3000
2055 CAAAACAATA GAAACGCGCC GAAGTGATTA CCATCCCCAA GCCCGGCAAA CCTGAAGCCA 3060
2056 ATCTTGCCTC CTATCGTCCG ATAAGTCTGC TGGCAATCCT CTCCAAAATA CTCGAAAGAG 3120
2057 TATTTCTGCG CAGAGTGCTG CCAGTACTGG ATGAGGCTGG TTTGATCCCC GATCACCAGT 3180
2058 TTGGCTTCAG GCGCTCCCAC GGAACACCAG AGCAATGCCA CCGGCTTGTA GAGCAAATTT 3240
2059 TGGAGGCCTT CGAAAGGAAG CAATACTGCT GCGCCGTCAT GCTGGATGTG AAGCAGGCCT 3300
2060 TCGACAAAGT CTGGCACCCT GGACTCCACT ATAAAATCAA GACTCACCTT CCCGGATCCC 3360
2061 ACTTCGCCTT CCTCAAATCA TTCACTGAGG GTAGAGAGTT CCAAGTTTGC TGCGGAACAG 3420
2062 CGACCAGCAC GCCTAGGCCG ATAAGAGCCG GAGTACCCCA AGGCAGCGTC CTTGGACCAA 3480
2063 TACTGTACAC ACTCTACACA GCAGACCTTC CTATCACACC CTCCCGGAGC CTAACAGTGG 3540
2064 CCACATATGC CGATGACACC GCCTTCCTAG CCTCCGCCTC AGACCCCCAA GAAGCATCAA 3600
2065 CCATCATTCT AAGCCAGCTG GATGCCCTCG ACCCATGGTT GAAACGATGG ACCATTGCCG 3660
2066 TGAACGCAGA CAAATCCTCC CAAACCACTT TCTCCCTGCG CAGAGGAGAC TGCCCCCCAG 3720
2067 TCACGCTCAA CGGGGAAACT ATTCCAACCT CAAGTTCCCC GAAATACCTT GGATTGACTC 3780
2068 TAGACCGGAG GCTCACTTGG CACACCAGGC TGACCTGCGC CTCAAGCAAC TCCACTGGCT 3840
2069 CATCGGGAAA AGGTCCAAAC TTAGGGAAAA CCTTAAACTC CTCCTGTACA AGGCCATCCT 3900
2070 GAAGCCAATT TGGACTTATG GGATTCAGCT GTGGGGCACT GCCAGCATCT CAAACCGCAA 3960
2071 CCGCATACAG CGCTTCCAGA ACAAGTGCCT GAGTCAATCG CTGACGCTCA CCCATACCAT 4020
2072 GAAAACTCCG TTATCCACAA GGAGCTTGGA ATGCCATGGG TAGCAGAGGA GATCTCCCGC 4080
2073 TTCAGCGAGA GATACGCTAA ACGACTGGAC AACCACCCTA ACCATCTGGC TATTAACCTC 4140
2074 CTGGACAACA GTGAAACCAT CAGACGCCTC CAGAGGAAAC ACCCGCTTGA TCTCCACCAC 4200
2075 CTATAACCCA CAACAATGAA CCCCCGACCA ATCTACAACT TTGTAATCCC TTAAGTTAAT 4260
2076 GCCCCCCCCA CCCAAACATT TAATTATTGT CCACATGGAC AGATTTTAAA TTAATACATA 4320
2077 GATCGCTAAA AAAAAAAAAA AAAAAA 4346
2078 //
2079 ID DMGYPF1A standard; DNA; INV; 7469 BP.
2080 XX
2081 AC M12927;
2082 XX
2083 DR FLYBASE; FBte0000021; Dmel\gypsy.
2084 XX
2085 SY synonym: mdg4
2086 XX
2087 FT source M12927:1..7469
2088 FT SO_feature five_prime_LTR ; SO:0000425:1..482
2089 FT SO_feature three_prime_LTR ; SO:0000426:6841..7411
2090 FT SO_feature polyA_site ; SO:0000553:7277..7280
2091 FT SO_feature primer_binding_site ; SO:0005850:482..492
2092 FT /bound_moiety="tRNA:lys2"
2093 FT SO_feature CDS ; SO:0000316:1080..2435
2094 FT SO_feature start_codon ; SO:0000318:1..3
2095 FT /name="Dmel\gypsy\gag"
2096 FT /db_xref="FLYBASE:FBgn0014965"
2097 FT /db_xref="SWISS-PROT:P10405"
2098 FT /db_xref="NCBI_PROTEIN:AAA70218.1"
2099 FT /translation="MSWAHNYRKVKVEYESEDSWEEEQVGQALGRPLDSATVDITMDPN
2100 FT QIQALIDNAVRQALSQQQSQFQTQLNSLAARVQSLQVEAPQIKIYEKVSVNPDVRCDIP
2101 FT LDIIKSVPEFSGTQDEYVAWRQSAIYAYELFKPYNGSSAHYQAVAILRNKIRGAAGALL
2102 FT VSHNTVLNFDAILARLDCTYSDKTSLRLLRQGLEMVRQGDLPLMQYYDEVEKKLTLVTN
2103 FT KIVMTHEQEGADLLNAEVRADALHAFISGLKKALRAVVFPAQPKDLPSALALAREAEAS
2104 FT IERSMFANSYAKAVEERAHSGANGKSRFQGKPNKEEQGQDRNPHFTKRPKNNGQTNKDT
2105 FT QAQAPQPMEVDSSSRFRQRTEHYQNHPNESNAFKRRNSSERSTGPRRQRLNNVVQEAPK
2106 FT QKDPKEEYEKTAKAAVEEIDSENEYAPSDDSLNFLGGAPGCRSLNDGWLGEP"
2107 FT SO_feature CDS ; SO:0000316:2438..5470
2108 FT SO_feature start_codon ; SO:0000318:1..3
2109 FT /name="Dmel\gypsy\pol"
2110 FT /db_xref="FLYBASE:FBgn0014966"
2111 FT /db_xref="SWISS-PROT:P10401"
2112 FT /db_xref="NCBI_PROTEIN:AAA70219.1"
2113 FT /translation="MLIDTDAAKNYIRPVKELKNVMPVASPFSVSSIHGSTEIKHKCLM
2114 FT KVFKHISPFFLLDSLNAFDAIIGLDLLTQAGVKLNLAEDSLEYQGIAEKLHYFSCPSVN
2115 FT FTDVNDIVVPDSVKKEFKDTIIRRKKAFSTTNEALPFNTAVTATIRTVDNEPVYSRAYP
2116 FT TLMGVSDFVNNEVKQLLKDGIIRPSRSPYNSPTWVVDKKGTDAFGNPNKRLVIDFRKLN
2117 FT EKTIPDRYPMPSIPMILANLGKAKFFTTLDLKSGYHQIYLAEHDREKTSFSVNGGKYEF
2118 FT CRLPFGLRNASSIFQRALDDVLREQIGKICYVYVDDVIIFSENESDHVRHIDTVLKCLI
2119 FT DANMRVSQEKTRFFKESVEYLGFIVSKDGTKSDPEKVKAIQEYPEPDCVYKVRSFLGLA
2120 FT SYYRVFIKDFAAIARPITDILKGENGSVSKHMSKKIPVEFNETQRNAFQRLRNILASED
2121 FT VILKYPDFKKPFDLTTDASASGIGAVLSQEGRPITMISRTLKQPEQNYATNERELLAIV
2122 FT WALGKLQNFLYGSREINIFTDHQPLTFAVADRNTNAKIKRWKSYIDQHNAKVFYKPGKE
2123 FT NFVADALSRQNLNALQNEPQSDAATIHSELSLTYTVETTDKPLNCFRNQIILEAARFPL
2124 FT KRNLVLFRSKSRHLISFTDKSWLLKTLKEVVNPDVVNAIHCDLPTLASFQHDLIAHFPA
2125 FT TQFRHCKNVVLDITDKNEQIEIVTAEHNRAHRAAQENIKQVLRDYYFPKMGSLAKEVVA
2126 FT NCRVCTQAKYDRHPKKQELGETPIPSYTGEMVHIDIFSTDRKLFLTCIDKFSKYAIVQP
2127 FT VVSRTIVDITAPLLQIINLFPNIKTVYCDNEPAFNSETVTSMLKNSFGIDIVNAPPLHS
2128 FT SSNGQVERFHSTLAEIARCLKLDKKTNDTVELILRATIEYNKTVHSVTRERPIEVVHPG
2129 FT AHERCLEIKARLVKAQQDSIGRNNPSRQNRVFEVGERVFVKNNKRLGNKLTPLCTEQKV
2130 FT QADLGTSVLIKGRVVHKDNLK"
2131 FT SO_feature CDS ; SO:0000316:join(567..568,5551..7000)
2132 FT SO_feature start_codon ; SO:0000318:1..3
2133 FT /name="gypsy\env"
2134 FT /db_xref="FLYBASE:FBgn0014964"
2135 FT /translation="
2136 FT MFTLMMFIPLVVANARITDFSHANYIPVLDGDVLVFEQRDLLKHSSNLSE
2137 FT YASMIDETQKLSESFPHSHMRKLLEVDTDHLRTLLSVLKVHHRIARSLDF
2138 FT LGTALKVVAGTPDATDLFKIKITEAQLVESNSRQIAINSETQKQINKLTD
2139 FT TINKVINARKGDLVDTPHLYEALLARNRMLSTEIQNLILTITLVKSNIIN
2140 FT PTILDHADLKPLVEQDTPIVSLIEASKIRVLQSENSIHILIAYPRVKFSC
2141 FT KKVAVYPVSHQHTILRLDEDTLAECEHDTFAVTGCTDTTHFTFCERSRRE
2142 FT TCVRSLHAGNAAQCHTQPSHLREINPVDDGVVIINEAAAHVSTDGSPETL
2143 FT IEGTYLVTFERTATINGSEFVNLRKTLSKQPGIVRSPLLNIVGHDPVLSI
2144 FT PLLHRMSNENLHSIQNLMDDVESEGSPRLWFVAGVVLNFGLIGSLALYLA
2145 FT LRRRRASREIQRTIDTFNMTEDGHKLEGGVVNN"
2146 XX
2147 CC Derived from M12927 (g157583) (Rel. 44, Last updated, Version 6).
2148 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
2149 CC Any changes to original sequence record are annotated in an FT line.
2150 CC [See also:AF033821; alignments in /alignments/gypsy]
2151 XX
2152 SQ Sequence 7469 BP; 2301 A; 1808 C; 1602 G; 1758 T; 0 other;
2153 AGTTAACAAC TAACAATGTA TTGCTTCGTA GCAACTAAGT AGCTTTGTAT GAACAATGCT 60
2154 GACGCGCCAG AATTGGGTTC AACGCTCCAC GCGAAGAATG CCTGGCAGCG GAAAGCTGAC 120
2155 ACTTCCTACC GGGAGTGTTG CTTCACGCTG CAAGAAATGC TGAGTCGGCT TGCCGACTTG 180
2156 TGGCGGCGCG ATGCATTGCT CGAGGGTAAA CTTAGTTTTC AATATTGTCT TCTACTCAGT 240
2157 TCAAATCTTG TGTCGAAATA AACCACAGCT TGCTCCGGCT CATTGCCGTT AAACATCATT 300
2158 GTTCTTATTT ACAATCAAAT CGCTATCGCC ACAAGGCTAG TGATAATAAC TAAGGGGGCG 360
2159 AAGTCAAGCC CTCCAACCTA ATCTCCATAA ACAGTGTCTA AGACGAACCT CAGCGAAAGA 420
2160 AGGAAGATCT CTAGACCTAC TGGAAATAAC ATAACTCTGG ACCTATTGGA ACTTATATAA 480
2161 TTGGCGCCCA ACCAACAATC TGAACCCACC AATCTAATTT AACACACTTT GTCAGGCGAC 540
2162 AAACAGGGTA GTTAAGTTAG AAAAGCATGT AAGTTTTACA AGACACTTCT TTGACGCAAT 600
2163 CAAGAAATTT ACGAGTGAAA AAAAAAAAAA AAAAAAGTTG TGTATCTGGC CACGTAATAA 660
2164 GTGTGCGTTG AATTTATTCG CAAAAACATT GCATATTTTC GGCAAAGTAA AATTTTGTTG 720
2165 CATACCTTAT CAAAAAATAA GTGCTGCATA CTTTTTAGAG AAACCAAATA ATTTTTTATT 780
2166 GCATACCCGT TTTTAATAAA ATACATTGCA TACCCTCTTT TAATAAAAAA TATTGCATAC 840
2167 TTTGACGAAA CAAATTTTCG TTGCATACCC AATAAAAGAT TATTATATTG CATACCCGTT 900
2168 TTTAATAAAA TACATTGCAT ACCCTCTTTT AATAAAAAAT ATTGCATACG TTGACGAAAC 960
2169 AAATTTTCGT TGCATACCCA ATAAAAGATT ATTATATTGC ATACCTTTTC TTGCCATACC 1020
2170 ATTTAGCCGA TCAATTGTGC TCGGCAACAG TATATTTGTG GTGTGCCAAC CAACAACCAA 1080
2171 TGAGTTGGGC ACATAACTAC AGAAAGGTTA AGGTCGAATA CGAAAGCGAG GATAGCTGGG 1140
2172 AGGAGGAGCA AGTAGGCCAA GCATTAGGTC GGCCGTTAGA TAGTGCCACG GTAGATATTA 1200
2173 CCATGGACCC CAATCAGATT CAAGCTCTTA TCGACAATGC TGTCAGACAG GCATTGTCGC 1260
2174 AACAGCAATC CCAATTTCAG ACACAACTCA ATTCCCTAGC TGCGCGGGTA CAGAGTTTGC 1320
2175 AGGTGGAAGC ACCGCAAATC AAGATTTACG AAAAAGTCTC TGTTAACCCC GATGTTAGGT 1380
2176 GCGACATTCC CCTTGACATA ATAAAGTCTG TACCAGAGTT CTCCGGTACC CAAGACGAGT 1440
2177 ATGTGGCCTG GAGACAATCG GCCATATACG CCTACGAGCT CTTCAAACCA TACAATGGCA 1500
2178 GCAGTGCCCA TTATCAGGCT GTTGCCATAT TAAGGAATAA AATCCGTGGC GCAGCCGGGG 1560
2179 CTTTACTGGT CTCCCACAAT ACGGTATTGA ACTTCGATGC TATTTTGGCC AGACTAGACT 1620
2180 GCACGTACTC GGACAAAACA TCCTTACGCC TGTTGAGGCA AGGATTGGAA ATGGTTAGGC 1680
2181 AAGGAGACCT ACCACTAATG CAATACTACG ATGAAGTTGA AAAGAAGCTA ACGCTTGTCA 1740
2182 CTAACAAAAT CGTAATGACG CATGAACAAG AGGGTGCTGA CCTGCTTAAC GCTGAGGTCA 1800
2183 GAGCCGACGC CCTGCATGCT TTTATTTCGG GGCTCAAAAA GGCCCTCAGA GCTGTGGTCT 1860
2184 TCCCGGCCCA ACCAAAAGAC CTGCCATCTG CACTGGCTTT AGCTAGAGAA GCAGAGGCAA 1920
2185 GCATAGAGAG AAGCATGTTC GCTAACTCCT ACGCCAAGGC CGTAGAGGAG CGAGCGCATT 1980
2186 CGGGGGCAAA CGGCAAGAGC CGTTTCCAGG GGAAGCCAAA TAAAGAAGAA CAGGGACAGG 2040
2187 ACAGGAATCC CCACTTCACC AAACGCCCCA AAAATAACGG ACAAACCAAC AAGGACACTC 2100
2188 AGGCGCAAGC ACCCCAGCCA ATGGAGGTCG ATTCATCCTC CAGGTTTAGG CAGCGTACTG 2160
2189 AACATTATCA GAATCATCCT AACGAGTCGA ACGCGTTTAA GAGGAGAAAT TCCTCAGAAC 2220
2190 GCTCAACAGG ACCGAGACGA CAACGTCTGA ATAACGTTGT CCAAGAGGCC CCTAAACAAA 2280
2191 AGGACCCCAA AGAAGAGTAT GAAAAAACAG CAAAGGCTGC AGTCGAGGAA ATCGACAGCG 2340
2192 AAAATGAGTA CGCTCCCAGT GACGACTCGT TGAATTTTTT AGGGGGCGCT CCCGGTTGCC 2400
2193 GTTCATTGAA CGACGGCTGG CTGGGAGAAC CTTAAAGATG CTAATCGATA CCGACGCGGC 2460
2194 AAAAAACTAC ATTAGGCCCG TAAAGGAGCT GAAAAATGTA ATGCCGGTCG CCAGCCCTTT 2520
2195 CTCGGTGAGC TCAATACACG GCTCCACCGA AATCAAACAC AAATGCTTGA TGAAAGTCTT 2580
2196 CAAGCACATC TCCCCATTTT TTCTTTTGGA TTCTCTCAAT GCGTTCGACG CTATCATAGG 2640
2197 CTTGGACCTG TTAACACAGG CCGGGGTAAA ACTCAACCTT GCAGAGGACT CCTTAGAATA 2700
2198 CCAGGGCATC GCTGAAAAGC TTCATTATTT CAGCTGCCCC AGTGTAAATT TCACTGATGT 2760
2199 AAACGATATT GTTGTACCTG ACTCCGTTAA AAAGGAGTTC AAGGACACAA TAATAAGGAG 2820
2200 GAAGAAAGCT TTCTCCACAA CAAATGAAGC TCTTCCTTTT AACACCGCTG TCACTGCCAC 2880
2201 AATTCGGACA GTTGACAATG AACCGGTGTA CTCAAGAGCG TACCCAACTC TTATGGGTGT 2940
2202 CTCCGACTTT GTGAACAACG AGGTCAAACA ACTGCTGAAA GACGGCATTA TCAGGCCCTC 3000
2203 AAGGTCTCCC TATAACAGCC CGACCTGGGT TGTTGACAAA AAGGGGACCG ACGCCTTCGG 3060
2204 GAACCCAAAC AAGAGGTTGG TCATTGACTT CAGGAAGCTA AATGAGAAAA CTATTCCTGA 3120
2205 CCGGTACCCG ATGCCTAGCA TTCCCATGAT TCTAGCGAAT CTGGGCAAGG CAAAGTTCTT 3180
2206 CACTACCCTT GATCTTAAGT CAGGGTATCA TCAAATTTAC CTCGCGGAAC ACGACCGCGA 3240
2207 GAAGACATCG TTCTCGGTGA ATGGTGGTAA ATACGAGTTT TGCCGTCTAC CGTTCGGCTT 3300
2208 GAGAAATGCA AGCAGCATTT TTCAAAGAGC CCTAGACGAT GTGCTTAGAG AGCAAATCGG 3360
2209 GAAGATATGT TACGTCTATG TAGATGACGT CATAATTTTC TCTGAAAACG AGTCCGACCA 3420
2210 TGTCCGCCAC ATCGATACAG TACTAAAATG CCTGATCGAT GCCAACATGA GAGTAAGCCA 3480
2211 GGAGAAAACT AGATTCTTTA AAGAGAGTGT AGAATACCTC GGCTTTATTG TCAGTAAGGA 3540
2212 CGGAACTAAA TCCGATCCAG AGAAGGTGAA GGCCATTCAG GAGTACCCTG AACCAGACTG 3600
2213 CGTTTACAAG GTTAGGTCCT TCCTTGGTTT AGCCAGCTAC TACAGAGTCT TCATCAAAGA 3660
2214 CTTTGCTGCC ATAGCCCGCC CGATCACCGA TATCCTAAAA GGGGAAAATG GTTCGGTGAG 3720
2215 CAAACACATG TCTAAAAAAA TTCCTGTTGA GTTTAATGAA ACTCAACGCA ACGCGTTCCA 3780
2216 AAGACTGCGA AACATACTAG CATCCGAGGA TGTCATACTC AAATACCCCG ACTTTAAAAA 3840
2217 GCCTTTTGAC CTTACTACAG ATGCTTCGGC AAGTGGTATC GGTGCAGTCC TATCCCAGGA 3900
2218 GGGCAGGCCA ATCACCATGA TATCGCGTAC CCTTAAACAG CCCGAGCAGA ACTACGCCAC 3960
2219 AAACGAAAGG GAATTGCTGG CGATTGTATG GGCCCTAGGT AAGTTGCAGA ACTTCCTGTA 4020
2220 TGGCTCTAGG GAGATTAATA TATTTACCGA CCATCAACCC CTCACTTTCG CTGTTGCCGA 4080
2221 CAGGAACACG AATGCCAAGA TAAAGAGGTG GAAATCTTAC ATAGACCAGC ATAATGCCAA 4140
2222 GGTTTTCTAC AAACCTGGCA AAGAAAATTT CGTGGCAGAC GCCCTCTCTA GGCAGAATCT 4200
2223 GAATGCCTTA CAAAACGAAC CCCAATCAGA CGCTGCGACC ATTCACAGTG AGCTCTCCCT 4260
2224 GACCTACACG GTCGAGACAA CAGACAAACC GTTAAATTGC TTCAGGAACC AGATCATTCT 4320
2225 GGAGGCAGCA CGTTTTCCGC TCAAACGAAA CCTGGTGCTC TTTCGAAGCA AATCTCGCCA 4380
2226 CTTAATCAGC TTTACTGATA AAAGTTGGCT ATTAAAAACA CTTAAGGAGG TGGTAAACCC 4440
2227 TGACGTCGTG AACGCTATTC ACTGCGACCT GCCCACTCTG GCAAGCTTCC AACACGACCT 4500
2228 CATTGCCCAC TTTCCAGCCA CCCAATTTCG TCACTGTAAG AATGTCGTGT TAGACATAAC 4560
2229 CGACAAAAAC GAACAGATCG AAATCGTCAC TGCCGAGCAC AACCGCGCTC ACAGAGCCGC 4620
2230 ACAAGAAAAC ATTAAACAAG TCCTTCGGGA TTATTACTTT CCCAAAATGG GCAGTTTAGC 4680
2231 TAAAGAAGTA GTAGCTAATT GTAGGGTCTG CACCCAAGCA AAGTATGACA GGCACCCGAA 4740
2232 AAAGCAAGAG CTCGGGGAAA CGCCCATACC CAGCTATACA GGTGAGATGG TGCATATTGA 4800
2233 CATATTCTCA ACCGACAGGA AGCTATTCCT GACGTGTATT GACAAATTTT CTAAATATGC 4860
2234 AATAGTGCAA CCAGTGGTGT CTAGAACAAT AGTGGACATC ACAGCACCCC TGTTGCAGAT 4920
2235 CATTAACCTG TTCCCCAATA TCAAAACGGT CTATTGTGAC AATGAGCCCG CATTTAACTC 4980
2236 AGAAACTGTC ACCTCAATGC TCAAGAACAG CTTCGGCATT GACATAGTAA ATGCGCCCCC 5040
2237 ACTCCACAGC TCATCCAATG GCCAAGTTGA ACGGTTCCAC AGCACATTGG CAGAAATCGC 5100
2238 CAGGTGCCTG AAGTTGGACA AAAAAACGAA TGACACAGTA GAACTAATCT TGAGGGCGAC 5160
2239 GATAGAATAT AACAAAACCG TGCACTCAGT TACTCGTGAG AGACCAATTG AGGTGGTTCA 5220
2240 CCCAGGGGCC CACGAGCGCT GCCTAGAAAT CAAGGCAAGA TTAGTAAAGG CTCAGCAAGA 5280
2241 CAGCATCGGA AGAAACAACC CTTCCCGACA AAACCGCGTG TTTGAGGTGG GAGAACGCGT 5340
2242 GTTTGTAAAA AACAACAAGA GGTTAGGAAA TAAGCTAACT CCACTATGCA CCGAGCAAAA 5400
2243 AGTGCAGGCA GACTTGGGAA CGTCTGTTCT TATTAAGGGG AGGGTGGTCC ACAAGGACAA 5460
2244 CCTCAAGTAG ACATTCCCTC TACAGTTAGG TAGTAAGTTA TGTCAAGGAA AATCCGAGCA 5520
2245 CTGTAGTATC ACCTTGTCTT TAATTTCCAG GTTCACCCTC ATGATGTTCA TACCCTTGGT 5580
2246 AGTAGCGAAT GCTCGGATCA CCGACTTTTC GCATGCCAAC TACATTCCTG TGTTAGATGG 5640
2247 GGATGTGCTG GTGTTTGAAC AGCGTGACCT CTTGAAACAT TCGAGTAACC TTTCCGAGTA 5700
2248 CGCTAGTATG ATAGATGAAA CACAGAAACT GTCCGAGTCC TTTCCCCACT CACATATGCG 5760
2249 TAAGTTGCTA GAGGTCGATA CTGACCATCT TAGAACCTTG TTGTCCGTTC TCAAAGTCCA 5820
2250 CCATAGGATA GCTAGGAGTC TAGATTTCTT AGGTACAGCC TTAAAGGTTG TGGCGGGTAC 5880
2251 TCCCGATGCC ACGGACCTCT TTAAAATTAA GATCACAGAG GCCCAACTAG TAGAATCTAA 5940
2252 TTCCAGGCAG ATAGCTATAA ACTCCGAAAC CCAGAAACAG ATAAATAAGT TAACTGACAC 6000
2253 CATCAATAAG GTGATCAATG CCCGTAAAGG CGACTTGGTT GACACTCCAC ACTTATATGA 6060
2254 AGCACTACTA GCAAGAAATA GGATGCTGTC TACAGAAATT CAAAATTTAA TTCTCACTAT 6120
2255 TACTTTGGTC AAATCAAACA TTATAAATCC CACAATTCTT GATCATGCCG ACTTGAAGCC 6180
2256 TCTTGTAGAA CAGGATACCC CAATTGTCAG CTTAATAGAA GCATCTAAGA TCAGGGTCCT 6240
2257 CCAGTCCGAG AATAGCATTC ATATTTTAAT TGCCTATCCT AGAGTCAAGT TCAGTTGCAA 6300
2258 GAAAGTCGCC GTCTACCCTG TATCTCACCA ACACACCATC TTGCGCCTCG ACGAAGACAC 6360
2259 TTTGGCCGAA TGCGAACATG ACACCTTTGC GGTCACCGGA TGCACAGACA CCACACACTT 6420
2260 CACGTTCTGC GAGCGGTCTC GGCGCGAAAC TTGCGTGCGC TCACTCCATG CTGGAAACGC 6480
2261 TGCTCAATGC CACACTCAAC CCAGCCACTT GCGAGAAATA AACCCCGTAG ATGATGGCGT 6540
2262 TGTGATTATC AACGAAGCCG CAGCTCACGT TAGCACTGAT GGCAGCCCCG AAACACTGAT 6600
2263 AGAGGGAACC TACCTGGTAA CCTTCGAGCG AACGGCAACC ATCAACGGCT CTGAATTCGT 6660
2264 AAATCTAAGG AAAACACTAA GCAAGCAGCC AGGCATCGTG CGTTCACCAC TACTTAACAT 6720
2265 CGTCGGCCAC GACCCTGTGC TCAGTATACC TCTGCTACAC CGGATGAGTA ACGAAAACCT 6780
2266 ACATTCCATC CAAAACCTTA TGGATGACGT GGAATCTGAA GGCTCGCCCA GACTCTGGTT 6840
2267 CGTGGCTGGT GTGGTCCTAA ACTTCGGCTT GATTGGCTCT CTCGCCCTTT ATCTGGCATT 6900
2268 AAGGAGAAGA CGAGCCTCTA GGGAGATACA GCGCACCATC GATACTTTCA ACATGACCGA 6960
2269 GGACGGTCAT AAACTTGAGG GGGGAGTAGT TAACAACTAA CAATGTATTG CTTCGTAGCA 7020
2270 ACTAAGTAGC TTTGTATGAA CAATGCTGAC GCGCCAGAAT TGGGTTCAAC GCTCCACGCG 7080
2271 AAGAATGCCT GGCAGCGGAA AGCTGACACT TCCTACCGGG AGTGTTGCTT CACGCTGCAA 7140
2272 GAAATGCTGA GTCGGCTTGC CGACTTGTGG CGGCGCGATG CATTGCTCGA GGGTAAACTT 7200
2273 AGTTTTCAAT ATTGTCTTCT ACTCAGTTCA AATCTTGTGT CGAAATAAAC CACAGCTTGC 7260
2274 TCCGGCTCAT TGCCGTTAAA CATCATTGTT CTTATTTACA ATCAAATCGC TATCGCCACA 7320
2275 AGGCTAGTGA TAATAACTAA GGGGGCGAAG TCAAGCCCTC CAACCTAATC TCCATAAACA 7380
2276 GTGTCTAAGA CGAACCTCAG CGAAAGAAGG AAGATCTCTA GACCTACTGG AAATAACATA 7440
2277 ACTCTGGACC TATTGGAACT TATATAATT 7469
2278 //
2279 ID DMHFL1 standard; DNA; INV; 2959 BP.
2280 XX
2281 AC M69216;
2282 XX
2283 DR FLYBASE; FBte0000154; Dmel\hobo.
2284 XX
2285 SY synonym: H-element
2286 XX
2287 XX
2288 FT source M69216:1..2959
2289 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..12
2290 FT SO_feature terminal_inverted_repeat ; SO:0000481:2948..2959
2291 FT SO_feature TATA_box ; SO:0000174:107..112
2292 FT SO_feature polyA_signal_sequence ; SO:0000551:2382..2394
2293 FT SO_feature CDS ; SO:0000316:316..2292
2294 FT SO_feature start_codon ; SO:0000318:1..3
2295 FT /name="Dmel\hobo\T"
2296 FT /db_xref="FLYBASE:FBgn0014191"
2297 FT /translation="
2298 FT MAPYIMIVEFLCLWSSVSAVNCPFFVFYDAITSLLGFSIIWKPKEKVTIM
2299 FT AEAADFVKNKINNGTYSVANKHKGKSVIWSILCDILKEDETVLDGWLFCR
2300 FT QCQKVLKFLHKNTSNLSRHKCCLTLRRPTELKIVSENDKKVAIEKCTQWV
2301 FT VQDCRPFSAVTGAGFKNLVKFFLQIGAIYGEQVDVDDLLPDPTTLSRKAK
2302 FT SDAEEKRSLISSEIKKAVDSGRASATVDMWTDQYVQRNFLGITFHYEKEF
2303 FT KLCDMILGLKSMNFQKSTAENILMKIKGLFSEFNVENIDNVKFVTDRGAN
2304 FT IKKALEGNTRLNCSSHLLSNVLEKSFNEANELKKIVKSCKKIVKYCKKSN
2305 FT LQHTLETTLKSACPTRWNSNYKMMKSILDNWRSVDKILGEADIHVDFNKS
2306 FT SLKVVVDILGDFERIFKKLQTSSSPSICFVLPSISKILELCEPNILDLSA
2307 FT AALLKERILENIRKIWMANLSIWHKAAFFLYPPAAHLQEEDILEIKVFCI
2308 FT SQIQVPISYTLSLESTETPRTPETPETPESLESPNLFPKKNKTISSENEF
2309 FT FFPKLVTESNSNFNESPLDEIERYIRQRVPLSQNFEVIEWWKNNANLYPQ
2310 FT LSKLALKLLSIPASSAAAERVFSLAGNIITEKRNRLCPKSVDSLLFLHSY
2311 FT YKNLNNSQ"
2312 XX
2313 CC Derived from M69216 (g157606) (Rel. 41, Last updated, Version 3).
2314 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
2315 CC Any changes to original sequence record are annotated in an FT line.
2316 CC CDS annotation from Lynn Crosby's annotation 'H-element.v004'.
2317 XX
2318 SQ Sequence 2959 BP; 994 A; 541 C; 571 G; 853 T; 0 other;
2319 CAGAGAACTG CAAGGGTGGC ACTTTTTTAC CACTCGACTC ACACCCTACA ATTTTGTGTG 60
2320 CGGGTGCTAC TCGCCACGCA CATCGCGGGT ACTTACAAAC ACACAGTATA AATCTGAACA 120
2321 TGCAGACAAG ACACCCCGTT GTGTGCGCAC CCGAATCAAT ACGGTGTTTT GCGTCGCGGG 180
2322 TGCCGCTCAC ACAGTGCCTA AAAAGGGATG AGTGAGAAAA ACACTTGTGG GTATACCGTT 240
2323 AAACACATGG GTGTTTCCAA AAATACTCGG GTGTTTCCAA AAATACTCGA GTGGTCTCGT 300
2324 AGGTAGTCGA GTCAAATGGC GCCATACATA ATGATTGTTG AGTTCTTGTG TCTTTGGTCC 360
2325 AGTGTCTCGG CTGTTAATTG CCCCTTTTTT GTTTTTTACG ATGCAATTAC TAGCTTGTTA 420
2326 GGATTCAGTA TTATTTGGAA GCCAAAGGAA AAGGTCACAA TAATGGCAGA AGCGGCTGAT 480
2327 TTCGTTAAAA ATAAAATTAA CAATGGAACA TACTCAGTTG CCAATAAACA TAAAGGAAAA 540
2328 AGTGTTATTT GGAGCATTTT ATGTGACATT TTAAAGGAAG ATGAAACTGT TCTGGACGGA 600
2329 TGGCTGTTCT GCAGGCAATG CCAGAAAGTG CTCAAATTTT TACACAAAAA CACCTCCAAT 660
2330 TTATCCCGCC ATAAATGTTG TCTAACATTA AGACGACCAA CGGAATTAAA AATTGTTTCG 720
2331 GAAAACGACA AGAAAGTAGC TATTGAAAAA TGCACCCAAT GGGTTGTCCA AGATTGTCGG 780
2332 CCGTTTTCTG CAGTAACCGG AGCCGGATTT AAAAATTTGG TGAAGTTTTT CCTACAAATC 840
2333 GGCGCTATCT ATGGGGAACA GGTAGACGTC GATGACTTAC TACCTGATCC AACAACATTA 900
2334 AGTCGGAAGG CCAAATCGGA TGCAGAAGAG AAGAGGAGTC TAATCTCGTC CGAGATAAAA 960
2335 AAAGCTGTGG ATAGCGGAAG AGCAAGTGCG ACCGTCGACA TGTGGACTGA CCAGTATGTC 1020
2336 CAAAGAAACT TTTTGGGCAT CACTTTCCAT TACGAAAAAG AATTTAAACT TTGTGACATG 1080
2337 ATTTTGGGAC TAAAATCGAT GAATTTTCAA AAATCGACTG CCGAAAACAT TTTAATGAAA 1140
2338 ATTAAAGGTT TATTTTCGGA ATTCAATGTT GAGAACATTG ATAATGTTAA GTTTGTGACT 1200
2339 GACAGGGGAG CAAATATAAA AAAGGCTTTA GAGGGCAATA CCCGTTTAAA TTGTAGCAGT 1260
2340 CACCTGTTGT CAAATGTTTT AGAAAAATCG TTTAACGAGG CCAATGAACT CAAAAAAATT 1320
2341 GTGAAATCAT GCAAAAAAAT CGTGAAGTAC TGCAAAAAAT CAAATTTGCA GCATACTCTA 1380
2342 GAAACCACTT TGAAAAGCGC CTGTCCGACT AGATGGAACT CCAACTACAA AATGATGAAG 1440
2343 TCCATTCTGG ATAACTGGCG TAGTGTGGAT AAAATATTAG GTGAAGCTGA TATCCATGTA 1500
2344 GATTTTAATA AATCATCTTT AAAAGTTGTG GTAGATATTC TAGGAGACTT TGAACGAATA 1560
2345 TTTAAGAAGT TGCAAACATC TAGCTCACCA TCTATATGCT TCGTATTGCC ATCCATCTCT 1620
2346 AAAATTTTAG AATTATGCGA GCCGAATATT TTAGACCTTT CTGCAGCAGC ATTGCTTAAG 1680
2347 GAAAGAATTT TGGAAAATAT TCGTAAGATT TGGATGGCAA ATCTAAGCAT ATGGCATAAG 1740
2348 GCGGCATTTT TTTTATATCC ACCCGCAGCA CATCTTCAGG AAGAAGATAT TCTTGAAATA 1800
2349 AAGGTGTTTT GCATTTCACA AATTCAAGTC CCAATTTCAT ACACATTAAG CTTAGAATCT 1860
2350 ACAGAAACTC CAAGAACTCC AGAAACTCCA GAAACTCCAG AAAGTCTAGA AAGTCCAAAC 1920
2351 TTATTTCCAA AAAAAAACAA AACAATATCT TCTGAAAACG AATTCTTCTT CCCAAAGTTA 1980
2352 GTAACTGAGT CTAATTCCAA CTTCAATGAA TCTCCATTAG ATGAAATTGA ACGATATATT 2040
2353 AGACAAAGAG TTCCATTGTC TCAAAATTTT GAAGTAATTG AGTGGTGGAA AAATAACGCA 2100
2354 AACTTATACC CTCAGTTGTC AAAGTTAGCA TTAAAACTTT TATCAATACC AGCCAGTAGC 2160
2355 GCAGCAGCTG AAAGAGTGTT TTCCCTAGCA GGTAATATAA TAACAGAAAA GCGAAATAGA 2220
2356 TTATGCCCAA AATCTGTAGA TAGCCTCCTT TTTTTGCATT CCTATTACAA AAACCTAAAC 2280
2357 AACTCGCAAT AGATATTCCT TCTTATAAGT ATATTTTATA TTATTAATTC TTATTATTTG 2340
2358 CTTAATTTTT GTATAAGTGT TAAGTATTAA GTATAAGTAT TAATTAATAA TATATAAGAT 2400
2359 TGTTATTTGT TAAGACATTA GATGCAAAAT CCTAAAAATG TGAAAGTAAT GAAGTTCCTT 2460
2360 ATATTTAATA GATACTTTTT AAGCCCACTA TGTTTTTATT ATTTAGATTG AGACATTAAA 2520
2361 AAACGTAAAA ATCAACAAAT GCCGTCTTTA ATTGCAATTA CTTTATGTGT TTGAAATGGG 2580
2362 AGGCACCCAT TGAGTCCATC AAAGAGCAAA GACATGAGCA CAAAAATTTT CTTGGGTATT 2640
2363 CCCTTTTACC CTTCATTTCT TATACCCGTC ACGCTTCCAC CCATACAAAT TTTAGGCGTA 2700
2364 CAAAAAATGA CCAGAGAACT GCAGCCCGCA TACAAAAAAT GACCTGCGGC CGATCGTTGA 2760
2365 CTGTGCGTCC ACTCACCCAT ACGGCTCTTG CGCAGCAGGC CTCGGGTGGT TTTTTTACTC 2820
2366 GTAACAAAAA CACAACGTCG GTAAAACACT CGAGTATTTT GTGTTGCCGC AAGTAGGGTG 2880
2367 TCAAAAAAAA CGGGGTGCCT AGAGTACCGA GTGTTTATCG GGTGGACGTA GAGTGCGAGT 2940
2368 GGCGGGCTGC AGTTCTCTG 2959
2369 //
2370 ID DMTHB1 standard; DNA; INV; 1653 BP.
2371 XX
2372 AC X01748;
2373 XX
2374 DR FLYBASE; FBte0000414; Dmel\HB.
2375 XX
2376 FT source X01748:189..1841
2377 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..31
2378 FT SO_feature terminal_inverted_repeat ; SO:0000481:1622..1653
2379 FT SO_feature CDS ; SO:0000316:387..534
2380 FT /name="Dmel\HB\T"
2381 FT /db_xref="FLYBASE:FBgn0044055"
2382 FT /db_xref="SPTREMBL:Q27293"
2383 FT /db_xref="NCBI_PROTEIN:CAA25884.1"
2384 FT /translation="MLILKLRKEGKTYKDIQKTLKCSAKMVSNAIKYKWKPENRGTKHK
2385 FT TTDIEDRRIVSYSKVYRFASFRDIKSELNLGISDVTIRRRLLNQNFSARSPRKVPLPSP
2386 FT RHIKARLSLAKTYLNWPVSKWRNILWTDGSKIMLFGGTGSLQYI"
2387 XX
2388 CC Derived from X01748 (g8693) (Rel. 49, Last updated, Version 3).
2389 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
2390 CC Any changes to original sequence record are annotated in an FT line.
2391 XX
2392 SQ Sequence 1653 BP; 568 A; 288 C; 302 G; 495 T; 0 other;
2393 ATGTACAGCT GTGTTCAGAA AAATAGCAGT GCGAAGGAAA CTAAGTAATA CAAAGGTATT 60
2394 TTTCCATGTC CCTTTTCGGA ATCGACTTTT TATTCCTCTT ATTTTTGTTA AATGGAATGT 120
2395 GTAGATAGGG AAAAAAAGAA AATCCGGTCA GTTTTTCTTG TTATCCTTTT TTTATTTACA 180
2396 TTCTTGAGCA AAATCACAAT TTTTAGGCTG TTCATAAGAA TAGCAGTGTC TGGTTCTGAC 240
2397 CAACGTAAAG TCCCGAAATG ATCAATATTT TCTAAAAAGT GAGTTTGGTT AAGTTAATTC 300
2398 GTATATTTAA AAGGACAATA AATTAAAAAA ATTAAAAAAA TTTTATTTTA GTGGGTAGAG 360
2399 GACAGCACTA CTCCCAGGGG AAAAGAATGT TAATTCTTAA GCTTAGAAAG GAAGGAAAAA 420
2400 CATATAAGGA CATTCAAAAA ACCCTTAAAT GTTCTGCCAA AATGGTATCC AATGCCATTA 480
2401 AATATAAATG GAAGCCCGAA AACCGTGGTA CCAAACATAA AACCACAGAT ATAGAGGATC 540
2402 GACGCATTGT TTCTTACAGC AAAGTCTATC GTTTTGCATC CTTTAGGGAC ATAAAGTCTG 600
2403 AGCTGAACTT GGGAATCAGC GACGTTACTA TTCGTAGACG ACTACTGAAT CAAAATTTCA 660
2404 GTGCGAGGAG TCCACGAAAG GTTCCCCTAC CTAGCCCAAG GCATATTAAG GCAAGGTTAA 720
2405 GCTTAGCTAA AACCTACCTA AACTGGCCAG TCTCCAAATG GCGTAATATC CTTTGGACTG 780
2406 ATGGGTCAAA AATCATGCTA TTTGGTGGAA CTGGTTCACT ACAGTATATC TGACGACCTC 840
2407 CAAACACGGA GTATCACCCA AAACACCCAG TGAAGACTTT CAATCACGGT GGACCTAAAA 900
2408 TCATGGTATG GGCTTGTTTT TTTTATAATG GTATGAGTCA TGCTATGGAT TATGATTTAT 960
2409 GGTATTATAG ACCAAAACGC ATATGTAAAT ATACTTAGTG ATGTCTTATT GTCATATTCT 1020
2410 GAATAAAATA TACCCTTAAA ATGGACATTC CAACAGGATA ATGATCAGAA ACGCAGATGT 1080
2411 AAATCGGCTA AGAATAGGTT CACCCAAAAT AGAATAGATG CAATGCCGTG GCAAGCACCA 1140
2412 CCTTCCCATT TAAACCCGAT TGAAAACCTG TATGGGGACA TTAAACAGTT TGTGTCGAAG 1200
2413 AAGTCCCCGA CGTCTAAGAC TCAGATTTGG CAAGTTGTGC AGGATACATG GGCAAAAATT 1260
2414 CCTCCCAAAC CTTGCTAGGA CTTGGTGGAC TTCATGCCGC GTGGGTGTAA GGCTGTGCTG 1320
2415 GCTAACAAAG GCTATCCAGC CAAGTATTAG GCCCGAATTA ACATATTAAA AAGAAAAACT 1380
2416 AAGTTCGTTC TAGGTCAAGT TAAATTTTGT TACTATTTTT TCATAGCACT GCTATTTTAT 1440
2417 TGAACACCAG AATTTCTGCC TATTTATTGT TTTAATCTAT ATTTTCGAAA CTATTGAAGA 1500
2418 AATAAAAGTG AAACATTTGT TAAATTGTTT GAAATGAAAT ACCTAATGAT ATTATTAAAA 1560
2419 AAAAATTCCC ATTAAAACTG TAAATCATAG GAATTTTTTA TCTTAAACTC TGAAGTCCAA 1620
2420 AGCACTGCTA TTATTCTGAA CACAGCTGTA CAT 1653
2421 //
2422 ID DM06920 standard; DNA; INV; 6083 BP.
2423 XX
2424 AC U06920;
2425 XX
2426 DR FLYBASE; FBte0000143; Dmel\HeT-A.
2427 XX
2428 FT source U06920:1015..7097
2429 FT SO_feature five_prime_UTR ; SO:0000204:1..731
2430 FT SO_feature three_prime_UTR ; SO:0000205:3497..6083
2431 FT SO_feature polyA_sequence ; SO:0000610:6077..6083
2432 FT SO_feature CDS ; SO:0000316:732..3497
2433 FT SO_feature start_codon ; SO:0000318:1..3
2434 FT /name="Dmel\HeT-A\gag"
2435 FT /db_xref="FLYBASE:FBgn0016662"
2436 FT /db_xref="REMTREMBL:AAC17188"
2437 FT /db_xref="NCBI_PROTEIN:AAC17188.3"
2438 FT /translation="MSMSDNLFSDDEVLSISSSPEQRSSPFYLNISPMSHGSDNSQINT
2439 FT VIINSKKLPSNQADISLKNSSGAAIKIVNSLSHKKKENTNVNNAQKDPLSLTNTTASTC
2440 FT GAKSSISEGKLSSPPSTSHTYEGKLLTKLTHTHTDFRGAKTSDAMGSFPSLSHSDNSIE
2441 FT KNLSSSTKIGPNASSPPSHAHTHTSKSTDISLESRSKHPALANTDARSIKANANDNGEI
2442 FT FSSLIQIDERKQEERPCTTINAFWSIFKPKPDVTKLSLKRKPTNPTKNTGKKCISPHKK
2443 FT SAYLCPSAQDDLNLNLNPKSSAKPTVVNLPAARILSRPAAKRDLFKSSSSRSPDEQPMS
2444 FT FSEVVAGTGSIFAAPCVPAPLTKTPGKRTNDDLDCSNFKTPNKKLCATSNFVTPSIFPP
2445 FT LITPVFKSKAAQSVYEESKARNGPPPPALACSINASARSAAAPPGIAPLPPHNTDAELP
2446 FT PWKIVPQSRRAPPILVNDVKEIVPLLEKLNYTAGVSSYTTRAIEGNGVRIQAKDMTAYN
2447 FT KIKEVLVANGLPLFTNQPKSERGFRVIIRHLHHSTPCSWIVEELLKLGFQARFVRNMTN
2448 FT PATGGPMRMFEVEIVMAKDGSHDKILSLKQIGGQRVDIERKNRTREPVQCYRCQGFRHA
2449 FT KNSCMRPPRCMKCAGEHLSSCCTKPRTTPATCVNCSGQHISAYKGCPAYKAEKQKLAAN
2450 FT NVDINKIRTIKDATNNFYKRQGPPLRNNTPRLPHSSAILSKSIAEARQEAARKSMLNPF
2451 FT RQNINDRRPRFSSHDTAIQKRLNKWRRNTNKIPKKGRIALKDNAKPRPAHRTSNPAQRH
2452 FT LEDYQDMLRRERSEENDQESEKGTPNTKQVGNDSPPTTSRAARASFKPRIIDDTTPSPK
2453 FT ICNPNSQKGLLDDPTTSLANRVDNLEKKIDILMALIIQGRNNNLDMDTSN"
2454 XX
2455 CC Derived from U06920.2 (Rel. 67, Last updated, Version 14).
2456 CC Michael Ashburner, 26-Jan-2002.
2457 CC Any changes to original sequence record are annotated in an FT line.
2458 XX
2459 SQ Sequence 6083 BP; 2199 A; 1545 C; 1033 G; 1306 T; 0 other;
2460 TAAATAAATA AAATAAATTA AACAATTAAC TAAATAATTA AATAACTAAA ATTAATAATA 60
2461 TAATCCGTTC GCTTGCCAAA GACTCTCACG CGCATAACTA ATTAAAATCG ATTTTCAAGT 120
2462 TGACAAATAA ATGGTTTAAA ATTGTCCTCA GGCTGCAAAG AAAAGCCGCG GCAACAATAA 180
2463 ACATTTAGTG ACACGCGAAA AGCGAACATT TGATTAGTGT AATACTTGTG CAAACCGACA 240
2464 AGCTGCCGCC ATAACAAAAC GGAGACGAAG AATCATAAAG AACAAAAGCT AAATCCACCA 300
2465 GCATAGCAAA AATAAATTAA CAAATAAAAT AAAAGCAAAT TTAAATAACA TAATAAATTA 360
2466 AACTTATTTA ATAAACCAAT TAATTTTAAT TAATTCAATT AAACGCTAAA TCTACATAAT 420
2467 ACTCCACGCG CAAATTAATT GAAATCGTCT TTCTAGTTAA TAAATTAAAA GTTTAAAAAT 480
2468 TGTCTCCGGC CGCAAAATTT GAACCGCGAC GATAAAAACA TTTAATTGAC AAACAAAAAG 540
2469 CGAACAATTA TTCAGTGAAC TATTTGTGCA AAATTGACAA GCAGACGCCA TAATTAAAAG 600
2470 GAGAAGAAGC CAAAAGACGA AGAGAAGAAA GCAACCAGAA GAACTCAAAG AAGAAAAGGA 660
2471 GGAAAGCCCA ATTAAAGAAA GCCAGGGTAT TTATACCTTA CACTTATCGT TTAATATAAC 720
2472 AAAAACCCAA CATGTCCATG TCCGACAACC TTTTTTCTGA CGATGAGGTA CTTTCAATTT 780
2473 CCTCAAGCCC AGAACAGCGA TCTTCTCCGT TCTACCTCAA TATATCGCCC ATGTCCCACG 840
2474 GATCAGACAA TTCTCAGATT AATACAGTCA TCATTAATTC GAAGAAATTG CCCTCAAATC 900
2475 AAGCAGACAT AAGTTTAAAA AACTCTTCTG GGGCTGCTAT AAAAATTGTT AATTCCCTTT 960
2476 CACACAAGAA GAAAGAGAAC ACAAACGTTA ATAATGCCCA AAAAGACCCC CTCTCACTCA 1020
2477 CCAATACTAC TGCAAGCACT TGTGGCGCCA AAAGCAGCAT CTCAGAGGGG AAATTGTCTT 1080
2478 CTCCTCCGTC CACCTCACAC ACATATGAGG GGAAATTACT CACAAAACTT ACTCACACAC 1140
2479 ACACAGACTT TAGAGGCGCC AAAACGAGCG ATGCAATGGG AAGTTTCCCC TCTCTCTCGC 1200
2480 ACAGCGACAA TAGCATAGAG AAAAATCTGA GTTCTTCCAC CAAAATTGGA CCAAACGCTT 1260
2481 CTTCCCCTCC TTCTCATGCA CACACTCACA CTAGCAAATC CACTGATATA AGCTTAGAAA 1320
2482 GCCGCTCAAA ACATCCCGCG CTTGCCAATA CGGACGCACG CTCTATAAAA GCCAATGCTA 1380
2483 ATGACAATGG GGAAATTTTC TCCTCACTTA TACAAATTGA CGAACGCAAG CAAGAGGAAA 1440
2484 GGCCTTGCAC AACTATCAAC GCTTTTTGGT CTATTTTTAA ACCCAAGCCG GACGTTACTA 1500
2485 AACTAAGTCT AAAGAGGAAA CCCACCAATC CCACTAAAAA CACTGGGAAA AAATGCATCT 1560
2486 CCCCTCATAA AAAGAGCGCT TATTTATGCC CTTCCGCTCA GGATGATTTA AATTTAAATT 1620
2487 TAAACCCCAA ATCTAGCGCC AAGCCCACTG TGGTGAATTT ACCAGCTGCC CGCATCCTAA 1680
2488 GCCGGCCTGC AGCCAAGCGG GATTTATTTA AATCATCATC CTCCCGAAGC CCAGACGAGC 1740
2489 AGCCTATGAG TTTTTCGGAA GTGGTCGCTG GCACGGGTTC AATTTTTGCG GCACCCTGTG 1800
2490 TCCCGGCACC TTTAACGAAA ACTCCAGGCA AGCGGACAAA CGACGATCTG GACTGCTCCA 1860
2491 ACTTTAAGAC GCCCAATAAA AAATTATGCG CGACTTCCAA CTTTGTAACT CCCAGCATTT 1920
2492 TTCCGCCGCT CATCACTCCC GTTTTCAAGA GCAAGGCAGC TCAATCTGTT TACGAGGAAT 1980
2493 CCAAAGCCAG AAATGGACCC CCCCCGCCGG CCCTCGCCTG CAGCATCAAT GCCTCTGCTC 2040
2494 GCAGCGCAGC GGCGCCACCC GGGATCGCCC CCCTACCCCC TCATAATACA GATGCAGAGC 2100
2495 TGCCTCCATG GAAAATCGTG CCCCAGAGCC GTAGAGCACC TCCTATACTC GTCAATGATG 2160
2496 TAAAGGAAAT TGTACCTCTA CTGGAAAAGC TGAACTACAC AGCAGGAGTC TCCAGCTATA 2220
2497 CTACTAGGGC TATAGAAGGA AACGGGGTCA GGATACAGGC AAAGGACATG ACCGCCTATA 2280
2498 ACAAAATTAA AGAAGTCCTG GTGGCCAACG GACTTCCTTT ATTCACCAAC CAGCCCAAGT 2340
2499 CCGAGAGAGG CTTCCGAGTC ATCATCAGAC ATCTCCACCA CTCCACACCA TGCTCGTGGA 2400
2500 TAGTCGAGGA ACTGCTGAAG CTCGGATTCC AAGCGCGATT CGTCAGAAAT ATGACGAATC 2460
2501 CGGCTACAGG TGGCCCCATG CGAATGTTTG AAGTGGAGAT CGTCATGGCC AAAGACGGCA 2520
2502 GTCATGACAA AATACTCTCA CTCAAACAAA TCGGTGGGCA AAGGGTGGAC ATTGAAAGGA 2580
2503 AAAACAGGAC ACGGGAGCCA GTCCAGTGCT ACAGATGCCA AGGCTTCAGG CATGCCAAAA 2640
2504 ACTCTTGCAT GAGGCCGCCA AGATGCATGA AATGCGCTGG CGAACACCTG TCTTCCTGTT 2700
2505 GCACCAAACC AAGAACCACC CCCGCCACCT GCGTAAATTG CTCTGGGCAG CATATTAGCG 2760
2506 CGTACAAAGG ATGCCCTGCA TATAAGGCGG AAAAACAAAA GCTGGCGGCA AACAACGTTG 2820
2507 ACATAAACAA AATAAGAACA ATCAAAGACG CAACAAATAA CTTTTATAAA CGTCAAGGCC 2880
2508 CCCCTCTACG CAACAACACC CCTCGGCTAC CGCACAGCTC AGCAATCCTG AGCAAATCAA 2940
2509 TTGCCGAAGC TCGCCAGGAG GCAGCCAGAA AGTCGATGTT AAATCCATTC CGACAAAATA 3000
2510 TAAACGACAG AAGACCACGA TTCTCCTCCC ACGACACGGC CATTCAGAAG CGTCTGAATA 3060
2511 AATGGCGCCG AAACACCAAC AAAATACCCA AAAAGGGTAG GATAGCCTTA AAGGATAATG 3120
2512 CAAAGCCACG ACCGGCACAT AGGACAAGTA ACCCAGCGCA AAGACATCTG GAGGACTACC 3180
2513 AGGACATGCT CCGAAGGGAA AGGAGTGAAG AAAACGACCA GGAATCTGAG AAGGGCACCC 3240
2514 CCAATACCAA GCAGGTCGGC AATGACAGCC CTCCGACCAC GAGCAGAGCA GCCAGAGCCA 3300
2515 GCTTTAAGCC AAGAATCATT GACGATACCA CGCCATCGCC AAAAATCTGC AATCCCAACT 3360
2516 CACAAAAAGG CCTCTTGGAC GACCCCACAA CAAGCTTAGC TAATAGAGTC GACAATTTAG 3420
2517 AAAAGAAAAT TGACATTTTA ATGGCCTTAA TCATACAAGG AAGAAATAAC AATCTTGACA 3480
2518 TGGATACATC CAATTAATCT TACAACTACT TATATATTCT TTAATAAATA TATCCAATAG 3540
2519 AAAAGCGCAC GTCGGTCTGC TTTTAAAATC CTTCACCGTC ATCACCTTCC TCGACGGAGC 3600
2520 CTAATTTATT GGAAAAATAA ATCAATTATA TGTTGGCACA AAAATGTAAA CACACACTCA 3660
2521 CCTAAACGCA CCCGGACGAA CAAGCCTATG ACAACGCACT CCAGCTGATC TGTAAGAAAC 3720
2522 AAAAAATATG AATAGATAGA TCGATATGAA AAGGATATGT GCGGCAGAAA CATGATGAGC 3780
2523 AAAAGGCGAC TCGCTGCAGC AACTTATGCA CAACGTCACT TACCTGAAAT TTCTTGCCGT 3840
2524 ACGATCTCCT GTAGTATCCC TTATCACAGC TGCAATCTAC TTGCAATGCT GCACTGCAAT 3900
2525 AAACGTACTA CAAAAGCTGC ATACGTTTTG ATCAGGACAC CTCGTGCGGA CGTGCTAAAA 3960
2526 AAAATTTCCT TTCTGCTGCT CTTATTGACG CTAAAACCTT AAAACCTACA AACAAAACAA 4020
2527 TTAAATAATA ACAAATCAAA TAAGACAACC AAATAATACA CTTACCTCAT TGACTGCAGC 4080
2528 TAAATCGCTG ACCCACATTC AGTGCAGCCG ACAGCAGGAG ACGGGCCCGC AAAAGCAAAA 4140
2529 CAAAATCGCC AATTTTGCGA TTATAAACAC GAAAAATTGA CAATTTTGCG ATGCCGTCTC 4200
2530 CGCCTCCTGA TGCCACTGCA TTGACAAGCA TCACTAGCGA GGAGCTGACA CCACACCAAA 4260
2531 AAGCTGTAAA ATCCGTCCAC AAATTGTATA TTTTGCCTCA GTGTCGTATC TGCAATGTTT 4320
2532 TTCCGATAAC CTGTAAGGAA AGAAAAATTA ATAAGAAAAT TATACAAAAT TAATTAAGGA 4380
2533 CGACAGAAAA TAGCAAACCA GACAGGCAAA TTAACAGATA CAAATATGAG ACTCCATCCT 4440
2534 GCTGCCGACA CACAAGTAAA TCCTTCAACT CGACAACAGG AGACGGGCCT TGCAAAAGCA 4500
2535 AAACAAAATC GCCAACTTTT GCGATTATAA ATACAAAAAA TTGACAATTT TGCAACGCCG 4560
2536 TCTCCACCTC CTGTTGCCAC TGCATTAATA AGGATCACCA GCGCGGCGTG ACGCCACACT 4620
2537 AAAAGGCTGC AAAATCCGTC CACAAAATGT ATACTTTTCC TCAGTACAAT ACTTTCTAAT 4680
2538 GAACTTCCGC CAACCTGCAA TGAAAAGAAA AGAAATAGGT ATATAAAACA AAACAAACAA 4740
2539 AAGGACAACC TAAAATTAGC AAACCAGACA GGCATACTAG TAGATGCTAA TATGCAGCTC 4800
2540 CATCCTACTG ACGACAACCA CGCAACTCCT TTCTCCAAGA CCGCAAATAC TGAAACAAGG 4860
2541 AAGCACAAGC TAATACTGGG AATTATTTAT TTAAACAAAA ATACTTATCT AATTGCCAAT 4920
2542 TCGACGACTC CAAATCCGCG GCTAACCGGC GGCGATGGCC CATAAATAAA GGGCCTCCTA 4980
2543 ATTAATTACA AAATGTACCT GAAAAACATA AAATTAACGC AACTATAATT AACGCAATTA 5040
2544 ATAAATCAAA TAAATACAAG TATAATACTT ACCTCCAAGC AAACGTACCT GAAAAACAAA 5100
2545 ACCAAAAAAA AAATTAATGC AATAAATAAA TCAAATAAAT ACAAACATAA TACTTACCTC 5160
2546 CAATTTACCT CCCAGCCAAT CTACCTGAAA AACATAATCT AATACAATCT CAAAAACAAA 5220
2547 TAACAAATGT AATACTTACC AAATTTTAAT TTTGTATTCA TTTCCATGAC CCCAACGCTG 5280
2548 CAACTGTCCT CGGCAACAAT TCCTGTTCCG GCGGCTCCAT GCTGCCAATC CTGACGCACT 5340
2549 GGCCACAAGA CGCGGCGCTG CTGGCAATCT CTCGATGAAC AACCGATCTA CAATTTCCAT 5400
2550 GACGACTCCT CTGTCACGAT GAGACAGAAG ACACCACCAA CGCCAGCAGC TCCAAAACAA 5460
2551 TACAACAACG GCCGCGCGGA ACCCATCTTC AGAATTCCCT CTTCCTGACG ACCGGCGAAC 5520
2552 GAGTTCTGGA ATAAACAATG TATTAATTGC AAACATCTAC CGATGAGGGT AGAAGAGATA 5580
2553 CTCACCAAAC GACTGCGGCG CGGGAACAAA CTAACTGCAA CGCCGGCCGG ACCTATTTGT 5640
2554 TGCAAGTGGC GCGCATCCAG CGCCTGCAAC ATGCCCCAGC CCAAGTACAC AACTACTTAC 5700
2555 CTGCAACGTC GCCAGAGGCT CCCAGCGAAT CGGTGCTTCC GTCCTTCTGG CGGGGGTACC 5760
2556 TGAAAAGAAA CAAATTAAAC AATATTAATC CTAAATTTCA ATGTTTTTTG TAAAATAATT 5820
2557 TAAATTGTTA AATGTAAACA AGCCTTGCAA TATGTTAATG TTACCAGTCC ATGCTACTGT 5880
2558 CTAAAAGCCA AGAATACAAA AAATACTAAT TATAAACTAA CTCACCACGC CCAACCCCCA 5940
2559 AACTCACCCC ATGCAATGTT AAACCTATAA ATTCAAATAA TTGTACCTAT ATATTGCACA 6000
2560 TACTGTAATC AAAGGCAAAA TAAATCGTGG ATGCGGAACA GAATTTACTC TGTCTCCGTA 6060
2561 CCTCCACCAG CAAAGTTAAA AAA 6083
2562 //
2563 ID DMIFACA standard; DNA; INV; 5371 BP.
2564 XX
2565 AC M14954;
2566 XX
2567 DR FLYBASE; FBte0000133; Dmel\I-element.
2568 XX
2569 FT source M14954:100..5470
2570 FT SO_feature CDS ; SO:0000316:187..1467
2571 FT SO_feature start_codon ; SO:0000318:1..3
2572 FT /name="Dmel\I-element\gag"
2573 FT /db_xref="FLYBASE:FBgn0020417"
2574 FT /db_xref="SPTREMBL:Q24362"
2575 FT /db_xref="NCBI_PROTEIN:AAA70221.1"
2576 FT /translation="MTDPPNIYKITSKTYQSQLGEPKFIIIKRNDNNSFERTSPFIIKK
2577 FT SVDFACGGEVEGCKRTRDGNLLIKTKNELQARKLLKLTKIADEDVTASEHKTLNFSKGV
2578 FT IYCNDLRHIDEDTILQELKPQKVSEVKKIMKRQNPNSNSDTNNITLVETGLIIITFESH
2579 FT KLPEIVRIGYETVRVRDYIPLPLRCKKCLRFGHPTPICKSVETCINCSETKHTNDGEKC
2580 FT TNEKNCLNCRNNPELDHQHSPIDRKCPTFIKNQELTAIKTTQKVDHKTAQHIYFERHGF
2581 FT QTKNTYAKTLTNGTTQRTTNTPSPNIHTNTTQSQQQNPHHTPKSAAQNTSAKTPTTEPA
2582 FT KTTLLSNQPHQHHHHHSYDKLEDMDTDYTPTRKPSTTYSSQLTEDLKIKIFPKDKSNNL
2583 FT SINLKASKLKAKAHKNKHTNNSDSESI"
2584 FT SO_feature CDS ; SO:0000316:1938..5195
2585 FT SO_feature start_codon ; SO:0000318:1..3
2586 FT /name="Dmel\I-element\RTase"
2587 FT /db_xref="FLYBASE:FBgn0020418"
2588 FT /db_xref="SPTREMBL:Q24363"
2589 FT /db_xref="NCBI_PROTEIN:AAA70222.1"
2590 FT /translation="MAPSWGSPTTNKRGKITHRFIDNMHLILLNDKSPTHFSTHNTYTH
2591 FT IDLTLCSPILAPHAKWKILNDLHGSDHFPIITTLFPTTNPQKFYRPFFKLKEANWEQFN
2592 FT ALTHQTNKKYPTSHNVNKEAALINRIILYSANLSIPQTSPNTHPYRVPWWNKHLDQLRK
2593 FT EKQLAWKKLNRTITVDNILDYRRKNAIFRYELKKRKKEASSSFTSTIHPTTPSSKIWAN
2594 FT IRRFCGLNPAKQIHAITNPVNNETTLASNEIANIFAQHFSDLSGDWNFSEEFRNNKYRN
2595 FT NIHLYTPSPIAQTIEENITYLELSSALQTLKGCAPGLNRISYQMIKNSSHTTKNRITKL
2596 FT FNEIFNSHIPQAYKTSLIIPILKPNTDKTKTSSYRPISLNCCIAKILDKIIAKRLWWLV
2597 FT TYNNLINDKQFGFKKGKSTSDCLLYVDYLITKSKMHTSLVTLDFSRAFDRVGVHSIIQQ
2598 FT LQEWKTGPKIIKYIKNFMSNRKITVRVGPHTSSPLPLFNGIPQGSPISVILFLIAFNKL
2599 FT SNIISLHKEIKFNAYADDFFLIINFNKNTNTNFNLDNLFDDIENWCSYSGASLSLSKCQ
2600 FT HLHICRKRHCTCKISCNNFQIPSVTSLKILGITLNNKYKWNTHINLLLPKLHNKLNIIK
2601 FT CLSSLKFNCNTHTLLNVAKATIIAKLEYGLFLYGHAPKSILNKIKTPFNSAIRLALGAY
2602 FT RSTPINNLLYESNTPPLEMKRDLQIAKLSQNLILSKNTPIHKFLKPKKANKKKTSTIDR
2603 FT TIKLSLELNLPYKPIKLHKNKPPWTLPNLIDTSLRIHKKEQTSPDQYRKLYEHTKNNLK
2604 FT THNFIFTDGSKINYTISFAITTETDVLKYGILPPYSSVLTSETIAILEAIELTKNRRGK
2605 FT FIICSDSLSAVDSIQNTNNNSFYPSRIRSLITQHAPKIKIMWIPGHSGIKGNELADQAA
2606 FT KSASSMPLILTPNINTTDIKKHLKADLATKQKEHIINCSPWYQSINTNTSHPCDYLKQS
2607 FT HPNWTRLDQIKIIRLRLGHTNITHQHYLNPNSIPTCPFCQGDISLNHIFNSCPSLLQTK
2608 FT QDIFNNTNPLDLLSKPNPDNIQKLILFLKKTKLYHKI"
2609 XX
2610 CC Derived from M14954 (g157749) (Rel. 44, Last updated, Version 2).
2611 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
2612 CC Any changes to original sequence record are annotated in an FT line.
2613 XX
2614 SQ Sequence 5371 BP; 2176 A; 1446 C; 606 G; 1143 T; 0 other;
2615 CATTACCACT TCAACCTCCG AAGAGATAAG TCGTGCCTCT CAGTCTAAAG CCTCGCTTCG 60
2616 CGTAAGCCCA AAACTCTTAT CAGCAAAATC TTGATAAACA AATATCAACC ACAAAGAGAA 120
2617 AATAAAAAAC TTAACAACAA AAACAACAAT ACCGCTAATC CGGGCTCAAG CCCTTAACCA 180
2618 ACAATCATGA CAGACCCACC AAACATTTAC AAAATCACTT CAAAAACATA CCAATCCCAA 240
2619 TTAGGCGAAC CTAAATTTAT AATTATTAAA AGAAATGACA ACAACTCTTT CGAAAGAACT 300
2620 TCACCATTCA TCATAAAAAA ATCGGTGGAC TTTGCCTGTG GAGGAGAAGT TGAGGGATGC 360
2621 AAACGTACAA GAGACGGCAA CCTGCTAATA AAAACCAAAA ATGAATTACA AGCCAGAAAA 420
2622 CTCCTAAAAC TAACAAAAAT TGCAGATGAG GATGTAACAG CAAGTGAACA TAAAACATTA 480
2623 AACTTCTCTA AGGGAGTTAT TTACTGTAAC GACCTTAGAC ACATCGACGA AGACACAATT 540
2624 CTACAAGAAC TAAAACCACA AAAAGTATCT GAAGTTAAAA AAATAATGAA ACGGCAAAAC 600
2625 CCCAACTCTA ACTCCGACAC CAACAACATC ACATTAGTTG AAACTGGACT CATAATTATA 660
2626 ACCTTTGAAT CGCATAAGCT CCCCGAGATA GTACGAATCG GGTACGAAAC AGTCCGAGTA 720
2627 CGAGACTATA TCCCACTCCC ACTTCGATGC AAAAAATGCC TCCGCTTCGG TCATCCAACA 780
2628 CCCATATGCA AAAGTGTAGA AACTTGCATC AATTGCTCTG AAACAAAACA CACAAACGAC 840
2629 GGAGAAAAAT GCACAAACGA AAAAAACTGC TTAAATTGCC GAAATAACCC AGAACTTGAC 900
2630 CATCAACACA GCCCAATTGA CCGCAAATGC CCTACGTTCA TAAAAAACCA GGAATTAACA 960
2631 GCAATTAAAA CCACACAAAA AGTTGACCAT AAAACGGCCC AACACATATA TTTCGAACGT 1020
2632 CACGGCTTCC AAACGAAAAA CACCTACGCC AAAACACTTA CAAACGGCAC AACCCAGAGG 1080
2633 ACAACAAACA CTCCATCACC TAATATTCAC ACAAACACAA CCCAATCACA ACAACAAAAT 1140
2634 CCGCACCACA CACCCAAATC AGCAGCACAA AACACTTCAG CTAAGACACC AACAACTGAA 1200
2635 CCAGCCAAAA CAACCTTACT ATCCAACCAA CCACACCAAC ACCACCACCA CCACAGCTAC 1260
2636 GACAAACTAG AAGACATGGA TACCGACTAC ACACCTACCA GAAAACCATC TACGACATAC 1320
2637 TCATCACAAC TCACAGAAGA CCTAAAAATA AAAATCTTCC CTAAAGATAA GTCCAATAAC 1380
2638 CTATCCATAA ACCTTAAAGC ATCAAAACTA AAGGCCAAAG CCCACAAAAA CAAGCACACT 1440
2639 AACAACAGCG ACAGCGAATC CATATAGAAC TCTACACAAA ACCCTAACCG TTAACACTAC 1500
2640 CTTTAAGTAA GTTATAAGCT TTAATTTTCT CACAAATGTC CCTAACTATA ATCCAATGGA 1560
2641 ATCTAAAAGG ATATCTAAAC AACTACAGCC ATCTCCTTAT TCTAATCAAA AAATACTCCC 1620
2642 CCCACATAAT TTCCCTCCAA GAAACCCATA TACAATACAC TAATAACATT CCAACCCCAA 1680
2643 TAAACTACAA ACTATTAACA AATATTGCCA CCAACAGATT TGGGGGGCGT ACGACTACTA 1740
2644 GTGCATAAGT CAATACAACA CACTGTCCTC AACATAACAA TCGATATAGA AGCAATAGCC 1800
2645 ATAAATATAG AATCTAAACT TAAATTAAAC ATATTTTCCA CATACATTTC TCCGACCAAA 1860
2646 AACATAACTA ACCAGACACT CCATAACACA TTTAACATAC AACAAACACC CTCTCTAATT 1920
2647 ACGGGAGATT TTAATGGATG GCACCATCCT GGGGCTCCCC AACAACAAAT AAACGAGGAA 1980
2648 AAATAACTCA TAGATTCATT GACAACATGC ACCTTATCCT GTTAAACGAC AAATCTCCCA 2040
2649 CACACTTTTC AACACACAAT ACATACACAC ACATAGACCT CACACTCTGC TCTCCAATCC 2100
2650 TAGCCCCCCA CGCCAAGTGG AAAATACTAA ACGATCTTCA CGGTAGCGAC CATTTCCCTA 2160
2651 TTATCACAAC ACTATTCCCA ACAACCAATC CACAAAAATT CTACAGACCC TTTTTTAAAC 2220
2652 TCAAAGAAGC CAACTGGGAA CAGTTCAACG CTCTTACCCA CCAAACCAAC AAGAAATACC 2280
2653 CCACCTCCCA CAACGTAAAC AAAGAAGCCG CTCTAATCAA TAGAATCATC CTTTATAGCG 2340
2654 CAAACCTCTC CATCCCACAA ACCTCACCTA ACACACATCC ATACAGGGTT CCATGGTGGA 2400
2655 ATAAACACCT CGACCAATTA CGTAAAGAAA AACAACTTGC CTGGAAAAAA TTAAACCGCA 2460
2656 CAATTACTGT TGACAACATT CTAGACTATA GACGCAAAAA CGCAATATTT AGATACGAAC 2520
2657 TAAAAAAGAG GAAAAAAGAA GCTTCCAGCT CTTTCACCTC AACCATCCAT CCCACTACTC 2580
2658 CCTCATCCAA AATATGGGCC AATATAAGAC GCTTCTGCGG ACTTAACCCA GCAAAACAAA 2640
2659 TTCATGCCAT CACAAACCCA GTAAATAACG AGACTACATT GGCTAGCAAC GAAATTGCTA 2700
2660 ACATATTCGC ACAACATTTC TCTGACCTCT CCGGCGACTG GAACTTCTCA GAGGAGTTCC 2760
2661 GGAACAATAA ATATAGAAAT AACATACATC TCTACACCCC CTCTCCAATA GCCCAAACCA 2820
2662 TAGAAGAGAA CATAACGTAT CTAGAACTTA GCTCAGCACT ACAAACATTA AAAGGATGTG 2880
2663 CTCCAGGACT AAATAGAATC TCGTATCAAA TGATCAAAAA TAGCTCCCAC ACAACAAAAA 2940
2664 ACCGAATAAC GAAACTATTT AATGAAATAT TCAATAGCCA CATACCTCAA GCCTACAAAA 3000
2665 CAAGCCTAAT CATCCCAATC CTTAAGCCAA ACACCGACAA AACGAAAACT TCCTCATACC 3060
2666 GACCCATCTC CCTCAACTGC TGTATAGCAA AGATACTTGA TAAAATAATT GCGAAAAGAC 3120
2667 TCTGGTGGCT AGTGACATAT AACAACCTAA TTAACGACAA ACAATTCGGG TTCAAAAAAG 3180
2668 GCAAATCGAC TTCGGACTGT CTACTCTATG TAGACTATCT CATAACGAAG TCAAAAATGC 3240
2669 ACACCTCCCT CGTCACTCTT GATTTTTCAA GAGCCTTCGA TCGAGTAGGT GTGCACTCCA 3300
2670 TAATCCAGCA ATTGCAGGAA TGGAAAACGG GTCCCAAAAT AATAAAATAC ATTAAAAACT 3360
2671 TCATGAGCAA CAGAAAAATA ACTGTCCGCG TCGGTCCGCA TACATCAAGC CCGTTACCCC 3420
2672 TATTCAACGG AATCCCCCAA GGTTCACCCA TATCCGTAAT ACTTTTCCTC ATAGCATTCA 3480
2673 ACAAATTATC CAACATCATA TCCCTACATA AAGAAATTAA ATTCAACGCA TATGCCGACG 3540
2674 ACTTCTTCCT TATAATAAAT TTCAACAAAA ACACAAATAC AAATTTCAAC TTAGACAATC 3600
2675 TATTCGACGA TATAGAAAAT TGGTGCTCCT ACTCAGGGGC ATCGCTTTCC CTATCCAAAT 3660
2676 GTCAACACCT CCACATATGC AGAAAACGTC ACTGCACATG CAAGATAAGC TGCAACAACT 3720
2677 TCCAAATTCC TAGCGTTACG TCCTTAAAAA TTCTAGGAAT AACCTTAAAC AACAAATACA 3780
2678 AATGGAACAC ACACATAAAC CTACTTCTAC CCAAACTACA CAACAAGCTA AATATAATAA 3840
2679 AATGCCTATC TAGTCTTAAA TTTAACTGCA ACACGCATAC ACTACTTAAT GTCGCAAAAG 3900
2680 CAACAATTAT AGCCAAACTA GAGTATGGTT TGTTTCTGTA CGGCCATGCT CCCAAAAGCA 3960
2681 TTTTAAACAA AATAAAAACA CCGTTTAACT CCGCTATCCG TCTAGCTCTC GGCGCATATC 4020
2682 GCTCTACCCC AATAAATAAC TTACTTTACG AATCGAATAC TCCCCCCTTA GAAATGAAAC 4080
2683 GAGACCTTCA AATAGCCAAA CTATCCCAAA ACCTAATCCT CTCCAAAAAC ACACCAATAC 4140
2684 ATAAGTTCTT AAAGCCTAAA AAAGCTAATA AGAAAAAAAC ATCAACAATA GACCGAACAA 4200
2685 TCAAACTTAG CCTAGAACTT AATCTACCCT ACAAACCAAT AAAACTCCAT AAAAACAAAC 4260
2686 CACCATGGAC CCTCCCCAAT CTAATAGACA CGTCACTTAG AATCCATAAG AAAGAACAAA 4320
2687 CATCTCCAGA CCAATACAGA AAATTATACG AACACACAAA GAATAACCTC AAAACACACA 4380
2688 ATTTCATATT CACTGACGGT TCAAAAATTA ATTACACAAT ATCATTCGCC ATTACAACGG 4440
2689 AGACAGACGT CTTGAAATAC GGCATACTGC CCCCATATTC ATCCGTCCTC ACCTCCGAAA 4500
2690 CAATCGCCAT CCTAGAAGCA ATAGAACTTA CTAAAAACCG AAGAGGCAAA TTTATTATCT 4560
2691 GCTCCGACTC CCTATCAGCA GTAGATTCAA TTCAAAACAC AAATAATAAC AGCTTTTACC 4620
2692 CAAGCAGAAT ACGATCGCTA ATAACGCAAC ACGCACCTAA AATTAAAATA ATGTGGATTC 4680
2693 CTGGCCATTC AGGAATAAAA GGAAATGAAT TAGCCGATCA AGCTGCAAAA TCAGCAAGCA 4740
2694 GTATGCCACT TATCCTCACC CCAAACATAA ATACCACAGA TATAAAAAAA CACCTTAAAG 4800
2695 CCGACCTTGC GACAAAACAG AAAGAACACA TAATAAACTG CAGTCCATGG TACCAATCTA 4860
2696 TTAACACGAA CACCTCACAC CCATGCGATT ACCTTAAACA ATCCCACCCA AATTGGACCA 4920
2697 GACTCGACCA AATAAAAATA ATACGACTTC GACTAGGACA CACAAACATA ACCCACCAAC 4980
2698 ACTACCTAAA TCCCAATTCA ATACCAACTT GCCCGTTTTG CCAAGGTGAT ATTTCTTTAA 5040
2699 ACCACATATT TAACTCATGC CCATCCCTCC TACAAACCAA GCAAGATATA TTTAACAACA 5100
2700 CCAACCCTCT AGACCTTCTT AGCAAACCCA ATCCAGATAA CATACAAAAA CTCATACTTT 5160
2701 TCCTCAAAAA AACTAAATTA TACCACAAAA TCTAAAAACA AAACAGGCAT TTGTACATAA 5220
2702 CAAGCCAGCA ATTAGTTACC AAATTAGATA TTAACTAAAT TAAGATATAA TAACATTGTA 5280
2703 AATAAATATA GCTGTAAGCC CCGTAGCTAA TGCTATACTA TCTAAGTTAG TCTAGTTTTG 5340
2704 TAAACTATTC TATCTATCAT AATAATAATA A 5371
2705 //
2706 ID DMLINEJA standard; DNA; INV; 5020 BP.
2707 XX
2708 AC M22874;
2709 XX
2710 DR FLYBASE; FBte0000088; Dmel\jockey.
2711 XX
2712 SY synonym: wallaby
2713 SY synonym: sancho
2714 XX
2715 FT source M22874:115..5134
2716 FT SO_feature CDS ; SO:0000316:300..2051
2717 FT SO_feature start_codon ; SO:0000318:1..3
2718 FT /name="Dmel\jockey\gag"
2719 FT /db_xref="FLYBASE:FBgn0020297"
2720 FT /db_xref="SWISS-PROT:P21330"
2721 FT /db_xref="NCBI_PROTEIN:AAA28674.1"
2722 FT /translation="ISIALYGISIKTIDIMENSFAQSRPSNGCDKFEKMRKVAGVEPGE
2723 FT LRSQLRASCAVVSPNLEGMPTQSAVSSLMVTISSNTNASVTCTISNVQANMICTPTYTD
2724 FT CTTVTTSICPTTPYDNGLPTPLSSLPNKPSKANCPFQAHDRTVNRKRKGVSQPPLPILT
2725 FT PSPSRKTKRQATMPLNEEASTSTAAALNNNRFALLSAEAENMEQDVSDADSDIEDSAAR
2726 FT DGGGQSAKYSKPPAICVPSVSDPVTLERALNLSTGSSNYYIRISRFGVSRIYTANPDAF
2727 FT RTAVKELNKLNCQFWHHQLKEEKPYRVVLKGIHANVPSSQIEQAFSDHGYEVLNIYCPR
2728 FT KSDWKNIQVNEDDNEATKNFKTRQNLFYINLKQGPNVKESLKITRLGRYRVTVERATRR
2729 FT KELLQCQRCQIFGHSKNYCAQDPICGKCSGPHMTGFALCISDVCLCINCGGDHVSTDKS
2730 FT CPVRAEKAKKLKPRSRLPMTNNIATLKPPQRSSSGYIPAEALRTNISYADIARRNTTQS
2731 FT RARATVQAEVIPTSDNSLNNKFMTLDNSIRAINTRMDELFKLIHETVEANKAFRELVQV
2732 FT LITRIPK"
2733 FT SO_feature CDS ; SO:0000316:2048..4798
2734 FT SO_feature start_codon ; SO:0000318:1..3
2735 FT /name="Dmel\jockey\pol"
2736 FT /db_xref="FLYBASE:FBgn0015952"
2737 FT /db_xref="SWISS-PROT:P21328"
2738 FT /db_xref="NCBI_PROTEIN:AAA28675.1"
2739 FT /translation="MTQPTLKIGLWNARGLTRGSEELRIFLSDHDIDVMLTTETHMRVG
2740 FT QRIYLPGYLMYHAHHPSGNSRGGSAVIIKSRLCHSPLTPISTNDRQIARVHLQTSVGTV
2741 FT TVAAVYLPPAERWIVDDFKSMFAALGNKFIAGGDYNAKHAWWGNPRSCPRGKMLQEVIA
2742 FT HGQYQVLATGEPTFYSYNPLLTPSALDFFITCGYGMGRLDVQTLQELSSDHLPILAVLH
2743 FT ATPLKKPQRVRLLAHNADINIFKTHLEQLSEVNMQILEAVDIDNATSLFMSKLSEAAQL
2744 FT AAPRNRHEVEAFRPLQLPSSILALLRLKRRVRKEYARTGDPRMQQIHSRLANCLHKALA
2745 FT RRKQAQIDTFLDNLGADASTNYSLWRITKRFKAQPTPKSAIKNPSGGWCRTSLEKTEVF
2746 FT ANNLEQRFTPYNYAPESLCRQVEEYLESPFQMSLPLSAVTLEEVKNLIAKLPLKKAPGE
2747 FT DLLDNRTIRLLPDQALQFLALIFNSVLDVGYFPKAWKSASIIMIHKTGKTPTDVDSYRP
2748 FT TSLLPSLGKIMERLILNRLLTCKDVTKAIPKFQFGFRLQHGTPEQLHRVVNFALEAMEN
2749 FT KEYAVGAFLDIQQAFDRVWHPGLLYKAKRLFPPQLYLVVKSFLEERTFHVSVDGYKSSI
2750 FT KPIAAGVPQGSVLGPTLYSVFASDMPTHTPVTEVDEEDVLIATYADDTAVLTKSKSILA
2751 FT ATSGLQEYLDAFQQWAENWNVRINAEKCANVTFANRTGSCPGVSLNGRLIRHHQAYKYL
2752 FT GITLDRKLTFSRHITNIQQAFRTKVARMSWLIAPRNKLSLGCKVNIYKSILAPCLFYGL
2753 FT QVYGIAAKSHLNKIRILQAKTLRRISGAPWYMRTRDIERDLKVPKLGDKLQNIAQKYME
2754 FT RLNVHPNSLARKLGTAAVVNADPRTRVKRRLKRHHPHDLPNLVLT"
2755 XX
2756 CC Derived from M22874 (g157823) (Rel. 47, Last updated, Version 5).
2757 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
2758 CC Any changes to original sequence record are annotated in an FT line.
2759 XX
2760 SQ Sequence 5020 BP; 1527 A; 1198 C; 1055 G; 1240 T; 0 other;
2761 AAAAATCATT CACATGGGAG ATGAGCAATC GAGTGGACGT GTTCACAGAA GTCGCGAGAT 60
2762 AAAACAAAAA CGTAATTGTG ATCCATCACA AACATCTGCG CAGATCGTGT GCTTATCTCA 120
2763 CAAACAAAAT CTATTTTTAG TCACTGCATA ACGGTGACGG CTTCGGTTCG CGAAACTTAT 180
2764 CAGCAACTAG CAATTTCTAA GCTGTGTTGT TTTTGCCCCT CGCCCTGCGC GCTGCGCAAG 240
2765 CGGGAGGTTG TTACAATTTA CCTTACAAGT AAACCGGTAA ATCTTATCGT GTTTAGTAAA 300
2766 TATCAATTGC ATTATACGGC ATAAGTATAA AGACAATTGA TATAATGGAG AATTCATTTG 360
2767 CTCAATCGCG ACCTAGCAAT GGGTGCGATA AATTTGAGAA AATGAGGAAA GTAGCAGGTG 420
2768 TTGAGCCAGG AGAATTACGC TCCCAACTCC GCGCCAGCTG TGCAGTTGTT TCCCCTAACC 480
2769 TGGAAGGTAT GCCAACTCAA TCTGCGGTCT CCAGCTTAAT GGTGACAATC AGCAGCAACA 540
2770 CCAATGCAAG TGTTACCTGC ACTATTTCTA ACGTACAGGC CAACATGATC TGTACTCCTA 600
2771 CATACACTGA TTGCACAACC GTGACCACTA GCATTTGCCC AACTACGCCT TATGACAATG 660
2772 GACTGCCGAC ACCTCTGTCA TCACTGCCCA ATAAGCCATC TAAAGCGAAT TGCCCCTTTC 720
2773 AAGCACATGA TCGTACTGTC AACAGGAAAC GAAAAGGCGT GTCTCAGCCC CCATTACCTA 780
2774 TCCTCACCCC TTCTCCAAGC CGTAAAACTA AAAGGCAGGC CACTATGCCA CTCAATGAGG 840
2775 AGGCCTCTAC CTCCACTGCA GCAGCATTAA ATAACAATCG CTTCGCGCTT TTGTCCGCTG 900
2776 AAGCGGAGAA TATGGAGCAA GACGTGTCGG ATGCTGATTC TGACATTGAA GACTCTGCTG 960
2777 CCCGAGATGG TGGTGGACAA TCCGCTAAAT ATAGCAAACC CCCAGCCATA TGCGTACCAA 1020
2778 GTGTAAGCGA TCCGGTCACC TTGGAACGGG CTCTCAATCT GAGCACCGGC TCCTCAAACT 1080
2779 ACTACATCCG CATTTCTAGA TTTGGTGTAT CCAGAATCTA TACAGCCAAC CCTGATGCTT 1140
2780 TCCGCACCGC TGTAAAAGAA CTAAATAAGT TAAATTGTCA ATTCTGGCAT CACCAACTTA 1200
2781 AAGAAGAAAA ACCCTACAGA GTAGTGCTTA AAGGAATCCA TGCTAATGTT CCTAGTTCGC 1260
2782 AGATAGAACA AGCATTTAGT GATCACGGCT ATGAGGTCCT TAATATCTAT TGCCCCAGAA 1320
2783 AGTCTGACTG GAAGAACATT CAGGTAAACG AAGATGATAA TGAAGCTACA AAAAACTTCA 1380
2784 AAACTAGACA AAATTTGTTT TATATTAATC TTAAACAAGG CCCGAATGTT AAAGAGTCTC 1440
2785 TTAAGATAAC TCGACTTGGC AGATACAGAG TCACTGTTGA GCGCGCTACA CGTAGAAAAG 1500
2786 AACTGCTACA ATGTCAAAGA TGCCAAATTT TTGGACACTC TAAGAACTAT TGCGCCCAGG 1560
2787 ATCCTATTTG TGGTAAATGT AGTGGTCCCC ATATGACCGG GTTCGCTTTG TGCATAAGTG 1620
2788 ACGTATGTCT GTGTATAAAT TGTGGTGGTG ATCATGTCTC GACAGACAAA AGCTGCCCTG 1680
2789 TCAGAGCAGA GAAAGCCAAG AAGCTAAAAC CAAGGTCCAG GCTACCGATG ACTAATAATA 1740
2790 TTGCCACACT CAAACCTCCA CAACGTTCTT CAAGCGGTTA CATACCAGCT GAGGCATTAA 1800
2791 GAACCAACAT CTCTTATGCT GATATTGCTC GACGCAACAC GACTCAATCT AGGGCTCGTG 1860
2792 CTACTGTGCA GGCTGAAGTT ATACCAACGT CGGACAATAG CCTTAACAAT AAATTTATGA 1920
2793 CGTTAGACAA CTCCATTCGG GCCATCAATA CGAGAATGGA CGAACTATTT AAGCTTATAC 1980
2794 ACGAAACTGT AGAGGCTAAT AAAGCTTTCA GAGAACTGGT TCAGGTTCTA ATTACACGTA 2040
2795 TTCCTAAATG ACTCAACCAA CCTTAAAAAT CGGATTGTGG AACGCTCGCG GATTAACAAG 2100
2796 GGGCTCTGAG GAGCTTCGGA TATTCCTCAG CGATCACGAT ATAGACGTAA TGCTTACCAC 2160
2797 GGAAACACAC ATGCGAGTTG GTCAGCGCAT CTATCTCCCA GGGTATCTTA TGTATCACGC 2220
2798 CCACCACCCC AGTGGTAACA GTAGAGGTGG CTCTGCAGTC ATCATAAAAT CTAGACTTTG 2280
2799 TCACAGCCCT CTGACACCTA TCTCTACTAA TGACAGGCAG ATAGCGAGAG TGCACCTGCA 2340
2800 AACATCGGTT GGGACCGTCA CTGTAGCTGC TGTTTATCTA CCTCCAGCAG AAAGATGGAT 2400
2801 AGTAGATGAC TTCAAATCCA TGTTTGCTGC GTTAGGCAAC AAATTTATTG CTGGTGGTGA 2460
2802 TTACAATGCC AAACATGCAT GGTGGGGGAA CCCAAGATCC TGTCCTAGAG GTAAAATGTT 2520
2803 GCAAGAAGTC ATTGCACATG GGCAATACCA AGTTCTGGCT ACGGGCGAAC CCACTTTCTA 2580
2804 CTCTTACAAC CCTTTGTTAA CACCATCAGC CCTTGATTTT TTTATAACCT GTGGGTACGG 2640
2805 CATGGGCAGG CTAGATGTAC AAACTCTCCA GGAACTCTCG TCGGACCATC TTCCTATTCT 2700
2806 GGCTGTATTG CACGCTACGC CGTTAAAGAA ACCACAACGC GTACGACTAC TTGCCCATAA 2760
2807 TGCTGACATA AACATATTCA AAACCCATCT TGAACAGCTG AGTGAGGTAA ATATGCAAAT 2820
2808 TCTGGAGGCG GTGGACATTG ATAATGCCAC AAGCCTTTTC ATGAGCAAAC TAAGTGAGGC 2880
2809 TGCTCAGCTT GCTGCACCGA GAAATCGGCA TGAAGTAGAG GCCTTCAGAC CACTTCAACT 2940
2810 TCCTTCCAGT ATATTGGCAC TGCTCAGGCT AAAACGAAGA GTTCGAAAAG AATATGCTAG 3000
2811 AACAGGTGAT CCCCGCATGC AACAGATCCA CAGTAGACTG GCCAACTGCC TGCATAAGGC 3060
2812 CCTTGCTCGA AGAAAGCAGG CCCAAATAGA TACCTTCTTG GATAACTTGG GTGCTGACGC 3120
2813 GAGCACAAAT TACTCACTGT GGCGTATCAC GAAACGGTTC AAAGCTCAGC CCACCCCAAA 3180
2814 ATCAGCAATC AAAAATCCGT CTGGTGGCTG GTGTCGCACT AGCTTGGAAA AAACTGAAGT 3240
2815 GTTCGCTAAC AACCTTGAGC AACGTTTTAC ACCCTATAAC TATGCACCGG AAAGTCTCTG 3300
2816 TCGTCAGGTT GAAGAATACT TGGAATCGCC CTTTCAAATG AGCCTGCCTC TGAGTGCTGT 3360
2817 CACACTGGAA GAAGTGAAGA ATTTAATAGC CAAGCTGCCA CTTAAGAAAG CTCCTGGAGA 3420
2818 AGATCTTCTT GATAATAGAA CCATTAGACT TCTCCCAGAT CAAGCATTGC AGTTCCTTGC 3480
2819 CTTAATATTC AACAGCGTTC TTGATGTTGG CTACTTTCCG AAAGCTTGGA AATCGGCGAG 3540
2820 CATAATTATG ATCCATAAGA CTGGAAAAAC ACCGACAGAC GTTGACTCGT ACAGGCCCAC 3600
2821 CAGCTTACTC CCATCTCTGG GTAAAATTAT GGAGAGGCTG ATCCTAAACA GGCTGCTCAC 3660
2822 ATGCAAGGAT GTTACCAAAG CGATTCCCAA ATTTCAGTTT GGCTTCCGGT TGCAGCACGG 3720
2823 TACTCCTGAG CAACTACATA GAGTAGTGAA CTTTGCTCTG GAAGCTATGG AAAACAAGGA 3780
2824 GTATGCAGTA GGTGCCTTTC TTGATATTCA ACAGGCATTT GACAGAGTCT GGCACCCTGG 3840
2825 GCTCCTGTAC AAAGCGAAGA GGCTGTTCCC GCCGCAGCTA TATTTGGTTG TTAAAAGTTT 3900
2826 CCTGGAAGAA CGCACATTCC ACGTCTCTGT TGATGGGTAC AAATCATCAA TCAAGCCAAT 3960
2827 TGCAGCTGGA GTTCCTCAAG GAAGCGTTCT TGGCCCAACC CTATACTCAG TTTTTGCTTC 4020
2828 GGACATGCCT ACTCACACAC CAGTCACAGA GGTAGACGAA GAAGATGTGC TCATAGCCAC 4080
2829 CTACGCTGAC GATACTGCTG TGCTCACGAA AAGTAAAAGT ATCCTGGCTG CCACTTCTGG 4140
2830 TCTACAGGAA TACCTGGATG CATTCCAGCA ATGGGCTGAG AACTGGAATG TGCGCATCAA 4200
2831 CGCTGAGAAG TGTGCCAATG TGACGTTCGC CAACCGAACA GGTAGCTGTC CGGGTGTCAG 4260
2832 TCTGAATGGA AGACTGATCA GACACCATCA GGCTTATAAA TACCTTGGTA TTACCCTCGA 4320
2833 TAGGAAGCTC ACCTTCAGCA GGCACATCAC AAATATTCAG CAAGCGTTCA GGACCAAGGT 4380
2834 TGCTCGGATG TCTTGGCTCA TTGCACCACG CAACAAACTG TCGCTTGGCT GCAAGGTCAA 4440
2835 TATTTACAAG TCCATATTGG CCCCCTGCCT GTTCTACGGC CTGCAGGTAT ACGGCATTGC 4500
2836 TGCGAAGAGT CACCTTAATA AGATCCGGAT TTTACAGGCG AAGACCTTAA GAAGAATTTC 4560
2837 GGGGGCTCCT TGGTATATGA GAACAAGAGA CATCGAACGC GACCTCAAGG TGCCCAAATT 4620
2838 AGGAGACAAG CTCCAGAACA TCGCCCAAAA ATATATGGAA AGGCTTAATG TACACCCCAA 4680
2839 CAGCCTAGCA AGGAAGCTAG GAACTGCAGC TGTGGTCAAT GCTGACCCTC GGACTAGAGT 4740
2840 CAAAAGAAGA CTCAAGCGAC ACCACCCTCA TGACCTCCCT AACCTGGTTT TGACCTAGAA 4800
2841 AGTCTTAGTT TTAAAATTCA TTAGAATAAT CAAATAAATA ATAATTACTA TGTTATATCA 4860
2842 ACTATTATAA TTCTCCCTAT CATTTTTAGA TTAAAAATCT GTTAGTCTTA AGTAACCAAG 4920
2843 ACACATTGTA AAATAAAATA ATTTAAGCAG ATCAAATTAA GTTGCCGCAT GGGTAACAGT 4980
2844 GCGTTGATCA AATAATAAAA ACATCATAAA AAAAAAAAAA 5020
2845 //
2846 ID DMTRDNA standard; DNA; INV; 1435 BP.
2847 XX
2848 AC X80025;
2849 XX
2850 DR FLYBASE; FBte0000670; Dmel\hopper.
2851 XX
2852 SY synonym: M4
2853 XX
2854 FT source X80025:1..1435
2855 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..33
2856 FT SO_feature terminal_inverted_repeat ; SO:0000481:1403..1435
2857 XX
2858 CC Derived from X80025 (g510507) (Rel. 44, Last updated, Version 11).
2859 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
2860 CC Any changes to original sequence record are annotated in an FT line.
2861 XX
2862 SQ Sequence 1435 BP; 456 A; 265 C; 212 G; 502 T; 0 other;
2863 CACTATGGGG CATTTGGCCT GTTTTTTTTA CAAAAATTAA TACCTCCTAA ACTATTGGAG 60
2864 ATATTTGGAT GAATTTTTTT TTATGCGTTA CACATGCCTC CAGGAATATT TTGGAAAAGT 120
2865 GGGCGTGCCC CAACTCCGCC CCATTTTTTT TTTTTTTTTT TTTTTTTTTT AATAATATAT 180
2866 TTTTAAAGTT TATTTTTAAT TTCAATAATG TATAATTCAT AACCGTCTTC CTCTTCACAA 240
2867 TCAGTAGAGT CTGAAGAATT TTTATCAGGT TCAAATTCGC AAGCTAACAT TTCAATGACT 300
2868 TCTGGTGGAA GAGATAGTCG CTTATGTTTT CGCCTCTTTA AATTTATTGA TGATATTATG 360
2869 GGATCCGAAG TATCCATTGC TCTGTAAAAG ACATCTGCGA AGCTACTAAT AGTTTTTGCC 420
2870 GTGGCTGGCT TCAACAAAAG AATTTTAAGT ATGGCTGCAA GATCCCGCAG GCAGCACTTC 480
2871 CGTGCAGCTT GAACCAAAAG ACGTTCGTTG TGTTTCTGCG CCCTTACGAG TTCATCTGCT 540
2872 TGCTGTCTTG GGCCACTCAA ATTTTTTAAA TAATATGACG TTTTCGGGAG TCCAACTAAT 600
2873 TTCCTTTCCT ATTTATTTTT CTCCTTTACC TTCAGGACTA GGTGTTCTTC TAACCAATTT 660
2874 GAAAAAAATT TTAAAAATTC ATATATTTTT CGATTGCATT TTCTCCAATT TCGTAAAAGA 720
2875 TTGACTGAAA TCATTCGTTA TTATTATTAT TAGTTAATCG TTTATTAAAG TCTAGCTTGC 780
2876 TATCAGAAAA ATGCCCACTG ATAAAAGTGC AAATAGAATT TTCCTTTTGA CGAACACCCT 840
2877 TTTGCGTGCG CCACACTTCC AGCAGGGCAG CATTGGAAAT CGAGATATTG CTCCCTAAAA 900
2878 AATGAAATTT CTCAAAAAAC CGCAAAAAAC GCACATAGAG ACTACCTGAT ATGAGTTAGG 960
2879 AATTGAACAC ACTACAACAT GGATATAAAC ACTTACTGAA CAAATTTGAA CAAATTGTTG 1020
2880 TAGCTCTATT CAAAGTTGAA AATTTTTTCA AACAACTACA TCTTGACACC ACTTGTTAAA 1080
2881 TGTACAAATT GTTAGAAATA GGCGCACACA ATAAACAATA TATTAATAAC AACACATAAT 1140
2882 AAGAACCTAA AGATTGATTA TCCATTTCAA ATTATACTCT CCTTCTTCTT CTTTTTAAAT 1200
2883 TTTAACACTT TGAAAGTTAA GCTAAATTTT GTGCGCAAAG CAGCCACGTG GTATATGCTC 1260
2884 GCAACAGCCG ACTTTAACAG CTGTTATTAT AACAGTGCAT TGTTAAATTA ACTTATGCGG 1320
2885 GCTATATCAT AACAGTTTAA CGTATTTCCA ATGTATTAAT ACTAAAATAC TTCAAATTTG 1380
2886 CATACTTGTG AAAAACACAT TATTGTAAAA AAAACAGGCC AAATGCCCCA TAGTG 1435
2887 //
2888 ID DMRTMGD1 standard; DNA; INV; 7480 BP.
2889 XX
2890 AC X59545;
2891 XX
2892 DR FLYBASE; FBte0000015; Dmel\mdg1.
2893 XX
2894 FT source X59545:1..7480
2895 FT SO_feature five_prime_LTR ; SO:0000425:1..441
2896 FT SO_feature three_prime_LTR ; SO:0000426:7039..7480
2897 FT SO_feature CDS ; SO:0000316:548..923
2898 FT SO_feature CDS ; SO:0000316:1327..1557
2899 FT SO_feature CDS ; SO:0000316:1749..3062
2900 FT SO_feature CDS ; SO:0000316:2987..6673
2901 XX
2902 CC Derived from X59545 (g8507) (Rel. 49, Last updated, Version 4).
2903 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
2904 CC Any changes to original sequence record are annotated in an FT line.
2905 XX
2906 SQ Sequence 7480 BP; 3067 A; 1298 C; 1235 G; 1880 T; 0 other;
2907 TGTAGTATAT ACGAATATAA TAACAATAAT AATAACAATA ATAATAATAA TATTAATAAT 60
2908 AATTATAATA TGAATCATAA TAATAAGTCA ACTAATAAGT AAACTTAGGA CCACCCTAAT 120
2909 TCCTTAGGGT CACCCTAGTA GATCTTTAGA TACACCCTAA TACTAAATAT GCGAATTCAG 180
2910 GATGTACGCC TTTAGGGGTC GGACTCGACT CCCATTGGTT ATCGAGTATG AACTTCATAC 240
2911 ATACATATTG CAGAATTTGC TAGTGTCAGC ACTTGGCTGT CACAAGAGAT CTCCCTGTAG 300
2912 ACCACACTAA GATCAGTTAT AAATCAGGAA TAGATCTGGA ATGTACACTC GCTTAATAAA 360
2913 AACCAAATAA AGATAAAATG ACCAACTGCG TTTTGAGACT TTATTAACTA CATCAGAAGT 420
2914 ATTAGAATTC AAATTAACTA CATGGCGACC GTGACAAAGG ATCGTTATAA GTTGTAGCAG 480
2915 AAGCTAAAGG AAACCGCTTG TGATAATTTT CAACTTCGAT GCTCATCCAC CAAGACGGCG 540
2916 GCAATTATGA AGAAAAAAGC GATCTGAGTG AGTAGAGTGT CAGTGTGATG GGAAAAAACA 600
2917 GGGGCGGAGT TCGACATAAT ATAAAAAAGA GAATAGCGCA CATAAAGTGG CTATTATATA 660
2918 CGAACACTCC ACCACCCCAA TGGTCGAAAG CTCAAAAACT ACAAGCTGAG CTAGACCACT 720
2919 GTGTCGAATA TCTCAAGAAA AAAATCCCCA CCACACGCGC TCACTCAGAA AATCAAATAA 780
2920 AATCGTTAAC AATTAACAAA ACTCCAACTC CCAATCCGAA AAGCCTGCCT GTTTTCAAGA 840
2921 AAAGATGCCC GAACGACTGC GAGGGACCAC TGTTCACACC GCATTGTGAA CATACGTGCA 900
2922 GACATTGCAG CTCCACCACA TAACCCCTAA ATGAGGAAAT CATCATCAAC GTGGTGAGCA 960
2923 GCCCGCTCAT TACGTCATCG AGGGAGTGTC AGCGTGCCAA CCCGGCGACG ACCAGATGAC 1020
2924 GCAGGAGGGT CAGAGTGAAG CAAATAGGAG CTGAAAAATA AAATATTTTT TTTGTTGCCC 1080
2925 TGCGTGGCAC ACCCTCGATG CACTGCGCTG CATATTAATA TTACACAAAA TATTGTAACA 1140
2926 TTGAGCGGAA CTTTTTCTGC CCGATGAGAA GAATGGCCCG TAAAGCCATA CACCAACTAG 1200
2927 GTAGGAAAAT GTAACTATAT TGAACAAAAA AAAAAAAAAT CAAAACAACA TATTTTTAAA 1260
2928 GTAAAATAAA CCAAAACCCA AAAATAAAAA AAAAAAAAAA AAAAAAAAAA ATAAAAATAT 1320
2929 ACAAAAATGG GTTGGTTTGG ATCTGACGAT AGTCAGACAA AAGATAATAC GGCCAATGTG 1380
2930 GTCAATAACT TAAAAATAGT CGACCATACA GATGACATTC AGTCACTGTG GTTACTCCTT 1440
2931 TTGATCATGA CGATCGTAAC AGTCGCTCAG TTTATATTAA CGCTATATGT TAAGCATAAC 1500
2932 AAGATAATAA AGAGGCGTTA TATAGGCAAA GCAGAGAATA GTTTGGATAA AATTTGAAAA 1560
2933 AAAAAAAAAA AAAAAAAAAA AAAAAAACAT CCGAGATGTA TTTTGAATTA AGATGATCTA 1620
2934 AAATTTTTAT TTTTAATATC AGAAAACTAG AATGAAAAAA AAAAAAAAAG ATTATTGAAG 1680
2935 AAACCTATTT GAGAGAGGCC AAAATTTATA AAGTTCGATT GCATAGATAA ATCCATAGTA 1740
2936 TTCTTTAAAT GGACTGGCAA GAAATACAAA ACGAGCTTAA AGAAATTAAA ACAACTTTTG 1800
2937 ACAAGTCTTA TAAATGCATG ACACCAAATA GAGAAGTGCA ACAAGACACT CTCAACAAGC 1860
2938 ATGCGCAGAT ATTGGTAAGA TGCTTTAATG GAGCACGCCA ATTAATTTAC AGAGAAAGGA 1920
2939 AAAGATTAAC AAAAAATCAT TTATCACAAG CAGTAAAATT TCTAAACAGG TTCCGTGAGA 1980
2940 ACTTGTTAAA CGTCAAGTAC AGACACAACT TAAATATTAC AATCCCAACG ATTTTAAGCA 2040
2941 CACCTATAGT GGCTGAGATC GGTGAGGATA TCGAAAGTGT AGGAGAATCA GAAATAGAAA 2100
2942 TAAAAGAAGA GGATCTCCAC GATCTTGCAA TTCCAGCGGT AATAACATTA CCCGAATTAC 2160
2943 TTGAAGAAGA ACTTTCAGAT TCAAATACAG GAATAAGAAT ACAGGAAACG GACAAAATGA 2220
2944 CAGACTCTGC CGCAACAGCA AGGGAATATG TGCGACAAAT TTCGTCCACA ATACCTGAGT 2280
2945 TTGACGGCAA AAAGTTAAAC TTGAATAGAT TCCTCACGGC TCTCCGGCTG ATAGATCTGA 2340
2946 CAAAAGGAGA TCAGGAGATG CTAGCGGTTG AGGTAATCAA GACAAAGATA CTTGGTCCAT 2400
2947 TATCACACAA AGTTGAAAAT GAAAAGACCA TTATCGGTAT AATAAATCTA TTAAAAGCAT 2460
2948 CAGTTAAAGG CGAATCGCCC GATGTCATCA AAGCAAAAAT GCTTAGTACA CAACAGCGCG 2520
2949 GCAAAACTGC AGCGCAATAT ACCACGGAGA TAGAAAACCT ACGTGGGTTG CTCGAAGCAG 2580
2950 CCTATATAGA TGATGGTTTA GATTCCAACA ATGCAGACAA ATTCGCTACA AAGGAAGCCA 2640
2951 TATCTGCAAT GACCAAGAAC TGTGGGCACG ATAAGCTCAA AACCATATTG GAAGCTGGAA 2700
2952 ATTTCAACAC GATGAATAGC GTGATTGAAA AATACATACA CTGCAGTACA GAAATGACCG 2760
2953 GCAATTCAAA TAGTGTATTA TTCTATAATA ATAGAGGACA CTATCGAGGT AATAATTACC 2820
2954 GAGGAAATTA CCAAAACAGA GGTAATGGCC GAGGAAATTA TAACTCCTAC AATAACAACT 2880
2955 ATAGAGGCAG AGGTGGTTAC CATGGTGGAA ACAGAGGACG AGGTGGTAAC CAAAATTATA 2940
2956 ATAGAGGTGG AGGTTACTCA AGAGGTAACC AAAACCATAA CTATAAAACA AGTCATGCCC 3000
2957 ACAATGTCCG AAACATACAA TCGGAAAACG AACATACCCC CTTGAGCGAC AATCTACAAT 3060
2958 AAAATTATAC AAAATTAATC TCAATTTAAG CATTTTTATA CGATTGAAGA ATATGAGTAC 3120
2959 CAATTCATGG GTAACTCTTT TAATAGATAC AGGTGCAGAA ATTTCCCTGC TTAAATGCAG 3180
2960 AAACAATAAT CTTAACGATT TAAATCCAAA AAATACAACA AATATATCAG GAATAGGGCA 3240
2961 AGGGACAATT CAGTCTCTAG GTACACTACA TTTAGAAATG TGTATTGCTA ATGCAGCAAT 3300
2962 ACCATATGAA TTCCATATCG TACCTAACAA TTTTCCTATA CCAGGGGATG GTATAATTGG 3360
2963 CTTGGATTTC ATTAAGAAAT ACAATTGTAT TTTGGAATTC CACGACCAAG AAGATTGGTT 3420
2964 CACTTTGAGG CCCAAAAATT TCAGGAACAT AAACATTCCT ATTATACATA CACTAGATAA 3480
2965 TGAAATAATT TTGCCAGCTA GATCAGAAGT GATTCGAAAG ATTCAACTAA CATCTACTGA 3540
2966 CACACATGTT CTCATTCCCA ACCAAGAATT ACAACCTAGC ATAATAATCG CAAGTGCACT 3600
2967 CGTAAACACT CAGAACGTTT TGATTCGAAT TATTAATACA ACTGAAAAAG ACGCTATAGT 3660
2968 TAGTAGCGCA AATATAAAAA GCGAATCATT GGATGATTAT GATGTATACA ACGCAAATAT 3720
2969 AGAAAATAGT GCACAAAGAA CTTCAGAAGT ATTAAAACTT CTTAAATTTC CATCGTTATT 3780
2970 CAAAAGCGAT TTAACAAAAT TATGCACCGA ATATAGCGAT ATTTTTGGTC TTGAAACAGA 3840
2971 AACCATATCA GCTAATAATT TTTACAAGCA AAAATTGAGA TTAAATGACA AAACTCCAGT 3900
2972 CTATATCAAA AACTATAGAA TGCCAGAAAG TCAAAAACCA GAAATTCAAA GGCAAGTTGA 3960
2973 CAAATTAATA AAAGATGGCA TTGTCGAACA ATCTATTTCA GAATATAATA GCCCTCTTCT 4020
2974 CTTGGTACCC AAGAAATCAC TGCCTAACTC GGAGGAAAAG AGATGGCGAT TAGTAGTCGA 4080
2975 TTATCGCCAA ATAAACAAGA AACTGCTAGC AGATAAATTC CCACTTCCAA GAATAGAAGA 4140
2976 CATTCTTGAT CAATTAGGCC GAGCAAAATA TTTCTCGTGC CTAGACCTGA TGTCAGGATT 4200
2977 TCATCAAATA GAATTAGACG AAAGGTCAAG AAATATAACA TCTTTCTCAA CTTCAACGGG 4260
2978 AGCATACCGC TACACGCGAT TACCATTTGG TTTAAAAATA GCCCCAAATT CTTTTCAAAG 4320
2979 AATGATGACC CTTGCATTTT CAGGTTTAAC GCCTTCGCAA GCATTTCTGT ATATGGATGA 4380
2980 TTTAGTAGTC ATAGGCTGTT CTGAAAAGCA CATGCTTAAA AATCTAACCG ACGTTTTCAA 4440
2981 ATTATGTAGG CAACATAATT TAAAATTACA TCCAGAAAAA TGCACTTTCT TTATGAAAGA 4500
2982 GGTTACTTAT TTAGGTCACA AGTGTACTGA CAAAGGTATA TTGCCAGATG ACTCTAAATA 4560
2983 TGAGGTAATA AAGAACTACC CCAAACCAGT AAACGCAGAC GAAGCTAGAC GCTTCGTGGC 4620
2984 ATTTTGCAAT TATTACAGAA GATTTATTAA GAACTTTTCT GAGAAATCAC GCCACTTAAC 4680
2985 GAGGCTTTGT AAAAAGAATG TTCCATTTGA ATGGACAAGC GAATGCAATG ATGTATTCGA 4740
2986 ATATCTCAAA AGGAAATTAA TGAAACCAAC ACTCCTTCAG TACCCAGATT TCAGCAAACA 4800
2987 ATTTTGCATA ACCACAGATG CTAGTAAACA AGCATGTGGA GCGGTACTAT CTCAAGACCA 4860
2988 TAACGGTCAA CAGCTACCAG TGGCATACGC TTCAAGAAGC TTTACAAAAG GCGAAAGTAA 4920
2989 TAAGTCCACT ACAGAGCAGG AGCTAGCAGC TATTCACTGG GCAATAAATC ACTTCAGACC 4980
2990 ATACGTATAT GGTAGACATT TCTTAGTACA AAGTGACCAT AGGCCACTAT CATATCTTTT 5040
2991 TTCAATGAGA AACCCCAGTT CAAAATTAAC CAGAATGAGA CTAGACTTGG AGGAGTTCGA 5100
2992 ATTCACAGTA GAATATCTCA AGGGGAAAGA TAATCATGTC GCAGACGCAT TGTTCCGAAT 5160
2993 AACAATCGGA GAACTTAAAG CAATAAATAG ACAGATACTA AAGGTAACAA CAAGATCAAC 5220
2994 AACAAGACAG AAAAATACCT GCGCAGGTGA AAAATTGCAT GAACCAAATG AGAAAGAAAA 5280
2995 TATAAAAATG CCCAATATCT ATCAGGTAAT CAATAACATT GATGCCAAAA AATATGTTAT 5340
2996 ACTCAAAATA GACAAGCATA AGTGTTTGTT GAAAAGAGGA AAACAAATTA TAACACGTTT 5400
2997 TGATATGACT AATTTTTATT CTAATGAAAT AATCGATTTA GATCAATTCT TTCAAAGGCT 5460
2998 TAATGAAGAA GCAAGAATAA ATAGCATCAT TCAAACACAA TTGTCACCAA GTGAACAAAT 5520
2999 CTTCGAATTT GTCACTATAA AGAACTTTAA AGAAAAGGGC AATAAAATAC TAAAAAATTT 5580
3000 AAAAATAGCG CTATTAAACA AGGTGACTAA GATAGATAAA AATGATAAGG TTCAAATAAA 5640
3001 AGCAATACTG TCTAAATATC ATGATGATCC ATCAGAAGGA GGCCATTCAG GAATTTCTAG 5700
3002 AACCCTGAGG AAAATGAAAA ACTGTTGTTG TTGGCCACGA ATGACGAAGG CGATAAGTGA 5760
3003 ATATGTTGAA ACATGTTTGA AATGTCAACA AGCCAAGACT ACGAAACATA CTAAAACACC 5820
3004 GTTGACAATA ACAGAAACGC CAGCAACAGC ATTTGATAAA GTTTTGATAG ATACCATTGG 5880
3005 TCCACTGCCA AGATCAGAAA ACGGAAATGA GTATGCTGTT ACTATCATTT GCGATTTAAC 5940
3006 AAAATATTTG GTAACGGTAC CAATTCCAAA TAAAAGTGCA AAATCAGTTG CTAAGGCTAT 6000
3007 ATTCGAAAAT TTTATTCTAA AGTACGGTCC AATGAAAACA ATCACAACGG ACATGGGAAC 6060
3008 GGAATATAAA AACCAAATTA TAGACGACCT ATGCAAATAT ATGAAGATAA AAAACATTAC 6120
3009 TTCAACAGCA CACCATCACC AGACATTAGG AACAGTAGAA CGAAGTCACA GAACTTTCAA 6180
3010 CGAGTATGTT CGCTCATATA TATCTGTTGA CAAAACCGAT TGGGATATAT GGATACAATA 6240
3011 TTTTACTTAT TGTTTCAACA CAACACCATC GGTAGTTCAT GAATATTGTC CATATGAATT 6300
3012 AGTATTTGGA AGATTACCAA GACAGTTCAT AGATTTTAAC AGGATAGACA GAATAGATCC 6360
3013 TATTTACAAC ATGGATGATT ATTCAAAAGA AGTTAAGCTA CGATTAGAAA TAGCATATAG 6420
3014 AAGAGCTAAA AATATGTTAG ACAAGGCAAA AGCCGATAGA AAGATAAAAT ATGATAGAAA 6480
3015 TATTAGTAAC TTTGAATTAA AGATAGGAGA TAAGATATTA CTTAAAAACG AAACGGGTCA 6540
3016 TAAACTTGAC AATAATTATT TAGGACCATA TTTAGTTTCA GAAATAGGAG ATAATGACAA 6600
3017 CATTACAATT ATAGGAAATA AAAATAAAAA ACAGATAGTC CATAAAGATA GGTTAAAAAT 6660
3018 TTTTAATTCA TAATACATTT TGTTTGGTTG GCCAACCACA AATAAAAAAC CACAAATAAA 6720
3019 AAACCACAAA TAAAAAACCA CAAATAAAAA ACCACAAATA AAAAACCACA AATAAAAAAC 6780
3020 CACAAATAAA AAACCACAAA TAAAAAACCA CAAATAAAAA ACCACAAATA AAAAAACCAC 6840
3021 AAATAAAATA AAAACCAATA AAAACATTAT AATACAAAAC TTTTACTTTG CAAAATATAA 6900
3022 TGAAAATATA TATATTTTTT TTAATATCTC TTTAATCATT CATTTCAAAT ATTAATGTAC 6960
3023 ATTTAAAAAA AAAAAAAAAA ATATTATATA CTTGAAAATA ACTTCATGTT ATTACGTTAT 7020
3024 TTTTCAAAAG GAGGGAGATG TAGTATATAC GAATATAATA ACAATAATAA TAACAATAAT 7080
3025 AATAATAATA TTAATAATAA TTATAATATG AATCATAATA ATAAGTCAAC TAATAAGTAA 7140
3026 ACTTAGGACC ACCCTAATTC CTTAGGGTCA CCCTAGTAGA TCTTTAGATA CACCCTAATA 7200
3027 CTAAATATGC GAATTCAGGA TGTACGCCTT TAGGGGTCGG ACTCGACTCC CATTGGTTAT 7260
3028 CGAGTATGAA CTTCATACAT ACATATTGCA GAATTTGCTA GTGTCAGCAC TTGGCTGTCA 7320
3029 CAAGAGATCT CCCTGTAGAC CACACTAAGA TCAGTTATAA ATCAGGAATA GATCTGGAAT 7380
3030 GTACACTCGC TTAATAAAAA CCAAATAAAG ATAAAATGAC CAACTGCGTT TTGAGACTTT 7440
3031 ATTAACTACA TCAGAAGTAT TAGAATTCAA ATTAACTACA 7480
3032 //
3033 ID DMMDG3 standard; DNA; INV; 5519 BP.
3034 XX
3035 AC X95908;
3036 XX
3037 DR FLYBASE; FBte0000010; Dmel\mdg3.
3038 XX
3039 FT source X95908:1..5519
3040 FT SO_feature five_prime_LTR ; SO:0000425:1..267
3041 FT SO_feature three_prime_LTR ; SO:0000426:5253..5519
3042 FT SO_feature transcription_start_site ; SO:0000315:178
3043 FT SO_feature polyA_signal_sequence ; SO:0000551:5253..5519
3044 FT SO_feature CDS ; SO:0000316:296..4780
3045 FT /name="Dmel\mdg3\ORF"
3046 FT /db_xref="FLYBASE:FBgn0043882"
3047 FT /db_xref="SPTREMBL:Q94885"
3048 FT /db_xref="NCBI_PROTEIN:CAA65152.1"
3049 FT /translation="MDDKIILNDFSLTTLKDWLRILGQNTEGTKTELIARLQDIPTAVR
3050 FT GDCPPEHPQKNAPPGNDIFSSLDFQNCEINTDHVSVNAMNRKESTETGSERETNMFELQ
3051 FT QLRAELAEAKAMLNGTRSSLQFQEQQQPEQSKATVSSVIQTAQFTQAGATKENTTFHSP
3052 FT QRSNERAESQRFPVDALALAKETITDYDGKTCARAWITVVKNIARTFNIDDNHLRILLI
3053 FT TKLKGNAQVWLHAHPARLIEPIDNLLDQLSLTFGEQSSKAEIRRKFESRKWKTEENFCS
3054 FT YYDEKMALSNGINIDDDELLDQMIEGIPLQNFRTQARIQCFSTPSEMLRAFSNIRLPAR
3055 FT REPPVQPTDYKDAIRCANCNSRGHKADICKKPKREPGSCYACGQLGHLVAQCPTRKSVS
3056 FT SNNYVRWFKINFFENAYKPIISECLIDSGSPISIIKKSLINETMKLALVNTCYFGLNNC
3057 FT ILKTHGQTTCYVLKGSIKIYFRLIIVCDQSMRYNVILGRDFLTACNLNLDPYTLGMIAL
3058 FT RKPMEINKISMFTENDSPEKSLENEIVSPKSLENEIVSSQSLENEIVSPKSLENEIVSP
3059 FT KSFKNATISPKSLENKIVNQQHKETGPISLRDEIVNQQKNVSKSKLSEDEIVNTSKEIV
3060 FT SFKLPKDKNVYEQLNHNFDKEVLRICHVTESELEYKIGENVSNRLQLEFDRLFRNFYIN
3061 FT AKRPNEPTVRSEIQLCLKNPKPFSCSPRRLSYTEKDRLQKLLDEYLENGFIRPSDSEYA
3062 FT SPIVLVKKKTGDLRMCVDFRKLNKMTMKDNYPLPLIDDLLDRMNEKTVFTKLDLKNGFF
3063 FT HVHVKKESIKYTSFVTPLGQYEWLRMPFGLKNAPSVFQRFVNKIFADMIRENKVVVYMD
3064 FT DILLATENINEHLETLKEIFKRLVENKLELRIDKCEFMQSSIKYLGFIINKDGIMPNDK
3065 FT GIEAIKNFPIPNNVHTVQSFLGLCSYFRRFIKDFSRLAKPLHDILKKDKPFKFGSEEMI
3066 FT CFNMLKDKLIQSPVLAIYNHKHETELHCDASSSGFGAVLMQKKEDQKWHPVSFFSKRTT
3067 FT DIESKYHSFELETLAIVYSLRRFRVYLHWRTFKIVTDCNSLILTLSKKELNPRIARWAL
3068 FT EFQGYDFEIVHRAGSRMQHVDALSRCTNIMVIQTNSFEDNLVICQGKDTKLKEIRQLLE
3069 FT NTENKLYEMRNGIVYKKTNENRLLFYVPIEMEEQVLYKYHNELGHVGRDKMIEAIMKNY
3070 FT WFPNLKQKCSTHISNCLKCISFSPKTGKTEGFLHNIPKGNKPFEIIHIDHYGPVDLARP
3071 FT KKHILVIVDAFTKFVRLYATKTTNTKEVIQSLNDYFRAYSRPKCIISDRGACFTSGDFD
3072 FT SFLKECNVKHIKIATGSPQANGQVERINRSLGPMISKLIEPDQGLHWDLVLEKVEYTLN
3073 FT NTLHRSIKQYPSIMLFGLQQKGQIMDELKEKIEEIGETIEERDLESIRNKGEASQKIAQ
3074 FT AYNKEYVDKKRKRSGVFTKGTTSWLKILTQQQA"
3075 XX
3076 CC Derived from X95908 (e990667) (Rel. 49, Last updated, Version 3).
3077 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
3078 CC Any changes to original sequence record are annotated in an FT line.
3079 XX
3080 SQ Sequence 5519 BP; 2078 A; 1005 C; 1029 G; 1407 T; 0 other;
3081 TGTAGTAGGC TGCACCTTCT ACCCTCTTCC TTTACTCTTA GTCATACATA CCTAATTATA 60
3082 CATAGCCAAT CTAGTCATAA GCTTATACAC TCATACACCC ATCCTTAACA TACAAATATT 120
3083 ATCGAGAAAC TTATCGACTA ATCGACTCGC CACTCTGCAG AGAGCGCGGC AGTCAGTCGC 180
3084 TGTTGAACCA AGCTAAAGGA CAGATCAAAA ATAAAAGAGA CACGTGAAAT TGTATTAGAA 240
3085 TATTAACTTC TGTAAACGGC GGCTAAAATC TCAGAAGTGG GATTAATAAT CCAAAATGGA 300
3086 CGATAAAATC ATCCTGAACG ACTTTTCGCT GACAACCCTA AAAGATTGGC TACGTATTCT 360
3087 GGGCCAAAAT ACGGAGGGCA CAAAAACCGA ATTAATCGCG AGGCTGCAAG ACATCCCAAC 420
3088 GGCAGTTCGG GGCGATTGTC CACCGGAGCA CCCCCAGAAA AACGCTCCAC CAGGAAACGA 480
3089 CATTTTTTCT TCACTGGATT TTCAGAATTG TGAAATTAAC ACCGATCACG TAAGTGTGAA 540
3090 TGCGATGAAC AGAAAAGAAT CAACCGAAAC TGGCAGTGAG AGGGAGACAA ACATGTTCGA 600
3091 GCTACAGCAA CTACGCGCAG AGCTAGCAGA AGCGAAGGCA ATGCTTAACG GAACACGATC 660
3092 GAGCTTGCAG TTCCAAGAAC AACAACAACC AGAGCAAAGC AAGGCTACAG TTAGTTCCGT 720
3093 TATCCAGACG GCGCAGTTTA CGCAGGCTGG CGCCACAAAA GAGAACACAA CATTTCACTC 780
3094 GCCGCAGCGA TCCAACGAGA GAGCGGAGAG CCAGCGTTTT CCAGTTGATG CTCTCGCTCT 840
3095 CGCCAAAGAG ACGATAACCG ATTACGATGG GAAAACTTGC GCGCGTGCCT GGATAACAGT 900
3096 GGTCAAAAAT ATCGCACGCA CTTTCAACAT CGATGACAAC CATTTACGCA TCTTACTCAT 960
3097 CACTAAACTT AAAGGAAACG CGCAAGTCTG GTTACATGCG CACCCTGCTC GATTGATCGA 1020
3098 ACCAATTGAC AATTTGCTTG ATCAATTGTC ATTGACTTTT GGCGAGCAAT CATCCAAGGC 1080
3099 TGAGATCCGG CGAAAATTCG AGAGTCGCAA GTGGAAAACC GAGGAGAATT TCTGCAGTTA 1140
3100 TTACGACGAG AAGATGGCTC TCTCAAACGG GATAAACATC GACGACGACG AACTACTGGA 1200
3101 CCAGATGATA GAGGGCATAC CGCTACAAAA TTTCCGTACC CAAGCACGGA TTCAATGCTT 1260
3102 CTCTACTCCA TCGGAGATGC TACGCGCATT TTCGAACATC CGTTTGCCAG CTCGGAGGGA 1320
3103 GCCACCTGTA CAGCCAACCG ACTACAAAGA TGCCATACGA TGCGCAAACT GTAATTCAAG 1380
3104 AGGACACAAA GCTGACATCT GCAAGAAGCC CAAACGTGAA CCAGGTTCGT GCTACGCCTG 1440
3105 TGGACAACTT GGACACCTGG TGGCACAATG TCCCACAAGG AAGAGCGTTT CATCTAATAA 1500
3106 TTATGTAAGA TGGTTTAAAA TTAATTTTTT TGAAAATGCT TATAAGCCCA TAATTTCAGA 1560
3107 ATGCCTCATA GACTCTGGCA GTCCTATATC TATCATTAAA AAGTCACTTA TTAACGAGAC 1620
3108 AATGAAGTTA GCCCTAGTTA ATACTTGCTA TTTTGGTTTA AACAACTGTA TTCTCAAAAC 1680
3109 ACATGGACAA ACCACATGTT ATGTTTTGAA AGGATCAATA AAAATATATT TTCGTTTAAT 1740
3110 CATTGTTTGC GACCAGTCTA TGAGGTATAA TGTTATTCTC GGCAGAGATT TTTTAACTGC 1800
3111 ATGCAATTTA AATTTAGACC CGTACACCTT GGGAATGATT GCGTTGAGAA AACCCATGGA 1860
3112 AATAAACAAA ATATCAATGT TTACTGAAAA TGATAGTCCT GAGAAATCTT TAGAAAATGA 1920
3113 AATTGTTAGT CCAAAATCGT TAGAGAATGA AATTGTTAGT TCACAATCGT TAGAAAATGA 1980
3114 AATTGTTAGC CCCAAATCGT TAGAGAATGA AATTGTTAGT CCAAAATCGT TTAAAAATGC 2040
3115 AACTATTAGT CCGAAATCGT TAGAAAATAA AATCGTTAAT CAACAGCATA AAGAAACTGG 2100
3116 TCCAATATCG TTAAGAGATG AAATAGTTAA TCAACAAAAG AATGTCAGTA AATCAAAATT 2160
3117 ATCAGAAGAT GAAATTGTTA ACACTTCAAA AGAAATCGTT AGTTTTAAAT TGCCAAAAGA 2220
3118 TAAAAACGTT TACGAACAAT TAAATCACAA CTTTGATAAG GAAGTACTAA GAATATGTCA 2280
3119 TGTAACTGAA AGTGAGTTAG AATACAAAAT AGGAGAAAAT GTTAGCAATA GGTTACAACT 2340
3120 AGAATTCGAT AGGTTGTTTA GAAATTTTTA TATAAATGCA AAAAGGCCAA ATGAACCGAC 2400
3121 AGTTAGAAGT GAAATACAAT TGTGTTTGAA AAACCCGAAA CCGTTTAGCT GTTCTCCTAG 2460
3122 GAGGCTTTCA TACACAGAAA AAGACAGGTT ACAAAAACTA TTAGACGAAT ATTTGGAAAA 2520
3123 CGGATTTATA CGACCAAGCG ACTCGGAATA TGCATCGCCT ATTGTTTTAG TGAAAAAGAA 2580
3124 AACTGGAGAC TTACGTATGT GCGTCGACTT TAGAAAACTT AATAAAATGA CAATGAAAGA 2640
3125 CAACTATCCT CTACCTCTTA TAGATGACTT GTTAGATAGA ATGAATGAGA AAACTGTTTT 2700
3126 CACCAAACTC GATCTTAAAA ACGGTTTTTT CCACGTGCAT GTTAAAAAAG AATCAATAAA 2760
3127 ATACACCTCT TTCGTTACAC CATTAGGCCA ATACGAGTGG CTGCGAATGC CATTTGGCCT 2820
3128 CAAAAACGCC CCGTCTGTGT TCCAAAGATT TGTTAACAAA ATTTTTGCGG ATATGATTAG 2880
3129 AGAAAACAAA GTAGTAGTAT ATATGGACGA CATTCTATTG GCAACCGAAA ATATAAACGA 2940
3130 ACACTTAGAA ACGTTGAAAG AAATTTTTAA AAGATTAGTT GAAAATAAAC TTGAATTAAG 3000
3131 AATAGACAAA TGTGAGTTTA TGCAATCAAG TATAAAATAT CTTGGGTTCA TAATAAATAA 3060
3132 AGACGGCATA ATGCCCAATG ACAAAGGAAT CGAGGCAATA AAAAATTTCC CAATACCTAA 3120
3133 TAATGTTCAT ACAGTACAAA GTTTTTTGGG ATTATGCTCA TATTTTCGAC GGTTTATAAA 3180
3134 AGATTTTTCT AGACTAGCTA AACCATTGCA TGACATTCTA AAAAAAGATA AACCGTTCAA 3240
3135 ATTTGGTAGT GAAGAAATGA TTTGTTTTAA TATGTTAAAA GATAAATTAA TACAGTCACC 3300
3136 GGTCTTAGCT ATATACAACC ATAAACACGA AACAGAATTG CATTGTGATG CAAGTTCTTC 3360
3137 TGGATTCGGT GCTGTACTTA TGCAAAAGAA GGAGGACCAG AAATGGCACC CAGTTTCATT 3420
3138 CTTTTCAAAA CGGACAACAG ATATTGAATC AAAATACCAC AGTTTCGAGT TAGAAACTTT 3480
3139 AGCCATTGTT TATTCGTTAC GTAGATTTAG AGTTTATCTT CATTGGAGGA CATTTAAAAT 3540
3140 AGTCACCGAC TGCAACTCAT TAATTTTGAC CCTAAGCAAA AAAGAGCTAA ACCCTAGGAT 3600
3141 AGCCAGGTGG GCTTTAGAAT TCCAAGGTTA TGATTTTGAA ATTGTGCATA GGGCAGGTAG 3660
3142 CCGCATGCAA CATGTTGACG CACTGAGTAG GTGTACAAAT ATTATGGTAA TACAAACAAA 3720
3143 CAGTTTCGAA GATAATCTAG TTATATGTCA AGGGAAAGAT ACAAAATTAA AAGAAATCAG 3780
3144 GCAATTGTTA GAAAACACAG AAAATAAATT GTATGAGATG AGAAATGGTA TAGTTTACAA 3840
3145 AAAGACAAAT GAAAATAGAT TGCTGTTCTA CGTTCCGATA GAAATGGAAG AACAAGTGTT 3900
3146 ATACAAATAT CACAACGAAC TTGGACACGT AGGAAGAGAC AAAATGATAG AAGCTATAAT 3960
3147 GAAAAACTAT TGGTTTCCAA ATTTAAAACA GAAGTGTAGC ACACATATCA GCAACTGTTT 4020
3148 AAAATGTATT TCATTCAGTC CCAAAACAGG AAAAACAGAA GGATTTCTAC ACAACATACC 4080
3149 TAAGGGAAAC AAACCTTTTG AAATAATCCA TATTGACCAT TATGGTCCAG TAGACTTGGC 4140
3150 TAGACCGAAG AAACATATTC TAGTGATAGT AGATGCATTC ACAAAGTTTG TCAGACTATA 4200
3151 CGCAACAAAA ACTACGAACA CAAAAGAAGT CATACAATCG TTAAATGACT ACTTCAGAGC 4260
3152 ATACAGTAGG CCTAAGTGTA TCATATCAGA TAGAGGAGCA TGTTTCACGT CTGGCGATTT 4320
3153 TGACTCATTT TTGAAAGAAT GCAATGTTAA ACACATAAAA ATTGCAACAG GATCGCCACA 4380
3154 AGCCAACGGT CAAGTTGAAC GTATAAACCG AAGTCTTGGT CCAATGATTA GCAAGTTAAT 4440
3155 TGAACCTGAT CAAGGTCTAC ACTGGGACTT AGTCTTAGAA AAGGTCGAAT ATACCCTGAA 4500
3156 CAATACACTA CACCGCAGCA TTAAACAGTA TCCTAGCATA ATGTTATTTG GGTTACAACA 4560
3157 AAAAGGACAA ATTATGGATG AGTTAAAAGA AAAAATTGAG GAAATTGGAG AAACGATTGA 4620
3158 AGAAAGAGAT TTAGAAAGTA TTAGAAATAA AGGCGAGGCA AGTCAGAAAA TAGCACAAGC 4680
3159 ATACAATAAA GAATATGTTG ACAAAAAACG AAAACGATCA GGAGTGTTCA CAAAAGGCAC 4740
3160 TACGTCATGG TTAAAAATTT TGACTCAACA ACAGGCATAG CTAAGAAGTT AATTCCAAAG 4800
3161 CATAAAGGAC CCTATGTCAT AAGCAAAGTT CTCAAAAATG ATCGCTTCCT TCTGGAAGAT 4860
3162 GTTGATGGAT TTCAAATTTC TCGCAATCCT TACCGGGGTG TATGGAGCAT ACAGAATATA 4920
3163 AAACACTGGC AAAGAAAAAT TAAGAGTCTA CAAAATAGAA AGTATAATTT GAGAAACTCT 4980
3164 GTACAAAATA GAAAGTATAA TTTGAGAAAC TCTGTACAAA ATAGAAAGTA TAATTTAAGA 5040
3165 AACTCTGTAC GAAATCGAAA GTATAATTTA AGAAGCAATT GTAAAACAAA GAAAACAAAC 5100
3166 AAGAAGAAAA GAAAACCAAA AAAATGTTTA AGACCGTTCA AAAGTATCTC CACTAAGAAG 5160
3167 AATAAAATAA GAAACAGGAC CCTTAGCTTT AAGAAACGTT AATTGTTATA AAATCCTACG 5220
3168 ATCGGGAGAT CTAGTTGTCA GGACGGCCGA GTTGTAGTAG GCTGCTCCTT CTACCCTCTT 5280
3169 CCTTTACTCT TAGTCATACA TACCTAATTA TACATAGCCA ATCTAGTCAT AAGCTTATAC 5340
3170 ACTCATACAC CCATCCTTAA CATACAAATA TTATCGAGAA ACTTATCGAC TAATCGACTC 5400
3171 GCCACTCTGC AGAGAGCGCG GCAGTCAGTC GCTGTTGAAC CAAGCTAAAG GACAGATCAA 5460
3172 AAATAAAAGA GACACGTGAA ATTGTATTAG AATATTAACT TCTGTAAACG GCGGCTAAA 5519
3173 //
3174 ID DMDM11 standard; DNA; INV; 5461 BP.
3175 XX
3176 AC X14037;
3177 AC X15066;
3178 XX
3179 DR FLYBASE; FBte0000042; Dmel\micropia.
3180 XX
3181 FT source join(X14037:5..3664,X15066:3534..3593,X14037:3721..5461)
3182 FT SO_feature five_prime_LTR ; SO:0000425:1..476
3183 FT SO_feature three_prime_LTR ; SO:0000426:4957..5461
3184 FT SO_feature primer_binding_site ; SO:0005850:477..489
3185 FT /bound_moiety="tRNA-leu"
3186 FT SO_feature primer_binding_site ; SO:0005850:4939..4956
3187 FT SO_feature CDS ; SO:0000316:540..4415
3188 FT /name="Dmel\micropia\polyprotein"
3189 FT /db_xref="FLYBASE:FBgn0043876"
3190 FT /translation="
3191 FT MQNRNLAELVKIMQKTPAREQQPSYDVKLPKFNPDAACVEAAKWCSTTDI
3192 FT ILTEHPLKGSKLITALSNCMEGTASQWLTQISYQGMTWQEFQELFLQRFE
3193 FT TEETPAATFLNLLNSRPTAAECYAVYASRLVTQLTTKWRNMEIEEIAVTT
3194 FT VLAHMANIDSRLQRVLFTSNVRTRSKLQAELKAFTFDKKRHARDDNLGPD
3195 FT QKNRKASPVVCHFCSKPGRRIAECRSKMRQDRRAKPQREKSNVTCYRCGQ
3196 FT PGHFSNQCPKNGTAAKQDVTQQKTVNQCCVTEPKGSLHQRGEIYPICFDS
3197 FT GAECSLIKDDISSKLSGKRINNTVMIKGIGGGSVCSTLQILSEVTINENI
3198 FT MEILFHVVPNEEMRNDILIGREILKQGFYVILTSDNFKVVKSKTVNNCSV
3199 FT TERSFTLSDIDTELVDNEKAQLIELLEKHSTSFTNGIPHTRVNTGEMKIR
3200 FT LIDPTKTVQRRPYRLSPEEREVVRMQVSELIRCNIVRPSCSPFASPMLLV
3201 FT KKKNGTDRLCVDFRELNSNTISDKYPLPLISDQIARLRGANYFTCLDMAS
3202 FT GFHQIPIHPESVEYTAFVPDGLKNAPSVFQRTVINALGDLANSFVIVYMD
3203 FT DIMVVSPTKELALERLKTVLNVLTKAGFTFNLAKCSFLKTTVQYLGYEVR
3204 FT AGEIRPNVRKIASLSSLPPPQTVSGVRQFIGLASYFRKFVSGFSQLMKPL
3205 FT YSLSSGSGKITWSAELEEIRLKVVTILTNEPALVIFDPQYPIELHTDASA
3206 FT CGYGAILLHRIESKPHVIEYFSKTTTSVESRYHSYELETLAVVKAVKHFR
3207 FT HYLIGREFVVYTDCNSLKASRTKIDLTPRVHRWWAYLQSFNFEIQYREGK
3208 FT RMAHVDFLSRNPLSPEHILSINKIPEKRVNLSEISSTWLLAEQRLDLEII
3209 FT EIVNKLESDELAENLAKTYDLRKGVLYRKVQRRGRTSYLPVVPRAFKWSV
3210 FT INQVHESIMHLGWQKTLDKVYQYYWFAKMNKYVRKFVSNCITCRSVKSSS
3211 FT GKVQAELHSIPKTSIPWHTIHIDITGKLSGKSDLKEYVIVQIDAYTKFVY
3212 FT LYHTLKIDAESCVNAMKSSISLFGVPDRIIADQGRCFTSSKFSEFCVSQK
3213 FT VELHLIATGMSRANGQVERVMETLKNLLSVVESSQRSWQDALGEVQLALN
3214 FT CTISRATDASPLEMLIGKQARPLGLVPPCETECEIDLATVRAHATENMNS
3215 FT LASYDKSRFDSSRAAVDKHHVGDYVLLRNEERHQTKLDPKFRGPFLVTEV
3216 FT LEGDRYTLKSLTSNRSFKYCHESIKMPDAEIPNELNENVEQ"
3217 XX
3218 CC Sequence assembled by Lynn Crosby (FlyBase), 'micropia.v006'.
3219 CC Any changes to original sequence record are annotated in an FT line.
3220 XX
3221 SQ Sequence 5461 BP; 1679 A; 1051 C; 1264 G; 1467 T; 0 other;
3222 TGTCGTGGCG AAAATAATGA GTATGCGTGT AGTCGCTGTT TACTTCTTCT CCATGTTCCC 60
3223 TTTGCTATTA TGCGTGTTCC TATTTATGAA CACGTGGCGA AAATAATAAA TGCGTGTAGT 120
3224 CGCCGTTTAC TTCTTCTCCA TGTTCCCTTT GCTATTATGC GTGTTCCTAT TTATTGTCAA 180
3225 TGTGTGAGGA TGAATAGATG AATTATCTAT GAACGGGATT TTGCAAAAAC GACTTGCGCT 240
3226 GCTTGGTTAG AAAGGGAAAA CTATATAATG AAAAGGGAAT GCCAAAAATT GAGAAGAGAC 300
3227 AAAGCAGGCT GCACGAAGCT GGAGTGAGGG CATTAATCGT GGAGAAGCCA AAGCAGACGC 360
3228 AAGTGGACTC GTTGACTGCG CACAGCTGCA TAAAATTATA TAGTAAAAAG AGATTTGAGC 420
3229 GACGCTGATA TGGACGGACG GACGGACGCG AGGCCCCTGA TATTCTTAAC CCGACATCAG 480
3230 AAGTGGGATC TGTGCCACAC CCTGCATTTT CTGAGGATCA GTGGCGTGCA GTAGTGGAAA 540
3231 TGCAAAATCG GAATTTGGCT GAACTTGTAA AAATCATGCA AAAGACGCCG GCACGTGAGC 600
3232 AGCAACCTAG TTATGATGTT AAGCTACCCA AATTTAACCC TGATGCTGCA TGCGTAGAGG 660
3233 CAGCAAAGTG GTGTTCAACA ACCGATATAA TTCTAACTGA GCACCCCCTT AAAGGAAGTA 720
3234 AATTGATCAC GGCACTAAGT AACTGCATGG AGGGAACTGC ATCTCAGTGG CTAACACAAA 780
3235 TCTCGTACCA GGGTATGACT TGGCAAGAGT TCCAGGAATT ATTTCTGCAG CGCTTTGAAA 840
3236 CCGAAGAGAC GCCGGCCGCT ACGTTTTTAA ATTTACTCAA CAGCCGCCCG ACTGCCGCCG 900
3237 AATGTTACGC GGTGTATGCG AGTCGGCTGG TGACGCAGCT GACTACAAAG TGGCGGAATA 960
3238 TGGAAATAGA AGAAATTGCC GTTACAACTG TTCTTGCGCA TATGGCAAAC ATTGACAGTC 1020
3239 GTTTGCAGCG CGTCCTCTTC ACATCCAATG TGCGTACCAG AAGTAAGCTA CAGGCGGAGT 1080
3240 TAAAAGCGTT TACGTTCGAC AAGAAGCGAC ATGCTCGAGA TGACAACCTT GGACCTGACC 1140
3241 AGAAGAACCG TAAGGCATCG CCAGTTGTAT GCCACTTCTG TTCAAAGCCG GGACGTCGAA 1200
3242 TTGCTGAATG CCGAAGTAAA ATGCGACAAG ATAGACGGGC GAAACCGCAG CGTGAAAAAT 1260
3243 CAAATGTTAC GTGCTATCGG TGCGGCCAAC CGGGACATTT CTCCAACCAG TGCCCGAAAA 1320
3244 ACGGAACTGC AGCCAAACAA GATGTGACTC AACAGAAGAC TGTTAACCAA TGTTGTGTGA 1380
3245 CTGAGCCAAA GGGAAGCTTG CATCAACGAG GTGAGATCTA TCCAATTTGT TTCGATTCCG 1440
3246 GTGCAGAGTG CTCCCTTATT AAAGACGACA TTAGCAGTAA GTTATCTGGT AAACGTATAA 1500
3247 ACAATACTGT AATGATAAAA GGCATTGGTG GTGGCAGTGT GTGCAGTACA TTGCAAATCT 1560
3248 TGAGTGAAGT CACTATAAAC GAAAATATTA TGGAAATATT ATTTCATGTA GTCCCGAACG 1620
3249 AGGAAATGAG GAATGATATT CTGATAGGGC GAGAAATACT TAAACAAGGC TTTTATGTAA 1680
3250 TTTTGACATC CGATAATTTT AAAGTTGTAA AATCAAAAAC TGTTAATAAT TGTTCCGTTA 1740
3251 CTGAGCGATC GTTTACTTTG TCCGATATTG ACACCGAATT AGTCGACAAT GAGAAAGCTC 1800
3252 AATTAATTGA GTTACTTGAA AAGCACTCGA CTTCATTTAC CAACGGGATA CCTCATACTC 1860
3253 GAGTAAATAC AGGCGAAATG AAAATCCGTT TGATTGATCC AACTAAAACT GTTCAGCGCC 1920
3254 GACCTTACAG ACTTAGCCCC GAAGAGAGAG AAGTAGTGCG AATGCAGGTG AGCGAATTGA 1980
3255 TAAGATGTAA TATTGTTCGC CCAAGTTGCT CTCCCTTTGC TAGCCCCATG TTGCTCGTCA 2040
3256 AAAAGAAGAA CGGAACCGAC CGTCTATGTG TTGATTTTAG AGAGCTAAAC TCGAACACGA 2100
3257 TTTCGGATAA ATACCCCTTG CCGCTTATCA GCGATCAAAT TGCTAGACTT CGCGGAGCAA 2160
3258 ATTATTTCAC ATGCCTGGAT ATGGCAAGTG GTTTCCACCA AATCCCGATT CACCCTGAAT 2220
3259 CCGTGGAATA TACTGCATTT GTGCCCGACG GCCTCAAAAA TGCGCCATCT GTTTTCCAGC 2280
3260 GCACAGTCAT AAATGCACTT GGTGACCTTG CTAACTCTTT TGTAATCGTT TACATGGACG 2340
3261 ACATAATGGT AGTATCGCCA ACCAAGGAAT TGGCTTTGGA AAGGTTAAAA ACTGTTTTGA 2400
3262 ATGTTCTTAC AAAGGCTGGT TTTACCTTTA ACCTTGCTAA ATGCAGTTTT CTCAAAACAA 2460
3263 CGGTTCAGTA TTTAGGCTAT GAAGTGCGAG CGGGAGAAAT TCGTCCGAAT GTGCGAAAGA 2520
3264 TAGCTTCTTT AAGCTCCTTG CCTCCTCCTC AAACTGTCTC CGGCGTTAGA CAATTCATTG 2580
3265 GCTTGGCCTC TTACTTTCGC AAATTCGTGT CTGGATTCTC CCAACTTATG AAACCATTGT 2640
3266 ATTCACTTTC GTCTGGTAGC GGCAAGATTA CATGGAGCGC TGAGCTGGAA GAGATCAGAC 2700
3267 TTAAAGTTGT GACGATCCTC ACAAATGAGC CTGCTCTGGT AATCTTCGAC CCGCAATATC 2760
3268 CTATTGAGTT GCACACTGAT GCAAGTGCCT GTGGATATGG AGCGATACTT TTGCACCGTA 2820
3269 TAGAAAGTAA GCCCCATGTA ATCGAATACT TCAGCAAAAC AACTACCTCT GTTGAATCTA 2880
3270 GATATCACTC CTACGAGCTG GAAACCTTGG CAGTGGTAAA AGCCGTTAAA CATTTTCGCC 2940
3271 ATTACCTAAT TGGCCGTGAG TTCGTTGTCT ATACAGACTG CAATTCATTA AAAGCTTCTC 3000
3272 GCACAAAAAT AGATTTAACC CCCAGAGTTC ACCGCTGGTG GGCCTACTTA CAATCGTTTA 3060
3273 ATTTCGAAAT TCAGTATAGA GAGGGTAAGC GTATGGCTCA TGTGGATTTC CTATCAAGAA 3120
3274 ATCCTTTATC ACCCGAACAC ATTTTGTCAA TAAACAAGAT TCCCGAAAAA CGAGTAAATC 3180
3275 TGTCTGAAAT TTCAAGTACT TGGCTTCTTG CTGAGCAACG GTTAGACCTT GAGATAATAG 3240
3276 AAATTGTTAA CAAATTGGAG TCAGATGAAT TAGCCGAAAA CTTGGCCAAA ACGTATGATT 3300
3277 TGCGAAAAGG TGTATTATAT CGCAAGGTCC AAAGACGAGG TAGAACAAGT TATTTACCAG 3360
3278 TTGTACCCAG AGCTTTCAAA TGGTCAGTAA TTAACCAGGT ACACGAGTCG ATAATGCATT 3420
3279 TAGGGTGGCA AAAGACACTT GATAAAGTGT ACCAGTATTA TTGGTTCGCT AAAATGAACA 3480
3280 AGTATGTTCG AAAATTTGTT TCAAACTGCA TAACTTGTAG ATCAGTGAAA TCATCTTCCG 3540
3281 GGAAGGTTCA GGCGGAACTT CATTCCATTC CGAAGACAAG TATACCGTGG CACACCATCC 3600
3282 ACATAGATAT AACGGGGAAA TTAAGTGGCA AGAGCGATTT GAAGGAGTAT GTCATTGTTC 3660
3283 AGATCGATGC CTATACAAAG TTTGTTTATC TGTATCACAC CTTAAAGATA GATGCCGAAA 3720
3284 GCTGTGTTAA TGCTATGAAA TCTTCCATAT CCTTATTTGG AGTACCAGAT CGCATTATCG 3780
3285 CCGACCAGGG CAGATGTTTT ACTAGCTCTA AGTTTTCAGA GTTTTGCGTA TCGCAGAAAG 3840
3286 TTGAACTTCA CTTGATTGCT ACGGGAATGA GCCGTGCAAA TGGGCAAGTG GAACGGGTGA 3900
3287 TGGAAACACT GAAAAATTTG TTGTCAGTGG TAGAATCAAG TCAACGATCG TGGCAGGACG 3960
3288 CACTTGGCGA AGTCCAACTT GCACTGAATT GTACAATTTC TCGTGCCACT GATGCAAGTC 4020
3289 CGTTAGAAAT GTTAATTGGT AAACAGGCTC GACCCCTTGG ATTAGTTCCC CCATGTGAGA 4080
3290 CCGAATGTGA AATAGATTTG GCAACTGTTA GAGCTCATGC GACAGAAAAT ATGAATTCCT 4140
3291 TAGCGTCTTA CGACAAATCC CGATTTGATA GCAGTAGAGC AGCCGTTGAC AAACACCACG 4200
3292 TAGGTGACTA TGTGCTATTG AGGAATGAAG AAAGACACCA AACTAAGTTA GATCCGAAAT 4260
3293 TCAGAGGACC GTTTTTGGTA ACTGAAGTAT TAGAGGGTGA CAGGTATACA CTAAAGTCGT 4320
3294 TGACGAGTAA CCGATCGTTC AAGTATTGCC ATGAATCAAT CAAAATGCCG GATGCAGAAA 4380
3295 TCCCGAATGA GTTAAACGAG AATGTAGAGC AATAGCTGAA ATATAGAAAC AGTTGAATGA 4440
3296 AAAGAAAAGC CCGCCAATGA GTTCTTTTGT GAACGAGAGA TATCCGTCTA GGTGAGACGA 4500
3297 TGAATTGTGA GTTATCCGTC TAGGTGAGAC GATGAATTGT GAGTTATCCG TCTAGGTGAG 4560
3298 ACGATGAATT GTCAGTTATC CGTCAGGTGA GACGATGAAT TGTGAGTTAT CCGTCCAGGA 4620
3299 GAGACGATGA GTTTGGATTG AATTAATAAT CAAGTGTGTG TGAACTGGCG GAAGATCGAT 4680
3300 ATATAGAAAT CGATAAATGA TAATGTTAAG ATAAGTTGTG AGCTGATGTA TTACTGATCA 4740
3301 ATGGAACTGA ATATGAAAAT AGAATAAGTT ATCCCAGCAA CAGTGAAATA AGAGCTGTTT 4800
3302 TGTTTCTTCA CAGAATTAAG ATTTAAGAAA TACACCTGAT AAAGTCAAAC TAATGAAATT 4860
3303 AAATGTTATT GAATAGTGAT GAAAGTAGGT GATCTTGATA TCTTGGTATC TCGGTATCAA 4920
3304 AAGCTTACAC GAGGACGTGA AATGTCAGAA TGGCCGTGTC GTGGCGAAAA TAATGAGTAT 4980
3305 GCGTGTAGTC GCTGTTTACT TCTTCTCCAT GTTCCCTTTG CTATTATGCG TGTTCCTATT 5040
3306 TATGAACACG TGGCGAAAAT AATGAATGCG CGTAGTCCGG TTTACTTCTT CTCCATGTTC 5100
3307 CCTTTGCTAT TATGCGTGTT CCTATTTATT GTCAATGTGT GAGGATGAAT AGATGAATTA 5160
3308 TCTATGAACG GGATTTTGCA AAAACGAGAG CGATAGAGCT GTTGCTGAAC GTGGCCACTT 5220
3309 GCGCTGCTTG GTTAGAAAGG GAAAACTATA TAATGAAAAG GGAATGCCAA AAATTGAGAA 5280
3310 GAGACAAAGC AGGCTGCACG AAACTGGAGT GAGGGCATTA ATCGTGGAGA AGCCAAAGCA 5340
3311 GACGCAAGTG GACTCGTTGA CTGCGCACAG CTGCATAAAA TTATATAGTA AAAAGAGATT 5400
3312 TGAGCGACGC TGATATGGAC GGACGGACGG ACGCGAGGCC CCTGATATTC TTAACCCGAC 5460
3313 A 5461
3314 //
3315 ID PPI251 standard; DNA; SYN; 2907 BP.
3316 XX
3317 AC X06779; V01520; X69493;
3318 XX
3319 DR FLYBASE; FBte0000037; Dmel\P-element.
3320 XX
3321 FT source X06779:996..3902
3322 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..31
3323 FT SO_feature terminal_inverted_repeat ; SO:0000481:2877..2907
3324 FT SO_feature CDS ; SO:0000316:join(153..442,501..1168,1222..1947,2138..2709)
3325 FT /name="Dmel\P\T"
3326 FT /db_xref="FLYBASE:FBgn0013311"
3327 FT /translation="
3328 FT MKYCKFCCKAVTGVKLIHVPKCAIKRKLWEQSLGCSLGENSQICDTHFND
3329 FT SQWKAAPAKGQTFKRRRLNADAVPSKVIEPEPEKIKEGYTSGSTQTESCS
3330 FT LFNENKSLREKIRTLEYEMRRLEQQLRESQQLEESLRKIFTDTQIRILKN
3331 FT GGQRATFNSDDISTAICLHTAGPRAYNHLYKKGFPLPSRTTLYRWLSDVD
3332 FT IKRGCLDVVIDLMDSDGVDDADKLCVLAFDEMKVAAAFEYDSSADIVYEP
3333 FT SDYVQLAIVRGLKKSWKQPVFFDFNTRMDPDTLNNILRKLHRKGYLVVAI
3334 FT VSDLGTGNQKLWTELGISESKTWFSHPADDHLKIFVFSDTPHLIKLVRNH
3335 FT YVDSGLTINGKKLTKKTIQEALHLCNKSDLSILFKINENHINVRSLAKQK
3336 FT VKLATQLFSNTTASSIRRCYSLGYDIENATETADFFKLMNDWFDIFNSKL
3337 FT STSNCIECSQPYGKQLDIQNDILNRMSEIMRTGILDKPKRLPFQKGIIVN
3338 FT NASLDGLYKYLQENFSMQYILTSRLNQDIVEHFFGSMRSRGGQFDHPTPL
3339 FT QFKYRLRKYIIARNTEMLRNSGNIEEDNSESWLNLDFSSKENENKSKDDE
3340 FT PVDDEPVDEMLSNIDFTEMDELTEDAMEYIAGYVIKKLRISDKVKENLTF
3341 FT TYVDEVSHGGLIKPSEKFQEKLKELECIFLHYTNNNNFEITNNVKEKLIL
3342 FT AARNVDVDKQVKSFYFKIRIYFRIKYFNKKIEIKNQKQKLIGNSKLLKIK
3343 FT L"
3344 FT SO_feature CDS ; SO:0000316:join(153..442,501..1168,1222..1994)
3345 FT /db_xref="FLYBASE:FBgnXXXXXXX"
3346 FT /translation="
3347 FT MKYCKFCCKAVTGVKLIHVPKCAIKRKLWEQSLGCSLGENSQICDTHFND
3348 FT SQWKAAPAKGQTFKRRRLNADAVPSKVIEPEPEKIKEGYTSGSTQTESCS
3349 FT LFNENKSLREKIRTLEYEMRRLEQQLRESQQLEESLRKIFTDTQIRILKN
3350 FT GGQRATFNSDDISTAICLHTAGPRAYNHLYKKGFPLPSRTTLYRWLSDVD
3351 FT IKRGCLDVVIDLMDSDGVDDADKLCVLAFDEMKVAAAFEYDSSADIVYEP
3352 FT SDYVQLAIVRGLKKSWKQPVFFDFNTRMDPDTLNNILRKLHRKGYLVVAI
3353 FT VSDLGTGNQKLWTELGISESKTWFSHPADDHLKIFVFSDTPHLIKLVRNH
3354 FT YVDSGLTINGKKLTKKTIQEALHLCNKSDLSILFKINENHINVRSLAKQK
3355 FT VKLATQLFSNTTASSIRRCYSLGYDIENATETADFFKLMNDWFDIFNSKL
3356 FT STSNCIECSQPYGKQLDIQNDILNRMSEIMRTGILDKPKRLPFQKGIIVN
3357 FT NASLDGLYKYLQENFSMQYILTSRLNQDIVEHFFGSMRSRGGQFDHPTPL
3358 FT QFKYRLRKYIIGMTNLKECVNKNVIP"
3359 FT SO_feature intron ; SO:0000188:443..500
3360 FT SO_feature intron ; SO:0000188:1169..1221
3361 FT SO_feature intron ; SO:0000188:1948..2137
3362 XX
3363 CC Derived from X06779 (g58305) (Rel. 49, Last updated, Version 8).
3364 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
3365 CC Any changes to original sequence record are annotated in an FT line.
3366 CC CDS annotation from Lynn Crosby's annotation 'P-element.v010'.
3367 XX
3368 SQ Sequence 2907 BP; 989 A; 491 C; 582 G; 845 T; 0 other;
3369 CATGATGAAA TAACATAAGG TGGTCCCGTC GAAAGCCGAA GCTTACCGAA GTATACACTT 60
3370 AAATTCAGTG CACGTTTGCT TGTTGAGAGG AAAGGTTGTG TGCGGACGAA TTTTTTTTTG 120
3371 AAAACATTAA CCCTTACGTG GAATAAAAAA AAATGAAATA TTGCAAATTT TGCTGCAAAG 180
3372 CTGTGACTGG AGTAAAATTA ATTCACGTGC CGAAGTGTGC TATTAAGAGA AAATTGTGGG 240
3373 AGCAGAGCCT TGGGTGCAGC CTTGGTGAAA ACTCCCAAAT TTGTGATACC CACTTTAATG 300
3374 ATTCGCAGTG GAAGGCTGCA CCTGCAAAAG GTCAGACATT TAAAAGGAGG CGACTCAACG 360
3375 CAGATGCCGT ACCTAGTAAA GTGATAGAGC CTGAACCAGA AAAGATAAAA GAAGGCTATA 420
3376 CCAGTGGGAG TACACAAACA GAGTAAGTTT GAATAGTAAA AAAAATCATT TATGTAAACA 480
3377 ATAACGTGAC TGTGCGTTAG GTCCTGTTCA TTGTTTAATG AAAATAAGAG CTTGAGGGAA 540
3378 AAAATTCGTA CTTTGGAGTA CGAAATGCGT CGTTTAGAGC AGCAGCTGAG GGAGTCTCAA 600
3379 CAGTTGGAGG AGTCTCTACG CAAAATCTTC ACGGACACGC AGATACGGAT ACTGAAGAAT 660
3380 GGTGGACAAA GAGCTACGTT CAATTCCGAC GACATTTCTA CAGCTATTTG TCTCCACACC 720
3381 GCAGGCCCTC GAGCGTATAA CCATCTGTAC AAAAAAGGAT TTCCTTTGCC CAGTCGTACG 780
3382 ACTTTGTACA GATGGTTATC AGATGTGGAC ATAAAAAGAG GATGTTTGGA TGTGGTCATA 840
3383 GACCTAATGG ACAGTGATGG AGTTGATGAC GCCGACAAGC TTTGCGTACT CGCTTTCGAC 900
3384 GAGATGAAGG TCGCTGCTGC CTTCGAGTAT GACAGCTCTG CTGATATTGT TTACGAGCCA 960
3385 AGCGACTATG TCCAACTGGC TATTGTTCGT GGTCTAAAAA AATCGTGGAA GCAGCCAGTT 1020
3386 TTTTTCGATT TTAATACCCG AATGGACCCG GATACTCTTA ACAATATATT AAGGAAACTG 1080
3387 CATAGGAAAG GATATTTAGT AGTTGCTATT GTATCCGATT TAGGTACCGG AAACCAAAAG 1140
3388 CTATGGACAG AGCTCGGTAT ATCAGAATGT AAGTTTCGTA TATTACAAAA ATCAGATAAT 1200
3389 CCTTGAAATT CCATTTTTTA GCAAAAACCT GGTTTAGCCA TCCTGCAGAT GACCATTTAA 1260
3390 AGATTTTCGT TTTTTCGGAT ACGCCACATT TAATTAAGTT AGTCCGTAAC CACTATGTGG 1320
3391 ATTCCGGATT AACAATAAAT GGGAAAAAAT TAACAAAAAA AACAATTCAG GAGGCACTTC 1380
3392 ATCTTTGCAA CAAGTCCGAT CTGTCTATCC TCTTTAAAAT TAATGAAAAT CACATTAATG 1440
3393 TTCGATCGCT CGCAAAACAG AAGGTTAAAT TGGCTACCCA GCTGTTTTCG AATACCACCG 1500
3394 CTAGCTCGAT CAGACGCTGC TATTCATTGG GGTATGACAT TGAAAATGCC ACCGAAACTG 1560
3395 CGGACTTCTT CAAATTGATG AATGATTGGT TCGACATTTT TAATTCTAAA TTGTCCACAT 1620
3396 CCAATTGCAT TGAGTGCTCG CAACCTTATG GCAAGCAGTT GGATATACAG AATGATATTT 1680
3397 TGAATCGAAT GTCGGAAATT ATGCGAACAG GAATTCTGGA TAAACCCAAA AGGCTCCCAT 1740
3398 TTCAAAAAGG TATCATTGTG AATAATGCTT CGCTTGATGG CTTGTATAAA TATTTGCAAG 1800
3399 AAAACTTCAG TATGCAATAC ATATTAACAA GCCGTCTCAA CCAAGACATT GTGGAGCATT 1860
3400 TTTTTGGCAG CATGCGATCG AGAGGTGGAC AATTCGACCA TCCCACTCCA CTGCAGTTTA 1920
3401 AGTATAGGTT AAGAAAATAT ATAATAGGTA TGACAAATTT AAAAGAATGC GTAAACAAAA 1980
3402 ATGTAATTCC ATGATTTATA ATTGTTTAAT GTTTAGCTAT ATGTTTCAGG AAAGTTTCAG 2040
3403 TTGAGAATGT AGGTAGTTAT GTGCTGTCTA TTGTGTTTTG TCTTTTATCT GTTTCTTTTC 2100
3404 ATTTTATTAT TTAATCATTA TCCTTTTGCT TATCCAGCCA GGAATACAGA AATGTTAAGA 2160
3405 AATTCGGGAA ATATCGAAGA GGACAACTCT GAAAGCTGGC TTAATTTAGA TTTCAGTTCT 2220
3406 AAAGAAAACG AAAATAAAAG TAAAGATGAT GAGCCTGTCG ATGATGAGCC TGTCGATGAG 2280
3407 ATGTTAAGCA ATATAGATTT CACCGAAATG GATGAGTTGA CGGAGGATGC GATGGAATAT 2340
3408 ATCGCGGGCT ATGTCATTAA AAAATTGAGA ATCAGTGACA AAGTAAAAGA AAATTTGACA 2400
3409 TTTACATACG TCGACGAGGT GTCTCACGGC GGACTTATTA AGCCGTCCGA AAAATTTCAA 2460
3410 GAGAAGTTAA AAGAGCTAGA ATGTATTTTT TTGCATTATA CAAATAATAA TAATTTTGAA 2520
3411 ATTACAAATA ATGTAAAGGA AAAATTAATA TTAGCAGCGC GAAACGTCGA TGTTGATAAA 2580
3412 CAAGTAAAAT CTTTTTATTT TAAAATTAGA ATATATTTTA GAATTAAGTA CTTCAACAAA 2640
3413 AAAATTGAAA TTAAAAATCA AAAACAAAAG TTAATTGGAA ACTCCAAATT ATTAAAAATA 2700
3414 AAACTTTAAA AATAATTTCG TCTAATTAAT ATTATGAGTT AATTCAAACC CCACGGACAT 2760
3415 GCTAAGGGTT AATCAACAAT CATATCGCTG TCTCACTCAG ACTCAATACG ACACTCAGAA 2820
3416 TACTATTCCT TTCACTCGCA CTTATTGCAA GCATACGTTA AGTGGATGTC TCTTGCCGAC 2880
3417 GGGACCACCT TATGTTATTT CATCATG 2907
3418 //
3419 ID DMPOGOR11 standard; DNA; INV; 2121 BP.
3420 XX
3421 AC X59837; S90749;
3422 XX
3423 DR FLYBASE; FBte0000568; Dmel\pogo.
3424 XX
3425 FT source X59837:1..2121
3426 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..21
3427 FT SO_feature terminal_inverted_repeat ; SO:0000481:2101..2121
3428 FT SO_feature intron ; SO:0000188:1438..1541
3429 XX
3430 CC Derived from X59837 (g8354) (Rel. 45, Last updated, Version 10).
3431 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
3432 CC Any changes to original sequence record are annotated in an FT line.
3433 CC K. O'Hare, Personal communication to FlyBase, 1 May 2000.
3434 CC This is probably complete element.
3435 XX
3436 SQ Sequence 2121 BP; 724 A; 353 C; 399 G; 645 T; 0 other;
3437 CAGTATAATT CGCTTAGCTG CATCGATAGT TAGCTGCATC GGCAAGATAT CTGCATTATT 60
3438 TTTCCATTTT TTTGTGTGAA TAGAAAATTT GTACGAAAAT TCATACGTTT GCTGCATCGC 120
3439 AGATAACAGC CTTTTTAACT TAAGTGCATC ATATCAGCTG TTTTTTTTGC CAATTTCAAT 180
3440 GAATATCATC AAAGTTAGCT GCGCCATCTA TGAATCATTT TTGCATATCT AAAAGATGCA 240
3441 AGAATGCCAA CTCGTTTCAG TATCTGCGCA TGTCCGTTTT TGTTTTTGCT TTGATCGTGA 300
3442 TTTTTGTGTT TTTGTTTCTT ATGGCACAAA GTTATTAAAA TGGGTAAAAC AAAGCGTGTC 360
3443 GTTGGACTAA CACTAAAGGA AAAGCTTCAA ATAATCGAGT TAGTGACCAA CAAAGTGGAC 420
3444 AAAAAGGAAA TTTGTGCCAA GTTCAAATGC GACAGATCCA CAGTCAACCG CATTTTACAA 480
3445 AAAACAAATG AAATTCATGA AGCTGTGGCC GCGTCAGGTT TAAAAAGAAA GCGTCAAAGA 540
3446 AAAGGAGCGC ACGACTTAGT AGAAGAAGCC TTATACATTT GGTTCGGACA GCAGGAATCA 600
3447 AAGAACGTAA TTCTTGACCG GCACGTCATA TTAGCAAAAG CGAAAGAATT TTGCCAAAAA 660
3448 TTTAACGACG CCTTTGAACC TGACGCCAGC TGGCTTTGGC GCTGGCGCAA GCGCCACAAT 720
3449 ATAAAGTATG GCAAAATACA CGGCGAAACT GCTACAAATG ATTCCGTATC AGCAAATGAG 780
3450 TACAAAAATG ATATTTTGCC AGGATTGCTT AAAGGTTATA ACCCAGAAGA CATTTTTAAC 840
3451 GCTGACGAAA CTGCACTCTT TTATAAAGCA ATGCCGAATG CGACATTTTT TACTTGTGGA 900
3452 AAGCAATTAA ATGGCCAGAA ATCTCAGAGA GTGAGACTTA CTTTGCTGTT TATATGCAAT 960
3453 GCAACTGGGA CATACAAAAA AACTTTTGTA ATCGGCAGAT CTAAATCGCC ACGATGCTTC 1020
3454 AAGAATGCTA ATGTGCCCAT TCCGTACTAT GCAAATAAGA AGGCCTGGAT GACTAAGGAT 1080
3455 CTCTGGCGAA AAATAATGAC AGGATTTGAC GAAGAAATGA AAAAGCAAAA TCGAAAGATT 1140
3456 TTACTCTTCA TCGACAATGC AACTAGTCAC ACGACTGTCA AGGACTTCGA AAACATAAAA 1200
3457 TTGTGCTTCA TGCCACCAAA CGCAACGGCT CTACTTCAAC CTCTGGACCA AGGTATTATC 1260
3458 CACTCATTCA AATTAGAGTA TAGGCGTATT TTGGTCAAAC AGCAGCTCAT TGCTGTTAAT 1320
3459 TGTGGTAAAT CTACTGTGGA ATTTTTAAAA TCATTATCGT TATTGGATGC TCTATATTTT 1380
3460 GTCAACCAAG GATGGAAGAA TGTTAAAATG TTAACTATTC AGAATTGTTT TAAAAAGGTA 1440
3461 AGATGGGATT ATTATTGATA TGTATCTCAA ATAACGAATT TATTATTTTC AGGCTGGATT 1500
3462 TAAGTTCAGT TTTGAAAATG AAGACACCAT TGCTGAAAAA GACAAACAAT GCGTAGAAGT 1560
3463 TGACATTGTA TCGAATATTA ATTGGAATGA ATATGCCAAT GTTGATGCAG ATGAGGCTTG 1620
3464 CCATGGTCAA TTAGATGATG ATGAAATCGT GCGCTCTTTA GTTCAAGATG CAAAAACCAG 1680
3465 CGATAACGAA GAAAGCCATA GTGATGAAGA TGTGGACGAT ACTGAGCGTC CTACTTTTAA 1740
3466 GGATGGGTTT GCAGCAATTA AGGCTTTAAA GTCCATTTTT ATGCGAAACA ATAATGATGA 1800
3467 GTTTTTGCAA AACTTGAATT CTATGGAAGA CAAGCTGTTT AATTTACATA TAAACTCAGC 1860
3468 TGTATTGCAA AAAAAAATTA CTGACTATTT TTAAGTTAGT TTTAAAAAGT GTTTTAATCA 1920
3469 ATTCACCATC ACTTAAATTT ATATGTCGAT CTTACTTATC ATTAAGAATG AAATTATCAG 1980
3470 TTCCTTTTAT GTTTAACATT GTTATAAAGA AATAAATTCT TTATTTTTCC TTAAAAAAAA 2040
3471 AAATTAAGTT AGCTGCATTT TTAAGTTACC TGCATCGAGG CATTGTGCAA AGTACTCGAG 2100
3472 GCAGCTAAGC GAATTATACT G 2121
3473 //
3474 ID DMRER1DM standard; DNA; INV; 5356 BP.
3475 XX
3476 AC X51968;
3477 XX
3478 DR FLYBASE; FBte0000118; Dmel\R1A1-element.
3479 XX
3480 FT source X51968:1..5356
3481 FT SO_feature CDS ; SO:0000316:319..1731
3482 FT /name="Dmel\R1A1-element\ORF1"
3483 FT /db_xref="FLYBASE:FBgn0044825"
3484 FT /db_xref="SWISS-PROT:P16424"
3485 FT /db_xref="NCBI_PROTEIN:CAA36226.1"
3486 FT /translation="PVSASIRLLDSSKGGATIGATPMESDSSVSALSGSSASKVSRRGR
3487 FT RRSHLASKSSAPTQAKLVALASNGVPEPVGVLEEAFSSLEDARAATSNAANDAAPPAAA
3488 FT PAVDHTVAPDVSTAAKIAATTATAATAAARAGQAAMMAELSATQRMVRNSFRSLGGVDT
3489 FT EELSCAISRYDELVMALMLRCGELETRLAMPPPPPPPSKANTTAANAPQMPQVAPIAAP
3490 FT RTTKVRETWSAVVKCDDPALSGKAIAEKVRTMVAPSLGVRVHEVRELPSRWWCDHSYSS
3491 FT VGELQKVMASKRFAELGLNVARNAAEKPKVIVYDVDTAIGPEEFMQELHENNFDSEMTL
3492 FT AQFKKSVHLVTKAWSATDGATVNVTLEVDDRAMAKLDVGRVYIKWFSFRCRSQVRTYAC
3493 FT HRCVGFDHKVSECRQKESVCRQCGQQGHTAAKCQNPVDCRNCRHRGQPSGHYMLSNACP
3494 FT IYGALLARVQARH"
3495 FT SO_feature CDS ; SO:0000316:1728..4790
3496 FT /name="Dmel\R1A1-element\ORF2"
3497 FT /db_xref="FLYBASE:FBgn0044824"
3498 FT /db_xref="SWISS-PROT:P16425"
3499 FT /db_xref="NCBI_PROTEIN:CAA36227.1"
3500 FT /translation="TLMFSFIQANCGRGRAATIELGVRLRRSESMFALVQEPYLGGDEM
3501 FT DVLPEGMRVFTDRRGKAAILVDHQEAICMPVETLTTDYGVCLVVKGSFGSIFLCAAYCQ
3502 FT FDAPLEPYLRYMDAVLLQASRTPAILGLDANAVSPMWLSKLSRHAEGQANYRRGELLSE
3503 FT WMLEARVAALNQSTEVYTFDNHRATSDIDVTIVNEAASMWATYEWRVDEWELSDHNIIT
3504 FT VVAEPTTARSVESIAPVPSWNFSNARWRLFKEEMVSRIAELPENFSESPLDQQVSTLRS
3505 FT IVHSVCDTALGRKLTRSPSRRARWWTADLCAARREVRRLRRLLQDGRRRDDDAAVELVV
3506 FT VELRRASAYYKKLIGRAKMDDWKRFVGDHADDPWGRVYKICRGRRKCTEIGCLRVNGEL
3507 FT ITDWGDCARVLLRNFFPVAESEAPTAIAEEVPPALEVFEVDTCVARLKSRRSPGLDGIN
3508 FT GTICKAVWRAIPEHLASLFSRCIRLGYFPAEWKCPRVVSLLKGPDKDKCEPSSYRGICL
3509 FT LPVFGKVLEAIMVNRVREVLPEGCRWQFGFRQGRCVEDAWRHVKSSVGASAAQYVLGTF
3510 FT VDFKGAFDNVEWSAALSRLADLGCREMGLWQSFFSGRRAVIRSSSGTVEVPVTRGCPQG
3511 FT SISGPFIWDILMDVLLQRLQPYCQLSAYADDLLLLVEGNSRAVLEEKGAQLMSIVETWG
3512 FT AEVGDCLSTSKTVIMLLKGALRRAPTVRFAGRNLPYVRSCRYLGITVSEGMKFLTHIAS
3513 FT LRQRMTGVVGALARVLRADWGFSPRARRTIYDGLMAPCVLFGAPVWYDTAEQVAAQRRL
3514 FT ASCQRLILLGCLSVCRTVSTVALQVLGGAPPLDLAAKLLAIKYKLKRGFPLEENDWLYG
3515 FT EDIACLSWEQRKTRLEECLIQSWQNRWDDDSEPGRVTHRFIPYVTLAYRDPSFGFSMRT
3516 FT SFLLTGHGSFNAFLHGRALSDTTACACGDPYEDWMHILCACPLYADLRDLDGLGVQRLG
3517 FT ENWIFEGILDDQEKTQRLAMFAEEVFLRRRAL"
3518 XX
3519 CC Derived from X51968 (g8429) (Rel. 23, Last updated, Version 1).
3520 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
3521 CC Any changes to original sequence record are annotated in an FT line.
3522 XX
3523 SQ Sequence 5356 BP; 1213 A; 1340 C; 1634 G; 1169 T; 0 other;
3524 CGGACGTGTT TTCGTTGCGC TCGTGGACAT AGTGCGAAGA ACTTTGTTTT CCGTATTTGG 60
3525 AAGTATACGG AATAAATAAT TTAGTGTTCC GTGGAAGTGG TGCGCAAATT TTCGCGAATT 120
3526 AAAAACAAGC GGTTTGGAAG TAATTGACAA TAAATTATTG GAAATTTTCC ACTCCGCACG 180
3527 TGTTGAGCGG CGGAGCTTGC GGGTGAGCTT TTCGAACAGC TGAGAGAAGC TTATTGGTGG 240
3528 TAGTCACCGC TAAGGATTGT GTCTTGGGAC AGCTTAGTGC ACTCTACCAA TAGGTGGAGC 300
3529 TATCACCATA GCAACTAGCC CGTGTCAGCG AGCATACGAT TGCTGGACTC GTCAAAAGGA 360
3530 GGAGCCACCA TCGGAGCAAC GCCGATGGAG AGCGACAGCA GTGTGAGTGC CTTGAGCGGA 420
3531 AGCAGTGCCT CAAAGGTGTC AAGACGAGGC AGGCGTAGGA GCCATCTGGC CTCCAAGAGC 480
3532 TCGGCGCCAA CGCAGGCGAA ACTGGTTGCC CTGGCCTCGA ATGGAGTGCC GGAACCCGTT 540
3533 GGTGTGCTGG AGGAGGCGTT TTCGTCGCTG GAGGATGCCC GGGCGGCTAC GTCAAACGCT 600
3534 GCCAACGATG CTGCCCCCCC CGCTGCTGCC CCCGCTGTTG ATCACACTGT TGCCCCTGAT 660
3535 GTTTCCACTG CTGCTAAAAT CGCTGCCACC ACTGCCACCG CTGCCACCGC TGCCGCCCGT 720
3536 GCTGGGCAAG CAGCCATGAT GGCAGAGCTG TCGGCCACCC AGCGCATGGT GCGAAACAGT 780
3537 TTCCGCAGCC TAGGAGGCGT AGACACGGAA GAGCTCTCGT GTGCCATCAG CCGCTATGAT 840
3538 GAGCTGGTGA TGGCATTAAT GCTCCGGTGT GGAGAACTGG AGACGCGGCT CGCTATGCCA 900
3539 CCACCGCCGC CGCCGCCGTC CAAGGCGAAC ACTACTGCCG CCAATGCTCC CCAGATGCCT 960
3540 CAGGTTGCAC CCATCGCTGC CCCGCGGACA ACCAAGGTTC GTGAGACGTG GTCAGCGGTG 1020
3541 GTGAAGTGCG ACGACCCTGC GCTATCGGGG AAAGCCATAG CCGAAAAGGT GCGGACGATG 1080
3542 GTTGCACCCT CCCTCGGAGT CAGAGTACAC GAGGTACGTG AGCTGCCGTC GAGGTGGTGG 1140
3543 TGCGATCATT CGTACTCTTC GGTTGGAGAG CTGCAGAAGG TGATGGCATC GAAAAGATTC 1200
3544 GCAGAACTTG GACTGAATGT GGCACGGAAC GCGGCCGAGA AGCCGAAGGT CATAGTCTAT 1260
3545 GACGTCGACA CAGCCATCGG CCCAGAAGAG TTCATGCAGG AGCTTCACGA GAACAACTTC 1320
3546 GACAGTGAAA TGACTCTGGC CCAGTTCAAA AAGTCGGTGC ACCTGGTGAC CAAGGCGTGG 1380
3547 TCGGCTACTG ACGGTGCCAC CGTAAACGTG ACGCTAGAGG TAGACGACCG GGCGATGGCG 1440
3548 AAACTTGATG TAGGACGTGT CTACATTAAG TGGTTTTCGT TCCGATGCCG ATCGCAAGTC 1500
3549 CGCACCTATG CCTGCCACAG ATGTGTGGGT TTCGACCACA AGGTTAGTGA ATGCAGGCAG 1560
3550 AAGGAGAGTG TTTGCCGCCA GTGCGGGCAA CAAGGCCACA CCGCGGCAAA GTGCCAAAAC 1620
3551 CCGGTGGACT GCCGGAACTG CCGTCACAGA GGGCAACCTT CGGGGCATTA TATGCTCTCG 1680
3552 AATGCTTGCC CGATATACGG AGCGTTGTTA GCGAGGGTGC AAGCTAGACA CTAATGTTTA 1740
3553 GCTTCATCCA AGCGAACTGT GGCCGAGGCA GAGCTGCGAC CATCGAGCTC GGAGTCCGAC 1800
3554 TCAGGAGATC GGAGTCAATG TTTGCTCTGG TGCAGGAGCC GTATCTTGGC GGGGATGAAA 1860
3555 TGGATGTGCT GCCTGAAGGA ATGAGGGTTT TCACCGACCG GCGAGGGAAG GCAGCCATCC 1920
3556 TAGTGGATCA TCAGGAAGCC ATCTGCATGC CAGTGGAAAC TCTCACCACA GATTATGGCG 1980
3557 TATGTCTGGT CGTTAAAGGG AGTTTTGGCT CAATCTTCCT TTGCGCCGCA TACTGCCAGT 2040
3558 TCGATGCACC TCTGGAACCG TACCTCCGGT ACATGGATGC GGTCCTGCTG CAGGCCAGCA 2100
3559 GAACCCCCGC AATCCTGGGC CTCGACGCGA ATGCAGTGTC CCCCATGTGG CTTAGCAAAC 2160
3560 TCTCTCGTCA TGCCGAGGGG CAAGCTAACT ACAGACGGGG TGAGCTGCTG TCTGAGTGGA 2220
3561 TGCTGGAGGC AAGAGTCGCC GCCCTAAACC AGTCAACAGA GGTGTACACG TTCGATAATC 2280
3562 ACAGAGCGAC TAGTGATATC GACGTGACAA TCGTCAATGA AGCAGCATCT ATGTGGGCCA 2340
3563 CATATGAGTG GAGAGTGGAC GAGTGGGAAT TGAGTGACCA CAACATCATT ACTGTTGTGG 2400
3564 CCGAACCAAC TACCGCGCGC TCAGTTGAGA GCATAGCTCC TGTGCCGTCC TGGAACTTCT 2460
3565 CCAATGCACG TTGGCGATTG TTCAAGGAGG AAATGGTGAG TAGAATAGCC GAACTTCCGG 2520
3566 AAAACTTTTC AGAGTCGCCG TTGGACCAGC AAGTTTCGAC CCTGCGCAGT ATAGTACATA 2580
3567 GTGTATGTGA TACTGCGCTA GGAAGGAAGT TGACTCGATC GCCCAGCAGG AGAGCACGTT 2640
3568 GGTGGACTGC CGACCTCTGC GCTGCAAGGC GCGAAGTCCG AAGACTTCGT CGCCTGCTCC 2700
3569 AAGATGGAAG GCGTCGAGAT GACGATGCCG CTGTAGAGCT TGTAGTGGTC GAGCTGAGGC 2760
3570 GTGCCTCAGC CTACTACAAG AAGCTCATTG GAAGGGCGAA GATGGATGAC TGGAAACGCT 2820
3571 TCGTGGGAGA TCATGCCGAC GACCCATGGG GGCGCGTCTA CAAGATTTGC CGAGGTCGCA 2880
3572 GGAAGTGCAC GGAGATTGGG TGCCTCCGCG TGAATGGCGA GCTGATCACT GATTGGGGTG 2940
3573 ACTGCGCACG AGTGCTCCTC CGCAATTTTT TCCCAGTTGC GGAGTCCGAA GCACCGACTG 3000
3574 CCATCGCGGA GGAAGTCCCA CCGGCCCTCG AAGTATTCGA GGTTGATACA TGTGTTGCCC 3060
3575 GGCTGAAGAG CAGGCGCTCT CCCGGGTTGG ACGGCATCAA TGGCACTATC TGCAAGGCAG 3120
3576 TCTGGCGCGC CATACCCGAG CACCTAGCAT CATTGTTTTC CCGATGCATC CGATTGGGAT 3180
3577 ACTTTCCAGC CGAGTGGAAG TGCCCACGAG TTGTCTCGTT GCTCAAAGGG CCAGATAAGG 3240
3578 ACAAGTGTGA GCCCTCCTCA TACAGAGGAA TATGCTTGCT ACCAGTCTTT GGAAAGGTGC 3300
3579 TCGAGGCCAT CATGGTGAAT CGTGTGAGAG AAGTTCTTCC GGAAGGCTGC AGATGGCAAT 3360
3580 TCGGATTTCG CCAAGGACGA TGTGTGGAGG ATGCTTGGAG GCACGTGAAG AGCAGTGTTG 3420
3581 GCGCCAGCGC GGCGCAATAC GTGCTCGGCA CATTCGTGGA CTTCAAAGGA GCATTCGACA 3480
3582 ACGTCGAATG GAGTGCTGCA CTCAGCCGAC TAGCCGACTT GGGATGCCGG GAAATGGGCT 3540
3583 TGTGGCAGAG CTTTTTCTCC GGCCGAAGAG CAGTGATCCG AAGCAGTTCC GGTACTGTGG 3600
3584 AGGTACCGGT AACTAGAGGC TGCCCGCAGG GATCAATCAG CGGCCCATTT ATCTGGGACA 3660
3585 TACTGATGGA TGTACTGCTT CAGCGTCTCC AGCCGTATTG CCAGCTGAGT GCATACGCGG 3720
3586 ATGACTTGCT GCTTCTCGTC GAGGGAAATT CCCGAGCTGT GCTAGAGGAA AAAGGAGCGC 3780
3587 AACTAATGTC CATCGTAGAA ACGTGGGGAG CGGAAGTTGG CGATTGCCTC TCGACCAGCA 3840
3588 AGACGGTAAT CATGCTGCTG AAAGGTGCCT TGAGACGTGC GCCTACGGTG AGGTTTGCTG 3900
3589 GACGGAACCT TCCGTATGTG CGTAGCTGTC GGTACCTTGG CATCACGGTC AGTGAAGGAA 3960
3590 TGAAATTCCT CACGCACATA GCTTCGCTTC GCCAGCGGAT GACAGGAGTC GTTGGAGCAT 4020
3591 TGGCGCGTGT GCTTCGAGCC GACTGGGGCT TCAGTCCTCG AGCCAGGCGG ACCATATATG 4080
3592 ACGGACTCAT GGCACCTTGT GTGCTGTTTG GTGCCCCGGT ATGGTATGAC ACCGCGGAAC 4140
3593 AAGTAGCTGC CCAGAGGCGA CTAGCCTCCT GCCAGAGGCT AATCCTGCTT GGATGCCTTT 4200
3594 CGGTATGCCG AACAGTATCC ACAGTGGCAC TGCAGGTACT TGGTGGAGCT CCCCCGCTTG 4260
3595 ATCTGGCTGC TAAGTTATTA GCGATCAAAT ACAAGCTAAA ACGTGGATTC CCGCTGGAGG 4320
3596 AGAACGACTG GCTTTACGGC GAGGACATTG CGTGTCTTAG CTGGGAGCAG AGGAAGACTC 4380
3597 GCCTAGAGGA GTGTTTAATC CAGAGTTGGC AGAACAGATG GGACGATGAC AGCGAACCAG 4440
3598 GACGGGTGAC GCATAGGTTT ATCCCATACG TCACTCTTGC CTATCGGGAT CCAAGTTTTG 4500
3599 GATTCTCGAT GAGGACGTCT TTCCTGCTTA CAGGGCACGG GTCGTTCAAT GCATTTTTGC 4560
3600 ACGGGAGAGC CCTCAGCGAT ACCACTGCTT GCGCATGTGG AGATCCATAT GAGGACTGGA 4620
3601 TGCATATCTT GTGCGCTTGC CCCCTATATG CAGATCTGCG GGACCTAGAT GGACTTGGAG 4680
3602 TGCAGCGCCT TGGCGAAAAC TGGATCTTCG AGGGAATCCT GGATGATCAA GAGAAGACTC 4740
3603 AACGGCTGGC AATGTTTGCG GAAGAAGTGT TCCTGAGGAG GAGGGCCCTT TAGCTCAACA 4800
3604 TCTCTGCCGT GTGGTTAGCG GGCGAGAATA CTACCACAGT CCGCTGTTGC TTGTCGTAAG 4860
3605 AGACGACTAA TACAGCGATA GGATTCCTCT AACCCTGCTT GTCGGAGCAA AAGGGGGAGG 4920
3606 CCCACCGAGC CTCTTTTCGG TACCACGGGT TGAGCAGCTA TCCAAGACTG CTCATTGAGG 4980
3607 TAGGCCCCCT GGTGGGAGTA TCGTGGTGGC TGTGGTTGGT ACCCATATCG CGGGTAGAGC 5040
3608 CTTCATGCTC GACGTTTGAG TTACGGTGCT AGTTGCGCAA AACTCGGGTG CTGTGACCCA 5100
3609 GAGATCAGTA GAGATTTTAG GTAGATCTCG CTCCTCAGCA AGGGGGAGTG CTTGCCCGGC 5160
3610 AAGCAAGTAC TCGAATTGCT ACCGGGGTGG TCGCTATGTA CATAGCTATA GCTTCTAGTC 5220
3611 CGGGACGCTT GTCTGGCGTA TCCAGACACA TGCACCATAT GCTCACTTGT GGGCGTATAG 5280
3612 GGTGCCGTGG TTGTAATCCC TTCAGTGTGG AACACGCCAC GTAAAATAAG TTCGGAGGGA 5340
3613 TCCGAAAAGC ATACAT 5356
3614 //
3615 ID DMRER2DM standard; DNA; INV; 3607 BP.
3616 XX
3617 AC X51967;
3618 XX
3619 DR FLYBASE; FBte0000030; Dmel\R2-element.
3620 XX
3621 FT source X51967:1..3607
3622 FT SO_feature CDS ; SO:0000316:181..3351
3623 FT /name="Dmel\R2-element\ORF"
3624 FT /db_xref="FLYBASE:FBgn0016699"
3625 FT /db_xref="SWISS-PROT:P16423"
3626 FT /db_xref="NCBI_PROTEIN:CAA36225.1"
3627 FT /translation="FERKNFSDGLVPQRKFIHIGTTSTNNEPRIPLHNLMTTRPSVDIF
3628 FT PEDQYEPNAAATLSRVPCTVCGRSFNSKRGLGVHMRSRHPDELDEERRRVDIKARWSDE
3629 FT EKWMMARKEVELTANGCKHINKQLAVYFANRSVEAIKKLRQRGDYKEKIEQIRGQSALA
3630 FT PEVANLTIRRRPSRSEQDHQVTTSETTPITPFEQSNREILRTLRGYSPVECHSKWRAQE
3631 FT LQTIIDRAHLEGKETTLQCLSLYLLGIFPAQGVRHTLTRPPRRPRNRRESRRQQYAVVQ
3632 FT RNWDKHKGRCIKSLLNGTDESVMPSQEIMVPYWREVMTQPSPSSCSGEVIQMDHSLERV
3633 FT WSAITEQDLRASRVSLSSSPGPDGITPKSAREVPSGIMLRIMNLILWCGNLPHSIRLAR
3634 FT TVFIPKTVTAKRPQDFRPISVPSVLVRQLNAILATRLNSSINWDPRQRGFLPTDGCADN
3635 FT ATIVDLVLRHSHKHFRSCYIANLDVSKAFDSLSHASIYDTLRAYGAPKGFVDYVQNTYE
3636 FT GGGTSLNGDGWSSEEFVPARGVKQGDPLSPILFNLVMDRLLRTLPSEIGAKVGNAITNA
3637 FT AAFADDLVLFAETRMGLQVLLDKTLDFLSIVGLKLNADKCFTVGIKGQPKQKCTVLEAQ
3638 FT SFYVGSSEIPSLKRTDEWKYLGINFTATGRVRCNPAEDIGPKLQRLTKAPLKPQQRLFA
3639 FT LRTVLIPQLYHKLALGSVAIGVLRKTDKLIRYYVRRWLNLPLDVPIAFVHAPPKSGGLG
3640 FT IPSLRWVAPMLRLRRLSNIKWPHLTQNEVASSFLEAEKQRARDRLLAEQNELLSRPAIE
3641 FT KYWANKLYLSVDGSGLREGGHYGPQHGWVSQPTRLLTGKEYMDGIRLRINALPTKSRTT
3642 FT RGRHELERQCRAGCDAPETTNHIMQKCYRSHGRRVARHNCVVNRIKRGLEERGCVVIVE
3643 FT PSLQCESGLNKPDLVALRQNHIDVIDTQIVTDGHSMDDAHQRKINRYDRPDIRTELRRR
3644 FT FEAAGDIEFHSATLNWRGIWSGQSVKRLIAKGLLSKYDSHIISVQVMRGSLGCFKQFMY
3645 FT LSGFSRDWT"
3646 XX
3647 CC Derived from X51967 (g8432) (Rel. 24, Last updated, Version 1).
3648 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
3649 CC Any changes to original sequence record are annotated in an FT line.
3650 XX
3651 SQ Sequence 3607 BP; 1064 A; 818 C; 900 G; 825 T; 0 other;
3652 TTGGGGATCA TGGGGTATTT GAGAGCAGAG GGGGAGTATT CTTCTGTAAT TCGTAAGTCA 60
3653 TATCATATGA TGTGCGGAAG GGGAATTTTA CTCTGTAACT CACAAGTCTC TCCTTTACTC 120
3654 AAGTCGACTC AAAACCTCCT CGTGGTGGTC CCGGTAATGC TAAACTCGTT TAGCAGCTAA 180
3655 TTTGAGCGGA AAAACTTTTC CGATGGGCTG GTTCCCCAGA GGAAATTTAT TCATATTGGA 240
3656 ACTACAAGCA CAAATAACGA GCCTCGGATA CCTTTACACA ATCTGATGAC GACCCGACCC 300
3657 TCCGTGGATA TCTTCCCGGA GGACCAATAT GAACCAAACG CAGCGGCTAC TCTATCTAGG 360
3658 GTTCCCTGCA CAGTATGTGG CCGGTCCTTT AACAGCAAGA GAGGACTCGG TGTTCACATG 420
3659 CGATCTCGGC ACCCAGACGA ACTTGATGAA GAACGTCGAC GTGTCGATAT AAAGGCAAGA 480
3660 TGGAGTGATG AAGAGAAGTG GATGATGGCG AGAAAGGAGG TTGAGCTCAC AGCAAATGGA 540
3661 TGTAAACACA TAAACAAGCA ACTAGCGGTG TATTTTGCAA ACCGCAGCGT CGAAGCCATC 600
3662 AAAAAGCTAA GACAGAGGGG CGATTATAAG GAGAAAATAG AGCAGATAAG AGGGCAATCA 660
3663 GCTCTCGCCC CGGAAGTTGC TAATCTAACC ATAAGGCGCC GCCCTAGTAG AAGTGAGCAA 720
3664 GACCACCAAG TAACAACATC GGAAACAACT CCAATCACTC CCTTCGAACA GTCGAACAGG 780
3665 GAAATTTTGC GGACACTACG CGGGTATAGC CCCGTAGAAT GCCATTCCAA ATGGAGAGCC 840
3666 CAAGAGTTGC AAACTATCAT TGATAGGGCA CATCTCGAGG GAAAGGAAAC CACTCTCCAA 900
3667 TGCTTATCGC TATATCTCCT GGGAATTTTT CCGGCACAGG GTGTACGACA CACACTGACG 960
3668 AGACCTCCTC GGAGACCTCG GAACAGGAGA GAAAGCAGAA GGCAGCAGTA CGCTGTCGTC 1020
3669 CAGCGTAACT GGGATAAGCA TAAAGGAAGA TGCATCAAGT CCTTGCTAAA TGGAACTGAT 1080
3670 GAGTCGGTAA TGCCAAGCCA AGAAATAATG GTTCCCTACT GGAGAGAAGT AATGACTCAG 1140
3671 CCTAGCCCAA GCTCTTGCAG TGGAGAAGTG ATACAAATGG ATCACTCGCT TGAGAGGGTA 1200
3672 TGGTCTGCTA TTACAGAGCA GGACCTTCGG GCGTCAAGAG TCTCATTATC CTCGTCTCCG 1260
3673 GGGCCTGACG GGATAACTCC AAAATCTGCC AGGGAGGTGC CGTCAGGTAT TATGCTGCGC 1320
3674 ATAATGAACC TAATTCTATG GTGCGGTAAT CTACCACACT CCATACGACT GGCCAGAACC 1380
3675 GTCTTCATCC CGAAGACGGT GACGGCGAAG CGACCGCAAG ACTTTCGTCC AATATCAGTG 1440
3676 CCTTCAGTCC TGGTAAGACA GCTAAATGCA ATATTGGCAA CCCGGTTGAA CTCATCAATC 1500
3677 AATTGGGACC CGCGCCAGCG GGGCTTCTTA CCAACCGACG GATGCGCCGA TAATGCGACG 1560
3678 ATAGTCGACT TAGTCTTGAG GCATAGCCAT AAGCACTTTA GATCTTGCTA CATCGCAAAT 1620
3679 TTAGATGTAA GCAAGGCATT TGATTCTCTA TCACATGCAT CTATATACGA CACCTTACGT 1680
3680 GCTTATGGTG CGCCAAAGGG CTTCGTTGAC TACGTACAGA ACACGTACGA GGGCGGTGGT 1740
3681 ACCAGTCTCA ATGGGGACGG TTGGAGTTCA GAGGAATTCG TCCCTGCTAG AGGAGTGAAG 1800
3682 CAGGGTGACC CTTTGTCTCC TATTCTATTT AACTTGGTAA TGGACAGGTT ACTTAGAACC 1860
3683 TTACCCAGCG AAATTGGTGC CAAAGTCGGA AATGCCATTA CTAACGCGGC CGCGTTTGCA 1920
3684 GATGATTTGG TACTATTTGC GGAAACTCGG ATGGGGCTTC AAGTATTGTT GGACAAGACG 1980
3685 TTGGATTTTC TATCTATCGT CGGCCTCAAA CTTAATGCCG ACAAATGTTT TACCGTTGGC 2040
3686 ATTAAGGGCC AGCCGAAACA GAAGTGTACC GTGTTAGAGG CACAGAGCTT CTACGTAGGC 2100
3687 TCGAGTGAGA TTCCATCACT GAAGCGCACG GACGAGTGGA AGTACTTAGG CATCAACTTC 2160
3688 ACTGCAACCG GGAGGGTTCG ATGCAATCCG GCCGAGGACA TTGGTCCAAA GCTACAAAGA 2220
3689 TTGACAAAGG CCCCCCTCAA ACCACAACAG AGGTTGTTCG CCCTTCGGAC TGTCCTTATC 2280
3690 CCACAGCTCT ACCACAAGTT AGCCCTTGGG AGTGTGGCGA TAGGCGTCCT AAGAAAAACT 2340
3691 GATAAACTTA TAAGATATTA TGTGCGAAGA TGGCTAAATC TTCCGCTGGA TGTGCCGATA 2400
3692 GCATTTGTTC ATGCACCCCC AAAAAGTGGA GGTCTCGGAA TTCCATCACT AAGATGGGTA 2460
3693 GCTCCAATGT TAAGGCTAAG ACGCTTGAGT AACATTAAAT GGCCTCACCT CACGCAAAAC 2520
3694 GAGGTAGCCA GCTCTTTCCT CGAAGCCGAA AAACAACGGG CCCGAGATAG ATTATTAGCT 2580
3695 GAACAAAATG AACTGTTATC GCGTCCGGCA ATAGAAAAAT ATTGGGCGAA CAAGTTGTAC 2640
3696 CTCTCAGTTG ATGGTAGCGG ACTCCGTGAA GGCGGCCATT ATGGCCCGCA ACACGGGTGG 2700
3697 GTTAGTCAAC CCACGCGTTT ATTAACAGGA AAGGAATATA TGGACGGTAT TCGTCTGCGG 2760
3698 ATAAATGCCC TACCCACAAA GTCTCGTACT ACAAGGGGAA GGCACGAATT GGAACGACAG 2820
3699 TGTCGTGCAG GATGTGATGC TCCCGAAACA ACAAACCACA TAATGCAAAA ATGCTACCGC 2880
3700 TCGCATGGGA GGCGGGTAGC TAGACACAAC TGCGTAGTAA ATCGAATCAA GCGGGGACTT 2940
3701 GAGGAGAGAG GCTGCGTGGT CATTGTTGAA CCAAGTCTGC AGTGCGAATC CGGCCTTAAT 3000
3702 AAACCAGACC TGGTGGCACT ACGACAAAAT CACATTGATG TGATCGACAC ACAAATTGTG 3060
3703 ACAGACGGAC ACTCTATGGA TGATGCGCAC CAGCGCAAAA TCAATAGATA CGACAGACCG 3120
3704 GACATACGAA CTGAATTGCG TCGCAGATTC GAAGCCGCAG GTGACATTGA ATTCCATTCT 3180
3705 GCCACCCTGA ACTGGAGGGG GATCTGGAGT GGTCAATCCG TTAAAAGATT GATAGCAAAG 3240
3706 GGTCTCCTCA GCAAATATGA TAGTCATATC ATTAGCGTCC AGGTTATGAG AGGCAGTCTC 3300
3707 GGTTGTTTTA AACAGTTCAT GTACCTGAGC GGGTTTTCCC GAGATTGGAC TTAGCTAAAT 3360
3708 CGTTTGGTTC AAAACATTTG CTTGCTGTCT TGGCATAACA TCAATAAAGG CATAAACATC 3420
3709 GCAAAATAAT GGTTATAATT AAATGGCTAT GAGGATGGTT TTAGTACGTA GGCGTTGCGG 3480
3710 AACTTCGGTT CATATAGAGC AATGAATCGT GCATGCTAGG AAAACTGACC ACACACAGTG 3540
3711 TTGGCAGACC TAGTATCTTT CGAAGATTTC CATACCTCCG CGATCAAAAA AAAAAAAAAA 3600
3712 AAAAAAA 3607
3713 //
3714 ID DM33463 standard; DNA; INV; 1736 BP.
3715 XX
3716 AC U33463;
3717 XX
3718 DR FLYBASE; FBte0001005; Dmel\S-element.
3719 XX
3720 FT source U33463:37..1772
3721 FT SO_feature terminal_inverted_repeat ; SO:0000481:1..234
3722 FT SO_feature terminal_inverted_repeat ; SO:0000481:1503..1736
3723 FT SO_feature CDS ; SO:0000316:404..1441
3724 FT SO_feature start_codon ; SO:0000318:1..3
3725 FT /name="Dmel\S-element\T"
3726 FT /db_xref="FLYBASE:FBgn0044019"
3727 FT /db_xref="REMTREMBL:AAC47095"
3728 FT /db_xref="NCBI_PROTEIN:AAC47095.1"
3729 FT /translation="MPGKRLAFEVTQLIYYNHQLGKSIPELVEIFSVSRKTVYNILNRX
3730 FT XKEGRLEPKSGGGCKTKINKRVDRLIMRKAIANPRISVRSLAQDIREECHLTVSHETVR
3731 FT QVILRHRYSSRVARKKPLLSEINIEKRHSFAVSMMDHAEEYWDDVIFCDETKMMLFYND
3732 FT GPSRVWRKPLSALETQNIIPTIKFGKLSVMIWGCISSHGVGKLAFIESTMNAVQYLDIL
3733 FT KTNLKASAEKFGLFSNNKPNFKFYQDNDPKHKEYNVRNWLLYNCGKVIDTPPQSPDLNP
3734 FT IENLWAYLKKKVAKRGPKTRQQLMAAIIEEWEKIPLEYDLKKLIHSMKKRLQLVAKANG
3735 FT GHTKY"
3736 XX
3737 CC Derived from U33463 (g1006788) (Rel. 47, Last updated, Version 5).
3738 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
3739 CC Any changes to original sequence record are annotated in an FT line.
3740 XX
3741 SQ Sequence 1736 BP; 600 A; 287 C; 300 G; 545 T; 4 other;
3742 CAGTTTGTCA AGAAACTGTT TACACACCGC AAAATAAGTA GAATTTTTGA CTTTAAAGGC 60
3743 CAAAATTAAG GGTTTTTTGC TTAATTAAAC GCAATTTTTT TATGAAATAT AATTAAACAA 120
3744 TATTTATTTT ACTTATAAAT TAAAAAACAA ATTCAATATA TCAAATATAC AAGAAAATAA 180
3745 ACAACAAATT TCTTGTTTAC ACACTTTTGA GAGTGCCAAG AAACTCTTTA CACAGTTTTG 240
3746 GGTTCCTACT TTGTTTTGCT CTTTTTCTTA GAAACAATCT CATTTTTCCG TTATTTTTGT 300
3747 CTTATGCATT CCTTTTTACA ACGCTTCTAT TGCAATTTTT TCACTTTGCT TGTGAAATTT 360
3748 TGTTGATCTA ACGTGCTTAA AGCGAATTAT TAAATTTAAT GAAATGCCTG GAAAGAGATT 420
3749 GGCTTTTGAA GTGACCCAGC TAATATACTA TAACCACCAG TTGGGAAAAT CTATTCCTGA 480
3750 ATTAGTAGAA ATATTTTCCG TATCCCGTAA AACCGTCTAT AATATTTTAA ATCGTNNNNA 540
3751 AAAAGAGGGC AGGCTTGAAC CTAAGAGTGG TGGTGGGTGT AAAACGAAAA TTAACAAGCG 600
3752 AGTAGACCGC CTTATTATGC GAAAAGCGAT TGCGAACCCC CGAATCTCGG TCAGATCACT 660
3753 TGCTCAGGAT ATCAGGGAAG AATGTCACCT AACTGTATCA CACGAAACTG TGCGCCAAGT 720
3754 CATCCTACGC CATAGGTACT CTTCAAGAGT TGCAAGAAAA AAGCCTTTGC TATCAGAGAT 780
3755 CAATATTGAA AAGCGTCATT CATTCGCTGT GAGCATGATG GATCATGCGG AAGAGTACTG 840
3756 GGATGACGTC ATATTTTGTG ACGAAACAAA AATGATGCTC TTTTATAACG ATGGGCCAAG 900
3757 CAGAGTATGG CGCAAACCGT TGAGTGCGCT AGAAACACAA AATATAATTC CAACAATCAA 960
3758 ATTTGGAAAA TTGTCAGTGA TGATTTGGGG CTGTATTTCC AGCCATGGAG TGGGCAAACT 1020
3759 AGCCTTTATT GAAAGCACTA TGAATGCCGT GCAATATCTA GATATTTTAA AAACAAATTT 1080
3760 GAAGGCCAGT GCAGAAAAAT TTGGTTTGTT TAGCAACAAC AAGCCAAATT TTAAGTTTTA 1140
3761 TCAGGACAAT GATCCCAAAC ATAAAGAGTA CAATGTACGC AACTGGCTAC TCTATAACTG 1200
3762 TGGCAAGGTG ATCGATACGC CCCCTCAGAG TCCTGATCTA AACCCCATTG AAAATTTGTG 1260
3763 GGCCTACTTA AAGAAGAAGG TTGCAAAAAG GGGCCCCAAA ACTCGACAAC AACTCATGGC 1320
3764 TGCGATAATC GAAGAGTGGG AAAAGATCCC GCTTGAATAT GACCTAAAAA AACTCATACA 1380
3765 TTCCATGAAA AAAAGGCTTC AACTTGTAGC CAAAGCCAAT GGGGGTCATA CTAAATACTA 1440
3766 AAACTTTTCA AATATTATCA AAATAATTAA AAAATTTAGG ATTAAACTTA GGTTTAGTGT 1500
3767 TTTGTGTAAA GAGTTTCTTG ACACTCTCAA AAGTGTGTAA ACTTGAAATT TGTTGTTTAT 1560
3768 TTTCTTGTAT ATTTGATATA TTGAATTTGT TTTTTAATTT ATAAGTAAAA TAAATATTGT 1620
3769 TTAATTATAT TTCATAAAAA AATTGCGTTT AATTAAGCGA AAAACCCTTA ATTTTGACCT 1680
3770 TTAAAGTCAA AAATTCTACT TATTTTACGG TGTGTAAACA GTTTCTTGAC AAACTG 1736
3771 //
3772 ID SPRINGER standard; DNA; INV; 7546 BP.
3773 XX
3774 AC AF364549;
3775 XX
3776 DR FLYBASE; FBte0000333; Dmel\springer.
3777 XX
3778 FT source AF364549:1..7546
3779 FT SO_feature five_prime_LTR ; SO:0000425:1..403
3780 FT SO_feature three_prime_LTR ; SO:0000426:7143..7546
3781 FT SO_feature CDS ; SO:0000316:1058..2422
3782 FT SO_feature start_codon ; SO:0000318:1..3
3783 FT /name="Dmel\springer\gag"
3784 FT /db_xref="FLYBASE:FBgn0044343"
3785 FT /db_xref="SPTREMBL:Q967T6"
3786 FT /db_xref="NCBI_PROTEIN:AAK52057.1"
3787 FT /translation="MSESFRQYRNSKKCASDSESESDDSTENSVRKNTPTNAFTAYKMS
3788 FT LETEQIKALIRALQEQALESQRREADLRKTIQDLAGQVAAIQIAPARAEAPPIKVYRPV
3789 FT EITGLVPCGETLDAVKCLPDFMGTQETYVSWRQAANAAYHMFRKYEDSSRHYQAVVIIR
3790 FT SKVKGPADAVLSSFGTILNFDAIISRLDFTYSDKRPIHVIEQELGTLRQGSLTLLQYYD
3791 FT EVEKKLTLLTNKATMSYEASAATVLCEKFRDDALRVFVSGLRRNLTDVLFAAKPKDMPS
3792 FT ALALAQEVESNHERYTFATSFARSQEDRDHKQYPKVQERQRAPPQAGSQGSAGKNPHFT
3793 FT KQHRAQVHSAPRSDRMARENMPEPMDVDPSLSRMQPSHAPAYPKSKPAASGRSVPPKRQ
3794 FT RVNHVAQASDDLDKVYNTAASSAAVKVDDDSILEYDSDTINFLGESPCYPSSDEE"
3795 FT SO_feature CDS ; SO:0000316:2434..5475
3796 FT SO_feature start_codon ; SO:0000318:1..3
3797 FT /name="Dmel\springer\pol"
3798 FT /db_xref="FLYBASE:FBgn0044342"
3799 FT /db_xref="SPTREMBL:Q967T5"
3800 FT /db_xref="NCBI_PROTEIN:AAK52055.1"
3801 FT /translation="MKLLIDTGAAKNFIRPFKGLKGVRPVQSPFTIHSIHGVTTITKKC
3802 FT FVSIFNLKATFFLLPDLTSFDAIVGLDLLKQAGASLCLASGKLKWGSGAEQIDFHTCPD
3803 FT VNFTKVDCSDAPPLIKDAFLKMLGNRKKAFADPNEALPYNTSVVATIRTVDEEPIYAKL
3804 FT YPYPMGAADFVNGEIQELLKNGIIQKSKSPYNNPIWVVDKKGTDDAGNKKMRLVLDFRK
3805 FT LNERTVPDRYPMPNISMILGNLGKAKYFTTLDLKSGYHQITLAERDREKTAFAVNGGKY
3806 FT EFRRLPFGLRNAASIFQRTIDDILREQIGKFCYVYVDDVIIFSEDENDHVKHVDWVLKS
3807 FT LYDANMRISAEKSRFFKKSVSFLGFIVTNNGAATDPEKVKAIKEFPEPKNVFEVRSFLG
3808 FT LASYYRCFIKDFASIARPISDILKGENGSVSRHRSRSIQVEFSEAQQRAFEKLRNILAS
3809 FT EDVILRYPDYKKAFDLTTDASAYGIGAVLSQEGRPITMISRTLSDREVNYATNERELLA
3810 FT IVWALAKLRHYLYAVKEINIFTDHQPLTFAVSESNPNAKIKRWKARIDESGARIFYKPG
3811 FT RNNLVADALSRQQLNVVEEQEPESCAATIHSELSLTHTIESTDKPVNCFQNQIILEEAR
3812 FT SHWKRTFILFGNKRRHSINFSCKQALLEELANIIIPNGVNAFHCDLHTLALIQDDVVRQ
3813 FT FPATKFWHCKNRVTDIFAMQERKEILTVEHNRAHRSAQENVKQVLSEYYFPKMTKLASE
3814 FT IAANCKTCAKAKYDRHPKKQELGETPVPTHVGEILHIDIFSTDKKYFLTCVDKFSKFAM
3815 FT VQPILSRTIEDLKAPLLQLMNVFPKAKTIYCDNEPSLKSQTIVAMLENHFGVSISNAPP
3816 FT LHSVSNGQVERFHSTLIELARCLKIDKGISDTVELVLLATARYNMSIHSVINKKPAEVM
3817 FT RADPDDPHTDVQEKIKNAQILTRKRENASRQNRVFQVGDKVLVKSNRRLGNKLTPLCEE
3818 FT KTIEADLGTTVLIKGRVVHKDNLK"
3819 FT SO_feature CDS ; SO:0000316:5870..7147
3820 FT SO_feature start_codon ; SO:0000318:1..3
3821 FT /name="Dmel\springer\env"
3822 FT /db_xref="FLYBASE:FBgn0044344"
3823 FT /db_xref="SPTREMBL:Q967T4"
3824 FT /db_xref="NCBI_PROTEIN:AAK52056.1"
3825 FT /translation="MLDMFPQSHMKKLLSVDIAHLRDMLDSLSIHHRVARSLDFLGTAL
3826 FT KVVAGTPDAEDFEKVKFTEARLVDAHNSQIEINTKTQVRINELTDTINKLLKISKSAQI
3827 FT DTGHLYETLSTRNRIIVMELQNLMLTITLAKINVVSPNFLDHADLESIWGEEPTNTPIR
3828 FT EILSVASVKVLQSLNILHFIIKFPKIIMACNKVTILPVVHHDTVLRLKDNVVAECNREI
3829 FT RTVKNCSITPGATFCQLSSVSSCAQELHAGVVAHCDAQQSDLHPITYVDEGIIVINDRP
3830 FT ALVRVDNGTAIHIRGTHLITFIESAMVNETVFFNHDMVQNRAPGVANSPVLNISMKHEV
3831 FT LSLPYLHRLSEKNLEQIRNFEKDVDGYRLSQIALVAGAIFCALICIGLTWQRTTRAKKS
3832 FT TAQLKEVLAQIGSAEGGLNLEEGIVN"
3833 XX
3834 CC Derived from BACR06P08 by Sue Celniker, 29 March 2001.
3835 CC Michael Ashburner, 9-Apr-2001.
3836 CC Any changes to original sequence record are annotated in an FT line.
3837 XX
3838 SQ Sequence 7546 BP; 2131 A; 1909 C; 1712 G; 1794 T; 0 other;
3839 AGTTAACTAA GTTAACCGGA CTGATCGTCC GCACACCAGC ACCGGTCAAA CTGCTGACCA 60
3840 AGCATTTGGC CGGAAGCTCA TGCATAGCCG GCAGAAGCTC TGCGCATTGG CAGAGGCCGC 120
3841 TATGATGTTT TTCCCTTTGT TAGCTTATAG TCAGTTTGAT TTTGTATTCA ATAAAGAGCG 180
3842 CATCGCGCCT TCAATCAACT CCAGCTACTG CTGTTATCAT TGAATTGGTT GGCTAGCCTT 240
3843 AAGGGCAGTC AACAACGGAG AGACGTTCTC CCACCATATC TCCCAATCTA GGAGAAGAGG 300
3844 TCTGCGGCAA CCGCCCTGCC TCCCAGTGAC AGAAGAACCC CCCGTTACCT GCAACCTACG 360
3845 CCGGAGACCG CGGCGAGGGA CCTGCACCTT ATATTTAATT AATTGGCACC CAACTCCAGG 420
3846 AACCCACACC ACTACCCTGA ATCATGTAAG TGGGATTCTC AACTTAAACA CTACTCCAAA 480
3847 CTGCGTCTAG AATTTTAAAA TATTTGGGAT GTTTGTGCGA GTTACATAAA TAAATTAAGA 540
3848 AAATCGGCAT TTCCACTACA ATAAACGTTT ATATGTGTTG CGAATTAAGA TTATGTTACT 600
3849 GTTATGAAGT TTAAATATCG AATTTTGATT TGTGGTTGAC TTTGCAATCC ATATTGTGTG 660
3850 CATTTCATTC CGCCTTCGCA CATCCGCGGG ACACTGTCGT TTCATTCGAA ATTTAATTCG 720
3851 CTACATTGGC TTCACAGCCC TTTCAAGCTT TGTTGTTTTT GACCCACTCC ACTTCGCTAC 780
3852 CCGATACTGG CGCATGCATT GCTGTGACAA TTTTGTGCCT TTTATTTATC TCTTTGTCTT 840
3853 TGCTGTGGCA ATTTTTGTCT TTGGATATTT GTTTGCCTTA TTGGAGACCC GCTCCCCGCA 900
3854 GGCCCTTCAC CTTATCGTTA CTTAGCTGGA CAGTGGCTCT GCTCGTTGAG TCTTCGTCCA 960
3855 ATGCCTTCAA AGCGGCGACT CAGCCCCCGC GACCCCCTTG CCGTACTGTT TGGCCCCACG 1020
3856 GGCACAACGG CCTGAGTATT CACATACATA GCTACCCATG AGCGAGTCAT TCCGACAATA 1080
3857 TAGGAATTCT AAAAAGTGCG CTAGCGACTC AGAGTCCGAA AGCGACGATT CGACAGAAAA 1140
3858 CTCTGTACGT AAAAACACCC CAACTAACGC ATTCACTGCA TATAAAATGT CCCTCGAAAC 1200
3859 GGAACAAATT AAAGCTCTCA TAAGGGCATT ACAAGAGCAA GCCTTAGAGA GTCAACGCAG 1260
3860 GGAGGCTGAC TTGCGTAAAA CAATTCAAGA TCTGGCCGGC CAGGTCGCGG CCATACAGAT 1320
3861 TGCCCCTGCC CGGGCAGAAG CTCCCCCAAT CAAAGTTTAC AGACCAGTAG AAATCACCGG 1380
3862 ACTGGTCCCT TGTGGGGAAA CATTGGATGC CGTTAAATGT CTTCCAGACT TTATGGGGAC 1440
3863 ACAGGAGACA TACGTCTCCT GGCGGCAAGC GGCAAATGCC GCTTACCATA TGTTCAGGAA 1500
3864 ATATGAGGAT AGTTCGCGGC ACTATCAAGC TGTGGTCATC ATCAGGAGCA AAGTTAAAGG 1560
3865 CCCTGCTGAT GCAGTTCTGT CGTCCTTTGG GACTATACTG AATTTCGATG CGATCATAAG 1620
3866 TCGCCTCGAT TTCACGTATA GTGACAAACG CCCGATACAC GTTATCGAGC AGGAGCTAGG 1680
3867 CACCCTCAGA CAGGGAAGCC TGACGCTCCT CCAGTATTAT GATGAGGTCG AGAAAAAACT 1740
3868 CACCTTACTC ACCAATAAGG CGACTATGTC TTATGAAGCG TCGGCAGCAA CGGTGCTGTG 1800
3869 TGAGAAGTTC CGAGATGATG CTTTGAGAGT TTTTGTCTCG GGGCTCAGGC GCAACCTCAC 1860
3870 AGACGTGCTA TTCGCGGCAA AGCCTAAGGA CATGCCGTCA GCGCTCGCCC TGGCGCAAGA 1920
3871 AGTAGAGTCC AATCATGAGC GGTACACTTT TGCAACTTCA TTTGCACGAA GCCAAGAGGA 1980
3872 TAGGGACCAC AAGCAATATC CCAAAGTGCA GGAGCGCCAA CGGGCCCCCC CACAAGCCGG 2040
3873 CTCGCAGGGA AGTGCTGGGA AGAACCCGCA CTTTACTAAG CAGCATAGAG CACAGGTGCA 2100
3874 CTCCGCTCCA CGTAGCGACC GAATGGCCCG AGAAAACATG CCAGAACCCA TGGACGTTGA 2160
3875 CCCGTCGTTG TCCAGGATGC AGCCATCTCA CGCCCCGGCT TACCCGAAAT CGAAGCCGGC 2220
3876 CGCGTCTGGC CGTTCGGTCC CACCAAAAAG GCAAAGGGTC AACCATGTTG CCCAGGCCTC 2280
3877 TGATGATTTG GACAAGGTTT ATAACACCGC AGCCTCCAGT GCAGCAGTTA AAGTCGACGA 2340
3878 CGATTCCATC CTAGAGTACG ACTCGGATAC CATTAATTTT TTAGGGGAAA GTCCCTGCTA 2400
3879 CCCGTCATCA GACGAAGAGT AGCGGGGATC GACATGAAAC TACTGATTGA TACGGGCGCG 2460
3880 GCAAAAAATT TTATCCGACC ATTTAAGGGG TTGAAAGGCG TCCGCCCGGT GCAGTCCCCA 2520
3881 TTTACAATCC ATTCGATTCA TGGTGTGACT ACAATAACTA AGAAATGTTT CGTGTCCATT 2580
3882 TTTAATCTTA AAGCTACCTT TTTTTTATTA CCAGACTTGA CCTCCTTTGA CGCGATCGTT 2640
3883 GGCCTAGACC TGTTAAAACA GGCCGGCGCG TCACTTTGCC TAGCTTCCGG CAAGCTCAAA 2700
3884 TGGGGCTCCG GAGCAGAGCA AATTGACTTT CATACTTGCC CCGATGTCAA TTTCACCAAA 2760
3885 GTAGATTGCT CGGACGCACC GCCCTTAATT AAGGATGCTT TTTTAAAAAT GCTCGGGAAT 2820
3886 AGGAAAAAAG CTTTTGCTGA TCCTAATGAG GCTCTTCCTT ACAATACGTC GGTGGTAGCC 2880
3887 ACCATCCGGA CGGTTGATGA GGAGCCCATT TATGCCAAGT TATACCCATA TCCCATGGGA 2940
3888 GCAGCTGACT TCGTCAACGG CGAAATTCAG GAACTGCTTA AAAATGGCAT AATCCAAAAG 3000
3889 TCAAAGTCCC CCTACAATAA CCCAATATGG GTCGTAGACA AAAAGGGCAC TGACGATGCG 3060
3890 GGCAATAAAA AAATGCGCTT GGTGCTGGAC TTTCGAAAAC TTAACGAAAG GACGGTACCA 3120
3891 GACAGATACC CCATGCCAAA TATCTCTATG ATATTGGGGA ATCTCGGCAA GGCCAAATAC 3180
3892 TTCACGACCC TCGATCTGAA GTCTGGCTAC CACCAAATCA CGCTCGCAGA ACGCGACCGT 3240
3893 GAAAAGACAG CGTTCGCAGT AAACGGAGGG AAGTATGAGT TCCGAAGGCT GCCATTCGGA 3300
3894 CTCAGGAATG CTGCAAGCAT CTTCCAAAGA ACAATTGACG ATATTCTGCG AGAGCAGATC 3360
3895 GGAAAGTTCT GCTACGTTTA CGTCGATGAC GTCATCATCT TTTCGGAAGA TGAAAACGAC 3420
3896 CATGTCAAGC ATGTAGATTG GGTTCTGAAG AGCCTGTACG ACGCTAACAT GAGAATATCG 3480
3897 GCAGAAAAGT CACGTTTTTT TAAGAAAAGC GTGAGCTTCC TGGGGTTCAT CGTCACCAAC 3540
3898 AATGGGGCGG CGACTGACCC AGAAAAGGTT AAGGCCATAA AGGAATTTCC GGAACCCAAA 3600
3899 AACGTATTTG AGGTAAGGTC ATTCTTGGGC TTAGCCAGCT ATTATCGTTG CTTTATCAAA 3660
3900 GACTTCGCAT CAATAGCTAG GCCCATTTCA GACATATTGA AGGGCGAGAA CGGTAGTGTT 3720
3901 AGCCGACACA GGTCCAGGAG TATCCAGGTA GAATTTTCCG AAGCGCAACA ACGTGCCTTC 3780
3902 GAAAAGCTAC GCAATATCCT GGCGTCTGAG GACGTCATCC TGAGATACCC TGATTACAAA 3840
3903 AAAGCGTTTG ATCTAACGAC AGACGCTTCG GCCTACGGCA TTGGCGCAGT GCTGTCCCAG 3900
3904 GAGGGACGTC CCATTACAAT GATCTCAAGG ACATTGTCTG ACAGAGAGGT TAACTATGCT 3960
3905 ACCAACGAAA GGGAGCTGTT AGCCATAGTC TGGGCACTGG CTAAGTTGCG GCACTACCTG 4020
3906 TATGCGGTTA AAGAGATAAA CATCTTTACC GATCACCAAC CTCTGACGTT CGCGGTATCG 4080
3907 GAGTCCAATC CGAACGCCAA AATTAAGAGA TGGAAAGCAC GCATCGACGA GTCCGGCGCA 4140
3908 CGAATTTTTT ACAAGCCTGG GAGAAACAAC CTCGTTGCAG ATGCCCTCTC GAGACAACAA 4200
3909 CTCAACGTTG TTGAAGAGCA AGAACCGGAG TCGTGCGCGG CCACGATTCA CAGCGAACTT 4260
3910 TCGCTTACGC ACACGATCGA GTCCACGGAC AAACCCGTGA ATTGCTTCCA GAACCAGATA 4320
3911 ATTTTGGAAG AGGCGCGCTC CCATTGGAAA CGCACTTTTA TATTATTTGG GAATAAGAGG 4380
3912 CGGCACTCGA TCAATTTCTC GTGCAAACAA GCTTTGCTGG AGGAACTCGC CAACATCATT 4440
3913 ATCCCTAATG GTGTAAACGC CTTCCACTGT GATCTTCACA CGCTGGCGCT AATCCAGGAC 4500
3914 GACGTAGTTC GACAGTTTCC AGCCACGAAA TTCTGGCATT GTAAGAATAG GGTCACCGAC 4560
3915 ATCTTCGCGA TGCAGGAGAG AAAAGAAATC CTCACCGTCG AGCACAACAG AGCTCACAGG 4620
3916 TCGGCCCAAG AAAACGTGAA ACAAGTACTC TCCGAGTACT ACTTCCCGAA AATGACCAAA 4680
3917 TTGGCGAGCG AAATAGCAGC CAATTGCAAA ACTTGCGCAA AGGCGAAGTA TGACAGACAT 4740
3918 CCGAAGAAGC AGGAGCTCGG TGAGACACCA GTCCCGACCC ACGTAGGAGA AATATTGCAC 4800
3919 ATCGATATTT TCTCAACGGA TAAAAAATAC TTTCTCACCT GTGTTGACAA GTTTTCTAAA 4860
3920 TTCGCCATGG TACAGCCGAT TCTGTCTAGA ACCATAGAAG ATTTGAAAGC ACCCCTTTTA 4920
3921 CAACTTATGA ATGTTTTCCC CAAAGCCAAA ACCATCTACT GCGACAATGA ACCATCATTG 4980
3922 AAATCGCAGA CAATAGTGGC TATGCTGGAA AACCATTTTG GCGTCAGCAT TTCGAATGCA 5040
3923 CCGCCCCTAC ATAGCGTCTC AAACGGACAG GTGGAACGAT TCCACAGCAC GTTAATTGAG 5100
3924 CTCGCCAGAT GCCTAAAAAT CGACAAAGGC ATAAGTGACA CAGTGGAATT GGTCTTGCTG 5160
3925 GCCACAGCCA GATATAACAT GTCCATCCAC TCCGTCATCA ATAAAAAACC GGCCGAAGTC 5220
3926 ATGCGGGCAG ATCCGGACGA TCCACATACC GATGTCCAAG AAAAAATCAA AAACGCCCAG 5280
3927 ATTTTGACAA GAAAACGAGA GAACGCTTCT CGGCAGAACA GAGTGTTCCA GGTCGGCGAC 5340
3928 AAAGTCCTAG TAAAGTCAAA CAGACGATTA GGCAACAAAC TTACTCCTTT ATGTGAGGAG 5400
3929 AAGACCATCG AGGCAGACTT GGGGACCACA GTCCTTATTA AAGGGAGGGT GGTCCATAAA 5460
3930 GACAACCTCA AGTGACCCAA GCAGAGCCTA GCCGCGGCTC CCTCGGAGGC ACACTTTTAT 5520
3931 TCCTCCAATT TGTAGCCACT CGGCATAAGT TTTTTCATTG TTTTTATAGC CGCTTGGCAT 5580
3932 AAGTTTTTTA TTTTTTAGCC ACTTGGCATA TTTTTTATAT ATTTTCGCTA TTATTGGTGG 5640
3933 TGGGCAACTC CATTCCGAAC AAGTAATAAT TTATCACACA CGTTACAGGT CGCTCCCAAC 5700
3934 CCTTCTTCTT TGTTTCCTGG CCACGACATC GGCCCACATT ACTGACTATT CCCGAGCGAA 5760
3935 TTACATTCCC GTCATTGACG GTAAAGTCTT AGTCTGGGAG GAATTCGCCT ATGTCAGACA 5820
3936 CTCGGCTAAC CTCTCCGAGT ATAGGCGGGT AATTGACGAA ACCGACAGCA TGCTCGATAT 5880
3937 GTTCCCCCAG TCCCATATGA AGAAGCTCCT GAGCGTTGAT ATCGCTCACC TCCGTGACAT 5940
3938 GCTTGATTCT TTGAGCATCC ATCACAGAGT GGCAAGGAGC CTAGACTTCT TGGGAACTGC 6000
3939 GTTAAAGGTT GTCGCAGGGA CACCTGACGC GGAAGACTTC GAGAAAGTCA AGTTCACTGA 6060
3940 AGCGCGGCTT GTTGATGCAC ACAATAGCCA AATCGAAATA AACACCAAAA CACAAGTTCG 6120
3941 AATTAACGAA CTCACTGATA CCATAAATAA ACTTTTAAAA ATTTCCAAAA GCGCTCAGAT 6180
3942 TGATACAGGT CACCTGTATG AAACGCTTTC TACTCGCAAC AGAATCATTG TAATGGAATT 6240
3943 GCAAAACTTA ATGCTCACTA TAACCCTCGC TAAAATTAAC GTAGTGAGTC CAAACTTCTT 6300
3944 GGACCACGCA GATCTGGAGA GTATTTGGGG CGAGGAGCCC ACCAACACCC CCATAAGGGA 6360
3945 GATTTTGTCC GTTGCGTCTG TAAAAGTCCT ACAATCCCTT AACATCTTAC ACTTTATTAT 6420
3946 TAAATTCCCC AAGATTATCA TGGCGTGCAA CAAAGTCACT ATCCTTCCAG TGGTACACCA 6480
3947 CGATACGGTG TTAAGGTTGA AAGATAATGT GGTAGCAGAG TGCAACAGAG AAATACGCAC 6540
3948 AGTAAAGAAT TGCTCCATAA CACCAGGGGC AACATTTTGC CAGTTATCTT CAGTGAGCTC 6600
3949 GTGTGCGCAG GAGCTCCACG CTGGGGTCGT AGCACATTGC GACGCACAGC AGAGTGATCT 6660
3950 ACATCCGATC ACCTACGTCG ACGAAGGAAT AATCGTCATC AATGACAGAC CAGCACTCGT 6720
3951 GCGTGTGGAC AATGGAACGG CCATCCACAT TAGAGGCACG CACCTCATAA CATTCATTGA 6780
3952 GAGTGCCATG GTCAACGAGA CCGTCTTCTT TAATCATGAC ATGGTCCAGA ATAGGGCGCC 6840
3953 GGGAGTGGCT AATTCCCCAG TCCTTAATAT CTCGATGAAA CACGAGGTCC TGAGCCTCCC 6900
3954 ATACCTTCAC CGTTTAAGTG AAAAGAACTT GGAGCAAATC AGGAACTTCG AGAAGGACGT 6960
3955 CGACGGATAC CGACTAAGTC AGATAGCGTT AGTTGCGGGA GCAATTTTCT GCGCTCTTAT 7020
3956 CTGCATCGGT TTAACCTGGC AGCGAACCAC TAGGGCCAAG AAATCTACAG CCCAACTGAA 7080
3957 GGAAGTTCTC GCCCAAATAG GGTCAGCCGA GGGCGGCCTT AATCTTGAGG AGGGAATAGT 7140
3958 TAACTAAGTT AACCGGACTG ATCGTCCGCA CACCAGCACC GGTCAAACTG CTGACCAAGC 7200
3959 ATTTGGCCGG AAGCTCATGC ATAGCCGGCA GAAGCTCTGC GCATTGGCAG AGGCCGCTAT 7260
3960 GATGTTTTTC CCTTTGTTAG CTTATAGTCA GTTTGATTTT GTATTCAATA AAGAGCGCAT 7320
3961 CGCGCCTTCA ATCAACTCCA GCTACTGCTG TTATCATTGA ATTGGTTGGC TAGCCTTAAG 7380
3962 GGCAGTCAAC AACGGAGAGA CGTTCTCCCA CCATATCTCC CAATCTAGGA GAAGAGGTCT 7440
3963 GCGGCAACCG CCCTGCCTCC CAGTGACAGA AGAACCCCCC GTTACCTGCA ACCTACGCCG 7500
3964 GAGACCGCGG CGAGGGACCT GCACCTTATA TTTAATTAAT TTAACT 7546
3965 //
3966 ID TARTC standard; DNA; INV; 11124 BP.
3967 XX
3968 AC AY600955;
3969 XX
3970 DR FLYBASE; FBte0001208; Dmel\TART-C.
3971 XX
3972 FT source AY600955:1..11124
3973 FT SO_feature non_LTR_retrotransposon ; SO:0000189
3974 CC telomeric retrotransposon
3975 FT SO_feature direct_repeat ; SO:0000314:1..331
3976 FT SO_feature direct_repeat ; SO:0000314:10383..10713
3977 FT SO_feature five_prime_UTR ; SO:0000204:1..205
3978 FT SO_feature three_prime_UTR ; SO:0000205:6629..11102
3979 FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:11103..11124
3980 CC derived from polyA tail of RNA transposition intermediate
3981 FT SO_feature CDS ; SO:0000316:206..3349
3982 FT SO_feature start_codon ; SO:0000318:1..3
3983 FT /name="Dmel\TART-element\gag"
3984 FT /db_xref="FLYBASE:FBgn0014071"
3985 FT /db_xref="NCBI_PROTEIN:AAT12844.1"
3986 FT /db_xref="SPTREMBL:Q6J4U8"
3987 FT /translation="MDGHNGDINEGWATVLSISSDDSNQLSSPPSIIVSSLDTTPTSN
3988 FT ETTIVRRSLHNPKADMKSYRFENIVLNENKNTILPDPLFVDKCGNTANTTEANEKKPA
3989 FT NSPFPISIIKNLSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTQIKPAKPS
3990 FT PPSKELSTNSAPKTLSYTDKITVTQKNLPDKTHVDRPTQDDDINATKASKTAKIISTQ
3991 FT LHLRETKPTQPAKDPSPRTQKPIANKAAETLTHTDKLIASQNLVPAKTHINSPTQYND
3992 FT TNATNALKTAKINFSSHSHQSEIKPTQSAKNISPLTQKQFTSESAGTHTHTDKHKNTA
3993 FT SQNLFSAKTHINSPTQHNDTSAATASKTAKLILSPHSHLSETKPTQPALSPSPLSQKQ
3994 FT ITSIAAKTLTHTNKHTASQNFIPAKTHINIPTQYNDTNATKALKTAKAASPSHTYSRQ
3995 FT TKPIKPAINALHAAQDTNPSPAISAVTYTDKPTATQNIFPVKTFAELIRENAKRSPTP
3996 FT IENPPQAKHDSAALGRPPTAARKNLNKTLISPKTPGKRRGDCLDEGLLQTSNKKVRIR
3997 FT DDFSDDDLGVTNLLSETPLFKSKAAIKIRQDSRRESLQKSAEMDTAPAISPSNAAADP
3998 FT DLPPWKTVPASRKPPSIFLSNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTM
3999 FT DAYNAIQNVLLEANIPLHSHQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFI
4000 FT RAMQFRDTRNPMRIHEVEVVPKADGSHLKVLLIKSLGGQTVKVERKRVSKDPTQCHRC
4001 FT QCFGHTKNYCRNPFKCMKCGQLHASVSCTKPKNLPATCANCNGSHVSSYKGCPVFQEA
4002 FT KQRLSINKIQSLHSQPTHLQTPRNKHPYPKPTHIQTPLNKQPYTHPLPRTLVNNTKLP
4003 FT AKRIQGKKISQRNLSINKRLNRIRTLDRKPRNETSPPTTSKKVLASLEESRKNPNSAL
4004 FT NPANTHLTHFRPPPLAQNIPNDESKELSGEQYLLNRIEGMEKKLNNLLEIVTRLLSQG
4005 FT KDCPKSPKNPFRDPIFV"
4006 FT SO_feature CDS ; SO:0000316:3350..6628
4007 FT SO_feature start_codon ; SO:0000318:1..3
4008 FT /name="Dmel\TART-element\pol"
4009 FT /db_xref="FLYBASE:FBgn0014072"
4010 FT /db_xref="NCBI_PROTEIN:AAT12845.1"
4011 FT /db_xref="SPTREMBL:Q6J4U7"
4012 FT /translation="MLFLVTSEVTFPMTRECNRDILKIAFWNAGGINNKIDELKLFIL
4013 FT NIDAHIIIVTETRLDNNSTKLELPGYFTYLAQNPASSKRGGVATIVNSSLRHMALEPI
4014 FT EKECIQSAPIVLLPENNRRSEMIVIASVYCPPSLSWSPHHFTDVLNFAEKTMGGQTKL
4015 FT ILCGDWNAKHRQWGCIRACQRGAALYDAIQADSMAEIVATGSATHFPHDTRKSPSAID
4016 FT FSICKRLGRYEKRISSSAHLSSDHLPILLEINLDIKTISLQKQNNNILKKTTNIELFK
4017 FT NVLERKILLNTEIRVAEDINDAINIFIKNIKDSAAESTPSPRIPDNHRRRYGQANRNS
4018 FT HTLTLDENTSRLLEEKRIQSRIFKATRTNEDKTKLKAAENRLKKVIKILREKRINEQI
4019 FT EGIDTNNPDRMRKIWRLLSEGKKMNQPNFPLKLETKKGPKWTKTIKETTEAFVSHLEG
4020 FT RFKPNKIVPDYHIDKVNTGLRIIKESMLTERHNLNKNPHNQPITLNELNEEIKNLKNS
4021 FT KAPGKDLITNQLIKTLPTKATLYLILIYNSILRLGYYPEAWKHAQVKMILKPGKSSNE
4022 FT PKSYRPISLLSGLSKMFERLLLKRLFRVDLFKKAIPLHQFGFRKEHGTEQQIARVTQF
4023 FT ILEAFERKEYCSAVFLDISEAFDRVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVK
4024 FT DQAGETSRTGQIGAGVPQGSNLGPLLYSIFSSDMPLPYIYRPSPTQRIMLSTYADDTI
4025 FT VLSSDTLATAATRNNENYLKTFSDWADKWGISVNAAKTGHVIFTLKNDLPTNSMNVKI
4026 FT KGQTIKKESKQSYLGVTLDSKLTLSSHVTKLLGKYSTAYRKLTWILNGRSKLPTKTKI
4027 FT LILKSVLSPIWQYAIAAWGPLVTDAQIRRVQVEENRKIRDICRAGRYTRNQTIRDLFG
4028 FT VKTVEEFYQQAMHRFSETIKSHPNIAVRRILSRHYIPNRLERSRQRYFKMTNDHITQK
4029 FT QTGLALSPKLLKIPDIDDCRTVKKRSEREKIRQMHLTELPTLLRLEEEEEELKRIKKQ
4030 FT EEREKRERENQKWPPDRWCELEINRYNKQYRKGDLTRQEVIEKFRGQPLNVQRIILPD
4031 FT YEGD"
4032 XX
4033 CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially
4034 CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314").
4035 CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates
4036 CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short
4037 CC distance into ORF-1. The 5’ ends of TART-C elements are variable and the
4038 CC minimal size for functionality has not been determined. Thus, this
4039 CC canonical sequence, AY600955, may be 5’ truncated within the 5’ PNTR (M-L
4040 CC Pardue, 2009).
4041 XX
4042 CC Derived from AY600955, Michael Ashburner, 6-Apr-2004; updated Jan-2009 as
4043 CC per Mary-Lou Pardue and Greg DeBaryshe.
4044 CC Any changes to original sequence record are annotated in an FT line.
4045 XX
4046 SQ Sequence 11124 BP; 3774 A; 2893 C; 2173 G; 2284 T; 0 other;
4047 AAGCTTCGCG GGATATCGAT AACAATCAGG TGGTTAAAAA TACTATAACA TCGAGTACCA 60
4048 GCCGTGTTTT TCCTGTCGAT TTATCGAAGT CCAACAGCCC GCCTTCGCTC CGAACACAAA 120
4049 TCGGCAAGTC AGTAGCTTTT TTAACCCGGC AGTGGCGCCT GTGCAGCAGC TATTTAAAGT 180
4050 GAAAAACACG AAACGCAACA ACAAAATGGA CGGCCATAAT GGAGACATAA ATGAAGGATG 240
4051 GGCAACAGTA CTATCTATCT CGTCGGATGA TAGTAACCAA CTTTCGTCGC CGCCGTCAAT 300
4052 TATAGTCTCA TCGCTGGACA CCACGCCAAC GTCAAACGAA ACCACCATAG TAAGAAGAAG 360
4053 CCTACACAAC CCAAAAGCTG ACATGAAATC TTACAGATTT GAAAATATTG TATTAAATGA 420
4054 AAATAAAAAT ACCATATTGC CAGATCCTTT ATTTGTTGAT AAATGCGGAA ATACTGCTAA 480
4055 TACCACAGAA GCCAATGAAA AAAAGCCTGC CAATAGCCCC TTCCCCATTT CCATTATCAA 540
4056 GAATCTTAGC ACTTCCTCGC CACTAACACA TGTAGACACG CCTACACAAG AAGATGACGC 600
4057 CAGTGCATTC AATACATTGA AAGCAGCCAA AACAGCTAGA ATAATTTTTC CCACACACAC 660
4058 ACAGATAAAG CCCGCCAAAC CCTCGCCCCC TTCCAAAGAA TTAAGCACAA ACTCAGCACC 720
4059 CAAAACTCTT AGCTACACAG ACAAAATTAC AGTAACACAG AAAAATCTAC CCGACAAAAC 780
4060 ACATGTAGAC AGACCTACAC AAGATGACGA CATTAATGCA ACCAAAGCAT CAAAAACCGC 840
4061 CAAAATAATT TCTACACAGT TACACCTACG TGAAACCAAG CCAACACAGC CCGCCAAAGA 900
4062 CCCCTCACCC CGCACCCAAA AGCCTATTGC AAACAAAGCA GCCGAGACAC TCACCCACAC 960
4063 AGACAAACTC ATAGCATCAC AAAACCTAGT TCCCGCCAAA ACACATATAA ACTCCCCCAC 1020
4064 ACAATATAAC GACACTAATG CAACCAATGC ATTAAAAACC GCTAAAATAA ATTTCTCTTC 1080
4065 ACACTCACAC CAAAGTGAAA TCAAGCCAAC ACAGTCCGCC AAAAACATTT CACCCCTCAC 1140
4066 ACAAAAGCAA TTCACAAGCG AATCAGCCGG GACACACACC CATACAGACA AACACAAAAA 1200
4067 CACAGCATCA CAAAATCTCT TTTCCGCCAA AACACACATT AACTCACCCA CACAACATAA 1260
4068 CGACACTAGT GCAGCCACAG CATCAAAAAC CGCTAAATTA ATTCTCTCCC CACACTCACA 1320
4069 CCTAAGTGAA ACCAAGCCCA CACAGCCCGC TTTAAGCCCC TCGCCCCTCT CCCAGAAGCA 1380
4070 AATAACAAGC ATAGCAGCCA AGACACTCAC CCACACAAAC AAACACACAG CATCACAAAA 1440
4071 CTTTATTCCC GCCAAAACAC ATATAAACAT ACCCACACAA TATAACGACA CCAATGCAAC 1500
4072 CAAAGCATTA AAAACCGCAA AAGCAGCTTC TCCCTCCCAC ACATACTCAC GTCAGACAAA 1560
4073 ACCAATAAAG CCCGCCATAA ACGCATTGCA TGCCGCCCAA GACACAAACC CAAGCCCAGC 1620
4074 AATCAGTGCT GTCACTTACA CAGACAAACC CACAGCTACT CAGAATATTT TTCCTGTCAA 1680
4075 AACTTTTGCA GAGCTGATTA GAGAAAATGC AAAACGCTCA CCAACTCCAA TCGAAAATCC 1740
4076 CCCTCAAGCA AAACATGACT CTGCCGCCCT CGGACGCCCT CCGACTGCAG CTAGAAAAAA 1800
4077 TCTAAATAAA ACACTGATTT CTCCTAAAAC TCCTGGGAAG CGCCGTGGGG ACTGTCTTGA 1860
4078 TGAAGGCCTA CTTCAAACCT CTAACAAAAA GGTTAGAATA CGCGACGACT TCTCTGATGA 1920
4079 TGATCTGGGG GTCACAAACC TACTCTCTGA AACACCCTTA TTCAAAAGCA AAGCAGCTAT 1980
4080 TAAGATTCGG CAAGACTCGA GAAGAGAATC CCTGCAGAAG TCAGCTGAAA TGGACACAGC 2040
4081 TCCAGCAATA AGTCCCTCAA ACGCAGCAGC CGATCCCGAC CTACCGCCCT GGAAAACTGT 2100
4082 TCCAGCTAGC AGAAAACCAC CATCAATCTT CCTGTCCAAT ATACAGCAGA TTATCCCGCT 2160
4083 AATAGAAAAA CTAAACTATA AAGCCGGGGT AAATAGCTTT ACTACCAAGT CTGAACTTGG 2220
4084 CAACAATATT AGAATCCAGG CTAAAACGAT GGACGCCTAC AATGCAATTC AGAATGTCCT 2280
4085 CCTTGAAGCA AACATTCCCC TACACTCTCA CCAGCCAAAG AGTGCAAAGG GCTTCCAAAT 2340
4086 TGTAATTAGG CACCTCCACC AGTCAACCCC GACCAAATGG ATTGAAAGCC AACTTCAAGA 2400
4087 CATCGGTATA GCTACAAAAT TTATCAGGGC AATGCAGTTT AGGGACACGA GAAATCCTAT 2460
4088 GCGCATCCAT GAGGTTGAGG TTGTACCCAA GGCTGACGGC AGCCATCTTA AGGTCCTGCT 2520
4089 AATAAAATCC CTTGGAGGAC AAACGGTCAA GGTCGAAAGG AAACGGGTAT CGAAGGATCC 2580
4090 TACACAATGC CACCGCTGCC AATGCTTTGG ACACACAAAA AATTATTGCA GAAACCCGTT 2640
4091 TAAATGTATG AAATGTGGCC AGCTGCACGC CTCGGTCTCA TGCACCAAAC CCAAAAACCT 2700
4092 TCCGGCTACT TGTGCAAACT GCAATGGAAG CCACGTTAGC AGCTATAAAG GATGTCCTGT 2760
4093 TTTCCAAGAA GCAAAGCAAA GACTATCTAT CAACAAAATT CAATCCCTTC ACTCACAACC 2820
4094 CACCCACCTT CAGACCCCCC GCAATAAACA TCCCTACCCA AAACCCACCC ACATTCAGAC 2880
4095 GCCCCTCAAT AAGCAGCCCT ACACACACCC CCTCCCTCGC ACATTAGTAA ACAACACAAA 2940
4096 ACTACCTGCC AAAAGAATCC AAGGAAAGAA GATATCGCAA AGGAATCTAT CTATAAATAA 3000
4097 ACGCTTAAAC AGAATCAGGA CATTGGACAG AAAACCGAGG AATGAGACAA GCCCGCCGAC 3060
4098 AACTAGCAAA AAGGTCTTGG CCTCTCTAGA AGAAAGCAGA AAAAACCCAA ATAGCGCCCT 3120
4099 AAACCCGGCC AACACCCATC TCACTCATTT CCGCCCACCA CCATTAGCAC AAAATATTCC 3180
4100 TAATGACGAA TCTAAGGAGC TGAGTGGGGA GCAATACCTT TTAAATCGCA TTGAAGGGAT 3240
4101 GGAAAAGAAG CTCAACAACC TTCTTGAAAT CGTCACCCGC CTACTAAGCC AAGGAAAAGA 3300
4102 CTGTCCAAAG TCTCCAAAAA ATCCTTTCCG AGATCCAATC TTCGTTTAAA TGCTCTTTCT 3360
4103 AGTAACATCA GAAGTGACGT TTCCTATGAC TCGGGAGTGC AACAGGGACA TCCTTAAAAT 3420
4104 CGCTTTCTGG AATGCTGGTG GGATCAACAA TAAAATAGAT GAGCTTAAGC TGTTCATTCT 3480
4105 AAATATTGAT GCCCACATAA TCATAGTCAC CGAAACTAGA CTAGACAACA ATTCTACCAA 3540
4106 ACTAGAGCTG CCAGGATATT TCACATACTT AGCCCAAAAT CCTGCCTCTA GCAAGAGAGG 3600
4107 AGGAGTCGCC ACGATAGTAA ACAGTAGTCT CCGCCACATG GCCTTAGAAC CGATTGAAAA 3660
4108 GGAATGCATA CAGAGTGCCC CAATAGTATT ACTGCCTGAA AACAACAGAC GCAGCGAAAT 3720
4109 GATTGTAATA GCATCTGTCT ACTGTCCGCC TTCGCTAAGC TGGTCGCCCC ACCATTTTAC 3780
4110 TGACGTTCTC AATTTTGCTG AGAAAACTAT GGGAGGGCAG ACTAAGCTCA TTCTATGTGG 3840
4111 CGACTGGAAC GCAAAACATA GACAATGGGG TTGTATACGC GCCTGCCAAC GTGGCGCCGC 3900
4112 ACTCTACGAT GCAATTCAAG CAGACTCCAT GGCTGAAATC GTCGCGACTG GCAGCGCTAC 3960
4113 ACATTTCCCG CACGATACAA GGAAAAGCCC GTCAGCAATA GACTTCTCGA TATGTAAACG 4020
4114 GCTTGGCAGG TATGAAAAAA GAATCTCCTC AAGTGCACAC CTATCCTCAG ACCATCTTCC 4080
4115 CATATTACTT GAGATAAACC TAGATATAAA AACCATCTCC CTGCAAAAAC AAAACAACAA 4140
4116 TATCCTCAAG AAAACAACGA ACATTGAGCT CTTTAAGAAC GTTCTAGAAA GGAAGATACT 4200
4117 TCTAAACACT GAGATAAGGG TAGCAGAAGA CATAAATGAC GCCATAAACA TCTTTATTAA 4260
4118 AAACATCAAG GACTCGGCTG CTGAATCAAC TCCCTCCCCA AGAATTCCTG ATAACCACAG 4320
4119 AAGAAGATAT GGGCAAGCTA ACAGAAATAG TCATACGCTC ACACTAGACG AAAACACAAG 4380
4120 CAGATTGCTG GAAGAAAAAC GTATACAAAG TAGAATTTTT AAAGCTACTA GAACGAACGA 4440
4121 GGACAAAACT AAACTAAAAG CAGCTGAAAA TCGACTTAAA AAAGTAATCA AAATCTTAAG 4500
4122 AGAAAAGAGA ATCAATGAGC AAATTGAAGG AATTGACACA AATAACCCGG ACAGAATGAG 4560
4123 GAAAATTTGG AGGCTGCTGA GTGAAGGGAA AAAAATGAAT CAACCCAACT TTCCCCTCAA 4620
4124 ATTAGAAACC AAAAAAGGCC CTAAATGGAC TAAAACAATT AAGGAGACAA CAGAAGCGTT 4680
4125 TGTCTCCCAC CTGGAAGGAA GATTCAAGCC AAATAAAATT GTACCTGATT ACCACATAGA 4740
4126 TAAGGTTAAC ACCGGACTAA GAATAATTAA GGAAAGCATG CTAACAGAAC GACATAATCT 4800
4127 AAACAAAAAC CCCCATAACC AACCCATTAC GCTAAACGAA TTAAATGAAG AAATAAAAAA 4860
4128 CTTAAAGAAT AGCAAAGCAC CTGGTAAAGA CCTTATAACA AACCAGCTCA TAAAAACCCT 4920
4129 ACCGACTAAA GCTACCCTGT ACCTTATCCT AATCTATAAC TCCATACTTA GATTAGGATA 4980
4130 CTACCCTGAA GCCTGGAAAC ATGCACAGGT AAAAATGATC CTGAAGCCAG GGAAAAGCTC 5040
4131 AAACGAGCCG AAGTCATACA GGCCGATTAG TCTACTCTCG GGACTCTCTA AAATGTTTGA 5100
4132 AAGACTACTC CTAAAAAGAC TTTTTAGGGT AGATCTATTC AAAAAAGCCA TACCACTGCA 5160
4133 CCAATTTGGC TTCAGAAAAG AGCACGGAAC TGAGCAGCAA ATAGCCAGGG TCACCCAGTT 5220
4134 CATCCTCGAG GCCTTCGAGC GGAAGGAATA CTGCTCAGCG GTTTTCCTTG ACATCTCTGA 5280
4135 GGCCTTTGAT AGGGTATGGC ACGAAGGCCT TTTACTTAAA TTAGCTAAGA TCCTACCTTA 5340
4136 CAACCTATAC ATTATACTGG AGAGCTACCT TACAAATAGA ACGTTCGAAG TTAAAGACCA 5400
4137 AGCAGGAGAG ACTTCGAGAA CAGGACAAAT AGGCGCAGGA GTGCCTCAAG GAAGCAATCT 5460
4138 CGGACCACTA CTTTACTCTA TCTTCTCCTC TGACATGCCC CTCCCATATA TCTACCGCCC 5520
4139 TTCACCAACA CAAAGAATTA TGCTCTCAAC ATACGCAGAC GACACTATAG TCCTCAGCTC 5580
4140 AGACACACTA GCAACTGCCG CCACAAGAAA CAACGAAAAC TACCTCAAGA CATTTTCGGA 5640
4141 CTGGGCGGAC AAATGGGGTA TCTCAGTAAA CGCTGCTAAA ACCGGACATG TCATTTTTAC 5700
4142 ATTAAAAAAC GACTTACCTA CAAACTCAAT GAATGTGAAG ATCAAGGGTC AAACAATAAA 5760
4143 GAAGGAAAGC AAGCAATCAT ACCTTGGGGT AACCCTTGAT AGCAAGCTAA CCCTTAGCTC 5820
4144 TCACGTCACA AAGCTATTGG GTAAATACTC TACAGCCTAC AGAAAATTGA CATGGATCCT 5880
4145 AAACGGAAGA AGTAAACTCC CTACTAAAAC TAAGATACTG ATCCTTAAAT CAGTTTTATC 5940
4146 ACCAATATGG CAGTATGCCA TAGCAGCTTG GGGTCCCCTT GTGACAGATG CACAGATAAG 6000
4147 GAGGGTCCAG GTTGAGGAAA ACAGAAAAAT AAGAGACATA TGTAGAGCGG GAAGATATAC 6060
4148 GAGAAACCAA ACTATAAGGG ACCTTTTTGG CGTCAAAACA GTAGAAGAAT TCTATCAACA 6120
4149 GGCTATGCAC AGGTTCTCAG AAACTATAAA ATCGCACCCA AATATAGCTG TTCGCAGGAT 6180
4150 TCTCTCTAGG CACTATATCC CGAACAGACT AGAAAGAAGC AGGCAGAGGT ACTTTAAAAT 6240
4151 GACAAATGAT CATATCACGC AAAAGCAGAC TGGACTTGCC CTCTCACCTA AACTCTTAAA 6300
4152 AATCCCTGAT ATAGATGACT GCAGAACCGT AAAAAAGCGT AGCGAGAGAG AGAAAATAAG 6360
4153 ACAAATGCAT CTAACTGAAC TCCCCACCTT GCTGAGACTA GAGGAAGAGG AGGAAGAGCT 6420
4154 CAAAAGAATA AAAAAACAGG AAGAAAGGGA AAAAAGAGAA AGGGAAAACC AAAAGTGGCC 6480
4155 TCCAGATAGA TGGTGCGAAT TGGAAATAAA CCGATATAAT AAACAATATA GAAAGGGCGA 6540
4156 CCTAACCAGG CAGGAAGTTA TAGAAAAATT CAGAGGGCAA CCATTAAATG TACAACGAAT 6600
4157 AATCCTACCC GACTATGAAG GGGACTAAAA TTAAATCAAA ACAAACCAGG ACAGGAGCAG 6660
4158 AAGGCAGAAA TAATCAAAAC TGGCGGAAGG GGTGGCAAAA TATTGAAAAG AGAGGAAAGA 6720
4159 AATATAAAAA GGCTAAAGGC TAAGTTACAG GTTACATAAA AAGGGAAATC TGCTTATAGA 6780
4160 TATTATGGTA AAATTAACTT AACTAAACAC CTACTGGTTA ACAAAATAAT TATGCCTGCA 6840
4161 TGGCACAAGC TGCGTACTCA AATCATTTCT CCTGACGCTA TTGAAAATCC ATCTTTACTT 6900
4162 TCCAACCGAG GGACTTGCGA CTGCGGTCTT TCCGCCTTAT TGGCTCCTTA TGGATCCATC 6960
4163 TGCTGCCGTA TTGGGCGACA CACCAGCGCT CCAACCTAAA AGAGAGATAA CATGTTTTAA 7020
4164 TTCACTTTCC TTTTCTTATA ACTAAATCAC AACAACAGCA ACAGCGCATC GGGCGACTGA 7080
4165 CAAAAGCATT AGCTCACCAA GTCAGCAACA ACAGCAGCAG CAAGACCAGA ATCAGTTGAG 7140
4166 GAGGAGGCCT GGTGGTGTGC TGAACATTTC GCCGCCCACA CCCACCATTT CTGTAGGCCT 7200
4167 GTATGACCCT GAGCCCAACG CCGGCATGGC AAATCCGGTC TTCCTGAGGA GGCGGGGCTC 7260
4168 TAGTGTTAGG CGCGCTTTTG CCCCAAAAGC AACAACGACA GCGGCAGTAG GGTCGGCGCC 7320
4169 CCCTGCGTGA CCGAGTCCAT CTTAGCAATC GGTCCTTTTG GCGGTGTTAT GCCGACGCGG 7380
4170 CGGTCGCGCT TATGAGGACT GCCTGCAATG CTTGGCCATG AGACGGCGTC ATCGACAACA 7440
4171 TTTCAATCAC GCTCAGCTGG TTGACCGGGG GCAACATGCT TGCCATGCAG CAACAATGGT 7500
4172 GCATGCAGTC CAGCATGCAG CAACAACAAC AATATTGGCA GCAGCAGACT AATGTTTCGC 7560
4173 AGCAGATTCC ATCTGGCAAC TTCCGACGAC CAGACTCCTC GCTTGGCCCC TGGAGACTCG 7620
4174 CTCTGGAAAA AAAAAGAAAG AAGCATGGAT TAGTTTTTTT TTTTCCCTTT AGCTATTGGA 7680
4175 TTAAATTTCT TTCCTGGACA ACCGGCGCCT TCATGCAGAT GACGCTGGAC TGCGGCGATT 7740
4176 CTTTCCCTCC AGCCACAGAT GGGAAGCTCA CATCATGGCA TATATGCGGC ATCGTGCTAA 7800
4177 TCAGCTCCCC ATGCTGAGCG AGATCTTGAT GCGGCGATGC ACTCACTAGC GAGCAGCGGG 7860
4178 AACAGCATAC AGCGTCAGCA ACAGCAGGAA GAGACTTTGT AGCAGAAGCC TTTCGGCATT 7920
4179 CTCCGACGAC CCGACTCCTC GATCGGGGTC AGGCAAATTC TCCTGGACCG ACAAATTTTC 7980
4180 CCGGCGTTTC GTCCTGGAAT AAGGAAGGAA GCACGGATTA ATTTCTCCCC TTCAGCTTAC 8040
4181 GACCCTTCTC ACCAACAGCA GCAACTACAA CAACATCGGC AGCAGACGAC TTGCAGCTGC 8100
4182 TTGGCTCACC TAATGCGACA GCAATAATCC CGGCAAGGCC AGAAACGGCA CCGAGCAGAA 8160
4183 GCACGACAGG GTGAAGAACA ACATGCCGCC CACGTCCACC AATCCGGAAG CCCTGCATTA 8220
4184 GGGGTCTGAA GCGCCATTAA CTGGAGGATC CGGCAGCGTA TGCCTACGCA GAAGCGGGGC 8280
4185 GTCGTAAATC CGGTGGCCGG AATAGCGCCT TGAACAGCAT GCTGTGTATG TTTGCCCCAA 8340
4186 AAGCAGAAAC TGCCGCAGCA AAGGAACCGC AAGCAGGATC ATCACTCGTG GCAAACTGGC 8400
4187 GTATTCCTGT TGAAGACGCG GGACTGCGGC GCATTCTTCC TTTCCAACCG GGGGCTTTAG 8460
4188 CGCTGCGGTA TTTCTGCTTT CACGGCTCCA TTTGCTGCTG CATCTGACGC CTCATCAGCG 8520
4189 CTCCTCCCTG AAAGAAAGAG AATATGTATT AGTTTTCTTT CCATTCCTTA CAATCTCTCT 8580
4190 CACCAAACCT CCACGACACA ACAACAGCAG CAGAAACAGG TCTAGCCCAC AATGGCAGCA 8640
4191 GCTACAGCAA TCAGCAGAAG CAAGGCCGGC AAAAGCAACA ACAAAAGCCC TCTCTGAAAG 8700
4192 CCCGGATGTG GAGACTGAAG CGCCGGAAAC TTGAGGATCC GCCCCCGATG CACGCCCACC 8760
4193 AACAATAAGC TGGAGGAGAA GTTACTGAAG CATGGGAAGC AGCACCAGGG GTCGCATACG 8820
4194 CAGCGTCAGG GCTTTGCGAA CCAGATGAAT GAGGAGAGAC TGGAACAGCA TAACATCAGC 8880
4195 GGCAGCAACA ACAGCGCCAC GAGGGTCAGC GGCGTCTGCA TGGCTGTGTC CAAAACAACT 8940
4196 CCAATTCAAC TGCTGTATGA TGCAGCGCAC CAGCGGCTTT CACAGGGACC GTCTGAAACG 9000
4197 CTTGGCAGGA GCCGGCTGAA GGCCTGGGCG AAGACACTGG AGACACCAAT GCGGCTCCTT 9060
4198 TCGGCCGACG GCAACAGGCT TGCCATGCAA TAAGAACAGT AAATCCTGAA ATAACAGCAG 9120
4199 AAGATACAGA CGTCCAAATT GCGAACACTG ACGCCAGCCC TCACCTGAAC GACTCACTGT 9180
4200 GCAGCAGCAG CAACATCAGC ACCGATGCCC TCAGCATCGG CAGCAGAGGG TGTTTTTGGC 9240
4201 CTTTGACAAT TCCCTGCGAC TTGACTTCTT CTTGGCATCT GGTCAATCAT CACGTGCCAG 9300
4202 CAAACAGTGG CTTGTCACCC TGGAAGAAAG AAGACTGGAT TAGCTTCTCC CCTTCTAATA 9360
4203 CATTTTGTGT GTTGAAATGC ATCAGGCGGC GACACACTCA CCAGCAACAG CAGCAACAAC 9420
4204 ACCAGCGGCA CCGGTAGCAG GAAATGGATC CTCAGCAAAA ACCATCGGCA CTTTCAGACG 9480
4205 TCCCGTACTC CTCGCCTGGC CCTGGCCGGT AACAGGGGCT TGTTAGATGG AGAAGACGAC 9540
4206 GGTCATCCGA CGGACAGCAG CCTGAAGATG GAAGCAGGCC TACGCTGCCC ACCTCTCCGA 9600
4207 TGCCTGCAGC AGCAACGGCA GCGGCTCATA AATGCAAACT GGCGCCAGCC CTCGGCTCTT 9660
4208 CGGGCTCATG TAGGCGGTGA CACACTCACT AGCAGCTAAA ACAGCAACGG CGGAATTAGT 9720
4209 AGAAGCAATG TTTTGCCGCA GCTGCCAGAT GGCATACTCC TAGCTTGGCC CCTGCCCAAA 9780
4210 CCGTATTGGA CCGGCAAATG ATTCGACAAT CCGATCTGGA AAAAATAAGT ATTGATTAAT 9840
4211 TTTTCCCCCA CAGATTGGTA TAAAATTGCA TTTACGGCCA ACCGGCTTCT TCCTGTTGAT 9900
4212 GACGTCACGC TGCGCCGCAT GCTTTTCGCC AGCCACAGTT GGAATGCATG CATTGGGGTT 9960
4213 GACGGTCCGG ATGGGCCGTT GCCTGTTATA TGCTGGCATC TCCGCAGCGG CGTTGTGAGC 10020
4214 AACGACACTG AAAGCAACAA TAATATTGTT AATTACTGCT CAAAACTATA ACACATTTAA 10080
4215 TCACTTACAC AATTTACACA CGCTTCCTGC CTAGGAGTTG TGGGACCAGC TACCGATAAT 10140
4216 GCCAACAATA CCGGGAAACG CGTCGCGGGA CATCGATAAC AATTTGGCGG TTAAAATGCT 10200
4217 AGAACATCGA GTACCAGACA TGTTTTTCCT GCCGATATAT CGAAGCCCAA TAGCCGCCAA 10260
4218 CGCTCAAAAC ATAAATCGGA GTGTGAGACC AGATACTGAA GCCGTTAAAA GCTTTTACCG 10320
4219 GCATCGGTAG CTGGTCTCAC ACTCCGATTT AAATTTGGAG CGTTGGCGGG CTGTTTGACG 10380
4220 CGAAGCTTCG CGGGATATCG ATAACAATCA GGTGGTTAAA AATACTATAA CATCGAGTAC 10440
4221 CAGCCGTGTT TTTCCTGTCG ATTTATCGAA GTCCAACAGC CCGCCTTCGC TCCGAACACA 10500
4222 AATCGGCAAG TCAGTAGCTT TTTTAACCCG GCAGTGGCGC CTGTGCAGCA GCTATTTAAA 10560
4223 GTGAAAAACA CGAAACGCAA CAACAAAATG GACGGCCATA ATGGAGACAT AAATGAAGGA 10620
4224 TGGGCAACAG TACTATCTAT CTCGTCGGAT GATAGTAACC AACTTTCGTC GCCGCCGTCA 10680
4225 ATTATAGTCT CATCGCTGGA CACCACGCCA ACGCCTGTCT AATGCAAATC AACTTACATA 10740
4226 TTACTCTAAA ATCTACTTAT AACTGTCCCC TCTAATGATA AGCAATTTTT ATGTTTACTT 10800
4227 TAAACTTAAA CCGATACCTT AAACTATGGC GCGCAAAATG ACTACCAAGA AATCTAAAAC 10860
4228 TGTAAATTGT TGCAAACTAT TTCTCCTAGT AATGTTAAAT TTAAATGCGC GCATAACCGC 10920
4229 AGCCAAGTTA ACCAAAAATG TCACTCGTAA ATGTAATTCC TAAATTAACA CTTGTAACTA 10980
4230 AGCGCGTATA AATACCGCAA ATCCAAAAAT GTAAATATGC CATAAATTGT TACTATATAT 11040
4231 TTTTAAAAAA GAAAAATCAG AGTACAATAA AAATGCCAGC GTCTATTAGG CGTTGAAAAT 11100
4232 TTAAAAAAAA AAAAAAAAAA AAAA 11124
4233 //
4234 ID AY561850 standard; DNA; INV; 13424 BP.
4235 XX
4236 AC AY561850;
4237 XX
4238 DR FLYBASE; FBte0001206; Dmel\TART-A.
4239 XX
4240 FT source AY561850:1..13424
4241 FT SO_feature non_LTR_retrotransposon ; SO:0000189
4242 CC telomeric retrotransposon
4243 FT SO_feature direct_repeat ; SO:0000314:1..1850
4244 FT SO_feature direct_repeat ; SO:0000314:11179..13028
4245 FT SO_feature five_prime_UTR ; SO:0000204:1..1759
4246 FT SO_feature three_prime_UTR ; SO:0000205:7953..13411
4247 FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:13412..13424
4248 CC derived from polyA tail of RNA transposition intermediate
4249 FT SO_feature CDS ; SO:0000316:1760..4672
4250 FT SO_feature start_codon ; SO:0000318:1..3
4251 FT /db_xref="FLYBASE:FBgnXXXXXXX"
4252 FT /db_xref="GI:45594384"
4253 FT /db_xref="NCBI_PROTEIN:AAS68533.1"
4254 FT /translation="MDGQNVNQSGGWASVLSISSDDGNCSSSPPSAIVSSLDTTPTSN
4255 FT ETTIVRRSLYQTNADMKSYDFENIVLNENKNTILPDPLFVDKCGSTANTTEANEKQPA
4256 FT DSPFPISISKNFSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTQIEPAKPS
4257 FT PPSKELSSNSAPKTLSYTDKITATQKNFPTKTHVDTPTQDDDTNATKASKTAQIDSSH
4258 FT SQLHETKPTQPAKNPSPLTQKLTTNKTAKTHTHTDKPTASQNLFPTKTHINSPTQYND
4259 FT TNASTASKDGKINLSSHSHLRETKPTQPAKNPSPLSQKQITSIAANTLTHTNKHTASQ
4260 FT NFIPAKTHINIPTQYNDTNATKALKTAKPASPSHTYSRQTKPIKPAINALHPAQDTNP
4261 FT SPAISAVTYTDKPTATQNIFPAKTFAELVRENAKRSQTAMQNPPHAKHDSAALGRLPS
4262 FT AARKNLTKTLSSPKTPGKRRGDCLDEGLLQTSNKKVRIRDDFSDDDLGVTNLLSETPI
4263 FT FKSKVAIKIRQDSRRESLQKSVEMDTAPAISPSNTAAEPDLPPWKTVPASRKPPSIFL
4264 FT SNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTMDAYKAIQNVLLGANIPLHS
4265 FT HQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFIRAMQFRDTRNPMRIHEVEV
4266 FT VPKADGSHLKVLLLKSLGGQTVKVERKRVSKDPTQCHRCQCFGHTKNYCRNPFKCMKC
4267 FT GQLHATVSCTKPKNLPATCANCNGSHVSSYKGCPAFQEAKQRLSINKIQSLHSQPTHL
4268 FT QTPRNKHPYPKPTHFQTPRNKQSYTHPPPRTTVNNTKLPAKRIQGKKLSQRNISINKR
4269 FT LNRIRAFDKKPRKETSPPTTSKKVLASLEESSKNPNSVLNPANTHLTHFCPPPITQDI
4270 FT PNDEPTEPSQEQYLLNRIEGMEKKLNNLLEIVTRLLNQGRECPKSPKNPFRDPILI"
4271 FT SO_feature CDS ; SO:0000316:4710..7952
4272 FT SO_feature start_codon ; SO:0000318:1..3
4273 FT /db_xref="FLYBASE:FBgnXXXXXXX"
4274 FT /db_xref="GI:45594385"
4275 FT /db_xref="NCBI_PROTEIN:AAS68534.1"
4276 FT /translation="MTRACNRDILKIAFWNAGGINNKIDELKLFILNIDAHIVIVTET
4277 FT RLDNKSTKLELPGYFTYLAQNPVSSKRGGVATIVNSSIRHMALEPIEKECIQSAPIVL
4278 FT LPENNRRSEMIVIASVYCPPSLSWSPHHFTDVLNFAEKTLGGQTKFILCGDWNAKHRQ
4279 FT WGCTRACQRGTALYEAVQADPMAEIIATGCATHFPHDTRKNPSAIDFSICKGLGRLEK
4280 FT RISSSADLSSDHLPILLEINLDTSTLFLQKQNNNILKKTTNIELFKTVLERKILLNTE
4281 FT IRVAEDINDAINIFIKNIKDSADESTPSPRIPDNLRRMHGQANRNSHTLTLDENTSRL
4282 FT LEEKRILSRIFKATRTDEDKAKLKAAENRLKKAVKILREKRINKQIEGIDTKNPDRMR
4283 FT KMWRLLDEGKKTNQPNFPLKLETKRGPKWTKTIKETTEAFVSHLEGRFKPNNNVPDYH
4284 FT INTVNSGLRTIKESMLTERYDVNKNPCNQPITLKELNDEIKNLKNSKAPGKDLITNQL
4285 FT IKTLPTKATLYLILIYNSILRIGYYPDAWKHAQVKMILKPGKSVNDPKSYRPISLLSG
4286 FT LSKMFERLLLKRLFRVDLFKKAIPLHQFGFRKEHGTEQQIARVTQFILEAFERKEYCS
4287 FT AVFLDISEAFDRVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVKDQAGETSRAGQI
4288 FT GAGVPQGSNLGPILYSIFSSDMPLPHIYHPSPTERIMLSTYADDTIVLSSDILATAAT
4289 FT RNNENYLKTFSDWADKWGISVNAAKTGHVIYTLKNDIPTNLKTMKIKGQAIKKESKQS
4290 FT YLGVILDSKLTLSPHVTKVVGKYLTAYRKMSWILNERSKLPTNTKMLILKSVLSPIWQ
4291 FT YAIAAWGPLVTDAQIRRIQVEENRKMRDICRAGRYTKNQTIRDRYCVKTVEEFYQQAV
4292 FT HRFSETTKSHPNVAVRRIFSRHYIPNRLERSRQRYLKMTMDHITQKQTGLTLSPKLLK
4293 FT IPDLDDCRTLKKRSEREKIRQTHLTELPTLLRLEEEEAELKRIKKQEERERRERENQK
4294 FT WPPDRWCELEINRYNKKYRNGDLTRQEIIEKFRGQPLNVQRIILPDYEGD"
4295 XX
4296 CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially
4297 CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314").
4298 CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates
4299 CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short
4300 CC distance into ORF-1. The 5’ ends of TART-A elements are variable and the
4301 CC minimal size for functionality has not been determined. Thus, this
4302 CC canonical sequence, AY561850, may be 5’ truncated within the 5’ PNTR (M-L
4303 CC Pardue, 2009).
4304 XX
4305 CC Derived from AY561850, Michael Ashburner, 6-Apr-2004; updated Jan-2009 as
4306 CC per Mary-Lou Pardue and Greg DeBaryshe.
4307 CC Any changes to original sequence record are annotated in an FT line.
4308 XX
4309 SQ Sequence 13424 BP; 4373 A; 3415 C; 2870 G; 2766 T; 0 other;
4310 CACGCTTTTT GGCCCCTGGC CGATCTTCAT ATATCTCAAA TCGACGGCTG CTTTTACCCT 60
4311 GGAAAAAAAA AAAGGAGCTT GGGTTATATT GAACTACACT AGGCGGCGAC ACACTCACCA 120
4312 GCAGCAGCCA GAACAACAAC AGCGGCAGAA GTAGCAGGAA ATTATCTCAC TGCAAAATCC 180
4313 AATTGGCACT TTCCGAAGTC CGTATTTCTC GCCTGGCCCC TGGCCAGTAA CAGGGGCCTG 240
4314 TGCGACGGAG ATGACGACGA TGATCTGCCC TGTGGACGGC CTCAAGAAGG AATCGGCCCT 300
4315 GTACTGCCCA CCTGACCTGT GCCAGGATAG CAGCAATGTC AGCGGACCAT GGATGGAAGA 360
4316 GGCGGCACTG GCGACGGTCC TCAGTTTTGC GGTTTCCGCG GGGCGTAGGC GCAGTAATCG 420
4317 GCGGCAGCAA CAGTGGCGGC AGCAGAAGGG AATGTGTATC TGCAGTCGCC GAATGGCAAT 480
4318 TTCCTGCCCA GCTGTAATGG ACCGCCAAAT GTTTTTTGGC ATGTCGACCT GTAAGAAAGA 540
4319 AGCAAGGATA AGTTTTTTCT TTACAAGATT GTATATGAAT TTGTATTTAC GGACAACTGG 600
4320 CTTGTTTCCT GTCGACGATA AATGGCGCTT CATGTTTTCA CTCTGCCAAA ATCTGAGTGC 660
4321 AAGCATCGGG GCTGACGGGC CGAATTTGCT GATGCCTTGT ACATGCTAGC ATCTTTATGC 720
4322 CGCCGTGTAA TTTTGCGACA GCAAAACACA TGATGGAGAA GACGAAGGTG ATCGATGGCG 780
4323 CCCGGATGAC GGATGCAGGC CCGTGCTACC CACTGGTCCG TTGCCAGGAC AGCAGCGTTT 840
4324 CAATTATGCG AACAGAGGCA CTGGAGCCAC TTCTCAGGCG ATAGGGATCA TGAGGCGACG 900
4325 ACAACTCGCC AGCAGCAGTA ACAACAACAG CGGCAGCAGC GATCTCGGAC TTGCTGAACA 960
4326 TTGCGGCTTT TTCCCAGCCT GGACCGTCAT CACAAACGCT CTCAAAGATC GGTGCGCCTG 1020
4327 CAGCCTACGG AAGCGTACAA CTGCCCAAAG TCGTGCTATT GCATAATGTT AGGTGTCCTG 1080
4328 GCTGCTCCGG CGGATGAGCT CCACCCGATT GAGAGAGGTA AGAAGGCCCA GCAAGTCGCC 1140
4329 CTTAAATAAA AGAAACAAGC ATTAGACTCG GCTGAAATTG TAACATCAGT CAGACTGTAC 1200
4330 TCACGCATGC ACTTAGACAA ACCGAAGCCT ATTCTATTGA CGACGCGGAC TCCAACACAT 1260
4331 GTTTTCCTCC ACAAAAGGCT GTGAGTGCAC CAAAGTTGAC GGGCCACGCC GGCCGATGCT 1320
4332 TGCTGCATAC CGGCATCTCC GCAGCAGCGA CGTTACAAGC ACCACTAAAA TTAGAAAGAG 1380
4333 GCTTACTATA GGCAAAGCGC AGAAAAACAA ATATTACAAT AAGAAATAGC ACGCGATTTT 1440
4334 TCTGCTTCGT TTCCGCTTGG TACAAGTGAG ACCATTCTCC CTATATGCCA TTCTAGTATA 1500
4335 TTTGCCCGAT AAGCGATATG CTGGCGGCAA AAAAAAAAGA TAATAGCCGA TAAGCCCGCC 1560
4336 AAAAAAAAAG CGCGAAATAT CGATAACGAG CTGGCACGAA AATTGCTGGC ATATCGATCA 1620
4337 ACCGCTGTGT CTTTGAGCTA TCGAAAAAGC CCGCCTACGC GCCTAGCCCA AATTTGCAAG 1680
4338 TCAGTTGAGA TTATAAAACC GACAGAGGCG CGCGCGCAAC AGTAGCTAAA AGTGAAGCCA 1740
4339 GCAGCAACAA CAACAACTAA TGGACGGCCA GAACGTGAAC CAAAGCGGAG GATGGGCATC 1800
4340 GGTTTTATCC ATCTCATCGG ACGATGGTAA CTGCTCATCC TCGCCGCCAT CAGCTATAGT 1860
4341 CTCATCGCTG GATACCACGC CAACGTCAAA TGAAACCACC ATAGTAAGAA GAAGCCTATA 1920
4342 TCAAACAAAT GCCGACATGA AATCTTACGA TTTTGAAAAT ATTGTATTAA ATGAAAATAA 1980
4343 AAATACCATA TTGCCAGACC CTTTATTTGT TGATAAATGC GGGAGTACTG CTAATACCAC 2040
4344 AGAAGCCAAT GAAAAACAGC CTGCCGATAG CCCCTTCCCC ATTTCCATAA GCAAAAATTT 2100
4345 TAGCACTTCC TCGCCACTAA CACATGTAGA CACGCCTACA CAAGAAGATG ACGCCAGTGC 2160
4346 ATTTAATACA TTGAAAGCAG CCAAAACAGC TAGAATAATT TTTCCCACAC ACACACAGAT 2220
4347 AGAGCCCGCC AAACCCTCGC CCCCCTCCAA AGAATTAAGC TCAAACTCAG CACCCAAAAC 2280
4348 TCTTAGCTAC ACAGACAAAA TTACAGCAAC ACAGAAAAAT TTCCCCACTA AAACACATGT 2340
4349 AGACACACCT ACACAAGACG ATGACACTAA TGCAACCAAA GCATCAAAAA CCGCCCAAAT 2400
4350 AGATTCATCA CACTCACAAC TACATGAAAC CAAGCCAACA CAGCCCGCCA AAAACCCTTC 2460
4351 ACCCCTCACC CAAAAGCTAA CCACAAACAA AACAGCCAAG ACACACACAC ACACAGACAA 2520
4352 ACCGACAGCG TCACAAAATC TTTTTCCCAC CAAAACACAT ATAAACTCAC CCACACAATA 2580
4353 TAACGACACT AATGCAAGCA CAGCATCAAA AGACGGTAAA ATAAACCTCT CTTCACACTC 2640
4354 ACACTTACGT GAAACCAAGC CAACACAGCC CGCCAAAAAC CCCTCACCCC TCTCCCAGAA 2700
4355 GCAAATAACA AGCATAGCAG CCAATACACT CACCCACACA AACAAACACA CAGCATCACA 2760
4356 AAACTTTATT CCCGCCAAAA CACATATAAA CATACCCACA CAATATAACG ACACCAATGC 2820
4357 AACCAAAGCA TTAAAAACCG CAAAACCAGC TTCTCCCTCC CACACATACT CACGCCAGAC 2880
4358 AAAACCAATA AAGCCCGCCA TAAACGCATT GCATCCCGCC CAAGACACAA ACCCAAGTCC 2940
4359 AGCAATCAGT GCTGTCACTT ACACAGACAA ACCCACAGCT ACTCAGAATA TTTTTCCTGC 3000
4360 CAAAACTTTT GCAGAGCTGG TGAGAGAAAA TGCTAAACGC TCACAAACTG CAATGCAAAA 3060
4361 TCCCCCTCAT GCAAAACATG ACTCTGCCGC CCTCGGACGC TTACCGAGTG CAGCTAGAAA 3120
4362 AAACCTAACT AAAACACTGA GTTCTCCTAA AACTCCTGGG AAGCGCCGCG GGGACTGTTT 3180
4363 GGATGAGGGC TTACTTCAAA CCTCTAACAA AAAGGTTAGA ATACGCGACG ACTTCTCTGA 3240
4364 TGATGATCTG GGGGTCACAA ATCTACTCTC CGAAACACCC ATATTCAAAA GCAAAGTAGC 3300
4365 TATTAAAATT CGGCAAGACT CAAGAAGAGA ATCCCTGCAG AAGTCAGTTG AAATGGACAC 3360
4366 AGCACCAGCA ATTAGTCCCT CAAACACAGC AGCTGAGCCC GACCTACCGC CCTGGAAAAC 3420
4367 TGTTCCAGCT AGCAGAAAAC CACCATCAAT CTTCTTGTCC AATATTCAGC AGATTATCCC 3480
4368 GCTAATAGAA AAACTAAACT ATAAAGCCGG GGTAAATAGC TTTACTACCA AATCTGAACT 3540
4369 TGGCAACAAT ATTAGAATCC AGGCTAAAAC GATGGATGCC TATAAAGCAA TTCAGAATGT 3600
4370 CCTCCTTGGG GCAAACATTC CCCTACACTC TCACCAGCCA AAGAGCGCAA AGGGCTTCCA 3660
4371 AATTGTAATT AGGCACCTCC ACCAGTCAAC CCCGACCAAA TGGATTGAAA GCCAACTTCA 3720
4372 AGACATCGGT ATAGCTACAA AATTCATCAG GGCAATGCAG TTTAGGGACA CGAGAAATCC 3780
4373 TATGCGCATT CATGAGGTTG AGGTTGTACC CAAGGCTGAC GGCAGCCATC TCAAGGTCCT 3840
4374 GCTACTAAAA TCCCTTGGAG GTCAAACGGT CAAGGTTGAA AGGAAACGGG TATCGAAGGA 3900
4375 TCCCACACAA TGTCATCGCT GCCAATGTTT TGGGCATACA AAAAATTATT GTAGAAACCC 3960
4376 GTTTAAATGT ATGAAATGTG GCCAGCTGCA CGCCACGGTT TCTTGCACTA AACCCAAAAA 4020
4377 CCTTCCGGCT ACTTGTGCAA ACTGCAATGG AAGCCACGTA AGCAGCTATA AAGGATGTCC 4080
4378 TGCTTTCCAA GAAGCAAAGC AAAGACTATC TATCAACAAA ATTCAATCCC TACACTCACA 4140
4379 ACCCACGCAC CTTCAGACCC CCCGCAATAA ACATCCCTAC CCAAAACCCA CCCACTTTCA 4200
4380 GACGCCCCGC AATAAGCAGT CCTACACACA CCCCCCTCCT CGAACAACAG TAAACAACAC 4260
4381 AAAATTACCT GCCAAAAGAA TCCAAGGAAA AAAGTTATCG CAAAGGAACA TATCTATAAA 4320
4382 TAAACGCTTA AATAGAATTA GGGCTTTTGA CAAGAAACCG AGAAAGGAGA CAAGCCCGCC 4380
4383 GACAACTAGC AAAAAGGTAC TGGCCTCCCT AGAAGAAAGC AGCAAAAACC CAAACAGCGT 4440
4384 CCTAAACCCA GCCAACACCC ATCTCACTCA TTTCTGTCCA CCCCCAATAA CACAAGATAT 4500
4385 CCCTAATGAC GAACCCACGG AGCCGAGTCA GGAGCAATAC CTTCTAAATC GTATTGAAGG 4560
4386 GATGGAAAAG AAGCTCAACA ATCTCCTGGA AATCGTCACC CGCCTACTAA ACCAAGGAAG 4620
4387 AGAGTGTCCA AAATCTCCAA AAAATCCTTT CCGAGATCCA ATCCTCATTT AAACGCTCTT 4680
4388 GCTAGTAGCA TCAGAAAGTG ACGTATCTTA TGACTCGGGC GTGCAACAGG GATATCCTTA 4740
4389 AAATTGCTTT CTGGAACGCT GGTGGGATCA ATAATAAAAT AGACGAGCTC AAACTGTTCA 4800
4390 TTCTAAATAT TGATGCCCAC ATAGTCATAG TCACTGAAAC CAGACTTGAC AACAAATCGA 4860
4391 CCAAACTAGA ACTTCCAGGA TATTTCACAT ACTTAGCCCA AAATCCTGTT TCTAGCAAGA 4920
4392 GAGGAGGAGT CGCCACTATA GTAAACAGCA GTATCCGACA CATGGCCTTA GAACCGATTG 4980
4393 AAAAAGAATG CATACAGAGC GCCCCAATAG TCTTGCTGCC TGAAAACAAC AGACGCAGCG 5040
4394 AAATGATAGT AATAGCATCT GTCTACTGTC CGCCTTCGCT AAGCTGGTCG CCCCACCACT 5100
4395 TTACTGACGT TCTCAATTTT GCCGAGAAAA CTCTGGGAGG GCAGACAAAG TTCATTCTAT 5160
4396 GTGGCGACTG GAATGCAAAA CACAGGCAAT GGGGTTGTAC CCGCGCCTGT CAACGCGGCA 5220
4397 CCGCACTCTA CGAAGCAGTT CAAGCAGATC CCATGGCTGA GATTATTGCT ACCGGCTGTG 5280
4398 CGACACATTT CCCGCACGAC ACACGGAAAA ACCCGTCAGC AATAGATTTC TCCATATGCA 5340
4399 AAGGACTGGG CAGGCTCGAA AAGAGAATTT CCTCAAGTGC GGACTTATCT TCAGACCACC 5400
4400 TTCCCATCCT GCTTGAGATC AACTTAGATA CAAGCACCCT CTTTCTGCAA AAGCAAAACA 5460
4401 ATAACATCCT CAAGAAAACT ACGAACATTG AGCTCTTTAA GACTGTTCTT GAAAGAAAGA 5520
4402 TACTTCTTAA TACGGAGATA AGAGTAGCAG AAGACATAAA TGACGCCATA AATATCTTTA 5580
4403 TCAAAAACAT CAAGGACTCG GCTGATGAAT CAACTCCCTC CCCAAGAATC CCTGACAACC 5640
4404 TCAGAAGAAT GCATGGACAA GCTAACAGAA ATAGTCACAC CCTCACACTA GACGAAAACA 5700
4405 CAAGCAGATT GTTGGAAGAA AAACGGATAC TAAGTAGAAT TTTTAAAGCT ACTAGAACGG 5760
4406 ACGAGGACAA AGCTAAACTA AAAGCAGCTG AAAATCGACT AAAAAAAGCG GTAAAGATCT 5820
4407 TGAGAGAAAA GAGAATTAAT AAACAAATTG AAGGAATAGA CACGAAAAAC CCGGACAGAA 5880
4408 TGAGGAAAAT GTGGAGACTG CTAGATGAAG GAAAAAAGAC AAACCAACCG AACTTTCCCC 5940
4409 TCAAACTGGA AACCAAAAGA GGCCCCAAAT GGACAAAAAC GATAAAGGAG ACAACAGAAG 6000
4410 CATTTGTTTC CCACTTAGAA GGAAGATTTA AGCCAAATAA CAACGTACCT GATTACCACA 6060
4411 TAAATACAGT TAACTCTGGA CTAAGAACAA TTAAAGAAAG CATGTTAACA GAAAGATATG 6120
4412 ATGTAAACAA GAATCCCTGT AACCAACCTA TCACACTAAA GGAATTAAAT GACGAAATAA 6180
4413 AAAACTTAAA GAATAGTAAA GCACCGGGAA AAGACCTTAT AACAAACCAA CTTATAAAAA 6240
4414 CCCTACCGAC TAAAGCTACA CTGTACCTTA TCCTAATCTA TAACTCTATA CTTAGAATTG 6300
4415 GATACTACCC AGACGCCTGG AAACATGCCC AAGTGAAAAT GATCTTAAAA CCAGGGAAAA 6360
4416 GTGTGAACGA CCCGAAGTCA TATAGGCCGA TCAGTCTACT CTCGGGACTC TCTAAAATGT 6420
4417 TTGAAAGACT ACTTCTAAAA AGACTTTTTA GGGTAGATCT ATTCAAAAAA GCCATACCAC 6480
4418 TGCACCAATT TGGCTTCAGA AAAGAGCACG GAACTGAGCA GCAAATAGCC AGGGTCACCC 6540
4419 AGTTCATCCT CGAGGCCTTT GAGCGAAAGG AATACTGCTC AGCGGTTTTC CTTGACATCT 6600
4420 CTGAGGCTTT CGATAGGGTC TGGCACGAAG GCCTTTTACT TAAACTAGCT AAAATATTAC 6660
4421 CATACAACCT ATACATTATT CTCGAAAGCT ACCTTACAAA CAGAACATTT GAAGTTAAAG 6720
4422 ACCAAGCTGG AGAGACTTCG AGAGCAGGAC AAATAGGCGC AGGGGTGCCC CAAGGAAGCA 6780
4423 ACCTTGGACC CATACTGTAC TCTATCTTCT CCTCAGACAT GCCACTCCCA CACATATACC 6840
4424 ACCCCTCCCC AACAGAAAGA ATTATGCTCT CAACATACGC AGACGACACT ATAGTACTCA 6900
4425 GCTCAGACAT ACTAGCAACT GCTGCCACAA GAAACAACGA AAACTACCTC AAGACATTTT 6960
4426 CGGACTGGGC AGACAAATGG GGTATCTCAG TAAATGCTGC TAAAACAGGA CATGTCATTT 7020
4427 ATACATTAAA AAACGACATA CCTACAAATC TAAAGACCAT GAAGATTAAG GGTCAAGCAA 7080
4428 TAAAAAAGGA AAGCAAGCAA TCATACCTTG GCGTAATCCT TGATAGCAAG CTAACACTTA 7140
4429 GTCCTCACGT CACGAAGGTA GTAGGTAAAT ACTTGACAGC CTATAGAAAA ATGTCATGGA 7200
4430 TCTTAAATGA AAGAAGCAAA CTCCCTACTA ATACTAAGAT GCTGATCCTC AAATCAGTTC 7260
4431 TATCGCCAAT ATGGCAGTAT GCCATAGCAG CCTGGGGTCC CCTTGTGACA GATGCACAGA 7320
4432 TAAGACGGAT ACAAGTTGAG GAAAACAGAA AAATGAGAGA CATATGCAGA GCGGGAAGAT 7380
4433 ACACGAAAAA CCAAACTATA AGGGACCGCT ACTGTGTCAA AACAGTAGAA GAGTTCTATC 7440
4434 AACAGGCTGT CCACAGGTTC TCAGAAACTA CAAAATCGCA CCCTAATGTA GCTGTTCGCA 7500
4435 GGATATTCTC TAGGCACTAT ATCCCGAACA GACTAGAAAG AAGCAGGCAG AGGTACTTGA 7560
4436 AAATGACAAT GGACCATATC ACGCAAAAAC AGACTGGACT GACCCTCTCA CCTAAACTCT 7620
4437 TAAAAATCCC TGATCTAGAT GACTGCAGAA CCTTAAAAAA GCGAAGCGAG AGAGAGAAAA 7680
4438 TAAGACAAAC GCATCTAACT GAACTCCCCA CCCTGCTGAG ACTAGAGGAA GAGGAGGCAG 7740
4439 AGCTCAAAAG AATAAAAAAA CAGGAAGAGA GGGAAAGAAG GGAAAGGGAA AACCAAAAGT 7800
4440 GGCCTCCAGA TAGGTGGTGT GAACTGGAAA TAAACCGATA TAATAAAAAA TATAGAAATG 7860
4441 GCGATCTAAC CAGGCAGGAA ATTATAGAAA AATTCCGAGG GCAACCATTA AATGTACAAC 7920
4442 GAATAATCCT ACCCGACTAC GAAGGTGACT AAAAGTAAAT CAAAACAAAC TAGGGTCGGA 7980
4443 GCATAAAGCA GAAATAATTA ACCTGGCGGA AGGGGCGGCA AAAATATTTA AAAGAAAGGA 8040
4444 AATAAATACA AAAAGGCTAA AGGCTAAGTT ACAGGTTACA TAAAAAGGGA AATGTGCTTA 8100
4445 TAGATATAAT GGTAAAATTA ACTTAACTAA ACACCTACTG GAAAACAAAA CCATGATGGC 8160
4446 TGCGTACTTA AAACGTTTCT CCTGGCGCGA TTGAAAATCC ATCTTTCCTA TCCAACCGAG 8220
4447 GGATCTGCGA CTGCGGCCTT CTGCCGTTCG GCTCCTGATG GATCCATCTG CTGCTGGAAT 8280
4448 GGGTGCCACA CCGGCGCTCC AACCTAAAAG AAAGATAATA TGTCTTAGTT TTCTTTCCCT 8340
4449 TTTTCTCATA AAAAACAAAA GCTCATCTGG AGTCTGATAA TAGCTTTAGC TCACCAAGAC 8400
4450 AGCAAAAACA ACAGCATCAA GGCCAGCAAC AGTGGAGGCA GAGACCAAGC GGTTTGCTGA 8460
4451 ACATTTCGCT GCCCACACCC ACCATTCCTG GAGGCTCTGA ATGAGGGAGC TGAAGCCTCT 8520
4452 GAAAATTGAA GATCCTACTC CAATGTGACA CTTTCGGCTC CGAGCTCAAC GCCGGCGCTG 8580
4453 CAAATCCGGC GTTATAAGGA AAGGGTGCTC CAGCTTGTGG AGTGGTCTTT CCCCAGAGGC 8640
4454 AGCAGCAGCA GCAACGCCAG CGGCAATTGG CGACCTCTGC GTAGCCGAGT CAATCCCGTT 8700
4455 ATCGGTCCGT CTGGCGATGC GTTTCCGACG CGGCGGTATG CGTCCATAGG GACCGCCTAG 8760
4456 AATGCTTGGC CAGGAGACAG CAGTAGACCT GGGCGTGGGC GTCACCAGCA ACATGGTAGC 8820
4457 CATGCGCAGT CAATTGGCCG GTGGCAACAA TCTTGCCATG CAGCAATAGC GGCGCATGCT 8880
4458 ACCCTTGGAG CGACGTCAAC AGCTACATAT TTTTCAACAG TGTAGCGCGA CCTTTAGGCG 8940
4459 CCTACACCTA CACCAGCAGC AGCGATATTG GCAGTAGCAG CATTTAATGT CTTGCAGCAG 9000
4460 TTTCCATTTG ACAACTTCCG ACGACCAGAC TCCTCGCTTG GCCCCTGGCG ATTCGCCCTG 9060
4461 GAAGAAAGAA AGAAGCATGG ATTAGTCAAA TATCAAAGCA CAACAAGCAT GCACGAAATC 9120
4462 TTCGCAACAA GGACTATTCC AAGGCAAGCG ATGGTGTGTT CTTTGGCTCT ACATATATCG 9180
4463 TTGAAATCCG TCTCCAACTG CCGCGAGTCA CCCACGACTT CCACTCCCTG CAGACGGACG 9240
4464 TAATGCACTA CGATGTGTAA ATTTTCCGGA TCCAAGTGAA CGCCAGGCGG AAGAGGATTC 9300
4465 CCTGGATGTG AAGGATCACA AACTGCTGCT TTTTCAAGAG TCCCCATTTA ACAACTTCCG 9360
4466 ACGACCAGAC TCCTCGCTTG GCCCCTGGCG ATTCGCCCTG AAAGAAAGAA AGAAGCATGG 9420
4467 ATTAGTCAAA TACCAAAGCA CAACAAGCAT GCACGAAATC TGCGCAACAA GGACTATTCC 9480
4468 AAGGCAAGCG ATGACGGACG GAATGCACTA CTATGTGTAA ATTTTCCGGA TCCAAGTGAA 9540
4469 CGCCAGGCGG AAGAGGATTC CCTGGATGTG AAGGATCACA AACTGCTGCT TCTTCAAGAG 9600
4470 GTAACCGGCC TCATTTCCAC TTGGGTCACA TCGATTGTGG AGGAAGCCGA TTGGGACTTT 9660
4471 GAGCGAGCCC TAAAATTGTT CATTCAGAAG AACGCTGATC ACGAAATCCC AGATCTAGCA 9720
4472 TTCGCCTAGA ATATGTGATC TCGTTGGACT GCGTGCTGGA CTGCGGCGCA TGCTTTCCCT 9780
4473 CCCGCCAGAG ACGGGATGCG CGCATCAGGA TCGACGGGAC AGACCGGCCG ACGCCTGGCT 9840
4474 TCACGTCGGC ATCTATGCGA CGACGTGATA ATCAGCTTCA CAGTACCTGC GGATGAGGGC 9900
4475 ACAGGCGCCA GTCCTCTGCC TAGCGACACA TACACCAACA GCAACATCTA AAACAGTCGC 9960
4476 AGTAGATGCA GGGAATTTTC TTGCTGCATT CTCCAACTGG AAAAATCCGA CGGCCCAACT 10020
4477 CCTAGCTTAG CCCGGCCAAT CTTCTTGGAC TGGCAAACGA TGTGATGAAT CGTCCTGGAA 10080
4478 GAAAGAAGCA TGGATTATTT CTTCATACAC AGCTTGTCTA CTAAAATGCA TTTCCCGGCA 10140
4479 AACTGGCACT GGGGCGTTGA AAATACGACA CTACTCACCA AACAGCAGCA AAAACAACAG 10200
4480 CATCGGCAGC AGGCGACCAG CAGCTGCTTT GGCTCACCCA ATGCGACAGC AATATCTGCG 10260
4481 CATGGCCAGC AACATGCAGC AAGCAAAAGA CCGGCATGGT GGTGAACAAC ATATCGCTCA 10320
4482 CGCCCAACGA TCTGGAAGCC CTGAGCTAGG GAACTGAGTA TCCGCCAGCG GATACTTATG 10380
4483 CAGCGGCGAG GCGTCGGAAA TCCGATAGCC GGAAGAGAGG CCGGAGCAGC ATGTTGGGCA 10440
4484 TTTTCGCCCC AGTAGCAGCT GCTGGGGCAG CAAGGGCAGA GGTAGCAGTG TCAGCGCTCC 10500
4485 TGGTAAACCG GCCTTTTCTG TTGAAGACGC GGGACTGCGG CGCAATTGTT CCTGCCAACC 10560
4486 GGGAGTTCTC TGCGCCTGAG GTCCTGTTGT GCTTCAGCGG CTCCATCTGC TGTTGCATCT 10620
4487 GGCGCTTCTC CAACTTTCCT CCCTGAAAGA AGAGAATATT AGTAGGAGCA TGAGACCAAC 10680
4488 AACAGCCCTA GCTTACCACG TCAGCGGAAA CAGCAACTGC AGAAGCCCGG TAACTTTCTG 10740
4489 ATAATATGCA GCAATAAGAG CGGCTGGATC AGCATGTTGT GTAGCTTGGC CCCAGAAGCA 10800
4490 GCAGCTGCGG TACCAAAGGC AGCGGAAGCA GGGTCAACAT AGTCTGCTAT GCTGTGTCCA 10860
4491 TACTAGCATA GTCAAGTCAG CGGTGGTGAC GTTGCCGCAG CAGCTGATCC ACAGGGTACG 10920
4492 GCCTGGAATG TTTTGTCAGA GACGGCAGTG GCCTGGGCGT ATTAGTCAGA TACGCCAACA 10980
4493 ACATGATACC CATGCGCAAC CATTCTTCCG GTGGCGGCAT GCTCGTAAAG TAGCGGCGGC 11040
4494 GCATGCATCT CTCGAAGCAG CAGCAGCAAC AGAGGCGTCT CATAAGTGCA TGCGCAGCAG 11100
4495 CGGTAGCAGC GGTGGTGGCA GCAGCAGGGA GATTTCATTG CTGCAGTCGC CAAATTACAT 11160
4496 GCATCCTACG ACTCGACTCA CGCTTTTTGG CCCCTGGCCG ATCTTCATAT ATCTCAAATC 11220
4497 GACGGCTGCT TTTACCCTGG AAAAAAAAAA AGGAGCTTGG GTTATATTGA ACTACACTAG 11280
4498 GCGGCGACAC ACTCACCAGC AGCAGCCAGA ACAACAACAG CGGCAGAAGT AGCAGGAAAT 11340
4499 TATCTCACTG CAAAATCCAA TTGGCACTTT CCGAAGTCCG TATTTCTCGC CTGGCCCCTG 11400
4500 GCCAGTAACA GGGGCCTGTG CGACGGAGAT GACGACGATG ATCTGCCCTG TGGACGGCCT 11460
4501 CAAGAAGGAA TCGGCCCTGT ACTGCCCACC TGACCTGTGC CAGGATAGCA GCAATGTCAG 11520
4502 CGGACCATGG ATGGAAGAGG CGGCACTGGC GACGGTCCTC AGTTTTGCGG TTTCCGCGGG 11580
4503 GCGTAGGCGC AGTAATCGGC GGCAGCAACA GTGGCGGCAG CAGAAGGGAA TGTGTATCTG 11640
4504 CAGTCGCCGA ATGGCAATTT CCTGCCCAGC TGTAATGGAC CGACAAATGT TTTTTGGCAT 11700
4505 GTCGACCTGT AAGAAAGAAG CAAGGATAAG TTTTTTCTTT ACAAGATTGT ATATGAATTT 11760
4506 GTATTTACGG ACAACTGGCT TGTTTCCTGT CGACGATAAA TGGCGCTTCA TGTTTTCACT 11820
4507 CTGCCAAAAT CTGAGTGCAA GCATCGGGGC TGACGGGCCG AATTTGCTGA TGCCTTGTAC 11880
4508 ATGCTAGCAT CTTTATGCCG CCGTGTAATT TTGCGACAGC AAAACACATG ATGGAGAAGA 11940
4509 CGAAGGTGAT CGATGGCGCC CGGATGACGG ATGCAGGCCC GTGCTACCCA CTGGTCCGTT 12000
4510 GCCAGGACAG CAGCGTTTCA ATTATGCGAA CAGAGGCACT GGAGCCACTT CTCAGGCGAT 12060
4511 AGGGATCATG AGGCGACGAC AACTCGCCAG CAGCAGTAAC AACAACAGCG GCAGCAGCGA 12120
4512 TCTCGGACTT GCTGAACATT GCGGCTTTTT CCCAGCCTGG ACCGTCATCA CAAACGCTCT 12180
4513 CAAAGATCGG TGCGCCTGCA GCCTACGGAA GCGTACAACT GCCCAAAGTC GTGCTATTGC 12240
4514 ATAATGTTAG GTGTCCTGGC TGCTCCGGCG GATGAGCTCC ACCCGATTGA GAGAGGTAAG 12300
4515 AAGGCCCAGC AAGTCGCCCT TAAATAAAAG AAACAAGCAT TAGACTCGGC TGAAATTGTA 12360
4516 ACATCAGTCA GACTGTACTC ACGCATGCAC TTAGACAAAC CGAAGCCTAT TCTATTGACG 12420
4517 ACGCGGACTC CAACACATGT TTTCCTCCAC AAAAGGCTGT GAGTGCACCA AAGTTGACGG 12480
4518 GCCACGCCGG CCGATGCTTG CTGCATACCG GCATCTCCGC AGCAGCGACG TTACAAGCAC 12540
4519 CACTAAAATT AGAAAGAGGC TTACTATAGG CAAAGCGCAG AAAAACAAAT ATTACAATAA 12600
4520 GAAATAGCAC GCGATTTTTC TGCTTCGTTT CCGCTTGGTA CAAGTGAGAC CATTCTCCCT 12660
4521 ATATGCCATT CTAGTATATT TGCCCGATAA GCGATATGCT GGCGGCAAAA AAAAAAGATA 12720
4522 ATAGCCGATA AGCCCGCCAA AAAAAAAGCG CGAAATATCG ATAACGAGCT GGCACGAAAA 12780
4523 TTGCTGGCAT ATCGATCAAC CGCTGTGTCT TTGAGCTATC GAAAAAGCCC GCCTACGCGC 12840
4524 CTAGCCCAAA TTTGCAAGTC AGTTGAGATT ATAAAACCGA CAGAGGCGCG CGCCGAACAG 12900
4525 TAGCTAAAAG TGAAGCCAGC AGCAACAACA ACAACTAATG GACGGCCAGA ACGTGAACCA 12960
4526 AAGCGGAGGA TGGGCATTGG TCTTATCCAT CTCATCGGAC GATGGTAACT GCTCATCCTT 13020
4527 GCCGCCATAG TCTCATCGCT GGATATCAAG TCATCGCTCA ACTATACCTT AAAATTACTC 13080
4528 ACCAAAACTC TTTTCTCCTT TTCCATAAGA TAAAGTAAAG TAAAGTAATG TAAAGTAAAG 13140
4529 TAAAGTAAAT TAAAGTAAAG TAAAGTAACG TAAAGTAACA TAATATTTAA ATTTAAATTC 13200
4530 TACACTTGAA CAATGGCGCG CAAAACTGCC GCAATGTAAT TCAAAAATGT CTCCCGCAAA 13260
4531 TTTAAAACAT AGATTAATAC TTGTAAGTAT GGCGCGCATA TCTGCGGCCA AGAAATCCGA 13320
4532 AAATGTAATT TGCCACAAAT TGTCACTATA TATTTTTAAG CAAAAATCAG AGGACAATAA 13380
4533 ATGCCAACGT CATTAGACGT TGAAAATATT CAAAAAAAAA AAAA 13424
4534 //
4535 ID DM14101 standard; DNA; INV; 10654 BP.
4536 XX
4537 AC U14101;
4538 XX
4539 DR FLYBASE; FBte0001207; Dmel\TART-B.
4540 XX
4541 FT source U14101:1..10654
4542 FT SO_feature non_LTR_retrotransposon ; SO:0000189
4543 CC telomeric retrotransposon
4544 FT SO_feature direct_repeat ; SO:0000314:1..1046
4545 FT SO_feature direct_repeat ; SO:0000314:9031..10076
4546 FT SO_feature five_prime_UTR ; SO:0000204:1..961
4547 FT SO_feature three_prime_UTR ; SO:0000205:7386..10637
4548 FT SO_feature polyA_signal_sequence ; SO:0000551:10479..10484
4549 FT SO_feature polyA_signal_sequence ; SO:0000551:10600..10605
4550 FT SO_feature non_LTR_retrotransposon_polymeric_tract ; SO:0000433:10638..10654
4551 CC derived from polyA tail of RNA transposition intermediate
4552 FT SO_feature CDS ; SO:0000316:962..4093
4553 FT SO_feature start_codon ; SO:0000318:1..3
4554 FT /name="Dmel\TART-element\gag"
4555 FT /db_xref="FLYBASE:FBgn0014071"
4556 FT /db_xref="SPTREMBL:Q23999"
4557 FT /db_xref="GI:603663"
4558 FT /db_xref="NCBI_PROTEIN:AAC46493.1"
4559 FT /translation="MDGHNGDQSEGWATVLSISSDDSNSLSSPPSIIVSSLDTTPTSHE
4560 FT TTIVRRSLYQTNADMKSYDFENIVLNENKNTILPDPLFVDKCGSTANTTEANEKKPANS
4561 FT PFPISISKNFSTSSPLTHVDTPTQEDDASAFNTLKAAKTARIIFPTHTHIKPTKPSPPS
4562 FT KELSTNSALKTLSYTDKITGTQKNLPDKTHVDTPTQDDDINATKASKTAKIISTQTHLG
4563 FT ETKPIQPAKDPSPRTQKPIAHKADETLTHTDKLTASQNLVPAKTHINTPTQYNDTNATN
4564 FT ALKTAKINFSSHSHQSEIKPTQSAKNISPLTQKQFTSESAGTHTHTDKHKNTASQNLFS
4565 FT AKTHINSPTQHNYTSAATASKTAKLILSPHSHLSETKPTQPALSPSPLSQKQITSIAAK
4566 FT TLTHTNKHTASQNFIPAKTHINIPTQYNDTNATKALKTAKAASPSHTYSRQTKPIKSAI
4567 FT NALHPAQDTNPSPAISAVTYTDKPTATQNIFPVKTFAELVRENAKRLPTPMQNSHQAKN
4568 FT DSAALGRPPTAARKNLNKTLISPKTPGKRRGDCLDEGLLQTSNKKVRIRDDFSDDDLGV
4569 FT TNLLSETPLFKSKAAIKIRQDSRRDSLQKSAEMDTAPAISPSNTAADSDLPPWKTVPAS
4570 FT RKPPSIFLSNIQQIIPLIEKLNYKAGVNSFTTKSELGNNIRIQAKTMDAHNAIQNVLLE
4571 FT ANIPLHSHQPKSAKGFQIVIRHLHQSTPTKWIESQLQDIGIATKFIRAMQFRDTRNPMR
4572 FT IHEVEVVPKADGSHLKVLLLKSLGGQTVKVERKRVSKDPTQCHRCQCFGHTKNYCRNPF
4573 FT KCMKCGQLHATVSCTKPKNLPATCANCNGSHVSSYKGCPAFQEAKQRLSINKIQSLHSQ
4574 FT PTHLQTPRNKHPYPKPTHLQTPRNKQPYTHPLPRTSVNNTKLPAKRIQGKKISQRNLSI
4575 FT NKRLHRMKKPRKETSPPTTSKKVLASLEESRKNPNSVLNPANTHLTHFRPPPLAQNIPN
4576 FT DEPKELSGEQYLLNRIEGMEKKINNLLEIVTRLLRQGKDCPKSPKNPFRDPIFV"
4577 FT SO_feature CDS ; SO:0000316:4131..7385
4578 FT SO_feature start_codon ; SO:0000318:1..3
4579 FT /name="Dmel\TART-element\pol"
4580 FT /db_xref="FLYBASE:FBgn0014072"
4581 FT /db_xref="REMTREMBL:AAC46494"
4582 FT /db_xref="GI:603664"
4583 FT /db_xref="NCBI_PROTEIN:AAC46494.1"
4584 FT /translation="MTRADNRDILKIAFWNAGGINNKIDELKLFILNIDAHIIIVTETR
4585 FT LDNNSTKLELPGYFTYLAQNPVSSKRGGVATIVNSSIRHMALKPIEKECIQSAPIVLLP
4586 FT ENNRRSEMIVIASVYCPPSLRWLPHHFTDVLNFAEKTLGGQTKFILCGDWNAKHRQWGC
4587 FT TRACQRGTALYEAVQADSTAEIIATGCATHFPHDTRKNPSAIDFSICKGLGRFEKRISS
4588 FT GADLSSDHLPILLEINLDTNTLFLQKQNNNILKKNTNIELFKKVLERKILLNTEIRVAE
4589 FT DINDAISTFMKNIKDSAAESTPSPRIRDNPRRRHRQANRNSHTLALDENTSRLLEEKRI
4590 FT LSRVFKATKNYEDKAKLKAAENRLKKAIKILRENRINEQVEGIDTSNPDRMRKMWKLLD
4591 FT EGKRTNQPNFPLKLETQKGPKWTKTIKETTETFVSHLEGRFKPNNNVPDYHIDRVNTGL
4592 FT RIIKESMLTERHNLNKNPHNQPITLKELNDEIKNLKNSKAPGKDLITNQLIKTLPTKAT
4593 FT LYLILIYNSILRLGYYPEAWKHAQVKMILKPGKSANEPRSYRPISLLSGLSKIFERLLL
4594 FT KRLFKVDLFKKAIPLHQFGFRKEHGSEQQIARVTQFILEAFERKEYCSAVFLDISEAFD
4595 FT RVWHEGLLLKLAKILPYNLYIILESYLTNRTFEVKDQAGETSRTGQIGAGVPQGSNLGP
4596 FT LLYSIFSSDMPLPYIYRPSPTERIMLSTYADDTIVLSSDTLATAATRNNENYLKSFSDW
4597 FT ADKWGISVNAAKTGHVIFTLKNDLPTSLRTMKIKGQVIKIESKQSYLGVILDSKLTLSS
4598 FT HVTKLMGKYTTAYRKMTWILNRRSKLPTKTKMLILKSVLSPIWQYAIAAWGPLVTDAQI
4599 FT RRIQVEENRKMRDICRAGRYTSNQTIRDRYGIKTVEEFYQQALHRFSETIKSHPNIAVR
4600 FT RIFTRHYIPNRLERSRQRYLKMTNEHITQKQTGQTLSPKLLKIPDLNDCRTLKKRNERD
4601 FT KIRQTHLIELPTLLRLEEEEEELRRIKKQEERERREKETQKWPPDRWCELEINLYNKQY
4602 FT RRGDLTRQEIIQKFRGQPLNVQRIILPDYKGDQEHN"
4603 XX
4604 CC A PNTR (Perfect Non-Terminal Repeat) is a perfect direct repeat partially
4605 CC overlapping the UTRs (annotated as "direct_repeat ; SO:0000314").
4606 CC Distinguishing characteristics of PNTR’s are that the 3’ repeat terminates
4607 CC upstream of the 3’ end of the element and that the 5’ PNTR extends a short
4608 CC distance into ORF-1. The 5’ ends of TART-B elements are variable and the
4609 CC minimal size for functionality has not been determined. Thus, this
4610 CC canonical sequence, U14101, may be 5’ truncated within the 5’ PNTR (M-L
4611 CC Pardue, 2009).
4612 XX
4613 CC Derived from U14101 (g603662) (Rel. 42, Last updated, Version 1).
4614 CC Takis Benos and Michael Ashburner, 20-Aug-1997; updated Jan-2009 as per
4615 CC Mary-Lou Pardue and Greg DeBaryshe.
4616 CC Any changes to original sequence record are annotated in an FT line.
4617 XX
4618 SQ Sequence 10654 BP; 3669 A; 2717 C; 2036 G; 2232 T; 0 other;
4619 GATCCGGCCG GATGGCAGCT CGACGACGGT AGCAGGCCAC CATGCCCGCC AGCCCGCAGC 60
4620 TAGGATAGCA GCAACATCAG CGTCTTATTA ACGCGAACGG CGGCACTGGC CCTTAGCTGA 120
4621 CCAGCTGCAA CAACATCAGC GACGCAGTCT CCACCAGCAG CAACAACAGC AGCGGCGCTT 180
4622 GCGACAGCAG CAGCAGGGAA TGGTTCTGCC GCAGTCGCCT ATTGCTGCCT ATAAAGAGCA 240
4623 TTCCTTGCCA ATTGGCTTTC TGTACGACGA CGATGATCCT GCGGACAAAT CCACCTTTCC 300
4624 GGACGCCTGA GTATTATGGC GAGCCTGCTG ATCATTGTTT CTCCGACTCC TTACTTGACC 360
4625 ACTGGACAAT CATACAATCA CCGGCTTTTC ACATCTGGAA GAAAGAAACC TGGATTAGTA 420
4626 TTTGCCCTTC AGATTTGTAT GAAACTGCAT TTCTGGCCAA CCGGAGTGTT TCCTGCAGAC 480
4627 GACGCTGGAC TGCGACGCAC TTTTTTCTAC CAACACAGAT GGGACGCTTG CATCAGATCT 540
4628 GACGGGCCAG ACTGGCCGAT GCCTGGTACA CGATGGCATC TCCGCGGCGG CGAGATGTGC 600
4629 AGCGACGCTG AAAGCAATAA TAATTCTTTT ACTTTGCAGT ATCAAAAATG AGAAGCCACA 660
4630 TCACAATTTA CATCAGCAAA AATTACACGT GATATCTTTT TCTTTTGCCT AGGAGTAGTG 720
4631 AGACCTGCTA CCAAAATGAC CAGTAATACC GGCTAACGGA AGCGAGATAT CGATAATCAT 780
4632 TCTGGCGGTA AAATAGCCAG AACATCGATA ACCAGCTGTG CATTTTCCCT TCGATTTATC 840
4633 GAAGTCAAAT AGCCCGCCTA GGCTATCGGA CCGGATCGGC AAGTCAGTAG TGATTAAAAA 900
4634 TCCGGCAGAG GCGCCTGTGC AGCAGCTACC CAAAGTGAAC ACGACGAAAC GCAACAACAA 960
4635 AATGGACGGA CATAATGGAG ATCAAAGTGA AGGATGGGCA ACAGTGCTAT CTATCTCCTC 1020
4636 GGATGATAGT AACTCCTTGT CGTCGCCGCC GTCTATAATA GTTTCATCGC TGGACACCAC 1080
4637 GCCAACTTCG CACGAAACCA CCATAGTAAG AAGAAGCCTA TATCAAACAA ATGCTGACAT 1140
4638 GAAATCTTAC GATTTTGAAA ATATTGTATT AAATGAGAAT AAAAATACCA TATTGCCAGA 1200
4639 CCCTTTATTT GTTGATAAAT GCGGGAGTAC TGCTAATACC ACAGAAGCCA ATGAAAAAAA 1260
4640 GCCTGCCAAT AGCCCCTTCC CCATTTCCAT TAGCAAGAAT TTTAGCACTT CCTCGCCACT 1320
4641 AACACATGTA GACACGCCTA CACAAGAAGA TGACGCCAGT GCGTTCAATA CATTGAAAGC 1380
4642 AGCTAAAACA GCTAGAATAA TTTTTCCCAC ACACACACAT ATAAAGCCCA CCAAACCCTC 1440
4643 GCCCCCCTCC AAAGAATTAA GCACAAACTC AGCACTAAAA ACTCTCAGCT ACACAGACAA 1500
4644 AATAACAGGA ACACAGAAAA ATCTACCCGA CAAAACACAT GTAGACACAC CTACACAAGA 1560
4645 TGACGACATT AATGCAACCA AAGCATCAAA AACCGCTAAA ATAATTTCTA CACAGACACA 1620
4646 CCTAGGTGAA ACCAAGCCAA TACAGCCCGC CAAAGACCCC TCACCCCGCA CCCAAAAGCC 1680
4647 TATTGCACAC AAAGCTGACG AGACACTTAC CCACACAGAC AAACTCACAG CATCACAAAA 1740
4648 CCTCGTTCCC GCCAAAACAC ATATAAACAC ACCCACACAA TATAACGACA CTAATGCAAC 1800
4649 CAATGCATTA AAAACCGCTA AAATAAATTT CTCTTCACAC TCACACCAAA GTGAAATCAA 1860
4650 GCCAACACAG TCCGCCAAAA ACATTTCACC CCTCACACAA AAGCAATTCA CAAGCGAATC 1920
4651 AGCCGGGACA CACACCCATA CAGACAAACA CAAAAACACA GCATCACAAA ATCTCTTTTC 1980
4652 CGCCAAAACA CACATTAACT CACCCACACA ACATAACTAC ACTAGTGCAG CCACAGCATC 2040
4653 AAAAACCGCT AAATTAATTC TCTCCCCACA CTCACACCTA AGTGAAACCA AGCCAACACA 2100
4654 GCCCGCTTTA AGCCCCTCGC CCCTCTCCCA GAAGCAAATA ACAAGCATAG CAGCCAAGAC 2160
4655 ACTCACCCAC ACAAACAAAC ACACAGCATC ACAAAACTTT ATTCCCGCCA AAACACATAT 2220
4656 AAACATACCC ACACAATATA ACGACACCAA TGCAACCAAA GCATTAAAAA CCGCAAAAGC 2280
4657 AGCTTCTCCC TCCCACACAT ACTCACGTCA GACAAAACCA ATAAAGTCCG CCATAAACGC 2340
4658 ATTGCATCCC GCCCAAGACA CAAACCCAAG CCCAGCAATC AGTGCTGTCA CTTACACAGA 2400
4659 CAAACCCACA GCTACTCAGA ATATTTTTCC TGTCAAAACT TTTGCAGAGC TGGTTAGGGA 2460
4660 AAATGCAAAA CGCTTACCAA CTCCAATGCA GAATTCCCAT CAAGCTAAAA ATGACTCTGC 2520
4661 CGCTCTCGGA CGCCCCCCGA CTGCAGCTAG AAAAAATCTA AATAAAACAC TGATTTCTCC 2580
4662 TAAAACTCCT GGGAAGCGCC GTGGGGACTG TCTTGATGAA GGCCTACTAC AAACCTCTAA 2640
4663 CAAAAAGGTT AGAATACGCG ATGACTTCTC TGACGATGAT CTTGGGGTCA CAAATCTACT 2700
4664 CTCTGAAACA CCCTTATTCA AAAGCAAAGC AGCTATCAAG ATCCGGCAAG ACTCGAGAAG 2760
4665 AGATTCCCTG CAGAAGTCAG CCGAAATGGA CACAGCTCCA GCAATTAGTC CCTCAAACAC 2820
4666 AGCAGCCGAT TCCGACCTAC CGCCCTGGAA AACTGTTCCA GCTAGCAGAA AACCACCATC 2880
4667 AATCTTCTTG TCCAATATAC AGCAGATTAT CCCGCTAATA GAAAAACTAA ACTATAAAGC 2940
4668 CGGGGTAAAT AGCTTTACCA CCAAATCTGA ACTTGGCAAC AATATTAGAA TCCAGGCTAA 3000
4669 AACGATGGAC GCCCACAATG CAATTCAGAA TGTTCTCCTT GAGGCAAATA TTCCCCTACA 3060
4670 CTCCCACCAG CCAAAGAGTG CAAAGGGCTT CCAAATTGTA ATTAGGCACC TCCACCAGTC 3120
4671 AACCCCGACC AAATGGATTG AAAGCCAACT TCAAGACATC GGTATAGCTA CAAAATTTAT 3180
4672 CAGGGCAATG CAGTTTAGGG ACACGAGAAA TCCTATGCGC ATTCATGAGG TTGAAGTTGT 3240
4673 ACCCAAGGCT GACGGCAGCC ATCTCAAGGT CCTGCTACTA AAATCCCTTG GAGGTCAAAC 3300
4674 GGTCAAGGTT GAAAGGAAAC GGGTATCGAA GGATCCCACA CAATGTCATC GCTGCCAATG 3360
4675 TTTTGGGCAC ACAAAAAATT ATTGTAGAAA CCCGTTTAAA TGTATGAAAT GTGGCCAGCT 3420
4676 GCACGCCACG GTTTCATGCA CTAAACCCAA AAACCTTCCG GCTACTTGTG CAAACTGCAA 3480
4677 TGGAAGCCAC GTAAGCAGCT ATAAAGGATG TCCCGCTTTC CAAGAAGCAA AGCAAAGACT 3540
4678 ATCTATCAAC AAAATTCAAT CCCTACACTC ACAACCCACG CACCTTCAGA CCCCCCGCAA 3600
4679 TAAACATCCC TACCCAAAAC CCACCCACCT TCAGACGCCC CGCAATAAGC AGCCCTACAC 3660
4680 ACACCCCCTC CCTCGCACAT CAGTAAACAA CACAAAACTA CCTGCCAAAA GAATCCAAGG 3720
4681 AAAGAAGATA TCGCAAAGGA ATCTATCTAT AAACAAACGC TTACACAGAA TGAAAAAACC 3780
4682 GAGGAAGGAG ACAAGCCCGC CGACAACTAG CAAAAAGGTC TTGGCCTCTC TAGAAGAAAG 3840
4683 CAGAAAAAAC CCAAATAGCG TCCTAAACCC GGCCAACACC CATCTCACTC ATTTCCGCCC 3900
4684 ACCCCCTTTA GCACAAAATA TTCCTAATGA CGAACCTAAG GAGCTGAGTG GGGAGCAATA 3960
4685 CCTTCTAAAT CGCATTGAAG GGATGGAAAA GAAGATCAAC AACCTTCTTG AAATCGTCAC 4020
4686 CCGCCTACTA AGACAAGGAA AAGACTGTCC AAAGTCTCCA AAAAATCCTT TCCGAGATCC 4080
4687 AATCTTCGTG TAAATGCTCT TTCTAGTAAC ATCAGAAAGT GACGTTTCCT ATGACTCGGG 4140
4688 CTGACAACAG GGACATCCTT AAAATCGCTT TCTGGAATGC TGGTGGGATT AACAATAAAA 4200
4689 TAGATGAGCT TAAGCTGTTC ATTCTAAATA TTGATGCCCA CATAATCATA GTCACCGAAA 4260
4690 CTAGACTAGA CAACAATTCT ACCAAACTAG AGCTGCCAGG ATATTTCACA TACTTAGCCC 4320
4691 AAAATCCTGT CTCTAGCAAG AGAGGAGGGG TCGCTACTAT AGTAAACAGC AGTATCCGAC 4380
4692 ACATGGCCCT AAAACCGATC GAAAAAGAAT GCATACAAAG CGCCCCAATA GTCCTGCTGC 4440
4693 CTGAAAACAA CAGACGCAGC GAAATGATAG TAATAGCATC TGTCTACTGT CCGCCCTCGC 4500
4694 TAAGGTGGTT GCCCCACCAC TTTACTGACG TTCTCAATTT TGCAGAGAAA ACTTTAGGAG 4560
4695 GGCAGACCAA GTTTATCCTA TGTGGCGACT GGAATGCAAA ACATAGACAA TGGGGTTGTA 4620
4696 CACGCGCCTG CCAACGTGGC ACCGCACTCT ACGAAGCAGT CCAAGCCGAC TCCACTGCAG 4680
4697 AGATCATTGC CACTGGCTGT GCTACACATT TCCCACATGA CACAAGAAAA AACCCGTCAG 4740
4698 CAATAGATTT CTCCATTTGC AAAGGGCTTG GCAGGTTTGA AAAAAGAATT TCTTCAGGGG 4800
4699 CGGATCTATC CTCAGACCAT CTTCCCATCT TGTTAGAGAT AAACCTAGAC ACAAACACCC 4860
4700 TCTTCTTGCA AAAACAAAAC AACAATATAC TCAAGAAAAA TACAAACATC GAGCTGTTTA 4920
4701 AGAAAGTTCT AGAAAGAAAG ATACTATTAA ACACTGAGAT AAGGGTAGCA GAAGATATAA 4980
4702 ATGACGCCAT AAGCACCTTT ATGAAAAACA TCAAGGACTC GGCTGCGGAA TCAACTCCCT 5040
4703 CCCCAAGAAT ACGTGACAAC CCCAGAAGAA GACATAGGCA AGCCAACAGA AACAGTCATA 5100
4704 CCCTCGCACT AGACGAAAAC ACAAGCAGAC TGCTTGAGGA AAAACGCATA TTAAGTAGAG 5160
4705 TTTTCAAAGC TACCAAAAAT TACGAGGACA AAGCTAAACT AAAGGCAGCT GAAAACCGAC 5220
4706 TAAAAAAAGC GATAAAAATA TTGAGAGAAA ACAGAATCAA TGAGCAAGTT GAAGGAATAG 5280
4707 ATACAAGTAA CCCGGACAGA ATGAGAAAAA TGTGGAAACT GCTAGATGAA GGGAAAAGGA 5340
4708 CAAATCAGCC TAATTTTCCC CTCAAATTAG AAACCCAAAA AGGACCCAAA TGGACAAAAA 5400
4709 CGATTAAGGA GACAACAGAA ACATTTGTCT CCCACTTGGA AGGAAGATTT AAGCCAAACA 5460
4710 ATAATGTACC TGATTACCAC ATAGATAGAG TCAATACTGG ACTAAGAATA ATTAAGGAAA 5520
4711 GCATGCTAAC TGAACGACAT AATCTGAACA AAAACCCCCA TAACCAACCT ATTACTCTAA 5580
4712 AGGAATTAAA TGACGAAATA AAAAACTTAA AGAATAGTAA AGCACCGGGA AAAGACCTTA 5640
4713 TAACAAACCA GCTAATAAAA ACCCTACCGA CTAAAGCTAC CCTTTACCTT ATCCTAATCT 5700
4714 ATAACTCCAT ACTTAGACTA GGATACTACC CAGAAGCCTG GAAACATGCG CAGGTAAAAA 5760
4715 TGATTCTCAA GCCAGGGAAA AGTGCAAACG AGCCAAGGTC ATATAGGCCG ATTAGCCTAC 5820
4716 TCTCGGGACT CTCAAAAATC TTTGAAAGAC TACTCTTAAA AAGACTTTTT AAGGTAGATT 5880
4717 TATTCAAAAA AGCTATTCCT CTGCACCAAT TTGGCTTTAG AAAAGAACAC GGATCGGAGC 5940
4718 AGCAAATAGC CAGGGTCACC CAGTTCATTC TTGAGGCCTT CGAGAGAAAG GAATACTGCT 6000
4719 CCGCGGTCTT CCTTGACATC TCTGAGGCTT TCGACAGGGT ATGGCACGAA GGCCTTTTAC 6060
4720 TTAAATTAGC TAAGATCCTA CCTTACAACT TGTACATTAT ACTGGAGAGC TACCTAACAA 6120
4721 ATAGAACGTT CGAAGTTAAA GACCAAGCTG GAGAGACTTC GAGAACAGGA CAAATTGGTG 6180
4722 CTGGTGTGCC TCAAGGAAGC AATCTTGGAC CACTACTCTA CTCTATCTTC TCCTCAGACA 6240
4723 TGCCCCTTCC ATATATCTAC CGCCCCTCAC CAACAGAAAG AATCATGCTC TCAACATACG 6300
4724 CAGACGACAC TATAGTCCTC AGCTCAGACA CACTAGCAAC TGCCGCTACA AGAAACAACG 6360
4725 AAAACTACCT CAAGTCATTC TCGGACTGGG CGGACAAATG GGGTATATCA GTAAACGCTG 6420
4726 CTAAAACCGG ACATGTCATT TTTACATTAA AAAACGACTT ACCTACAAGT CTAAGGACTA 6480
4727 TGAAGATCAA GGGTCAAGTA ATAAAGATTG AAAGCAAACA ATCATACCTT GGCGTAATCC 6540
4728 TTGACAGCAA GCTAACCCTC AGCTCCCACG TCACAAAGCT GATGGGCAAA TACACTACAG 6600
4729 CCTACAGAAA AATGACATGG ATTCTAAACA GAAGAAGCAA ACTCCCTACC AAGACTAAAA 6660
4730 TGCTGATCCT TAAGTCAGTC CTTTCACCAA TATGGCAGTA TGCCATAGCA GCTTGGGGTC 6720
4731 CCCTTGTGAC GGATGCACAG ATAAGACGGA TCCAAGTCGA GGAAAATAGG AAAATGAGAG 6780
4732 ACATATGCAG AGCGGGTAGA TACACGAGCA ACCAAACTAT AAGGGACCGC TATGGAATCA 6840
4733 AAACAGTAGA AGAATTCTAT CAACAGGCAC TCCACAGGTT CTCAGAAACA ATAAAATCTC 6900
4734 ACCCAAATAT AGCTGTACGC AGGATATTCA CAAGGCACTA TATCCCGAAC AGACTAGAAA 6960
4735 GAAGCAGGCA GAGGTACTTG AAAATGACAA ATGAACACAT CACGCAAAAA CAGACTGGAC 7020
4736 AAACACTCTC ACCTAAACTC CTAAAAATCC CTGATCTAAA TGACTGCAGA ACCCTTAAAA 7080
4737 AGCGGAATGA AAGAGATAAA ATAAGGCAAA CCCATCTAAT TGAACTCCCC ACCCTGCTGA 7140
4738 GACTAGAGGA AGAAGAGGAA GAGCTTAGAA GAATAAAAAA ACAGGAAGAG AGGGAAAGAA 7200
4739 GGGAAAAGGA AACCCAAAAG TGGCCTCCAG ACAGATGGTG TGAATTAGAA ATTAACCTAT 7260
4740 ATAATAAGCA ATATAGAAGG GGCGATCTAA CCAGGCAGGA AATCATACAA AAATTTAGAG 7320
4741 GACAACCACT AAATGTACAG AGGATAATTT TACCCGACTA TAAAGGAGAC CAGGAACACA 7380
4742 ATTAAAAGTA AATCATGGGA AAGCAGGGGA AAAAAAACAG AAGTAACAAA ATGGCGGAAG 7440
4743 GGGTGGCAAA ATATATATAA AAATAAGAAA AGATAGAAAT AAAAAGGCTA AAGGCTCACT 7500
4744 TACAGGTTAA TTCAAAAGGG AAACGTGCTT ACATATCTAA TGGTAAAAAC TAACTTATAA 7560
4745 CACCTACTGG ATGACATAGT GAGGATGCCA CAGGTTGCGC ACTTGAATCA CGCTTTCCTG 7620
4746 GCGAGATTGT TAAGGCATCA CCGGGATCCC GTCTCTCTTT CCTAACTGGA GGACTCATGC 7680
4747 CTGAAATCTT TTCCGCTTCA CCGGCACCTG ATGGCCATAT CTGCTACTGC GCCTTGCGTC 7740
4748 CACGGACGCT CCTTCCTGAA AGAAAGAGAA TTTGTTTTAG TTTTCCTTTC TCTTCTTAAA 7800
4749 AATATAACAA AAACAGCAGC AGTAGCCGAC CAACAACATA CTTAGCTTAC CAAGGCAGCA 7860
4750 GCAATGATAC CAACAGAAGC CCTACAGTGT GCTGAACAAT ATGCCGCCCA CGCCCACCAC 7920
4751 TTCTGGAACT CAGGAATGGG GGGTACGGAA TGCCGGAAAC TGGAGGATTC GCCTCAAATG 7980
4752 TTACGCTTAC ATCTTTGAGC AAATCGCCTG CCTCCTCGTC TAACGGCCCG GCGTCTTGGT 8040
4753 ACGCCCAGAA GTAGCAGCGG TAGCAGGATT AGCAGCCTCC ACAGAGATAT GTTCATCCCA 8100
4754 GCATCAGTCC AGTTGGCATT GTGATGCCGC CGTAGCGTAC GCCCTCAGAG ACCCGACTGG 8160
4755 AATCCCAGGA CAAGAGACGG CAGCACGCCT GGGCTTAGGC GCGGGACAAC ATGCAGAGAT 8220
4756 TCGTCAATGA GAATGGCGGC ACTGGAATCA CCTTTCAGCT GAGCGGGATA ATGAGTCGGC 8280
4757 AACGCACCGC ACTATCAGCA GCAATAACAA CATCGGCAGA TGACCTGGAA GAAAGGAAAA 8340
4758 AACATGTATC AGTCTTTTCT TTTCTTTTTT TTTCCCATTA GCATGCGTTT TTAAATTCCA 8400
4759 TTCCTGAAAA CCGGCGTTTT CCTGTAAAAG ACACTGGACG GCGGCGTTTG TTTTAAATGC 8460
4760 AAAGATTGGA TGCTTGCATC AGGGCTGACG TCCTTGAATA GCCGATGCCT TGTAATTGCC 8520
4761 TGCATAGCCG CGGAGGTCCT GATGACGGAT GCTGGCCTGT ATTTGGCCAC CACTCCGATG 8580
4762 CCATGACAGC AGCAACAGCA GCGGTTTTTG CAAATGAGAG GGATCAGGAG GCGGCAACAC 8640
4763 ATTCACCCGT AGCAGCAACA ACAAGCAGTG GTAGCATCAG CAGGGAGTCT TCTCGCCACA 8700
4764 ATAGCCATTT GGAAATTTCT CGACGACCCG ACTTCCTGCT TGGCCCATGG TCAATCACAC 8760
4765 TGGACCAGTT AACAGCGGCG TTTTACCCTG GAAGAAAGAA AACTTGTATT ATTCATTCCC 8820
4766 TTTTCTCTCA CAGTTGGGTA TTTAAGTGCA TTCCTGGCCA ACCTAGCGTG TCTCCTGGCA 8880
4767 ATGACGTCGG ACTCAACGCA TGCTTCCCTT CCGACACAGT AAGGATGTTC GCATCTGGGC 8940
4768 TGACGGGCCA GGCCGGTCCG TTGCCATACA TGCTAGCGTT TCCGCGGCGG CGTAGTGAAC 9000
4769 ATCAAACCGT ATAATGGCGA AGACGACGAT GATCCGGCCG GATGGCAGCT CGACGACGGT 9060
4770 AGCAGGCCAC CATGCCCGCC AGCCCGCAGC TAGGATAGCA GCAACATCAG CGTCTTATTA 9120
4771 ACGCGAACGG CGGCACTGGC CCTTAGCTGA CCAGCTGCAA CAACATCAGC GACGCAGTCT 9180
4772 CCACCAGCAG CAACAACAGC AGCGGCGCTT GCGACAGCAG CAGCAGGGAA TGGTTCTGCC 9240
4773 GCAGTCGCCT ATTGCTGCCT ATAAAGAGCA TTCCTTGCCA ATTGGCTTTC TGTACGACGA 9300
4774 CGATGATCCT GCGGACAAAT CCACCTTTCC GGACGCCTGA GTATTATGGC GAGCCTGCTG 9360
4775 ATCATTGTTT CTCCGACTCC TTACTTGACC ACTGGACAAT CATACAATCA CCGGCTTTTC 9420
4776 ACATCTGGAA GAAAGAAACC TGGATTAGTA TTTGCCCTTC AGATTTGTAT GAAACTGCAT 9480
4777 TTCTGGCCAA CCGGAGTGTT TCCTGCAGAC GACGCTGGAC TGCGACGCAC TTTTTTCTAC 9540
4778 CAACACAGAT GGGACGCTTG CATCAGATCT GACGGGCCAG ACTGGCCGAT GCCTGGTACA 9600
4779 CGATGGCATC TCCGCGGCGG CGAGATGTGC AGCGACGCTG AAAGCAATAA TAATTCTTTT 9660
4780 ACTTTGCAGT ATCAAAAATG AGAAGCCACA TCACAATTTA CATCAGCAAA AATTACACGT 9720
4781 GATATCTTTT TCTTTTGCCT AGGAGTAGTG AGACCTGCTA CCAAAATGAC CAGTAATACC 9780
4782 GGCTAACGGA AGCGAGATAT CGATAATCAT TCTGGCGGTA AAATAGCCAG AACATCGATA 9840
4783 ACCAGCTGTG CATTTTCCCT TCGATTTATC GAAGTCAAAT AGCCCGCCTA GGCTATCGGA 9900
4784 CCGGATCGGC AAGTCAGTAG TGATTAAAAA TCCGGCAGAG GCGCCTGTGC AGCAGCTACC 9960
4785 CAAAGTGAAC ACGACGAAAC GCAACAACAA AATGGACGGA CATAATGGAG ATCAAAGTGA 10020
4786 AGGATGGGCA ACAGTGCTAT CTATCTCCTC GGATGATAGT AACTCCTTGT CGTCGCTGCA 10080
4787 TATATAAAAT AATAAATTTC TTAAAATAAT TTCATCGCTG GATTCCTGCG CCACCATAAA 10140
4788 TTACTTATAG AATACACTTA ACACTGTACC CACTAATGCT AAAAATTTTC TTATACAATT 10200
4789 TTACTTTAAA GCTAAAACTA CTTAAACTAT GGCGCGTAAA ACGGCCGTCA AAAATATCCA 10260
4790 AAAATTGTAC TTGCCATAAA CAAATTCTAA CATAATGTAA ATCCTAAATC GTAAAATCAT 10320
4791 GGCGAACATA ACCGCCGCCA AGCAAATCAA AAAATGTTCC TAGAAATTGT AAATCTTAAA 10380
4792 CCTACTTCTC TAACTAAAGC GCGCACAACT GCCGCTGATC CGAAATTGTA AAATGCCATA 10440
4793 AATTGTAACT ATATATTTTA TAAAAAAAAT CAGAGTACAA TAAAATGACA GCGCCGAAAG 10500
4794 GCACTGAAAA TATTTAAAAA AAAAAAAAAC TGCCGCTGAT CCGAAATTGT AAAATGCCAT 10560
4795 AAATTGTAAC TATATATTTT ATAAAAAAAA TCAGAGTACA ATAAAATGAC AGCGCCGAAA 10620
4796 GGCACTGAAA ATATTTAAAA AAAAAAAAAA AAAA 10654
4797 //
4798 ID TIRANT standard; DNA; INV; 8526 BP.
4799 XX
4800 AC nnnnnnnn;
4801 XX
4802 DR FLYBASE; FBte0000179; Dmel\Tirant.
4803 XX
4804 SY synonym: prygun
4805 XX
4806 FT source X93507:1..2484
4807 FT SO_feature five_prime_LTR ; SO:0000425:1..417
4808 FT SO_feature three_prime_LTR ; SO:0000426:8109..8526
4809 FT SO_feature CDS ; SO:0000316:1866..2999
4810 FT SO_feature CDS ; SO:0000316:3239..6505
4811 FT SO_feature CDS ; SO:0000316:6683..8146
4812 XX
4813 CC Sequence identified by REPBASE:
4814 CC http://www.girinst.org/server/RepBase/RepBase6.6.embl/drorep.ref
4815 CC Assembled and annotated by Josh Kaminker & Michael Ashburner.
4816 CC REPBASE states this to be a consensus sequence.
4817 CC This replaces that from X93507 in versions previous to 4.8.
4818 XX
4819 SQ Sequence 8526 BP; 2961 A; 2097 C; 1384 G; 2084 T; 0 other;
4820 GGAGTTACCA CCCCACCCCC TAAACCCCCA CGCCTCTAAA CAAATCATCG GACACTCAAC 60
4821 CGGGAAGACG GCAACTGGAA CACCGCATCC GGCCGAATGC TGACATTCCG GCCGAATGCT 120
4822 GACATTACAC AAAAGTCGCA CTGCAACATT GTCCCCAGCT AGCCAGCCAC ATGCCGAGTC 180
4823 GGCATGTTCA TTATGCTTAC AATTAAGAAC CTATGTACTT ATGTATAAGA CGAAAACGGA 240
4824 GGACTCGAGT AGCCACTCTC TGACAATAAA CTTGATACTG ATTTTGAACT TCAAGAAAGT 300
4825 CAGTCGTATT CTTTATTGGA AATCTTCACA CTACAACTAT CTGCTGAAAC TTAAAAACCT 360
4826 TCATACATTT ACACATCATA TCTTCACAAA AGGCTCCACC CTCGATCACG GACTTAACTG 420
4827 GCGCAGCCGG TAGGATGTCC TACCTATTAA TAATTACCTA CCTGTAAGTA AACATGTAAG 480
4828 AAACGAAACA AACTATATGC AAGATGTCGA CTGAAAGTGA CTAGGAACAA ATTTTTATAA 540
4829 AACAAAATTG AAGTTGTGAA GTACCAAATG AAACTCAAAC ATATATTCAA ACACAGGAAA 600
4830 AAAAAAGAGA GAGGAAAAAT GTAAAATAAA TAAATATACA AAAAAAAGTG CAAGTGTACC 660
4831 GTACTGCCGC GCTGACGTGG AATCTATCGC TGATCATCAC GCCATCGGTA TGTCCATACT 720
4832 CTGCCGAACG TCATAATTTT TTTAAAAAAG TGCAAGTGTA CCGTACTGCC GCACTGACGT 780
4833 GGAATCTATC GCTGATCATC ACGCCATCGG TATGTCCATA CTCTGCCGAA CGTCATAATT 840
4834 TTTATAAAAA AGTGCAAGTG TACCGTACTG CCGCGCTGAC GTGGAATCTA TCGCTGATCA 900
4835 TCACGCCATC GGTATGTCCA TACTCTGCCA AACGTCATAA TTTTTATAAA AAAGTGCAAG 960
4836 TGTACCGTAC TGCCGCGCTG ACGTGGAATC TATCGCTGAT CATCACGCCA TCGGTATGTC 1020
4837 CATACTCTGC CAAACGTCAT AATTTTTATA AAAAAAGTGC AAGTGTACCG TACTGCTGCG 1080
4838 CTGACGTGGA ATCTATCGCT GATCACCACG CCATCGGTAT GTCCATACTC TGCCAAACGT 1140
4839 CATAAGTTTT TATAAAAAAA AAGAGTGCAA GTGTACCGTA CTGCCGCGCT GACGTGGAAT 1200
4840 CTATCGCTGA TCATCACGTC ATCGGCACTT ACATACGCTG GCCAACGCAT CGCCAAAGCC 1260
4841 TCTATATACA CTTATATATG TGAGCATACA ATATCAACTA CAATCCAATA CATCCACGTA 1320
4842 CTGTACCGCC TCGTTGGCAT GGAATCAAAC GCTGATCACC ATGCCACCGT GGTAAACAAA 1380
4843 CAAAGCACCA AAGCCTCTCT AATACATTGT ACACTCAAAA CGCACACTGC CATACGTCGG 1440
4844 CGAAAAATCA AAACATAAGC AAAAATCATT TCAAACCAAG CGAGGCTCAT TCTGCGTACC 1500
4845 ACAACGACAA CGACACTGCA TGTGTAGTGG CGCACCCATG TCTGGGTAGC CGAGGTAAGG 1560
4846 GGAAAACGCT TGAGTATCGT CAAGTGTTCT TGCCTTTCAC TCTTCTACAA TGGGTTGCTA 1620
4847 CGCTCATGTA TTGCACATTC AAAATAACCA AAACAAATGT ACTAAAGAAG TCGACATATA 1680
4848 CAGATATATT TTGTTTCCTT TCATTGTGTA ATTTTGTATA TCAAACAAAT ACTAATACCA 1740
4849 ATCACATTGC AGAATATAAA AGGGAAAATA TAAAGCCAAA GACAGACACC CATACACTCT 1800
4850 AGTAAACAAG AAATTTGTTC ATTATTTTTC AATCATACAT AATATACTAA GTAACCTCAA 1860
4851 ATTTAATGTC AAAAAAGTTC GTTTACAACC TTAGGAAAAC TACACGTTCA GTTGTTGGAG 1920
4852 TTCCACCAAA CACTAATAGG CCCCCACATC CCGTTAGACG TCCTGACTCC CTTCTCCCGA 1980
4853 TTTCGGAAGA ACCCAAATCA ATATCTTCCC AAACCCCCAA TATGGACTCG GGAAACGATT 2040
4854 CTGCCCGCCC CACTCCATCC CCTCTGGCGC CCACTGTCAG TGGTATTAGC TCCTTAATTT 2100
4855 CAACTACGTT CAAGCCTAAA GATATCATGG CATTTGTTGA GCATTTGCCA ACCTTTGATG 2160
4856 GTACACCTCG TCTATTGGAC AGGTTTATCA CTAGCGTAGA AGAAATCCTG ATGCTCATCA 2220
4857 GGGGAGCTGA CCAAACACCG TATGGCCTGC TTACTCTGAG GACCATCAGG AACAAAATCA 2280
4858 TTGATAGGGC CGACGAAGCC TTGGAACTGG CAAATACCCC CTTGGTTTGG GATGAGATTA 2340
4859 AAAGCAATCT CATCCGCCTC TACTCGAGCA AGAAAAGCGA GGCCAACTTG TTAAGCGAGC 2400
4860 TTAACACATT TTCGGACAAC CTGACCTTGG GCCAACTGTT CTTTGGTATA TCAAAGGTGA 2460
4861 GAAGCCAACT CTTCTCCATA CTCAAAAACA GCGAACACAA CAACACTGTT GTAGATGCAA 2520
4862 AAAAGGTTGT CTACAACGAG GTTTGTCTCA ATGCTTTTAT GACTGGTTTG AAGGAACCTC 2580
4863 TCAAGACTTT CGTCAGGATA AAGTCCCCTT CTACACTTGA ACAGGCGTAC GAGCAATGCC 2640
4864 AAATAGAGCA GACCTTATAT AGGGCACAAA ACAAGCGAAC CAACAGACCA GAGCAGGGAC 2700
4865 CCAATGGATC AGACAATAAA ACCTACCGAA ATAGCTACGA CAGCAATTAC CGCAGCGGAC 2760
4866 GTAACGACCG AAATGACCGT AGGGGACCCT ACTCTAACTC TAACTCTAAC TCTAACTCTG 2820
4867 GCCAAAATAG ACCATTTAAT TCACACAATC GCACACCCCA ATCCGGCACC AAGGACAACC 2880
4868 GGGCCAATAC ATCAAACCCC TTTCGAGCAC CTTCACATAG TTTGAATAAT ATAGAGGAGA 2940
4869 ACCCTCAACC TGATTCGAAT TTTCAGCAAA CGGCCTCGGG AAACCAACAG GGTACATAAG 3000
4870 CCCAGCCACG CACAACCCCT CGCTTCCTTT TATAAAAATC AAACTATCCC AGACAAACCC 3060
4871 CCTGAAGTTT TTAATTGACA CAGGCTCTAC ACACTCCTTC ATCGACCCAA AATATGTCGA 3120
4872 CCCTAGGAAC TGTGTGACCT TAGATACGCC CATAACACTC AAAACAGCCC TGAACAGTTT 3180
4873 TAAAATATAT CAAAACGTCT CTATACCATT TCCACCGGAA TTCCAAATCA CGGGCAAAAT 3240
4874 GACCCTTCTA CCTTTCAAGT TCCACTCTTA TTTTGACGGA TTGATAGGAA TGGACTTATT 3300
4875 ATCTTACCTA AAAACAGAAA TAGATTTACT TAACCTAAAT CTAAAAACCC CAAGTACCAT 3360
4876 TATACCCTTA TGGACCCACA GTAACTCAAC TTCAAACGTA TTTAATATCT CTGGACATAC 3420
4877 GAAAACTATT TTGCCACTAC CAGTGGAAAC CAAACAGGGC GACTTCTACA TCGATTCAAT 3480
4878 TACAATCAAT GATGACTTAA TAATATCAGA CGGGATTTAT AATGCCCAAA ACAATATTGC 3540
4879 TAATTTCGTT ATCACAAACT ATAGCGAGAG GGATCAGTTA TTGTACCTCG AGAGCCCGAT 3600
4880 AAAAGGCATG CCATACTCCA CGGCCAACAA TGTTGAACTT TTCAGTATCA CTTCAGACAC 3660
4881 CCCACAGCCC CAAAACTCCG CAGCGTCGTT ACAAGCCCTT GGCGTCGATC ACCTCTCCTC 3720
4882 TGAAGAGAAA CAAAGCCTAC TTTCACTTTG CAAAAGTTAT CTAGATATCT TCTACAATGA 3780
4883 AGACAAATCA TTGACCTTCA CCAACAAGAT TACACACACG ATTAAAACCA CGGACGACAC 3840
4884 CCCCATTCAT ACAAAATCTT ATAGATATCC TTACATTCAT AAAGAGGAGG TCAAAAAACA 3900
4885 AATAGAGGCA ATGTTAAATC AGGACATTAT CAAATCCAGT TATTCCCCGT GGAGCGCCCC 3960
4886 CGTCTGGGTC GTCCCAAAGA AAATCACTCC TACGGGAGAG CAAAAATGGC GTCTAGTTAT 4020
4887 CGATTATAGA AAACTCAACG AGAAGACTAT ATCCGATAGA TATCCAATAC CTAACATCGC 4080
4888 GGATATCTTA GACAGATTGG GCAAAGCCAA ATATTTCTCC ACACTTGATC TGGCAAGTGG 4140
4889 ATTCCATCAG ATAGAAATGA ATCCCGACGA CACACCCAAA ACTGCATTTA CAGTAGAGGG 4200
4890 GGGCCACTAC GAGTTCATTA GAATGCCGTT TGGCCTCAAA AATGCCCCAG CCACATTCCA 4260
4891 AAGGGTGATG GACAATATTT TTGGAGACCT TATCGGAACT ATCTGCCTAG TTTACCTAGA 4320
4892 TGATATAATA ATTTTCTCAA CCTCCTTACA AGAACACTTC ATACACTTGA AAACTATTTT 4380
4893 TGGAAGACTC AGATCTGCCA ACTTTAAAGT CCAACTCACA AAATCCTACT TCCTCAGGCG 4440
4894 GGAGACAGAA TTCCTTGGCC ACATCGTTTC ACAAGAAGGT GTTAGGCCAA ATCCCAATAA 4500
4895 GATCGAAGCT ATAAAAAACT TTCCATGTCC CCACAGTAAA AAGTCAATTA AGTCTTTCCT 4560
4896 AGGCTTGTTG GGATATTACA GAAAATTTAT CAGAGATTTT GCGAGACTTA CCCAACCCAT 4620
4897 GACACAAAAA TTAAGGGGAA ACAATAAATC GATCATAATA GATGATGAAT TCAAAAAGGC 4680
4898 CTTTGAATAT TGCAAAACCT TACTGTCTAA CGACCCAATC CTCCAATACC CGGACTTTAC 4740
4899 AAAACCTTTC ACACTAACCA CGGACGCAAG TAATTTCGCA ATAGGAGCTG TCCTATCCCA 4800
4900 AGGTCCGGTG CATAGTGATA GGCCCGTATG TTTTGCTAGT AGAACCTTGT CGGCTGCGGA 4860
4901 AACAAATTAT TCCACAATTG AGAAGGAAAT GCTGGCCATT ATATGGGCGG TCCAATACTT 4920
4902 CAGACCCTAC CTCTTTGGCA GGAGATTCAC TATAATCACC GATCACAAAC CACTAACTTG 4980
4903 GTTAATGAAT TTCAAACAAC CAAATTCTAA AATAGTTAGG TGGAGACTCC AGCTTCAGGA 5040
4904 GTACGATTTC GAAGTCGTCT ACAAGAAAGG CTCTCAAAAT GTAATTGCTG ATGCTCTCAG 5100
4905 TAGACCAGAG GCCTCTGTCA ACCATAACGA AGCCCTATCA ATTCCTCAAA ATGTTTGCCC 5160
4906 CATCTCAGAG AAACCCCTTA ATGATTTTAA TATTCAGCTC CTGTTCAAAA TAACCCCAGA 5220
4907 TACAAATAAC GCCACACTGA CCCCGTTTAA ACACAAACTT AGGAGGGAAT TCTGTAAACC 5280
4908 CAATTTTCAG TATGACGACG TAGTTTGCAT TCTTAGGCAG TCGTTAAAAC CAAACAAGAC 5340
4909 ATGCGCGGTA TTTGCCCCCG ACCACATTTT TCAAATGGTG GAACAAGCCT ACCAAACCTA 5400
4910 CTTCTCAGCC CACAGTCAAT TTAAACTCAT TAGATGTTTG ATCTTCCTCC CCGAAATTAC 5460
4911 TGATAGTACG GAGATCGAAA AAATTATAAC CGACTATCAC TATAATAGTA ACCATCGAGG 5520
4912 GATCGATGAA ACATATTTAC ACATAAAACG ACAACAGTTC TTCCCACATA TGAAGGAGAG 5580
4913 AATAACTCAG TTAATTCGAA AATGTGAAAC ATGTTTAAAA TTAAAATACG ACAGACAACC 5640
4914 TCAAAAGATC ACTTACCAAA TATCCGAACT ACCTTCAAAA CCGTTGGACA TCTTACATAT 5700
4915 AGACATTTAT ACTATTAACA AAAATTATAA CCTTACTATT ATCGATAAAT TTTCTAAATT 5760
4916 TGCGGCTGCC TACCCTATAA CTAATAGGAA TTGCATTAAC GTAGTTAAAG CCTTAAAACA 5820
4917 TTTCATTTCC CAATTTGGTA TTCCCAAAAA GCTGATCTAT GATCAGGGAG CAGAATTCGC 5880
4918 TAGCGATATG TTCAATAAGT TCTGCACTCA ATTTAACATT GACCTACACG TTACGTCCTT 5940
4919 TCAACAATCC TCTAGTAACT CTCCCGTTGA ACGGCTTCAC TCGACACTAA CTGAGATTTA 6000
4920 CAGAATAATA CTTGACGTCA GGAAACAACA GAAACTCAGT AGCGAGCATG ACGAGATAAT 6060
4921 GTCCGAAACC CTAATCACAT ATAATAACGC TATTCATTCT GCAACTAAAC ATACCCCCTT 6120
4922 TGAACTATTT AACGGACGTA CTCATATATT CAACCAAACA ATCCAGTTCA ATAACGAACA 6180
4923 CGACTACTTA ACGAAATTAA ATGAATTTCG CGAGAAGTTG TACCCCCTCA TCACGGACAA 6240
4924 ACTTTCAAAT GACGTAGTTA GGAGAACCCT AAAATTAAAT GAAACCCGAA CAGACCCCGT 6300
4925 AGACCTACAA CCAGACACTT TAGTCCTTAG GAAGGAAAAC AGACGTAATA AGATTACACC 6360
4926 CAGGTTTTCG ATTCACAAAG TCAAACACGA CAAAGGTCAT ACATTGATAA CTGCTAGGAA 6420
4927 TCAAAAACTA CACAAATCAA AAATTCGAAA AACAGTTTTG AAAAAAGACA AAAGCAACAA 6480
4928 CGTACCCAAC ACTGATAATA ACTGACCCCA CTACCTCTTA ACTTACCATT TCAGGTTCAC 6540
4929 CCTTGTGCCA ACTCAGGCTA TCCATGTCCA TTATTTAAAT GATAACGCCC CTATAGCCAA 6600
4930 GATAGAACTA GGGAAAGCCT TACTAATTGA GAGGTACAAA ATAATTAGTC ATGTAATCAA 6660
4931 CCTACAAGAC TACAGCAGAT GTATGGAACA ATTCCATCTG ACCATTAATA AATTTAACCC 6720
4932 CGATTCCACG TTGACGGACT CCGTCACAAT TTTAAAAACC AAATTAACCC AAGCCCAAGT 6780
4933 AAAGCTCAAA GCCCTTACAC CTTCATATAG AAACAAACGG GGTTTGATTA ACGGATTGGG 6840
4934 GAGTCTAGTA AAGGTGGTTA CCGGCAACAT GGATGCCAAC GACAATAAAG AAATACATGA 6900
4935 AGAACTTGAC AATATAAAGA AAAATTCCGA AGTCAGTAAC GACAATCTCC AAAAACAAGT 6960
4936 AATGTTTAAC AACGAAATAC TTATCCGGTT CGAAAATATC ACGGACCATA TAAATAATGA 7020
4937 ACAAATTTTG ATAAGTAAAT TCTTTGATAC CTCACAAAAC AAAATATACA AACACTTAAA 7080
4938 CTTACAAGAT ACCCTTCTGG AAGAAATACA ATATTTAAAT AGGATTAATT ATAACATAGA 7140
4939 ATTATTCATT AACCACCTAA ACGACATAAC AGAAAGTATG CTATTGGCGA AAATAAATAT 7200
4940 AATTCCCAAG TTCATCCTAA ATGAACAAGA AATGGATAAA ATAAAAACAA TACTGGAAAA 7260
4941 ACAAAATATC ACAGTCAAAA ATGAACAAAG TATATACAAT TTCCTACAAA TGAATACACT 7320
4942 AAATTACGAA CAAAAGATTA TTTTTAATAT CAAAGTCCCA ATTTTTAAAC AACCTTTTCA 7380
4943 TACCCTCGCC AGACTAGTTC CATTACCAAT AAATAACACA TATTTTGTAA TAACCCCAAA 7440
4944 TTACCTAGCT TATAATATTA ATAATAAGAA ATTTCATATG ACCCGTAAAT GCCCCAAACT 7500
4945 GGATAATACA TTCTTGTGCG ACGAGAACTT CTACGTTGAT ACACCACAGA ACAACACATG 7560
4946 CCTGGAACAC CTTTTGAACG GAGAAAACAG TTCCTGCGAT GTACGGGAAA CCGGCCCCAT 7620
4947 CACCGACGTG TTCGAGGCAG AGAGAGGTTA CATCTTCGCA TTCAACGTGA ACAAACTGAA 7680
4948 GGTATCCCTA ACAAACGGCT CCGAGCTCTC AATAATGGGG TCAGCCATCA TCAGATACAT 7740
4949 TAACGAAACA ATACAGATTA ACGGTATCGA TTACGACGGC ACGGTTGACA CGTTCCCTGA 7800
4950 ACAGACGGAT TTTGATCTTC CCCCCATGCG AAAAGTAACT AGGAATACCA CTATTACGGT 7860
4951 ACTAAGCCTA GAAAAACTGC ACCTCGAAGC CACCCAAACA ATGGATAAAA TCCTGGCCGT 7920
4952 CCATCACAAT ACTATACAGC ACACCTGGAC ACTCTACACT CTGCTCGGAT TGGTAACGTT 7980
4953 CCTAGCAGTC ATCTTATGGC TGCACCGACG AACGAAACAC ATCGTCCACA TCCACGAGGA 8040
4954 TCATCACGTA CCAATCTACG CGTCATCCAT ACCTTCGCTA TGGCCGTCAC TTCGAACTGG 8100
4955 GGGGGGAGGA GTTACCACCC CACCCCCTAA ACCCCCACGC CTCTAAACAA ATCATCGGAC 8160
4956 ACTCAACCGG GAAGACGGCA ACTGGAACAC CGCATCCGGC CGAATGCTGA CATTCCGGCC 8220
4957 GAATGCTGAC ATTACACAAA AGTCGCACTG CAACATTGTC CCCAGCTAGC CAGCCACATG 8280
4958 CCGAGTCGGC ATGTTCATTA TGCTTACAAT TAAGAACCTA TGTACTTATG TATAAGACGA 8340
4959 AAACGGAGGA CTCGAGTAGC CACTCTCTGA CAATAAACTT GATACTGATT TTGAACTTCA 8400
4960 AGAAAGTCAG TCGTATTCTT TATTGGAAAT CTTCACACTA CAACTATCTG CTGAAACTTA 8460
4961 AAAACCTTCA TACATTTACA CATCATATCT TCACAAAAGG CTCCACCCTC GATCACGGAC 8520
4962 TTAACT 8526
4963 //
4964 ID DMBLPP standard; DNA; INV; 5034 BP.
4965 XX
4966 AC Z27119;
4967 XX
4968 DR FLYBASE; FBte0000660; Dmel\flea.
4969 XX
4970 SY synonym: blastopia
4971 SY synonym: Kermit
4972 XX
4973 FT source Z27119:372..5405
4974 FT SO_feature five_prime_LTR ; SO:0000425:1..275
4975 FT SO_feature three_prime_LTR ; SO:0000426:4757..5034
4976 FT SO_feature polyA_site ; SO:0000553:5006..5011
4977 FT SO_feature polyA_site ; SO:0000553:5019..5024
4978 FT SO_feature CDS ; SO:0000316:760..4761
4979 FT /name="Dmel\flea\polyprotein"
4980 FT /db_xref="FLYBASE:FBgn0043491"
4981 FT /db_xref="SPTREMBL:Q24262"
4982 FT /db_xref="NCBI_PROTEIN:CAA81643.1"
4983 FT /translation="MFTRTPPTNKKLNTDQIQAILENESEDESRKEKMNEEDQKLAPVG
4984 FT EAEAKKQNKDASAKVEEKFEQMMNTLTQSMLAKSKQEGQVIIAAEKFEKVVSDCDGKSI
4985 FT PIKKWFEIFEKNAEAYELSEKQKYVQARSKMIGSAELFLESECVSGYTELKELLIEEFS
4986 FT GSYNSAVIHKKLQDRKKKREETLHDYLLQMKKIAALGEVETVALITHIVNGLDIKKEYK
4987 FT GAMLRCKTLKELKQEFEIYESLNIVDKPNIQPKPKQITQGVKADHCFNCGSREHKRKDC
4988 FT TLPTKCFSCNQEGHISSKCPEKVNSMRIHVDSARTKPVIINGIIINCLVDTGSDVTIIK
4989 FT EAIFKKMKDVDLNRTATVLRGLGNASTQPIGCFRALIKTDQVEASHNVLVVHDSKFSCD
4990 FT GIVGHDFISKFRLICSAEGYTFLDLEADKKQAVEYSQMFNICEESSFTVAPQYREDVER
4991 FT MIERTYETPPKQIKQCPVELKIIPDGVIKPFRHGHTRLSEEEAIAVKKQVEEWVEQSIV
4992 FT RKSTSNVASRIVVVRKKDGTLRVCVDYRKLNTMVLMDCFPVPIMEEVLEKLQSAKWFTT
4993 FT MDLQNGFFHVAVEEASKPYTAFVTREGLFEFNKAPFGFKNSPAAFIRFVQFIFQELINS
4994 FT NIMQLYMDDIIVYAATPEECMEKTEMVLKRAAEFGLKIKWKKCNFMQRRIHFLGHIIEG
4995 FT GQICPGKEKTSAVNSFGTPQNVKAVQGFLGLTGFFRKFIPGYAQIARPLTDLLKKDAIF
4996 FT NIGPVEQQSVNKLKEILVNEPVLRIYSREAETELHTDASKDGLGAVLLQKFEGSFHPVC
4997 FT FWSRKTTKAESNRHSYYLEVKAAYLALKKFRHYLLGVPFKLVTDCVAFKQTTKKADVPR
4998 FT EVGPWILYMQDFNFQPEHRAGERMRHVDFLSRHPQACMMITSELTARIKKSQQNDDSIR
4999 FT AILEILKDRLFQPYKLKGGLLYSMVNGNELLVVPALMEREVIQSAHEVGHLSLQKTMHS
5000 FT IQQQFFYFLIWEYKVKKLISNCIKCIIHSKKLGKQEGYLNCIDKGDAPLHTLHIDHLGP
5001 FT MDSSAKQYKYILATVDAFSKFVWLFPTKSTGQEEVVKRLTDWSNIFGFPKRIVSDKGTA
5002 FT FTSGAFEQFMSSHNVEHVCTTTGVARGNGQIERVNRLILAIISKLSSDEPSKWYKYVPE
5003 FT VQKAINCHVHSSLKLSPFEVMFGTKMYTRVEDRLLELLQEEVVCQFNEDRYEMRQLVKR
5004 FT NIEQAQKDYKRNYDKKRRAEYKYKAGDLVAIKRTQFVAGRKMASGYLGPYEVTGVKDNG
5005 FT RYDVKKAANVEGPNVTSTSCDNMKLWKYIAENADLLSSGSDDDDQEGRM"
5006 XX
5007 CC Derived from Z27119 (g415797) (Rel. 50, Last updated, Version 6).
5008 CC Takis Benos and Michael Ashburner, 20-Aug-1997.
5009 CC Any changes to original sequence record are annotated in an FT line.
5010 XX
5011 SQ Sequence 5034 BP; 1719 A; 938 C; 1145 G; 1232 T; 0 other;
5012 TGTAACATGA GTAAGGCTGA AGGCTGGCAA CAACCCGGTT GGCAGCGCTG TTGAGCAGCA 60
5013 ACATGATTGT CGGAAATCCA AGTTATCGAC AATCAGTCAT CGAAGGACGA TCGCAGGCAG 120
5014 CAGTAGAGGC GAGTGGAAGT CAGCGTTGCA GTCAGTCGAG TTCTCAGCAG CAGTCGTTCG 180
5015 GTCCACAAAC TAAGAAATAC TTTATATAAT TACCGCATTT AGAATTAAAC TAATAATTAA 240
5016 ATTAATAATA AACAATAATA ATAAACAATC TTACATGGGG GCTCGTCCAG TCCTAAATCG 300
5017 GTTATATGAA GGTGCAGTTG TTTAAAGAAA AAAGACATTG TTGTGTGCGT GGGTATAGTC 360
5018 TTTAAAACGT TGTAAAGTTG TGGCTATATC TATTGCATTT AAAGTTGGAA AAATCAGTTG 420
5019 TACAGATTTT GTTTGAACAC AAGTCGGTAA AAGTCGGGAA AGCTGCTAGA GAGAACTGAT 480
5020 AAAGTTGAAA TTGTCGTGTG CGTGGATTTA GTCTTTAAAG TTGTAAAGTT ATGGCTACGT 540
5021 CTACTGCATT GAAAGTTGAA AAAATCGATT GAACTCATAC AGACTCAAGT CGTTTTGCTG 600
5022 TTGTGGAATT TAAAACAATT AAATTGCAAA GGTGGTGAAA TTCGTTTCTA ACGAAAATCA 660
5023 AAATTTGTCT TTTAACCGGT GGCGCCGTCT GCAAAATCGA CTACCGTCGC GCCGTTAGAA 720
5024 CATTGTCGTT GTTTGCTGGT GTTAGTGCCT TGTCGCGGAA TGTTCACACG TACACCACCT 780
5025 ACAAATAAAA AACTTAACAC CGACCAAATA CAAGCAATTC TAGAGAACGA AAGCGAGGAC 840
5026 GAAAGCAGAA AAGAAAAAAT GAACGAAGAA GATCAAAAGT TGGCGCCTGT AGGAGAAGCA 900
5027 GAGGCAAAGA AGCAGAATAA AGACGCTAGT GCTAAAGTCG AAGAGAAATT TGAACAAATG 960
5028 ATGAATACTC TAACCCAGAG CATGTTGGCA AAATCTAAAC AAGAGGGGCA AGTAATTATC 1020
5029 GCTGCAGAAA AATTTGAAAA AGTTGTAAGT GACTGTGATG GCAAATCAAT TCCTATTAAA 1080
5030 AAATGGTTTG AAATTTTTGA GAAAAATGCC GAGGCATATG AACTTTCGGA GAAACAAAAA 1140
5031 TATGTTCAAG CCAGAAGTAA GATGATTGGA TCAGCAGAAC TTTTCTTAGA ATCTGAATGT 1200
5032 GTCAGTGGAT ACACTGAACT CAAAGAGTTA CTAATTGAAG AATTTTCAGG CAGCTATAAT 1260
5033 AGCGCCGTTA TTCACAAAAA GTTGCAAGAC AGGAAGAAGA AGAGGGAGGA AACTCTACAC 1320
5034 GACTATTTGT TACAAATGAA GAAAATAGCA GCCTTAGGTG AAGTTGAAAC AGTTGCTTTG 1380
5035 ATAACTCATA TCGTAAACGG CCTCGACATT AAAAAGGAGT ATAAGGGTGC TATGCTCCGT 1440
5036 TGTAAAACTC TTAAGGAATT AAAGCAAGAA TTCGAAATCT ACGAGAGTCT GAATATTGTT 1500
5037 GACAAGCCGA ATATTCAACC AAAACCAAAG CAAATTACAC AAGGTGTAAA AGCAGATCAC 1560
5038 TGCTTCAACT GTGGTTCGAG GGAACACAAA CGAAAGGATT GTACACTTCC TACCAAATGT 1620
5039 TTCAGCTGTA ATCAAGAGGG CCATATCTCA AGCAAGTGTC CGGAAAAAGT AAACAGCATG 1680
5040 CGCATTCACG TTGATAGTGC ACGAACAAAG CCAGTAATCA TAAATGGGAT TATCATCAAC 1740
5041 TGTCTGGTGG ACACAGGATC AGATGTGACC ATAATTAAAG AAGCTATATT CAAGAAGATG 1800
5042 AAAGATGTTG ATTTAAACCG CACTGCAACA GTATTGCGAG GTTTGGGAAA TGCCTCAACA 1860
5043 CAGCCGATTG GATGCTTCAG AGCATTAATC AAGACCGACC AGGTGGAAGC AAGCCACAAC 1920
5044 GTTTTAGTCG TCCACGATTC TAAATTCAGT TGCGATGGAA TAGTGGGACA CGATTTTATC 1980
5045 AGCAAGTTTC GTCTTATCTG TAGTGCAGAA GGCTATACTT TTCTTGACCT GGAAGCAGAT 2040
5046 AAAAAACAAG CGGTTGAGTA TTCCCAAATG TTTAATATTT GTGAAGAATC TTCTTTTACA 2100
5047 GTTGCACCAC AATACCGAGA AGACGTTGAA CGCATGATAG AGAGAACATA CGAAACACCA 2160
5048 CCCAAGCAGA TAAAGCAATG TCCAGTCGAA CTCAAAATTA TTCCTGATGG CGTGATTAAA 2220
5049 CCCTTTCGCC ATGGACACAC CCGACTATCT GAAGAAGAAG CTATAGCTGT AAAGAAGCAG 2280
5050 GTAGAGGAAT GGGTCGAGCA GTCAATCGTC CGTAAATCTA CATCAAATGT TGCCAGTCGC 2340
5051 ATAGTCGTTG TCAGGAAAAA GGATGGTACC CTACGCGTTT GCGTGGACTA TAGAAAATTG 2400
5052 AACACCATGG TTCTGATGGA TTGTTTTCCG GTACCCATAA TGGAGGAGGT GCTTGAAAAA 2460
5053 CTGCAGAGTG CCAAATGGTT TACAACCATG GACTTACAGA ACGGATTTTT TCATGTGGCC 2520
5054 GTAGAAGAAG CCAGCAAGCC GTACACAGCA TTTGTTACCC GAGAAGGCTT ATTCGAGTTT 2580
5055 AACAAAGCGC CCTTTGGTTT TAAGAATTCC CCAGCAGCGT TTATACGGTT CGTTCAATTT 2640
5056 ATTTTTCAAG AACTAATCAA TTCCAATATA ATGCAGCTAT ATATGGATGA CATAATTGTA 2700
5057 TATGCCGCTA CCCCAGAAGA ATGCATGGAA AAGACGGAAA TGGTACTTAA GAGAGCTGCA 2760
5058 GAATTTGGTC TAAAAATAAA ATGGAAGAAG TGCAACTTTA TGCAGAGGCG AATTCATTTC 2820
5059 CTGGGACATA TTATCGAAGG TGGACAAATA TGCCCTGGAA AAGAGAAAAC ATCAGCAGTG 2880
5060 AATTCCTTTG GAACACCTCA GAATGTAAAA GCCGTTCAAG GATTTCTGGG TCTCACAGGA 2940
5061 TTCTTCAGAA AATTCATACC TGGATACGCC CAAATTGCGA GACCACTGAC GGACCTATTA 3000
5062 AAAAAAGATG CCATTTTCAA CATTGGACCA GTAGAGCAGC AGTCGGTGAA TAAGCTGAAA 3060
5063 GAGATTCTGG TAAACGAACC AGTATTGAGG ATCTACTCAC GAGAAGCAGA AACCGAACTT 3120
5064 CATACAGATG CCTCTAAGGA CGGGTTAGGA GCCGTTTTAT TGCAGAAGTT CGAAGGCAGT 3180
5065 TTTCACCCAG TCTGCTTTTG GAGCAGAAAA ACTACAAAAG CCGAATCAAA TCGTCATAGT 3240
5066 TATTACCTTG AAGTAAAAGC CGCATACTTA GCTCTGAAAA AGTTCAGACA CTATTTATTG 3300
5067 GGAGTCCCTT TCAAGCTCGT CACGGACTGT GTCGCATTTA AACAGACAAC AAAAAAAGCA 3360
5068 GATGTCCCAA GAGAAGTTGG CCCATGGATT CTCTATATGC AGGATTTTAA TTTTCAACCC 3420
5069 GAACATCGTG CAGGAGAAAG AATGAGACAC GTTGATTTTT TAAGCCGCCA TCCCCAAGCA 3480
5070 TGCATGATGA TAACATCCGA GTTGACAGCA CGTATTAAAA AGTCGCAGCA GAACGATGAT 3540
5071 TCAATTAGAG CAATCCTGGA AATTCTAAAA GATCGTCTAT TCCAACCCTA CAAGCTAAAA 3600
5072 GGTGGCCTGT TGTATAGTAT GGTCAATGGC AATGAACTAC TGGTTGTCCC TGCACTAATG 3660
5073 GAGAGGGAGG TGATTCAAAG CGCACATGAA GTTGGCCATT TGTCGTTGCA AAAGACGATG 3720
5074 CATAGCATAC AGCAGCAATT TTTTTATTTC CTCATTTGGG AATACAAGGT AAAAAAGCTA 3780
5075 ATTTCTAACT GTATAAAATG TATCATCCAC AGCAAAAAGT TGGGAAAGCA GGAGGGATAT 3840
5076 CTAAATTGCA TAGATAAAGG AGACGCACCG TTGCACACAC TACACATCGA TCATTTGGGG 3900
5077 CCAATGGATT CATCGGCCAA ACAGTATAAA TACATTCTGG CAACAGTCGA TGCGTTTTCA 3960
5078 AAGTTTGTCT GGTTATTCCC AACCAAATCA ACCGGACAGG AAGAAGTGGT CAAGAGGCTG 4020
5079 ACCGACTGGT CAAACATTTT TGGTTTCCCT AAGCGAATTG TTAGCGACAA AGGAACGGCC 4080
5080 TTTACGAGTG GTGCGTTCGA ACAATTTATG AGCAGCCATA ACGTGGAACA CGTCTGCACA 4140
5081 ACTACTGGAG TGGCCAGAGG CAACGGCCAG ATAGAACGAG TAAATCGTTT AATTTTGGCA 4200
5082 ATAATATCAA AGCTGTCTTC AGACGAACCG TCGAAGTGGT ACAAATATGT GCCTGAGGTA 4260
5083 CAAAAGGCGA TCAACTGTCA CGTGCATTCA TCACTGAAGC TGTCACCATT TGAGGTCATG 4320
5084 TTTGGCACCA AGATGTACAC CCGAGTTGAG GATCGGTTAC TGGAACTGCT CCAAGAAGAA 4380
5085 GTGGTCTGTC AATTCAACGA GGACCGCTAT GAGATGAGAC AGCTGGTAAA ACGCAACATC 4440
5086 GAGCAGGCGC AGAAGGACTA CAAGCGCAAT TACGACAAAA AGCGCCGAGC TGAATACAAA 4500
5087 TACAAAGCAG GTGATCTGGT TGCAATTAAA AGGACCCAAT TTGTAGCTGG CCGCAAGATG 4560
5088 GCAAGCGGGT ATTTAGGTCC ATACGAAGTC ACAGGGGTCA AAGACAATGG CAGATATGAC 4620
5089 GTTAAAAAAG CAGCAAACGT CGAAGGACCC AATGTCACAT CCACCAGCTG TGACAACATG 4680
5090 AAGTTGTGGA AGTACATAGC CGAAAATGCA GACCTATTGT CATCCGGGTC GGATGATGAT 4740
5091 GATCAGGAGG GCCGAATGTA ACATGGAGTA AGGCTGAAGG CTGGCAACAA CCCGGTTGGC 4800
5092 AGCGCTGTTG AGCAGCAACA TGATTGTCGG AAATCGAAGT TATCGACAAT CAGTCATCGA 4860
5093 AGGAACGATC GCAAGGCAGC AGTGGAGTAG GAGTGGAAGT CAGCGTTGCA GTCAGTCGTG 4920
5094 TTCTCAGCAG CAGTTCGTTC GGTCACAAAC TAAGAATACT TTATATAATT ACCGCATTTA 4980
5095 GAATTAAACT AATAATTAAA TTAATAATAA ACAATAATAA TAAACAATCT TACA 5034
5096 //
5097 ID OPUS standard; DNA; INV; 7521 BP.
5098 XX
5099 AC AY180918;
5100 XX
5101 DR FLYBASE; FBte0000918; Dmel\opus.
5102 XX
5103 SY synonym: nomad
5104 SY synonym: yoyo
5105 XX
5106 FT source AY180918:1..7521
5107 FT SO_feature five_prime_LTR ; SO:0000425:1..518
5108 FT SO_feature three_prime_LTR ; SO:0000426:7004..7521
5109 FT SO_feature CDS ; SO:0000316:1578..2831
5110 FT /name="Dmel\opus\gag"
5111 FT /db_xref="FLYBASE:FBgn0025876"
5112 FT /db_xref="SPTREMBL:Q8I7Q0"
5113 FT /db_xref="NCBI_PROTEIN:AAN87270.1"
5114 FT /translation="MEETLRALSESLNALTNVVTGIKEDIKKNNDRLAILEQERGNAD
5115 FT PTVDQPQPLVRARTEYELREISVLPDCVKELQAFEGRQEAYLSWINRAQSILTEYDLI
5116 FT KTRPLYRAIVLHIRQKIRGHADMALAAYGVQDDDWDDIKRVLALHYADKRDLRTLEHE
5117 FT LGAMCQGSRPLDRFYMDVNGHLSLILNNLKARNHPREVVNALIETYRDKALDVFIRGV
5118 FT GRDCSKHLLVRSPKNLPEAYSFCMGLQNVMSRNFTAQNYQPSGAPRFAGPYQHQARPP
5119 FT FRTPFSPGSGRFSQNSYRTQGPRQAIKMESNRSGQSYQSGYSGRQEEGSGIKRMSEGN
5120 FT NPFQKAQRLYHMELAPPPLAPAASGDNQGRSHEGYYDDESQAVERSNNYPPQKNVEGV
5121 FT TDAPHNLETEGGANFMTNASPVYRT"
5122 FT SO_feature CDS ; SO:0000316:2972..5983
5123 FT /name="Dmel\opus\pol"
5124 FT /db_xref="FLYBASE:FBgn0025875"
5125 FT /db_xref="SPTREMBL:Q8I7P9"
5126 FT /db_xref="NCBI_PROTEIN:AAN87271.1"
5127 FT /translation="MITHRLVGKFFKPLGNDSDITFFVLPNLHSFDGIIGDDTLKDLK
5128 FT AIVDRKNNCLIITPGIKIPLLARASINVNPLLAAEHPDGTQEILNSLLGEFPRIFEPP
5129 FT LSGMSVETAVKAEIRTNTQDPIYAKSYPYPVNMRGEVERQIDELLQDGIIRPSNSPYN
5130 FT SPIWIVPKKPKPNGEKQYRMVVDFKRLNTVTIPDTYPIPDINATLASLGNAKYFTTLD
5131 FT LTSGFHQIHMKESDIPKTAFSTLNGKYEFLRLPFGLKNAPAIFQRMIDDILREHIGKV
5132 FT CYVYIDDIIVFSEDYDTHWKNLRLVLASLSKANLQVNLEKSHFLDTQVEFLGYIVTAD
5133 FT GIKADPKKVRAISEMPPPTSVKELKRFLGMTSYYRKFIQDYAKVAKPLTNLTRGLYAN
5134 FT IKSSQSSKVPITLDETALQSFNDLKSILCSSEILAFPCFTKPFHLTTDASNWAIGAVL
5135 FT SQDDQGRDRPIAYISRSLNKTEENYATIEKEMLAIIWSLDNLRAYLYGAGTIKVYTDH
5136 FT QPLTFALGNRNFNAKLKRWKARIEEYNCELIYKPGKSNVVADALSRIPPQLNQLSTDL
5137 FT DANPEDDMQSLATAHSALHDSSRLIPHVESPINVFKNQLIFDTTRSKYLCEHPFPGYT
5138 FT RHLIPLKDGSLADLTNSLQSCLRPVIINGVKIPEAHLQRFQSICLANFLLYKIRITQR
5139 FT LVADVSGAEEICEIIEKEHRRAHRGPTEIRLQLLEKYYFPRMSSTIRLQTSSCQCCKL
5140 FT YKYERHPNKPNLQPTPIPNYPCEILHIDIFALEKRLYLSCIDKFSKFAKLFHLQSKAS
5141 FT VHLRETLVEALHYFTAPKVLVSDNERGLLCPTVLNYLRSLDIDLYYAPTQKSEVNGQV
5142 FT ERFHSTFLEIYRCLKDELPTFKPVELVHIAVDRYNTSVHSVTNRKPADVFFDRSSRVN
5143 FT YQGLTDFRRQTLEDIKGLIEYKQIRGNMARNKNRDEPKSYGPGDEVFVANKQIKTKEK
5144 FT ARFRCEKVQEDNKITVKTRSGKIFHKSDLRN"
5145 XX
5146 CC Sequence from P1 DS01219.2:861..8381 provided by Guochon Liao
5147 CC Berkeley Drosophila Genome Project.
5148 XX
5149 SQ Sequence 7521 BP; 2322 A; 1740 C; 1677 G; 1782 T; 0 other;
5150 AGTTAAGAAC CCTCTTCTTG CGCTCTTCGT CAGGACTCAC CAGCGCTCGG CTCTCGTGTT 60
5151 TTCGGGCCCC GTCAGCAGGC GACTCGGGGC CTGTCTAGTA ACATGTTCGT GTAAGTTACG 120
5152 AACCCTCTTC TTGCGATCTT CGTCAGGACT CACCAGCGCT CGGCTCTCGT GTTTTCGGGC 180
5153 CCCGTCAGCA GGCGACTCGG GGCCTGTCTA GGAACATGTT TGTGTATGTG TGCATTCGGA 240
5154 ACAAGTGCCG TTGGTCGCAC TCAGGGTGAG GGGTCAACGG GGGAAGCGGA TATAAAAGCA 300
5155 GCGGGGCGGG AGAAGAGGTC CCAGTCTCGA ACGGACACAT AACGGAACCG CTAGCAGATC 360
5156 GCGAACTGAA TCTTAAAATA AAGCTAATCG TAAACTCGAA CCCTCTTAAC TATCTTGACT 420
5157 ATTATTTGGA GAACCACAGC ATGTTGGTTG TCATATCAAG GTGAGGTATG CGGCAGCGAG 480
5158 TGCCGAGAAC CCTGATGCAA GTGGAACTTG CGTTAACTGG CGCCCGAACA GGGACCGGCA 540
5159 ATGTCCGGCC GATAAAAGTG ATACGAAAAA ATTGTGGAAA TTTGTGCGTA AAAATAGTGG 600
5160 TGGTGTGCAT AAGTCAGATT AAGATCTGAA ATCCATAAAT GAAAAAGAAG TGCTGCGTGA 660
5161 GCTGTGTATA AAATGATAAA ATAGCAATTA CCCGCTGCCG GGGGGAACTA CGCCCATCCC 720
5162 GGGGCGCAAC AAATATTGCA TAATTCAATA AAAGGTGTAA AATTTCTAAA ATAAAAATGT 780
5163 AAACCTATGT TGCGCCAAGA CCTAATTTAA ATTAATAAAA CAACGACCCG CTACCGGAGG 840
5164 ACGCCACGTC GCCCATGCCG AGCGCAAAAG TTGTACGATA CCTATAACAT AATTAAAACA 900
5165 CGATCAACCC ACTGCGGCGG TACGGCTTGT GGGAAAATTT TTTTTTTTTT CTCTCCTTGC 960
5166 CAATTCGCGA GTGCAAAAGA TTGTGTATAA TAAACCAATA ATTAACCATT GCAGCAGTTT 1020
5167 ACCTGCGGCA GTACGAGTAA TATGAGCGCC CAGAGTGATA AGGTGGTGTG TGGCAGCTTG 1080
5168 TTGGATACGT TAAGTGGTGT GGAATGCACC CAAAAAAAAC CGCCCAACAA GTTGTGTGGC 1140
5169 GGCCGTACCT TAGTAGGCAA CCAGCCAAAA GGGATACTAC GGAACCACCG TGCCCAGTGC 1200
5170 CGAAATAAAT TAGAGGTCAT CAATAAAAAA CTGTAACAGC ACGCACGCAA GGAAAAAATA 1260
5171 TTGCAAAATG GAATAGCGCA CAAAAATTGT ATAAACACAT GCACAACACC ACAATTCAAA 1320
5172 GGAAAACAAA ATATTCATGC TGTAGGGGTA CAACCTAAAC GACGAAAACT AATAAAGAGC 1380
5173 ATACAAGGGT GAGTGAAATA TTTCATTAAA CTTTATTGCC ATATTTGCTA AATTTAGAGA 1440
5174 AATAAAGAAA AAGCAAAGAA GAACAGATAT TCTTTTTTAT CGGGTTAAAA CCGTTGTCTC 1500
5175 ACATTTCCGT AAAGTAATAA CGAATTCTGT TGCCTTGAAA GCTTCCTGCA TCTTTCCAAC 1560
5176 GCAAACTAAA AATCAAAATG GAAGAGACCC TGCGTGCTCT TAGCGAGTCC CTCAATGCCC 1620
5177 TGACCAACGT GGTGACAGGC ATTAAGGAAG ATATTAAGAA AAATAATGAT AGGTTGGCTA 1680
5178 TTTTAGAACA GGAGCGCGGG AACGCTGACC CTACGGTCGA CCAACCGCAA CCCCTGGTGC 1740
5179 GCGCACGCAC CGAGTATGAG CTGAGAGAGA TATCGGTCCT CCCTGACTGC GTCAAAGAAC 1800
5180 TGCAGGCGTT CGAAGGACGG CAGGAGGCTT ACCTGTCTTG GATAAACAGG GCACAGTCAA 1860
5181 TACTGACCGA ATATGACTTG ATTAAAACCA GACCCCTGTA TAGGGCAATT GTCTTGCATA 1920
5182 TTAGACAGAA AATAAGGGGA CACGCCGACA TGGCCTTGGC GGCCTATGGC GTCCAAGACG 1980
5183 ACGATTGGGA CGACATAAAA CGAGTCTTGG CGCTGCATTA CGCAGACAAA CGAGACTTAC 2040
5184 GTACGCTTGA GCATGAGCTT GGCGCTATGT GCCAAGGTTC TAGACCACTA GATAGGTTCT 2100
5185 ATATGGACGT TAATGGCCAT CTCTCGTTGA TCTTAAATAA CTTGAAGGCC AGAAACCACC 2160
5186 CTCGTGAAGT AGTCAACGCT TTGATAGAAA CCTATAGAGA CAAGGCTTTG GATGTTTTTA 2220
5187 TCCGAGGAGT GGGGAGAGAT TGTTCCAAAC ACTTACTTGT CCGCAGCCCG AAGAATCTAC 2280
5188 CAGAGGCTTA CTCTTTTTGT ATGGGATTGC AGAATGTAAT GTCAAGAAAT TTCACAGCTC 2340
5189 AGAACTATCA ACCGTCAGGT GCCCCAAGAT TCGCAGGCCC ATATCAACAT CAGGCCAGGC 2400
5190 CACCGTTCCG AACCCCTTTT TCTCCTGGTT CAGGCAGATT TTCGCAAAAC TCCTACAGAA 2460
5191 CTCAGGGTCC TAGACAGGCC ATAAAAATGG AATCCAATCG GTCGGGTCAA TCTTACCAAT 2520
5192 CAGGATACAG TGGTCGCCAG GAAGAAGGCT CCGGTATTAA GAGAATGTCC GAAGGAAACA 2580
5193 ACCCATTCCA AAAGGCACAA AGATTGTACC ACATGGAATT GGCACCACCC CCGCTAGCCC 2640
5194 CGGCGGCTAG TGGAGATAAC CAAGGACGTT CACACGAGGG TTACTATGAT GACGAGTCTC 2700
5195 AAGCTGTCGA GAGAAGCAAC AATTATCCTC CGCAGAAAAA CGTGGAAGGA GTTACAGATG 2760
5196 CTCCACATAA CCTTGAGACT GAGGGAGGGG CAAATTTTAT GACCAACGCC TCTCCAGTGT 2820
5197 ACCGTACTTA GAGTATGCTA CGGAGAGGGG AGAAAGGCTG AAGTTTTTGA TCGACACGGG 2880
5198 GGCGAACAAA AACTTTATTA GCCGAAGACT TGCAGCCGGG TGTACCACAG TCCGTAAACC 2940
5199 CTTCTCCGTA CTGTCCGCTG CGGGTAACAT CATGATAACG CACCGCCTAG TTGGTAAATT 3000
5200 CTTCAAACCA CTAGGGAACG ACTCGGATAT TACCTTTTTC GTACTACCGA ATTTACATTC 3060
5201 CTTTGATGGT ATCATTGGCG ACGATACTCT CAAAGACTTA AAAGCCATAG TGGATAGGAA 3120
5202 AAACAATTGT TTGATAATAA CCCCAGGAAT TAAAATCCCT CTTTTGGCGA GAGCTTCAAT 3180
5203 AAACGTTAAC CCGCTACTCG CCGCCGAACA CCCAGATGGT ACACAAGAAA TTTTGAATTC 3240
5204 CCTTCTCGGG GAATTTCCCC GCATCTTCGA GCCCCCCTTA TCTGGAATGT CCGTGGAGAC 3300
5205 GGCCGTCAAG GCTGAAATCC GGACAAACAC ACAAGACCCG ATCTATGCTA AAAGTTATCC 3360
5206 TTACCCAGTC AACATGCGCG GAGAAGTCGA ACGTCAAATC GATGAACTGC TGCAGGACGG 3420
5207 TATAATTCGA CCCTCTAATA GCCCTTACAA TTCCCCTATC TGGATAGTCC CGAAGAAACC 3480
5208 TAAACCAAAC GGAGAAAAAC AATATCGCAT GGTAGTCGAT TTCAAGCGGT TAAATACCGT 3540
5209 CACCATACCC GACACTTACC CCATCCCAGA TATAAACGCT ACGCTAGCCA GCCTTGGCAA 3600
5210 TGCCAAATAC TTTACCACCC TAGATTTGAC TTCTGGATTC CATCAAATCC ACATGAAGGA 3660
5211 AAGCGACATT CCAAAGACAG CTTTCTCTAC TCTAAATGGA AAGTACGAGT TCCTCCGTCT 3720
5212 ACCATTCGGT TTGAAGAATG CACCTGCAAT CTTCCAAAGA ATGATCGATG ATATTTTGCG 3780
5213 CGAGCATATT GGCAAGGTCT GCTACGTTTA TATTGACGAT ATCATCGTCT TCAGTGAAGA 3840
5214 TTATGACACA CACTGGAAAA ATCTCCGATT GGTATTAGCG AGTTTATCAA AAGCTAACCT 3900
5215 CCAAGTGAAC CTTGAGAAGT CGCATTTTTT AGACACGCAG GTAGAATTTT TAGGATATAT 3960
5216 CGTCACGGCC GATGGCATTA AGGCAGATCC GAAAAAGGTC AGAGCGATTA GCGAAATGCC 4020
5217 TCCTCCGACC TCTGTTAAGG AGTTAAAAAG ATTTCTAGGC ATGACCTCGT ACTACAGGAA 4080
5218 GTTCATTCAG GACTATGCGA AGGTAGCAAA GCCCCTTACA AACTTGACGC GTGGATTGTA 4140
5219 CGCTAATATA AAGTCTTCAC AATCAAGCAA AGTGCCAATT ACATTAGACG AGACGGCCCT 4200
5220 ACAGTCTTTT AATGATTTAA AATCAATTCT CTGTTCTTCT GAAATACTGG CGTTCCCATG 4260
5221 TTTCACTAAA CCTTTCCATC TAACCACGGA CGCTTCTAAC TGGGCCATCG GAGCTGTCCT 4320
5222 CTCACAGGAC GACCAGGGTA GAGATAGGCC GATAGCGTAC ATTTCCCGTT CATTAAATAA 4380
5223 GACGGAGGAA AACTACGCTA CTATCGAAAA GGAAATGCTC GCGATAATTT GGTCATTGGA 4440
5224 CAATCTTCGG GCTTACTTAT ATGGCGCTGG TACTATTAAA GTATATACTG ACCATCAACC 4500
5225 TCTAACGTTT GCCCTAGGCA ACAGAAATTT CAATGCGAAG CTAAAACGCT GGAAGGCTCG 4560
5226 TATAGAGGAA TACAACTGCG AACTCATCTA CAAGCCTGGG AAATCTAATG TGGTGGCTGA 4620
5227 CGCGCTTTCA CGCATTCCGC CTCAGCTTAA CCAGTTGAGC ACCGATTTAG ATGCTAATCC 4680
5228 CGAGGATGAC ATGCAGTCTT TGGCTACTGC CCATAGCGCT TTACATGACA GTTCACGATT 4740
5229 GATTCCCCAC GTTGAATCTC CAATCAACGT TTTCAAGAAT CAACTCATTT TTGACACAAC 4800
5230 CAGGTCAAAA TACTTATGCG AGCACCCGTT CCCAGGTTAT ACTCGCCATC TGATTCCTCT 4860
5231 CAAAGACGGA TCACTTGCCG ATTTAACCAA CTCGTTACAA TCGTGTCTAC GACCTGTAAT 4920
5232 AATTAACGGC GTCAAAATCC CGGAAGCACA TTTGCAACGC TTTCAGTCCA TCTGCTTAGC 4980
5233 GAATTTTCTT TTATACAAAA TTCGGATAAC GCAGCGCCTA GTGGCGGACG TGTCTGGCGC 5040
5234 AGAGGAAATT TGTGAAATAA TTGAAAAAGA ACACCGTAGA GCACATAGGG GCCCTACGGA 5100
5235 GATTCGTCTC CAACTTTTAG AAAAATATTA TTTCCCGCGA ATGTCCAGTA CGATCCGTCT 5160
5236 GCAAACTTCC TCATGTCAGT GTTGCAAACT CTACAAGTAC GAGAGACACC CTAACAAACC 5220
5237 AAACCTACAA CCTACGCCAA TTCCTAACTA CCCATGTGAA ATACTTCACA TCGACATTTT 5280
5238 TGCGCTCGAA AAAAGGTTAT ACCTAAGTTG TATTGACAAA TTTAGCAAGT TTGCCAAACT 5340
5239 TTTCCATCTG CAGTCAAAAG CATCTGTGCA TTTGCGAGAA ACTTTGGTGG AGGCCCTACA 5400
5240 TTACTTCACC GCCCCTAAGG TCTTGGTTTC GGATAACGAG CGAGGGTTGT TATGCCCCAC 5460
5241 AGTGCTCAAC TATCTTCGGT CTCTAGATAT CGATCTGTAT TATGCTCCAA CCCAGAAGAG 5520
5242 CGAAGTAAAT GGTCAAGTCG AGAGATTCCA CTCTACGTTC CTAGAAATTT ATCGTTGCCT 5580
5243 TAAAGATGAG CTCCCTACCT TCAAACCCGT TGAGCTGGTA CACATAGCAG TGGACCGCTA 5640
5244 CAACACTTCC GTTCACTCGG TAACGAATCG AAAACCAGCA GACGTTTTTT TCGACCGCTC 5700
5245 GTCAAGGGTA AACTATCAGG GTCTGACAGA TTTCCGGCGG CAGACTTTAG AGGACATCAA 5760
5246 GGGCTTAATT GAGTATAAGC AAATTAGAGG TAATATGGCT CGGAATAAAA ATAGGGACGA 5820
5247 GCCAAAGTCT TATGGGCCGG GAGATGAAGT TTTTGTTGCA AATAAGCAAA TAAAAACAAA 5880
5248 GGAAAAAGCG AGGTTCAGAT GCGAAAAGGT ACAGGAAGAC AACAAGATAA CAGTTAAAAC 5940
5249 CAGATCAGGA AAAATTTTCC ACAAATCTGA TCTAAGAAAT TGAGACGTGG CTTTCACATT 6000
5250 TAAAAAAGAA ACGCGAAAAA GAATAACGAA AGTAATAAAA GTACGTTGTG GCAGCTAATG 6060
5251 AAATATTCCA CCCATGCATA CCCTATATAA AAAAAACATT AATAAAAAAA AAAAAAAAAA 6120
5252 AAAAAAAAAA AAAAAAAAAT GAGTTAAGAA ATACAAAAAG AAATACAAAA AAAACTATAA 6180
5253 AAAAAATAAT ATAAAAAAAT ACAGATTATA AGAAATAAGA AATAAGAAAT ATAAAAAAAT 6240
5254 AAAAATATAA GTACACAAAA TGTACCGTAC CCCCACACAC TACGTAGTCT TAGAACAACT 6300
5255 TAGACGACCA GATATTTACG AATTGTCTTT TTGTAAGCGC GATTTCTGCA TGCGGCGCAA 6360
5256 ATCCCGCTCA CTGGACTGGC TGGGGTCGGC TTGGAAATGG GTAGCTGGAT CTCCAGATGC 6420
5257 TGCTGATTGG AACGCCGTCT TGGCCGCGCA AGCGACGGCT TCGAGGAACT GCAAAAACTG 6480
5258 GAGGAGGCTA GCTGTATCCC TCGGCTACTG AAGTAACCAA CGAGTGGTTA AGCAAGTCGA 6540
5259 CGATGGAATG CTCCTCCTGA CCAACTTCAA CGGAACTCTA AGAACGGCTG CAGAGAACTA 6600
5260 CGACCTGATC GGCTCCTTTA TCATCCAATT CGACAATGAG ACGATAATGG TCAACGGTCA 6660
5261 AAACTATTCC AGTTACTCGG TCAGTCATCT AATGGCGATG CCGGCCGTGT TGAGCCACAT 6720
5262 AACGGCCAGC AACTTTCAAC TTTCTCTGGA ATACGTCCAC GACGTGAGCA TGAAGAATTT 6780
5263 GGAAAAGATG TCCAACATGG CGAGTGAGCT ACTAGCCTCT CTTCTCACCG AGGCGGCACT 6840
5264 CGCAATCTGC ATATTCCTAG GCTTTTATTT CCTATGGAAG AAGCTGATGT CCACCAAAGG 6900
5265 CATGCCCGAT GTCCGCGAGA TTGCCGCAAA CTTAGAAGCA TTGGGCCAAA CCGAGCTGAA 6960
5266 CAAGGCTCAC TAATCTGCGG GACGCAGATC TTGAGGGGGG AGGAGTTAAG AACCCTCTTC 7020
5267 TTGCGCTCTT CGTCAGGACT CACCAGCGCT CGGCTCTCGT GTTTTCGGGC CCCGTCAGCA 7080
5268 GGCGACTCGG GGCCTGTCTA GTAACATGTT CGTGTAAGTT ACGAACCCTC TTCTTGCGAT 7140
5269 CTTCGTCAGG ACTCACCAGC GCTCGGCTCT CGTGTTTTCG GGCCCCGTCA GCAGGCGACT 7200
5270 CGGGGCCTGT CTAGGAACAT GTTTGTGTAT GTGTGCATTC GGAACAAGTG CCGTTGGTCG 7260
5271 CACTCAGGGT GAGGGGTCAA CGGGGGAAGC GGATATAAAA GCAGCGGGGC GGGAGAAGAG 7320
5272 GTCCCAGTCT CGAACGGACA CATAACGGAA CCGCTAGCAG ATCGCGAACT GAATCTTAAA 7380
5273 ATAAAGCTAA TCGTAAACTC GAACCCTCTT AACTATCTTG ACTATTATTT GGAGAACCAC 7440
5274 AGCATGTTGG TTGTCATATC AAGGTGAGGT ATGCGGCAGC GAGTGCCGAG AACCCTGATG 7500
5275 CAAGTGGAAC TTGCGTTAAC T 7521
5276 //
5277 ID DM_ROO standard; DNA; INV; 9092 BP.
5278 XX
5279 AC AY180917;
5280 XX
5281 DR FLYBASE; FBte0000100; Dmel\roo.
5282 XX
5283 SY synonym: B104
5284 XX
5285 FT source AY180917:1..9092
5286 FT SO_feature five_prime_LTR ; SO:0000425:1..429
5287 FT SO_feature three_prime_LTR ; SO:0000426:8665..9092
5288 FT SO_feature CDS ; SO:0000316:1275..8357
5289 FT /name="Dmel\roo\ORF"
5290 FT /db_xref="FLYBASE:FBgn0043856"
5291 FT /db_xref="NCBI_PROTEIN:AAN87269.1"
5292 FT /translation="MMSEKTIQFLKKQSEIILEIRKLEVKPTLTDVEILKLNELQKCF
5293 FT IANHSNLLKIGVVDHEYFNAKQYDLIMMVLEKIKNKNEKIKGESVENTFPKSNTVPKS
5294 FT NPPPTLNLEMRGHPEKEGIAQNNALKVEQAFRNNVGQFRVYLEDTSKLIDSSPDFLKI
5295 FT RKNKIEFLWHKIDNLIEQVNSRFESSLFEEEISELEFDKQNILTAINSRLSGTINKAE
5296 FT MSTVVKAEELPTLPKIQIPTFFGDSKEWDLFNELFTELIHVREDLSPSLKFNYLKSAL
5297 FT KGEARNVVTHLLLGSGENYEATWEFLTKRYENKRNIFSDHMNRLMDMPNLNLESNKQI
5298 FT KTFIDTINESIYIIKLKAQLPEDVDAIFAHIILRKFNKESLNLYESHVKKTKEIQALS
5299 FT DVMDFLEQRLNSISSFSQEVKPVKKMINNNKNKNYSDNCAYCKLPGHYLIQCHKFKIM
5300 FT NPAERSDWVRKNGICLRCLRHPFGKKCISEQLCSTCRKPHHTLLHFAGHNPEKVNTCR
5301 FT TTGQALLATALIQVKSRYGGFEQLRALIDSGSQSTIISEESAQILKLKKFRSHTEISG
5302 FT VSSTGTCISKHKAVISIRNSPKNLEIEAIILPKLMKALPVNTINVDQKKWKNFKLADP
5303 FT DFNKPGRIDLIIGADVYTHILQNGVIKIDGLLGQKTDFGWIVSGCKKSKGKETIVATT
5304 FT IEIKELDRYWEVEEEEKDDIESEICENKFIKTTKKDSDGRYIVSIPFKEDVTLGDSKK
5305 FT QAIARYMNLEKKLKRNEKLKVDYTKFMNEYMDLGHMIEVSDEGKYFLPHQAVIRDSSL
5306 FT TTKLRVVFDASAKTTNNKSLNDIMWVGPRVQKDIFDIIIKWRKWEFVVSADIEKMYRQ
5307 FT IKIDNNDQKYQYILWRNSPKEKIKTYKLTTVTYGTASAPYLATRVLVDIADKCKNQVI
5308 FT SAIIRNDFYMDDLMTGADSVEEANKLITLIPHELQKVGFNLRKWISNNSKILTTVEDT
5309 FT GDNKVLNIIENECVKTLGLKWEPQKDLFKFSVNCNDESKNINKRVVLSTLAKIFDPLG
5310 FT WLAPVTVSGKLFIQKLWINKSEWDQELSIEDKNYWEKYKENLLLLENIRIPRWINSNS
5311 FT SSVIQIHGFADASEKAYAAVVYAKVGPHVNIIASKSRVNPIKNRKTIPKLELCAAHLL
5312 FT SELIQRLKGSIDNIMEIYAWSDSTITLAWINSGQSKIKFIKRRTDDIRKLKNTEWNHV
5313 FT KSEDNPADLASRGVDSNQLINCDFWWKGPKWLADPKELWPRQQSVEEPVLINTVLNDK
5314 FT IDDPIYELIERYSSIEKLIRIIAYINRFVQMKTRNKAYSSIISVKEIRIAETVVIKKQ
5315 FT QEYQFRQEIKCLKIKKEIKTNNKILSLNPFLDKGGVLRVGGRLQNSNAEFNVKHPIIL
5316 FT EKCHLTSLLIKNAHKETLHGGINLMRNYIQRKYWIFGLKNSLKKYLRECVTCARYKQN
5317 FT TAQQIMGNLPKYRVTMTFPFLNTGIDYAGPYYVKCSKNRGQKTFKGYVAVFVCMATKA
5318 FT IHLEMVSDLTSDAFLAALRRFIARRGKCSNIYSDNGTNFVGAARKLDQELFNAIQENI
5319 FT TIAAQLEKDRIDWHFIPPAGPHFGGIWEAGVKSMKYHLKRIIGDTIFTYEEMSTLLCQ
5320 FT IEACLNSRPLYTIVSEKDQQEVLTPGHFLIGRPPLEIVEPMEDEKIGNLDRWRLIQKI
5321 FT KKDFWVKWKSEYLHTLQQRNKWKKEIPNIEEGQIVLLKDENCHPARWPLGKVEKVHKG
5322 FT NDDKVRVAKVKMQEGYITRPITKICPLEGIKSVDKNEADQEPKRRTRATSGMSKIGII
5323 FT MAMLLFVLSCQVSSALPKDIAPRYSIDKINKTSAIYLDPLGDVEIVSTSWNLVIYYKM
5324 FT DPYFKMLTKGNALIQSMRKVCERLHSFEEQCSLVLDNMQSQLSELEENNKLFMMQSRS
5325 FT RSKRAPFEFMGSLYHILFGIMDEDDREQLEENMKNLLDNQNNLDKLIQKQTSVVDSTS
5326 FT NLLKRTTEDVNSNFRSMQIRIENMTEVLKENYYVYKESIKFFMITKQLHSLIEEGEKI
5327 FT QAGIISLLIDINHGRLNTNILRPNQLKKEIAKIQQSLSENLVIPGKRSGTELKEVYTL
5328 FT LTARGLFIDDKLIISAKVPLFSRHPSKLFRLIPVPIRNEDRIIMVHTTSEYLIYNFEI
5329 FT DSYHIMTEATLNQCQKWQLNKRICKGSWPWNSANDNACEIQPLKPDKAANCIYKTVVD
5330 FT SKSYWVELEKKSSWLFKVPANSKVRLQCTGSQIELFDLPQQGVLSIAPYCTARTDDKI
5331 FT LVAHHNIQSESEELLSTPYIGEVSGVPKIIWDPLKLSILNHTEEFERLNNEIKFMKEN
5332 FT HQKLKDLHFHHISGHAGLIIALILMIVLIIYFIRKCAVQQRMQAITFAGPLPVLXX"
5333 XX
5334 CC Sequence from P1 sequence DS00941:20448..29535 provided by
5335 CC Guochun Liao, Berkeley Drosophila Genome Project.
5336 XX
5337 SQ Sequence 9092 BP; 3468 A; 1442 C; 1710 G; 2472 T; 0 other;
5338 TGTTCACACA TGAACACGAA TATATTTAAA GACTTACAAT TTTGGGCTCC GTTCATATCT 60
5339 TATGTAAATG AATCGAGAGC GATAAATTAT ATTTAGGATT TTGTTATCTA AGGCGACATG 120
5340 GGTGCATTGC TCAAAAACAT GTAATTTAAG TGCACACTAC ATGAGTCAGT CACTTGAGAT 180
5341 CGTTCCCCGC CTCCTAAAAT AGTCCCTTAG TGGGAGACCA CAGATAAGGT CCTCGCCGCT 240
5342 CAAGATAGGC AGATGTGCCC GAGCGTGGGA CCTCGATAAG GCGGGGACTA TTTACGTAGG 300
5343 CCTCTGCGTA GGCCATTTAC TTTAAGATGC GATTCTCATG TCACCTATTT AAACCGAAGA 360
5344 TATTTCCAAA TAAAATCAGT TTTTTTACAA AAACTCAACG AGTAAAGTCT TCTTATTTGG 420
5345 GATTTTACAT TTGGTCAATC GAGCCTTTAA TCGACTCTGC AGTTTCCCCC TACCAAAGGT 480
5346 AAGGAACTCA GAGAAAGGCC AGCTCCTTTA AGCATCTTAC AGCTAAAGGT AGCAAAAATA 540
5347 AGTGACTCTT GTTTCCCCCT ACCAAAGGTA AGGAACAGAG TATAAATATA AAAAGCAAAA 600
5348 GATACAAAAG AATCTTTTAT GTTTTAAAAC AAGCACCTTA TAGTCTATAG CTAAAGGTTG 660
5349 CTTTGTGTAC CATTATAAAT TGTGGTAAGG CGTGCTTGAG GCCATACATC AGCAATTGTG 720
5350 AAATTAAAAA GTGCATAACA AAAGTGCCTT ATAAATGCTC TAATAGCATT AAATCAGCTC 780
5351 ATAAATAGAG TGCAGTGTAT ATGCCATAAG AGCATAAATT AAATAAAAAG TGCCTGAAAA 840
5352 CAGTGCCTTA TAAATGCTCT AATAGCATTA AATCAGCTCA TAAATAGAGT GCAGTGTATA 900
5353 TGCCAAAAGA GCATAAATGC CGAAATAAAT GGCTAAAAAA CAAAAAATCT GACTGGACTA 960
5354 CAAAAATAAT AAAACGTGCC AAAAAAAAAA AAAAAATCAT CTTTAAACAT CGACGGAGCC 1020
5355 TTAAAGAAGA GAAGGAAGTC AAATTCAAAG GAGCCTCTAC CAGCAGCAGA AGCAGCAACA 1080
5356 ACAGCAGCAG CAGAAGCAGC AACAGCAGTA GCAACAGCAG CAACAACAGC AGCAACAGCA 1140
5357 GCAGCAACAA CAACGACATC AGCTAAGTCA AAACAAGAAT TTTCTGTTTA TCCAAACACA 1200
5358 CATATATATA TAAATACATA TAAAATACAT ATACACGTAC TATATATATT AAGAAATTAC 1260
5359 AAAAAATTTT CAAAATGATG TCAGAAAAGA CTATTCAATT CCTTAAGAAG CAGTCCGAAA 1320
5360 TTATTTTGGA AATTAGAAAG TTGGAAGTAA AACCAACATT AACAGATGTA GAAATTCTAA 1380
5361 AATTAAATGA GCTTCAAAAA TGTTTCATTG CTAATCATAG CAATTTGTTA AAGATCGGCG 1440
5362 TTGTCGATCA TGAATATTTT AACGCGAAGC AGTATGATTT AATAATGATG GTGTTAGAAA 1500
5363 AAATTAAAAA TAAAAATGAA AAAATTAAGG GCGAGTCGGT AGAAAACACT TTCCCTAAAT 1560
5364 CAAACACTGT CCCTAAATCA AACCCTCCCC CTACATTAAA CCTTGAAATG CGTGGTCACC 1620
5365 CTGAAAAAGA GGGTATAGCA CAAAACAACG CTTTAAAAGT AGAGCAGGCA TTTCGTAATA 1680
5366 ATGTTGGCCA ATTTCGAGTA TATCTAGAAG ATACGTCTAA ACTAATAGAC AGTAGTCCAG 1740
5367 ATTTCCTTAA AATAAGGAAA AATAAAATTG AATTTTTATG GCATAAAATA GATAACCTGA 1800
5368 TTGAACAGGT GAATAGTCGT TTTGAGAGTT CGCTATTCGA AGAAGAAATT AGCGAACTTG 1860
5369 AATTTGACAA ACAAAATATT CTTACAGCCA TTAATAGTCG ACTCAGTGGC ACAATAAATA 1920
5370 AAGCTGAAAT GTCGACGGTT GTTAAGGCGG AGGAGTTACC AACCCTGCCT AAAATACAGA 1980
5371 TTCCCACCTT CTTTGGTGAT TCCAAAGAAT GGGATCTTTT TAATGAACTC TTTACAGAGC 2040
5372 TCATACATGT GAGAGAGGAT CTCAGTCCTT CTCTCAAATT TAATTATCTA AAGTCAGCAT 2100
5373 TAAAAGGAGA AGCCAGAAAT GTGGTTACTC ATTTACTGCT CGGCTCTGGA GAAAATTATG 2160
5374 AAGCCACTTG GGAGTTTTTG ACCAAGCGAT ATGAGAATAA AAGAAACATA TTCTCAGATC 2220
5375 ATATGAATAG GCTTATGGAT ATGCCAAATT TAAATTTAGA ATCCAATAAG CAAATAAAGA 2280
5376 CATTTATTGA CACGATTAAC GAGTCAATTT ATATTATAAA ATTAAAGGCA CAATTACCAG 2340
5377 AAGATGTGGA TGCAATTTTC GCTCACATAA TTCTTCGGAA ATTCAATAAA GAATCACTCA 2400
5378 ATTTATATGA AAGCCATGTT AAAAAGACAA AAGAAATACA GGCACTTTCT GATGTCATGG 2460
5379 ACTTTTTAGA GCAAAGGCTC AATTCTATAT CATCATTCTC ACAGGAAGTA AAACCTGTAA 2520
5380 AGAAAATGAT TAATAATAAC AAGAATAAAA ATTATAGTGA CAATTGTGCA TATTGCAAAC 2580
5381 TACCAGGGCA TTATTTAATT CAATGCCATA AATTTAAAAT AATGAATCCA GCAGAACGGT 2640
5382 CTGACTGGGT AAGAAAAAAT GGGATTTGCC TAAGATGTCT GAGGCATCCG TTTGGTAAAA 2700
5383 AATGTATAAG CGAGCAGCTT TGTTCGACTT GTCGTAAACC TCACCACACG TTACTTCACT 2760
5384 TTGCAGGTCA TAATCCAGAA AAAGTGAATA CGTGTAGAAC AACAGGTCAA GCCTTGTTGG 2820
5385 CCACGGCCTT GATTCAAGTA AAGTCGAGGT ATGGAGGCTT TGAACAATTA AGAGCATTGA 2880
5386 TTGATAGTGG CTCTCAAAGC ACAATTATTT CAGAAGAGTC TGCACAGATT CTAAAATTGA 2940
5387 AAAAATTTCG GTCTCATACT GAAATAAGTG GAGTATCTTC CACAGGAACG TGCATCTCCA 3000
5388 AGCACAAAGC GGTTATTTCG ATAAGAAATT CTCCGAAAAA TTTAGAAATT GAAGCAATTA 3060
5389 TTCTCCCAAA ACTTATGAAG GCACTTCCAG TCAACACGAT TAATGTTGAT CAGAAAAAAT 3120
5390 GGAAGAACTT TAAATTAGCC GACCCCGATT TTAATAAACC GGGTCGCATT GATTTAATCA 3180
5391 TTGGAGCAGA CGTATATACT CACATTCTGC AAAATGGAGT TATAAAAATA GACGGTCTCC 3240
5392 TTGGGCAAAA AACTGATTTC GGGTGGATAG TTTCTGGATG TAAAAAATCC AAAGGAAAAG 3300
5393 AAACCATTGT AGCCACAACA ATAGAAATAA AAGAGTTAGA TCGCTACTGG GAAGTGGAAG 3360
5394 AAGAAGAAAA AGATGATATC GAGTCTGAAA TCTGTGAAAA TAAATTTATC AAAACGACAA 3420
5395 AAAAAGATTC AGATGGGCGA TACATTGTGT CAATTCCATT CAAGGAGGAT GTCACCTTAG 3480
5396 GAGATTCAAA GAAACAAGCG ATAGCTCGTT ACATGAATCT GGAGAAAAAA CTAAAAAGAA 3540
5397 ATGAAAAACT TAAGGTTGAC TACACTAAAT TCATGAATGA ATACATGGAT TTAGGACACA 3600
5398 TGATTGAAGT GAGTGATGAA GGCAAATATT TTTTACCGCA CCAGGCAGTG ATTAGAGATT 3660
5399 CAAGCCTTAC GACCAAATTG AGAGTAGTTT TTGATGCTTC AGCAAAAACT ACGAATAACA 3720
5400 AAAGTTTGAA CGACATAATG TGGGTTGGGC CACGAGTTCA AAAAGATATT TTTGACATTA 3780
5401 TTATTAAATG GAGAAAATGG GAATTTGTTG TTTCGGCAGA CATTGAAAAG ATGTACCGAC 3840
5402 AAATTAAAAT AGATAATAAT GATCAAAAAT ATCAATATAT TTTATGGAGA AATTCTCCAA 3900
5403 AAGAAAAAAT TAAAACATAT AAATTAACCA CAGTCACTTA CGGAACTGCA TCTGCACCAT 3960
5404 ATTTGGCTAC CAGGGTTCTG GTAGATATTG CAGATAAATG TAAAAACCAA GTTATTAGTG 4020
5405 CAATAATTAG GAATGATTTC TATATGGATG ACCTAATGAC TGGAGCTGAT TCGGTAGAAG 4080
5406 AAGCTAATAA ATTAATAACA TTAATTCCCC ATGAATTGCA GAAAGTTGGA TTCAACTTAA 4140
5407 GGAAATGGAT TTCCAACAAT TCCAAAATAT TAACCACTGT GGAGGACACA GGGGACAATA 4200
5408 AGGTTCTCAA TATTATCGAA AATGAATGTG TTAAAACTTT AGGACTAAAA TGGGAACCTC 4260
5409 AAAAGGATTT ATTTAAGTTC AGCGTAAATT GTAATGATGA ATCAAAAAAT ATAAATAAGC 4320
5410 GCGTTGTGTT ATCAACGCTA GCAAAAATAT TTGATCCGTT AGGATGGTTG GCACCAGTCA 4380
5411 CGGTTTCAGG AAAACTTTTT ATTCAAAAAC TTTGGATAAA TAAAAGTGAA TGGGATCAGG 4440
5412 AATTATCCAT AGAAGATAAA AATTATTGGG AAAAATATAA AGAAAATTTA TTATTGTTAG 4500
5413 AGAATATTCG AATCCCAAGG TGGATTAATT CAAACAGTTC TTCAGTCATT CAGATTCACG 4560
5414 GATTTGCGGA CGCCTCCGAA AAAGCATATG CTGCAGTAGT CTATGCTAAA GTAGGACCTC 4620
5415 ATGTTAATAT AATAGCTAGC AAAAGTAGAG TCAACCCTAT AAAAAATAGG AAGACAATTC 4680
5416 CCAAACTCGA GCTGTGTGCA GCTCACCTGC TTAGTGAATT AATCCAAAGA CTAAAAGGAT 4740
5417 CAATTGACAA TATAATGGAG ATCTATGCTT GGAGTGATTC CACGATTACC TTAGCATGGA 4800
5418 TTAACAGTGG TCAAAGTAAG ATCAAATTTA TAAAAAGAAG AACGGATGAC ATTCGGAAAT 4860
5419 TAAAAAATAC TGAATGGAAT CATGTTAAGT CAGAGGATAA TCCAGCAGAT TTAGCATCCA 4920
5420 GGGGAGTGGA TTCTAACCAG TTGATCAACT GTGATTTTTG GTGGAAAGGT CCGAAATGGC 4980
5421 TAGCAGACCC AAAAGAACTT TGGCCTCGGC AGCAGTCTGT AGAAGAACCT GTCTTAATAA 5040
5422 ATACGGTATT AAATGACAAA ATAGATGATC CTATTTACGA ATTAATAGAA AGGTATTCCA 5100
5423 GTATAGAAAA ACTTATACGT ATAATAGCAT ACATAAATAG ATTCGTGCAG ATGAAAACAA 5160
5424 GAAATAAAGC CTATTCATCA ATTATTTCAG TAAAGGAGAT AAGAATAGCG GAAACAGTTG 5220
5425 TTATTAAGAA ACAACAAGAA TACCAGTTTA GGCAAGAGAT AAAGTGCCTT AAAATCAAAA 5280
5426 AGGAAATCAA GACAAATAAT AAAATATTGT CATTGAATCC ATTTTTGGAC AAGGGTGGGG 5340
5427 TTCTAAGAGT TGGAGGAAGA TTGCAAAATT CCAATGCAGA ATTTAATGTT AAACATCCAA 5400
5428 TCATTTTAGA AAAATGCCAC CTAACAAGCT TATTAATAAA AAATGCTCAT AAGGAAACAT 5460
5429 TGCATGGAGG GATAAACCTA ATGCGAAACT ATATCCAAAG AAAGTATTGG ATTTTCGGGT 5520
5430 TGAAAAATTC GTTGAAAAAG TATTTAAGAG AATGTGTAAC GTGTGCAAGG TATAAACAAA 5580
5431 ATACAGCTCA GCAAATAATG GGTAACTTGC CAAAATATAG AGTGACGATG ACATTCCCGT 5640
5432 TTCTTAATAC TGGAATAGAT TACGCAGGTC CTTATTATGT TAAATGTTCA AAAAATCGTG 5700
5433 GCCAAAAAAC ATTTAAAGGA TACGTTGCTG TATTCGTTTG CATGGCCACC AAAGCCATAC 5760
5434 ACTTAGAAAT GGTAAGCGAT CTAACTTCAG ACGCATTTTT AGCAGCACTC AGAAGATTTA 5820
5435 TTGCTAGACG GGGAAAATGT TCCAATATCT ATTCAGACAA CGGAACAAAT TTTGTAGGAG 5880
5436 CTGCAAGAAA ATTAGATCAA GAGTTATTTA ATGCAATACA AGAAAATATA ACGATTGCAG 5940
5437 CGCAACTTGA AAAGGACAGG ATTGATTGGC ATTTTATTCC CCCGGCAGGA CCTCACTTCG 6000
5438 GAGGTATTTG GGAAGCTGGA GTTAAGTCAA TGAAATACCA TTTAAAGCGT ATAATCGGCG 6060
5439 ACACTATTTT TACTTATGAA GAAATGTCAA CTCTTTTATG TCAAATAGAA GCATGCTTAA 6120
5440 ATTCAAGGCC ATTATACACT ATAGTTAGTG AGAAGGACCA ACAAGAAGTT TTAACACCAG 6180
5441 GTCATTTTTT AATTGGAAGA CCACCTTTAG AAATAGTCGA ACCAATGGAA GATGAAAAAA 6240
5442 TCGGAAATTT GGATAGGTGG AGACTTATCC AAAAAATAAA GAAAGATTTC TGGGTTAAGT 6300
5443 GGAAAAGTGA ATATTTGCAT ACGCTCCAGC AAAGGAATAA ATGGAAAAAG GAAATTCCTA 6360
5444 ATATAGAAGA AGGGCAAATA GTTTTATTAA AGGATGAGAA TTGTCATCCT GCAAGATGGC 6420
5445 CTTTAGGAAA GGTGGAAAAG GTGCATAAGG GGAATGATGA TAAGGTCCGA GTGGCTAAAG 6480
5446 TAAAGATGCA GGAAGGATAT ATCACTAGAC CCATTACTAA AATTTGTCCC TTGGAAGGAA 6540
5447 TAAAGTCTGT TGACAAAAAT GAGGCTGACC AAGAGCCAAA AAGACGAACT AGAGCGACAT 6600
5448 CGGGAATGTC CAAGATCGGA ATCATTATGG CAATGTTGTT GTTTGTGTTA AGTTGTCAAG 6660
5449 TTTCTAGCGC ATTACCTAAA GATATAGCAC CAAGATATTC TATAGACAAA ATAAATAAAA 6720
5450 CCTCAGCAAT ATATCTAGAC CCGCTAGGAG ATGTTGAGAT TGTGAGTACT TCTTGGAATT 6780
5451 TGGTTATCTA TTATAAAATG GATCCATATT TTAAAATGTT AACAAAGGGT AATGCGCTTA 6840
5452 TACAAAGTAT GAGGAAAGTT TGCGAAAGAC TTCATAGCTT TGAAGAGCAA TGTAGTCTAG 6900
5453 TCTTAGATAA TATGCAAAGT CAGTTATCGG AACTTGAAGA AAACAATAAA TTGTTTATGA 6960
5454 TGCAGTCTAG ATCTAGAAGC AAGCGTGCTC CTTTCGAATT TATGGGTTCC TTGTATCATA 7020
5455 TTTTATTTGG TATAATGGAT GAAGATGATA GAGAGCAATT AGAAGAAAAT ATGAAGAATT 7080
5456 TGTTAGATAA CCAGAACAAC CTTGATAAAC TAATTCAAAA ACAAACATCT GTGGTTGATT 7140
5457 CAACTTCTAA TCTATTAAAG AGAACAACAG AAGATGTTAA CTCCAATTTT AGAAGTATGC 7200
5458 AAATAAGAAT TGAGAACATG ACAGAAGTTC TTAAAGAAAA TTATTATGTT TATAAGGAAT 7260
5459 CAATAAAATT CTTTATGATT ACGAAACAGC TACACTCATT GATTGAAGAA GGCGAAAAAA 7320
5460 TTCAAGCAGG CATTATAAGC CTGTTGATTG ATATTAATCA CGGTAGGCTA AATACAAATA 7380
5461 TTCTCAGGCC AAATCAGCTT AAAAAAGAAA TTGCCAAAAT TCAGCAGAGT CTTTCAGAGA 7440
5462 ACCTAGTAAT TCCAGGAAAA CGGTCAGGTA CGGAACTTAA GGAGGTGTAT ACACTGTTAA 7500
5463 CAGCCAGGGG TTTATTCATC GACGATAAAT TGATCATTAG TGCAAAAGTG CCTCTGTTTA 7560
5464 GCAGGCATCC ATCCAAATTG TTCAGGCTTA TTCCGGTGCC AATTCGAAAT GAAGATCGGA 7620
5465 TAATAATGGT GCATACAACG TCCGAATATT TAATTTATAA TTTTGAGATA GATTCCTATC 7680
5466 ACATAATGAC GGAAGCCACA TTAAATCAAT GTCAGAAATG GCAACTAAAT AAGAGAATAT 7740
5467 GCAAAGGAAG TTGGCCCTGG AATTCAGCGA ATGATAATGC ATGTGAGATT CAGCCTCTAA 7800
5468 AGCCAGATAA AGCGGCGAAC TGCATCTATA AAACAGTAGT CGACTCTAAA AGTTACTGGG 7860
5469 TAGAGTTAGA AAAGAAAAGT AGTTGGTTGT TTAAGGTTCC TGCGAATTCA AAAGTCCGTC 7920
5470 TGCAATGTAC TGGCTCTCAA ATTGAATTGT TTGATTTGCC TCAGCAAGGA GTTTTAAGCA 7980
5471 TTGCGCCATA TTGTACGGCA AGAACCGACG ATAAAATTCT AGTTGCCCAC CATAACATTC 8040
5472 AGTCCGAAAG TGAAGAATTA TTATCAACAC CTTATATAGG AGAAGTTAGT GGAGTGCCGA 8100
5473 AGATTATTTG GGATCCGCTG AAACTATCAA TATTAAATCA TACTGAGGAA TTTGAACGAT 8160
5474 TGAATAATGA AATTAAATTT ATGAAAGAGA ACCATCAAAA ATTGAAAGAT TTACATTTCC 8220
5475 ATCATATTTC CGGACATGCT GGATTAATTA TTGCTTTAAT ACTAATGATA GTATTAATAA 8280
5476 TATATTTCAT ACGGAAATGT GCTGTGCAAC AAAGAATGCA AGCAATAACC TTTGCAGGTC 8340
5477 CGTTGCCAGT ACTATAAATA TCAATAGTAA ATAAACAATA AAATAATATA ACAAATAAAA 8400
5478 ATATACAGTC CACTAATAGA AAATGTACTT CTACATAGAA AAAGCAAAAT GTTTAAAATA 8460
5479 AGTTAATTAA GTACAAATTG TTGAATTAAA AATAATATAA ACCATAATTG TAATCCAATA 8520
5480 AAATTAAAAG CCAGAAAAAC TAGGCCCATT GAAATCTTAG TTGCAAAATA AATGAACATA 8580
5481 TATCAAATAA ATACAGTCCA CTACTGTTAT AAATGCAACT AATATACTAA TGTACATCTC 8640
5482 AGCTTTGCTG GCCCTTTGGC AGAATGTTCA CACATGAACA CGAATATATT TAAAGACTTA 8700
5483 CAATTTTGGG CTCCGTTCAT ATCTTATGTA AATGAATCGA GAGCGATAAA TTATATTTAG 8760
5484 GATTTTGTTA TCTAAGGCGA CATGGGTGCA TTGCTCAAAA ACATGTAATT TAAGTGCACA 8820
5485 CTACATGAGT CAGTCACTTG AGATCGTTCC CCGCCTCCTA AAATAGTCCC TTAGTGGGAG 8880
5486 ACCACAGATA AGGTCCTCGC CGCTCAAGAT AGGCAGATGT GCCCGAGCGT GGGACCTCGA 8940
5487 TAAGGCGGGG ACTATTTACG TAGGCCTCTG CGTAGGCCAT TTACTTTAAG ATGCGATTCT 9000
5488 CATGTCACCT ATTTAAACCG AAGATATTTC CAAATAAAAT CAGTTTCTTA CAAAAACTCA 9060
5489 ACGAGTAAAG TCTTCTCATT TGGGATTTTA CA 9092
5490 //
5491 ID BLOOD standard; DNA; INV; 7410 BP.
5492 XX
5493 AC AY180916;
5494 XX
5495 DR FLYBASE; FBte0000279; Dmel\blood.
5496 XX
5497 FT source AY180916:1..7410
5498 FT SO_feature five_prime_LTR ; SO:0000425:1..398
5499 FT SO_feature three_prime_LTR ; SO:0000426:7011..7410
5500 FT SO_feature CDS ; SO:0000316:966..1271
5501 FT /name="Dmel\blood\sORF"
5502 FT /db_xref="FLYBASE:FBgn0045863"
5503 FT /db_xref="NCBI_PROTEIN:AAN87266.1"
5504 FT /translation="MSTKQTFEHPAPVEQRDLPSIKEVIEVDPSAGPKPLTIQEYKAR
5505 FT TAAREQPPKKKRGGRRIKLLSARRLNIELLKTATNEEDRQRYKERLAAINQQLRGAK"
5506 FT SO_feature CDS ; SO:0000316:1863..3116
5507 FT /name="Dmel\blood\ORF1"
5508 FT /db_xref="FLYBASE:FBgn0045865"
5509 FT /db_xref="NCBI_PROTEIN:AAN87267.1"
5510 FT /translation="MEWLNLTISINNIRDAFDKSYKCINKTALIKTQTLIFHIKVLIT
5511 FT QYNTLQNLIVTNKSKLTEEHKVQCFKVLSSFGKRLHNTSVRHSIIIEVPTELTKIAEF
5512 FT DESQLRDLDESQPLEDLDIESDIESIEELKFNTVQPNTRNMANALEAQRAYVKQVSAT
5513 FT VPDFDGKKLHLNRFVTALKLTDLTKGDQETLAVEVIKTKIIGPLNYKVEHATTIQAII
5514 FT TILQANVKGESPDVIKAKLINAQQRGKTASQYVTEIDSMRKQLEAAYIDGGLDADNAD
5515 FT KFATKESISAMTKNCANEALKMILTAGTFSTFNDAMEKYLHCSTEITGNSNTVLFYNG
5516 FT NNRRGNYNAYYRGRGRNNYNHNYNQNYNQGYNNNNRGRGGYRGHGNNRDGGNRRGNQS
5517 FT QNNNNNRNVRNVQSENSQTPLSDQQ"
5518 FT SO_feature CDS ; SO:0000316:3749..6733
5519 FT /name="Dmel\blood\ORF2"
5520 FT /db_xref="FLYBASE:FBgn0045864"
5521 FT /db_xref="NCBI_PROTEIN:AAN87268.1"
5522 FT /translation="MKDYDIFTTPVEKENRTEEILKQLRFPKQFNNELTKLCTEFSDI
5523 FT FGLETEPISANNFYKQKLRLGEKTPVYIKNYRMADSQKPEIARQVKKLIDDGIVEPSM
5524 FT SEYNSPLLLVPKKPLPNSTEKRWRLAVDYRQINKKLLSDKFPLPRIEDILDQLGRAKY
5525 FT FSCLDLMSGFHQIELEKRYRDITSFSTANGSYRFTRLPYGLKVAPNSFQRRMTLAFSG
5526 FT LEPSQAFLYMDDLVVIGCSEKHMLKNLTNVFELCRRHNLKLHPGKCSFFMKEVTYLGH
5527 FT KCTDKGILPDDTKYEVIEKYPIPTDADSARRFVAFCNYYRRFIKNFSDHSRHLTRLCK
5528 FT KNVQFEWTAECNDAFEYLKTELMKPTLLQYPDFGKEFCITTDASKQACGAVLTQDHNG
5529 FT QQLPVAYASRMFTQGESNKSTTEQELTAIHWAINHFRPYIYGKHFMVKSDHRPLSYLF
5530 FT SMKNPSSKLTRMRLDLEEYDFTVEYLKGKDNHIADALSRITIKDLKTINREILKVTTR
5531 FT SKAKQENSCKDEAIVKIQEEKEQTIEKPKVYEVVNNNDTKKYVLIKIDKHKCLLKRGK
5532 FT TIVSRFDVDDLYSNETFDLNQFFQRLISKAGMHKITKMRISPSEQMFQFVSLNEFKIK
5533 FT GNRVLEKVELAILQKVIIIDKNDEAQIKEILTKFHDDPIEGGHTGISRTQSKIKRFYY
5534 FT WPQMTKTISKYVKTCLKCQQAKITTHTKTPLTLMPTPATAFDTVLIDTIGPLPKSEDG
5535 FT NEYAVTIICDLTKFLVTIPTPNKSAKTVAKAIFELFVLKYGPMKTFITDQGTEYKNSL
5536 FT MNELCKYMHIENLTSSAHHHQTLGTIERSHRTFNEYIRSYISVNKSDWDIWLPYFTYC
5537 FT FNTTPSIVHDYCPYELVFGRLPRQFKDFSKINKIDPIYNLDDYSKELKCRLELSYNRA
5538 FT RRMLEKAKADRKLRYDRNTNNFELKIGDKVLLRKETGHKLDKRYEGPYDVVDIGINDN
5539 FT ITIKTGSKKQQIVHKDRLKKHK"
5540 XX
5541 CC Sequence from P1 (complement)DS03023:69372..76782 provided by Guochon Liao,
5542 CC Berkeley Drosophila Genome Project.
5543 XX
5544 SQ Sequence 7410 BP; 2840 A; 1403 C; 1328 G; 1839 T; 0 other;
5545 TGTAGTATGT GCATATATCG AGGGTACACT GTACCTATAA GTACACAGCA ACACTTAGTT 60
5546 GCATTGCATA AATAAATGTC TCAAGTGAGC GTGATATAAG ATCACCCATT TATGCTTTAA 120
5547 GCTAAGTCAG CATCCCCACG CTGGCCGCTG GCCATATATG CGCATAAGCT CTCTCTCTCT 180
5548 CTCTCTTATA CATATATATA TACGCTGCTC TTCTGCCGCT GTCGACGGCG GCGCAGTCGC 240
5549 AGTATTTAGG TAAGATTAGA CACTCTGTAG AGGTTAAGCG GGCAGAACCG TTTCTGCTAC 300
5550 TCGAAGAGAT AAGAAGAAAT AAAAAGGTGC CTGACGGCTG CACCCAACTG CAAGGAAAAC 360
5551 ACGTGTTCTC AATTGGTGGC ATATATTGGT TTATTACATG GCGACCGTGA GGCAGGAGCC 420
5552 TGCGATCTGA GGACTACTGA GGAAATGCTG CTAATATTGC CGATTTGATT TGGGAATTCT 480
5553 AAACAGCGAC AACAGGTGTG AGAAGCAGGC CGCCCCTTAC ACCAGTGCGG GAGACCTAGA 540
5554 GACGGGACAC TGATGAAAAA AAAAGAAACA AAAATACTGA GTGAGTAGAG TGTGGTAATG 600
5555 GGCAAACGCG GATGTCAGGA AATCAAAAAT AAAGGTATAG CACATATTAA GTGGCTATGA 660
5556 TATACAAATA AAACACCGCC CCCATGGGCA ACGGCACAGA AATTAACTGC CGAATTAGAC 720
5557 TTTCTGAAAG AAAACCTCCA GCAAAGAAAG CCGAATACCA CAACTCACTC AGCAAAAATA 780
5558 GAAATAATCA ATGAAGAAAT AACTGAAAAT TCAACATCAC CCAAGCCGAA AAGACCCGAC 840
5559 GTCTGCATGA AAGACTGCCC TCGACCATTG TAAGCCGCAA CAGCAATTAG CACGGCATCC 900
5560 TGCGAGGGTA GGATTAGGAT AAAGGATAAA GGATTCCACC GGCGCGCCGC ACATGACAAC 960
5561 AGCGAATGTC TACCAAGCAG ACGTTCGAAC ACCCTGCTCC TGTCGAGCAA AGGGATCTGC 1020
5562 CAAGTATCAA AGAGGTAATA GAGGTAGATC CGTCCGCGGG ACCAAAGCCC TTGACCATAC 1080
5563 AAGAGTACAA GGCACGGACT GCAGCGAGGG AGCAGCCACC TAAAAAGAAG AGGGGTGGCC 1140
5564 GCCGGATTAA GTTGCTCAGC GCCCGGAGGC TCAACATCGA ACTACTGAAG ACGGCAACTA 1200
5565 ATGAGGAAGA CCGGCAGCGC TACAAAGAGC GCCTTGCAGC CATCAATCAA CAACTTCGTG 1260
5566 GTGCGAAGTA AAGCGGCGGG CTGCGTTATA CGCCATAGCC TCAACCGCCC AAATATTATA 1320
5567 TTAATGTTGT CGATGCGGTT TCCGCTGCAA CAAAATTACT AACTTATCAG GGACCCATTT 1380
5568 CATAACTAAC ACATTATACT CAGTCCTAAA CTTAAAATAA GTAATAATAT TGTAAAATTG 1440
5569 CAAATTGCAA CCGATGTAAA CTGAGTATAA TGAATTCATC TATCAAGTAA AAATATGTTT 1500
5570 AACAACAGTT TAGACCTATT AAAATTTCGA GCTATATTTA TATCTGATCG AGATAACAAT 1560
5571 AATTGACCAA TTCTCAAAGT TAAAATTCTA TTTGTACTTT TGATATACAA ATAAAGACTA 1620
5572 ATTTTCCCCA TATCAAAATG GGACATAAGT CGTGGATACA ACCCCACAGT TAAATTCAAT 1680
5573 GTACTTACTA TTTTTGATTT TAGTTATCCT ATCAGCCTTT TTACCTTGGC CTTAAAACTT 1740
5574 TATCAGTTTC ACACAAGATC GTTGAAAAGA CTTACATGAG TCGAGCCAAT GATTTAGACA 1800
5575 AAATCTAATA GAAACTACAC CAAAAAGGTA CAAGGTCGAT TACATCGCTA AAAGGTACAT 1860
5576 ACATGGAATG GCTAAACTTA ACCATATCCA TAAACAATAT TAGAGATGCT TTTGATAAAT 1920
5577 CCTATAAATG TATTAATAAA ACCGCGCTGA TCAAAACTCA GACGCTTATT TTTCACATAA 1980
5578 AGGTATTGAT AACACAATAC AACACATTAC AAAACCTAAT AGTAACAAAC AAAAGCAAAC 2040
5579 TCACTGAAGA ACATAAAGTC CAATGCTTCA AAGTTCTCAG TTCATTTGGT AAAAGACTAC 2100
5580 ATAATACCAG CGTTAGACAC AGTATTATAA TAGAAGTCCC AACAGAACTA ACCAAAATAG 2160
5581 CAGAATTCGA CGAAAGCCAG TTAAGAGACT TGGACGAGTC GCAGCCGTTA GAAGATTTAG 2220
5582 ATATCGAAAG CGATATCGAA TCAATAGAAG AATTAAAATT TAATACCGTA CAACCAAATA 2280
5583 CAAGAAACAT GGCCAACGCA TTAGAAGCTC AGAGAGCATA CGTTAAACAG GTATCTGCCA 2340
5584 CAGTACCTGA TTTCGATGGT AAGAAACTCC ATTTAAACAG GTTTGTGACA GCACTTAAGT 2400
5585 TGACGGATCT AACTAAAGGA GATCAAGAAA CTTTAGCAGT AGAGGTCATA AAGACCAAAA 2460
5586 TTATTGGCCC ATTAAACTAT AAAGTAGAAC ATGCGACAAC GATACAGGCA ATAATTACCA 2520
5587 TATTGCAGGC AAACGTAAAA GGCGAATCGC CTGACGTTAT AAAGGCCAAA TTAATAAATG 2580
5588 CCCAACAAAG AGGCAAGACC GCGTCTCAGT ATGTTACAGA AATAGACAGT ATGCGTAAGC 2640
5589 AGCTCGAGGC AGCTTACATA GACGGCGGAT TAGACGCCGA TAATGCTGAC AAATTCGCGA 2700
5590 CTAAAGAGTC GATATCAGCA ATGACCAAAA ACTGTGCCAA CGAGGCACTT AAAATGATCT 2760
5591 TAACTGCAGG TACATTTAGT ACATTCAACG ACGCAATGGA AAAATACCTA CATTGCAGTA 2820
5592 CAGAAATAAC CGGCAATTCA AATACAGTCT TATTCTATAA TGGGAATAAT AGACGTGGTA 2880
5593 ATTATAATGC CTACTATCGT GGTAGAGGCA GAAATAATTA TAACCATAAT TATAACCAGA 2940
5594 ATTATAACCA AGGTTATAAT AATAACAACA GAGGTCGCGG AGGCTACCGC GGCCACGGTA 3000
5595 ATAACAGAGA CGGAGGTAAC CGAAGGGGTA ACCAAAGTCA GAATAATAAT AACAACCGAA 3060
5596 ATGTGCGTAA CGTACAATCG GAAAACAGCC AGACCCCCTT AAGCGATCAA CAGTAAAAGT 3120
5597 GTTTAAAGTA AACCTAAATC TGAGTATTTT CATTAAGACA AAAAACCATG AAACAAACAC 3180
5598 AGTTCTTACA TTACTAATAG ACACAGGTGC AGAAATTTCA TTGCTAAAAG CCAAAGCAAA 3240
5599 GGAATATAAT AATATAAATT TCAGTAATAT ATCAAATATT ACAGGTATTG GGCAAGGAAC 3300
5600 CATACAGTCT ATAGGTACAG TAGATCTTGA CATACGCATT CAGGATGTTC TAGTGCCACA 3360
5601 TGAATTTCAT GTAGTACCTG AGAATTTTCC GATACCATGC GATGGCATAA TCGGAATAGA 3420
5602 TTTTATCAAG AAATACAATT GCGTATTAGA GTTTCAAAAT AACAAAGACT GGTTCACAAT 3480
5603 AAGACCCAAT AACTTCAGTA GACAGATTAG TGTACCAATT ACACATAACT TAGACTCCAA 3540
5604 CACACTCTTA TTGCCAGCTA GATGCGAAGT AATCAGACAA GTCAAATTAC TCACTAACGA 3600
5605 AAAAACGGTG GTAGTACCAA ATCAGGAGCT GCAACCAGGT ATAATAGTAG CAAGCACCAT 3660
5606 TGCCGATAGC AAAAACGCAT TGATTCGCAT TATAAATACA AATAATAAAG ACGCCATAAT 3720
5607 AGATAGCGCG AAGATCAAAT GCGAATCAAT GAAAGACTAT GACATTTTTA CAACACCAGT 3780
5608 AGAAAAGGAA AATAGAACTG AAGAAATTTT AAAACAATTA AGATTCCCTA AACAATTCAA 3840
5609 TAATGAACTA ACTAAGTTAT GCACCGAGTT TAGCGATATT TTTGGTCTAG AAACAGAACC 3900
5610 AATATCGGCT AACAATTTCT ACAAACAAAA ACTCAGATTA GGGGAAAAAA CACCGGTCTA 3960
5611 TATAAAAAAC TATCGCATGG CAGATAGCCA AAAACCAGAA ATCGCCAGAC AGGTAAAAAA 4020
5612 ATTAATAGAT GATGGAATAG TTGAACCATC AATGTCTGAA TATAATAGTC CATTACTTTT 4080
5613 GGTTCCAAAG AAACCACTTC CGAATTCCAC GGAAAAAAGA TGGCGATTAG CAGTTGACTA 4140
5614 TCGTCAAATA AATAAGAAAC TATTATCAGA CAAATTTCCA CTTCCAAGAA TAGAAGATAT 4200
5615 TCTTGATCAA TTAGGAAGAG CAAAGTATTT TTCATGTCTC GACCTAATGT CTGGATTCCA 4260
5616 CCAGATAGAA CTAGAAAAAA GGTATAGAGA TATAACGTCA TTTTCAACAG CCAATGGCTC 4320
5617 ATATCGCTTC ACGCGATTAC CATACGGACT GAAAGTAGCA CCAAACTCCT TCCAACGTAG 4380
5618 GATGACACTT GCATTTTCTG GTCTTGAACC ATCGCAAGCA TTTCTATATA TGGATGACTT 4440
5619 AGTAGTAATA GGTTGTTCAG AAAAACATAT GCTCAAAAAT TTGACTAACG TATTCGAGCT 4500
5620 ATGTAGACGA CATAATTTGA AACTACATCC AGGGAAATGT TCTTTCTTTA TGAAAGAAGT 4560
5621 AACATATTTG GGTCACAAAT GTACCGATAA AGGTATACTC CCAGATGACA CCAAATATGA 4620
5622 AGTTATAGAA AAATATCCTA TACCAACAGA TGCCGACAGT GCTAGGCGTT TCGTAGCCTT 4680
5623 CTGTAATTAT TACAGACGTT TCATTAAAAA TTTTTCTGAT CATTCACGCC ACTTAACGAG 4740
5624 GCTTTGTAAA AAGAATGTTC AATTCGAATG GACAGCAGAA TGCAATGATG CATTCGAATA 4800
5625 CCTTAAAACA GAATTAATGA AACCAACATT ACTACAGTAC CCAGATTTCG GTAAAGAATT 4860
5626 TTGCATAACA ACCGATGCTA GTAAACAGGC ATGCGGAGCG GTACTTACAC AAGATCACAA 4920
5627 TGGTCAACAA CTTCCAGTGG CATACGCTTC AAGAATGTTC ACTCAAGGTG AAAGTAATAA 4980
5628 GTCCACTACA GAACAAGAAT TAACGGCCAT TCATTGGGCC ATAAATCATT TTCGACCATA 5040
5629 CATATATGGC AAGCATTTCA TGGTAAAAAG CGATCATAGA CCATTGTCAT ACCTATTCTC 5100
5630 TATGAAAAAT CCAAGTTCAA AACTCACTCG TATGAGGCTG GATTTAGAAG AGTATGACTT 5160
5631 TACTGTAGAA TATCTTAAGG GGAAAGATAA CCATATTGCG GACGCCTTGT CTCGCATAAC 5220
5632 AATAAAAGAT CTGAAAACAA TCAACAGAGA AATATTAAAA GTTACCACCA GATCAAAAGC 5280
5633 TAAACAGGAA AATTCCTGTA AGGACGAAGC AATAGTCAAA ATACAAGAGG AAAAAGAGCA 5340
5634 AACAATAGAA AAGCCCAAAG TCTATGAAGT TGTCAATAAT AATGACACAA AGAAATATGT 5400
5635 TTTAATCAAA ATAGATAAAC ACAAGTGTTT ATTAAAACGA GGAAAAACAA TTGTTTCACG 5460
5636 CTTTGATGTT GATGACTTGT ATTCTAATGA AACATTTGAT CTAAATCAAT TCTTTCAAAG 5520
5637 GCTTATTTCA AAAGCCGGAA TGCATAAAAT AACAAAAATG CGAATATCAC CAAGCGAACA 5580
5638 GATGTTCCAA TTTGTATCAC TAAATGAATT TAAAATAAAG GGCAACCGAG TACTCGAAAA 5640
5639 AGTAGAACTA GCTATTCTAC AAAAGGTGAT AATTATAGAC AAAAATGACG AAGCTCAGAT 5700
5640 TAAAGAAATT TTGACAAAAT TCCATGATGA TCCTATAGAA GGAGGCCACA CTGGTATTTC 5760
5641 GCGAACCCAG TCAAAAATCA AAAGATTTTA TTATTGGCCC CAGATGACCA AGACAATCTC 5820
5642 AAAGTATGTA AAGACTTGTT TGAAATGTCA ACAAGCCAAA ATTACAACAC ATACGAAAAC 5880
5643 TCCATTAACA TTGATGCCAA CGCCAGCAAC AGCATTTGAT ACTGTTTTAA TTGATACCAT 5940
5644 TGGTCCACTA CCGAAATCGG AAGACGGAAA TGAGTATGCA GTTACAATCA TATGCGATCT 6000
5645 AACCAAGTTT TTAGTAACTA TTCCAACACC AAATAAAAGT GCTAAAACAG TTGCAAAGGC 6060
5646 TATATTTGAA TTATTTGTAC TGAAGTACGG TCCAATGAAG ACGTTCATTA CAGATCAAGG 6120
5647 TACGGAATAC AAAAATTCAC TTATGAATGA ATTATGCAAA TATATGCATA TAGAAAATCT 6180
5648 AACATCTAGC GCTCACCATC ATCAAACTTT AGGAACAATA GAAAGAAGCC ACCGAACTTT 6240
5649 TAATGAATAT ATACGTTCAT ACATATCGGT TAACAAAAGT GATTGGGACA TTTGGTTACC 6300
5650 ATATTTCACT TATTGCTTCA ATACAACACC CTCAATAGTC CATGACTATT GCCCATACGA 6360
5651 ACTAGTATTT GGCAGACTAC CCAGACAATT CAAAGATTTC AGTAAGATAA ACAAAATAGA 6420
5652 CCCAATATAC AACTTAGACG ACTACTCTAA AGAGCTTAAA TGCAGACTAG AATTGTCGTA 6480
5653 CAACAGAGCA AGAAGAATGT TAGAAAAAGC AAAAGCGGAT AGAAAATTAA GATATGATAG 6540
5654 GAATACAAAT AATTTCGAAT TAAAAATAGG AGATAAAGTA TTACTTAGAA AAGAAACAGG 6600
5655 TCATAAGTTA GATAAAAGAT ATGAAGGTCC TTATGACGTA GTAGATATAG GAATAAATGA 6660
5656 CAATATAACC ATTAAAACAG GAAGTAAGAA ACAACAAATA GTACATAAAG ATAGGCTAAA 6720
5657 AAAGCACAAA TAGAATGAAA AAAAAAAAGG GCAATCAATG CCAAACCTTT CATAATAAAA 6780
5658 CTTAAATAAC GGCCTGATCA GCCAAAACAA TATAACAAAG ACATAGACAT AATCGAATTT 6840
5659 TTATTAATTC AAAATACATA CATATTTTTT CTTTATTCAT TTAAAAATTC TATATCATAA 6900
5660 ATAATGTTAA TTCATTAAAA ATAATATTTA AGTAATTTTT ATTTTATAAT GGTAATATAG 6960
5661 TTGATAGAAA ATAACTTCAT TTCTTTACGT TATTTTAAAA AAGAGGGGAG GTGTAGTATG 7020
5662 TGCATATATC GAGGGTACAC TGTACCTATA AGTACACAGC AACACTTAGT TGCATTGCAT 7080
5663 AAATAAATGT CTCAAGTGAG CGTGATATAA GATCACCCAT TTATGCTTTA AGCTAAGTCA 7140
5664 GCATCCCCAC GCTGGCCGCT GGCCATATAT GCGCATAAGC TCTCTCTCTC TCTCTCTTAT 7200
5665 ACATATATAT ATACGCTGCT CTTCTGCCGC TGTCGACGGC GGCGCAGTCG CAGTATTTAG 7260
5666 GTAAGATTAG ACACTCTGTA GAGGTTAAGC GGGCAGAACC GTTTCTGCTA CTCGAAGAGA 7320
5667 TAAGAAGAAA TAAAAAGGTG GCCTGACGGC TGCACCCAAC TGCAAGGAAA ACACGTGTTC 7380
5668 TCAATTGGTG GCATATATTG GTTTATTACA 7410
5669 //
5670 ID DMZAM standard; DNA; INV; 8435 BP.
5671 XX
5672 AC AJ000387;
5673 XX
5674 DR FLYBASE; FBte0000217; Dmel\ZAM.
5675 XX
5676 FT source AJ000387:1..8435
5677 FT SO_feature five_prime_LTR ; SO:0000425:1..473
5678 FT SO_feature three_prime_LTR ; SO:0000426:7963..8435
5679 FT SO_feature CDS ; SO:0000316:join(494..531,6387..8004)
5680 FT SO_feature start_codon ; SO:0000318:1..3
5681 FT /name="Dmel\ZAM\env"
5682 FT /db_xref="FLYBASE:FBgn0024272"
5683 FT /db_xref="SPTREMBL:O46113"
5684 FT /db_xref="NCBI_PROTEIN:CAA04048.1"
5685 FT /translation="MENTLLNLLLVLLSCHGAYQSIFIHNFNSTNLLAKVPVGKTLVIG
5686 FT NYKKISHIIDLSEYTNCIEKLYHTIDTLRQDETLTDSISILNAKLAQTQSKIDALTPFS
5687 FT RHKRGLINGLGSLVKVVTGNMDANDAKNIETEINHLKSQSTTISDNFEIQNSFNDEVQL
5688 FT RFKNLTRHINNEQNLIKNFFENTQNTIYTKIYNNEEEIKKLQYINRLNYNIDLLVSHLS
5689 FT DIIESTLLAKINVIPKLILDKTEITKIKQIFKTQNYTIKSEQHIYNLLKMNALNYQNKI
5690 FT IFSIKIPIFLSCNYEMARLIPLPINSTQFVIAPKYLIYNNKSNSMFSTMYKCPVIEEQF
5691 FT VCEIDSINNLKNNTCLGHLIQNKTSYCDIKETGLTTDVFEPEKGFILVFNGNNLPIISS
5692 FT NQTITSINGSAIIKYNNCTLKINEINYDNRAVSTEEHPDFFLPPMRKLIKNATINILTL
5693 FT ERLHLDTLTTSNKLLVVAAGNSRHSTTLYILFTVSLVAVILTWTLRRDTHIFHTGPDHI
5694 FT LPIVAPPIPPSMAFAPNWGGRSYRPIGTIHHPSL"
5695 FT SO_feature CDS ; SO:0000316:1789..2820
5696 FT SO_feature start_codon ; SO:0000318:1..3
5697 FT /name="Dmel\ZAM\gag"
5698 FT /db_xref="FLYBASE:FBgn0024271"
5699 FT /db_xref="SPTREMBL:O46114"
5700 FT /db_xref="NCBI_PROTEIN:CAA04049.1"
5701 FT /translation="MSKKLTQTIKQTTRSVLESHTFPKRVTRSVSKTNTLPVIRESTPL
5702 FT PPLQPINMDSGNASVGNSAPVTPTVSGFSSIATALSATDILAFVKELPTFDGTPGQLDK
5703 FT YITSVEEIIMLIRGTDQTPYGLLTLRAIRNKIVGRADEALNLANTKLIWDDIKSNLLRL
5704 FT YSSKKSEATLLGELQSLPDNLTLGQLFFGLSRIRSQLISITSNSGQSATIIEAKKTLYD
5705 FT EVCLNAFISRIREPLKTVIRLKDPKTIETAYELCQGERARYQNRNPYPPTQNNTERRTN
5706 FT NYNNNNNNNHRDNNNRNNVTRLTPKTTQTITQTPIPNIVNQTTATELVTRLKIIKQIMG
5707 FT YTT"
5708 FT SO_feature CDS ; SO:0000316:<2795..6448
5709 FT SO_feature start_codon ; SO:0000318:1..3
5710 FT /name="Dmel\ZAM\pol"
5711 FT /db_xref="FLYBASE:FBgn0024270"
5712 FT /db_xref="SPTREMBL:O46115"
5713 FT /db_xref="NCBI_PROTEIN:CAA04050.1"
5714 FT /translation="NKLWATQHRRRKTHPTLPYQLKFSGTRLRNPTGYINPTTHATSLP
5715 FT YITLNLQQKFPLSFLIDTGSNNSFIDPESANQLECTILPTSTSITTALNSFKIEEKAIF
5716 FT PMPPEFKTEGQITLLKFKFHSYFNGLIGMDLLSHLEAKVDLVNLQLVTSKSTLPIFLYT
5717 FT NQASKIFNIPAYSKVILPLPVKTNHGEFYCCTTQLNNELSLSEGLYKSNNNIANVEISN
5718 FT QSDSDKLLYLEYPLETIPYNKNDHIELFNISATPLNNDTPQAPLHILTEHLNPEEKTAL
5719 FT TTLCKQFRDIFYNPETPLTFTNKITHSIPTIDNTPIHTKSYRYPFVHKTEVKKQIESML
5720 FT DQQIIRSSHSPWSAPVWVVPKKLDGTGNRKWRLVIDYRKLNDKTISDRYPIPNINDILD
5721 FT SIGKAKYFSTLDLTSGFHQIEMNPKDIAKTAFTVEGGHYEFTRMPFGLKNAPATFQRVM
5722 FT DSVLGDLNGTICLFYLDDIIIFSPSLQKHLLDIKMVFEKLRAANFKLQPSKSEFLRKEI
5723 FT EFLGHIVTQDGVKPNPNKISAIKKFPCPTNRRAIKSFLGLLGYYRKFIRDFARITKPMT
5724 FT KQLKGKRQVTTDKDFVDAFEQCKTLLSNDPILIHPDFEKPFILTTDASNFALGAVLSQG
5725 FT SLQNDRPVCFASRTLSDTEVNYSTIEKEMLAIIWAVKYFRPYIYGVKFTIVTDHKPLIW
5726 FT LMNFKEPNSKIIRWRLQLMEYNFEIIHKKGSQNVIADALSRADPNLNYNETLTVKPCPT
5727 FT SEKPINEFNTQLILEIDTNTSYQTTTPFKQKIRKKYSQPCFDFDNIVKILKGTLKPNRI
5728 FT CAFLADDNNSALIEKAFSTYFAHKKHFKIIRCKSLLHEIVGNPEQNKFIQEYHTNSNHR
5729 FT GIDETFLHLKRETYFPNMKNKISELIRNCETCLKLKYDRQPQNIVFETPETPSKPLDII
5730 FT HIDIYTINNNFNLTIIDKFSKFAAVYPIPNRNGINCIKAIKNFFSQFGLPKKLIHDQGV
5731 FT EFCNDIFRKFCSQYNILLHVTSFQQSSSNSPVERLHSSLTEIYRIILDTRKKHKLPTDH
5732 FT EEIMSETVITYNNAIHSTTKHTPFELFNGRTHLFEKTIIPNNEHDYLNKLNTFQDKLYS
5733 FT EIKEKLSTNTQQRIEKLNTSRVEPTTVQPNSTIFRKENRRNKLTPRFSLHRTAKDKGKT
5734 FT LVTTRNQKIHKSKIRKISKPPNDLSLSTCIPDLAMGHTNLSSSTTSIAPTS"
5735 XX
5736 CC Derived from AJ000387 (e1237231) ((Rel. 54, Last updated, Version 1).
5737 CC Takis Benos and Michael Ashburner, 19-Jan-1998.
5738 CC Any changes to original sequence record are annotated in an FT line.
5739 XX
5740 SQ Sequence 8435 BP; 3286 A; 2055 C; 1151 G; 1943 T; 0 other;
5741 AGTTACCGAC CCATCGGTAC CATACACCAC CCCTCCCTCT AAGCCACCAC GCCTACACAA 60
5742 GTAGAAGACA TCGAACCGGG AAGCTTTGCG ATACAAAGTT GCAGCATAAA CATCAACAAC 120
5743 GGGTCAGACG CCGACATCCG CCCAAAATGC TGACACCACA TCCTTTTCGC TCAGACAGAA 180
5744 CAACGCATAC AATTCCATAT ACATACGTAT AAACATACTC ATACTTTCTG CTGTGTCAGA 240
5745 TACTTTATTT CTAAGAACTT TAACATTGTA ATACATACAC ACATATTCAC TGTTAGCCCA 300
5746 TTTAAGACGA AGAATAAAGA CGACCACAGT CGAGTGCAAG CAGCAAACAC TTGTAGACGT 360
5747 ACATAATCTC CGATCAAAAT TCTCCCAAGA CGACCGTGGC TACGTTCTGG ACCCGCATAA 420
5748 CTCCTCTATC TTTCTGAGTG ATAATACCTC CGCAAGACTC CCCGGAGGTA ACTGGCGCAG 480
5749 CCGGAAAACT GGAATGGAAA ATACTTTATT AAACCTTCTA TTAGTTCTAT TGTAAGTAGT 540
5750 TGTGGAAAAA GAGTGAGAAT GAAGTGCAGA AATGTCTAAA AGTGATTACA ACAAAAATCC 600
5751 TAATACAATA CATAAACCGC CTTAACAAAC ATACAAAACA CGCATATAAA AAAAAAAAAA 660
5752 AAAAAAAAAA GAAAAAAAAA AACCCAAAAC TTAAAAATGC CGTAACCGCG AAACATGATA 720
5753 TGCGTTGTAC TTGTGTGAAA TCAATCGCTG ATAGTCACTG CCGAAGTTTA TTAAGGCCAA 780
5754 GTACCATATC ATTACTTTCA TGTTTACATA CATATATATG CCCCACAATT AAAACAACAT 840
5755 ACACACACAC AAATATTTCA AATGCAAAAA AAAAAAAAAG AATGTAGTGT ACCTGCGTGG 900
5756 CATCAATCGC TGATAAACCA CTGCCGAAAT ATTAAAGGCC CGGTACTACA TCACAAAACA 960
5757 CGTATATATG CAACAAAAAT ATACACAACA AAACCATATA TACAAACGTG TATGAGTGAC 1020
5758 GTGTAATGTA CTTGTGTGAA ATCAATCGCT GATAATCACT GCCGAAGCTT AGTAAGGCCA 1080
5759 AGTACCACAT CATTACTAAC ATGTGTACAT ATATATATAT GCAAAACAAT TAAAACAACA 1140
5760 TACACACACA CAAATATTTC AAATGCAAAA AAAAAAAAAA AAGAGGAAAT GTTGTGTACC 1200
5761 TGCGTGGCAT CAATCGCTGA TAAACCACTG CCGAAATATT AAAGGCCCGG TACTACATCA 1260
5762 CAAAACACGT ATATATGCAA CAAAAATATA CACAACAAAA CCATATATAC AAACGTGTAT 1320
5763 GAGTGACGTG TAATGTACTT GTGTGAAATC AATCGCTGAT AATCACTGCC GAAGCTTAGT 1380
5764 AAGGCCAAGT ACCACATCAT TACTAACATG TGTACATATA TATATGCAAA CCACCAAAAC 1440
5765 AAATACATAT ACACATACAA ACACTCCAAA AAAAAAAACA AATAATACTA TATGAACGGC 1500
5766 GAAGCGTATG TTTTCTAAGG CTGGATACAA AACCACAAAA CCAAATATAA ATTGCACACC 1560
5767 TTAATAAAGA AAAGAACAAA AATGATAATA AACAAAAGAA ATTTTTTTTG GAACATGCAC 1620
5768 CCATACTCTC ACTCTTTCAA CACAAATAAA GTATTCAAAT TATACATACA TACAATAATA 1680
5769 CCACTATATT ACAGAAATTA ACGCACAAGA AAACACACAC ACTATCCAAC AACAAACAAG 1740
5770 TAATTAAGAG TTATTAAGTA CATTGTAAAC TACATATTTT TATCTTAAAT GTCAAAGAAA 1800
5771 TTAACACAAA CTATTAAACA AACAACTCGC TCCGTGTTAG AATCACACAC ATTTCCCAAA 1860
5772 AGAGTTACAC GATCAGTTTC GAAAACAAAC ACCCTCCCCG TAATAAGAGA AAGCACCCCC 1920
5773 TTACCGCCCC TTCAACCTAT AAATATGGAT TCGGGCAACG CCTCCGTAGG TAATTCCGCC 1980
5774 CCCGTAACAC CTACTGTCAG TGGCTTTAGC AGTATTGCTA CGGCACTTAG TGCCACCGAT 2040
5775 ATTTTAGCCT TCGTTAAAGA ACTTCCGACC TTCGATGGTA CTCCAGGCCA ACTCGACAAA 2100
5776 TATATAACTA GCGTTGAGGA AATAATCATG CTCATTAGGG GTACCGACCA AACTCCGTAC 2160
5777 GGACTTCTGA CACTCAGGGC AATTAGGAAT AAAATAGTTG GAAGAGCAGA CGAAGCTCTA 2220
5778 AACCTAGCCA ACACCAAACT TATATGGGAC GATATCAAAA GTAACCTACT ACGTTTATAC 2280
5779 TCTAGCAAGA AAAGCGAAGC TACCCTCTTA GGCGAGCTCC AATCTCTCCC AGATAACCTA 2340
5780 ACCCTAGGGC AATTGTTCTT CGGCTTATCG AGGATTAGGA GCCAACTTAT ATCCATTACT 2400
5781 TCCAATAGTG GACAGTCGGC CACAATCATC GAAGCCAAGA AAACACTATA TGACGAAGTC 2460
5782 TGTTTAAACG CCTTCATCTC AAGAATTAGA GAACCACTTA AAACAGTCAT CAGATTGAAA 2520
5783 GACCCCAAGA CTATCGAAAC AGCTTACGAG CTATGTCAAG GAGAAAGGGC TCGTTACCAG 2580
5784 AACAGAAACC CATATCCCCC AACACAAAAC AACACCGAAC GACGAACTAA CAACTACAAT 2640
5785 AACAATAACA ACAACAATCA CAGAGACAAC AACAACCGCA ACAACGTAAC TCGTCTTACA 2700
5786 CCCAAAACCA CTCAAACCAT TACTCAAACC CCAATTCCCA ATATCGTCAA TCAAACAACG 2760
5787 GCAACAGAAC TAGTAACCCG TTTAAAGATA ATAAAACAAA TTATGGGCTA CACAACATAG 2820
5788 AAGAAGAAAA ACTCACCCAA CACTGCCTTA CCAACTTAAA TTTTCAGGCA CCCGCCTCAG 2880
5789 GAACCCAACA GGATACATAA ATCCTACCAC ACATGCAACA TCCCTTCCAT ACATAACTCT 2940
5790 AAACCTCCAA CAAAAATTCC CTTTATCATT TCTTATCGAT ACAGGATCCA ATAACTCCTT 3000
5791 CATTGACCCA GAATCTGCAA ACCAACTAGA GTGCACAATT CTACCAACAT CCACTTCAAT 3060
5792 TACAACAGCA TTAAATAGTT TCAAAATTGA AGAAAAGGCA ATATTCCCAA TGCCACCCGA 3120
5793 GTTCAAAACC GAAGGTCAAA TTACCCTACT TAAATTCAAA TTTCACTCTT ATTTCAATGG 3180
5794 CCTCATAGGA ATGGACCTAT TATCACACCT AGAAGCAAAA GTAGACCTAG TAAACTTACA 3240
5795 ACTAGTAACT TCAAAGTCTA CACTCCCAAT ATTCTTATAC ACTAACCAGG CTTCAAAAAT 3300
5796 TTTTAACATC CCCGCCTACA GTAAAGTTAT CTTACCACTA CCAGTAAAGA CTAATCATGG 3360
5797 GGAATTCTAT TGTTGTACTA CACAACTAAA TAATGAGTTA TCGTTGTCAG AAGGACTATA 3420
5798 TAAATCAAAC AATAATATTG CCAATGTCGA AATCTCTAAC CAATCCGACT CAGATAAACT 3480
5799 ATTATACCTA GAATACCCCC TAGAAACCAT TCCATACAAT AAAAACGACC ATATAGAGCT 3540
5800 CTTTAATATA TCAGCTACAC CTCTTAATAA CGATACCCCT CAAGCCCCAT TACATATCCT 3600
5801 CACAGAACAC CTCAATCCAG AGGAAAAAAC AGCCTTAACA ACCCTATGTA AACAATTTCG 3660
5802 CGACATATTC TACAACCCAG AAACACCATT AACTTTTACC AACAAAATCA CACACTCCAT 3720
5803 CCCAACCATA GATAACACTC CTATCCACAC AAAATCCTAC AGATACCCTT TTGTCCATAA 3780
5804 AACAGAAGTC AAAAAACAAA TCGAATCCAT GTTAGACCAA CAAATTATTA GATCTAGCCA 3840
5805 CTCCCCTTGG AGCGCCCCGG TGTGGGTGGT CCCAAAAAAA CTAGACGGGA CAGGGAACAG 3900
5806 GAAATGGCGA CTTGTAATAG ACTACCGGAA ACTCAACGAC AAAACCATTT CGGACAGATA 3960
5807 CCCCATCCCA AACATAAATG ACATATTAGA TAGCATAGGC AAAGCAAAAT ATTTCTCAAC 4020
5808 GCTCGACCTA ACTAGCGGTT TTCATCAAAT CGAGATGAAT CCAAAAGATA TCGCCAAAAC 4080
5809 AGCCTTTACA GTCGAAGGGG GTCACTACGA ATTCACACGG ATGCCCTTCG GCTTAAAAAA 4140
5810 CGCACCGGCT ACCTTTCAAC GGGTTATGGA CAGCGTTCTT GGCGATCTCA ACGGCACCAT 4200
5811 TTGCCTATTC TATCTTGACG ATATTATAAT TTTCTCGCCT TCCCTACAAA AACACCTGTT 4260
5812 GGACATAAAA ATGGTATTCG AAAAACTCAG AGCGGCAAAC TTTAAACTAC AACCTTCAAA 4320
5813 ATCAGAATTC CTAAGGAAAG AGATAGAATT TCTAGGCCAC ATAGTCACAC AAGACGGAGT 4380
5814 TAAACCAAAC CCGAACAAAA TAAGTGCGAT CAAAAAATTT CCTTGCCCCA CCAACAGAAG 4440
5815 AGCTATCAAA TCTTTTCTCG GGTTACTGGG TTATTATAGG AAGTTTATAA GAGACTTTGC 4500
5816 ACGAATAACG AAGCCCATGA CTAAACAATT GAAAGGGAAA AGACAAGTTA CTACAGACAA 4560
5817 AGACTTTGTA GACGCATTCG AACAGTGCAA AACTCTTCTG TCCAATGACC CAATACTCAT 4620
5818 ACACCCAGAC TTCGAAAAAC CATTCATTCT TACTACGGAT GCTAGTAACT TCGCGTTAGG 4680
5819 AGCCGTACTA TCTCAAGGCT CCTTACAAAA CGATAGACCT GTATGTTTTG CCAGCAGGAC 4740
5820 CCTCTCCGAC ACCGAAGTCA ACTATTCAAC CATAGAAAAA GAAATGTTGG CAATAATATG 4800
5821 GGCAGTAAAA TACTTCAGAC CATATATTTA TGGCGTAAAA TTTACTATTG TTACAGATCA 4860
5822 CAAGCCACTA ATATGGCTTA TGAATTTCAA AGAACCCAAC TCAAAAATAA TTCGTTGGAG 4920
5823 ACTCCAACTC ATGGAATACA ATTTTGAAAT AATTCACAAG AAAGGTTCAC AAAATGTAAT 4980
5824 TGCAGACGCC TTAAGTAGAG CGGACCCAAA TTTAAACTAC AACGAAACAC TGACTGTTAA 5040
5825 GCCTTGCCCC ACATCCGAAA AACCTATTAA CGAATTTAAC ACGCAACTCA TACTAGAAAT 5100
5826 AGATACAAAT ACGTCTTACC AAACTACAAC ACCATTTAAA CAAAAGATTA GGAAAAAATA 5160
5827 TTCACAGCCT TGCTTCGATT TCGATAATAT TGTTAAAATC TTGAAAGGAA CCCTAAAACC 5220
5828 TAACAGGATT TGCGCATTCT TGGCGGACGA TAATAATTCC GCATTAATCG AAAAAGCATT 5280
5829 CTCAACGTAT TTTGCACATA AAAAACACTT TAAAATTATC AGATGCAAAT CACTTCTCCA 5340
5830 CGAAATCGTA GGAAACCCCG AACAAAACAA ATTCATTCAG GAATATCACA CTAACAGCAA 5400
5831 CCACAGAGGC ATAGACGAAA CATTCCTTCA CCTCAAACGA GAAACCTACT TCCCCAATAT 5460
5832 GAAAAACAAA ATCTCTGAAT TAATTAGGAA TTGCGAAACC TGTCTAAAAC TCAAATACGA 5520
5833 CAGGCAACCA CAAAATATAG TATTTGAAAC CCCAGAAACC CCATCGAAAC CCCTCGACAT 5580
5834 AATACACATA GACATCTATA CTATTAACAA TAATTTTAAC CTGACAATCA TAGACAAATT 5640
5835 CTCAAAATTC GCAGCTGTCT ACCCCATCCC AAATAGAAAC GGCATCAATT GCATCAAAGC 5700
5836 AATCAAAAAT TTTTTCAGTC AATTCGGACT ACCCAAAAAA CTAATACACG ACCAAGGAGT 5760
5837 AGAATTTTGC AACGACATAT TTCGAAAGTT TTGCTCTCAA TATAATATAC TTCTCCATGT 5820
5838 CACATCCTTC CAGCAATCTT CAAGTAATTC TCCAGTAGAA CGTTTACACT CCTCTTTGAC 5880
5839 AGAGATTTAC AGAATAATAC TAGACACACG GAAAAAACAC AAATTACCTA CAGACCACGA 5940
5840 AGAAATAATG TCAGAAACTG TAATAACATA TAACAACGCA ATCCACTCCA CCACCAAACA 6000
5841 CACCCCTTTT GAACTTTTTA ATGGTAGGAC CCATTTATTC GAGAAAACAA TAATACCCAA 6060
5842 TAATGAGCAT GACTATTTAA ATAAACTAAA TACGTTCCAA GACAAACTAT ACTCCGAAAT 6120
5843 AAAAGAAAAA TTGTCCACAA ACACCCAACA AAGGATAGAA AAGCTAAACA CAAGCAGAGT 6180
5844 AGAACCAACA ACAGTACAAC CTAACAGCAC AATTTTCAGA AAAGAAAACA GGAGAAATAA 6240
5845 ATTAACACCA CGGTTTTCCT TACACAGAAC AGCAAAAGAC AAAGGAAAAA CTCTAGTAAC 6300
5846 CACAAGAAAT CAAAAAATCC ACAAATCAAA AATTAGGAAA ATATCCAAAC CTCCAAATGA 6360
5847 CTTAAGCCTT TCCACCTGCA TTCCAGATCT TGCCATGGGG CATACCAATC TATCTTCATC 6420
5848 CACAACTTCA ATAGCACCAA CCTCCTAGCA AAAGTGCCGG TAGGGAAAAC ACTCGTGATA 6480
5849 GGAAACTATA AAAAAATTAG CCACATAATC GATCTGTCCG AATACACCAA CTGTATTGAA 6540
5850 AAATTATACC ACACCATCGA TACCCTAAGA CAAGATGAAA CACTCACCGA TTCTATATCA 6600
5851 ATACTAAATG CTAAACTGGC CCAAACTCAA AGTAAAATAG ACGCACTAAC ACCCTTTTCA 6660
5852 CGCCACAAAA GAGGTCTTAT TAACGGGTTA GGTAGTTTAG TCAAAGTCGT CACCGGCAAC 6720
5853 ATGGACGCCA ATGATGCAAA GAATATAGAA ACAGAAATTA ACCACTTAAA AAGCCAGTCC 6780
5854 ACCACTATCT CAGATAACTT CGAAATACAG AACTCGTTCA ATGATGAAGT TCAACTACGG 6840
5855 TTCAAAAACT TAACAAGACA CATTAACAAT GAACAGAATT TGATTAAAAA CTTCTTCGAA 6900
5856 AACACTCAAA ATACAATTTA CACAAAAATA TACAACAACG AAGAAGAAAT AAAGAAACTA 6960
5857 CAATATATAA ATAGGCTTAA CTACAATATA GATTTATTAG TTAGCCACCT AAGCGACATT 7020
5858 ATAGAAAGTA CACTGCTTGC CAAAATTAAT GTTATCCCAA AACTCATCTT AGACAAGACA 7080
5859 GAAATAACCA AAATCAAACA AATTTTTAAA ACACAAAACT ACACAATAAA ATCCGAGCAA 7140
5860 CACATTTATA ACCTCTTAAA AATGAACGCA CTCAATTACC AAAACAAAAT AATTTTTAGT 7200
5861 ATCAAAATTC CTATTTTTTT AAGTTGTAAC TACGAAATGG CAAGATTAAT TCCACTTCCA 7260
5862 ATAAATTCCA CACAATTTGT AATAGCACCT AAGTACTTAA TATATAATAA CAAAAGTAAC 7320
5863 AGCATGTTTT CAACTATGTA TAAATGTCCT GTAATAGAAG AACAATTCGT CTGCGAAATC 7380
5864 GACTCCATCA ATAATCTTAA AAATAATACT TGCCTGGGAC ACCTTATCCA AAATAAGACC 7440
5865 AGCTACTGCG ACATAAAGGA AACGGGACTC ACGACTGATG TGTTCGAACC GGAAAAAGGC 7500
5866 TTCATACTTG TATTTAACGG GAACAACCTC CCAATCATCT CCTCCAACCA GACCATAACT 7560
5867 AGTATCAATG GATCAGCTAT AATAAAGTAT AACAATTGCA CATTAAAAAT CAATGAAATA 7620
5868 AACTACGACA ACAGGGCGGT ATCAACAGAA GAGCACCCCG ACTTCTTCCT ACCACCAATG 7680
5869 CGGAAACTAA TAAAAAATGC CACTATCAAC ATACTCACCT TGGAAAGACT TCACCTGGAT 7740
5870 ACACTCACAA CATCCAATAA GCTACTGGTC GTCGCCGCAG GAAACTCTCG ACACTCGACA 7800
5871 ACCTTGTATA TCCTCTTCAC CGTATCCCTA GTCGCCGTAA TACTCACCTG GACACTTCGA 7860
5872 AGGGACACCC ACATCTTCCA TACCGGGCCC GACCACATTC TTCCAATCGT CGCTCCACCA 7920
5873 ATTCCTCCGT CTATGGCCTT CGCTCCAAAC TGGGGGGGGA GGAGTTACCG ACCCATCGGT 7980
5874 ACCATACACC ACCCCTCCCT CTAAGCCACC ACGCCTACAC AAGTAGAAGA CATCGAACCG 8040
5875 GGAAGCTTTG CGATACAAAG TTGCAGCATA AACATCAACA ACGGGTCAGA CGCCGACATC 8100
5876 CGCCCAAAAT GCTGACACCA CATCCTTTTC GCTCAGACAG AACAACGCAT ACAATTCCAT 8160
5877 ATACATACGT ATAAACATAC TCATACTTTC TGCTGTGTCA GATACTTTAT TTCTAAGAAC 8220
5878 TTTAACATTG TAATACATAC ACACATATTC ACTGTTAGCC TATTTAAGAC GAAGAATAAA 8280
5879 GACGACCACA GTCGAGTGCA AGCAGCAAAC ACTTGTAGAC GTACATAATC TCCGATCAAA 8340
5880 ATTCTCCCAA GACGACCGTG GCTACGTTCT GGACCCGCAT AACTCCTCTA TCTTTCTGAG 8400
5881 TGATAATACC TCCGCAAGAC TCCCCGGAGG TAACT 8435
5882 //
5883 ID DME010298 standard; DNA; INV; 8507 BP.
5884 XX
5885 AC AJ010298;
5886 XX
5887 DR FLYBASE; FBte0000359; Dmel\GATE.
5888 XX
5889 SY synonym: Batumi
5890 XX
5891 FT source AJ010298:1..8507
5892 FT SO_feature five_prime_LTR ; SO:0000425:1..272
5893 FT SO_feature three_prime_LTR ; SO:0000426:8236..8507
5894 FT SO_feature polyA_signal_sequence ; SO:0000551:158..163
5895 FT SO_feature polyA_signal_sequence ; SO:0000551:8383..8398
5896 FT SO_feature primer_binding_site ; SO:0005850:276..293
5897 FT SO_feature RR_tract ; SO:0000435:8236..8507
5898 FT SO_feature CDS ; SO:0000316:1741..6456
5899 FT /name="Dmel\GATE\polyprotein"
5900 FT /db_xref="FLYBASE:FBgn0044067"
5901 FT /db_xref="SPTREMBL:O76925"
5902 FT /db_xref="NCBI_PROTEIN:CAA09069.1"
5903 FT /translation="MPIGDDKKKLSADKPRSIFSPQGPKSPRIPSISVKTPAQISDDCA
5904 FT TPSKATVQRTAKNMAASDLALAKFISVSDAQANLRLRSTLRNPQLQPSRCLASVATKSE
5905 FT AYGTRLKRIRPLLRVPCVSRRAAASGMPILRASYSYCYSVYERCVAQLVDKIEQGHFSV
5906 FT HPKRTLRPRPTFPLAVGCLHAIQEFSQVTIFAGRFPDLLHAIYINNPRLTPFEKLFHLN
5907 FT AKTSGDAHAIVSISPLTKRGFSSAWENLIERFENKRLLVNSQLKILFNVQSIPQESGAA
5908 FT LKVMQSTVQGCLTALELSGINTENWDCLLEYLCSSKLPKITLSLWEQSLHKKADIPTWG
5909 FT ELNTFLTERHRTLEAIDDVRPSVPSQSHSKAMNSSGPSRDGKLASDLCNKENHPVRVCR
5910 FT VFSKWSVDDRSAYIKRKQLCLNYFAKGHQLRECKDRQSFTWWPASHVVAPKQPLFQQFK
5911 FT PFKSCKPNFRYSGQFRSKRASRCSKLFCHGSRAILLGSAIINSSHLGTNFKARALIDSG
5912 FT SEATFITEPLFNLIRLPFQVVQAQVSGLNQTVAAQFKNAAVSPSDLRLGRVAVGDDGLC
5913 FT PPSTSRKSAFLPNSAKFLRDLPDFPLADPKFYESAPIDVLIRSPHPASVLLSGAKTNIC
5914 FT GSLLGQETIFRWVLTGPVSASAQSRIPLFRHRSPTRTIIHWTNSSQNLGRWRIYQQSCK
5915 FT RIRFHVRERVGKCLRRHQCGKYVVTLPFRDPEHIGCGLGHSRSWALAQFLKNEQRLKKD
5916 FT EALKARYDSVIQEYLDLKHMRQVLPTHDCNAYYMPHHAVLKPESVTTKLRVVFNASSPS
5917 FT SNGTSLNDILHAGPVLQSDLTVQILKWRDFRYVFSADIQKMYRQIWVDPKHTPFQRILF
5918 FT RNNRGEIRDFELKTVTFGVNCAPLLAIRVLQQLAADEELSHPKASNVIRNFMYVDDVLA
5919 FT GADSTEEAQLMVHELRDALNSSSSRQRWLSKRPLQRQVLSQIAKLFDPAGWLAPFIVRA
5920 FT KIFMQEIWLQELGWDENVPNDLFQRWLNFLQSYSVFEQIRIPRWLSFHPDFKVEHHGFC
5921 FT DASQKAYGAAIYVRGEVGSAIMVQLLTAKTRVAPVKTVSLPRLELCGALLLSEMAAAII
5922 FT PQMPTINSKLYCWTDSTIVLAWLSKPACQWTTFVANRETKIAQATKTENWSHVQSEHNP
5923 FT ADLASRGVSLQDLADSQLWWHGPTWLQNPRNQWPTQVNAPVTDLEKRALKVHLAKAPSE
5924 FT ELLARFSKLEKALRVLAYVYRFIQRCRKQTSPSDVHLLATEIAAAERFLISNTQRREFP
5925 FT VEYHCLSEKRPVPSSSAILSMNPFLDPQGLIRACGRVAASESPQYNERHPVILPYNCLL
5926 FT SRLLAKFTHRTTLHGGNQLMVRLIRSKYWIPRIKNLMKAVVNSCKVCVIHKRRLQSQLM
5927 FT GVLPKERASFSRPFTVSAWITPVRDIKNYTGRACVITKGYVLVFVCFSTKAIHLEPTSD
5928 FT LTTEKFLAAFSRFVSRRGCPRQVQSDNGKTFVGAATLLSRDFLQAVKESVTNAYIHQEM
5929 FT QWQLFSGGTQYGRPLGSRRKKLQDAILQMHGHTKIHVRRTLHALGKNRSVP"
5930 XX
5931 CC Derived from AJ010298 (e1315889) (Rel. 56, Last updated, Version 1).
5932 CC Takis Benos and Michael Ashburner, 08-Sept-1998.
5933 CC Any changes to original sequence record are annotated in an FT line.
5934 XX
5935 SQ Sequence 8507 BP; 2245 A; 2251 C; 1836 G; 2175 T; 0 other;
5936 TGTTCAAGTT ACGCTCACCC GCTGTCACCC GCTGTCACCC GCTCTCCGCT CCCTCTTACG 60
5937 CTCTCCCGCT CTTCACCTCA GAGTCTCCAA GGAGTCCTCG GGCTTGGGAT AGCCTAACTA 120
5938 ATTAGAATAA GCATCAGTGT AAAAACTAAC CACGCTGAAT AAACATACGC CCGGTCGCCG 180
5939 CGCAATTACG AAAAGTCTAG TGTTTGCTTT CCTTCGAGTG TTTCTTTTCA GCATATTTGA 240
5940 ATTCAGGACA GCCATCCCCC TACATCCCAA CATTTTGGTC CTTCGAGCCG GATCACCTGG 300
5941 ATTTTCAAGT TTGTCCACCA GCGAACAAAT TATAAGATAA GTACGAAATT TCCATTCCTT 360
5942 TTAATTGCCG GTCTGCAGCA AAAGGTTCGA AAATCCAATT TCGTTCAATT TGCTGTAAGA 420
5943 TTTATTGTCA AATCTAACGG ATTTCTCCGA CAAAAGGCAA TTAAAGAAAA GTACTTATCC 480
5944 AATCTCACGG GCGCCGCATA TTACTCGCCG TTCTCCGTTC TCCTTTCACC CTCATTCGTG 540
5945 AAAATTTCTA AAGTCCAAAT GGGCGAATAT ATTTAAATAT TAATCCAGTG CGATAATGCA 600
5946 AAATTCCAAA TGTGAAAAAG TGAATAATTT GTGCCAAGTT CAGTGAAACT TTCTAAGTCC 660
5947 AAAGCTCTGC CAAAATTGGC AAAAATTCTG TTCTCGTTTC ACTGTGTCAA AGCGAAGCCA 720
5948 AACTTCTTTT CGCAACACAT TTTTGCTTTA ACTCCGCAGT CCACTTAATA CCATTTGCTT 780
5949 TGCTATCGAA GAATACCACA ACGAAACAAA CAACACCATA CCCTCTGGCC ATTCAAATAA 840
5950 CATATTAATT AACATTTCCG CAGTTCCATA TCTCTTACAT CAACATATAC CTACTCCATA 900
5951 CTCTTGCATA TATTCACATC TTACACAATA TATCCTCACC ATATATTACA TATATTACAT 960
5952 CAACATATAA TATCCACATA TATTACCGAC ATACATTGCG CATATTATCA GCATTCCTTT 1020
5953 AACGTATACC AAAGTTTAAA TTCGATCCCG TCGGCAAATC CAACCACAAA TAAAATTTAT 1080
5954 TCCAAGTGCC GACGCGGAAA GGCGTTTTCT TTTCCATCAA TTTTTTCCGT AAATTTCCAA 1140
5955 ATTAATTTCC GAGCAATAAA TTAAAAGCGG TTTTTTCTTT TTTTTTAACA AATAACTTAT 1200
5956 TGTTGAAAAC ATTTATTAAA TTATTAAAAA TTATATAAAT AATACGACCG CCAAATACAA 1260
5957 GTCGTTCACC CGACAAATAT TTTTTCCTGT ATTGCTTGGA TATTAATTTG TGTTTGTTTT 1320
5958 AGAAGTACTT ACAACGCGGA GAAAAGACTC CAAATCCACC ATTCCATTTT CTCCGTTTCC 1380
5959 AGTTATAAAC AAAAAAATAA ATAAAATTTT CTTCCTTCTA ATAAACATTT TATTTTACCG 1440
5960 TGTTCACATT CCAAGTGTTC CAACCGTAAA TAAGGTGGAC CTAATTACCA TAAATCACAG 1500
5961 GTCATTTATA CAATTCGCTG TTCACTCCGA GTCACCTGTC CAATTAGTCT AAACTACGGC 1560
5962 GTTTCCACTT CGCAAATTCA ACACCACTTT CTCACCCATT ACATCCTATA CGGTCCTTTT 1620
5963 CCGCTGCTTT ATACCGTTCA CGGCAGGAAG CTTAAATTTA TTAAGTGGAA TCTGTCTACT 1680
5964 TTTTCAAAAG TGTGACCGGG CTCCAAAAAC GCTTCCCTTC CATTTCGTAT TTCTTCGATT 1740
5965 ATGCCCATCG GGGACGATAA GAAGAAATTG TCCGCTGACA AACCCAGGTC TATTTTTTCA 1800
5966 CCACAAGGGC CCAAGAGTCC AAGAATCCCA AGCATTTCGG TGAAAACGCC TGCGCAGATT 1860
5967 TCCGACGACT GTGCCACTCC ATCCAAAGCC ACAGTACAGC GCACAGCTAA AAATATGGCT 1920
5968 GCTTCCGATC TAGCGCTAGC CAAATTCATT TCGGTTTCTG ACGCTCAAGC GAATTTGAGG 1980
5969 CTCAGATCAA CACTCCGGAA TCCGCAGCTC CAACCGTCAC GATGCTTAGC GTCCGTCGCG 2040
5970 ACCAAGTCCG AAGCCTATGG GACAAGGTTG AAAAGAATTC GACCTCTGCT CAGAGTGCCT 2100
5971 TGTGTCAGCA GGCGAGCGGC AGCAAGCGGC ATGCCTATTC TCAGGGCTAG TTACAGTTAT 2160
5972 TGCTATTCAG TCTATGAAAG GTGTGTTGCC CAGCTCGTTG ATAAAATCGA GCAGGGGCAC 2220
5973 TTCTCAGTCC ATCCCAAGCG AACGCTGCGG CCCAGGCCTA CATTTCCTCT GGCTGTCGGT 2280
5974 TGCCTCCATG CGATACAGGA GTTTTCGCAG GTGACTATCT TCGCTGGCCG CTTTCCGGAT 2340
5975 CTTTTACACG CCATTTATAT TAATAATCCA CGGCTGACTC CGTTCGAAAA GTTATTCCAC 2400
5976 TTAAATGCCA AAACAAGTGG CGACGCGCAT GCCATAGTTT CGATTTCGCC TCTCACCAAA 2460
5977 CGAGGGTTTT CCTCTGCGTG GGAAAACCTA ATAGAGCGTT TCGAAAATAA ACGATTGTTG 2520
5978 GTAAACAGTC AATTGAAAAT ACTGTTTAAT GTGCAGTCGA TACCACAGGA ATCTGGGGCG 2580
5979 GCCTTGAAGG TAATGCAAAG TACTGTTCAA GGTTGCTTGA CTGCCTTAGA ACTGTCAGGC 2640
5980 ATCAACACTG AGAACTGGGA CTGCCTGCTG GAATATCTGT GTTCATCCAA GCTCCCGAAG 2700
5981 ATAACTCTCT CCTTATGGGA GCAGTCTCTA CATAAGAAAG CCGACATCCC GACATGGGGA 2760
5982 GAACTGAACA CCTTCCTCAC AGAACGTCAT CGAACCCTAG AGGCCATCGA TGATGTGAGA 2820
5983 CCGTCCGTAC CAAGTCAGTC GCACTCCAAA GCGATGAACT CAAGTGGGCC CTCTAGAGAT 2880
5984 GGCAAGCTGG CGTCCGACTT GTGCAACAAG GAAAACCATC CTGTCCGTGT ATGTCGCGTT 2940
5985 TTCTCCAAAT GGTCGGTTGA CGACCGGTCA GCCTACATTA AACGGAAGCA GTTATGCTTA 3000
5986 AACTACTTTG CAAAGGGACA TCAGCTTCGT GAGTGCAAAG ATCGACAAAG TTTTACTTGG 3060
5987 TGGCCGGCAT CACACGTTGT TGCACCGAAA CAACCTCTTT TCCAGCAATT CAAGCCCTTC 3120
5988 AAATCCTGCA AGCCCAATTT CCGCTACTCA GGCCAATTTC GTTCCAAACG AGCAAGCCGG 3180
5989 TGTTCAAAAT TATTTTGCCA CGGCTCAAGA GCTATCCTTC TTGGCAGTGC CATAATCAAT 3240
5990 AGTTCCCATC TTGGCACTAA CTTTAAGGCA CGCGCCCTGA TCGACTCCGG ATCAGAGGCG 3300
5991 ACATTCATAA CCGAGCCACT GTTCAATCTA ATTAGATTGC CATTCCAGGT GGTTCAAGCC 3360
5992 CAAGTCTCGG GCTTAAACCA AACAGTAGCT GCTCAGTTCA AGAACGCTGC AGTTTCACCA 3420
5993 TCCGATCTCC GACTAGGCCG CGTTGCAGTT GGAGACGACG GCCTATGTCC TCCCTCAACT 3480
5994 AGCCGGAAAT CTGCCTTCCT ACCCAATTCC GCAAAATTTC TTCGGGATCT TCCCGATTTT 3540
5995 CCACTGGCGG ATCCAAAATT CTATGAGAGC GCCCCAATAG ATGTACTTAT CCGGAGCCCA 3600
5996 CATCCTGCTT CGGTGCTTCT GAGTGGAGCA AAAACCAACA TCTGTGGCTC TCTCTTGGGG 3660
5997 CAAGAGACCA TTTTCCGCTG GGTACTAACT GGGCCAGTGT CAGCCTCAGC CCAAAGCAGG 3720
5998 ATTCCTCTTT TTCGACACAG ATCTCCCACG CGTACGATAA TTCACTGGAC AAACTCCTCA 3780
5999 CAAAATTTGG GGAGGTGGAG GATATACCAA CAAAGTTGCA AAAGAATCCG ATTCCATGTG 3840
6000 CGAGAACGGG TTGGTAAATG CTTACGACGA CACCAGTGCG GCAAATATGT CGTTACTCTG 3900
6001 CCTTTTCGCG ACCCAGAACA TATCGGTTGC GGGCTAGGGC ATTCTAGGTC TTGGGCGTTG 3960
6002 GCTCAGTTCT TGAAGAATGA GCAGCGTCTA AAAAAAGATG AGGCCTTGAA AGCGAGATAC 4020
6003 GATTCGGTGA TCCAGGAATA TCTCGACTTA AAGCACATGC GACAAGTTCT GCCTACCCAT 4080
6004 GATTGCAACG CCTATTATAT GCCACATCAC GCCGTCTTAA AACCGGAGAG TGTAACTACT 4140
6005 AAACTCCGTG TAGTATTCAA TGCCTCCAGC CCTTCATCGA ATGGTACCAG TTTAAATGAT 4200
6006 ATCCTTCATG CTGGCCCTGT CTTGCAGTCC GACTTGACAG TGCAAATTCT GAAGTGGCGC 4260
6007 GATTTCCGAT ACGTGTTCAG TGCCGATATT CAAAAAATGT ATCGGCAGAT CTGGGTAGAT 4320
6008 CCGAAACACA CTCCATTCCA GCGAATACTT TTCCGTAACA ATAGAGGGGA AATCAGAGAT 4380
6009 TTCGAATTGA AAACAGTAAC CTTTGGAGTC AATTGCGCGC CCTTGCTGGC GATCCGAGTA 4440
6010 CTGCAGCAGC TAGCAGCTGA CGAAGAACTC AGCCATCCAA AAGCTAGCAA TGTCATTCGA 4500
6011 AATTTCATGT ATGTGGATGA TGTTTTAGCC GGAGCGGACT CTACGGAAGA AGCTCAGCTC 4560
6012 ATGGTGCACG AGCTCCGAGA CGCTCTGAAT TCTTCTTCGT CCCGCCAGAG ATGGCTATCG 4620
6013 AAACGTCCTT TACAACGCCA AGTCCTGTCC CAAATTGCCA AATTGTTCGA CCCTGCAGGC 4680
6014 TGGTTAGCAC CGTTTATCGT TCGAGCTAAA ATTTTCATGC AGGAGATTTG GCTACAGGAG 4740
6015 CTTGGGTGGG ACGAAAACGT TCCAAATGAC CTTTTTCAGC GATGGCTTAA TTTTCTCCAA 4800
6016 AGTTATTCGG TTTTCGAGCA GATACGCATT CCACGCTGGC TATCGTTTCA TCCAGATTTC 4860
6017 AAGGTCGAGC ATCATGGCTT TTGCGATGCA TCGCAAAAGG CTTATGGCGC CGCAATATAT 4920
6018 GTCCGCGGAG AAGTGGGCAG CGCCATTATG GTGCAACTCC TAACCGCCAA AACCCGGGTA 4980
6019 GCACCAGTCA AAACGGTTTC GCTCCCAAGA CTCGAGCTCT GCGGAGCGTT ATTGCTTTCC 5040
6020 GAAATGGCTG CAGCCATCAT TCCGCAGATG CCTACGATTA ACTCCAAACT TTACTGTTGG 5100
6021 ACGGACTCCA CCATAGTGCT TGCATGGTTA AGCAAGCCAG CATGCCAGTG GACCACATTT 5160
6022 GTAGCCAATA GGGAGACGAA GATCGCCCAG GCCACAAAAA CAGAGAATTG GTCTCATGTT 5220
6023 CAATCTGAGC ATAATCCAGC AGACCTGGCA AGTAGAGGAG TTTCCCTCCA AGATCTAGCC 5280
6024 GATAGCCAGT TATGGTGGCA CGGACCGACT TGGTTGCAAA ATCCACGCAA CCAATGGCCT 5340
6025 ACTCAGGTCA ACGCTCCGGT GACCGACCTG GAGAAGCGTG CTCTAAAAGT CCATCTCGCG 5400
6026 AAAGCTCCTT CTGAAGAGTT GTTGGCACGT TTCTCCAAGC TAGAGAAAGC TCTACGAGTC 5460
6027 CTTGCCTATG TTTATCGCTT CATTCAGCGG TGCAGGAAGC AGACATCTCC ATCTGATGTT 5520
6028 CATCTACTGG CCACTGAAAT CGCCGCCGCC GAGCGGTTCC TAATTTCGAA CACTCAACGC 5580
6029 AGAGAATTCC CTGTGGAATA TCACTGCCTA AGTGAAAAGC GTCCAGTGCC AAGTTCAAGT 5640
6030 GCCATCCTAA GCATGAACCC GTTTCTAGAT CCGCAAGGAC TGATCAGGGC ATGCGGCCGT 5700
6031 GTGGCGGCTT CCGAAAGCCC TCAATACAAT GAACGCCATC CAGTGATTCT TCCGTATAAC 5760
6032 TGCCTGCTTT CTCGCCTCCT TGCGAAGTTC ACGCATCGCA CAACTCTCCA TGGTGGTAAC 5820
6033 CAGTTAATGG TGCGCCTCAT CCGGTCGAAA TACTGGATTC CGAGAATCAA GAACCTGATG 5880
6034 AAAGCAGTGG TAAATTCGTG CAAAGTATGT GTGATCCACA AAAGGCGGTT GCAAAGCCAA 5940
6035 CTGATGGGTG TCCTGCCCAA AGAAAGAGCA TCGTTCTCCC GACCATTCAC GGTATCGGCA 6000
6036 TGGATTACGC CGGTCCGCGA TATAAAGAAC TATACGGGAA GAGCATGTGT TATTACAAAG 6060
6037 GGGTATGTGT TAGTTTTTGT TTGTTTCTCC ACCAAGGCCA TCCACTTAGA GCCTACATCT 6120
6038 GACTTAACGA CCGAGAAGTT TCTTGCCGCT TTCTCTCGTT TTGTATCCAG GAGAGGGTGT 6180
6039 CCACGTCAAG TCCAGTCAGA CAATGGCAAA ACCTTTGTTG GCGCTGCCAC CCTGCTTTCC 6240
6040 CGCGATTTCC TTCAAGCCGT AAAAGAGTCG GTGACGAATG CCTATATTCA TCAAGAGATG 6300
6041 CAATGGCAAT TATTCTCCGG GGGCACCCAA TATGGGAGGC CTTTGGGAAG CAGGCGTAAA 6360
6042 AAGCTTCAAG ACGCTATTTT ACAAATGCAC GGCCACACGA AAATACACGT TCGAAGAACT 6420
6043 CTCCACGCTC TTGGCAAAAA TAGAAGCGTG CCTTAACTCC AGGCCGCTCT CTCCTATGTC 6480
6044 TGAAGATCCG ACAGACTTGC TGGCTCTGAC GCCAGGGCAT TTCCTTGTCG GGGGACCCCT 6540
6045 TATGTCCACG GTGGAACCCG AAGTAAAGGG GGAAACGAAA TCCCTTCTTA ATCGGTGGCA 6600
6046 GCATTTGAAG GCTCTCCATC AGCAGTTCCG TGTGCGATGG AAAGAAGAGT ACCTCAAAGA 6660
6047 ACTCCACAAG CGTTCTAAAT GGCAGGTCCC GTGAACTTCG AGCTAAAATA CTCGTGCATG 6720
6048 TGGAGCAGCG TGTGGTGGGA TCGGTCGCAC TTCTTGCAAC GATCACCGCT TCGGCAGTCT 6780
6049 CCCGTGGAAT GCTCGTGAGC GAGGCAATTG GCGCTAGTAT GTTGGTAATG AGGACTGCTC 6840
6050 GCAAACGCTT TTCAGCGCTG AGCTTTAGGA ACCTCGCGCA CGTCCGAAGA GGATGGATTA 6900
6051 CCGCGGCAGA CTCGGCATCG GTAGGATTTA ATACCTCGGG TACGTCTGCT CTCCACGGCA 6960
6052 CGACCTGCGT GCGTTTTGTT GACGAGGAGC CATGTGCGCG TAGTCGAATG TCGAAAGGAG 7020
6053 ATCGAAAACG AAATGAAAAA TAACGGATGA TTAGTGATAG TGAACTACAA CTAAGGACGA 7080
6054 GAGGAGAGAC CTATTATTGT GGAGATTCGG AACTCCGTCG GCAAAAGCAC CTTTTTTGCC 7140
6055 ACTGGACGTT TAATAACTCC ACGTGCAGTA CGGATGTTTA CTACACGACG TTGCCGTCAG 7200
6056 CTCCTGGGAA AACAGACTCA ATTCTGCCGA GCCGCCACTC ATTAGAGGGC AAGTTGTCGT 7260
6057 CCTTGATGAC GACTGTTGAG TTACGGGGTT TGGACTGTCA CCGTCTCCGC TCCCTCTTAC 7320
6058 GTTCTCCACT CCCTCTTACG CTCTCCCGCT CTTCACCACA GAGTCTCCGA GGAGTCTCTG 7380
6059 GCGCTTGGGA GAACCCAACG CATTAGAATA AGTTTTAGTG TAAAACTAAC CACGATCAAT 7440
6060 AAAACATACG CCCGGTGCCC GCGCTAATTC TACAAGTCTT CGAGTGTTTT TTCGAGTGGT 7500
6061 CTTTTTTTCA GCAAACTAGG AACTTTCCAG GACCAGCACC CCCCATCACC CCAACAACGA 7560
6062 CCATGTCATC GATGGCGTCG CCAACCGGCG CCAACCCTGC AAGCAGCTTC GGCCTCGTCC 7620
6063 CAACGTTCCC GCCGGCACAA TCCGCCAACT CAGCGTAGGA GTTCACCGCC ACGACGACCG 7680
6064 GAATCGACGA CGCCAGGCCC ATCACTCTCG TCGCCGCTGC AACGCCACAG CGTGAACATC 7740
6065 CTTCCCACAG CGCTGGTCAA GATGGAGACC GGGACGAAGA CCTTCAGACC GCAGCACTCA 7800
6066 TCGATCCGTG CAGCCCCATG AGCTGCATCG ACGCTTCGTT GGCGTCAGCC TTTAAGCTTT 7860
6067 CGATGACCAA TGTTGGCGAC GAGAAGGTCT GCACGACGAC GATTCGCTCC AGGATCGACG 7920
6068 CGAACACGAA GCTCGAGGTC GTGCTCAAGA TCGAGCCCAG GGTGCGGATC CGTACACCTG 7980
6069 TCCGGGCATT GAGCGACACC GTAGTGTCCA AGTACAGGGA CATCATGCTG GCGGATGACG 8040
6070 GGTTCCATCG GCCTGCTACC GTATCCATGG TCTTAGGAGC AGACATTTAT CCTAAGGTTA 8100
6071 TCCAATCCGG ATTCCTGACC TTCGACGAGG GAATGCCGGT CGCTCAAAAG ACCGTGTTTG 8160
6072 GGTGGATCGT GTCCGGTGCC TGCAGCTTGC CTAGATGGCT ATGTTGCAAC CCCAGTGATT 8220
6073 GCAAGGGGGG CGGAATGTTC AAGTTACGCT CACCCGCTGT CACCCGCTGT CACCCGCTCT 8280
6074 CCGCTCCCTC TTACGCTCTC CCGCTCTTCA CCTCAGAGTC TCCAAGGAGT CCTCGGGCTT 8340
6075 GGGATAGCCT AACTAATTAG AATAAGCATC AGTGTAAAAA CTAACCACGC TGAATAAACA 8400
6076 TACGCCCGGT CGCCGCGCAA TTACGAAAAG TCTAGTGTTT GCTTTCCTTC GAGTGTTTCT 8460
6077 TTTCAGCATA TTTGAATTCA GGACAGCCAT CCCCCTACAT CCCAACA 8507
6078 //
6079 ID ROXELEMENT standard; DNA; INV; 4740 BP.
6080 XX
6081 AC AF237761;
6082 XX
6083 XX
6084 DR FLYBASE; FBte0001160; Dmel\X-element.
6085 XX
6086 SY synonym: BS2
6087 XX
6088 FT source AF237761:1..4740
6089 FT SO_feature CDS ; SO:0000316:322..1827
6090 FT SO_feature start_codon ; SO:0000318:1..3
6091 FT /name="Dmel\X-element\ORF1"
6092 FT /db_xref="FLYBASE:FBgn0041613"
6093 FT /db_xref="SPTREMBL:Q9NBX5"
6094 FT /db_xref="NCBI_PROTEIN:AAF81410.1"
6095 FT /translation="MNTLNETAAADESLDTAFLSSPQCAAPQRFQKIKRKSRASPETER
6096 FT KKPKSTIGKQGENPSATEPRYGGNSNRFGLLAHLTADKQVGNEIGDLYDQPSTSHQAAI
6097 FT AAAKRDAASAGTTSSAKRAQSKPPPIVMEGVDDVYLMMQSIENIVDLEKIEARASMSGV
6098 FT LRLYAADANTFRTIVNWLEIEEYEFHCYQLKEDRPYRVCVKGLHHSTLHHQIKDELEKI
6099 FT GHKVLDIHTPLRRNEPGTSKASPVNMFFLNIAAAANNKEILAVKALCHMRVVIEPLRKR
6100 FT NAIVQCHRCQQIGHTAKYCRKAHICVKCAGEHPAKDCTRPRIELCTCYNCGGQHPANYK
6101 FT GCSKLQAFLQRSRPRSGVAGRTEVSDRPTPRGLAGGKEIPSSRGGISYADVARGSIHHK
6102 FT QPMSLTHQQQKQKQQPYDGSPSRQRSRSRTRASRGTLQRSTDASSSIEAILQTLNENIN
6103 FT SLRSIQEKQMELMMMMMKQQQQQSHQQGQIINLLTALQARQAP"
6104 FT SO_feature CDS ; SO:0000316:1827..4553
6105 FT SO_feature start_codon ; SO:0000318:1..3
6106 FT /name="Dmel\X-element\ORF2"
6107 FT /db_xref="FLYBASE:FBgn0041612"
6108 FT /db_xref="SPTREMBL:Q9NBX4"
6109 FT /db_xref="NCBI_PROTEIN:AAF81411.1"
6110 FT /translation="MMPLRILVWNADGVSTKLPEVECFVRRHEIDVLLLSETHCKGAET
6111 FT PKLFGFVAYTANDPSGGNAKGGAAILIKNSLAHFPLTPIATAKVQLAPAVIETALGPIS
6112 FT FGAVYCPPRFAWTTDEFKDILEEFQTKFIVAGDWNASHWLWGAGRSNQRGIALANLVLN
6113 FT SEVDSLATGGPTRYPYGCRGSPGYIDFALTKGVLGIHANISAVVELSSDHLPLVITLDA
6114 FT GAISYPKMERLITRRTNLEVFQSQLESTLPLNTAINSGQDVDDAIELLTNNIKSAARLA
6115 FT TRSISRQPAADRIPIPREILLLIAEKRRLRTRWMRSRHPSDKTEWNRALSRLRCALVLH
6116 FT KAAWFDERLANTGVESEATHSLWKATRAIKRRCTRKAPLVDSNGTWCRTDLGQAEVFAA
6117 FT HLAERFQPFKLASLQQVEETQDQLNQALQMDMPITPFEPCEVAEVIVRQSNNKAPGHDV
6118 FT ICNATLKALPRQAILYITLVFNAIVRLQYFPYQWKLGIISMIHKPGKPEREPASYRPIS
6119 FT LLPSISKVFERLIAVRIVSIMEAQGITPEHQFGFRAGHCTVEQLHRVVEQILTAYDSKE
6120 FT YCNSLFLDIREAFDRVWHIGLQLKIKQTLPAPYFGLLKSYLEGRRFAVRFHSAISTEHN
6121 FT VAAGVPQGSVLGPLLYCLYSHDMPQPDVSLYGKSMLATFADDVCVTYRSRCEHDAADGI
6122 FT QDFAYRFSEWARRWNIGINSSKSNNVCFTLKRRTPPPVYIEEVPVPQPNAAKYLGVLLD
6123 FT RRLTFSKHVTDIRTRLRAKVAKHYWLLSSRSKLSLSNKLTIYKQILAPNWKYGCQIWGL
6124 FT ACDSHIKRIQAIQNKVARLITGCEWFVRNTTLHRDLKLATVFDEINKHSSRYHDRLERH
6125 FT RNRLASALNRSRPPRRLNRRQPRDLITRSPLTRVRRS"
6126 XX
6127 SQ Sequence 4740 BP; 1336 A; 1215 C; 1183 G; 1006 T; 0 other;
6128 AATGTTAAAT AAAGGTTCGT GTCTAACAAT ACGCACCTGA CAAAGTGGAT TAAGTGAAAT 60
6129 TAGTTTTCGC GGTAATAAAC TTATGGACAA GACCAGAATA CTGGCACACA TAGCAAATAG 120
6130 TGACCCCCCA AGTCACTAAC AGTGAAATAA TAGTGAAACG AAAACATTTT CATTCAAAAA 180
6131 TACAAAGTTA AGTTTCTCGA ACTGGGGCTC CGCTGCCCAG CTGCCACGCG ATCGCACAAA 240
6132 CAGCTGTTTG CGAGCTTAAA GCTTTCTATC CCAGGGTTCA AGTTTTGGCT AGAACCCTGG 300
6133 TGATTTGGTG CACACTTCAA TATGAACACT TTAAATGAAA CCGCTGCGGC TGATGAATCG 360
6134 TTGGATACTG CGTTTCTCTC GAGCCCCCAA TGTGCTGCCC CGCAGCGCTT TCAAAAAATA 420
6135 AAGCGAAAGT CTCGTGCTTC TCCGGAGACT GAAAGGAAAA AACCCAAATC AACCATCGGC 480
6136 AAACAAGGGG AAAACCCTTC GGCTACAGAA CCTAGATATG GCGGCAATTC AAACCGATTT 540
6137 GGTTTACTTG CGCATCTCAC AGCTGACAAA CAAGTAGGCA ATGAAATTGG CGATCTGTAT 600
6138 GACCAGCCCA GTACCAGTCA TCAAGCTGCA ATTGCTGCCG CTAAGCGGGA TGCAGCCTCC 660
6139 GCTGGTACCA CTAGCTCAGC CAAAAGAGCG CAGTCCAAAC CACCTCCTAT AGTAATGGAG 720
6140 GGAGTGGACG ACGTATACCT GATGATGCAG AGCATCGAAA ATATAGTGGA CCTAGAAAAG 780
6141 ATTGAGGCTA GGGCGTCAAT GAGCGGTGTC CTAAGGCTTT ACGCGGCTGA CGCTAATACA 840
6142 TTTCGCACCA TAGTGAACTG GCTCGAGATC GAAGAGTATG AGTTCCACTG CTACCAGCTT 900
6143 AAAGAGGACA GGCCTTACAG GGTATGCGTG AAAGGCCTGC ACCACAGTAC GCTACATCAC 960
6144 CAAATCAAGG ATGAGCTGGA AAAGATCGGG CACAAGGTTC TCGATATTCA CACACCGCTT 1020
6145 AGGCGAAACG AACCGGGTAC CTCAAAAGCG TCGCCAGTCA ATATGTTCTT CCTAAATATT 1080
6146 GCTGCTGCGG CAAACAATAA GGAGATCCTG GCGGTAAAGG CACTATGCCA TATGAGAGTA 1140
6147 GTTATTGAGC CTCTCCGCAA GCGTAACGCT ATTGTCCAGT GCCATCGTTG TCAGCAGATT 1200
6148 GGCCACACAG CCAAATACTG CCGTAAGGCC CACATTTGTG TGAAATGTGC CGGCGAACAC 1260
6149 CCAGCCAAGG ACTGTACCAG GCCACGCATC GAGCTGTGCA CTTGCTACAA CTGTGGCGGC 1320
6150 CAGCATCCTG CAAACTATAA AGGTTGCAGC AAGCTACAAG CGTTCCTGCA GCGATCCAGA 1380
6151 CCCAGAAGTG GAGTGGCTGG AAGAACAGAA GTAAGCGATC GACCAACTCC ACGGGGCTTA 1440
6152 GCTGGAGGTA AGGAGATCCC CTCTTCTCGA GGCGGAATAT CTTATGCAGA TGTGGCTAGA 1500
6153 GGGTCCATTC ACCACAAGCA ACCAATGAGC CTGACGCACC AGCAACAGAA GCAAAAGCAA 1560
6154 CAGCCCTATG ATGGAAGCCC CAGTCGTCAA AGGAGCCGCA GCCGGACAAG GGCGTCTAGG 1620
6155 GGTACACTCC AGCGCTCGAC GGATGCTAGC AGCAGCATTG AAGCCATCCT GCAGACGCTT 1680
6156 AATGAGAACA TTAATTCTTT GCGCTCGATT CAAGAGAAGC AAATGGAATT AATGATGATG 1740
6157 ATGATGAAGC AACAGCAACA ACAGTCACAT CAGCAGGGGC AGATTATCAA TCTGCTCACT 1800
6158 GCTCTCCAAG CGCGTCAAGC GCCATAATGA TGCCGCTGCG CATCCTAGTG TGGAACGCCG 1860
6159 ACGGCGTATC CACGAAGTTG CCTGAAGTAG AGTGCTTCGT GCGACGTCAC GAAATCGATG 1920
6160 TATTACTGCT CAGCGAGACA CACTGCAAGG GGGCAGAGAC GCCTAAGCTA TTCGGATTTG 1980
6161 TAGCCTACAC TGCCAATGAT CCGAGTGGTG GCAACGCCAA AGGCGGAGCA GCTATCTTAA 2040
6162 TCAAAAATAG CCTTGCCCAC TTTCCGCTAA CACCAATAGC CACTGCCAAG GTGCAACTTG 2100
6163 CGCCGGCGGT TATTGAAACG GCACTTGGTC CTATAAGCTT TGGAGCGGTC TACTGCCCAC 2160
6164 CGAGATTTGC ATGGACTACG GACGAGTTTA AGGACATTTT GGAAGAGTTC CAGACGAAGT 2220
6165 TCATTGTTGC AGGCGATTGG AACGCGTCCC ACTGGCTCTG GGGTGCGGGA AGGAGCAACC 2280
6166 AAAGAGGCAT TGCATTAGCG AATCTCGTCC TAAATTCGGA GGTGGACTCG CTAGCAACAG 2340
6167 GAGGACCAAC AAGATACCCG TACGGCTGTA GAGGCTCACC AGGGTACATC GATTTTGCAC 2400
6168 TGACAAAGGG TGTGCTGGGC ATCCACGCTA ACATAAGTGC GGTTGTTGAG CTTAGCTCCG 2460
6169 ACCACCTGCC TCTGGTAATT ACGCTGGATG CGGGGGCAAT ATCCTACCCT AAGATGGAGC 2520
6170 GGCTTATCAC TAGGCGTACT AACCTGGAGG TATTCCAATC GCAACTGGAG TCCACACTGC 2580
6171 CCCTCAACAC TGCCATAAAC TCTGGACAGG ACGTTGATGA TGCTATCGAA CTGCTCACCA 2640
6172 ACAATATCAA GTCAGCAGCT AGATTGGCAA CTCGCAGCAT ATCTCGGCAG CCCGCGGCAG 2700
6173 ATCGAATCCC AATACCCAGG GAGATCCTGC TGCTTATAGC TGAGAAGAGG CGCTTACGCA 2760
6174 CTAGGTGGAT GAGGTCTCGG CACCCGTCGG ACAAAACGGA ATGGAACCGA GCTCTGAGTA 2820
6175 GGCTCCGATG CGCGTTGGTG CTGCACAAAG CCGCATGGTT CGACGAAAGG CTTGCCAATA 2880
6176 CCGGAGTCGA AAGCGAAGCG ACGCATTCGC TGTGGAAGGC CACGCGCGCA ATCAAAAGGC 2940
6177 GTTGCACGAG GAAGGCGCCT CTAGTCGATA GCAACGGGAC ATGGTGTCGG ACCGACTTGG 3000
6178 GACAAGCGGA GGTATTCGCT GCGCACCTCG CCGAGCGATT TCAACCATTC AAGCTTGCCA 3060
6179 GCCTGCAACA GGTTGAAGAA ACTCAGGACC AGCTGAACCA AGCGCTTCAA ATGGATATGC 3120
6180 CAATCACGCC GTTTGAACCC TGCGAGGTAG CCGAAGTCAT TGTGCGCCAG AGTAACAACA 3180
6181 AAGCACCTGG ACATGACGTC ATCTGCAACG CCACATTGAA GGCCCTGCCC AGACAAGCGA 3240
6182 TCCTCTACAT AACGTTGGTT TTCAACGCTA TTGTGAGGTT GCAATACTTC CCTTATCAGT 3300
6183 GGAAGCTCGG GATAATCTCC ATGATCCACA AACCTGGCAA GCCGGAAAGG GAGCCCGCCT 3360
6184 CCTACCGGCC GATCAGTCTC CTCCCTTCAA TTTCGAAGGT GTTTGAGAGA CTGATTGCTG 3420
6185 TCCGGATTGT AAGCATTATG GAAGCCCAGG GGATTACCCC TGAGCACCAG TTCGGTTTCC 3480
6186 GTGCTGGCCA CTGTACTGTC GAGCAGCTCC ATCGAGTCGT CGAGCAAATT CTGACTGCCT 3540
6187 ACGACAGTAA GGAATATTGT AACAGCCTCT TCTTGGACAT TCGAGAAGCG TTTGATCGAG 3600
6188 TGTGGCACAT TGGACTCCAA CTGAAAATCA AGCAGACGCT GCCTGCCCCA TATTTTGGGT 3660
6189 TGCTGAAATC GTACCTGGAA GGAAGGAGGT TCGCTGTGCG CTTTCATTCA GCAATTTCCA 3720
6190 CCGAGCACAA CGTGGCAGCT GGTGTTCCAC AAGGTAGTGT CCTCGGCCCC CTGCTCTACT 3780
6191 GCCTGTATAG CCACGACATG CCGCAGCCAG ATGTAAGCCT TTACGGGAAA TCTATGTTGG 3840
6192 CCACATTTGC CGATGACGTG TGCGTCACCT ACAGGTCCCG ATGCGAGCAC GACGCAGCCG 3900
6193 ATGGTATCCA GGACTTTGCA TACCGGTTCT CGGAATGGGC AAGACGATGG AATATTGGCA 3960
6194 TCAATAGCAG TAAATCCAAC AACGTCTGCT TCACTTTAAA GCGGAGAACG CCACCGCCCG 4020
6195 TCTACATCGA GGAAGTCCCC GTACCACAGC CGAACGCAGC AAAGTACCTT GGAGTGCTTC 4080
6196 TGGATCGCAG ACTCACATTT TCCAAGCATG TGACCGACAT CAGAACGCGC CTACGTGCTA 4140
6197 AGGTGGCGAA GCACTACTGG CTACTTTCTT CGCGCAGTAA ATTGTCGCTA TCCAACAAGC 4200
6198 TGACAATTTA CAAACAGATC CTAGCACCAA ACTGGAAGTA TGGGTGCCAA ATCTGGGGCT 4260
6199 TAGCCTGCGA CAGCCACATC AAAAGGATCC AGGCTATTCA AAATAAGGTA GCAAGACTCA 4320
6200 TCACCGGCTG CGAGTGGTTT GTTCGAAACA CCACCCTGCA CAGAGACCTG AAACTCGCAA 4380
6201 CGGTATTTGA CGAAATAAAC AAGCACTCGA GCAGATACCA TGACAGGCTG GAGCGCCACA 4440
6202 GAAATCGGCT GGCCAGCGCT TTAAACAGAT CTCGCCCACC AAGGAGGCTC AATAGAAGGC 4500
6203 AACCGAGGGA TCTCATTACC CGATCTCCTT TGACAAGGGT CCGCAGAAGC TGACGCTTAT 4560
6204 CTTAAATCCT ATTTGTTATA TGTGATTGTT ATGTAATTGT AGTTAAATTA CTGTAAATTT 4620
6205 GAAAAAGCTA ACTATAGTTA GCCGGCGAGC CCAAATGGGC TGAATTAATA GATAAGAAGG 4680
6206 ACACAAAGGG GCTTCAAGAC TTCCCCGTAT GCCTTAATAA ATAAATTAAA TAAAAAAAAA 4740
6207 //