Dbfetch

ID   X07656; SV 1; linear; genomic DNA; STD; INV; 4648 BP.
XX
AC   X07656;
XX
DT   16-JUL-1988 (Rel. 16, Created)
DT   12-SEP-1993 (Rel. 36, Last updated, Version 6)
XX
DE   Drosophila melanogaster retrotransposon 1731 sequence
XX
KW   gag gene; pol gene; retrotransposon.
XX
OS   Drosophila melanogaster (fruit fly)
OC   Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta; Pterygota;
OC   Neoptera; Holometabola; Diptera; Brachycera; Muscomorpha; Ephydroidea;
OC   Drosophilidae; Drosophila; Sophophora.
XX
RN   [1]
RP   1-4648
RA   Fourcade F.;
RT   ;
RL   Submitted (16-MAY-1988) to the INSDC.
RL   Fourcade F., VACNRS 1135 , Universite P. Et M. Curie Bat. A. 5 etage, 7
RL   Quai St. Bernard, 75005 Paris, France.
XX
RN   [2]
RX   DOI; 10.1093/nar/16.13.6113.
RX   PUBMED; 2456522.
RA   Fourcade F., D'Auriol L., Galibert F., Best-Belpomme M.;
RT   "Primary structure and functional organisation of drosophila 1731
RT   retrotransposon";
RL   Nucleic Acids Res. 16(13):6113-6125(1988).
XX
RN   [3]
RP   1-4648
RX   DOI; 10.1093/nar/19.20.5689.
RX   PUBMED; 1658740.
RA   Ziarczyk P., Best-Belpomme M.;
RT   "A short 5' region of the long terminal repeat is required for regulation
RT   by hormone and heat shock of Drosophila retrotransposon 1731";
RL   Nucleic Acids Res. 19(20):5689-5693(1991).
XX
DR   MD5; aef492175fa506af1daa2bd40f807343.
DR   EuropePMC; PMC1074743; 15817569.
DR   EuropePMC; PMC1383729; 12045146.
DR   EuropePMC; PMC155295; 11875027.
DR   EuropePMC; PMC1553205; 16882972.
DR   EuropePMC; PMC2996953; 20618961.
DR   EuropePMC; PMC311128; 11544196.
DR   FLYBASE; FBgn0012032; 1731\RTase.
DR   FLYBASE; FBgn0020768; 1731\gag.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..4648
FT                   /organism="Drosophila melanogaster"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:7227"
FT   repeat_region   1..336
FT                   /note="5' LTR"
FT   regulatory      110..116
FT                   /note="pot. TATA-box"
FT                   /regulatory_class="promoter"
FT   CDS             431..1252
FT                   /note="gag polypeptide (AA 1-273)"
FT                   /db_xref="GOA:V9H1H4"
FT                   /db_xref="InterPro:IPR001878"
FT                   /db_xref="InterPro:IPR036875"
FT                   /db_xref="UniProtKB/TrEMBL:V9H1H4"
FT                   /protein_id="CAA30502.1"
FT                   /translation="MSNLYQIDKLEDGSYETWSIQMRSVLVHACLWKVVSGESVKPEVD
FT                   TGGAWQSQDEKALATIILSVKSSQLGYVKGCLTAAEAWKVLQDVHQPKGPLRTVMLYKK
FT                   LLSKRLLEGQSISSHIKEFKEIFDALDAVEIGITEKLRSVVLLSSLPESFENFVVAIET
FT                   RDDVPLFDALCIKLIEEDTRRGGAEQQREKQTESAKAFTAVHKPQAPAREARPSAKKRK
FT                   DVVCYNCGERRHFKANCRREKVNKESATQEQCSLLNALDSGGFWQNTVVSR"
FT   CDS             1203..4151
FT                   /note="pol polypeptide (AA 1-982)"
FT                   /db_xref="GOA:V9H104"
FT                   /db_xref="InterPro:IPR001584"
FT                   /db_xref="InterPro:IPR012337"
FT                   /db_xref="InterPro:IPR013103"
FT                   /db_xref="InterPro:IPR025724"
FT                   /db_xref="InterPro:IPR036397"
FT                   /db_xref="InterPro:IPR039537"
FT                   /db_xref="UniProtKB/TrEMBL:V9H104"
FT                   /protein_id="CAA30503.1"
FT                   /translation="MRWIVVVFGKTQWCLDSGATSHMCCDRSVFTEFEEHTEKISLAGN
FT                   GFLLAKGIGTVKLKTDLCTLVLNNVLFVPDLNGNFMSVSRAAQYKCFVNFGPHYADVIQ
FT                   EGERILRVMRAGNLYMFQGKHNSCFAAVDADGSLWHKRNGHLNTSSLQEMVRKKMVYGV
FT                   EKVVFKPDAVCKTCMLAKIHVQPFPKTTRSRAEELLDMIHSDLCGPFSTPSLAGSKYFL
FT                   TFIDDKSRRIFVYFLRKKDEVFTKFVEFKKLVERQTGRKIKCIRSDNGGEFVNNVFDDY
FT                   LKAHGIARQLTIPHTPQQNGVAERANRTLVEMARCMLLQSELGEALWAEAINTAVYLRN
FT                   RSTSRALQSKTPMEEWTGKIPAVSHLRVFGAIAVALDKGVHKGKFESKGKEYRMIGYSI
FT                   AAKGYRLFDKEKRCVIEKQDVLFDESGSLVNHGNTIEFQFPATDDPEPQSDSNAREGDD
FT                   TEPVGSSDDYESAAEAEEAEVHVGPGRPKIVRTGRPGRPKKQYNVLGVLMASDVEIPKS
FT                   YEEAINSQYSAKWEEAMGLEYKALLANETWKLADLPRNRRCVACKWVYSLKRDVSGRIE
FT                   RFKARLVAKGCSQKFGVDYFETFSPVCRLESVRLILALAAEMQLYLHHMDVCTAYLNSE
FT                   LKDTVYMKQPQGFTDAANPDQVLLLRKAIYGLKQSGREWNSKLDGVLKDLGFKACNHEP
FT                   CLYQQSGQGNLMLILVYVDDLILACQSREDMEDLKAKISESFECTDKGPLHLFLGMEVQ
FT                   RDGDLGEITLGHSQYIKELLRDYGSENCRPATTPLDAGHQVLCAGEQCQKVDAGQYQST
FT                   IGELMWLGLTTRPDMLHSVAKLAQRNQDPHSEHMVAVKHILRYLASTVDVKLHYQKCGQ
FT                   AFTGFVDADWGGDRLDRKSYTGYVFFLSGGPVSWRSEKQQSVALSSTEAEYMALTTACK
FT                   EAIALRRLIVEIVCGDLKTPTVMHGDNLKCAAQLAKNPVHHSRTKHIDIRYH"
FT   repeat_region   4313..4648
FT                   /note="3' LTR"
XX
SQ   Sequence 4648 BP; 1316 A; 880 C; 1268 G; 1184 T; 0 other;
     tgttgaatat aggcaatgcc cacatgtgtg ttgaatatag gcaatttcca catgtgcata        60
     tgtaattttg tatgagaaca tacatacata cacatgaact gtatgtatgt atatatatta       120
     gcaaataagc agccgcatga aggtggcatt tttatgtgta tcagtttcag tttcaaataa       180
     aacttcttcg tgttcggaca cgcggctcaa gactttttat ttcgcgttta ctctttcagc       240
     ctttgctctc aattcgctga gtttgggtga agattaggat cttcccatta tgattgtcag       300
     tgttccacac ttggagcacc ttttcaataa acaacaggtt aatgggccca gcgccctagg       360
     agctgcctaa aggagaaacg tgtagtgaaa ctcaggagtt agattttgga gtctactcaa       420
     gattgccgga atgagtaacc tgtatcagat cgataagctg gaggatggat cctatgaaac       480
     gtggagcatc cagatgcgtt cagtgttggt gcacgcatgt ttgtggaagg tggtttcagg       540
     agagtccgtg aaacctgagg ttgatactgg aggtgcttgg caatcccaag atgaaaaagc       600
     attggccacg atcatcttga gtgtgaagtc ttcgcaactt ggttatgtaa aagggtgtct       660
     cactgcggct gaggcatgga aagttttaca ggatgtccac cagccgaaag ggccgttacg       720
     aacggtcatg ctgtataaga agttgctgag caaacgtctg ttggaagggc agagtatatc       780
     gtcacatatt aaagaattta aggaaatctt tgatgccctt gatgcggtgg aaattggtat       840
     caccgagaaa ttgcgcagtg ttgttttgct gtcgagcctt ccagagagtt tcgagaattt       900
     cgttgtcgcc attgagacgc gcgacgacgt gccgcttttc gatgctctat gtataaagct       960
     gatcgaggaa gacacgagaa ggggaggagc ggagcagcag agagaaaaac aaacggagag      1020
     cgcaaaggca tttactgcag tacataagcc acaggcgccg gcgagagaag ctcggccgag      1080
     cgcaaagaag aggaaagacg tagtttgtta taactgtgga gagcgtaggc attttaaagc      1140
     gaactgtcgt cgcgagaaag taaacaaaga gagcgcgaca caagaacaat gcagtttgtt      1200
     aaatgcgctg gatagtggtg gtttttggca aaacacagtg gtgtctcgat agcggggcta      1260
     ccagtcacat gtgctgtgac agaagtgttt ttactgagtt tgaagagcac actgaaaaaa      1320
     ttagtcttgc tggaaatgga ttcctactag caaagggcat aggaacagtg aagctgaaga      1380
     ctgatttatg tactctggta ttgaataacg tactcttcgt cccagatttg aacggcaact      1440
     ttatgtcagt cagccgtgca gctcagtata aatgttttgt caattttgga ccacattacg      1500
     ctgacgtcat tcaggaaggc gagcgaatac tgcgtgtaat gagagctggt aatttatata      1560
     tgtttcaagg gaaacataac agttgttttg cggccgttga tgctgatggt tcactatggc      1620
     ataaaaggaa tggccatttg aatacaagca gcctacagga gatggtgagg aagaagatgg      1680
     tgtacggtgt tgaaaaggtc gttttcaaac cagacgcagt atgcaagacg tgcatgctgg      1740
     caaaaatcca tgtgcaacca tttccgaaga caacgaggag cagagctgag gagctgttgg      1800
     atatgatcca ttcagacctg tgcgggccat ttagcacacc gtcacttgct ggatcaaagt      1860
     actttctcac tttcatagac gacaagtcca ggcggatttt tgtatatttc ttgcggaaga      1920
     aggacgaagt cttcactaag tttgtcgagt ttaagaaact ggtcgagcga caaacaggta      1980
     gaaagataaa atgtatccgg agcgataatg gtggtgagtt cgtcaataat gtttttgatg      2040
     actatttaaa ggcacatggg atcgctagac agctgactat tccacacact ccccaacaaa      2100
     atggagttgc agaacgagcc aaccgcacgc tagtagaaat ggctaggtgc atgttgctgc      2160
     aatcggagtt gggtgaggct ctatgggctg aggcgataaa cactgcggtg tatctgagga      2220
     accgatcaac gagcagagca ttacaaagca aaacccctat ggaagagtgg accggaaaaa      2280
     taccagcagt gagccacttg agggtttttg gtgccatagc agtggcattg gacaaaggag      2340
     tccataaagg caaattcgaa tccaaaggaa aggaatatcg tatgattgga tattcaatag      2400
     ctgctaaggg gtaccgtctg tttgacaaag agaagcggtg tgtgatcgag aagcaagatg      2460
     tcctttttga tgagtctggt agtttggtaa atcatggaaa taccattgag ttccagtttc      2520
     ccgcaactga tgacccggag ccgcagagtg attcgaatgc acgggaaggt gacgatacag      2580
     aacccgtggg cagcagcgac gactatgaga gtgcagctga ggcagaagaa gctgaagtac      2640
     atgtggggcc tggacggcca aagattgttc ggacgggcag accagggcgc ccgaagaagc      2700
     aatacaatgt acttggcgtg ttgatggcta gcgacgtcga aattcccaag tcctatgagg      2760
     aggccatcaa ttcgcagtat tctgcaaagt gggaagaggc aatgggcctg gagtacaagg      2820
     cgctacttgc aaatgagaca tggaagctgg ctgacttacc aagaaatcgc cggtgtgtgg      2880
     cttgcaagtg ggtgtattcc ctgaaacgag acgtctctgg tagaattgag cgcttcaagg      2940
     cacgactagt agcaaagggg tgttcgcaga agttcggagt ggactacttc gagacttttt      3000
     cacccgtgtg caggctcgag agtgtgaggc tcattttggc attggcagca gagatgcaat      3060
     tgtacttgca tcacatggac gtatgcacgg cgtacttaaa tagcgagcta aaggatactg      3120
     tgtacatgaa gcagccccaa gggttcacag atgctgctaa tcccgaccag gtgttattgc      3180
     tgaggaaggc aatatacggc ttgaagcagt caggcagaga gtggaactcc aagctcgacg      3240
     gtgttctaaa agacttggga tttaaggcct gtaatcatga accatgtctt tatcagcaaa      3300
     gtggtcaagg taatctgatg ctcatcttag tatatgttga tgatttaatt ctagcgtgcc      3360
     agtcaagaga agatatggag gatctgaaag ccaagatttc agagtctttc gagtgcacgg      3420
     acaagggtcc actgcatttg ttcttaggca tggaggtgca acgagatggc gaccttggag      3480
     aaatcacttt gggccattcg caatatatca aggaactatt gcgggattat ggcagcgaga      3540
     actgtagacc agcgacgaca cctttggatg cagggcatca agttttgtgc gcgggtgagc      3600
     agtgccagaa ggtcgacgca gggcagtatc agtctacaat tggtgagcta atgtggcttg      3660
     ggcttactac cagaccagac atgctacatt cggtggcgaa gttggctcag aggaatcagg      3720
     acccgcattc tgagcacatg gtggctgtga agcacatcct ccggtacttg gcgtcaactg      3780
     tggacgtcaa gctgcattat caaaagtgcg gtcaggcatt taccggcttt gtggatgcag      3840
     attggggagg cgaccgtttg gaccgaaagt catacacagg gtatgtgttt ttcctgtctg      3900
     gcggaccagt atcatggagg tccgagaagc agcagagcgt ggcgttgagc agtactgaag      3960
     ccgagtatat ggctctgacc acggcttgca aggaagctat agctttacga aggctaatag      4020
     tggagatcgt atgcggtgat ctgaagaccc cgacggttat gcatggcgac aacctgaagt      4080
     gcgcagcaca gttagcgaag aacccggttc atcactctag gacgaagcac atcgacattc      4140
     gatatcatta gagaagtcat gaaagagggt cacgttgtgt tagagtacac ttctacgaat      4200
     gagatgatag cagacattat gacaaagaat ctttcaaagg gaaagcataa tgggtttatg      4260
     aaaatgttaa atttgtttta atttttgtaa acatgttggc attgaggaag gctgttgaat      4320
     ataggcaatg cccacatgtg tgttgaatat aggcaatttc cacatgtgca tatgtaattt      4380
     tgtatgagaa catacataca tacacatgaa ctatatgtat gtatatatat tagtaaataa      4440
     gcagccgcat gaagctggca tttttatgtg tatcagtttc agtttcaaat aaaacttctt      4500
     cgtgttcgga cgctcggctc aagacttttt atttcgcgtt tactcattcg gcctttgctc      4560
     tcaatgcgct gagtttgggt gaagattagg atcttcccat tatggttgtc agtgttccac      4620
     actgggagca ccttttcaac aaaccaca                                         4648
//