Unfortunately due to lack of commercial feasibility, the SkyBLAST service has been suspended from December 1st, 2025.
All subscriptions for paid accounts have been paused. For further information or enquiries, please email [email protected]

PREDICTED: Drosophila takahashii uncharacterized protein


LOCUS       XM_070219045            4491 bp    mRNA    linear   INV 09-DEC-2024
            (LOC123003496), mRNA.
ACCESSION   XM_070219045
VERSION     XM_070219045.1
DBLINK      BioProject: PRJNA1194641
KEYWORDS    RefSeq; includes ab initio.
SOURCE      Drosophila takahashii
  ORGANISM  Drosophila takahashii
            Eukaryota; Metazoa; Ecdysozoa; Arthropoda; Hexapoda; Insecta;
            Pterygota; Neoptera; Endopterygota; Diptera; Brachycera;
            Muscomorpha; Ephydroidea; Drosophilidae; Drosophila; Sophophora.
COMMENT     MODEL REFSEQ:  This record is predicted by automated computational
            analysis. This record is derived from a genomic sequence
            (NC_091683) annotated using gene prediction method: Gnomon.
            Also see:
                Documentation of NCBI's Annotation Process
            
            ##Genome-Annotation-Data-START##
            Annotation Provider         :: NCBI RefSeq
            Annotation Status           :: Full annotation
            Annotation Name             :: GCF_030179915.1-RS_2024_12
            Annotation Pipeline         :: NCBI eukaryotic genome annotation
                                           pipeline
            Annotation Software Version :: 10.3
            Annotation Method           :: Gnomon; cmsearch; tRNAscan-SE
            Features Annotated          :: Gene; mRNA; CDS; ncRNA
            Annotation Date             :: 12/07/2024
            ##Genome-Annotation-Data-END##
            
            ##RefSeq-Attributes-START##
            ab initio :: 100% of CDS bases
            ##RefSeq-Attributes-END##
FEATURES             Location/Qualifiers
     source          1..4491
                     /organism="Drosophila takahashii"
                     /mol_type="mRNA"
                     /strain="IR98-3 E-12201"
                     /db_xref="taxon:29030"
                     /chromosome="X"
                     /sex="female"
                     /tissue_type="Whole fly"
                     /dev_stage="Adult fly"
                     /collected_by="Originally obtained from EHIME-Fly"
     gene            1..4491
                     /gene="LOC123003496"
                     /note="uncharacterized LOC123003496; Derived by automated
                     computational analysis using gene prediction method:
                     Gnomon. Supporting evidence includes similarity to: 11
                     Proteins"
                     /db_xref="GeneID:123003496"
     CDS             1..4491
                     /gene="LOC123003496"
                     /codon_start=1
                     /product="uncharacterized protein"
                     /protein_id="XP_070075146.1"
                     /db_xref="GeneID:123003496"
                     /translation="MSNEIAVAALARFITVSDRMSHFRATIETPGAAAPSVHTCKVRK
                     EQVRSLWDKAEKEFEACLDTISSLTTDEASDILATLHRKYEYCYSVYEELSVQLSELI
                     DRASSQQPLSSTDNQSAYIPSGCRLPPCDTEVFEGDYLKWPTFRDLFTAVYVNNTRLM
                     FLWDEMNAFLSDRYRTLEAIEDMKQSLGGPSTSKNSQVTKKLNSFEAKVSVKPKSCDL
                     CSKETHPVRLCPRFIQMAVEARENYIKKKQLCLNCFARGHQLRDCSSTHSCFVCRGRH
                     HTLLHRGNPFSNNPSSSGHARPRSDPPSGGSDIPDEHSNVQVCFASGSKAVLLGTAMI
                     DICHLGTHFRARALIDSGSEATFITERLFKLVNLPFRPIQAKVSGLNQTVSAQSTRLC
                     HFAIRSPTKPGLQLDTAAYVLPELAGRLPSHSIPQDILRDLPNLQWADPTFLQSSQID
                     VLIGADILPSVLLSGTKTNICGSLFGQETIFGWVLTGPVSMSTSNRVSAFTTQITKTS
                     EASLDKLLTKFWEVEDLPSKMVKESDSVCESHMREVSPTHNSPNYYLPHHAVIKPEST
                     TTKLRVVFNASSPSANGTSLNDVLHAGPVLQSDLTIQILKWRYFKYVFSADITKMYRQ
                     IWVDPKHTPFQRILFRNKEGDIRDYELKTVTFGVNCAPYLAIRVLKQLADDVVQQFPK
                     ASHIIRNFMYVDDVLAGSNSQQEAQLAIQELVTALNSAGFPLRKWTSNHKGVLKDIPN
                     EHLLHSEFLNIDAESTAKTLGIRWRATTDEFYFVPPEISVKSSYTKREVLSQIAKLFD
                     PAGWLAPFIVRAKTFMQEIWLQELGWDDNLPDEMSHRWQVFLQSYSDLDQIRIPRWVG
                     YQPQVKIELHGFCDASQKAYGAALYVRVEVGQQILTNLARVAPVKTVSLPRLELCGAL
                     LLADMASTILPNMLSKSSAIFCWTDSTIVLAWLKKPACSWTTFVANRVTKIAQATKIE
                     NWSHVRSEHNPADLASRGVSLQELGDSNLWWHGPQWFQLPKLQWPETSDPHPVTELEQ
                     RAVKVHFVKLPADDFLDRFSRLDKALRVLAYVQRFLNRCRKAPVSPDKQLSNREIREA
                     ERTYIILAQREEYALELRLLRSKRSIPASSPIANLFPFIDQQGLLRACGRLTASKVLQ
                     YDERHPVLLPYSCRLSRLLVQFTHQITLHGGNQLIVRLMRSKYWIPKVKNLVKGVVNS
                     CNMCTIYKKRLQTQLMGDFPTDRASFSRPFTYTGVDYAGKTIQGARRGCPQRVHSDNG
                     KTFVGASSLISRDFTQALKESVTNAYSHQGLVWRFIPPGAPHMGGLWEAGVKSFKTLF
                     NKSTSARKYTFEELSTLLAKIEACLNSRPLSPMSEDPTDLLALTPGHFLIGGPLLSTA
                     EPAIKGEAQSIINRWQHLKAQHQQFSSRWKEEYLKELHKRNKWLSPSRNLQVDDMVVI
                     KDDNLPSNDWRLGRIVAAIPGADTRVRVVDILTSRGTIQRPVHKLVLLPMEDKAISAL
                     PQ"
     misc_feature    547..>834
                     /gene="LOC123003496"
                     /note="Arginine methyltransferase-interacting protein,
                     contains RING Zn-finger [Posttranslational modification,
                     protein turnover, chaperones / Intracellular trafficking
                     and secretion]; Region: AIR1; COG5082"
                     /db_xref="CDD:227414"
     misc_feature    1018..1458
                     /gene="LOC123003496"
                     /note="Cellular and retroviral pepsin-like aspartate
                     proteases; Region: pepsin_retropepsin_like; cl11403"
                     /db_xref="CDD:472175"
     misc_feature    order(1048..1050,1054..1056,1060..1062,1129..1137)
                     /gene="LOC123003496"
                     /note="inhibitor binding site [active]"
                     /db_xref="CDD:133136"
     misc_feature    1048..1056
                     /gene="LOC123003496"
                     /note="catalytic motif [active]"
                     /db_xref="CDD:133136"
     misc_feature    1048..1050
                     /gene="LOC123003496"
                     /note="Catalytic residue [active]"
                     /db_xref="CDD:133136"
     misc_feature    order(1129..1140,1150..1161)
                     /gene="LOC123003496"
                     /note="Active site flap [active]"
                     /db_xref="CDD:133136"
     misc_feature    1654..2307
                     /gene="LOC123003496"
                     /note="Reverse transcriptase (RTs) in retrotransposons.
                     This subfamily represents the RT domain of a
                     multifunctional enzyme. C-terminal to the RT domain is a
                     domain homologous to aspartic proteinases (corresponding
                     to Merops family A17) encoded by...; Region: RT_pepA17;
                     cd01644"
                     /db_xref="CDD:238822"
     misc_feature    order(1849..1866,1966..1971,2074..2076,2080..2085,
                     2278..2283)
                     /gene="LOC123003496"
                     /note="putative active site [active]"
                     /db_xref="CDD:238822"
     misc_feature    order(1849..1866,1966..1968,2080..2082)
                     /gene="LOC123003496"
                     /note="putative NTP binding site [chemical binding]; other
                     site"
                     /db_xref="CDD:238822"
     misc_feature    1969..1971
                     /gene="LOC123003496"
                     /note="putative nucleic acid binding site [nucleotide
                     binding]; other site"
                     /db_xref="CDD:238822"
     misc_feature    2353..2820
                     /gene="LOC123003496"
                     /note="Pao retrotransposon peptidase; Region:
                     Peptidase_A17; pfam05380"
                     /db_xref="CDD:461634"
     misc_feature    3481..3642
                     /gene="LOC123003496"
                     /note="Integrase zinc binding domain; Region:
                     Integrase_H2C2; pfam17921"
                     /db_xref="CDD:465569"
     misc_feature    <3745..3909
                     /gene="LOC123003496"
                     /note="Integrase core domain; Region: rve; pfam00665"
                     /db_xref="CDD:459897"
     misc_feature    4171..4452
                     /gene="LOC123003496"
                     /note="Family of unknown function (DUF5641); Region:
                     DUF5641; pfam18701"
                     /db_xref="CDD:465838"
ORIGIN      
        1 atgagtaacg aaattgcagt tgcagccctc gcgcggttta tcacggtgtc cgaccgtatg
       61 agccatttca gagcgactat agaaactcca ggagctgccg ctccgtccgt ccacacctgc
      121 aaagtccgaa aagaacaagt ccgttcactc tgggacaaag ccgagaagga atttgaagct
      181 tgtctagaca cgatttccag ccttacgact gacgaggcgt cggatatttt ggcgactcta
      241 cacagaaaat atgaatattg ctattcggtg tacgaggagc tatcggttca gctcagcgag
      301 ttaattgacc gagccagttc acagcagccg ttgtcgagca ccgacaatca gtccgcgtac
      361 attccgtctg ggtgccggtt gcctccatgt gatacagaag tatttgaggg agactatctc
      421 aaatggccaa cattcaggga ccttttcact gccgtctacg tcaacaacac acgtctgatg
      481 ttcctatggg atgagatgaa cgcgttcctt agcgataggt atagaacctt agaagccatt
      541 gaggacatga agcagagtct tggtggtccg tcaacttcca aaaattccca agttacgaag
      601 aagcttaact cctttgaagc caaagtgagt gtcaaaccaa agagttgcga tttgtgctct
      661 aaggagactc acccagtgcg gttgtgccct cgcttcattc agatggcagt agaggcgcgg
      721 gaaaactaca taaaaaagaa gcagttatgc ttgaattgct tcgcgagagg ccatcagctc
      781 cgggattgtt ccagtacgca cagctgcttt gtatgccgag ggagacatca cacgcttttg
      841 catcgaggca acccattttc caacaatcca agttcctctg gacatgcgag acctagatcc
      901 gatcctccgt cgggaggctc agacattccg gatgaacact caaatgtaca agtctgtttt
      961 gcctcgggct caaaggcagt tctgttgggc acggcaatga ttgatatttg ccacctcggc
     1021 acccacttcc gagcacgcgc tttgatcgac tcgggatctg aagcgacgtt cataacggag
     1081 cgtcttttca agttggtcaa tctgccgttc cgccccattc aagctaaagt gtctggttta
     1141 aatcagaccg tttctgccca gtcaacaagg ctttgccatt tcgccattcg ttctcctact
     1201 aagccgggcc tgcagttaga caccgcagcg tatgttctgc cagaactagc aggcagatta
     1261 ccctcacatt ccattccaca agatatcctg agagatttgc caaaccttca atgggcagat
     1321 cccacatttc tccagagttc ccagatagac gttcttatcg gagctgatat tcttccatcc
     1381 gtgctgctga gtggcacaaa gaccaacatc tgcggatctc tttttgggca agagaccatc
     1441 ttcgggtggg tgctcactgg tccagtgtcc atgtccacga gcaaccgagt ctcagccttt
     1501 acgactcaaa ttacaaaaac aagtgaggca tccttagaca aacttcttac gaagttttgg
     1561 gaggtggaag atctaccatc aaaaatggta aaagagtccg attccgtctg cgaaagccat
     1621 atgagagagg tttcgcccac tcacaattct ccaaactact acctcccaca ccatgcggtt
     1681 ataaaacccg aaagcacgac cacgaaactc cgggtggtat tcaacgcttc cagcccgtca
     1741 gcaaatggga ctagcttgaa cgatgtgctt catgccggtc cagtcctcca atctgactta
     1801 acaattcaga ttttaaagtg gcgctatttc aagtatgttt ttagtgcaga catcacgaaa
     1861 atgtataggc agatctgggt cgatccaaag cacacgccct ttcaaaggat tcttttccga
     1921 aacaaggaag gtgacattcg agattacgag ctgaaaaccg taacattcgg tgtcaattgc
     1981 gcgccctatc tcgccatccg agtgctgaaa cagctggctg atgacgtcgt tcagcagttt
     2041 ccaaaagcca gtcatataat ccgcaacttc atgtatgttg atgacgtttt agcaggatcg
     2101 aattctcaac aagaagctca acttgccatc caggagttag taaccgcttt gaattcggcc
     2161 ggttttccgc ttagaaagtg gacttccaac cacaaggggg ttttaaagga catcccaaat
     2221 gagcatcttc tccattctga gttcctaaat attgatgccg aaagcacagc caaaaccctc
     2281 ggcattcgtt ggagagcaac caccgacgag ttctacttcg tgcccccaga aatatccgtc
     2341 aagtcctcct atactaaaag agaagttctc tcccagatcg caaagctatt cgatcccgct
     2401 ggatggcttg caccgttcat cgtccgggcc aaaactttta tgcaggagat ctggctgcaa
     2461 gagttaggct gggatgacaa ccttcccgac gaaatgagcc atagatggca agtgttcctg
     2521 caaagttatt ccgacctcga tcaaatccgt attccgagat gggtcggtta ccagccccag
     2581 gtaaaaatcg agcttcacgg gttctgtgac gcttcccaaa aagcctatgg ggcggcgctg
     2641 tatgtcaggg ttgaagtcgg tcagcagata ttgactaatc tggcccgggt tgcccctgtg
     2701 aaaactgtat ctctcccccg actcgagcta tgtggtgccc tattgctggc agatatggca
     2761 tctaccatcc ttccaaatat gctgtcaaaa agctctgcga ttttctgctg gacagattct
     2821 accattgtcc tggcatggtt aaagaaacca gcctgctcct ggaccacatt cgtagccaac
     2881 cgcgtaacca aaatagctca agctacaaag attgagaatt ggtcacatgt gcggtcagaa
     2941 cacaatcctg ccgacctagc tagtcgcggc gtgtccctgc aagagctggg cgatagcaac
     3001 ctctggtggc atgggcccca gtggtttcaa ttgcccaaac ttcaatggcc agaaacttcg
     3061 gatccacacc cagtcacgga attagagcag cgcgcggtga aggttcattt cgtaaagctc
     3121 cccgctgatg atttccttga ccgtttttcc agactagaca aggctttacg agtcctagct
     3181 tacgtccaaa ggttcctaaa tcgctgtcgt aaggctccgg taagtccgga taagcagctc
     3241 agtaatcggg agatccggga ggctgagagg acctacataa tacttgccca gcgtgaagag
     3301 tacgcgctcg agcttcgatt gttacgaagc aaaagatcca tacccgcatc aagcccaatt
     3361 gctaatttgt ttccatttat agaccaacag ggactcttaa gagcatgtgg ccgcttaact
     3421 gcctccaagg tcctgcagta tgacgagcgc catcctgtat tactcccgta cagctgtcgg
     3481 ttatctcgtc ttcttgtcca attcacgcac cagattacgc ttcatggcgg caaccaattg
     3541 atagtgcgcc tgatgcgatc caaatattgg attcctaaag tcaagaatct ggtaaagggc
     3601 gtggtgaatt catgcaatat gtgcaccatt tataagaaaa gactgcaaac ccaattgatg
     3661 ggcgattttc cgactgatcg agcctctttt tccaggccat ttacttacac cggcgtcgat
     3721 tacgccggta aaactataca gggagctaga agaggttgtc ctcagcgggt ccattccgac
     3781 aacggcaaaa cctttgttgg cgcctcaagt cttatttccc gtgactttac gcaagcacta
     3841 aaggagtcag tgaccaatgc gtatagccat cagggactcg tgtggcgttt cataccccca
     3901 ggagctcctc atatgggagg cctgtgggag gcaggagtaa agagttttaa aacgctgttt
     3961 aacaaatcca cgtccgctcg caagtataca ttcgaagagc tttccacgct tctggcaaag
     4021 attgaagcct gccttaattc cagaccactc tctccaatgt cagaggaccc gacagacttg
     4081 ctggcactga cgccaggcca ttttctgatc gggggaccgt tgctttccac ggcggagcct
     4141 gcaattaaag gcgaagccca gtcaatcata aatcgatggc aacatctcaa ggcccagcat
     4201 caacaattta gttcgcgatg gaaagaagag tatctaaagg aactccacaa gcgcaacaag
     4261 tggttgagtc catccagaaa tctgcaagtc gacgatatgg tagtcatcaa ggacgataat
     4321 ttgccatcaa atgactggcg gctcggcagg atcgtagctg ctatcccagg agctgatact
     4381 agagtacgcg tcgtagatat tcttacttct cgtggaacca tccaacgtcc ggtccacaaa
     4441 ctagtacttc ttcctatgga agacaaggca atctccgcac ttccgcaata a